diff --git a/phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7/checkpoints/latest-checkpoint.pt b/phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7/checkpoints/latest-checkpoint.pt new file mode 100644 index 0000000000000000000000000000000000000000..e438326f0a2ed68621a72fdf71e4fbb6a6a494e0 --- /dev/null +++ b/phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7/checkpoints/latest-checkpoint.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaafd5105c885733881cf9f41b32db1dd821896649a2fd6751ea65d171a1e551 +size 15336322587 diff --git a/phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7/config.json b/phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7/config.json new file mode 100644 index 0000000000000000000000000000000000000000..225224cc8b64002a34b6661cc10b7e4c130e6f41 --- /dev/null +++ b/phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7/config.json @@ -0,0 +1,73 @@ +{ + "dataset": { + "align_stage_components": [ + "download/llava-laion-cc-sbu-558k/chat.json", + "download/llava-laion-cc-sbu-558k" + ], + "dataset_id": "llava-v15", + "dataset_resampled": true, + "dataset_root_dir": "data", + "finetune_stage_components": [ + "/home/wzwang/data/llava/llava_phi_3_joint_sharegpt_sft_data_557k.json", + "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/llava/images" + ], + "max_num_images": 6, + "min_num_images": 1, + "train_num_samples": 200000, + "type": "llava-v15", + "workers": 4 + }, + "model": { + "align_epochs": 1, + "align_global_batch_size": 256, + "align_learning_rate": 0.001, + "align_lr_scheduler_type": "linear-warmup+cosine-decay", + "align_max_grad_norm": 1.0, + "align_max_steps": null, + "align_per_device_batch_size": 16, + "align_train_strategy": "fsdp-shard-grad-op", + "align_warmup_ratio": 0.03, + "align_weight_decay": 0.0, + "arch_specifier": "full-align+avgpool", + "enable_gradient_checkpointing": true, + "enable_mixed_precision_training": true, + "finetune_epochs": 1, + "finetune_global_batch_size": 112, + "finetune_learning_rate": 2e-05, + "finetune_lr_scheduler_type": "linear-warmup+cosine-decay", + "finetune_max_grad_norm": 1.0, + "finetune_max_steps": null, + "finetune_per_device_batch_size": 16, + "finetune_train_strategy": "fsdp-full-shard", + "finetune_warmup_ratio": 0.03, + "finetune_weight_decay": 0.1, + "image_resize_strategy": "resize-naive", + "llm_backbone_id": "phi3-3b", + "llm_max_length": 4096, + "model_id": "phi3-3b-continue-training-hq-35-557k-sft", + "pretrain_epochs": 1, + "pretrain_global_batch_size": 512, + "pretrain_learning_rate": 5e-05, + "pretrain_lr_scheduler_type": "linear-warmup+cosine-decay", + "pretrain_max_grad_norm": 1.0, + "pretrain_max_steps": null, + "pretrain_per_device_batch_size": 16, + "pretrain_train_strategy": "fsdp-full-shard", + "pretrain_warmup_ratio": 0.03, + "pretrain_weight_decay": 0.01, + "reduce_in_full_precision": false, + "type": "one-stage+7b", + "vision_backbone_id": "siglip-vit-so400m-384px" + }, + "mount_path": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/models", + "pretrained_checkpoint": "/home/wzwang/checkpoints/mllm_pretrain_checkpoints/obelics+phi3-3b-continue-training-hq_35-run1+stage-pretrain+x7/checkpoints/latest-checkpoint.pt", + "run_id": "phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7", + "run_root_dir": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/checkpoints/mllm_sft_checkpoints", + "seed": 7, + "stage": "finetune", + "trackers": [ + "jsonl" + ], + "wandb_entity": null, + "wandb_project": "mmpretrain" +} \ No newline at end of file diff --git a/phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7/config.yaml b/phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7/config.yaml new file mode 100644 index 0000000000000000000000000000000000000000..549eba5b9387333d7af146811a58baaaa5f40140 --- /dev/null +++ b/phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7/config.yaml @@ -0,0 +1,66 @@ +dataset: + align_stage_components: + - download/llava-laion-cc-sbu-558k/chat.json + - download/llava-laion-cc-sbu-558k + dataset_id: llava-v15 + dataset_resampled: true + dataset_root_dir: data + finetune_stage_components: + - /home/wzwang/data/llava/llava_phi_3_joint_sharegpt_sft_data_557k.json + - /fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/llava/images + max_num_images: 6 + min_num_images: 1 + train_num_samples: 200000 + type: llava-v15 + workers: 4 +model: + align_epochs: 1 + align_global_batch_size: 256 + align_learning_rate: 0.001 + align_lr_scheduler_type: linear-warmup+cosine-decay + align_max_grad_norm: 1.0 + align_max_steps: null + align_per_device_batch_size: 16 + align_train_strategy: fsdp-shard-grad-op + align_warmup_ratio: 0.03 + align_weight_decay: 0.0 + arch_specifier: full-align+avgpool + enable_gradient_checkpointing: true + enable_mixed_precision_training: true + finetune_epochs: 1 + finetune_global_batch_size: 112 + finetune_learning_rate: 2.0e-05 + finetune_lr_scheduler_type: linear-warmup+cosine-decay + finetune_max_grad_norm: 1.0 + finetune_max_steps: null + finetune_per_device_batch_size: 16 + finetune_train_strategy: fsdp-full-shard + finetune_warmup_ratio: 0.03 + finetune_weight_decay: 0.1 + image_resize_strategy: resize-naive + llm_backbone_id: phi3-3b + llm_max_length: 4096 + model_id: phi3-3b-continue-training-hq-35-557k-sft + pretrain_epochs: 1 + pretrain_global_batch_size: 512 + pretrain_learning_rate: 5.0e-05 + pretrain_lr_scheduler_type: linear-warmup+cosine-decay + pretrain_max_grad_norm: 1.0 + pretrain_max_steps: null + pretrain_per_device_batch_size: 16 + pretrain_train_strategy: fsdp-full-shard + pretrain_warmup_ratio: 0.03 + pretrain_weight_decay: 0.01 + reduce_in_full_precision: false + type: one-stage+7b + vision_backbone_id: siglip-vit-so400m-384px +mount_path: /fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/models +pretrained_checkpoint: /home/wzwang/checkpoints/mllm_pretrain_checkpoints/obelics+phi3-3b-continue-training-hq_35-run1+stage-pretrain+x7/checkpoints/latest-checkpoint.pt +run_id: phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7 +run_root_dir: /fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/checkpoints/mllm_sft_checkpoints +seed: 7 +stage: finetune +trackers: +- jsonl +wandb_entity: null +wandb_project: mmpretrain diff --git a/phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7/phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7.jsonl b/phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7/phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d608cc34919cebf81d0225110bfb53177b0fdb67 --- /dev/null +++ b/phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7/phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7.jsonl @@ -0,0 +1,4975 @@ +{"Finetune/Learning Rate": 1.342281879194631e-07, "Finetune/Loss": 0.5888769626617432, "Finetune/Loss (Raw)": 0.5888769626617432, "Finetune/Step": 1, "Finetune/Step Time": 27.28826379776001} +{"Finetune/Learning Rate": 2.684563758389262e-07, "Finetune/Loss": 1.0051438808441162, "Finetune/Loss (Raw)": 1.4214106798171997, "Finetune/Step": 2, "Finetune/Step Time": 15.077386140823364} +{"Finetune/Learning Rate": 4.026845637583893e-07, "Finetune/Loss": 0.9348106384277344, "Finetune/Loss (Raw)": 0.7941442131996155, "Finetune/Step": 3, "Finetune/Step Time": 12.260646979014078} +{"Finetune/Learning Rate": 5.369127516778524e-07, "Finetune/Loss": 1.0749013423919678, "Finetune/Loss (Raw)": 1.4951733350753784, "Finetune/Step": 4, "Finetune/Step Time": 9.767219185829163} +{"Finetune/Learning Rate": 6.711409395973155e-07, "Finetune/Loss": 1.1299022436141968, "Finetune/Loss (Raw)": 1.3499054908752441, "Finetune/Step": 5, "Finetune/Step Time": 8.308956003189087} +{"Finetune/Learning Rate": 8.053691275167786e-07, "Finetune/Loss": 1.196791172027588, "Finetune/Loss (Raw)": 1.5312362909317017, "Finetune/Step": 6, "Finetune/Step Time": 7.374405701955159} +{"Finetune/Learning Rate": 9.395973154362417e-07, "Finetune/Loss": 1.2201677560806274, "Finetune/Loss (Raw)": 1.3604263067245483, "Finetune/Step": 7, "Finetune/Step Time": 6.675990002495902} +{"Finetune/Learning Rate": 1.0738255033557048e-06, "Finetune/Loss": 1.2358900308609009, "Finetune/Loss (Raw)": 1.345947027206421, "Finetune/Step": 8, "Finetune/Step Time": 6.11047837138176} +{"Finetune/Learning Rate": 1.208053691275168e-06, "Finetune/Loss": 1.2487096786499023, "Finetune/Loss (Raw)": 1.3512672185897827, "Finetune/Step": 9, "Finetune/Step Time": 5.714061074786716} +{"Finetune/Learning Rate": 1.342281879194631e-06, "Finetune/Loss": 1.2643877267837524, "Finetune/Loss (Raw)": 1.4054903984069824, "Finetune/Step": 10, "Finetune/Step Time": 5.373258709907532} +{"Finetune/Learning Rate": 1.4765100671140942e-06, "Finetune/Loss": 1.2706422805786133, "Finetune/Loss (Raw)": 1.3331876993179321, "Finetune/Step": 11, "Finetune/Step Time": 5.097585049542514} +{"Finetune/Learning Rate": 1.6107382550335572e-06, "Finetune/Loss": 1.2688405513763428, "Finetune/Loss (Raw)": 1.2490202188491821, "Finetune/Step": 12, "Finetune/Step Time": 4.871985375881195} +{"Finetune/Learning Rate": 1.7449664429530203e-06, "Finetune/Loss": 1.2751210927963257, "Finetune/Loss (Raw)": 1.3504892587661743, "Finetune/Step": 13, "Finetune/Step Time": 4.680923296855046} +{"Finetune/Learning Rate": 1.8791946308724835e-06, "Finetune/Loss": 1.275794267654419, "Finetune/Loss (Raw)": 1.2845441102981567, "Finetune/Step": 14, "Finetune/Step Time": 4.515813333647592} +{"Finetune/Learning Rate": 2.013422818791946e-06, "Finetune/Loss": 1.2715760469436646, "Finetune/Loss (Raw)": 1.212520718574524, "Finetune/Step": 15, "Finetune/Step Time": 4.383769226074219} +{"Finetune/Learning Rate": 2.1476510067114096e-06, "Finetune/Loss": 1.2594962120056152, "Finetune/Loss (Raw)": 1.0782991647720337, "Finetune/Step": 16, "Finetune/Step Time": 4.259894788265228} +{"Finetune/Learning Rate": 2.2818791946308725e-06, "Finetune/Loss": 1.2555333375930786, "Finetune/Loss (Raw)": 1.192128300666809, "Finetune/Step": 17, "Finetune/Step Time": 4.160426055683809} +{"Finetune/Learning Rate": 2.416107382550336e-06, "Finetune/Loss": 1.251473069190979, "Finetune/Loss (Raw)": 1.1824500560760498, "Finetune/Step": 18, "Finetune/Step Time": 4.065616528193156} +{"Finetune/Learning Rate": 2.5503355704697992e-06, "Finetune/Loss": 1.2426724433898926, "Finetune/Loss (Raw)": 1.0842598676681519, "Finetune/Step": 19, "Finetune/Step Time": 3.9806667503557707} +{"Finetune/Learning Rate": 2.684563758389262e-06, "Finetune/Loss": 1.2362464666366577, "Finetune/Loss (Raw)": 1.1141526699066162, "Finetune/Step": 20, "Finetune/Step Time": 3.9006011724472045} +{"Finetune/Learning Rate": 2.8187919463087247e-06, "Finetune/Loss": 1.2328091859817505, "Finetune/Loss (Raw)": 1.1640634536743164, "Finetune/Step": 21, "Finetune/Step Time": 3.8250163169134233} +{"Finetune/Learning Rate": 2.9530201342281885e-06, "Finetune/Loss": 1.2267534732818604, "Finetune/Loss (Raw)": 1.0995817184448242, "Finetune/Step": 22, "Finetune/Step Time": 3.7492424032904883} +{"Finetune/Learning Rate": 3.0872483221476514e-06, "Finetune/Loss": 1.2252185344696045, "Finetune/Loss (Raw)": 1.1914503574371338, "Finetune/Step": 23, "Finetune/Step Time": 3.686902502308721} +{"Finetune/Learning Rate": 3.2214765100671143e-06, "Finetune/Loss": 1.2159934043884277, "Finetune/Loss (Raw)": 1.0038138628005981, "Finetune/Step": 24, "Finetune/Step Time": 3.6298204759756723} +{"Finetune/Learning Rate": 3.3557046979865777e-06, "Finetune/Loss": 1.214392900466919, "Finetune/Loss (Raw)": 1.1759834289550781, "Finetune/Step": 25, "Finetune/Step Time": 3.5868405723571777} +{"Finetune/Learning Rate": 3.4899328859060407e-06, "Finetune/Loss": 1.205499291419983, "Finetune/Loss (Raw)": 0.9831574559211731, "Finetune/Step": 26, "Finetune/Step Time": 3.533188535616948} +{"Finetune/Learning Rate": 3.6241610738255036e-06, "Finetune/Loss": 1.1998406648635864, "Finetune/Loss (Raw)": 1.0527154207229614, "Finetune/Step": 27, "Finetune/Step Time": 3.495122953697487} +{"Finetune/Learning Rate": 3.758389261744967e-06, "Finetune/Loss": 1.1932425498962402, "Finetune/Loss (Raw)": 1.0150905847549438, "Finetune/Step": 28, "Finetune/Step Time": 3.458908293928419} +{"Finetune/Learning Rate": 3.8926174496644295e-06, "Finetune/Loss": 1.1865872144699097, "Finetune/Loss (Raw)": 1.0002423524856567, "Finetune/Step": 29, "Finetune/Step Time": 3.4140590305986076} +{"Finetune/Learning Rate": 4.026845637583892e-06, "Finetune/Loss": 1.1831920146942139, "Finetune/Loss (Raw)": 1.0847281217575073, "Finetune/Step": 30, "Finetune/Step Time": 3.382421851158142} +{"Finetune/Learning Rate": 4.161073825503356e-06, "Finetune/Loss": 1.1796386241912842, "Finetune/Loss (Raw)": 1.073039174079895, "Finetune/Step": 31, "Finetune/Step Time": 3.3435328929655013} +{"Finetune/Learning Rate": 4.295302013422819e-06, "Finetune/Loss": 1.1587902307510376, "Finetune/Loss (Raw)": 0.5124914050102234, "Finetune/Step": 32, "Finetune/Step Time": 3.436756767332554} +{"Finetune/Learning Rate": 4.429530201342283e-06, "Finetune/Loss": 1.1534535884857178, "Finetune/Loss (Raw)": 0.9826817512512207, "Finetune/Step": 33, "Finetune/Step Time": 3.4129744298530347} +{"Finetune/Learning Rate": 4.563758389261745e-06, "Finetune/Loss": 1.1489357948303223, "Finetune/Loss (Raw)": 0.9998475909233093, "Finetune/Step": 34, "Finetune/Step Time": 3.3909160249373493} +{"Finetune/Learning Rate": 4.697986577181208e-06, "Finetune/Loss": 1.143308162689209, "Finetune/Loss (Raw)": 0.9519686102867126, "Finetune/Step": 35, "Finetune/Step Time": 3.3633936268942697} +{"Finetune/Learning Rate": 4.832214765100672e-06, "Finetune/Loss": 1.1395604610443115, "Finetune/Loss (Raw)": 1.0083919763565063, "Finetune/Step": 36, "Finetune/Step Time": 3.3540952271885343} +{"Finetune/Learning Rate": 4.966442953020135e-06, "Finetune/Loss": 1.1272300481796265, "Finetune/Loss (Raw)": 0.6833383440971375, "Finetune/Step": 37, "Finetune/Step Time": 3.4078568896731816} +{"Finetune/Learning Rate": 5.1006711409395985e-06, "Finetune/Loss": 1.122550368309021, "Finetune/Loss (Raw)": 0.9493986368179321, "Finetune/Step": 38, "Finetune/Step Time": 3.3931179360339514} +{"Finetune/Learning Rate": 5.234899328859061e-06, "Finetune/Loss": 1.1191747188568115, "Finetune/Loss (Raw)": 0.9909003973007202, "Finetune/Step": 39, "Finetune/Step Time": 3.369653053772755} +{"Finetune/Learning Rate": 5.369127516778524e-06, "Finetune/Loss": 1.1160379648208618, "Finetune/Loss (Raw)": 0.9937025308609009, "Finetune/Step": 40, "Finetune/Step Time": 3.351633197069168} +{"Finetune/Learning Rate": 5.503355704697987e-06, "Finetune/Loss": 1.111807942390442, "Finetune/Loss (Raw)": 0.9426093101501465, "Finetune/Step": 41, "Finetune/Step Time": 3.332437672266146} +{"Finetune/Learning Rate": 5.637583892617449e-06, "Finetune/Loss": 1.1087907552719116, "Finetune/Loss (Raw)": 0.9850851893424988, "Finetune/Step": 42, "Finetune/Step Time": 3.3181200254531134} +{"Finetune/Learning Rate": 5.771812080536914e-06, "Finetune/Loss": 1.1063482761383057, "Finetune/Loss (Raw)": 1.0037617683410645, "Finetune/Step": 43, "Finetune/Step Time": 3.2973347431005435} +{"Finetune/Learning Rate": 5.906040268456377e-06, "Finetune/Loss": 1.1087710857391357, "Finetune/Loss (Raw)": 1.2129544019699097, "Finetune/Step": 44, "Finetune/Step Time": 3.2767571319233286} +{"Finetune/Learning Rate": 6.04026845637584e-06, "Finetune/Loss": 1.1056159734725952, "Finetune/Loss (Raw)": 0.9667943120002747, "Finetune/Step": 45, "Finetune/Step Time": 3.2532543023427327} +{"Finetune/Learning Rate": 6.174496644295303e-06, "Finetune/Loss": 1.1051833629608154, "Finetune/Loss (Raw)": 1.085710883140564, "Finetune/Step": 46, "Finetune/Step Time": 3.2286052548367046} +{"Finetune/Learning Rate": 6.308724832214766e-06, "Finetune/Loss": 1.099886178970337, "Finetune/Loss (Raw)": 0.856221616268158, "Finetune/Step": 47, "Finetune/Step Time": 3.2070622342698116} +{"Finetune/Learning Rate": 6.442953020134229e-06, "Finetune/Loss": 1.0979204177856445, "Finetune/Loss (Raw)": 1.0055227279663086, "Finetune/Step": 48, "Finetune/Step Time": 3.1910817871491113} +{"Finetune/Learning Rate": 6.5771812080536925e-06, "Finetune/Loss": 1.095150351524353, "Finetune/Loss (Raw)": 0.9621927738189697, "Finetune/Step": 49, "Finetune/Step Time": 3.174898230299658} +{"Finetune/Learning Rate": 6.711409395973155e-06, "Finetune/Loss": 1.0941264629364014, "Finetune/Loss (Raw)": 1.0439512729644775, "Finetune/Step": 50, "Finetune/Step Time": 3.1595882511138917} +{"Finetune/Learning Rate": 6.845637583892618e-06, "Finetune/Loss": 1.0924007892608643, "Finetune/Loss (Raw)": 1.0061219930648804, "Finetune/Step": 51, "Finetune/Step Time": 3.1441677551643523} +{"Finetune/Learning Rate": 6.979865771812081e-06, "Finetune/Loss": 1.0886247158050537, "Finetune/Loss (Raw)": 0.8960381746292114, "Finetune/Step": 52, "Finetune/Step Time": 3.1292676421312184} +{"Finetune/Learning Rate": 7.114093959731544e-06, "Finetune/Loss": 1.085991382598877, "Finetune/Loss (Raw)": 0.9490604996681213, "Finetune/Step": 53, "Finetune/Step Time": 3.1190523921318776} +{"Finetune/Learning Rate": 7.248322147651007e-06, "Finetune/Loss": 1.083092451095581, "Finetune/Loss (Raw)": 0.9294496774673462, "Finetune/Step": 54, "Finetune/Step Time": 3.1593409997445567} +{"Finetune/Learning Rate": 7.382550335570471e-06, "Finetune/Loss": 1.0812610387802124, "Finetune/Loss (Raw)": 0.9823691844940186, "Finetune/Step": 55, "Finetune/Step Time": 3.146852879090743} +{"Finetune/Learning Rate": 7.516778523489934e-06, "Finetune/Loss": 1.0808645486831665, "Finetune/Loss (Raw)": 1.0590524673461914, "Finetune/Step": 56, "Finetune/Step Time": 3.1347072337354933} +{"Finetune/Learning Rate": 7.651006711409396e-06, "Finetune/Loss": 1.0799362659454346, "Finetune/Loss (Raw)": 1.0279552936553955, "Finetune/Step": 57, "Finetune/Step Time": 3.118720422711289} +{"Finetune/Learning Rate": 7.785234899328859e-06, "Finetune/Loss": 1.0678281784057617, "Finetune/Loss (Raw)": 0.3776640295982361, "Finetune/Step": 58, "Finetune/Step Time": 3.191015999892662} +{"Finetune/Learning Rate": 7.919463087248322e-06, "Finetune/Loss": 1.0662016868591309, "Finetune/Loss (Raw)": 0.9718707203865051, "Finetune/Step": 59, "Finetune/Step Time": 3.183853981858593} +{"Finetune/Learning Rate": 8.053691275167785e-06, "Finetune/Loss": 1.0601146221160889, "Finetune/Loss (Raw)": 0.7009742856025696, "Finetune/Step": 60, "Finetune/Step Time": 3.219889231522878} +{"Finetune/Learning Rate": 8.18791946308725e-06, "Finetune/Loss": 1.0471320152282715, "Finetune/Loss (Raw)": 0.2681807577610016, "Finetune/Step": 61, "Finetune/Step Time": 3.2806886297757507} +{"Finetune/Learning Rate": 8.322147651006712e-06, "Finetune/Loss": 1.0466595888137817, "Finetune/Loss (Raw)": 1.0178362131118774, "Finetune/Step": 62, "Finetune/Step Time": 3.2620159887498423} +{"Finetune/Learning Rate": 8.456375838926175e-06, "Finetune/Loss": 1.0400516986846924, "Finetune/Loss (Raw)": 0.6303583383560181, "Finetune/Step": 63, "Finetune/Step Time": 3.3044224012465704} +{"Finetune/Learning Rate": 8.590604026845638e-06, "Finetune/Loss": 1.0388271808624268, "Finetune/Loss (Raw)": 0.9616926908493042, "Finetune/Step": 64, "Finetune/Step Time": 3.2946071960031986} +{"Finetune/Learning Rate": 8.724832214765101e-06, "Finetune/Loss": 1.038687825202942, "Finetune/Loss (Raw)": 1.029765248298645, "Finetune/Step": 65, "Finetune/Step Time": 3.2797158791468695} +{"Finetune/Learning Rate": 8.859060402684566e-06, "Finetune/Loss": 1.0382124185562134, "Finetune/Loss (Raw)": 1.0073143243789673, "Finetune/Step": 66, "Finetune/Step Time": 3.2660415208700933} +{"Finetune/Learning Rate": 8.993288590604027e-06, "Finetune/Loss": 1.0387336015701294, "Finetune/Loss (Raw)": 1.0731266736984253, "Finetune/Step": 67, "Finetune/Step Time": 3.2554814922275828} +{"Finetune/Learning Rate": 9.12751677852349e-06, "Finetune/Loss": 1.037485957145691, "Finetune/Loss (Raw)": 0.9538882374763489, "Finetune/Step": 68, "Finetune/Step Time": 3.2376012802124023} +{"Finetune/Learning Rate": 9.261744966442953e-06, "Finetune/Loss": 1.0367186069488525, "Finetune/Loss (Raw)": 0.9845477342605591, "Finetune/Step": 69, "Finetune/Step Time": 3.230592644732931} +{"Finetune/Learning Rate": 9.395973154362416e-06, "Finetune/Loss": 1.0264679193496704, "Finetune/Loss (Raw)": 0.31916189193725586, "Finetune/Step": 70, "Finetune/Step Time": 3.292623083932059} +{"Finetune/Learning Rate": 9.530201342281879e-06, "Finetune/Loss": 1.0256661176681519, "Finetune/Loss (Raw)": 0.9695485830307007, "Finetune/Step": 71, "Finetune/Step Time": 3.2803520484709403} +{"Finetune/Learning Rate": 9.664429530201343e-06, "Finetune/Loss": 1.0237290859222412, "Finetune/Loss (Raw)": 0.886203408241272, "Finetune/Step": 72, "Finetune/Step Time": 3.2683943808078766} +{"Finetune/Learning Rate": 9.798657718120806e-06, "Finetune/Loss": 1.0203765630722046, "Finetune/Loss (Raw)": 0.7789903879165649, "Finetune/Step": 73, "Finetune/Step Time": 3.2968343349352276} +{"Finetune/Learning Rate": 9.93288590604027e-06, "Finetune/Loss": 1.021071434020996, "Finetune/Loss (Raw)": 1.0717964172363281, "Finetune/Step": 74, "Finetune/Step Time": 3.2886225661715947} +{"Finetune/Learning Rate": 1.0067114093959734e-05, "Finetune/Loss": 1.0202360153198242, "Finetune/Loss (Raw)": 0.9584073424339294, "Finetune/Step": 75, "Finetune/Step Time": 3.277001183827718} +{"Finetune/Learning Rate": 1.0201342281879197e-05, "Finetune/Loss": 1.0150365829467773, "Finetune/Loss (Raw)": 0.6250753998756409, "Finetune/Step": 76, "Finetune/Step Time": 3.3109744661732723} +{"Finetune/Learning Rate": 1.033557046979866e-05, "Finetune/Loss": 1.0143545866012573, "Finetune/Loss (Raw)": 0.9625260233879089, "Finetune/Step": 77, "Finetune/Step Time": 3.3039368778080136} +{"Finetune/Learning Rate": 1.0469798657718123e-05, "Finetune/Loss": 1.0132412910461426, "Finetune/Loss (Raw)": 0.9275203347206116, "Finetune/Step": 78, "Finetune/Step Time": 3.2901653723839} +{"Finetune/Learning Rate": 1.0604026845637586e-05, "Finetune/Loss": 1.0143301486968994, "Finetune/Loss (Raw)": 1.0992687940597534, "Finetune/Step": 79, "Finetune/Step Time": 3.2803976475437984} +{"Finetune/Learning Rate": 1.0738255033557049e-05, "Finetune/Loss": 1.0148929357528687, "Finetune/Loss (Raw)": 1.0593557357788086, "Finetune/Step": 80, "Finetune/Step Time": 3.2704851806163786} +{"Finetune/Learning Rate": 1.0872483221476512e-05, "Finetune/Loss": 1.013317346572876, "Finetune/Loss (Raw)": 0.8872678279876709, "Finetune/Step": 81, "Finetune/Step Time": 3.2594797169720686} +{"Finetune/Learning Rate": 1.1006711409395975e-05, "Finetune/Loss": 1.0123505592346191, "Finetune/Loss (Raw)": 0.9340394139289856, "Finetune/Step": 82, "Finetune/Step Time": 3.246036000368072} +{"Finetune/Learning Rate": 1.1140939597315436e-05, "Finetune/Loss": 1.0119653940200806, "Finetune/Loss (Raw)": 0.9803772568702698, "Finetune/Step": 83, "Finetune/Step Time": 3.2312566688261835} +{"Finetune/Learning Rate": 1.1275167785234899e-05, "Finetune/Loss": 1.0115776062011719, "Finetune/Loss (Raw)": 0.9793907999992371, "Finetune/Step": 84, "Finetune/Step Time": 3.224433896087465} +{"Finetune/Learning Rate": 1.1409395973154362e-05, "Finetune/Loss": 1.011654019355774, "Finetune/Loss (Raw)": 1.0180647373199463, "Finetune/Step": 85, "Finetune/Step Time": 3.215974911521463} +{"Finetune/Learning Rate": 1.1543624161073828e-05, "Finetune/Loss": 1.0107041597366333, "Finetune/Loss (Raw)": 0.9299800395965576, "Finetune/Step": 86, "Finetune/Step Time": 3.208341889603193} +{"Finetune/Learning Rate": 1.1677852348993291e-05, "Finetune/Loss": 1.010487675666809, "Finetune/Loss (Raw)": 0.9918702244758606, "Finetune/Step": 87, "Finetune/Step Time": 3.19578471128968} +{"Finetune/Learning Rate": 1.1812080536912754e-05, "Finetune/Loss": 1.009786605834961, "Finetune/Loss (Raw)": 0.9487802982330322, "Finetune/Step": 88, "Finetune/Step Time": 3.186304720965299} +{"Finetune/Learning Rate": 1.1946308724832217e-05, "Finetune/Loss": 1.0091348886489868, "Finetune/Loss (Raw)": 0.9517928957939148, "Finetune/Step": 89, "Finetune/Step Time": 3.1753687322809454} +{"Finetune/Learning Rate": 1.208053691275168e-05, "Finetune/Loss": 1.0084894895553589, "Finetune/Loss (Raw)": 0.9510475993156433, "Finetune/Step": 90, "Finetune/Step Time": 3.1680717759662205} +{"Finetune/Learning Rate": 1.2214765100671143e-05, "Finetune/Loss": 1.0077672004699707, "Finetune/Loss (Raw)": 0.9427634477615356, "Finetune/Step": 91, "Finetune/Step Time": 3.160021653542152} +{"Finetune/Learning Rate": 1.2348993288590606e-05, "Finetune/Loss": 1.0073308944702148, "Finetune/Loss (Raw)": 0.9676169753074646, "Finetune/Step": 92, "Finetune/Step Time": 3.1510847392289536} +{"Finetune/Learning Rate": 1.2483221476510069e-05, "Finetune/Loss": 1.0058846473693848, "Finetune/Loss (Raw)": 0.8728400468826294, "Finetune/Step": 93, "Finetune/Step Time": 3.141736061342301} +{"Finetune/Learning Rate": 1.2617449664429532e-05, "Finetune/Loss": 1.005812406539917, "Finetune/Loss (Raw)": 0.9990875720977783, "Finetune/Step": 94, "Finetune/Step Time": 3.1356048051347125} +{"Finetune/Learning Rate": 1.2751677852348994e-05, "Finetune/Loss": 1.0046749114990234, "Finetune/Loss (Raw)": 0.8977442979812622, "Finetune/Step": 95, "Finetune/Step Time": 3.1270080892663255} +{"Finetune/Learning Rate": 1.2885906040268457e-05, "Finetune/Loss": 1.001072883605957, "Finetune/Loss (Raw)": 0.6588955521583557, "Finetune/Step": 96, "Finetune/Step Time": 3.1558751240372658} +{"Finetune/Learning Rate": 1.302013422818792e-05, "Finetune/Loss": 1.0010122060775757, "Finetune/Loss (Raw)": 0.9951826333999634, "Finetune/Step": 97, "Finetune/Step Time": 3.148203023930186} +{"Finetune/Learning Rate": 1.3154362416107385e-05, "Finetune/Loss": 1.0002679824829102, "Finetune/Loss (Raw)": 0.9280782341957092, "Finetune/Step": 98, "Finetune/Step Time": 3.1402211481211135} +{"Finetune/Learning Rate": 1.3288590604026848e-05, "Finetune/Loss": 0.9993913173675537, "Finetune/Loss (Raw)": 0.9134804606437683, "Finetune/Step": 99, "Finetune/Step Time": 3.133439210930256} +{"Finetune/Learning Rate": 1.342281879194631e-05, "Finetune/Loss": 0.9935000538825989, "Finetune/Loss (Raw)": 0.410264253616333, "Finetune/Step": 100, "Finetune/Step Time": 3.1632324290275573} +{"Finetune/Learning Rate": 1.3557046979865774e-05, "Finetune/Loss": 0.992727518081665, "Finetune/Loss (Raw)": 0.9154756665229797, "Finetune/Step": 101, "Finetune/Step Time": 3.1570507606657423} +{"Finetune/Learning Rate": 1.3691275167785237e-05, "Finetune/Loss": 0.9923859238624573, "Finetune/Loss (Raw)": 0.9578762054443359, "Finetune/Step": 102, "Finetune/Step Time": 3.1476657063353297} +{"Finetune/Learning Rate": 1.38255033557047e-05, "Finetune/Loss": 0.9922310709953308, "Finetune/Loss (Raw)": 0.976442813873291, "Finetune/Step": 103, "Finetune/Step Time": 3.1415738457614935} +{"Finetune/Learning Rate": 1.3959731543624163e-05, "Finetune/Loss": 0.9913679361343384, "Finetune/Loss (Raw)": 0.902463972568512, "Finetune/Step": 104, "Finetune/Step Time": 3.1335814022100887} +{"Finetune/Learning Rate": 1.4093959731543626e-05, "Finetune/Loss": 0.9881733059883118, "Finetune/Loss (Raw)": 0.6559270620346069, "Finetune/Step": 105, "Finetune/Step Time": 3.1588007699875607} +{"Finetune/Learning Rate": 1.4228187919463088e-05, "Finetune/Loss": 0.987740159034729, "Finetune/Loss (Raw)": 0.9422706365585327, "Finetune/Step": 106, "Finetune/Step Time": 3.15539949570062} +{"Finetune/Learning Rate": 1.4362416107382551e-05, "Finetune/Loss": 0.9872580170631409, "Finetune/Loss (Raw)": 0.9361517429351807, "Finetune/Step": 107, "Finetune/Step Time": 3.151565028128223} +{"Finetune/Learning Rate": 1.4496644295302014e-05, "Finetune/Loss": 0.9842857122421265, "Finetune/Loss (Raw)": 0.6662494540214539, "Finetune/Step": 108, "Finetune/Step Time": 3.1797397004233465} +{"Finetune/Learning Rate": 1.4630872483221479e-05, "Finetune/Loss": 0.9838135838508606, "Finetune/Loss (Raw)": 0.9328198432922363, "Finetune/Step": 109, "Finetune/Step Time": 3.173561513970751} +{"Finetune/Learning Rate": 1.4765100671140942e-05, "Finetune/Loss": 0.9830703139305115, "Finetune/Loss (Raw)": 0.9020581245422363, "Finetune/Step": 110, "Finetune/Step Time": 3.1645886594598944} +{"Finetune/Learning Rate": 1.4899328859060405e-05, "Finetune/Loss": 0.9828378558158875, "Finetune/Loss (Raw)": 0.9572692513465881, "Finetune/Step": 111, "Finetune/Step Time": 3.1554214481834895} +{"Finetune/Learning Rate": 1.5033557046979868e-05, "Finetune/Loss": 0.9823920726776123, "Finetune/Loss (Raw)": 0.93290114402771, "Finetune/Step": 112, "Finetune/Step Time": 3.149373825107302} +{"Finetune/Learning Rate": 1.516778523489933e-05, "Finetune/Loss": 0.982812225818634, "Finetune/Loss (Raw)": 1.0298768281936646, "Finetune/Step": 113, "Finetune/Step Time": 3.141856294817629} +{"Finetune/Learning Rate": 1.5302013422818792e-05, "Finetune/Loss": 0.9824655055999756, "Finetune/Loss (Raw)": 0.9432916045188904, "Finetune/Step": 114, "Finetune/Step Time": 3.1346838055995474} +{"Finetune/Learning Rate": 1.5436241610738255e-05, "Finetune/Loss": 0.9818044900894165, "Finetune/Loss (Raw)": 0.9064527153968811, "Finetune/Step": 115, "Finetune/Step Time": 3.1341719233471412} +{"Finetune/Learning Rate": 1.5570469798657718e-05, "Finetune/Loss": 0.9804286360740662, "Finetune/Loss (Raw)": 0.8221957683563232, "Finetune/Step": 116, "Finetune/Step Time": 3.126286009262348} +{"Finetune/Learning Rate": 1.570469798657718e-05, "Finetune/Loss": 0.9796382784843445, "Finetune/Loss (Raw)": 0.8879539966583252, "Finetune/Step": 117, "Finetune/Step Time": 3.120864843710875} +{"Finetune/Learning Rate": 1.5838926174496644e-05, "Finetune/Loss": 0.9792253971099854, "Finetune/Loss (Raw)": 0.9309254884719849, "Finetune/Step": 118, "Finetune/Step Time": 3.1150330062639915} +{"Finetune/Learning Rate": 1.5973154362416107e-05, "Finetune/Loss": 0.9797519445419312, "Finetune/Loss (Raw)": 1.0418787002563477, "Finetune/Step": 119, "Finetune/Step Time": 3.110228907160398} +{"Finetune/Learning Rate": 1.610738255033557e-05, "Finetune/Loss": 0.9796643853187561, "Finetune/Loss (Raw)": 0.9692390561103821, "Finetune/Step": 120, "Finetune/Step Time": 3.104788581530253} +{"Finetune/Learning Rate": 1.6241610738255036e-05, "Finetune/Loss": 0.979566752910614, "Finetune/Loss (Raw)": 0.9678576588630676, "Finetune/Step": 121, "Finetune/Step Time": 3.1008203738977103} +{"Finetune/Learning Rate": 1.63758389261745e-05, "Finetune/Loss": 0.9756864905357361, "Finetune/Loss (Raw)": 0.5061807036399841, "Finetune/Step": 122, "Finetune/Step Time": 3.119858163302062} +{"Finetune/Learning Rate": 1.6510067114093962e-05, "Finetune/Loss": 0.9755328297615051, "Finetune/Loss (Raw)": 0.9567793607711792, "Finetune/Step": 123, "Finetune/Step Time": 3.115418451588328} +{"Finetune/Learning Rate": 1.6644295302013425e-05, "Finetune/Loss": 0.9748932123184204, "Finetune/Loss (Raw)": 0.8962286114692688, "Finetune/Step": 124, "Finetune/Step Time": 3.1109712585326164} +{"Finetune/Learning Rate": 1.6778523489932888e-05, "Finetune/Loss": 0.9744371771812439, "Finetune/Loss (Raw)": 0.9178769588470459, "Finetune/Step": 125, "Finetune/Step Time": 3.106171667098999} +{"Finetune/Learning Rate": 1.691275167785235e-05, "Finetune/Loss": 0.9751742482185364, "Finetune/Loss (Raw)": 1.067301869392395, "Finetune/Step": 126, "Finetune/Step Time": 3.100357354633392} +{"Finetune/Learning Rate": 1.7046979865771814e-05, "Finetune/Loss": 0.9747071862220764, "Finetune/Loss (Raw)": 0.9158646464347839, "Finetune/Step": 127, "Finetune/Step Time": 3.09471431679613} +{"Finetune/Learning Rate": 1.7181208053691277e-05, "Finetune/Loss": 0.9739793539047241, "Finetune/Loss (Raw)": 0.8815452456474304, "Finetune/Step": 128, "Finetune/Step Time": 3.088538095355034} +{"Finetune/Learning Rate": 1.731543624161074e-05, "Finetune/Loss": 0.9766414761543274, "Finetune/Loss (Raw)": 0.9296241998672485, "Finetune/Step": 129, "Finetune/Step Time": 2.892529545351863} +{"Finetune/Learning Rate": 1.7449664429530202e-05, "Finetune/Loss": 0.9724419116973877, "Finetune/Loss (Raw)": 0.8838707804679871, "Finetune/Step": 130, "Finetune/Step Time": 2.8887629937380552} +{"Finetune/Learning Rate": 1.7583892617449665e-05, "Finetune/Loss": 0.9734706282615662, "Finetune/Loss (Raw)": 0.9258204698562622, "Finetune/Step": 131, "Finetune/Step Time": 2.8652896489948034} +{"Finetune/Learning Rate": 1.771812080536913e-05, "Finetune/Loss": 0.9692324995994568, "Finetune/Loss (Raw)": 0.9526899456977844, "Finetune/Step": 132, "Finetune/Step Time": 2.8670009952038527} +{"Finetune/Learning Rate": 1.7852348993288595e-05, "Finetune/Loss": 0.9632289409637451, "Finetune/Loss (Raw)": 0.5814522504806519, "Finetune/Step": 133, "Finetune/Step Time": 2.8887820579111576} +{"Finetune/Learning Rate": 1.7986577181208054e-05, "Finetune/Loss": 0.959236204624176, "Finetune/Loss (Raw)": 1.0201671123504639, "Finetune/Step": 134, "Finetune/Step Time": 2.888211492449045} +{"Finetune/Learning Rate": 1.8120805369127517e-05, "Finetune/Loss": 0.9561020135879517, "Finetune/Loss (Raw)": 0.9592505693435669, "Finetune/Step": 135, "Finetune/Step Time": 2.8867860324680805} +{"Finetune/Learning Rate": 1.825503355704698e-05, "Finetune/Loss": 0.9537481069564819, "Finetune/Loss (Raw)": 1.044641137123108, "Finetune/Step": 136, "Finetune/Step Time": 2.8910926952958107} +{"Finetune/Learning Rate": 1.8389261744966443e-05, "Finetune/Loss": 0.9509221911430359, "Finetune/Loss (Raw)": 0.9895491003990173, "Finetune/Step": 137, "Finetune/Step Time": 2.8901193030178547} +{"Finetune/Learning Rate": 1.8523489932885906e-05, "Finetune/Loss": 0.9472894072532654, "Finetune/Loss (Raw)": 0.9404954314231873, "Finetune/Step": 138, "Finetune/Step Time": 2.8896248377859592} +{"Finetune/Learning Rate": 1.865771812080537e-05, "Finetune/Loss": 0.9414386749267578, "Finetune/Loss (Raw)": 0.5842921137809753, "Finetune/Step": 139, "Finetune/Step Time": 2.913359861820936} +{"Finetune/Learning Rate": 1.8791946308724832e-05, "Finetune/Loss": 0.9391777515411377, "Finetune/Loss (Raw)": 0.959620475769043, "Finetune/Step": 140, "Finetune/Step Time": 2.9161411486566067} +{"Finetune/Learning Rate": 1.8926174496644295e-05, "Finetune/Loss": 0.9357357025146484, "Finetune/Loss (Raw)": 0.909903883934021, "Finetune/Step": 141, "Finetune/Step Time": 2.91669493727386} +{"Finetune/Learning Rate": 1.9060402684563758e-05, "Finetune/Loss": 0.9320431351661682, "Finetune/Loss (Raw)": 0.8119028806686401, "Finetune/Step": 142, "Finetune/Step Time": 2.9389647394418716} +{"Finetune/Learning Rate": 1.919463087248322e-05, "Finetune/Loss": 0.9301812648773193, "Finetune/Loss (Raw)": 0.9741959571838379, "Finetune/Step": 143, "Finetune/Step Time": 2.93907755240798} +{"Finetune/Learning Rate": 1.9328859060402687e-05, "Finetune/Loss": 0.9297739267349243, "Finetune/Loss (Raw)": 1.0261629819869995, "Finetune/Step": 144, "Finetune/Step Time": 2.9368655793368816} +{"Finetune/Learning Rate": 1.946308724832215e-05, "Finetune/Loss": 0.9274366497993469, "Finetune/Loss (Raw)": 0.8929571509361267, "Finetune/Step": 145, "Finetune/Step Time": 2.9385722130537033} +{"Finetune/Learning Rate": 1.9597315436241613e-05, "Finetune/Loss": 0.9261390566825867, "Finetune/Loss (Raw)": 1.016359567642212, "Finetune/Step": 146, "Finetune/Step Time": 2.937741069123149} +{"Finetune/Learning Rate": 1.9731543624161076e-05, "Finetune/Loss": 0.9254530072212219, "Finetune/Loss (Raw)": 0.9964442849159241, "Finetune/Step": 147, "Finetune/Step Time": 2.9382244497537613} +{"Finetune/Learning Rate": 1.986577181208054e-05, "Finetune/Loss": 0.9232670664787292, "Finetune/Loss (Raw)": 0.8343514800071716, "Finetune/Step": 148, "Finetune/Step Time": 2.9405502267181873} +{"Finetune/Learning Rate": 2e-05, "Finetune/Loss": 0.9210284948348999, "Finetune/Loss (Raw)": 0.8775258660316467, "Finetune/Step": 149, "Finetune/Step Time": 2.938542254269123} +{"Finetune/Learning Rate": 1.999999788029659e-05, "Finetune/Loss": 0.9200509190559387, "Finetune/Loss (Raw)": 0.9744482636451721, "Finetune/Step": 150, "Finetune/Step Time": 2.9433276634663343} +{"Finetune/Learning Rate": 1.999999152118725e-05, "Finetune/Loss": 0.9181032180786133, "Finetune/Loss (Raw)": 0.9421463012695312, "Finetune/Step": 151, "Finetune/Step Time": 2.945958439260721} +{"Finetune/Learning Rate": 1.9999980922674677e-05, "Finetune/Loss": 0.9178332686424255, "Finetune/Loss (Raw)": 0.9692622423171997, "Finetune/Step": 152, "Finetune/Step Time": 2.9471214059740305} +{"Finetune/Learning Rate": 1.999996608476337e-05, "Finetune/Loss": 0.916127622127533, "Finetune/Loss (Raw)": 0.9576596021652222, "Finetune/Step": 153, "Finetune/Step Time": 2.9438638258725405} +{"Finetune/Learning Rate": 1.9999947007459616e-05, "Finetune/Loss": 0.9160398840904236, "Finetune/Loss (Raw)": 0.9719282388687134, "Finetune/Step": 154, "Finetune/Step Time": 2.9450223185122013} +{"Finetune/Learning Rate": 1.99999236907715e-05, "Finetune/Loss": 0.9156544208526611, "Finetune/Loss (Raw)": 1.0033780336380005, "Finetune/Step": 155, "Finetune/Step Time": 2.9451619684696198} +{"Finetune/Learning Rate": 1.999989613470891e-05, "Finetune/Loss": 0.9124008417129517, "Finetune/Loss (Raw)": 0.5986331701278687, "Finetune/Step": 156, "Finetune/Step Time": 2.966982064768672} +{"Finetune/Learning Rate": 1.999986433928353e-05, "Finetune/Loss": 0.9115647673606873, "Finetune/Loss (Raw)": 0.8932183384895325, "Finetune/Step": 157, "Finetune/Step Time": 2.968548571690917} +{"Finetune/Learning Rate": 1.9999828304508834e-05, "Finetune/Loss": 0.9098409414291382, "Finetune/Loss (Raw)": 0.8640882968902588, "Finetune/Step": 158, "Finetune/Step Time": 2.965409219264984} +{"Finetune/Learning Rate": 1.99997880304001e-05, "Finetune/Loss": 0.9092889428138733, "Finetune/Loss (Raw)": 1.0023808479309082, "Finetune/Step": 159, "Finetune/Step Time": 2.968307802453637} +{"Finetune/Learning Rate": 1.9999743516974405e-05, "Finetune/Loss": 0.9121576547622681, "Finetune/Loss (Raw)": 0.8796901106834412, "Finetune/Step": 160, "Finetune/Step Time": 2.939820323139429} +{"Finetune/Learning Rate": 1.999969476425062e-05, "Finetune/Loss": 0.9118598699569702, "Finetune/Loss (Raw)": 0.9445592164993286, "Finetune/Step": 161, "Finetune/Step Time": 2.9370645843446255} +{"Finetune/Learning Rate": 1.9999641772249407e-05, "Finetune/Loss": 0.9110158085823059, "Finetune/Loss (Raw)": 0.8918055891990662, "Finetune/Step": 162, "Finetune/Step Time": 2.934148583561182} +{"Finetune/Learning Rate": 1.999958454099324e-05, "Finetune/Loss": 0.9111400246620178, "Finetune/Loss (Raw)": 0.967869758605957, "Finetune/Step": 163, "Finetune/Step Time": 2.932467533275485} +{"Finetune/Learning Rate": 1.9999523070506376e-05, "Finetune/Loss": 0.9099246263504028, "Finetune/Loss (Raw)": 0.8528252243995667, "Finetune/Step": 164, "Finetune/Step Time": 2.9287470281124115} +{"Finetune/Learning Rate": 1.9999457360814873e-05, "Finetune/Loss": 0.9116530418395996, "Finetune/Loss (Raw)": 0.9045671224594116, "Finetune/Step": 165, "Finetune/Step Time": 2.906250972300768} +{"Finetune/Learning Rate": 1.9999387411946598e-05, "Finetune/Loss": 0.9121916890144348, "Finetune/Loss (Raw)": 1.0183500051498413, "Finetune/Step": 166, "Finetune/Step Time": 2.9026975259184837} +{"Finetune/Learning Rate": 1.9999313223931194e-05, "Finetune/Loss": 0.9110990762710571, "Finetune/Loss (Raw)": 0.851051390171051, "Finetune/Step": 167, "Finetune/Step Time": 2.902803311124444} +{"Finetune/Learning Rate": 1.999923479680012e-05, "Finetune/Loss": 0.9106862545013428, "Finetune/Loss (Raw)": 0.9408627152442932, "Finetune/Step": 168, "Finetune/Step Time": 2.9005037751048803} +{"Finetune/Learning Rate": 1.9999152130586617e-05, "Finetune/Loss": 0.9099447727203369, "Finetune/Loss (Raw)": 0.8476876020431519, "Finetune/Step": 169, "Finetune/Step Time": 2.9003366995602846} +{"Finetune/Learning Rate": 1.999906522532574e-05, "Finetune/Loss": 0.9088521003723145, "Finetune/Loss (Raw)": 0.8452277779579163, "Finetune/Step": 170, "Finetune/Step Time": 2.897047409787774} +{"Finetune/Learning Rate": 1.9998974081054323e-05, "Finetune/Loss": 0.9081041216850281, "Finetune/Loss (Raw)": 0.9080255627632141, "Finetune/Step": 171, "Finetune/Step Time": 2.898220542818308} +{"Finetune/Learning Rate": 1.999887869781101e-05, "Finetune/Loss": 0.9057945609092712, "Finetune/Loss (Raw)": 0.9173256754875183, "Finetune/Step": 172, "Finetune/Step Time": 2.898257914930582} +{"Finetune/Learning Rate": 1.999877907563624e-05, "Finetune/Loss": 0.905289888381958, "Finetune/Loss (Raw)": 0.9021909236907959, "Finetune/Step": 173, "Finetune/Step Time": 2.903156539425254} +{"Finetune/Learning Rate": 1.999867521457224e-05, "Finetune/Loss": 0.9044675827026367, "Finetune/Loss (Raw)": 0.9804655909538269, "Finetune/Step": 174, "Finetune/Step Time": 2.904731346294284} +{"Finetune/Learning Rate": 1.9998567114663048e-05, "Finetune/Loss": 0.9026002883911133, "Finetune/Loss (Raw)": 0.6172012686729431, "Finetune/Step": 175, "Finetune/Step Time": 2.9297780971974134} +{"Finetune/Learning Rate": 1.999845477595449e-05, "Finetune/Loss": 0.9022663831710815, "Finetune/Loss (Raw)": 0.9627911448478699, "Finetune/Step": 176, "Finetune/Step Time": 2.9281521514058113} +{"Finetune/Learning Rate": 1.9998338198494184e-05, "Finetune/Loss": 0.8995884656906128, "Finetune/Loss (Raw)": 0.6194105744361877, "Finetune/Step": 177, "Finetune/Step Time": 2.950075425207615} +{"Finetune/Learning Rate": 1.9998217382331564e-05, "Finetune/Loss": 0.8987797498703003, "Finetune/Loss (Raw)": 0.9404382705688477, "Finetune/Step": 178, "Finetune/Step Time": 2.9519882071763277} +{"Finetune/Learning Rate": 1.999809232751784e-05, "Finetune/Loss": 0.8982805013656616, "Finetune/Loss (Raw)": 0.9422170519828796, "Finetune/Step": 179, "Finetune/Step Time": 2.9521403070539236} +{"Finetune/Learning Rate": 1.9997963034106032e-05, "Finetune/Loss": 0.8984349966049194, "Finetune/Loss (Raw)": 0.9158113598823547, "Finetune/Step": 180, "Finetune/Step Time": 2.9547903072088957} +{"Finetune/Learning Rate": 1.999782950215095e-05, "Finetune/Loss": 0.8988125324249268, "Finetune/Loss (Raw)": 0.9973911046981812, "Finetune/Step": 181, "Finetune/Step Time": 2.954090289771557} +{"Finetune/Learning Rate": 1.9997691731709207e-05, "Finetune/Loss": 0.896539032459259, "Finetune/Loss (Raw)": 0.6384431719779968, "Finetune/Step": 182, "Finetune/Step Time": 2.9547316934913397} +{"Finetune/Learning Rate": 1.9997549722839205e-05, "Finetune/Loss": 0.8961107134819031, "Finetune/Loss (Raw)": 0.9275426864624023, "Finetune/Step": 183, "Finetune/Step Time": 2.954938430339098} +{"Finetune/Learning Rate": 1.999740347560115e-05, "Finetune/Loss": 0.8945443630218506, "Finetune/Loss (Raw)": 0.8585623502731323, "Finetune/Step": 184, "Finetune/Step Time": 2.9552886318415403} +{"Finetune/Learning Rate": 1.9997252990057047e-05, "Finetune/Loss": 0.8946375250816345, "Finetune/Loss (Raw)": 1.039876937866211, "Finetune/Step": 185, "Finetune/Step Time": 2.9551964718848467} +{"Finetune/Learning Rate": 1.9997098266270682e-05, "Finetune/Loss": 0.8991464972496033, "Finetune/Loss (Raw)": 0.9548107385635376, "Finetune/Step": 186, "Finetune/Step Time": 2.917347028851509} +{"Finetune/Learning Rate": 1.9996939304307657e-05, "Finetune/Loss": 0.8994000554084778, "Finetune/Loss (Raw)": 1.004326343536377, "Finetune/Step": 187, "Finetune/Step Time": 2.9133400041610003} +{"Finetune/Learning Rate": 1.9996776104235355e-05, "Finetune/Loss": 0.9022074341773987, "Finetune/Loss (Raw)": 1.0603183507919312, "Finetune/Step": 188, "Finetune/Step Time": 2.8908402901142836} +{"Finetune/Learning Rate": 1.9996608666122976e-05, "Finetune/Loss": 0.9068393111228943, "Finetune/Loss (Raw)": 0.8610617518424988, "Finetune/Step": 189, "Finetune/Step Time": 2.8535471949726343} +{"Finetune/Learning Rate": 1.9996436990041493e-05, "Finetune/Loss": 0.9064153432846069, "Finetune/Loss (Raw)": 0.9635728001594543, "Finetune/Step": 190, "Finetune/Step Time": 2.855487357825041} +{"Finetune/Learning Rate": 1.9996261076063688e-05, "Finetune/Loss": 0.9085860252380371, "Finetune/Loss (Raw)": 0.9082064628601074, "Finetune/Step": 191, "Finetune/Step Time": 2.8402029890567064} +{"Finetune/Learning Rate": 1.999608092426414e-05, "Finetune/Loss": 0.9090955853462219, "Finetune/Loss (Raw)": 1.026910424232483, "Finetune/Step": 192, "Finetune/Step Time": 2.8382966723293066} +{"Finetune/Learning Rate": 1.9995896534719223e-05, "Finetune/Loss": 0.9081454873085022, "Finetune/Loss (Raw)": 0.9081544280052185, "Finetune/Step": 193, "Finetune/Step Time": 2.839897843077779} +{"Finetune/Learning Rate": 1.9995707907507107e-05, "Finetune/Loss": 0.907340407371521, "Finetune/Loss (Raw)": 0.9042667150497437, "Finetune/Step": 194, "Finetune/Step Time": 2.839571399614215} +{"Finetune/Learning Rate": 1.9995515042707757e-05, "Finetune/Loss": 0.9064632058143616, "Finetune/Loss (Raw)": 0.9608423709869385, "Finetune/Step": 195, "Finetune/Step Time": 2.8391921930015087} +{"Finetune/Learning Rate": 1.999531794040294e-05, "Finetune/Loss": 0.9064263701438904, "Finetune/Loss (Raw)": 0.9491721391677856, "Finetune/Step": 196, "Finetune/Step Time": 2.840357104316354} +{"Finetune/Learning Rate": 1.999511660067621e-05, "Finetune/Loss": 0.9055448174476624, "Finetune/Loss (Raw)": 0.8717114925384521, "Finetune/Step": 197, "Finetune/Step Time": 2.8401751909404993} +{"Finetune/Learning Rate": 1.9994911023612928e-05, "Finetune/Loss": 0.910964846611023, "Finetune/Loss (Raw)": 1.0129287242889404, "Finetune/Step": 198, "Finetune/Step Time": 2.7984543181955814} +{"Finetune/Learning Rate": 1.9994701209300245e-05, "Finetune/Loss": 0.9086017608642578, "Finetune/Loss (Raw)": 0.667076826095581, "Finetune/Step": 199, "Finetune/Step Time": 2.8208233304321766} +{"Finetune/Learning Rate": 1.9994487157827108e-05, "Finetune/Loss": 0.9092544913291931, "Finetune/Loss (Raw)": 0.9697440266609192, "Finetune/Step": 200, "Finetune/Step Time": 2.8231644872576} +{"Finetune/Learning Rate": 1.9994268869284264e-05, "Finetune/Loss": 0.910863995552063, "Finetune/Loss (Raw)": 0.9850044250488281, "Finetune/Step": 201, "Finetune/Step Time": 2.801523180678487} +{"Finetune/Learning Rate": 1.9994046343764254e-05, "Finetune/Loss": 0.9102444648742676, "Finetune/Loss (Raw)": 0.9925016164779663, "Finetune/Step": 202, "Finetune/Step Time": 2.79650273732841} +{"Finetune/Learning Rate": 1.999381958136142e-05, "Finetune/Loss": 0.9107238054275513, "Finetune/Loss (Raw)": 1.0197566747665405, "Finetune/Step": 203, "Finetune/Step Time": 2.796425648033619} +{"Finetune/Learning Rate": 1.9993588582171886e-05, "Finetune/Loss": 0.9132417440414429, "Finetune/Loss (Raw)": 0.9473726749420166, "Finetune/Step": 204, "Finetune/Step Time": 2.7722268737852573} +{"Finetune/Learning Rate": 1.999335334629359e-05, "Finetune/Loss": 0.9131040573120117, "Finetune/Loss (Raw)": 0.9449008107185364, "Finetune/Step": 205, "Finetune/Step Time": 2.769761275500059} +{"Finetune/Learning Rate": 1.9993113873826252e-05, "Finetune/Loss": 0.9113222360610962, "Finetune/Loss (Raw)": 0.6994464993476868, "Finetune/Step": 206, "Finetune/Step Time": 2.79379253461957} +{"Finetune/Learning Rate": 1.99928701648714e-05, "Finetune/Loss": 0.909739077091217, "Finetune/Loss (Raw)": 0.8966311812400818, "Finetune/Step": 207, "Finetune/Step Time": 2.794583972543478} +{"Finetune/Learning Rate": 1.9992622219532352e-05, "Finetune/Loss": 0.9095609784126282, "Finetune/Loss (Raw)": 1.0365525484085083, "Finetune/Step": 208, "Finetune/Step Time": 2.7988353110849857} +{"Finetune/Learning Rate": 1.9992370037914218e-05, "Finetune/Loss": 0.9094005823135376, "Finetune/Loss (Raw)": 0.8667420744895935, "Finetune/Step": 209, "Finetune/Step Time": 2.800060721114278} +{"Finetune/Learning Rate": 1.999211362012391e-05, "Finetune/Loss": 0.9087574481964111, "Finetune/Loss (Raw)": 0.8517183065414429, "Finetune/Step": 210, "Finetune/Step Time": 2.8047026563435793} +{"Finetune/Learning Rate": 1.9991852966270134e-05, "Finetune/Loss": 0.908379077911377, "Finetune/Loss (Raw)": 0.9319533705711365, "Finetune/Step": 211, "Finetune/Step Time": 2.808035394176841} +{"Finetune/Learning Rate": 1.9991588076463393e-05, "Finetune/Loss": 0.9090510606765747, "Finetune/Loss (Raw)": 1.0653979778289795, "Finetune/Step": 212, "Finetune/Step Time": 2.809745190665126} +{"Finetune/Learning Rate": 1.999131895081598e-05, "Finetune/Loss": 0.908098578453064, "Finetune/Loss (Raw)": 0.8961434960365295, "Finetune/Step": 213, "Finetune/Step Time": 2.806267624720931} +{"Finetune/Learning Rate": 1.9991045589441997e-05, "Finetune/Loss": 0.908687949180603, "Finetune/Loss (Raw)": 1.005426287651062, "Finetune/Step": 214, "Finetune/Step Time": 2.804936809465289} +{"Finetune/Learning Rate": 1.999076799245732e-05, "Finetune/Loss": 0.9074921607971191, "Finetune/Loss (Raw)": 0.8388120532035828, "Finetune/Step": 215, "Finetune/Step Time": 2.805218042805791} +{"Finetune/Learning Rate": 1.9990486159979644e-05, "Finetune/Loss": 0.9076122045516968, "Finetune/Loss (Raw)": 0.9641364216804504, "Finetune/Step": 216, "Finetune/Step Time": 2.80532836727798} +{"Finetune/Learning Rate": 1.999020009212845e-05, "Finetune/Loss": 0.9072517156600952, "Finetune/Loss (Raw)": 0.9056463241577148, "Finetune/Step": 217, "Finetune/Step Time": 2.806768571957946} +{"Finetune/Learning Rate": 1.9989909789025005e-05, "Finetune/Loss": 0.9074903726577759, "Finetune/Loss (Raw)": 0.981605589389801, "Finetune/Step": 218, "Finetune/Step Time": 2.80781676620245} +{"Finetune/Learning Rate": 1.9989615250792392e-05, "Finetune/Loss": 0.9048625826835632, "Finetune/Loss (Raw)": 0.6064027547836304, "Finetune/Step": 219, "Finetune/Step Time": 2.8375983107835054} +{"Finetune/Learning Rate": 1.9989316477555467e-05, "Finetune/Loss": 0.9046213626861572, "Finetune/Loss (Raw)": 0.9367397427558899, "Finetune/Step": 220, "Finetune/Step Time": 2.843037437647581} +{"Finetune/Learning Rate": 1.9989013469440896e-05, "Finetune/Loss": 0.9053781628608704, "Finetune/Loss (Raw)": 0.9697095155715942, "Finetune/Step": 221, "Finetune/Step Time": 2.843483032658696} +{"Finetune/Learning Rate": 1.998870622657714e-05, "Finetune/Loss": 0.9048415422439575, "Finetune/Loss (Raw)": 0.9304037690162659, "Finetune/Step": 222, "Finetune/Step Time": 2.846357436850667} +{"Finetune/Learning Rate": 1.9988394749094448e-05, "Finetune/Loss": 0.9047360420227051, "Finetune/Loss (Raw)": 0.8842408061027527, "Finetune/Step": 223, "Finetune/Step Time": 2.8488342501223087} +{"Finetune/Learning Rate": 1.9988079037124866e-05, "Finetune/Loss": 0.9070606827735901, "Finetune/Loss (Raw)": 0.956445038318634, "Finetune/Step": 224, "Finetune/Step Time": 2.8209084812551737} +{"Finetune/Learning Rate": 1.998775909080224e-05, "Finetune/Loss": 0.9041423797607422, "Finetune/Loss (Raw)": 0.6216384768486023, "Finetune/Step": 225, "Finetune/Step Time": 2.845611421391368} +{"Finetune/Learning Rate": 1.998743491026221e-05, "Finetune/Loss": 0.9041234254837036, "Finetune/Loss (Raw)": 0.9256523251533508, "Finetune/Step": 226, "Finetune/Step Time": 2.849097114056349} +{"Finetune/Learning Rate": 1.9987106495642207e-05, "Finetune/Loss": 0.904617428779602, "Finetune/Loss (Raw)": 0.9767218232154846, "Finetune/Step": 227, "Finetune/Step Time": 2.848520625382662} +{"Finetune/Learning Rate": 1.9986773847081458e-05, "Finetune/Loss": 0.9084824919700623, "Finetune/Loss (Raw)": 0.9049871563911438, "Finetune/Step": 228, "Finetune/Step Time": 2.8200813736766577} +{"Finetune/Learning Rate": 1.9986436964720986e-05, "Finetune/Loss": 0.9082865715026855, "Finetune/Loss (Raw)": 0.8903974294662476, "Finetune/Step": 229, "Finetune/Step Time": 2.8227112721651793} +{"Finetune/Learning Rate": 1.9986095848703616e-05, "Finetune/Loss": 0.9081032276153564, "Finetune/Loss (Raw)": 0.9344038963317871, "Finetune/Step": 230, "Finetune/Step Time": 2.8215779326856136} +{"Finetune/Learning Rate": 1.9985750499173955e-05, "Finetune/Loss": 0.9077904224395752, "Finetune/Loss (Raw)": 0.936414361000061, "Finetune/Step": 231, "Finetune/Step Time": 2.821196911856532} +{"Finetune/Learning Rate": 1.998540091627841e-05, "Finetune/Loss": 0.9079227447509766, "Finetune/Loss (Raw)": 0.9193891882896423, "Finetune/Step": 232, "Finetune/Step Time": 2.8203802797943354} +{"Finetune/Learning Rate": 1.9985047100165188e-05, "Finetune/Loss": 0.9082962274551392, "Finetune/Loss (Raw)": 0.7037320137023926, "Finetune/Step": 233, "Finetune/Step Time": 2.8179223965853453} +{"Finetune/Learning Rate": 1.9984689050984277e-05, "Finetune/Loss": 0.9083128571510315, "Finetune/Loss (Raw)": 0.9444047808647156, "Finetune/Step": 234, "Finetune/Step Time": 2.813519161194563} +{"Finetune/Learning Rate": 1.9984326768887482e-05, "Finetune/Loss": 0.9065855741500854, "Finetune/Loss (Raw)": 0.7150647640228271, "Finetune/Step": 235, "Finetune/Step Time": 2.811097525060177} +{"Finetune/Learning Rate": 1.9983960254028377e-05, "Finetune/Loss": 0.908981204032898, "Finetune/Loss (Raw)": 0.972878098487854, "Finetune/Step": 236, "Finetune/Step Time": 2.7841055560857058} +{"Finetune/Learning Rate": 1.9983589506562348e-05, "Finetune/Loss": 0.9082309603691101, "Finetune/Loss (Raw)": 0.836794912815094, "Finetune/Step": 237, "Finetune/Step Time": 2.785600522533059} +{"Finetune/Learning Rate": 1.9983214526646574e-05, "Finetune/Loss": 0.908126711845398, "Finetune/Loss (Raw)": 0.8887200951576233, "Finetune/Step": 238, "Finetune/Step Time": 2.787697935476899} +{"Finetune/Learning Rate": 1.9982835314440013e-05, "Finetune/Loss": 0.9078961610794067, "Finetune/Loss (Raw)": 0.9277554750442505, "Finetune/Step": 239, "Finetune/Step Time": 2.7892865762114525} +{"Finetune/Learning Rate": 1.998245187010344e-05, "Finetune/Loss": 0.9084139466285706, "Finetune/Loss (Raw)": 0.9991790056228638, "Finetune/Step": 240, "Finetune/Step Time": 2.7895005084574223} +{"Finetune/Learning Rate": 1.9982064193799405e-05, "Finetune/Loss": 0.9080617427825928, "Finetune/Loss (Raw)": 0.9847898483276367, "Finetune/Step": 241, "Finetune/Step Time": 2.7927920036017895} +{"Finetune/Learning Rate": 1.9981672285692265e-05, "Finetune/Loss": 0.9075106978416443, "Finetune/Loss (Raw)": 0.8727607727050781, "Finetune/Step": 242, "Finetune/Step Time": 2.7966329101473093} +{"Finetune/Learning Rate": 1.9981276145948163e-05, "Finetune/Loss": 0.9079594612121582, "Finetune/Loss (Raw)": 0.9638976454734802, "Finetune/Step": 243, "Finetune/Step Time": 2.7923891991376877} +{"Finetune/Learning Rate": 1.9980875774735038e-05, "Finetune/Loss": 0.9066924452781677, "Finetune/Loss (Raw)": 0.6600176095962524, "Finetune/Step": 244, "Finetune/Step Time": 2.817142991349101} +{"Finetune/Learning Rate": 1.9980471172222625e-05, "Finetune/Loss": 0.9070224165916443, "Finetune/Loss (Raw)": 0.9301880598068237, "Finetune/Step": 245, "Finetune/Step Time": 2.8181199058890343} +{"Finetune/Learning Rate": 1.9980062338582452e-05, "Finetune/Loss": 0.9064623117446899, "Finetune/Loss (Raw)": 0.8592278957366943, "Finetune/Step": 246, "Finetune/Step Time": 2.8180122170597315} +{"Finetune/Learning Rate": 1.9979649273987838e-05, "Finetune/Loss": 0.9051147103309631, "Finetune/Loss (Raw)": 0.8693895936012268, "Finetune/Step": 247, "Finetune/Step Time": 2.8212523963302374} +{"Finetune/Learning Rate": 1.9979231978613896e-05, "Finetune/Loss": 0.9040387868881226, "Finetune/Loss (Raw)": 0.8315191268920898, "Finetune/Step": 248, "Finetune/Step Time": 2.829625580459833} +{"Finetune/Learning Rate": 1.9978810452637544e-05, "Finetune/Loss": 0.9026859402656555, "Finetune/Loss (Raw)": 0.7946940064430237, "Finetune/Step": 249, "Finetune/Step Time": 2.853142010048032} +{"Finetune/Learning Rate": 1.9978384696237475e-05, "Finetune/Loss": 0.90496826171875, "Finetune/Loss (Raw)": 0.7983158826828003, "Finetune/Step": 250, "Finetune/Step Time": 2.8308762703090906} +{"Finetune/Learning Rate": 1.9977954709594186e-05, "Finetune/Loss": 0.9044371843338013, "Finetune/Loss (Raw)": 0.888802170753479, "Finetune/Step": 251, "Finetune/Step Time": 2.8279461711645126} +{"Finetune/Learning Rate": 1.9977520492889974e-05, "Finetune/Loss": 0.9030333757400513, "Finetune/Loss (Raw)": 0.7165364027023315, "Finetune/Step": 252, "Finetune/Step Time": 2.8269402254372835} +{"Finetune/Learning Rate": 1.9977082046308907e-05, "Finetune/Loss": 0.9032979607582092, "Finetune/Loss (Raw)": 0.9517515301704407, "Finetune/Step": 253, "Finetune/Step Time": 2.8308205883949995} +{"Finetune/Learning Rate": 1.997663937003687e-05, "Finetune/Loss": 0.9019749760627747, "Finetune/Loss (Raw)": 0.8979575634002686, "Finetune/Step": 254, "Finetune/Step Time": 2.830827835947275} +{"Finetune/Learning Rate": 1.9976192464261528e-05, "Finetune/Loss": 0.9019734859466553, "Finetune/Loss (Raw)": 0.9156753420829773, "Finetune/Step": 255, "Finetune/Step Time": 2.8303944263607264} +{"Finetune/Learning Rate": 1.9975741329172346e-05, "Finetune/Loss": 0.9025543928146362, "Finetune/Loss (Raw)": 0.9559078812599182, "Finetune/Step": 256, "Finetune/Step Time": 2.8324761856347322} +{"Finetune/Learning Rate": 1.997528596496057e-05, "Finetune/Loss": 0.9016510248184204, "Finetune/Loss (Raw)": 0.8139870762825012, "Finetune/Step": 257, "Finetune/Step Time": 2.8378682620823383} +{"Finetune/Learning Rate": 1.997482637181926e-05, "Finetune/Loss": 0.900783896446228, "Finetune/Loss (Raw)": 0.7728762030601501, "Finetune/Step": 258, "Finetune/Step Time": 2.8393551502376795} +{"Finetune/Learning Rate": 1.997436254994325e-05, "Finetune/Loss": 0.9004050493240356, "Finetune/Loss (Raw)": 0.8773290514945984, "Finetune/Step": 259, "Finetune/Step Time": 2.8295150995254517} +{"Finetune/Learning Rate": 1.997389449952917e-05, "Finetune/Loss": 0.8988289833068848, "Finetune/Loss (Raw)": 0.750959038734436, "Finetune/Step": 260, "Finetune/Step Time": 2.827875290066004} +{"Finetune/Learning Rate": 1.9973422220775446e-05, "Finetune/Loss": 0.9012848138809204, "Finetune/Loss (Raw)": 0.8957884907722473, "Finetune/Step": 261, "Finetune/Step Time": 2.808358510956168} +{"Finetune/Learning Rate": 1.9972945713882298e-05, "Finetune/Loss": 0.9005042314529419, "Finetune/Loss (Raw)": 0.9202541708946228, "Finetune/Step": 262, "Finetune/Step Time": 2.8085108306258917} +{"Finetune/Learning Rate": 1.9972464979051743e-05, "Finetune/Loss": 0.9001702666282654, "Finetune/Loss (Raw)": 0.9165034294128418, "Finetune/Step": 263, "Finetune/Step Time": 2.8092174734920263} +{"Finetune/Learning Rate": 1.9971980016487574e-05, "Finetune/Loss": 0.8999385833740234, "Finetune/Loss (Raw)": 1.014986276626587, "Finetune/Step": 264, "Finetune/Step Time": 2.8062475956976414} +{"Finetune/Learning Rate": 1.9971490826395392e-05, "Finetune/Loss": 0.896979808807373, "Finetune/Loss (Raw)": 0.610826313495636, "Finetune/Step": 265, "Finetune/Step Time": 2.8316912800073624} +{"Finetune/Learning Rate": 1.9970997408982585e-05, "Finetune/Loss": 0.897385835647583, "Finetune/Loss (Raw)": 0.9924683570861816, "Finetune/Step": 266, "Finetune/Step Time": 2.833323512226343} +{"Finetune/Learning Rate": 1.9970499764458326e-05, "Finetune/Loss": 0.9004518985748291, "Finetune/Loss (Raw)": 0.9767423868179321, "Finetune/Step": 267, "Finetune/Step Time": 2.8114694580435753} +{"Finetune/Learning Rate": 1.9969997893033594e-05, "Finetune/Loss": 0.9005126953125, "Finetune/Loss (Raw)": 0.9674158692359924, "Finetune/Step": 268, "Finetune/Step Time": 2.8084323592483997} +{"Finetune/Learning Rate": 1.996949179492115e-05, "Finetune/Loss": 0.9008192420005798, "Finetune/Loss (Raw)": 0.9491398930549622, "Finetune/Step": 269, "Finetune/Step Time": 2.8101922180503607} +{"Finetune/Learning Rate": 1.9968981470335552e-05, "Finetune/Loss": 0.9007136821746826, "Finetune/Loss (Raw)": 0.7983847260475159, "Finetune/Step": 270, "Finetune/Step Time": 2.7878756504505873} +{"Finetune/Learning Rate": 1.9968466919493147e-05, "Finetune/Loss": 0.8999767303466797, "Finetune/Loss (Raw)": 0.8798660039901733, "Finetune/Step": 271, "Finetune/Step Time": 2.788102285936475} +{"Finetune/Learning Rate": 1.9967948142612065e-05, "Finetune/Loss": 0.8990734815597534, "Finetune/Loss (Raw)": 0.9105454087257385, "Finetune/Step": 272, "Finetune/Step Time": 2.789181334897876} +{"Finetune/Learning Rate": 1.996742513991225e-05, "Finetune/Loss": 0.8986698389053345, "Finetune/Loss (Raw)": 0.8412973880767822, "Finetune/Step": 273, "Finetune/Step Time": 2.7871250342577696} +{"Finetune/Learning Rate": 1.9966897911615417e-05, "Finetune/Loss": 0.898026168346405, "Finetune/Loss (Raw)": 0.9339650869369507, "Finetune/Step": 274, "Finetune/Step Time": 2.785980887711048} +{"Finetune/Learning Rate": 1.996636645794508e-05, "Finetune/Loss": 0.898235559463501, "Finetune/Loss (Raw)": 1.0232479572296143, "Finetune/Step": 275, "Finetune/Step Time": 2.785013098269701} +{"Finetune/Learning Rate": 1.9965830779126543e-05, "Finetune/Loss": 0.8996439576148987, "Finetune/Loss (Raw)": 1.0146290063858032, "Finetune/Step": 276, "Finetune/Step Time": 2.7820890191942453} +{"Finetune/Learning Rate": 1.9965290875386904e-05, "Finetune/Loss": 0.8969597816467285, "Finetune/Loss (Raw)": 0.5339549779891968, "Finetune/Step": 277, "Finetune/Step Time": 2.809581018984318} +{"Finetune/Learning Rate": 1.996474674695505e-05, "Finetune/Loss": 0.8961727023124695, "Finetune/Loss (Raw)": 0.8736966252326965, "Finetune/Step": 278, "Finetune/Step Time": 2.807266552001238} +{"Finetune/Learning Rate": 1.996419839406166e-05, "Finetune/Loss": 0.8957769870758057, "Finetune/Loss (Raw)": 0.8914942741394043, "Finetune/Step": 279, "Finetune/Step Time": 2.8071917295455933} +{"Finetune/Learning Rate": 1.99636458169392e-05, "Finetune/Loss": 0.8950045108795166, "Finetune/Loss (Raw)": 0.8703862428665161, "Finetune/Step": 280, "Finetune/Step Time": 2.807997714728117} +{"Finetune/Learning Rate": 1.9963089015821934e-05, "Finetune/Loss": 0.893856406211853, "Finetune/Loss (Raw)": 0.8107024431228638, "Finetune/Step": 281, "Finetune/Step Time": 2.8107317946851254} +{"Finetune/Learning Rate": 1.996252799094591e-05, "Finetune/Loss": 0.8931329846382141, "Finetune/Loss (Raw)": 0.879328191280365, "Finetune/Step": 282, "Finetune/Step Time": 2.811747867614031} +{"Finetune/Learning Rate": 1.9961962742548966e-05, "Finetune/Loss": 0.8933786749839783, "Finetune/Loss (Raw)": 1.0348292589187622, "Finetune/Step": 283, "Finetune/Step Time": 2.8127301558852196} +{"Finetune/Learning Rate": 1.9961393270870738e-05, "Finetune/Loss": 0.895696759223938, "Finetune/Loss (Raw)": 0.8953426480293274, "Finetune/Step": 284, "Finetune/Step Time": 2.79347375407815} +{"Finetune/Learning Rate": 1.9960819576152653e-05, "Finetune/Loss": 0.8953344821929932, "Finetune/Loss (Raw)": 0.8468558192253113, "Finetune/Step": 285, "Finetune/Step Time": 2.794562090188265} +{"Finetune/Learning Rate": 1.9960241658637917e-05, "Finetune/Loss": 0.8960244655609131, "Finetune/Loss (Raw)": 0.9524030685424805, "Finetune/Step": 286, "Finetune/Step Time": 2.797174960374832} +{"Finetune/Learning Rate": 1.9959659518571527e-05, "Finetune/Loss": 0.894686222076416, "Finetune/Loss (Raw)": 0.8310865163803101, "Finetune/Step": 287, "Finetune/Step Time": 2.796409025788307} +{"Finetune/Learning Rate": 1.995907315620029e-05, "Finetune/Loss": 0.8953456878662109, "Finetune/Loss (Raw)": 0.9641002416610718, "Finetune/Step": 288, "Finetune/Step Time": 2.795294551178813} +{"Finetune/Learning Rate": 1.995848257177278e-05, "Finetune/Loss": 0.8949370384216309, "Finetune/Loss (Raw)": 0.8922494649887085, "Finetune/Step": 289, "Finetune/Step Time": 2.794205540791154} +{"Finetune/Learning Rate": 1.995788776553937e-05, "Finetune/Loss": 0.8926520347595215, "Finetune/Loss (Raw)": 0.5993216037750244, "Finetune/Step": 290, "Finetune/Step Time": 2.818232409656048} +{"Finetune/Learning Rate": 1.9957288737752226e-05, "Finetune/Loss": 0.8928117752075195, "Finetune/Loss (Raw)": 0.988322913646698, "Finetune/Step": 291, "Finetune/Step Time": 2.82276514172554} +{"Finetune/Learning Rate": 1.99566854886653e-05, "Finetune/Loss": 0.8897308111190796, "Finetune/Loss (Raw)": 0.45845744013786316, "Finetune/Step": 292, "Finetune/Step Time": 2.8502258770167828} +{"Finetune/Learning Rate": 1.9956078018534328e-05, "Finetune/Loss": 0.8897813558578491, "Finetune/Loss (Raw)": 0.9110357165336609, "Finetune/Step": 293, "Finetune/Step Time": 2.8528468124568462} +{"Finetune/Learning Rate": 1.9955466327616846e-05, "Finetune/Loss": 0.8894215822219849, "Finetune/Loss (Raw)": 0.9722986817359924, "Finetune/Step": 294, "Finetune/Step Time": 2.850859496742487} +{"Finetune/Learning Rate": 1.9954850416172177e-05, "Finetune/Loss": 0.8908963203430176, "Finetune/Loss (Raw)": 1.0398221015930176, "Finetune/Step": 295, "Finetune/Step Time": 2.8514441177248955} +{"Finetune/Learning Rate": 1.9954230284461428e-05, "Finetune/Loss": 0.8907403945922852, "Finetune/Loss (Raw)": 0.920900821685791, "Finetune/Step": 296, "Finetune/Step Time": 2.851667134091258} +{"Finetune/Learning Rate": 1.9953605932747493e-05, "Finetune/Loss": 0.8914339542388916, "Finetune/Loss (Raw)": 0.9364654421806335, "Finetune/Step": 297, "Finetune/Step Time": 2.850635202601552} +{"Finetune/Learning Rate": 1.995297736129507e-05, "Finetune/Loss": 0.8896560072898865, "Finetune/Loss (Raw)": 0.6176515817642212, "Finetune/Step": 298, "Finetune/Step Time": 2.8770044557750225} +{"Finetune/Learning Rate": 1.995234457037063e-05, "Finetune/Loss": 0.8891932964324951, "Finetune/Loss (Raw)": 0.8488042950630188, "Finetune/Step": 299, "Finetune/Step Time": 2.87572243437171} +{"Finetune/Learning Rate": 1.9951707560242438e-05, "Finetune/Loss": 0.8895769119262695, "Finetune/Loss (Raw)": 0.9664296507835388, "Finetune/Step": 300, "Finetune/Step Time": 2.8744174782186747} +{"Finetune/Learning Rate": 1.9951066331180555e-05, "Finetune/Loss": 0.8899749517440796, "Finetune/Loss (Raw)": 0.9531359672546387, "Finetune/Step": 301, "Finetune/Step Time": 2.875287188217044} +{"Finetune/Learning Rate": 1.9950420883456813e-05, "Finetune/Loss": 0.8887118101119995, "Finetune/Loss (Raw)": 0.8187867403030396, "Finetune/Step": 302, "Finetune/Step Time": 2.8755610771477222} +{"Finetune/Learning Rate": 1.9949771217344853e-05, "Finetune/Loss": 0.8914625644683838, "Finetune/Loss (Raw)": 0.9692900776863098, "Finetune/Step": 303, "Finetune/Step Time": 2.8512257412075996} +{"Finetune/Learning Rate": 1.9949117333120096e-05, "Finetune/Loss": 0.890626847743988, "Finetune/Loss (Raw)": 0.8558210730552673, "Finetune/Step": 304, "Finetune/Step Time": 2.864104676991701} +{"Finetune/Learning Rate": 1.994845923105974e-05, "Finetune/Loss": 0.892865777015686, "Finetune/Loss (Raw)": 0.9059956669807434, "Finetune/Step": 305, "Finetune/Step Time": 2.8454568665474653} +{"Finetune/Learning Rate": 1.994779691144279e-05, "Finetune/Loss": 0.8919821977615356, "Finetune/Loss (Raw)": 0.8273431062698364, "Finetune/Step": 306, "Finetune/Step Time": 2.8440458551049232} +{"Finetune/Learning Rate": 1.994713037455003e-05, "Finetune/Loss": 0.891252875328064, "Finetune/Loss (Raw)": 0.8488600254058838, "Finetune/Step": 307, "Finetune/Step Time": 2.8447466287761927} +{"Finetune/Learning Rate": 1.9946459620664026e-05, "Finetune/Loss": 0.8909287452697754, "Finetune/Loss (Raw)": 0.8743211627006531, "Finetune/Step": 308, "Finetune/Step Time": 2.843961277976632} +{"Finetune/Learning Rate": 1.9945784650069145e-05, "Finetune/Loss": 0.889403223991394, "Finetune/Loss (Raw)": 0.8021250367164612, "Finetune/Step": 309, "Finetune/Step Time": 2.8425813633948565} +{"Finetune/Learning Rate": 1.994510546305153e-05, "Finetune/Loss": 0.891823410987854, "Finetune/Loss (Raw)": 0.9482272267341614, "Finetune/Step": 310, "Finetune/Step Time": 2.818776184692979} +{"Finetune/Learning Rate": 1.9944422059899116e-05, "Finetune/Loss": 0.8920689225196838, "Finetune/Loss (Raw)": 0.9589657783508301, "Finetune/Step": 311, "Finetune/Step Time": 2.8192380256950855} +{"Finetune/Learning Rate": 1.9943734440901625e-05, "Finetune/Loss": 0.8926369547843933, "Finetune/Loss (Raw)": 0.9312710762023926, "Finetune/Step": 312, "Finetune/Step Time": 2.818748692050576} +{"Finetune/Learning Rate": 1.9943042606350572e-05, "Finetune/Loss": 0.8926239013671875, "Finetune/Loss (Raw)": 1.0382075309753418, "Finetune/Step": 313, "Finetune/Step Time": 2.820219047367573} +{"Finetune/Learning Rate": 1.9942346556539247e-05, "Finetune/Loss": 0.8922764658927917, "Finetune/Loss (Raw)": 0.9103420376777649, "Finetune/Step": 314, "Finetune/Step Time": 2.8195895589888096} +{"Finetune/Learning Rate": 1.9941646291762736e-05, "Finetune/Loss": 0.8904685974121094, "Finetune/Loss (Raw)": 0.7729124426841736, "Finetune/Step": 315, "Finetune/Step Time": 2.817781303077936} +{"Finetune/Learning Rate": 1.9940941812317915e-05, "Finetune/Loss": 0.8898148536682129, "Finetune/Loss (Raw)": 0.9766444563865662, "Finetune/Step": 316, "Finetune/Step Time": 2.816730571910739} +{"Finetune/Learning Rate": 1.9940233118503433e-05, "Finetune/Loss": 0.8901566863059998, "Finetune/Loss (Raw)": 0.9048174619674683, "Finetune/Step": 317, "Finetune/Step Time": 2.8193773832172155} +{"Finetune/Learning Rate": 1.993952021061974e-05, "Finetune/Loss": 0.8898036479949951, "Finetune/Loss (Raw)": 0.9183805584907532, "Finetune/Step": 318, "Finetune/Step Time": 2.822980547323823} +{"Finetune/Learning Rate": 1.9938803088969062e-05, "Finetune/Loss": 0.8888430595397949, "Finetune/Loss (Raw)": 0.7852482199668884, "Finetune/Step": 319, "Finetune/Step Time": 2.811050295829773} +{"Finetune/Learning Rate": 1.9938081753855423e-05, "Finetune/Loss": 0.8890836238861084, "Finetune/Loss (Raw)": 1.0577081441879272, "Finetune/Step": 320, "Finetune/Step Time": 2.8130852915346622} +{"Finetune/Learning Rate": 1.9937356205584623e-05, "Finetune/Loss": 0.888843834400177, "Finetune/Loss (Raw)": 0.8774617314338684, "Finetune/Step": 321, "Finetune/Step Time": 2.8132814280688763} +{"Finetune/Learning Rate": 1.9936626444464245e-05, "Finetune/Loss": 0.8891576528549194, "Finetune/Loss (Raw)": 0.9444333910942078, "Finetune/Step": 322, "Finetune/Step Time": 2.8133379705250263} +{"Finetune/Learning Rate": 1.993589247080367e-05, "Finetune/Loss": 0.8871690630912781, "Finetune/Loss (Raw)": 0.7063040733337402, "Finetune/Step": 323, "Finetune/Step Time": 2.8358039651066065} +{"Finetune/Learning Rate": 1.9935154284914063e-05, "Finetune/Loss": 0.8868495225906372, "Finetune/Loss (Raw)": 0.9082693457603455, "Finetune/Step": 324, "Finetune/Step Time": 2.8395312186330557} +{"Finetune/Learning Rate": 1.9934411887108367e-05, "Finetune/Loss": 0.8878370523452759, "Finetune/Loss (Raw)": 0.9981158375740051, "Finetune/Step": 325, "Finetune/Step Time": 2.836117956787348} +{"Finetune/Learning Rate": 1.9933665277701317e-05, "Finetune/Loss": 0.8877012729644775, "Finetune/Loss (Raw)": 0.9955416917800903, "Finetune/Step": 326, "Finetune/Step Time": 2.8357409853488207} +{"Finetune/Learning Rate": 1.9932914457009425e-05, "Finetune/Loss": 0.8891004323959351, "Finetune/Loss (Raw)": 0.8461746573448181, "Finetune/Step": 327, "Finetune/Step Time": 2.8121060375124216} +{"Finetune/Learning Rate": 1.9932159425351e-05, "Finetune/Loss": 0.8892125487327576, "Finetune/Loss (Raw)": 0.9840969443321228, "Finetune/Step": 328, "Finetune/Step Time": 2.8134037144482136} +{"Finetune/Learning Rate": 1.993140018304613e-05, "Finetune/Loss": 0.8893750905990601, "Finetune/Loss (Raw)": 1.0058099031448364, "Finetune/Step": 329, "Finetune/Step Time": 2.816612560302019} +{"Finetune/Learning Rate": 1.9930636730416687e-05, "Finetune/Loss": 0.8888223171234131, "Finetune/Loss (Raw)": 0.9217467308044434, "Finetune/Step": 330, "Finetune/Step Time": 2.8212603759020567} +{"Finetune/Learning Rate": 1.9929869067786328e-05, "Finetune/Loss": 0.8874253034591675, "Finetune/Loss (Raw)": 0.8409437537193298, "Finetune/Step": 331, "Finetune/Step Time": 2.822239350527525} +{"Finetune/Learning Rate": 1.9929097195480504e-05, "Finetune/Loss": 0.8869553804397583, "Finetune/Loss (Raw)": 0.8872143626213074, "Finetune/Step": 332, "Finetune/Step Time": 2.821600928902626} +{"Finetune/Learning Rate": 1.9928321113826433e-05, "Finetune/Loss": 0.8868651986122131, "Finetune/Loss (Raw)": 0.933362603187561, "Finetune/Step": 333, "Finetune/Step Time": 2.8220263570547104} +{"Finetune/Learning Rate": 1.9927540823153135e-05, "Finetune/Loss": 0.889182448387146, "Finetune/Loss (Raw)": 0.9960430860519409, "Finetune/Step": 334, "Finetune/Step Time": 2.79909485951066} +{"Finetune/Learning Rate": 1.9926756323791405e-05, "Finetune/Loss": 0.8887485861778259, "Finetune/Loss (Raw)": 0.841106653213501, "Finetune/Step": 335, "Finetune/Step Time": 2.79852064140141} +{"Finetune/Learning Rate": 1.9925967616073824e-05, "Finetune/Loss": 0.8847596645355225, "Finetune/Loss (Raw)": 0.5259698033332825, "Finetune/Step": 336, "Finetune/Step Time": 2.81812528334558} +{"Finetune/Learning Rate": 1.9925174700334758e-05, "Finetune/Loss": 0.8849141597747803, "Finetune/Loss (Raw)": 0.8865146040916443, "Finetune/Step": 337, "Finetune/Step Time": 2.8173415772616863} +{"Finetune/Learning Rate": 1.992437757691035e-05, "Finetune/Loss": 0.8854110240936279, "Finetune/Loss (Raw)": 0.9153169393539429, "Finetune/Step": 338, "Finetune/Step Time": 2.8129163961857557} +{"Finetune/Learning Rate": 1.9923576246138543e-05, "Finetune/Loss": 0.8860555291175842, "Finetune/Loss (Raw)": 1.0144548416137695, "Finetune/Step": 339, "Finetune/Step Time": 2.8381201699376106} +{"Finetune/Learning Rate": 1.9922770708359047e-05, "Finetune/Loss": 0.8856025338172913, "Finetune/Loss (Raw)": 1.0074137449264526, "Finetune/Step": 340, "Finetune/Step Time": 2.8362217601388693} +{"Finetune/Learning Rate": 1.9921960963913364e-05, "Finetune/Loss": 0.8865347504615784, "Finetune/Loss (Raw)": 1.0154659748077393, "Finetune/Step": 341, "Finetune/Step Time": 2.836067270487547} +{"Finetune/Learning Rate": 1.9921147013144782e-05, "Finetune/Loss": 0.8853425979614258, "Finetune/Loss (Raw)": 0.8528230786323547, "Finetune/Step": 342, "Finetune/Step Time": 2.8387842755764723} +{"Finetune/Learning Rate": 1.992032885639836e-05, "Finetune/Loss": 0.8859506845474243, "Finetune/Loss (Raw)": 0.916650652885437, "Finetune/Step": 343, "Finetune/Step Time": 2.84293001703918} +{"Finetune/Learning Rate": 1.991950649402095e-05, "Finetune/Loss": 0.8847283124923706, "Finetune/Loss (Raw)": 0.8076806664466858, "Finetune/Step": 344, "Finetune/Step Time": 2.844118934124708} +{"Finetune/Learning Rate": 1.991867992636119e-05, "Finetune/Loss": 0.881507396697998, "Finetune/Loss (Raw)": 0.4933627247810364, "Finetune/Step": 345, "Finetune/Step Time": 2.868336170911789} +{"Finetune/Learning Rate": 1.9917849153769492e-05, "Finetune/Loss": 0.8803854584693909, "Finetune/Loss (Raw)": 0.8379981517791748, "Finetune/Step": 346, "Finetune/Step Time": 2.865577396005392} +{"Finetune/Learning Rate": 1.991701417659805e-05, "Finetune/Loss": 0.8804630041122437, "Finetune/Loss (Raw)": 0.616333544254303, "Finetune/Step": 347, "Finetune/Step Time": 2.8584188371896744} +{"Finetune/Learning Rate": 1.9916174995200853e-05, "Finetune/Loss": 0.880531907081604, "Finetune/Loss (Raw)": 0.9455564618110657, "Finetune/Step": 348, "Finetune/Step Time": 2.8544850163161755} +{"Finetune/Learning Rate": 1.991533160993366e-05, "Finetune/Loss": 0.8798302412033081, "Finetune/Loss (Raw)": 0.8798951506614685, "Finetune/Step": 349, "Finetune/Step Time": 2.854291031137109} +{"Finetune/Learning Rate": 1.9914484021154018e-05, "Finetune/Loss": 0.8789834976196289, "Finetune/Loss (Raw)": 0.822016716003418, "Finetune/Step": 350, "Finetune/Step Time": 2.849848072975874} +{"Finetune/Learning Rate": 1.991363222922125e-05, "Finetune/Loss": 0.8791249394416809, "Finetune/Loss (Raw)": 0.9023500680923462, "Finetune/Step": 351, "Finetune/Step Time": 2.846730435267091} +{"Finetune/Learning Rate": 1.9912776234496468e-05, "Finetune/Loss": 0.8783391714096069, "Finetune/Loss (Raw)": 0.8558602929115295, "Finetune/Step": 352, "Finetune/Step Time": 2.8500681817531586} +{"Finetune/Learning Rate": 1.9911916037342568e-05, "Finetune/Loss": 0.8810100555419922, "Finetune/Loss (Raw)": 0.9635156393051147, "Finetune/Step": 353, "Finetune/Step Time": 2.824684439226985} +{"Finetune/Learning Rate": 1.9911051638124213e-05, "Finetune/Loss": 0.8807111382484436, "Finetune/Loss (Raw)": 0.8873904943466187, "Finetune/Step": 354, "Finetune/Step Time": 2.821441937237978} +{"Finetune/Learning Rate": 1.9910183037207865e-05, "Finetune/Loss": 0.8801702260971069, "Finetune/Loss (Raw)": 0.907489001750946, "Finetune/Step": 355, "Finetune/Step Time": 2.8221805207431316} +{"Finetune/Learning Rate": 1.9909310234961752e-05, "Finetune/Loss": 0.880136251449585, "Finetune/Loss (Raw)": 0.9006317853927612, "Finetune/Step": 356, "Finetune/Step Time": 2.827527714893222} +{"Finetune/Learning Rate": 1.99084332317559e-05, "Finetune/Loss": 0.8795801401138306, "Finetune/Loss (Raw)": 0.8192116022109985, "Finetune/Step": 357, "Finetune/Step Time": 2.82359485514462} +{"Finetune/Learning Rate": 1.9907552027962097e-05, "Finetune/Loss": 0.8793503642082214, "Finetune/Loss (Raw)": 0.9049986004829407, "Finetune/Step": 358, "Finetune/Step Time": 2.827288782224059} +{"Finetune/Learning Rate": 1.9906666623953926e-05, "Finetune/Loss": 0.8799862861633301, "Finetune/Loss (Raw)": 1.0178142786026, "Finetune/Step": 359, "Finetune/Step Time": 2.8251051045954227} +{"Finetune/Learning Rate": 1.9905777020106745e-05, "Finetune/Loss": 0.8797197341918945, "Finetune/Loss (Raw)": 0.8852635622024536, "Finetune/Step": 360, "Finetune/Step Time": 2.8380559012293816} +{"Finetune/Learning Rate": 1.9904883216797693e-05, "Finetune/Loss": 0.8813982605934143, "Finetune/Loss (Raw)": 0.9185880422592163, "Finetune/Step": 361, "Finetune/Step Time": 2.8130411822348833} +{"Finetune/Learning Rate": 1.990398521440569e-05, "Finetune/Loss": 0.8789708614349365, "Finetune/Loss (Raw)": 0.6336981654167175, "Finetune/Step": 362, "Finetune/Step Time": 2.840907085686922} +{"Finetune/Learning Rate": 1.9903083013311434e-05, "Finetune/Loss": 0.8767421245574951, "Finetune/Loss (Raw)": 0.42978981137275696, "Finetune/Step": 363, "Finetune/Step Time": 2.8717814050614834} +{"Finetune/Learning Rate": 1.990217661389741e-05, "Finetune/Loss": 0.8759446144104004, "Finetune/Loss (Raw)": 0.8707976937294006, "Finetune/Step": 364, "Finetune/Step Time": 2.869273705407977} +{"Finetune/Learning Rate": 1.9901266016547865e-05, "Finetune/Loss": 0.8765497207641602, "Finetune/Loss (Raw)": 0.9142424464225769, "Finetune/Step": 365, "Finetune/Step Time": 2.8694314770400524} +{"Finetune/Learning Rate": 1.9900351221648854e-05, "Finetune/Loss": 0.8765599131584167, "Finetune/Loss (Raw)": 0.8900265097618103, "Finetune/Step": 366, "Finetune/Step Time": 2.8675874266773462} +{"Finetune/Learning Rate": 1.9899432229588188e-05, "Finetune/Loss": 0.8758180737495422, "Finetune/Loss (Raw)": 0.8328007459640503, "Finetune/Step": 367, "Finetune/Step Time": 2.868604715913534} +{"Finetune/Learning Rate": 1.989850904075547e-05, "Finetune/Loss": 0.874901533126831, "Finetune/Loss (Raw)": 0.8818589448928833, "Finetune/Step": 368, "Finetune/Step Time": 2.8673097789287567} +{"Finetune/Learning Rate": 1.9897581655542063e-05, "Finetune/Loss": 0.8735601902008057, "Finetune/Loss (Raw)": 0.8130999207496643, "Finetune/Step": 369, "Finetune/Step Time": 2.8660166542977095} +{"Finetune/Learning Rate": 1.989665007434114e-05, "Finetune/Loss": 0.8736168742179871, "Finetune/Loss (Raw)": 0.8800138831138611, "Finetune/Step": 370, "Finetune/Step Time": 2.864717870950699} +{"Finetune/Learning Rate": 1.989571429754763e-05, "Finetune/Loss": 0.8727743625640869, "Finetune/Loss (Raw)": 0.8560581207275391, "Finetune/Step": 371, "Finetune/Step Time": 2.8611404579132795} +{"Finetune/Learning Rate": 1.9894774325558245e-05, "Finetune/Loss": 0.875008761882782, "Finetune/Loss (Raw)": 0.94601970911026, "Finetune/Step": 372, "Finetune/Step Time": 2.8369831293821335} +{"Finetune/Learning Rate": 1.989383015877148e-05, "Finetune/Loss": 0.8758809566497803, "Finetune/Loss (Raw)": 1.0418306589126587, "Finetune/Step": 373, "Finetune/Step Time": 2.837437704205513} +{"Finetune/Learning Rate": 1.98928817975876e-05, "Finetune/Loss": 0.8764781951904297, "Finetune/Loss (Raw)": 0.9356762766838074, "Finetune/Step": 374, "Finetune/Step Time": 2.839862322434783} +{"Finetune/Learning Rate": 1.9891929242408664e-05, "Finetune/Loss": 0.876640260219574, "Finetune/Loss (Raw)": 0.8901365995407104, "Finetune/Step": 375, "Finetune/Step Time": 2.838171871379018} +{"Finetune/Learning Rate": 1.989097249363849e-05, "Finetune/Loss": 0.8768168687820435, "Finetune/Loss (Raw)": 0.8541171550750732, "Finetune/Step": 376, "Finetune/Step Time": 2.828345784917474} +{"Finetune/Learning Rate": 1.9890011551682687e-05, "Finetune/Loss": 0.8773017525672913, "Finetune/Loss (Raw)": 0.8567613959312439, "Finetune/Step": 377, "Finetune/Step Time": 2.8065970335155725} +{"Finetune/Learning Rate": 1.988904641694864e-05, "Finetune/Loss": 0.8778021931648254, "Finetune/Loss (Raw)": 0.862372875213623, "Finetune/Step": 378, "Finetune/Step Time": 2.80534709058702} +{"Finetune/Learning Rate": 1.98880770898455e-05, "Finetune/Loss": 0.8779374361038208, "Finetune/Loss (Raw)": 0.9061116576194763, "Finetune/Step": 379, "Finetune/Step Time": 2.8087284304201603} +{"Finetune/Learning Rate": 1.9887103570784213e-05, "Finetune/Loss": 0.8802498579025269, "Finetune/Loss (Raw)": 1.0125356912612915, "Finetune/Step": 380, "Finetune/Step Time": 2.8058957643806934} +{"Finetune/Learning Rate": 1.9886125860177487e-05, "Finetune/Loss": 0.8794596791267395, "Finetune/Loss (Raw)": 0.85060054063797, "Finetune/Step": 381, "Finetune/Step Time": 2.8060785606503487} +{"Finetune/Learning Rate": 1.9885143958439818e-05, "Finetune/Loss": 0.8793697953224182, "Finetune/Loss (Raw)": 0.8864550590515137, "Finetune/Step": 382, "Finetune/Step Time": 2.8080613054335117} +{"Finetune/Learning Rate": 1.9884157865987472e-05, "Finetune/Loss": 0.8793379664421082, "Finetune/Loss (Raw)": 0.9116016030311584, "Finetune/Step": 383, "Finetune/Step Time": 2.8093662541359663} +{"Finetune/Learning Rate": 1.9883167583238494e-05, "Finetune/Loss": 0.8783692121505737, "Finetune/Loss (Raw)": 0.8319089412689209, "Finetune/Step": 384, "Finetune/Step Time": 2.8132372722029686} +{"Finetune/Learning Rate": 1.9882173110612705e-05, "Finetune/Loss": 0.8791224956512451, "Finetune/Loss (Raw)": 0.9103991985321045, "Finetune/Step": 385, "Finetune/Step Time": 2.8145594522356987} +{"Finetune/Learning Rate": 1.9881174448531705e-05, "Finetune/Loss": 0.8798994421958923, "Finetune/Loss (Raw)": 0.872331440448761, "Finetune/Step": 386, "Finetune/Step Time": 2.8151312861591578} +{"Finetune/Learning Rate": 1.988017159741886e-05, "Finetune/Loss": 0.8800060749053955, "Finetune/Loss (Raw)": 0.8909801244735718, "Finetune/Step": 387, "Finetune/Step Time": 2.8158636186271906} +{"Finetune/Learning Rate": 1.987916455769933e-05, "Finetune/Loss": 0.8814871311187744, "Finetune/Loss (Raw)": 0.9405331611633301, "Finetune/Step": 388, "Finetune/Step Time": 2.8162828758358955} +{"Finetune/Learning Rate": 1.987815332980003e-05, "Finetune/Loss": 0.8808785676956177, "Finetune/Loss (Raw)": 0.8178936243057251, "Finetune/Step": 389, "Finetune/Step Time": 2.8165215589106083} +{"Finetune/Learning Rate": 1.9877137914149664e-05, "Finetune/Loss": 0.8804309368133545, "Finetune/Loss (Raw)": 0.8629552721977234, "Finetune/Step": 390, "Finetune/Step Time": 2.8139328453689814} +{"Finetune/Learning Rate": 1.9876118311178712e-05, "Finetune/Loss": 0.8802734613418579, "Finetune/Loss (Raw)": 0.8963497281074524, "Finetune/Step": 391, "Finetune/Step Time": 2.8170116804540157} +{"Finetune/Learning Rate": 1.9875094521319423e-05, "Finetune/Loss": 0.8798282742500305, "Finetune/Loss (Raw)": 0.9579985737800598, "Finetune/Step": 392, "Finetune/Step Time": 2.8153996001929045} +{"Finetune/Learning Rate": 1.9874066545005823e-05, "Finetune/Loss": 0.8817765712738037, "Finetune/Loss (Raw)": 0.8602069020271301, "Finetune/Step": 393, "Finetune/Step Time": 2.7883451152592897} +{"Finetune/Learning Rate": 1.987303438267371e-05, "Finetune/Loss": 0.878460705280304, "Finetune/Loss (Raw)": 0.5680406093597412, "Finetune/Step": 394, "Finetune/Step Time": 2.8103909641504288} +{"Finetune/Learning Rate": 1.9871998034760663e-05, "Finetune/Loss": 0.878153920173645, "Finetune/Loss (Raw)": 0.9374735951423645, "Finetune/Step": 395, "Finetune/Step Time": 2.8106549959629774} +{"Finetune/Learning Rate": 1.9870957501706033e-05, "Finetune/Loss": 0.8777674436569214, "Finetune/Loss (Raw)": 0.9179520010948181, "Finetune/Step": 396, "Finetune/Step Time": 2.8130796123296022} +{"Finetune/Learning Rate": 1.986991278395094e-05, "Finetune/Loss": 0.877717137336731, "Finetune/Loss (Raw)": 0.9426929950714111, "Finetune/Step": 397, "Finetune/Step Time": 2.8102569971233606} +{"Finetune/Learning Rate": 1.9868863881938285e-05, "Finetune/Loss": 0.8798263669013977, "Finetune/Loss (Raw)": 1.068371057510376, "Finetune/Step": 398, "Finetune/Step Time": 2.812410721555352} +{"Finetune/Learning Rate": 1.9867810796112742e-05, "Finetune/Loss": 0.8791590929031372, "Finetune/Loss (Raw)": 0.79444819688797, "Finetune/Step": 399, "Finetune/Step Time": 2.8123880587518215} +{"Finetune/Learning Rate": 1.9866753526920754e-05, "Finetune/Loss": 0.8794145584106445, "Finetune/Loss (Raw)": 0.943254292011261, "Finetune/Step": 400, "Finetune/Step Time": 2.815810615196824} +{"Finetune/Learning Rate": 1.986569207481054e-05, "Finetune/Loss": 0.8798243403434753, "Finetune/Loss (Raw)": 0.8937435150146484, "Finetune/Step": 401, "Finetune/Step Time": 2.815389048308134} +{"Finetune/Learning Rate": 1.9864626440232097e-05, "Finetune/Loss": 0.8799515962600708, "Finetune/Loss (Raw)": 0.9502525925636292, "Finetune/Step": 402, "Finetune/Step Time": 2.8174398448318243} +{"Finetune/Learning Rate": 1.9863556623637183e-05, "Finetune/Loss": 0.8792901039123535, "Finetune/Loss (Raw)": 0.9385724067687988, "Finetune/Step": 403, "Finetune/Step Time": 2.8175761606544256} +{"Finetune/Learning Rate": 1.9862482625479346e-05, "Finetune/Loss": 0.8787062764167786, "Finetune/Loss (Raw)": 0.9399096965789795, "Finetune/Step": 404, "Finetune/Step Time": 2.819171652197838} +{"Finetune/Learning Rate": 1.986140444621389e-05, "Finetune/Loss": 0.8818565607070923, "Finetune/Loss (Raw)": 0.9371812343597412, "Finetune/Step": 405, "Finetune/Step Time": 2.79351819306612} +{"Finetune/Learning Rate": 1.9860322086297906e-05, "Finetune/Loss": 0.8815748691558838, "Finetune/Loss (Raw)": 0.837645947933197, "Finetune/Step": 406, "Finetune/Step Time": 2.7927111964672804} +{"Finetune/Learning Rate": 1.9859235546190246e-05, "Finetune/Loss": 0.881161093711853, "Finetune/Loss (Raw)": 0.838528573513031, "Finetune/Step": 407, "Finetune/Step Time": 2.791991278529167} +{"Finetune/Learning Rate": 1.9858144826351536e-05, "Finetune/Loss": 0.8809101581573486, "Finetune/Loss (Raw)": 0.8382737040519714, "Finetune/Step": 408, "Finetune/Step Time": 2.793786009773612} +{"Finetune/Learning Rate": 1.9857049927244186e-05, "Finetune/Loss": 0.881279706954956, "Finetune/Loss (Raw)": 0.8579933643341064, "Finetune/Step": 409, "Finetune/Step Time": 2.792505346238613} +{"Finetune/Learning Rate": 1.9855950849332358e-05, "Finetune/Loss": 0.8818918466567993, "Finetune/Loss (Raw)": 0.9576947689056396, "Finetune/Step": 410, "Finetune/Step Time": 2.7924059871584177} +{"Finetune/Learning Rate": 1.9854847593081997e-05, "Finetune/Loss": 0.8805321455001831, "Finetune/Loss (Raw)": 0.8607861995697021, "Finetune/Step": 411, "Finetune/Step Time": 2.79188634455204} +{"Finetune/Learning Rate": 1.9853740158960825e-05, "Finetune/Loss": 0.8802640438079834, "Finetune/Loss (Raw)": 0.8610217571258545, "Finetune/Step": 412, "Finetune/Step Time": 2.7904111612588167} +{"Finetune/Learning Rate": 1.9852628547438322e-05, "Finetune/Loss": 0.8800103664398193, "Finetune/Loss (Raw)": 0.8143806457519531, "Finetune/Step": 413, "Finetune/Step Time": 2.790283853188157} +{"Finetune/Learning Rate": 1.985151275898575e-05, "Finetune/Loss": 0.8792524337768555, "Finetune/Loss (Raw)": 0.8553895354270935, "Finetune/Step": 414, "Finetune/Step Time": 2.7886920291930437} +{"Finetune/Learning Rate": 1.9850392794076133e-05, "Finetune/Loss": 0.8800220489501953, "Finetune/Loss (Raw)": 0.9296004176139832, "Finetune/Step": 415, "Finetune/Step Time": 2.788219226524234} +{"Finetune/Learning Rate": 1.9849268653184276e-05, "Finetune/Loss": 0.8802585005760193, "Finetune/Loss (Raw)": 0.9943650364875793, "Finetune/Step": 416, "Finetune/Step Time": 2.7993634305894375} +{"Finetune/Learning Rate": 1.9848140336786737e-05, "Finetune/Loss": 0.8809149265289307, "Finetune/Loss (Raw)": 0.9762738347053528, "Finetune/Step": 417, "Finetune/Step Time": 2.802083607763052} +{"Finetune/Learning Rate": 1.9847007845361864e-05, "Finetune/Loss": 0.8833682537078857, "Finetune/Loss (Raw)": 0.9133495092391968, "Finetune/Step": 418, "Finetune/Step Time": 2.7774315644055605} +{"Finetune/Learning Rate": 1.9845871179389767e-05, "Finetune/Loss": 0.8824428915977478, "Finetune/Loss (Raw)": 0.8698664307594299, "Finetune/Step": 419, "Finetune/Step Time": 2.7750850412994623} +{"Finetune/Learning Rate": 1.984473033935232e-05, "Finetune/Loss": 0.8858033418655396, "Finetune/Loss (Raw)": 0.8886051177978516, "Finetune/Step": 420, "Finetune/Step Time": 2.7499588541686535} +{"Finetune/Learning Rate": 1.9843585325733174e-05, "Finetune/Loss": 0.8838130235671997, "Finetune/Loss (Raw)": 0.6562657356262207, "Finetune/Step": 421, "Finetune/Step Time": 2.7693272586911917} +{"Finetune/Learning Rate": 1.9842436139017748e-05, "Finetune/Loss": 0.8826097249984741, "Finetune/Loss (Raw)": 0.8182797431945801, "Finetune/Step": 422, "Finetune/Step Time": 2.7707188855856657} +{"Finetune/Learning Rate": 1.9841282779693225e-05, "Finetune/Loss": 0.880439817905426, "Finetune/Loss (Raw)": 0.7620773911476135, "Finetune/Step": 423, "Finetune/Step Time": 2.7691107243299484} +{"Finetune/Learning Rate": 1.9840125248248564e-05, "Finetune/Loss": 0.8806301951408386, "Finetune/Loss (Raw)": 0.9452722668647766, "Finetune/Step": 424, "Finetune/Step Time": 2.766632182523608} +{"Finetune/Learning Rate": 1.983896354517449e-05, "Finetune/Loss": 0.8806864023208618, "Finetune/Loss (Raw)": 0.9436619281768799, "Finetune/Step": 425, "Finetune/Step Time": 2.768265614286065} +{"Finetune/Learning Rate": 1.9837797670963495e-05, "Finetune/Loss": 0.8826848268508911, "Finetune/Loss (Raw)": 0.8734486699104309, "Finetune/Step": 426, "Finetune/Step Time": 2.7420145850628614} +{"Finetune/Learning Rate": 1.9836627626109837e-05, "Finetune/Loss": 0.8829697370529175, "Finetune/Loss (Raw)": 0.8852671980857849, "Finetune/Step": 427, "Finetune/Step Time": 2.745318340137601} +{"Finetune/Learning Rate": 1.9835453411109557e-05, "Finetune/Loss": 0.8824942111968994, "Finetune/Loss (Raw)": 0.9055618047714233, "Finetune/Step": 428, "Finetune/Step Time": 2.7480394896119833} +{"Finetune/Learning Rate": 1.9834275026460438e-05, "Finetune/Loss": 0.8816009759902954, "Finetune/Loss (Raw)": 0.8388106226921082, "Finetune/Step": 429, "Finetune/Step Time": 2.744500422850251} +{"Finetune/Learning Rate": 1.9833092472662053e-05, "Finetune/Loss": 0.8819971680641174, "Finetune/Loss (Raw)": 0.8694870471954346, "Finetune/Step": 430, "Finetune/Step Time": 2.743198461830616} +{"Finetune/Learning Rate": 1.9831905750215736e-05, "Finetune/Loss": 0.8810769319534302, "Finetune/Loss (Raw)": 0.8515071868896484, "Finetune/Step": 431, "Finetune/Step Time": 2.747350526973605} +{"Finetune/Learning Rate": 1.983071485962458e-05, "Finetune/Loss": 0.8811883330345154, "Finetune/Loss (Raw)": 0.8700730204582214, "Finetune/Step": 432, "Finetune/Step Time": 2.7359986882656813} +{"Finetune/Learning Rate": 1.9829519801393463e-05, "Finetune/Loss": 0.8810100555419922, "Finetune/Loss (Raw)": 0.8831809163093567, "Finetune/Step": 433, "Finetune/Step Time": 2.73285648599267} +{"Finetune/Learning Rate": 1.982832057602901e-05, "Finetune/Loss": 0.8813564777374268, "Finetune/Loss (Raw)": 0.8716827630996704, "Finetune/Step": 434, "Finetune/Step Time": 2.733170984312892} +{"Finetune/Learning Rate": 1.982711718403962e-05, "Finetune/Loss": 0.8796819448471069, "Finetune/Loss (Raw)": 0.6345205903053284, "Finetune/Step": 435, "Finetune/Step Time": 2.756442055106163} +{"Finetune/Learning Rate": 1.9825909625935468e-05, "Finetune/Loss": 0.8801882266998291, "Finetune/Loss (Raw)": 0.939132571220398, "Finetune/Step": 436, "Finetune/Step Time": 2.7575491555035114} +{"Finetune/Learning Rate": 1.9824697902228482e-05, "Finetune/Loss": 0.8807240724563599, "Finetune/Loss (Raw)": 0.8707022070884705, "Finetune/Step": 437, "Finetune/Step Time": 2.7564206663519144} +{"Finetune/Learning Rate": 1.982348201343236e-05, "Finetune/Loss": 0.8778139352798462, "Finetune/Loss (Raw)": 0.575735330581665, "Finetune/Step": 438, "Finetune/Step Time": 2.7853818107396364} +{"Finetune/Learning Rate": 1.982226196006257e-05, "Finetune/Loss": 0.8769181966781616, "Finetune/Loss (Raw)": 0.8443036675453186, "Finetune/Step": 439, "Finetune/Step Time": 2.785472324118018} +{"Finetune/Learning Rate": 1.982103774263634e-05, "Finetune/Loss": 0.8766708374023438, "Finetune/Loss (Raw)": 0.8996226787567139, "Finetune/Step": 440, "Finetune/Step Time": 2.7873291317373514} +{"Finetune/Learning Rate": 1.9819809361672668e-05, "Finetune/Loss": 0.8732354640960693, "Finetune/Loss (Raw)": 0.5984708666801453, "Finetune/Step": 441, "Finetune/Step Time": 2.8112009316682816} +{"Finetune/Learning Rate": 1.9818576817692307e-05, "Finetune/Loss": 0.8737220764160156, "Finetune/Loss (Raw)": 0.9726307392120361, "Finetune/Step": 442, "Finetune/Step Time": 2.8125233072787523} +{"Finetune/Learning Rate": 1.9817340111217795e-05, "Finetune/Loss": 0.8752555847167969, "Finetune/Loss (Raw)": 0.9692021012306213, "Finetune/Step": 443, "Finetune/Step Time": 2.8146384973078966} +{"Finetune/Learning Rate": 1.981609924277341e-05, "Finetune/Loss": 0.8755010962486267, "Finetune/Loss (Raw)": 1.008070468902588, "Finetune/Step": 444, "Finetune/Step Time": 2.817552912980318} +{"Finetune/Learning Rate": 1.9814854212885217e-05, "Finetune/Loss": 0.8752562999725342, "Finetune/Loss (Raw)": 0.8734828233718872, "Finetune/Step": 445, "Finetune/Step Time": 2.8178477343171835} +{"Finetune/Learning Rate": 1.9813605022081027e-05, "Finetune/Loss": 0.8753501772880554, "Finetune/Loss (Raw)": 0.9303929805755615, "Finetune/Step": 446, "Finetune/Step Time": 2.815782602876425} +{"Finetune/Learning Rate": 1.9812351670890426e-05, "Finetune/Loss": 0.8765679597854614, "Finetune/Loss (Raw)": 0.9411266446113586, "Finetune/Step": 447, "Finetune/Step Time": 2.81560492888093} +{"Finetune/Learning Rate": 1.981109415984476e-05, "Finetune/Loss": 0.8747955560684204, "Finetune/Loss (Raw)": 0.8308418989181519, "Finetune/Step": 448, "Finetune/Step Time": 2.8182553723454475} +{"Finetune/Learning Rate": 1.9809832489477144e-05, "Finetune/Loss": 0.8751152753829956, "Finetune/Loss (Raw)": 0.9183861613273621, "Finetune/Step": 449, "Finetune/Step Time": 2.821012683212757} +{"Finetune/Learning Rate": 1.9808566660322443e-05, "Finetune/Loss": 0.8740156888961792, "Finetune/Loss (Raw)": 0.8036811947822571, "Finetune/Step": 450, "Finetune/Step Time": 2.822320057079196} +{"Finetune/Learning Rate": 1.9807296672917297e-05, "Finetune/Loss": 0.8753184676170349, "Finetune/Loss (Raw)": 0.8730663657188416, "Finetune/Step": 451, "Finetune/Step Time": 2.7967931423336267} +{"Finetune/Learning Rate": 1.9806022527800107e-05, "Finetune/Loss": 0.8762565851211548, "Finetune/Loss (Raw)": 1.028348684310913, "Finetune/Step": 452, "Finetune/Step Time": 2.7960366290062666} +{"Finetune/Learning Rate": 1.9804744225511034e-05, "Finetune/Loss": 0.8737717866897583, "Finetune/Loss (Raw)": 0.6800516247749329, "Finetune/Step": 453, "Finetune/Step Time": 2.8175305649638176} +{"Finetune/Learning Rate": 1.9803461766591998e-05, "Finetune/Loss": 0.872638463973999, "Finetune/Loss (Raw)": 0.8504874110221863, "Finetune/Step": 454, "Finetune/Step Time": 2.822363482788205} +{"Finetune/Learning Rate": 1.9802175151586693e-05, "Finetune/Loss": 0.8724462389945984, "Finetune/Loss (Raw)": 0.821563184261322, "Finetune/Step": 455, "Finetune/Step Time": 2.8270504977554083} +{"Finetune/Learning Rate": 1.980088438104056e-05, "Finetune/Loss": 0.8720738887786865, "Finetune/Loss (Raw)": 0.9364343881607056, "Finetune/Step": 456, "Finetune/Step Time": 2.824096329510212} +{"Finetune/Learning Rate": 1.979958945550082e-05, "Finetune/Loss": 0.8702576756477356, "Finetune/Loss (Raw)": 0.7733378410339355, "Finetune/Step": 457, "Finetune/Step Time": 2.821673119440675} +{"Finetune/Learning Rate": 1.979829037551643e-05, "Finetune/Loss": 0.8697928190231323, "Finetune/Loss (Raw)": 0.8622422814369202, "Finetune/Step": 458, "Finetune/Step Time": 2.8225557301193476} +{"Finetune/Learning Rate": 1.9796987141638137e-05, "Finetune/Loss": 0.8703986406326294, "Finetune/Loss (Raw)": 0.9184906482696533, "Finetune/Step": 459, "Finetune/Step Time": 2.8214855808764696} +{"Finetune/Learning Rate": 1.9795679754418426e-05, "Finetune/Loss": 0.8697406649589539, "Finetune/Loss (Raw)": 0.8029959201812744, "Finetune/Step": 460, "Finetune/Step Time": 2.8208503872156143} +{"Finetune/Learning Rate": 1.979436821441155e-05, "Finetune/Loss": 0.8684244751930237, "Finetune/Loss (Raw)": 0.7648884654045105, "Finetune/Step": 461, "Finetune/Step Time": 2.822155676782131} +{"Finetune/Learning Rate": 1.9793052522173536e-05, "Finetune/Loss": 0.8670751452445984, "Finetune/Loss (Raw)": 0.8233281970024109, "Finetune/Step": 462, "Finetune/Step Time": 2.8209612891077995} +{"Finetune/Learning Rate": 1.9791732678262144e-05, "Finetune/Loss": 0.8651508092880249, "Finetune/Loss (Raw)": 0.5947927832603455, "Finetune/Step": 463, "Finetune/Step Time": 2.8479469511657953} +{"Finetune/Learning Rate": 1.9790408683236922e-05, "Finetune/Loss": 0.8682553768157959, "Finetune/Loss (Raw)": 0.9233613610267639, "Finetune/Step": 464, "Finetune/Step Time": 2.8248360082507133} +{"Finetune/Learning Rate": 1.978908053765916e-05, "Finetune/Loss": 0.8688933849334717, "Finetune/Loss (Raw)": 0.9681716561317444, "Finetune/Step": 465, "Finetune/Step Time": 2.8266446460038424} +{"Finetune/Learning Rate": 1.9787748242091908e-05, "Finetune/Loss": 0.8683818578720093, "Finetune/Loss (Raw)": 0.8498451113700867, "Finetune/Step": 466, "Finetune/Step Time": 2.8293767143040895} +{"Finetune/Learning Rate": 1.978641179709999e-05, "Finetune/Loss": 0.8669230937957764, "Finetune/Loss (Raw)": 0.8277365565299988, "Finetune/Step": 467, "Finetune/Step Time": 2.8056501913815737} +{"Finetune/Learning Rate": 1.9785071203249976e-05, "Finetune/Loss": 0.8646660447120667, "Finetune/Loss (Raw)": 0.7185042500495911, "Finetune/Step": 468, "Finetune/Step Time": 2.8293664697557688} +{"Finetune/Learning Rate": 1.9783726461110197e-05, "Finetune/Loss": 0.861337423324585, "Finetune/Loss (Raw)": 0.5894016623497009, "Finetune/Step": 469, "Finetune/Step Time": 2.85652919113636} +{"Finetune/Learning Rate": 1.9782377571250745e-05, "Finetune/Loss": 0.8620986938476562, "Finetune/Loss (Raw)": 0.9502670168876648, "Finetune/Step": 470, "Finetune/Step Time": 2.8543944656848907} +{"Finetune/Learning Rate": 1.9781024534243468e-05, "Finetune/Loss": 0.8580220937728882, "Finetune/Loss (Raw)": 0.3948451578617096, "Finetune/Step": 471, "Finetune/Step Time": 2.8887484557926655} +{"Finetune/Learning Rate": 1.9779667350661973e-05, "Finetune/Loss": 0.8583919405937195, "Finetune/Loss (Raw)": 0.8550198078155518, "Finetune/Step": 472, "Finetune/Step Time": 2.9029774833470583} +{"Finetune/Learning Rate": 1.9778306021081627e-05, "Finetune/Loss": 0.8620309829711914, "Finetune/Loss (Raw)": 0.9591663479804993, "Finetune/Step": 473, "Finetune/Step Time": 2.8759214095771313} +{"Finetune/Learning Rate": 1.9776940546079552e-05, "Finetune/Loss": 0.862557053565979, "Finetune/Loss (Raw)": 0.9053387641906738, "Finetune/Step": 474, "Finetune/Step Time": 2.8769931867718697} +{"Finetune/Learning Rate": 1.977557092623463e-05, "Finetune/Loss": 0.8642927408218384, "Finetune/Loss (Raw)": 0.8384937644004822, "Finetune/Step": 475, "Finetune/Step Time": 2.853226451203227} +{"Finetune/Learning Rate": 1.9774197162127496e-05, "Finetune/Loss": 0.8626728057861328, "Finetune/Loss (Raw)": 0.7382084727287292, "Finetune/Step": 476, "Finetune/Step Time": 2.85268778167665} +{"Finetune/Learning Rate": 1.9772819254340545e-05, "Finetune/Loss": 0.8627971410751343, "Finetune/Loss (Raw)": 0.89580237865448, "Finetune/Step": 477, "Finetune/Step Time": 2.8573485631495714} +{"Finetune/Learning Rate": 1.9771437203457934e-05, "Finetune/Loss": 0.8629487752914429, "Finetune/Loss (Raw)": 0.8414294719696045, "Finetune/Step": 478, "Finetune/Step Time": 2.8574170004576445} +{"Finetune/Learning Rate": 1.977005101006556e-05, "Finetune/Loss": 0.863178014755249, "Finetune/Loss (Raw)": 0.9316940903663635, "Finetune/Step": 479, "Finetune/Step Time": 2.8578901812434196} +{"Finetune/Learning Rate": 1.9768660674751094e-05, "Finetune/Loss": 0.8634001612663269, "Finetune/Loss (Raw)": 0.8842944502830505, "Finetune/Step": 480, "Finetune/Step Time": 2.853123089298606} +{"Finetune/Learning Rate": 1.9767266198103954e-05, "Finetune/Loss": 0.8628882169723511, "Finetune/Loss (Raw)": 0.8979889750480652, "Finetune/Step": 481, "Finetune/Step Time": 2.8551131170243025} +{"Finetune/Learning Rate": 1.9765867580715316e-05, "Finetune/Loss": 0.8631548285484314, "Finetune/Loss (Raw)": 0.9215148687362671, "Finetune/Step": 482, "Finetune/Step Time": 2.8544605188071728} +{"Finetune/Learning Rate": 1.976446482317811e-05, "Finetune/Loss": 0.8633246421813965, "Finetune/Loss (Raw)": 0.9292277097702026, "Finetune/Step": 483, "Finetune/Step Time": 2.8538829404860735} +{"Finetune/Learning Rate": 1.9763057926087023e-05, "Finetune/Loss": 0.8628021478652954, "Finetune/Loss (Raw)": 0.833748996257782, "Finetune/Step": 484, "Finetune/Step Time": 2.845906138420105} +{"Finetune/Learning Rate": 1.9761646890038494e-05, "Finetune/Loss": 0.8629334568977356, "Finetune/Loss (Raw)": 0.8360194563865662, "Finetune/Step": 485, "Finetune/Step Time": 2.845893593505025} +{"Finetune/Learning Rate": 1.976023171563072e-05, "Finetune/Loss": 0.8630733489990234, "Finetune/Loss (Raw)": 0.922906219959259, "Finetune/Step": 486, "Finetune/Step Time": 2.8460416942834854} +{"Finetune/Learning Rate": 1.975881240346365e-05, "Finetune/Loss": 0.8622373342514038, "Finetune/Loss (Raw)": 0.910810649394989, "Finetune/Step": 487, "Finetune/Step Time": 2.848822658881545} +{"Finetune/Learning Rate": 1.9757388954138988e-05, "Finetune/Loss": 0.8620113134384155, "Finetune/Loss (Raw)": 0.8563194274902344, "Finetune/Step": 488, "Finetune/Step Time": 2.8361071683466434} +{"Finetune/Learning Rate": 1.9755961368260197e-05, "Finetune/Loss": 0.8620160222053528, "Finetune/Loss (Raw)": 0.9192007184028625, "Finetune/Step": 489, "Finetune/Step Time": 2.8379327710717916} +{"Finetune/Learning Rate": 1.9754529646432484e-05, "Finetune/Loss": 0.8638831377029419, "Finetune/Loss (Raw)": 0.8726837038993835, "Finetune/Step": 490, "Finetune/Step Time": 2.814642194658518} +{"Finetune/Learning Rate": 1.9753093789262813e-05, "Finetune/Loss": 0.8676450848579407, "Finetune/Loss (Raw)": 0.9113250970840454, "Finetune/Step": 491, "Finetune/Step Time": 2.7835042849183083} +{"Finetune/Learning Rate": 1.9751653797359904e-05, "Finetune/Loss": 0.8671557903289795, "Finetune/Loss (Raw)": 0.8081588745117188, "Finetune/Step": 492, "Finetune/Step Time": 2.7831745464354753} +{"Finetune/Learning Rate": 1.9750209671334225e-05, "Finetune/Loss": 0.8666093349456787, "Finetune/Loss (Raw)": 0.8442976474761963, "Finetune/Step": 493, "Finetune/Step Time": 2.779388712719083} +{"Finetune/Learning Rate": 1.974876141179801e-05, "Finetune/Loss": 0.8665777444839478, "Finetune/Loss (Raw)": 0.8859862685203552, "Finetune/Step": 494, "Finetune/Step Time": 2.781295247375965} +{"Finetune/Learning Rate": 1.9747309019365224e-05, "Finetune/Loss": 0.866868793964386, "Finetune/Loss (Raw)": 0.8700568675994873, "Finetune/Step": 495, "Finetune/Step Time": 2.7797138318419456} +{"Finetune/Learning Rate": 1.97458524946516e-05, "Finetune/Loss": 0.8663740158081055, "Finetune/Loss (Raw)": 0.8185205459594727, "Finetune/Step": 496, "Finetune/Step Time": 2.779263848438859} +{"Finetune/Learning Rate": 1.9744391838274615e-05, "Finetune/Loss": 0.8679054975509644, "Finetune/Loss (Raw)": 1.0091358423233032, "Finetune/Step": 497, "Finetune/Step Time": 2.7762014027684927} +{"Finetune/Learning Rate": 1.9742927050853508e-05, "Finetune/Loss": 0.8682067394256592, "Finetune/Loss (Raw)": 0.9185686111450195, "Finetune/Step": 498, "Finetune/Step Time": 2.7767001185566187} +{"Finetune/Learning Rate": 1.9741458133009258e-05, "Finetune/Loss": 0.8683884739875793, "Finetune/Loss (Raw)": 0.8793206214904785, "Finetune/Step": 499, "Finetune/Step Time": 2.7796940859407187} +{"Finetune/Learning Rate": 1.9739985085364593e-05, "Finetune/Loss": 0.867929995059967, "Finetune/Loss (Raw)": 0.8873379826545715, "Finetune/Step": 500, "Finetune/Step Time": 2.7805985882878304} +{"Finetune/Learning Rate": 1.9738507908544006e-05, "Finetune/Loss": 0.8665487766265869, "Finetune/Loss (Raw)": 0.8650306463241577, "Finetune/Step": 501, "Finetune/Step Time": 2.7792226877063513} +{"Finetune/Learning Rate": 1.973702660317373e-05, "Finetune/Loss": 0.8663156628608704, "Finetune/Loss (Raw)": 0.9058381915092468, "Finetune/Step": 502, "Finetune/Step Time": 2.777790129184723} +{"Finetune/Learning Rate": 1.9735541169881748e-05, "Finetune/Loss": 0.866437554359436, "Finetune/Loss (Raw)": 0.9057355523109436, "Finetune/Step": 503, "Finetune/Step Time": 2.7758332807570696} +{"Finetune/Learning Rate": 1.97340516092978e-05, "Finetune/Loss": 0.8666892051696777, "Finetune/Loss (Raw)": 0.8863338232040405, "Finetune/Step": 504, "Finetune/Step Time": 2.778255809098482} +{"Finetune/Learning Rate": 1.9732557922053365e-05, "Finetune/Loss": 0.8679304122924805, "Finetune/Loss (Raw)": 1.0156428813934326, "Finetune/Step": 505, "Finetune/Step Time": 2.7743282075971365} +{"Finetune/Learning Rate": 1.9731060108781682e-05, "Finetune/Loss": 0.8682742118835449, "Finetune/Loss (Raw)": 0.9063753485679626, "Finetune/Step": 506, "Finetune/Step Time": 2.7740279994904995} +{"Finetune/Learning Rate": 1.9729558170117738e-05, "Finetune/Loss": 0.86854088306427, "Finetune/Loss (Raw)": 0.9402400255203247, "Finetune/Step": 507, "Finetune/Step Time": 2.771880853921175} +{"Finetune/Learning Rate": 1.972805210669826e-05, "Finetune/Loss": 0.8684216141700745, "Finetune/Loss (Raw)": 0.9972724318504333, "Finetune/Step": 508, "Finetune/Step Time": 2.772479012608528} +{"Finetune/Learning Rate": 1.9726541919161733e-05, "Finetune/Loss": 0.8689136505126953, "Finetune/Loss (Raw)": 0.9135852456092834, "Finetune/Step": 509, "Finetune/Step Time": 2.7678995188325644} +{"Finetune/Learning Rate": 1.9725027608148388e-05, "Finetune/Loss": 0.8665404915809631, "Finetune/Loss (Raw)": 0.5826848745346069, "Finetune/Step": 510, "Finetune/Step Time": 2.787485444918275} +{"Finetune/Learning Rate": 1.97235091743002e-05, "Finetune/Loss": 0.8665978312492371, "Finetune/Loss (Raw)": 0.9189431071281433, "Finetune/Step": 511, "Finetune/Step Time": 2.787214208394289} +{"Finetune/Learning Rate": 1.9721986618260892e-05, "Finetune/Loss": 0.8669505715370178, "Finetune/Loss (Raw)": 0.8770608305931091, "Finetune/Step": 512, "Finetune/Step Time": 2.7825771663337946} +{"Finetune/Learning Rate": 1.9720459940675946e-05, "Finetune/Loss": 0.8674808740615845, "Finetune/Loss (Raw)": 0.9782822728157043, "Finetune/Step": 513, "Finetune/Step Time": 2.7769149616360664} +{"Finetune/Learning Rate": 1.9718929142192577e-05, "Finetune/Loss": 0.8674803972244263, "Finetune/Loss (Raw)": 0.8722695112228394, "Finetune/Step": 514, "Finetune/Step Time": 2.7762996535748243} +{"Finetune/Learning Rate": 1.9717394223459755e-05, "Finetune/Loss": 0.8667572736740112, "Finetune/Loss (Raw)": 0.798418402671814, "Finetune/Step": 515, "Finetune/Step Time": 2.7773012556135654} +{"Finetune/Learning Rate": 1.971585518512819e-05, "Finetune/Loss": 0.866290807723999, "Finetune/Loss (Raw)": 0.8808274269104004, "Finetune/Step": 516, "Finetune/Step Time": 2.7774707712233067} +{"Finetune/Learning Rate": 1.971431202785035e-05, "Finetune/Loss": 0.8661130666732788, "Finetune/Loss (Raw)": 0.7951359152793884, "Finetune/Step": 517, "Finetune/Step Time": 2.7738627828657627} +{"Finetune/Learning Rate": 1.9712764752280437e-05, "Finetune/Loss": 0.8653576374053955, "Finetune/Loss (Raw)": 0.7662619352340698, "Finetune/Step": 518, "Finetune/Step Time": 2.775683391839266} +{"Finetune/Learning Rate": 1.9711213359074408e-05, "Finetune/Loss": 0.8652887344360352, "Finetune/Loss (Raw)": 0.887524425983429, "Finetune/Step": 519, "Finetune/Step Time": 2.77401234023273} +{"Finetune/Learning Rate": 1.9709657848889956e-05, "Finetune/Loss": 0.8643964529037476, "Finetune/Loss (Raw)": 0.8437996506690979, "Finetune/Step": 520, "Finetune/Step Time": 2.7770151551812887} +{"Finetune/Learning Rate": 1.9708098222386528e-05, "Finetune/Loss": 0.8643794059753418, "Finetune/Loss (Raw)": 0.8580226898193359, "Finetune/Step": 521, "Finetune/Step Time": 2.7808901630342007} +{"Finetune/Learning Rate": 1.9706534480225317e-05, "Finetune/Loss": 0.8666225671768188, "Finetune/Loss (Raw)": 0.8551581501960754, "Finetune/Step": 522, "Finetune/Step Time": 2.7606517113745213} +{"Finetune/Learning Rate": 1.970496662306925e-05, "Finetune/Loss": 0.8665897250175476, "Finetune/Loss (Raw)": 0.933274507522583, "Finetune/Step": 523, "Finetune/Step Time": 2.7584380581974983} +{"Finetune/Learning Rate": 1.970339465158301e-05, "Finetune/Loss": 0.8663855195045471, "Finetune/Loss (Raw)": 0.8918137550354004, "Finetune/Step": 524, "Finetune/Step Time": 2.7557541988790035} +{"Finetune/Learning Rate": 1.970181856643302e-05, "Finetune/Loss": 0.8658545613288879, "Finetune/Loss (Raw)": 0.8747261762619019, "Finetune/Step": 525, "Finetune/Step Time": 2.7567990105599165} +{"Finetune/Learning Rate": 1.970023836828744e-05, "Finetune/Loss": 0.8641372919082642, "Finetune/Loss (Raw)": 0.8485572338104248, "Finetune/Step": 526, "Finetune/Step Time": 2.758561572059989} +{"Finetune/Learning Rate": 1.969865405781619e-05, "Finetune/Loss": 0.859328031539917, "Finetune/Loss (Raw)": 0.17886494100093842, "Finetune/Step": 527, "Finetune/Step Time": 2.787018684670329} +{"Finetune/Learning Rate": 1.969706563569092e-05, "Finetune/Loss": 0.8568940162658691, "Finetune/Loss (Raw)": 0.6317107081413269, "Finetune/Step": 528, "Finetune/Step Time": 2.828856896609068} +{"Finetune/Learning Rate": 1.9695473102585022e-05, "Finetune/Loss": 0.8565497398376465, "Finetune/Loss (Raw)": 0.8496668934822083, "Finetune/Step": 529, "Finetune/Step Time": 2.8298863377422094} +{"Finetune/Learning Rate": 1.969387645917364e-05, "Finetune/Loss": 0.8560216426849365, "Finetune/Loss (Raw)": 0.8826593160629272, "Finetune/Step": 530, "Finetune/Step Time": 2.831057842820883} +{"Finetune/Learning Rate": 1.9692275706133658e-05, "Finetune/Loss": 0.8562257289886475, "Finetune/Loss (Raw)": 0.9646958112716675, "Finetune/Step": 531, "Finetune/Step Time": 2.829961596056819} +{"Finetune/Learning Rate": 1.9690670844143697e-05, "Finetune/Loss": 0.8553220629692078, "Finetune/Loss (Raw)": 0.8242401480674744, "Finetune/Step": 532, "Finetune/Step Time": 2.8264457769691944} +{"Finetune/Learning Rate": 1.968906187388412e-05, "Finetune/Loss": 0.8552790284156799, "Finetune/Loss (Raw)": 0.9316703081130981, "Finetune/Step": 533, "Finetune/Step Time": 2.8285633735358715} +{"Finetune/Learning Rate": 1.9687448796037046e-05, "Finetune/Loss": 0.8563478589057922, "Finetune/Loss (Raw)": 0.9744590520858765, "Finetune/Step": 534, "Finetune/Step Time": 2.8281348533928394} +{"Finetune/Learning Rate": 1.9685831611286312e-05, "Finetune/Loss": 0.8569340705871582, "Finetune/Loss (Raw)": 0.9135622382164001, "Finetune/Step": 535, "Finetune/Step Time": 2.827560342848301} +{"Finetune/Learning Rate": 1.9684210320317518e-05, "Finetune/Loss": 0.8581438660621643, "Finetune/Loss (Raw)": 0.9931301474571228, "Finetune/Step": 536, "Finetune/Step Time": 2.8253490142524242} +{"Finetune/Learning Rate": 1.9682584923817988e-05, "Finetune/Loss": 0.8592972159385681, "Finetune/Loss (Raw)": 1.0056235790252686, "Finetune/Step": 537, "Finetune/Step Time": 2.826809197664261} +{"Finetune/Learning Rate": 1.96809554224768e-05, "Finetune/Loss": 0.8596420884132385, "Finetune/Loss (Raw)": 1.0018353462219238, "Finetune/Step": 538, "Finetune/Step Time": 2.8249083887785673} +{"Finetune/Learning Rate": 1.9679321816984756e-05, "Finetune/Loss": 0.8597425222396851, "Finetune/Loss (Raw)": 0.8736429810523987, "Finetune/Step": 539, "Finetune/Step Time": 2.824641928076744} +{"Finetune/Learning Rate": 1.9677684108034417e-05, "Finetune/Loss": 0.8599264621734619, "Finetune/Loss (Raw)": 0.8845647573471069, "Finetune/Step": 540, "Finetune/Step Time": 2.8224357590079308} +{"Finetune/Learning Rate": 1.9676042296320075e-05, "Finetune/Loss": 0.8612788915634155, "Finetune/Loss (Raw)": 0.9874852895736694, "Finetune/Step": 541, "Finetune/Step Time": 2.8230896778404713} +{"Finetune/Learning Rate": 1.9674396382537756e-05, "Finetune/Loss": 0.8611007928848267, "Finetune/Loss (Raw)": 0.8326031565666199, "Finetune/Step": 542, "Finetune/Step Time": 2.822895599529147} +{"Finetune/Learning Rate": 1.9672746367385228e-05, "Finetune/Loss": 0.8607293367385864, "Finetune/Loss (Raw)": 0.8820503950119019, "Finetune/Step": 543, "Finetune/Step Time": 2.827793676406145} +{"Finetune/Learning Rate": 1.9671092251562006e-05, "Finetune/Loss": 0.8593025207519531, "Finetune/Loss (Raw)": 0.8117308020591736, "Finetune/Step": 544, "Finetune/Step Time": 2.815305884927511} +{"Finetune/Learning Rate": 1.9669434035769335e-05, "Finetune/Loss": 0.8584377765655518, "Finetune/Loss (Raw)": 0.8655902743339539, "Finetune/Step": 545, "Finetune/Step Time": 2.81790972314775} +{"Finetune/Learning Rate": 1.96677717207102e-05, "Finetune/Loss": 0.8577702045440674, "Finetune/Loss (Raw)": 0.8278929591178894, "Finetune/Step": 546, "Finetune/Step Time": 2.8195638600736856} +{"Finetune/Learning Rate": 1.966610530708932e-05, "Finetune/Loss": 0.8582072257995605, "Finetune/Loss (Raw)": 0.9258056879043579, "Finetune/Step": 547, "Finetune/Step Time": 2.8196879010647535} +{"Finetune/Learning Rate": 1.9664434795613162e-05, "Finetune/Loss": 0.8579712510108948, "Finetune/Loss (Raw)": 0.8584044575691223, "Finetune/Step": 548, "Finetune/Step Time": 2.8145667128264904} +{"Finetune/Learning Rate": 1.9662760186989914e-05, "Finetune/Loss": 0.8594664335250854, "Finetune/Loss (Raw)": 0.8476470708847046, "Finetune/Step": 549, "Finetune/Step Time": 2.7913110982626677} +{"Finetune/Learning Rate": 1.9661081481929524e-05, "Finetune/Loss": 0.8603661060333252, "Finetune/Loss (Raw)": 0.9334362149238586, "Finetune/Step": 550, "Finetune/Step Time": 2.7910727690905333} +{"Finetune/Learning Rate": 1.9659398681143657e-05, "Finetune/Loss": 0.8616970181465149, "Finetune/Loss (Raw)": 0.9324431419372559, "Finetune/Step": 551, "Finetune/Step Time": 2.793665809556842} +{"Finetune/Learning Rate": 1.9657711785345713e-05, "Finetune/Loss": 0.8613967299461365, "Finetune/Loss (Raw)": 0.9068307280540466, "Finetune/Step": 552, "Finetune/Step Time": 2.79655783995986} +{"Finetune/Learning Rate": 1.965602079525085e-05, "Finetune/Loss": 0.860785722732544, "Finetune/Loss (Raw)": 0.8654488325119019, "Finetune/Step": 553, "Finetune/Step Time": 2.7955051455646753} +{"Finetune/Learning Rate": 1.9654325711575937e-05, "Finetune/Loss": 0.8607959747314453, "Finetune/Loss (Raw)": 0.8747691512107849, "Finetune/Step": 554, "Finetune/Step Time": 2.796907924115658} +{"Finetune/Learning Rate": 1.9652626535039593e-05, "Finetune/Loss": 0.8608301877975464, "Finetune/Loss (Raw)": 0.8896373510360718, "Finetune/Step": 555, "Finetune/Step Time": 2.795642487704754} +{"Finetune/Learning Rate": 1.9650923266362166e-05, "Finetune/Loss": 0.8600339293479919, "Finetune/Loss (Raw)": 0.8036445379257202, "Finetune/Step": 556, "Finetune/Step Time": 2.794451517984271} +{"Finetune/Learning Rate": 1.9649215906265744e-05, "Finetune/Loss": 0.8592113852500916, "Finetune/Loss (Raw)": 0.7335233688354492, "Finetune/Step": 557, "Finetune/Step Time": 2.8154474440962076} +{"Finetune/Learning Rate": 1.9647504455474145e-05, "Finetune/Loss": 0.8591650724411011, "Finetune/Loss (Raw)": 0.8635644912719727, "Finetune/Step": 558, "Finetune/Step Time": 2.818404244259} +{"Finetune/Learning Rate": 1.964578891471292e-05, "Finetune/Loss": 0.8598206043243408, "Finetune/Loss (Raw)": 0.9354081153869629, "Finetune/Step": 559, "Finetune/Step Time": 2.814336286857724} +{"Finetune/Learning Rate": 1.9644069284709362e-05, "Finetune/Loss": 0.859927773475647, "Finetune/Loss (Raw)": 0.8837953805923462, "Finetune/Step": 560, "Finetune/Step Time": 2.8137337900698185} +{"Finetune/Learning Rate": 1.964234556619249e-05, "Finetune/Loss": 0.8598228096961975, "Finetune/Loss (Raw)": 0.8697417378425598, "Finetune/Step": 561, "Finetune/Step Time": 2.8150604777038097} +{"Finetune/Learning Rate": 1.9640617759893053e-05, "Finetune/Loss": 0.8575501441955566, "Finetune/Loss (Raw)": 0.5807850360870361, "Finetune/Step": 562, "Finetune/Step Time": 2.837858499959111} +{"Finetune/Learning Rate": 1.9638885866543543e-05, "Finetune/Loss": 0.8595680594444275, "Finetune/Loss (Raw)": 0.8928117752075195, "Finetune/Step": 563, "Finetune/Step Time": 2.8146409690380096} +{"Finetune/Learning Rate": 1.9637149886878183e-05, "Finetune/Loss": 0.8596123456954956, "Finetune/Loss (Raw)": 0.9447988867759705, "Finetune/Step": 564, "Finetune/Step Time": 2.8117303382605314} +{"Finetune/Learning Rate": 1.9635409821632923e-05, "Finetune/Loss": 0.860490083694458, "Finetune/Loss (Raw)": 0.9830499887466431, "Finetune/Step": 565, "Finetune/Step Time": 2.8149545826017857} +{"Finetune/Learning Rate": 1.9633665671545443e-05, "Finetune/Loss": 0.8635389804840088, "Finetune/Loss (Raw)": 0.9659969806671143, "Finetune/Step": 566, "Finetune/Step Time": 2.788696214556694} +{"Finetune/Learning Rate": 1.9631917437355166e-05, "Finetune/Loss": 0.8640996813774109, "Finetune/Loss (Raw)": 0.9160807728767395, "Finetune/Step": 567, "Finetune/Step Time": 2.7873531617224216} +{"Finetune/Learning Rate": 1.9630165119803234e-05, "Finetune/Loss": 0.8634829521179199, "Finetune/Loss (Raw)": 0.8206740617752075, "Finetune/Step": 568, "Finetune/Step Time": 2.787228437140584} +{"Finetune/Learning Rate": 1.962840871963253e-05, "Finetune/Loss": 0.865558385848999, "Finetune/Loss (Raw)": 0.8641321063041687, "Finetune/Step": 569, "Finetune/Step Time": 2.7645764648914337} +{"Finetune/Learning Rate": 1.962664823758766e-05, "Finetune/Loss": 0.8648985624313354, "Finetune/Loss (Raw)": 0.8881755471229553, "Finetune/Step": 570, "Finetune/Step Time": 2.767758037894964} +{"Finetune/Learning Rate": 1.9624883674414964e-05, "Finetune/Loss": 0.8643195629119873, "Finetune/Loss (Raw)": 0.8950831890106201, "Finetune/Step": 571, "Finetune/Step Time": 2.768570678308606} +{"Finetune/Learning Rate": 1.9623115030862516e-05, "Finetune/Loss": 0.8632752299308777, "Finetune/Loss (Raw)": 0.8743973970413208, "Finetune/Step": 572, "Finetune/Step Time": 2.7672926615923643} +{"Finetune/Learning Rate": 1.9621342307680117e-05, "Finetune/Loss": 0.8632975220680237, "Finetune/Loss (Raw)": 0.8763372898101807, "Finetune/Step": 573, "Finetune/Step Time": 2.7634761817753315} +{"Finetune/Learning Rate": 1.9619565505619288e-05, "Finetune/Loss": 0.862369179725647, "Finetune/Loss (Raw)": 0.8115593194961548, "Finetune/Step": 574, "Finetune/Step Time": 2.7666606083512306} +{"Finetune/Learning Rate": 1.9617784625433292e-05, "Finetune/Loss": 0.8619257211685181, "Finetune/Loss (Raw)": 0.8843712210655212, "Finetune/Step": 575, "Finetune/Step Time": 2.76800343580544} +{"Finetune/Learning Rate": 1.9615999667877124e-05, "Finetune/Loss": 0.8627063035964966, "Finetune/Loss (Raw)": 0.9307540059089661, "Finetune/Step": 576, "Finetune/Step Time": 2.765551310032606} +{"Finetune/Learning Rate": 1.961421063370749e-05, "Finetune/Loss": 0.8632176518440247, "Finetune/Loss (Raw)": 0.9838383197784424, "Finetune/Step": 577, "Finetune/Step Time": 2.763088261708617} +{"Finetune/Learning Rate": 1.9612417523682838e-05, "Finetune/Loss": 0.8642522096633911, "Finetune/Loss (Raw)": 0.9361037015914917, "Finetune/Step": 578, "Finetune/Step Time": 2.7620114143937826} +{"Finetune/Learning Rate": 1.961062033856334e-05, "Finetune/Loss": 0.8633223176002502, "Finetune/Loss (Raw)": 0.7540388703346252, "Finetune/Step": 579, "Finetune/Step Time": 2.765571665018797} +{"Finetune/Learning Rate": 1.9608819079110895e-05, "Finetune/Loss": 0.8615807890892029, "Finetune/Loss (Raw)": 0.8054357171058655, "Finetune/Step": 580, "Finetune/Step Time": 2.762822838500142} +{"Finetune/Learning Rate": 1.9607013746089133e-05, "Finetune/Loss": 0.8628072738647461, "Finetune/Loss (Raw)": 0.8370433449745178, "Finetune/Step": 581, "Finetune/Step Time": 2.7423261795192957} +{"Finetune/Learning Rate": 1.9605204340263402e-05, "Finetune/Loss": 0.8635766506195068, "Finetune/Loss (Raw)": 0.9489684104919434, "Finetune/Step": 582, "Finetune/Step Time": 2.7392698135226965} +{"Finetune/Learning Rate": 1.960339086240079e-05, "Finetune/Loss": 0.8639569878578186, "Finetune/Loss (Raw)": 0.8702462315559387, "Finetune/Step": 583, "Finetune/Step Time": 2.7366871181875467} +{"Finetune/Learning Rate": 1.9601573313270102e-05, "Finetune/Loss": 0.8644609451293945, "Finetune/Loss (Raw)": 1.000935673713684, "Finetune/Step": 584, "Finetune/Step Time": 2.7444214932620525} +{"Finetune/Learning Rate": 1.959975169364187e-05, "Finetune/Loss": 0.8657569289207458, "Finetune/Loss (Raw)": 0.9392284750938416, "Finetune/Step": 585, "Finetune/Step Time": 2.7444567047059536} +{"Finetune/Learning Rate": 1.9597926004288354e-05, "Finetune/Loss": 0.8642573356628418, "Finetune/Loss (Raw)": 0.670284628868103, "Finetune/Step": 586, "Finetune/Step Time": 2.764846086502075} +{"Finetune/Learning Rate": 1.9596096245983534e-05, "Finetune/Loss": 0.8641297817230225, "Finetune/Loss (Raw)": 0.9021650552749634, "Finetune/Step": 587, "Finetune/Step Time": 2.7652313970029354} +{"Finetune/Learning Rate": 1.9594262419503126e-05, "Finetune/Loss": 0.8641183376312256, "Finetune/Loss (Raw)": 0.8015374541282654, "Finetune/Step": 588, "Finetune/Step Time": 2.7664168998599052} +{"Finetune/Learning Rate": 1.9592424525624555e-05, "Finetune/Loss": 0.864779531955719, "Finetune/Loss (Raw)": 0.8495246171951294, "Finetune/Step": 589, "Finetune/Step Time": 2.764609159901738} +{"Finetune/Learning Rate": 1.959058256512698e-05, "Finetune/Loss": 0.8653832674026489, "Finetune/Loss (Raw)": 0.9006076455116272, "Finetune/Step": 590, "Finetune/Step Time": 2.766647458076477} +{"Finetune/Learning Rate": 1.9588736538791294e-05, "Finetune/Loss": 0.8675295114517212, "Finetune/Loss (Raw)": 0.8695029020309448, "Finetune/Step": 591, "Finetune/Step Time": 2.7371160872280598} +{"Finetune/Learning Rate": 1.9586886447400094e-05, "Finetune/Loss": 0.8671121001243591, "Finetune/Loss (Raw)": 0.8699394464492798, "Finetune/Step": 592, "Finetune/Step Time": 2.739434488117695} +{"Finetune/Learning Rate": 1.9585032291737707e-05, "Finetune/Loss": 0.8669945001602173, "Finetune/Loss (Raw)": 0.9531158804893494, "Finetune/Step": 593, "Finetune/Step Time": 2.7413145378232002} +{"Finetune/Learning Rate": 1.958317407259019e-05, "Finetune/Loss": 0.8667751550674438, "Finetune/Loss (Raw)": 0.8217648863792419, "Finetune/Step": 594, "Finetune/Step Time": 2.7423642855137587} +{"Finetune/Learning Rate": 1.9581311790745316e-05, "Finetune/Loss": 0.8671776652336121, "Finetune/Loss (Raw)": 0.8792586326599121, "Finetune/Step": 595, "Finetune/Step Time": 2.7393516581505537} +{"Finetune/Learning Rate": 1.957944544699258e-05, "Finetune/Loss": 0.8681991100311279, "Finetune/Loss (Raw)": 0.8492582440376282, "Finetune/Step": 596, "Finetune/Step Time": 2.7183256298303604} +{"Finetune/Learning Rate": 1.9577575042123205e-05, "Finetune/Loss": 0.8708088994026184, "Finetune/Loss (Raw)": 0.9234443306922913, "Finetune/Step": 597, "Finetune/Step Time": 2.6948317904025316} +{"Finetune/Learning Rate": 1.957570057693013e-05, "Finetune/Loss": 0.8701256513595581, "Finetune/Loss (Raw)": 0.8628196120262146, "Finetune/Step": 598, "Finetune/Step Time": 2.694917691871524} +{"Finetune/Learning Rate": 1.9573822052208013e-05, "Finetune/Loss": 0.8715897798538208, "Finetune/Loss (Raw)": 0.5822481513023376, "Finetune/Step": 599, "Finetune/Step Time": 2.6798684615641832} +{"Finetune/Learning Rate": 1.9571939468753242e-05, "Finetune/Loss": 0.8714374899864197, "Finetune/Loss (Raw)": 0.8355307579040527, "Finetune/Step": 600, "Finetune/Step Time": 2.6687970254570246} +{"Finetune/Learning Rate": 1.957005282736392e-05, "Finetune/Loss": 0.8716208934783936, "Finetune/Loss (Raw)": 0.9826379418373108, "Finetune/Step": 601, "Finetune/Step Time": 2.6724465638399124} +{"Finetune/Learning Rate": 1.956816212883987e-05, "Finetune/Loss": 0.8709404468536377, "Finetune/Loss (Raw)": 0.8182400465011597, "Finetune/Step": 602, "Finetune/Step Time": 2.673231592401862} +{"Finetune/Learning Rate": 1.956626737398264e-05, "Finetune/Loss": 0.8712749481201172, "Finetune/Loss (Raw)": 0.8813128471374512, "Finetune/Step": 603, "Finetune/Step Time": 2.6762927565723658} +{"Finetune/Learning Rate": 1.9564368563595487e-05, "Finetune/Loss": 0.8728722333908081, "Finetune/Loss (Raw)": 0.9426613450050354, "Finetune/Step": 604, "Finetune/Step Time": 2.673047287389636} +{"Finetune/Learning Rate": 1.9562465698483398e-05, "Finetune/Loss": 0.8725117444992065, "Finetune/Loss (Raw)": 0.8496552109718323, "Finetune/Step": 605, "Finetune/Step Time": 2.6699496656656265} +{"Finetune/Learning Rate": 1.9560558779453073e-05, "Finetune/Loss": 0.8723363876342773, "Finetune/Loss (Raw)": 0.818994402885437, "Finetune/Step": 606, "Finetune/Step Time": 2.6719506289809942} +{"Finetune/Learning Rate": 1.9558647807312934e-05, "Finetune/Loss": 0.8718427419662476, "Finetune/Loss (Raw)": 0.8685026168823242, "Finetune/Step": 607, "Finetune/Step Time": 2.6770178116858006} +{"Finetune/Learning Rate": 1.955673278287312e-05, "Finetune/Loss": 0.8715066909790039, "Finetune/Loss (Raw)": 0.8412826061248779, "Finetune/Step": 608, "Finetune/Step Time": 2.6792640145868063} +{"Finetune/Learning Rate": 1.9554813706945485e-05, "Finetune/Loss": 0.8710746765136719, "Finetune/Loss (Raw)": 0.8426851630210876, "Finetune/Step": 609, "Finetune/Step Time": 2.679780676960945} +{"Finetune/Learning Rate": 1.9552890580343607e-05, "Finetune/Loss": 0.8707189559936523, "Finetune/Loss (Raw)": 0.8759881854057312, "Finetune/Step": 610, "Finetune/Step Time": 2.677708687260747} +{"Finetune/Learning Rate": 1.9550963403882777e-05, "Finetune/Loss": 0.8700203895568848, "Finetune/Loss (Raw)": 0.8398067355155945, "Finetune/Step": 611, "Finetune/Step Time": 2.6791905984282494} +{"Finetune/Learning Rate": 1.9549032178380002e-05, "Finetune/Loss": 0.8704056739807129, "Finetune/Loss (Raw)": 0.8830731511116028, "Finetune/Step": 612, "Finetune/Step Time": 2.6835024505853653} +{"Finetune/Learning Rate": 1.9547096904654007e-05, "Finetune/Loss": 0.8710356950759888, "Finetune/Loss (Raw)": 0.9166505932807922, "Finetune/Step": 613, "Finetune/Step Time": 2.683532329276204} +{"Finetune/Learning Rate": 1.9545157583525235e-05, "Finetune/Loss": 0.8696658611297607, "Finetune/Loss (Raw)": 0.7475703358650208, "Finetune/Step": 614, "Finetune/Step Time": 2.6818752009421587} +{"Finetune/Learning Rate": 1.954321421581584e-05, "Finetune/Loss": 0.8695287108421326, "Finetune/Loss (Raw)": 0.8932556509971619, "Finetune/Step": 615, "Finetune/Step Time": 2.6836996600031853} +{"Finetune/Learning Rate": 1.9541266802349702e-05, "Finetune/Loss": 0.8704813122749329, "Finetune/Loss (Raw)": 0.9782571792602539, "Finetune/Step": 616, "Finetune/Step Time": 2.684255663305521} +{"Finetune/Learning Rate": 1.9539315343952398e-05, "Finetune/Loss": 0.8703408241271973, "Finetune/Loss (Raw)": 0.9012085199356079, "Finetune/Step": 617, "Finetune/Step Time": 2.680906204506755} +{"Finetune/Learning Rate": 1.953735984145124e-05, "Finetune/Loss": 0.8710201382637024, "Finetune/Loss (Raw)": 0.959640622138977, "Finetune/Step": 618, "Finetune/Step Time": 2.6760158613324165} +{"Finetune/Learning Rate": 1.953540029567524e-05, "Finetune/Loss": 0.8713740110397339, "Finetune/Loss (Raw)": 0.956616222858429, "Finetune/Step": 619, "Finetune/Step Time": 2.6746347565203905} +{"Finetune/Learning Rate": 1.9533436707455128e-05, "Finetune/Loss": 0.8717583417892456, "Finetune/Loss (Raw)": 0.8573574423789978, "Finetune/Step": 620, "Finetune/Step Time": 2.677565412595868} +{"Finetune/Learning Rate": 1.9531469077623356e-05, "Finetune/Loss": 0.8717728853225708, "Finetune/Loss (Raw)": 0.8461647629737854, "Finetune/Step": 621, "Finetune/Step Time": 2.679785378277302} +{"Finetune/Learning Rate": 1.9529497407014075e-05, "Finetune/Loss": 0.8717702627182007, "Finetune/Loss (Raw)": 0.8856515288352966, "Finetune/Step": 622, "Finetune/Step Time": 2.6802091374993324} +{"Finetune/Learning Rate": 1.9527521696463157e-05, "Finetune/Loss": 0.8718370795249939, "Finetune/Loss (Raw)": 0.8786077499389648, "Finetune/Step": 623, "Finetune/Step Time": 2.681844837963581} +{"Finetune/Learning Rate": 1.9525541946808187e-05, "Finetune/Loss": 0.8724370002746582, "Finetune/Loss (Raw)": 0.8953117728233337, "Finetune/Step": 624, "Finetune/Step Time": 2.687252586707473} +{"Finetune/Learning Rate": 1.952355815888847e-05, "Finetune/Loss": 0.8717234134674072, "Finetune/Loss (Raw)": 0.9177950620651245, "Finetune/Step": 625, "Finetune/Step Time": 2.6878465842455626} +{"Finetune/Learning Rate": 1.9521570333545e-05, "Finetune/Loss": 0.8701426982879639, "Finetune/Loss (Raw)": 0.7162363529205322, "Finetune/Step": 626, "Finetune/Step Time": 2.7060463316738605} +{"Finetune/Learning Rate": 1.9519578471620506e-05, "Finetune/Loss": 0.8697372674942017, "Finetune/Loss (Raw)": 0.8274244070053101, "Finetune/Step": 627, "Finetune/Step Time": 2.7125727273523808} +{"Finetune/Learning Rate": 1.951758257395942e-05, "Finetune/Loss": 0.8697535395622253, "Finetune/Loss (Raw)": 0.8894230723381042, "Finetune/Step": 628, "Finetune/Step Time": 2.709670254960656} +{"Finetune/Learning Rate": 1.9515582641407877e-05, "Finetune/Loss": 0.8698790669441223, "Finetune/Loss (Raw)": 0.8810992240905762, "Finetune/Step": 629, "Finetune/Step Time": 2.7100559901446104} +{"Finetune/Learning Rate": 1.9513578674813736e-05, "Finetune/Loss": 0.8702511787414551, "Finetune/Loss (Raw)": 0.9534618258476257, "Finetune/Step": 630, "Finetune/Step Time": 2.7099977396428585} +{"Finetune/Learning Rate": 1.951157067502656e-05, "Finetune/Loss": 0.8699126839637756, "Finetune/Loss (Raw)": 0.8624110817909241, "Finetune/Step": 631, "Finetune/Step Time": 2.715318849310279} +{"Finetune/Learning Rate": 1.9509558642897616e-05, "Finetune/Loss": 0.87005615234375, "Finetune/Loss (Raw)": 0.9046999216079712, "Finetune/Step": 632, "Finetune/Step Time": 2.711239540949464} +{"Finetune/Learning Rate": 1.9507542579279894e-05, "Finetune/Loss": 0.8669670224189758, "Finetune/Loss (Raw)": 0.6202349066734314, "Finetune/Step": 633, "Finetune/Step Time": 2.7351064700633287} +{"Finetune/Learning Rate": 1.9505522485028083e-05, "Finetune/Loss": 0.8667967319488525, "Finetune/Loss (Raw)": 0.8845698833465576, "Finetune/Step": 634, "Finetune/Step Time": 2.7379291020333767} +{"Finetune/Learning Rate": 1.9503498360998576e-05, "Finetune/Loss": 0.8664082884788513, "Finetune/Loss (Raw)": 0.8905256390571594, "Finetune/Step": 635, "Finetune/Step Time": 2.741042507812381} +{"Finetune/Learning Rate": 1.9501470208049494e-05, "Finetune/Loss": 0.8650460243225098, "Finetune/Loss (Raw)": 0.8229022026062012, "Finetune/Step": 636, "Finetune/Step Time": 2.7438947185873985} +{"Finetune/Learning Rate": 1.949943802704064e-05, "Finetune/Loss": 0.8650164604187012, "Finetune/Loss (Raw)": 0.9098081588745117, "Finetune/Step": 637, "Finetune/Step Time": 2.745680183172226} +{"Finetune/Learning Rate": 1.949740181883355e-05, "Finetune/Loss": 0.8666494488716125, "Finetune/Loss (Raw)": 0.7917019724845886, "Finetune/Step": 638, "Finetune/Step Time": 2.7266334798187017} +{"Finetune/Learning Rate": 1.949536158429145e-05, "Finetune/Loss": 0.8664112091064453, "Finetune/Loss (Raw)": 0.8884541988372803, "Finetune/Step": 639, "Finetune/Step Time": 2.72688302770257} +{"Finetune/Learning Rate": 1.9493317324279278e-05, "Finetune/Loss": 0.8671761751174927, "Finetune/Loss (Raw)": 0.9749688506126404, "Finetune/Step": 640, "Finetune/Step Time": 2.736443078145385} +{"Finetune/Learning Rate": 1.949126903966368e-05, "Finetune/Loss": 0.8659118413925171, "Finetune/Loss (Raw)": 0.8164513111114502, "Finetune/Step": 641, "Finetune/Step Time": 2.739553676918149} +{"Finetune/Learning Rate": 1.9489216731313007e-05, "Finetune/Loss": 0.8662093877792358, "Finetune/Loss (Raw)": 0.9103546738624573, "Finetune/Step": 642, "Finetune/Step Time": 2.738618714734912} +{"Finetune/Learning Rate": 1.9487160400097316e-05, "Finetune/Loss": 0.8665859699249268, "Finetune/Loss (Raw)": 0.8466205596923828, "Finetune/Step": 643, "Finetune/Step Time": 2.737027797847986} +{"Finetune/Learning Rate": 1.9485100046888374e-05, "Finetune/Loss": 0.8671619892120361, "Finetune/Loss (Raw)": 0.9545602798461914, "Finetune/Step": 644, "Finetune/Step Time": 2.7368980553001165} +{"Finetune/Learning Rate": 1.948303567255964e-05, "Finetune/Loss": 0.8677054047584534, "Finetune/Loss (Raw)": 0.8646939992904663, "Finetune/Step": 645, "Finetune/Step Time": 2.7444816660135984} +{"Finetune/Learning Rate": 1.9480967277986288e-05, "Finetune/Loss": 0.8682084083557129, "Finetune/Loss (Raw)": 0.830637514591217, "Finetune/Step": 646, "Finetune/Step Time": 2.7424071952700615} +{"Finetune/Learning Rate": 1.94788948640452e-05, "Finetune/Loss": 0.8676536083221436, "Finetune/Loss (Raw)": 0.8165093660354614, "Finetune/Step": 647, "Finetune/Step Time": 2.7418526522815228} +{"Finetune/Learning Rate": 1.9476818431614954e-05, "Finetune/Loss": 0.8679462671279907, "Finetune/Loss (Raw)": 0.8812623023986816, "Finetune/Step": 648, "Finetune/Step Time": 2.740748167037964} +{"Finetune/Learning Rate": 1.9474737981575833e-05, "Finetune/Loss": 0.8679193258285522, "Finetune/Loss (Raw)": 0.8545792102813721, "Finetune/Step": 649, "Finetune/Step Time": 2.738449040800333} +{"Finetune/Learning Rate": 1.9472653514809826e-05, "Finetune/Loss": 0.8680529594421387, "Finetune/Loss (Raw)": 0.8722624778747559, "Finetune/Step": 650, "Finetune/Step Time": 2.7371140122413635} +{"Finetune/Learning Rate": 1.9470565032200622e-05, "Finetune/Loss": 0.8677319288253784, "Finetune/Loss (Raw)": 0.8921874761581421, "Finetune/Step": 651, "Finetune/Step Time": 2.739678520709276} +{"Finetune/Learning Rate": 1.9468472534633615e-05, "Finetune/Loss": 0.8668506741523743, "Finetune/Loss (Raw)": 0.7790088653564453, "Finetune/Step": 652, "Finetune/Step Time": 2.74126691929996} +{"Finetune/Learning Rate": 1.94663760229959e-05, "Finetune/Loss": 0.866876482963562, "Finetune/Loss (Raw)": 0.8780246376991272, "Finetune/Step": 653, "Finetune/Step Time": 2.7396045606583357} +{"Finetune/Learning Rate": 1.946427549817627e-05, "Finetune/Loss": 0.8662256002426147, "Finetune/Loss (Raw)": 0.7652415633201599, "Finetune/Step": 654, "Finetune/Step Time": 2.7349747214466333} +{"Finetune/Learning Rate": 1.9462170961065225e-05, "Finetune/Loss": 0.8699859380722046, "Finetune/Loss (Raw)": 0.6601965427398682, "Finetune/Step": 655, "Finetune/Step Time": 2.7286217026412487} +{"Finetune/Learning Rate": 1.946006241255497e-05, "Finetune/Loss": 0.8721820116043091, "Finetune/Loss (Raw)": 0.9128023386001587, "Finetune/Step": 656, "Finetune/Step Time": 2.682614043354988} +{"Finetune/Learning Rate": 1.9457949853539393e-05, "Finetune/Loss": 0.8721082210540771, "Finetune/Loss (Raw)": 0.8402308821678162, "Finetune/Step": 657, "Finetune/Step Time": 2.6804155614227057} +{"Finetune/Learning Rate": 1.9455833284914102e-05, "Finetune/Loss": 0.8708678483963013, "Finetune/Loss (Raw)": 0.723885178565979, "Finetune/Step": 658, "Finetune/Step Time": 2.7030788641422987} +{"Finetune/Learning Rate": 1.9453712707576392e-05, "Finetune/Loss": 0.8702690005302429, "Finetune/Loss (Raw)": 0.8880477547645569, "Finetune/Step": 659, "Finetune/Step Time": 2.7066781409084797} +{"Finetune/Learning Rate": 1.9451588122425266e-05, "Finetune/Loss": 0.8707243800163269, "Finetune/Loss (Raw)": 0.8825300931930542, "Finetune/Step": 660, "Finetune/Step Time": 2.7125903014093637} +{"Finetune/Learning Rate": 1.944945953036142e-05, "Finetune/Loss": 0.8705036640167236, "Finetune/Loss (Raw)": 0.9034166932106018, "Finetune/Step": 661, "Finetune/Step Time": 2.7107282169163227} +{"Finetune/Learning Rate": 1.9447326932287254e-05, "Finetune/Loss": 0.8696058988571167, "Finetune/Loss (Raw)": 0.8595471978187561, "Finetune/Step": 662, "Finetune/Step Time": 2.711397437378764} +{"Finetune/Learning Rate": 1.9445190329106856e-05, "Finetune/Loss": 0.8691368103027344, "Finetune/Loss (Raw)": 0.8535099029541016, "Finetune/Step": 663, "Finetune/Step Time": 2.7113695349544287} +{"Finetune/Learning Rate": 1.9443049721726024e-05, "Finetune/Loss": 0.8681172132492065, "Finetune/Loss (Raw)": 0.8626298308372498, "Finetune/Step": 664, "Finetune/Step Time": 2.711431350558996} +{"Finetune/Learning Rate": 1.944090511105225e-05, "Finetune/Loss": 0.866533637046814, "Finetune/Loss (Raw)": 0.8029206991195679, "Finetune/Step": 665, "Finetune/Step Time": 2.7116167042404413} +{"Finetune/Learning Rate": 1.943875649799472e-05, "Finetune/Loss": 0.8640424013137817, "Finetune/Loss (Raw)": 0.6829544901847839, "Finetune/Step": 666, "Finetune/Step Time": 2.7372076213359833} +{"Finetune/Learning Rate": 1.9436603883464317e-05, "Finetune/Loss": 0.8637399673461914, "Finetune/Loss (Raw)": 0.8349359631538391, "Finetune/Step": 667, "Finetune/Step Time": 2.7392138596624136} +{"Finetune/Learning Rate": 1.943444726837362e-05, "Finetune/Loss": 0.863890528678894, "Finetune/Loss (Raw)": 0.9038389325141907, "Finetune/Step": 668, "Finetune/Step Time": 2.7391445711255074} +{"Finetune/Learning Rate": 1.943228665363691e-05, "Finetune/Loss": 0.863528847694397, "Finetune/Loss (Raw)": 0.9411885738372803, "Finetune/Step": 669, "Finetune/Step Time": 2.7380119152367115} +{"Finetune/Learning Rate": 1.9430122040170157e-05, "Finetune/Loss": 0.8613837957382202, "Finetune/Loss (Raw)": 0.5580313801765442, "Finetune/Step": 670, "Finetune/Step Time": 2.7656642589718103} +{"Finetune/Learning Rate": 1.9427953428891032e-05, "Finetune/Loss": 0.861283004283905, "Finetune/Loss (Raw)": 0.8691523671150208, "Finetune/Step": 671, "Finetune/Step Time": 2.76431324146688} +{"Finetune/Learning Rate": 1.9425780820718895e-05, "Finetune/Loss": 0.8622627258300781, "Finetune/Loss (Raw)": 0.9371321797370911, "Finetune/Step": 672, "Finetune/Step Time": 2.766789758577943} +{"Finetune/Learning Rate": 1.9423604216574804e-05, "Finetune/Loss": 0.862548828125, "Finetune/Loss (Raw)": 0.9022126197814941, "Finetune/Step": 673, "Finetune/Step Time": 2.7646240666508675} +{"Finetune/Learning Rate": 1.942142361738151e-05, "Finetune/Loss": 0.8626885414123535, "Finetune/Loss (Raw)": 0.8457815647125244, "Finetune/Step": 674, "Finetune/Step Time": 2.7653195280581713} +{"Finetune/Learning Rate": 1.9419239024063456e-05, "Finetune/Loss": 0.8622320294380188, "Finetune/Loss (Raw)": 0.8673725128173828, "Finetune/Step": 675, "Finetune/Step Time": 2.763967113569379} +{"Finetune/Learning Rate": 1.941705043754678e-05, "Finetune/Loss": 0.8629381656646729, "Finetune/Loss (Raw)": 0.9487860202789307, "Finetune/Step": 676, "Finetune/Step Time": 2.764203554019332} +{"Finetune/Learning Rate": 1.9414857858759314e-05, "Finetune/Loss": 0.8635862469673157, "Finetune/Loss (Raw)": 0.9306063055992126, "Finetune/Step": 677, "Finetune/Step Time": 2.7670410070568323} +{"Finetune/Learning Rate": 1.9412661288630585e-05, "Finetune/Loss": 0.8629252910614014, "Finetune/Loss (Raw)": 0.8488314151763916, "Finetune/Step": 678, "Finetune/Step Time": 2.766670096665621} +{"Finetune/Learning Rate": 1.9410460728091802e-05, "Finetune/Loss": 0.8631020784378052, "Finetune/Loss (Raw)": 0.9550703763961792, "Finetune/Step": 679, "Finetune/Step Time": 2.764994814991951} +{"Finetune/Learning Rate": 1.9408256178075875e-05, "Finetune/Loss": 0.8622783422470093, "Finetune/Loss (Raw)": 0.8013967275619507, "Finetune/Step": 680, "Finetune/Step Time": 2.7657177913933992} +{"Finetune/Learning Rate": 1.9406047639517402e-05, "Finetune/Loss": 0.8628294467926025, "Finetune/Loss (Raw)": 0.9359879493713379, "Finetune/Step": 681, "Finetune/Step Time": 2.7658576741814613} +{"Finetune/Learning Rate": 1.9403835113352674e-05, "Finetune/Loss": 0.862481951713562, "Finetune/Loss (Raw)": 0.8302803635597229, "Finetune/Step": 682, "Finetune/Step Time": 2.765349142253399} +{"Finetune/Learning Rate": 1.9401618600519668e-05, "Finetune/Loss": 0.8623595833778381, "Finetune/Loss (Raw)": 0.8739800453186035, "Finetune/Step": 683, "Finetune/Step Time": 2.763356188312173} +{"Finetune/Learning Rate": 1.9399398101958054e-05, "Finetune/Loss": 0.8636798858642578, "Finetune/Loss (Raw)": 0.9726483821868896, "Finetune/Step": 684, "Finetune/Step Time": 2.7640759628266096} +{"Finetune/Learning Rate": 1.93971736186092e-05, "Finetune/Loss": 0.8645138740539551, "Finetune/Loss (Raw)": 0.8402730822563171, "Finetune/Step": 685, "Finetune/Step Time": 2.7436567433178425} +{"Finetune/Learning Rate": 1.939494515141614e-05, "Finetune/Loss": 0.8653876185417175, "Finetune/Loss (Raw)": 0.9753987193107605, "Finetune/Step": 686, "Finetune/Step Time": 2.7440946586430073} +{"Finetune/Learning Rate": 1.9392712701323627e-05, "Finetune/Loss": 0.8649004697799683, "Finetune/Loss (Raw)": 0.8730550408363342, "Finetune/Step": 687, "Finetune/Step Time": 2.744905339553952} +{"Finetune/Learning Rate": 1.9390476269278077e-05, "Finetune/Loss": 0.8642632961273193, "Finetune/Loss (Raw)": 0.8022318482398987, "Finetune/Step": 688, "Finetune/Step Time": 2.743574356660247} +{"Finetune/Learning Rate": 1.938823585622761e-05, "Finetune/Loss": 0.8610798120498657, "Finetune/Loss (Raw)": 0.46225738525390625, "Finetune/Step": 689, "Finetune/Step Time": 2.770488951355219} +{"Finetune/Learning Rate": 1.9385991463122022e-05, "Finetune/Loss": 0.8629370927810669, "Finetune/Loss (Raw)": 0.8185205459594727, "Finetune/Step": 690, "Finetune/Step Time": 2.748215703293681} +{"Finetune/Learning Rate": 1.938374309091281e-05, "Finetune/Loss": 0.862324595451355, "Finetune/Loss (Raw)": 0.8144082427024841, "Finetune/Step": 691, "Finetune/Step Time": 2.7466449458152056} +{"Finetune/Learning Rate": 1.9381490740553147e-05, "Finetune/Loss": 0.8610799312591553, "Finetune/Loss (Raw)": 0.7854898571968079, "Finetune/Step": 692, "Finetune/Step Time": 2.748392954468727} +{"Finetune/Learning Rate": 1.93792344129979e-05, "Finetune/Loss": 0.857994556427002, "Finetune/Loss (Raw)": 0.5881182551383972, "Finetune/Step": 693, "Finetune/Step Time": 2.7731165196746588} +{"Finetune/Learning Rate": 1.9376974109203604e-05, "Finetune/Loss": 0.8568354845046997, "Finetune/Loss (Raw)": 0.8176324963569641, "Finetune/Step": 694, "Finetune/Step Time": 2.7723452895879745} +{"Finetune/Learning Rate": 1.937470983012851e-05, "Finetune/Loss": 0.8565315008163452, "Finetune/Loss (Raw)": 0.8771708607673645, "Finetune/Step": 695, "Finetune/Step Time": 2.7748686019331217} +{"Finetune/Learning Rate": 1.9372441576732533e-05, "Finetune/Loss": 0.8576302528381348, "Finetune/Loss (Raw)": 0.9613168239593506, "Finetune/Step": 696, "Finetune/Step Time": 2.782016798853874} +{"Finetune/Learning Rate": 1.9370169349977278e-05, "Finetune/Loss": 0.8574790358543396, "Finetune/Loss (Raw)": 0.8447755575180054, "Finetune/Step": 697, "Finetune/Step Time": 2.7801648303866386} +{"Finetune/Learning Rate": 1.9367893150826033e-05, "Finetune/Loss": 0.8574765920639038, "Finetune/Loss (Raw)": 0.8878591656684875, "Finetune/Step": 698, "Finetune/Step Time": 2.774273058399558} +{"Finetune/Learning Rate": 1.936561298024377e-05, "Finetune/Loss": 0.8578301072120667, "Finetune/Loss (Raw)": 0.9403363466262817, "Finetune/Step": 699, "Finetune/Step Time": 2.7780147530138493} +{"Finetune/Learning Rate": 1.936332883919715e-05, "Finetune/Loss": 0.8574918508529663, "Finetune/Loss (Raw)": 0.8310967087745667, "Finetune/Step": 700, "Finetune/Step Time": 2.77712276019156} +{"Finetune/Learning Rate": 1.936104072865451e-05, "Finetune/Loss": 0.8559082746505737, "Finetune/Loss (Raw)": 0.6736449599266052, "Finetune/Step": 701, "Finetune/Step Time": 2.8028645925223827} +{"Finetune/Learning Rate": 1.9358748649585874e-05, "Finetune/Loss": 0.8570922017097473, "Finetune/Loss (Raw)": 0.9630993604660034, "Finetune/Step": 702, "Finetune/Step Time": 2.801719570532441} +{"Finetune/Learning Rate": 1.9356452602962947e-05, "Finetune/Loss": 0.8557882308959961, "Finetune/Loss (Raw)": 0.7174581289291382, "Finetune/Step": 703, "Finetune/Step Time": 2.8008785750716925} +{"Finetune/Learning Rate": 1.9354152589759114e-05, "Finetune/Loss": 0.8561701774597168, "Finetune/Loss (Raw)": 0.9796499013900757, "Finetune/Step": 704, "Finetune/Step Time": 2.8002044931054115} +{"Finetune/Learning Rate": 1.9351848610949454e-05, "Finetune/Loss": 0.85551917552948, "Finetune/Loss (Raw)": 0.9005162119865417, "Finetune/Step": 705, "Finetune/Step Time": 2.8008424285799265} +{"Finetune/Learning Rate": 1.9349540667510705e-05, "Finetune/Loss": 0.855257511138916, "Finetune/Loss (Raw)": 0.9025982618331909, "Finetune/Step": 706, "Finetune/Step Time": 2.8018156327307224} +{"Finetune/Learning Rate": 1.9347228760421308e-05, "Finetune/Loss": 0.8559055328369141, "Finetune/Loss (Raw)": 0.8369883894920349, "Finetune/Step": 707, "Finetune/Step Time": 2.8012643419206142} +{"Finetune/Learning Rate": 1.934491289066137e-05, "Finetune/Loss": 0.8558690547943115, "Finetune/Loss (Raw)": 0.8007673025131226, "Finetune/Step": 708, "Finetune/Step Time": 2.8040976747870445} +{"Finetune/Learning Rate": 1.934259305921268e-05, "Finetune/Loss": 0.8562892079353333, "Finetune/Loss (Raw)": 0.8908266425132751, "Finetune/Step": 709, "Finetune/Step Time": 2.8065474070608616} +{"Finetune/Learning Rate": 1.9340269267058714e-05, "Finetune/Loss": 0.8555619120597839, "Finetune/Loss (Raw)": 0.8558696508407593, "Finetune/Step": 710, "Finetune/Step Time": 2.8071460258215666} +{"Finetune/Learning Rate": 1.933794151518462e-05, "Finetune/Loss": 0.8558197021484375, "Finetune/Loss (Raw)": 0.9032422304153442, "Finetune/Step": 711, "Finetune/Step Time": 2.806098597124219} +{"Finetune/Learning Rate": 1.9335609804577226e-05, "Finetune/Loss": 0.8547952175140381, "Finetune/Loss (Raw)": 0.8698028922080994, "Finetune/Step": 712, "Finetune/Step Time": 2.7971292193979025} +{"Finetune/Learning Rate": 1.933327413622504e-05, "Finetune/Loss": 0.8514392971992493, "Finetune/Loss (Raw)": 0.5096723437309265, "Finetune/Step": 713, "Finetune/Step Time": 2.825457625091076} +{"Finetune/Learning Rate": 1.933093451111825e-05, "Finetune/Loss": 0.8521100878715515, "Finetune/Loss (Raw)": 0.7561477422714233, "Finetune/Step": 714, "Finetune/Step Time": 2.803629716858268} +{"Finetune/Learning Rate": 1.932859093024871e-05, "Finetune/Loss": 0.8523626327514648, "Finetune/Loss (Raw)": 0.9344879984855652, "Finetune/Step": 715, "Finetune/Step Time": 2.804095294326544} +{"Finetune/Learning Rate": 1.9326243394609966e-05, "Finetune/Loss": 0.8535973429679871, "Finetune/Loss (Raw)": 0.9595827460289001, "Finetune/Step": 716, "Finetune/Step Time": 2.805738525465131} +{"Finetune/Learning Rate": 1.932389190519723e-05, "Finetune/Loss": 0.8536940217018127, "Finetune/Loss (Raw)": 0.8618990778923035, "Finetune/Step": 717, "Finetune/Step Time": 2.8067260179668665} +{"Finetune/Learning Rate": 1.9321536463007396e-05, "Finetune/Loss": 0.8536024689674377, "Finetune/Loss (Raw)": 0.8888906836509705, "Finetune/Step": 718, "Finetune/Step Time": 2.807366529479623} +{"Finetune/Learning Rate": 1.931917706903903e-05, "Finetune/Loss": 0.8531160354614258, "Finetune/Loss (Raw)": 0.80723637342453, "Finetune/Step": 719, "Finetune/Step Time": 2.809699224308133} +{"Finetune/Learning Rate": 1.931681372429238e-05, "Finetune/Loss": 0.8528602123260498, "Finetune/Loss (Raw)": 0.8371882438659668, "Finetune/Step": 720, "Finetune/Step Time": 2.8077668081969023} +{"Finetune/Learning Rate": 1.931444642976936e-05, "Finetune/Loss": 0.8515986800193787, "Finetune/Loss (Raw)": 0.7916483283042908, "Finetune/Step": 721, "Finetune/Step Time": 2.8074117805808783} +{"Finetune/Learning Rate": 1.9312075186473564e-05, "Finetune/Loss": 0.8520527482032776, "Finetune/Loss (Raw)": 0.8798829913139343, "Finetune/Step": 722, "Finetune/Step Time": 2.8053280021995306} +{"Finetune/Learning Rate": 1.9309699995410253e-05, "Finetune/Loss": 0.8513814806938171, "Finetune/Loss (Raw)": 0.7933404445648193, "Finetune/Step": 723, "Finetune/Step Time": 2.8071699179708958} +{"Finetune/Learning Rate": 1.9307320857586377e-05, "Finetune/Loss": 0.8512369394302368, "Finetune/Loss (Raw)": 0.8307515978813171, "Finetune/Step": 724, "Finetune/Step Time": 2.804293777793646} +{"Finetune/Learning Rate": 1.9304937774010542e-05, "Finetune/Loss": 0.8513203263282776, "Finetune/Loss (Raw)": 0.9341264367103577, "Finetune/Step": 725, "Finetune/Step Time": 2.806658986955881} +{"Finetune/Learning Rate": 1.9302550745693035e-05, "Finetune/Loss": 0.8520956635475159, "Finetune/Loss (Raw)": 0.9620549082756042, "Finetune/Step": 726, "Finetune/Step Time": 2.8062395248562098} +{"Finetune/Learning Rate": 1.9300159773645816e-05, "Finetune/Loss": 0.8542320132255554, "Finetune/Loss (Raw)": 0.8557030558586121, "Finetune/Step": 727, "Finetune/Step Time": 2.7838108893483877} +{"Finetune/Learning Rate": 1.9297764858882516e-05, "Finetune/Loss": 0.854483425617218, "Finetune/Loss (Raw)": 0.8677093982696533, "Finetune/Step": 728, "Finetune/Step Time": 2.7824516277760267} +{"Finetune/Learning Rate": 1.9295366002418434e-05, "Finetune/Loss": 0.8534610271453857, "Finetune/Loss (Raw)": 0.8517694473266602, "Finetune/Step": 729, "Finetune/Step Time": 2.7808816134929657} +{"Finetune/Learning Rate": 1.9292963205270546e-05, "Finetune/Loss": 0.8498448729515076, "Finetune/Loss (Raw)": 0.35537779331207275, "Finetune/Step": 730, "Finetune/Step Time": 2.809781387448311} +{"Finetune/Learning Rate": 1.929055646845749e-05, "Finetune/Loss": 0.8500443696975708, "Finetune/Loss (Raw)": 0.9068491458892822, "Finetune/Step": 731, "Finetune/Step Time": 2.8095703218132257} +{"Finetune/Learning Rate": 1.928814579299959e-05, "Finetune/Loss": 0.8481019735336304, "Finetune/Loss (Raw)": 0.6940301656723022, "Finetune/Step": 732, "Finetune/Step Time": 2.83555699698627} +{"Finetune/Learning Rate": 1.928573117991882e-05, "Finetune/Loss": 0.8482322692871094, "Finetune/Loss (Raw)": 0.8663328886032104, "Finetune/Step": 733, "Finetune/Step Time": 2.835772840306163} +{"Finetune/Learning Rate": 1.9283312630238837e-05, "Finetune/Loss": 0.8465777635574341, "Finetune/Loss (Raw)": 0.6072169542312622, "Finetune/Step": 734, "Finetune/Step Time": 2.8582490608096123} +{"Finetune/Learning Rate": 1.928089014498496e-05, "Finetune/Loss": 0.8467377424240112, "Finetune/Loss (Raw)": 0.8889784812927246, "Finetune/Step": 735, "Finetune/Step Time": 2.857128396630287} +{"Finetune/Learning Rate": 1.927846372518418e-05, "Finetune/Loss": 0.8467759490013123, "Finetune/Loss (Raw)": 0.8461776375770569, "Finetune/Step": 736, "Finetune/Step Time": 2.8585571218281984} +{"Finetune/Learning Rate": 1.9276033371865157e-05, "Finetune/Loss": 0.8473026752471924, "Finetune/Loss (Raw)": 0.9101080894470215, "Finetune/Step": 737, "Finetune/Step Time": 2.857412699609995} +{"Finetune/Learning Rate": 1.9273599086058214e-05, "Finetune/Loss": 0.8473715782165527, "Finetune/Loss (Raw)": 0.8848061561584473, "Finetune/Step": 738, "Finetune/Step Time": 2.8620418552309275} +{"Finetune/Learning Rate": 1.927116086879534e-05, "Finetune/Loss": 0.8484698534011841, "Finetune/Loss (Raw)": 0.9803929328918457, "Finetune/Step": 739, "Finetune/Step Time": 2.861607301980257} +{"Finetune/Learning Rate": 1.9268718721110207e-05, "Finetune/Loss": 0.8485580682754517, "Finetune/Loss (Raw)": 0.8943567872047424, "Finetune/Step": 740, "Finetune/Step Time": 2.86500489898026} +{"Finetune/Learning Rate": 1.9266272644038133e-05, "Finetune/Loss": 0.848020613193512, "Finetune/Loss (Raw)": 0.847862720489502, "Finetune/Step": 741, "Finetune/Step Time": 2.8652469515800476} +{"Finetune/Learning Rate": 1.9263822638616107e-05, "Finetune/Loss": 0.8490352034568787, "Finetune/Loss (Raw)": 0.8774303197860718, "Finetune/Step": 742, "Finetune/Step Time": 2.8671641312539577} +{"Finetune/Learning Rate": 1.9261368705882785e-05, "Finetune/Loss": 0.8494163155555725, "Finetune/Loss (Raw)": 0.942039430141449, "Finetune/Step": 743, "Finetune/Step Time": 2.865095155313611} +{"Finetune/Learning Rate": 1.92589108468785e-05, "Finetune/Loss": 0.8477159142494202, "Finetune/Loss (Raw)": 0.7606083154678345, "Finetune/Step": 744, "Finetune/Step Time": 2.865715242922306} +{"Finetune/Learning Rate": 1.9256449062645227e-05, "Finetune/Loss": 0.8471623659133911, "Finetune/Loss (Raw)": 0.830352246761322, "Finetune/Step": 745, "Finetune/Step Time": 2.8695861026644707} +{"Finetune/Learning Rate": 1.925398335422662e-05, "Finetune/Loss": 0.8464028835296631, "Finetune/Loss (Raw)": 0.8624255657196045, "Finetune/Step": 746, "Finetune/Step Time": 2.8720248211175203} +{"Finetune/Learning Rate": 1.9251513722667995e-05, "Finetune/Loss": 0.8456511497497559, "Finetune/Loss (Raw)": 0.8604027628898621, "Finetune/Step": 747, "Finetune/Step Time": 2.874021030962467} +{"Finetune/Learning Rate": 1.9249040169016325e-05, "Finetune/Loss": 0.8460632562637329, "Finetune/Loss (Raw)": 0.9101013541221619, "Finetune/Step": 748, "Finetune/Step Time": 2.8753248304128647} +{"Finetune/Learning Rate": 1.9246562694320258e-05, "Finetune/Loss": 0.8456912040710449, "Finetune/Loss (Raw)": 0.7985453009605408, "Finetune/Step": 749, "Finetune/Step Time": 2.8926052674651146} +{"Finetune/Learning Rate": 1.9244081299630088e-05, "Finetune/Loss": 0.8457813262939453, "Finetune/Loss (Raw)": 0.8971846103668213, "Finetune/Step": 750, "Finetune/Step Time": 2.8931636102497578} +{"Finetune/Learning Rate": 1.9241595985997784e-05, "Finetune/Loss": 0.8456794023513794, "Finetune/Loss (Raw)": 0.8655545115470886, "Finetune/Step": 751, "Finetune/Step Time": 2.8926400374621153} +{"Finetune/Learning Rate": 1.923910675447697e-05, "Finetune/Loss": 0.8457757234573364, "Finetune/Loss (Raw)": 0.9076493382453918, "Finetune/Step": 752, "Finetune/Step Time": 2.8970873672515154} +{"Finetune/Learning Rate": 1.9236613606122927e-05, "Finetune/Loss": 0.8453537225723267, "Finetune/Loss (Raw)": 0.8637759685516357, "Finetune/Step": 753, "Finetune/Step Time": 2.898457497358322} +{"Finetune/Learning Rate": 1.9234116541992615e-05, "Finetune/Loss": 0.8462875485420227, "Finetune/Loss (Raw)": 0.8357638716697693, "Finetune/Step": 754, "Finetune/Step Time": 2.875826647505164} +{"Finetune/Learning Rate": 1.923161556314463e-05, "Finetune/Loss": 0.8447550535202026, "Finetune/Loss (Raw)": 0.6312692165374756, "Finetune/Step": 755, "Finetune/Step Time": 2.8960789795964956} +{"Finetune/Learning Rate": 1.922911067063924e-05, "Finetune/Loss": 0.8441346287727356, "Finetune/Loss (Raw)": 0.8100059032440186, "Finetune/Step": 756, "Finetune/Step Time": 2.9017118513584137} +{"Finetune/Learning Rate": 1.9226601865538377e-05, "Finetune/Loss": 0.8439353704452515, "Finetune/Loss (Raw)": 0.8555973172187805, "Finetune/Step": 757, "Finetune/Step Time": 2.8993005752563477} +{"Finetune/Learning Rate": 1.9224089148905622e-05, "Finetune/Loss": 0.8436843156814575, "Finetune/Loss (Raw)": 0.9213185906410217, "Finetune/Step": 758, "Finetune/Step Time": 2.903050610795617} +{"Finetune/Learning Rate": 1.9221572521806213e-05, "Finetune/Loss": 0.8432313203811646, "Finetune/Loss (Raw)": 0.8044310212135315, "Finetune/Step": 759, "Finetune/Step Time": 2.894847696647048} +{"Finetune/Learning Rate": 1.921905198530706e-05, "Finetune/Loss": 0.8431447148323059, "Finetune/Loss (Raw)": 0.8936156630516052, "Finetune/Step": 760, "Finetune/Step Time": 2.897826539352536} +{"Finetune/Learning Rate": 1.9216527540476713e-05, "Finetune/Loss": 0.8453733921051025, "Finetune/Loss (Raw)": 0.9054969549179077, "Finetune/Step": 761, "Finetune/Step Time": 2.8737327735871077} +{"Finetune/Learning Rate": 1.921399918838539e-05, "Finetune/Loss": 0.8453949689865112, "Finetune/Loss (Raw)": 0.8873355984687805, "Finetune/Step": 762, "Finetune/Step Time": 2.872787293046713} +{"Finetune/Learning Rate": 1.9211466930104963e-05, "Finetune/Loss": 0.8451007604598999, "Finetune/Loss (Raw)": 0.8528712391853333, "Finetune/Step": 763, "Finetune/Step Time": 2.8703175839036703} +{"Finetune/Learning Rate": 1.920893076670896e-05, "Finetune/Loss": 0.8448581695556641, "Finetune/Loss (Raw)": 0.7918498516082764, "Finetune/Step": 764, "Finetune/Step Time": 2.868899704888463} +{"Finetune/Learning Rate": 1.9206390699272558e-05, "Finetune/Loss": 0.8443909883499146, "Finetune/Loss (Raw)": 0.8500088453292847, "Finetune/Step": 765, "Finetune/Step Time": 2.867156248539686} +{"Finetune/Learning Rate": 1.9203846728872603e-05, "Finetune/Loss": 0.8446770906448364, "Finetune/Loss (Raw)": 0.8283286690711975, "Finetune/Step": 766, "Finetune/Step Time": 2.867468999698758} +{"Finetune/Learning Rate": 1.9201298856587584e-05, "Finetune/Loss": 0.8443046808242798, "Finetune/Loss (Raw)": 0.840783417224884, "Finetune/Step": 767, "Finetune/Step Time": 2.8672188110649586} +{"Finetune/Learning Rate": 1.9198747083497643e-05, "Finetune/Loss": 0.8431956768035889, "Finetune/Loss (Raw)": 0.8330150842666626, "Finetune/Step": 768, "Finetune/Step Time": 2.856883829459548} +{"Finetune/Learning Rate": 1.9196191410684588e-05, "Finetune/Loss": 0.8433172106742859, "Finetune/Loss (Raw)": 0.8320063948631287, "Finetune/Step": 769, "Finetune/Step Time": 2.856525456532836} +{"Finetune/Learning Rate": 1.919363183923187e-05, "Finetune/Loss": 0.8435189127922058, "Finetune/Loss (Raw)": 0.9361777305603027, "Finetune/Step": 770, "Finetune/Step Time": 2.8571580350399017} +{"Finetune/Learning Rate": 1.9191068370224595e-05, "Finetune/Loss": 0.8446118831634521, "Finetune/Loss (Raw)": 0.9865193963050842, "Finetune/Step": 771, "Finetune/Step Time": 2.855632282793522} +{"Finetune/Learning Rate": 1.918850100474952e-05, "Finetune/Loss": 0.8443838357925415, "Finetune/Loss (Raw)": 0.9253678917884827, "Finetune/Step": 772, "Finetune/Step Time": 2.856828585267067} +{"Finetune/Learning Rate": 1.918592974389506e-05, "Finetune/Loss": 0.8441676497459412, "Finetune/Loss (Raw)": 0.8370200991630554, "Finetune/Step": 773, "Finetune/Step Time": 2.85020075365901} +{"Finetune/Learning Rate": 1.9183354588751274e-05, "Finetune/Loss": 0.8441128134727478, "Finetune/Loss (Raw)": 0.8236196637153625, "Finetune/Step": 774, "Finetune/Step Time": 2.850800732150674} +{"Finetune/Learning Rate": 1.9180775540409876e-05, "Finetune/Loss": 0.844515323638916, "Finetune/Loss (Raw)": 0.8680344223976135, "Finetune/Step": 775, "Finetune/Step Time": 2.8506648894399405} +{"Finetune/Learning Rate": 1.9178192599964228e-05, "Finetune/Loss": 0.8441163301467896, "Finetune/Loss (Raw)": 0.830187976360321, "Finetune/Step": 776, "Finetune/Step Time": 2.851727169007063} +{"Finetune/Learning Rate": 1.9175605768509348e-05, "Finetune/Loss": 0.8438339829444885, "Finetune/Loss (Raw)": 0.818431556224823, "Finetune/Step": 777, "Finetune/Step Time": 2.8504130486398935} +{"Finetune/Learning Rate": 1.9173015047141888e-05, "Finetune/Loss": 0.8431463837623596, "Finetune/Loss (Raw)": 0.7842519879341125, "Finetune/Step": 778, "Finetune/Step Time": 2.8478928804397583} +{"Finetune/Learning Rate": 1.9170420436960174e-05, "Finetune/Loss": 0.8433048725128174, "Finetune/Loss (Raw)": 0.9124820232391357, "Finetune/Step": 779, "Finetune/Step Time": 2.848009992390871} +{"Finetune/Learning Rate": 1.9167821939064158e-05, "Finetune/Loss": 0.8445826768875122, "Finetune/Loss (Raw)": 0.9425674676895142, "Finetune/Step": 780, "Finetune/Step Time": 2.8509772159159184} +{"Finetune/Learning Rate": 1.9165219554555458e-05, "Finetune/Loss": 0.8448792695999146, "Finetune/Loss (Raw)": 0.9159785509109497, "Finetune/Step": 781, "Finetune/Step Time": 2.8527636881917715} +{"Finetune/Learning Rate": 1.9162613284537318e-05, "Finetune/Loss": 0.8446065187454224, "Finetune/Loss (Raw)": 0.7303354144096375, "Finetune/Step": 782, "Finetune/Step Time": 2.857938602566719} +{"Finetune/Learning Rate": 1.9160003130114653e-05, "Finetune/Loss": 0.8463358283042908, "Finetune/Loss (Raw)": 0.8815483450889587, "Finetune/Step": 783, "Finetune/Step Time": 2.8352576959878206} +{"Finetune/Learning Rate": 1.9157389092394005e-05, "Finetune/Loss": 0.8454570770263672, "Finetune/Loss (Raw)": 0.8003271818161011, "Finetune/Step": 784, "Finetune/Step Time": 2.8363985270261765} +{"Finetune/Learning Rate": 1.9154771172483575e-05, "Finetune/Loss": 0.845067024230957, "Finetune/Loss (Raw)": 0.7903044819831848, "Finetune/Step": 785, "Finetune/Step Time": 2.8388044498860836} +{"Finetune/Learning Rate": 1.9152149371493207e-05, "Finetune/Loss": 0.8459038138389587, "Finetune/Loss (Raw)": 0.830995500087738, "Finetune/Step": 786, "Finetune/Step Time": 2.8192241322249174} +{"Finetune/Learning Rate": 1.9149523690534388e-05, "Finetune/Loss": 0.8455535173416138, "Finetune/Loss (Raw)": 0.8432043194770813, "Finetune/Step": 787, "Finetune/Step Time": 2.8164130859076977} +{"Finetune/Learning Rate": 1.9146894130720252e-05, "Finetune/Loss": 0.8436154723167419, "Finetune/Loss (Raw)": 0.6344605684280396, "Finetune/Step": 788, "Finetune/Step Time": 2.835956085473299} +{"Finetune/Learning Rate": 1.9144260693165573e-05, "Finetune/Loss": 0.8434183597564697, "Finetune/Loss (Raw)": 0.8781839609146118, "Finetune/Step": 789, "Finetune/Step Time": 2.841362252831459} +{"Finetune/Learning Rate": 1.9141623378986772e-05, "Finetune/Loss": 0.8418399095535278, "Finetune/Loss (Raw)": 0.6575061678886414, "Finetune/Step": 790, "Finetune/Step Time": 2.862754672765732} +{"Finetune/Learning Rate": 1.913898218930192e-05, "Finetune/Loss": 0.8424807190895081, "Finetune/Loss (Raw)": 0.9355339407920837, "Finetune/Step": 791, "Finetune/Step Time": 2.86046127602458} +{"Finetune/Learning Rate": 1.913633712523072e-05, "Finetune/Loss": 0.8427723050117493, "Finetune/Loss (Raw)": 0.8999564051628113, "Finetune/Step": 792, "Finetune/Step Time": 2.862661972641945} +{"Finetune/Learning Rate": 1.9133688187894527e-05, "Finetune/Loss": 0.8427443504333496, "Finetune/Loss (Raw)": 0.7993395328521729, "Finetune/Step": 793, "Finetune/Step Time": 2.8614785615354776} +{"Finetune/Learning Rate": 1.9131035378416322e-05, "Finetune/Loss": 0.8444175720214844, "Finetune/Loss (Raw)": 0.8971239924430847, "Finetune/Step": 794, "Finetune/Step Time": 2.837448626756668} +{"Finetune/Learning Rate": 1.912837869792075e-05, "Finetune/Loss": 0.8440673351287842, "Finetune/Loss (Raw)": 0.7901079654693604, "Finetune/Step": 795, "Finetune/Step Time": 2.838234033435583} +{"Finetune/Learning Rate": 1.9125718147534086e-05, "Finetune/Loss": 0.8435468673706055, "Finetune/Loss (Raw)": 0.8372211456298828, "Finetune/Step": 796, "Finetune/Step Time": 2.83953027240932} +{"Finetune/Learning Rate": 1.912305372838424e-05, "Finetune/Loss": 0.8431494235992432, "Finetune/Loss (Raw)": 0.8903101086616516, "Finetune/Step": 797, "Finetune/Step Time": 2.840094557031989} +{"Finetune/Learning Rate": 1.9120385441600766e-05, "Finetune/Loss": 0.8454787731170654, "Finetune/Loss (Raw)": 0.8561895489692688, "Finetune/Step": 798, "Finetune/Step Time": 2.8135951682925224} +{"Finetune/Learning Rate": 1.9117713288314864e-05, "Finetune/Loss": 0.8450392484664917, "Finetune/Loss (Raw)": 0.8129002451896667, "Finetune/Step": 799, "Finetune/Step Time": 2.810041857883334} +{"Finetune/Learning Rate": 1.9115037269659366e-05, "Finetune/Loss": 0.844684898853302, "Finetune/Loss (Raw)": 0.8917773365974426, "Finetune/Step": 800, "Finetune/Step Time": 2.809671161696315} +{"Finetune/Learning Rate": 1.9112357386768748e-05, "Finetune/Loss": 0.8447350859642029, "Finetune/Loss (Raw)": 0.908628523349762, "Finetune/Step": 801, "Finetune/Step Time": 2.810462648048997} +{"Finetune/Learning Rate": 1.9109673640779124e-05, "Finetune/Loss": 0.8463484048843384, "Finetune/Loss (Raw)": 1.0522937774658203, "Finetune/Step": 802, "Finetune/Step Time": 2.8089619744569063} +{"Finetune/Learning Rate": 1.9106986032828233e-05, "Finetune/Loss": 0.8466720581054688, "Finetune/Loss (Raw)": 0.9087918996810913, "Finetune/Step": 803, "Finetune/Step Time": 2.8090484980493784} +{"Finetune/Learning Rate": 1.9104294564055472e-05, "Finetune/Loss": 0.8459048271179199, "Finetune/Loss (Raw)": 0.8505831360816956, "Finetune/Step": 804, "Finetune/Step Time": 2.8155344054102898} +{"Finetune/Learning Rate": 1.910159923560186e-05, "Finetune/Loss": 0.8419482111930847, "Finetune/Loss (Raw)": 0.4241587221622467, "Finetune/Step": 805, "Finetune/Step Time": 2.8422172404825687} +{"Finetune/Learning Rate": 1.9098900048610053e-05, "Finetune/Loss": 0.8431564569473267, "Finetune/Loss (Raw)": 1.0034819841384888, "Finetune/Step": 806, "Finetune/Step Time": 2.8457306679338217} +{"Finetune/Learning Rate": 1.9096197004224347e-05, "Finetune/Loss": 0.8422492742538452, "Finetune/Loss (Raw)": 0.838959813117981, "Finetune/Step": 807, "Finetune/Step Time": 2.849867571145296} +{"Finetune/Learning Rate": 1.9093490103590678e-05, "Finetune/Loss": 0.8424983024597168, "Finetune/Loss (Raw)": 0.8332767486572266, "Finetune/Step": 808, "Finetune/Step Time": 2.8566856998950243} +{"Finetune/Learning Rate": 1.9090779347856607e-05, "Finetune/Loss": 0.8413861989974976, "Finetune/Loss (Raw)": 0.793634295463562, "Finetune/Step": 809, "Finetune/Step Time": 2.854043224826455} +{"Finetune/Learning Rate": 1.9088064738171334e-05, "Finetune/Loss": 0.8436027765274048, "Finetune/Loss (Raw)": 1.113998293876648, "Finetune/Step": 810, "Finetune/Step Time": 2.856924580410123} +{"Finetune/Learning Rate": 1.9085346275685695e-05, "Finetune/Loss": 0.8434871435165405, "Finetune/Loss (Raw)": 0.8591763973236084, "Finetune/Step": 811, "Finetune/Step Time": 2.8549756184220314} +{"Finetune/Learning Rate": 1.9082623961552153e-05, "Finetune/Loss": 0.8429506421089172, "Finetune/Loss (Raw)": 0.9039825797080994, "Finetune/Step": 812, "Finetune/Step Time": 2.8526564855128527} +{"Finetune/Learning Rate": 1.9079897796924808e-05, "Finetune/Loss": 0.8438680171966553, "Finetune/Loss (Raw)": 0.9576975703239441, "Finetune/Step": 813, "Finetune/Step Time": 2.8495049104094505} +{"Finetune/Learning Rate": 1.9077167782959395e-05, "Finetune/Loss": 0.8428893089294434, "Finetune/Loss (Raw)": 0.8501265048980713, "Finetune/Step": 814, "Finetune/Step Time": 2.8494713120162487} +{"Finetune/Learning Rate": 1.9074433920813276e-05, "Finetune/Loss": 0.8423262238502502, "Finetune/Loss (Raw)": 0.8009743690490723, "Finetune/Step": 815, "Finetune/Step Time": 2.8497849106788635} +{"Finetune/Learning Rate": 1.907169621164545e-05, "Finetune/Loss": 0.8431747555732727, "Finetune/Loss (Raw)": 0.9108465909957886, "Finetune/Step": 816, "Finetune/Step Time": 2.8515976890921593} +{"Finetune/Learning Rate": 1.906895465661654e-05, "Finetune/Loss": 0.8467538356781006, "Finetune/Loss (Raw)": 0.9203699827194214, "Finetune/Step": 817, "Finetune/Step Time": 2.824460217729211} +{"Finetune/Learning Rate": 1.9066209256888798e-05, "Finetune/Loss": 0.8473761677742004, "Finetune/Loss (Raw)": 0.8981907367706299, "Finetune/Step": 818, "Finetune/Step Time": 2.8223521392792463} +{"Finetune/Learning Rate": 1.906346001362612e-05, "Finetune/Loss": 0.8479882478713989, "Finetune/Loss (Raw)": 0.8927455544471741, "Finetune/Step": 819, "Finetune/Step Time": 2.826110852882266} +{"Finetune/Learning Rate": 1.9060706927994018e-05, "Finetune/Loss": 0.8494209051132202, "Finetune/Loss (Raw)": 0.9688711166381836, "Finetune/Step": 820, "Finetune/Step Time": 2.8240409549325705} +{"Finetune/Learning Rate": 1.905795000115963e-05, "Finetune/Loss": 0.8516790270805359, "Finetune/Loss (Raw)": 0.8771597146987915, "Finetune/Step": 821, "Finetune/Step Time": 2.797705886885524} +{"Finetune/Learning Rate": 1.9055189234291746e-05, "Finetune/Loss": 0.8522131443023682, "Finetune/Loss (Raw)": 0.8860021233558655, "Finetune/Step": 822, "Finetune/Step Time": 2.797193259000778} +{"Finetune/Learning Rate": 1.905242462856075e-05, "Finetune/Loss": 0.8517621755599976, "Finetune/Loss (Raw)": 0.8194413781166077, "Finetune/Step": 823, "Finetune/Step Time": 2.7978834863752127} +{"Finetune/Learning Rate": 1.904965618513868e-05, "Finetune/Loss": 0.851114809513092, "Finetune/Loss (Raw)": 0.8784589767456055, "Finetune/Step": 824, "Finetune/Step Time": 2.790469642728567} +{"Finetune/Learning Rate": 1.904688390519919e-05, "Finetune/Loss": 0.8509287238121033, "Finetune/Loss (Raw)": 0.8209515810012817, "Finetune/Step": 825, "Finetune/Step Time": 2.79292094707489} +{"Finetune/Learning Rate": 1.9044107789917565e-05, "Finetune/Loss": 0.8503299355506897, "Finetune/Loss (Raw)": 0.8112194538116455, "Finetune/Step": 826, "Finetune/Step Time": 2.796716818585992} +{"Finetune/Learning Rate": 1.904132784047071e-05, "Finetune/Loss": 0.8492285013198853, "Finetune/Loss (Raw)": 0.7993462085723877, "Finetune/Step": 827, "Finetune/Step Time": 2.7968869879841805} +{"Finetune/Learning Rate": 1.9038544058037157e-05, "Finetune/Loss": 0.849435031414032, "Finetune/Loss (Raw)": 0.8575380444526672, "Finetune/Step": 828, "Finetune/Step Time": 2.7971669528633356} +{"Finetune/Learning Rate": 1.903575644379707e-05, "Finetune/Loss": 0.8507623672485352, "Finetune/Loss (Raw)": 0.8435360193252563, "Finetune/Step": 829, "Finetune/Step Time": 2.775538133457303} +{"Finetune/Learning Rate": 1.9032964998932227e-05, "Finetune/Loss": 0.8506436347961426, "Finetune/Loss (Raw)": 0.9479144811630249, "Finetune/Step": 830, "Finetune/Step Time": 2.772094551473856} +{"Finetune/Learning Rate": 1.9030169724626035e-05, "Finetune/Loss": 0.8529990911483765, "Finetune/Loss (Raw)": 1.0189489126205444, "Finetune/Step": 831, "Finetune/Step Time": 2.7720264475792646} +{"Finetune/Learning Rate": 1.902737062206353e-05, "Finetune/Loss": 0.8527509570121765, "Finetune/Loss (Raw)": 0.9478908181190491, "Finetune/Step": 832, "Finetune/Step Time": 2.770475994795561} +{"Finetune/Learning Rate": 1.902456769243136e-05, "Finetune/Loss": 0.8528969287872314, "Finetune/Loss (Raw)": 0.9192035794258118, "Finetune/Step": 833, "Finetune/Step Time": 2.7677722051739693} +{"Finetune/Learning Rate": 1.9021760936917802e-05, "Finetune/Loss": 0.8532341718673706, "Finetune/Loss (Raw)": 0.9457634091377258, "Finetune/Step": 834, "Finetune/Step Time": 2.767409337684512} +{"Finetune/Learning Rate": 1.901895035671276e-05, "Finetune/Loss": 0.8532260656356812, "Finetune/Loss (Raw)": 0.835952639579773, "Finetune/Step": 835, "Finetune/Step Time": 2.769578892737627} +{"Finetune/Learning Rate": 1.9016135953007745e-05, "Finetune/Loss": 0.8534246683120728, "Finetune/Loss (Raw)": 0.8261809349060059, "Finetune/Step": 836, "Finetune/Step Time": 2.7655533235520124} +{"Finetune/Learning Rate": 1.9013317726995896e-05, "Finetune/Loss": 0.852672278881073, "Finetune/Loss (Raw)": 0.7945284247398376, "Finetune/Step": 837, "Finetune/Step Time": 2.7635778952389956} +{"Finetune/Learning Rate": 1.9010495679871984e-05, "Finetune/Loss": 0.8533269166946411, "Finetune/Loss (Raw)": 0.9396570920944214, "Finetune/Step": 838, "Finetune/Step Time": 2.7625708114355803} +{"Finetune/Learning Rate": 1.900766981283238e-05, "Finetune/Loss": 0.8532065153121948, "Finetune/Loss (Raw)": 0.8878340125083923, "Finetune/Step": 839, "Finetune/Step Time": 2.764833377674222} +{"Finetune/Learning Rate": 1.9004840127075085e-05, "Finetune/Loss": 0.853518009185791, "Finetune/Loss (Raw)": 0.9096696376800537, "Finetune/Step": 840, "Finetune/Step Time": 2.7664654292166233} +{"Finetune/Learning Rate": 1.9002006623799723e-05, "Finetune/Loss": 0.8546176552772522, "Finetune/Loss (Raw)": 0.6504330039024353, "Finetune/Step": 841, "Finetune/Step Time": 2.7586925867944956} +{"Finetune/Learning Rate": 1.899916930420753e-05, "Finetune/Loss": 0.855972170829773, "Finetune/Loss (Raw)": 0.9295299053192139, "Finetune/Step": 842, "Finetune/Step Time": 2.7604194562882185} +{"Finetune/Learning Rate": 1.8996328169501362e-05, "Finetune/Loss": 0.8554794788360596, "Finetune/Loss (Raw)": 0.87141352891922, "Finetune/Step": 843, "Finetune/Step Time": 2.7606338169425726} +{"Finetune/Learning Rate": 1.8993483220885688e-05, "Finetune/Loss": 0.854205310344696, "Finetune/Loss (Raw)": 0.7964950799942017, "Finetune/Step": 844, "Finetune/Step Time": 2.7532178964465857} +{"Finetune/Learning Rate": 1.8990634459566596e-05, "Finetune/Loss": 0.8535991907119751, "Finetune/Loss (Raw)": 0.7843097448348999, "Finetune/Step": 845, "Finetune/Step Time": 2.754481380805373} +{"Finetune/Learning Rate": 1.89877818867518e-05, "Finetune/Loss": 0.8533242344856262, "Finetune/Loss (Raw)": 0.8536996841430664, "Finetune/Step": 846, "Finetune/Step Time": 2.7545393351465464} +{"Finetune/Learning Rate": 1.898492550365061e-05, "Finetune/Loss": 0.8537270426750183, "Finetune/Loss (Raw)": 0.8587992787361145, "Finetune/Step": 847, "Finetune/Step Time": 2.7532092928886414} +{"Finetune/Learning Rate": 1.898206531147397e-05, "Finetune/Loss": 0.8543323874473572, "Finetune/Loss (Raw)": 0.9146681427955627, "Finetune/Step": 848, "Finetune/Step Time": 2.750678738579154} +{"Finetune/Learning Rate": 1.8979201311434434e-05, "Finetune/Loss": 0.8500560522079468, "Finetune/Loss (Raw)": 0.2442808598279953, "Finetune/Step": 849, "Finetune/Step Time": 2.7779481112957} +{"Finetune/Learning Rate": 1.8976333504746164e-05, "Finetune/Loss": 0.8505555391311646, "Finetune/Loss (Raw)": 0.9438130259513855, "Finetune/Step": 850, "Finetune/Step Time": 2.778430113568902} +{"Finetune/Learning Rate": 1.8973461892624943e-05, "Finetune/Loss": 0.8517319560050964, "Finetune/Loss (Raw)": 0.9439245462417603, "Finetune/Step": 851, "Finetune/Step Time": 2.7782749962061644} +{"Finetune/Learning Rate": 1.897058647628816e-05, "Finetune/Loss": 0.8517234325408936, "Finetune/Loss (Raw)": 0.8296618461608887, "Finetune/Step": 852, "Finetune/Step Time": 2.775849100202322} +{"Finetune/Learning Rate": 1.8967707256954824e-05, "Finetune/Loss": 0.8514963388442993, "Finetune/Loss (Raw)": 0.9050601720809937, "Finetune/Step": 853, "Finetune/Step Time": 2.7759430166333914} +{"Finetune/Learning Rate": 1.8964824235845557e-05, "Finetune/Loss": 0.8511494398117065, "Finetune/Loss (Raw)": 0.9176461100578308, "Finetune/Step": 854, "Finetune/Step Time": 2.7792059369385242} +{"Finetune/Learning Rate": 1.896193741418258e-05, "Finetune/Loss": 0.851651132106781, "Finetune/Loss (Raw)": 0.9199240803718567, "Finetune/Step": 855, "Finetune/Step Time": 2.780264250934124} +{"Finetune/Learning Rate": 1.895904679318974e-05, "Finetune/Loss": 0.852295994758606, "Finetune/Loss (Raw)": 0.950246274471283, "Finetune/Step": 856, "Finetune/Step Time": 2.7760189957916737} +{"Finetune/Learning Rate": 1.8956152374092493e-05, "Finetune/Loss": 0.8530547618865967, "Finetune/Loss (Raw)": 0.9488935470581055, "Finetune/Step": 857, "Finetune/Step Time": 2.7784934490919113} +{"Finetune/Learning Rate": 1.8953254158117888e-05, "Finetune/Loss": 0.8566832542419434, "Finetune/Loss (Raw)": 0.8198240399360657, "Finetune/Step": 858, "Finetune/Step Time": 2.748389445245266} +{"Finetune/Learning Rate": 1.8950352146494605e-05, "Finetune/Loss": 0.8561040163040161, "Finetune/Loss (Raw)": 0.8327082991600037, "Finetune/Step": 859, "Finetune/Step Time": 2.7473384719341993} +{"Finetune/Learning Rate": 1.8947446340452926e-05, "Finetune/Loss": 0.8575476408004761, "Finetune/Loss (Raw)": 0.8788157105445862, "Finetune/Step": 860, "Finetune/Step Time": 2.7243038043379784} +{"Finetune/Learning Rate": 1.894453674122474e-05, "Finetune/Loss": 0.8577144742012024, "Finetune/Loss (Raw)": 0.8876886367797852, "Finetune/Step": 861, "Finetune/Step Time": 2.726579340174794} +{"Finetune/Learning Rate": 1.894162335004354e-05, "Finetune/Loss": 0.8600338697433472, "Finetune/Loss (Raw)": 0.9040958285331726, "Finetune/Step": 862, "Finetune/Step Time": 2.7029122561216354} +{"Finetune/Learning Rate": 1.8938706168144434e-05, "Finetune/Loss": 0.8599441051483154, "Finetune/Loss (Raw)": 0.8774954676628113, "Finetune/Step": 863, "Finetune/Step Time": 2.7003718744963408} +{"Finetune/Learning Rate": 1.893578519676414e-05, "Finetune/Loss": 0.8595995903015137, "Finetune/Loss (Raw)": 0.8020731210708618, "Finetune/Step": 864, "Finetune/Step Time": 2.7102574445307255} +{"Finetune/Learning Rate": 1.893286043714096e-05, "Finetune/Loss": 0.8596189022064209, "Finetune/Loss (Raw)": 0.9125797152519226, "Finetune/Step": 865, "Finetune/Step Time": 2.7154744043946266} +{"Finetune/Learning Rate": 1.8929931890514836e-05, "Finetune/Loss": 0.8590784072875977, "Finetune/Loss (Raw)": 0.8156223297119141, "Finetune/Step": 866, "Finetune/Step Time": 2.71307079680264} +{"Finetune/Learning Rate": 1.8926999558127293e-05, "Finetune/Loss": 0.8577545881271362, "Finetune/Loss (Raw)": 0.8109528422355652, "Finetune/Step": 867, "Finetune/Step Time": 2.7126543261110783} +{"Finetune/Learning Rate": 1.892406344122146e-05, "Finetune/Loss": 0.8574322462081909, "Finetune/Loss (Raw)": 0.8530969619750977, "Finetune/Step": 868, "Finetune/Step Time": 2.7098733093589544} +{"Finetune/Learning Rate": 1.8921123541042082e-05, "Finetune/Loss": 0.8575625419616699, "Finetune/Loss (Raw)": 0.8645311594009399, "Finetune/Step": 869, "Finetune/Step Time": 2.7096258141100407} +{"Finetune/Learning Rate": 1.89181798588355e-05, "Finetune/Loss": 0.8572980165481567, "Finetune/Loss (Raw)": 0.8435819745063782, "Finetune/Step": 870, "Finetune/Step Time": 2.7084657009691} +{"Finetune/Learning Rate": 1.8915232395849666e-05, "Finetune/Loss": 0.8559126853942871, "Finetune/Loss (Raw)": 0.7647127509117126, "Finetune/Step": 871, "Finetune/Step Time": 2.708931712433696} +{"Finetune/Learning Rate": 1.8912281153334122e-05, "Finetune/Loss": 0.8566699028015137, "Finetune/Loss (Raw)": 0.8575337529182434, "Finetune/Step": 872, "Finetune/Step Time": 2.7121397014707327} +{"Finetune/Learning Rate": 1.8909326132540022e-05, "Finetune/Loss": 0.8570584654808044, "Finetune/Loss (Raw)": 0.880083441734314, "Finetune/Step": 873, "Finetune/Step Time": 2.7105072662234306} +{"Finetune/Learning Rate": 1.8906367334720125e-05, "Finetune/Loss": 0.8577100038528442, "Finetune/Loss (Raw)": 0.9458269476890564, "Finetune/Step": 874, "Finetune/Step Time": 2.7114393189549446} +{"Finetune/Learning Rate": 1.8903404761128774e-05, "Finetune/Loss": 0.8581624031066895, "Finetune/Loss (Raw)": 0.9183125495910645, "Finetune/Step": 875, "Finetune/Step Time": 2.7086694706231356} +{"Finetune/Learning Rate": 1.890043841302194e-05, "Finetune/Loss": 0.8573474884033203, "Finetune/Loss (Raw)": 0.8057919144630432, "Finetune/Step": 876, "Finetune/Step Time": 2.7037387620657682} +{"Finetune/Learning Rate": 1.8897468291657163e-05, "Finetune/Loss": 0.8575047850608826, "Finetune/Loss (Raw)": 0.8186718821525574, "Finetune/Step": 877, "Finetune/Step Time": 2.685559095814824} +{"Finetune/Learning Rate": 1.889449439829361e-05, "Finetune/Loss": 0.8576769828796387, "Finetune/Loss (Raw)": 0.9192347526550293, "Finetune/Step": 878, "Finetune/Step Time": 2.689462212845683} +{"Finetune/Learning Rate": 1.889151673419203e-05, "Finetune/Loss": 0.8584585189819336, "Finetune/Loss (Raw)": 0.9655776619911194, "Finetune/Step": 879, "Finetune/Step Time": 2.689379071816802} +{"Finetune/Learning Rate": 1.8888535300614774e-05, "Finetune/Loss": 0.8578284382820129, "Finetune/Loss (Raw)": 0.8270043730735779, "Finetune/Step": 880, "Finetune/Step Time": 2.680749421939254} +{"Finetune/Learning Rate": 1.8885550098825798e-05, "Finetune/Loss": 0.8579362034797668, "Finetune/Loss (Raw)": 0.8775713443756104, "Finetune/Step": 881, "Finetune/Step Time": 2.6845028065145016} +{"Finetune/Learning Rate": 1.8882561130090648e-05, "Finetune/Loss": 0.8580157160758972, "Finetune/Loss (Raw)": 0.8459416031837463, "Finetune/Step": 882, "Finetune/Step Time": 2.689783029258251} +{"Finetune/Learning Rate": 1.887956839567647e-05, "Finetune/Loss": 0.8597222566604614, "Finetune/Loss (Raw)": 0.8497018218040466, "Finetune/Step": 883, "Finetune/Step Time": 2.664841152727604} +{"Finetune/Learning Rate": 1.887657189685201e-05, "Finetune/Loss": 0.8598698377609253, "Finetune/Loss (Raw)": 0.8289059400558472, "Finetune/Step": 884, "Finetune/Step Time": 2.6631545834243298} +{"Finetune/Learning Rate": 1.887357163488759e-05, "Finetune/Loss": 0.8601951599121094, "Finetune/Loss (Raw)": 0.8972260355949402, "Finetune/Step": 885, "Finetune/Step Time": 2.6646150201559067} +{"Finetune/Learning Rate": 1.8870567611055167e-05, "Finetune/Loss": 0.8582802414894104, "Finetune/Loss (Raw)": 0.67621910572052, "Finetune/Step": 886, "Finetune/Step Time": 2.6807812359184027} +{"Finetune/Learning Rate": 1.886755982662825e-05, "Finetune/Loss": 0.858950138092041, "Finetune/Loss (Raw)": 0.8901764154434204, "Finetune/Step": 887, "Finetune/Step Time": 2.686509782448411} +{"Finetune/Learning Rate": 1.886454828288197e-05, "Finetune/Loss": 0.8581157922744751, "Finetune/Loss (Raw)": 0.7868125438690186, "Finetune/Step": 888, "Finetune/Step Time": 2.6882979162037373} +{"Finetune/Learning Rate": 1.8861532981093038e-05, "Finetune/Loss": 0.8579615354537964, "Finetune/Loss (Raw)": 0.8857631087303162, "Finetune/Step": 889, "Finetune/Step Time": 2.690398095175624} +{"Finetune/Learning Rate": 1.8858513922539766e-05, "Finetune/Loss": 0.8576472997665405, "Finetune/Loss (Raw)": 0.847106397151947, "Finetune/Step": 890, "Finetune/Step Time": 2.6884100064635277} +{"Finetune/Learning Rate": 1.885549110850206e-05, "Finetune/Loss": 0.8576267957687378, "Finetune/Loss (Raw)": 0.8502517342567444, "Finetune/Step": 891, "Finetune/Step Time": 2.6900916192680597} +{"Finetune/Learning Rate": 1.8852464540261403e-05, "Finetune/Loss": 0.8580289483070374, "Finetune/Loss (Raw)": 0.8433218598365784, "Finetune/Step": 892, "Finetune/Step Time": 2.6910694297403097} +{"Finetune/Learning Rate": 1.884943421910089e-05, "Finetune/Loss": 0.8585107922554016, "Finetune/Loss (Raw)": 0.911683976650238, "Finetune/Step": 893, "Finetune/Step Time": 2.6900759898126125} +{"Finetune/Learning Rate": 1.88464001463052e-05, "Finetune/Loss": 0.8592385053634644, "Finetune/Loss (Raw)": 0.9214837551116943, "Finetune/Step": 894, "Finetune/Step Time": 2.687072951346636} +{"Finetune/Learning Rate": 1.8843362323160582e-05, "Finetune/Loss": 0.8596999049186707, "Finetune/Loss (Raw)": 0.8998339772224426, "Finetune/Step": 895, "Finetune/Step Time": 2.683947781100869} +{"Finetune/Learning Rate": 1.8840320750954913e-05, "Finetune/Loss": 0.8583331108093262, "Finetune/Loss (Raw)": 0.658062219619751, "Finetune/Step": 896, "Finetune/Step Time": 2.709503611549735} +{"Finetune/Learning Rate": 1.883727543097763e-05, "Finetune/Loss": 0.8587743639945984, "Finetune/Loss (Raw)": 0.8884938955307007, "Finetune/Step": 897, "Finetune/Step Time": 2.709805019199848} +{"Finetune/Learning Rate": 1.8834226364519766e-05, "Finetune/Loss": 0.859160304069519, "Finetune/Loss (Raw)": 0.9855777025222778, "Finetune/Step": 898, "Finetune/Step Time": 2.7090733125805855} +{"Finetune/Learning Rate": 1.8831173552873946e-05, "Finetune/Loss": 0.8578556776046753, "Finetune/Loss (Raw)": 0.8195264339447021, "Finetune/Step": 899, "Finetune/Step Time": 2.7131178490817547} +{"Finetune/Learning Rate": 1.8828116997334387e-05, "Finetune/Loss": 0.8570225834846497, "Finetune/Loss (Raw)": 0.818729817867279, "Finetune/Step": 900, "Finetune/Step Time": 2.7182484045624733} +{"Finetune/Learning Rate": 1.882505669919688e-05, "Finetune/Loss": 0.8569135069847107, "Finetune/Loss (Raw)": 0.8230565786361694, "Finetune/Step": 901, "Finetune/Step Time": 2.7179795745760202} +{"Finetune/Learning Rate": 1.8821992659758813e-05, "Finetune/Loss": 0.8569872379302979, "Finetune/Loss (Raw)": 0.8330629467964172, "Finetune/Step": 902, "Finetune/Step Time": 2.7227197010070086} +{"Finetune/Learning Rate": 1.8818924880319156e-05, "Finetune/Loss": 0.8570106029510498, "Finetune/Loss (Raw)": 0.8710219860076904, "Finetune/Step": 903, "Finetune/Step Time": 2.724522840231657} +{"Finetune/Learning Rate": 1.881585336217847e-05, "Finetune/Loss": 0.8574241399765015, "Finetune/Loss (Raw)": 0.8831189274787903, "Finetune/Step": 904, "Finetune/Step Time": 2.723348941653967} +{"Finetune/Learning Rate": 1.881277810663889e-05, "Finetune/Loss": 0.8588160276412964, "Finetune/Loss (Raw)": 0.9966020584106445, "Finetune/Step": 905, "Finetune/Step Time": 2.7277637999504805} +{"Finetune/Learning Rate": 1.880969911500414e-05, "Finetune/Loss": 0.859607458114624, "Finetune/Loss (Raw)": 0.8855500817298889, "Finetune/Step": 906, "Finetune/Step Time": 2.730874879285693} +{"Finetune/Learning Rate": 1.880661638857954e-05, "Finetune/Loss": 0.8597214221954346, "Finetune/Loss (Raw)": 0.9270629286766052, "Finetune/Step": 907, "Finetune/Step Time": 2.726650008931756} +{"Finetune/Learning Rate": 1.880352992867197e-05, "Finetune/Loss": 0.8591985106468201, "Finetune/Loss (Raw)": 0.8756414651870728, "Finetune/Step": 908, "Finetune/Step Time": 2.7246340792626143} +{"Finetune/Learning Rate": 1.8800439736589924e-05, "Finetune/Loss": 0.8589402437210083, "Finetune/Loss (Raw)": 0.8829153776168823, "Finetune/Step": 909, "Finetune/Step Time": 2.727094516158104} +{"Finetune/Learning Rate": 1.8797345813643444e-05, "Finetune/Loss": 0.8604140877723694, "Finetune/Loss (Raw)": 0.9189903140068054, "Finetune/Step": 910, "Finetune/Step Time": 2.725724134594202} +{"Finetune/Learning Rate": 1.8794248161144174e-05, "Finetune/Loss": 0.8604294061660767, "Finetune/Loss (Raw)": 0.883509635925293, "Finetune/Step": 911, "Finetune/Step Time": 2.7220899127423763} +{"Finetune/Learning Rate": 1.879114678040534e-05, "Finetune/Loss": 0.8599250316619873, "Finetune/Loss (Raw)": 0.7357632517814636, "Finetune/Step": 912, "Finetune/Step Time": 2.7218752279877663} +{"Finetune/Learning Rate": 1.8788041672741735e-05, "Finetune/Loss": 0.8611568212509155, "Finetune/Loss (Raw)": 0.9479760527610779, "Finetune/Step": 913, "Finetune/Step Time": 2.719337448477745} +{"Finetune/Learning Rate": 1.8784932839469747e-05, "Finetune/Loss": 0.8609803318977356, "Finetune/Loss (Raw)": 0.808407187461853, "Finetune/Step": 914, "Finetune/Step Time": 2.716500084847212} +{"Finetune/Learning Rate": 1.8781820281907335e-05, "Finetune/Loss": 0.858217716217041, "Finetune/Loss (Raw)": 0.4895865023136139, "Finetune/Step": 915, "Finetune/Step Time": 2.7385172601789236} +{"Finetune/Learning Rate": 1.877870400137404e-05, "Finetune/Loss": 0.859686017036438, "Finetune/Loss (Raw)": 0.8224051594734192, "Finetune/Step": 916, "Finetune/Step Time": 2.716255597770214} +{"Finetune/Learning Rate": 1.8775583999190975e-05, "Finetune/Loss": 0.8599787354469299, "Finetune/Loss (Raw)": 0.9156509637832642, "Finetune/Step": 917, "Finetune/Step Time": 2.713147282600403} +{"Finetune/Learning Rate": 1.8772460276680843e-05, "Finetune/Loss": 0.8625132441520691, "Finetune/Loss (Raw)": 0.9819220900535583, "Finetune/Step": 918, "Finetune/Step Time": 2.691563844680786} +{"Finetune/Learning Rate": 1.8769332835167914e-05, "Finetune/Loss": 0.8614385724067688, "Finetune/Loss (Raw)": 0.7979837656021118, "Finetune/Step": 919, "Finetune/Step Time": 2.6959163807332516} +{"Finetune/Learning Rate": 1.8766201675978038e-05, "Finetune/Loss": 0.8617193698883057, "Finetune/Loss (Raw)": 0.9358868598937988, "Finetune/Step": 920, "Finetune/Step Time": 2.7012858614325523} +{"Finetune/Learning Rate": 1.8763066800438638e-05, "Finetune/Loss": 0.8599539995193481, "Finetune/Loss (Raw)": 0.5733767151832581, "Finetune/Step": 921, "Finetune/Step Time": 2.726185319945216} +{"Finetune/Learning Rate": 1.8759928209878718e-05, "Finetune/Loss": 0.860274076461792, "Finetune/Loss (Raw)": 0.9380936026573181, "Finetune/Step": 922, "Finetune/Step Time": 2.7260098550468683} +{"Finetune/Learning Rate": 1.8756785905628852e-05, "Finetune/Loss": 0.859791100025177, "Finetune/Loss (Raw)": 0.7282867431640625, "Finetune/Step": 923, "Finetune/Step Time": 2.746326481923461} +{"Finetune/Learning Rate": 1.8753639889021197e-05, "Finetune/Loss": 0.8596506118774414, "Finetune/Loss (Raw)": 0.8192436099052429, "Finetune/Step": 924, "Finetune/Step Time": 2.7439317535609007} +{"Finetune/Learning Rate": 1.875049016138947e-05, "Finetune/Loss": 0.8598682880401611, "Finetune/Loss (Raw)": 0.9181655049324036, "Finetune/Step": 925, "Finetune/Step Time": 2.744405595585704} +{"Finetune/Learning Rate": 1.874733672406897e-05, "Finetune/Loss": 0.8595991730690002, "Finetune/Loss (Raw)": 0.8217461109161377, "Finetune/Step": 926, "Finetune/Step Time": 2.747593382373452} +{"Finetune/Learning Rate": 1.8744179578396572e-05, "Finetune/Loss": 0.8569222092628479, "Finetune/Loss (Raw)": 0.47025078535079956, "Finetune/Step": 927, "Finetune/Step Time": 2.779120897874236} +{"Finetune/Learning Rate": 1.8741018725710712e-05, "Finetune/Loss": 0.8567782640457153, "Finetune/Loss (Raw)": 0.8733488917350769, "Finetune/Step": 928, "Finetune/Step Time": 2.7775188367813826} +{"Finetune/Learning Rate": 1.873785416735141e-05, "Finetune/Loss": 0.856691837310791, "Finetune/Loss (Raw)": 0.897563636302948, "Finetune/Step": 929, "Finetune/Step Time": 2.776252254843712} +{"Finetune/Learning Rate": 1.8734685904660245e-05, "Finetune/Loss": 0.855384111404419, "Finetune/Loss (Raw)": 0.8849117159843445, "Finetune/Step": 930, "Finetune/Step Time": 2.7775494512170553} +{"Finetune/Learning Rate": 1.873151393898038e-05, "Finetune/Loss": 0.8548191785812378, "Finetune/Loss (Raw)": 0.8364772796630859, "Finetune/Step": 931, "Finetune/Step Time": 2.7800681367516518} +{"Finetune/Learning Rate": 1.8728338271656533e-05, "Finetune/Loss": 0.8553674817085266, "Finetune/Loss (Raw)": 0.9207653999328613, "Finetune/Step": 932, "Finetune/Step Time": 2.7774174623191357} +{"Finetune/Learning Rate": 1.8725158904035005e-05, "Finetune/Loss": 0.8582586050033569, "Finetune/Loss (Raw)": 0.7942192554473877, "Finetune/Step": 933, "Finetune/Step Time": 2.750739023089409} +{"Finetune/Learning Rate": 1.8721975837463656e-05, "Finetune/Loss": 0.8574316501617432, "Finetune/Loss (Raw)": 0.8976355791091919, "Finetune/Step": 934, "Finetune/Step Time": 2.745550986379385} +{"Finetune/Learning Rate": 1.8718789073291915e-05, "Finetune/Loss": 0.8579280376434326, "Finetune/Loss (Raw)": 0.9025009870529175, "Finetune/Step": 935, "Finetune/Step Time": 2.740540862083435} +{"Finetune/Learning Rate": 1.8715598612870783e-05, "Finetune/Loss": 0.858628511428833, "Finetune/Loss (Raw)": 0.9229370355606079, "Finetune/Step": 936, "Finetune/Step Time": 2.72979917563498} +{"Finetune/Learning Rate": 1.8712404457552827e-05, "Finetune/Loss": 0.8593119978904724, "Finetune/Loss (Raw)": 0.8811157941818237, "Finetune/Step": 937, "Finetune/Step Time": 2.732313971966505} +{"Finetune/Learning Rate": 1.8709206608692177e-05, "Finetune/Loss": 0.8575327396392822, "Finetune/Loss (Raw)": 0.8862595558166504, "Finetune/Step": 938, "Finetune/Step Time": 2.731204444542527} +{"Finetune/Learning Rate": 1.8706005067644536e-05, "Finetune/Loss": 0.8578317761421204, "Finetune/Loss (Raw)": 0.8974484205245972, "Finetune/Step": 939, "Finetune/Step Time": 2.732567897066474} +{"Finetune/Learning Rate": 1.8702799835767162e-05, "Finetune/Loss": 0.8579952716827393, "Finetune/Loss (Raw)": 0.9249081015586853, "Finetune/Step": 940, "Finetune/Step Time": 2.7347191609442234} +{"Finetune/Learning Rate": 1.869959091441889e-05, "Finetune/Loss": 0.8568594455718994, "Finetune/Loss (Raw)": 0.8123204708099365, "Finetune/Step": 941, "Finetune/Step Time": 2.739606609568} +{"Finetune/Learning Rate": 1.8696378304960104e-05, "Finetune/Loss": 0.8568377494812012, "Finetune/Loss (Raw)": 0.8473431468009949, "Finetune/Step": 942, "Finetune/Step Time": 2.7428231574594975} +{"Finetune/Learning Rate": 1.8693162008752766e-05, "Finetune/Loss": 0.8576334714889526, "Finetune/Loss (Raw)": 0.9028223752975464, "Finetune/Step": 943, "Finetune/Step Time": 2.742214797064662} +{"Finetune/Learning Rate": 1.868994202716039e-05, "Finetune/Loss": 0.8571996688842773, "Finetune/Loss (Raw)": 0.8553188443183899, "Finetune/Step": 944, "Finetune/Step Time": 2.7394223026931286} +{"Finetune/Learning Rate": 1.868671836154806e-05, "Finetune/Loss": 0.8571344614028931, "Finetune/Loss (Raw)": 0.9120239019393921, "Finetune/Step": 945, "Finetune/Step Time": 2.738796688616276} +{"Finetune/Learning Rate": 1.868349101328242e-05, "Finetune/Loss": 0.8563547134399414, "Finetune/Loss (Raw)": 0.7983871698379517, "Finetune/Step": 946, "Finetune/Step Time": 2.739988636225462} +{"Finetune/Learning Rate": 1.8680259983731674e-05, "Finetune/Loss": 0.8558569550514221, "Finetune/Loss (Raw)": 0.8290337324142456, "Finetune/Step": 947, "Finetune/Step Time": 2.739478964358568} +{"Finetune/Learning Rate": 1.8677025274265585e-05, "Finetune/Loss": 0.8553963899612427, "Finetune/Loss (Raw)": 0.9099236726760864, "Finetune/Step": 948, "Finetune/Step Time": 2.7436586897820234} +{"Finetune/Learning Rate": 1.8673786886255478e-05, "Finetune/Loss": 0.855061411857605, "Finetune/Loss (Raw)": 0.8342715501785278, "Finetune/Step": 949, "Finetune/Step Time": 2.7451119404286146} +{"Finetune/Learning Rate": 1.8670544821074237e-05, "Finetune/Loss": 0.8537377119064331, "Finetune/Loss (Raw)": 0.7165835499763489, "Finetune/Step": 950, "Finetune/Step Time": 2.7496187426149845} +{"Finetune/Learning Rate": 1.866729908009631e-05, "Finetune/Loss": 0.8537755012512207, "Finetune/Loss (Raw)": 0.8242651224136353, "Finetune/Step": 951, "Finetune/Step Time": 2.7457418460398912} +{"Finetune/Learning Rate": 1.866404966469769e-05, "Finetune/Loss": 0.8534278273582458, "Finetune/Loss (Raw)": 0.8339588642120361, "Finetune/Step": 952, "Finetune/Step Time": 2.7450582403689623} +{"Finetune/Learning Rate": 1.8660796576255947e-05, "Finetune/Loss": 0.8535858988761902, "Finetune/Loss (Raw)": 0.841188907623291, "Finetune/Step": 953, "Finetune/Step Time": 2.7436878997832537} +{"Finetune/Learning Rate": 1.865753981615019e-05, "Finetune/Loss": 0.8548580408096313, "Finetune/Loss (Raw)": 0.9740532636642456, "Finetune/Step": 954, "Finetune/Step Time": 2.7433489598333836} +{"Finetune/Learning Rate": 1.8654279385761092e-05, "Finetune/Loss": 0.8533774614334106, "Finetune/Loss (Raw)": 0.6098292469978333, "Finetune/Step": 955, "Finetune/Step Time": 2.7638206016272306} +{"Finetune/Learning Rate": 1.865101528647089e-05, "Finetune/Loss": 0.8532150983810425, "Finetune/Loss (Raw)": 0.8367506265640259, "Finetune/Step": 956, "Finetune/Step Time": 2.769869351759553} +{"Finetune/Learning Rate": 1.864774751966336e-05, "Finetune/Loss": 0.8538196086883545, "Finetune/Loss (Raw)": 0.9209181666374207, "Finetune/Step": 957, "Finetune/Step Time": 2.7686289343982935} +{"Finetune/Learning Rate": 1.8644476086723843e-05, "Finetune/Loss": 0.8540092706680298, "Finetune/Loss (Raw)": 0.9721944332122803, "Finetune/Step": 958, "Finetune/Step Time": 2.7706520948559046} +{"Finetune/Learning Rate": 1.8641200989039238e-05, "Finetune/Loss": 0.8523699045181274, "Finetune/Loss (Raw)": 0.8091090321540833, "Finetune/Step": 959, "Finetune/Step Time": 2.769917355850339} +{"Finetune/Learning Rate": 1.863792222799798e-05, "Finetune/Loss": 0.8521295189857483, "Finetune/Loss (Raw)": 0.9171169400215149, "Finetune/Step": 960, "Finetune/Step Time": 2.7709880992770195} +{"Finetune/Learning Rate": 1.8634639804990084e-05, "Finetune/Loss": 0.8514759540557861, "Finetune/Loss (Raw)": 0.8355550765991211, "Finetune/Step": 961, "Finetune/Step Time": 2.7725873831659555} +{"Finetune/Learning Rate": 1.863135372140709e-05, "Finetune/Loss": 0.8501129150390625, "Finetune/Loss (Raw)": 0.7712886929512024, "Finetune/Step": 962, "Finetune/Step Time": 2.7934407368302345} +{"Finetune/Learning Rate": 1.862806397864211e-05, "Finetune/Loss": 0.8497732877731323, "Finetune/Loss (Raw)": 0.7924811840057373, "Finetune/Step": 963, "Finetune/Step Time": 2.794366765767336} +{"Finetune/Learning Rate": 1.86247705780898e-05, "Finetune/Loss": 0.8506048917770386, "Finetune/Loss (Raw)": 0.9326255917549133, "Finetune/Step": 964, "Finetune/Step Time": 2.7981235533952713} +{"Finetune/Learning Rate": 1.8621473521146366e-05, "Finetune/Loss": 0.8506050705909729, "Finetune/Loss (Raw)": 0.7945491075515747, "Finetune/Step": 965, "Finetune/Step Time": 2.796712124720216} +{"Finetune/Learning Rate": 1.861817280920956e-05, "Finetune/Loss": 0.8501599431037903, "Finetune/Loss (Raw)": 0.8826835751533508, "Finetune/Step": 966, "Finetune/Step Time": 2.7979474309831858} +{"Finetune/Learning Rate": 1.861486844367869e-05, "Finetune/Loss": 0.8499505519866943, "Finetune/Loss (Raw)": 0.8610244989395142, "Finetune/Step": 967, "Finetune/Step Time": 2.800053983926773} +{"Finetune/Learning Rate": 1.861156042595461e-05, "Finetune/Loss": 0.8503109216690063, "Finetune/Loss (Raw)": 0.955805242061615, "Finetune/Step": 968, "Finetune/Step Time": 2.7992740981280804} +{"Finetune/Learning Rate": 1.8608248757439732e-05, "Finetune/Loss": 0.8525931239128113, "Finetune/Loss (Raw)": 0.9425588250160217, "Finetune/Step": 969, "Finetune/Step Time": 2.777187868952751} +{"Finetune/Learning Rate": 1.8604933439537992e-05, "Finetune/Loss": 0.8519343137741089, "Finetune/Loss (Raw)": 0.8451976776123047, "Finetune/Step": 970, "Finetune/Step Time": 2.7732858397066593} +{"Finetune/Learning Rate": 1.86016144736549e-05, "Finetune/Loss": 0.8516168594360352, "Finetune/Loss (Raw)": 0.8307797908782959, "Finetune/Step": 971, "Finetune/Step Time": 2.7747070249170065} +{"Finetune/Learning Rate": 1.8598291861197503e-05, "Finetune/Loss": 0.8526251316070557, "Finetune/Loss (Raw)": 0.9255527257919312, "Finetune/Step": 972, "Finetune/Step Time": 2.780969947576523} +{"Finetune/Learning Rate": 1.859496560357438e-05, "Finetune/Loss": 0.8531676530838013, "Finetune/Loss (Raw)": 0.8537537455558777, "Finetune/Step": 973, "Finetune/Step Time": 2.7798636853694916} +{"Finetune/Learning Rate": 1.8591635702195672e-05, "Finetune/Loss": 0.8535004258155823, "Finetune/Loss (Raw)": 0.8962978720664978, "Finetune/Step": 974, "Finetune/Step Time": 2.7798371985554695} +{"Finetune/Learning Rate": 1.8588302158473063e-05, "Finetune/Loss": 0.8532348275184631, "Finetune/Loss (Raw)": 0.8248007297515869, "Finetune/Step": 975, "Finetune/Step Time": 2.7854633033275604} +{"Finetune/Learning Rate": 1.8584964973819774e-05, "Finetune/Loss": 0.8526268601417542, "Finetune/Loss (Raw)": 0.8368415236473083, "Finetune/Step": 976, "Finetune/Step Time": 2.7970260065048933} +{"Finetune/Learning Rate": 1.8581624149650573e-05, "Finetune/Loss": 0.8579476475715637, "Finetune/Loss (Raw)": 0.9253502488136292, "Finetune/Step": 977, "Finetune/Step Time": 2.7668147161602974} +{"Finetune/Learning Rate": 1.8578279687381776e-05, "Finetune/Loss": 0.8568286895751953, "Finetune/Loss (Raw)": 0.8005870580673218, "Finetune/Step": 978, "Finetune/Step Time": 2.765712033957243} +{"Finetune/Learning Rate": 1.8574931588431233e-05, "Finetune/Loss": 0.8560650944709778, "Finetune/Loss (Raw)": 0.8461770415306091, "Finetune/Step": 979, "Finetune/Step Time": 2.769560571759939} +{"Finetune/Learning Rate": 1.8571579854218337e-05, "Finetune/Loss": 0.8569674491882324, "Finetune/Loss (Raw)": 0.945161759853363, "Finetune/Step": 980, "Finetune/Step Time": 2.772355653345585} +{"Finetune/Learning Rate": 1.856822448616403e-05, "Finetune/Loss": 0.8563319444656372, "Finetune/Loss (Raw)": 0.8237159848213196, "Finetune/Step": 981, "Finetune/Step Time": 2.7713150084018707} +{"Finetune/Learning Rate": 1.8564865485690782e-05, "Finetune/Loss": 0.8560077548027039, "Finetune/Loss (Raw)": 0.8761492371559143, "Finetune/Step": 982, "Finetune/Step Time": 2.771101785823703} +{"Finetune/Learning Rate": 1.8561502854222618e-05, "Finetune/Loss": 0.8555840849876404, "Finetune/Loss (Raw)": 0.8656986951828003, "Finetune/Step": 983, "Finetune/Step Time": 2.7721033543348312} +{"Finetune/Learning Rate": 1.8558136593185087e-05, "Finetune/Loss": 0.8548208475112915, "Finetune/Loss (Raw)": 0.8525531888008118, "Finetune/Step": 984, "Finetune/Step Time": 2.772983781993389} +{"Finetune/Learning Rate": 1.8554766704005292e-05, "Finetune/Loss": 0.8539556860923767, "Finetune/Loss (Raw)": 0.8381555080413818, "Finetune/Step": 985, "Finetune/Step Time": 2.7701204400509596} +{"Finetune/Learning Rate": 1.855139318811186e-05, "Finetune/Loss": 0.854188084602356, "Finetune/Loss (Raw)": 0.849566638469696, "Finetune/Step": 986, "Finetune/Step Time": 2.7695920318365097} +{"Finetune/Learning Rate": 1.854801604693496e-05, "Finetune/Loss": 0.8554428219795227, "Finetune/Loss (Raw)": 0.9933187961578369, "Finetune/Step": 987, "Finetune/Step Time": 2.7688000071793795} +{"Finetune/Learning Rate": 1.8544635281906305e-05, "Finetune/Loss": 0.8548070788383484, "Finetune/Loss (Raw)": 0.7974379062652588, "Finetune/Step": 988, "Finetune/Step Time": 2.7724199034273624} +{"Finetune/Learning Rate": 1.8541250894459137e-05, "Finetune/Loss": 0.8545611500740051, "Finetune/Loss (Raw)": 0.8562095761299133, "Finetune/Step": 989, "Finetune/Step Time": 2.7677333876490593} +{"Finetune/Learning Rate": 1.8537862886028234e-05, "Finetune/Loss": 0.8544671535491943, "Finetune/Loss (Raw)": 0.8920659422874451, "Finetune/Step": 990, "Finetune/Step Time": 2.766397688537836} +{"Finetune/Learning Rate": 1.8534471258049913e-05, "Finetune/Loss": 0.8545520305633545, "Finetune/Loss (Raw)": 0.8883577585220337, "Finetune/Step": 991, "Finetune/Step Time": 2.7693094424903393} +{"Finetune/Learning Rate": 1.853107601196202e-05, "Finetune/Loss": 0.8557888865470886, "Finetune/Loss (Raw)": 0.9603850841522217, "Finetune/Step": 992, "Finetune/Step Time": 2.757215676829219} +{"Finetune/Learning Rate": 1.852767714920394e-05, "Finetune/Loss": 0.8555948138237, "Finetune/Loss (Raw)": 0.8877479434013367, "Finetune/Step": 993, "Finetune/Step Time": 2.751828610897064} +{"Finetune/Learning Rate": 1.8524274671216592e-05, "Finetune/Loss": 0.855797529220581, "Finetune/Loss (Raw)": 0.8415687680244446, "Finetune/Step": 994, "Finetune/Step Time": 2.751686830073595} +{"Finetune/Learning Rate": 1.852086857944242e-05, "Finetune/Loss": 0.8556308746337891, "Finetune/Loss (Raw)": 0.7896131873130798, "Finetune/Step": 995, "Finetune/Step Time": 2.7569987419992685} +{"Finetune/Learning Rate": 1.8517458875325405e-05, "Finetune/Loss": 0.8560508489608765, "Finetune/Loss (Raw)": 0.9068616628646851, "Finetune/Step": 996, "Finetune/Step Time": 2.75504051707685} +{"Finetune/Learning Rate": 1.8514045560311064e-05, "Finetune/Loss": 0.8542766571044922, "Finetune/Loss (Raw)": 0.6374296545982361, "Finetune/Step": 997, "Finetune/Step Time": 2.7787334471940994} +{"Finetune/Learning Rate": 1.8510628635846432e-05, "Finetune/Loss": 0.8529601097106934, "Finetune/Loss (Raw)": 0.6750617027282715, "Finetune/Step": 998, "Finetune/Step Time": 2.8037670459598303} +{"Finetune/Learning Rate": 1.8507208103380093e-05, "Finetune/Loss": 0.8543680906295776, "Finetune/Loss (Raw)": 0.9449428915977478, "Finetune/Step": 999, "Finetune/Step Time": 2.8049432560801506} +{"Finetune/Learning Rate": 1.850378396436214e-05, "Finetune/Loss": 0.8545688390731812, "Finetune/Loss (Raw)": 0.8832259178161621, "Finetune/Step": 1000, "Finetune/Step Time": 2.803832607343793} +{"Finetune/Learning Rate": 1.8500356220244212e-05, "Finetune/Loss": 0.854926586151123, "Finetune/Loss (Raw)": 0.925874650478363, "Finetune/Step": 1001, "Finetune/Step Time": 2.801876522600651} +{"Finetune/Learning Rate": 1.849692487247946e-05, "Finetune/Loss": 0.8548454642295837, "Finetune/Loss (Raw)": 0.9354428648948669, "Finetune/Step": 1002, "Finetune/Step Time": 2.801023880019784} +{"Finetune/Learning Rate": 1.8493489922522585e-05, "Finetune/Loss": 0.8546229600906372, "Finetune/Loss (Raw)": 0.8898329138755798, "Finetune/Step": 1003, "Finetune/Step Time": 2.8035565093159676} +{"Finetune/Learning Rate": 1.8490051371829795e-05, "Finetune/Loss": 0.8548710346221924, "Finetune/Loss (Raw)": 0.8375412821769714, "Finetune/Step": 1004, "Finetune/Step Time": 2.806352239102125} +{"Finetune/Learning Rate": 1.848660922185883e-05, "Finetune/Loss": 0.8550329208374023, "Finetune/Loss (Raw)": 0.8393956422805786, "Finetune/Step": 1005, "Finetune/Step Time": 2.8082610983401537} +{"Finetune/Learning Rate": 1.8483163474068953e-05, "Finetune/Loss": 0.8541486263275146, "Finetune/Loss (Raw)": 0.8060432076454163, "Finetune/Step": 1006, "Finetune/Step Time": 2.8028811644762754} +{"Finetune/Learning Rate": 1.847971412992097e-05, "Finetune/Loss": 0.8533317446708679, "Finetune/Loss (Raw)": 0.8610143661499023, "Finetune/Step": 1007, "Finetune/Step Time": 2.8053071685135365} +{"Finetune/Learning Rate": 1.847626119087719e-05, "Finetune/Loss": 0.8533710241317749, "Finetune/Loss (Raw)": 0.8320336937904358, "Finetune/Step": 1008, "Finetune/Step Time": 2.8074951227754354} +{"Finetune/Learning Rate": 1.8472804658401452e-05, "Finetune/Loss": 0.8537080883979797, "Finetune/Loss (Raw)": 0.920722246170044, "Finetune/Step": 1009, "Finetune/Step Time": 2.806176794692874} +{"Finetune/Learning Rate": 1.846934453395913e-05, "Finetune/Loss": 0.8538399934768677, "Finetune/Loss (Raw)": 0.8628193736076355, "Finetune/Step": 1010, "Finetune/Step Time": 2.80297589302063} +{"Finetune/Learning Rate": 1.8465880819017103e-05, "Finetune/Loss": 0.8543445467948914, "Finetune/Loss (Raw)": 0.9142882823944092, "Finetune/Step": 1011, "Finetune/Step Time": 2.800733556970954} +{"Finetune/Learning Rate": 1.846241351504378e-05, "Finetune/Loss": 0.8556842803955078, "Finetune/Loss (Raw)": 1.0003937482833862, "Finetune/Step": 1012, "Finetune/Step Time": 2.800822149962187} +{"Finetune/Learning Rate": 1.84589426235091e-05, "Finetune/Loss": 0.8551139235496521, "Finetune/Loss (Raw)": 0.8242224454879761, "Finetune/Step": 1013, "Finetune/Step Time": 2.801385883241892} +{"Finetune/Learning Rate": 1.8455468145884507e-05, "Finetune/Loss": 0.856019139289856, "Finetune/Loss (Raw)": 0.7920785546302795, "Finetune/Step": 1014, "Finetune/Step Time": 2.779884774237871} +{"Finetune/Learning Rate": 1.845199008364298e-05, "Finetune/Loss": 0.8557808995246887, "Finetune/Loss (Raw)": 0.8596848845481873, "Finetune/Step": 1015, "Finetune/Step Time": 2.7773829996585846} +{"Finetune/Learning Rate": 1.8448508438259004e-05, "Finetune/Loss": 0.8570491075515747, "Finetune/Loss (Raw)": 0.9491507411003113, "Finetune/Step": 1016, "Finetune/Step Time": 2.7756058499217033} +{"Finetune/Learning Rate": 1.84450232112086e-05, "Finetune/Loss": 0.8569257259368896, "Finetune/Loss (Raw)": 0.8699615597724915, "Finetune/Step": 1017, "Finetune/Step Time": 2.7808533255010843} +{"Finetune/Learning Rate": 1.8441534403969287e-05, "Finetune/Loss": 0.8574308753013611, "Finetune/Loss (Raw)": 0.9117714762687683, "Finetune/Step": 1018, "Finetune/Step Time": 2.7825033888220787} +{"Finetune/Learning Rate": 1.843804201802012e-05, "Finetune/Loss": 0.8559306263923645, "Finetune/Loss (Raw)": 0.6582139730453491, "Finetune/Step": 1019, "Finetune/Step Time": 2.8055717665702105} +{"Finetune/Learning Rate": 1.843454605484166e-05, "Finetune/Loss": 0.8559655547142029, "Finetune/Loss (Raw)": 0.8477923274040222, "Finetune/Step": 1020, "Finetune/Step Time": 2.807498747482896} +{"Finetune/Learning Rate": 1.843104651591599e-05, "Finetune/Loss": 0.8559459447860718, "Finetune/Loss (Raw)": 0.9091804623603821, "Finetune/Step": 1021, "Finetune/Step Time": 2.8081885017454624} +{"Finetune/Learning Rate": 1.8427543402726704e-05, "Finetune/Loss": 0.8556804656982422, "Finetune/Loss (Raw)": 0.8874967098236084, "Finetune/Step": 1022, "Finetune/Step Time": 2.8087484519928694} +{"Finetune/Learning Rate": 1.8424036716758914e-05, "Finetune/Loss": 0.8557765483856201, "Finetune/Loss (Raw)": 0.9121270179748535, "Finetune/Step": 1023, "Finetune/Step Time": 2.810710860416293} +{"Finetune/Learning Rate": 1.8420526459499252e-05, "Finetune/Loss": 0.8573785424232483, "Finetune/Loss (Raw)": 0.8631269931793213, "Finetune/Step": 1024, "Finetune/Step Time": 2.7877203561365604} +{"Finetune/Learning Rate": 1.8417012632435852e-05, "Finetune/Loss": 0.8574771881103516, "Finetune/Loss (Raw)": 0.9011164903640747, "Finetune/Step": 1025, "Finetune/Step Time": 2.786229744553566} +{"Finetune/Learning Rate": 1.841349523705837e-05, "Finetune/Loss": 0.8540182113647461, "Finetune/Loss (Raw)": 0.5428306460380554, "Finetune/Step": 1026, "Finetune/Step Time": 2.8106251377612352} +{"Finetune/Learning Rate": 1.8409974274857984e-05, "Finetune/Loss": 0.8547369241714478, "Finetune/Loss (Raw)": 0.9115188717842102, "Finetune/Step": 1027, "Finetune/Step Time": 2.8065823819488287} +{"Finetune/Learning Rate": 1.8406449747327355e-05, "Finetune/Loss": 0.8544349074363708, "Finetune/Loss (Raw)": 0.7800742983818054, "Finetune/Step": 1028, "Finetune/Step Time": 2.8015756141394377} +{"Finetune/Learning Rate": 1.8402921655960685e-05, "Finetune/Loss": 0.8538577556610107, "Finetune/Loss (Raw)": 0.7491812705993652, "Finetune/Step": 1029, "Finetune/Step Time": 2.7988450191915035} +{"Finetune/Learning Rate": 1.839939000225367e-05, "Finetune/Loss": 0.853382408618927, "Finetune/Loss (Raw)": 0.7722170948982239, "Finetune/Step": 1030, "Finetune/Step Time": 2.797403484582901} +{"Finetune/Learning Rate": 1.839585478770353e-05, "Finetune/Loss": 0.8536168336868286, "Finetune/Loss (Raw)": 0.9010316729545593, "Finetune/Step": 1031, "Finetune/Step Time": 2.795108787715435} +{"Finetune/Learning Rate": 1.839231601380898e-05, "Finetune/Loss": 0.8503009080886841, "Finetune/Loss (Raw)": 0.45867469906806946, "Finetune/Step": 1032, "Finetune/Step Time": 2.8281065113842487} +{"Finetune/Learning Rate": 1.8388773682070247e-05, "Finetune/Loss": 0.8491084575653076, "Finetune/Loss (Raw)": 0.8439713716506958, "Finetune/Step": 1033, "Finetune/Step Time": 2.831000804901123} +{"Finetune/Learning Rate": 1.8385227793989076e-05, "Finetune/Loss": 0.8484185934066772, "Finetune/Loss (Raw)": 0.7972478270530701, "Finetune/Step": 1034, "Finetune/Step Time": 2.830553764477372} +{"Finetune/Learning Rate": 1.8381678351068713e-05, "Finetune/Loss": 0.8478711843490601, "Finetune/Loss (Raw)": 0.8569903373718262, "Finetune/Step": 1035, "Finetune/Step Time": 2.8327851220965385} +{"Finetune/Learning Rate": 1.8378125354813904e-05, "Finetune/Loss": 0.847655713558197, "Finetune/Loss (Raw)": 0.8480624556541443, "Finetune/Step": 1036, "Finetune/Step Time": 2.8313106931746006} +{"Finetune/Learning Rate": 1.837456880673092e-05, "Finetune/Loss": 0.8477851748466492, "Finetune/Loss (Raw)": 0.8994914293289185, "Finetune/Step": 1037, "Finetune/Step Time": 2.8334852308034897} +{"Finetune/Learning Rate": 1.8371008708327514e-05, "Finetune/Loss": 0.847681999206543, "Finetune/Loss (Raw)": 0.9057828187942505, "Finetune/Step": 1038, "Finetune/Step Time": 2.8303193654865026} +{"Finetune/Learning Rate": 1.8367445061112966e-05, "Finetune/Loss": 0.8470573425292969, "Finetune/Loss (Raw)": 0.8035579919815063, "Finetune/Step": 1039, "Finetune/Step Time": 2.8353075683116913} +{"Finetune/Learning Rate": 1.836387786659805e-05, "Finetune/Loss": 0.8478828072547913, "Finetune/Loss (Raw)": 0.8414182066917419, "Finetune/Step": 1040, "Finetune/Step Time": 2.835799913853407} +{"Finetune/Learning Rate": 1.8360307126295035e-05, "Finetune/Loss": 0.847061038017273, "Finetune/Loss (Raw)": 0.8427945971488953, "Finetune/Step": 1041, "Finetune/Step Time": 2.839990470558405} +{"Finetune/Learning Rate": 1.8356732841717715e-05, "Finetune/Loss": 0.8468741178512573, "Finetune/Loss (Raw)": 0.7844790816307068, "Finetune/Step": 1042, "Finetune/Step Time": 2.8389480467885733} +{"Finetune/Learning Rate": 1.835315501438137e-05, "Finetune/Loss": 0.8495951890945435, "Finetune/Loss (Raw)": 0.8378793597221375, "Finetune/Step": 1043, "Finetune/Step Time": 2.8183914721012115} +{"Finetune/Learning Rate": 1.834957364580279e-05, "Finetune/Loss": 0.8500261306762695, "Finetune/Loss (Raw)": 0.877566933631897, "Finetune/Step": 1044, "Finetune/Step Time": 2.8178236298263073} +{"Finetune/Learning Rate": 1.8345988737500255e-05, "Finetune/Loss": 0.8501327037811279, "Finetune/Loss (Raw)": 0.9292929172515869, "Finetune/Step": 1045, "Finetune/Step Time": 2.8193964455276728} +{"Finetune/Learning Rate": 1.834240029099356e-05, "Finetune/Loss": 0.8492822051048279, "Finetune/Loss (Raw)": 0.8730595707893372, "Finetune/Step": 1046, "Finetune/Step Time": 2.8189568612724543} +{"Finetune/Learning Rate": 1.8338808307803994e-05, "Finetune/Loss": 0.8458147048950195, "Finetune/Loss (Raw)": 0.35414618253707886, "Finetune/Step": 1047, "Finetune/Step Time": 2.8457936998456717} +{"Finetune/Learning Rate": 1.8335212789454337e-05, "Finetune/Loss": 0.8459992408752441, "Finetune/Loss (Raw)": 0.9595087170600891, "Finetune/Step": 1048, "Finetune/Step Time": 2.836285689845681} +{"Finetune/Learning Rate": 1.8331613737468888e-05, "Finetune/Loss": 0.8480232954025269, "Finetune/Loss (Raw)": 0.8324522376060486, "Finetune/Step": 1049, "Finetune/Step Time": 2.813656874001026} +{"Finetune/Learning Rate": 1.832801115337342e-05, "Finetune/Loss": 0.8461432456970215, "Finetune/Loss (Raw)": 0.6974427700042725, "Finetune/Step": 1050, "Finetune/Step Time": 2.838463595137} +{"Finetune/Learning Rate": 1.832440503869522e-05, "Finetune/Loss": 0.847350001335144, "Finetune/Loss (Raw)": 0.8827545642852783, "Finetune/Step": 1051, "Finetune/Step Time": 2.8217145074158907} +{"Finetune/Learning Rate": 1.8320795394963063e-05, "Finetune/Loss": 0.8479410409927368, "Finetune/Loss (Raw)": 0.8948902487754822, "Finetune/Step": 1052, "Finetune/Step Time": 2.824871437624097} +{"Finetune/Learning Rate": 1.831718222370723e-05, "Finetune/Loss": 0.8471075296401978, "Finetune/Loss (Raw)": 0.811478316783905, "Finetune/Step": 1053, "Finetune/Step Time": 2.823902901262045} +{"Finetune/Learning Rate": 1.8313565526459492e-05, "Finetune/Loss": 0.8477486968040466, "Finetune/Loss (Raw)": 0.9038202166557312, "Finetune/Step": 1054, "Finetune/Step Time": 2.8248521126806736} +{"Finetune/Learning Rate": 1.8309945304753105e-05, "Finetune/Loss": 0.8508247137069702, "Finetune/Loss (Raw)": 0.8639841675758362, "Finetune/Step": 1055, "Finetune/Step Time": 2.7940707225352526} +{"Finetune/Learning Rate": 1.8306321560122836e-05, "Finetune/Loss": 0.8508708477020264, "Finetune/Loss (Raw)": 0.8792544603347778, "Finetune/Step": 1056, "Finetune/Step Time": 2.7932423669844866} +{"Finetune/Learning Rate": 1.8302694294104934e-05, "Finetune/Loss": 0.850556492805481, "Finetune/Loss (Raw)": 0.8573216199874878, "Finetune/Step": 1057, "Finetune/Step Time": 2.794497564435005} +{"Finetune/Learning Rate": 1.829906350823715e-05, "Finetune/Loss": 0.849970281124115, "Finetune/Loss (Raw)": 0.8098770976066589, "Finetune/Step": 1058, "Finetune/Step Time": 2.794276749715209} +{"Finetune/Learning Rate": 1.829542920405871e-05, "Finetune/Loss": 0.8505257368087769, "Finetune/Loss (Raw)": 0.9075716733932495, "Finetune/Step": 1059, "Finetune/Step Time": 2.7958943992853165} +{"Finetune/Learning Rate": 1.829179138311036e-05, "Finetune/Loss": 0.8504893779754639, "Finetune/Loss (Raw)": 0.9161096215248108, "Finetune/Step": 1060, "Finetune/Step Time": 2.795297771692276} +{"Finetune/Learning Rate": 1.8288150046934308e-05, "Finetune/Loss": 0.8485462665557861, "Finetune/Loss (Raw)": 0.5455125570297241, "Finetune/Step": 1061, "Finetune/Step Time": 2.818940483033657} +{"Finetune/Learning Rate": 1.8284505197074268e-05, "Finetune/Loss": 0.848193347454071, "Finetune/Loss (Raw)": 0.8524596691131592, "Finetune/Step": 1062, "Finetune/Step Time": 2.822521809488535} +{"Finetune/Learning Rate": 1.8280856835075437e-05, "Finetune/Loss": 0.8492808938026428, "Finetune/Loss (Raw)": 1.041700839996338, "Finetune/Step": 1063, "Finetune/Step Time": 2.8218975849449635} +{"Finetune/Learning Rate": 1.8277204962484513e-05, "Finetune/Loss": 0.8488621711730957, "Finetune/Loss (Raw)": 0.8693410754203796, "Finetune/Step": 1064, "Finetune/Step Time": 2.8272423297166824} +{"Finetune/Learning Rate": 1.8273549580849663e-05, "Finetune/Loss": 0.8482298254966736, "Finetune/Loss (Raw)": 0.8001781105995178, "Finetune/Step": 1065, "Finetune/Step Time": 2.8292217403650284} +{"Finetune/Learning Rate": 1.826989069172056e-05, "Finetune/Loss": 0.8476505279541016, "Finetune/Loss (Raw)": 0.8121030330657959, "Finetune/Step": 1066, "Finetune/Step Time": 2.827783841639757} +{"Finetune/Learning Rate": 1.826622829664835e-05, "Finetune/Loss": 0.8475099205970764, "Finetune/Loss (Raw)": 0.8794506788253784, "Finetune/Step": 1067, "Finetune/Step Time": 2.8305773977190256} +{"Finetune/Learning Rate": 1.8262562397185678e-05, "Finetune/Loss": 0.8468923568725586, "Finetune/Loss (Raw)": 0.845856785774231, "Finetune/Step": 1068, "Finetune/Step Time": 2.8315172735601664} +{"Finetune/Learning Rate": 1.8258892994886662e-05, "Finetune/Loss": 0.8475372195243835, "Finetune/Loss (Raw)": 0.8948717713356018, "Finetune/Step": 1069, "Finetune/Step Time": 2.8281588088721037} +{"Finetune/Learning Rate": 1.825522009130691e-05, "Finetune/Loss": 0.847794771194458, "Finetune/Loss (Raw)": 0.8803122043609619, "Finetune/Step": 1070, "Finetune/Step Time": 2.8231827039271593} +{"Finetune/Learning Rate": 1.8251543688003522e-05, "Finetune/Loss": 0.8467661142349243, "Finetune/Loss (Raw)": 0.7711547613143921, "Finetune/Step": 1071, "Finetune/Step Time": 2.8205112535506487} +{"Finetune/Learning Rate": 1.824786378653507e-05, "Finetune/Loss": 0.8464884161949158, "Finetune/Loss (Raw)": 0.8197739124298096, "Finetune/Step": 1072, "Finetune/Step Time": 2.8238096665591} +{"Finetune/Learning Rate": 1.824418038846161e-05, "Finetune/Loss": 0.8456237316131592, "Finetune/Loss (Raw)": 0.8013421297073364, "Finetune/Step": 1073, "Finetune/Step Time": 2.8268868755549192} +{"Finetune/Learning Rate": 1.8240493495344695e-05, "Finetune/Loss": 0.8412153124809265, "Finetune/Loss (Raw)": 0.23411047458648682, "Finetune/Step": 1074, "Finetune/Step Time": 2.87364137545228} +{"Finetune/Learning Rate": 1.823680310874734e-05, "Finetune/Loss": 0.8410912752151489, "Finetune/Loss (Raw)": 0.81315678358078, "Finetune/Step": 1075, "Finetune/Step Time": 2.8741049133241177} +{"Finetune/Learning Rate": 1.8233109230234053e-05, "Finetune/Loss": 0.8400979042053223, "Finetune/Loss (Raw)": 0.7827630043029785, "Finetune/Step": 1076, "Finetune/Step Time": 2.870383096858859} +{"Finetune/Learning Rate": 1.8229411861370822e-05, "Finetune/Loss": 0.8384531736373901, "Finetune/Loss (Raw)": 0.6237586140632629, "Finetune/Step": 1077, "Finetune/Step Time": 2.894324168562889} +{"Finetune/Learning Rate": 1.822571100372511e-05, "Finetune/Loss": 0.8396371006965637, "Finetune/Loss (Raw)": 0.8681206107139587, "Finetune/Step": 1078, "Finetune/Step Time": 2.890911655500531} +{"Finetune/Learning Rate": 1.8222006658865858e-05, "Finetune/Loss": 0.8408089876174927, "Finetune/Loss (Raw)": 0.9742632508277893, "Finetune/Step": 1079, "Finetune/Step Time": 2.8915164172649384} +{"Finetune/Learning Rate": 1.8218298828363493e-05, "Finetune/Loss": 0.8407516479492188, "Finetune/Loss (Raw)": 0.8266239762306213, "Finetune/Step": 1080, "Finetune/Step Time": 2.893552850931883} +{"Finetune/Learning Rate": 1.8214587513789912e-05, "Finetune/Loss": 0.8407769203186035, "Finetune/Loss (Raw)": 0.8444227576255798, "Finetune/Step": 1081, "Finetune/Step Time": 2.8971501123160124} +{"Finetune/Learning Rate": 1.8210872716718496e-05, "Finetune/Loss": 0.8394641876220703, "Finetune/Loss (Raw)": 0.8060250282287598, "Finetune/Step": 1082, "Finetune/Step Time": 2.894839845597744} +{"Finetune/Learning Rate": 1.820715443872409e-05, "Finetune/Loss": 0.8414186239242554, "Finetune/Loss (Raw)": 0.8599966168403625, "Finetune/Step": 1083, "Finetune/Step Time": 2.8696209713816643} +{"Finetune/Learning Rate": 1.8203432681383034e-05, "Finetune/Loss": 0.8419339656829834, "Finetune/Loss (Raw)": 0.902715802192688, "Finetune/Step": 1084, "Finetune/Step Time": 2.8631787076592445} +{"Finetune/Learning Rate": 1.819970744627313e-05, "Finetune/Loss": 0.8422350883483887, "Finetune/Loss (Raw)": 0.9594600200653076, "Finetune/Step": 1085, "Finetune/Step Time": 2.864689029753208} +{"Finetune/Learning Rate": 1.8195978734973653e-05, "Finetune/Loss": 0.84173583984375, "Finetune/Loss (Raw)": 0.9082869291305542, "Finetune/Step": 1086, "Finetune/Step Time": 2.86354523524642} +{"Finetune/Learning Rate": 1.8192246549065355e-05, "Finetune/Loss": 0.8414751291275024, "Finetune/Loss (Raw)": 0.7757444977760315, "Finetune/Step": 1087, "Finetune/Step Time": 2.8645111452788115} +{"Finetune/Learning Rate": 1.8188510890130466e-05, "Finetune/Loss": 0.8413807153701782, "Finetune/Loss (Raw)": 0.9050289392471313, "Finetune/Step": 1088, "Finetune/Step Time": 2.874321050941944} +{"Finetune/Learning Rate": 1.8184771759752683e-05, "Finetune/Loss": 0.8410977125167847, "Finetune/Loss (Raw)": 0.7993354797363281, "Finetune/Step": 1089, "Finetune/Step Time": 2.8759250100702047} +{"Finetune/Learning Rate": 1.818102915951717e-05, "Finetune/Loss": 0.8419036865234375, "Finetune/Loss (Raw)": 0.8744496703147888, "Finetune/Step": 1090, "Finetune/Step Time": 2.8541303388774395} +{"Finetune/Learning Rate": 1.8177283091010573e-05, "Finetune/Loss": 0.8421856760978699, "Finetune/Loss (Raw)": 0.828570544719696, "Finetune/Step": 1091, "Finetune/Step Time": 2.8488007225096226} +{"Finetune/Learning Rate": 1.8173533555821e-05, "Finetune/Loss": 0.8415343761444092, "Finetune/Loss (Raw)": 0.8492637872695923, "Finetune/Step": 1092, "Finetune/Step Time": 2.8459803219884634} +{"Finetune/Learning Rate": 1.8169780555538033e-05, "Finetune/Loss": 0.8427420854568481, "Finetune/Loss (Raw)": 0.9491331577301025, "Finetune/Step": 1093, "Finetune/Step Time": 2.848989361897111} +{"Finetune/Learning Rate": 1.816602409175272e-05, "Finetune/Loss": 0.8428277373313904, "Finetune/Loss (Raw)": 0.8936448097229004, "Finetune/Step": 1094, "Finetune/Step Time": 2.8490872029215097} +{"Finetune/Learning Rate": 1.8162264166057583e-05, "Finetune/Loss": 0.8429622650146484, "Finetune/Loss (Raw)": 0.8782468438148499, "Finetune/Step": 1095, "Finetune/Step Time": 2.8462063260376453} +{"Finetune/Learning Rate": 1.81585007800466e-05, "Finetune/Loss": 0.8415968418121338, "Finetune/Loss (Raw)": 0.7810239791870117, "Finetune/Step": 1096, "Finetune/Step Time": 2.846637111157179} +{"Finetune/Learning Rate": 1.815473393531523e-05, "Finetune/Loss": 0.8385442495346069, "Finetune/Loss (Raw)": 0.5518407821655273, "Finetune/Step": 1097, "Finetune/Step Time": 2.8710964992642403} +{"Finetune/Learning Rate": 1.815096363346039e-05, "Finetune/Loss": 0.8389095067977905, "Finetune/Loss (Raw)": 0.8919385671615601, "Finetune/Step": 1098, "Finetune/Step Time": 2.873477164655924} +{"Finetune/Learning Rate": 1.8147189876080463e-05, "Finetune/Loss": 0.8386924266815186, "Finetune/Loss (Raw)": 0.8030022382736206, "Finetune/Step": 1099, "Finetune/Step Time": 2.873539136722684} +{"Finetune/Learning Rate": 1.8143412664775302e-05, "Finetune/Loss": 0.8381601572036743, "Finetune/Loss (Raw)": 0.8574217557907104, "Finetune/Step": 1100, "Finetune/Step Time": 2.872370919212699} +{"Finetune/Learning Rate": 1.8139632001146214e-05, "Finetune/Loss": 0.8386317491531372, "Finetune/Loss (Raw)": 0.9141179919242859, "Finetune/Step": 1101, "Finetune/Step Time": 2.871065340936184} +{"Finetune/Learning Rate": 1.8135847886795983e-05, "Finetune/Loss": 0.8379530310630798, "Finetune/Loss (Raw)": 0.8094189167022705, "Finetune/Step": 1102, "Finetune/Step Time": 2.8692534379661083} +{"Finetune/Learning Rate": 1.8132060323328843e-05, "Finetune/Loss": 0.8390779495239258, "Finetune/Loss (Raw)": 0.968784749507904, "Finetune/Step": 1103, "Finetune/Step Time": 2.8626644127070904} +{"Finetune/Learning Rate": 1.81282693123505e-05, "Finetune/Loss": 0.8390211462974548, "Finetune/Loss (Raw)": 0.8295727968215942, "Finetune/Step": 1104, "Finetune/Step Time": 2.85449480637908} +{"Finetune/Learning Rate": 1.812447485546812e-05, "Finetune/Loss": 0.8359355926513672, "Finetune/Loss (Raw)": 0.5304065942764282, "Finetune/Step": 1105, "Finetune/Step Time": 2.8758913055062294} +{"Finetune/Learning Rate": 1.812067695429032e-05, "Finetune/Loss": 0.836880087852478, "Finetune/Loss (Raw)": 0.9214762449264526, "Finetune/Step": 1106, "Finetune/Step Time": 2.8781938795000315} +{"Finetune/Learning Rate": 1.8116875610427193e-05, "Finetune/Loss": 0.8321597576141357, "Finetune/Loss (Raw)": 0.2419690489768982, "Finetune/Step": 1107, "Finetune/Step Time": 2.90790381655097} +{"Finetune/Learning Rate": 1.8113070825490276e-05, "Finetune/Loss": 0.8310497999191284, "Finetune/Loss (Raw)": 0.8030967116355896, "Finetune/Step": 1108, "Finetune/Step Time": 2.9085818603634834} +{"Finetune/Learning Rate": 1.8109262601092576e-05, "Finetune/Loss": 0.8319457769393921, "Finetune/Loss (Raw)": 0.9383999109268188, "Finetune/Step": 1109, "Finetune/Step Time": 2.907243298366666} +{"Finetune/Learning Rate": 1.8105450938848555e-05, "Finetune/Loss": 0.8316949605941772, "Finetune/Loss (Raw)": 0.8440450429916382, "Finetune/Step": 1110, "Finetune/Step Time": 2.9059021677821875} +{"Finetune/Learning Rate": 1.8101635840374135e-05, "Finetune/Loss": 0.8310475945472717, "Finetune/Loss (Raw)": 0.7828325033187866, "Finetune/Step": 1111, "Finetune/Step Time": 2.9055334106087685} +{"Finetune/Learning Rate": 1.809781730728668e-05, "Finetune/Loss": 0.8313654661178589, "Finetune/Loss (Raw)": 0.8932393193244934, "Finetune/Step": 1112, "Finetune/Step Time": 2.9070243258029222} +{"Finetune/Learning Rate": 1.8093995341205033e-05, "Finetune/Loss": 0.8317193984985352, "Finetune/Loss (Raw)": 0.8834709525108337, "Finetune/Step": 1113, "Finetune/Step Time": 2.9122127145528793} +{"Finetune/Learning Rate": 1.8090169943749477e-05, "Finetune/Loss": 0.8320087194442749, "Finetune/Loss (Raw)": 0.8865889310836792, "Finetune/Step": 1114, "Finetune/Step Time": 2.9133891630917788} +{"Finetune/Learning Rate": 1.808634111654175e-05, "Finetune/Loss": 0.8309273719787598, "Finetune/Loss (Raw)": 0.8549118041992188, "Finetune/Step": 1115, "Finetune/Step Time": 2.9117232114076614} +{"Finetune/Learning Rate": 1.8082508861205052e-05, "Finetune/Loss": 0.8309823274612427, "Finetune/Loss (Raw)": 0.8044741153717041, "Finetune/Step": 1116, "Finetune/Step Time": 2.906652892008424} +{"Finetune/Learning Rate": 1.8078673179364034e-05, "Finetune/Loss": 0.83051598072052, "Finetune/Loss (Raw)": 0.7965145111083984, "Finetune/Step": 1117, "Finetune/Step Time": 2.9098642989993095} +{"Finetune/Learning Rate": 1.8074834072644793e-05, "Finetune/Loss": 0.829455554485321, "Finetune/Loss (Raw)": 0.7563309073448181, "Finetune/Step": 1118, "Finetune/Step Time": 2.9114862009882927} +{"Finetune/Learning Rate": 1.807099154267488e-05, "Finetune/Loss": 0.8297796845436096, "Finetune/Loss (Raw)": 0.9298433065414429, "Finetune/Step": 1119, "Finetune/Step Time": 2.908681869506836} +{"Finetune/Learning Rate": 1.8067145591083306e-05, "Finetune/Loss": 0.8293339014053345, "Finetune/Loss (Raw)": 0.9033243060112, "Finetune/Step": 1120, "Finetune/Step Time": 2.9096366483718157} +{"Finetune/Learning Rate": 1.8063296219500524e-05, "Finetune/Loss": 0.8288699388504028, "Finetune/Loss (Raw)": 0.8283618688583374, "Finetune/Step": 1121, "Finetune/Step Time": 2.910914469510317} +{"Finetune/Learning Rate": 1.805944342955844e-05, "Finetune/Loss": 0.82908695936203, "Finetune/Loss (Raw)": 0.86934894323349, "Finetune/Step": 1122, "Finetune/Step Time": 2.9134170301258564} +{"Finetune/Learning Rate": 1.8055587222890406e-05, "Finetune/Loss": 0.828961968421936, "Finetune/Loss (Raw)": 0.7736154198646545, "Finetune/Step": 1123, "Finetune/Step Time": 2.907987905666232} +{"Finetune/Learning Rate": 1.8051727601131228e-05, "Finetune/Loss": 0.8292158842086792, "Finetune/Loss (Raw)": 0.939363420009613, "Finetune/Step": 1124, "Finetune/Step Time": 2.908393496647477} +{"Finetune/Learning Rate": 1.8047864565917154e-05, "Finetune/Loss": 0.829992413520813, "Finetune/Loss (Raw)": 0.7368276119232178, "Finetune/Step": 1125, "Finetune/Step Time": 2.887598190456629} +{"Finetune/Learning Rate": 1.8043998118885885e-05, "Finetune/Loss": 0.8303964138031006, "Finetune/Loss (Raw)": 0.7267677783966064, "Finetune/Step": 1126, "Finetune/Step Time": 2.8621399011462927} +{"Finetune/Learning Rate": 1.804012826167656e-05, "Finetune/Loss": 0.829802393913269, "Finetune/Loss (Raw)": 0.8689038157463074, "Finetune/Step": 1127, "Finetune/Step Time": 2.8575406447052956} +{"Finetune/Learning Rate": 1.8036254995929775e-05, "Finetune/Loss": 0.8300841450691223, "Finetune/Loss (Raw)": 0.9192963242530823, "Finetune/Step": 1128, "Finetune/Step Time": 2.8537464514374733} +{"Finetune/Learning Rate": 1.803237832328756e-05, "Finetune/Loss": 0.8273721933364868, "Finetune/Loss (Raw)": 0.57874995470047, "Finetune/Step": 1129, "Finetune/Step Time": 2.879534402862191} +{"Finetune/Learning Rate": 1.8028498245393397e-05, "Finetune/Loss": 0.8267954587936401, "Finetune/Loss (Raw)": 0.8616191148757935, "Finetune/Step": 1130, "Finetune/Step Time": 2.8799852337688208} +{"Finetune/Learning Rate": 1.8024614763892207e-05, "Finetune/Loss": 0.8232102394104004, "Finetune/Loss (Raw)": 0.43092063069343567, "Finetune/Step": 1131, "Finetune/Step Time": 2.9113657139241695} +{"Finetune/Learning Rate": 1.802072788043036e-05, "Finetune/Loss": 0.8239692449569702, "Finetune/Loss (Raw)": 0.9346951842308044, "Finetune/Step": 1132, "Finetune/Step Time": 2.910530375316739} +{"Finetune/Learning Rate": 1.8016837596655657e-05, "Finetune/Loss": 0.8233308792114258, "Finetune/Loss (Raw)": 0.7576805949211121, "Finetune/Step": 1133, "Finetune/Step Time": 2.9057315289974213} +{"Finetune/Learning Rate": 1.8012943914217357e-05, "Finetune/Loss": 0.8244237303733826, "Finetune/Loss (Raw)": 0.945929765701294, "Finetune/Step": 1134, "Finetune/Step Time": 2.909805515781045} +{"Finetune/Learning Rate": 1.800904683476614e-05, "Finetune/Loss": 0.824433445930481, "Finetune/Loss (Raw)": 0.862259566783905, "Finetune/Step": 1135, "Finetune/Step Time": 2.911347836256027} +{"Finetune/Learning Rate": 1.8005146359954143e-05, "Finetune/Loss": 0.8241767287254333, "Finetune/Loss (Raw)": 0.7991714477539062, "Finetune/Step": 1136, "Finetune/Step Time": 2.9089951254427433} +{"Finetune/Learning Rate": 1.8001242491434934e-05, "Finetune/Loss": 0.8235052824020386, "Finetune/Loss (Raw)": 0.8347789645195007, "Finetune/Step": 1137, "Finetune/Step Time": 2.906439770013094} +{"Finetune/Learning Rate": 1.799733523086352e-05, "Finetune/Loss": 0.8238367438316345, "Finetune/Loss (Raw)": 0.9052470326423645, "Finetune/Step": 1138, "Finetune/Step Time": 2.9081817138940096} +{"Finetune/Learning Rate": 1.7993424579896352e-05, "Finetune/Loss": 0.8242336511611938, "Finetune/Loss (Raw)": 0.9650939702987671, "Finetune/Step": 1139, "Finetune/Step Time": 2.909920496866107} +{"Finetune/Learning Rate": 1.7989510540191313e-05, "Finetune/Loss": 0.8227142095565796, "Finetune/Loss (Raw)": 0.8058987259864807, "Finetune/Step": 1140, "Finetune/Step Time": 2.9092983845621347} +{"Finetune/Learning Rate": 1.798559311340772e-05, "Finetune/Loss": 0.8228878974914551, "Finetune/Loss (Raw)": 0.8464592695236206, "Finetune/Step": 1141, "Finetune/Step Time": 2.908956641331315} +{"Finetune/Learning Rate": 1.7981672301206333e-05, "Finetune/Loss": 0.8242424726486206, "Finetune/Loss (Raw)": 0.9654650092124939, "Finetune/Step": 1142, "Finetune/Step Time": 2.9088541083037853} +{"Finetune/Learning Rate": 1.7977748105249343e-05, "Finetune/Loss": 0.824156641960144, "Finetune/Loss (Raw)": 0.8486966490745544, "Finetune/Step": 1143, "Finetune/Step Time": 2.9114139806479216} +{"Finetune/Learning Rate": 1.7973820527200376e-05, "Finetune/Loss": 0.8216421604156494, "Finetune/Loss (Raw)": 0.6272996068000793, "Finetune/Step": 1144, "Finetune/Step Time": 2.9442988354712725} +{"Finetune/Learning Rate": 1.7969889568724493e-05, "Finetune/Loss": 0.8214694261550903, "Finetune/Loss (Raw)": 0.8478556871414185, "Finetune/Step": 1145, "Finetune/Step Time": 2.9382924921810627} +{"Finetune/Learning Rate": 1.7965955231488186e-05, "Finetune/Loss": 0.8210022449493408, "Finetune/Loss (Raw)": 0.8519710302352905, "Finetune/Step": 1146, "Finetune/Step Time": 2.9372876565903425} +{"Finetune/Learning Rate": 1.796201751715938e-05, "Finetune/Loss": 0.8213714361190796, "Finetune/Loss (Raw)": 0.7054672837257385, "Finetune/Step": 1147, "Finetune/Step Time": 2.9350423961877823} +{"Finetune/Learning Rate": 1.7958076427407432e-05, "Finetune/Loss": 0.8212407827377319, "Finetune/Loss (Raw)": 0.8310644626617432, "Finetune/Step": 1148, "Finetune/Step Time": 2.936194436624646} +{"Finetune/Learning Rate": 1.7954131963903134e-05, "Finetune/Loss": 0.8215572834014893, "Finetune/Loss (Raw)": 0.9496984481811523, "Finetune/Step": 1149, "Finetune/Step Time": 2.936708642169833} +{"Finetune/Learning Rate": 1.7950184128318704e-05, "Finetune/Loss": 0.8210591673851013, "Finetune/Loss (Raw)": 0.8237353563308716, "Finetune/Step": 1150, "Finetune/Step Time": 2.9387630838900805} +{"Finetune/Learning Rate": 1.7946232922327785e-05, "Finetune/Loss": 0.8205395936965942, "Finetune/Loss (Raw)": 0.845618724822998, "Finetune/Step": 1151, "Finetune/Step Time": 2.9401720110327005} +{"Finetune/Learning Rate": 1.7942278347605458e-05, "Finetune/Loss": 0.8202767372131348, "Finetune/Loss (Raw)": 0.8294793963432312, "Finetune/Step": 1152, "Finetune/Step Time": 2.9421694818884134} +{"Finetune/Learning Rate": 1.7938320405828232e-05, "Finetune/Loss": 0.82008957862854, "Finetune/Loss (Raw)": 0.8771665692329407, "Finetune/Step": 1153, "Finetune/Step Time": 2.9436525143682957} +{"Finetune/Learning Rate": 1.793435909867403e-05, "Finetune/Loss": 0.8233107328414917, "Finetune/Loss (Raw)": 0.9551309943199158, "Finetune/Step": 1154, "Finetune/Step Time": 2.919680994004011} +{"Finetune/Learning Rate": 1.7930394427822214e-05, "Finetune/Loss": 0.8201440572738647, "Finetune/Loss (Raw)": 0.5061933398246765, "Finetune/Step": 1155, "Finetune/Step Time": 2.946452060714364} +{"Finetune/Learning Rate": 1.7926426394953577e-05, "Finetune/Loss": 0.8210448026657104, "Finetune/Loss (Raw)": 0.8953608274459839, "Finetune/Step": 1156, "Finetune/Step Time": 2.9479935001581907} +{"Finetune/Learning Rate": 1.7922455001750323e-05, "Finetune/Loss": 0.8224008679389954, "Finetune/Loss (Raw)": 0.9227679967880249, "Finetune/Step": 1157, "Finetune/Step Time": 2.9509449172765017} +{"Finetune/Learning Rate": 1.7918480249896085e-05, "Finetune/Loss": 0.8236533403396606, "Finetune/Loss (Raw)": 0.9325240850448608, "Finetune/Step": 1158, "Finetune/Step Time": 2.9484421983361244} +{"Finetune/Learning Rate": 1.7914502141075927e-05, "Finetune/Loss": 0.8234285712242126, "Finetune/Loss (Raw)": 0.8722660541534424, "Finetune/Step": 1159, "Finetune/Step Time": 2.950211660936475} +{"Finetune/Learning Rate": 1.791052067697633e-05, "Finetune/Loss": 0.8221981525421143, "Finetune/Loss (Raw)": 0.301177054643631, "Finetune/Step": 1160, "Finetune/Step Time": 2.9467583764344454} +{"Finetune/Learning Rate": 1.79065358592852e-05, "Finetune/Loss": 0.8225891590118408, "Finetune/Loss (Raw)": 0.8940312266349792, "Finetune/Step": 1161, "Finetune/Step Time": 2.9449753258377314} +{"Finetune/Learning Rate": 1.790254768969186e-05, "Finetune/Loss": 0.8225581645965576, "Finetune/Loss (Raw)": 0.7932759523391724, "Finetune/Step": 1162, "Finetune/Step Time": 2.945971794426441} +{"Finetune/Learning Rate": 1.7898556169887055e-05, "Finetune/Loss": 0.8222160339355469, "Finetune/Loss (Raw)": 0.8131986856460571, "Finetune/Step": 1163, "Finetune/Step Time": 2.947093738242984} +{"Finetune/Learning Rate": 1.789456130156296e-05, "Finetune/Loss": 0.8224443793296814, "Finetune/Loss (Raw)": 0.8772878050804138, "Finetune/Step": 1164, "Finetune/Step Time": 2.949256092309952} +{"Finetune/Learning Rate": 1.7890563086413156e-05, "Finetune/Loss": 0.8215920925140381, "Finetune/Loss (Raw)": 0.7903977632522583, "Finetune/Step": 1165, "Finetune/Step Time": 2.9467471819370985} +{"Finetune/Learning Rate": 1.7886561526132654e-05, "Finetune/Loss": 0.8217595815658569, "Finetune/Loss (Raw)": 0.9272201061248779, "Finetune/Step": 1166, "Finetune/Step Time": 2.946891298517585} +{"Finetune/Learning Rate": 1.7882556622417872e-05, "Finetune/Loss": 0.8220158219337463, "Finetune/Loss (Raw)": 0.8363572359085083, "Finetune/Step": 1167, "Finetune/Step Time": 2.9444543328136206} +{"Finetune/Learning Rate": 1.787854837696666e-05, "Finetune/Loss": 0.8177913427352905, "Finetune/Loss (Raw)": 0.3006804883480072, "Finetune/Step": 1168, "Finetune/Step Time": 2.9745663795620203} +{"Finetune/Learning Rate": 1.7874536791478267e-05, "Finetune/Loss": 0.8182376623153687, "Finetune/Loss (Raw)": 0.8999266028404236, "Finetune/Step": 1169, "Finetune/Step Time": 2.97122005186975} +{"Finetune/Learning Rate": 1.7870521867653377e-05, "Finetune/Loss": 0.8185533881187439, "Finetune/Loss (Raw)": 0.824894368648529, "Finetune/Step": 1170, "Finetune/Step Time": 2.9697351306676865} +{"Finetune/Learning Rate": 1.786650360719407e-05, "Finetune/Loss": 0.81905198097229, "Finetune/Loss (Raw)": 0.9016930460929871, "Finetune/Step": 1171, "Finetune/Step Time": 2.968048866838217} +{"Finetune/Learning Rate": 1.786248201180386e-05, "Finetune/Loss": 0.8180394172668457, "Finetune/Loss (Raw)": 0.7479623556137085, "Finetune/Step": 1172, "Finetune/Step Time": 2.9925451800227165} +{"Finetune/Learning Rate": 1.7858457083187652e-05, "Finetune/Loss": 0.817481279373169, "Finetune/Loss (Raw)": 0.8578556776046753, "Finetune/Step": 1173, "Finetune/Step Time": 2.9895647447556257} +{"Finetune/Learning Rate": 1.785442882305179e-05, "Finetune/Loss": 0.8178812861442566, "Finetune/Loss (Raw)": 0.9242600202560425, "Finetune/Step": 1174, "Finetune/Step Time": 2.9898845069110394} +{"Finetune/Learning Rate": 1.785039723310401e-05, "Finetune/Loss": 0.8220562934875488, "Finetune/Loss (Raw)": 0.8885405659675598, "Finetune/Step": 1175, "Finetune/Step Time": 2.9639097545295954} +{"Finetune/Learning Rate": 1.784636231505347e-05, "Finetune/Loss": 0.821391224861145, "Finetune/Loss (Raw)": 0.8743777871131897, "Finetune/Step": 1176, "Finetune/Step Time": 2.9659228324890137} +{"Finetune/Learning Rate": 1.7842324070610732e-05, "Finetune/Loss": 0.8215508460998535, "Finetune/Loss (Raw)": 0.8528929352760315, "Finetune/Step": 1177, "Finetune/Step Time": 2.9629952032119036} +{"Finetune/Learning Rate": 1.7838282501487777e-05, "Finetune/Loss": 0.823219358921051, "Finetune/Loss (Raw)": 0.9110142588615417, "Finetune/Step": 1178, "Finetune/Step Time": 2.9408136922866106} +{"Finetune/Learning Rate": 1.783423760939799e-05, "Finetune/Loss": 0.8224190473556519, "Finetune/Loss (Raw)": 0.78030925989151, "Finetune/Step": 1179, "Finetune/Step Time": 2.936291651800275} +{"Finetune/Learning Rate": 1.7830189396056157e-05, "Finetune/Loss": 0.8217259049415588, "Finetune/Loss (Raw)": 0.8061709403991699, "Finetune/Step": 1180, "Finetune/Step Time": 2.9333424028009176} +{"Finetune/Learning Rate": 1.7826137863178496e-05, "Finetune/Loss": 0.8223317861557007, "Finetune/Loss (Raw)": 0.8890263438224792, "Finetune/Step": 1181, "Finetune/Step Time": 2.938280127942562} +{"Finetune/Learning Rate": 1.7822083012482603e-05, "Finetune/Loss": 0.8216542601585388, "Finetune/Loss (Raw)": 0.8170973658561707, "Finetune/Step": 1182, "Finetune/Step Time": 2.9363858308643103} +{"Finetune/Learning Rate": 1.78180248456875e-05, "Finetune/Loss": 0.821986973285675, "Finetune/Loss (Raw)": 0.9065706133842468, "Finetune/Step": 1183, "Finetune/Step Time": 2.938156746327877} +{"Finetune/Learning Rate": 1.7813963364513607e-05, "Finetune/Loss": 0.8217037320137024, "Finetune/Loss (Raw)": 0.8430001139640808, "Finetune/Step": 1184, "Finetune/Step Time": 2.93984517455101} +{"Finetune/Learning Rate": 1.780989857068275e-05, "Finetune/Loss": 0.8202667236328125, "Finetune/Loss (Raw)": 0.6733870506286621, "Finetune/Step": 1185, "Finetune/Step Time": 2.959479942917824} +{"Finetune/Learning Rate": 1.7805830465918164e-05, "Finetune/Loss": 0.8203293085098267, "Finetune/Loss (Raw)": 0.8178953528404236, "Finetune/Step": 1186, "Finetune/Step Time": 2.963484074920416} +{"Finetune/Learning Rate": 1.7801759051944483e-05, "Finetune/Loss": 0.8207778930664062, "Finetune/Loss (Raw)": 0.964979350566864, "Finetune/Step": 1187, "Finetune/Step Time": 2.9611375723034143} +{"Finetune/Learning Rate": 1.7797684330487747e-05, "Finetune/Loss": 0.8201485276222229, "Finetune/Loss (Raw)": 0.8355552554130554, "Finetune/Step": 1188, "Finetune/Step Time": 2.9586404468864202} +{"Finetune/Learning Rate": 1.7793606303275388e-05, "Finetune/Loss": 0.8228684663772583, "Finetune/Loss (Raw)": 0.8936678171157837, "Finetune/Step": 1189, "Finetune/Step Time": 2.93340771086514} +{"Finetune/Learning Rate": 1.778952497203626e-05, "Finetune/Loss": 0.8228197693824768, "Finetune/Loss (Raw)": 0.8462283611297607, "Finetune/Step": 1190, "Finetune/Step Time": 2.9364988412708044} +{"Finetune/Learning Rate": 1.7785440338500594e-05, "Finetune/Loss": 0.8212953805923462, "Finetune/Loss (Raw)": 0.8465718030929565, "Finetune/Step": 1191, "Finetune/Step Time": 2.9379660729318857} +{"Finetune/Learning Rate": 1.778135240440004e-05, "Finetune/Loss": 0.8206183314323425, "Finetune/Loss (Raw)": 0.7826811671257019, "Finetune/Step": 1192, "Finetune/Step Time": 2.9375096410512924} +{"Finetune/Learning Rate": 1.777726117146763e-05, "Finetune/Loss": 0.8206549882888794, "Finetune/Loss (Raw)": 0.8048714995384216, "Finetune/Step": 1193, "Finetune/Step Time": 2.933225618675351} +{"Finetune/Learning Rate": 1.777316664143782e-05, "Finetune/Loss": 0.8207249641418457, "Finetune/Loss (Raw)": 0.8210684061050415, "Finetune/Step": 1194, "Finetune/Step Time": 2.9336826987564564} +{"Finetune/Learning Rate": 1.776906881604643e-05, "Finetune/Loss": 0.820100724697113, "Finetune/Loss (Raw)": 0.7995389103889465, "Finetune/Step": 1195, "Finetune/Step Time": 2.9325291384011507} +{"Finetune/Learning Rate": 1.776496769703071e-05, "Finetune/Loss": 0.8202539682388306, "Finetune/Loss (Raw)": 0.8654696941375732, "Finetune/Step": 1196, "Finetune/Step Time": 2.9320342615246773} +{"Finetune/Learning Rate": 1.776086328612928e-05, "Finetune/Loss": 0.8191119432449341, "Finetune/Loss (Raw)": 0.7486876845359802, "Finetune/Step": 1197, "Finetune/Step Time": 2.9301881920546293} +{"Finetune/Learning Rate": 1.7756755585082173e-05, "Finetune/Loss": 0.8197166323661804, "Finetune/Loss (Raw)": 0.9577186107635498, "Finetune/Step": 1198, "Finetune/Step Time": 2.932606253772974} +{"Finetune/Learning Rate": 1.775264459563081e-05, "Finetune/Loss": 0.8193905353546143, "Finetune/Loss (Raw)": 0.7294082045555115, "Finetune/Step": 1199, "Finetune/Step Time": 2.9375077169388533} +{"Finetune/Learning Rate": 1.7748530319518005e-05, "Finetune/Loss": 0.814268946647644, "Finetune/Loss (Raw)": 0.1642189621925354, "Finetune/Step": 1200, "Finetune/Step Time": 2.977916045114398} +{"Finetune/Learning Rate": 1.7744412758487967e-05, "Finetune/Loss": 0.8134097456932068, "Finetune/Loss (Raw)": 0.6913636326789856, "Finetune/Step": 1201, "Finetune/Step Time": 2.9978250171989202} +{"Finetune/Learning Rate": 1.77402919142863e-05, "Finetune/Loss": 0.8177285194396973, "Finetune/Loss (Raw)": 0.7869202494621277, "Finetune/Step": 1202, "Finetune/Step Time": 2.9506385400891304} +{"Finetune/Learning Rate": 1.7736167788659995e-05, "Finetune/Loss": 0.8181400299072266, "Finetune/Loss (Raw)": 0.8658220171928406, "Finetune/Step": 1203, "Finetune/Step Time": 2.951684519648552} +{"Finetune/Learning Rate": 1.7732040383357437e-05, "Finetune/Loss": 0.8184267282485962, "Finetune/Loss (Raw)": 0.819462239742279, "Finetune/Step": 1204, "Finetune/Step Time": 2.9514365792274475} +{"Finetune/Learning Rate": 1.7727909700128403e-05, "Finetune/Loss": 0.8200890421867371, "Finetune/Loss (Raw)": 0.8365297913551331, "Finetune/Step": 1205, "Finetune/Step Time": 2.927281616255641} +{"Finetune/Learning Rate": 1.7723775740724054e-05, "Finetune/Loss": 0.8195751905441284, "Finetune/Loss (Raw)": 0.8023502826690674, "Finetune/Step": 1206, "Finetune/Step Time": 2.9256724286824465} +{"Finetune/Learning Rate": 1.7719638506896946e-05, "Finetune/Loss": 0.8180192708969116, "Finetune/Loss (Raw)": 0.7751105427742004, "Finetune/Step": 1207, "Finetune/Step Time": 2.9289430640637875} +{"Finetune/Learning Rate": 1.7715498000401024e-05, "Finetune/Loss": 0.8186911344528198, "Finetune/Loss (Raw)": 0.9126191735267639, "Finetune/Step": 1208, "Finetune/Step Time": 2.9258264768868685} +{"Finetune/Learning Rate": 1.7711354222991607e-05, "Finetune/Loss": 0.818148136138916, "Finetune/Loss (Raw)": 0.7749196290969849, "Finetune/Step": 1209, "Finetune/Step Time": 2.922195188701153} +{"Finetune/Learning Rate": 1.7707207176425424e-05, "Finetune/Loss": 0.8190805912017822, "Finetune/Loss (Raw)": 0.925378143787384, "Finetune/Step": 1210, "Finetune/Step Time": 2.923501782119274} +{"Finetune/Learning Rate": 1.7703056862460564e-05, "Finetune/Loss": 0.8189985752105713, "Finetune/Loss (Raw)": 0.8494986891746521, "Finetune/Step": 1211, "Finetune/Step Time": 2.925411293283105} +{"Finetune/Learning Rate": 1.7698903282856528e-05, "Finetune/Loss": 0.8193851709365845, "Finetune/Loss (Raw)": 0.9521946310997009, "Finetune/Step": 1212, "Finetune/Step Time": 2.9264229498803616} +{"Finetune/Learning Rate": 1.7694746439374175e-05, "Finetune/Loss": 0.8189669847488403, "Finetune/Loss (Raw)": 0.9059383273124695, "Finetune/Step": 1213, "Finetune/Step Time": 2.9221231918781996} +{"Finetune/Learning Rate": 1.769058633377576e-05, "Finetune/Loss": 0.8193602561950684, "Finetune/Loss (Raw)": 0.9586191773414612, "Finetune/Step": 1214, "Finetune/Step Time": 2.9217383470386267} +{"Finetune/Learning Rate": 1.7686422967824932e-05, "Finetune/Loss": 0.819643497467041, "Finetune/Loss (Raw)": 0.8120007514953613, "Finetune/Step": 1215, "Finetune/Step Time": 2.9243687484413385} +{"Finetune/Learning Rate": 1.7682256343286704e-05, "Finetune/Loss": 0.8196654915809631, "Finetune/Loss (Raw)": 0.9078487157821655, "Finetune/Step": 1216, "Finetune/Step Time": 2.915044730529189} +{"Finetune/Learning Rate": 1.7678086461927474e-05, "Finetune/Loss": 0.8206052780151367, "Finetune/Loss (Raw)": 0.9196204543113708, "Finetune/Step": 1217, "Finetune/Step Time": 2.9146821927279234} +{"Finetune/Learning Rate": 1.7673913325515035e-05, "Finetune/Loss": 0.820159375667572, "Finetune/Loss (Raw)": 0.8173865079879761, "Finetune/Step": 1218, "Finetune/Step Time": 2.919356670230627} +{"Finetune/Learning Rate": 1.766973693581854e-05, "Finetune/Loss": 0.8211678266525269, "Finetune/Loss (Raw)": 0.957646369934082, "Finetune/Step": 1219, "Finetune/Step Time": 2.9270411897450686} +{"Finetune/Learning Rate": 1.7665557294608533e-05, "Finetune/Loss": 0.821157693862915, "Finetune/Loss (Raw)": 0.8479599356651306, "Finetune/Step": 1220, "Finetune/Step Time": 2.927152071148157} +{"Finetune/Learning Rate": 1.7661374403656935e-05, "Finetune/Loss": 0.8211818337440491, "Finetune/Loss (Raw)": 0.9522294402122498, "Finetune/Step": 1221, "Finetune/Step Time": 2.9258810840547085} +{"Finetune/Learning Rate": 1.7657188264737046e-05, "Finetune/Loss": 0.8211615085601807, "Finetune/Loss (Raw)": 0.8910505175590515, "Finetune/Step": 1222, "Finetune/Step Time": 2.924897402524948} +{"Finetune/Learning Rate": 1.7652998879623532e-05, "Finetune/Loss": 0.8207111358642578, "Finetune/Loss (Raw)": 0.8205967545509338, "Finetune/Step": 1223, "Finetune/Step Time": 2.926144640892744} +{"Finetune/Learning Rate": 1.764880625009245e-05, "Finetune/Loss": 0.8209085464477539, "Finetune/Loss (Raw)": 0.8062849044799805, "Finetune/Step": 1224, "Finetune/Step Time": 2.9227301627397537} +{"Finetune/Learning Rate": 1.764461037792123e-05, "Finetune/Loss": 0.823419988155365, "Finetune/Loss (Raw)": 0.8733085989952087, "Finetune/Step": 1225, "Finetune/Step Time": 2.89865237288177} +{"Finetune/Learning Rate": 1.7640411264888665e-05, "Finetune/Loss": 0.8234737515449524, "Finetune/Loss (Raw)": 0.8988242149353027, "Finetune/Step": 1226, "Finetune/Step Time": 2.8990458231419325} +{"Finetune/Learning Rate": 1.7636208912774936e-05, "Finetune/Loss": 0.8234962224960327, "Finetune/Loss (Raw)": 0.8058732748031616, "Finetune/Step": 1227, "Finetune/Step Time": 2.899178296327591} +{"Finetune/Learning Rate": 1.763200332336159e-05, "Finetune/Loss": 0.8231854438781738, "Finetune/Loss (Raw)": 0.8176392316818237, "Finetune/Step": 1228, "Finetune/Step Time": 2.9005535412579775} +{"Finetune/Learning Rate": 1.762779449843154e-05, "Finetune/Loss": 0.8231775760650635, "Finetune/Loss (Raw)": 0.913112461566925, "Finetune/Step": 1229, "Finetune/Step Time": 2.9015186838805676} +{"Finetune/Learning Rate": 1.762358243976909e-05, "Finetune/Loss": 0.8231388330459595, "Finetune/Loss (Raw)": 0.8044567108154297, "Finetune/Step": 1230, "Finetune/Step Time": 2.9010533448308706} +{"Finetune/Learning Rate": 1.7619367149159892e-05, "Finetune/Loss": 0.8226761817932129, "Finetune/Loss (Raw)": 0.9095733761787415, "Finetune/Step": 1231, "Finetune/Step Time": 2.907233027741313} +{"Finetune/Learning Rate": 1.761514862839099e-05, "Finetune/Loss": 0.8221530318260193, "Finetune/Loss (Raw)": 0.7626094222068787, "Finetune/Step": 1232, "Finetune/Step Time": 2.903792917728424} +{"Finetune/Learning Rate": 1.7610926879250776e-05, "Finetune/Loss": 0.8247300386428833, "Finetune/Loss (Raw)": 0.8602655529975891, "Finetune/Step": 1233, "Finetune/Step Time": 2.8828044924885035} +{"Finetune/Learning Rate": 1.760670190352903e-05, "Finetune/Loss": 0.8245747089385986, "Finetune/Loss (Raw)": 0.901593029499054, "Finetune/Step": 1234, "Finetune/Step Time": 2.8833643700927496} +{"Finetune/Learning Rate": 1.7602473703016884e-05, "Finetune/Loss": 0.8297780752182007, "Finetune/Loss (Raw)": 0.9079925417900085, "Finetune/Step": 1235, "Finetune/Step Time": 2.849965177476406} +{"Finetune/Learning Rate": 1.7598242279506848e-05, "Finetune/Loss": 0.8259822130203247, "Finetune/Loss (Raw)": 0.31722745299339294, "Finetune/Step": 1236, "Finetune/Step Time": 2.8759619500488043} +{"Finetune/Learning Rate": 1.7594007634792793e-05, "Finetune/Loss": 0.824927806854248, "Finetune/Loss (Raw)": 0.8034417033195496, "Finetune/Step": 1237, "Finetune/Step Time": 2.8780620712786913} +{"Finetune/Learning Rate": 1.7589769770669963e-05, "Finetune/Loss": 0.8244433403015137, "Finetune/Loss (Raw)": 0.7820340991020203, "Finetune/Step": 1238, "Finetune/Step Time": 2.876834649592638} +{"Finetune/Learning Rate": 1.7585528688934952e-05, "Finetune/Loss": 0.8254809379577637, "Finetune/Loss (Raw)": 0.9156454801559448, "Finetune/Step": 1239, "Finetune/Step Time": 2.8764886632561684} +{"Finetune/Learning Rate": 1.7581284391385732e-05, "Finetune/Loss": 0.8248121738433838, "Finetune/Loss (Raw)": 0.8076284527778625, "Finetune/Step": 1240, "Finetune/Step Time": 2.8753023240715265} +{"Finetune/Learning Rate": 1.7577036879821633e-05, "Finetune/Loss": 0.8250913619995117, "Finetune/Loss (Raw)": 0.9192120432853699, "Finetune/Step": 1241, "Finetune/Step Time": 2.8727694135159254} +{"Finetune/Learning Rate": 1.7572786156043348e-05, "Finetune/Loss": 0.8245981931686401, "Finetune/Loss (Raw)": 0.82347172498703, "Finetune/Step": 1242, "Finetune/Step Time": 2.874479353427887} +{"Finetune/Learning Rate": 1.756853222185293e-05, "Finetune/Loss": 0.8243385553359985, "Finetune/Loss (Raw)": 0.8216677308082581, "Finetune/Step": 1243, "Finetune/Step Time": 2.876783659681678} +{"Finetune/Learning Rate": 1.7564275079053794e-05, "Finetune/Loss": 0.8246037364006042, "Finetune/Loss (Raw)": 0.8384162783622742, "Finetune/Step": 1244, "Finetune/Step Time": 2.87945400364697} +{"Finetune/Learning Rate": 1.756001472945072e-05, "Finetune/Loss": 0.8243917226791382, "Finetune/Loss (Raw)": 0.7693854570388794, "Finetune/Step": 1245, "Finetune/Step Time": 2.88022324629128} +{"Finetune/Learning Rate": 1.7555751174849845e-05, "Finetune/Loss": 0.8245331048965454, "Finetune/Loss (Raw)": 0.7744244337081909, "Finetune/Step": 1246, "Finetune/Step Time": 2.8833756018429995} +{"Finetune/Learning Rate": 1.7551484417058656e-05, "Finetune/Loss": 0.8241488933563232, "Finetune/Loss (Raw)": 0.8806633949279785, "Finetune/Step": 1247, "Finetune/Step Time": 2.882854549214244} +{"Finetune/Learning Rate": 1.754721445788601e-05, "Finetune/Loss": 0.824061930179596, "Finetune/Loss (Raw)": 0.8921958804130554, "Finetune/Step": 1248, "Finetune/Step Time": 2.8855356127023697} +{"Finetune/Learning Rate": 1.7542941299142113e-05, "Finetune/Loss": 0.824261486530304, "Finetune/Loss (Raw)": 0.8539009094238281, "Finetune/Step": 1249, "Finetune/Step Time": 2.887090779840946} +{"Finetune/Learning Rate": 1.7538664942638535e-05, "Finetune/Loss": 0.824816107749939, "Finetune/Loss (Raw)": 0.9403382539749146, "Finetune/Step": 1250, "Finetune/Step Time": 2.8834375254809856} +{"Finetune/Learning Rate": 1.75343853901882e-05, "Finetune/Loss": 0.8249268531799316, "Finetune/Loss (Raw)": 0.7877901792526245, "Finetune/Step": 1251, "Finetune/Step Time": 2.8847699966281652} +{"Finetune/Learning Rate": 1.7530102643605377e-05, "Finetune/Loss": 0.8236620426177979, "Finetune/Loss (Raw)": 0.7774648666381836, "Finetune/Step": 1252, "Finetune/Step Time": 2.8847270756959915} +{"Finetune/Learning Rate": 1.7525816704705697e-05, "Finetune/Loss": 0.8236618041992188, "Finetune/Loss (Raw)": 0.7368030548095703, "Finetune/Step": 1253, "Finetune/Step Time": 2.8863578885793686} +{"Finetune/Learning Rate": 1.752152757530615e-05, "Finetune/Loss": 0.8242040872573853, "Finetune/Loss (Raw)": 0.7961856722831726, "Finetune/Step": 1254, "Finetune/Step Time": 2.8858592566102743} +{"Finetune/Learning Rate": 1.7517235257225066e-05, "Finetune/Loss": 0.824713945388794, "Finetune/Loss (Raw)": 0.934165894985199, "Finetune/Step": 1255, "Finetune/Step Time": 2.8868827242404222} +{"Finetune/Learning Rate": 1.7512939752282137e-05, "Finetune/Loss": 0.8228804469108582, "Finetune/Loss (Raw)": 0.684599757194519, "Finetune/Step": 1256, "Finetune/Step Time": 2.9216024298220873} +{"Finetune/Learning Rate": 1.7508641062298405e-05, "Finetune/Loss": 0.8238235116004944, "Finetune/Loss (Raw)": 0.6994661688804626, "Finetune/Step": 1257, "Finetune/Step Time": 2.898084392771125} +{"Finetune/Learning Rate": 1.7504339189096254e-05, "Finetune/Loss": 0.824343204498291, "Finetune/Loss (Raw)": 0.928135097026825, "Finetune/Step": 1258, "Finetune/Step Time": 2.8964101113379} +{"Finetune/Learning Rate": 1.7500034134499425e-05, "Finetune/Loss": 0.8276161551475525, "Finetune/Loss (Raw)": 0.8498623371124268, "Finetune/Step": 1259, "Finetune/Step Time": 2.8653624393045902} +{"Finetune/Learning Rate": 1.7495725900333008e-05, "Finetune/Loss": 0.8271322250366211, "Finetune/Loss (Raw)": 0.8727522492408752, "Finetune/Step": 1260, "Finetune/Step Time": 2.8671170715242624} +{"Finetune/Learning Rate": 1.7491414488423434e-05, "Finetune/Loss": 0.8280243873596191, "Finetune/Loss (Raw)": 0.8718786239624023, "Finetune/Step": 1261, "Finetune/Step Time": 2.867216130718589} +{"Finetune/Learning Rate": 1.748709990059849e-05, "Finetune/Loss": 0.8266350626945496, "Finetune/Loss (Raw)": 0.7680983543395996, "Finetune/Step": 1262, "Finetune/Step Time": 2.865346586331725} +{"Finetune/Learning Rate": 1.74827821386873e-05, "Finetune/Loss": 0.8266751766204834, "Finetune/Loss (Raw)": 0.8673917651176453, "Finetune/Step": 1263, "Finetune/Step Time": 2.8616067823022604} +{"Finetune/Learning Rate": 1.7478461204520346e-05, "Finetune/Loss": 0.8267332315444946, "Finetune/Loss (Raw)": 0.8065980672836304, "Finetune/Step": 1264, "Finetune/Step Time": 2.8676509503275156} +{"Finetune/Learning Rate": 1.7474137099929448e-05, "Finetune/Loss": 0.8266923427581787, "Finetune/Loss (Raw)": 0.8295460939407349, "Finetune/Step": 1265, "Finetune/Step Time": 2.8676758352667093} +{"Finetune/Learning Rate": 1.746980982674776e-05, "Finetune/Loss": 0.8267546892166138, "Finetune/Loss (Raw)": 0.9132338166236877, "Finetune/Step": 1266, "Finetune/Step Time": 2.8663601726293564} +{"Finetune/Learning Rate": 1.74654793868098e-05, "Finetune/Loss": 0.8259565830230713, "Finetune/Loss (Raw)": 0.8629318475723267, "Finetune/Step": 1267, "Finetune/Step Time": 2.86473935469985} +{"Finetune/Learning Rate": 1.7461145781951412e-05, "Finetune/Loss": 0.8265668153762817, "Finetune/Loss (Raw)": 0.8840107321739197, "Finetune/Step": 1268, "Finetune/Step Time": 2.8661059848964214} +{"Finetune/Learning Rate": 1.745680901400979e-05, "Finetune/Loss": 0.8270605802536011, "Finetune/Loss (Raw)": 0.9096551537513733, "Finetune/Step": 1269, "Finetune/Step Time": 2.866138316690922} +{"Finetune/Learning Rate": 1.7452469084823463e-05, "Finetune/Loss": 0.8254482746124268, "Finetune/Loss (Raw)": 0.7590950131416321, "Finetune/Step": 1270, "Finetune/Step Time": 2.864208372309804} +{"Finetune/Learning Rate": 1.7448125996232307e-05, "Finetune/Loss": 0.8252148628234863, "Finetune/Loss (Raw)": 0.81882244348526, "Finetune/Step": 1271, "Finetune/Step Time": 2.860544266179204} +{"Finetune/Learning Rate": 1.744377975007753e-05, "Finetune/Loss": 0.8262509107589722, "Finetune/Loss (Raw)": 0.7599062323570251, "Finetune/Step": 1272, "Finetune/Step Time": 2.8276347499340773} +{"Finetune/Learning Rate": 1.743943034820169e-05, "Finetune/Loss": 0.8261566162109375, "Finetune/Loss (Raw)": 0.8357954621315002, "Finetune/Step": 1273, "Finetune/Step Time": 2.8276517763733864} +{"Finetune/Learning Rate": 1.7435077792448666e-05, "Finetune/Loss": 0.8264367580413818, "Finetune/Loss (Raw)": 0.8878180980682373, "Finetune/Step": 1274, "Finetune/Step Time": 2.827910704538226} +{"Finetune/Learning Rate": 1.743072208466369e-05, "Finetune/Loss": 0.8278706073760986, "Finetune/Loss (Raw)": 0.8890042304992676, "Finetune/Step": 1275, "Finetune/Step Time": 2.8059075474739075} +{"Finetune/Learning Rate": 1.742636322669332e-05, "Finetune/Loss": 0.828571617603302, "Finetune/Loss (Raw)": 0.9207957983016968, "Finetune/Step": 1276, "Finetune/Step Time": 2.80208820104599} +{"Finetune/Learning Rate": 1.7422001220385457e-05, "Finetune/Loss": 0.8258094787597656, "Finetune/Loss (Raw)": 0.596145749092102, "Finetune/Step": 1277, "Finetune/Step Time": 2.828931584954262} +{"Finetune/Learning Rate": 1.741763606758933e-05, "Finetune/Loss": 0.8263324499130249, "Finetune/Loss (Raw)": 0.8906757235527039, "Finetune/Step": 1278, "Finetune/Step Time": 2.8261817693710327} +{"Finetune/Learning Rate": 1.7413267770155503e-05, "Finetune/Loss": 0.8265384435653687, "Finetune/Loss (Raw)": 0.8719862103462219, "Finetune/Step": 1279, "Finetune/Step Time": 2.827727133408189} +{"Finetune/Learning Rate": 1.740889632993588e-05, "Finetune/Loss": 0.8270899057388306, "Finetune/Loss (Raw)": 0.9000681042671204, "Finetune/Step": 1280, "Finetune/Step Time": 2.822909263893962} +{"Finetune/Learning Rate": 1.740452174878369e-05, "Finetune/Loss": 0.8263621926307678, "Finetune/Loss (Raw)": 0.7840168476104736, "Finetune/Step": 1281, "Finetune/Step Time": 2.818991443142295} +{"Finetune/Learning Rate": 1.7400144028553498e-05, "Finetune/Loss": 0.8259671926498413, "Finetune/Loss (Raw)": 0.9045742750167847, "Finetune/Step": 1282, "Finetune/Step Time": 2.8196030724793673} +{"Finetune/Learning Rate": 1.7395763171101193e-05, "Finetune/Loss": 0.8287447690963745, "Finetune/Loss (Raw)": 0.8617214560508728, "Finetune/Step": 1283, "Finetune/Step Time": 2.799892071634531} +{"Finetune/Learning Rate": 1.7391379178284e-05, "Finetune/Loss": 0.8287234902381897, "Finetune/Loss (Raw)": 0.892633855342865, "Finetune/Step": 1284, "Finetune/Step Time": 2.799760429188609} +{"Finetune/Learning Rate": 1.738699205196048e-05, "Finetune/Loss": 0.8287494778633118, "Finetune/Loss (Raw)": 0.926095724105835, "Finetune/Step": 1285, "Finetune/Step Time": 2.7984043154865503} +{"Finetune/Learning Rate": 1.7382601793990502e-05, "Finetune/Loss": 0.8279927968978882, "Finetune/Loss (Raw)": 0.835668683052063, "Finetune/Step": 1286, "Finetune/Step Time": 2.800574902445078} +{"Finetune/Learning Rate": 1.7378208406235278e-05, "Finetune/Loss": 0.8278073668479919, "Finetune/Loss (Raw)": 0.8485289812088013, "Finetune/Step": 1287, "Finetune/Step Time": 2.7998607996851206} +{"Finetune/Learning Rate": 1.7373811890557352e-05, "Finetune/Loss": 0.8316145539283752, "Finetune/Loss (Raw)": 0.7884959578514099, "Finetune/Step": 1288, "Finetune/Step Time": 2.7714552879333496} +{"Finetune/Learning Rate": 1.736941224882058e-05, "Finetune/Loss": 0.8315534591674805, "Finetune/Loss (Raw)": 0.8862133622169495, "Finetune/Step": 1289, "Finetune/Step Time": 2.766354478895664} +{"Finetune/Learning Rate": 1.7365009482890144e-05, "Finetune/Loss": 0.8320446014404297, "Finetune/Loss (Raw)": 0.8561446666717529, "Finetune/Step": 1290, "Finetune/Step Time": 2.762257795780897} +{"Finetune/Learning Rate": 1.7360603594632565e-05, "Finetune/Loss": 0.832236647605896, "Finetune/Loss (Raw)": 0.837786078453064, "Finetune/Step": 1291, "Finetune/Step Time": 2.765605553984642} +{"Finetune/Learning Rate": 1.7356194585915673e-05, "Finetune/Loss": 0.8272798657417297, "Finetune/Loss (Raw)": 0.242811918258667, "Finetune/Step": 1292, "Finetune/Step Time": 2.7948650550097227} +{"Finetune/Learning Rate": 1.735178245860863e-05, "Finetune/Loss": 0.8285604119300842, "Finetune/Loss (Raw)": 0.9543076753616333, "Finetune/Step": 1293, "Finetune/Step Time": 2.7980703227221966} +{"Finetune/Learning Rate": 1.7347367214581908e-05, "Finetune/Loss": 0.827777624130249, "Finetune/Loss (Raw)": 0.8270289897918701, "Finetune/Step": 1294, "Finetune/Step Time": 2.7967779487371445} +{"Finetune/Learning Rate": 1.734294885570732e-05, "Finetune/Loss": 0.827879786491394, "Finetune/Loss (Raw)": 0.8494250774383545, "Finetune/Step": 1295, "Finetune/Step Time": 2.7960876803845167} +{"Finetune/Learning Rate": 1.7338527383857982e-05, "Finetune/Loss": 0.8314186334609985, "Finetune/Loss (Raw)": 0.7536601424217224, "Finetune/Step": 1296, "Finetune/Step Time": 2.7708311285823584} +{"Finetune/Learning Rate": 1.7334102800908333e-05, "Finetune/Loss": 0.8305166363716125, "Finetune/Loss (Raw)": 0.7844668626785278, "Finetune/Step": 1297, "Finetune/Step Time": 2.772766124457121} +{"Finetune/Learning Rate": 1.7329675108734137e-05, "Finetune/Loss": 0.8303543925285339, "Finetune/Loss (Raw)": 0.8041268587112427, "Finetune/Step": 1298, "Finetune/Step Time": 2.775993812829256} +{"Finetune/Learning Rate": 1.7325244309212476e-05, "Finetune/Loss": 0.8301036357879639, "Finetune/Loss (Raw)": 0.869597315788269, "Finetune/Step": 1299, "Finetune/Step Time": 2.7767428383231163} +{"Finetune/Learning Rate": 1.7320810404221737e-05, "Finetune/Loss": 0.8316055536270142, "Finetune/Loss (Raw)": 0.9402100443840027, "Finetune/Step": 1300, "Finetune/Step Time": 2.752787886187434} +{"Finetune/Learning Rate": 1.7316373395641644e-05, "Finetune/Loss": 0.8322008848190308, "Finetune/Loss (Raw)": 0.9340486526489258, "Finetune/Step": 1301, "Finetune/Step Time": 2.754285706207156} +{"Finetune/Learning Rate": 1.7311933285353216e-05, "Finetune/Loss": 0.8312029242515564, "Finetune/Loss (Raw)": 0.7965303063392639, "Finetune/Step": 1302, "Finetune/Step Time": 2.7537780087441206} +{"Finetune/Learning Rate": 1.7307490075238802e-05, "Finetune/Loss": 0.8289847373962402, "Finetune/Loss (Raw)": 0.6046091318130493, "Finetune/Step": 1303, "Finetune/Step Time": 2.7733097951859236} +{"Finetune/Learning Rate": 1.7303043767182058e-05, "Finetune/Loss": 0.8287599086761475, "Finetune/Loss (Raw)": 0.8456055521965027, "Finetune/Step": 1304, "Finetune/Step Time": 2.775354117155075} +{"Finetune/Learning Rate": 1.7298594363067955e-05, "Finetune/Loss": 0.8290010094642639, "Finetune/Loss (Raw)": 0.8837473392486572, "Finetune/Step": 1305, "Finetune/Step Time": 2.774317616596818} +{"Finetune/Learning Rate": 1.7294141864782777e-05, "Finetune/Loss": 0.8290041089057922, "Finetune/Loss (Raw)": 0.9114137887954712, "Finetune/Step": 1306, "Finetune/Step Time": 2.771095249801874} +{"Finetune/Learning Rate": 1.7289686274214116e-05, "Finetune/Loss": 0.8293048143386841, "Finetune/Loss (Raw)": 0.8187944293022156, "Finetune/Step": 1307, "Finetune/Step Time": 2.7677062954753637} +{"Finetune/Learning Rate": 1.728522759325088e-05, "Finetune/Loss": 0.8295847177505493, "Finetune/Loss (Raw)": 0.8420013785362244, "Finetune/Step": 1308, "Finetune/Step Time": 2.7712046429514885} +{"Finetune/Learning Rate": 1.728076582378329e-05, "Finetune/Loss": 0.8287546634674072, "Finetune/Loss (Raw)": 0.782780647277832, "Finetune/Step": 1309, "Finetune/Step Time": 2.768581159412861} +{"Finetune/Learning Rate": 1.7276300967702863e-05, "Finetune/Loss": 0.8292961120605469, "Finetune/Loss (Raw)": 0.8864094018936157, "Finetune/Step": 1310, "Finetune/Step Time": 2.7663258500397205} +{"Finetune/Learning Rate": 1.727183302690244e-05, "Finetune/Loss": 0.8281892538070679, "Finetune/Loss (Raw)": 0.7648880481719971, "Finetune/Step": 1311, "Finetune/Step Time": 2.764001052826643} +{"Finetune/Learning Rate": 1.7267362003276157e-05, "Finetune/Loss": 0.8284620046615601, "Finetune/Loss (Raw)": 0.8779050707817078, "Finetune/Step": 1312, "Finetune/Step Time": 2.7754263766109943} +{"Finetune/Learning Rate": 1.726288789871947e-05, "Finetune/Loss": 0.8279537558555603, "Finetune/Loss (Raw)": 0.608333170413971, "Finetune/Step": 1313, "Finetune/Step Time": 2.776374828070402} +{"Finetune/Learning Rate": 1.725841071512913e-05, "Finetune/Loss": 0.8291720151901245, "Finetune/Loss (Raw)": 0.9738296866416931, "Finetune/Step": 1314, "Finetune/Step Time": 2.7715102024376392} +{"Finetune/Learning Rate": 1.7253930454403194e-05, "Finetune/Loss": 0.8271011114120483, "Finetune/Loss (Raw)": 0.6999091506004333, "Finetune/Step": 1315, "Finetune/Step Time": 2.7956793140619993} +{"Finetune/Learning Rate": 1.724944711844103e-05, "Finetune/Loss": 0.8268418312072754, "Finetune/Loss (Raw)": 0.8023658990859985, "Finetune/Step": 1316, "Finetune/Step Time": 2.7960953656584024} +{"Finetune/Learning Rate": 1.724496070914331e-05, "Finetune/Loss": 0.8270470499992371, "Finetune/Loss (Raw)": 0.9199334383010864, "Finetune/Step": 1317, "Finetune/Step Time": 2.7948485650122166} +{"Finetune/Learning Rate": 1.7240471228412e-05, "Finetune/Loss": 0.8276950120925903, "Finetune/Loss (Raw)": 0.9291690587997437, "Finetune/Step": 1318, "Finetune/Step Time": 2.7927687037736177} +{"Finetune/Learning Rate": 1.7235978678150375e-05, "Finetune/Loss": 0.8282577395439148, "Finetune/Loss (Raw)": 0.9186044931411743, "Finetune/Step": 1319, "Finetune/Step Time": 2.7914607860147953} +{"Finetune/Learning Rate": 1.7231483060263012e-05, "Finetune/Loss": 0.8284060955047607, "Finetune/Loss (Raw)": 0.8016653060913086, "Finetune/Step": 1320, "Finetune/Step Time": 2.789247941225767} +{"Finetune/Learning Rate": 1.7226984376655784e-05, "Finetune/Loss": 0.8270339369773865, "Finetune/Loss (Raw)": 0.6292393207550049, "Finetune/Step": 1321, "Finetune/Step Time": 2.8155587185174227} +{"Finetune/Learning Rate": 1.7222482629235868e-05, "Finetune/Loss": 0.8270432949066162, "Finetune/Loss (Raw)": 0.8222634792327881, "Finetune/Step": 1322, "Finetune/Step Time": 2.816039362922311} +{"Finetune/Learning Rate": 1.7217977819911732e-05, "Finetune/Loss": 0.8233369588851929, "Finetune/Loss (Raw)": 0.325131356716156, "Finetune/Step": 1323, "Finetune/Step Time": 2.8461615703999996} +{"Finetune/Learning Rate": 1.7213469950593156e-05, "Finetune/Loss": 0.8223837614059448, "Finetune/Loss (Raw)": 0.7434645891189575, "Finetune/Step": 1324, "Finetune/Step Time": 2.844129964709282} +{"Finetune/Learning Rate": 1.7208959023191205e-05, "Finetune/Loss": 0.8199777603149414, "Finetune/Loss (Raw)": 0.44071128964424133, "Finetune/Step": 1325, "Finetune/Step Time": 2.8744548242539167} +{"Finetune/Learning Rate": 1.7204445039618246e-05, "Finetune/Loss": 0.8189324736595154, "Finetune/Loss (Raw)": 0.823924720287323, "Finetune/Step": 1326, "Finetune/Step Time": 2.8758595660328865} +{"Finetune/Learning Rate": 1.719992800178794e-05, "Finetune/Loss": 0.8198385834693909, "Finetune/Loss (Raw)": 0.8453913927078247, "Finetune/Step": 1327, "Finetune/Step Time": 2.873138414695859} +{"Finetune/Learning Rate": 1.7195407911615243e-05, "Finetune/Loss": 0.8259060382843018, "Finetune/Loss (Raw)": 0.9408496618270874, "Finetune/Step": 1328, "Finetune/Step Time": 2.831484703347087} +{"Finetune/Learning Rate": 1.7190884771016404e-05, "Finetune/Loss": 0.8270391225814819, "Finetune/Loss (Raw)": 0.836396336555481, "Finetune/Step": 1329, "Finetune/Step Time": 2.808875150978565} +{"Finetune/Learning Rate": 1.7186358581908965e-05, "Finetune/Loss": 0.827763557434082, "Finetune/Loss (Raw)": 0.8796489834785461, "Finetune/Step": 1330, "Finetune/Step Time": 2.8126947078853846} +{"Finetune/Learning Rate": 1.7181829346211766e-05, "Finetune/Loss": 0.8280712366104126, "Finetune/Loss (Raw)": 0.9052091240882874, "Finetune/Step": 1331, "Finetune/Step Time": 2.8085273392498493} +{"Finetune/Learning Rate": 1.717729706584493e-05, "Finetune/Loss": 0.8286265134811401, "Finetune/Loss (Raw)": 0.8905409574508667, "Finetune/Step": 1332, "Finetune/Step Time": 2.811130542308092} +{"Finetune/Learning Rate": 1.717276174272988e-05, "Finetune/Loss": 0.8282794952392578, "Finetune/Loss (Raw)": 0.7921075224876404, "Finetune/Step": 1333, "Finetune/Step Time": 2.8106034118682146} +{"Finetune/Learning Rate": 1.7168223378789318e-05, "Finetune/Loss": 0.824481725692749, "Finetune/Loss (Raw)": 0.3162355422973633, "Finetune/Step": 1334, "Finetune/Step Time": 2.8437765277922153} +{"Finetune/Learning Rate": 1.716368197594725e-05, "Finetune/Loss": 0.8255643844604492, "Finetune/Loss (Raw)": 0.9136882424354553, "Finetune/Step": 1335, "Finetune/Step Time": 2.843545598909259} +{"Finetune/Learning Rate": 1.715913753612895e-05, "Finetune/Loss": 0.824384331703186, "Finetune/Loss (Raw)": 0.7615746259689331, "Finetune/Step": 1336, "Finetune/Step Time": 2.8456214480102062} +{"Finetune/Learning Rate": 1.7154590061261e-05, "Finetune/Loss": 0.8238672018051147, "Finetune/Loss (Raw)": 0.7087269425392151, "Finetune/Step": 1337, "Finetune/Step Time": 2.8671732041984797} +{"Finetune/Learning Rate": 1.7150039553271252e-05, "Finetune/Loss": 0.8236900568008423, "Finetune/Loss (Raw)": 0.9027078747749329, "Finetune/Step": 1338, "Finetune/Step Time": 2.867493949830532} +{"Finetune/Learning Rate": 1.7145486014088857e-05, "Finetune/Loss": 0.8239618539810181, "Finetune/Loss (Raw)": 0.8842819333076477, "Finetune/Step": 1339, "Finetune/Step Time": 2.86808168515563} +{"Finetune/Learning Rate": 1.7140929445644247e-05, "Finetune/Loss": 0.8230667114257812, "Finetune/Loss (Raw)": 0.8376222848892212, "Finetune/Step": 1340, "Finetune/Step Time": 2.8674010187387466} +{"Finetune/Learning Rate": 1.713636984986913e-05, "Finetune/Loss": 0.8222554922103882, "Finetune/Loss (Raw)": 0.8020974397659302, "Finetune/Step": 1341, "Finetune/Step Time": 2.871249770745635} +{"Finetune/Learning Rate": 1.713180722869651e-05, "Finetune/Loss": 0.8212776184082031, "Finetune/Loss (Raw)": 0.8334483504295349, "Finetune/Step": 1342, "Finetune/Step Time": 2.869814494624734} +{"Finetune/Learning Rate": 1.712724158406067e-05, "Finetune/Loss": 0.8209176659584045, "Finetune/Loss (Raw)": 0.7659353017807007, "Finetune/Step": 1343, "Finetune/Step Time": 2.8666091952472925} +{"Finetune/Learning Rate": 1.712267291789716e-05, "Finetune/Loss": 0.8208556175231934, "Finetune/Loss (Raw)": 0.8999051451683044, "Finetune/Step": 1344, "Finetune/Step Time": 2.8675896171480417} +{"Finetune/Learning Rate": 1.7118101232142838e-05, "Finetune/Loss": 0.8207367062568665, "Finetune/Loss (Raw)": 0.9044011235237122, "Finetune/Step": 1345, "Finetune/Step Time": 2.863860797137022} +{"Finetune/Learning Rate": 1.7113526528735817e-05, "Finetune/Loss": 0.8205784559249878, "Finetune/Loss (Raw)": 0.7971246242523193, "Finetune/Step": 1346, "Finetune/Step Time": 2.863622635602951} +{"Finetune/Learning Rate": 1.7108948809615507e-05, "Finetune/Loss": 0.8184254765510559, "Finetune/Loss (Raw)": 0.6820647120475769, "Finetune/Step": 1347, "Finetune/Step Time": 2.880914878100157} +{"Finetune/Learning Rate": 1.7104368076722585e-05, "Finetune/Loss": 0.8179978132247925, "Finetune/Loss (Raw)": 0.7932178378105164, "Finetune/Step": 1348, "Finetune/Step Time": 2.882136955857277} +{"Finetune/Learning Rate": 1.709978433199901e-05, "Finetune/Loss": 0.8151271343231201, "Finetune/Loss (Raw)": 0.5847909450531006, "Finetune/Step": 1349, "Finetune/Step Time": 2.9038434736430645} +{"Finetune/Learning Rate": 1.7095197577388022e-05, "Finetune/Loss": 0.8142842054367065, "Finetune/Loss (Raw)": 0.7831578850746155, "Finetune/Step": 1350, "Finetune/Step Time": 2.9061166997998953} +{"Finetune/Learning Rate": 1.7090607814834133e-05, "Finetune/Loss": 0.8146638870239258, "Finetune/Loss (Raw)": 0.8691932559013367, "Finetune/Step": 1351, "Finetune/Step Time": 2.904518362134695} +{"Finetune/Learning Rate": 1.7086015046283123e-05, "Finetune/Loss": 0.8128132820129395, "Finetune/Loss (Raw)": 0.5694049596786499, "Finetune/Step": 1352, "Finetune/Step Time": 2.9309081714600325} +{"Finetune/Learning Rate": 1.708141927368206e-05, "Finetune/Loss": 0.8132971525192261, "Finetune/Loss (Raw)": 0.9352414011955261, "Finetune/Step": 1353, "Finetune/Step Time": 2.9298299793154} +{"Finetune/Learning Rate": 1.7076820498979273e-05, "Finetune/Loss": 0.8132354617118835, "Finetune/Loss (Raw)": 0.890933096408844, "Finetune/Step": 1354, "Finetune/Step Time": 2.929266734048724} +{"Finetune/Learning Rate": 1.7072218724124375e-05, "Finetune/Loss": 0.8131794929504395, "Finetune/Loss (Raw)": 0.7987068891525269, "Finetune/Step": 1355, "Finetune/Step Time": 2.933284994214773} +{"Finetune/Learning Rate": 1.706761395106825e-05, "Finetune/Loss": 0.8136583566665649, "Finetune/Loss (Raw)": 0.8789314031600952, "Finetune/Step": 1356, "Finetune/Step Time": 2.9287507757544518} +{"Finetune/Learning Rate": 1.7063006181763037e-05, "Finetune/Loss": 0.8131358623504639, "Finetune/Loss (Raw)": 0.846234142780304, "Finetune/Step": 1357, "Finetune/Step Time": 2.9287733137607574} +{"Finetune/Learning Rate": 1.705839541816216e-05, "Finetune/Loss": 0.8135476112365723, "Finetune/Loss (Raw)": 0.8571632504463196, "Finetune/Step": 1358, "Finetune/Step Time": 2.930003546178341} +{"Finetune/Learning Rate": 1.705378166222032e-05, "Finetune/Loss": 0.8125807046890259, "Finetune/Loss (Raw)": 0.7858079075813293, "Finetune/Step": 1359, "Finetune/Step Time": 2.926152614876628} +{"Finetune/Learning Rate": 1.704916491589346e-05, "Finetune/Loss": 0.8130512237548828, "Finetune/Loss (Raw)": 0.8228393197059631, "Finetune/Step": 1360, "Finetune/Step Time": 2.9288852997124195} +{"Finetune/Learning Rate": 1.7044545181138818e-05, "Finetune/Loss": 0.8131530284881592, "Finetune/Loss (Raw)": 0.8732925653457642, "Finetune/Step": 1361, "Finetune/Step Time": 2.928923584520817} +{"Finetune/Learning Rate": 1.703992245991488e-05, "Finetune/Loss": 0.8121623992919922, "Finetune/Loss (Raw)": 0.7747910618782043, "Finetune/Step": 1362, "Finetune/Step Time": 2.9272761661559343} +{"Finetune/Learning Rate": 1.7035296754181418e-05, "Finetune/Loss": 0.8114166259765625, "Finetune/Loss (Raw)": 0.812537670135498, "Finetune/Step": 1363, "Finetune/Step Time": 2.925477996468544} +{"Finetune/Learning Rate": 1.703066806589944e-05, "Finetune/Loss": 0.8153088092803955, "Finetune/Loss (Raw)": 0.8154289722442627, "Finetune/Step": 1364, "Finetune/Step Time": 2.8985121324658394} +{"Finetune/Learning Rate": 1.702603639703125e-05, "Finetune/Loss": 0.8147493600845337, "Finetune/Loss (Raw)": 0.7318340539932251, "Finetune/Step": 1365, "Finetune/Step Time": 2.8992522954940796} +{"Finetune/Learning Rate": 1.7021401749540386e-05, "Finetune/Loss": 0.815043568611145, "Finetune/Loss (Raw)": 0.8196877241134644, "Finetune/Step": 1366, "Finetune/Step Time": 2.8959046006202698} +{"Finetune/Learning Rate": 1.7016764125391675e-05, "Finetune/Loss": 0.8147196769714355, "Finetune/Loss (Raw)": 0.8741896152496338, "Finetune/Step": 1367, "Finetune/Step Time": 2.898063201457262} +{"Finetune/Learning Rate": 1.7012123526551193e-05, "Finetune/Loss": 0.8148818612098694, "Finetune/Loss (Raw)": 0.8283849358558655, "Finetune/Step": 1368, "Finetune/Step Time": 2.9114043042063713} +{"Finetune/Learning Rate": 1.7007479954986275e-05, "Finetune/Loss": 0.8146287202835083, "Finetune/Loss (Raw)": 0.8868182897567749, "Finetune/Step": 1369, "Finetune/Step Time": 2.907098228111863} +{"Finetune/Learning Rate": 1.7002833412665527e-05, "Finetune/Loss": 0.8156472444534302, "Finetune/Loss (Raw)": 0.9538360238075256, "Finetune/Step": 1370, "Finetune/Step Time": 2.9033732563257217} +{"Finetune/Learning Rate": 1.69981839015588e-05, "Finetune/Loss": 0.815454363822937, "Finetune/Loss (Raw)": 0.796973705291748, "Finetune/Step": 1371, "Finetune/Step Time": 2.9025005474686623} +{"Finetune/Learning Rate": 1.699353142363721e-05, "Finetune/Loss": 0.8153400421142578, "Finetune/Loss (Raw)": 0.8237826824188232, "Finetune/Step": 1372, "Finetune/Step Time": 2.9039213843643665} +{"Finetune/Learning Rate": 1.698887598087314e-05, "Finetune/Loss": 0.8113632202148438, "Finetune/Loss (Raw)": 0.2603510320186615, "Finetune/Step": 1373, "Finetune/Step Time": 2.930434636771679} +{"Finetune/Learning Rate": 1.6984217575240212e-05, "Finetune/Loss": 0.8076145648956299, "Finetune/Loss (Raw)": 0.2945997416973114, "Finetune/Step": 1374, "Finetune/Step Time": 2.960051706060767} +{"Finetune/Learning Rate": 1.6979556208713318e-05, "Finetune/Loss": 0.8079644441604614, "Finetune/Loss (Raw)": 0.9254509210586548, "Finetune/Step": 1375, "Finetune/Step Time": 2.959274163469672} +{"Finetune/Learning Rate": 1.6974891883268605e-05, "Finetune/Loss": 0.8073478937149048, "Finetune/Loss (Raw)": 0.8132804036140442, "Finetune/Step": 1376, "Finetune/Step Time": 2.961322760209441} +{"Finetune/Learning Rate": 1.6970224600883463e-05, "Finetune/Loss": 0.8071286082267761, "Finetune/Loss (Raw)": 0.8258263468742371, "Finetune/Step": 1377, "Finetune/Step Time": 2.9610157143324614} +{"Finetune/Learning Rate": 1.6965554363536546e-05, "Finetune/Loss": 0.8067127466201782, "Finetune/Loss (Raw)": 0.8871038556098938, "Finetune/Step": 1378, "Finetune/Step Time": 2.9624913036823273} +{"Finetune/Learning Rate": 1.6960881173207762e-05, "Finetune/Loss": 0.8070733547210693, "Finetune/Loss (Raw)": 0.8339532613754272, "Finetune/Step": 1379, "Finetune/Step Time": 2.9614545851945877} +{"Finetune/Learning Rate": 1.695620503187826e-05, "Finetune/Loss": 0.808214008808136, "Finetune/Loss (Raw)": 0.9234710335731506, "Finetune/Step": 1380, "Finetune/Step Time": 2.959540292620659} +{"Finetune/Learning Rate": 1.695152594153045e-05, "Finetune/Loss": 0.8097906112670898, "Finetune/Loss (Raw)": 0.938606321811676, "Finetune/Step": 1381, "Finetune/Step Time": 2.954292371869087} +{"Finetune/Learning Rate": 1.6946843904147985e-05, "Finetune/Loss": 0.810154914855957, "Finetune/Loss (Raw)": 0.8428173661231995, "Finetune/Step": 1382, "Finetune/Step Time": 2.954283306375146} +{"Finetune/Learning Rate": 1.6942158921715775e-05, "Finetune/Loss": 0.8088352084159851, "Finetune/Loss (Raw)": 0.7652376294136047, "Finetune/Step": 1383, "Finetune/Step Time": 2.9551924392580986} +{"Finetune/Learning Rate": 1.6937470996219972e-05, "Finetune/Loss": 0.8096778392791748, "Finetune/Loss (Raw)": 0.7924625873565674, "Finetune/Step": 1384, "Finetune/Step Time": 2.921486083418131} +{"Finetune/Learning Rate": 1.6932780129647985e-05, "Finetune/Loss": 0.8103185892105103, "Finetune/Loss (Raw)": 0.7814859747886658, "Finetune/Step": 1385, "Finetune/Step Time": 2.9234440997242928} +{"Finetune/Learning Rate": 1.6928086323988452e-05, "Finetune/Loss": 0.8094232678413391, "Finetune/Loss (Raw)": 0.8135301470756531, "Finetune/Step": 1386, "Finetune/Step Time": 2.923261681571603} +{"Finetune/Learning Rate": 1.6923389581231275e-05, "Finetune/Loss": 0.8091747164726257, "Finetune/Loss (Raw)": 0.8180480599403381, "Finetune/Step": 1387, "Finetune/Step Time": 2.925242794677615} +{"Finetune/Learning Rate": 1.69186899033676e-05, "Finetune/Loss": 0.8090892434120178, "Finetune/Loss (Raw)": 0.8618139028549194, "Finetune/Step": 1388, "Finetune/Step Time": 2.9230000115931034} +{"Finetune/Learning Rate": 1.6913987292389795e-05, "Finetune/Loss": 0.8092223405838013, "Finetune/Loss (Raw)": 0.8889071941375732, "Finetune/Step": 1389, "Finetune/Step Time": 2.9272032603621483} +{"Finetune/Learning Rate": 1.6909281750291504e-05, "Finetune/Loss": 0.8104326128959656, "Finetune/Loss (Raw)": 0.9230192303657532, "Finetune/Step": 1390, "Finetune/Step Time": 2.923554502427578} +{"Finetune/Learning Rate": 1.690457327906759e-05, "Finetune/Loss": 0.8100597858428955, "Finetune/Loss (Raw)": 0.8196653127670288, "Finetune/Step": 1391, "Finetune/Step Time": 2.920533461496234} +{"Finetune/Learning Rate": 1.689986188071417e-05, "Finetune/Loss": 0.8104097843170166, "Finetune/Loss (Raw)": 0.8513957262039185, "Finetune/Step": 1392, "Finetune/Step Time": 2.912935497239232} +{"Finetune/Learning Rate": 1.6895147557228595e-05, "Finetune/Loss": 0.8101239204406738, "Finetune/Loss (Raw)": 0.7929527163505554, "Finetune/Step": 1393, "Finetune/Step Time": 2.915222281590104} +{"Finetune/Learning Rate": 1.6890430310609457e-05, "Finetune/Loss": 0.8099050521850586, "Finetune/Loss (Raw)": 0.8852320313453674, "Finetune/Step": 1394, "Finetune/Step Time": 2.914027715101838} +{"Finetune/Learning Rate": 1.688571014285659e-05, "Finetune/Loss": 0.8100799322128296, "Finetune/Loss (Raw)": 0.8853124976158142, "Finetune/Step": 1395, "Finetune/Step Time": 2.913287753239274} +{"Finetune/Learning Rate": 1.6880987055971064e-05, "Finetune/Loss": 0.8098553419113159, "Finetune/Loss (Raw)": 0.8552638292312622, "Finetune/Step": 1396, "Finetune/Step Time": 2.9084163550287485} +{"Finetune/Learning Rate": 1.6876261051955188e-05, "Finetune/Loss": 0.8095011711120605, "Finetune/Loss (Raw)": 0.8643196821212769, "Finetune/Step": 1397, "Finetune/Step Time": 2.910184197127819} +{"Finetune/Learning Rate": 1.6871532132812513e-05, "Finetune/Loss": 0.8098328709602356, "Finetune/Loss (Raw)": 0.8015516996383667, "Finetune/Step": 1398, "Finetune/Step Time": 2.913956865668297} +{"Finetune/Learning Rate": 1.6866800300547814e-05, "Finetune/Loss": 0.8104369044303894, "Finetune/Loss (Raw)": 0.896135687828064, "Finetune/Step": 1399, "Finetune/Step Time": 2.91362183354795} +{"Finetune/Learning Rate": 1.6862065557167105e-05, "Finetune/Loss": 0.8120484352111816, "Finetune/Loss (Raw)": 0.9661819338798523, "Finetune/Step": 1400, "Finetune/Step Time": 2.911573078483343} +{"Finetune/Learning Rate": 1.6857327904677645e-05, "Finetune/Loss": 0.8098650574684143, "Finetune/Loss (Raw)": 0.556324303150177, "Finetune/Step": 1401, "Finetune/Step Time": 2.934504257515073} +{"Finetune/Learning Rate": 1.685258734508791e-05, "Finetune/Loss": 0.8085996508598328, "Finetune/Loss (Raw)": 0.725848376750946, "Finetune/Step": 1402, "Finetune/Step Time": 2.935074346140027} +{"Finetune/Learning Rate": 1.684784388040762e-05, "Finetune/Loss": 0.8086928129196167, "Finetune/Loss (Raw)": 0.9009284377098083, "Finetune/Step": 1403, "Finetune/Step Time": 2.937621582299471} +{"Finetune/Learning Rate": 1.6843097512647718e-05, "Finetune/Loss": 0.8069424629211426, "Finetune/Loss (Raw)": 0.6967509984970093, "Finetune/Step": 1404, "Finetune/Step Time": 2.9635832142084837} +{"Finetune/Learning Rate": 1.683834824382039e-05, "Finetune/Loss": 0.8087568283081055, "Finetune/Loss (Raw)": 0.8283880949020386, "Finetune/Step": 1405, "Finetune/Step Time": 2.9382103122770786} +{"Finetune/Learning Rate": 1.683359607593904e-05, "Finetune/Loss": 0.8083819150924683, "Finetune/Loss (Raw)": 0.842685878276825, "Finetune/Step": 1406, "Finetune/Step Time": 2.9374268893152475} +{"Finetune/Learning Rate": 1.6828841011018302e-05, "Finetune/Loss": 0.8086236119270325, "Finetune/Loss (Raw)": 0.9029192924499512, "Finetune/Step": 1407, "Finetune/Step Time": 2.9350056927651167} +{"Finetune/Learning Rate": 1.682408305107405e-05, "Finetune/Loss": 0.8079017400741577, "Finetune/Loss (Raw)": 0.8076672554016113, "Finetune/Step": 1408, "Finetune/Step Time": 2.9392901193350554} +{"Finetune/Learning Rate": 1.6819322198123368e-05, "Finetune/Loss": 0.8086084723472595, "Finetune/Loss (Raw)": 0.874478280544281, "Finetune/Step": 1409, "Finetune/Step Time": 2.941698130220175} +{"Finetune/Learning Rate": 1.6814558454184577e-05, "Finetune/Loss": 0.8077136874198914, "Finetune/Loss (Raw)": 0.7900444865226746, "Finetune/Step": 1410, "Finetune/Step Time": 2.941414652392268} +{"Finetune/Learning Rate": 1.6809791821277225e-05, "Finetune/Loss": 0.8071132898330688, "Finetune/Loss (Raw)": 0.7848635911941528, "Finetune/Step": 1411, "Finetune/Step Time": 2.9366426710039377} +{"Finetune/Learning Rate": 1.680502230142208e-05, "Finetune/Loss": 0.806835412979126, "Finetune/Loss (Raw)": 0.857080340385437, "Finetune/Step": 1412, "Finetune/Step Time": 2.93421720713377} +{"Finetune/Learning Rate": 1.6800249896641142e-05, "Finetune/Loss": 0.806259036064148, "Finetune/Loss (Raw)": 0.8523080348968506, "Finetune/Step": 1413, "Finetune/Step Time": 2.9347072783857584} +{"Finetune/Learning Rate": 1.6795474608957615e-05, "Finetune/Loss": 0.8064632415771484, "Finetune/Loss (Raw)": 0.8618108630180359, "Finetune/Step": 1414, "Finetune/Step Time": 2.9334242567420006} +{"Finetune/Learning Rate": 1.6790696440395947e-05, "Finetune/Loss": 0.8060092926025391, "Finetune/Loss (Raw)": 0.7904260158538818, "Finetune/Step": 1415, "Finetune/Step Time": 2.932284252718091} +{"Finetune/Learning Rate": 1.6785915392981795e-05, "Finetune/Loss": 0.8063502311706543, "Finetune/Loss (Raw)": 0.8321311473846436, "Finetune/Step": 1416, "Finetune/Step Time": 2.931516529992223} +{"Finetune/Learning Rate": 1.678113146874204e-05, "Finetune/Loss": 0.8061513900756836, "Finetune/Loss (Raw)": 0.8607637882232666, "Finetune/Step": 1417, "Finetune/Step Time": 2.9336890187114477} +{"Finetune/Learning Rate": 1.6776344669704778e-05, "Finetune/Loss": 0.8062211871147156, "Finetune/Loss (Raw)": 0.8650766015052795, "Finetune/Step": 1418, "Finetune/Step Time": 2.9357437323778868} +{"Finetune/Learning Rate": 1.6771554997899335e-05, "Finetune/Loss": 0.8069403171539307, "Finetune/Loss (Raw)": 0.9298338294029236, "Finetune/Step": 1419, "Finetune/Step Time": 2.9303754568099976} +{"Finetune/Learning Rate": 1.6766762455356242e-05, "Finetune/Loss": 0.8117170333862305, "Finetune/Loss (Raw)": 0.8542407751083374, "Finetune/Step": 1420, "Finetune/Step Time": 2.9005642663687468} +{"Finetune/Learning Rate": 1.6761967044107258e-05, "Finetune/Loss": 0.811343789100647, "Finetune/Loss (Raw)": 0.9065249562263489, "Finetune/Step": 1421, "Finetune/Step Time": 2.895423576235771} +{"Finetune/Learning Rate": 1.675716876618535e-05, "Finetune/Loss": 0.8123241662979126, "Finetune/Loss (Raw)": 0.9525164365768433, "Finetune/Step": 1422, "Finetune/Step Time": 2.8952610082924366} +{"Finetune/Learning Rate": 1.67523676236247e-05, "Finetune/Loss": 0.8123397827148438, "Finetune/Loss (Raw)": 0.851421594619751, "Finetune/Step": 1423, "Finetune/Step Time": 2.8973369263112545} +{"Finetune/Learning Rate": 1.674756361846071e-05, "Finetune/Loss": 0.8131762742996216, "Finetune/Loss (Raw)": 0.8607350587844849, "Finetune/Step": 1424, "Finetune/Step Time": 2.906519927084446} +{"Finetune/Learning Rate": 1.6742756752729996e-05, "Finetune/Loss": 0.814062237739563, "Finetune/Loss (Raw)": 0.8978725671768188, "Finetune/Step": 1425, "Finetune/Step Time": 2.902979088947177} +{"Finetune/Learning Rate": 1.6737947028470386e-05, "Finetune/Loss": 0.8146856427192688, "Finetune/Loss (Raw)": 0.8839178085327148, "Finetune/Step": 1426, "Finetune/Step Time": 2.90107180736959} +{"Finetune/Learning Rate": 1.673313444772091e-05, "Finetune/Loss": 0.8148094415664673, "Finetune/Loss (Raw)": 0.8854425549507141, "Finetune/Step": 1427, "Finetune/Step Time": 2.9005605205893517} +{"Finetune/Learning Rate": 1.672831901252182e-05, "Finetune/Loss": 0.810338020324707, "Finetune/Loss (Raw)": 0.36787888407707214, "Finetune/Step": 1428, "Finetune/Step Time": 2.9344354830682278} +{"Finetune/Learning Rate": 1.6723500724914578e-05, "Finetune/Loss": 0.8090140223503113, "Finetune/Loss (Raw)": 0.7645684480667114, "Finetune/Step": 1429, "Finetune/Step Time": 2.935099456459284} +{"Finetune/Learning Rate": 1.6718679586941847e-05, "Finetune/Loss": 0.809307873249054, "Finetune/Loss (Raw)": 0.834145724773407, "Finetune/Step": 1430, "Finetune/Step Time": 2.9337510615587234} +{"Finetune/Learning Rate": 1.6713855600647512e-05, "Finetune/Loss": 0.8112756013870239, "Finetune/Loss (Raw)": 0.856474757194519, "Finetune/Step": 1431, "Finetune/Step Time": 2.9139499608427286} +{"Finetune/Learning Rate": 1.6709028768076644e-05, "Finetune/Loss": 0.810842752456665, "Finetune/Loss (Raw)": 0.7902098298072815, "Finetune/Step": 1432, "Finetune/Step Time": 2.9103142209351063} +{"Finetune/Learning Rate": 1.6704199091275544e-05, "Finetune/Loss": 0.8100037574768066, "Finetune/Loss (Raw)": 0.7763439416885376, "Finetune/Step": 1433, "Finetune/Step Time": 2.912091040983796} +{"Finetune/Learning Rate": 1.6699366572291704e-05, "Finetune/Loss": 0.809884250164032, "Finetune/Loss (Raw)": 0.8961215615272522, "Finetune/Step": 1434, "Finetune/Step Time": 2.915825130417943} +{"Finetune/Learning Rate": 1.6694531213173828e-05, "Finetune/Loss": 0.8099276423454285, "Finetune/Loss (Raw)": 0.824351966381073, "Finetune/Step": 1435, "Finetune/Step Time": 2.9194276053458452} +{"Finetune/Learning Rate": 1.668969301597182e-05, "Finetune/Loss": 0.810387134552002, "Finetune/Loss (Raw)": 0.9008128643035889, "Finetune/Step": 1436, "Finetune/Step Time": 2.9180111698806286} +{"Finetune/Learning Rate": 1.668485198273679e-05, "Finetune/Loss": 0.8112990856170654, "Finetune/Loss (Raw)": 0.8995105028152466, "Finetune/Step": 1437, "Finetune/Step Time": 2.914508456364274} +{"Finetune/Learning Rate": 1.6680008115521045e-05, "Finetune/Loss": 0.8108209371566772, "Finetune/Loss (Raw)": 0.8252081871032715, "Finetune/Step": 1438, "Finetune/Step Time": 2.9150065183639526} +{"Finetune/Learning Rate": 1.6675161416378103e-05, "Finetune/Loss": 0.8120143413543701, "Finetune/Loss (Raw)": 0.9176447987556458, "Finetune/Step": 1439, "Finetune/Step Time": 2.919325415045023} +{"Finetune/Learning Rate": 1.6670311887362675e-05, "Finetune/Loss": 0.8109617233276367, "Finetune/Loss (Raw)": 0.7431713938713074, "Finetune/Step": 1440, "Finetune/Step Time": 2.908132003620267} +{"Finetune/Learning Rate": 1.6665459530530666e-05, "Finetune/Loss": 0.810479998588562, "Finetune/Loss (Raw)": 0.5466635823249817, "Finetune/Step": 1441, "Finetune/Step Time": 2.9078002646565437} +{"Finetune/Learning Rate": 1.66606043479392e-05, "Finetune/Loss": 0.8097918033599854, "Finetune/Loss (Raw)": 0.8857465982437134, "Finetune/Step": 1442, "Finetune/Step Time": 2.910842167213559} +{"Finetune/Learning Rate": 1.665574634164658e-05, "Finetune/Loss": 0.8109501600265503, "Finetune/Loss (Raw)": 0.848180890083313, "Finetune/Step": 1443, "Finetune/Step Time": 2.90741547010839} +{"Finetune/Learning Rate": 1.6650885513712315e-05, "Finetune/Loss": 0.8092182874679565, "Finetune/Loss (Raw)": 0.5806810855865479, "Finetune/Step": 1444, "Finetune/Step Time": 2.932937955483794} +{"Finetune/Learning Rate": 1.66460218661971e-05, "Finetune/Loss": 0.8087767362594604, "Finetune/Loss (Raw)": 0.8634162545204163, "Finetune/Step": 1445, "Finetune/Step Time": 2.9338436536490917} +{"Finetune/Learning Rate": 1.6641155401162847e-05, "Finetune/Loss": 0.8084396123886108, "Finetune/Loss (Raw)": 0.8860145211219788, "Finetune/Step": 1446, "Finetune/Step Time": 2.931166399270296} +{"Finetune/Learning Rate": 1.6636286120672634e-05, "Finetune/Loss": 0.8079167604446411, "Finetune/Loss (Raw)": 0.8516888618469238, "Finetune/Step": 1447, "Finetune/Step Time": 2.9339020159095526} +{"Finetune/Learning Rate": 1.6631414026790754e-05, "Finetune/Loss": 0.8078420162200928, "Finetune/Loss (Raw)": 0.7920873165130615, "Finetune/Step": 1448, "Finetune/Step Time": 2.9352409318089485} +{"Finetune/Learning Rate": 1.6626539121582687e-05, "Finetune/Loss": 0.8096149563789368, "Finetune/Loss (Raw)": 0.8561807870864868, "Finetune/Step": 1449, "Finetune/Step Time": 2.910572038963437} +{"Finetune/Learning Rate": 1.66216614071151e-05, "Finetune/Loss": 0.8110253810882568, "Finetune/Loss (Raw)": 1.0028040409088135, "Finetune/Step": 1450, "Finetune/Step Time": 2.909728392958641} +{"Finetune/Learning Rate": 1.6616780885455858e-05, "Finetune/Loss": 0.8147268891334534, "Finetune/Loss (Raw)": 0.7989222407341003, "Finetune/Step": 1451, "Finetune/Step Time": 2.8826214354485273} +{"Finetune/Learning Rate": 1.6611897558674012e-05, "Finetune/Loss": 0.8140009641647339, "Finetune/Loss (Raw)": 0.6505494713783264, "Finetune/Step": 1452, "Finetune/Step Time": 2.906060241162777} +{"Finetune/Learning Rate": 1.66070114288398e-05, "Finetune/Loss": 0.816525399684906, "Finetune/Loss (Raw)": 0.7638318538665771, "Finetune/Step": 1453, "Finetune/Step Time": 2.902130538597703} +{"Finetune/Learning Rate": 1.6602122498024655e-05, "Finetune/Loss": 0.8174176216125488, "Finetune/Loss (Raw)": 0.9381242394447327, "Finetune/Step": 1454, "Finetune/Step Time": 2.8996583875268698} +{"Finetune/Learning Rate": 1.659723076830119e-05, "Finetune/Loss": 0.8119146227836609, "Finetune/Loss (Raw)": 0.14101305603981018, "Finetune/Step": 1455, "Finetune/Step Time": 2.935522010549903} +{"Finetune/Learning Rate": 1.6592336241743212e-05, "Finetune/Loss": 0.8114023208618164, "Finetune/Loss (Raw)": 0.8752814531326294, "Finetune/Step": 1456, "Finetune/Step Time": 2.9368241503834724} +{"Finetune/Learning Rate": 1.658743892042571e-05, "Finetune/Loss": 0.8115576505661011, "Finetune/Loss (Raw)": 0.8562743663787842, "Finetune/Step": 1457, "Finetune/Step Time": 2.9366495236754417} +{"Finetune/Learning Rate": 1.658253880642485e-05, "Finetune/Loss": 0.8116490244865417, "Finetune/Loss (Raw)": 0.8913439512252808, "Finetune/Step": 1458, "Finetune/Step Time": 2.934664538130164} +{"Finetune/Learning Rate": 1.6577635901818003e-05, "Finetune/Loss": 0.8104948997497559, "Finetune/Loss (Raw)": 0.7574813961982727, "Finetune/Step": 1459, "Finetune/Step Time": 2.9350168351083994} +{"Finetune/Learning Rate": 1.6572730208683697e-05, "Finetune/Loss": 0.8099862337112427, "Finetune/Loss (Raw)": 0.8254357576370239, "Finetune/Step": 1460, "Finetune/Step Time": 2.9311711080372334} +{"Finetune/Learning Rate": 1.656782172910166e-05, "Finetune/Loss": 0.8107631802558899, "Finetune/Loss (Raw)": 0.8915500044822693, "Finetune/Step": 1461, "Finetune/Step Time": 2.9312369376420975} +{"Finetune/Learning Rate": 1.6562910465152803e-05, "Finetune/Loss": 0.8152887225151062, "Finetune/Loss (Raw)": 0.8955039978027344, "Finetune/Step": 1462, "Finetune/Step Time": 2.8989308904856443} +{"Finetune/Learning Rate": 1.6557996418919198e-05, "Finetune/Loss": 0.8149723410606384, "Finetune/Loss (Raw)": 0.8731929659843445, "Finetune/Step": 1463, "Finetune/Step Time": 2.896170085296035} +{"Finetune/Learning Rate": 1.6553079592484115e-05, "Finetune/Loss": 0.8159275650978088, "Finetune/Loss (Raw)": 0.8838423490524292, "Finetune/Step": 1464, "Finetune/Step Time": 2.892737101763487} +{"Finetune/Learning Rate": 1.6548159987931995e-05, "Finetune/Loss": 0.8167667388916016, "Finetune/Loss (Raw)": 0.8161416053771973, "Finetune/Step": 1465, "Finetune/Step Time": 2.870259340852499} +{"Finetune/Learning Rate": 1.6543237607348467e-05, "Finetune/Loss": 0.8158576488494873, "Finetune/Loss (Raw)": 0.7863509058952332, "Finetune/Step": 1466, "Finetune/Step Time": 2.871262973174453} +{"Finetune/Learning Rate": 1.6538312452820317e-05, "Finetune/Loss": 0.816082775592804, "Finetune/Loss (Raw)": 0.9130920767784119, "Finetune/Step": 1467, "Finetune/Step Time": 2.870772683992982} +{"Finetune/Learning Rate": 1.6533384526435523e-05, "Finetune/Loss": 0.8145730495452881, "Finetune/Loss (Raw)": 0.6443759799003601, "Finetune/Step": 1468, "Finetune/Step Time": 2.8950831070542336} +{"Finetune/Learning Rate": 1.6528453830283234e-05, "Finetune/Loss": 0.8147447109222412, "Finetune/Loss (Raw)": 0.8240699768066406, "Finetune/Step": 1469, "Finetune/Step Time": 2.897565120831132} +{"Finetune/Learning Rate": 1.6523520366453775e-05, "Finetune/Loss": 0.8146548271179199, "Finetune/Loss (Raw)": 0.8219469785690308, "Finetune/Step": 1470, "Finetune/Step Time": 2.9037946723401546} +{"Finetune/Learning Rate": 1.651858413703864e-05, "Finetune/Loss": 0.8152139186859131, "Finetune/Loss (Raw)": 0.8374990820884705, "Finetune/Step": 1471, "Finetune/Step Time": 2.9045087955892086} +{"Finetune/Learning Rate": 1.6513645144130493e-05, "Finetune/Loss": 0.8134476542472839, "Finetune/Loss (Raw)": 0.6738260984420776, "Finetune/Step": 1472, "Finetune/Step Time": 2.900945372879505} +{"Finetune/Learning Rate": 1.6508703389823178e-05, "Finetune/Loss": 0.8127976059913635, "Finetune/Loss (Raw)": 0.821189284324646, "Finetune/Step": 1473, "Finetune/Step Time": 2.9007403887808323} +{"Finetune/Learning Rate": 1.650375887621171e-05, "Finetune/Loss": 0.8130636811256409, "Finetune/Loss (Raw)": 0.8311867713928223, "Finetune/Step": 1474, "Finetune/Step Time": 2.896402293816209} +{"Finetune/Learning Rate": 1.6498811605392258e-05, "Finetune/Loss": 0.8147183656692505, "Finetune/Loss (Raw)": 0.8938608169555664, "Finetune/Step": 1475, "Finetune/Step Time": 2.8767838645726442} +{"Finetune/Learning Rate": 1.6493861579462183e-05, "Finetune/Loss": 0.8149592280387878, "Finetune/Loss (Raw)": 0.8240505456924438, "Finetune/Step": 1476, "Finetune/Step Time": 2.875548157840967} +{"Finetune/Learning Rate": 1.6488908800519996e-05, "Finetune/Loss": 0.8174104690551758, "Finetune/Loss (Raw)": 0.8985465168952942, "Finetune/Step": 1477, "Finetune/Step Time": 2.8528882451355457} +{"Finetune/Learning Rate": 1.6483953270665382e-05, "Finetune/Loss": 0.8185310363769531, "Finetune/Loss (Raw)": 0.9265899062156677, "Finetune/Step": 1478, "Finetune/Step Time": 2.850541276857257} +{"Finetune/Learning Rate": 1.6478994991999197e-05, "Finetune/Loss": 0.8182580471038818, "Finetune/Loss (Raw)": 0.8342538475990295, "Finetune/Step": 1479, "Finetune/Step Time": 2.852278359234333} +{"Finetune/Learning Rate": 1.6474033966623448e-05, "Finetune/Loss": 0.8205538392066956, "Finetune/Loss (Raw)": 0.8632642030715942, "Finetune/Step": 1480, "Finetune/Step Time": 2.8368245884776115} +{"Finetune/Learning Rate": 1.6469070196641324e-05, "Finetune/Loss": 0.8193025588989258, "Finetune/Loss (Raw)": 0.7750760912895203, "Finetune/Step": 1481, "Finetune/Step Time": 2.8372235223650932} +{"Finetune/Learning Rate": 1.6464103684157163e-05, "Finetune/Loss": 0.8192399144172668, "Finetune/Loss (Raw)": 0.8829155564308167, "Finetune/Step": 1482, "Finetune/Step Time": 2.8420539628714323} +{"Finetune/Learning Rate": 1.6459134431276477e-05, "Finetune/Loss": 0.819061279296875, "Finetune/Loss (Raw)": 0.7758435606956482, "Finetune/Step": 1483, "Finetune/Step Time": 2.834002347663045} +{"Finetune/Learning Rate": 1.645416244010593e-05, "Finetune/Loss": 0.8189917802810669, "Finetune/Loss (Raw)": 0.8700303435325623, "Finetune/Step": 1484, "Finetune/Step Time": 2.836320221424103} +{"Finetune/Learning Rate": 1.6449187712753352e-05, "Finetune/Loss": 0.8186520338058472, "Finetune/Loss (Raw)": 0.80275559425354, "Finetune/Step": 1485, "Finetune/Step Time": 2.8346936646848917} +{"Finetune/Learning Rate": 1.644421025132773e-05, "Finetune/Loss": 0.8186847567558289, "Finetune/Loss (Raw)": 0.8613476753234863, "Finetune/Step": 1486, "Finetune/Step Time": 2.837996181100607} +{"Finetune/Learning Rate": 1.6439230057939224e-05, "Finetune/Loss": 0.8192397952079773, "Finetune/Loss (Raw)": 0.8568504452705383, "Finetune/Step": 1487, "Finetune/Step Time": 2.8371635172516108} +{"Finetune/Learning Rate": 1.6434247134699128e-05, "Finetune/Loss": 0.8192612528800964, "Finetune/Loss (Raw)": 0.8255870938301086, "Finetune/Step": 1488, "Finetune/Step Time": 2.838422752916813} +{"Finetune/Learning Rate": 1.6429261483719908e-05, "Finetune/Loss": 0.8184396028518677, "Finetune/Loss (Raw)": 0.7681213617324829, "Finetune/Step": 1489, "Finetune/Step Time": 2.837891325354576} +{"Finetune/Learning Rate": 1.642427310711519e-05, "Finetune/Loss": 0.8170949220657349, "Finetune/Loss (Raw)": 0.6026725769042969, "Finetune/Step": 1490, "Finetune/Step Time": 2.8634475395083427} +{"Finetune/Learning Rate": 1.6419282006999746e-05, "Finetune/Loss": 0.8168669939041138, "Finetune/Loss (Raw)": 0.7833622097969055, "Finetune/Step": 1491, "Finetune/Step Time": 2.865788696333766} +{"Finetune/Learning Rate": 1.6414288185489506e-05, "Finetune/Loss": 0.8178790807723999, "Finetune/Loss (Raw)": 0.9449723362922668, "Finetune/Step": 1492, "Finetune/Step Time": 2.8639952279627323} +{"Finetune/Learning Rate": 1.640929164470155e-05, "Finetune/Loss": 0.8185925483703613, "Finetune/Loss (Raw)": 0.8231632113456726, "Finetune/Step": 1493, "Finetune/Step Time": 2.864770734682679} +{"Finetune/Learning Rate": 1.6404292386754125e-05, "Finetune/Loss": 0.818432629108429, "Finetune/Loss (Raw)": 0.79921555519104, "Finetune/Step": 1494, "Finetune/Step Time": 2.867867585271597} +{"Finetune/Learning Rate": 1.6399290413766613e-05, "Finetune/Loss": 0.8179988861083984, "Finetune/Loss (Raw)": 0.8186700940132141, "Finetune/Step": 1495, "Finetune/Step Time": 2.8685228377580643} +{"Finetune/Learning Rate": 1.6394285727859554e-05, "Finetune/Loss": 0.81771320104599, "Finetune/Loss (Raw)": 0.7918193936347961, "Finetune/Step": 1496, "Finetune/Step Time": 2.856266876682639} +{"Finetune/Learning Rate": 1.6389278331154645e-05, "Finetune/Loss": 0.8173764944076538, "Finetune/Loss (Raw)": 0.8437201976776123, "Finetune/Step": 1497, "Finetune/Step Time": 2.863097531720996} +{"Finetune/Learning Rate": 1.6384268225774712e-05, "Finetune/Loss": 0.8169357776641846, "Finetune/Loss (Raw)": 0.897421658039093, "Finetune/Step": 1498, "Finetune/Step Time": 2.863814003765583} +{"Finetune/Learning Rate": 1.637925541384375e-05, "Finetune/Loss": 0.8165358901023865, "Finetune/Loss (Raw)": 0.7457924485206604, "Finetune/Step": 1499, "Finetune/Step Time": 2.863224571570754} +{"Finetune/Learning Rate": 1.63742398974869e-05, "Finetune/Loss": 0.8163179159164429, "Finetune/Loss (Raw)": 0.7958828806877136, "Finetune/Step": 1500, "Finetune/Step Time": 2.85869630984962} +{"Finetune/Learning Rate": 1.6369221678830435e-05, "Finetune/Loss": 0.8213903903961182, "Finetune/Loss (Raw)": 0.9096266031265259, "Finetune/Step": 1501, "Finetune/Step Time": 2.833226513117552} +{"Finetune/Learning Rate": 1.636420076000178e-05, "Finetune/Loss": 0.8257986307144165, "Finetune/Loss (Raw)": 0.8588549494743347, "Finetune/Step": 1502, "Finetune/Step Time": 2.797535952180624} +{"Finetune/Learning Rate": 1.635917714312951e-05, "Finetune/Loss": 0.8249080181121826, "Finetune/Loss (Raw)": 0.8114508986473083, "Finetune/Step": 1503, "Finetune/Step Time": 2.7991277761757374} +{"Finetune/Learning Rate": 1.635415083034335e-05, "Finetune/Loss": 0.8250490427017212, "Finetune/Loss (Raw)": 0.8313263654708862, "Finetune/Step": 1504, "Finetune/Step Time": 2.7945080120116472} +{"Finetune/Learning Rate": 1.6349121823774144e-05, "Finetune/Loss": 0.8248851299285889, "Finetune/Loss (Raw)": 0.8048515915870667, "Finetune/Step": 1505, "Finetune/Step Time": 2.7950076777487993} +{"Finetune/Learning Rate": 1.63440901255539e-05, "Finetune/Loss": 0.8252299427986145, "Finetune/Loss (Raw)": 0.9312346577644348, "Finetune/Step": 1506, "Finetune/Step Time": 2.7951115146279335} +{"Finetune/Learning Rate": 1.6339055737815758e-05, "Finetune/Loss": 0.8207086324691772, "Finetune/Loss (Raw)": 0.25522929430007935, "Finetune/Step": 1507, "Finetune/Step Time": 2.8239583633840084} +{"Finetune/Learning Rate": 1.6334018662694e-05, "Finetune/Loss": 0.8193339109420776, "Finetune/Loss (Raw)": 0.7474996447563171, "Finetune/Step": 1508, "Finetune/Step Time": 2.8278836719691753} +{"Finetune/Learning Rate": 1.6328978902324045e-05, "Finetune/Loss": 0.8184510469436646, "Finetune/Loss (Raw)": 0.8256089687347412, "Finetune/Step": 1509, "Finetune/Step Time": 2.829732706770301} +{"Finetune/Learning Rate": 1.6323936458842457e-05, "Finetune/Loss": 0.8185403347015381, "Finetune/Loss (Raw)": 0.8542459607124329, "Finetune/Step": 1510, "Finetune/Step Time": 2.830330967903137} +{"Finetune/Learning Rate": 1.631889133438693e-05, "Finetune/Loss": 0.8195466995239258, "Finetune/Loss (Raw)": 0.8940553665161133, "Finetune/Step": 1511, "Finetune/Step Time": 2.8312614001333714} +{"Finetune/Learning Rate": 1.6313843531096296e-05, "Finetune/Loss": 0.8202581405639648, "Finetune/Loss (Raw)": 0.8835180401802063, "Finetune/Step": 1512, "Finetune/Step Time": 2.8338951524347067} +{"Finetune/Learning Rate": 1.6308793051110527e-05, "Finetune/Loss": 0.820462167263031, "Finetune/Loss (Raw)": 0.8076059222221375, "Finetune/Step": 1513, "Finetune/Step Time": 2.835313443094492} +{"Finetune/Learning Rate": 1.630373989657073e-05, "Finetune/Loss": 0.8163844347000122, "Finetune/Loss (Raw)": 0.2915809154510498, "Finetune/Step": 1514, "Finetune/Step Time": 2.8707305416464806} +{"Finetune/Learning Rate": 1.6298684069619132e-05, "Finetune/Loss": 0.8151583075523376, "Finetune/Loss (Raw)": 0.6611036062240601, "Finetune/Step": 1515, "Finetune/Step Time": 2.891703451052308} +{"Finetune/Learning Rate": 1.6293625572399114e-05, "Finetune/Loss": 0.8153352737426758, "Finetune/Loss (Raw)": 0.8844630122184753, "Finetune/Step": 1516, "Finetune/Step Time": 2.893274361267686} +{"Finetune/Learning Rate": 1.6288564407055174e-05, "Finetune/Loss": 0.8145291209220886, "Finetune/Loss (Raw)": 0.7857206463813782, "Finetune/Step": 1517, "Finetune/Step Time": 2.893129702657461} +{"Finetune/Learning Rate": 1.628350057573295e-05, "Finetune/Loss": 0.815121054649353, "Finetune/Loss (Raw)": 0.9987841248512268, "Finetune/Step": 1518, "Finetune/Step Time": 2.8931799326092005} +{"Finetune/Learning Rate": 1.6278434080579196e-05, "Finetune/Loss": 0.8157437443733215, "Finetune/Loss (Raw)": 0.8993779420852661, "Finetune/Step": 1519, "Finetune/Step Time": 2.8976533748209476} +{"Finetune/Learning Rate": 1.627336492374182e-05, "Finetune/Loss": 0.8166356086730957, "Finetune/Loss (Raw)": 0.9655427932739258, "Finetune/Step": 1520, "Finetune/Step Time": 2.8985436223447323} +{"Finetune/Learning Rate": 1.626829310736983e-05, "Finetune/Loss": 0.8176625967025757, "Finetune/Loss (Raw)": 0.9244160652160645, "Finetune/Step": 1521, "Finetune/Step Time": 2.897461434826255} +{"Finetune/Learning Rate": 1.626321863361339e-05, "Finetune/Loss": 0.8160533308982849, "Finetune/Loss (Raw)": 0.679243803024292, "Finetune/Step": 1522, "Finetune/Step Time": 2.921287514269352} +{"Finetune/Learning Rate": 1.6258141504623763e-05, "Finetune/Loss": 0.815360963344574, "Finetune/Loss (Raw)": 0.796692430973053, "Finetune/Step": 1523, "Finetune/Step Time": 2.923464983701706} +{"Finetune/Learning Rate": 1.6253061722553353e-05, "Finetune/Loss": 0.8153398036956787, "Finetune/Loss (Raw)": 0.8525547981262207, "Finetune/Step": 1524, "Finetune/Step Time": 2.9286130480468273} +{"Finetune/Learning Rate": 1.6247979289555692e-05, "Finetune/Loss": 0.8146346807479858, "Finetune/Loss (Raw)": 0.7740602493286133, "Finetune/Step": 1525, "Finetune/Step Time": 2.925702352076769} +{"Finetune/Learning Rate": 1.6242894207785422e-05, "Finetune/Loss": 0.8145226240158081, "Finetune/Loss (Raw)": 0.7872099280357361, "Finetune/Step": 1526, "Finetune/Step Time": 2.925095696002245} +{"Finetune/Learning Rate": 1.6237806479398326e-05, "Finetune/Loss": 0.8142396211624146, "Finetune/Loss (Raw)": 0.8599135875701904, "Finetune/Step": 1527, "Finetune/Step Time": 2.926799926906824} +{"Finetune/Learning Rate": 1.623271610655129e-05, "Finetune/Loss": 0.8136096000671387, "Finetune/Loss (Raw)": 0.8855321407318115, "Finetune/Step": 1528, "Finetune/Step Time": 2.9303748439997435} +{"Finetune/Learning Rate": 1.6227623091402336e-05, "Finetune/Loss": 0.8155144453048706, "Finetune/Loss (Raw)": 0.8001478910446167, "Finetune/Step": 1529, "Finetune/Step Time": 2.9041779916733503} +{"Finetune/Learning Rate": 1.6222527436110596e-05, "Finetune/Loss": 0.8165340423583984, "Finetune/Loss (Raw)": 0.8563589453697205, "Finetune/Step": 1530, "Finetune/Step Time": 2.903287624940276} +{"Finetune/Learning Rate": 1.621742914283633e-05, "Finetune/Loss": 0.8165804743766785, "Finetune/Loss (Raw)": 0.9068711996078491, "Finetune/Step": 1531, "Finetune/Step Time": 2.899484084919095} +{"Finetune/Learning Rate": 1.6212328213740908e-05, "Finetune/Loss": 0.8179277181625366, "Finetune/Loss (Raw)": 0.8692049980163574, "Finetune/Step": 1532, "Finetune/Step Time": 2.8767849318683147} +{"Finetune/Learning Rate": 1.620722465098682e-05, "Finetune/Loss": 0.8180103898048401, "Finetune/Loss (Raw)": 0.8389630317687988, "Finetune/Step": 1533, "Finetune/Step Time": 2.8732729107141495} +{"Finetune/Learning Rate": 1.6202118456737683e-05, "Finetune/Loss": 0.8175398111343384, "Finetune/Loss (Raw)": 0.782451331615448, "Finetune/Step": 1534, "Finetune/Step Time": 2.8745230734348297} +{"Finetune/Learning Rate": 1.6197009633158208e-05, "Finetune/Loss": 0.817109227180481, "Finetune/Loss (Raw)": 0.847810685634613, "Finetune/Step": 1535, "Finetune/Step Time": 2.8756126035004854} +{"Finetune/Learning Rate": 1.6191898182414245e-05, "Finetune/Loss": 0.817340075969696, "Finetune/Loss (Raw)": 0.8372092843055725, "Finetune/Step": 1536, "Finetune/Step Time": 2.884597400203347} +{"Finetune/Learning Rate": 1.6186784106672736e-05, "Finetune/Loss": 0.8172528743743896, "Finetune/Loss (Raw)": 0.8633207678794861, "Finetune/Step": 1537, "Finetune/Step Time": 2.8806094769388437} +{"Finetune/Learning Rate": 1.6181667408101752e-05, "Finetune/Loss": 0.8134064674377441, "Finetune/Loss (Raw)": 0.2977030873298645, "Finetune/Step": 1538, "Finetune/Step Time": 2.913082182407379} +{"Finetune/Learning Rate": 1.617654808887047e-05, "Finetune/Loss": 0.8134078979492188, "Finetune/Loss (Raw)": 0.7850525379180908, "Finetune/Step": 1539, "Finetune/Step Time": 2.915134208276868} +{"Finetune/Learning Rate": 1.617142615114917e-05, "Finetune/Loss": 0.8130183219909668, "Finetune/Loss (Raw)": 0.8072030544281006, "Finetune/Step": 1540, "Finetune/Step Time": 2.914289180189371} +{"Finetune/Learning Rate": 1.6166301597109263e-05, "Finetune/Loss": 0.8126537799835205, "Finetune/Loss (Raw)": 0.805648684501648, "Finetune/Step": 1541, "Finetune/Step Time": 2.9139177221804857} +{"Finetune/Learning Rate": 1.6161174428923243e-05, "Finetune/Loss": 0.8126100897789001, "Finetune/Loss (Raw)": 0.8562204241752625, "Finetune/Step": 1542, "Finetune/Step Time": 2.912169234827161} +{"Finetune/Learning Rate": 1.615604464876473e-05, "Finetune/Loss": 0.8136524558067322, "Finetune/Loss (Raw)": 0.9238485097885132, "Finetune/Step": 1543, "Finetune/Step Time": 2.911715779453516} +{"Finetune/Learning Rate": 1.6150912258808448e-05, "Finetune/Loss": 0.8136112689971924, "Finetune/Loss (Raw)": 0.8268617391586304, "Finetune/Step": 1544, "Finetune/Step Time": 2.912465799599886} +{"Finetune/Learning Rate": 1.6145777261230224e-05, "Finetune/Loss": 0.8139913082122803, "Finetune/Loss (Raw)": 0.9094032049179077, "Finetune/Step": 1545, "Finetune/Step Time": 2.9086457565426826} +{"Finetune/Learning Rate": 1.6140639658206995e-05, "Finetune/Loss": 0.813497006893158, "Finetune/Loss (Raw)": 0.8018114566802979, "Finetune/Step": 1546, "Finetune/Step Time": 2.910566307604313} +{"Finetune/Learning Rate": 1.6135499451916793e-05, "Finetune/Loss": 0.8131754398345947, "Finetune/Loss (Raw)": 0.8886724710464478, "Finetune/Step": 1547, "Finetune/Step Time": 2.912933513522148} +{"Finetune/Learning Rate": 1.613035664453877e-05, "Finetune/Loss": 0.8124203681945801, "Finetune/Loss (Raw)": 0.7575861811637878, "Finetune/Step": 1548, "Finetune/Step Time": 2.909608591347933} +{"Finetune/Learning Rate": 1.612521123825317e-05, "Finetune/Loss": 0.8124991655349731, "Finetune/Loss (Raw)": 0.9166179299354553, "Finetune/Step": 1549, "Finetune/Step Time": 2.910570276901126} +{"Finetune/Learning Rate": 1.612006323524133e-05, "Finetune/Loss": 0.8112562894821167, "Finetune/Loss (Raw)": 0.7934258580207825, "Finetune/Step": 1550, "Finetune/Step Time": 2.911803338676691} +{"Finetune/Learning Rate": 1.6114912637685712e-05, "Finetune/Loss": 0.8106920719146729, "Finetune/Loss (Raw)": 0.7792009115219116, "Finetune/Step": 1551, "Finetune/Step Time": 2.9140558522194624} +{"Finetune/Learning Rate": 1.610975944776985e-05, "Finetune/Loss": 0.8106502294540405, "Finetune/Loss (Raw)": 0.8553839325904846, "Finetune/Step": 1552, "Finetune/Step Time": 2.899142099544406} +{"Finetune/Learning Rate": 1.6104603667678403e-05, "Finetune/Loss": 0.8098971247673035, "Finetune/Loss (Raw)": 0.8014707565307617, "Finetune/Step": 1553, "Finetune/Step Time": 2.900747414678335} +{"Finetune/Learning Rate": 1.6099445299597105e-05, "Finetune/Loss": 0.8090865612030029, "Finetune/Loss (Raw)": 0.7801622152328491, "Finetune/Step": 1554, "Finetune/Step Time": 2.9007522333413363} +{"Finetune/Learning Rate": 1.6094284345712807e-05, "Finetune/Loss": 0.8085713386535645, "Finetune/Loss (Raw)": 0.8194957375526428, "Finetune/Step": 1555, "Finetune/Step Time": 2.902162827551365} +{"Finetune/Learning Rate": 1.6089120808213444e-05, "Finetune/Loss": 0.8127409815788269, "Finetune/Loss (Raw)": 0.9015944004058838, "Finetune/Step": 1556, "Finetune/Step Time": 2.867657346650958} +{"Finetune/Learning Rate": 1.608395468928805e-05, "Finetune/Loss": 0.8139210343360901, "Finetune/Loss (Raw)": 0.9156136512756348, "Finetune/Step": 1557, "Finetune/Step Time": 2.8679046742618084} +{"Finetune/Learning Rate": 1.607878599112675e-05, "Finetune/Loss": 0.813046932220459, "Finetune/Loss (Raw)": 0.7222574353218079, "Finetune/Step": 1558, "Finetune/Step Time": 2.8721805717796087} +{"Finetune/Learning Rate": 1.607361471592077e-05, "Finetune/Loss": 0.8121823072433472, "Finetune/Loss (Raw)": 0.7458051443099976, "Finetune/Step": 1559, "Finetune/Step Time": 2.867634104564786} +{"Finetune/Learning Rate": 1.606844086586242e-05, "Finetune/Loss": 0.8121159076690674, "Finetune/Loss (Raw)": 0.7817165851593018, "Finetune/Step": 1560, "Finetune/Step Time": 2.867384772747755} +{"Finetune/Learning Rate": 1.606326444314511e-05, "Finetune/Loss": 0.8129330277442932, "Finetune/Loss (Raw)": 0.8809282779693604, "Finetune/Step": 1561, "Finetune/Step Time": 2.867655947804451} +{"Finetune/Learning Rate": 1.6058085449963333e-05, "Finetune/Loss": 0.8120170831680298, "Finetune/Loss (Raw)": 0.7788888812065125, "Finetune/Step": 1562, "Finetune/Step Time": 2.866471339017153} +{"Finetune/Learning Rate": 1.6052903888512674e-05, "Finetune/Loss": 0.812542200088501, "Finetune/Loss (Raw)": 0.8915631175041199, "Finetune/Step": 1563, "Finetune/Step Time": 2.8655691985040903} +{"Finetune/Learning Rate": 1.604771976098981e-05, "Finetune/Loss": 0.8120347857475281, "Finetune/Loss (Raw)": 0.8358609080314636, "Finetune/Step": 1564, "Finetune/Step Time": 2.8668163884431124} +{"Finetune/Learning Rate": 1.6042533069592506e-05, "Finetune/Loss": 0.8110388517379761, "Finetune/Loss (Raw)": 0.772035539150238, "Finetune/Step": 1565, "Finetune/Step Time": 2.869195569306612} +{"Finetune/Learning Rate": 1.6037343816519602e-05, "Finetune/Loss": 0.8094241619110107, "Finetune/Loss (Raw)": 0.6185262799263, "Finetune/Step": 1566, "Finetune/Step Time": 2.894224975258112} +{"Finetune/Learning Rate": 1.6032152003971044e-05, "Finetune/Loss": 0.8079860210418701, "Finetune/Loss (Raw)": 0.7335658669471741, "Finetune/Step": 1567, "Finetune/Step Time": 2.8883467242121696} +{"Finetune/Learning Rate": 1.6026957634147845e-05, "Finetune/Loss": 0.8085474967956543, "Finetune/Loss (Raw)": 0.815037190914154, "Finetune/Step": 1568, "Finetune/Step Time": 2.8892899118363857} +{"Finetune/Learning Rate": 1.6021760709252115e-05, "Finetune/Loss": 0.8107748627662659, "Finetune/Loss (Raw)": 0.8317617177963257, "Finetune/Step": 1569, "Finetune/Step Time": 2.8681011088192463} +{"Finetune/Learning Rate": 1.601656123148704e-05, "Finetune/Loss": 0.8104338645935059, "Finetune/Loss (Raw)": 0.8420940637588501, "Finetune/Step": 1570, "Finetune/Step Time": 2.866861280053854} +{"Finetune/Learning Rate": 1.601135920305689e-05, "Finetune/Loss": 0.8099099397659302, "Finetune/Loss (Raw)": 0.7811219692230225, "Finetune/Step": 1571, "Finetune/Step Time": 2.844051143154502} +{"Finetune/Learning Rate": 1.6006154626167016e-05, "Finetune/Loss": 0.8117113709449768, "Finetune/Loss (Raw)": 0.8112668395042419, "Finetune/Step": 1572, "Finetune/Step Time": 2.8192291036248207} +{"Finetune/Learning Rate": 1.600094750302385e-05, "Finetune/Loss": 0.8123363852500916, "Finetune/Loss (Raw)": 0.9434186220169067, "Finetune/Step": 1573, "Finetune/Step Time": 2.8194032926112413} +{"Finetune/Learning Rate": 1.5995737835834905e-05, "Finetune/Loss": 0.8116525411605835, "Finetune/Loss (Raw)": 0.798486053943634, "Finetune/Step": 1574, "Finetune/Step Time": 2.8252692352980375} +{"Finetune/Learning Rate": 1.5990525626808766e-05, "Finetune/Loss": 0.8117595911026001, "Finetune/Loss (Raw)": 0.8653854727745056, "Finetune/Step": 1575, "Finetune/Step Time": 2.8234988171607256} +{"Finetune/Learning Rate": 1.5985310878155108e-05, "Finetune/Loss": 0.8123695850372314, "Finetune/Loss (Raw)": 0.8701735138893127, "Finetune/Step": 1576, "Finetune/Step Time": 2.819613078609109} +{"Finetune/Learning Rate": 1.598009359208467e-05, "Finetune/Loss": 0.8126906156539917, "Finetune/Loss (Raw)": 0.8972673416137695, "Finetune/Step": 1577, "Finetune/Step Time": 2.8189870584756136} +{"Finetune/Learning Rate": 1.597487377080927e-05, "Finetune/Loss": 0.8115508556365967, "Finetune/Loss (Raw)": 0.8569164276123047, "Finetune/Step": 1578, "Finetune/Step Time": 2.8213474731892347} +{"Finetune/Learning Rate": 1.596965141654181e-05, "Finetune/Loss": 0.8118398189544678, "Finetune/Loss (Raw)": 0.8359100222587585, "Finetune/Step": 1579, "Finetune/Step Time": 2.817377457395196} +{"Finetune/Learning Rate": 1.5964426531496254e-05, "Finetune/Loss": 0.8136759996414185, "Finetune/Loss (Raw)": 0.8855780959129333, "Finetune/Step": 1580, "Finetune/Step Time": 2.7955581564456224} +{"Finetune/Learning Rate": 1.5959199117887642e-05, "Finetune/Loss": 0.8141445517539978, "Finetune/Loss (Raw)": 0.8238124847412109, "Finetune/Step": 1581, "Finetune/Step Time": 2.7711747977882624} +{"Finetune/Learning Rate": 1.5953969177932086e-05, "Finetune/Loss": 0.8140007257461548, "Finetune/Loss (Raw)": 0.9197152256965637, "Finetune/Step": 1582, "Finetune/Step Time": 2.7674668822437525} +{"Finetune/Learning Rate": 1.5948736713846775e-05, "Finetune/Loss": 0.8198121786117554, "Finetune/Loss (Raw)": 0.8848704099655151, "Finetune/Step": 1583, "Finetune/Step Time": 2.736586418002844} +{"Finetune/Learning Rate": 1.594350172784996e-05, "Finetune/Loss": 0.8198322057723999, "Finetune/Loss (Raw)": 0.8778467178344727, "Finetune/Step": 1584, "Finetune/Step Time": 2.7354684565216303} +{"Finetune/Learning Rate": 1.5938264222160968e-05, "Finetune/Loss": 0.8194863796234131, "Finetune/Loss (Raw)": 0.8120111227035522, "Finetune/Step": 1585, "Finetune/Step Time": 2.734320241957903} +{"Finetune/Learning Rate": 1.593302419900019e-05, "Finetune/Loss": 0.8190982341766357, "Finetune/Loss (Raw)": 0.8416544198989868, "Finetune/Step": 1586, "Finetune/Step Time": 2.7316276375204325} +{"Finetune/Learning Rate": 1.5927781660589078e-05, "Finetune/Loss": 0.8194730877876282, "Finetune/Loss (Raw)": 0.8054701685905457, "Finetune/Step": 1587, "Finetune/Step Time": 2.735741999000311} +{"Finetune/Learning Rate": 1.592253660915017e-05, "Finetune/Loss": 0.8192312717437744, "Finetune/Loss (Raw)": 0.7944812178611755, "Finetune/Step": 1588, "Finetune/Step Time": 2.7380231320858} +{"Finetune/Learning Rate": 1.5917289046907046e-05, "Finetune/Loss": 0.8187945485115051, "Finetune/Loss (Raw)": 0.8356541991233826, "Finetune/Step": 1589, "Finetune/Step Time": 2.7382826637476683} +{"Finetune/Learning Rate": 1.5912038976084363e-05, "Finetune/Loss": 0.8187187910079956, "Finetune/Loss (Raw)": 0.8858063817024231, "Finetune/Step": 1590, "Finetune/Step Time": 2.736655691638589} +{"Finetune/Learning Rate": 1.5906786398907842e-05, "Finetune/Loss": 0.8187139630317688, "Finetune/Loss (Raw)": 0.872575044631958, "Finetune/Step": 1591, "Finetune/Step Time": 2.7379983011633158} +{"Finetune/Learning Rate": 1.5901531317604265e-05, "Finetune/Loss": 0.8178550004959106, "Finetune/Loss (Raw)": 0.7738895416259766, "Finetune/Step": 1592, "Finetune/Step Time": 2.7502424363046885} +{"Finetune/Learning Rate": 1.589627373440147e-05, "Finetune/Loss": 0.8179464340209961, "Finetune/Loss (Raw)": 0.8278523683547974, "Finetune/Step": 1593, "Finetune/Step Time": 2.7511905282735825} +{"Finetune/Learning Rate": 1.5891013651528368e-05, "Finetune/Loss": 0.8184141516685486, "Finetune/Loss (Raw)": 0.8462116718292236, "Finetune/Step": 1594, "Finetune/Step Time": 2.7517440654337406} +{"Finetune/Learning Rate": 1.5885751071214914e-05, "Finetune/Loss": 0.8178372383117676, "Finetune/Loss (Raw)": 0.8392540216445923, "Finetune/Step": 1595, "Finetune/Step Time": 2.751383861526847} +{"Finetune/Learning Rate": 1.5880485995692136e-05, "Finetune/Loss": 0.8173658847808838, "Finetune/Loss (Raw)": 0.5840332508087158, "Finetune/Step": 1596, "Finetune/Step Time": 2.748856842517853} +{"Finetune/Learning Rate": 1.587521842719211e-05, "Finetune/Loss": 0.8176407217979431, "Finetune/Loss (Raw)": 0.8592569231987, "Finetune/Step": 1597, "Finetune/Step Time": 2.7497461643069983} +{"Finetune/Learning Rate": 1.5869948367947975e-05, "Finetune/Loss": 0.8177931308746338, "Finetune/Loss (Raw)": 0.8414590954780579, "Finetune/Step": 1598, "Finetune/Step Time": 2.7456998638808727} +{"Finetune/Learning Rate": 1.586467582019392e-05, "Finetune/Loss": 0.8178796768188477, "Finetune/Loss (Raw)": 0.8485749959945679, "Finetune/Step": 1599, "Finetune/Step Time": 2.7484488748013973} +{"Finetune/Learning Rate": 1.58594007861652e-05, "Finetune/Loss": 0.8193854093551636, "Finetune/Loss (Raw)": 0.8665568828582764, "Finetune/Step": 1600, "Finetune/Step Time": 2.750189295038581} +{"Finetune/Learning Rate": 1.5854123268098106e-05, "Finetune/Loss": 0.8192054629325867, "Finetune/Loss (Raw)": 0.798157811164856, "Finetune/Step": 1601, "Finetune/Step Time": 2.7544478122144938} +{"Finetune/Learning Rate": 1.5848843268230002e-05, "Finetune/Loss": 0.8192991018295288, "Finetune/Loss (Raw)": 0.8431654572486877, "Finetune/Step": 1602, "Finetune/Step Time": 2.7581747733056545} +{"Finetune/Learning Rate": 1.584356078879929e-05, "Finetune/Loss": 0.8190639019012451, "Finetune/Loss (Raw)": 0.8637599349021912, "Finetune/Step": 1603, "Finetune/Step Time": 2.7542574759572744} +{"Finetune/Learning Rate": 1.5838275832045426e-05, "Finetune/Loss": 0.8191126585006714, "Finetune/Loss (Raw)": 0.8302961587905884, "Finetune/Step": 1604, "Finetune/Step Time": 2.7569903656840324} +{"Finetune/Learning Rate": 1.5832988400208925e-05, "Finetune/Loss": 0.818848192691803, "Finetune/Loss (Raw)": 0.8646931648254395, "Finetune/Step": 1605, "Finetune/Step Time": 2.7573402374982834} +{"Finetune/Learning Rate": 1.5827698495531336e-05, "Finetune/Loss": 0.818101167678833, "Finetune/Loss (Raw)": 0.8309680223464966, "Finetune/Step": 1606, "Finetune/Step Time": 2.757249316200614} +{"Finetune/Learning Rate": 1.5822406120255273e-05, "Finetune/Loss": 0.8183716535568237, "Finetune/Loss (Raw)": 0.8688772320747375, "Finetune/Step": 1607, "Finetune/Step Time": 2.755302669480443} +{"Finetune/Learning Rate": 1.581711127662438e-05, "Finetune/Loss": 0.818365752696991, "Finetune/Loss (Raw)": 0.8625074625015259, "Finetune/Step": 1608, "Finetune/Step Time": 2.7482608444988728} +{"Finetune/Learning Rate": 1.5811813966883368e-05, "Finetune/Loss": 0.8190615177154541, "Finetune/Loss (Raw)": 0.8641341328620911, "Finetune/Step": 1609, "Finetune/Step Time": 2.7502637896686792} +{"Finetune/Learning Rate": 1.5806514193277974e-05, "Finetune/Loss": 0.8187914490699768, "Finetune/Loss (Raw)": 0.8483471870422363, "Finetune/Step": 1610, "Finetune/Step Time": 2.7441372722387314} +{"Finetune/Learning Rate": 1.580121195805499e-05, "Finetune/Loss": 0.817367434501648, "Finetune/Loss (Raw)": 0.5935697555541992, "Finetune/Step": 1611, "Finetune/Step Time": 2.7678810339421034} +{"Finetune/Learning Rate": 1.5795907263462247e-05, "Finetune/Loss": 0.8166259527206421, "Finetune/Loss (Raw)": 0.775118350982666, "Finetune/Step": 1612, "Finetune/Step Time": 2.792558116838336} +{"Finetune/Learning Rate": 1.5790600111748627e-05, "Finetune/Loss": 0.8126728534698486, "Finetune/Loss (Raw)": 0.2967570722103119, "Finetune/Step": 1613, "Finetune/Step Time": 2.825103987008333} +{"Finetune/Learning Rate": 1.5785290505164038e-05, "Finetune/Loss": 0.812362015247345, "Finetune/Loss (Raw)": 0.8215622305870056, "Finetune/Step": 1614, "Finetune/Step Time": 2.821425676345825} +{"Finetune/Learning Rate": 1.5779978445959446e-05, "Finetune/Loss": 0.8126532435417175, "Finetune/Loss (Raw)": 0.8941267132759094, "Finetune/Step": 1615, "Finetune/Step Time": 2.821367934346199} +{"Finetune/Learning Rate": 1.5774663936386848e-05, "Finetune/Loss": 0.8126229047775269, "Finetune/Loss (Raw)": 0.8217113018035889, "Finetune/Step": 1616, "Finetune/Step Time": 2.8177909664809704} +{"Finetune/Learning Rate": 1.576934697869928e-05, "Finetune/Loss": 0.8124597668647766, "Finetune/Loss (Raw)": 0.7472370862960815, "Finetune/Step": 1617, "Finetune/Step Time": 2.817243354395032} +{"Finetune/Learning Rate": 1.576402757515081e-05, "Finetune/Loss": 0.8140131235122681, "Finetune/Loss (Raw)": 0.8014969229698181, "Finetune/Step": 1618, "Finetune/Step Time": 2.794732941314578} +{"Finetune/Learning Rate": 1.5758705727996564e-05, "Finetune/Loss": 0.8142901062965393, "Finetune/Loss (Raw)": 0.8188239336013794, "Finetune/Step": 1619, "Finetune/Step Time": 2.7931838016957045} +{"Finetune/Learning Rate": 1.5753381439492676e-05, "Finetune/Loss": 0.8121893405914307, "Finetune/Loss (Raw)": 0.6760684847831726, "Finetune/Step": 1620, "Finetune/Step Time": 2.793234357610345} +{"Finetune/Learning Rate": 1.5748054711896332e-05, "Finetune/Loss": 0.8111467361450195, "Finetune/Loss (Raw)": 0.6897146105766296, "Finetune/Step": 1621, "Finetune/Step Time": 2.8160596005618572} +{"Finetune/Learning Rate": 1.5742725547465755e-05, "Finetune/Loss": 0.8114893436431885, "Finetune/Loss (Raw)": 0.8430656790733337, "Finetune/Step": 1622, "Finetune/Step Time": 2.8143160976469517} +{"Finetune/Learning Rate": 1.5737393948460186e-05, "Finetune/Loss": 0.8101825714111328, "Finetune/Loss (Raw)": 0.6514040231704712, "Finetune/Step": 1623, "Finetune/Step Time": 2.8351945839822292} +{"Finetune/Learning Rate": 1.5732059917139912e-05, "Finetune/Loss": 0.8105499148368835, "Finetune/Loss (Raw)": 0.8388375043869019, "Finetune/Step": 1624, "Finetune/Step Time": 2.8358542174100876} +{"Finetune/Learning Rate": 1.5726723455766246e-05, "Finetune/Loss": 0.8108881711959839, "Finetune/Loss (Raw)": 0.8870229125022888, "Finetune/Step": 1625, "Finetune/Step Time": 2.8312435429543257} +{"Finetune/Learning Rate": 1.572138456660153e-05, "Finetune/Loss": 0.8103598356246948, "Finetune/Loss (Raw)": 0.829788863658905, "Finetune/Step": 1626, "Finetune/Step Time": 2.832830063998699} +{"Finetune/Learning Rate": 1.571604325190913e-05, "Finetune/Loss": 0.8118235468864441, "Finetune/Loss (Raw)": 0.9331504702568054, "Finetune/Step": 1627, "Finetune/Step Time": 2.8315029814839363} +{"Finetune/Learning Rate": 1.571069951395346e-05, "Finetune/Loss": 0.812597393989563, "Finetune/Loss (Raw)": 0.8949356079101562, "Finetune/Step": 1628, "Finetune/Step Time": 2.834344355389476} +{"Finetune/Learning Rate": 1.5705353354999933e-05, "Finetune/Loss": 0.8125734329223633, "Finetune/Loss (Raw)": 0.9065518975257874, "Finetune/Step": 1629, "Finetune/Step Time": 2.828513231128454} +{"Finetune/Learning Rate": 1.5700004777315014e-05, "Finetune/Loss": 0.8121786117553711, "Finetune/Loss (Raw)": 0.8083208799362183, "Finetune/Step": 1630, "Finetune/Step Time": 2.830264026299119} +{"Finetune/Learning Rate": 1.5694653783166177e-05, "Finetune/Loss": 0.8123157620429993, "Finetune/Loss (Raw)": 0.8290034532546997, "Finetune/Step": 1631, "Finetune/Step Time": 2.829942286014557} +{"Finetune/Learning Rate": 1.5689300374821934e-05, "Finetune/Loss": 0.8123916387557983, "Finetune/Loss (Raw)": 0.8410341739654541, "Finetune/Step": 1632, "Finetune/Step Time": 2.8302558306604624} +{"Finetune/Learning Rate": 1.56839445545518e-05, "Finetune/Loss": 0.8124547004699707, "Finetune/Loss (Raw)": 0.8129294514656067, "Finetune/Step": 1633, "Finetune/Step Time": 2.825946720317006} +{"Finetune/Learning Rate": 1.5678586324626337e-05, "Finetune/Loss": 0.8120560050010681, "Finetune/Loss (Raw)": 0.8802038431167603, "Finetune/Step": 1634, "Finetune/Step Time": 2.825267793610692} +{"Finetune/Learning Rate": 1.5673225687317112e-05, "Finetune/Loss": 0.8158727884292603, "Finetune/Loss (Raw)": 0.7437810301780701, "Finetune/Step": 1635, "Finetune/Step Time": 2.79323510825634} +{"Finetune/Learning Rate": 1.5667862644896712e-05, "Finetune/Loss": 0.8166537284851074, "Finetune/Loss (Raw)": 0.8474609851837158, "Finetune/Step": 1636, "Finetune/Step Time": 2.7932731825858355} +{"Finetune/Learning Rate": 1.5662497199638757e-05, "Finetune/Loss": 0.8166275024414062, "Finetune/Loss (Raw)": 0.8222532272338867, "Finetune/Step": 1637, "Finetune/Step Time": 2.7931063920259476} +{"Finetune/Learning Rate": 1.565712935381788e-05, "Finetune/Loss": 0.8151159286499023, "Finetune/Loss (Raw)": 0.6607546806335449, "Finetune/Step": 1638, "Finetune/Step Time": 2.81668590195477} +{"Finetune/Learning Rate": 1.5651759109709712e-05, "Finetune/Loss": 0.8140469193458557, "Finetune/Loss (Raw)": 0.7572285532951355, "Finetune/Step": 1639, "Finetune/Step Time": 2.8410979826003313} +{"Finetune/Learning Rate": 1.5646386469590934e-05, "Finetune/Loss": 0.8129943609237671, "Finetune/Loss (Raw)": 0.7487926483154297, "Finetune/Step": 1640, "Finetune/Step Time": 2.8409780375659466} +{"Finetune/Learning Rate": 1.5641011435739225e-05, "Finetune/Loss": 0.8130788803100586, "Finetune/Loss (Raw)": 0.8184237480163574, "Finetune/Step": 1641, "Finetune/Step Time": 2.845626000314951} +{"Finetune/Learning Rate": 1.5635634010433277e-05, "Finetune/Loss": 0.8142358660697937, "Finetune/Loss (Raw)": 0.43966758251190186, "Finetune/Step": 1642, "Finetune/Step Time": 2.839825937524438} +{"Finetune/Learning Rate": 1.5630254195952798e-05, "Finetune/Loss": 0.8150265216827393, "Finetune/Loss (Raw)": 0.762313187122345, "Finetune/Step": 1643, "Finetune/Step Time": 2.816270725801587} +{"Finetune/Learning Rate": 1.5624871994578515e-05, "Finetune/Loss": 0.8150843977928162, "Finetune/Loss (Raw)": 0.8918694853782654, "Finetune/Step": 1644, "Finetune/Step Time": 2.8147860653698444} +{"Finetune/Learning Rate": 1.561948740859216e-05, "Finetune/Loss": 0.8153167963027954, "Finetune/Loss (Raw)": 0.8154674768447876, "Finetune/Step": 1645, "Finetune/Step Time": 2.8143071364611387} +{"Finetune/Learning Rate": 1.5614100440276474e-05, "Finetune/Loss": 0.8135491609573364, "Finetune/Loss (Raw)": 0.772525429725647, "Finetune/Step": 1646, "Finetune/Step Time": 2.8181727956980467} +{"Finetune/Learning Rate": 1.5608711091915213e-05, "Finetune/Loss": 0.8121283054351807, "Finetune/Loss (Raw)": 0.7175079584121704, "Finetune/Step": 1647, "Finetune/Step Time": 2.8173509035259485} +{"Finetune/Learning Rate": 1.560331936579315e-05, "Finetune/Loss": 0.8109254240989685, "Finetune/Loss (Raw)": 0.8115729689598083, "Finetune/Step": 1648, "Finetune/Step Time": 2.8293579779565334} +{"Finetune/Learning Rate": 1.5597925264196048e-05, "Finetune/Loss": 0.8101325035095215, "Finetune/Loss (Raw)": 0.8229243755340576, "Finetune/Step": 1649, "Finetune/Step Time": 2.8281039614230394} +{"Finetune/Learning Rate": 1.559252878941069e-05, "Finetune/Loss": 0.8116908073425293, "Finetune/Loss (Raw)": 0.8787049055099487, "Finetune/Step": 1650, "Finetune/Step Time": 2.8060268089175224} +{"Finetune/Learning Rate": 1.5587129943724856e-05, "Finetune/Loss": 0.8078384399414062, "Finetune/Loss (Raw)": 0.3035932779312134, "Finetune/Step": 1651, "Finetune/Step Time": 2.834590746089816} +{"Finetune/Learning Rate": 1.5581728729427346e-05, "Finetune/Loss": 0.8082504868507385, "Finetune/Loss (Raw)": 0.9052953720092773, "Finetune/Step": 1652, "Finetune/Step Time": 2.831275897100568} +{"Finetune/Learning Rate": 1.5576325148807945e-05, "Finetune/Loss": 0.8082952499389648, "Finetune/Loss (Raw)": 0.7797939777374268, "Finetune/Step": 1653, "Finetune/Step Time": 2.8341418020427227} +{"Finetune/Learning Rate": 1.5570919204157453e-05, "Finetune/Loss": 0.8076671957969666, "Finetune/Loss (Raw)": 0.706814169883728, "Finetune/Step": 1654, "Finetune/Step Time": 2.8327309880405664} +{"Finetune/Learning Rate": 1.5565510897767672e-05, "Finetune/Loss": 0.8075652122497559, "Finetune/Loss (Raw)": 0.8468557596206665, "Finetune/Step": 1655, "Finetune/Step Time": 2.834861323237419} +{"Finetune/Learning Rate": 1.5560100231931404e-05, "Finetune/Loss": 0.8030346632003784, "Finetune/Loss (Raw)": 0.3056289255619049, "Finetune/Step": 1656, "Finetune/Step Time": 2.8625276498496532} +{"Finetune/Learning Rate": 1.555468720894245e-05, "Finetune/Loss": 0.8031628131866455, "Finetune/Loss (Raw)": 0.8165507316589355, "Finetune/Step": 1657, "Finetune/Step Time": 2.8669137358665466} +{"Finetune/Learning Rate": 1.5549271831095607e-05, "Finetune/Loss": 0.801906406879425, "Finetune/Loss (Raw)": 0.6955356001853943, "Finetune/Step": 1658, "Finetune/Step Time": 2.889278592541814} +{"Finetune/Learning Rate": 1.5543854100686677e-05, "Finetune/Loss": 0.802057147026062, "Finetune/Loss (Raw)": 0.9261605143547058, "Finetune/Step": 1659, "Finetune/Step Time": 2.891053171828389} +{"Finetune/Learning Rate": 1.5538434020012454e-05, "Finetune/Loss": 0.8020204305648804, "Finetune/Loss (Raw)": 0.8645111918449402, "Finetune/Step": 1660, "Finetune/Step Time": 2.8903850596398115} +{"Finetune/Learning Rate": 1.5533011591370738e-05, "Finetune/Loss": 0.8018551468849182, "Finetune/Loss (Raw)": 0.8178097009658813, "Finetune/Step": 1661, "Finetune/Step Time": 2.893147610127926} +{"Finetune/Learning Rate": 1.5527586817060302e-05, "Finetune/Loss": 0.8003455400466919, "Finetune/Loss (Raw)": 0.5892148613929749, "Finetune/Step": 1662, "Finetune/Step Time": 2.9178250152617693} +{"Finetune/Learning Rate": 1.5522159699380945e-05, "Finetune/Loss": 0.800621509552002, "Finetune/Loss (Raw)": 0.8831419944763184, "Finetune/Step": 1663, "Finetune/Step Time": 2.914667909964919} +{"Finetune/Learning Rate": 1.5516730240633436e-05, "Finetune/Loss": 0.8005067110061646, "Finetune/Loss (Raw)": 0.822510302066803, "Finetune/Step": 1664, "Finetune/Step Time": 2.902402276173234} +{"Finetune/Learning Rate": 1.551129844311954e-05, "Finetune/Loss": 0.8000805377960205, "Finetune/Loss (Raw)": 0.8087775111198425, "Finetune/Step": 1665, "Finetune/Step Time": 2.9064613096415997} +{"Finetune/Learning Rate": 1.5505864309142023e-05, "Finetune/Loss": 0.8039764165878296, "Finetune/Loss (Raw)": 0.7963747978210449, "Finetune/Step": 1666, "Finetune/Step Time": 2.87358982488513} +{"Finetune/Learning Rate": 1.5500427841004633e-05, "Finetune/Loss": 0.804786205291748, "Finetune/Loss (Raw)": 0.8887037634849548, "Finetune/Step": 1667, "Finetune/Step Time": 2.872528310865164} +{"Finetune/Learning Rate": 1.549498904101211e-05, "Finetune/Loss": 0.8042848110198975, "Finetune/Loss (Raw)": 0.7430177330970764, "Finetune/Step": 1668, "Finetune/Step Time": 2.872909564524889} +{"Finetune/Learning Rate": 1.548954791147018e-05, "Finetune/Loss": 0.8043551445007324, "Finetune/Loss (Raw)": 0.8146572113037109, "Finetune/Step": 1669, "Finetune/Step Time": 2.873444275930524} +{"Finetune/Learning Rate": 1.548410445468556e-05, "Finetune/Loss": 0.8043719530105591, "Finetune/Loss (Raw)": 0.8583756685256958, "Finetune/Step": 1670, "Finetune/Step Time": 2.8732730336487293} +{"Finetune/Learning Rate": 1.547865867296596e-05, "Finetune/Loss": 0.8027147054672241, "Finetune/Loss (Raw)": 0.711716890335083, "Finetune/Step": 1671, "Finetune/Step Time": 2.878822561353445} +{"Finetune/Learning Rate": 1.547321056862006e-05, "Finetune/Loss": 0.8032420873641968, "Finetune/Loss (Raw)": 0.8943701386451721, "Finetune/Step": 1672, "Finetune/Step Time": 2.901479959487915} +{"Finetune/Learning Rate": 1.5467760143957534e-05, "Finetune/Loss": 0.8032184839248657, "Finetune/Loss (Raw)": 0.9063747525215149, "Finetune/Step": 1673, "Finetune/Step Time": 2.906040947884321} +{"Finetune/Learning Rate": 1.546230740128904e-05, "Finetune/Loss": 0.8038864135742188, "Finetune/Loss (Raw)": 0.8873056769371033, "Finetune/Step": 1674, "Finetune/Step Time": 2.9071329664438963} +{"Finetune/Learning Rate": 1.545685234292622e-05, "Finetune/Loss": 0.8023695349693298, "Finetune/Loss (Raw)": 0.694515585899353, "Finetune/Step": 1675, "Finetune/Step Time": 2.9059980399906635} +{"Finetune/Learning Rate": 1.5451394971181695e-05, "Finetune/Loss": 0.8028250932693481, "Finetune/Loss (Raw)": 0.8158996105194092, "Finetune/Step": 1676, "Finetune/Step Time": 2.9056634288281202} +{"Finetune/Learning Rate": 1.5445935288369067e-05, "Finetune/Loss": 0.8019459247589111, "Finetune/Loss (Raw)": 0.8040858507156372, "Finetune/Step": 1677, "Finetune/Step Time": 2.9049380347132683} +{"Finetune/Learning Rate": 1.544047329680291e-05, "Finetune/Loss": 0.8023058176040649, "Finetune/Loss (Raw)": 0.8394929766654968, "Finetune/Step": 1678, "Finetune/Step Time": 2.9088070783764124} +{"Finetune/Learning Rate": 1.5435008998798794e-05, "Finetune/Loss": 0.8029959201812744, "Finetune/Loss (Raw)": 0.8675341606140137, "Finetune/Step": 1679, "Finetune/Step Time": 2.906088836491108} +{"Finetune/Learning Rate": 1.542954239667325e-05, "Finetune/Loss": 0.802395761013031, "Finetune/Loss (Raw)": 0.7785586714744568, "Finetune/Step": 1680, "Finetune/Step Time": 2.909033777192235} +{"Finetune/Learning Rate": 1.5424073492743802e-05, "Finetune/Loss": 0.8023732900619507, "Finetune/Loss (Raw)": 0.7985934615135193, "Finetune/Step": 1681, "Finetune/Step Time": 2.907745001837611} +{"Finetune/Learning Rate": 1.541860228932893e-05, "Finetune/Loss": 0.802440345287323, "Finetune/Loss (Raw)": 0.7887446284294128, "Finetune/Step": 1682, "Finetune/Step Time": 2.9127829372882843} +{"Finetune/Learning Rate": 1.5413128788748105e-05, "Finetune/Loss": 0.8022363185882568, "Finetune/Loss (Raw)": 0.793379545211792, "Finetune/Step": 1683, "Finetune/Step Time": 2.9086880553513765} +{"Finetune/Learning Rate": 1.540765299332177e-05, "Finetune/Loss": 0.8013885021209717, "Finetune/Loss (Raw)": 0.7930783033370972, "Finetune/Step": 1684, "Finetune/Step Time": 2.9096885845065117} +{"Finetune/Learning Rate": 1.5402174905371334e-05, "Finetune/Loss": 0.8011461496353149, "Finetune/Loss (Raw)": 0.8845922946929932, "Finetune/Step": 1685, "Finetune/Step Time": 2.9089133851230145} +{"Finetune/Learning Rate": 1.539669452721918e-05, "Finetune/Loss": 0.8017722368240356, "Finetune/Loss (Raw)": 0.8023988008499146, "Finetune/Step": 1686, "Finetune/Step Time": 2.909667057916522} +{"Finetune/Learning Rate": 1.5391211861188666e-05, "Finetune/Loss": 0.7994682788848877, "Finetune/Loss (Raw)": 0.45089706778526306, "Finetune/Step": 1687, "Finetune/Step Time": 2.9403298683464527} +{"Finetune/Learning Rate": 1.5385726909604113e-05, "Finetune/Loss": 0.7995665073394775, "Finetune/Loss (Raw)": 0.794293224811554, "Finetune/Step": 1688, "Finetune/Step Time": 2.944685496389866} +{"Finetune/Learning Rate": 1.538023967479082e-05, "Finetune/Loss": 0.7994080781936646, "Finetune/Loss (Raw)": 0.8606433868408203, "Finetune/Step": 1689, "Finetune/Step Time": 2.9451893530786037} +{"Finetune/Learning Rate": 1.5374750159075048e-05, "Finetune/Loss": 0.8000061511993408, "Finetune/Loss (Raw)": 0.8554482460021973, "Finetune/Step": 1690, "Finetune/Step Time": 2.944144658744335} +{"Finetune/Learning Rate": 1.5369258364784023e-05, "Finetune/Loss": 0.8004090785980225, "Finetune/Loss (Raw)": 0.943138837814331, "Finetune/Step": 1691, "Finetune/Step Time": 2.939279394224286} +{"Finetune/Learning Rate": 1.5363764294245946e-05, "Finetune/Loss": 0.8007160425186157, "Finetune/Loss (Raw)": 0.8751471638679504, "Finetune/Step": 1692, "Finetune/Step Time": 2.9412175212055445} +{"Finetune/Learning Rate": 1.5358267949789968e-05, "Finetune/Loss": 0.8008833527565002, "Finetune/Loss (Raw)": 0.7934474945068359, "Finetune/Step": 1693, "Finetune/Step Time": 2.9395704939961433} +{"Finetune/Learning Rate": 1.535276933374622e-05, "Finetune/Loss": 0.8021398782730103, "Finetune/Loss (Raw)": 0.7793703675270081, "Finetune/Step": 1694, "Finetune/Step Time": 2.9160661920905113} +{"Finetune/Learning Rate": 1.534726844844579e-05, "Finetune/Loss": 0.8020455837249756, "Finetune/Loss (Raw)": 0.7214947938919067, "Finetune/Step": 1695, "Finetune/Step Time": 2.917876984924078} +{"Finetune/Learning Rate": 1.534176529622072e-05, "Finetune/Loss": 0.802334189414978, "Finetune/Loss (Raw)": 0.8519719243049622, "Finetune/Step": 1696, "Finetune/Step Time": 2.9182102736085653} +{"Finetune/Learning Rate": 1.5336259879404024e-05, "Finetune/Loss": 0.802153468132019, "Finetune/Loss (Raw)": 0.8086293935775757, "Finetune/Step": 1697, "Finetune/Step Time": 2.9173595048487186} +{"Finetune/Learning Rate": 1.5330752200329676e-05, "Finetune/Loss": 0.8018759489059448, "Finetune/Loss (Raw)": 0.8065763711929321, "Finetune/Step": 1698, "Finetune/Step Time": 2.9156334567815065} +{"Finetune/Learning Rate": 1.53252422613326e-05, "Finetune/Loss": 0.8025719523429871, "Finetune/Loss (Raw)": 0.8702089190483093, "Finetune/Step": 1699, "Finetune/Step Time": 2.918139811605215} +{"Finetune/Learning Rate": 1.5319730064748686e-05, "Finetune/Loss": 0.8032020330429077, "Finetune/Loss (Raw)": 0.8919100761413574, "Finetune/Step": 1700, "Finetune/Step Time": 2.9173902887851} +{"Finetune/Learning Rate": 1.5314215612914776e-05, "Finetune/Loss": 0.8023841381072998, "Finetune/Loss (Raw)": 0.8387295603752136, "Finetune/Step": 1701, "Finetune/Step Time": 2.9225355722010136} +{"Finetune/Learning Rate": 1.5308698908168674e-05, "Finetune/Loss": 0.8025520443916321, "Finetune/Loss (Raw)": 0.8199883699417114, "Finetune/Step": 1702, "Finetune/Step Time": 2.9170765355229378} +{"Finetune/Learning Rate": 1.530317995284913e-05, "Finetune/Loss": 0.8020946979522705, "Finetune/Loss (Raw)": 0.8068468570709229, "Finetune/Step": 1703, "Finetune/Step Time": 2.920717952772975} +{"Finetune/Learning Rate": 1.529765874929586e-05, "Finetune/Loss": 0.8021261692047119, "Finetune/Loss (Raw)": 0.8741933107376099, "Finetune/Step": 1704, "Finetune/Step Time": 2.936544109135866} +{"Finetune/Learning Rate": 1.5292135299849526e-05, "Finetune/Loss": 0.8017717003822327, "Finetune/Loss (Raw)": 0.8518986105918884, "Finetune/Step": 1705, "Finetune/Step Time": 2.937224879860878} +{"Finetune/Learning Rate": 1.5286609606851735e-05, "Finetune/Loss": 0.8020423650741577, "Finetune/Loss (Raw)": 0.8915578722953796, "Finetune/Step": 1706, "Finetune/Step Time": 2.934496620669961} +{"Finetune/Learning Rate": 1.5281081672645065e-05, "Finetune/Loss": 0.8019736409187317, "Finetune/Loss (Raw)": 0.8271145224571228, "Finetune/Step": 1707, "Finetune/Step Time": 2.9355697948485613} +{"Finetune/Learning Rate": 1.527555149957302e-05, "Finetune/Loss": 0.8018203377723694, "Finetune/Loss (Raw)": 0.8659532070159912, "Finetune/Step": 1708, "Finetune/Step Time": 2.9362918827682734} +{"Finetune/Learning Rate": 1.5270019089980076e-05, "Finetune/Loss": 0.8015568256378174, "Finetune/Loss (Raw)": 0.7900841236114502, "Finetune/Step": 1709, "Finetune/Step Time": 2.937088618054986} +{"Finetune/Learning Rate": 1.5264484446211643e-05, "Finetune/Loss": 0.8007748126983643, "Finetune/Loss (Raw)": 0.8196250200271606, "Finetune/Step": 1710, "Finetune/Step Time": 2.9396495930850506} +{"Finetune/Learning Rate": 1.5258947570614074e-05, "Finetune/Loss": 0.7981499433517456, "Finetune/Loss (Raw)": 0.5488760471343994, "Finetune/Step": 1711, "Finetune/Step Time": 2.959938943386078} +{"Finetune/Learning Rate": 1.5253408465534692e-05, "Finetune/Loss": 0.797870397567749, "Finetune/Loss (Raw)": 0.842075765132904, "Finetune/Step": 1712, "Finetune/Step Time": 2.9643262829631567} +{"Finetune/Learning Rate": 1.5247867133321732e-05, "Finetune/Loss": 0.797630786895752, "Finetune/Loss (Raw)": 0.781340479850769, "Finetune/Step": 1713, "Finetune/Step Time": 2.9648809153586626} +{"Finetune/Learning Rate": 1.5242323576324403e-05, "Finetune/Loss": 0.7983459234237671, "Finetune/Loss (Raw)": 0.9331889152526855, "Finetune/Step": 1714, "Finetune/Step Time": 2.9693064391613007} +{"Finetune/Learning Rate": 1.5236777796892837e-05, "Finetune/Loss": 0.7989967465400696, "Finetune/Loss (Raw)": 0.8887712955474854, "Finetune/Step": 1715, "Finetune/Step Time": 2.9668435640633106} +{"Finetune/Learning Rate": 1.5231229797378112e-05, "Finetune/Loss": 0.8000073432922363, "Finetune/Loss (Raw)": 0.9238343834877014, "Finetune/Step": 1716, "Finetune/Step Time": 2.9678574707359076} +{"Finetune/Learning Rate": 1.5225679580132262e-05, "Finetune/Loss": 0.8001894354820251, "Finetune/Loss (Raw)": 0.8589678406715393, "Finetune/Step": 1717, "Finetune/Step Time": 2.9690378587692976} +{"Finetune/Learning Rate": 1.5220127147508246e-05, "Finetune/Loss": 0.8001376390457153, "Finetune/Loss (Raw)": 0.8791797161102295, "Finetune/Step": 1718, "Finetune/Step Time": 2.970140617340803} +{"Finetune/Learning Rate": 1.5214572501859959e-05, "Finetune/Loss": 0.7993104457855225, "Finetune/Loss (Raw)": 0.7666926383972168, "Finetune/Step": 1719, "Finetune/Step Time": 2.9694491121917963} +{"Finetune/Learning Rate": 1.5209015645542251e-05, "Finetune/Loss": 0.8009345531463623, "Finetune/Loss (Raw)": 0.981774091720581, "Finetune/Step": 1720, "Finetune/Step Time": 2.959601594135165} +{"Finetune/Learning Rate": 1.520345658091089e-05, "Finetune/Loss": 0.800947904586792, "Finetune/Loss (Raw)": 0.8295637965202332, "Finetune/Step": 1721, "Finetune/Step Time": 2.9603038150817156} +{"Finetune/Learning Rate": 1.5197895310322598e-05, "Finetune/Loss": 0.8010783791542053, "Finetune/Loss (Raw)": 0.8629087805747986, "Finetune/Step": 1722, "Finetune/Step Time": 2.9607599824666977} +{"Finetune/Learning Rate": 1.5192331836135016e-05, "Finetune/Loss": 0.8007486462593079, "Finetune/Loss (Raw)": 0.7970479130744934, "Finetune/Step": 1723, "Finetune/Step Time": 2.9599851835519075} +{"Finetune/Learning Rate": 1.5186766160706738e-05, "Finetune/Loss": 0.802432656288147, "Finetune/Loss (Raw)": 0.7995866537094116, "Finetune/Step": 1724, "Finetune/Step Time": 2.9384438395500183} +{"Finetune/Learning Rate": 1.5181198286397268e-05, "Finetune/Loss": 0.8024529218673706, "Finetune/Loss (Raw)": 0.8618578314781189, "Finetune/Step": 1725, "Finetune/Step Time": 2.934660416096449} +{"Finetune/Learning Rate": 1.5175628215567062e-05, "Finetune/Loss": 0.8022096157073975, "Finetune/Loss (Raw)": 0.8103169798851013, "Finetune/Step": 1726, "Finetune/Step Time": 2.9369051679968834} +{"Finetune/Learning Rate": 1.51700559505775e-05, "Finetune/Loss": 0.802448034286499, "Finetune/Loss (Raw)": 0.8790887594223022, "Finetune/Step": 1727, "Finetune/Step Time": 2.9331345818936825} +{"Finetune/Learning Rate": 1.5164481493790887e-05, "Finetune/Loss": 0.8030749559402466, "Finetune/Loss (Raw)": 0.9467966556549072, "Finetune/Step": 1728, "Finetune/Step Time": 2.9334573969244957} +{"Finetune/Learning Rate": 1.5158904847570467e-05, "Finetune/Loss": 0.8037874698638916, "Finetune/Loss (Raw)": 0.8893682956695557, "Finetune/Step": 1729, "Finetune/Step Time": 2.931601408869028} +{"Finetune/Learning Rate": 1.51533260142804e-05, "Finetune/Loss": 0.8047784566879272, "Finetune/Loss (Raw)": 0.9700006246566772, "Finetune/Step": 1730, "Finetune/Step Time": 2.9288887977600098} +{"Finetune/Learning Rate": 1.514774499628579e-05, "Finetune/Loss": 0.8039833307266235, "Finetune/Loss (Raw)": 0.7619919180870056, "Finetune/Step": 1731, "Finetune/Step Time": 2.9297124072909355} +{"Finetune/Learning Rate": 1.5142161795952653e-05, "Finetune/Loss": 0.803329586982727, "Finetune/Loss (Raw)": 0.7466094493865967, "Finetune/Step": 1732, "Finetune/Step Time": 2.92852034047246} +{"Finetune/Learning Rate": 1.5136576415647932e-05, "Finetune/Loss": 0.8022671937942505, "Finetune/Loss (Raw)": 0.7287166714668274, "Finetune/Step": 1733, "Finetune/Step Time": 2.9279368706047535} +{"Finetune/Learning Rate": 1.51309888577395e-05, "Finetune/Loss": 0.8014915585517883, "Finetune/Loss (Raw)": 0.731684148311615, "Finetune/Step": 1734, "Finetune/Step Time": 2.926416525617242} +{"Finetune/Learning Rate": 1.5125399124596148e-05, "Finetune/Loss": 0.7990150451660156, "Finetune/Loss (Raw)": 0.5518773794174194, "Finetune/Step": 1735, "Finetune/Step Time": 2.951449440792203} +{"Finetune/Learning Rate": 1.5119807218587594e-05, "Finetune/Loss": 0.797291100025177, "Finetune/Loss (Raw)": 0.641845703125, "Finetune/Step": 1736, "Finetune/Step Time": 2.973878202959895} +{"Finetune/Learning Rate": 1.5114213142084473e-05, "Finetune/Loss": 0.796703577041626, "Finetune/Loss (Raw)": 0.7889271974563599, "Finetune/Step": 1737, "Finetune/Step Time": 2.9708973225206137} +{"Finetune/Learning Rate": 1.5108616897458343e-05, "Finetune/Loss": 0.7958114743232727, "Finetune/Loss (Raw)": 0.7341625690460205, "Finetune/Step": 1738, "Finetune/Step Time": 2.9699452351778746} +{"Finetune/Learning Rate": 1.5103018487081678e-05, "Finetune/Loss": 0.7974703311920166, "Finetune/Loss (Raw)": 0.8058986663818359, "Finetune/Step": 1739, "Finetune/Step Time": 2.9468287751078606} +{"Finetune/Learning Rate": 1.5097417913327872e-05, "Finetune/Loss": 0.7965932488441467, "Finetune/Loss (Raw)": 0.6628563404083252, "Finetune/Step": 1740, "Finetune/Step Time": 2.9457090254873037} +{"Finetune/Learning Rate": 1.5091815178571238e-05, "Finetune/Loss": 0.8013286590576172, "Finetune/Loss (Raw)": 0.9028888940811157, "Finetune/Step": 1741, "Finetune/Step Time": 2.916234776377678} +{"Finetune/Learning Rate": 1.5086210285187002e-05, "Finetune/Loss": 0.800796627998352, "Finetune/Loss (Raw)": 0.7534643411636353, "Finetune/Step": 1742, "Finetune/Step Time": 2.915620280429721} +{"Finetune/Learning Rate": 1.5080603235551305e-05, "Finetune/Loss": 0.8003469705581665, "Finetune/Loss (Raw)": 0.8365731835365295, "Finetune/Step": 1743, "Finetune/Step Time": 2.9193688482046127} +{"Finetune/Learning Rate": 1.5074994032041204e-05, "Finetune/Loss": 0.7999894618988037, "Finetune/Loss (Raw)": 0.7759479880332947, "Finetune/Step": 1744, "Finetune/Step Time": 2.9196633100509644} +{"Finetune/Learning Rate": 1.5069382677034669e-05, "Finetune/Loss": 0.7992163896560669, "Finetune/Loss (Raw)": 0.6482810974121094, "Finetune/Step": 1745, "Finetune/Step Time": 2.921939192339778} +{"Finetune/Learning Rate": 1.5063769172910585e-05, "Finetune/Loss": 0.7993499040603638, "Finetune/Loss (Raw)": 0.8185885548591614, "Finetune/Step": 1746, "Finetune/Step Time": 2.9183266554027796} +{"Finetune/Learning Rate": 1.5058153522048739e-05, "Finetune/Loss": 0.7994440793991089, "Finetune/Loss (Raw)": 0.8308742046356201, "Finetune/Step": 1747, "Finetune/Step Time": 2.920200066640973} +{"Finetune/Learning Rate": 1.505253572682984e-05, "Finetune/Loss": 0.8013370037078857, "Finetune/Loss (Raw)": 0.9183701276779175, "Finetune/Step": 1748, "Finetune/Step Time": 2.919742004945874} +{"Finetune/Learning Rate": 1.504691578963549e-05, "Finetune/Loss": 0.8033934831619263, "Finetune/Loss (Raw)": 0.95293790102005, "Finetune/Step": 1749, "Finetune/Step Time": 2.893907753750682} +{"Finetune/Learning Rate": 1.504129371284822e-05, "Finetune/Loss": 0.8030939102172852, "Finetune/Loss (Raw)": 0.8047274351119995, "Finetune/Step": 1750, "Finetune/Step Time": 2.8960269652307034} +{"Finetune/Learning Rate": 1.5035669498851451e-05, "Finetune/Loss": 0.8047382831573486, "Finetune/Loss (Raw)": 0.8618744611740112, "Finetune/Step": 1751, "Finetune/Step Time": 2.875987619161606} +{"Finetune/Learning Rate": 1.5030043150029521e-05, "Finetune/Loss": 0.804673433303833, "Finetune/Loss (Raw)": 0.8305342197418213, "Finetune/Step": 1752, "Finetune/Step Time": 2.8737760186195374} +{"Finetune/Learning Rate": 1.502441466876766e-05, "Finetune/Loss": 0.8016660213470459, "Finetune/Loss (Raw)": 0.5020845532417297, "Finetune/Step": 1753, "Finetune/Step Time": 2.8973725717514753} +{"Finetune/Learning Rate": 1.5018784057452016e-05, "Finetune/Loss": 0.8014637231826782, "Finetune/Loss (Raw)": 0.8038959503173828, "Finetune/Step": 1754, "Finetune/Step Time": 2.902695832774043} +{"Finetune/Learning Rate": 1.5013151318469634e-05, "Finetune/Loss": 0.8005356788635254, "Finetune/Loss (Raw)": 0.8143511414527893, "Finetune/Step": 1755, "Finetune/Step Time": 2.904332173988223} +{"Finetune/Learning Rate": 1.5007516454208462e-05, "Finetune/Loss": 0.8004168272018433, "Finetune/Loss (Raw)": 0.8797268867492676, "Finetune/Step": 1756, "Finetune/Step Time": 2.902025455608964} +{"Finetune/Learning Rate": 1.5001879467057345e-05, "Finetune/Loss": 0.799978494644165, "Finetune/Loss (Raw)": 0.8504464626312256, "Finetune/Step": 1757, "Finetune/Step Time": 2.904727363958955} +{"Finetune/Learning Rate": 1.4996240359406032e-05, "Finetune/Loss": 0.8005596399307251, "Finetune/Loss (Raw)": 0.8827043175697327, "Finetune/Step": 1758, "Finetune/Step Time": 2.904956454411149} +{"Finetune/Learning Rate": 1.4990599133645173e-05, "Finetune/Loss": 0.8006901144981384, "Finetune/Loss (Raw)": 0.8457062840461731, "Finetune/Step": 1759, "Finetune/Step Time": 2.9037123806774616} +{"Finetune/Learning Rate": 1.4984955792166308e-05, "Finetune/Loss": 0.8008024096488953, "Finetune/Loss (Raw)": 0.8554072380065918, "Finetune/Step": 1760, "Finetune/Step Time": 2.9129304718226194} +{"Finetune/Learning Rate": 1.4979310337361886e-05, "Finetune/Loss": 0.8011572360992432, "Finetune/Loss (Raw)": 0.8583457469940186, "Finetune/Step": 1761, "Finetune/Step Time": 2.9122487287968397} +{"Finetune/Learning Rate": 1.4973662771625237e-05, "Finetune/Loss": 0.8011857271194458, "Finetune/Loss (Raw)": 0.8838599920272827, "Finetune/Step": 1762, "Finetune/Step Time": 2.9151015523821115} +{"Finetune/Learning Rate": 1.49680130973506e-05, "Finetune/Loss": 0.8022523522377014, "Finetune/Loss (Raw)": 0.8803026676177979, "Finetune/Step": 1763, "Finetune/Step Time": 2.9171885214746} +{"Finetune/Learning Rate": 1.4962361316933099e-05, "Finetune/Loss": 0.8014940023422241, "Finetune/Loss (Raw)": 0.7503941059112549, "Finetune/Step": 1764, "Finetune/Step Time": 2.911925921216607} +{"Finetune/Learning Rate": 1.4956707432768753e-05, "Finetune/Loss": 0.8017213344573975, "Finetune/Loss (Raw)": 0.8513542413711548, "Finetune/Step": 1765, "Finetune/Step Time": 2.914132921025157} +{"Finetune/Learning Rate": 1.4951051447254478e-05, "Finetune/Loss": 0.8031440377235413, "Finetune/Loss (Raw)": 0.8428593277931213, "Finetune/Step": 1766, "Finetune/Step Time": 2.8947500195354223} +{"Finetune/Learning Rate": 1.4945393362788072e-05, "Finetune/Loss": 0.8041220903396606, "Finetune/Loss (Raw)": 0.8824152946472168, "Finetune/Step": 1767, "Finetune/Step Time": 2.869985105469823} +{"Finetune/Learning Rate": 1.4939733181768226e-05, "Finetune/Loss": 0.8043836355209351, "Finetune/Loss (Raw)": 0.7822640538215637, "Finetune/Step": 1768, "Finetune/Step Time": 2.8690575640648603} +{"Finetune/Learning Rate": 1.4934070906594527e-05, "Finetune/Loss": 0.8040820360183716, "Finetune/Loss (Raw)": 0.7798261046409607, "Finetune/Step": 1769, "Finetune/Step Time": 2.862061494961381} +{"Finetune/Learning Rate": 1.4928406539667438e-05, "Finetune/Loss": 0.8079450726509094, "Finetune/Loss (Raw)": 0.9341392517089844, "Finetune/Step": 1770, "Finetune/Step Time": 2.832667613402009} +{"Finetune/Learning Rate": 1.4922740083388316e-05, "Finetune/Loss": 0.8083212375640869, "Finetune/Loss (Raw)": 0.8104578852653503, "Finetune/Step": 1771, "Finetune/Step Time": 2.8297665249556303} +{"Finetune/Learning Rate": 1.4917071540159404e-05, "Finetune/Loss": 0.8078770637512207, "Finetune/Loss (Raw)": 0.8350138664245605, "Finetune/Step": 1772, "Finetune/Step Time": 2.831167872995138} +{"Finetune/Learning Rate": 1.4911400912383829e-05, "Finetune/Loss": 0.8084158301353455, "Finetune/Loss (Raw)": 0.8844323754310608, "Finetune/Step": 1773, "Finetune/Step Time": 2.829099114984274} +{"Finetune/Learning Rate": 1.4905728202465596e-05, "Finetune/Loss": 0.8088948130607605, "Finetune/Loss (Raw)": 0.833833634853363, "Finetune/Step": 1774, "Finetune/Step Time": 2.8277798909693956} +{"Finetune/Learning Rate": 1.4900053412809602e-05, "Finetune/Loss": 0.8095849752426147, "Finetune/Loss (Raw)": 0.8058471083641052, "Finetune/Step": 1775, "Finetune/Step Time": 2.829905405640602} +{"Finetune/Learning Rate": 1.4894376545821621e-05, "Finetune/Loss": 0.8099778890609741, "Finetune/Loss (Raw)": 0.8618676662445068, "Finetune/Step": 1776, "Finetune/Step Time": 2.8199244681745768} +{"Finetune/Learning Rate": 1.4888697603908305e-05, "Finetune/Loss": 0.8092746734619141, "Finetune/Loss (Raw)": 0.732918381690979, "Finetune/Step": 1777, "Finetune/Step Time": 2.8218619134277105} +{"Finetune/Learning Rate": 1.488301658947719e-05, "Finetune/Loss": 0.8084210157394409, "Finetune/Loss (Raw)": 0.7694375514984131, "Finetune/Step": 1778, "Finetune/Step Time": 2.8234381452202797} +{"Finetune/Learning Rate": 1.4877333504936688e-05, "Finetune/Loss": 0.8123027086257935, "Finetune/Loss (Raw)": 0.800449550151825, "Finetune/Step": 1779, "Finetune/Step Time": 2.792844448238611} +{"Finetune/Learning Rate": 1.4871648352696096e-05, "Finetune/Loss": 0.8113558888435364, "Finetune/Loss (Raw)": 0.7841013073921204, "Finetune/Step": 1780, "Finetune/Step Time": 2.7925982158631086} +{"Finetune/Learning Rate": 1.4865961135165572e-05, "Finetune/Loss": 0.8112529516220093, "Finetune/Loss (Raw)": 0.7666123509407043, "Finetune/Step": 1781, "Finetune/Step Time": 2.78992728702724} +{"Finetune/Learning Rate": 1.4860271854756163e-05, "Finetune/Loss": 0.8129053711891174, "Finetune/Loss (Raw)": 0.9183253645896912, "Finetune/Step": 1782, "Finetune/Step Time": 2.7925068233162165} +{"Finetune/Learning Rate": 1.4854580513879787e-05, "Finetune/Loss": 0.8123269081115723, "Finetune/Loss (Raw)": 0.7728176712989807, "Finetune/Step": 1783, "Finetune/Step Time": 2.7954461127519608} +{"Finetune/Learning Rate": 1.4848887114949236e-05, "Finetune/Loss": 0.8166966438293457, "Finetune/Loss (Raw)": 0.864945650100708, "Finetune/Step": 1784, "Finetune/Step Time": 2.7661897130310535} +{"Finetune/Learning Rate": 1.484319166037817e-05, "Finetune/Loss": 0.8177305459976196, "Finetune/Loss (Raw)": 0.9488906264305115, "Finetune/Step": 1785, "Finetune/Step Time": 2.7630962878465652} +{"Finetune/Learning Rate": 1.4837494152581124e-05, "Finetune/Loss": 0.8184967041015625, "Finetune/Loss (Raw)": 0.7936093807220459, "Finetune/Step": 1786, "Finetune/Step Time": 2.74126435816288} +{"Finetune/Learning Rate": 1.483179459397351e-05, "Finetune/Loss": 0.8179104328155518, "Finetune/Loss (Raw)": 0.8511104583740234, "Finetune/Step": 1787, "Finetune/Step Time": 2.7421451173722744} +{"Finetune/Learning Rate": 1.4826092986971596e-05, "Finetune/Loss": 0.8172872066497803, "Finetune/Loss (Raw)": 0.7847391963005066, "Finetune/Step": 1788, "Finetune/Step Time": 2.739210944622755} +{"Finetune/Learning Rate": 1.482038933399253e-05, "Finetune/Loss": 0.8177722096443176, "Finetune/Loss (Raw)": 0.8798970580101013, "Finetune/Step": 1789, "Finetune/Step Time": 2.737814115360379} +{"Finetune/Learning Rate": 1.4814683637454315e-05, "Finetune/Loss": 0.8198021650314331, "Finetune/Loss (Raw)": 0.8490437865257263, "Finetune/Step": 1790, "Finetune/Step Time": 2.7144826035946608} +{"Finetune/Learning Rate": 1.4808975899775832e-05, "Finetune/Loss": 0.8192061185836792, "Finetune/Loss (Raw)": 0.8068458437919617, "Finetune/Step": 1791, "Finetune/Step Time": 2.7209260631352663} +{"Finetune/Learning Rate": 1.4803266123376827e-05, "Finetune/Loss": 0.8190958499908447, "Finetune/Loss (Raw)": 0.8084041476249695, "Finetune/Step": 1792, "Finetune/Step Time": 2.7203212548047304} +{"Finetune/Learning Rate": 1.4797554310677902e-05, "Finetune/Loss": 0.8195450901985168, "Finetune/Loss (Raw)": 0.8662793636322021, "Finetune/Step": 1793, "Finetune/Step Time": 2.7189438808709383} +{"Finetune/Learning Rate": 1.4791840464100528e-05, "Finetune/Loss": 0.8185587525367737, "Finetune/Loss (Raw)": 0.6701225638389587, "Finetune/Step": 1794, "Finetune/Step Time": 2.7167924474924803} +{"Finetune/Learning Rate": 1.4786124586067039e-05, "Finetune/Loss": 0.8188005685806274, "Finetune/Loss (Raw)": 0.9196574091911316, "Finetune/Step": 1795, "Finetune/Step Time": 2.717540794983506} +{"Finetune/Learning Rate": 1.4780406679000623e-05, "Finetune/Loss": 0.8190889358520508, "Finetune/Loss (Raw)": 0.7799293398857117, "Finetune/Step": 1796, "Finetune/Step Time": 2.7174110636115074} +{"Finetune/Learning Rate": 1.4774686745325337e-05, "Finetune/Loss": 0.819556474685669, "Finetune/Loss (Raw)": 0.8745026588439941, "Finetune/Step": 1797, "Finetune/Step Time": 2.7194962203502655} +{"Finetune/Learning Rate": 1.4768964787466096e-05, "Finetune/Loss": 0.8199741840362549, "Finetune/Loss (Raw)": 0.9118381142616272, "Finetune/Step": 1798, "Finetune/Step Time": 2.721130793914199} +{"Finetune/Learning Rate": 1.4763240807848667e-05, "Finetune/Loss": 0.8203645944595337, "Finetune/Loss (Raw)": 0.7616933584213257, "Finetune/Step": 1799, "Finetune/Step Time": 2.7203701455146074} +{"Finetune/Learning Rate": 1.4757514808899675e-05, "Finetune/Loss": 0.8190716505050659, "Finetune/Loss (Raw)": 0.7288693189620972, "Finetune/Step": 1800, "Finetune/Step Time": 2.696662636473775} +{"Finetune/Learning Rate": 1.4751786793046611e-05, "Finetune/Loss": 0.8181978464126587, "Finetune/Loss (Raw)": 0.7945308089256287, "Finetune/Step": 1801, "Finetune/Step Time": 2.695230457931757} +{"Finetune/Learning Rate": 1.4746056762717813e-05, "Finetune/Loss": 0.8183240294456482, "Finetune/Loss (Raw)": 0.9034565687179565, "Finetune/Step": 1802, "Finetune/Step Time": 2.6917022597044706} +{"Finetune/Learning Rate": 1.4740324720342469e-05, "Finetune/Loss": 0.8189520239830017, "Finetune/Loss (Raw)": 0.7748974561691284, "Finetune/Step": 1803, "Finetune/Step Time": 2.6939496099948883} +{"Finetune/Learning Rate": 1.4734590668350631e-05, "Finetune/Loss": 0.8187337517738342, "Finetune/Loss (Raw)": 0.7879638075828552, "Finetune/Step": 1804, "Finetune/Step Time": 2.6981977000832558} +{"Finetune/Learning Rate": 1.4728854609173187e-05, "Finetune/Loss": 0.819293737411499, "Finetune/Loss (Raw)": 0.8757623434066772, "Finetune/Step": 1805, "Finetune/Step Time": 2.698892133310437} +{"Finetune/Learning Rate": 1.4723116545241896e-05, "Finetune/Loss": 0.8192431926727295, "Finetune/Loss (Raw)": 0.8330245018005371, "Finetune/Step": 1806, "Finetune/Step Time": 2.6940202116966248} +{"Finetune/Learning Rate": 1.4717376478989354e-05, "Finetune/Loss": 0.8179773092269897, "Finetune/Loss (Raw)": 0.705504298210144, "Finetune/Step": 1807, "Finetune/Step Time": 2.696793794631958} +{"Finetune/Learning Rate": 1.4711634412849005e-05, "Finetune/Loss": 0.8191719055175781, "Finetune/Loss (Raw)": 0.9314697980880737, "Finetune/Step": 1808, "Finetune/Step Time": 2.6942587550729513} +{"Finetune/Learning Rate": 1.4705890349255149e-05, "Finetune/Loss": 0.8199625611305237, "Finetune/Loss (Raw)": 0.89979088306427, "Finetune/Step": 1809, "Finetune/Step Time": 2.693976305425167} +{"Finetune/Learning Rate": 1.4700144290642926e-05, "Finetune/Loss": 0.8194350004196167, "Finetune/Loss (Raw)": 0.7212238311767578, "Finetune/Step": 1810, "Finetune/Step Time": 2.6880265437066555} +{"Finetune/Learning Rate": 1.4694396239448325e-05, "Finetune/Loss": 0.8193244934082031, "Finetune/Loss (Raw)": 0.7792286276817322, "Finetune/Step": 1811, "Finetune/Step Time": 2.6907811872661114} +{"Finetune/Learning Rate": 1.4688646198108178e-05, "Finetune/Loss": 0.8194761276245117, "Finetune/Loss (Raw)": 0.8124915361404419, "Finetune/Step": 1812, "Finetune/Step Time": 2.6884732879698277} +{"Finetune/Learning Rate": 1.4682894169060163e-05, "Finetune/Loss": 0.8196566104888916, "Finetune/Loss (Raw)": 0.9076914191246033, "Finetune/Step": 1813, "Finetune/Step Time": 2.6888939682394266} +{"Finetune/Learning Rate": 1.4677140154742792e-05, "Finetune/Loss": 0.819568395614624, "Finetune/Loss (Raw)": 0.7911025881767273, "Finetune/Step": 1814, "Finetune/Step Time": 2.6873911265283823} +{"Finetune/Learning Rate": 1.4671384157595436e-05, "Finetune/Loss": 0.8222601413726807, "Finetune/Loss (Raw)": 0.7954434752464294, "Finetune/Step": 1815, "Finetune/Step Time": 2.6605947632342577} +{"Finetune/Learning Rate": 1.4665626180058295e-05, "Finetune/Loss": 0.8230014443397522, "Finetune/Loss (Raw)": 0.8891777992248535, "Finetune/Step": 1816, "Finetune/Step Time": 2.668483706191182} +{"Finetune/Learning Rate": 1.46598662245724e-05, "Finetune/Loss": 0.822806715965271, "Finetune/Loss (Raw)": 0.8357164263725281, "Finetune/Step": 1817, "Finetune/Step Time": 2.6660183127969503} +{"Finetune/Learning Rate": 1.4654104293579643e-05, "Finetune/Loss": 0.8219201564788818, "Finetune/Loss (Raw)": 0.7419772148132324, "Finetune/Step": 1818, "Finetune/Step Time": 2.665224965661764} +{"Finetune/Learning Rate": 1.464834038952273e-05, "Finetune/Loss": 0.8212075233459473, "Finetune/Loss (Raw)": 0.8519165515899658, "Finetune/Step": 1819, "Finetune/Step Time": 2.6683296654373407} +{"Finetune/Learning Rate": 1.4642574514845223e-05, "Finetune/Loss": 0.8214240074157715, "Finetune/Loss (Raw)": 0.9028580188751221, "Finetune/Step": 1820, "Finetune/Step Time": 2.663939779624343} +{"Finetune/Learning Rate": 1.4636806671991508e-05, "Finetune/Loss": 0.821468710899353, "Finetune/Loss (Raw)": 0.7991629242897034, "Finetune/Step": 1821, "Finetune/Step Time": 2.6644166875630617} +{"Finetune/Learning Rate": 1.4631036863406805e-05, "Finetune/Loss": 0.8218839168548584, "Finetune/Loss (Raw)": 0.8325310945510864, "Finetune/Step": 1822, "Finetune/Step Time": 2.6620133463293314} +{"Finetune/Learning Rate": 1.4625265091537175e-05, "Finetune/Loss": 0.8224614858627319, "Finetune/Loss (Raw)": 0.7954154014587402, "Finetune/Step": 1823, "Finetune/Step Time": 2.6620475854724646} +{"Finetune/Learning Rate": 1.4619491358829502e-05, "Finetune/Loss": 0.8228256702423096, "Finetune/Loss (Raw)": 0.8985925316810608, "Finetune/Step": 1824, "Finetune/Step Time": 2.6599929723888636} +{"Finetune/Learning Rate": 1.4613715667731513e-05, "Finetune/Loss": 0.8232954144477844, "Finetune/Loss (Raw)": 0.8687517046928406, "Finetune/Step": 1825, "Finetune/Step Time": 2.6603613570332527} +{"Finetune/Learning Rate": 1.4607938020691755e-05, "Finetune/Loss": 0.823444128036499, "Finetune/Loss (Raw)": 0.8256111741065979, "Finetune/Step": 1826, "Finetune/Step Time": 2.6633263397961855} +{"Finetune/Learning Rate": 1.4602158420159606e-05, "Finetune/Loss": 0.8222697377204895, "Finetune/Loss (Raw)": 0.7198877930641174, "Finetune/Step": 1827, "Finetune/Step Time": 2.684471609070897} +{"Finetune/Learning Rate": 1.4596376868585276e-05, "Finetune/Loss": 0.8221749067306519, "Finetune/Loss (Raw)": 0.8797715306282043, "Finetune/Step": 1828, "Finetune/Step Time": 2.6860988419502974} +{"Finetune/Learning Rate": 1.4590593368419796e-05, "Finetune/Loss": 0.8219045400619507, "Finetune/Loss (Raw)": 0.8041225671768188, "Finetune/Step": 1829, "Finetune/Step Time": 2.681982923299074} +{"Finetune/Learning Rate": 1.4584807922115034e-05, "Finetune/Loss": 0.8215683102607727, "Finetune/Loss (Raw)": 0.7769491672515869, "Finetune/Step": 1830, "Finetune/Step Time": 2.685616722330451} +{"Finetune/Learning Rate": 1.457902053212367e-05, "Finetune/Loss": 0.8228458166122437, "Finetune/Loss (Raw)": 0.9703748226165771, "Finetune/Step": 1831, "Finetune/Step Time": 2.684756813570857} +{"Finetune/Learning Rate": 1.4573231200899218e-05, "Finetune/Loss": 0.8224542140960693, "Finetune/Loss (Raw)": 0.8240675926208496, "Finetune/Step": 1832, "Finetune/Step Time": 2.674637356773019} +{"Finetune/Learning Rate": 1.4567439930896008e-05, "Finetune/Loss": 0.8219836950302124, "Finetune/Loss (Raw)": 0.7916716933250427, "Finetune/Step": 1833, "Finetune/Step Time": 2.6766629740595818} +{"Finetune/Learning Rate": 1.4561646724569199e-05, "Finetune/Loss": 0.8221184015274048, "Finetune/Loss (Raw)": 0.9087961316108704, "Finetune/Step": 1834, "Finetune/Step Time": 2.6770412418991327} +{"Finetune/Learning Rate": 1.455585158437476e-05, "Finetune/Loss": 0.8222471475601196, "Finetune/Loss (Raw)": 0.8435885310173035, "Finetune/Step": 1835, "Finetune/Step Time": 2.675841636955738} +{"Finetune/Learning Rate": 1.4550054512769493e-05, "Finetune/Loss": 0.8227603435516357, "Finetune/Loss (Raw)": 0.9316474795341492, "Finetune/Step": 1836, "Finetune/Step Time": 2.67321434058249} +{"Finetune/Learning Rate": 1.4544255512211009e-05, "Finetune/Loss": 0.8232210874557495, "Finetune/Loss (Raw)": 0.8490564227104187, "Finetune/Step": 1837, "Finetune/Step Time": 2.6732690818607807} +{"Finetune/Learning Rate": 1.4538454585157742e-05, "Finetune/Loss": 0.8232006430625916, "Finetune/Loss (Raw)": 0.8170177340507507, "Finetune/Step": 1838, "Finetune/Step Time": 2.6744120940566063} +{"Finetune/Learning Rate": 1.453265173406894e-05, "Finetune/Loss": 0.8250501155853271, "Finetune/Loss (Raw)": 0.7856023907661438, "Finetune/Step": 1839, "Finetune/Step Time": 2.650361755862832} +{"Finetune/Learning Rate": 1.452684696140467e-05, "Finetune/Loss": 0.8253594040870667, "Finetune/Loss (Raw)": 0.8816630840301514, "Finetune/Step": 1840, "Finetune/Step Time": 2.646949578076601} +{"Finetune/Learning Rate": 1.452104026962581e-05, "Finetune/Loss": 0.8264015913009644, "Finetune/Loss (Raw)": 0.9147416353225708, "Finetune/Step": 1841, "Finetune/Step Time": 2.6459813322871923} +{"Finetune/Learning Rate": 1.4515231661194052e-05, "Finetune/Loss": 0.8260283470153809, "Finetune/Loss (Raw)": 0.8854108452796936, "Finetune/Step": 1842, "Finetune/Step Time": 2.6451032757759094} +{"Finetune/Learning Rate": 1.4509421138571898e-05, "Finetune/Loss": 0.825090765953064, "Finetune/Loss (Raw)": 0.7687599658966064, "Finetune/Step": 1843, "Finetune/Step Time": 2.6453541964292526} +{"Finetune/Learning Rate": 1.4503608704222672e-05, "Finetune/Loss": 0.8254833221435547, "Finetune/Loss (Raw)": 0.9740810990333557, "Finetune/Step": 1844, "Finetune/Step Time": 2.64632435888052} +{"Finetune/Learning Rate": 1.4497794360610498e-05, "Finetune/Loss": 0.8260120749473572, "Finetune/Loss (Raw)": 0.9266525506973267, "Finetune/Step": 1845, "Finetune/Step Time": 2.6440892051905394} +{"Finetune/Learning Rate": 1.449197811020031e-05, "Finetune/Loss": 0.8254852890968323, "Finetune/Loss (Raw)": 0.811752200126648, "Finetune/Step": 1846, "Finetune/Step Time": 2.6464663427323103} +{"Finetune/Learning Rate": 1.4486159955457857e-05, "Finetune/Loss": 0.8258739709854126, "Finetune/Loss (Raw)": 0.8164394497871399, "Finetune/Step": 1847, "Finetune/Step Time": 2.646707221865654} +{"Finetune/Learning Rate": 1.4480339898849694e-05, "Finetune/Loss": 0.8242899775505066, "Finetune/Loss (Raw)": 0.7790248990058899, "Finetune/Step": 1848, "Finetune/Step Time": 2.6463134679943323} +{"Finetune/Learning Rate": 1.4474517942843173e-05, "Finetune/Loss": 0.8253183364868164, "Finetune/Loss (Raw)": 0.9611983895301819, "Finetune/Step": 1849, "Finetune/Step Time": 2.6456008851528168} +{"Finetune/Learning Rate": 1.4468694089906463e-05, "Finetune/Loss": 0.8248521089553833, "Finetune/Loss (Raw)": 0.8032286167144775, "Finetune/Step": 1850, "Finetune/Step Time": 2.643134055659175} +{"Finetune/Learning Rate": 1.4462868342508529e-05, "Finetune/Loss": 0.8249375820159912, "Finetune/Loss (Raw)": 0.8079923391342163, "Finetune/Step": 1851, "Finetune/Step Time": 2.642423540353775} +{"Finetune/Learning Rate": 1.4457040703119143e-05, "Finetune/Loss": 0.824480414390564, "Finetune/Loss (Raw)": 0.7410650253295898, "Finetune/Step": 1852, "Finetune/Step Time": 2.642965318635106} +{"Finetune/Learning Rate": 1.4451211174208882e-05, "Finetune/Loss": 0.82435542345047, "Finetune/Loss (Raw)": 0.8458552360534668, "Finetune/Step": 1853, "Finetune/Step Time": 2.640711933374405} +{"Finetune/Learning Rate": 1.4445379758249117e-05, "Finetune/Loss": 0.8245368599891663, "Finetune/Loss (Raw)": 0.8335461020469666, "Finetune/Step": 1854, "Finetune/Step Time": 2.6378717366605997} +{"Finetune/Learning Rate": 1.443954645771202e-05, "Finetune/Loss": 0.8190518617630005, "Finetune/Loss (Raw)": 0.17700453102588654, "Finetune/Step": 1855, "Finetune/Step Time": 2.6714558266103268} +{"Finetune/Learning Rate": 1.4433711275070572e-05, "Finetune/Loss": 0.8176456093788147, "Finetune/Loss (Raw)": 0.7667949795722961, "Finetune/Step": 1856, "Finetune/Step Time": 2.693955909460783} +{"Finetune/Learning Rate": 1.4427874212798536e-05, "Finetune/Loss": 0.8169068098068237, "Finetune/Loss (Raw)": 0.7947995066642761, "Finetune/Step": 1857, "Finetune/Step Time": 2.6975424271076918} +{"Finetune/Learning Rate": 1.4422035273370488e-05, "Finetune/Loss": 0.8155808448791504, "Finetune/Loss (Raw)": 0.8002811074256897, "Finetune/Step": 1858, "Finetune/Step Time": 2.6957223024219275} +{"Finetune/Learning Rate": 1.4416194459261785e-05, "Finetune/Loss": 0.8153270483016968, "Finetune/Loss (Raw)": 0.7295145988464355, "Finetune/Step": 1859, "Finetune/Step Time": 2.7183726131916046} +{"Finetune/Learning Rate": 1.441035177294859e-05, "Finetune/Loss": 0.8160961270332336, "Finetune/Loss (Raw)": 0.8450427651405334, "Finetune/Step": 1860, "Finetune/Step Time": 2.7185934614390135} +{"Finetune/Learning Rate": 1.4404507216907853e-05, "Finetune/Loss": 0.816556453704834, "Finetune/Loss (Raw)": 0.7876402735710144, "Finetune/Step": 1861, "Finetune/Step Time": 2.719500271603465} +{"Finetune/Learning Rate": 1.439866079361732e-05, "Finetune/Loss": 0.8173816204071045, "Finetune/Loss (Raw)": 0.8373050689697266, "Finetune/Step": 1862, "Finetune/Step Time": 2.7227920163422823} +{"Finetune/Learning Rate": 1.4392812505555531e-05, "Finetune/Loss": 0.8209156394004822, "Finetune/Loss (Raw)": 1.004236102104187, "Finetune/Step": 1863, "Finetune/Step Time": 2.695583315566182} +{"Finetune/Learning Rate": 1.4386962355201809e-05, "Finetune/Loss": 0.8226261138916016, "Finetune/Loss (Raw)": 0.8607861995697021, "Finetune/Step": 1864, "Finetune/Step Time": 2.672641871497035} +{"Finetune/Learning Rate": 1.4381110345036268e-05, "Finetune/Loss": 0.8235106468200684, "Finetune/Loss (Raw)": 0.9021410942077637, "Finetune/Step": 1865, "Finetune/Step Time": 2.6753633860498667} +{"Finetune/Learning Rate": 1.437525647753982e-05, "Finetune/Loss": 0.823611855506897, "Finetune/Loss (Raw)": 0.7471106052398682, "Finetune/Step": 1866, "Finetune/Step Time": 2.6764626130461693} +{"Finetune/Learning Rate": 1.4369400755194156e-05, "Finetune/Loss": 0.8249158263206482, "Finetune/Loss (Raw)": 0.9728149771690369, "Finetune/Step": 1867, "Finetune/Step Time": 2.6781699620187283} +{"Finetune/Learning Rate": 1.4363543180481752e-05, "Finetune/Loss": 0.8262598514556885, "Finetune/Loss (Raw)": 0.8348913192749023, "Finetune/Step": 1868, "Finetune/Step Time": 2.6540192496031523} +{"Finetune/Learning Rate": 1.4357683755885875e-05, "Finetune/Loss": 0.825872540473938, "Finetune/Loss (Raw)": 0.853310227394104, "Finetune/Step": 1869, "Finetune/Step Time": 2.6524741742759943} +{"Finetune/Learning Rate": 1.435182248389057e-05, "Finetune/Loss": 0.8262595534324646, "Finetune/Loss (Raw)": 0.8030047416687012, "Finetune/Step": 1870, "Finetune/Step Time": 2.658134201541543} +{"Finetune/Learning Rate": 1.434595936698067e-05, "Finetune/Loss": 0.8263338804244995, "Finetune/Loss (Raw)": 0.8460947275161743, "Finetune/Step": 1871, "Finetune/Step Time": 2.655606919899583} +{"Finetune/Learning Rate": 1.4340094407641794e-05, "Finetune/Loss": 0.826841413974762, "Finetune/Loss (Raw)": 0.8409009575843811, "Finetune/Step": 1872, "Finetune/Step Time": 2.664742724969983} +{"Finetune/Learning Rate": 1.433422760836033e-05, "Finetune/Loss": 0.8282151222229004, "Finetune/Loss (Raw)": 0.8241176009178162, "Finetune/Step": 1873, "Finetune/Step Time": 2.6637284625321627} +{"Finetune/Learning Rate": 1.4328358971623455e-05, "Finetune/Loss": 0.8285950422286987, "Finetune/Loss (Raw)": 0.8672202229499817, "Finetune/Step": 1874, "Finetune/Step Time": 2.6646016966551542} +{"Finetune/Learning Rate": 1.4322488499919123e-05, "Finetune/Loss": 0.8281144499778748, "Finetune/Loss (Raw)": 0.7693583965301514, "Finetune/Step": 1875, "Finetune/Step Time": 2.663726296275854} +{"Finetune/Learning Rate": 1.4316616195736068e-05, "Finetune/Loss": 0.828387975692749, "Finetune/Loss (Raw)": 0.9533839225769043, "Finetune/Step": 1876, "Finetune/Step Time": 2.6650126464664936} +{"Finetune/Learning Rate": 1.4310742061563796e-05, "Finetune/Loss": 0.8278810381889343, "Finetune/Loss (Raw)": 0.8880443572998047, "Finetune/Step": 1877, "Finetune/Step Time": 2.6632660254836082} +{"Finetune/Learning Rate": 1.4304866099892594e-05, "Finetune/Loss": 0.82796311378479, "Finetune/Loss (Raw)": 0.8152328729629517, "Finetune/Step": 1878, "Finetune/Step Time": 2.6658522710204124} +{"Finetune/Learning Rate": 1.4298988313213516e-05, "Finetune/Loss": 0.8278229832649231, "Finetune/Loss (Raw)": 0.8439444899559021, "Finetune/Step": 1879, "Finetune/Step Time": 2.664173297584057} +{"Finetune/Learning Rate": 1.4293108704018397e-05, "Finetune/Loss": 0.8270882368087769, "Finetune/Loss (Raw)": 0.7364852428436279, "Finetune/Step": 1880, "Finetune/Step Time": 2.665186356753111} +{"Finetune/Learning Rate": 1.4287227274799848e-05, "Finetune/Loss": 0.8291144371032715, "Finetune/Loss (Raw)": 0.7614390254020691, "Finetune/Step": 1881, "Finetune/Step Time": 2.6469584442675114} +{"Finetune/Learning Rate": 1.4281344028051241e-05, "Finetune/Loss": 0.8299670219421387, "Finetune/Loss (Raw)": 0.9130287170410156, "Finetune/Step": 1882, "Finetune/Step Time": 2.6458948757499456} +{"Finetune/Learning Rate": 1.4275458966266723e-05, "Finetune/Loss": 0.8306784629821777, "Finetune/Loss (Raw)": 0.9054094552993774, "Finetune/Step": 1883, "Finetune/Step Time": 2.646720675751567} +{"Finetune/Learning Rate": 1.4269572091941215e-05, "Finetune/Loss": 0.8296959400177002, "Finetune/Loss (Raw)": 0.7539703845977783, "Finetune/Step": 1884, "Finetune/Step Time": 2.6502370834350586} +{"Finetune/Learning Rate": 1.4263683407570396e-05, "Finetune/Loss": 0.8301843404769897, "Finetune/Loss (Raw)": 0.9129518866539001, "Finetune/Step": 1885, "Finetune/Step Time": 2.651038510724902} +{"Finetune/Learning Rate": 1.4257792915650728e-05, "Finetune/Loss": 0.8301000595092773, "Finetune/Loss (Raw)": 0.871926486492157, "Finetune/Step": 1886, "Finetune/Step Time": 2.6539660152047873} +{"Finetune/Learning Rate": 1.4251900618679424e-05, "Finetune/Loss": 0.8294285535812378, "Finetune/Loss (Raw)": 0.7597553730010986, "Finetune/Step": 1887, "Finetune/Step Time": 2.652595577761531} +{"Finetune/Learning Rate": 1.424600651915447e-05, "Finetune/Loss": 0.8287422060966492, "Finetune/Loss (Raw)": 0.7675488591194153, "Finetune/Step": 1888, "Finetune/Step Time": 2.6456915698945522} +{"Finetune/Learning Rate": 1.424011061957461e-05, "Finetune/Loss": 0.8286271691322327, "Finetune/Loss (Raw)": 0.8436177372932434, "Finetune/Step": 1889, "Finetune/Step Time": 2.6465058363974094} +{"Finetune/Learning Rate": 1.4234212922439364e-05, "Finetune/Loss": 0.8284609317779541, "Finetune/Loss (Raw)": 0.8625843524932861, "Finetune/Step": 1890, "Finetune/Step Time": 2.6452251095324755} +{"Finetune/Learning Rate": 1.4228313430249001e-05, "Finetune/Loss": 0.8283879160881042, "Finetune/Loss (Raw)": 0.870954692363739, "Finetune/Step": 1891, "Finetune/Step Time": 2.645697785541415} +{"Finetune/Learning Rate": 1.4222412145504554e-05, "Finetune/Loss": 0.829247236251831, "Finetune/Loss (Raw)": 0.8603828549385071, "Finetune/Step": 1892, "Finetune/Step Time": 2.6486543845385313} +{"Finetune/Learning Rate": 1.4216509070707822e-05, "Finetune/Loss": 0.8293846845626831, "Finetune/Loss (Raw)": 0.8689532279968262, "Finetune/Step": 1893, "Finetune/Step Time": 2.645349096506834} +{"Finetune/Learning Rate": 1.4210604208361355e-05, "Finetune/Loss": 0.8294922113418579, "Finetune/Loss (Raw)": 0.85662841796875, "Finetune/Step": 1894, "Finetune/Step Time": 2.6435376815497875} +{"Finetune/Learning Rate": 1.420469756096847e-05, "Finetune/Loss": 0.8298171758651733, "Finetune/Loss (Raw)": 0.924004077911377, "Finetune/Step": 1895, "Finetune/Step Time": 2.640261773020029} +{"Finetune/Learning Rate": 1.4198789131033227e-05, "Finetune/Loss": 0.8298222422599792, "Finetune/Loss (Raw)": 0.7829148173332214, "Finetune/Step": 1896, "Finetune/Step Time": 2.6433934029191732} +{"Finetune/Learning Rate": 1.4192878921060458e-05, "Finetune/Loss": 0.8299893736839294, "Finetune/Loss (Raw)": 0.8012174367904663, "Finetune/Step": 1897, "Finetune/Step Time": 2.6434338372200727} +{"Finetune/Learning Rate": 1.4186966933555735e-05, "Finetune/Loss": 0.8290536403656006, "Finetune/Loss (Raw)": 0.8143687844276428, "Finetune/Step": 1898, "Finetune/Step Time": 2.646687986329198} +{"Finetune/Learning Rate": 1.4181053171025392e-05, "Finetune/Loss": 0.8292750120162964, "Finetune/Loss (Raw)": 0.8387923240661621, "Finetune/Step": 1899, "Finetune/Step Time": 2.650279166176915} +{"Finetune/Learning Rate": 1.4175137635976515e-05, "Finetune/Loss": 0.8284364938735962, "Finetune/Loss (Raw)": 0.7276753187179565, "Finetune/Step": 1900, "Finetune/Step Time": 2.6461349707096815} +{"Finetune/Learning Rate": 1.4169220330916939e-05, "Finetune/Loss": 0.8276022672653198, "Finetune/Loss (Raw)": 0.777654767036438, "Finetune/Step": 1901, "Finetune/Step Time": 2.648345524445176} +{"Finetune/Learning Rate": 1.4163301258355249e-05, "Finetune/Loss": 0.8232738971710205, "Finetune/Loss (Raw)": 0.2798071801662445, "Finetune/Step": 1902, "Finetune/Step Time": 2.678231777623296} +{"Finetune/Learning Rate": 1.4157380420800784e-05, "Finetune/Loss": 0.8234512805938721, "Finetune/Loss (Raw)": 0.8285449743270874, "Finetune/Step": 1903, "Finetune/Step Time": 2.675668105483055} +{"Finetune/Learning Rate": 1.4151457820763624e-05, "Finetune/Loss": 0.8233731985092163, "Finetune/Loss (Raw)": 0.851884663105011, "Finetune/Step": 1904, "Finetune/Step Time": 2.6730658523738384} +{"Finetune/Learning Rate": 1.41455334607546e-05, "Finetune/Loss": 0.8239136934280396, "Finetune/Loss (Raw)": 0.8020908832550049, "Finetune/Step": 1905, "Finetune/Step Time": 2.6748647689819336} +{"Finetune/Learning Rate": 1.4139607343285296e-05, "Finetune/Loss": 0.8248029947280884, "Finetune/Loss (Raw)": 0.8832690119743347, "Finetune/Step": 1906, "Finetune/Step Time": 2.6721682492643595} +{"Finetune/Learning Rate": 1.4133679470868027e-05, "Finetune/Loss": 0.8253860473632812, "Finetune/Loss (Raw)": 0.8750849366188049, "Finetune/Step": 1907, "Finetune/Step Time": 2.6756233032792807} +{"Finetune/Learning Rate": 1.412774984601586e-05, "Finetune/Loss": 0.8256661891937256, "Finetune/Loss (Raw)": 0.8199577331542969, "Finetune/Step": 1908, "Finetune/Step Time": 2.6755711007863283} +{"Finetune/Learning Rate": 1.4121818471242608e-05, "Finetune/Loss": 0.8257500529289246, "Finetune/Loss (Raw)": 0.7773475646972656, "Finetune/Step": 1909, "Finetune/Step Time": 2.682747373357415} +{"Finetune/Learning Rate": 1.4115885349062818e-05, "Finetune/Loss": 0.825331449508667, "Finetune/Loss (Raw)": 0.8647472858428955, "Finetune/Step": 1910, "Finetune/Step Time": 2.680012084543705} +{"Finetune/Learning Rate": 1.4109950481991788e-05, "Finetune/Loss": 0.8242810964584351, "Finetune/Loss (Raw)": 0.6383667588233948, "Finetune/Step": 1911, "Finetune/Step Time": 2.6958875358104706} +{"Finetune/Learning Rate": 1.4104013872545544e-05, "Finetune/Loss": 0.824026346206665, "Finetune/Loss (Raw)": 0.8323401808738708, "Finetune/Step": 1912, "Finetune/Step Time": 2.698196928948164} +{"Finetune/Learning Rate": 1.4098075523240856e-05, "Finetune/Loss": 0.8228086829185486, "Finetune/Loss (Raw)": 0.7930288910865784, "Finetune/Step": 1913, "Finetune/Step Time": 2.699764298275113} +{"Finetune/Learning Rate": 1.4092135436595234e-05, "Finetune/Loss": 0.8234893083572388, "Finetune/Loss (Raw)": 0.8807306289672852, "Finetune/Step": 1914, "Finetune/Step Time": 2.7004006821662188} +{"Finetune/Learning Rate": 1.4086193615126922e-05, "Finetune/Loss": 0.8238708972930908, "Finetune/Loss (Raw)": 0.8999535441398621, "Finetune/Step": 1915, "Finetune/Step Time": 2.697760868817568} +{"Finetune/Learning Rate": 1.4080250061354899e-05, "Finetune/Loss": 0.8242921829223633, "Finetune/Loss (Raw)": 0.8386611938476562, "Finetune/Step": 1916, "Finetune/Step Time": 2.7036478091031313} +{"Finetune/Learning Rate": 1.4074304777798882e-05, "Finetune/Loss": 0.8238574862480164, "Finetune/Loss (Raw)": 0.8242572546005249, "Finetune/Step": 1917, "Finetune/Step Time": 2.7031599897891283} +{"Finetune/Learning Rate": 1.4068357766979314e-05, "Finetune/Loss": 0.8234518766403198, "Finetune/Loss (Raw)": 0.79712975025177, "Finetune/Step": 1918, "Finetune/Step Time": 2.702278131619096} +{"Finetune/Learning Rate": 1.406240903141738e-05, "Finetune/Loss": 0.8234198093414307, "Finetune/Loss (Raw)": 0.8027342557907104, "Finetune/Step": 1919, "Finetune/Step Time": 2.7014946155250072} +{"Finetune/Learning Rate": 1.4056458573634988e-05, "Finetune/Loss": 0.8242738246917725, "Finetune/Loss (Raw)": 0.917716383934021, "Finetune/Step": 1920, "Finetune/Step Time": 2.7022007368505} +{"Finetune/Learning Rate": 1.4050506396154779e-05, "Finetune/Loss": 0.8240509033203125, "Finetune/Loss (Raw)": 0.8377450108528137, "Finetune/Step": 1921, "Finetune/Step Time": 2.7016131207346916} +{"Finetune/Learning Rate": 1.4044552501500124e-05, "Finetune/Loss": 0.824833869934082, "Finetune/Loss (Raw)": 0.7703537344932556, "Finetune/Step": 1922, "Finetune/Step Time": 2.7002746406942606} +{"Finetune/Learning Rate": 1.403859689219512e-05, "Finetune/Loss": 0.8238319158554077, "Finetune/Loss (Raw)": 0.7914015054702759, "Finetune/Step": 1923, "Finetune/Step Time": 2.698708765208721} +{"Finetune/Learning Rate": 1.4032639570764595e-05, "Finetune/Loss": 0.8238909244537354, "Finetune/Loss (Raw)": 0.7874855995178223, "Finetune/Step": 1924, "Finetune/Step Time": 2.7024566419422626} +{"Finetune/Learning Rate": 1.4026680539734096e-05, "Finetune/Loss": 0.8234909176826477, "Finetune/Loss (Raw)": 0.8232948780059814, "Finetune/Step": 1925, "Finetune/Step Time": 2.7013067081570625} +{"Finetune/Learning Rate": 1.4020719801629902e-05, "Finetune/Loss": 0.821542501449585, "Finetune/Loss (Raw)": 0.6624454855918884, "Finetune/Step": 1926, "Finetune/Step Time": 2.7222059313207865} +{"Finetune/Learning Rate": 1.401475735897901e-05, "Finetune/Loss": 0.8212729692459106, "Finetune/Loss (Raw)": 0.7271931171417236, "Finetune/Step": 1927, "Finetune/Step Time": 2.7247347682714462} +{"Finetune/Learning Rate": 1.4008793214309147e-05, "Finetune/Loss": 0.8223748207092285, "Finetune/Loss (Raw)": 0.8699021339416504, "Finetune/Step": 1928, "Finetune/Step Time": 2.7346863225102425} +{"Finetune/Learning Rate": 1.4002827370148747e-05, "Finetune/Loss": 0.822655439376831, "Finetune/Loss (Raw)": 0.830448567867279, "Finetune/Step": 1929, "Finetune/Step Time": 2.7348890230059624} +{"Finetune/Learning Rate": 1.3996859829026983e-05, "Finetune/Loss": 0.8218845725059509, "Finetune/Loss (Raw)": 0.8047902584075928, "Finetune/Step": 1930, "Finetune/Step Time": 2.740561766549945} +{"Finetune/Learning Rate": 1.3990890593473734e-05, "Finetune/Loss": 0.8221964836120605, "Finetune/Loss (Raw)": 0.8148189187049866, "Finetune/Step": 1931, "Finetune/Step Time": 2.741430191323161} +{"Finetune/Learning Rate": 1.3984919666019603e-05, "Finetune/Loss": 0.8234387040138245, "Finetune/Loss (Raw)": 0.9469688534736633, "Finetune/Step": 1932, "Finetune/Step Time": 2.7368758097290993} +{"Finetune/Learning Rate": 1.3978947049195909e-05, "Finetune/Loss": 0.823167085647583, "Finetune/Loss (Raw)": 0.8409982323646545, "Finetune/Step": 1933, "Finetune/Step Time": 2.7338974364101887} +{"Finetune/Learning Rate": 1.3972972745534685e-05, "Finetune/Loss": 0.8241647481918335, "Finetune/Loss (Raw)": 0.9607287049293518, "Finetune/Step": 1934, "Finetune/Step Time": 2.7392000425606966} +{"Finetune/Learning Rate": 1.3966996757568686e-05, "Finetune/Loss": 0.8245556354522705, "Finetune/Loss (Raw)": 0.7555340528488159, "Finetune/Step": 1935, "Finetune/Step Time": 2.7346264254301786} +{"Finetune/Learning Rate": 1.3961019087831373e-05, "Finetune/Loss": 0.8240675330162048, "Finetune/Loss (Raw)": 0.8689895868301392, "Finetune/Step": 1936, "Finetune/Step Time": 2.7360127363353968} +{"Finetune/Learning Rate": 1.3955039738856924e-05, "Finetune/Loss": 0.820306658744812, "Finetune/Loss (Raw)": 0.4184010624885559, "Finetune/Step": 1937, "Finetune/Step Time": 2.772854048758745} +{"Finetune/Learning Rate": 1.394905871318023e-05, "Finetune/Loss": 0.8218050003051758, "Finetune/Loss (Raw)": 0.9130138754844666, "Finetune/Step": 1938, "Finetune/Step Time": 2.771618578583002} +{"Finetune/Learning Rate": 1.3943076013336891e-05, "Finetune/Loss": 0.8225786685943604, "Finetune/Loss (Raw)": 0.8782536387443542, "Finetune/Step": 1939, "Finetune/Step Time": 2.7714467272162437} +{"Finetune/Learning Rate": 1.3937091641863213e-05, "Finetune/Loss": 0.8229711651802063, "Finetune/Loss (Raw)": 0.8627387881278992, "Finetune/Step": 1940, "Finetune/Step Time": 2.7712764274328947} +{"Finetune/Learning Rate": 1.3931105601296217e-05, "Finetune/Loss": 0.8221558928489685, "Finetune/Loss (Raw)": 0.8033323884010315, "Finetune/Step": 1941, "Finetune/Step Time": 2.77191274240613} +{"Finetune/Learning Rate": 1.392511789417363e-05, "Finetune/Loss": 0.8221193552017212, "Finetune/Loss (Raw)": 0.7864324450492859, "Finetune/Step": 1942, "Finetune/Step Time": 2.7711655627936125} +{"Finetune/Learning Rate": 1.3919128523033885e-05, "Finetune/Loss": 0.8221962451934814, "Finetune/Loss (Raw)": 0.8052806854248047, "Finetune/Step": 1943, "Finetune/Step Time": 2.770521717146039} +{"Finetune/Learning Rate": 1.3913137490416117e-05, "Finetune/Loss": 0.821124255657196, "Finetune/Loss (Raw)": 0.7519562244415283, "Finetune/Step": 1944, "Finetune/Step Time": 2.759060714393854} +{"Finetune/Learning Rate": 1.3907144798860172e-05, "Finetune/Loss": 0.8161913156509399, "Finetune/Loss (Raw)": 0.20430395007133484, "Finetune/Step": 1945, "Finetune/Step Time": 2.7953069377690554} +{"Finetune/Learning Rate": 1.3901150450906593e-05, "Finetune/Loss": 0.8169927597045898, "Finetune/Loss (Raw)": 0.8445656895637512, "Finetune/Step": 1946, "Finetune/Step Time": 2.7985548209398985} +{"Finetune/Learning Rate": 1.3895154449096631e-05, "Finetune/Loss": 0.8165217638015747, "Finetune/Loss (Raw)": 0.791622519493103, "Finetune/Step": 1947, "Finetune/Step Time": 2.803079703822732} +{"Finetune/Learning Rate": 1.3889156795972231e-05, "Finetune/Loss": 0.8152368068695068, "Finetune/Loss (Raw)": 0.7383872866630554, "Finetune/Step": 1948, "Finetune/Step Time": 2.802030296996236} +{"Finetune/Learning Rate": 1.3883157494076048e-05, "Finetune/Loss": 0.815790057182312, "Finetune/Loss (Raw)": 0.8699792623519897, "Finetune/Step": 1949, "Finetune/Step Time": 2.801534404978156} +{"Finetune/Learning Rate": 1.3877156545951423e-05, "Finetune/Loss": 0.8170521259307861, "Finetune/Loss (Raw)": 0.994083821773529, "Finetune/Step": 1950, "Finetune/Step Time": 2.8033977691084146} +{"Finetune/Learning Rate": 1.3871153954142406e-05, "Finetune/Loss": 0.8172114491462708, "Finetune/Loss (Raw)": 0.8158003091812134, "Finetune/Step": 1951, "Finetune/Step Time": 2.8032592236995697} +{"Finetune/Learning Rate": 1.3865149721193741e-05, "Finetune/Loss": 0.8179308176040649, "Finetune/Loss (Raw)": 0.9906662702560425, "Finetune/Step": 1952, "Finetune/Step Time": 2.8038894329220057} +{"Finetune/Learning Rate": 1.3859143849650865e-05, "Finetune/Loss": 0.8178868293762207, "Finetune/Loss (Raw)": 0.8631272912025452, "Finetune/Step": 1953, "Finetune/Step Time": 2.80556758120656} +{"Finetune/Learning Rate": 1.385313634205991e-05, "Finetune/Loss": 0.8176074028015137, "Finetune/Loss (Raw)": 0.789848268032074, "Finetune/Step": 1954, "Finetune/Step Time": 2.8025815673172474} +{"Finetune/Learning Rate": 1.3847127200967703e-05, "Finetune/Loss": 0.8187397718429565, "Finetune/Loss (Raw)": 0.8648275136947632, "Finetune/Step": 1955, "Finetune/Step Time": 2.7799064964056015} +{"Finetune/Learning Rate": 1.3841116428921768e-05, "Finetune/Loss": 0.8134727478027344, "Finetune/Loss (Raw)": 0.20559483766555786, "Finetune/Step": 1956, "Finetune/Step Time": 2.811705155298114} +{"Finetune/Learning Rate": 1.3835104028470312e-05, "Finetune/Loss": 0.8136199116706848, "Finetune/Loss (Raw)": 0.8229617476463318, "Finetune/Step": 1957, "Finetune/Step Time": 2.813931543380022} +{"Finetune/Learning Rate": 1.3829090002162235e-05, "Finetune/Loss": 0.814154326915741, "Finetune/Loss (Raw)": 0.8453516364097595, "Finetune/Step": 1958, "Finetune/Step Time": 2.808105256408453} +{"Finetune/Learning Rate": 1.382307435254713e-05, "Finetune/Loss": 0.812552809715271, "Finetune/Loss (Raw)": 0.765374481678009, "Finetune/Step": 1959, "Finetune/Step Time": 2.803169572725892} +{"Finetune/Learning Rate": 1.3817057082175272e-05, "Finetune/Loss": 0.8127124309539795, "Finetune/Loss (Raw)": 0.8445010781288147, "Finetune/Step": 1960, "Finetune/Step Time": 2.798642011359334} +{"Finetune/Learning Rate": 1.3811038193597633e-05, "Finetune/Loss": 0.813080906867981, "Finetune/Loss (Raw)": 0.8388370871543884, "Finetune/Step": 1961, "Finetune/Step Time": 2.794994378462434} +{"Finetune/Learning Rate": 1.3805017689365859e-05, "Finetune/Loss": 0.8123396635055542, "Finetune/Loss (Raw)": 0.8139178156852722, "Finetune/Step": 1962, "Finetune/Step Time": 2.796778989955783} +{"Finetune/Learning Rate": 1.379899557203229e-05, "Finetune/Loss": 0.8124899864196777, "Finetune/Loss (Raw)": 0.8628327250480652, "Finetune/Step": 1963, "Finetune/Step Time": 2.7975211907178164} +{"Finetune/Learning Rate": 1.3792971844149942e-05, "Finetune/Loss": 0.812139630317688, "Finetune/Loss (Raw)": 0.8868054151535034, "Finetune/Step": 1964, "Finetune/Step Time": 2.798398671671748} +{"Finetune/Learning Rate": 1.3786946508272526e-05, "Finetune/Loss": 0.8116370439529419, "Finetune/Loss (Raw)": 0.7847181558609009, "Finetune/Step": 1965, "Finetune/Step Time": 2.7967530991882086} +{"Finetune/Learning Rate": 1.3780919566954418e-05, "Finetune/Loss": 0.8121440410614014, "Finetune/Loss (Raw)": 0.881913423538208, "Finetune/Step": 1966, "Finetune/Step Time": 2.7978053633123636} +{"Finetune/Learning Rate": 1.3774891022750691e-05, "Finetune/Loss": 0.8116360902786255, "Finetune/Loss (Raw)": 0.720585823059082, "Finetune/Step": 1967, "Finetune/Step Time": 2.7958614323288202} +{"Finetune/Learning Rate": 1.3768860878217087e-05, "Finetune/Loss": 0.8109897375106812, "Finetune/Loss (Raw)": 0.798927366733551, "Finetune/Step": 1968, "Finetune/Step Time": 2.796508826315403} +{"Finetune/Learning Rate": 1.376282913591003e-05, "Finetune/Loss": 0.8099169731140137, "Finetune/Loss (Raw)": 0.7774317860603333, "Finetune/Step": 1969, "Finetune/Step Time": 2.7994972970336676} +{"Finetune/Learning Rate": 1.375679579838662e-05, "Finetune/Loss": 0.8081933259963989, "Finetune/Loss (Raw)": 0.6647883057594299, "Finetune/Step": 1970, "Finetune/Step Time": 2.82220022380352} +{"Finetune/Learning Rate": 1.3750760868204635e-05, "Finetune/Loss": 0.8084486126899719, "Finetune/Loss (Raw)": 0.8014317154884338, "Finetune/Step": 1971, "Finetune/Step Time": 2.8204433117061853} +{"Finetune/Learning Rate": 1.3744724347922528e-05, "Finetune/Loss": 0.8069136142730713, "Finetune/Loss (Raw)": 0.7776023149490356, "Finetune/Step": 1972, "Finetune/Step Time": 2.817115182057023} +{"Finetune/Learning Rate": 1.3738686240099428e-05, "Finetune/Loss": 0.8043563961982727, "Finetune/Loss (Raw)": 0.5993297696113586, "Finetune/Step": 1973, "Finetune/Step Time": 2.84407433308661} +{"Finetune/Learning Rate": 1.3732646547295128e-05, "Finetune/Loss": 0.8044132590293884, "Finetune/Loss (Raw)": 0.819030225276947, "Finetune/Step": 1974, "Finetune/Step Time": 2.841584926471114} +{"Finetune/Learning Rate": 1.3726605272070103e-05, "Finetune/Loss": 0.8040919303894043, "Finetune/Loss (Raw)": 0.7753095030784607, "Finetune/Step": 1975, "Finetune/Step Time": 2.8404316157102585} +{"Finetune/Learning Rate": 1.3720562416985497e-05, "Finetune/Loss": 0.8046318292617798, "Finetune/Loss (Raw)": 0.8481297492980957, "Finetune/Step": 1976, "Finetune/Step Time": 2.845148764550686} +{"Finetune/Learning Rate": 1.371451798460312e-05, "Finetune/Loss": 0.8026195168495178, "Finetune/Loss (Raw)": 0.7036236524581909, "Finetune/Step": 1977, "Finetune/Step Time": 2.846070248633623} +{"Finetune/Learning Rate": 1.3708471977485454e-05, "Finetune/Loss": 0.8032270669937134, "Finetune/Loss (Raw)": 0.8809912800788879, "Finetune/Step": 1978, "Finetune/Step Time": 2.8459876868873835} +{"Finetune/Learning Rate": 1.3702424398195644e-05, "Finetune/Loss": 0.8033643960952759, "Finetune/Loss (Raw)": 0.8255752325057983, "Finetune/Step": 1979, "Finetune/Step Time": 2.8481340892612934} +{"Finetune/Learning Rate": 1.3696375249297509e-05, "Finetune/Loss": 0.8033983111381531, "Finetune/Loss (Raw)": 0.745408833026886, "Finetune/Step": 1980, "Finetune/Step Time": 2.8713412024080753} +{"Finetune/Learning Rate": 1.3690324533355528e-05, "Finetune/Loss": 0.8029953241348267, "Finetune/Loss (Raw)": 0.7942650318145752, "Finetune/Step": 1981, "Finetune/Step Time": 2.874026231467724} +{"Finetune/Learning Rate": 1.3684272252934847e-05, "Finetune/Loss": 0.8030663728713989, "Finetune/Loss (Raw)": 0.8426374197006226, "Finetune/Step": 1982, "Finetune/Step Time": 2.8743587005883455} +{"Finetune/Learning Rate": 1.3678218410601269e-05, "Finetune/Loss": 0.8072159886360168, "Finetune/Loss (Raw)": 0.7081629633903503, "Finetune/Step": 1983, "Finetune/Step Time": 2.844303263351321} +{"Finetune/Learning Rate": 1.3672163008921271e-05, "Finetune/Loss": 0.8058817386627197, "Finetune/Loss (Raw)": 0.5960091948509216, "Finetune/Step": 1984, "Finetune/Step Time": 2.853349572047591} +{"Finetune/Learning Rate": 1.3666106050461979e-05, "Finetune/Loss": 0.8063779473304749, "Finetune/Loss (Raw)": 0.8583175539970398, "Finetune/Step": 1985, "Finetune/Step Time": 2.8512886855751276} +{"Finetune/Learning Rate": 1.3660047537791186e-05, "Finetune/Loss": 0.8063244223594666, "Finetune/Loss (Raw)": 0.7934301495552063, "Finetune/Step": 1986, "Finetune/Step Time": 2.8532081581652164} +{"Finetune/Learning Rate": 1.3653987473477344e-05, "Finetune/Loss": 0.8071635961532593, "Finetune/Loss (Raw)": 0.83692467212677, "Finetune/Step": 1987, "Finetune/Step Time": 2.828841833397746} +{"Finetune/Learning Rate": 1.3647925860089552e-05, "Finetune/Loss": 0.8062455654144287, "Finetune/Loss (Raw)": 0.727533221244812, "Finetune/Step": 1988, "Finetune/Step Time": 2.8304566647857428} +{"Finetune/Learning Rate": 1.3641862700197589e-05, "Finetune/Loss": 0.8064950704574585, "Finetune/Loss (Raw)": 0.8195774555206299, "Finetune/Step": 1989, "Finetune/Step Time": 2.8332248721271753} +{"Finetune/Learning Rate": 1.3635797996371862e-05, "Finetune/Loss": 0.8065457344055176, "Finetune/Loss (Raw)": 0.8437917828559875, "Finetune/Step": 1990, "Finetune/Step Time": 2.828514091670513} +{"Finetune/Learning Rate": 1.3629731751183452e-05, "Finetune/Loss": 0.8055894374847412, "Finetune/Loss (Raw)": 0.8818271160125732, "Finetune/Step": 1991, "Finetune/Step Time": 2.829095335677266} +{"Finetune/Learning Rate": 1.3623663967204088e-05, "Finetune/Loss": 0.8044531941413879, "Finetune/Loss (Raw)": 0.7153487205505371, "Finetune/Step": 1992, "Finetune/Step Time": 2.853278897702694} +{"Finetune/Learning Rate": 1.3617594647006146e-05, "Finetune/Loss": 0.8040931820869446, "Finetune/Loss (Raw)": 0.8560616374015808, "Finetune/Step": 1993, "Finetune/Step Time": 2.851950766518712} +{"Finetune/Learning Rate": 1.361152379316266e-05, "Finetune/Loss": 0.8044835329055786, "Finetune/Loss (Raw)": 0.7970743775367737, "Finetune/Step": 1994, "Finetune/Step Time": 2.851376364007592} +{"Finetune/Learning Rate": 1.3605451408247312e-05, "Finetune/Loss": 0.8030427694320679, "Finetune/Loss (Raw)": 0.7883942723274231, "Finetune/Step": 1995, "Finetune/Step Time": 2.849392104893923} +{"Finetune/Learning Rate": 1.3599377494834436e-05, "Finetune/Loss": 0.8035651445388794, "Finetune/Loss (Raw)": 0.9017603397369385, "Finetune/Step": 1996, "Finetune/Step Time": 2.8558958806097507} +{"Finetune/Learning Rate": 1.3593302055499004e-05, "Finetune/Loss": 0.8035392761230469, "Finetune/Loss (Raw)": 0.8499939441680908, "Finetune/Step": 1997, "Finetune/Step Time": 2.852925790473819} +{"Finetune/Learning Rate": 1.358722509281665e-05, "Finetune/Loss": 0.803615927696228, "Finetune/Loss (Raw)": 0.8128198385238647, "Finetune/Step": 1998, "Finetune/Step Time": 2.846982216462493} +{"Finetune/Learning Rate": 1.358114660936364e-05, "Finetune/Loss": 0.8034722805023193, "Finetune/Loss (Raw)": 0.8277091979980469, "Finetune/Step": 1999, "Finetune/Step Time": 2.846588743850589} +{"Finetune/Learning Rate": 1.3575066607716893e-05, "Finetune/Loss": 0.8033682107925415, "Finetune/Loss (Raw)": 0.827580988407135, "Finetune/Step": 2000, "Finetune/Step Time": 2.8403333723545074} +{"Finetune/Learning Rate": 1.3568985090453968e-05, "Finetune/Loss": 0.8032670617103577, "Finetune/Loss (Raw)": 0.8111690878868103, "Finetune/Step": 2001, "Finetune/Step Time": 2.840240841731429} +{"Finetune/Learning Rate": 1.3562902060153065e-05, "Finetune/Loss": 0.8024976253509521, "Finetune/Loss (Raw)": 0.7687345743179321, "Finetune/Step": 2002, "Finetune/Step Time": 2.839326862245798} +{"Finetune/Learning Rate": 1.3556817519393033e-05, "Finetune/Loss": 0.8018862009048462, "Finetune/Loss (Raw)": 0.6910865306854248, "Finetune/Step": 2003, "Finetune/Step Time": 2.8633541520684958} +{"Finetune/Learning Rate": 1.3550731470753355e-05, "Finetune/Loss": 0.801486611366272, "Finetune/Loss (Raw)": 0.902247428894043, "Finetune/Step": 2004, "Finetune/Step Time": 2.8641608245670795} +{"Finetune/Learning Rate": 1.3544643916814152e-05, "Finetune/Loss": 0.799837589263916, "Finetune/Loss (Raw)": 0.6769669055938721, "Finetune/Step": 2005, "Finetune/Step Time": 2.887780385091901} +{"Finetune/Learning Rate": 1.353855486015619e-05, "Finetune/Loss": 0.8005207777023315, "Finetune/Loss (Raw)": 0.9026756286621094, "Finetune/Step": 2006, "Finetune/Step Time": 2.8874506689608097} +{"Finetune/Learning Rate": 1.3532464303360862e-05, "Finetune/Loss": 0.8005893230438232, "Finetune/Loss (Raw)": 0.852722704410553, "Finetune/Step": 2007, "Finetune/Step Time": 2.886059433221817} +{"Finetune/Learning Rate": 1.3526372249010209e-05, "Finetune/Loss": 0.8017472624778748, "Finetune/Loss (Raw)": 0.884697675704956, "Finetune/Step": 2008, "Finetune/Step Time": 2.885010113939643} +{"Finetune/Learning Rate": 1.3520278699686897e-05, "Finetune/Loss": 0.8020710349082947, "Finetune/Loss (Raw)": 0.8028908371925354, "Finetune/Step": 2009, "Finetune/Step Time": 2.8826831933110952} +{"Finetune/Learning Rate": 1.3514183657974232e-05, "Finetune/Loss": 0.8017681837081909, "Finetune/Loss (Raw)": 0.8742511868476868, "Finetune/Step": 2010, "Finetune/Step Time": 2.880582692101598} +{"Finetune/Learning Rate": 1.3508087126456144e-05, "Finetune/Loss": 0.8015191555023193, "Finetune/Loss (Raw)": 0.8735414743423462, "Finetune/Step": 2011, "Finetune/Step Time": 2.8806926365941763} +{"Finetune/Learning Rate": 1.3501989107717209e-05, "Finetune/Loss": 0.8015820384025574, "Finetune/Loss (Raw)": 0.7620205283164978, "Finetune/Step": 2012, "Finetune/Step Time": 2.8811908420175314} +{"Finetune/Learning Rate": 1.349588960434262e-05, "Finetune/Loss": 0.8011205196380615, "Finetune/Loss (Raw)": 0.853870153427124, "Finetune/Step": 2013, "Finetune/Step Time": 2.8807583823800087} +{"Finetune/Learning Rate": 1.3489788618918207e-05, "Finetune/Loss": 0.7986675500869751, "Finetune/Loss (Raw)": 0.5579518675804138, "Finetune/Step": 2014, "Finetune/Step Time": 2.903407573699951} +{"Finetune/Learning Rate": 1.3483686154030423e-05, "Finetune/Loss": 0.7987072467803955, "Finetune/Loss (Raw)": 0.7648332715034485, "Finetune/Step": 2015, "Finetune/Step Time": 2.9065645411610603} +{"Finetune/Learning Rate": 1.3477582212266355e-05, "Finetune/Loss": 0.7994195222854614, "Finetune/Loss (Raw)": 0.8587223887443542, "Finetune/Step": 2016, "Finetune/Step Time": 2.9068840835243464} +{"Finetune/Learning Rate": 1.3471476796213709e-05, "Finetune/Loss": 0.7985938787460327, "Finetune/Loss (Raw)": 0.7379338145256042, "Finetune/Step": 2017, "Finetune/Step Time": 2.9066019374877214} +{"Finetune/Learning Rate": 1.3465369908460824e-05, "Finetune/Loss": 0.7979121804237366, "Finetune/Loss (Raw)": 0.7753276824951172, "Finetune/Step": 2018, "Finetune/Step Time": 2.906638430431485} +{"Finetune/Learning Rate": 1.3459261551596653e-05, "Finetune/Loss": 0.7977422475814819, "Finetune/Loss (Raw)": 0.8492037653923035, "Finetune/Step": 2019, "Finetune/Step Time": 2.9064676482230425} +{"Finetune/Learning Rate": 1.3453151728210779e-05, "Finetune/Loss": 0.7978267669677734, "Finetune/Loss (Raw)": 0.8712020516395569, "Finetune/Step": 2020, "Finetune/Step Time": 2.9070540573447943} +{"Finetune/Learning Rate": 1.34470404408934e-05, "Finetune/Loss": 0.796708881855011, "Finetune/Loss (Raw)": 0.7258660197257996, "Finetune/Step": 2021, "Finetune/Step Time": 2.911238182336092} +{"Finetune/Learning Rate": 1.3440927692235348e-05, "Finetune/Loss": 0.7944549918174744, "Finetune/Loss (Raw)": 0.5681261420249939, "Finetune/Step": 2022, "Finetune/Step Time": 2.9317122232168913} +{"Finetune/Learning Rate": 1.343481348482806e-05, "Finetune/Loss": 0.7937966585159302, "Finetune/Loss (Raw)": 0.8397378921508789, "Finetune/Step": 2023, "Finetune/Step Time": 2.9413090720772743} +{"Finetune/Learning Rate": 1.34286978212636e-05, "Finetune/Loss": 0.7953984141349792, "Finetune/Loss (Raw)": 0.9879417419433594, "Finetune/Step": 2024, "Finetune/Step Time": 2.93539634719491} +{"Finetune/Learning Rate": 1.3422580704134645e-05, "Finetune/Loss": 0.7913036942481995, "Finetune/Loss (Raw)": 0.2770964503288269, "Finetune/Step": 2025, "Finetune/Step Time": 2.9652248080819845} +{"Finetune/Learning Rate": 1.341646213603449e-05, "Finetune/Loss": 0.7916136980056763, "Finetune/Loss (Raw)": 0.854047417640686, "Finetune/Step": 2026, "Finetune/Step Time": 2.9633353371173143} +{"Finetune/Learning Rate": 1.3410342119557046e-05, "Finetune/Loss": 0.7912813425064087, "Finetune/Loss (Raw)": 0.7962522506713867, "Finetune/Step": 2027, "Finetune/Step Time": 2.9623022824525833} +{"Finetune/Learning Rate": 1.3404220657296836e-05, "Finetune/Loss": 0.7921043038368225, "Finetune/Loss (Raw)": 0.8330160975456238, "Finetune/Step": 2028, "Finetune/Step Time": 2.9656729213893414} +{"Finetune/Learning Rate": 1.3398097751848997e-05, "Finetune/Loss": 0.7923729419708252, "Finetune/Loss (Raw)": 0.8120394945144653, "Finetune/Step": 2029, "Finetune/Step Time": 2.9688197560608387} +{"Finetune/Learning Rate": 1.3391973405809275e-05, "Finetune/Loss": 0.7964569330215454, "Finetune/Loss (Raw)": 0.8025581240653992, "Finetune/Step": 2030, "Finetune/Step Time": 2.9422586262226105} +{"Finetune/Learning Rate": 1.3385847621774035e-05, "Finetune/Loss": 0.7963008880615234, "Finetune/Loss (Raw)": 0.8085616827011108, "Finetune/Step": 2031, "Finetune/Step Time": 2.9437590558081865} +{"Finetune/Learning Rate": 1.3379720402340243e-05, "Finetune/Loss": 0.7958380579948425, "Finetune/Loss (Raw)": 0.7926499843597412, "Finetune/Step": 2032, "Finetune/Step Time": 2.9438593946397305} +{"Finetune/Learning Rate": 1.3373591750105479e-05, "Finetune/Loss": 0.7961361408233643, "Finetune/Loss (Raw)": 0.8402467370033264, "Finetune/Step": 2033, "Finetune/Step Time": 2.9422334786504507} +{"Finetune/Learning Rate": 1.3367461667667922e-05, "Finetune/Loss": 0.7957196235656738, "Finetune/Loss (Raw)": 0.8299477696418762, "Finetune/Step": 2034, "Finetune/Step Time": 2.9449410438537598} +{"Finetune/Learning Rate": 1.336133015762637e-05, "Finetune/Loss": 0.7952141761779785, "Finetune/Loss (Raw)": 0.8103954792022705, "Finetune/Step": 2035, "Finetune/Step Time": 2.9468309190124273} +{"Finetune/Learning Rate": 1.3355197222580213e-05, "Finetune/Loss": 0.7964246273040771, "Finetune/Loss (Raw)": 0.9748932719230652, "Finetune/Step": 2036, "Finetune/Step Time": 2.947965767234564} +{"Finetune/Learning Rate": 1.334906286512946e-05, "Finetune/Loss": 0.7966562509536743, "Finetune/Loss (Raw)": 0.8069992065429688, "Finetune/Step": 2037, "Finetune/Step Time": 2.943320531398058} +{"Finetune/Learning Rate": 1.334292708787471e-05, "Finetune/Loss": 0.7949660420417786, "Finetune/Loss (Raw)": 0.6483936905860901, "Finetune/Step": 2038, "Finetune/Step Time": 2.9671442098915577} +{"Finetune/Learning Rate": 1.3336789893417163e-05, "Finetune/Loss": 0.7963759899139404, "Finetune/Loss (Raw)": 0.8188386559486389, "Finetune/Step": 2039, "Finetune/Step Time": 2.9438079614192247} +{"Finetune/Learning Rate": 1.3330651284358635e-05, "Finetune/Loss": 0.794495701789856, "Finetune/Loss (Raw)": 0.591667890548706, "Finetune/Step": 2040, "Finetune/Step Time": 2.975827319547534} +{"Finetune/Learning Rate": 1.332451126330153e-05, "Finetune/Loss": 0.7944331169128418, "Finetune/Loss (Raw)": 0.7850221991539001, "Finetune/Step": 2041, "Finetune/Step Time": 2.9791086185723543} +{"Finetune/Learning Rate": 1.3318369832848848e-05, "Finetune/Loss": 0.7946204543113708, "Finetune/Loss (Raw)": 0.904704213142395, "Finetune/Step": 2042, "Finetune/Step Time": 2.9784170668572187} +{"Finetune/Learning Rate": 1.3312226995604195e-05, "Finetune/Loss": 0.793975830078125, "Finetune/Loss (Raw)": 0.81744784116745, "Finetune/Step": 2043, "Finetune/Step Time": 2.9836772177368402} +{"Finetune/Learning Rate": 1.3306082754171767e-05, "Finetune/Loss": 0.7934552431106567, "Finetune/Loss (Raw)": 0.7720279097557068, "Finetune/Step": 2044, "Finetune/Step Time": 2.9812660962343216} +{"Finetune/Learning Rate": 1.3299937111156363e-05, "Finetune/Loss": 0.793937087059021, "Finetune/Loss (Raw)": 0.8859262466430664, "Finetune/Step": 2045, "Finetune/Step Time": 2.9852891862392426} +{"Finetune/Learning Rate": 1.3293790069163366e-05, "Finetune/Loss": 0.7942999601364136, "Finetune/Loss (Raw)": 0.8435785174369812, "Finetune/Step": 2046, "Finetune/Step Time": 2.9895444568246603} +{"Finetune/Learning Rate": 1.328764163079876e-05, "Finetune/Loss": 0.7945507764816284, "Finetune/Loss (Raw)": 0.8348372578620911, "Finetune/Step": 2047, "Finetune/Step Time": 2.98485186137259} +{"Finetune/Learning Rate": 1.3281491798669118e-05, "Finetune/Loss": 0.794281005859375, "Finetune/Loss (Raw)": 0.883184015750885, "Finetune/Step": 2048, "Finetune/Step Time": 2.984154125675559} +{"Finetune/Learning Rate": 1.32753405753816e-05, "Finetune/Loss": 0.7938578128814697, "Finetune/Loss (Raw)": 0.7835858464241028, "Finetune/Step": 2049, "Finetune/Step Time": 2.985723378136754} +{"Finetune/Learning Rate": 1.3269187963543963e-05, "Finetune/Loss": 0.792499840259552, "Finetune/Loss (Raw)": 0.5965257883071899, "Finetune/Step": 2050, "Finetune/Step Time": 3.011838909238577} +{"Finetune/Learning Rate": 1.326303396576455e-05, "Finetune/Loss": 0.7928619384765625, "Finetune/Loss (Raw)": 0.8377536535263062, "Finetune/Step": 2051, "Finetune/Step Time": 3.009605599567294} +{"Finetune/Learning Rate": 1.3256878584652293e-05, "Finetune/Loss": 0.7936742901802063, "Finetune/Loss (Raw)": 0.8914663195610046, "Finetune/Step": 2052, "Finetune/Step Time": 3.0073985811322927} +{"Finetune/Learning Rate": 1.3250721822816703e-05, "Finetune/Loss": 0.7932747602462769, "Finetune/Loss (Raw)": 0.7721508741378784, "Finetune/Step": 2053, "Finetune/Step Time": 3.0111281871795654} +{"Finetune/Learning Rate": 1.3244563682867886e-05, "Finetune/Loss": 0.7947884798049927, "Finetune/Loss (Raw)": 0.8561988472938538, "Finetune/Step": 2054, "Finetune/Step Time": 2.9862339347600937} +{"Finetune/Learning Rate": 1.3238404167416527e-05, "Finetune/Loss": 0.7960037589073181, "Finetune/Loss (Raw)": 0.8827544450759888, "Finetune/Step": 2055, "Finetune/Step Time": 2.979597557336092} +{"Finetune/Learning Rate": 1.3232243279073896e-05, "Finetune/Loss": 0.7945594191551208, "Finetune/Loss (Raw)": 0.6850232481956482, "Finetune/Step": 2056, "Finetune/Step Time": 2.9708880465477705} +{"Finetune/Learning Rate": 1.3226081020451843e-05, "Finetune/Loss": 0.794385552406311, "Finetune/Loss (Raw)": 0.8082036375999451, "Finetune/Step": 2057, "Finetune/Step Time": 2.97499905154109} +{"Finetune/Learning Rate": 1.3219917394162796e-05, "Finetune/Loss": 0.7951548099517822, "Finetune/Loss (Raw)": 0.9032472968101501, "Finetune/Step": 2058, "Finetune/Step Time": 2.9697773344814777} +{"Finetune/Learning Rate": 1.3213752402819773e-05, "Finetune/Loss": 0.7946490049362183, "Finetune/Loss (Raw)": 0.7500720024108887, "Finetune/Step": 2059, "Finetune/Step Time": 2.9652197640389204} +{"Finetune/Learning Rate": 1.3207586049036366e-05, "Finetune/Loss": 0.7939221858978271, "Finetune/Loss (Raw)": 0.8539363741874695, "Finetune/Step": 2060, "Finetune/Step Time": 2.9648517314344645} +{"Finetune/Learning Rate": 1.3201418335426737e-05, "Finetune/Loss": 0.7934225797653198, "Finetune/Loss (Raw)": 0.7770588397979736, "Finetune/Step": 2061, "Finetune/Step Time": 2.966604843735695} +{"Finetune/Learning Rate": 1.3195249264605635e-05, "Finetune/Loss": 0.7926063537597656, "Finetune/Loss (Raw)": 0.856250524520874, "Finetune/Step": 2062, "Finetune/Step Time": 2.9627085216343403} +{"Finetune/Learning Rate": 1.3189078839188376e-05, "Finetune/Loss": 0.7937612533569336, "Finetune/Loss (Raw)": 0.9033555388450623, "Finetune/Step": 2063, "Finetune/Step Time": 2.9649646636098623} +{"Finetune/Learning Rate": 1.3182907061790862e-05, "Finetune/Loss": 0.7931501269340515, "Finetune/Loss (Raw)": 0.7907659411430359, "Finetune/Step": 2064, "Finetune/Step Time": 2.966403007507324} +{"Finetune/Learning Rate": 1.3176733935029552e-05, "Finetune/Loss": 0.7961611747741699, "Finetune/Loss (Raw)": 0.8038164377212524, "Finetune/Step": 2065, "Finetune/Step Time": 2.930623061954975} +{"Finetune/Learning Rate": 1.3170559461521492e-05, "Finetune/Loss": 0.7960795164108276, "Finetune/Loss (Raw)": 0.9025609493255615, "Finetune/Step": 2066, "Finetune/Step Time": 2.9327681362628937} +{"Finetune/Learning Rate": 1.3164383643884291e-05, "Finetune/Loss": 0.7953732013702393, "Finetune/Loss (Raw)": 0.7878459095954895, "Finetune/Step": 2067, "Finetune/Step Time": 2.9335682597011328} +{"Finetune/Learning Rate": 1.3158206484736122e-05, "Finetune/Loss": 0.7953879833221436, "Finetune/Loss (Raw)": 0.8646278977394104, "Finetune/Step": 2068, "Finetune/Step Time": 2.9344428535550833} +{"Finetune/Learning Rate": 1.3152027986695745e-05, "Finetune/Loss": 0.7955193519592285, "Finetune/Loss (Raw)": 0.8201547861099243, "Finetune/Step": 2069, "Finetune/Step Time": 2.932164369150996} +{"Finetune/Learning Rate": 1.3145848152382472e-05, "Finetune/Loss": 0.7956272959709167, "Finetune/Loss (Raw)": 0.8002440929412842, "Finetune/Step": 2070, "Finetune/Step Time": 2.9335620384663343} +{"Finetune/Learning Rate": 1.3139666984416187e-05, "Finetune/Loss": 0.795069694519043, "Finetune/Loss (Raw)": 0.7339130640029907, "Finetune/Step": 2071, "Finetune/Step Time": 2.933463878929615} +{"Finetune/Learning Rate": 1.3133484485417333e-05, "Finetune/Loss": 0.7962257862091064, "Finetune/Loss (Raw)": 0.8999283313751221, "Finetune/Step": 2072, "Finetune/Step Time": 2.934624830260873} +{"Finetune/Learning Rate": 1.3127300658006932e-05, "Finetune/Loss": 0.8011397123336792, "Finetune/Loss (Raw)": 0.833285927772522, "Finetune/Step": 2073, "Finetune/Step Time": 2.9008747413754463} +{"Finetune/Learning Rate": 1.3121115504806554e-05, "Finetune/Loss": 0.8004930019378662, "Finetune/Loss (Raw)": 0.7617870569229126, "Finetune/Step": 2074, "Finetune/Step Time": 2.89912973344326} +{"Finetune/Learning Rate": 1.311492902843834e-05, "Finetune/Loss": 0.8001051545143127, "Finetune/Loss (Raw)": 0.7419768571853638, "Finetune/Step": 2075, "Finetune/Step Time": 2.8945069797337055} +{"Finetune/Learning Rate": 1.3108741231524986e-05, "Finetune/Loss": 0.8009201884269714, "Finetune/Loss (Raw)": 0.8427141904830933, "Finetune/Step": 2076, "Finetune/Step Time": 2.8955971375107765} +{"Finetune/Learning Rate": 1.310255211668975e-05, "Finetune/Loss": 0.8007181882858276, "Finetune/Loss (Raw)": 0.8441309928894043, "Finetune/Step": 2077, "Finetune/Step Time": 2.8962913677096367} +{"Finetune/Learning Rate": 1.3096361686556457e-05, "Finetune/Loss": 0.7996764779090881, "Finetune/Loss (Raw)": 0.8607357144355774, "Finetune/Step": 2078, "Finetune/Step Time": 2.897369908168912} +{"Finetune/Learning Rate": 1.3090169943749475e-05, "Finetune/Loss": 0.7981433868408203, "Finetune/Loss (Raw)": 0.6195641160011292, "Finetune/Step": 2079, "Finetune/Step Time": 2.920021539554} +{"Finetune/Learning Rate": 1.308397689089374e-05, "Finetune/Loss": 0.7967606782913208, "Finetune/Loss (Raw)": 0.8136845231056213, "Finetune/Step": 2080, "Finetune/Step Time": 2.9205181039869785} +{"Finetune/Learning Rate": 1.3077782530614736e-05, "Finetune/Loss": 0.7964717149734497, "Finetune/Loss (Raw)": 0.8261333703994751, "Finetune/Step": 2081, "Finetune/Step Time": 2.920632019639015} +{"Finetune/Learning Rate": 1.3071586865538502e-05, "Finetune/Loss": 0.796249508857727, "Finetune/Loss (Raw)": 0.7614095211029053, "Finetune/Step": 2082, "Finetune/Step Time": 2.9217383451759815} +{"Finetune/Learning Rate": 1.3065389898291638e-05, "Finetune/Loss": 0.7968871593475342, "Finetune/Loss (Raw)": 0.9464503526687622, "Finetune/Step": 2083, "Finetune/Step Time": 2.922554025426507} +{"Finetune/Learning Rate": 1.305919163150129e-05, "Finetune/Loss": 0.8013910055160522, "Finetune/Loss (Raw)": 0.7820799946784973, "Finetune/Step": 2084, "Finetune/Step Time": 2.8897459506988525} +{"Finetune/Learning Rate": 1.3052992067795152e-05, "Finetune/Loss": 0.8014062643051147, "Finetune/Loss (Raw)": 0.82492595911026, "Finetune/Step": 2085, "Finetune/Step Time": 2.8888110257685184} +{"Finetune/Learning Rate": 1.3046791209801471e-05, "Finetune/Loss": 0.8010238409042358, "Finetune/Loss (Raw)": 0.7963886260986328, "Finetune/Step": 2086, "Finetune/Step Time": 2.8910971581935883} +{"Finetune/Learning Rate": 1.3040589060149045e-05, "Finetune/Loss": 0.8024489879608154, "Finetune/Loss (Raw)": 0.9477980732917786, "Finetune/Step": 2087, "Finetune/Step Time": 2.893422670662403} +{"Finetune/Learning Rate": 1.303438562146722e-05, "Finetune/Loss": 0.8013783097267151, "Finetune/Loss (Raw)": 0.7074550986289978, "Finetune/Step": 2088, "Finetune/Step Time": 2.919549286365509} +{"Finetune/Learning Rate": 1.3028180896385885e-05, "Finetune/Loss": 0.801673173904419, "Finetune/Loss (Raw)": 0.8765754699707031, "Finetune/Step": 2089, "Finetune/Step Time": 2.9220611937344074} +{"Finetune/Learning Rate": 1.3021974887535471e-05, "Finetune/Loss": 0.8004026412963867, "Finetune/Loss (Raw)": 0.6512885093688965, "Finetune/Step": 2090, "Finetune/Step Time": 2.942221838980913} +{"Finetune/Learning Rate": 1.301576759754696e-05, "Finetune/Loss": 0.8006453514099121, "Finetune/Loss (Raw)": 0.8938986659049988, "Finetune/Step": 2091, "Finetune/Step Time": 2.943787781521678} +{"Finetune/Learning Rate": 1.3009559029051878e-05, "Finetune/Loss": 0.8001701831817627, "Finetune/Loss (Raw)": 0.8259948492050171, "Finetune/Step": 2092, "Finetune/Step Time": 2.943794371560216} +{"Finetune/Learning Rate": 1.3003349184682285e-05, "Finetune/Loss": 0.8005748391151428, "Finetune/Loss (Raw)": 0.8365102410316467, "Finetune/Step": 2093, "Finetune/Step Time": 2.9426421876996756} +{"Finetune/Learning Rate": 1.2997138067070791e-05, "Finetune/Loss": 0.8003635406494141, "Finetune/Loss (Raw)": 0.8548619151115417, "Finetune/Step": 2094, "Finetune/Step Time": 2.942090367898345} +{"Finetune/Learning Rate": 1.2990925678850539e-05, "Finetune/Loss": 0.802150547504425, "Finetune/Loss (Raw)": 0.9493258595466614, "Finetune/Step": 2095, "Finetune/Step Time": 2.9445409905165434} +{"Finetune/Learning Rate": 1.298471202265521e-05, "Finetune/Loss": 0.8020737767219543, "Finetune/Loss (Raw)": 0.7891017198562622, "Finetune/Step": 2096, "Finetune/Step Time": 2.952205128967762} +{"Finetune/Learning Rate": 1.2978497101119032e-05, "Finetune/Loss": 0.8021593689918518, "Finetune/Loss (Raw)": 0.7883892059326172, "Finetune/Step": 2097, "Finetune/Step Time": 2.9494134075939655} +{"Finetune/Learning Rate": 1.2972280916876758e-05, "Finetune/Loss": 0.8039352893829346, "Finetune/Loss (Raw)": 0.8921046257019043, "Finetune/Step": 2098, "Finetune/Step Time": 2.925574269145727} +{"Finetune/Learning Rate": 1.2966063472563686e-05, "Finetune/Loss": 0.8041993379592896, "Finetune/Loss (Raw)": 0.835227370262146, "Finetune/Step": 2099, "Finetune/Step Time": 2.930500527843833} +{"Finetune/Learning Rate": 1.2959844770815636e-05, "Finetune/Loss": 0.8052854537963867, "Finetune/Loss (Raw)": 0.9166294932365417, "Finetune/Step": 2100, "Finetune/Step Time": 2.93171601369977} +{"Finetune/Learning Rate": 1.2953624814268979e-05, "Finetune/Loss": 0.8077993392944336, "Finetune/Loss (Raw)": 0.9211081266403198, "Finetune/Step": 2101, "Finetune/Step Time": 2.9044210352003574} +{"Finetune/Learning Rate": 1.29474036055606e-05, "Finetune/Loss": 0.8078904747962952, "Finetune/Loss (Raw)": 0.830693781375885, "Finetune/Step": 2102, "Finetune/Step Time": 2.9028517305850983} +{"Finetune/Learning Rate": 1.2941181147327926e-05, "Finetune/Loss": 0.8081612586975098, "Finetune/Loss (Raw)": 0.8099719285964966, "Finetune/Step": 2103, "Finetune/Step Time": 2.908432772383094} +{"Finetune/Learning Rate": 1.2934957442208908e-05, "Finetune/Loss": 0.8081613183021545, "Finetune/Loss (Raw)": 0.8481360077857971, "Finetune/Step": 2104, "Finetune/Step Time": 2.9038548804819584} +{"Finetune/Learning Rate": 1.2928732492842029e-05, "Finetune/Loss": 0.8088005781173706, "Finetune/Loss (Raw)": 0.7854505777359009, "Finetune/Step": 2105, "Finetune/Step Time": 2.9012400340288877} +{"Finetune/Learning Rate": 1.2922506301866298e-05, "Finetune/Loss": 0.8079181909561157, "Finetune/Loss (Raw)": 0.7680379748344421, "Finetune/Step": 2106, "Finetune/Step Time": 2.900590181350708} +{"Finetune/Learning Rate": 1.291627887192125e-05, "Finetune/Loss": 0.8084462881088257, "Finetune/Loss (Raw)": 0.8931717276573181, "Finetune/Step": 2107, "Finetune/Step Time": 2.899821622297168} +{"Finetune/Learning Rate": 1.2910050205646947e-05, "Finetune/Loss": 0.8094007968902588, "Finetune/Loss (Raw)": 0.8675896525382996, "Finetune/Step": 2108, "Finetune/Step Time": 2.8783676382154226} +{"Finetune/Learning Rate": 1.2903820305683973e-05, "Finetune/Loss": 0.8099367618560791, "Finetune/Loss (Raw)": 0.8628685474395752, "Finetune/Step": 2109, "Finetune/Step Time": 2.8793254923075438} +{"Finetune/Learning Rate": 1.2897589174673437e-05, "Finetune/Loss": 0.8100919723510742, "Finetune/Loss (Raw)": 0.8625053763389587, "Finetune/Step": 2110, "Finetune/Step Time": 2.8782647121697664} +{"Finetune/Learning Rate": 1.2891356815256968e-05, "Finetune/Loss": 0.8112406134605408, "Finetune/Loss (Raw)": 0.855189323425293, "Finetune/Step": 2111, "Finetune/Step Time": 2.8765597715973854} +{"Finetune/Learning Rate": 1.288512323007672e-05, "Finetune/Loss": 0.8129787445068359, "Finetune/Loss (Raw)": 0.8184877634048462, "Finetune/Step": 2112, "Finetune/Step Time": 2.846087047830224} +{"Finetune/Learning Rate": 1.287888842177536e-05, "Finetune/Loss": 0.8121484518051147, "Finetune/Loss (Raw)": 0.7520421147346497, "Finetune/Step": 2113, "Finetune/Step Time": 2.844230268150568} +{"Finetune/Learning Rate": 1.2872652392996074e-05, "Finetune/Loss": 0.8133830428123474, "Finetune/Loss (Raw)": 0.9514566659927368, "Finetune/Step": 2114, "Finetune/Step Time": 2.8430322036147118} +{"Finetune/Learning Rate": 1.2866415146382574e-05, "Finetune/Loss": 0.8131340742111206, "Finetune/Loss (Raw)": 0.805061936378479, "Finetune/Step": 2115, "Finetune/Step Time": 2.844895616173744} +{"Finetune/Learning Rate": 1.286017668457908e-05, "Finetune/Loss": 0.8098486065864563, "Finetune/Loss (Raw)": 0.3069899082183838, "Finetune/Step": 2116, "Finetune/Step Time": 2.8723197747021914} +{"Finetune/Learning Rate": 1.2853937010230334e-05, "Finetune/Loss": 0.8104953765869141, "Finetune/Loss (Raw)": 0.9023659825325012, "Finetune/Step": 2117, "Finetune/Step Time": 2.8703872710466385} +{"Finetune/Learning Rate": 1.284769612598158e-05, "Finetune/Loss": 0.8102835416793823, "Finetune/Loss (Raw)": 0.816677987575531, "Finetune/Step": 2118, "Finetune/Step Time": 2.875341797247529} +{"Finetune/Learning Rate": 1.2841454034478584e-05, "Finetune/Loss": 0.8099718689918518, "Finetune/Loss (Raw)": 0.8419291973114014, "Finetune/Step": 2119, "Finetune/Step Time": 2.8766608368605375} +{"Finetune/Learning Rate": 1.283521073836763e-05, "Finetune/Loss": 0.8107092380523682, "Finetune/Loss (Raw)": 0.8097285032272339, "Finetune/Step": 2120, "Finetune/Step Time": 2.851908566430211} +{"Finetune/Learning Rate": 1.2828966240295499e-05, "Finetune/Loss": 0.8103770017623901, "Finetune/Loss (Raw)": 0.8135414719581604, "Finetune/Step": 2121, "Finetune/Step Time": 2.8536941185593605} +{"Finetune/Learning Rate": 1.2822720542909491e-05, "Finetune/Loss": 0.8101162910461426, "Finetune/Loss (Raw)": 0.7636956572532654, "Finetune/Step": 2122, "Finetune/Step Time": 2.8549633622169495} +{"Finetune/Learning Rate": 1.2816473648857408e-05, "Finetune/Loss": 0.8103890419006348, "Finetune/Loss (Raw)": 0.8233146071434021, "Finetune/Step": 2123, "Finetune/Step Time": 2.855945101007819} +{"Finetune/Learning Rate": 1.2810225560787561e-05, "Finetune/Loss": 0.8092566132545471, "Finetune/Loss (Raw)": 0.7568073272705078, "Finetune/Step": 2124, "Finetune/Step Time": 2.8486658111214638} +{"Finetune/Learning Rate": 1.2803976281348774e-05, "Finetune/Loss": 0.8088862299919128, "Finetune/Loss (Raw)": 0.8025785088539124, "Finetune/Step": 2125, "Finetune/Step Time": 2.8538948353379965} +{"Finetune/Learning Rate": 1.2797725813190369e-05, "Finetune/Loss": 0.8091219663619995, "Finetune/Loss (Raw)": 0.8429991602897644, "Finetune/Step": 2126, "Finetune/Step Time": 2.855249771848321} +{"Finetune/Learning Rate": 1.2791474158962173e-05, "Finetune/Loss": 0.8090418577194214, "Finetune/Loss (Raw)": 0.8174530267715454, "Finetune/Step": 2127, "Finetune/Step Time": 2.8540485482662916} +{"Finetune/Learning Rate": 1.2785221321314517e-05, "Finetune/Loss": 0.8093781471252441, "Finetune/Loss (Raw)": 0.8706309199333191, "Finetune/Step": 2128, "Finetune/Step Time": 2.853078765794635} +{"Finetune/Learning Rate": 1.277896730289823e-05, "Finetune/Loss": 0.8088387846946716, "Finetune/Loss (Raw)": 0.742124617099762, "Finetune/Step": 2129, "Finetune/Step Time": 2.8769491966813803} +{"Finetune/Learning Rate": 1.2772712106364653e-05, "Finetune/Loss": 0.8072024583816528, "Finetune/Loss (Raw)": 0.5592821836471558, "Finetune/Step": 2130, "Finetune/Step Time": 2.9004673790186644} +{"Finetune/Learning Rate": 1.2766455734365611e-05, "Finetune/Loss": 0.8042094111442566, "Finetune/Loss (Raw)": 0.30797988176345825, "Finetune/Step": 2131, "Finetune/Step Time": 2.909613437950611} +{"Finetune/Learning Rate": 1.2760198189553437e-05, "Finetune/Loss": 0.8034125566482544, "Finetune/Loss (Raw)": 0.8002520799636841, "Finetune/Step": 2132, "Finetune/Step Time": 2.906769698485732} +{"Finetune/Learning Rate": 1.2753939474580956e-05, "Finetune/Loss": 0.8045508861541748, "Finetune/Loss (Raw)": 0.8226707577705383, "Finetune/Step": 2133, "Finetune/Step Time": 2.882692452520132} +{"Finetune/Learning Rate": 1.2747679592101498e-05, "Finetune/Loss": 0.8042141199111938, "Finetune/Loss (Raw)": 0.8595747351646423, "Finetune/Step": 2134, "Finetune/Step Time": 2.882996339350939} +{"Finetune/Learning Rate": 1.2741418544768878e-05, "Finetune/Loss": 0.804003119468689, "Finetune/Loss (Raw)": 0.8257116079330444, "Finetune/Step": 2135, "Finetune/Step Time": 2.881313495337963} +{"Finetune/Learning Rate": 1.2735156335237407e-05, "Finetune/Loss": 0.8038654327392578, "Finetune/Loss (Raw)": 0.8670724034309387, "Finetune/Step": 2136, "Finetune/Step Time": 2.883497778326273} +{"Finetune/Learning Rate": 1.2728892966161893e-05, "Finetune/Loss": 0.8048186302185059, "Finetune/Loss (Raw)": 0.924899697303772, "Finetune/Step": 2137, "Finetune/Step Time": 2.8814873956143856} +{"Finetune/Learning Rate": 1.2722628440197631e-05, "Finetune/Loss": 0.804004967212677, "Finetune/Loss (Raw)": 0.7701027989387512, "Finetune/Step": 2138, "Finetune/Step Time": 2.880681600421667} +{"Finetune/Learning Rate": 1.2716362760000412e-05, "Finetune/Loss": 0.8037577867507935, "Finetune/Loss (Raw)": 0.8419072031974792, "Finetune/Step": 2139, "Finetune/Step Time": 2.8800314888358116} +{"Finetune/Learning Rate": 1.2710095928226509e-05, "Finetune/Loss": 0.8036669492721558, "Finetune/Loss (Raw)": 0.7503842711448669, "Finetune/Step": 2140, "Finetune/Step Time": 2.8967111017555} +{"Finetune/Learning Rate": 1.2703827947532692e-05, "Finetune/Loss": 0.8031540513038635, "Finetune/Loss (Raw)": 0.7882214784622192, "Finetune/Step": 2141, "Finetune/Step Time": 2.8992175925523043} +{"Finetune/Learning Rate": 1.2697558820576205e-05, "Finetune/Loss": 0.8058586120605469, "Finetune/Loss (Raw)": 0.9041446447372437, "Finetune/Step": 2142, "Finetune/Step Time": 2.874392669647932} +{"Finetune/Learning Rate": 1.2691288550014794e-05, "Finetune/Loss": 0.804797887802124, "Finetune/Loss (Raw)": 0.6290533542633057, "Finetune/Step": 2143, "Finetune/Step Time": 2.896033465862274} +{"Finetune/Learning Rate": 1.2685017138506675e-05, "Finetune/Loss": 0.804088294506073, "Finetune/Loss (Raw)": 0.7678961157798767, "Finetune/Step": 2144, "Finetune/Step Time": 2.8971058651804924} +{"Finetune/Learning Rate": 1.2678744588710558e-05, "Finetune/Loss": 0.8047276735305786, "Finetune/Loss (Raw)": 0.8197725415229797, "Finetune/Step": 2145, "Finetune/Step Time": 2.897051475942135} +{"Finetune/Learning Rate": 1.2672470903285634e-05, "Finetune/Loss": 0.801817774772644, "Finetune/Loss (Raw)": 0.4028666317462921, "Finetune/Step": 2146, "Finetune/Step Time": 2.928426394239068} +{"Finetune/Learning Rate": 1.266619608489157e-05, "Finetune/Loss": 0.8001194596290588, "Finetune/Loss (Raw)": 0.6318085789680481, "Finetune/Step": 2147, "Finetune/Step Time": 2.951778117567301} +{"Finetune/Learning Rate": 1.2659920136188517e-05, "Finetune/Loss": 0.7998010516166687, "Finetune/Loss (Raw)": 0.8304502367973328, "Finetune/Step": 2148, "Finetune/Step Time": 2.9511050302535295} +{"Finetune/Learning Rate": 1.2653643059837109e-05, "Finetune/Loss": 0.8004173636436462, "Finetune/Loss (Raw)": 0.8047520518302917, "Finetune/Step": 2149, "Finetune/Step Time": 2.9493888821452856} +{"Finetune/Learning Rate": 1.2647364858498448e-05, "Finetune/Loss": 0.8030767440795898, "Finetune/Loss (Raw)": 0.9085320830345154, "Finetune/Step": 2150, "Finetune/Step Time": 2.9284581523388624} +{"Finetune/Learning Rate": 1.2641085534834124e-05, "Finetune/Loss": 0.8036354184150696, "Finetune/Loss (Raw)": 0.9112415313720703, "Finetune/Step": 2151, "Finetune/Step Time": 2.9207694102078676} +{"Finetune/Learning Rate": 1.2634805091506192e-05, "Finetune/Loss": 0.8029438257217407, "Finetune/Loss (Raw)": 0.8994249701499939, "Finetune/Step": 2152, "Finetune/Step Time": 2.9295001067221165} +{"Finetune/Learning Rate": 1.2628523531177194e-05, "Finetune/Loss": 0.8070699572563171, "Finetune/Loss (Raw)": 0.8052369952201843, "Finetune/Step": 2153, "Finetune/Step Time": 2.903739219531417} +{"Finetune/Learning Rate": 1.2622240856510137e-05, "Finetune/Loss": 0.8071504831314087, "Finetune/Loss (Raw)": 0.8643596172332764, "Finetune/Step": 2154, "Finetune/Step Time": 2.9008166436105967} +{"Finetune/Learning Rate": 1.26159570701685e-05, "Finetune/Loss": 0.8072940707206726, "Finetune/Loss (Raw)": 0.8146262764930725, "Finetune/Step": 2155, "Finetune/Step Time": 2.9000330567359924} +{"Finetune/Learning Rate": 1.2609672174816239e-05, "Finetune/Loss": 0.8073749542236328, "Finetune/Loss (Raw)": 0.8433685302734375, "Finetune/Step": 2156, "Finetune/Step Time": 2.8989589028060436} +{"Finetune/Learning Rate": 1.2603386173117771e-05, "Finetune/Loss": 0.8060212135314941, "Finetune/Loss (Raw)": 0.6387612223625183, "Finetune/Step": 2157, "Finetune/Step Time": 2.9209322202950716} +{"Finetune/Learning Rate": 1.2597099067737995e-05, "Finetune/Loss": 0.8064931035041809, "Finetune/Loss (Raw)": 0.862964391708374, "Finetune/Step": 2158, "Finetune/Step Time": 2.9169730376452208} +{"Finetune/Learning Rate": 1.2590810861342267e-05, "Finetune/Loss": 0.8069019317626953, "Finetune/Loss (Raw)": 0.8608847260475159, "Finetune/Step": 2159, "Finetune/Step Time": 2.9148078206926584} +{"Finetune/Learning Rate": 1.2584521556596414e-05, "Finetune/Loss": 0.8069007992744446, "Finetune/Loss (Raw)": 0.7925092577934265, "Finetune/Step": 2160, "Finetune/Step Time": 2.9194827266037464} +{"Finetune/Learning Rate": 1.257823115616673e-05, "Finetune/Loss": 0.806445837020874, "Finetune/Loss (Raw)": 0.782008171081543, "Finetune/Step": 2161, "Finetune/Step Time": 2.91755199059844} +{"Finetune/Learning Rate": 1.2571939662719968e-05, "Finetune/Loss": 0.8060268759727478, "Finetune/Loss (Raw)": 0.7763301730155945, "Finetune/Step": 2162, "Finetune/Step Time": 2.913127204403281} +{"Finetune/Learning Rate": 1.2565647078923351e-05, "Finetune/Loss": 0.8062434196472168, "Finetune/Loss (Raw)": 0.8381052017211914, "Finetune/Step": 2163, "Finetune/Step Time": 2.909328855574131} +{"Finetune/Learning Rate": 1.2559353407444559e-05, "Finetune/Loss": 0.805335283279419, "Finetune/Loss (Raw)": 0.8586453795433044, "Finetune/Step": 2164, "Finetune/Step Time": 2.9112629778683186} +{"Finetune/Learning Rate": 1.2553058650951737e-05, "Finetune/Loss": 0.8050235509872437, "Finetune/Loss (Raw)": 0.7671042084693909, "Finetune/Step": 2165, "Finetune/Step Time": 2.91032119654119} +{"Finetune/Learning Rate": 1.2546762812113486e-05, "Finetune/Loss": 0.8060718774795532, "Finetune/Loss (Raw)": 0.782579779624939, "Finetune/Step": 2166, "Finetune/Step Time": 2.8874998819082975} +{"Finetune/Learning Rate": 1.2540465893598874e-05, "Finetune/Loss": 0.8037830591201782, "Finetune/Loss (Raw)": 0.5258662700653076, "Finetune/Step": 2167, "Finetune/Step Time": 2.9130032416433096} +{"Finetune/Learning Rate": 1.2534167898077413e-05, "Finetune/Loss": 0.8057488203048706, "Finetune/Loss (Raw)": 0.8432945013046265, "Finetune/Step": 2168, "Finetune/Step Time": 2.8801621180027723} +{"Finetune/Learning Rate": 1.2527868828219087e-05, "Finetune/Loss": 0.8058229684829712, "Finetune/Loss (Raw)": 0.79450523853302, "Finetune/Step": 2169, "Finetune/Step Time": 2.8765495996922255} +{"Finetune/Learning Rate": 1.2521568686694325e-05, "Finetune/Loss": 0.8063993453979492, "Finetune/Loss (Raw)": 0.978481113910675, "Finetune/Step": 2170, "Finetune/Step Time": 2.875475697219372} +{"Finetune/Learning Rate": 1.2515267476174012e-05, "Finetune/Loss": 0.8057413101196289, "Finetune/Loss (Raw)": 0.7332184314727783, "Finetune/Step": 2171, "Finetune/Step Time": 2.8744837380945683} +{"Finetune/Learning Rate": 1.2508965199329486e-05, "Finetune/Loss": 0.8059012293815613, "Finetune/Loss (Raw)": 0.7924978137016296, "Finetune/Step": 2172, "Finetune/Step Time": 2.871399700641632} +{"Finetune/Learning Rate": 1.2502661858832543e-05, "Finetune/Loss": 0.8058019876480103, "Finetune/Loss (Raw)": 0.8732225298881531, "Finetune/Step": 2173, "Finetune/Step Time": 2.8698245119303465} +{"Finetune/Learning Rate": 1.2496357457355423e-05, "Finetune/Loss": 0.8055010437965393, "Finetune/Loss (Raw)": 0.8050649166107178, "Finetune/Step": 2174, "Finetune/Step Time": 2.8659568708389997} +{"Finetune/Learning Rate": 1.2490051997570818e-05, "Finetune/Loss": 0.8055634498596191, "Finetune/Loss (Raw)": 0.8428188562393188, "Finetune/Step": 2175, "Finetune/Step Time": 2.8667602632194757} +{"Finetune/Learning Rate": 1.248374548215187e-05, "Finetune/Loss": 0.8047105669975281, "Finetune/Loss (Raw)": 0.7740198373794556, "Finetune/Step": 2176, "Finetune/Step Time": 2.867810193449259} +{"Finetune/Learning Rate": 1.2477437913772169e-05, "Finetune/Loss": 0.8028624653816223, "Finetune/Loss (Raw)": 0.5470283031463623, "Finetune/Step": 2177, "Finetune/Step Time": 2.8892084173858166} +{"Finetune/Learning Rate": 1.2471129295105746e-05, "Finetune/Loss": 0.8050099611282349, "Finetune/Loss (Raw)": 0.8714115023612976, "Finetune/Step": 2178, "Finetune/Step Time": 2.8674556519836187} +{"Finetune/Learning Rate": 1.2464819628827085e-05, "Finetune/Loss": 0.8046479821205139, "Finetune/Loss (Raw)": 0.7914105653762817, "Finetune/Step": 2179, "Finetune/Step Time": 2.8695913776755333} +{"Finetune/Learning Rate": 1.2458508917611105e-05, "Finetune/Loss": 0.8033472299575806, "Finetune/Loss (Raw)": 0.7249767184257507, "Finetune/Step": 2180, "Finetune/Step Time": 2.8711323607712984} +{"Finetune/Learning Rate": 1.2452197164133177e-05, "Finetune/Loss": 0.8033331036567688, "Finetune/Loss (Raw)": 0.7703409194946289, "Finetune/Step": 2181, "Finetune/Step Time": 2.868020987138152} +{"Finetune/Learning Rate": 1.2445884371069112e-05, "Finetune/Loss": 0.802593469619751, "Finetune/Loss (Raw)": 0.7615285515785217, "Finetune/Step": 2182, "Finetune/Step Time": 2.871117392554879} +{"Finetune/Learning Rate": 1.2439570541095157e-05, "Finetune/Loss": 0.8020786046981812, "Finetune/Loss (Raw)": 0.8168478012084961, "Finetune/Step": 2183, "Finetune/Step Time": 2.8695948105305433} +{"Finetune/Learning Rate": 1.2433255676888001e-05, "Finetune/Loss": 0.8019530773162842, "Finetune/Loss (Raw)": 0.6689541935920715, "Finetune/Step": 2184, "Finetune/Step Time": 2.89252757281065} +{"Finetune/Learning Rate": 1.242693978112477e-05, "Finetune/Loss": 0.8025017976760864, "Finetune/Loss (Raw)": 0.8784487247467041, "Finetune/Step": 2185, "Finetune/Step Time": 2.8885652236640453} +{"Finetune/Learning Rate": 1.2420622856483034e-05, "Finetune/Loss": 0.8028780817985535, "Finetune/Loss (Raw)": 0.9514040946960449, "Finetune/Step": 2186, "Finetune/Step Time": 2.888866340741515} +{"Finetune/Learning Rate": 1.2414304905640793e-05, "Finetune/Loss": 0.8040490746498108, "Finetune/Loss (Raw)": 0.8999578952789307, "Finetune/Step": 2187, "Finetune/Step Time": 2.8912608958780766} +{"Finetune/Learning Rate": 1.240798593127648e-05, "Finetune/Loss": 0.803486704826355, "Finetune/Loss (Raw)": 0.7819586992263794, "Finetune/Step": 2188, "Finetune/Step Time": 2.8937098030000925} +{"Finetune/Learning Rate": 1.2401665936068967e-05, "Finetune/Loss": 0.7990067601203918, "Finetune/Loss (Raw)": 0.20361967384815216, "Finetune/Step": 2189, "Finetune/Step Time": 2.926076654344797} +{"Finetune/Learning Rate": 1.239534492269756e-05, "Finetune/Loss": 0.7989829778671265, "Finetune/Loss (Raw)": 0.8532044291496277, "Finetune/Step": 2190, "Finetune/Step Time": 2.927554337307811} +{"Finetune/Learning Rate": 1.2389022893841993e-05, "Finetune/Loss": 0.7984438538551331, "Finetune/Loss (Raw)": 0.8343514800071716, "Finetune/Step": 2191, "Finetune/Step Time": 2.9259198866784573} +{"Finetune/Learning Rate": 1.238269985218243e-05, "Finetune/Loss": 0.7990104556083679, "Finetune/Loss (Raw)": 0.8632938265800476, "Finetune/Step": 2192, "Finetune/Step Time": 2.922071373090148} +{"Finetune/Learning Rate": 1.2376375800399463e-05, "Finetune/Loss": 0.7994835376739502, "Finetune/Loss (Raw)": 0.8643695116043091, "Finetune/Step": 2193, "Finetune/Step Time": 2.9242059998214245} +{"Finetune/Learning Rate": 1.2370050741174116e-05, "Finetune/Loss": 0.799186110496521, "Finetune/Loss (Raw)": 0.8644849061965942, "Finetune/Step": 2194, "Finetune/Step Time": 2.9225679617375135} +{"Finetune/Learning Rate": 1.2363724677187843e-05, "Finetune/Loss": 0.7947049140930176, "Finetune/Loss (Raw)": 0.21425382792949677, "Finetune/Step": 2195, "Finetune/Step Time": 2.9545095674693584} +{"Finetune/Learning Rate": 1.2357397611122516e-05, "Finetune/Loss": 0.794213056564331, "Finetune/Loss (Raw)": 0.8016782999038696, "Finetune/Step": 2196, "Finetune/Step Time": 2.957680430263281} +{"Finetune/Learning Rate": 1.2351069545660437e-05, "Finetune/Loss": 0.7948448657989502, "Finetune/Loss (Raw)": 0.9010236263275146, "Finetune/Step": 2197, "Finetune/Step Time": 2.958186488598585} +{"Finetune/Learning Rate": 1.234474048348433e-05, "Finetune/Loss": 0.7937585711479187, "Finetune/Loss (Raw)": 0.6611923575401306, "Finetune/Step": 2198, "Finetune/Step Time": 2.977849956601858} +{"Finetune/Learning Rate": 1.2338410427277342e-05, "Finetune/Loss": 0.7953377962112427, "Finetune/Loss (Raw)": 0.9360632300376892, "Finetune/Step": 2199, "Finetune/Step Time": 2.9771440643817186} +{"Finetune/Learning Rate": 1.2332079379723042e-05, "Finetune/Loss": 0.7945091128349304, "Finetune/Loss (Raw)": 0.7938523888587952, "Finetune/Step": 2200, "Finetune/Step Time": 2.976934790611267} +{"Finetune/Learning Rate": 1.2325747343505416e-05, "Finetune/Loss": 0.7953304052352905, "Finetune/Loss (Raw)": 0.9384140372276306, "Finetune/Step": 2201, "Finetune/Step Time": 3.003349833190441} +{"Finetune/Learning Rate": 1.2319414321308876e-05, "Finetune/Loss": 0.7963485717773438, "Finetune/Loss (Raw)": 0.8921135663986206, "Finetune/Step": 2202, "Finetune/Step Time": 3.0003439374268055} +{"Finetune/Learning Rate": 1.2313080315818243e-05, "Finetune/Loss": 0.7973179817199707, "Finetune/Loss (Raw)": 0.8660507798194885, "Finetune/Step": 2203, "Finetune/Step Time": 3.0017050690948963} +{"Finetune/Learning Rate": 1.2306745329718764e-05, "Finetune/Loss": 0.7941356301307678, "Finetune/Loss (Raw)": 0.435378760099411, "Finetune/Step": 2204, "Finetune/Step Time": 3.0353885907679796} +{"Finetune/Learning Rate": 1.2300409365696095e-05, "Finetune/Loss": 0.7928464412689209, "Finetune/Loss (Raw)": 0.6791108250617981, "Finetune/Step": 2205, "Finetune/Step Time": 3.0359567385166883} +{"Finetune/Learning Rate": 1.2294072426436311e-05, "Finetune/Loss": 0.7925937175750732, "Finetune/Loss (Raw)": 0.828393280506134, "Finetune/Step": 2206, "Finetune/Step Time": 3.0342973433434963} +{"Finetune/Learning Rate": 1.2287734514625896e-05, "Finetune/Loss": 0.7932496070861816, "Finetune/Loss (Raw)": 0.7035143971443176, "Finetune/Step": 2207, "Finetune/Step Time": 3.01413494348526} +{"Finetune/Learning Rate": 1.2281395632951747e-05, "Finetune/Loss": 0.794165313243866, "Finetune/Loss (Raw)": 0.9308977127075195, "Finetune/Step": 2208, "Finetune/Step Time": 3.0227806866168976} +{"Finetune/Learning Rate": 1.2275055784101178e-05, "Finetune/Loss": 0.7943565249443054, "Finetune/Loss (Raw)": 0.8506056666374207, "Finetune/Step": 2209, "Finetune/Step Time": 3.0209643188863993} +{"Finetune/Learning Rate": 1.2268714970761908e-05, "Finetune/Loss": 0.7948896288871765, "Finetune/Loss (Raw)": 0.8296462893486023, "Finetune/Step": 2210, "Finetune/Step Time": 3.0218278113752604} +{"Finetune/Learning Rate": 1.2262373195622064e-05, "Finetune/Loss": 0.7939637899398804, "Finetune/Loss (Raw)": 0.8279438018798828, "Finetune/Step": 2211, "Finetune/Step Time": 3.0215448644012213} +{"Finetune/Learning Rate": 1.2256030461370183e-05, "Finetune/Loss": 0.7939565181732178, "Finetune/Loss (Raw)": 0.781143069267273, "Finetune/Step": 2212, "Finetune/Step Time": 3.0219696648418903} +{"Finetune/Learning Rate": 1.2249686770695208e-05, "Finetune/Loss": 0.7937405109405518, "Finetune/Loss (Raw)": 0.797285795211792, "Finetune/Step": 2213, "Finetune/Step Time": 3.017237439751625} +{"Finetune/Learning Rate": 1.2243342126286488e-05, "Finetune/Loss": 0.7944458723068237, "Finetune/Loss (Raw)": 0.8866652846336365, "Finetune/Step": 2214, "Finetune/Step Time": 3.0177024137228727} +{"Finetune/Learning Rate": 1.2236996530833778e-05, "Finetune/Loss": 0.7923199534416199, "Finetune/Loss (Raw)": 0.6756923198699951, "Finetune/Step": 2215, "Finetune/Step Time": 3.03862614184618} +{"Finetune/Learning Rate": 1.223064998702723e-05, "Finetune/Loss": 0.7934515476226807, "Finetune/Loss (Raw)": 0.8522960543632507, "Finetune/Step": 2216, "Finetune/Step Time": 3.016271313652396} +{"Finetune/Learning Rate": 1.2224302497557405e-05, "Finetune/Loss": 0.7925944924354553, "Finetune/Loss (Raw)": 0.7668719291687012, "Finetune/Step": 2217, "Finetune/Step Time": 3.0176988765597343} +{"Finetune/Learning Rate": 1.2217954065115258e-05, "Finetune/Loss": 0.7944856286048889, "Finetune/Loss (Raw)": 0.8933574557304382, "Finetune/Step": 2218, "Finetune/Step Time": 2.994396671652794} +{"Finetune/Learning Rate": 1.2211604692392154e-05, "Finetune/Loss": 0.7934262752532959, "Finetune/Loss (Raw)": 0.7582989931106567, "Finetune/Step": 2219, "Finetune/Step Time": 2.9926477894186974} +{"Finetune/Learning Rate": 1.2205254382079848e-05, "Finetune/Loss": 0.7931122779846191, "Finetune/Loss (Raw)": 0.7857958674430847, "Finetune/Step": 2220, "Finetune/Step Time": 2.9908353462815285} +{"Finetune/Learning Rate": 1.2198903136870493e-05, "Finetune/Loss": 0.7921708822250366, "Finetune/Loss (Raw)": 0.7160099744796753, "Finetune/Step": 2221, "Finetune/Step Time": 2.9937785901129246} +{"Finetune/Learning Rate": 1.2192550959456638e-05, "Finetune/Loss": 0.7924729585647583, "Finetune/Loss (Raw)": 0.8935319185256958, "Finetune/Step": 2222, "Finetune/Step Time": 2.989033818244934} +{"Finetune/Learning Rate": 1.2186197852531237e-05, "Finetune/Loss": 0.7915037870407104, "Finetune/Loss (Raw)": 0.8252791166305542, "Finetune/Step": 2223, "Finetune/Step Time": 2.9887390732765198} +{"Finetune/Learning Rate": 1.2179843818787625e-05, "Finetune/Loss": 0.7916812300682068, "Finetune/Loss (Raw)": 0.8118100762367249, "Finetune/Step": 2224, "Finetune/Step Time": 2.9798069298267365} +{"Finetune/Learning Rate": 1.2173488860919536e-05, "Finetune/Loss": 0.7925964593887329, "Finetune/Loss (Raw)": 0.9055376052856445, "Finetune/Step": 2225, "Finetune/Step Time": 2.981666162610054} +{"Finetune/Learning Rate": 1.2167132981621097e-05, "Finetune/Loss": 0.7914398908615112, "Finetune/Loss (Raw)": 0.7440603971481323, "Finetune/Step": 2226, "Finetune/Step Time": 2.9820699635893106} +{"Finetune/Learning Rate": 1.216077618358682e-05, "Finetune/Loss": 0.7913281917572021, "Finetune/Loss (Raw)": 0.8209313154220581, "Finetune/Step": 2227, "Finetune/Step Time": 2.976763477548957} +{"Finetune/Learning Rate": 1.2154418469511612e-05, "Finetune/Loss": 0.7910556793212891, "Finetune/Loss (Raw)": 0.8817517161369324, "Finetune/Step": 2228, "Finetune/Step Time": 2.9783174823969603} +{"Finetune/Learning Rate": 1.2148059842090772e-05, "Finetune/Loss": 0.7907241582870483, "Finetune/Loss (Raw)": 0.8786722421646118, "Finetune/Step": 2229, "Finetune/Step Time": 2.977306453511119} +{"Finetune/Learning Rate": 1.2141700304019977e-05, "Finetune/Loss": 0.791301965713501, "Finetune/Loss (Raw)": 0.9046521782875061, "Finetune/Step": 2230, "Finetune/Step Time": 2.9793319813907146} +{"Finetune/Learning Rate": 1.2135339857995289e-05, "Finetune/Loss": 0.7919520139694214, "Finetune/Loss (Raw)": 0.8931827545166016, "Finetune/Step": 2231, "Finetune/Step Time": 2.9749285969883204} +{"Finetune/Learning Rate": 1.2128978506713164e-05, "Finetune/Loss": 0.7922594547271729, "Finetune/Loss (Raw)": 0.887479841709137, "Finetune/Step": 2232, "Finetune/Step Time": 2.9737106040120125} +{"Finetune/Learning Rate": 1.2122616252870443e-05, "Finetune/Loss": 0.7922121286392212, "Finetune/Loss (Raw)": 0.7794004678726196, "Finetune/Step": 2233, "Finetune/Step Time": 2.978293526917696} +{"Finetune/Learning Rate": 1.2116253099164335e-05, "Finetune/Loss": 0.7920622825622559, "Finetune/Loss (Raw)": 0.7488607168197632, "Finetune/Step": 2234, "Finetune/Step Time": 2.978182116523385} +{"Finetune/Learning Rate": 1.2109889048292444e-05, "Finetune/Loss": 0.7919548749923706, "Finetune/Loss (Raw)": 0.8794196844100952, "Finetune/Step": 2235, "Finetune/Step Time": 2.975995544344187} +{"Finetune/Learning Rate": 1.2103524102952751e-05, "Finetune/Loss": 0.7919420599937439, "Finetune/Loss (Raw)": 0.8659473657608032, "Finetune/Step": 2236, "Finetune/Step Time": 2.9725667275488377} +{"Finetune/Learning Rate": 1.2097158265843611e-05, "Finetune/Loss": 0.7912775278091431, "Finetune/Loss (Raw)": 0.7778139114379883, "Finetune/Step": 2237, "Finetune/Step Time": 2.972831239923835} +{"Finetune/Learning Rate": 1.209079153966377e-05, "Finetune/Loss": 0.7906643152236938, "Finetune/Loss (Raw)": 0.7840057611465454, "Finetune/Step": 2238, "Finetune/Step Time": 2.9766103457659483} +{"Finetune/Learning Rate": 1.2084423927112332e-05, "Finetune/Loss": 0.7912346124649048, "Finetune/Loss (Raw)": 0.9281976222991943, "Finetune/Step": 2239, "Finetune/Step Time": 2.9770842641592026} +{"Finetune/Learning Rate": 1.2078055430888793e-05, "Finetune/Loss": 0.7903856039047241, "Finetune/Loss (Raw)": 0.7098041772842407, "Finetune/Step": 2240, "Finetune/Step Time": 2.9751874916255474} +{"Finetune/Learning Rate": 1.2071686053693015e-05, "Finetune/Loss": 0.7913866639137268, "Finetune/Loss (Raw)": 0.8801796436309814, "Finetune/Step": 2241, "Finetune/Step Time": 2.972462961450219} +{"Finetune/Learning Rate": 1.2065315798225239e-05, "Finetune/Loss": 0.7899606227874756, "Finetune/Loss (Raw)": 0.7689294219017029, "Finetune/Step": 2242, "Finetune/Step Time": 2.975642219185829} +{"Finetune/Learning Rate": 1.2058944667186075e-05, "Finetune/Loss": 0.7898092269897461, "Finetune/Loss (Raw)": 0.7856816053390503, "Finetune/Step": 2243, "Finetune/Step Time": 2.9724337588995695} +{"Finetune/Learning Rate": 1.2052572663276502e-05, "Finetune/Loss": 0.793747067451477, "Finetune/Loss (Raw)": 0.8110361099243164, "Finetune/Step": 2244, "Finetune/Step Time": 2.942846190184355} +{"Finetune/Learning Rate": 1.2046199789197874e-05, "Finetune/Loss": 0.7928464412689209, "Finetune/Loss (Raw)": 0.787082314491272, "Finetune/Step": 2245, "Finetune/Step Time": 2.9394975807517767} +{"Finetune/Learning Rate": 1.2039826047651908e-05, "Finetune/Loss": 0.7876710295677185, "Finetune/Loss (Raw)": 0.15422596037387848, "Finetune/Step": 2246, "Finetune/Step Time": 2.9677308220416307} +{"Finetune/Learning Rate": 1.2033451441340698e-05, "Finetune/Loss": 0.7878671884536743, "Finetune/Loss (Raw)": 0.8670347332954407, "Finetune/Step": 2247, "Finetune/Step Time": 2.9696303121745586} +{"Finetune/Learning Rate": 1.2027075972966696e-05, "Finetune/Loss": 0.7875216007232666, "Finetune/Loss (Raw)": 0.765489935874939, "Finetune/Step": 2248, "Finetune/Step Time": 2.9690905436873436} +{"Finetune/Learning Rate": 1.202069964523272e-05, "Finetune/Loss": 0.787608802318573, "Finetune/Loss (Raw)": 0.8247069120407104, "Finetune/Step": 2249, "Finetune/Step Time": 2.970223095268011} +{"Finetune/Learning Rate": 1.2014322460841958e-05, "Finetune/Loss": 0.7872205972671509, "Finetune/Loss (Raw)": 0.714012622833252, "Finetune/Step": 2250, "Finetune/Step Time": 2.9718583561480045} +{"Finetune/Learning Rate": 1.200794442249796e-05, "Finetune/Loss": 0.7850775122642517, "Finetune/Loss (Raw)": 0.5489951372146606, "Finetune/Step": 2251, "Finetune/Step Time": 2.9948134813457727} +{"Finetune/Learning Rate": 1.200156553290463e-05, "Finetune/Loss": 0.7827934622764587, "Finetune/Loss (Raw)": 0.46445003151893616, "Finetune/Step": 2252, "Finetune/Step Time": 3.029526786878705} +{"Finetune/Learning Rate": 1.1995185794766245e-05, "Finetune/Loss": 0.7827786207199097, "Finetune/Loss (Raw)": 0.8006739616394043, "Finetune/Step": 2253, "Finetune/Step Time": 3.028174478560686} +{"Finetune/Learning Rate": 1.1988805210787428e-05, "Finetune/Loss": 0.783257007598877, "Finetune/Loss (Raw)": 0.9042335748672485, "Finetune/Step": 2254, "Finetune/Step Time": 3.029997754842043} +{"Finetune/Learning Rate": 1.1982423783673174e-05, "Finetune/Loss": 0.7844374179840088, "Finetune/Loss (Raw)": 0.9685471057891846, "Finetune/Step": 2255, "Finetune/Step Time": 3.028254287317395} +{"Finetune/Learning Rate": 1.1976041516128829e-05, "Finetune/Loss": 0.7842597365379333, "Finetune/Loss (Raw)": 0.8478857278823853, "Finetune/Step": 2256, "Finetune/Step Time": 3.0243224147707224} +{"Finetune/Learning Rate": 1.1969658410860094e-05, "Finetune/Loss": 0.7846969962120056, "Finetune/Loss (Raw)": 0.7980915904045105, "Finetune/Step": 2257, "Finetune/Step Time": 3.0012506041675806} +{"Finetune/Learning Rate": 1.196327447057303e-05, "Finetune/Loss": 0.784887969493866, "Finetune/Loss (Raw)": 0.5837267637252808, "Finetune/Step": 2258, "Finetune/Step Time": 2.9995440039783716} +{"Finetune/Learning Rate": 1.1956889697974046e-05, "Finetune/Loss": 0.787273108959198, "Finetune/Loss (Raw)": 0.6132813692092896, "Finetune/Step": 2259, "Finetune/Step Time": 2.9877827651798725} +{"Finetune/Learning Rate": 1.1950504095769907e-05, "Finetune/Loss": 0.7869937419891357, "Finetune/Loss (Raw)": 0.7644981741905212, "Finetune/Step": 2260, "Finetune/Step Time": 2.9940538480877876} +{"Finetune/Learning Rate": 1.194411766666773e-05, "Finetune/Loss": 0.7878259420394897, "Finetune/Loss (Raw)": 0.9291873574256897, "Finetune/Step": 2261, "Finetune/Step Time": 2.9955516811460257} +{"Finetune/Learning Rate": 1.1937730413374983e-05, "Finetune/Loss": 0.7875534296035767, "Finetune/Loss (Raw)": 0.8246908783912659, "Finetune/Step": 2262, "Finetune/Step Time": 2.9921283423900604} +{"Finetune/Learning Rate": 1.1931342338599483e-05, "Finetune/Loss": 0.7872113585472107, "Finetune/Loss (Raw)": 0.7819292545318604, "Finetune/Step": 2263, "Finetune/Step Time": 2.9962774012237787} +{"Finetune/Learning Rate": 1.192495344504939e-05, "Finetune/Loss": 0.7863829731941223, "Finetune/Loss (Raw)": 0.7610394954681396, "Finetune/Step": 2264, "Finetune/Step Time": 3.009649744257331} +{"Finetune/Learning Rate": 1.1918563735433224e-05, "Finetune/Loss": 0.7852166891098022, "Finetune/Loss (Raw)": 0.7756146192550659, "Finetune/Step": 2265, "Finetune/Step Time": 3.0086052753031254} +{"Finetune/Learning Rate": 1.1912173212459836e-05, "Finetune/Loss": 0.7858409881591797, "Finetune/Loss (Raw)": 0.8500135540962219, "Finetune/Step": 2266, "Finetune/Step Time": 3.006030287593603} +{"Finetune/Learning Rate": 1.1905781878838433e-05, "Finetune/Loss": 0.7859898805618286, "Finetune/Loss (Raw)": 0.8609596490859985, "Finetune/Step": 2267, "Finetune/Step Time": 3.009871568530798} +{"Finetune/Learning Rate": 1.189938973727856e-05, "Finetune/Loss": 0.7860370874404907, "Finetune/Loss (Raw)": 0.7564285397529602, "Finetune/Step": 2268, "Finetune/Step Time": 2.9900214225053787} +{"Finetune/Learning Rate": 1.1892996790490102e-05, "Finetune/Loss": 0.7859607934951782, "Finetune/Loss (Raw)": 0.7784635424613953, "Finetune/Step": 2269, "Finetune/Step Time": 2.9891068898141384} +{"Finetune/Learning Rate": 1.1886603041183295e-05, "Finetune/Loss": 0.785607099533081, "Finetune/Loss (Raw)": 0.8588680028915405, "Finetune/Step": 2270, "Finetune/Step Time": 2.9891620073467493} +{"Finetune/Learning Rate": 1.1880208492068707e-05, "Finetune/Loss": 0.7875608801841736, "Finetune/Loss (Raw)": 0.8791344165802002, "Finetune/Step": 2271, "Finetune/Step Time": 2.9680499490350485} +{"Finetune/Learning Rate": 1.187381314585725e-05, "Finetune/Loss": 0.7884997129440308, "Finetune/Loss (Raw)": 0.8880661725997925, "Finetune/Step": 2272, "Finetune/Step Time": 2.964208271354437} +{"Finetune/Learning Rate": 1.1867417005260165e-05, "Finetune/Loss": 0.7886145114898682, "Finetune/Loss (Raw)": 0.834470272064209, "Finetune/Step": 2273, "Finetune/Step Time": 2.968699825927615} +{"Finetune/Learning Rate": 1.186102007298904e-05, "Finetune/Loss": 0.7917913198471069, "Finetune/Loss (Raw)": 0.8094934225082397, "Finetune/Step": 2274, "Finetune/Step Time": 2.9375375360250473} +{"Finetune/Learning Rate": 1.1854622351755795e-05, "Finetune/Loss": 0.793188214302063, "Finetune/Loss (Raw)": 0.8106173872947693, "Finetune/Step": 2275, "Finetune/Step Time": 2.914720766246319} +{"Finetune/Learning Rate": 1.1848223844272688e-05, "Finetune/Loss": 0.7930437326431274, "Finetune/Loss (Raw)": 0.811952531337738, "Finetune/Step": 2276, "Finetune/Step Time": 2.914735736325383} +{"Finetune/Learning Rate": 1.1841824553252302e-05, "Finetune/Loss": 0.7930392622947693, "Finetune/Loss (Raw)": 0.804186999797821, "Finetune/Step": 2277, "Finetune/Step Time": 2.9117922466248274} +{"Finetune/Learning Rate": 1.1835424481407553e-05, "Finetune/Loss": 0.7924184799194336, "Finetune/Loss (Raw)": 0.8290690779685974, "Finetune/Step": 2278, "Finetune/Step Time": 2.912016497924924} +{"Finetune/Learning Rate": 1.1829023631451701e-05, "Finetune/Loss": 0.7920348048210144, "Finetune/Loss (Raw)": 0.8621265292167664, "Finetune/Step": 2279, "Finetune/Step Time": 2.9138837475329638} +{"Finetune/Learning Rate": 1.1822622006098323e-05, "Finetune/Loss": 0.7913775444030762, "Finetune/Loss (Raw)": 0.8152946829795837, "Finetune/Step": 2280, "Finetune/Step Time": 2.9063054155558348} +{"Finetune/Learning Rate": 1.1816219608061325e-05, "Finetune/Loss": 0.790787398815155, "Finetune/Loss (Raw)": 0.7297043800354004, "Finetune/Step": 2281, "Finetune/Step Time": 2.901917127892375} +{"Finetune/Learning Rate": 1.1809816440054948e-05, "Finetune/Loss": 0.7857239246368408, "Finetune/Loss (Raw)": 0.21622642874717712, "Finetune/Step": 2282, "Finetune/Step Time": 2.938203977420926} +{"Finetune/Learning Rate": 1.1803412504793755e-05, "Finetune/Loss": 0.7855528593063354, "Finetune/Loss (Raw)": 0.7927291393280029, "Finetune/Step": 2283, "Finetune/Step Time": 2.939157633110881} +{"Finetune/Learning Rate": 1.1797007804992633e-05, "Finetune/Loss": 0.7851201295852661, "Finetune/Loss (Raw)": 0.7879858016967773, "Finetune/Step": 2284, "Finetune/Step Time": 2.9393952190876007} +{"Finetune/Learning Rate": 1.1790602343366795e-05, "Finetune/Loss": 0.7853636145591736, "Finetune/Loss (Raw)": 0.6699244976043701, "Finetune/Step": 2285, "Finetune/Step Time": 2.9140335097908974} +{"Finetune/Learning Rate": 1.1784196122631779e-05, "Finetune/Loss": 0.7844460606575012, "Finetune/Loss (Raw)": 0.7455196976661682, "Finetune/Step": 2286, "Finetune/Step Time": 2.9205507785081863} +{"Finetune/Learning Rate": 1.1777789145503439e-05, "Finetune/Loss": 0.7848204374313354, "Finetune/Loss (Raw)": 0.908808708190918, "Finetune/Step": 2287, "Finetune/Step Time": 2.9214341659098864} +{"Finetune/Learning Rate": 1.1771381414697956e-05, "Finetune/Loss": 0.7852324843406677, "Finetune/Loss (Raw)": 0.8452498316764832, "Finetune/Step": 2288, "Finetune/Step Time": 2.918974345549941} +{"Finetune/Learning Rate": 1.1764972932931826e-05, "Finetune/Loss": 0.7850974798202515, "Finetune/Loss (Raw)": 0.7647337317466736, "Finetune/Step": 2289, "Finetune/Step Time": 2.920206133276224} +{"Finetune/Learning Rate": 1.1758563702921869e-05, "Finetune/Loss": 0.7853311896324158, "Finetune/Loss (Raw)": 0.8062312602996826, "Finetune/Step": 2290, "Finetune/Step Time": 2.9251314904540777} +{"Finetune/Learning Rate": 1.1752153727385214e-05, "Finetune/Loss": 0.7855100631713867, "Finetune/Loss (Raw)": 0.8610090017318726, "Finetune/Step": 2291, "Finetune/Step Time": 2.92740292660892} +{"Finetune/Learning Rate": 1.1745743009039311e-05, "Finetune/Loss": 0.7851901054382324, "Finetune/Loss (Raw)": 0.8176851272583008, "Finetune/Step": 2292, "Finetune/Step Time": 2.9256358053535223} +{"Finetune/Learning Rate": 1.1739331550601927e-05, "Finetune/Loss": 0.7853872776031494, "Finetune/Loss (Raw)": 0.7923521995544434, "Finetune/Step": 2293, "Finetune/Step Time": 2.9242033213377} +{"Finetune/Learning Rate": 1.1732919354791137e-05, "Finetune/Loss": 0.7855838537216187, "Finetune/Loss (Raw)": 0.8077300786972046, "Finetune/Step": 2294, "Finetune/Step Time": 2.925995796918869} +{"Finetune/Learning Rate": 1.1726506424325333e-05, "Finetune/Loss": 0.7883071899414062, "Finetune/Loss (Raw)": 0.8744631409645081, "Finetune/Step": 2295, "Finetune/Step Time": 2.9039021972566843} +{"Finetune/Learning Rate": 1.1720092761923219e-05, "Finetune/Loss": 0.7877548933029175, "Finetune/Loss (Raw)": 0.7725942730903625, "Finetune/Step": 2296, "Finetune/Step Time": 2.9031360428780317} +{"Finetune/Learning Rate": 1.17136783703038e-05, "Finetune/Loss": 0.7877000570297241, "Finetune/Loss (Raw)": 0.7874864339828491, "Finetune/Step": 2297, "Finetune/Step Time": 2.901230489835143} +{"Finetune/Learning Rate": 1.1707263252186407e-05, "Finetune/Loss": 0.7865282893180847, "Finetune/Loss (Raw)": 0.8284912705421448, "Finetune/Step": 2298, "Finetune/Step Time": 2.904257409274578} +{"Finetune/Learning Rate": 1.1700847410290667e-05, "Finetune/Loss": 0.7873218059539795, "Finetune/Loss (Raw)": 0.8347931504249573, "Finetune/Step": 2299, "Finetune/Step Time": 2.9000201765447855} +{"Finetune/Learning Rate": 1.1694430847336513e-05, "Finetune/Loss": 0.7876712083816528, "Finetune/Loss (Raw)": 0.8372185230255127, "Finetune/Step": 2300, "Finetune/Step Time": 2.9012299347668886} +{"Finetune/Learning Rate": 1.1688013566044191e-05, "Finetune/Loss": 0.7871484756469727, "Finetune/Loss (Raw)": 0.8063178062438965, "Finetune/Step": 2301, "Finetune/Step Time": 2.8989978544414043} +{"Finetune/Learning Rate": 1.168159556913424e-05, "Finetune/Loss": 0.7879839539527893, "Finetune/Loss (Raw)": 0.9120011329650879, "Finetune/Step": 2302, "Finetune/Step Time": 2.9033660385757685} +{"Finetune/Learning Rate": 1.1675176859327521e-05, "Finetune/Loss": 0.7875370383262634, "Finetune/Loss (Raw)": 0.7856196165084839, "Finetune/Step": 2303, "Finetune/Step Time": 2.9049698133021593} +{"Finetune/Learning Rate": 1.1668757439345181e-05, "Finetune/Loss": 0.7887939214706421, "Finetune/Loss (Raw)": 0.9348960518836975, "Finetune/Step": 2304, "Finetune/Step Time": 2.902976782992482} +{"Finetune/Learning Rate": 1.1662337311908671e-05, "Finetune/Loss": 0.7910627126693726, "Finetune/Loss (Raw)": 0.8374318480491638, "Finetune/Step": 2305, "Finetune/Step Time": 2.881740814074874} +{"Finetune/Learning Rate": 1.1655916479739748e-05, "Finetune/Loss": 0.7900258898735046, "Finetune/Loss (Raw)": 0.7386964559555054, "Finetune/Step": 2306, "Finetune/Step Time": 2.8828080240637064} +{"Finetune/Learning Rate": 1.164949494556046e-05, "Finetune/Loss": 0.790489912033081, "Finetune/Loss (Raw)": 0.8508182168006897, "Finetune/Step": 2307, "Finetune/Step Time": 2.882694708183408} +{"Finetune/Learning Rate": 1.1643072712093162e-05, "Finetune/Loss": 0.7922642230987549, "Finetune/Loss (Raw)": 0.9520822167396545, "Finetune/Step": 2308, "Finetune/Step Time": 2.8829940389841795} +{"Finetune/Learning Rate": 1.1636649782060496e-05, "Finetune/Loss": 0.7931943535804749, "Finetune/Loss (Raw)": 0.8893980979919434, "Finetune/Step": 2309, "Finetune/Step Time": 2.8830234967172146} +{"Finetune/Learning Rate": 1.1630226158185406e-05, "Finetune/Loss": 0.7936699390411377, "Finetune/Loss (Raw)": 0.8224044442176819, "Finetune/Step": 2310, "Finetune/Step Time": 2.887284839525819} +{"Finetune/Learning Rate": 1.162380184319112e-05, "Finetune/Loss": 0.7935734987258911, "Finetune/Loss (Raw)": 0.804509699344635, "Finetune/Step": 2311, "Finetune/Step Time": 2.890367092564702} +{"Finetune/Learning Rate": 1.1617376839801176e-05, "Finetune/Loss": 0.794644832611084, "Finetune/Loss (Raw)": 0.8060727119445801, "Finetune/Step": 2312, "Finetune/Step Time": 2.86387724801898} +{"Finetune/Learning Rate": 1.1610951150739391e-05, "Finetune/Loss": 0.794303297996521, "Finetune/Loss (Raw)": 0.8347415924072266, "Finetune/Step": 2313, "Finetune/Step Time": 2.8627826515585184} +{"Finetune/Learning Rate": 1.1604524778729875e-05, "Finetune/Loss": 0.7932683229446411, "Finetune/Loss (Raw)": 0.8189206719398499, "Finetune/Step": 2314, "Finetune/Step Time": 2.867119688540697} +{"Finetune/Learning Rate": 1.159809772649703e-05, "Finetune/Loss": 0.7924975156784058, "Finetune/Loss (Raw)": 0.8012945652008057, "Finetune/Step": 2315, "Finetune/Step Time": 2.8641423620283604} +{"Finetune/Learning Rate": 1.1591669996765543e-05, "Finetune/Loss": 0.7932525873184204, "Finetune/Loss (Raw)": 0.8786049485206604, "Finetune/Step": 2316, "Finetune/Step Time": 2.8648703414946795} +{"Finetune/Learning Rate": 1.158524159226039e-05, "Finetune/Loss": 0.7985354661941528, "Finetune/Loss (Raw)": 0.8798362016677856, "Finetune/Step": 2317, "Finetune/Step Time": 2.832461068406701} +{"Finetune/Learning Rate": 1.1578812515706836e-05, "Finetune/Loss": 0.7972894310951233, "Finetune/Loss (Raw)": 0.6937071681022644, "Finetune/Step": 2318, "Finetune/Step Time": 2.83553477935493} +{"Finetune/Learning Rate": 1.1572382769830428e-05, "Finetune/Loss": 0.7976402640342712, "Finetune/Loss (Raw)": 0.8792588710784912, "Finetune/Step": 2319, "Finetune/Step Time": 2.83802324347198} +{"Finetune/Learning Rate": 1.1565952357356996e-05, "Finetune/Loss": 0.7975396513938904, "Finetune/Loss (Raw)": 0.8504083752632141, "Finetune/Step": 2320, "Finetune/Step Time": 2.846486125141382} +{"Finetune/Learning Rate": 1.1559521281012648e-05, "Finetune/Loss": 0.7969571948051453, "Finetune/Loss (Raw)": 0.7898203730583191, "Finetune/Step": 2321, "Finetune/Step Time": 2.8495500702410936} +{"Finetune/Learning Rate": 1.1553089543523786e-05, "Finetune/Loss": 0.7961194515228271, "Finetune/Loss (Raw)": 0.7572485208511353, "Finetune/Step": 2322, "Finetune/Step Time": 2.85090477950871} +{"Finetune/Learning Rate": 1.1546657147617083e-05, "Finetune/Loss": 0.8009229898452759, "Finetune/Loss (Raw)": 0.8291118741035461, "Finetune/Step": 2323, "Finetune/Step Time": 2.818898167461157} +{"Finetune/Learning Rate": 1.1540224096019495e-05, "Finetune/Loss": 0.8005586266517639, "Finetune/Loss (Raw)": 0.7550395131111145, "Finetune/Step": 2324, "Finetune/Step Time": 2.818287242203951} +{"Finetune/Learning Rate": 1.1533790391458249e-05, "Finetune/Loss": 0.7977946996688843, "Finetune/Loss (Raw)": 0.547240674495697, "Finetune/Step": 2325, "Finetune/Step Time": 2.8402773682028055} +{"Finetune/Learning Rate": 1.1527356036660859e-05, "Finetune/Loss": 0.7994714379310608, "Finetune/Loss (Raw)": 0.8758205771446228, "Finetune/Step": 2326, "Finetune/Step Time": 2.818185558542609} +{"Finetune/Learning Rate": 1.152092103435511e-05, "Finetune/Loss": 0.7981176376342773, "Finetune/Loss (Raw)": 0.7627756595611572, "Finetune/Step": 2327, "Finetune/Step Time": 2.817281387746334} +{"Finetune/Learning Rate": 1.151448538726906e-05, "Finetune/Loss": 0.7985693216323853, "Finetune/Loss (Raw)": 0.8516592979431152, "Finetune/Step": 2328, "Finetune/Step Time": 2.8189666606485844} +{"Finetune/Learning Rate": 1.1508049098131038e-05, "Finetune/Loss": 0.7987193465232849, "Finetune/Loss (Raw)": 0.9576225876808167, "Finetune/Step": 2329, "Finetune/Step Time": 2.789691301062703} +{"Finetune/Learning Rate": 1.1501612169669652e-05, "Finetune/Loss": 0.7990435361862183, "Finetune/Loss (Raw)": 0.9336113929748535, "Finetune/Step": 2330, "Finetune/Step Time": 2.790533371269703} +{"Finetune/Learning Rate": 1.149517460461378e-05, "Finetune/Loss": 0.7988770008087158, "Finetune/Loss (Raw)": 0.8447306752204895, "Finetune/Step": 2331, "Finetune/Step Time": 2.7876999005675316} +{"Finetune/Learning Rate": 1.1488736405692567e-05, "Finetune/Loss": 0.8021827936172485, "Finetune/Loss (Raw)": 0.8585265874862671, "Finetune/Step": 2332, "Finetune/Step Time": 2.7536868285387754} +{"Finetune/Learning Rate": 1.1482297575635424e-05, "Finetune/Loss": 0.798548698425293, "Finetune/Loss (Raw)": 0.21394315361976624, "Finetune/Step": 2333, "Finetune/Step Time": 2.7843781672418118} +{"Finetune/Learning Rate": 1.1475858117172034e-05, "Finetune/Loss": 0.7980698347091675, "Finetune/Loss (Raw)": 0.7670977115631104, "Finetune/Step": 2334, "Finetune/Step Time": 2.7842579297721386} +{"Finetune/Learning Rate": 1.1469418033032347e-05, "Finetune/Loss": 0.7986783385276794, "Finetune/Loss (Raw)": 0.7814007997512817, "Finetune/Step": 2335, "Finetune/Step Time": 2.7850245721638203} +{"Finetune/Learning Rate": 1.1462977325946576e-05, "Finetune/Loss": 0.7974894046783447, "Finetune/Loss (Raw)": 0.778709352016449, "Finetune/Step": 2336, "Finetune/Step Time": 2.776945421472192} +{"Finetune/Learning Rate": 1.1456535998645203e-05, "Finetune/Loss": 0.7975297570228577, "Finetune/Loss (Raw)": 0.855777382850647, "Finetune/Step": 2337, "Finetune/Step Time": 2.7785670086741447} +{"Finetune/Learning Rate": 1.145009405385896e-05, "Finetune/Loss": 0.797608494758606, "Finetune/Loss (Raw)": 0.8397225141525269, "Finetune/Step": 2338, "Finetune/Step Time": 2.777433218434453} +{"Finetune/Learning Rate": 1.1443651494318853e-05, "Finetune/Loss": 0.797405481338501, "Finetune/Loss (Raw)": 0.8019655346870422, "Finetune/Step": 2339, "Finetune/Step Time": 2.7771370988339186} +{"Finetune/Learning Rate": 1.143720832275615e-05, "Finetune/Loss": 0.7960638999938965, "Finetune/Loss (Raw)": 0.6094167828559875, "Finetune/Step": 2340, "Finetune/Step Time": 2.799777237698436} +{"Finetune/Learning Rate": 1.1430764541902368e-05, "Finetune/Loss": 0.7958440184593201, "Finetune/Loss (Raw)": 0.7691400647163391, "Finetune/Step": 2341, "Finetune/Step Time": 2.8020108211785555} +{"Finetune/Learning Rate": 1.142432015448929e-05, "Finetune/Loss": 0.7952487468719482, "Finetune/Loss (Raw)": 0.8104690909385681, "Finetune/Step": 2342, "Finetune/Step Time": 2.808816382661462} +{"Finetune/Learning Rate": 1.1417875163248954e-05, "Finetune/Loss": 0.7958554029464722, "Finetune/Loss (Raw)": 0.7533490657806396, "Finetune/Step": 2343, "Finetune/Step Time": 2.786941349506378} +{"Finetune/Learning Rate": 1.1411429570913652e-05, "Finetune/Loss": 0.7953029274940491, "Finetune/Loss (Raw)": 0.7815725803375244, "Finetune/Step": 2344, "Finetune/Step Time": 2.783242514356971} +{"Finetune/Learning Rate": 1.1404983380215934e-05, "Finetune/Loss": 0.7951545119285583, "Finetune/Loss (Raw)": 0.7478745579719543, "Finetune/Step": 2345, "Finetune/Step Time": 2.7785121016204357} +{"Finetune/Learning Rate": 1.1398536593888606e-05, "Finetune/Loss": 0.7945257425308228, "Finetune/Loss (Raw)": 0.8128746747970581, "Finetune/Step": 2346, "Finetune/Step Time": 2.780981933698058} +{"Finetune/Learning Rate": 1.1392089214664717e-05, "Finetune/Loss": 0.7958090305328369, "Finetune/Loss (Raw)": 0.9225664138793945, "Finetune/Step": 2347, "Finetune/Step Time": 2.7807365376502275} +{"Finetune/Learning Rate": 1.1385641245277579e-05, "Finetune/Loss": 0.7942278385162354, "Finetune/Loss (Raw)": 0.5833961367607117, "Finetune/Step": 2348, "Finetune/Step Time": 2.8049076441675425} +{"Finetune/Learning Rate": 1.137919268846074e-05, "Finetune/Loss": 0.794818103313446, "Finetune/Loss (Raw)": 0.7915675044059753, "Finetune/Step": 2349, "Finetune/Step Time": 2.806842390447855} +{"Finetune/Learning Rate": 1.1372743546948017e-05, "Finetune/Loss": 0.7944608926773071, "Finetune/Loss (Raw)": 0.8478123545646667, "Finetune/Step": 2350, "Finetune/Step Time": 2.8108841478824615} +{"Finetune/Learning Rate": 1.1366293823473455e-05, "Finetune/Loss": 0.7948715686798096, "Finetune/Loss (Raw)": 0.8778470158576965, "Finetune/Step": 2351, "Finetune/Step Time": 2.8080836441367865} +{"Finetune/Learning Rate": 1.1359843520771359e-05, "Finetune/Loss": 0.794366180896759, "Finetune/Loss (Raw)": 0.7471104264259338, "Finetune/Step": 2352, "Finetune/Step Time": 2.809438394382596} +{"Finetune/Learning Rate": 1.1353392641576272e-05, "Finetune/Loss": 0.7939397096633911, "Finetune/Loss (Raw)": 0.8509503602981567, "Finetune/Step": 2353, "Finetune/Step Time": 2.8091737255454063} +{"Finetune/Learning Rate": 1.1346941188622982e-05, "Finetune/Loss": 0.7953594923019409, "Finetune/Loss (Raw)": 0.9257931709289551, "Finetune/Step": 2354, "Finetune/Step Time": 2.806110305711627} +{"Finetune/Learning Rate": 1.134048916464653e-05, "Finetune/Loss": 0.7912903428077698, "Finetune/Loss (Raw)": 0.3000885546207428, "Finetune/Step": 2355, "Finetune/Step Time": 2.838467614725232} +{"Finetune/Learning Rate": 1.1334036572382182e-05, "Finetune/Loss": 0.7905224561691284, "Finetune/Loss (Raw)": 0.7834548354148865, "Finetune/Step": 2356, "Finetune/Step Time": 2.835250273346901} +{"Finetune/Learning Rate": 1.1327583414565461e-05, "Finetune/Loss": 0.7867796421051025, "Finetune/Loss (Raw)": 0.3995952606201172, "Finetune/Step": 2357, "Finetune/Step Time": 2.8667218796908855} +{"Finetune/Learning Rate": 1.132112969393212e-05, "Finetune/Loss": 0.786504864692688, "Finetune/Loss (Raw)": 0.8694800734519958, "Finetune/Step": 2358, "Finetune/Step Time": 2.8694929219782352} +{"Finetune/Learning Rate": 1.1314675413218157e-05, "Finetune/Loss": 0.7860094904899597, "Finetune/Loss (Raw)": 0.8297824859619141, "Finetune/Step": 2359, "Finetune/Step Time": 2.8683590441942215} +{"Finetune/Learning Rate": 1.13082205751598e-05, "Finetune/Loss": 0.7859719395637512, "Finetune/Loss (Raw)": 0.8826643824577332, "Finetune/Step": 2360, "Finetune/Step Time": 2.8689568359404802} +{"Finetune/Learning Rate": 1.1301765182493523e-05, "Finetune/Loss": 0.7868412733078003, "Finetune/Loss (Raw)": 0.8906754851341248, "Finetune/Step": 2361, "Finetune/Step Time": 2.8663674853742123} +{"Finetune/Learning Rate": 1.1295309237956022e-05, "Finetune/Loss": 0.7861410975456238, "Finetune/Loss (Raw)": 0.6592397689819336, "Finetune/Step": 2362, "Finetune/Step Time": 2.8913979195058346} +{"Finetune/Learning Rate": 1.128885274428424e-05, "Finetune/Loss": 0.7856333255767822, "Finetune/Loss (Raw)": 0.8144294023513794, "Finetune/Step": 2363, "Finetune/Step Time": 2.8926082588732243} +{"Finetune/Learning Rate": 1.1282395704215346e-05, "Finetune/Loss": 0.7837410569190979, "Finetune/Loss (Raw)": 0.6237336993217468, "Finetune/Step": 2364, "Finetune/Step Time": 2.9169695116579533} +{"Finetune/Learning Rate": 1.1275938120486743e-05, "Finetune/Loss": 0.7840825915336609, "Finetune/Loss (Raw)": 0.8215263485908508, "Finetune/Step": 2365, "Finetune/Step Time": 2.9153372198343277} +{"Finetune/Learning Rate": 1.1269479995836062e-05, "Finetune/Loss": 0.7847182154655457, "Finetune/Loss (Raw)": 0.8653698563575745, "Finetune/Step": 2366, "Finetune/Step Time": 2.9114357326179743} +{"Finetune/Learning Rate": 1.1263021333001164e-05, "Finetune/Loss": 0.7826648950576782, "Finetune/Loss (Raw)": 0.6653749346733093, "Finetune/Step": 2367, "Finetune/Step Time": 2.9080713987350464} +{"Finetune/Learning Rate": 1.1256562134720137e-05, "Finetune/Loss": 0.7841463685035706, "Finetune/Loss (Raw)": 0.8994285464286804, "Finetune/Step": 2368, "Finetune/Step Time": 2.904839903116226} +{"Finetune/Learning Rate": 1.1250102403731305e-05, "Finetune/Loss": 0.7838799953460693, "Finetune/Loss (Raw)": 0.8460875153541565, "Finetune/Step": 2369, "Finetune/Step Time": 2.911748008802533} +{"Finetune/Learning Rate": 1.1243642142773206e-05, "Finetune/Loss": 0.7844737768173218, "Finetune/Loss (Raw)": 0.8449270725250244, "Finetune/Step": 2370, "Finetune/Step Time": 2.9072779193520546} +{"Finetune/Learning Rate": 1.1237181354584608e-05, "Finetune/Loss": 0.7844858765602112, "Finetune/Loss (Raw)": 0.7872311472892761, "Finetune/Step": 2371, "Finetune/Step Time": 2.9078854769468307} +{"Finetune/Learning Rate": 1.12307200419045e-05, "Finetune/Loss": 0.7842196226119995, "Finetune/Loss (Raw)": 0.776958703994751, "Finetune/Step": 2372, "Finetune/Step Time": 2.9080917593091726} +{"Finetune/Learning Rate": 1.1224258207472101e-05, "Finetune/Loss": 0.783650279045105, "Finetune/Loss (Raw)": 0.7142107486724854, "Finetune/Step": 2373, "Finetune/Step Time": 2.9088936783373356} +{"Finetune/Learning Rate": 1.121779585402684e-05, "Finetune/Loss": 0.789000928401947, "Finetune/Loss (Raw)": 0.8391062021255493, "Finetune/Step": 2374, "Finetune/Step Time": 2.877377614378929} +{"Finetune/Learning Rate": 1.1211332984308373e-05, "Finetune/Loss": 0.7890433073043823, "Finetune/Loss (Raw)": 0.8724559545516968, "Finetune/Step": 2375, "Finetune/Step Time": 2.8741719890385866} +{"Finetune/Learning Rate": 1.1204869601056579e-05, "Finetune/Loss": 0.787665843963623, "Finetune/Loss (Raw)": 0.5891755819320679, "Finetune/Step": 2376, "Finetune/Step Time": 2.9074666555970907} +{"Finetune/Learning Rate": 1.1198405707011536e-05, "Finetune/Loss": 0.7871595621109009, "Finetune/Loss (Raw)": 0.75989830493927, "Finetune/Step": 2377, "Finetune/Step Time": 2.9049772024154663} +{"Finetune/Learning Rate": 1.1191941304913564e-05, "Finetune/Loss": 0.7835158109664917, "Finetune/Loss (Raw)": 0.24761860072612762, "Finetune/Step": 2378, "Finetune/Step Time": 2.933143785223365} +{"Finetune/Learning Rate": 1.1185476397503181e-05, "Finetune/Loss": 0.7856351733207703, "Finetune/Loss (Raw)": 0.820269763469696, "Finetune/Step": 2379, "Finetune/Step Time": 2.9145771954208612} +{"Finetune/Learning Rate": 1.1179010987521125e-05, "Finetune/Loss": 0.7879672050476074, "Finetune/Loss (Raw)": 0.7629607319831848, "Finetune/Step": 2380, "Finetune/Step Time": 2.8810198083519936} +{"Finetune/Learning Rate": 1.1172545077708348e-05, "Finetune/Loss": 0.7887095212936401, "Finetune/Loss (Raw)": 0.8956848978996277, "Finetune/Step": 2381, "Finetune/Step Time": 2.8783483933657408} +{"Finetune/Learning Rate": 1.1166078670806006e-05, "Finetune/Loss": 0.7884811162948608, "Finetune/Loss (Raw)": 0.8749969005584717, "Finetune/Step": 2382, "Finetune/Step Time": 2.878973612561822} +{"Finetune/Learning Rate": 1.1159611769555481e-05, "Finetune/Loss": 0.7879327535629272, "Finetune/Loss (Raw)": 0.8983548283576965, "Finetune/Step": 2383, "Finetune/Step Time": 2.881476992741227} +{"Finetune/Learning Rate": 1.1153144376698349e-05, "Finetune/Loss": 0.7873486280441284, "Finetune/Loss (Raw)": 0.7731180191040039, "Finetune/Step": 2384, "Finetune/Step Time": 2.883928682655096} +{"Finetune/Learning Rate": 1.1146676494976402e-05, "Finetune/Loss": 0.7877283096313477, "Finetune/Loss (Raw)": 0.8466900587081909, "Finetune/Step": 2385, "Finetune/Step Time": 2.8841711468994617} +{"Finetune/Learning Rate": 1.1140208127131638e-05, "Finetune/Loss": 0.7897775173187256, "Finetune/Loss (Raw)": 0.8460203409194946, "Finetune/Step": 2386, "Finetune/Step Time": 2.862957451492548} +{"Finetune/Learning Rate": 1.1133739275906266e-05, "Finetune/Loss": 0.7906939387321472, "Finetune/Loss (Raw)": 0.7305837869644165, "Finetune/Step": 2387, "Finetune/Step Time": 2.841997830197215} +{"Finetune/Learning Rate": 1.1127269944042688e-05, "Finetune/Loss": 0.790870189666748, "Finetune/Loss (Raw)": 0.7870668768882751, "Finetune/Step": 2388, "Finetune/Step Time": 2.8377414736896753} +{"Finetune/Learning Rate": 1.1120800134283525e-05, "Finetune/Loss": 0.7909220457077026, "Finetune/Loss (Raw)": 0.9358264803886414, "Finetune/Step": 2389, "Finetune/Step Time": 2.837489804252982} +{"Finetune/Learning Rate": 1.1114329849371586e-05, "Finetune/Loss": 0.7908437848091125, "Finetune/Loss (Raw)": 0.8146660327911377, "Finetune/Step": 2390, "Finetune/Step Time": 2.8369703479111195} +{"Finetune/Learning Rate": 1.1107859092049886e-05, "Finetune/Loss": 0.790406346321106, "Finetune/Loss (Raw)": 0.725939154624939, "Finetune/Step": 2391, "Finetune/Step Time": 2.833096681162715} +{"Finetune/Learning Rate": 1.110138786506165e-05, "Finetune/Loss": 0.7906416058540344, "Finetune/Loss (Raw)": 0.7911537885665894, "Finetune/Step": 2392, "Finetune/Step Time": 2.820010783150792} +{"Finetune/Learning Rate": 1.1094916171150291e-05, "Finetune/Loss": 0.790926992893219, "Finetune/Loss (Raw)": 0.8121420741081238, "Finetune/Step": 2393, "Finetune/Step Time": 2.8231950849294662} +{"Finetune/Learning Rate": 1.1088444013059423e-05, "Finetune/Loss": 0.7912017703056335, "Finetune/Loss (Raw)": 0.8851839900016785, "Finetune/Step": 2394, "Finetune/Step Time": 2.8240768257528543} +{"Finetune/Learning Rate": 1.1081971393532858e-05, "Finetune/Loss": 0.7912280559539795, "Finetune/Loss (Raw)": 0.8643178939819336, "Finetune/Step": 2395, "Finetune/Step Time": 2.8195241522043943} +{"Finetune/Learning Rate": 1.1075498315314598e-05, "Finetune/Loss": 0.7914867401123047, "Finetune/Loss (Raw)": 0.789552628993988, "Finetune/Step": 2396, "Finetune/Step Time": 2.8204457350075245} +{"Finetune/Learning Rate": 1.1069024781148852e-05, "Finetune/Loss": 0.791996955871582, "Finetune/Loss (Raw)": 0.8437661528587341, "Finetune/Step": 2397, "Finetune/Step Time": 2.8190004508942366} +{"Finetune/Learning Rate": 1.1062550793780011e-05, "Finetune/Loss": 0.7915077805519104, "Finetune/Loss (Raw)": 0.7962520718574524, "Finetune/Step": 2398, "Finetune/Step Time": 2.819967694580555} +{"Finetune/Learning Rate": 1.105607635595266e-05, "Finetune/Loss": 0.7907042503356934, "Finetune/Loss (Raw)": 0.7762831449508667, "Finetune/Step": 2399, "Finetune/Step Time": 2.8190448880195618} +{"Finetune/Learning Rate": 1.1049601470411575e-05, "Finetune/Loss": 0.7905583381652832, "Finetune/Loss (Raw)": 0.8693886399269104, "Finetune/Step": 2400, "Finetune/Step Time": 2.8177688252180815} +{"Finetune/Learning Rate": 1.104312613990173e-05, "Finetune/Loss": 0.790181040763855, "Finetune/Loss (Raw)": 0.7861801385879517, "Finetune/Step": 2401, "Finetune/Step Time": 2.8167459592223167} +{"Finetune/Learning Rate": 1.1036650367168276e-05, "Finetune/Loss": 0.7905086874961853, "Finetune/Loss (Raw)": 0.851429283618927, "Finetune/Step": 2402, "Finetune/Step Time": 2.8182556983083487} +{"Finetune/Learning Rate": 1.1030174154956558e-05, "Finetune/Loss": 0.7910881042480469, "Finetune/Loss (Raw)": 0.8847827911376953, "Finetune/Step": 2403, "Finetune/Step Time": 2.8161783162504435} +{"Finetune/Learning Rate": 1.1023697506012108e-05, "Finetune/Loss": 0.7908856868743896, "Finetune/Loss (Raw)": 0.7860449552536011, "Finetune/Step": 2404, "Finetune/Step Time": 2.8147791791707277} +{"Finetune/Learning Rate": 1.1017220423080634e-05, "Finetune/Loss": 0.7913088202476501, "Finetune/Loss (Raw)": 0.8583457469940186, "Finetune/Step": 2405, "Finetune/Step Time": 2.8168187830597162} +{"Finetune/Learning Rate": 1.1010742908908041e-05, "Finetune/Loss": 0.7910314798355103, "Finetune/Loss (Raw)": 0.7935692667961121, "Finetune/Step": 2406, "Finetune/Step Time": 2.8120507765561342} +{"Finetune/Learning Rate": 1.1004264966240413e-05, "Finetune/Loss": 0.790886640548706, "Finetune/Loss (Raw)": 0.8435856699943542, "Finetune/Step": 2407, "Finetune/Step Time": 2.8148718513548374} +{"Finetune/Learning Rate": 1.0997786597824006e-05, "Finetune/Loss": 0.790415346622467, "Finetune/Loss (Raw)": 0.7549676299095154, "Finetune/Step": 2408, "Finetune/Step Time": 2.8139073345810175} +{"Finetune/Learning Rate": 1.099130780640527e-05, "Finetune/Loss": 0.7900428771972656, "Finetune/Loss (Raw)": 0.682039201259613, "Finetune/Step": 2409, "Finetune/Step Time": 2.8358868416398764} +{"Finetune/Learning Rate": 1.0984828594730821e-05, "Finetune/Loss": 0.7948065400123596, "Finetune/Loss (Raw)": 0.8259706497192383, "Finetune/Step": 2410, "Finetune/Step Time": 2.803141251206398} +{"Finetune/Learning Rate": 1.0978348965547469e-05, "Finetune/Loss": 0.7952556610107422, "Finetune/Loss (Raw)": 0.85020911693573, "Finetune/Step": 2411, "Finetune/Step Time": 2.802321108058095} +{"Finetune/Learning Rate": 1.0971868921602189e-05, "Finetune/Loss": 0.7955545783042908, "Finetune/Loss (Raw)": 0.8262514472007751, "Finetune/Step": 2412, "Finetune/Step Time": 2.8030895106494427} +{"Finetune/Learning Rate": 1.0965388465642135e-05, "Finetune/Loss": 0.796257495880127, "Finetune/Loss (Raw)": 0.7598998546600342, "Finetune/Step": 2413, "Finetune/Step Time": 2.802002055570483} +{"Finetune/Learning Rate": 1.0958907600414634e-05, "Finetune/Loss": 0.7962225675582886, "Finetune/Loss (Raw)": 0.7410535216331482, "Finetune/Step": 2414, "Finetune/Step Time": 2.7955089285969734} +{"Finetune/Learning Rate": 1.0952426328667191e-05, "Finetune/Loss": 0.7962571978569031, "Finetune/Loss (Raw)": 0.9132395386695862, "Finetune/Step": 2415, "Finetune/Step Time": 2.793936649337411} +{"Finetune/Learning Rate": 1.0945944653147482e-05, "Finetune/Loss": 0.7960711717605591, "Finetune/Loss (Raw)": 0.8214356899261475, "Finetune/Step": 2416, "Finetune/Step Time": 2.794273314997554} +{"Finetune/Learning Rate": 1.0939462576603352e-05, "Finetune/Loss": 0.7920280694961548, "Finetune/Loss (Raw)": 0.24721607565879822, "Finetune/Step": 2417, "Finetune/Step Time": 2.8248419892042875} +{"Finetune/Learning Rate": 1.0932980101782815e-05, "Finetune/Loss": 0.792370617389679, "Finetune/Loss (Raw)": 0.8500755429267883, "Finetune/Step": 2418, "Finetune/Step Time": 2.8223144300282} +{"Finetune/Learning Rate": 1.0926497231434055e-05, "Finetune/Loss": 0.7917066812515259, "Finetune/Loss (Raw)": 0.776028573513031, "Finetune/Step": 2419, "Finetune/Step Time": 2.820254223421216} +{"Finetune/Learning Rate": 1.0920013968305427e-05, "Finetune/Loss": 0.7913797497749329, "Finetune/Loss (Raw)": 0.7758370041847229, "Finetune/Step": 2420, "Finetune/Step Time": 2.823055235669017} +{"Finetune/Learning Rate": 1.091353031514545e-05, "Finetune/Loss": 0.7911731600761414, "Finetune/Loss (Raw)": 0.765904426574707, "Finetune/Step": 2421, "Finetune/Step Time": 2.822915766388178} +{"Finetune/Learning Rate": 1.0907046274702809e-05, "Finetune/Loss": 0.7920543551445007, "Finetune/Loss (Raw)": 0.9205291271209717, "Finetune/Step": 2422, "Finetune/Step Time": 2.820659063756466} +{"Finetune/Learning Rate": 1.090056184972635e-05, "Finetune/Loss": 0.7915489673614502, "Finetune/Loss (Raw)": 0.8097729682922363, "Finetune/Step": 2423, "Finetune/Step Time": 2.8206261191517115} +{"Finetune/Learning Rate": 1.0894077042965084e-05, "Finetune/Loss": 0.7916643619537354, "Finetune/Loss (Raw)": 0.7873611450195312, "Finetune/Step": 2424, "Finetune/Step Time": 2.8217580169439316} +{"Finetune/Learning Rate": 1.0887591857168187e-05, "Finetune/Loss": 0.7929293513298035, "Finetune/Loss (Raw)": 0.949411928653717, "Finetune/Step": 2425, "Finetune/Step Time": 2.82392224855721} +{"Finetune/Learning Rate": 1.0881106295084993e-05, "Finetune/Loss": 0.7935450077056885, "Finetune/Loss (Raw)": 0.907288670539856, "Finetune/Step": 2426, "Finetune/Step Time": 2.8200320471078157} +{"Finetune/Learning Rate": 1.0874620359464996e-05, "Finetune/Loss": 0.7932931780815125, "Finetune/Loss (Raw)": 0.8025588393211365, "Finetune/Step": 2427, "Finetune/Step Time": 2.8192427456378937} +{"Finetune/Learning Rate": 1.0868134053057844e-05, "Finetune/Loss": 0.792526125907898, "Finetune/Loss (Raw)": 0.739036500453949, "Finetune/Step": 2428, "Finetune/Step Time": 2.818535577505827} +{"Finetune/Learning Rate": 1.086164737861335e-05, "Finetune/Loss": 0.7926845550537109, "Finetune/Loss (Raw)": 0.8265945315361023, "Finetune/Step": 2429, "Finetune/Step Time": 2.8223766274750233} +{"Finetune/Learning Rate": 1.0855160338881478e-05, "Finetune/Loss": 0.7927604913711548, "Finetune/Loss (Raw)": 0.9217246174812317, "Finetune/Step": 2430, "Finetune/Step Time": 2.8170722518116236} +{"Finetune/Learning Rate": 1.084867293661235e-05, "Finetune/Loss": 0.793097972869873, "Finetune/Loss (Raw)": 0.8288202881813049, "Finetune/Step": 2431, "Finetune/Step Time": 2.8158200066536665} +{"Finetune/Learning Rate": 1.084218517455624e-05, "Finetune/Loss": 0.7923880815505981, "Finetune/Loss (Raw)": 0.844025731086731, "Finetune/Step": 2432, "Finetune/Step Time": 2.8299299888312817} +{"Finetune/Learning Rate": 1.0835697055463565e-05, "Finetune/Loss": 0.7919288873672485, "Finetune/Loss (Raw)": 0.7786594033241272, "Finetune/Step": 2433, "Finetune/Step Time": 2.828819217160344} +{"Finetune/Learning Rate": 1.0829208582084915e-05, "Finetune/Loss": 0.7920130491256714, "Finetune/Loss (Raw)": 0.7494654059410095, "Finetune/Step": 2434, "Finetune/Step Time": 2.826600978150964} +{"Finetune/Learning Rate": 1.0822719757171014e-05, "Finetune/Loss": 0.7920091152191162, "Finetune/Loss (Raw)": 0.850321352481842, "Finetune/Step": 2435, "Finetune/Step Time": 2.82592667452991} +{"Finetune/Learning Rate": 1.0816230583472735e-05, "Finetune/Loss": 0.7900815010070801, "Finetune/Loss (Raw)": 0.705341100692749, "Finetune/Step": 2436, "Finetune/Step Time": 2.826298637315631} +{"Finetune/Learning Rate": 1.0809741063741106e-05, "Finetune/Loss": 0.7900911569595337, "Finetune/Loss (Raw)": 0.8906310200691223, "Finetune/Step": 2437, "Finetune/Step Time": 2.8250682074576616} +{"Finetune/Learning Rate": 1.0803251200727296e-05, "Finetune/Loss": 0.7900826930999756, "Finetune/Loss (Raw)": 0.821325957775116, "Finetune/Step": 2438, "Finetune/Step Time": 2.8196952417492867} +{"Finetune/Learning Rate": 1.0796760997182627e-05, "Finetune/Loss": 0.7903379797935486, "Finetune/Loss (Raw)": 0.837186336517334, "Finetune/Step": 2439, "Finetune/Step Time": 2.8180190231651068} +{"Finetune/Learning Rate": 1.0790270455858555e-05, "Finetune/Loss": 0.789635181427002, "Finetune/Loss (Raw)": 0.7161094546318054, "Finetune/Step": 2440, "Finetune/Step Time": 2.8178149592131376} +{"Finetune/Learning Rate": 1.0783779579506687e-05, "Finetune/Loss": 0.790515124797821, "Finetune/Loss (Raw)": 0.9473804831504822, "Finetune/Step": 2441, "Finetune/Step Time": 2.8196114618331194} +{"Finetune/Learning Rate": 1.077728837087877e-05, "Finetune/Loss": 0.7893387079238892, "Finetune/Loss (Raw)": 0.6683362722396851, "Finetune/Step": 2442, "Finetune/Step Time": 2.815889287739992} +{"Finetune/Learning Rate": 1.0770796832726689e-05, "Finetune/Loss": 0.7902860641479492, "Finetune/Loss (Raw)": 0.9225550889968872, "Finetune/Step": 2443, "Finetune/Step Time": 2.816659213975072} +{"Finetune/Learning Rate": 1.0764304967802472e-05, "Finetune/Loss": 0.7894443273544312, "Finetune/Loss (Raw)": 0.7708651423454285, "Finetune/Step": 2444, "Finetune/Step Time": 2.8150062821805477} +{"Finetune/Learning Rate": 1.0757812778858288e-05, "Finetune/Loss": 0.7885569334030151, "Finetune/Loss (Raw)": 0.766255259513855, "Finetune/Step": 2445, "Finetune/Step Time": 2.8177071399986744} +{"Finetune/Learning Rate": 1.0751320268646436e-05, "Finetune/Loss": 0.7897274494171143, "Finetune/Loss (Raw)": 0.8435295224189758, "Finetune/Step": 2446, "Finetune/Step Time": 2.8150027077645063} +{"Finetune/Learning Rate": 1.0744827439919354e-05, "Finetune/Loss": 0.7891029119491577, "Finetune/Loss (Raw)": 0.7993232607841492, "Finetune/Step": 2447, "Finetune/Step Time": 2.8134491741657257} +{"Finetune/Learning Rate": 1.0738334295429622e-05, "Finetune/Loss": 0.7883227467536926, "Finetune/Loss (Raw)": 0.7505410313606262, "Finetune/Step": 2448, "Finetune/Step Time": 2.8084431812167168} +{"Finetune/Learning Rate": 1.0731840837929946e-05, "Finetune/Loss": 0.7884324789047241, "Finetune/Loss (Raw)": 0.8038597702980042, "Finetune/Step": 2449, "Finetune/Step Time": 2.8074115198105574} +{"Finetune/Learning Rate": 1.0725347070173162e-05, "Finetune/Loss": 0.7862047553062439, "Finetune/Loss (Raw)": 0.47210872173309326, "Finetune/Step": 2450, "Finetune/Step Time": 2.8397311847656965} +{"Finetune/Learning Rate": 1.071885299491225e-05, "Finetune/Loss": 0.7867586612701416, "Finetune/Loss (Raw)": 0.9000062346458435, "Finetune/Step": 2451, "Finetune/Step Time": 2.843338217586279} +{"Finetune/Learning Rate": 1.0712358614900305e-05, "Finetune/Loss": 0.7863905429840088, "Finetune/Loss (Raw)": 0.7079194188117981, "Finetune/Step": 2452, "Finetune/Step Time": 2.8637037593871355} +{"Finetune/Learning Rate": 1.0705863932890564e-05, "Finetune/Loss": 0.7883856296539307, "Finetune/Loss (Raw)": 0.8026120066642761, "Finetune/Step": 2453, "Finetune/Step Time": 2.8414903301745653} +{"Finetune/Learning Rate": 1.0699368951636384e-05, "Finetune/Loss": 0.7874913811683655, "Finetune/Loss (Raw)": 0.7613570690155029, "Finetune/Step": 2454, "Finetune/Step Time": 2.84595375880599} +{"Finetune/Learning Rate": 1.0692873673891256e-05, "Finetune/Loss": 0.7881977558135986, "Finetune/Loss (Raw)": 0.8531970381736755, "Finetune/Step": 2455, "Finetune/Step Time": 2.845774846151471} +{"Finetune/Learning Rate": 1.0686378102408787e-05, "Finetune/Loss": 0.7879766225814819, "Finetune/Loss (Raw)": 0.8233473300933838, "Finetune/Step": 2456, "Finetune/Step Time": 2.8425727877765894} +{"Finetune/Learning Rate": 1.0679882239942718e-05, "Finetune/Loss": 0.7870767116546631, "Finetune/Loss (Raw)": 0.8424388766288757, "Finetune/Step": 2457, "Finetune/Step Time": 2.8470369931310415} +{"Finetune/Learning Rate": 1.0673386089246908e-05, "Finetune/Loss": 0.7860832810401917, "Finetune/Loss (Raw)": 0.806454062461853, "Finetune/Step": 2458, "Finetune/Step Time": 2.8501338865607977} +{"Finetune/Learning Rate": 1.0666889653075341e-05, "Finetune/Loss": 0.7860066294670105, "Finetune/Loss (Raw)": 0.8349183201789856, "Finetune/Step": 2459, "Finetune/Step Time": 2.8530772924423218} +{"Finetune/Learning Rate": 1.066039293418212e-05, "Finetune/Loss": 0.7847024202346802, "Finetune/Loss (Raw)": 0.6915825605392456, "Finetune/Step": 2460, "Finetune/Step Time": 2.8545981738716364} +{"Finetune/Learning Rate": 1.0653895935321462e-05, "Finetune/Loss": 0.7892365455627441, "Finetune/Loss (Raw)": 0.7943093776702881, "Finetune/Step": 2461, "Finetune/Step Time": 2.823795238509774} +{"Finetune/Learning Rate": 1.064739865924772e-05, "Finetune/Loss": 0.7862764596939087, "Finetune/Loss (Raw)": 0.3882092535495758, "Finetune/Step": 2462, "Finetune/Step Time": 2.848075957968831} +{"Finetune/Learning Rate": 1.0640901108715348e-05, "Finetune/Loss": 0.7868266105651855, "Finetune/Loss (Raw)": 0.8518261909484863, "Finetune/Step": 2463, "Finetune/Step Time": 2.8464494682848454} +{"Finetune/Learning Rate": 1.0634403286478926e-05, "Finetune/Loss": 0.7824538350105286, "Finetune/Loss (Raw)": 0.2189905047416687, "Finetune/Step": 2464, "Finetune/Step Time": 2.8755887541919947} +{"Finetune/Learning Rate": 1.0627905195293135e-05, "Finetune/Loss": 0.7824956774711609, "Finetune/Loss (Raw)": 0.8611290454864502, "Finetune/Step": 2465, "Finetune/Step Time": 2.8747631181031466} +{"Finetune/Learning Rate": 1.0621406837912789e-05, "Finetune/Loss": 0.7831331491470337, "Finetune/Loss (Raw)": 0.9213297963142395, "Finetune/Step": 2466, "Finetune/Step Time": 2.8729913663119078} +{"Finetune/Learning Rate": 1.0614908217092805e-05, "Finetune/Loss": 0.7833247184753418, "Finetune/Loss (Raw)": 0.8264771103858948, "Finetune/Step": 2467, "Finetune/Step Time": 2.873615600168705} +{"Finetune/Learning Rate": 1.0608409335588212e-05, "Finetune/Loss": 0.7841429114341736, "Finetune/Loss (Raw)": 0.7141482830047607, "Finetune/Step": 2468, "Finetune/Step Time": 2.873803861439228} +{"Finetune/Learning Rate": 1.060191019615415e-05, "Finetune/Loss": 0.7806541323661804, "Finetune/Loss (Raw)": 0.3225756287574768, "Finetune/Step": 2469, "Finetune/Step Time": 2.907226936891675} +{"Finetune/Learning Rate": 1.059541080154587e-05, "Finetune/Loss": 0.7807562351226807, "Finetune/Loss (Raw)": 0.8235390782356262, "Finetune/Step": 2470, "Finetune/Step Time": 2.902095379307866} +{"Finetune/Learning Rate": 1.0588911154518725e-05, "Finetune/Loss": 0.780487060546875, "Finetune/Loss (Raw)": 0.7189010977745056, "Finetune/Step": 2471, "Finetune/Step Time": 2.9027321748435497} +{"Finetune/Learning Rate": 1.0582411257828185e-05, "Finetune/Loss": 0.7816691398620605, "Finetune/Loss (Raw)": 0.9328698515892029, "Finetune/Step": 2472, "Finetune/Step Time": 2.908259518444538} +{"Finetune/Learning Rate": 1.0575911114229818e-05, "Finetune/Loss": 0.7818199396133423, "Finetune/Loss (Raw)": 0.7671725749969482, "Finetune/Step": 2473, "Finetune/Step Time": 2.9132244139909744} +{"Finetune/Learning Rate": 1.0569410726479301e-05, "Finetune/Loss": 0.782053530216217, "Finetune/Loss (Raw)": 0.8427791595458984, "Finetune/Step": 2474, "Finetune/Step Time": 2.9123460557311773} +{"Finetune/Learning Rate": 1.0562910097332411e-05, "Finetune/Loss": 0.7810077667236328, "Finetune/Loss (Raw)": 0.7887169718742371, "Finetune/Step": 2475, "Finetune/Step Time": 2.911138167604804} +{"Finetune/Learning Rate": 1.055640922954503e-05, "Finetune/Loss": 0.7831085920333862, "Finetune/Loss (Raw)": 0.8522895574569702, "Finetune/Step": 2476, "Finetune/Step Time": 2.8883830793201923} +{"Finetune/Learning Rate": 1.054990812587314e-05, "Finetune/Loss": 0.7838730812072754, "Finetune/Loss (Raw)": 0.8894277215003967, "Finetune/Step": 2477, "Finetune/Step Time": 2.889890296384692} +{"Finetune/Learning Rate": 1.0543406789072827e-05, "Finetune/Loss": 0.782971203327179, "Finetune/Loss (Raw)": 0.7323727011680603, "Finetune/Step": 2478, "Finetune/Step Time": 2.887015998363495} +{"Finetune/Learning Rate": 1.0536905221900268e-05, "Finetune/Loss": 0.7815693616867065, "Finetune/Loss (Raw)": 0.6984090805053711, "Finetune/Step": 2479, "Finetune/Step Time": 2.889461712911725} +{"Finetune/Learning Rate": 1.0530403427111739e-05, "Finetune/Loss": 0.7797069549560547, "Finetune/Loss (Raw)": 0.5087239742279053, "Finetune/Step": 2480, "Finetune/Step Time": 2.916675617918372} +{"Finetune/Learning Rate": 1.0523901407463624e-05, "Finetune/Loss": 0.7795453667640686, "Finetune/Loss (Raw)": 0.8302679657936096, "Finetune/Step": 2481, "Finetune/Step Time": 2.9190468080341816} +{"Finetune/Learning Rate": 1.0517399165712385e-05, "Finetune/Loss": 0.7785565853118896, "Finetune/Loss (Raw)": 0.7992252707481384, "Finetune/Step": 2482, "Finetune/Step Time": 2.919671906158328} +{"Finetune/Learning Rate": 1.0510896704614593e-05, "Finetune/Loss": 0.7820466160774231, "Finetune/Loss (Raw)": 0.7468163371086121, "Finetune/Step": 2483, "Finetune/Step Time": 2.8890827372670174} +{"Finetune/Learning Rate": 1.0504394026926902e-05, "Finetune/Loss": 0.7820266485214233, "Finetune/Loss (Raw)": 0.780894935131073, "Finetune/Step": 2484, "Finetune/Step Time": 2.891528397798538} +{"Finetune/Learning Rate": 1.0497891135406064e-05, "Finetune/Loss": 0.7859081625938416, "Finetune/Loss (Raw)": 0.8964330554008484, "Finetune/Step": 2485, "Finetune/Step Time": 2.861883796751499} +{"Finetune/Learning Rate": 1.0491388032808918e-05, "Finetune/Loss": 0.7849532961845398, "Finetune/Loss (Raw)": 0.7472615242004395, "Finetune/Step": 2486, "Finetune/Step Time": 2.8587519638240337} +{"Finetune/Learning Rate": 1.0484884721892394e-05, "Finetune/Loss": 0.7851190567016602, "Finetune/Loss (Raw)": 0.8509975671768188, "Finetune/Step": 2487, "Finetune/Step Time": 2.8626360055059195} +{"Finetune/Learning Rate": 1.047838120541351e-05, "Finetune/Loss": 0.7846633791923523, "Finetune/Loss (Raw)": 0.8243343830108643, "Finetune/Step": 2488, "Finetune/Step Time": 2.873709661886096} +{"Finetune/Learning Rate": 1.0471877486129369e-05, "Finetune/Loss": 0.7834371328353882, "Finetune/Loss (Raw)": 0.7337188720703125, "Finetune/Step": 2489, "Finetune/Step Time": 2.872252831235528} +{"Finetune/Learning Rate": 1.0465373566797166e-05, "Finetune/Loss": 0.7850430011749268, "Finetune/Loss (Raw)": 0.8647870421409607, "Finetune/Step": 2490, "Finetune/Step Time": 2.8485474940389395} +{"Finetune/Learning Rate": 1.0458869450174177e-05, "Finetune/Loss": 0.7847594022750854, "Finetune/Loss (Raw)": 0.7781299948692322, "Finetune/Step": 2491, "Finetune/Step Time": 2.852695031091571} +{"Finetune/Learning Rate": 1.0452365139017759e-05, "Finetune/Loss": 0.786605954170227, "Finetune/Loss (Raw)": 0.860099196434021, "Finetune/Step": 2492, "Finetune/Step Time": 2.8310823794454336} +{"Finetune/Learning Rate": 1.0445860636085357e-05, "Finetune/Loss": 0.7869532108306885, "Finetune/Loss (Raw)": 0.8659678101539612, "Finetune/Step": 2493, "Finetune/Step Time": 2.830800335854292} +{"Finetune/Learning Rate": 1.0439355944134487e-05, "Finetune/Loss": 0.7864120006561279, "Finetune/Loss (Raw)": 0.7960938215255737, "Finetune/Step": 2494, "Finetune/Step Time": 2.830698683857918} +{"Finetune/Learning Rate": 1.0432851065922764e-05, "Finetune/Loss": 0.7879745364189148, "Finetune/Loss (Raw)": 0.8653807640075684, "Finetune/Step": 2495, "Finetune/Step Time": 2.83381106890738} +{"Finetune/Learning Rate": 1.0426346004207863e-05, "Finetune/Loss": 0.7881087064743042, "Finetune/Loss (Raw)": 0.9165973663330078, "Finetune/Step": 2496, "Finetune/Step Time": 2.838287826627493} +{"Finetune/Learning Rate": 1.0419840761747547e-05, "Finetune/Loss": 0.7883516550064087, "Finetune/Loss (Raw)": 0.877196729183197, "Finetune/Step": 2497, "Finetune/Step Time": 2.8341592233628035} +{"Finetune/Learning Rate": 1.0413335341299649e-05, "Finetune/Loss": 0.788256824016571, "Finetune/Loss (Raw)": 0.8327831029891968, "Finetune/Step": 2498, "Finetune/Step Time": 2.835963813588023} +{"Finetune/Learning Rate": 1.0406829745622085e-05, "Finetune/Loss": 0.7892613410949707, "Finetune/Loss (Raw)": 0.9158033728599548, "Finetune/Step": 2499, "Finetune/Step Time": 2.8402621801942587} +{"Finetune/Learning Rate": 1.0400323977472842e-05, "Finetune/Loss": 0.7898594737052917, "Finetune/Loss (Raw)": 0.8535273671150208, "Finetune/Step": 2500, "Finetune/Step Time": 2.838387869298458} +{"Finetune/Learning Rate": 1.0393818039609979e-05, "Finetune/Loss": 0.7904644012451172, "Finetune/Loss (Raw)": 0.7916371822357178, "Finetune/Step": 2501, "Finetune/Step Time": 2.8403171449899673} +{"Finetune/Learning Rate": 1.0387311934791627e-05, "Finetune/Loss": 0.7905711531639099, "Finetune/Loss (Raw)": 0.8527755737304688, "Finetune/Step": 2502, "Finetune/Step Time": 2.8436282202601433} +{"Finetune/Learning Rate": 1.0380805665775988e-05, "Finetune/Loss": 0.7898604869842529, "Finetune/Loss (Raw)": 0.7814907431602478, "Finetune/Step": 2503, "Finetune/Step Time": 2.848036389797926} +{"Finetune/Learning Rate": 1.0374299235321337e-05, "Finetune/Loss": 0.7920690774917603, "Finetune/Loss (Raw)": 0.8718705177307129, "Finetune/Step": 2504, "Finetune/Step Time": 2.8162284418940544} +{"Finetune/Learning Rate": 1.0367792646186012e-05, "Finetune/Loss": 0.7923051118850708, "Finetune/Loss (Raw)": 0.7901155948638916, "Finetune/Step": 2505, "Finetune/Step Time": 2.812791895121336} +{"Finetune/Learning Rate": 1.0361285901128421e-05, "Finetune/Loss": 0.7975825071334839, "Finetune/Loss (Raw)": 0.9231181740760803, "Finetune/Step": 2506, "Finetune/Step Time": 2.779073351994157} +{"Finetune/Learning Rate": 1.0354779002907041e-05, "Finetune/Loss": 0.7980501055717468, "Finetune/Loss (Raw)": 0.8801279067993164, "Finetune/Step": 2507, "Finetune/Step Time": 2.7806472089141607} +{"Finetune/Learning Rate": 1.0348271954280403e-05, "Finetune/Loss": 0.7984490394592285, "Finetune/Loss (Raw)": 0.8140239119529724, "Finetune/Step": 2508, "Finetune/Step Time": 2.7803668212145567} +{"Finetune/Learning Rate": 1.0341764758007118e-05, "Finetune/Loss": 0.7981191277503967, "Finetune/Loss (Raw)": 0.8534553647041321, "Finetune/Step": 2509, "Finetune/Step Time": 2.7807234060019255} +{"Finetune/Learning Rate": 1.033525741684585e-05, "Finetune/Loss": 0.796913743019104, "Finetune/Loss (Raw)": 0.7207117676734924, "Finetune/Step": 2510, "Finetune/Step Time": 2.779985025525093} +{"Finetune/Learning Rate": 1.0328749933555322e-05, "Finetune/Loss": 0.7968580722808838, "Finetune/Loss (Raw)": 0.8912250399589539, "Finetune/Step": 2511, "Finetune/Step Time": 2.784722052514553} +{"Finetune/Learning Rate": 1.0322242310894323e-05, "Finetune/Loss": 0.7971771359443665, "Finetune/Loss (Raw)": 0.813958466053009, "Finetune/Step": 2512, "Finetune/Step Time": 2.7840224355459213} +{"Finetune/Learning Rate": 1.0315734551621699e-05, "Finetune/Loss": 0.7944521903991699, "Finetune/Loss (Raw)": 0.4978988468647003, "Finetune/Step": 2513, "Finetune/Step Time": 2.804088268429041} +{"Finetune/Learning Rate": 1.0309226658496355e-05, "Finetune/Loss": 0.7939190864562988, "Finetune/Loss (Raw)": 0.7777836322784424, "Finetune/Step": 2514, "Finetune/Step Time": 2.811424743384123} +{"Finetune/Learning Rate": 1.0302718634277248e-05, "Finetune/Loss": 0.7929381132125854, "Finetune/Loss (Raw)": 0.6050127744674683, "Finetune/Step": 2515, "Finetune/Step Time": 2.8333640545606613} +{"Finetune/Learning Rate": 1.0296210481723396e-05, "Finetune/Loss": 0.7935721278190613, "Finetune/Loss (Raw)": 0.868225634098053, "Finetune/Step": 2516, "Finetune/Step Time": 2.836706342175603} +{"Finetune/Learning Rate": 1.0289702203593872e-05, "Finetune/Loss": 0.7919944524765015, "Finetune/Loss (Raw)": 0.7338758707046509, "Finetune/Step": 2517, "Finetune/Step Time": 2.8366283793002367} +{"Finetune/Learning Rate": 1.0283193802647797e-05, "Finetune/Loss": 0.7923814058303833, "Finetune/Loss (Raw)": 0.8641977906227112, "Finetune/Step": 2518, "Finetune/Step Time": 2.8391376715153456} +{"Finetune/Learning Rate": 1.027668528164435e-05, "Finetune/Loss": 0.7930022478103638, "Finetune/Loss (Raw)": 0.8054072856903076, "Finetune/Step": 2519, "Finetune/Step Time": 2.837095880880952} +{"Finetune/Learning Rate": 1.0270176643342755e-05, "Finetune/Loss": 0.7921248078346252, "Finetune/Loss (Raw)": 0.67884761095047, "Finetune/Step": 2520, "Finetune/Step Time": 2.8604928478598595} +{"Finetune/Learning Rate": 1.026366789050229e-05, "Finetune/Loss": 0.7920304536819458, "Finetune/Loss (Raw)": 0.8000643253326416, "Finetune/Step": 2521, "Finetune/Step Time": 2.8590819109231234} +{"Finetune/Learning Rate": 1.0257159025882278e-05, "Finetune/Loss": 0.792011559009552, "Finetune/Loss (Raw)": 0.8827620148658752, "Finetune/Step": 2522, "Finetune/Step Time": 2.859524490311742} +{"Finetune/Learning Rate": 1.0250650052242092e-05, "Finetune/Loss": 0.791938066482544, "Finetune/Loss (Raw)": 0.8549081683158875, "Finetune/Step": 2523, "Finetune/Step Time": 2.863203015178442} +{"Finetune/Learning Rate": 1.0244140972341155e-05, "Finetune/Loss": 0.7918634414672852, "Finetune/Loss (Raw)": 0.7800061702728271, "Finetune/Step": 2524, "Finetune/Step Time": 2.8634910732507706} +{"Finetune/Learning Rate": 1.0237631788938926e-05, "Finetune/Loss": 0.7907357215881348, "Finetune/Loss (Raw)": 0.6994158625602722, "Finetune/Step": 2525, "Finetune/Step Time": 2.8848241716623306} +{"Finetune/Learning Rate": 1.0231122504794916e-05, "Finetune/Loss": 0.7914512157440186, "Finetune/Loss (Raw)": 0.8878387212753296, "Finetune/Step": 2526, "Finetune/Step Time": 2.886627808213234} +{"Finetune/Learning Rate": 1.022461312266867e-05, "Finetune/Loss": 0.791589081287384, "Finetune/Loss (Raw)": 0.7939258217811584, "Finetune/Step": 2527, "Finetune/Step Time": 2.8850731253623962} +{"Finetune/Learning Rate": 1.0218103645319784e-05, "Finetune/Loss": 0.7889552712440491, "Finetune/Loss (Raw)": 0.5322683453559875, "Finetune/Step": 2528, "Finetune/Step Time": 2.9100569654256105} +{"Finetune/Learning Rate": 1.021159407550789e-05, "Finetune/Loss": 0.7893505096435547, "Finetune/Loss (Raw)": 0.836768627166748, "Finetune/Step": 2529, "Finetune/Step Time": 2.912741666659713} +{"Finetune/Learning Rate": 1.0205084415992664e-05, "Finetune/Loss": 0.7890692949295044, "Finetune/Loss (Raw)": 0.8154285550117493, "Finetune/Step": 2530, "Finetune/Step Time": 2.9101959355175495} +{"Finetune/Learning Rate": 1.0198574669533805e-05, "Finetune/Loss": 0.7887696027755737, "Finetune/Loss (Raw)": 0.846425473690033, "Finetune/Step": 2531, "Finetune/Step Time": 2.9115469995886087} +{"Finetune/Learning Rate": 1.0192064838891065e-05, "Finetune/Loss": 0.7892998456954956, "Finetune/Loss (Raw)": 0.8539185523986816, "Finetune/Step": 2532, "Finetune/Step Time": 2.913021843880415} +{"Finetune/Learning Rate": 1.0185554926824229e-05, "Finetune/Loss": 0.7896861433982849, "Finetune/Loss (Raw)": 0.9077807068824768, "Finetune/Step": 2533, "Finetune/Step Time": 2.915542995557189} +{"Finetune/Learning Rate": 1.0179044936093109e-05, "Finetune/Loss": 0.7898277044296265, "Finetune/Loss (Raw)": 0.8116928339004517, "Finetune/Step": 2534, "Finetune/Step Time": 2.918755602091551} +{"Finetune/Learning Rate": 1.017253486945756e-05, "Finetune/Loss": 0.7883468866348267, "Finetune/Loss (Raw)": 0.6540436744689941, "Finetune/Step": 2535, "Finetune/Step Time": 2.9374098610132933} +{"Finetune/Learning Rate": 1.0166024729677455e-05, "Finetune/Loss": 0.789939284324646, "Finetune/Loss (Raw)": 0.9587951302528381, "Finetune/Step": 2536, "Finetune/Step Time": 2.945190714672208} +{"Finetune/Learning Rate": 1.0159514519512716e-05, "Finetune/Loss": 0.7895524501800537, "Finetune/Loss (Raw)": 0.6325159072875977, "Finetune/Step": 2537, "Finetune/Step Time": 2.9452741909772158} +{"Finetune/Learning Rate": 1.0153004241723283e-05, "Finetune/Loss": 0.7889927625656128, "Finetune/Loss (Raw)": 0.7543354630470276, "Finetune/Step": 2538, "Finetune/Step Time": 2.9466187302023172} +{"Finetune/Learning Rate": 1.0146493899069128e-05, "Finetune/Loss": 0.7884396314620972, "Finetune/Loss (Raw)": 0.779413640499115, "Finetune/Step": 2539, "Finetune/Step Time": 2.951145324856043} +{"Finetune/Learning Rate": 1.0139983494310249e-05, "Finetune/Loss": 0.7884937524795532, "Finetune/Loss (Raw)": 0.8331770300865173, "Finetune/Step": 2540, "Finetune/Step Time": 2.950845941901207} +{"Finetune/Learning Rate": 1.0133473030206669e-05, "Finetune/Loss": 0.7869974374771118, "Finetune/Loss (Raw)": 0.5683687329292297, "Finetune/Step": 2541, "Finetune/Step Time": 2.9758227542042732} +{"Finetune/Learning Rate": 1.0126962509518443e-05, "Finetune/Loss": 0.7874010801315308, "Finetune/Loss (Raw)": 0.7927280068397522, "Finetune/Step": 2542, "Finetune/Step Time": 2.9744498170912266} +{"Finetune/Learning Rate": 1.0120451935005647e-05, "Finetune/Loss": 0.7865836024284363, "Finetune/Loss (Raw)": 0.8085944056510925, "Finetune/Step": 2543, "Finetune/Step Time": 2.975035874173045} +{"Finetune/Learning Rate": 1.0113941309428373e-05, "Finetune/Loss": 0.7867828607559204, "Finetune/Loss (Raw)": 0.8469408750534058, "Finetune/Step": 2544, "Finetune/Step Time": 2.985834028571844} +{"Finetune/Learning Rate": 1.0107430635546741e-05, "Finetune/Loss": 0.7916586399078369, "Finetune/Loss (Raw)": 0.8713192343711853, "Finetune/Step": 2545, "Finetune/Step Time": 2.952527606859803} +{"Finetune/Learning Rate": 1.0100919916120892e-05, "Finetune/Loss": 0.7908706665039062, "Finetune/Loss (Raw)": 0.7492128610610962, "Finetune/Step": 2546, "Finetune/Step Time": 2.9516644403338432} +{"Finetune/Learning Rate": 1.009440915391099e-05, "Finetune/Loss": 0.7913246154785156, "Finetune/Loss (Raw)": 0.8341339230537415, "Finetune/Step": 2547, "Finetune/Step Time": 2.9515437185764313} +{"Finetune/Learning Rate": 1.0087898351677204e-05, "Finetune/Loss": 0.7911806106567383, "Finetune/Loss (Raw)": 0.7574064135551453, "Finetune/Step": 2548, "Finetune/Step Time": 2.949759528040886} +{"Finetune/Learning Rate": 1.008138751217973e-05, "Finetune/Loss": 0.7900357246398926, "Finetune/Loss (Raw)": 0.6193583011627197, "Finetune/Step": 2549, "Finetune/Step Time": 2.9746143855154514} +{"Finetune/Learning Rate": 1.0074876638178777e-05, "Finetune/Loss": 0.7892844676971436, "Finetune/Loss (Raw)": 0.824375569820404, "Finetune/Step": 2550, "Finetune/Step Time": 2.9758803248405457} +{"Finetune/Learning Rate": 1.0068365732434573e-05, "Finetune/Loss": 0.7888038158416748, "Finetune/Loss (Raw)": 0.7482381463050842, "Finetune/Step": 2551, "Finetune/Step Time": 2.9752956219017506} +{"Finetune/Learning Rate": 1.0061854797707353e-05, "Finetune/Loss": 0.7886129021644592, "Finetune/Loss (Raw)": 0.7629292011260986, "Finetune/Step": 2552, "Finetune/Step Time": 2.977130362764001} +{"Finetune/Learning Rate": 1.005534383675737e-05, "Finetune/Loss": 0.7873858213424683, "Finetune/Loss (Raw)": 0.7923396229743958, "Finetune/Step": 2553, "Finetune/Step Time": 2.978003468364477} +{"Finetune/Learning Rate": 1.0048832852344881e-05, "Finetune/Loss": 0.7874451875686646, "Finetune/Loss (Raw)": 0.9148914813995361, "Finetune/Step": 2554, "Finetune/Step Time": 2.977655118331313} +{"Finetune/Learning Rate": 1.0042321847230156e-05, "Finetune/Loss": 0.7876170873641968, "Finetune/Loss (Raw)": 0.8245593905448914, "Finetune/Step": 2555, "Finetune/Step Time": 2.980812294408679} +{"Finetune/Learning Rate": 1.0035810824173483e-05, "Finetune/Loss": 0.7881137132644653, "Finetune/Loss (Raw)": 0.8026098608970642, "Finetune/Step": 2556, "Finetune/Step Time": 2.981486512348056} +{"Finetune/Learning Rate": 1.0029299785935144e-05, "Finetune/Loss": 0.7883763313293457, "Finetune/Loss (Raw)": 0.8602063655853271, "Finetune/Step": 2557, "Finetune/Step Time": 2.9778023343533278} +{"Finetune/Learning Rate": 1.0022788735275434e-05, "Finetune/Loss": 0.7877441644668579, "Finetune/Loss (Raw)": 0.8408096432685852, "Finetune/Step": 2558, "Finetune/Step Time": 2.9775139819830656} +{"Finetune/Learning Rate": 1.0016277674954651e-05, "Finetune/Loss": 0.7875562906265259, "Finetune/Loss (Raw)": 0.8047695159912109, "Finetune/Step": 2559, "Finetune/Step Time": 2.978408310562372} +{"Finetune/Learning Rate": 1.0009766607733098e-05, "Finetune/Loss": 0.7875620722770691, "Finetune/Loss (Raw)": 0.8447667360305786, "Finetune/Step": 2560, "Finetune/Step Time": 2.9693483747541904} +{"Finetune/Learning Rate": 1.0003255536371086e-05, "Finetune/Loss": 0.7865120768547058, "Finetune/Loss (Raw)": 0.644257664680481, "Finetune/Step": 2561, "Finetune/Step Time": 2.98941863887012} +{"Finetune/Learning Rate": 9.996744463628917e-06, "Finetune/Loss": 0.7866989970207214, "Finetune/Loss (Raw)": 0.7733972668647766, "Finetune/Step": 2562, "Finetune/Step Time": 2.9940206818282604} +{"Finetune/Learning Rate": 9.990233392266904e-06, "Finetune/Loss": 0.7863912582397461, "Finetune/Loss (Raw)": 0.8109317421913147, "Finetune/Step": 2563, "Finetune/Step Time": 2.994314804673195} +{"Finetune/Learning Rate": 9.98372232504535e-06, "Finetune/Loss": 0.7877975106239319, "Finetune/Loss (Raw)": 0.8853350877761841, "Finetune/Step": 2564, "Finetune/Step Time": 2.9888846296817064} +{"Finetune/Learning Rate": 9.97721126472457e-06, "Finetune/Loss": 0.7872905731201172, "Finetune/Loss (Raw)": 0.8257431387901306, "Finetune/Step": 2565, "Finetune/Step Time": 2.990712096914649} +{"Finetune/Learning Rate": 9.97070021406486e-06, "Finetune/Loss": 0.7876346111297607, "Finetune/Loss (Raw)": 0.865374743938446, "Finetune/Step": 2566, "Finetune/Step Time": 2.9917781986296177} +{"Finetune/Learning Rate": 9.96418917582652e-06, "Finetune/Loss": 0.7871071100234985, "Finetune/Loss (Raw)": 0.7696588635444641, "Finetune/Step": 2567, "Finetune/Step Time": 2.9927173741161823} +{"Finetune/Learning Rate": 9.957678152769844e-06, "Finetune/Loss": 0.7879584431648254, "Finetune/Loss (Raw)": 0.8250776529312134, "Finetune/Step": 2568, "Finetune/Step Time": 2.995472675189376} +{"Finetune/Learning Rate": 9.951167147655126e-06, "Finetune/Loss": 0.7869364023208618, "Finetune/Loss (Raw)": 0.816557765007019, "Finetune/Step": 2569, "Finetune/Step Time": 2.996663875877857} +{"Finetune/Learning Rate": 9.944656163242634e-06, "Finetune/Loss": 0.7879735231399536, "Finetune/Loss (Raw)": 0.8010926246643066, "Finetune/Step": 2570, "Finetune/Step Time": 2.998708490282297} +{"Finetune/Learning Rate": 9.938145202292649e-06, "Finetune/Loss": 0.786540150642395, "Finetune/Loss (Raw)": 0.7390808463096619, "Finetune/Step": 2571, "Finetune/Step Time": 3.003482958301902} +{"Finetune/Learning Rate": 9.931634267565432e-06, "Finetune/Loss": 0.7867854833602905, "Finetune/Loss (Raw)": 0.8022704720497131, "Finetune/Step": 2572, "Finetune/Step Time": 3.005362682044506} +{"Finetune/Learning Rate": 9.925123361821227e-06, "Finetune/Loss": 0.7874279618263245, "Finetune/Loss (Raw)": 0.8484911918640137, "Finetune/Step": 2573, "Finetune/Step Time": 3.0037692207843065} +{"Finetune/Learning Rate": 9.918612487820274e-06, "Finetune/Loss": 0.7862752676010132, "Finetune/Loss (Raw)": 0.6959818601608276, "Finetune/Step": 2574, "Finetune/Step Time": 3.002202734351158} +{"Finetune/Learning Rate": 9.912101648322801e-06, "Finetune/Loss": 0.7865287661552429, "Finetune/Loss (Raw)": 0.8317732810974121, "Finetune/Step": 2575, "Finetune/Step Time": 3.003522263839841} +{"Finetune/Learning Rate": 9.905590846089015e-06, "Finetune/Loss": 0.786595344543457, "Finetune/Loss (Raw)": 0.7590616941452026, "Finetune/Step": 2576, "Finetune/Step Time": 3.0035812314599752} +{"Finetune/Learning Rate": 9.89908008387911e-06, "Finetune/Loss": 0.7873750925064087, "Finetune/Loss (Raw)": 0.9036694765090942, "Finetune/Step": 2577, "Finetune/Step Time": 3.002633422613144} +{"Finetune/Learning Rate": 9.89256936445326e-06, "Finetune/Loss": 0.7903446555137634, "Finetune/Loss (Raw)": 0.8522135615348816, "Finetune/Step": 2578, "Finetune/Step Time": 2.9690176229923964} +{"Finetune/Learning Rate": 9.886058690571632e-06, "Finetune/Loss": 0.789212703704834, "Finetune/Loss (Raw)": 0.7551122903823853, "Finetune/Step": 2579, "Finetune/Step Time": 2.96698609739542} +{"Finetune/Learning Rate": 9.879548064994356e-06, "Finetune/Loss": 0.7894721627235413, "Finetune/Loss (Raw)": 0.7411292791366577, "Finetune/Step": 2580, "Finetune/Step Time": 2.945662410929799} +{"Finetune/Learning Rate": 9.87303749048156e-06, "Finetune/Loss": 0.7894490361213684, "Finetune/Loss (Raw)": 0.7996569871902466, "Finetune/Step": 2581, "Finetune/Step Time": 2.946587663143873} +{"Finetune/Learning Rate": 9.866526969793331e-06, "Finetune/Loss": 0.7896268367767334, "Finetune/Loss (Raw)": 0.7841163873672485, "Finetune/Step": 2582, "Finetune/Step Time": 2.944584235548973} +{"Finetune/Learning Rate": 9.860016505689756e-06, "Finetune/Loss": 0.7894480228424072, "Finetune/Loss (Raw)": 0.8303087949752808, "Finetune/Step": 2583, "Finetune/Step Time": 2.9467943254858255} +{"Finetune/Learning Rate": 9.853506100930875e-06, "Finetune/Loss": 0.7892183065414429, "Finetune/Loss (Raw)": 0.7939419746398926, "Finetune/Step": 2584, "Finetune/Step Time": 2.9481128621846437} +{"Finetune/Learning Rate": 9.846995758276719e-06, "Finetune/Loss": 0.7892756462097168, "Finetune/Loss (Raw)": 0.8497729897499084, "Finetune/Step": 2585, "Finetune/Step Time": 2.9444261454045773} +{"Finetune/Learning Rate": 9.840485480487289e-06, "Finetune/Loss": 0.7892342805862427, "Finetune/Loss (Raw)": 0.8011613488197327, "Finetune/Step": 2586, "Finetune/Step Time": 2.9416768848896027} +{"Finetune/Learning Rate": 9.833975270322548e-06, "Finetune/Loss": 0.7889280319213867, "Finetune/Loss (Raw)": 0.7957205176353455, "Finetune/Step": 2587, "Finetune/Step Time": 2.9414897579699755} +{"Finetune/Learning Rate": 9.827465130542444e-06, "Finetune/Loss": 0.790184736251831, "Finetune/Loss (Raw)": 0.8524406552314758, "Finetune/Step": 2588, "Finetune/Step Time": 2.941210813820362} +{"Finetune/Learning Rate": 9.820955063906893e-06, "Finetune/Loss": 0.7908785939216614, "Finetune/Loss (Raw)": 0.8831244111061096, "Finetune/Step": 2589, "Finetune/Step Time": 2.94163747318089} +{"Finetune/Learning Rate": 9.814445073175773e-06, "Finetune/Loss": 0.7942484021186829, "Finetune/Loss (Raw)": 0.819542407989502, "Finetune/Step": 2590, "Finetune/Step Time": 2.917305190116167} +{"Finetune/Learning Rate": 9.807935161108937e-06, "Finetune/Loss": 0.7942701578140259, "Finetune/Loss (Raw)": 0.8546171188354492, "Finetune/Step": 2591, "Finetune/Step Time": 2.918091854080558} +{"Finetune/Learning Rate": 9.801425330466199e-06, "Finetune/Loss": 0.7983226180076599, "Finetune/Loss (Raw)": 0.7376983165740967, "Finetune/Step": 2592, "Finetune/Step Time": 2.8853614516556263} +{"Finetune/Learning Rate": 9.794915584007343e-06, "Finetune/Loss": 0.7977676391601562, "Finetune/Loss (Raw)": 0.7900975942611694, "Finetune/Step": 2593, "Finetune/Step Time": 2.8857110645622015} +{"Finetune/Learning Rate": 9.788405924492111e-06, "Finetune/Loss": 0.7958019971847534, "Finetune/Loss (Raw)": 0.6697236895561218, "Finetune/Step": 2594, "Finetune/Step Time": 2.912915799766779} +{"Finetune/Learning Rate": 9.781896354680218e-06, "Finetune/Loss": 0.7951990962028503, "Finetune/Loss (Raw)": 0.7493082284927368, "Finetune/Step": 2595, "Finetune/Step Time": 2.9132700469344854} +{"Finetune/Learning Rate": 9.775386877331332e-06, "Finetune/Loss": 0.7960618734359741, "Finetune/Loss (Raw)": 0.8245797753334045, "Finetune/Step": 2596, "Finetune/Step Time": 2.8904918879270554} +{"Finetune/Learning Rate": 9.76887749520509e-06, "Finetune/Loss": 0.7995157837867737, "Finetune/Loss (Raw)": 0.7646784782409668, "Finetune/Step": 2597, "Finetune/Step Time": 2.854587133973837} +{"Finetune/Learning Rate": 9.762368211061077e-06, "Finetune/Loss": 0.800249457359314, "Finetune/Loss (Raw)": 0.9174449443817139, "Finetune/Step": 2598, "Finetune/Step Time": 2.854114079847932} +{"Finetune/Learning Rate": 9.755859027658848e-06, "Finetune/Loss": 0.8017795085906982, "Finetune/Loss (Raw)": 0.9147524237632751, "Finetune/Step": 2599, "Finetune/Step Time": 2.852471735328436} +{"Finetune/Learning Rate": 9.749349947757912e-06, "Finetune/Loss": 0.800658106803894, "Finetune/Loss (Raw)": 0.7893300652503967, "Finetune/Step": 2600, "Finetune/Step Time": 2.859274758026004} +{"Finetune/Learning Rate": 9.742840974117727e-06, "Finetune/Loss": 0.8007146120071411, "Finetune/Loss (Raw)": 0.7744114995002747, "Finetune/Step": 2601, "Finetune/Step Time": 2.856351776048541} +{"Finetune/Learning Rate": 9.736332109497714e-06, "Finetune/Loss": 0.8003522157669067, "Finetune/Loss (Raw)": 0.7963848114013672, "Finetune/Step": 2602, "Finetune/Step Time": 2.8614109102636576} +{"Finetune/Learning Rate": 9.729823356657247e-06, "Finetune/Loss": 0.8003860712051392, "Finetune/Loss (Raw)": 0.793049156665802, "Finetune/Step": 2603, "Finetune/Step Time": 2.8610380850732327} +{"Finetune/Learning Rate": 9.723314718355653e-06, "Finetune/Loss": 0.7990731000900269, "Finetune/Loss (Raw)": 0.6842296719551086, "Finetune/Step": 2604, "Finetune/Step Time": 2.8829847052693367} +{"Finetune/Learning Rate": 9.716806197352205e-06, "Finetune/Loss": 0.7987949252128601, "Finetune/Loss (Raw)": 0.8538235425949097, "Finetune/Step": 2605, "Finetune/Step Time": 2.8812794778496027} +{"Finetune/Learning Rate": 9.71029779640613e-06, "Finetune/Loss": 0.7998074293136597, "Finetune/Loss (Raw)": 0.8619710803031921, "Finetune/Step": 2606, "Finetune/Step Time": 2.882898984476924} +{"Finetune/Learning Rate": 9.703789518276608e-06, "Finetune/Loss": 0.8001089096069336, "Finetune/Loss (Raw)": 0.7370064854621887, "Finetune/Step": 2607, "Finetune/Step Time": 2.882639493793249} +{"Finetune/Learning Rate": 9.697281365722754e-06, "Finetune/Loss": 0.8029510974884033, "Finetune/Loss (Raw)": 0.8725093603134155, "Finetune/Step": 2608, "Finetune/Step Time": 2.853980991989374} +{"Finetune/Learning Rate": 9.69077334150365e-06, "Finetune/Loss": 0.8028168082237244, "Finetune/Loss (Raw)": 0.813089907169342, "Finetune/Step": 2609, "Finetune/Step Time": 2.853029564023018} +{"Finetune/Learning Rate": 9.684265448378302e-06, "Finetune/Loss": 0.8029733896255493, "Finetune/Loss (Raw)": 0.8192540407180786, "Finetune/Step": 2610, "Finetune/Step Time": 2.8541310727596283} +{"Finetune/Learning Rate": 9.677757689105682e-06, "Finetune/Loss": 0.8031337261199951, "Finetune/Loss (Raw)": 0.7673555016517639, "Finetune/Step": 2611, "Finetune/Step Time": 2.852534681558609} +{"Finetune/Learning Rate": 9.671250066444681e-06, "Finetune/Loss": 0.8039439916610718, "Finetune/Loss (Raw)": 0.8846030235290527, "Finetune/Step": 2612, "Finetune/Step Time": 2.8519476670771837} +{"Finetune/Learning Rate": 9.664742583154153e-06, "Finetune/Loss": 0.8037556409835815, "Finetune/Loss (Raw)": 0.8723279237747192, "Finetune/Step": 2613, "Finetune/Step Time": 2.85385262966156} +{"Finetune/Learning Rate": 9.658235241992886e-06, "Finetune/Loss": 0.8041610717773438, "Finetune/Loss (Raw)": 0.7991560697555542, "Finetune/Step": 2614, "Finetune/Step Time": 2.8531303461641073} +{"Finetune/Learning Rate": 9.651728045719599e-06, "Finetune/Loss": 0.8035809993743896, "Finetune/Loss (Raw)": 0.7767443656921387, "Finetune/Step": 2615, "Finetune/Step Time": 2.8472862634807825} +{"Finetune/Learning Rate": 9.645220997092964e-06, "Finetune/Loss": 0.8026393055915833, "Finetune/Loss (Raw)": 0.703796923160553, "Finetune/Step": 2616, "Finetune/Step Time": 2.8358506113290787} +{"Finetune/Learning Rate": 9.638714098871582e-06, "Finetune/Loss": 0.803307831287384, "Finetune/Loss (Raw)": 0.8192956447601318, "Finetune/Step": 2617, "Finetune/Step Time": 2.8377564139664173} +{"Finetune/Learning Rate": 9.632207353813992e-06, "Finetune/Loss": 0.8022758960723877, "Finetune/Loss (Raw)": 0.7326969504356384, "Finetune/Step": 2618, "Finetune/Step Time": 2.8394792284816504} +{"Finetune/Learning Rate": 9.625700764678666e-06, "Finetune/Loss": 0.8029431104660034, "Finetune/Loss (Raw)": 0.8635315895080566, "Finetune/Step": 2619, "Finetune/Step Time": 2.8339074552059174} +{"Finetune/Learning Rate": 9.619194334224013e-06, "Finetune/Loss": 0.8026314377784729, "Finetune/Loss (Raw)": 0.820204496383667, "Finetune/Step": 2620, "Finetune/Step Time": 2.831140039488673} +{"Finetune/Learning Rate": 9.612688065208378e-06, "Finetune/Loss": 0.8012567162513733, "Finetune/Loss (Raw)": 0.6900036334991455, "Finetune/Step": 2621, "Finetune/Step Time": 2.830015279352665} +{"Finetune/Learning Rate": 9.606181960390024e-06, "Finetune/Loss": 0.801734209060669, "Finetune/Loss (Raw)": 0.8572125434875488, "Finetune/Step": 2622, "Finetune/Step Time": 2.8314100932329893} +{"Finetune/Learning Rate": 9.599676022527161e-06, "Finetune/Loss": 0.8014426231384277, "Finetune/Loss (Raw)": 0.8280649781227112, "Finetune/Step": 2623, "Finetune/Step Time": 2.82855555601418} +{"Finetune/Learning Rate": 9.593170254377915e-06, "Finetune/Loss": 0.7998141050338745, "Finetune/Loss (Raw)": 0.7081342339515686, "Finetune/Step": 2624, "Finetune/Step Time": 2.824839912354946} +{"Finetune/Learning Rate": 9.586664658700356e-06, "Finetune/Loss": 0.7990648150444031, "Finetune/Loss (Raw)": 0.7812952399253845, "Finetune/Step": 2625, "Finetune/Step Time": 2.826379455626011} +{"Finetune/Learning Rate": 9.580159238252458e-06, "Finetune/Loss": 0.7994688749313354, "Finetune/Loss (Raw)": 0.8845015168190002, "Finetune/Step": 2626, "Finetune/Step Time": 2.8244257420301437} +{"Finetune/Learning Rate": 9.57365399579214e-06, "Finetune/Loss": 0.7975540161132812, "Finetune/Loss (Raw)": 0.6707080006599426, "Finetune/Step": 2627, "Finetune/Step Time": 2.8235006891191006} +{"Finetune/Learning Rate": 9.56714893407724e-06, "Finetune/Loss": 0.7973867058753967, "Finetune/Loss (Raw)": 0.8321035504341125, "Finetune/Step": 2628, "Finetune/Step Time": 2.8260951172560453} +{"Finetune/Learning Rate": 9.560644055865514e-06, "Finetune/Loss": 0.7975479364395142, "Finetune/Loss (Raw)": 0.8122769594192505, "Finetune/Step": 2629, "Finetune/Step Time": 2.823904547840357} +{"Finetune/Learning Rate": 9.554139363914647e-06, "Finetune/Loss": 0.7967352867126465, "Finetune/Loss (Raw)": 0.7487523555755615, "Finetune/Step": 2630, "Finetune/Step Time": 2.823936888948083} +{"Finetune/Learning Rate": 9.547634860982243e-06, "Finetune/Loss": 0.7963168621063232, "Finetune/Loss (Raw)": 0.7279384732246399, "Finetune/Step": 2631, "Finetune/Step Time": 2.820823049172759} +{"Finetune/Learning Rate": 9.541130549825825e-06, "Finetune/Loss": 0.7960721850395203, "Finetune/Loss (Raw)": 0.8405494093894958, "Finetune/Step": 2632, "Finetune/Step Time": 2.8204660788178444} +{"Finetune/Learning Rate": 9.534626433202835e-06, "Finetune/Loss": 0.7961465716362, "Finetune/Loss (Raw)": 0.7996399998664856, "Finetune/Step": 2633, "Finetune/Step Time": 2.822464916855097} +{"Finetune/Learning Rate": 9.528122513870633e-06, "Finetune/Loss": 0.79505455493927, "Finetune/Loss (Raw)": 0.7833320498466492, "Finetune/Step": 2634, "Finetune/Step Time": 2.8249933682382107} +{"Finetune/Learning Rate": 9.521618794586496e-06, "Finetune/Loss": 0.7942962646484375, "Finetune/Loss (Raw)": 0.7830692529678345, "Finetune/Step": 2635, "Finetune/Step Time": 2.820571806281805} +{"Finetune/Learning Rate": 9.515115278107609e-06, "Finetune/Loss": 0.7939956784248352, "Finetune/Loss (Raw)": 0.7755500078201294, "Finetune/Step": 2636, "Finetune/Step Time": 2.82034713588655} +{"Finetune/Learning Rate": 9.508611967191085e-06, "Finetune/Loss": 0.7940799593925476, "Finetune/Loss (Raw)": 0.8642476201057434, "Finetune/Step": 2637, "Finetune/Step Time": 2.822296040132642} +{"Finetune/Learning Rate": 9.502108864593938e-06, "Finetune/Loss": 0.794305682182312, "Finetune/Loss (Raw)": 0.7495980262756348, "Finetune/Step": 2638, "Finetune/Step Time": 2.8243549317121506} +{"Finetune/Learning Rate": 9.495605973073101e-06, "Finetune/Loss": 0.7936698794364929, "Finetune/Loss (Raw)": 0.809846043586731, "Finetune/Step": 2639, "Finetune/Step Time": 2.819675186648965} +{"Finetune/Learning Rate": 9.489103295385409e-06, "Finetune/Loss": 0.7935454845428467, "Finetune/Loss (Raw)": 0.7980395555496216, "Finetune/Step": 2640, "Finetune/Step Time": 2.819487424567342} +{"Finetune/Learning Rate": 9.482600834287617e-06, "Finetune/Loss": 0.7963148355484009, "Finetune/Loss (Raw)": 0.8523693084716797, "Finetune/Step": 2641, "Finetune/Step Time": 2.7969331480562687} +{"Finetune/Learning Rate": 9.47609859253638e-06, "Finetune/Loss": 0.7970930337905884, "Finetune/Loss (Raw)": 0.8773972392082214, "Finetune/Step": 2642, "Finetune/Step Time": 2.794268559664488} +{"Finetune/Learning Rate": 9.469596572888263e-06, "Finetune/Loss": 0.7986399531364441, "Finetune/Loss (Raw)": 0.8030156493186951, "Finetune/Step": 2643, "Finetune/Step Time": 2.7718832567334175} +{"Finetune/Learning Rate": 9.463094778099735e-06, "Finetune/Loss": 0.7982900142669678, "Finetune/Loss (Raw)": 0.8234363794326782, "Finetune/Step": 2644, "Finetune/Step Time": 2.7672533243894577} +{"Finetune/Learning Rate": 9.456593210927173e-06, "Finetune/Loss": 0.7973934412002563, "Finetune/Loss (Raw)": 0.6191166043281555, "Finetune/Step": 2645, "Finetune/Step Time": 2.7911454625427723} +{"Finetune/Learning Rate": 9.450091874126861e-06, "Finetune/Loss": 0.796451210975647, "Finetune/Loss (Raw)": 0.7435905933380127, "Finetune/Step": 2646, "Finetune/Step Time": 2.7882970590144396} +{"Finetune/Learning Rate": 9.443590770454973e-06, "Finetune/Loss": 0.7938986420631409, "Finetune/Loss (Raw)": 0.47867515683174133, "Finetune/Step": 2647, "Finetune/Step Time": 2.8116939943283796} +{"Finetune/Learning Rate": 9.43708990266759e-06, "Finetune/Loss": 0.7955851554870605, "Finetune/Loss (Raw)": 0.8947246074676514, "Finetune/Step": 2648, "Finetune/Step Time": 2.790503364056349} +{"Finetune/Learning Rate": 9.430589273520704e-06, "Finetune/Loss": 0.7955173254013062, "Finetune/Loss (Raw)": 0.7913838624954224, "Finetune/Step": 2649, "Finetune/Step Time": 2.7897237092256546} +{"Finetune/Learning Rate": 9.424088885770185e-06, "Finetune/Loss": 0.7940986156463623, "Finetune/Loss (Raw)": 0.7011657357215881, "Finetune/Step": 2650, "Finetune/Step Time": 2.7913476396352053} +{"Finetune/Learning Rate": 9.41758874217182e-06, "Finetune/Loss": 0.7934500575065613, "Finetune/Loss (Raw)": 0.7718862891197205, "Finetune/Step": 2651, "Finetune/Step Time": 2.788678815588355} +{"Finetune/Learning Rate": 9.411088845481277e-06, "Finetune/Loss": 0.7927525043487549, "Finetune/Loss (Raw)": 0.6907208561897278, "Finetune/Step": 2652, "Finetune/Step Time": 2.791121982038021} +{"Finetune/Learning Rate": 9.404589198454136e-06, "Finetune/Loss": 0.7935464978218079, "Finetune/Loss (Raw)": 0.801051914691925, "Finetune/Step": 2653, "Finetune/Step Time": 2.770593173801899} +{"Finetune/Learning Rate": 9.398089803845852e-06, "Finetune/Loss": 0.7881299257278442, "Finetune/Loss (Raw)": 0.1945182979106903, "Finetune/Step": 2654, "Finetune/Step Time": 2.799999926239252} +{"Finetune/Learning Rate": 9.391590664411791e-06, "Finetune/Loss": 0.788916826248169, "Finetune/Loss (Raw)": 0.894646406173706, "Finetune/Step": 2655, "Finetune/Step Time": 2.8004308082163334} +{"Finetune/Learning Rate": 9.385091782907198e-06, "Finetune/Loss": 0.791192889213562, "Finetune/Loss (Raw)": 0.8236021399497986, "Finetune/Step": 2656, "Finetune/Step Time": 2.7859849836677313} +{"Finetune/Learning Rate": 9.378593162087215e-06, "Finetune/Loss": 0.7913107872009277, "Finetune/Loss (Raw)": 0.851858377456665, "Finetune/Step": 2657, "Finetune/Step Time": 2.7817486487329006} +{"Finetune/Learning Rate": 9.372094804706867e-06, "Finetune/Loss": 0.7917211055755615, "Finetune/Loss (Raw)": 0.8679571747779846, "Finetune/Step": 2658, "Finetune/Step Time": 2.786948326975107} +{"Finetune/Learning Rate": 9.365596713521076e-06, "Finetune/Loss": 0.7895771265029907, "Finetune/Loss (Raw)": 0.5719866156578064, "Finetune/Step": 2659, "Finetune/Step Time": 2.8093379251658916} +{"Finetune/Learning Rate": 9.359098891284653e-06, "Finetune/Loss": 0.7890397906303406, "Finetune/Loss (Raw)": 0.7851460576057434, "Finetune/Step": 2660, "Finetune/Step Time": 2.8108105957508087} +{"Finetune/Learning Rate": 9.352601340752282e-06, "Finetune/Loss": 0.7880407571792603, "Finetune/Loss (Raw)": 0.7798988223075867, "Finetune/Step": 2661, "Finetune/Step Time": 2.809352580457926} +{"Finetune/Learning Rate": 9.346104064678537e-06, "Finetune/Loss": 0.7878934144973755, "Finetune/Loss (Raw)": 0.7928340435028076, "Finetune/Step": 2662, "Finetune/Step Time": 2.80808412283659} +{"Finetune/Learning Rate": 9.339607065817886e-06, "Finetune/Loss": 0.7886853218078613, "Finetune/Loss (Raw)": 0.7554082274436951, "Finetune/Step": 2663, "Finetune/Step Time": 2.7858910132199526} +{"Finetune/Learning Rate": 9.33311034692466e-06, "Finetune/Loss": 0.7885820865631104, "Finetune/Loss (Raw)": 0.9455779790878296, "Finetune/Step": 2664, "Finetune/Step Time": 2.781913975253701} +{"Finetune/Learning Rate": 9.326613910753093e-06, "Finetune/Loss": 0.7899633646011353, "Finetune/Loss (Raw)": 0.8093273043632507, "Finetune/Step": 2665, "Finetune/Step Time": 2.7591818049550056} +{"Finetune/Learning Rate": 9.320117760057282e-06, "Finetune/Loss": 0.7911912798881531, "Finetune/Loss (Raw)": 0.9115036725997925, "Finetune/Step": 2666, "Finetune/Step Time": 2.755239248275757} +{"Finetune/Learning Rate": 9.313621897591216e-06, "Finetune/Loss": 0.791512131690979, "Finetune/Loss (Raw)": 0.8204845786094666, "Finetune/Step": 2667, "Finetune/Step Time": 2.7538352012634277} +{"Finetune/Learning Rate": 9.307126326108747e-06, "Finetune/Loss": 0.7909899950027466, "Finetune/Loss (Raw)": 0.7663427591323853, "Finetune/Step": 2668, "Finetune/Step Time": 2.752777649089694} +{"Finetune/Learning Rate": 9.300631048363618e-06, "Finetune/Loss": 0.7927048802375793, "Finetune/Loss (Raw)": 0.7878749370574951, "Finetune/Step": 2669, "Finetune/Step Time": 2.7308644521981478} +{"Finetune/Learning Rate": 9.294136067109441e-06, "Finetune/Loss": 0.7921395897865295, "Finetune/Loss (Raw)": 0.720369279384613, "Finetune/Step": 2670, "Finetune/Step Time": 2.7337881810963154} +{"Finetune/Learning Rate": 9.287641385099699e-06, "Finetune/Loss": 0.7920828461647034, "Finetune/Loss (Raw)": 0.8013319373130798, "Finetune/Step": 2671, "Finetune/Step Time": 2.7339226715266705} +{"Finetune/Learning Rate": 9.281147005087754e-06, "Finetune/Loss": 0.7916498184204102, "Finetune/Loss (Raw)": 0.7915108799934387, "Finetune/Step": 2672, "Finetune/Step Time": 2.720546267926693} +{"Finetune/Learning Rate": 9.274652929826838e-06, "Finetune/Loss": 0.7912609577178955, "Finetune/Loss (Raw)": 0.8215497732162476, "Finetune/Step": 2673, "Finetune/Step Time": 2.7258552834391594} +{"Finetune/Learning Rate": 9.268159162070058e-06, "Finetune/Loss": 0.7915905714035034, "Finetune/Loss (Raw)": 0.791397750377655, "Finetune/Step": 2674, "Finetune/Step Time": 2.726009974256158} +{"Finetune/Learning Rate": 9.26166570457038e-06, "Finetune/Loss": 0.7920001745223999, "Finetune/Loss (Raw)": 0.8865663409233093, "Finetune/Step": 2675, "Finetune/Step Time": 2.727547151967883} +{"Finetune/Learning Rate": 9.255172560080645e-06, "Finetune/Loss": 0.7917572259902954, "Finetune/Loss (Raw)": 0.7263080477714539, "Finetune/Step": 2676, "Finetune/Step Time": 2.729486668482423} +{"Finetune/Learning Rate": 9.248679731353569e-06, "Finetune/Loss": 0.7935166358947754, "Finetune/Loss (Raw)": 0.8445626497268677, "Finetune/Step": 2677, "Finetune/Step Time": 2.7058531306684017} +{"Finetune/Learning Rate": 9.242187221141716e-06, "Finetune/Loss": 0.7913353443145752, "Finetune/Loss (Raw)": 0.5451744198799133, "Finetune/Step": 2678, "Finetune/Step Time": 2.727689675986767} +{"Finetune/Learning Rate": 9.23569503219753e-06, "Finetune/Loss": 0.7914709448814392, "Finetune/Loss (Raw)": 0.76558917760849, "Finetune/Step": 2679, "Finetune/Step Time": 2.7280691489577293} +{"Finetune/Learning Rate": 9.229203167273313e-06, "Finetune/Loss": 0.7915759086608887, "Finetune/Loss (Raw)": 0.7763678431510925, "Finetune/Step": 2680, "Finetune/Step Time": 2.727453228086233} +{"Finetune/Learning Rate": 9.222711629121235e-06, "Finetune/Loss": 0.7918550968170166, "Finetune/Loss (Raw)": 0.8280807137489319, "Finetune/Step": 2681, "Finetune/Step Time": 2.724509097635746} +{"Finetune/Learning Rate": 9.216220420493314e-06, "Finetune/Loss": 0.7906653881072998, "Finetune/Loss (Raw)": 0.7626022100448608, "Finetune/Step": 2682, "Finetune/Step Time": 2.7253795228898525} +{"Finetune/Learning Rate": 9.209729544141448e-06, "Finetune/Loss": 0.79097580909729, "Finetune/Loss (Raw)": 0.864295482635498, "Finetune/Step": 2683, "Finetune/Step Time": 2.725081916898489} +{"Finetune/Learning Rate": 9.203239002817378e-06, "Finetune/Loss": 0.7904214859008789, "Finetune/Loss (Raw)": 0.7316520810127258, "Finetune/Step": 2684, "Finetune/Step Time": 2.7251039557158947} +{"Finetune/Learning Rate": 9.196748799272706e-06, "Finetune/Loss": 0.7903664708137512, "Finetune/Loss (Raw)": 0.8531674146652222, "Finetune/Step": 2685, "Finetune/Step Time": 2.731148784980178} +{"Finetune/Learning Rate": 9.190258936258896e-06, "Finetune/Loss": 0.7908598184585571, "Finetune/Loss (Raw)": 0.9039546251296997, "Finetune/Step": 2686, "Finetune/Step Time": 2.7296663857996464} +{"Finetune/Learning Rate": 9.183769416527265e-06, "Finetune/Loss": 0.7904714345932007, "Finetune/Loss (Raw)": 0.7550564408302307, "Finetune/Step": 2687, "Finetune/Step Time": 2.7340288311243057} +{"Finetune/Learning Rate": 9.177280242828989e-06, "Finetune/Loss": 0.7908861637115479, "Finetune/Loss (Raw)": 0.8978546857833862, "Finetune/Step": 2688, "Finetune/Step Time": 2.728467745706439} +{"Finetune/Learning Rate": 9.170791417915086e-06, "Finetune/Loss": 0.7918770909309387, "Finetune/Loss (Raw)": 0.7711018919944763, "Finetune/Step": 2689, "Finetune/Step Time": 2.709507005289197} +{"Finetune/Learning Rate": 9.164302944536435e-06, "Finetune/Loss": 0.7930169105529785, "Finetune/Loss (Raw)": 0.9192824363708496, "Finetune/Step": 2690, "Finetune/Step Time": 2.7038889583200216} +{"Finetune/Learning Rate": 9.157814825443767e-06, "Finetune/Loss": 0.7925222516059875, "Finetune/Loss (Raw)": 0.7476233839988708, "Finetune/Step": 2691, "Finetune/Step Time": 2.702480334788561} +{"Finetune/Learning Rate": 9.151327063387652e-06, "Finetune/Loss": 0.7917124629020691, "Finetune/Loss (Raw)": 0.7816804051399231, "Finetune/Step": 2692, "Finetune/Step Time": 2.709935124963522} +{"Finetune/Learning Rate": 9.144839661118523e-06, "Finetune/Loss": 0.7917394042015076, "Finetune/Loss (Raw)": 0.8291955590248108, "Finetune/Step": 2693, "Finetune/Step Time": 2.706897422671318} +{"Finetune/Learning Rate": 9.13835262138665e-06, "Finetune/Loss": 0.790944516658783, "Finetune/Loss (Raw)": 0.7636284828186035, "Finetune/Step": 2694, "Finetune/Step Time": 2.7075041476637125} +{"Finetune/Learning Rate": 9.13186594694216e-06, "Finetune/Loss": 0.7910540699958801, "Finetune/Loss (Raw)": 0.7836742997169495, "Finetune/Step": 2695, "Finetune/Step Time": 2.710261272266507} +{"Finetune/Learning Rate": 9.125379640535007e-06, "Finetune/Loss": 0.7909332513809204, "Finetune/Loss (Raw)": 0.8096145391464233, "Finetune/Step": 2696, "Finetune/Step Time": 2.7118795849382877} +{"Finetune/Learning Rate": 9.118893704915009e-06, "Finetune/Loss": 0.7912144064903259, "Finetune/Loss (Raw)": 0.8525511622428894, "Finetune/Step": 2697, "Finetune/Step Time": 2.7062895074486732} +{"Finetune/Learning Rate": 9.112408142831816e-06, "Finetune/Loss": 0.7908634543418884, "Finetune/Loss (Raw)": 0.7561662793159485, "Finetune/Step": 2698, "Finetune/Step Time": 2.7058305088430643} +{"Finetune/Learning Rate": 9.105922957034921e-06, "Finetune/Loss": 0.7910419702529907, "Finetune/Loss (Raw)": 0.7619374990463257, "Finetune/Step": 2699, "Finetune/Step Time": 2.7064583841711283} +{"Finetune/Learning Rate": 9.099438150273654e-06, "Finetune/Loss": 0.7909526824951172, "Finetune/Loss (Raw)": 0.7908383011817932, "Finetune/Step": 2700, "Finetune/Step Time": 2.7054832447320223} +{"Finetune/Learning Rate": 9.092953725297191e-06, "Finetune/Loss": 0.7910329103469849, "Finetune/Loss (Raw)": 0.8587561249732971, "Finetune/Step": 2701, "Finetune/Step Time": 2.7011576667428017} +{"Finetune/Learning Rate": 9.086469684854553e-06, "Finetune/Loss": 0.7921515703201294, "Finetune/Loss (Raw)": 0.8391755223274231, "Finetune/Step": 2702, "Finetune/Step Time": 2.7021371368318796} +{"Finetune/Learning Rate": 9.079986031694576e-06, "Finetune/Loss": 0.791211724281311, "Finetune/Loss (Raw)": 0.7114689350128174, "Finetune/Step": 2703, "Finetune/Step Time": 2.701248165220022} +{"Finetune/Learning Rate": 9.073502768565947e-06, "Finetune/Loss": 0.7914042472839355, "Finetune/Loss (Raw)": 0.7837007641792297, "Finetune/Step": 2704, "Finetune/Step Time": 2.704673655331135} +{"Finetune/Learning Rate": 9.067019898217192e-06, "Finetune/Loss": 0.7903127670288086, "Finetune/Loss (Raw)": 0.7639622688293457, "Finetune/Step": 2705, "Finetune/Step Time": 2.700817756354809} +{"Finetune/Learning Rate": 9.060537423396651e-06, "Finetune/Loss": 0.7885539531707764, "Finetune/Loss (Raw)": 0.6270826458930969, "Finetune/Step": 2706, "Finetune/Step Time": 2.7271605543792248} +{"Finetune/Learning Rate": 9.05405534685252e-06, "Finetune/Loss": 0.7887946367263794, "Finetune/Loss (Raw)": 0.7859287261962891, "Finetune/Step": 2707, "Finetune/Step Time": 2.7258677165955305} +{"Finetune/Learning Rate": 9.047573671332807e-06, "Finetune/Loss": 0.789543867111206, "Finetune/Loss (Raw)": 0.8370242714881897, "Finetune/Step": 2708, "Finetune/Step Time": 2.7253180909901857} +{"Finetune/Learning Rate": 9.041092399585369e-06, "Finetune/Loss": 0.7895157337188721, "Finetune/Loss (Raw)": 0.7960660457611084, "Finetune/Step": 2709, "Finetune/Step Time": 2.7233687099069357} +{"Finetune/Learning Rate": 9.034611534357868e-06, "Finetune/Loss": 0.7896835207939148, "Finetune/Loss (Raw)": 0.805587887763977, "Finetune/Step": 2710, "Finetune/Step Time": 2.72129724919796} +{"Finetune/Learning Rate": 9.028131078397814e-06, "Finetune/Loss": 0.7907856702804565, "Finetune/Loss (Raw)": 0.9713755249977112, "Finetune/Step": 2711, "Finetune/Step Time": 2.720784669741988} +{"Finetune/Learning Rate": 9.021651034452535e-06, "Finetune/Loss": 0.7904927730560303, "Finetune/Loss (Raw)": 0.7564559578895569, "Finetune/Step": 2712, "Finetune/Step Time": 2.728260651230812} +{"Finetune/Learning Rate": 9.015171405269182e-06, "Finetune/Loss": 0.7900662422180176, "Finetune/Loss (Raw)": 0.7951754331588745, "Finetune/Step": 2713, "Finetune/Step Time": 2.7313696034252644} +{"Finetune/Learning Rate": 9.008692193594735e-06, "Finetune/Loss": 0.7902384996414185, "Finetune/Loss (Raw)": 0.8232138156890869, "Finetune/Step": 2714, "Finetune/Step Time": 2.7330450024455786} +{"Finetune/Learning Rate": 9.002213402175996e-06, "Finetune/Loss": 0.7901310920715332, "Finetune/Loss (Raw)": 0.7819769978523254, "Finetune/Step": 2715, "Finetune/Step Time": 2.7315294295549393} +{"Finetune/Learning Rate": 8.995735033759593e-06, "Finetune/Loss": 0.7908051013946533, "Finetune/Loss (Raw)": 0.9387039542198181, "Finetune/Step": 2716, "Finetune/Step Time": 2.7316269036382437} +{"Finetune/Learning Rate": 8.98925709109196e-06, "Finetune/Loss": 0.7913733720779419, "Finetune/Loss (Raw)": 0.9558709859848022, "Finetune/Step": 2717, "Finetune/Step Time": 2.7276766039431095} +{"Finetune/Learning Rate": 8.982779576919367e-06, "Finetune/Loss": 0.7908822298049927, "Finetune/Loss (Raw)": 0.7566726207733154, "Finetune/Step": 2718, "Finetune/Step Time": 2.729679988697171} +{"Finetune/Learning Rate": 8.976302493987898e-06, "Finetune/Loss": 0.7901217341423035, "Finetune/Loss (Raw)": 0.7572754621505737, "Finetune/Step": 2719, "Finetune/Step Time": 2.7278025150299072} +{"Finetune/Learning Rate": 8.969825845043443e-06, "Finetune/Loss": 0.7901108264923096, "Finetune/Loss (Raw)": 0.7363060116767883, "Finetune/Step": 2720, "Finetune/Step Time": 2.7285932432860136} +{"Finetune/Learning Rate": 8.963349632831725e-06, "Finetune/Loss": 0.790290117263794, "Finetune/Loss (Raw)": 0.813042402267456, "Finetune/Step": 2721, "Finetune/Step Time": 2.7273873537778854} +{"Finetune/Learning Rate": 8.956873860098275e-06, "Finetune/Loss": 0.7917160987854004, "Finetune/Loss (Raw)": 0.8522473573684692, "Finetune/Step": 2722, "Finetune/Step Time": 2.7009358629584312} +{"Finetune/Learning Rate": 8.950398529588427e-06, "Finetune/Loss": 0.7919377088546753, "Finetune/Loss (Raw)": 0.7776724696159363, "Finetune/Step": 2723, "Finetune/Step Time": 2.7086685691028833} +{"Finetune/Learning Rate": 8.943923644047343e-06, "Finetune/Loss": 0.7917656898498535, "Finetune/Loss (Raw)": 0.8025690913200378, "Finetune/Step": 2724, "Finetune/Step Time": 2.706827348098159} +{"Finetune/Learning Rate": 8.937449206219992e-06, "Finetune/Loss": 0.7918909788131714, "Finetune/Loss (Raw)": 0.7807075381278992, "Finetune/Step": 2725, "Finetune/Step Time": 2.7101902160793543} +{"Finetune/Learning Rate": 8.93097521885115e-06, "Finetune/Loss": 0.7912468910217285, "Finetune/Loss (Raw)": 0.8350040316581726, "Finetune/Step": 2726, "Finetune/Step Time": 2.709962382912636} +{"Finetune/Learning Rate": 8.924501684685403e-06, "Finetune/Loss": 0.7903828024864197, "Finetune/Loss (Raw)": 0.8041505813598633, "Finetune/Step": 2727, "Finetune/Step Time": 2.7149934489279985} +{"Finetune/Learning Rate": 8.918028606467145e-06, "Finetune/Loss": 0.7900542616844177, "Finetune/Loss (Raw)": 0.7472798228263855, "Finetune/Step": 2728, "Finetune/Step Time": 2.706034427508712} +{"Finetune/Learning Rate": 8.91155598694058e-06, "Finetune/Loss": 0.7902196049690247, "Finetune/Loss (Raw)": 0.7955687642097473, "Finetune/Step": 2729, "Finetune/Step Time": 2.7061482667922974} +{"Finetune/Learning Rate": 8.90508382884971e-06, "Finetune/Loss": 0.790591835975647, "Finetune/Loss (Raw)": 0.844034731388092, "Finetune/Step": 2730, "Finetune/Step Time": 2.704273471608758} +{"Finetune/Learning Rate": 8.898612134938353e-06, "Finetune/Loss": 0.7906065583229065, "Finetune/Loss (Raw)": 0.7949337363243103, "Finetune/Step": 2731, "Finetune/Step Time": 2.7078196983784437} +{"Finetune/Learning Rate": 8.892140907950114e-06, "Finetune/Loss": 0.7888513803482056, "Finetune/Loss (Raw)": 0.4595712125301361, "Finetune/Step": 2732, "Finetune/Step Time": 2.715482957661152} +{"Finetune/Learning Rate": 8.885670150628421e-06, "Finetune/Loss": 0.7885834574699402, "Finetune/Loss (Raw)": 0.8195263743400574, "Finetune/Step": 2733, "Finetune/Step Time": 2.715195532888174} +{"Finetune/Learning Rate": 8.879199865716478e-06, "Finetune/Loss": 0.7874389886856079, "Finetune/Loss (Raw)": 0.7154790163040161, "Finetune/Step": 2734, "Finetune/Step Time": 2.7155331056565046} +{"Finetune/Learning Rate": 8.872730055957313e-06, "Finetune/Loss": 0.7890524864196777, "Finetune/Loss (Raw)": 0.9435333013534546, "Finetune/Step": 2735, "Finetune/Step Time": 2.713515777140856} +{"Finetune/Learning Rate": 8.86626072409374e-06, "Finetune/Loss": 0.7889294624328613, "Finetune/Loss (Raw)": 0.8567706346511841, "Finetune/Step": 2736, "Finetune/Step Time": 2.714184954762459} +{"Finetune/Learning Rate": 8.859791872868363e-06, "Finetune/Loss": 0.7845489978790283, "Finetune/Loss (Raw)": 0.25237444043159485, "Finetune/Step": 2737, "Finetune/Step Time": 2.74119003303349} +{"Finetune/Learning Rate": 8.853323505023601e-06, "Finetune/Loss": 0.7853646278381348, "Finetune/Loss (Raw)": 0.9236662983894348, "Finetune/Step": 2738, "Finetune/Step Time": 2.7657898757606745} +{"Finetune/Learning Rate": 8.846855623301654e-06, "Finetune/Loss": 0.785548210144043, "Finetune/Loss (Raw)": 0.7908437848091125, "Finetune/Step": 2739, "Finetune/Step Time": 2.765573685988784} +{"Finetune/Learning Rate": 8.840388230444524e-06, "Finetune/Loss": 0.7856276631355286, "Finetune/Loss (Raw)": 0.8947808146476746, "Finetune/Step": 2740, "Finetune/Step Time": 2.7632066141813993} +{"Finetune/Learning Rate": 8.833921329193996e-06, "Finetune/Loss": 0.7845696210861206, "Finetune/Loss (Raw)": 0.7369005680084229, "Finetune/Step": 2741, "Finetune/Step Time": 2.759931145235896} +{"Finetune/Learning Rate": 8.827454922291656e-06, "Finetune/Loss": 0.7854811549186707, "Finetune/Loss (Raw)": 0.9158299565315247, "Finetune/Step": 2742, "Finetune/Step Time": 2.758285079151392} +{"Finetune/Learning Rate": 8.82098901247888e-06, "Finetune/Loss": 0.7857931852340698, "Finetune/Loss (Raw)": 0.8166900873184204, "Finetune/Step": 2743, "Finetune/Step Time": 2.7626943551003933} +{"Finetune/Learning Rate": 8.814523602496822e-06, "Finetune/Loss": 0.7853294610977173, "Finetune/Loss (Raw)": 0.6444341540336609, "Finetune/Step": 2744, "Finetune/Step Time": 2.7864697482436895} +{"Finetune/Learning Rate": 8.808058695086439e-06, "Finetune/Loss": 0.7848736047744751, "Finetune/Loss (Raw)": 0.7609439492225647, "Finetune/Step": 2745, "Finetune/Step Time": 2.789981983602047} +{"Finetune/Learning Rate": 8.801594292988465e-06, "Finetune/Loss": 0.785423219203949, "Finetune/Loss (Raw)": 0.8030537366867065, "Finetune/Step": 2746, "Finetune/Step Time": 2.787576638162136} +{"Finetune/Learning Rate": 8.795130398943428e-06, "Finetune/Loss": 0.7847325205802917, "Finetune/Loss (Raw)": 0.7751176357269287, "Finetune/Step": 2747, "Finetune/Step Time": 2.7872081324458122} +{"Finetune/Learning Rate": 8.788667015691628e-06, "Finetune/Loss": 0.7848119735717773, "Finetune/Loss (Raw)": 0.8303750157356262, "Finetune/Step": 2748, "Finetune/Step Time": 2.788779454305768} +{"Finetune/Learning Rate": 8.782204145973162e-06, "Finetune/Loss": 0.7856641411781311, "Finetune/Loss (Raw)": 0.7990819215774536, "Finetune/Step": 2749, "Finetune/Step Time": 2.78986082598567} +{"Finetune/Learning Rate": 8.775741792527902e-06, "Finetune/Loss": 0.7840352058410645, "Finetune/Loss (Raw)": 0.6487099528312683, "Finetune/Step": 2750, "Finetune/Step Time": 2.8105024099349976} +{"Finetune/Learning Rate": 8.769279958095503e-06, "Finetune/Loss": 0.783805787563324, "Finetune/Loss (Raw)": 0.7986987233161926, "Finetune/Step": 2751, "Finetune/Step Time": 2.8121880535036325} +{"Finetune/Learning Rate": 8.762818645415393e-06, "Finetune/Loss": 0.7846629023551941, "Finetune/Loss (Raw)": 0.8178483247756958, "Finetune/Step": 2752, "Finetune/Step Time": 2.8123370558023453} +{"Finetune/Learning Rate": 8.756357857226798e-06, "Finetune/Loss": 0.7850282192230225, "Finetune/Loss (Raw)": 0.8280500173568726, "Finetune/Step": 2753, "Finetune/Step Time": 2.81084662117064} +{"Finetune/Learning Rate": 8.749897596268698e-06, "Finetune/Loss": 0.7845404148101807, "Finetune/Loss (Raw)": 0.8220675587654114, "Finetune/Step": 2754, "Finetune/Step Time": 2.8136365488171577} +{"Finetune/Learning Rate": 8.743437865279866e-06, "Finetune/Loss": 0.7862409353256226, "Finetune/Loss (Raw)": 0.8883673548698425, "Finetune/Step": 2755, "Finetune/Step Time": 2.811558071523905} +{"Finetune/Learning Rate": 8.73697866699884e-06, "Finetune/Loss": 0.7859435677528381, "Finetune/Loss (Raw)": 0.7940423488616943, "Finetune/Step": 2756, "Finetune/Step Time": 2.8127835635095835} +{"Finetune/Learning Rate": 8.730520004163945e-06, "Finetune/Loss": 0.7860730290412903, "Finetune/Loss (Raw)": 0.8288504481315613, "Finetune/Step": 2757, "Finetune/Step Time": 2.816296309232712} +{"Finetune/Learning Rate": 8.72406187951326e-06, "Finetune/Loss": 0.7874722480773926, "Finetune/Loss (Raw)": 0.9278565049171448, "Finetune/Step": 2758, "Finetune/Step Time": 2.8115470204502344} +{"Finetune/Learning Rate": 8.717604295784658e-06, "Finetune/Loss": 0.7841410636901855, "Finetune/Loss (Raw)": 0.3015425205230713, "Finetune/Step": 2759, "Finetune/Step Time": 2.8463767673820257} +{"Finetune/Learning Rate": 8.711147255715761e-06, "Finetune/Loss": 0.7840591073036194, "Finetune/Loss (Raw)": 0.8300611972808838, "Finetune/Step": 2760, "Finetune/Step Time": 2.846228927373886} +{"Finetune/Learning Rate": 8.704690762043981e-06, "Finetune/Loss": 0.7844644784927368, "Finetune/Loss (Raw)": 0.8515236973762512, "Finetune/Step": 2761, "Finetune/Step Time": 2.8442744370549917} +{"Finetune/Learning Rate": 8.698234817506482e-06, "Finetune/Loss": 0.7852421998977661, "Finetune/Loss (Raw)": 0.8828873634338379, "Finetune/Step": 2762, "Finetune/Step Time": 2.8438255060464144} +{"Finetune/Learning Rate": 8.691779424840201e-06, "Finetune/Loss": 0.7858996987342834, "Finetune/Loss (Raw)": 0.8672240376472473, "Finetune/Step": 2763, "Finetune/Step Time": 2.8447980750352144} +{"Finetune/Learning Rate": 8.685324586781846e-06, "Finetune/Loss": 0.7851401567459106, "Finetune/Loss (Raw)": 0.6783264875411987, "Finetune/Step": 2764, "Finetune/Step Time": 2.84562505222857} +{"Finetune/Learning Rate": 8.678870306067882e-06, "Finetune/Loss": 0.7843978404998779, "Finetune/Loss (Raw)": 0.7692291140556335, "Finetune/Step": 2765, "Finetune/Step Time": 2.843164835125208} +{"Finetune/Learning Rate": 8.67241658543454e-06, "Finetune/Loss": 0.7849907875061035, "Finetune/Loss (Raw)": 0.8254915475845337, "Finetune/Step": 2766, "Finetune/Step Time": 2.837371814996004} +{"Finetune/Learning Rate": 8.665963427617817e-06, "Finetune/Loss": 0.7854360342025757, "Finetune/Loss (Raw)": 0.8668425679206848, "Finetune/Step": 2767, "Finetune/Step Time": 2.8378197085112333} +{"Finetune/Learning Rate": 8.659510835353474e-06, "Finetune/Loss": 0.785742998123169, "Finetune/Loss (Raw)": 0.8373329639434814, "Finetune/Step": 2768, "Finetune/Step Time": 2.8535146322101355} +{"Finetune/Learning Rate": 8.65305881137702e-06, "Finetune/Loss": 0.7859581112861633, "Finetune/Loss (Raw)": 0.8799043297767639, "Finetune/Step": 2769, "Finetune/Step Time": 2.854691334068775} +{"Finetune/Learning Rate": 8.64660735842373e-06, "Finetune/Loss": 0.7857552766799927, "Finetune/Loss (Raw)": 0.8514370918273926, "Finetune/Step": 2770, "Finetune/Step Time": 2.849726578220725} +{"Finetune/Learning Rate": 8.640156479228645e-06, "Finetune/Loss": 0.7868325710296631, "Finetune/Loss (Raw)": 0.9409130811691284, "Finetune/Step": 2771, "Finetune/Step Time": 2.8495284616947174} +{"Finetune/Learning Rate": 8.633706176526547e-06, "Finetune/Loss": 0.7871789336204529, "Finetune/Loss (Raw)": 0.867765486240387, "Finetune/Step": 2772, "Finetune/Step Time": 2.8491437900811434} +{"Finetune/Learning Rate": 8.627256453051987e-06, "Finetune/Loss": 0.789304256439209, "Finetune/Loss (Raw)": 0.8911523222923279, "Finetune/Step": 2773, "Finetune/Step Time": 2.8237511944025755} +{"Finetune/Learning Rate": 8.620807311539258e-06, "Finetune/Loss": 0.7902036905288696, "Finetune/Loss (Raw)": 0.8587246537208557, "Finetune/Step": 2774, "Finetune/Step Time": 2.8259234372526407} +{"Finetune/Learning Rate": 8.614358754722428e-06, "Finetune/Loss": 0.7930461168289185, "Finetune/Loss (Raw)": 0.8425024747848511, "Finetune/Step": 2775, "Finetune/Step Time": 2.808104209601879} +{"Finetune/Learning Rate": 8.607910785335284e-06, "Finetune/Loss": 0.7924740314483643, "Finetune/Loss (Raw)": 0.8215065002441406, "Finetune/Step": 2776, "Finetune/Step Time": 2.805589061230421} +{"Finetune/Learning Rate": 8.601463406111398e-06, "Finetune/Loss": 0.7931833267211914, "Finetune/Loss (Raw)": 0.8821619749069214, "Finetune/Step": 2777, "Finetune/Step Time": 2.805486746132374} +{"Finetune/Learning Rate": 8.595016619784067e-06, "Finetune/Loss": 0.7941612601280212, "Finetune/Loss (Raw)": 0.8263456225395203, "Finetune/Step": 2778, "Finetune/Step Time": 2.802890768274665} +{"Finetune/Learning Rate": 8.588570429086351e-06, "Finetune/Loss": 0.7938390970230103, "Finetune/Loss (Raw)": 0.7306491732597351, "Finetune/Step": 2779, "Finetune/Step Time": 2.805716287344694} +{"Finetune/Learning Rate": 8.582124836751049e-06, "Finetune/Loss": 0.7950529456138611, "Finetune/Loss (Raw)": 0.8460990786552429, "Finetune/Step": 2780, "Finetune/Step Time": 2.8050857838243246} +{"Finetune/Learning Rate": 8.57567984551071e-06, "Finetune/Loss": 0.7946628928184509, "Finetune/Loss (Raw)": 0.7511184811592102, "Finetune/Step": 2781, "Finetune/Step Time": 2.803903728723526} +{"Finetune/Learning Rate": 8.569235458097634e-06, "Finetune/Loss": 0.7957375049591064, "Finetune/Loss (Raw)": 0.3320641815662384, "Finetune/Step": 2782, "Finetune/Step Time": 2.8012911714613438} +{"Finetune/Learning Rate": 8.562791677243854e-06, "Finetune/Loss": 0.7947711944580078, "Finetune/Loss (Raw)": 0.77095627784729, "Finetune/Step": 2783, "Finetune/Step Time": 2.8016318269073963} +{"Finetune/Learning Rate": 8.556348505681147e-06, "Finetune/Loss": 0.7945892810821533, "Finetune/Loss (Raw)": 0.8003231883049011, "Finetune/Step": 2784, "Finetune/Step Time": 2.7929958030581474} +{"Finetune/Learning Rate": 8.549905946141045e-06, "Finetune/Loss": 0.7943339347839355, "Finetune/Loss (Raw)": 0.8191692233085632, "Finetune/Step": 2785, "Finetune/Step Time": 2.8156562093645334} +{"Finetune/Learning Rate": 8.543464001354802e-06, "Finetune/Loss": 0.7940793633460999, "Finetune/Loss (Raw)": 0.8353763222694397, "Finetune/Step": 2786, "Finetune/Step Time": 2.811137583106756} +{"Finetune/Learning Rate": 8.537022674053425e-06, "Finetune/Loss": 0.7964895963668823, "Finetune/Loss (Raw)": 0.8805018663406372, "Finetune/Step": 2787, "Finetune/Step Time": 2.7869977932423353} +{"Finetune/Learning Rate": 8.530581966967653e-06, "Finetune/Loss": 0.7969517111778259, "Finetune/Loss (Raw)": 0.8442973494529724, "Finetune/Step": 2788, "Finetune/Step Time": 2.783692594617605} +{"Finetune/Learning Rate": 8.524141882827969e-06, "Finetune/Loss": 0.7973524928092957, "Finetune/Loss (Raw)": 0.8311921954154968, "Finetune/Step": 2789, "Finetune/Step Time": 2.7868180125951767} +{"Finetune/Learning Rate": 8.517702424364581e-06, "Finetune/Loss": 0.7974075675010681, "Finetune/Loss (Raw)": 0.7998902201652527, "Finetune/Step": 2790, "Finetune/Step Time": 2.78938889503479} +{"Finetune/Learning Rate": 8.511263594307437e-06, "Finetune/Loss": 0.7972023487091064, "Finetune/Loss (Raw)": 0.7291364669799805, "Finetune/Step": 2791, "Finetune/Step Time": 2.791081950068474} +{"Finetune/Learning Rate": 8.504825395386222e-06, "Finetune/Loss": 0.7952876687049866, "Finetune/Loss (Raw)": 0.7005031108856201, "Finetune/Step": 2792, "Finetune/Step Time": 2.790279060602188} +{"Finetune/Learning Rate": 8.49838783033035e-06, "Finetune/Loss": 0.7954692840576172, "Finetune/Loss (Raw)": 0.8325691223144531, "Finetune/Step": 2793, "Finetune/Step Time": 2.7945932876318693} +{"Finetune/Learning Rate": 8.491950901868963e-06, "Finetune/Loss": 0.793895959854126, "Finetune/Loss (Raw)": 0.7101193070411682, "Finetune/Step": 2794, "Finetune/Step Time": 2.7975163366645575} +{"Finetune/Learning Rate": 8.485514612730942e-06, "Finetune/Loss": 0.793537974357605, "Finetune/Loss (Raw)": 0.7746613025665283, "Finetune/Step": 2795, "Finetune/Step Time": 2.795187858864665} +{"Finetune/Learning Rate": 8.479078965644893e-06, "Finetune/Loss": 0.7937584519386292, "Finetune/Loss (Raw)": 0.7945657968521118, "Finetune/Step": 2796, "Finetune/Step Time": 2.7945947628468275} +{"Finetune/Learning Rate": 8.472643963339143e-06, "Finetune/Loss": 0.7945672273635864, "Finetune/Loss (Raw)": 0.891391932964325, "Finetune/Step": 2797, "Finetune/Step Time": 2.794377328827977} +{"Finetune/Learning Rate": 8.466209608541753e-06, "Finetune/Loss": 0.7952085733413696, "Finetune/Loss (Raw)": 0.8024702668190002, "Finetune/Step": 2798, "Finetune/Step Time": 2.791656395420432} +{"Finetune/Learning Rate": 8.45977590398051e-06, "Finetune/Loss": 0.7955288887023926, "Finetune/Loss (Raw)": 0.8423259854316711, "Finetune/Step": 2799, "Finetune/Step Time": 2.792574306949973} +{"Finetune/Learning Rate": 8.45334285238292e-06, "Finetune/Loss": 0.7946668267250061, "Finetune/Loss (Raw)": 0.6811727285385132, "Finetune/Step": 2800, "Finetune/Step Time": 2.8189723193645477} +{"Finetune/Learning Rate": 8.446910456476216e-06, "Finetune/Loss": 0.7946274280548096, "Finetune/Loss (Raw)": 0.8164989352226257, "Finetune/Step": 2801, "Finetune/Step Time": 2.8157884143292904} +{"Finetune/Learning Rate": 8.440478718987352e-06, "Finetune/Loss": 0.7952473163604736, "Finetune/Loss (Raw)": 0.8707493543624878, "Finetune/Step": 2802, "Finetune/Step Time": 2.8166874684393406} +{"Finetune/Learning Rate": 8.43404764264301e-06, "Finetune/Loss": 0.7948018312454224, "Finetune/Loss (Raw)": 0.8295387625694275, "Finetune/Step": 2803, "Finetune/Step Time": 2.8131557423621416} +{"Finetune/Learning Rate": 8.427617230169574e-06, "Finetune/Loss": 0.7948043346405029, "Finetune/Loss (Raw)": 0.7266331315040588, "Finetune/Step": 2804, "Finetune/Step Time": 2.8143651504069567} +{"Finetune/Learning Rate": 8.421187484293166e-06, "Finetune/Loss": 0.7940170764923096, "Finetune/Loss (Raw)": 0.7437866926193237, "Finetune/Step": 2805, "Finetune/Step Time": 2.813420431688428} +{"Finetune/Learning Rate": 8.414758407739612e-06, "Finetune/Loss": 0.7960225343704224, "Finetune/Loss (Raw)": 0.8018782138824463, "Finetune/Step": 2806, "Finetune/Step Time": 2.791871489956975} +{"Finetune/Learning Rate": 8.40833000323446e-06, "Finetune/Loss": 0.7962139844894409, "Finetune/Loss (Raw)": 0.790091335773468, "Finetune/Step": 2807, "Finetune/Step Time": 2.7893674448132515} +{"Finetune/Learning Rate": 8.401902273502972e-06, "Finetune/Loss": 0.796625018119812, "Finetune/Loss (Raw)": 0.8289835453033447, "Finetune/Step": 2808, "Finetune/Step Time": 2.78862776607275} +{"Finetune/Learning Rate": 8.395475221270125e-06, "Finetune/Loss": 0.7960152626037598, "Finetune/Loss (Raw)": 0.7500328421592712, "Finetune/Step": 2809, "Finetune/Step Time": 2.794044766575098} +{"Finetune/Learning Rate": 8.389048849260612e-06, "Finetune/Loss": 0.7967446446418762, "Finetune/Loss (Raw)": 0.8559584617614746, "Finetune/Step": 2810, "Finetune/Step Time": 2.795197846367955} +{"Finetune/Learning Rate": 8.382623160198826e-06, "Finetune/Loss": 0.7961522340774536, "Finetune/Loss (Raw)": 0.7884684205055237, "Finetune/Step": 2811, "Finetune/Step Time": 2.793713014572859} +{"Finetune/Learning Rate": 8.376198156808881e-06, "Finetune/Loss": 0.7967060804367065, "Finetune/Loss (Raw)": 0.8025521039962769, "Finetune/Step": 2812, "Finetune/Step Time": 2.7945691663771868} +{"Finetune/Learning Rate": 8.369773841814601e-06, "Finetune/Loss": 0.7947716116905212, "Finetune/Loss (Raw)": 0.6055479645729065, "Finetune/Step": 2813, "Finetune/Step Time": 2.811444589868188} +{"Finetune/Learning Rate": 8.363350217939507e-06, "Finetune/Loss": 0.7941133975982666, "Finetune/Loss (Raw)": 0.8197113275527954, "Finetune/Step": 2814, "Finetune/Step Time": 2.8124002162367105} +{"Finetune/Learning Rate": 8.356927287906841e-06, "Finetune/Loss": 0.7946005463600159, "Finetune/Loss (Raw)": 0.8174058794975281, "Finetune/Step": 2815, "Finetune/Step Time": 2.810297206044197} +{"Finetune/Learning Rate": 8.350505054439539e-06, "Finetune/Loss": 0.7938687801361084, "Finetune/Loss (Raw)": 0.8041919469833374, "Finetune/Step": 2816, "Finetune/Step Time": 2.8128274343907833} +{"Finetune/Learning Rate": 8.344083520260256e-06, "Finetune/Loss": 0.7934514880180359, "Finetune/Loss (Raw)": 0.7176860570907593, "Finetune/Step": 2817, "Finetune/Step Time": 2.813462106510997} +{"Finetune/Learning Rate": 8.33766268809133e-06, "Finetune/Loss": 0.7927178144454956, "Finetune/Loss (Raw)": 0.8253703117370605, "Finetune/Step": 2818, "Finetune/Step Time": 2.8125754054635763} +{"Finetune/Learning Rate": 8.331242560654822e-06, "Finetune/Loss": 0.7937661409378052, "Finetune/Loss (Raw)": 0.8818061351776123, "Finetune/Step": 2819, "Finetune/Step Time": 2.8161632530391216} +{"Finetune/Learning Rate": 8.32482314067248e-06, "Finetune/Loss": 0.7937394976615906, "Finetune/Loss (Raw)": 0.7782737016677856, "Finetune/Step": 2820, "Finetune/Step Time": 2.810041854158044} +{"Finetune/Learning Rate": 8.318404430865761e-06, "Finetune/Loss": 0.7944631576538086, "Finetune/Loss (Raw)": 0.9218211770057678, "Finetune/Step": 2821, "Finetune/Step Time": 2.810655143111944} +{"Finetune/Learning Rate": 8.311986433955812e-06, "Finetune/Loss": 0.7949310541152954, "Finetune/Loss (Raw)": 0.8235176205635071, "Finetune/Step": 2822, "Finetune/Step Time": 2.811181791126728} +{"Finetune/Learning Rate": 8.305569152663486e-06, "Finetune/Loss": 0.7953590154647827, "Finetune/Loss (Raw)": 0.8384637832641602, "Finetune/Step": 2823, "Finetune/Step Time": 2.8084697145968676} +{"Finetune/Learning Rate": 8.299152589709336e-06, "Finetune/Loss": 0.7958542108535767, "Finetune/Loss (Raw)": 0.8729947805404663, "Finetune/Step": 2824, "Finetune/Step Time": 2.8157229088246822} +{"Finetune/Learning Rate": 8.292736747813594e-06, "Finetune/Loss": 0.7953152656555176, "Finetune/Loss (Raw)": 0.7835623621940613, "Finetune/Step": 2825, "Finetune/Step Time": 2.8178415689617395} +{"Finetune/Learning Rate": 8.2863216296962e-06, "Finetune/Loss": 0.794721245765686, "Finetune/Loss (Raw)": 0.6801316738128662, "Finetune/Step": 2826, "Finetune/Step Time": 2.840299976989627} +{"Finetune/Learning Rate": 8.279907238076788e-06, "Finetune/Loss": 0.7954233884811401, "Finetune/Loss (Raw)": 0.851810097694397, "Finetune/Step": 2827, "Finetune/Step Time": 2.8363496102392673} +{"Finetune/Learning Rate": 8.273493575674669e-06, "Finetune/Loss": 0.7946764230728149, "Finetune/Loss (Raw)": 0.6952374577522278, "Finetune/Step": 2828, "Finetune/Step Time": 2.837522514164448} +{"Finetune/Learning Rate": 8.267080645208866e-06, "Finetune/Loss": 0.7939441800117493, "Finetune/Loss (Raw)": 0.7650230526924133, "Finetune/Step": 2829, "Finetune/Step Time": 2.839408800005913} +{"Finetune/Learning Rate": 8.260668449398075e-06, "Finetune/Loss": 0.7924960255622864, "Finetune/Loss (Raw)": 0.6538102626800537, "Finetune/Step": 2830, "Finetune/Step Time": 2.862280908972025} +{"Finetune/Learning Rate": 8.254256990960692e-06, "Finetune/Loss": 0.7917817831039429, "Finetune/Loss (Raw)": 0.6200435757637024, "Finetune/Step": 2831, "Finetune/Step Time": 2.8872657660394907} +{"Finetune/Learning Rate": 8.247846272614788e-06, "Finetune/Loss": 0.7921686768531799, "Finetune/Loss (Raw)": 0.8332231044769287, "Finetune/Step": 2832, "Finetune/Step Time": 2.880584402009845} +{"Finetune/Learning Rate": 8.241436297078133e-06, "Finetune/Loss": 0.7926547527313232, "Finetune/Loss (Raw)": 0.8261866569519043, "Finetune/Step": 2833, "Finetune/Step Time": 2.879775542765856} +{"Finetune/Learning Rate": 8.235027067068176e-06, "Finetune/Loss": 0.794704258441925, "Finetune/Loss (Raw)": 0.8894174695014954, "Finetune/Step": 2834, "Finetune/Step Time": 2.8526728060096502} +{"Finetune/Learning Rate": 8.228618585302047e-06, "Finetune/Loss": 0.7949151992797852, "Finetune/Loss (Raw)": 0.8129204511642456, "Finetune/Step": 2835, "Finetune/Step Time": 2.8558558970689774} +{"Finetune/Learning Rate": 8.222210854496562e-06, "Finetune/Loss": 0.7942009568214417, "Finetune/Loss (Raw)": 0.7456086277961731, "Finetune/Step": 2836, "Finetune/Step Time": 2.860014410689473} +{"Finetune/Learning Rate": 8.215803877368221e-06, "Finetune/Loss": 0.794144332408905, "Finetune/Loss (Raw)": 0.7888216376304626, "Finetune/Step": 2837, "Finetune/Step Time": 2.858056614175439} +{"Finetune/Learning Rate": 8.209397656633207e-06, "Finetune/Loss": 0.7942308187484741, "Finetune/Loss (Raw)": 0.8166492581367493, "Finetune/Step": 2838, "Finetune/Step Time": 2.857255879789591} +{"Finetune/Learning Rate": 8.202992195007372e-06, "Finetune/Loss": 0.7928694486618042, "Finetune/Loss (Raw)": 0.7971278429031372, "Finetune/Step": 2839, "Finetune/Step Time": 2.8573791962116957} +{"Finetune/Learning Rate": 8.196587495206247e-06, "Finetune/Loss": 0.7922924160957336, "Finetune/Loss (Raw)": 0.6825980544090271, "Finetune/Step": 2840, "Finetune/Step Time": 2.851853158324957} +{"Finetune/Learning Rate": 8.190183559945055e-06, "Finetune/Loss": 0.7933101654052734, "Finetune/Loss (Raw)": 0.9254468679428101, "Finetune/Step": 2841, "Finetune/Step Time": 2.853572767227888} +{"Finetune/Learning Rate": 8.183780391938677e-06, "Finetune/Loss": 0.7929325699806213, "Finetune/Loss (Raw)": 0.7748798131942749, "Finetune/Step": 2842, "Finetune/Step Time": 2.852923331782222} +{"Finetune/Learning Rate": 8.17737799390168e-06, "Finetune/Loss": 0.7906839847564697, "Finetune/Loss (Raw)": 0.4941507875919342, "Finetune/Step": 2843, "Finetune/Step Time": 2.8768084682524204} +{"Finetune/Learning Rate": 8.170976368548299e-06, "Finetune/Loss": 0.789738655090332, "Finetune/Loss (Raw)": 0.8177080750465393, "Finetune/Step": 2844, "Finetune/Step Time": 2.875273386016488} +{"Finetune/Learning Rate": 8.164575518592449e-06, "Finetune/Loss": 0.7890796661376953, "Finetune/Loss (Raw)": 0.8715213537216187, "Finetune/Step": 2845, "Finetune/Step Time": 2.8782641403377056} +{"Finetune/Learning Rate": 8.158175446747702e-06, "Finetune/Loss": 0.7901328206062317, "Finetune/Loss (Raw)": 0.8914718627929688, "Finetune/Step": 2846, "Finetune/Step Time": 2.877247739583254} +{"Finetune/Learning Rate": 8.151776155727314e-06, "Finetune/Loss": 0.7898706793785095, "Finetune/Loss (Raw)": 0.7237222790718079, "Finetune/Step": 2847, "Finetune/Step Time": 2.8785908091813326} +{"Finetune/Learning Rate": 8.145377648244207e-06, "Finetune/Loss": 0.7908010482788086, "Finetune/Loss (Raw)": 0.8553926944732666, "Finetune/Step": 2848, "Finetune/Step Time": 2.8813912086188793} +{"Finetune/Learning Rate": 8.138979927010964e-06, "Finetune/Loss": 0.7890243530273438, "Finetune/Loss (Raw)": 0.5856293439865112, "Finetune/Step": 2849, "Finetune/Step Time": 2.9064711928367615} +{"Finetune/Learning Rate": 8.132582994739838e-06, "Finetune/Loss": 0.7893171310424805, "Finetune/Loss (Raw)": 0.8897247910499573, "Finetune/Step": 2850, "Finetune/Step Time": 2.906040959060192} +{"Finetune/Learning Rate": 8.126186854142752e-06, "Finetune/Loss": 0.7876603007316589, "Finetune/Loss (Raw)": 0.5655953288078308, "Finetune/Step": 2851, "Finetune/Step Time": 2.9191534724086523} +{"Finetune/Learning Rate": 8.119791507931294e-06, "Finetune/Loss": 0.7865930199623108, "Finetune/Loss (Raw)": 0.6659590005874634, "Finetune/Step": 2852, "Finetune/Step Time": 2.9220023714005947} +{"Finetune/Learning Rate": 8.113396958816707e-06, "Finetune/Loss": 0.7865778207778931, "Finetune/Loss (Raw)": 0.7787601351737976, "Finetune/Step": 2853, "Finetune/Step Time": 2.921172760426998} +{"Finetune/Learning Rate": 8.107003209509898e-06, "Finetune/Loss": 0.7872679829597473, "Finetune/Loss (Raw)": 0.923344612121582, "Finetune/Step": 2854, "Finetune/Step Time": 2.9213484581559896} +{"Finetune/Learning Rate": 8.100610262721445e-06, "Finetune/Loss": 0.7877422571182251, "Finetune/Loss (Raw)": 0.8648586869239807, "Finetune/Step": 2855, "Finetune/Step Time": 2.917709104716778} +{"Finetune/Learning Rate": 8.094218121161568e-06, "Finetune/Loss": 0.7884871959686279, "Finetune/Loss (Raw)": 0.8426313996315002, "Finetune/Step": 2856, "Finetune/Step Time": 2.9158466272056103} +{"Finetune/Learning Rate": 8.087826787540165e-06, "Finetune/Loss": 0.78888338804245, "Finetune/Loss (Raw)": 0.8462753891944885, "Finetune/Step": 2857, "Finetune/Step Time": 2.9148234706372023} +{"Finetune/Learning Rate": 8.081436264566777e-06, "Finetune/Loss": 0.788200855255127, "Finetune/Loss (Raw)": 0.756673276424408, "Finetune/Step": 2858, "Finetune/Step Time": 2.910270670428872} +{"Finetune/Learning Rate": 8.075046554950612e-06, "Finetune/Loss": 0.7885500192642212, "Finetune/Loss (Raw)": 0.839629054069519, "Finetune/Step": 2859, "Finetune/Step Time": 2.9084963891655207} +{"Finetune/Learning Rate": 8.06865766140052e-06, "Finetune/Loss": 0.7913903594017029, "Finetune/Loss (Raw)": 0.8231340646743774, "Finetune/Step": 2860, "Finetune/Step Time": 2.880503112450242} +{"Finetune/Learning Rate": 8.06226958662502e-06, "Finetune/Loss": 0.7915329933166504, "Finetune/Loss (Raw)": 0.8377823829650879, "Finetune/Step": 2861, "Finetune/Step Time": 2.8805004619061947} +{"Finetune/Learning Rate": 8.055882333332274e-06, "Finetune/Loss": 0.7925571799278259, "Finetune/Loss (Raw)": 0.8465789556503296, "Finetune/Step": 2862, "Finetune/Step Time": 2.8797317650169134} +{"Finetune/Learning Rate": 8.049495904230098e-06, "Finetune/Loss": 0.7902416586875916, "Finetune/Loss (Raw)": 0.6471484303474426, "Finetune/Step": 2863, "Finetune/Step Time": 2.879316534847021} +{"Finetune/Learning Rate": 8.043110302025957e-06, "Finetune/Loss": 0.7904844880104065, "Finetune/Loss (Raw)": 0.8878434896469116, "Finetune/Step": 2864, "Finetune/Step Time": 2.879704402759671} +{"Finetune/Learning Rate": 8.03672552942697e-06, "Finetune/Loss": 0.7954702973365784, "Finetune/Loss (Raw)": 0.8905643820762634, "Finetune/Step": 2865, "Finetune/Step Time": 2.8535193540155888} +{"Finetune/Learning Rate": 8.030341589139908e-06, "Finetune/Loss": 0.7953273057937622, "Finetune/Loss (Raw)": 0.9053571224212646, "Finetune/Step": 2866, "Finetune/Step Time": 2.8253410682082176} +{"Finetune/Learning Rate": 8.023958483871174e-06, "Finetune/Loss": 0.7951937913894653, "Finetune/Loss (Raw)": 0.7737570405006409, "Finetune/Step": 2867, "Finetune/Step Time": 2.829875560477376} +{"Finetune/Learning Rate": 8.017576216326826e-06, "Finetune/Loss": 0.794894814491272, "Finetune/Loss (Raw)": 0.856510579586029, "Finetune/Step": 2868, "Finetune/Step Time": 2.8319999035447836} +{"Finetune/Learning Rate": 8.011194789212577e-06, "Finetune/Loss": 0.7958465218544006, "Finetune/Loss (Raw)": 0.8587203621864319, "Finetune/Step": 2869, "Finetune/Step Time": 2.832649488002062} +{"Finetune/Learning Rate": 8.004814205233759e-06, "Finetune/Loss": 0.7947039604187012, "Finetune/Loss (Raw)": 0.7695810198783875, "Finetune/Step": 2870, "Finetune/Step Time": 2.8362955283373594} +{"Finetune/Learning Rate": 7.998434467095373e-06, "Finetune/Loss": 0.7947509288787842, "Finetune/Loss (Raw)": 0.8227068185806274, "Finetune/Step": 2871, "Finetune/Step Time": 2.8332968037575483} +{"Finetune/Learning Rate": 7.992055577502042e-06, "Finetune/Loss": 0.7958635687828064, "Finetune/Loss (Raw)": 0.7868453860282898, "Finetune/Step": 2872, "Finetune/Step Time": 2.8104828912764788} +{"Finetune/Learning Rate": 7.985677539158044e-06, "Finetune/Loss": 0.7966600656509399, "Finetune/Loss (Raw)": 0.8628987669944763, "Finetune/Step": 2873, "Finetune/Step Time": 2.8058016318827868} +{"Finetune/Learning Rate": 7.979300354767282e-06, "Finetune/Loss": 0.7966556549072266, "Finetune/Loss (Raw)": 0.8024850487709045, "Finetune/Step": 2874, "Finetune/Step Time": 2.8029833752661943} +{"Finetune/Learning Rate": 7.972924027033307e-06, "Finetune/Loss": 0.7944164872169495, "Finetune/Loss (Raw)": 0.48851093649864197, "Finetune/Step": 2875, "Finetune/Step Time": 2.8277155477553606} +{"Finetune/Learning Rate": 7.966548558659305e-06, "Finetune/Loss": 0.7938191890716553, "Finetune/Loss (Raw)": 0.7539241313934326, "Finetune/Step": 2876, "Finetune/Step Time": 2.8328464161604643} +{"Finetune/Learning Rate": 7.960173952348094e-06, "Finetune/Loss": 0.7936939001083374, "Finetune/Loss (Raw)": 0.7830387949943542, "Finetune/Step": 2877, "Finetune/Step Time": 2.8324347492307425} +{"Finetune/Learning Rate": 7.95380021080213e-06, "Finetune/Loss": 0.7951822280883789, "Finetune/Loss (Raw)": 0.8392199873924255, "Finetune/Step": 2878, "Finetune/Step Time": 2.8089216127991676} +{"Finetune/Learning Rate": 7.947427336723503e-06, "Finetune/Loss": 0.7956268787384033, "Finetune/Loss (Raw)": 0.8556196093559265, "Finetune/Step": 2879, "Finetune/Step Time": 2.8089576978236437} +{"Finetune/Learning Rate": 7.941055332813929e-06, "Finetune/Loss": 0.7952027916908264, "Finetune/Loss (Raw)": 0.7635565400123596, "Finetune/Step": 2880, "Finetune/Step Time": 2.82439211755991} +{"Finetune/Learning Rate": 7.934684201774763e-06, "Finetune/Loss": 0.7956918478012085, "Finetune/Loss (Raw)": 0.8906476497650146, "Finetune/Step": 2881, "Finetune/Step Time": 2.824373133480549} +{"Finetune/Learning Rate": 7.928313946306985e-06, "Finetune/Loss": 0.7958344221115112, "Finetune/Loss (Raw)": 0.8403169512748718, "Finetune/Step": 2882, "Finetune/Step Time": 2.8230353239923716} +{"Finetune/Learning Rate": 7.92194456911121e-06, "Finetune/Loss": 0.7959003448486328, "Finetune/Loss (Raw)": 0.8968067765235901, "Finetune/Step": 2883, "Finetune/Step Time": 2.822573209181428} +{"Finetune/Learning Rate": 7.91557607288767e-06, "Finetune/Loss": 0.795986533164978, "Finetune/Loss (Raw)": 0.8050701022148132, "Finetune/Step": 2884, "Finetune/Step Time": 2.8246799279004335} +{"Finetune/Learning Rate": 7.909208460336234e-06, "Finetune/Loss": 0.7955790758132935, "Finetune/Loss (Raw)": 0.7766982316970825, "Finetune/Step": 2885, "Finetune/Step Time": 2.824305072426796} +{"Finetune/Learning Rate": 7.90284173415639e-06, "Finetune/Loss": 0.7951791286468506, "Finetune/Loss (Raw)": 0.8766629695892334, "Finetune/Step": 2886, "Finetune/Step Time": 2.8267759829759598} +{"Finetune/Learning Rate": 7.896475897047254e-06, "Finetune/Loss": 0.7991192936897278, "Finetune/Loss (Raw)": 0.8058885335922241, "Finetune/Step": 2887, "Finetune/Step Time": 2.7903777845203876} +{"Finetune/Learning Rate": 7.890110951707558e-06, "Finetune/Loss": 0.7984221577644348, "Finetune/Loss (Raw)": 0.7408248782157898, "Finetune/Step": 2888, "Finetune/Step Time": 2.792567430064082} +{"Finetune/Learning Rate": 7.883746900835668e-06, "Finetune/Loss": 0.798383891582489, "Finetune/Loss (Raw)": 0.846630334854126, "Finetune/Step": 2889, "Finetune/Step Time": 2.79573574103415} +{"Finetune/Learning Rate": 7.877383747129562e-06, "Finetune/Loss": 0.7966338396072388, "Finetune/Loss (Raw)": 0.6588788032531738, "Finetune/Step": 2890, "Finetune/Step Time": 2.7988836262375116} +{"Finetune/Learning Rate": 7.871021493286837e-06, "Finetune/Loss": 0.7963488101959229, "Finetune/Loss (Raw)": 0.8307415843009949, "Finetune/Step": 2891, "Finetune/Step Time": 2.7979431692510843} +{"Finetune/Learning Rate": 7.864660142004713e-06, "Finetune/Loss": 0.797614574432373, "Finetune/Loss (Raw)": 0.8403380513191223, "Finetune/Step": 2892, "Finetune/Step Time": 2.800671959295869} +{"Finetune/Learning Rate": 7.85829969598003e-06, "Finetune/Loss": 0.7936134338378906, "Finetune/Loss (Raw)": 0.25708967447280884, "Finetune/Step": 2893, "Finetune/Step Time": 2.8305138535797596} +{"Finetune/Learning Rate": 7.85194015790923e-06, "Finetune/Loss": 0.7942161560058594, "Finetune/Loss (Raw)": 0.9026371836662292, "Finetune/Step": 2894, "Finetune/Step Time": 2.834799161180854} +{"Finetune/Learning Rate": 7.84558153048839e-06, "Finetune/Loss": 0.7938859462738037, "Finetune/Loss (Raw)": 0.8245739340782166, "Finetune/Step": 2895, "Finetune/Step Time": 2.834630087018013} +{"Finetune/Learning Rate": 7.839223816413181e-06, "Finetune/Loss": 0.7938611507415771, "Finetune/Loss (Raw)": 0.8341687321662903, "Finetune/Step": 2896, "Finetune/Step Time": 2.8187064100056887} +{"Finetune/Learning Rate": 7.83286701837891e-06, "Finetune/Loss": 0.7943736910820007, "Finetune/Loss (Raw)": 0.9454983472824097, "Finetune/Step": 2897, "Finetune/Step Time": 2.8208794202655554} +{"Finetune/Learning Rate": 7.826511139080468e-06, "Finetune/Loss": 0.7947283983230591, "Finetune/Loss (Raw)": 0.8968464136123657, "Finetune/Step": 2898, "Finetune/Step Time": 2.8253716323524714} +{"Finetune/Learning Rate": 7.82015618121238e-06, "Finetune/Loss": 0.7933171987533569, "Finetune/Loss (Raw)": 0.7602791786193848, "Finetune/Step": 2899, "Finetune/Step Time": 2.825619675219059} +{"Finetune/Learning Rate": 7.813802147468768e-06, "Finetune/Loss": 0.7930604219436646, "Finetune/Loss (Raw)": 0.8348918557167053, "Finetune/Step": 2900, "Finetune/Step Time": 2.8272470515221357} +{"Finetune/Learning Rate": 7.807449040543366e-06, "Finetune/Loss": 0.7930251359939575, "Finetune/Loss (Raw)": 0.8866422772407532, "Finetune/Step": 2901, "Finetune/Step Time": 2.826807327568531} +{"Finetune/Learning Rate": 7.801096863129512e-06, "Finetune/Loss": 0.7931087017059326, "Finetune/Loss (Raw)": 0.8694136738777161, "Finetune/Step": 2902, "Finetune/Step Time": 2.829969462007284} +{"Finetune/Learning Rate": 7.794745617920154e-06, "Finetune/Loss": 0.7923564910888672, "Finetune/Loss (Raw)": 0.7462213635444641, "Finetune/Step": 2903, "Finetune/Step Time": 2.8277691565454006} +{"Finetune/Learning Rate": 7.78839530760785e-06, "Finetune/Loss": 0.7920070886611938, "Finetune/Loss (Raw)": 0.7767927050590515, "Finetune/Step": 2904, "Finetune/Step Time": 2.8244234267622232} +{"Finetune/Learning Rate": 7.782045934884744e-06, "Finetune/Loss": 0.791537880897522, "Finetune/Loss (Raw)": 0.8220964670181274, "Finetune/Step": 2905, "Finetune/Step Time": 2.827496061101556} +{"Finetune/Learning Rate": 7.775697502442598e-06, "Finetune/Loss": 0.7919066548347473, "Finetune/Loss (Raw)": 0.8735519051551819, "Finetune/Step": 2906, "Finetune/Step Time": 2.82968557626009} +{"Finetune/Learning Rate": 7.769350012972774e-06, "Finetune/Loss": 0.7926926612854004, "Finetune/Loss (Raw)": 0.8312527537345886, "Finetune/Step": 2907, "Finetune/Step Time": 2.8296777214854956} +{"Finetune/Learning Rate": 7.763003469166225e-06, "Finetune/Loss": 0.7928831577301025, "Finetune/Loss (Raw)": 0.8704817295074463, "Finetune/Step": 2908, "Finetune/Step Time": 2.826195364817977} +{"Finetune/Learning Rate": 7.756657873713513e-06, "Finetune/Loss": 0.7934958934783936, "Finetune/Loss (Raw)": 0.829553484916687, "Finetune/Step": 2909, "Finetune/Step Time": 2.827631799504161} +{"Finetune/Learning Rate": 7.750313229304794e-06, "Finetune/Loss": 0.7974360585212708, "Finetune/Loss (Raw)": 0.8364059329032898, "Finetune/Step": 2910, "Finetune/Step Time": 2.8004536759108305} +{"Finetune/Learning Rate": 7.74396953862982e-06, "Finetune/Loss": 0.7978153824806213, "Finetune/Loss (Raw)": 0.8195089101791382, "Finetune/Step": 2911, "Finetune/Step Time": 2.8003441020846367} +{"Finetune/Learning Rate": 7.737626804377938e-06, "Finetune/Loss": 0.7981302738189697, "Finetune/Loss (Raw)": 0.8406245112419128, "Finetune/Step": 2912, "Finetune/Step Time": 2.798977419734001} +{"Finetune/Learning Rate": 7.731285029238094e-06, "Finetune/Loss": 0.7978464365005493, "Finetune/Loss (Raw)": 0.782834529876709, "Finetune/Step": 2913, "Finetune/Step Time": 2.774796301499009} +{"Finetune/Learning Rate": 7.724944215898823e-06, "Finetune/Loss": 0.7970572710037231, "Finetune/Loss (Raw)": 0.7343730330467224, "Finetune/Step": 2914, "Finetune/Step Time": 2.777727887034416} +{"Finetune/Learning Rate": 7.718604367048255e-06, "Finetune/Loss": 0.7958468794822693, "Finetune/Loss (Raw)": 0.7255683541297913, "Finetune/Step": 2915, "Finetune/Step Time": 2.7782534826546907} +{"Finetune/Learning Rate": 7.712265485374106e-06, "Finetune/Loss": 0.7959235906600952, "Finetune/Loss (Raw)": 0.8541198372840881, "Finetune/Step": 2916, "Finetune/Step Time": 2.777429984882474} +{"Finetune/Learning Rate": 7.70592757356369e-06, "Finetune/Loss": 0.7951045036315918, "Finetune/Loss (Raw)": 0.7263473272323608, "Finetune/Step": 2917, "Finetune/Step Time": 2.7713538184762} +{"Finetune/Learning Rate": 7.699590634303907e-06, "Finetune/Loss": 0.7946585416793823, "Finetune/Loss (Raw)": 0.7428093552589417, "Finetune/Step": 2918, "Finetune/Step Time": 2.766576301306486} +{"Finetune/Learning Rate": 7.693254670281238e-06, "Finetune/Loss": 0.7945542335510254, "Finetune/Loss (Raw)": 0.7157846093177795, "Finetune/Step": 2919, "Finetune/Step Time": 2.766036234796047} +{"Finetune/Learning Rate": 7.686919684181757e-06, "Finetune/Loss": 0.7951699495315552, "Finetune/Loss (Raw)": 0.779320240020752, "Finetune/Step": 2920, "Finetune/Step Time": 2.764412662014365} +{"Finetune/Learning Rate": 7.680585678691129e-06, "Finetune/Loss": 0.7951093316078186, "Finetune/Loss (Raw)": 0.8247976899147034, "Finetune/Step": 2921, "Finetune/Step Time": 2.7612697575241327} +{"Finetune/Learning Rate": 7.674252656494586e-06, "Finetune/Loss": 0.7958089113235474, "Finetune/Loss (Raw)": 0.7996704578399658, "Finetune/Step": 2922, "Finetune/Step Time": 2.7591299563646317} +{"Finetune/Learning Rate": 7.667920620276963e-06, "Finetune/Loss": 0.795838475227356, "Finetune/Loss (Raw)": 0.7784423828125, "Finetune/Step": 2923, "Finetune/Step Time": 2.7622623778879642} +{"Finetune/Learning Rate": 7.66158957272266e-06, "Finetune/Loss": 0.7962416410446167, "Finetune/Loss (Raw)": 0.8461784720420837, "Finetune/Step": 2924, "Finetune/Step Time": 2.763636227697134} +{"Finetune/Learning Rate": 7.655259516515674e-06, "Finetune/Loss": 0.7955362796783447, "Finetune/Loss (Raw)": 0.8010998368263245, "Finetune/Step": 2925, "Finetune/Step Time": 2.761736897751689} +{"Finetune/Learning Rate": 7.648930454339566e-06, "Finetune/Loss": 0.7962108254432678, "Finetune/Loss (Raw)": 0.8888168334960938, "Finetune/Step": 2926, "Finetune/Step Time": 2.7622895408421755} +{"Finetune/Learning Rate": 7.642602388877487e-06, "Finetune/Loss": 0.7957723736763, "Finetune/Loss (Raw)": 0.7862028479576111, "Finetune/Step": 2927, "Finetune/Step Time": 2.7641461342573166} +{"Finetune/Learning Rate": 7.63627532281216e-06, "Finetune/Loss": 0.7965436577796936, "Finetune/Loss (Raw)": 0.7798975706100464, "Finetune/Step": 2928, "Finetune/Step Time": 2.740592060610652} +{"Finetune/Learning Rate": 7.629949258825886e-06, "Finetune/Loss": 0.7965576648712158, "Finetune/Loss (Raw)": 0.818285346031189, "Finetune/Step": 2929, "Finetune/Step Time": 2.7397897839546204} +{"Finetune/Learning Rate": 7.62362419960054e-06, "Finetune/Loss": 0.7963654398918152, "Finetune/Loss (Raw)": 0.846145749092102, "Finetune/Step": 2930, "Finetune/Step Time": 2.741496032103896} +{"Finetune/Learning Rate": 7.617300147817572e-06, "Finetune/Loss": 0.796042263507843, "Finetune/Loss (Raw)": 0.7881777882575989, "Finetune/Step": 2931, "Finetune/Step Time": 2.7468122262507677} +{"Finetune/Learning Rate": 7.610977106158009e-06, "Finetune/Loss": 0.796481192111969, "Finetune/Loss (Raw)": 0.7828136086463928, "Finetune/Step": 2932, "Finetune/Step Time": 2.742657992988825} +{"Finetune/Learning Rate": 7.6046550773024405e-06, "Finetune/Loss": 0.7972787618637085, "Finetune/Loss (Raw)": 0.845874011516571, "Finetune/Step": 2933, "Finetune/Step Time": 2.7429919485002756} +{"Finetune/Learning Rate": 7.5983340639310325e-06, "Finetune/Loss": 0.7967066764831543, "Finetune/Loss (Raw)": 0.7286540865898132, "Finetune/Step": 2934, "Finetune/Step Time": 2.7400336023420095} +{"Finetune/Learning Rate": 7.592014068723525e-06, "Finetune/Loss": 0.7965120077133179, "Finetune/Loss (Raw)": 0.7651801109313965, "Finetune/Step": 2935, "Finetune/Step Time": 2.74254890345037} +{"Finetune/Learning Rate": 7.585695094359211e-06, "Finetune/Loss": 0.7969414591789246, "Finetune/Loss (Raw)": 0.8839467167854309, "Finetune/Step": 2936, "Finetune/Step Time": 2.749486954882741} +{"Finetune/Learning Rate": 7.579377143516969e-06, "Finetune/Loss": 0.7977838516235352, "Finetune/Loss (Raw)": 0.8578511476516724, "Finetune/Step": 2937, "Finetune/Step Time": 2.749513080343604} +{"Finetune/Learning Rate": 7.573060218875231e-06, "Finetune/Loss": 0.7960071563720703, "Finetune/Loss (Raw)": 0.6285433769226074, "Finetune/Step": 2938, "Finetune/Step Time": 2.7734073642641306} +{"Finetune/Learning Rate": 7.5667443231120056e-06, "Finetune/Loss": 0.791619062423706, "Finetune/Loss (Raw)": 0.22679343819618225, "Finetune/Step": 2939, "Finetune/Step Time": 2.8081361558288336} +{"Finetune/Learning Rate": 7.560429458904847e-06, "Finetune/Loss": 0.7895058393478394, "Finetune/Loss (Raw)": 0.5320615172386169, "Finetune/Step": 2940, "Finetune/Step Time": 2.8287666980177164} +{"Finetune/Learning Rate": 7.5541156289308915e-06, "Finetune/Loss": 0.7906105518341064, "Finetune/Loss (Raw)": 0.7469531297683716, "Finetune/Step": 2941, "Finetune/Step Time": 2.803947104141116} +{"Finetune/Learning Rate": 7.547802835866826e-06, "Finetune/Loss": 0.7901958227157593, "Finetune/Loss (Raw)": 0.7666274905204773, "Finetune/Step": 2942, "Finetune/Step Time": 2.8079578038305044} +{"Finetune/Learning Rate": 7.541491082388898e-06, "Finetune/Loss": 0.7903424501419067, "Finetune/Loss (Raw)": 0.8361718654632568, "Finetune/Step": 2943, "Finetune/Step Time": 2.805040316656232} +{"Finetune/Learning Rate": 7.535180371172919e-06, "Finetune/Loss": 0.7898388504981995, "Finetune/Loss (Raw)": 0.7397313714027405, "Finetune/Step": 2944, "Finetune/Step Time": 2.8043184839189053} +{"Finetune/Learning Rate": 7.528870704894255e-06, "Finetune/Loss": 0.7907912731170654, "Finetune/Loss (Raw)": 0.8395949006080627, "Finetune/Step": 2945, "Finetune/Step Time": 2.8021835014224052} +{"Finetune/Learning Rate": 7.522562086227834e-06, "Finetune/Loss": 0.7905387878417969, "Finetune/Loss (Raw)": 0.7930519580841064, "Finetune/Step": 2946, "Finetune/Step Time": 2.80315094999969} +{"Finetune/Learning Rate": 7.516254517848132e-06, "Finetune/Loss": 0.789551317691803, "Finetune/Loss (Raw)": 0.7554160356521606, "Finetune/Step": 2947, "Finetune/Step Time": 2.801977166905999} +{"Finetune/Learning Rate": 7.5099480024291824e-06, "Finetune/Loss": 0.7898005247116089, "Finetune/Loss (Raw)": 0.8101658821105957, "Finetune/Step": 2948, "Finetune/Step Time": 2.8025531210005283} +{"Finetune/Learning Rate": 7.503642542644581e-06, "Finetune/Loss": 0.7882089614868164, "Finetune/Loss (Raw)": 0.7181035876274109, "Finetune/Step": 2949, "Finetune/Step Time": 2.801840478554368} +{"Finetune/Learning Rate": 7.49733814116746e-06, "Finetune/Loss": 0.7857988476753235, "Finetune/Loss (Raw)": 0.515022873878479, "Finetune/Step": 2950, "Finetune/Step Time": 2.825806898996234} +{"Finetune/Learning Rate": 7.491034800670517e-06, "Finetune/Loss": 0.7856297492980957, "Finetune/Loss (Raw)": 0.8168240785598755, "Finetune/Step": 2951, "Finetune/Step Time": 2.82291610725224} +{"Finetune/Learning Rate": 7.48473252382599e-06, "Finetune/Loss": 0.785554826259613, "Finetune/Loss (Raw)": 0.8633975386619568, "Finetune/Step": 2952, "Finetune/Step Time": 2.813222983852029} +{"Finetune/Learning Rate": 7.47843131330568e-06, "Finetune/Loss": 0.7859431505203247, "Finetune/Loss (Raw)": 0.833260715007782, "Finetune/Step": 2953, "Finetune/Step Time": 2.8107862267643213} +{"Finetune/Learning Rate": 7.472131171780914e-06, "Finetune/Loss": 0.7866420745849609, "Finetune/Loss (Raw)": 0.7696035504341125, "Finetune/Step": 2954, "Finetune/Step Time": 2.7858287431299686} +{"Finetune/Learning Rate": 7.4658321019225875e-06, "Finetune/Loss": 0.7862696647644043, "Finetune/Loss (Raw)": 0.8041377067565918, "Finetune/Step": 2955, "Finetune/Step Time": 2.7875631283968687} +{"Finetune/Learning Rate": 7.4595341064011296e-06, "Finetune/Loss": 0.7875720262527466, "Finetune/Loss (Raw)": 0.8619433641433716, "Finetune/Step": 2956, "Finetune/Step Time": 2.787392234429717} +{"Finetune/Learning Rate": 7.453237187886517e-06, "Finetune/Loss": 0.7874060869216919, "Finetune/Loss (Raw)": 0.7437842488288879, "Finetune/Step": 2957, "Finetune/Step Time": 2.8121780920773745} +{"Finetune/Learning Rate": 7.446941349048265e-06, "Finetune/Loss": 0.7884567379951477, "Finetune/Loss (Raw)": 0.7882893085479736, "Finetune/Step": 2958, "Finetune/Step Time": 2.7894037570804358} +{"Finetune/Learning Rate": 7.440646592555443e-06, "Finetune/Loss": 0.7905312776565552, "Finetune/Loss (Raw)": 0.885586142539978, "Finetune/Step": 2959, "Finetune/Step Time": 2.7643087916076183} +{"Finetune/Learning Rate": 7.434352921076653e-06, "Finetune/Loss": 0.7903741002082825, "Finetune/Loss (Raw)": 0.8130994439125061, "Finetune/Step": 2960, "Finetune/Step Time": 2.764714188873768} +{"Finetune/Learning Rate": 7.428060337280036e-06, "Finetune/Loss": 0.7897752523422241, "Finetune/Loss (Raw)": 0.7495348453521729, "Finetune/Step": 2961, "Finetune/Step Time": 2.770960895344615} +{"Finetune/Learning Rate": 7.4217688438332725e-06, "Finetune/Loss": 0.7882329225540161, "Finetune/Loss (Raw)": 0.692008912563324, "Finetune/Step": 2962, "Finetune/Step Time": 2.7952122148126364} +{"Finetune/Learning Rate": 7.415478443403589e-06, "Finetune/Loss": 0.7837126851081848, "Finetune/Loss (Raw)": 0.2343285232782364, "Finetune/Step": 2963, "Finetune/Step Time": 2.8279167525470257} +{"Finetune/Learning Rate": 7.409189138657735e-06, "Finetune/Loss": 0.7844357490539551, "Finetune/Loss (Raw)": 0.838162899017334, "Finetune/Step": 2964, "Finetune/Step Time": 2.8282267209142447} +{"Finetune/Learning Rate": 7.402900932262007e-06, "Finetune/Loss": 0.7842682600021362, "Finetune/Loss (Raw)": 0.7673710584640503, "Finetune/Step": 2965, "Finetune/Step Time": 2.8302889708429575} +{"Finetune/Learning Rate": 7.396613826882229e-06, "Finetune/Loss": 0.7836490273475647, "Finetune/Loss (Raw)": 0.7373954057693481, "Finetune/Step": 2966, "Finetune/Step Time": 2.835844559594989} +{"Finetune/Learning Rate": 7.390327825183767e-06, "Finetune/Loss": 0.7819322347640991, "Finetune/Loss (Raw)": 0.5773769617080688, "Finetune/Step": 2967, "Finetune/Step Time": 2.855427708476782} +{"Finetune/Learning Rate": 7.384042929831503e-06, "Finetune/Loss": 0.7786597013473511, "Finetune/Loss (Raw)": 0.263714998960495, "Finetune/Step": 2968, "Finetune/Step Time": 2.8838642071932554} +{"Finetune/Learning Rate": 7.377759143489867e-06, "Finetune/Loss": 0.7775688171386719, "Finetune/Loss (Raw)": 0.7858020067214966, "Finetune/Step": 2969, "Finetune/Step Time": 2.881388947367668} +{"Finetune/Learning Rate": 7.371476468822809e-06, "Finetune/Loss": 0.7776446342468262, "Finetune/Loss (Raw)": 0.7845995426177979, "Finetune/Step": 2970, "Finetune/Step Time": 2.8783540911972523} +{"Finetune/Learning Rate": 7.365194908493811e-06, "Finetune/Loss": 0.7797918915748596, "Finetune/Loss (Raw)": 0.7689926624298096, "Finetune/Step": 2971, "Finetune/Step Time": 2.854405388236046} +{"Finetune/Learning Rate": 7.35891446516588e-06, "Finetune/Loss": 0.7789708375930786, "Finetune/Loss (Raw)": 0.7126191854476929, "Finetune/Step": 2972, "Finetune/Step Time": 2.858747970312834} +{"Finetune/Learning Rate": 7.352635141501553e-06, "Finetune/Loss": 0.7784810066223145, "Finetune/Loss (Raw)": 0.8088216781616211, "Finetune/Step": 2973, "Finetune/Step Time": 2.8579323310405016} +{"Finetune/Learning Rate": 7.346356940162895e-06, "Finetune/Loss": 0.7776100635528564, "Finetune/Loss (Raw)": 0.7799863815307617, "Finetune/Step": 2974, "Finetune/Step Time": 2.856334626674652} +{"Finetune/Learning Rate": 7.340079863811485e-06, "Finetune/Loss": 0.7782076597213745, "Finetune/Loss (Raw)": 0.8002191185951233, "Finetune/Step": 2975, "Finetune/Step Time": 2.8549837060272694} +{"Finetune/Learning Rate": 7.333803915108433e-06, "Finetune/Loss": 0.7776345014572144, "Finetune/Loss (Raw)": 0.7820261716842651, "Finetune/Step": 2976, "Finetune/Step Time": 2.8547773230820894} +{"Finetune/Learning Rate": 7.327529096714371e-06, "Finetune/Loss": 0.7798606157302856, "Finetune/Loss (Raw)": 0.8705729246139526, "Finetune/Step": 2977, "Finetune/Step Time": 2.8282662611454725} +{"Finetune/Learning Rate": 7.321255411289443e-06, "Finetune/Loss": 0.7798150777816772, "Finetune/Loss (Raw)": 0.8838986158370972, "Finetune/Step": 2978, "Finetune/Step Time": 2.827704915776849} +{"Finetune/Learning Rate": 7.314982861493328e-06, "Finetune/Loss": 0.7816647291183472, "Finetune/Loss (Raw)": 0.8023440837860107, "Finetune/Step": 2979, "Finetune/Step Time": 2.804908251389861} +{"Finetune/Learning Rate": 7.308711449985209e-06, "Finetune/Loss": 0.7817897200584412, "Finetune/Loss (Raw)": 0.6819599270820618, "Finetune/Step": 2980, "Finetune/Step Time": 2.8070539981126785} +{"Finetune/Learning Rate": 7.302441179423798e-06, "Finetune/Loss": 0.7819646596908569, "Finetune/Loss (Raw)": 0.8011495471000671, "Finetune/Step": 2981, "Finetune/Step Time": 2.8040798138827085} +{"Finetune/Learning Rate": 7.296172052467312e-06, "Finetune/Loss": 0.7806018590927124, "Finetune/Loss (Raw)": 0.7489061951637268, "Finetune/Step": 2982, "Finetune/Step Time": 2.8028494268655777} +{"Finetune/Learning Rate": 7.289904071773492e-06, "Finetune/Loss": 0.7796202898025513, "Finetune/Loss (Raw)": 0.7392227649688721, "Finetune/Step": 2983, "Finetune/Step Time": 2.803245946764946} +{"Finetune/Learning Rate": 7.2836372399995905e-06, "Finetune/Loss": 0.7784099578857422, "Finetune/Loss (Raw)": 0.6877071261405945, "Finetune/Step": 2984, "Finetune/Step Time": 2.807979604229331} +{"Finetune/Learning Rate": 7.277371559802371e-06, "Finetune/Loss": 0.7777109146118164, "Finetune/Loss (Raw)": 0.7567890286445618, "Finetune/Step": 2985, "Finetune/Step Time": 2.81033499725163} +{"Finetune/Learning Rate": 7.27110703383811e-06, "Finetune/Loss": 0.7770878672599792, "Finetune/Loss (Raw)": 0.6769322156906128, "Finetune/Step": 2986, "Finetune/Step Time": 2.811547080054879} +{"Finetune/Learning Rate": 7.264843664762594e-06, "Finetune/Loss": 0.7772830724716187, "Finetune/Loss (Raw)": 0.8646165132522583, "Finetune/Step": 2987, "Finetune/Step Time": 2.811501795426011} +{"Finetune/Learning Rate": 7.258581455231126e-06, "Finetune/Loss": 0.7773777842521667, "Finetune/Loss (Raw)": 0.8352544903755188, "Finetune/Step": 2988, "Finetune/Step Time": 2.8134187664836645} +{"Finetune/Learning Rate": 7.2523204078985055e-06, "Finetune/Loss": 0.77773118019104, "Finetune/Loss (Raw)": 0.8830114006996155, "Finetune/Step": 2989, "Finetune/Step Time": 2.8116111159324646} +{"Finetune/Learning Rate": 7.246060525419044e-06, "Finetune/Loss": 0.7772151231765747, "Finetune/Loss (Raw)": 0.7805277109146118, "Finetune/Step": 2990, "Finetune/Step Time": 2.814244616776705} +{"Finetune/Learning Rate": 7.239801810446567e-06, "Finetune/Loss": 0.7742422819137573, "Finetune/Loss (Raw)": 0.26662901043891907, "Finetune/Step": 2991, "Finetune/Step Time": 2.847758224233985} +{"Finetune/Learning Rate": 7.2335442656343915e-06, "Finetune/Loss": 0.7718484401702881, "Finetune/Loss (Raw)": 0.5814253687858582, "Finetune/Step": 2992, "Finetune/Step Time": 2.8787052389234304} +{"Finetune/Learning Rate": 7.2272878936353495e-06, "Finetune/Loss": 0.7713460922241211, "Finetune/Loss (Raw)": 0.826259970664978, "Finetune/Step": 2993, "Finetune/Step Time": 2.877773055806756} +{"Finetune/Learning Rate": 7.221032697101769e-06, "Finetune/Loss": 0.7696757316589355, "Finetune/Loss (Raw)": 0.6915602087974548, "Finetune/Step": 2994, "Finetune/Step Time": 2.903491698205471} +{"Finetune/Learning Rate": 7.214778678685487e-06, "Finetune/Loss": 0.7698568105697632, "Finetune/Loss (Raw)": 0.7969306111335754, "Finetune/Step": 2995, "Finetune/Step Time": 2.9025493282824755} +{"Finetune/Learning Rate": 7.208525841037829e-06, "Finetune/Loss": 0.7676748037338257, "Finetune/Loss (Raw)": 0.5772135257720947, "Finetune/Step": 2996, "Finetune/Step Time": 2.926177207380533} +{"Finetune/Learning Rate": 7.202274186809634e-06, "Finetune/Loss": 0.767479658126831, "Finetune/Loss (Raw)": 0.8337383270263672, "Finetune/Step": 2997, "Finetune/Step Time": 2.9268699027597904} +{"Finetune/Learning Rate": 7.196023718651229e-06, "Finetune/Loss": 0.7673701047897339, "Finetune/Loss (Raw)": 0.7555636167526245, "Finetune/Step": 2998, "Finetune/Step Time": 2.9244272094219923} +{"Finetune/Learning Rate": 7.189774439212442e-06, "Finetune/Loss": 0.767744779586792, "Finetune/Loss (Raw)": 0.8706608414649963, "Finetune/Step": 2999, "Finetune/Step Time": 2.9291524663567543} +{"Finetune/Learning Rate": 7.183526351142596e-06, "Finetune/Loss": 0.7670059204101562, "Finetune/Loss (Raw)": 0.6922746300697327, "Finetune/Step": 3000, "Finetune/Step Time": 2.951419796794653} +{"Finetune/Learning Rate": 7.177279457090512e-06, "Finetune/Loss": 0.7668391466140747, "Finetune/Loss (Raw)": 0.8415532112121582, "Finetune/Step": 3001, "Finetune/Step Time": 2.951943129301071} +{"Finetune/Learning Rate": 7.171033759704504e-06, "Finetune/Loss": 0.7667983770370483, "Finetune/Loss (Raw)": 0.7972638010978699, "Finetune/Step": 3002, "Finetune/Step Time": 2.956308888271451} +{"Finetune/Learning Rate": 7.164789261632373e-06, "Finetune/Loss": 0.7686470746994019, "Finetune/Loss (Raw)": 0.7251440286636353, "Finetune/Step": 3003, "Finetune/Step Time": 2.9348643720149994} +{"Finetune/Learning Rate": 7.158545965521415e-06, "Finetune/Loss": 0.7699311375617981, "Finetune/Loss (Raw)": 0.9182886481285095, "Finetune/Step": 3004, "Finetune/Step Time": 2.928940949961543} +{"Finetune/Learning Rate": 7.152303874018426e-06, "Finetune/Loss": 0.7690443396568298, "Finetune/Loss (Raw)": 0.6695217490196228, "Finetune/Step": 3005, "Finetune/Step Time": 2.949641702696681} +{"Finetune/Learning Rate": 7.146062989769671e-06, "Finetune/Loss": 0.7681915163993835, "Finetune/Loss (Raw)": 0.730065643787384, "Finetune/Step": 3006, "Finetune/Step Time": 2.9509560223668814} +{"Finetune/Learning Rate": 7.139823315420922e-06, "Finetune/Loss": 0.7681717276573181, "Finetune/Loss (Raw)": 0.8530876636505127, "Finetune/Step": 3007, "Finetune/Step Time": 2.9531791005283594} +{"Finetune/Learning Rate": 7.133584853617427e-06, "Finetune/Loss": 0.7685245275497437, "Finetune/Loss (Raw)": 0.8087190389633179, "Finetune/Step": 3008, "Finetune/Step Time": 2.9383082035928965} +{"Finetune/Learning Rate": 7.127347607003929e-06, "Finetune/Loss": 0.7673321962356567, "Finetune/Loss (Raw)": 0.7380228042602539, "Finetune/Step": 3009, "Finetune/Step Time": 2.9389462154358625} +{"Finetune/Learning Rate": 7.121111578224644e-06, "Finetune/Loss": 0.7669774293899536, "Finetune/Loss (Raw)": 0.7949104905128479, "Finetune/Step": 3010, "Finetune/Step Time": 2.942379193380475} +{"Finetune/Learning Rate": 7.114876769923282e-06, "Finetune/Loss": 0.7666743993759155, "Finetune/Loss (Raw)": 0.8580109477043152, "Finetune/Step": 3011, "Finetune/Step Time": 2.9422608092427254} +{"Finetune/Learning Rate": 7.108643184743033e-06, "Finetune/Loss": 0.7666118144989014, "Finetune/Loss (Raw)": 0.7970648407936096, "Finetune/Step": 3012, "Finetune/Step Time": 2.938866026699543} +{"Finetune/Learning Rate": 7.1024108253265665e-06, "Finetune/Loss": 0.7670323848724365, "Finetune/Loss (Raw)": 0.8305259346961975, "Finetune/Step": 3013, "Finetune/Step Time": 2.9397806618362665} +{"Finetune/Learning Rate": 7.096179694316027e-06, "Finetune/Loss": 0.7669541835784912, "Finetune/Loss (Raw)": 0.8666526079177856, "Finetune/Step": 3014, "Finetune/Step Time": 2.9427842143923044} +{"Finetune/Learning Rate": 7.089949794353052e-06, "Finetune/Loss": 0.7677042484283447, "Finetune/Loss (Raw)": 0.9019047021865845, "Finetune/Step": 3015, "Finetune/Step Time": 2.943995827808976} +{"Finetune/Learning Rate": 7.083721128078753e-06, "Finetune/Loss": 0.7674087285995483, "Finetune/Loss (Raw)": 0.7030029892921448, "Finetune/Step": 3016, "Finetune/Step Time": 2.9407972916960716} +{"Finetune/Learning Rate": 7.077493698133706e-06, "Finetune/Loss": 0.7669351100921631, "Finetune/Loss (Raw)": 0.7859983444213867, "Finetune/Step": 3017, "Finetune/Step Time": 2.9429070726037025} +{"Finetune/Learning Rate": 7.071267507157973e-06, "Finetune/Loss": 0.7679557800292969, "Finetune/Loss (Raw)": 0.789522647857666, "Finetune/Step": 3018, "Finetune/Step Time": 2.942363290116191} +{"Finetune/Learning Rate": 7.065042557791096e-06, "Finetune/Loss": 0.767608106136322, "Finetune/Loss (Raw)": 0.7862417101860046, "Finetune/Step": 3019, "Finetune/Step Time": 2.9412777833640575} +{"Finetune/Learning Rate": 7.058818852672077e-06, "Finetune/Loss": 0.7673981189727783, "Finetune/Loss (Raw)": 0.8134698867797852, "Finetune/Step": 3020, "Finetune/Step Time": 2.9379502162337303} +{"Finetune/Learning Rate": 7.052596394439401e-06, "Finetune/Loss": 0.7730023264884949, "Finetune/Loss (Raw)": 0.9744173288345337, "Finetune/Step": 3021, "Finetune/Step Time": 2.9354332983493805} +{"Finetune/Learning Rate": 7.0463751857310225e-06, "Finetune/Loss": 0.7726471424102783, "Finetune/Loss (Raw)": 0.8571709394454956, "Finetune/Step": 3022, "Finetune/Step Time": 2.933667842298746} +{"Finetune/Learning Rate": 7.040155229184365e-06, "Finetune/Loss": 0.7722552418708801, "Finetune/Loss (Raw)": 0.7744183540344238, "Finetune/Step": 3023, "Finetune/Step Time": 2.938274757936597} +{"Finetune/Learning Rate": 7.033936527436318e-06, "Finetune/Loss": 0.7715221643447876, "Finetune/Loss (Raw)": 0.7403375506401062, "Finetune/Step": 3024, "Finetune/Step Time": 2.9396604113280773} +{"Finetune/Learning Rate": 7.027719083123242e-06, "Finetune/Loss": 0.7713032960891724, "Finetune/Loss (Raw)": 0.9174766540527344, "Finetune/Step": 3025, "Finetune/Step Time": 2.939139312133193} +{"Finetune/Learning Rate": 7.021502898880972e-06, "Finetune/Loss": 0.7703529596328735, "Finetune/Loss (Raw)": 0.7752078175544739, "Finetune/Step": 3026, "Finetune/Step Time": 2.9343886598944664} +{"Finetune/Learning Rate": 7.0152879773447935e-06, "Finetune/Loss": 0.7690012454986572, "Finetune/Loss (Raw)": 0.5872534513473511, "Finetune/Step": 3027, "Finetune/Step Time": 2.9575115106999874} +{"Finetune/Learning Rate": 7.009074321149465e-06, "Finetune/Loss": 0.7679775953292847, "Finetune/Loss (Raw)": 0.7038712501525879, "Finetune/Step": 3028, "Finetune/Step Time": 2.959648732095957} +{"Finetune/Learning Rate": 7.0028619329292145e-06, "Finetune/Loss": 0.7677643299102783, "Finetune/Loss (Raw)": 0.8593440651893616, "Finetune/Step": 3029, "Finetune/Step Time": 2.961515324190259} +{"Finetune/Learning Rate": 6.996650815317717e-06, "Finetune/Loss": 0.7676221132278442, "Finetune/Loss (Raw)": 0.8512013554573059, "Finetune/Step": 3030, "Finetune/Step Time": 2.95812276750803} +{"Finetune/Learning Rate": 6.990440970948125e-06, "Finetune/Loss": 0.7677483558654785, "Finetune/Loss (Raw)": 0.7623842358589172, "Finetune/Step": 3031, "Finetune/Step Time": 2.9607052970677614} +{"Finetune/Learning Rate": 6.984232402453039e-06, "Finetune/Loss": 0.768303394317627, "Finetune/Loss (Raw)": 0.8478425741195679, "Finetune/Step": 3032, "Finetune/Step Time": 2.963092938065529} +{"Finetune/Learning Rate": 6.978025112464533e-06, "Finetune/Loss": 0.7681225538253784, "Finetune/Loss (Raw)": 0.7989403605461121, "Finetune/Step": 3033, "Finetune/Step Time": 2.9611006397753954} +{"Finetune/Learning Rate": 6.9718191036141195e-06, "Finetune/Loss": 0.7676507234573364, "Finetune/Loss (Raw)": 0.8131672739982605, "Finetune/Step": 3034, "Finetune/Step Time": 2.958312889561057} +{"Finetune/Learning Rate": 6.965614378532781e-06, "Finetune/Loss": 0.7677291631698608, "Finetune/Loss (Raw)": 0.8412928581237793, "Finetune/Step": 3035, "Finetune/Step Time": 2.960723513737321} +{"Finetune/Learning Rate": 6.959410939850957e-06, "Finetune/Loss": 0.7679077386856079, "Finetune/Loss (Raw)": 0.893341600894928, "Finetune/Step": 3036, "Finetune/Step Time": 2.963516978546977} +{"Finetune/Learning Rate": 6.953208790198533e-06, "Finetune/Loss": 0.7674559354782104, "Finetune/Loss (Raw)": 0.7717170119285583, "Finetune/Step": 3037, "Finetune/Step Time": 2.9608301278203726} +{"Finetune/Learning Rate": 6.9470079322048525e-06, "Finetune/Loss": 0.7665090560913086, "Finetune/Loss (Raw)": 0.7151996493339539, "Finetune/Step": 3038, "Finetune/Step Time": 2.95841858163476} +{"Finetune/Learning Rate": 6.940808368498713e-06, "Finetune/Loss": 0.7671558260917664, "Finetune/Loss (Raw)": 0.9022992849349976, "Finetune/Step": 3039, "Finetune/Step Time": 2.957767754793167} +{"Finetune/Learning Rate": 6.934610101708366e-06, "Finetune/Loss": 0.7652931213378906, "Finetune/Loss (Raw)": 0.6022008657455444, "Finetune/Step": 3040, "Finetune/Step Time": 2.9805648997426033} +{"Finetune/Learning Rate": 6.9284131344615025e-06, "Finetune/Loss": 0.7660213708877563, "Finetune/Loss (Raw)": 0.8760449886322021, "Finetune/Step": 3041, "Finetune/Step Time": 2.982002839446068} +{"Finetune/Learning Rate": 6.922217469385268e-06, "Finetune/Loss": 0.7664742469787598, "Finetune/Loss (Raw)": 0.7923487424850464, "Finetune/Step": 3042, "Finetune/Step Time": 2.9793253373354673} +{"Finetune/Learning Rate": 6.916023109106266e-06, "Finetune/Loss": 0.7666529417037964, "Finetune/Loss (Raw)": 0.7484413981437683, "Finetune/Step": 3043, "Finetune/Step Time": 2.9827802665531635} +{"Finetune/Learning Rate": 6.909830056250527e-06, "Finetune/Loss": 0.7668901681900024, "Finetune/Loss (Raw)": 0.8844813108444214, "Finetune/Step": 3044, "Finetune/Step Time": 2.9830337204039097} +{"Finetune/Learning Rate": 6.903638313443546e-06, "Finetune/Loss": 0.7674367427825928, "Finetune/Loss (Raw)": 0.7963142395019531, "Finetune/Step": 3045, "Finetune/Step Time": 2.984651828184724} +{"Finetune/Learning Rate": 6.897447883310249e-06, "Finetune/Loss": 0.766274094581604, "Finetune/Loss (Raw)": 0.593987762928009, "Finetune/Step": 3046, "Finetune/Step Time": 3.009689746424556} +{"Finetune/Learning Rate": 6.891258768475018e-06, "Finetune/Loss": 0.767385721206665, "Finetune/Loss (Raw)": 0.8580711483955383, "Finetune/Step": 3047, "Finetune/Step Time": 3.0084479432553053} +{"Finetune/Learning Rate": 6.885070971561663e-06, "Finetune/Loss": 0.7673373818397522, "Finetune/Loss (Raw)": 0.7731322646141052, "Finetune/Step": 3048, "Finetune/Step Time": 3.020220033824444} +{"Finetune/Learning Rate": 6.878884495193448e-06, "Finetune/Loss": 0.7672432661056519, "Finetune/Loss (Raw)": 0.8127486705780029, "Finetune/Step": 3049, "Finetune/Step Time": 3.019609348848462} +{"Finetune/Learning Rate": 6.87269934199307e-06, "Finetune/Loss": 0.76716148853302, "Finetune/Loss (Raw)": 0.7892070412635803, "Finetune/Step": 3050, "Finetune/Step Time": 3.0179783515632153} +{"Finetune/Learning Rate": 6.866515514582668e-06, "Finetune/Loss": 0.7677270174026489, "Finetune/Loss (Raw)": 0.8508222699165344, "Finetune/Step": 3051, "Finetune/Step Time": 3.013949975371361} +{"Finetune/Learning Rate": 6.860333015583815e-06, "Finetune/Loss": 0.7680350542068481, "Finetune/Loss (Raw)": 0.885614812374115, "Finetune/Step": 3052, "Finetune/Step Time": 3.015188790857792} +{"Finetune/Learning Rate": 6.8541518476175275e-06, "Finetune/Loss": 0.7678006291389465, "Finetune/Loss (Raw)": 0.7710915207862854, "Finetune/Step": 3053, "Finetune/Step Time": 3.0157984141260386} +{"Finetune/Learning Rate": 6.847972013304256e-06, "Finetune/Loss": 0.7664327025413513, "Finetune/Loss (Raw)": 0.7137191891670227, "Finetune/Step": 3054, "Finetune/Step Time": 3.01580798253417} +{"Finetune/Learning Rate": 6.841793515263879e-06, "Finetune/Loss": 0.7664434313774109, "Finetune/Loss (Raw)": 0.7875747084617615, "Finetune/Step": 3055, "Finetune/Step Time": 3.0137453228235245} +{"Finetune/Learning Rate": 6.835616356115713e-06, "Finetune/Loss": 0.7665229439735413, "Finetune/Loss (Raw)": 0.7900817394256592, "Finetune/Step": 3056, "Finetune/Step Time": 3.0105564035475254} +{"Finetune/Learning Rate": 6.8294405384785114e-06, "Finetune/Loss": 0.7665498852729797, "Finetune/Loss (Raw)": 0.8217324614524841, "Finetune/Step": 3057, "Finetune/Step Time": 3.011289807036519} +{"Finetune/Learning Rate": 6.823266064970448e-06, "Finetune/Loss": 0.7665964365005493, "Finetune/Loss (Raw)": 0.8521089553833008, "Finetune/Step": 3058, "Finetune/Step Time": 3.009335221722722} +{"Finetune/Learning Rate": 6.817092938209141e-06, "Finetune/Loss": 0.7667785882949829, "Finetune/Loss (Raw)": 0.8114782571792603, "Finetune/Step": 3059, "Finetune/Step Time": 3.0041843615472317} +{"Finetune/Learning Rate": 6.8109211608116236e-06, "Finetune/Loss": 0.7669230699539185, "Finetune/Loss (Raw)": 0.8013208508491516, "Finetune/Step": 3060, "Finetune/Step Time": 3.005974745377898} +{"Finetune/Learning Rate": 6.804750735394369e-06, "Finetune/Loss": 0.7673373818397522, "Finetune/Loss (Raw)": 0.8989010453224182, "Finetune/Step": 3061, "Finetune/Step Time": 3.006702920421958} +{"Finetune/Learning Rate": 6.798581664573265e-06, "Finetune/Loss": 0.7674412727355957, "Finetune/Loss (Raw)": 0.7419499754905701, "Finetune/Step": 3062, "Finetune/Step Time": 3.0090594720095396} +{"Finetune/Learning Rate": 6.792413950963638e-06, "Finetune/Loss": 0.767526388168335, "Finetune/Loss (Raw)": 0.7760710716247559, "Finetune/Step": 3063, "Finetune/Step Time": 3.007386786863208} +{"Finetune/Learning Rate": 6.786247597180229e-06, "Finetune/Loss": 0.7667943835258484, "Finetune/Loss (Raw)": 0.7902578115463257, "Finetune/Step": 3064, "Finetune/Step Time": 2.999798897653818} +{"Finetune/Learning Rate": 6.780082605837208e-06, "Finetune/Loss": 0.7657626271247864, "Finetune/Loss (Raw)": 0.7257838845252991, "Finetune/Step": 3065, "Finetune/Step Time": 2.995731508359313} +{"Finetune/Learning Rate": 6.773918979548162e-06, "Finetune/Loss": 0.7664909958839417, "Finetune/Loss (Raw)": 0.721777617931366, "Finetune/Step": 3066, "Finetune/Step Time": 2.972092254087329} +{"Finetune/Learning Rate": 6.767756720926106e-06, "Finetune/Loss": 0.7707895040512085, "Finetune/Loss (Raw)": 0.7769975066184998, "Finetune/Step": 3067, "Finetune/Step Time": 2.9362293481826782} +{"Finetune/Learning Rate": 6.761595832583476e-06, "Finetune/Loss": 0.7732961177825928, "Finetune/Loss (Raw)": 0.8529137969017029, "Finetune/Step": 3068, "Finetune/Step Time": 2.9144536182284355} +{"Finetune/Learning Rate": 6.755436317132117e-06, "Finetune/Loss": 0.7726134657859802, "Finetune/Loss (Raw)": 0.6595747470855713, "Finetune/Step": 3069, "Finetune/Step Time": 2.9173851553350687} +{"Finetune/Learning Rate": 6.749278177183299e-06, "Finetune/Loss": 0.7728763818740845, "Finetune/Loss (Raw)": 0.800274133682251, "Finetune/Step": 3070, "Finetune/Step Time": 2.9148741122335196} +{"Finetune/Learning Rate": 6.7431214153477106e-06, "Finetune/Loss": 0.7726279497146606, "Finetune/Loss (Raw)": 0.804373562335968, "Finetune/Step": 3071, "Finetune/Step Time": 2.916494570672512} +{"Finetune/Learning Rate": 6.73696603423545e-06, "Finetune/Loss": 0.7727096080780029, "Finetune/Loss (Raw)": 0.75018709897995, "Finetune/Step": 3072, "Finetune/Step Time": 2.9175260439515114} +{"Finetune/Learning Rate": 6.730812036456039e-06, "Finetune/Loss": 0.7732360363006592, "Finetune/Loss (Raw)": 0.9069798588752747, "Finetune/Step": 3073, "Finetune/Step Time": 2.9212088733911514} +{"Finetune/Learning Rate": 6.724659424618401e-06, "Finetune/Loss": 0.7737565636634827, "Finetune/Loss (Raw)": 0.8596764206886292, "Finetune/Step": 3074, "Finetune/Step Time": 2.921298338100314} +{"Finetune/Learning Rate": 6.718508201330888e-06, "Finetune/Loss": 0.773948609828949, "Finetune/Loss (Raw)": 0.779992401599884, "Finetune/Step": 3075, "Finetune/Step Time": 2.92133242636919} +{"Finetune/Learning Rate": 6.712358369201242e-06, "Finetune/Loss": 0.7743161916732788, "Finetune/Loss (Raw)": 0.8572232127189636, "Finetune/Step": 3076, "Finetune/Step Time": 2.9238911028951406} +{"Finetune/Learning Rate": 6.706209930836636e-06, "Finetune/Loss": 0.7733908891677856, "Finetune/Loss (Raw)": 0.5996639132499695, "Finetune/Step": 3077, "Finetune/Step Time": 2.9523095060139894} +{"Finetune/Learning Rate": 6.700062888843639e-06, "Finetune/Loss": 0.7752432823181152, "Finetune/Loss (Raw)": 0.7521237134933472, "Finetune/Step": 3078, "Finetune/Step Time": 2.9265599828213453} +{"Finetune/Learning Rate": 6.693917245828234e-06, "Finetune/Loss": 0.7743500471115112, "Finetune/Loss (Raw)": 0.7024943232536316, "Finetune/Step": 3079, "Finetune/Step Time": 2.951679630205035} +{"Finetune/Learning Rate": 6.687773004395808e-06, "Finetune/Loss": 0.7740265130996704, "Finetune/Loss (Raw)": 0.8219836950302124, "Finetune/Step": 3080, "Finetune/Step Time": 2.9545083455741405} +{"Finetune/Learning Rate": 6.681630167151152e-06, "Finetune/Loss": 0.7742109298706055, "Finetune/Loss (Raw)": 0.8568686246871948, "Finetune/Step": 3081, "Finetune/Step Time": 2.9815758280456066} +{"Finetune/Learning Rate": 6.675488736698474e-06, "Finetune/Loss": 0.7742440700531006, "Finetune/Loss (Raw)": 0.7738497257232666, "Finetune/Step": 3082, "Finetune/Step Time": 2.9839325062930584} +{"Finetune/Learning Rate": 6.669348715641367e-06, "Finetune/Loss": 0.7749570608139038, "Finetune/Loss (Raw)": 0.8954001069068909, "Finetune/Step": 3083, "Finetune/Step Time": 2.9802488535642624} +{"Finetune/Learning Rate": 6.663210106582838e-06, "Finetune/Loss": 0.7751801013946533, "Finetune/Loss (Raw)": 0.890485405921936, "Finetune/Step": 3084, "Finetune/Step Time": 2.979785894975066} +{"Finetune/Learning Rate": 6.657072912125297e-06, "Finetune/Loss": 0.7761672735214233, "Finetune/Loss (Raw)": 0.8701471090316772, "Finetune/Step": 3085, "Finetune/Step Time": 2.9587739501148462} +{"Finetune/Learning Rate": 6.6509371348705436e-06, "Finetune/Loss": 0.7752748727798462, "Finetune/Loss (Raw)": 0.6740627884864807, "Finetune/Step": 3086, "Finetune/Step Time": 2.9587582163512707} +{"Finetune/Learning Rate": 6.6448027774197875e-06, "Finetune/Loss": 0.7740685939788818, "Finetune/Loss (Raw)": 0.7311730980873108, "Finetune/Step": 3087, "Finetune/Step Time": 2.9589552134275436} +{"Finetune/Learning Rate": 6.638669842373633e-06, "Finetune/Loss": 0.7743880152702332, "Finetune/Loss (Raw)": 0.8539891242980957, "Finetune/Step": 3088, "Finetune/Step Time": 2.9595339465886354} +{"Finetune/Learning Rate": 6.632538332332081e-06, "Finetune/Loss": 0.7756471633911133, "Finetune/Loss (Raw)": 0.9107099771499634, "Finetune/Step": 3089, "Finetune/Step Time": 2.9585587959736586} +{"Finetune/Learning Rate": 6.626408249894525e-06, "Finetune/Loss": 0.7758466005325317, "Finetune/Loss (Raw)": 0.7175338864326477, "Finetune/Step": 3090, "Finetune/Step Time": 2.9372697733342648} +{"Finetune/Learning Rate": 6.620279597659758e-06, "Finetune/Loss": 0.7796821594238281, "Finetune/Loss (Raw)": 0.7252823114395142, "Finetune/Step": 3091, "Finetune/Step Time": 2.9011095724999905} +{"Finetune/Learning Rate": 6.614152378225966e-06, "Finetune/Loss": 0.7792542576789856, "Finetune/Loss (Raw)": 0.783388078212738, "Finetune/Step": 3092, "Finetune/Step Time": 2.8981934655457735} +{"Finetune/Learning Rate": 6.608026594190726e-06, "Finetune/Loss": 0.7806200981140137, "Finetune/Loss (Raw)": 0.9421960711479187, "Finetune/Step": 3093, "Finetune/Step Time": 2.901777295395732} +{"Finetune/Learning Rate": 6.601902248151006e-06, "Finetune/Loss": 0.7813737392425537, "Finetune/Loss (Raw)": 0.8338602781295776, "Finetune/Step": 3094, "Finetune/Step Time": 2.9013931080698967} +{"Finetune/Learning Rate": 6.595779342703165e-06, "Finetune/Loss": 0.7832303047180176, "Finetune/Loss (Raw)": 0.8150196075439453, "Finetune/Step": 3095, "Finetune/Step Time": 2.8773193806409836} +{"Finetune/Learning Rate": 6.589657880442957e-06, "Finetune/Loss": 0.787877082824707, "Finetune/Loss (Raw)": 0.8585049510002136, "Finetune/Step": 3096, "Finetune/Step Time": 2.8450995329767466} +{"Finetune/Learning Rate": 6.583537863965512e-06, "Finetune/Loss": 0.7883230447769165, "Finetune/Loss (Raw)": 0.8428821563720703, "Finetune/Step": 3097, "Finetune/Step Time": 2.846471818163991} +{"Finetune/Learning Rate": 6.577419295865357e-06, "Finetune/Loss": 0.7884133458137512, "Finetune/Loss (Raw)": 0.7961635589599609, "Finetune/Step": 3098, "Finetune/Step Time": 2.8510279655456543} +{"Finetune/Learning Rate": 6.571302178736404e-06, "Finetune/Loss": 0.7889186143875122, "Finetune/Loss (Raw)": 0.8336626291275024, "Finetune/Step": 3099, "Finetune/Step Time": 2.852097300812602} +{"Finetune/Learning Rate": 6.5651865151719415e-06, "Finetune/Loss": 0.7892330884933472, "Finetune/Loss (Raw)": 0.7528729438781738, "Finetune/Step": 3100, "Finetune/Step Time": 2.8488569483160973} +{"Finetune/Learning Rate": 6.559072307764656e-06, "Finetune/Loss": 0.7897263765335083, "Finetune/Loss (Raw)": 0.8719702363014221, "Finetune/Step": 3101, "Finetune/Step Time": 2.852626085281372} +{"Finetune/Learning Rate": 6.552959559106601e-06, "Finetune/Loss": 0.788512110710144, "Finetune/Loss (Raw)": 0.6245514154434204, "Finetune/Step": 3102, "Finetune/Step Time": 2.875660205259919} +{"Finetune/Learning Rate": 6.546848271789228e-06, "Finetune/Loss": 0.7868143916130066, "Finetune/Loss (Raw)": 0.5829159021377563, "Finetune/Step": 3103, "Finetune/Step Time": 2.901235591620207} +{"Finetune/Learning Rate": 6.540738448403351e-06, "Finetune/Loss": 0.7869234085083008, "Finetune/Loss (Raw)": 0.7959798574447632, "Finetune/Step": 3104, "Finetune/Step Time": 2.9089265931397676} +{"Finetune/Learning Rate": 6.534630091539181e-06, "Finetune/Loss": 0.786101758480072, "Finetune/Loss (Raw)": 0.7654001116752625, "Finetune/Step": 3105, "Finetune/Step Time": 2.911440011113882} +{"Finetune/Learning Rate": 6.528523203786292e-06, "Finetune/Loss": 0.7851203680038452, "Finetune/Loss (Raw)": 0.7582794427871704, "Finetune/Step": 3106, "Finetune/Step Time": 2.9169015418738127} +{"Finetune/Learning Rate": 6.522417787733648e-06, "Finetune/Loss": 0.7832838892936707, "Finetune/Loss (Raw)": 0.5672762393951416, "Finetune/Step": 3107, "Finetune/Step Time": 2.941057026386261} +{"Finetune/Learning Rate": 6.516313845969577e-06, "Finetune/Loss": 0.7842632532119751, "Finetune/Loss (Raw)": 0.8073176145553589, "Finetune/Step": 3108, "Finetune/Step Time": 2.9370663836598396} +{"Finetune/Learning Rate": 6.510211381081793e-06, "Finetune/Loss": 0.7840362787246704, "Finetune/Loss (Raw)": 0.7720987796783447, "Finetune/Step": 3109, "Finetune/Step Time": 2.9408664237707853} +{"Finetune/Learning Rate": 6.504110395657383e-06, "Finetune/Loss": 0.7848591208457947, "Finetune/Loss (Raw)": 0.854228138923645, "Finetune/Step": 3110, "Finetune/Step Time": 2.941701576113701} +{"Finetune/Learning Rate": 6.498010892282794e-06, "Finetune/Loss": 0.7841129899024963, "Finetune/Loss (Raw)": 0.6437209248542786, "Finetune/Step": 3111, "Finetune/Step Time": 2.963929794728756} +{"Finetune/Learning Rate": 6.491912873543856e-06, "Finetune/Loss": 0.7859722375869751, "Finetune/Loss (Raw)": 0.9256935715675354, "Finetune/Step": 3112, "Finetune/Step Time": 2.9624475706368685} +{"Finetune/Learning Rate": 6.485816342025774e-06, "Finetune/Loss": 0.7869502305984497, "Finetune/Loss (Raw)": 0.8819675445556641, "Finetune/Step": 3113, "Finetune/Step Time": 2.961801826953888} +{"Finetune/Learning Rate": 6.4797213003131055e-06, "Finetune/Loss": 0.7877424359321594, "Finetune/Loss (Raw)": 0.7783368825912476, "Finetune/Step": 3114, "Finetune/Step Time": 2.962312662974} +{"Finetune/Learning Rate": 6.473627750989794e-06, "Finetune/Loss": 0.7874919772148132, "Finetune/Loss (Raw)": 0.8325586915016174, "Finetune/Step": 3115, "Finetune/Step Time": 2.9635088220238686} +{"Finetune/Learning Rate": 6.467535696639137e-06, "Finetune/Loss": 0.7877416014671326, "Finetune/Loss (Raw)": 0.8672022223472595, "Finetune/Step": 3116, "Finetune/Step Time": 2.964038146659732} +{"Finetune/Learning Rate": 6.461445139843815e-06, "Finetune/Loss": 0.7877906560897827, "Finetune/Loss (Raw)": 0.889289915561676, "Finetune/Step": 3117, "Finetune/Step Time": 2.964753355830908} +{"Finetune/Learning Rate": 6.45535608318585e-06, "Finetune/Loss": 0.7876272201538086, "Finetune/Loss (Raw)": 0.7596073150634766, "Finetune/Step": 3118, "Finetune/Step Time": 2.9860095977783203} +{"Finetune/Learning Rate": 6.449268529246648e-06, "Finetune/Loss": 0.7917389869689941, "Finetune/Loss (Raw)": 0.7929435968399048, "Finetune/Step": 3119, "Finetune/Step Time": 2.960331179201603} +{"Finetune/Learning Rate": 6.443182480606969e-06, "Finetune/Loss": 0.7942860722541809, "Finetune/Loss (Raw)": 0.9074465036392212, "Finetune/Step": 3120, "Finetune/Step Time": 2.928478639572859} +{"Finetune/Learning Rate": 6.437097939846938e-06, "Finetune/Loss": 0.79388028383255, "Finetune/Loss (Raw)": 0.7743197083473206, "Finetune/Step": 3121, "Finetune/Step Time": 2.9285394735634327} +{"Finetune/Learning Rate": 6.431014909546036e-06, "Finetune/Loss": 0.7948411703109741, "Finetune/Loss (Raw)": 0.8145594596862793, "Finetune/Step": 3122, "Finetune/Step Time": 2.9049104675650597} +{"Finetune/Learning Rate": 6.424933392283108e-06, "Finetune/Loss": 0.7952929735183716, "Finetune/Loss (Raw)": 0.8547617793083191, "Finetune/Step": 3123, "Finetune/Step Time": 2.90741078928113} +{"Finetune/Learning Rate": 6.418853390636363e-06, "Finetune/Loss": 0.7970544099807739, "Finetune/Loss (Raw)": 0.8026700019836426, "Finetune/Step": 3124, "Finetune/Step Time": 2.883666755631566} +{"Finetune/Learning Rate": 6.412774907183353e-06, "Finetune/Loss": 0.7969450354576111, "Finetune/Loss (Raw)": 0.8197450637817383, "Finetune/Step": 3125, "Finetune/Step Time": 2.8834326341748238} +{"Finetune/Learning Rate": 6.406697944500997e-06, "Finetune/Loss": 0.7970489263534546, "Finetune/Loss (Raw)": 0.7688654065132141, "Finetune/Step": 3126, "Finetune/Step Time": 2.8882585652172565} +{"Finetune/Learning Rate": 6.400622505165569e-06, "Finetune/Loss": 0.7962424755096436, "Finetune/Loss (Raw)": 0.7674291133880615, "Finetune/Step": 3127, "Finetune/Step Time": 2.884734271094203} +{"Finetune/Learning Rate": 6.39454859175269e-06, "Finetune/Loss": 0.7970719337463379, "Finetune/Loss (Raw)": 0.7984414100646973, "Finetune/Step": 3128, "Finetune/Step Time": 2.8638341017067432} +{"Finetune/Learning Rate": 6.388476206837343e-06, "Finetune/Loss": 0.7969413995742798, "Finetune/Loss (Raw)": 0.8248481750488281, "Finetune/Step": 3129, "Finetune/Step Time": 2.8686720114201307} +{"Finetune/Learning Rate": 6.382405352993857e-06, "Finetune/Loss": 0.7968319654464722, "Finetune/Loss (Raw)": 0.7832563519477844, "Finetune/Step": 3130, "Finetune/Step Time": 2.8710870314389467} +{"Finetune/Learning Rate": 6.3763360327959176e-06, "Finetune/Loss": 0.7975538372993469, "Finetune/Loss (Raw)": 0.8175423741340637, "Finetune/Step": 3131, "Finetune/Step Time": 2.872245281934738} +{"Finetune/Learning Rate": 6.37026824881655e-06, "Finetune/Loss": 0.7969293594360352, "Finetune/Loss (Raw)": 0.8383505940437317, "Finetune/Step": 3132, "Finetune/Step Time": 2.8695291317999363} +{"Finetune/Learning Rate": 6.364202003628142e-06, "Finetune/Loss": 0.7978546619415283, "Finetune/Loss (Raw)": 0.787969172000885, "Finetune/Step": 3133, "Finetune/Step Time": 2.849542737007141} +{"Finetune/Learning Rate": 6.358137299802416e-06, "Finetune/Loss": 0.7980650067329407, "Finetune/Loss (Raw)": 0.7569836974143982, "Finetune/Step": 3134, "Finetune/Step Time": 2.8550710640847683} +{"Finetune/Learning Rate": 6.3520741399104495e-06, "Finetune/Loss": 0.7973065376281738, "Finetune/Loss (Raw)": 0.7560037970542908, "Finetune/Step": 3135, "Finetune/Step Time": 2.8532075490802526} +{"Finetune/Learning Rate": 6.34601252652266e-06, "Finetune/Loss": 0.7964609265327454, "Finetune/Loss (Raw)": 0.700475811958313, "Finetune/Step": 3136, "Finetune/Step Time": 2.8571540284901857} +{"Finetune/Learning Rate": 6.339952462208814e-06, "Finetune/Loss": 0.7972493171691895, "Finetune/Loss (Raw)": 0.8389415740966797, "Finetune/Step": 3137, "Finetune/Step Time": 2.8555553406476974} +{"Finetune/Learning Rate": 6.333893949538024e-06, "Finetune/Loss": 0.795102059841156, "Finetune/Loss (Raw)": 0.5200645923614502, "Finetune/Step": 3138, "Finetune/Step Time": 2.874966708943248} +{"Finetune/Learning Rate": 6.327836991078733e-06, "Finetune/Loss": 0.7951839566230774, "Finetune/Loss (Raw)": 0.8684958815574646, "Finetune/Step": 3139, "Finetune/Step Time": 2.8764800932258368} +{"Finetune/Learning Rate": 6.321781589398731e-06, "Finetune/Loss": 0.7954554557800293, "Finetune/Loss (Raw)": 0.8318061232566833, "Finetune/Step": 3140, "Finetune/Step Time": 2.878312923014164} +{"Finetune/Learning Rate": 6.3157277470651575e-06, "Finetune/Loss": 0.7956282496452332, "Finetune/Loss (Raw)": 0.8526555895805359, "Finetune/Step": 3141, "Finetune/Step Time": 2.879360605031252} +{"Finetune/Learning Rate": 6.309675466644474e-06, "Finetune/Loss": 0.7960747480392456, "Finetune/Loss (Raw)": 0.9238019585609436, "Finetune/Step": 3142, "Finetune/Step Time": 2.877204639837146} +{"Finetune/Learning Rate": 6.303624750702494e-06, "Finetune/Loss": 0.7959062457084656, "Finetune/Loss (Raw)": 0.8803325891494751, "Finetune/Step": 3143, "Finetune/Step Time": 2.8769941963255405} +{"Finetune/Learning Rate": 6.297575601804357e-06, "Finetune/Loss": 0.7952951192855835, "Finetune/Loss (Raw)": 0.6247766613960266, "Finetune/Step": 3144, "Finetune/Step Time": 2.90020009316504} +{"Finetune/Learning Rate": 6.291528022514552e-06, "Finetune/Loss": 0.7952584028244019, "Finetune/Loss (Raw)": 0.7812950611114502, "Finetune/Step": 3145, "Finetune/Step Time": 2.8983842488378286} +{"Finetune/Learning Rate": 6.285482015396883e-06, "Finetune/Loss": 0.7948448061943054, "Finetune/Loss (Raw)": 0.7365853190422058, "Finetune/Step": 3146, "Finetune/Step Time": 2.8976217191666365} +{"Finetune/Learning Rate": 6.279437583014507e-06, "Finetune/Loss": 0.7944980263710022, "Finetune/Loss (Raw)": 0.7418573498725891, "Finetune/Step": 3147, "Finetune/Step Time": 2.8941808100789785} +{"Finetune/Learning Rate": 6.2733947279299e-06, "Finetune/Loss": 0.7935575246810913, "Finetune/Loss (Raw)": 0.6930826902389526, "Finetune/Step": 3148, "Finetune/Step Time": 2.918668959289789} +{"Finetune/Learning Rate": 6.267353452704876e-06, "Finetune/Loss": 0.7922766208648682, "Finetune/Loss (Raw)": 0.8104715943336487, "Finetune/Step": 3149, "Finetune/Step Time": 2.8908056188374758} +{"Finetune/Learning Rate": 6.261313759900576e-06, "Finetune/Loss": 0.791592001914978, "Finetune/Loss (Raw)": 0.769528329372406, "Finetune/Step": 3150, "Finetune/Step Time": 2.888464320451021} +{"Finetune/Learning Rate": 6.255275652077471e-06, "Finetune/Loss": 0.7918277382850647, "Finetune/Loss (Raw)": 0.8045996427536011, "Finetune/Step": 3151, "Finetune/Step Time": 2.8845875337719917} +{"Finetune/Learning Rate": 6.249239131795366e-06, "Finetune/Loss": 0.7927178740501404, "Finetune/Loss (Raw)": 0.8542672991752625, "Finetune/Step": 3152, "Finetune/Step Time": 2.882567936554551} +{"Finetune/Learning Rate": 6.243204201613382e-06, "Finetune/Loss": 0.7923518419265747, "Finetune/Loss (Raw)": 0.8706256151199341, "Finetune/Step": 3153, "Finetune/Step Time": 2.8818075489252806} +{"Finetune/Learning Rate": 6.237170864089972e-06, "Finetune/Loss": 0.7924712896347046, "Finetune/Loss (Raw)": 0.7904937863349915, "Finetune/Step": 3154, "Finetune/Step Time": 2.881623176857829} +{"Finetune/Learning Rate": 6.231139121782916e-06, "Finetune/Loss": 0.7934455871582031, "Finetune/Loss (Raw)": 0.7119746804237366, "Finetune/Step": 3155, "Finetune/Step Time": 2.85960035584867} +{"Finetune/Learning Rate": 6.225108977249311e-06, "Finetune/Loss": 0.7936956882476807, "Finetune/Loss (Raw)": 0.7358801960945129, "Finetune/Step": 3156, "Finetune/Step Time": 2.855078436434269} +{"Finetune/Learning Rate": 6.219080433045583e-06, "Finetune/Loss": 0.7935510277748108, "Finetune/Loss (Raw)": 0.8408279418945312, "Finetune/Step": 3157, "Finetune/Step Time": 2.855701567605138} +{"Finetune/Learning Rate": 6.213053491727477e-06, "Finetune/Loss": 0.7934717535972595, "Finetune/Loss (Raw)": 0.84104984998703, "Finetune/Step": 3158, "Finetune/Step Time": 2.8550879154354334} +{"Finetune/Learning Rate": 6.207028155850061e-06, "Finetune/Loss": 0.7940018773078918, "Finetune/Loss (Raw)": 0.8302424550056458, "Finetune/Step": 3159, "Finetune/Step Time": 2.853317905217409} +{"Finetune/Learning Rate": 6.201004427967714e-06, "Finetune/Loss": 0.7939659953117371, "Finetune/Loss (Raw)": 0.8432533144950867, "Finetune/Step": 3160, "Finetune/Step Time": 2.8630202785134315} +{"Finetune/Learning Rate": 6.194982310634143e-06, "Finetune/Loss": 0.794032633304596, "Finetune/Loss (Raw)": 0.8074652552604675, "Finetune/Step": 3161, "Finetune/Step Time": 2.8632417023181915} +{"Finetune/Learning Rate": 6.188961806402371e-06, "Finetune/Loss": 0.794035792350769, "Finetune/Loss (Raw)": 0.8135654330253601, "Finetune/Step": 3162, "Finetune/Step Time": 2.8624145351350307} +{"Finetune/Learning Rate": 6.18294291782473e-06, "Finetune/Loss": 0.794089674949646, "Finetune/Loss (Raw)": 0.8481987714767456, "Finetune/Step": 3163, "Finetune/Step Time": 2.8567461390048265} +{"Finetune/Learning Rate": 6.1769256474528734e-06, "Finetune/Loss": 0.7929867506027222, "Finetune/Loss (Raw)": 0.7521679997444153, "Finetune/Step": 3164, "Finetune/Step Time": 2.8566414173692465} +{"Finetune/Learning Rate": 6.170909997837767e-06, "Finetune/Loss": 0.793541669845581, "Finetune/Loss (Raw)": 0.8427474498748779, "Finetune/Step": 3165, "Finetune/Step Time": 2.8579000402241945} +{"Finetune/Learning Rate": 6.164895971529692e-06, "Finetune/Loss": 0.7949177622795105, "Finetune/Loss (Raw)": 0.8913357257843018, "Finetune/Step": 3166, "Finetune/Step Time": 2.8591707590967417} +{"Finetune/Learning Rate": 6.158883571078236e-06, "Finetune/Loss": 0.7930859327316284, "Finetune/Loss (Raw)": 0.6678286194801331, "Finetune/Step": 3167, "Finetune/Step Time": 2.864615036174655} +{"Finetune/Learning Rate": 6.152872799032297e-06, "Finetune/Loss": 0.7942424416542053, "Finetune/Loss (Raw)": 0.7502322793006897, "Finetune/Step": 3168, "Finetune/Step Time": 2.845817821100354} +{"Finetune/Learning Rate": 6.146863657940094e-06, "Finetune/Loss": 0.7937374711036682, "Finetune/Loss (Raw)": 0.811407744884491, "Finetune/Step": 3169, "Finetune/Step Time": 2.8473098445683718} +{"Finetune/Learning Rate": 6.14085615034914e-06, "Finetune/Loss": 0.7934972047805786, "Finetune/Loss (Raw)": 0.7615954875946045, "Finetune/Step": 3170, "Finetune/Step Time": 2.8470974657684565} +{"Finetune/Learning Rate": 6.1348502788062625e-06, "Finetune/Loss": 0.7931832075119019, "Finetune/Loss (Raw)": 0.7082510590553284, "Finetune/Step": 3171, "Finetune/Step Time": 2.8448360841721296} +{"Finetune/Learning Rate": 6.128846045857595e-06, "Finetune/Loss": 0.7928521633148193, "Finetune/Loss (Raw)": 0.8421066999435425, "Finetune/Step": 3172, "Finetune/Step Time": 2.8461394235491753} +{"Finetune/Learning Rate": 6.122843454048581e-06, "Finetune/Loss": 0.7931132316589355, "Finetune/Loss (Raw)": 0.829724907875061, "Finetune/Step": 3173, "Finetune/Step Time": 2.8453003726899624} +{"Finetune/Learning Rate": 6.116842505923955e-06, "Finetune/Loss": 0.7951616644859314, "Finetune/Loss (Raw)": 0.8561912775039673, "Finetune/Step": 3174, "Finetune/Step Time": 2.82093702070415} +{"Finetune/Learning Rate": 6.110843204027768e-06, "Finetune/Loss": 0.7962620854377747, "Finetune/Loss (Raw)": 0.9989243149757385, "Finetune/Step": 3175, "Finetune/Step Time": 2.825265634804964} +{"Finetune/Learning Rate": 6.104845550903372e-06, "Finetune/Loss": 0.7963359951972961, "Finetune/Loss (Raw)": 0.7826000452041626, "Finetune/Step": 3176, "Finetune/Step Time": 2.8152798246592283} +{"Finetune/Learning Rate": 6.098849549093408e-06, "Finetune/Loss": 0.7961483001708984, "Finetune/Loss (Raw)": 0.7887230515480042, "Finetune/Step": 3177, "Finetune/Step Time": 2.8172635473310947} +{"Finetune/Learning Rate": 6.092855201139829e-06, "Finetune/Loss": 0.7968807220458984, "Finetune/Loss (Raw)": 0.8829577565193176, "Finetune/Step": 3178, "Finetune/Step Time": 2.8197783529758453} +{"Finetune/Learning Rate": 6.086862509583882e-06, "Finetune/Loss": 0.7970354557037354, "Finetune/Loss (Raw)": 0.8706179857254028, "Finetune/Step": 3179, "Finetune/Step Time": 2.8209627363830805} +{"Finetune/Learning Rate": 6.080871476966117e-06, "Finetune/Loss": 0.7971532940864563, "Finetune/Loss (Raw)": 0.9007032513618469, "Finetune/Step": 3180, "Finetune/Step Time": 2.818946836516261} +{"Finetune/Learning Rate": 6.074882105826372e-06, "Finetune/Loss": 0.7968580722808838, "Finetune/Loss (Raw)": 0.7333008646965027, "Finetune/Step": 3181, "Finetune/Step Time": 2.8184956833720207} +{"Finetune/Learning Rate": 6.068894398703784e-06, "Finetune/Loss": 0.7975820302963257, "Finetune/Loss (Raw)": 0.8063902258872986, "Finetune/Step": 3182, "Finetune/Step Time": 2.8210882283747196} +{"Finetune/Learning Rate": 6.062908358136792e-06, "Finetune/Loss": 0.797667384147644, "Finetune/Loss (Raw)": 0.7984998226165771, "Finetune/Step": 3183, "Finetune/Step Time": 2.8243791200220585} +{"Finetune/Learning Rate": 6.056923986663112e-06, "Finetune/Loss": 0.7971594333648682, "Finetune/Loss (Raw)": 0.7250623106956482, "Finetune/Step": 3184, "Finetune/Step Time": 2.8276126496493816} +{"Finetune/Learning Rate": 6.050941286819771e-06, "Finetune/Loss": 0.7977802753448486, "Finetune/Loss (Raw)": 0.901198148727417, "Finetune/Step": 3185, "Finetune/Step Time": 2.82951651327312} +{"Finetune/Learning Rate": 6.044960261143078e-06, "Finetune/Loss": 0.7983837723731995, "Finetune/Loss (Raw)": 0.9293574690818787, "Finetune/Step": 3186, "Finetune/Step Time": 2.8281480725854635} +{"Finetune/Learning Rate": 6.03898091216863e-06, "Finetune/Loss": 0.7981986403465271, "Finetune/Loss (Raw)": 0.7877774238586426, "Finetune/Step": 3187, "Finetune/Step Time": 2.8298668079078197} +{"Finetune/Learning Rate": 6.033003242431315e-06, "Finetune/Loss": 0.7984120845794678, "Finetune/Loss (Raw)": 0.8286426663398743, "Finetune/Step": 3188, "Finetune/Step Time": 2.826721204444766} +{"Finetune/Learning Rate": 6.027027254465314e-06, "Finetune/Loss": 0.7976193428039551, "Finetune/Loss (Raw)": 0.7974320650100708, "Finetune/Step": 3189, "Finetune/Step Time": 2.8265479542315006} +{"Finetune/Learning Rate": 6.021052950804095e-06, "Finetune/Loss": 0.7983262538909912, "Finetune/Loss (Raw)": 0.8324390649795532, "Finetune/Step": 3190, "Finetune/Step Time": 2.825399188324809} +{"Finetune/Learning Rate": 6.015080333980401e-06, "Finetune/Loss": 0.7990046143531799, "Finetune/Loss (Raw)": 0.8628969192504883, "Finetune/Step": 3191, "Finetune/Step Time": 2.82833912037313} +{"Finetune/Learning Rate": 6.009109406526268e-06, "Finetune/Loss": 0.7993378043174744, "Finetune/Loss (Raw)": 0.8329088091850281, "Finetune/Step": 3192, "Finetune/Step Time": 2.828648528084159} +{"Finetune/Learning Rate": 6.003140170973022e-06, "Finetune/Loss": 0.8000199198722839, "Finetune/Loss (Raw)": 0.8130942583084106, "Finetune/Step": 3193, "Finetune/Step Time": 2.8295463360846043} +{"Finetune/Learning Rate": 5.997172629851256e-06, "Finetune/Loss": 0.8007591962814331, "Finetune/Loss (Raw)": 0.8164075613021851, "Finetune/Step": 3194, "Finetune/Step Time": 2.82859324850142} +{"Finetune/Learning Rate": 5.991206785690858e-06, "Finetune/Loss": 0.801023006439209, "Finetune/Loss (Raw)": 0.8107530474662781, "Finetune/Step": 3195, "Finetune/Step Time": 2.8341145385056734} +{"Finetune/Learning Rate": 5.985242641020989e-06, "Finetune/Loss": 0.8003184795379639, "Finetune/Loss (Raw)": 0.7627463340759277, "Finetune/Step": 3196, "Finetune/Step Time": 2.833511110395193} +{"Finetune/Learning Rate": 5.979280198370101e-06, "Finetune/Loss": 0.8010956645011902, "Finetune/Loss (Raw)": 0.7590476870536804, "Finetune/Step": 3197, "Finetune/Step Time": 2.834688825532794} +{"Finetune/Learning Rate": 5.973319460265905e-06, "Finetune/Loss": 0.8016927242279053, "Finetune/Loss (Raw)": 0.8767032623291016, "Finetune/Step": 3198, "Finetune/Step Time": 2.832386337220669} +{"Finetune/Learning Rate": 5.967360429235407e-06, "Finetune/Loss": 0.8018399477005005, "Finetune/Loss (Raw)": 0.8232117891311646, "Finetune/Step": 3199, "Finetune/Step Time": 2.832560380920768} +{"Finetune/Learning Rate": 5.961403107804882e-06, "Finetune/Loss": 0.8023996949195862, "Finetune/Loss (Raw)": 0.821839451789856, "Finetune/Step": 3200, "Finetune/Step Time": 2.8302157055586576} +{"Finetune/Learning Rate": 5.95544749849988e-06, "Finetune/Loss": 0.8020647764205933, "Finetune/Loss (Raw)": 0.8641118407249451, "Finetune/Step": 3201, "Finetune/Step Time": 2.8276413548737764} +{"Finetune/Learning Rate": 5.949493603845222e-06, "Finetune/Loss": 0.800406813621521, "Finetune/Loss (Raw)": 0.6474589705467224, "Finetune/Step": 3202, "Finetune/Step Time": 2.850366909056902} +{"Finetune/Learning Rate": 5.943541426365013e-06, "Finetune/Loss": 0.8009317517280579, "Finetune/Loss (Raw)": 0.847176730632782, "Finetune/Step": 3203, "Finetune/Step Time": 2.85092150606215} +{"Finetune/Learning Rate": 5.937590968582623e-06, "Finetune/Loss": 0.7996188998222351, "Finetune/Loss (Raw)": 0.6891805529594421, "Finetune/Step": 3204, "Finetune/Step Time": 2.8516383450478315} +{"Finetune/Learning Rate": 5.931642233020688e-06, "Finetune/Loss": 0.801407516002655, "Finetune/Loss (Raw)": 0.8286088109016418, "Finetune/Step": 3205, "Finetune/Step Time": 2.8324128556996584} +{"Finetune/Learning Rate": 5.92569522220112e-06, "Finetune/Loss": 0.8025864362716675, "Finetune/Loss (Raw)": 0.9030203819274902, "Finetune/Step": 3206, "Finetune/Step Time": 2.8359832670539618} +{"Finetune/Learning Rate": 5.919749938645105e-06, "Finetune/Loss": 0.8042097091674805, "Finetune/Loss (Raw)": 0.9102799892425537, "Finetune/Step": 3207, "Finetune/Step Time": 2.8124795351177454} +{"Finetune/Learning Rate": 5.913806384873082e-06, "Finetune/Loss": 0.8036667704582214, "Finetune/Loss (Raw)": 0.7524867653846741, "Finetune/Step": 3208, "Finetune/Step Time": 2.8077888544648886} +{"Finetune/Learning Rate": 5.90786456340477e-06, "Finetune/Loss": 0.8035398721694946, "Finetune/Loss (Raw)": 0.8406261205673218, "Finetune/Step": 3209, "Finetune/Step Time": 2.783087158575654} +{"Finetune/Learning Rate": 5.901924476759147e-06, "Finetune/Loss": 0.8022282123565674, "Finetune/Loss (Raw)": 0.6059525012969971, "Finetune/Step": 3210, "Finetune/Step Time": 2.800466012209654} +{"Finetune/Learning Rate": 5.895986127454463e-06, "Finetune/Loss": 0.7966973781585693, "Finetune/Loss (Raw)": 0.18745644390583038, "Finetune/Step": 3211, "Finetune/Step Time": 2.839972123503685} +{"Finetune/Learning Rate": 5.890049518008215e-06, "Finetune/Loss": 0.796289324760437, "Finetune/Loss (Raw)": 0.838252067565918, "Finetune/Step": 3212, "Finetune/Step Time": 2.8408583346754313} +{"Finetune/Learning Rate": 5.884114650937182e-06, "Finetune/Loss": 0.7964522242546082, "Finetune/Loss (Raw)": 0.8909990191459656, "Finetune/Step": 3213, "Finetune/Step Time": 2.8375442661345005} +{"Finetune/Learning Rate": 5.8781815287573955e-06, "Finetune/Loss": 0.7978169918060303, "Finetune/Loss (Raw)": 0.8487533926963806, "Finetune/Step": 3214, "Finetune/Step Time": 2.838863894343376} +{"Finetune/Learning Rate": 5.872250153984143e-06, "Finetune/Loss": 0.7952375411987305, "Finetune/Loss (Raw)": 0.4010007977485657, "Finetune/Step": 3215, "Finetune/Step Time": 2.8715646769851446} +{"Finetune/Learning Rate": 5.8663205291319765e-06, "Finetune/Loss": 0.7947167754173279, "Finetune/Loss (Raw)": 0.7873346209526062, "Finetune/Step": 3216, "Finetune/Step Time": 2.881837274879217} +{"Finetune/Learning Rate": 5.860392656714706e-06, "Finetune/Loss": 0.7933419346809387, "Finetune/Loss (Raw)": 0.7347316741943359, "Finetune/Step": 3217, "Finetune/Step Time": 2.8811895735561848} +{"Finetune/Learning Rate": 5.854466539245403e-06, "Finetune/Loss": 0.7932077646255493, "Finetune/Loss (Raw)": 0.7003628015518188, "Finetune/Step": 3218, "Finetune/Step Time": 2.881284885108471} +{"Finetune/Learning Rate": 5.8485421792363804e-06, "Finetune/Loss": 0.7935808897018433, "Finetune/Loss (Raw)": 0.7730415463447571, "Finetune/Step": 3219, "Finetune/Step Time": 2.8831539265811443} +{"Finetune/Learning Rate": 5.84261957919922e-06, "Finetune/Loss": 0.7942742109298706, "Finetune/Loss (Raw)": 0.8721365928649902, "Finetune/Step": 3220, "Finetune/Step Time": 2.882594721391797} +{"Finetune/Learning Rate": 5.836698741644753e-06, "Finetune/Loss": 0.793769121170044, "Finetune/Loss (Raw)": 0.8775347471237183, "Finetune/Step": 3221, "Finetune/Step Time": 2.882714692503214} +{"Finetune/Learning Rate": 5.830779669083064e-06, "Finetune/Loss": 0.7920109033584595, "Finetune/Loss (Raw)": 0.6088135838508606, "Finetune/Step": 3222, "Finetune/Step Time": 2.902213351801038} +{"Finetune/Learning Rate": 5.824862364023489e-06, "Finetune/Loss": 0.7914498448371887, "Finetune/Loss (Raw)": 0.7432056665420532, "Finetune/Step": 3223, "Finetune/Step Time": 2.904023999348283} +{"Finetune/Learning Rate": 5.8189468289746075e-06, "Finetune/Loss": 0.7901250123977661, "Finetune/Loss (Raw)": 0.6889198422431946, "Finetune/Step": 3224, "Finetune/Step Time": 2.9071794487535954} +{"Finetune/Learning Rate": 5.813033066444269e-06, "Finetune/Loss": 0.7899086475372314, "Finetune/Loss (Raw)": 0.8151918649673462, "Finetune/Step": 3225, "Finetune/Step Time": 2.9052460063248873} +{"Finetune/Learning Rate": 5.807121078939546e-06, "Finetune/Loss": 0.7892157435417175, "Finetune/Loss (Raw)": 0.7074707746505737, "Finetune/Step": 3226, "Finetune/Step Time": 2.903778627514839} +{"Finetune/Learning Rate": 5.801210868966771e-06, "Finetune/Loss": 0.7885848879814148, "Finetune/Loss (Raw)": 0.7529146671295166, "Finetune/Step": 3227, "Finetune/Step Time": 2.9021867979317904} +{"Finetune/Learning Rate": 5.7953024390315345e-06, "Finetune/Loss": 0.788954496383667, "Finetune/Loss (Raw)": 0.8001846075057983, "Finetune/Step": 3228, "Finetune/Step Time": 2.9031023792922497} +{"Finetune/Learning Rate": 5.789395791638643e-06, "Finetune/Loss": 0.7882925271987915, "Finetune/Loss (Raw)": 0.7872352600097656, "Finetune/Step": 3229, "Finetune/Step Time": 2.8979397378861904} +{"Finetune/Learning Rate": 5.783490929292179e-06, "Finetune/Loss": 0.7881358861923218, "Finetune/Loss (Raw)": 0.6045020222663879, "Finetune/Step": 3230, "Finetune/Step Time": 2.9010586570948362} +{"Finetune/Learning Rate": 5.777587854495448e-06, "Finetune/Loss": 0.7898745536804199, "Finetune/Loss (Raw)": 0.8054654598236084, "Finetune/Step": 3231, "Finetune/Step Time": 2.8750078473240137} +{"Finetune/Learning Rate": 5.771686569751002e-06, "Finetune/Loss": 0.7899375557899475, "Finetune/Loss (Raw)": 0.8040398955345154, "Finetune/Step": 3232, "Finetune/Step Time": 2.8663707952946424} +{"Finetune/Learning Rate": 5.76578707756064e-06, "Finetune/Loss": 0.7908946871757507, "Finetune/Loss (Raw)": 0.8879140615463257, "Finetune/Step": 3233, "Finetune/Step Time": 2.8678845148533583} +{"Finetune/Learning Rate": 5.759889380425393e-06, "Finetune/Loss": 0.7916345596313477, "Finetune/Loss (Raw)": 0.8529813885688782, "Finetune/Step": 3234, "Finetune/Step Time": 2.8635756820440292} +{"Finetune/Learning Rate": 5.753993480845537e-06, "Finetune/Loss": 0.7937803268432617, "Finetune/Loss (Raw)": 0.841944694519043, "Finetune/Step": 3235, "Finetune/Step Time": 2.8426508996635675} +{"Finetune/Learning Rate": 5.748099381320582e-06, "Finetune/Loss": 0.7941224575042725, "Finetune/Loss (Raw)": 0.8510995507240295, "Finetune/Step": 3236, "Finetune/Step Time": 2.8429300636053085} +{"Finetune/Learning Rate": 5.742207084349274e-06, "Finetune/Loss": 0.7940530776977539, "Finetune/Loss (Raw)": 0.7632289528846741, "Finetune/Step": 3237, "Finetune/Step Time": 2.8422014247626066} +{"Finetune/Learning Rate": 5.736316592429603e-06, "Finetune/Loss": 0.7941091060638428, "Finetune/Loss (Raw)": 0.8613986968994141, "Finetune/Step": 3238, "Finetune/Step Time": 2.8429087810218334} +{"Finetune/Learning Rate": 5.730427908058788e-06, "Finetune/Loss": 0.794420599937439, "Finetune/Loss (Raw)": 0.683587372303009, "Finetune/Step": 3239, "Finetune/Step Time": 2.8217712324112654} +{"Finetune/Learning Rate": 5.724541033733278e-06, "Finetune/Loss": 0.7936100959777832, "Finetune/Loss (Raw)": 0.8219437599182129, "Finetune/Step": 3240, "Finetune/Step Time": 2.8216169327497482} +{"Finetune/Learning Rate": 5.718655971948762e-06, "Finetune/Loss": 0.7933950424194336, "Finetune/Loss (Raw)": 0.8544427156448364, "Finetune/Step": 3241, "Finetune/Step Time": 2.81912081502378} +{"Finetune/Learning Rate": 5.712772725200155e-06, "Finetune/Loss": 0.7941253185272217, "Finetune/Loss (Raw)": 0.8718204498291016, "Finetune/Step": 3242, "Finetune/Step Time": 2.8181958328932524} +{"Finetune/Learning Rate": 5.706891295981605e-06, "Finetune/Loss": 0.7940913438796997, "Finetune/Loss (Raw)": 0.8282111287117004, "Finetune/Step": 3243, "Finetune/Step Time": 2.816649954766035} +{"Finetune/Learning Rate": 5.701011686786488e-06, "Finetune/Loss": 0.7934897541999817, "Finetune/Loss (Raw)": 0.7901906371116638, "Finetune/Step": 3244, "Finetune/Step Time": 2.8128220662474632} +{"Finetune/Learning Rate": 5.695133900107408e-06, "Finetune/Loss": 0.7936984300613403, "Finetune/Loss (Raw)": 0.9160011410713196, "Finetune/Step": 3245, "Finetune/Step Time": 2.8108244258910418} +{"Finetune/Learning Rate": 5.689257938436209e-06, "Finetune/Loss": 0.794095516204834, "Finetune/Loss (Raw)": 0.8104372024536133, "Finetune/Step": 3246, "Finetune/Step Time": 2.7897272743284702} +{"Finetune/Learning Rate": 5.6833838042639335e-06, "Finetune/Loss": 0.7942060232162476, "Finetune/Loss (Raw)": 0.8070802688598633, "Finetune/Step": 3247, "Finetune/Step Time": 2.785243671387434} +{"Finetune/Learning Rate": 5.677511500080878e-06, "Finetune/Loss": 0.7924100756645203, "Finetune/Loss (Raw)": 0.6775702834129333, "Finetune/Step": 3248, "Finetune/Step Time": 2.786568069830537} +{"Finetune/Learning Rate": 5.671641028376547e-06, "Finetune/Loss": 0.7925733327865601, "Finetune/Loss (Raw)": 0.7952096462249756, "Finetune/Step": 3249, "Finetune/Step Time": 2.7848538365215063} +{"Finetune/Learning Rate": 5.665772391639672e-06, "Finetune/Loss": 0.7924096584320068, "Finetune/Loss (Raw)": 0.7936133742332458, "Finetune/Step": 3250, "Finetune/Step Time": 2.7853578869253397} +{"Finetune/Learning Rate": 5.65990559235821e-06, "Finetune/Loss": 0.7915531396865845, "Finetune/Loss (Raw)": 0.745137631893158, "Finetune/Step": 3251, "Finetune/Step Time": 2.780358573421836} +{"Finetune/Learning Rate": 5.654040633019328e-06, "Finetune/Loss": 0.7912183403968811, "Finetune/Loss (Raw)": 0.7598064541816711, "Finetune/Step": 3252, "Finetune/Step Time": 2.780302641913295} +{"Finetune/Learning Rate": 5.648177516109435e-06, "Finetune/Loss": 0.7913986444473267, "Finetune/Loss (Raw)": 0.8428282737731934, "Finetune/Step": 3253, "Finetune/Step Time": 2.778971403837204} +{"Finetune/Learning Rate": 5.642316244114131e-06, "Finetune/Loss": 0.7913410067558289, "Finetune/Loss (Raw)": 0.7614865303039551, "Finetune/Step": 3254, "Finetune/Step Time": 2.775910332798958} +{"Finetune/Learning Rate": 5.63645681951825e-06, "Finetune/Loss": 0.7914794087409973, "Finetune/Loss (Raw)": 0.7851406335830688, "Finetune/Step": 3255, "Finetune/Step Time": 2.7768466398119926} +{"Finetune/Learning Rate": 5.63059924480585e-06, "Finetune/Loss": 0.7890293598175049, "Finetune/Loss (Raw)": 0.4848380386829376, "Finetune/Step": 3256, "Finetune/Step Time": 2.798098396509886} +{"Finetune/Learning Rate": 5.624743522460181e-06, "Finetune/Loss": 0.7892285585403442, "Finetune/Loss (Raw)": 0.8503496646881104, "Finetune/Step": 3257, "Finetune/Step Time": 2.7950851060450077} +{"Finetune/Learning Rate": 5.6188896549637325e-06, "Finetune/Loss": 0.7896794080734253, "Finetune/Loss (Raw)": 0.840959906578064, "Finetune/Step": 3258, "Finetune/Step Time": 2.7945214081555605} +{"Finetune/Learning Rate": 5.613037644798196e-06, "Finetune/Loss": 0.7900220155715942, "Finetune/Loss (Raw)": 0.8613964915275574, "Finetune/Step": 3259, "Finetune/Step Time": 2.7922309171408415} +{"Finetune/Learning Rate": 5.607187494444473e-06, "Finetune/Loss": 0.7889272570610046, "Finetune/Loss (Raw)": 0.6982240676879883, "Finetune/Step": 3260, "Finetune/Step Time": 2.7944966331124306} +{"Finetune/Learning Rate": 5.601339206382682e-06, "Finetune/Loss": 0.7891702651977539, "Finetune/Loss (Raw)": 0.8190733790397644, "Finetune/Step": 3261, "Finetune/Step Time": 2.793227968737483} +{"Finetune/Learning Rate": 5.595492783092151e-06, "Finetune/Loss": 0.7906800508499146, "Finetune/Loss (Raw)": 0.9502354860305786, "Finetune/Step": 3262, "Finetune/Step Time": 2.789754591882229} +{"Finetune/Learning Rate": 5.5896482270514144e-06, "Finetune/Loss": 0.7907798290252686, "Finetune/Loss (Raw)": 0.7687795758247375, "Finetune/Step": 3263, "Finetune/Step Time": 2.7905463073402643} +{"Finetune/Learning Rate": 5.58380554073822e-06, "Finetune/Loss": 0.7917272448539734, "Finetune/Loss (Raw)": 0.8217427134513855, "Finetune/Step": 3264, "Finetune/Step Time": 2.786354139447212} +{"Finetune/Learning Rate": 5.577964726629515e-06, "Finetune/Loss": 0.7909404039382935, "Finetune/Loss (Raw)": 0.7382221817970276, "Finetune/Step": 3265, "Finetune/Step Time": 2.786599103361368} +{"Finetune/Learning Rate": 5.572125787201464e-06, "Finetune/Loss": 0.7933797240257263, "Finetune/Loss (Raw)": 0.8322991132736206, "Finetune/Step": 3266, "Finetune/Step Time": 2.763786753639579} +{"Finetune/Learning Rate": 5.56628872492943e-06, "Finetune/Loss": 0.7922086715698242, "Finetune/Loss (Raw)": 0.7186021208763123, "Finetune/Step": 3267, "Finetune/Step Time": 2.7667696848511696} +{"Finetune/Learning Rate": 5.56045354228798e-06, "Finetune/Loss": 0.7913849353790283, "Finetune/Loss (Raw)": 0.7263695001602173, "Finetune/Step": 3268, "Finetune/Step Time": 2.786635233089328} +{"Finetune/Learning Rate": 5.554620241750887e-06, "Finetune/Loss": 0.7890598177909851, "Finetune/Loss (Raw)": 0.5550392270088196, "Finetune/Step": 3269, "Finetune/Step Time": 2.809534987434745} +{"Finetune/Learning Rate": 5.548788825791122e-06, "Finetune/Loss": 0.7884777784347534, "Finetune/Loss (Raw)": 0.8493064045906067, "Finetune/Step": 3270, "Finetune/Step Time": 2.808730587363243} +{"Finetune/Learning Rate": 5.542959296880859e-06, "Finetune/Loss": 0.7885472774505615, "Finetune/Loss (Raw)": 0.8892185091972351, "Finetune/Step": 3271, "Finetune/Step Time": 2.8112926594913006} +{"Finetune/Learning Rate": 5.537131657491475e-06, "Finetune/Loss": 0.7904577255249023, "Finetune/Loss (Raw)": 0.8693234324455261, "Finetune/Step": 3272, "Finetune/Step Time": 2.801078239455819} +{"Finetune/Learning Rate": 5.531305910093538e-06, "Finetune/Loss": 0.7906421422958374, "Finetune/Loss (Raw)": 0.8049020171165466, "Finetune/Step": 3273, "Finetune/Step Time": 2.79835469648242} +{"Finetune/Learning Rate": 5.525482057156833e-06, "Finetune/Loss": 0.7904545068740845, "Finetune/Loss (Raw)": 0.7125537991523743, "Finetune/Step": 3274, "Finetune/Step Time": 2.798356842249632} +{"Finetune/Learning Rate": 5.519660101150308e-06, "Finetune/Loss": 0.7887803912162781, "Finetune/Loss (Raw)": 0.5275796055793762, "Finetune/Step": 3275, "Finetune/Step Time": 2.8242562022060156} +{"Finetune/Learning Rate": 5.513840044542142e-06, "Finetune/Loss": 0.7898118495941162, "Finetune/Loss (Raw)": 0.825103759765625, "Finetune/Step": 3276, "Finetune/Step Time": 2.7969011943787336} +{"Finetune/Learning Rate": 5.50802188979969e-06, "Finetune/Loss": 0.7893627882003784, "Finetune/Loss (Raw)": 0.7529990077018738, "Finetune/Step": 3277, "Finetune/Step Time": 2.7974678482860327} +{"Finetune/Learning Rate": 5.502205639389507e-06, "Finetune/Loss": 0.7901602983474731, "Finetune/Loss (Raw)": 0.8716081976890564, "Finetune/Step": 3278, "Finetune/Step Time": 2.801004173234105} +{"Finetune/Learning Rate": 5.496391295777331e-06, "Finetune/Loss": 0.7905644774436951, "Finetune/Loss (Raw)": 0.8563324809074402, "Finetune/Step": 3279, "Finetune/Step Time": 2.802364921197295} +{"Finetune/Learning Rate": 5.4905788614281005e-06, "Finetune/Loss": 0.791067898273468, "Finetune/Loss (Raw)": 0.9187084436416626, "Finetune/Step": 3280, "Finetune/Step Time": 2.8045805487781763} +{"Finetune/Learning Rate": 5.484768338805955e-06, "Finetune/Loss": 0.790460467338562, "Finetune/Loss (Raw)": 0.7928749322891235, "Finetune/Step": 3281, "Finetune/Step Time": 2.802963687106967} +{"Finetune/Learning Rate": 5.478959730374195e-06, "Finetune/Loss": 0.7906794548034668, "Finetune/Loss (Raw)": 0.8185216188430786, "Finetune/Step": 3282, "Finetune/Step Time": 2.806681739166379} +{"Finetune/Learning Rate": 5.473153038595329e-06, "Finetune/Loss": 0.7918555736541748, "Finetune/Loss (Raw)": 0.8625203967094421, "Finetune/Step": 3283, "Finetune/Step Time": 2.8089049961417913} +{"Finetune/Learning Rate": 5.467348265931063e-06, "Finetune/Loss": 0.7926359176635742, "Finetune/Loss (Raw)": 0.8357582092285156, "Finetune/Step": 3284, "Finetune/Step Time": 2.8109868559986353} +{"Finetune/Learning Rate": 5.461545414842259e-06, "Finetune/Loss": 0.7927946448326111, "Finetune/Loss (Raw)": 0.8611479997634888, "Finetune/Step": 3285, "Finetune/Step Time": 2.809923132881522} +{"Finetune/Learning Rate": 5.455744487788992e-06, "Finetune/Loss": 0.7920611500740051, "Finetune/Loss (Raw)": 0.7471656203269958, "Finetune/Step": 3286, "Finetune/Step Time": 2.8133266493678093} +{"Finetune/Learning Rate": 5.44994548723051e-06, "Finetune/Loss": 0.7922238111495972, "Finetune/Loss (Raw)": 0.8510575294494629, "Finetune/Step": 3287, "Finetune/Step Time": 2.813087409362197} +{"Finetune/Learning Rate": 5.4441484156252425e-06, "Finetune/Loss": 0.7917085886001587, "Finetune/Loss (Raw)": 0.7773039937019348, "Finetune/Step": 3288, "Finetune/Step Time": 2.8033634200692177} +{"Finetune/Learning Rate": 5.4383532754308055e-06, "Finetune/Loss": 0.7919861078262329, "Finetune/Loss (Raw)": 0.8429919481277466, "Finetune/Step": 3289, "Finetune/Step Time": 2.8024598583579063} +{"Finetune/Learning Rate": 5.432560069103991e-06, "Finetune/Loss": 0.7919882535934448, "Finetune/Loss (Raw)": 0.813834011554718, "Finetune/Step": 3290, "Finetune/Step Time": 2.8047786597162485} +{"Finetune/Learning Rate": 5.426768799100785e-06, "Finetune/Loss": 0.7905930280685425, "Finetune/Loss (Raw)": 0.6696213483810425, "Finetune/Step": 3291, "Finetune/Step Time": 2.827277034521103} +{"Finetune/Learning Rate": 5.420979467876333e-06, "Finetune/Loss": 0.7906148433685303, "Finetune/Loss (Raw)": 0.7549517750740051, "Finetune/Step": 3292, "Finetune/Step Time": 2.826556947082281} +{"Finetune/Learning Rate": 5.415192077884967e-06, "Finetune/Loss": 0.7897883653640747, "Finetune/Loss (Raw)": 0.7369611859321594, "Finetune/Step": 3293, "Finetune/Step Time": 2.826930332928896} +{"Finetune/Learning Rate": 5.409406631580203e-06, "Finetune/Loss": 0.7874041795730591, "Finetune/Loss (Raw)": 0.5861560702323914, "Finetune/Step": 3294, "Finetune/Step Time": 2.848649498075247} +{"Finetune/Learning Rate": 5.4036231314147255e-06, "Finetune/Loss": 0.7880438566207886, "Finetune/Loss (Raw)": 0.7497101426124573, "Finetune/Step": 3295, "Finetune/Step Time": 2.843910278752446} +{"Finetune/Learning Rate": 5.397841579840396e-06, "Finetune/Loss": 0.7884790897369385, "Finetune/Loss (Raw)": 0.8059479594230652, "Finetune/Step": 3296, "Finetune/Step Time": 2.840346137061715} +{"Finetune/Learning Rate": 5.392061979308247e-06, "Finetune/Loss": 0.7884078621864319, "Finetune/Loss (Raw)": 0.8022844195365906, "Finetune/Step": 3297, "Finetune/Step Time": 2.8425931222736835} +{"Finetune/Learning Rate": 5.386284332268489e-06, "Finetune/Loss": 0.7890963554382324, "Finetune/Loss (Raw)": 0.8497240543365479, "Finetune/Step": 3298, "Finetune/Step Time": 2.842581393197179} +{"Finetune/Learning Rate": 5.380508641170499e-06, "Finetune/Loss": 0.789696216583252, "Finetune/Loss (Raw)": 0.7850310802459717, "Finetune/Step": 3299, "Finetune/Step Time": 2.8438722379505634} +{"Finetune/Learning Rate": 5.374734908462829e-06, "Finetune/Loss": 0.7881404161453247, "Finetune/Loss (Raw)": 0.6429659724235535, "Finetune/Step": 3300, "Finetune/Step Time": 2.8693603929132223} +{"Finetune/Learning Rate": 5.368963136593195e-06, "Finetune/Loss": 0.7881503701210022, "Finetune/Loss (Raw)": 0.8309993743896484, "Finetune/Step": 3301, "Finetune/Step Time": 2.872192258015275} +{"Finetune/Learning Rate": 5.363193328008498e-06, "Finetune/Loss": 0.7875136137008667, "Finetune/Loss (Raw)": 0.7746904492378235, "Finetune/Step": 3302, "Finetune/Step Time": 2.875595111399889} +{"Finetune/Learning Rate": 5.357425485154778e-06, "Finetune/Loss": 0.7859939932823181, "Finetune/Loss (Raw)": 0.8044089674949646, "Finetune/Step": 3303, "Finetune/Step Time": 2.8735810592770576} +{"Finetune/Learning Rate": 5.3516596104772715e-06, "Finetune/Loss": 0.7865908741950989, "Finetune/Loss (Raw)": 0.8589997291564941, "Finetune/Step": 3304, "Finetune/Step Time": 2.8718615528196096} +{"Finetune/Learning Rate": 5.345895706420361e-06, "Finetune/Loss": 0.7865563631057739, "Finetune/Loss (Raw)": 0.7843090891838074, "Finetune/Step": 3305, "Finetune/Step Time": 2.869565799832344} +{"Finetune/Learning Rate": 5.340133775427601e-06, "Finetune/Loss": 0.786310076713562, "Finetune/Loss (Raw)": 0.851434588432312, "Finetune/Step": 3306, "Finetune/Step Time": 2.874217452481389} +{"Finetune/Learning Rate": 5.334373819941709e-06, "Finetune/Loss": 0.7864484786987305, "Finetune/Loss (Raw)": 0.8883217573165894, "Finetune/Step": 3307, "Finetune/Step Time": 2.8775605596601963} +{"Finetune/Learning Rate": 5.3286158424045605e-06, "Finetune/Loss": 0.7853667140007019, "Finetune/Loss (Raw)": 0.7622491121292114, "Finetune/Step": 3308, "Finetune/Step Time": 2.879496632143855} +{"Finetune/Learning Rate": 5.3228598452572086e-06, "Finetune/Loss": 0.7865985631942749, "Finetune/Loss (Raw)": 0.8909774422645569, "Finetune/Step": 3309, "Finetune/Step Time": 2.8773694336414337} +{"Finetune/Learning Rate": 5.317105830939843e-06, "Finetune/Loss": 0.7825421690940857, "Finetune/Loss (Raw)": 0.287168949842453, "Finetune/Step": 3310, "Finetune/Step Time": 2.905612960457802} +{"Finetune/Learning Rate": 5.311353801891823e-06, "Finetune/Loss": 0.7826894521713257, "Finetune/Loss (Raw)": 0.8173494935035706, "Finetune/Step": 3311, "Finetune/Step Time": 2.9024002514779568} +{"Finetune/Learning Rate": 5.30560376055168e-06, "Finetune/Loss": 0.7838352918624878, "Finetune/Loss (Raw)": 0.8717352747917175, "Finetune/Step": 3312, "Finetune/Step Time": 2.8990692887455225} +{"Finetune/Learning Rate": 5.299855709357074e-06, "Finetune/Loss": 0.7829947471618652, "Finetune/Loss (Raw)": 0.793607771396637, "Finetune/Step": 3313, "Finetune/Step Time": 2.8980921898037195} +{"Finetune/Learning Rate": 5.294109650744852e-06, "Finetune/Loss": 0.7815811634063721, "Finetune/Loss (Raw)": 0.7484174370765686, "Finetune/Step": 3314, "Finetune/Step Time": 2.900303453207016} +{"Finetune/Learning Rate": 5.288365587150996e-06, "Finetune/Loss": 0.7813209891319275, "Finetune/Loss (Raw)": 0.7544704079627991, "Finetune/Step": 3315, "Finetune/Step Time": 2.8991011660546064} +{"Finetune/Learning Rate": 5.282623521010649e-06, "Finetune/Loss": 0.7811336517333984, "Finetune/Loss (Raw)": 0.8046693801879883, "Finetune/Step": 3316, "Finetune/Step Time": 2.900176538154483} +{"Finetune/Learning Rate": 5.276883454758106e-06, "Finetune/Loss": 0.7811720371246338, "Finetune/Loss (Raw)": 0.8023415803909302, "Finetune/Step": 3317, "Finetune/Step Time": 2.8972103353589773} +{"Finetune/Learning Rate": 5.271145390826812e-06, "Finetune/Loss": 0.7810869216918945, "Finetune/Loss (Raw)": 0.8215486407279968, "Finetune/Step": 3318, "Finetune/Step Time": 2.900378881022334} +{"Finetune/Learning Rate": 5.265409331649376e-06, "Finetune/Loss": 0.7787890434265137, "Finetune/Loss (Raw)": 0.5687669515609741, "Finetune/Step": 3319, "Finetune/Step Time": 2.919835666194558} +{"Finetune/Learning Rate": 5.259675279657534e-06, "Finetune/Loss": 0.7796787619590759, "Finetune/Loss (Raw)": 0.9467901587486267, "Finetune/Step": 3320, "Finetune/Step Time": 2.9193674195557833} +{"Finetune/Learning Rate": 5.253943237282189e-06, "Finetune/Loss": 0.7799967527389526, "Finetune/Loss (Raw)": 0.8537952899932861, "Finetune/Step": 3321, "Finetune/Step Time": 2.9207020960748196} +{"Finetune/Learning Rate": 5.248213206953388e-06, "Finetune/Loss": 0.7748587131500244, "Finetune/Loss (Raw)": 0.15873582661151886, "Finetune/Step": 3322, "Finetune/Step Time": 2.953846665099263} +{"Finetune/Learning Rate": 5.242485191100324e-06, "Finetune/Loss": 0.7742841243743896, "Finetune/Loss (Raw)": 0.7372063398361206, "Finetune/Step": 3323, "Finetune/Step Time": 2.9506207276135683} +{"Finetune/Learning Rate": 5.236759192151336e-06, "Finetune/Loss": 0.7745962142944336, "Finetune/Loss (Raw)": 0.8027001619338989, "Finetune/Step": 3324, "Finetune/Step Time": 2.949692102149129} +{"Finetune/Learning Rate": 5.231035212533907e-06, "Finetune/Loss": 0.7744393348693848, "Finetune/Loss (Raw)": 0.7389650940895081, "Finetune/Step": 3325, "Finetune/Step Time": 2.948765469714999} +{"Finetune/Learning Rate": 5.225313254674664e-06, "Finetune/Loss": 0.7738005518913269, "Finetune/Loss (Raw)": 0.7949340343475342, "Finetune/Step": 3326, "Finetune/Step Time": 2.953097615391016} +{"Finetune/Learning Rate": 5.219593320999381e-06, "Finetune/Loss": 0.7725352048873901, "Finetune/Loss (Raw)": 0.6612520217895508, "Finetune/Step": 3327, "Finetune/Step Time": 2.9519287273287773} +{"Finetune/Learning Rate": 5.213875413932966e-06, "Finetune/Loss": 0.7724862694740295, "Finetune/Loss (Raw)": 0.8155776858329773, "Finetune/Step": 3328, "Finetune/Step Time": 2.9607442282140255} +{"Finetune/Learning Rate": 5.208159535899472e-06, "Finetune/Loss": 0.772453248500824, "Finetune/Loss (Raw)": 0.8598873615264893, "Finetune/Step": 3329, "Finetune/Step Time": 2.9596667643636465} +{"Finetune/Learning Rate": 5.202445689322102e-06, "Finetune/Loss": 0.7739230394363403, "Finetune/Loss (Raw)": 0.835580050945282, "Finetune/Step": 3330, "Finetune/Step Time": 2.935971897095442} +{"Finetune/Learning Rate": 5.196733876623174e-06, "Finetune/Loss": 0.7730740308761597, "Finetune/Loss (Raw)": 0.7385084629058838, "Finetune/Step": 3331, "Finetune/Step Time": 2.935824790969491} +{"Finetune/Learning Rate": 5.191024100224169e-06, "Finetune/Loss": 0.7742973566055298, "Finetune/Loss (Raw)": 0.8457692265510559, "Finetune/Step": 3332, "Finetune/Step Time": 2.9333434849977493} +{"Finetune/Learning Rate": 5.185316362545688e-06, "Finetune/Loss": 0.7744532823562622, "Finetune/Loss (Raw)": 0.8485645651817322, "Finetune/Step": 3333, "Finetune/Step Time": 2.926018189638853} +{"Finetune/Learning Rate": 5.179610666007475e-06, "Finetune/Loss": 0.7736098766326904, "Finetune/Loss (Raw)": 0.7950671315193176, "Finetune/Step": 3334, "Finetune/Step Time": 2.9268484823405743} +{"Finetune/Learning Rate": 5.1739070130284066e-06, "Finetune/Loss": 0.7735339403152466, "Finetune/Loss (Raw)": 0.9005585312843323, "Finetune/Step": 3335, "Finetune/Step Time": 2.9276885390281677} +{"Finetune/Learning Rate": 5.168205406026489e-06, "Finetune/Loss": 0.7731669545173645, "Finetune/Loss (Raw)": 0.7055103778839111, "Finetune/Step": 3336, "Finetune/Step Time": 2.9531935527920723} +{"Finetune/Learning Rate": 5.162505847418877e-06, "Finetune/Loss": 0.7728759050369263, "Finetune/Loss (Raw)": 0.8033773303031921, "Finetune/Step": 3337, "Finetune/Step Time": 2.954886684194207} +{"Finetune/Learning Rate": 5.156808339621835e-06, "Finetune/Loss": 0.7748185396194458, "Finetune/Loss (Raw)": 0.8546016812324524, "Finetune/Step": 3338, "Finetune/Step Time": 2.9376065749675035} +{"Finetune/Learning Rate": 5.151112885050767e-06, "Finetune/Loss": 0.7797015905380249, "Finetune/Loss (Raw)": 0.812492311000824, "Finetune/Step": 3339, "Finetune/Step Time": 2.9016787856817245} +{"Finetune/Learning Rate": 5.145419486120218e-06, "Finetune/Loss": 0.7802361249923706, "Finetune/Loss (Raw)": 0.906674325466156, "Finetune/Step": 3340, "Finetune/Step Time": 2.9005566872656345} +{"Finetune/Learning Rate": 5.139728145243839e-06, "Finetune/Loss": 0.7797129154205322, "Finetune/Loss (Raw)": 0.8240225911140442, "Finetune/Step": 3341, "Finetune/Step Time": 2.9009308461099863} +{"Finetune/Learning Rate": 5.134038864834432e-06, "Finetune/Loss": 0.778857946395874, "Finetune/Loss (Raw)": 0.7393181920051575, "Finetune/Step": 3342, "Finetune/Step Time": 2.9017643332481384} +{"Finetune/Learning Rate": 5.128351647303908e-06, "Finetune/Loss": 0.7824267148971558, "Finetune/Loss (Raw)": 0.8578017950057983, "Finetune/Step": 3343, "Finetune/Step Time": 2.866558799520135} +{"Finetune/Learning Rate": 5.122666495063313e-06, "Finetune/Loss": 0.7820619344711304, "Finetune/Loss (Raw)": 0.7406518459320068, "Finetune/Step": 3344, "Finetune/Step Time": 2.857661882415414} +{"Finetune/Learning Rate": 5.116983410522813e-06, "Finetune/Loss": 0.7822808623313904, "Finetune/Loss (Raw)": 0.7627537846565247, "Finetune/Step": 3345, "Finetune/Step Time": 2.854586658999324} +{"Finetune/Learning Rate": 5.111302396091695e-06, "Finetune/Loss": 0.7827823162078857, "Finetune/Loss (Raw)": 0.7645520567893982, "Finetune/Step": 3346, "Finetune/Step Time": 2.8766643591225147} +{"Finetune/Learning Rate": 5.105623454178383e-06, "Finetune/Loss": 0.7834667563438416, "Finetune/Loss (Raw)": 0.860640823841095, "Finetune/Step": 3347, "Finetune/Step Time": 2.872149705886841} +{"Finetune/Learning Rate": 5.099946587190401e-06, "Finetune/Loss": 0.7837725877761841, "Finetune/Loss (Raw)": 0.9112896919250488, "Finetune/Step": 3348, "Finetune/Step Time": 2.871554972603917} +{"Finetune/Learning Rate": 5.094271797534404e-06, "Finetune/Loss": 0.7831012010574341, "Finetune/Loss (Raw)": 0.7915880680084229, "Finetune/Step": 3349, "Finetune/Step Time": 2.87279761582613} +{"Finetune/Learning Rate": 5.088599087616177e-06, "Finetune/Loss": 0.785122275352478, "Finetune/Loss (Raw)": 0.8675107359886169, "Finetune/Step": 3350, "Finetune/Step Time": 2.849060555920005} +{"Finetune/Learning Rate": 5.082928459840597e-06, "Finetune/Loss": 0.7851510047912598, "Finetune/Loss (Raw)": 0.7468825578689575, "Finetune/Step": 3351, "Finetune/Step Time": 2.8498972840607166} +{"Finetune/Learning Rate": 5.077259916611685e-06, "Finetune/Loss": 0.7837350368499756, "Finetune/Loss (Raw)": 0.507675290107727, "Finetune/Step": 3352, "Finetune/Step Time": 2.872248539701104} +{"Finetune/Learning Rate": 5.071593460332565e-06, "Finetune/Loss": 0.7831094861030579, "Finetune/Loss (Raw)": 0.7351292371749878, "Finetune/Step": 3353, "Finetune/Step Time": 2.871272085234523} +{"Finetune/Learning Rate": 5.065929093405477e-06, "Finetune/Loss": 0.7837926149368286, "Finetune/Loss (Raw)": 0.7949095964431763, "Finetune/Step": 3354, "Finetune/Step Time": 2.87171415053308} +{"Finetune/Learning Rate": 5.060266818231776e-06, "Finetune/Loss": 0.7836441993713379, "Finetune/Loss (Raw)": 0.7339127659797668, "Finetune/Step": 3355, "Finetune/Step Time": 2.872706774622202} +{"Finetune/Learning Rate": 5.054606637211933e-06, "Finetune/Loss": 0.7827574014663696, "Finetune/Loss (Raw)": 0.6866762042045593, "Finetune/Step": 3356, "Finetune/Step Time": 2.876666756346822} +{"Finetune/Learning Rate": 5.048948552745527e-06, "Finetune/Loss": 0.782957136631012, "Finetune/Loss (Raw)": 0.8128024935722351, "Finetune/Step": 3357, "Finetune/Step Time": 2.8765070997178555} +{"Finetune/Learning Rate": 5.0432925672312505e-06, "Finetune/Loss": 0.7844390869140625, "Finetune/Loss (Raw)": 0.7941911816596985, "Finetune/Step": 3358, "Finetune/Step Time": 2.8501667361706495} +{"Finetune/Learning Rate": 5.037638683066903e-06, "Finetune/Loss": 0.7830781936645508, "Finetune/Loss (Raw)": 0.6312652230262756, "Finetune/Step": 3359, "Finetune/Step Time": 2.8506377432495356} +{"Finetune/Learning Rate": 5.031986902649402e-06, "Finetune/Loss": 0.7826899290084839, "Finetune/Loss (Raw)": 0.7543479204177856, "Finetune/Step": 3360, "Finetune/Step Time": 2.850832626223564} +{"Finetune/Learning Rate": 5.026337228374765e-06, "Finetune/Loss": 0.7821638584136963, "Finetune/Loss (Raw)": 0.8205761909484863, "Finetune/Step": 3361, "Finetune/Step Time": 2.8476532120257616} +{"Finetune/Learning Rate": 5.020689662638118e-06, "Finetune/Loss": 0.7810770869255066, "Finetune/Loss (Raw)": 0.7138826847076416, "Finetune/Step": 3362, "Finetune/Step Time": 2.847721790894866} +{"Finetune/Learning Rate": 5.015044207833695e-06, "Finetune/Loss": 0.779861569404602, "Finetune/Loss (Raw)": 0.6863536238670349, "Finetune/Step": 3363, "Finetune/Step Time": 2.845521792769432} +{"Finetune/Learning Rate": 5.0094008663548325e-06, "Finetune/Loss": 0.7800997495651245, "Finetune/Loss (Raw)": 0.88158118724823, "Finetune/Step": 3364, "Finetune/Step Time": 2.8445193246006966} +{"Finetune/Learning Rate": 5.003759640593971e-06, "Finetune/Loss": 0.7804239988327026, "Finetune/Loss (Raw)": 0.8047304749488831, "Finetune/Step": 3365, "Finetune/Step Time": 2.846776569262147} +{"Finetune/Learning Rate": 4.9981205329426596e-06, "Finetune/Loss": 0.7799912691116333, "Finetune/Loss (Raw)": 0.8060238361358643, "Finetune/Step": 3366, "Finetune/Step Time": 2.8449552450329065} +{"Finetune/Learning Rate": 4.992483545791539e-06, "Finetune/Loss": 0.7806433439254761, "Finetune/Loss (Raw)": 0.767044186592102, "Finetune/Step": 3367, "Finetune/Step Time": 2.8429814241826534} +{"Finetune/Learning Rate": 4.98684868153037e-06, "Finetune/Loss": 0.780898928642273, "Finetune/Loss (Raw)": 0.854664146900177, "Finetune/Step": 3368, "Finetune/Step Time": 2.841136323288083} +{"Finetune/Learning Rate": 4.981215942547985e-06, "Finetune/Loss": 0.7807300090789795, "Finetune/Loss (Raw)": 0.832813024520874, "Finetune/Step": 3369, "Finetune/Step Time": 2.846459647640586} +{"Finetune/Learning Rate": 4.9755853312323425e-06, "Finetune/Loss": 0.7798627614974976, "Finetune/Loss (Raw)": 0.7608112692832947, "Finetune/Step": 3370, "Finetune/Step Time": 2.846791474148631} +{"Finetune/Learning Rate": 4.969956849970483e-06, "Finetune/Loss": 0.7803270816802979, "Finetune/Loss (Raw)": 0.8876499533653259, "Finetune/Step": 3371, "Finetune/Step Time": 2.8448955677449703} +{"Finetune/Learning Rate": 4.9643305011485506e-06, "Finetune/Loss": 0.7810193300247192, "Finetune/Loss (Raw)": 0.8787983059883118, "Finetune/Step": 3372, "Finetune/Step Time": 2.8459212463349104} +{"Finetune/Learning Rate": 4.9587062871517825e-06, "Finetune/Loss": 0.7810389995574951, "Finetune/Loss (Raw)": 0.9185152649879456, "Finetune/Step": 3373, "Finetune/Step Time": 2.8504899833351374} +{"Finetune/Learning Rate": 4.953084210364508e-06, "Finetune/Loss": 0.7812662124633789, "Finetune/Loss (Raw)": 0.8395213484764099, "Finetune/Step": 3374, "Finetune/Step Time": 2.8492538817226887} +{"Finetune/Learning Rate": 4.947464273170166e-06, "Finetune/Loss": 0.7809256911277771, "Finetune/Loss (Raw)": 0.7634952068328857, "Finetune/Step": 3375, "Finetune/Step Time": 2.8464285526424646} +{"Finetune/Learning Rate": 4.941846477951264e-06, "Finetune/Loss": 0.7822292447090149, "Finetune/Loss (Raw)": 0.844429612159729, "Finetune/Step": 3376, "Finetune/Step Time": 2.8422942347824574} +{"Finetune/Learning Rate": 4.936230827089416e-06, "Finetune/Loss": 0.7817348837852478, "Finetune/Loss (Raw)": 0.7319287657737732, "Finetune/Step": 3377, "Finetune/Step Time": 2.8437272794544697} +{"Finetune/Learning Rate": 4.9306173229653344e-06, "Finetune/Loss": 0.7805660963058472, "Finetune/Loss (Raw)": 0.6440079808235168, "Finetune/Step": 3378, "Finetune/Step Time": 2.867514155805111} +{"Finetune/Learning Rate": 4.925005967958797e-06, "Finetune/Loss": 0.7814978361129761, "Finetune/Loss (Raw)": 0.8643994331359863, "Finetune/Step": 3379, "Finetune/Step Time": 2.8680400270968676} +{"Finetune/Learning Rate": 4.9193967644486975e-06, "Finetune/Loss": 0.7818328738212585, "Finetune/Loss (Raw)": 0.8026906847953796, "Finetune/Step": 3380, "Finetune/Step Time": 2.8724679481238127} +{"Finetune/Learning Rate": 4.913789714813001e-06, "Finetune/Loss": 0.7811763286590576, "Finetune/Loss (Raw)": 0.7587873339653015, "Finetune/Step": 3381, "Finetune/Step Time": 2.874442821368575} +{"Finetune/Learning Rate": 4.9081848214287644e-06, "Finetune/Loss": 0.7813405990600586, "Finetune/Loss (Raw)": 0.782524049282074, "Finetune/Step": 3382, "Finetune/Step Time": 2.8733312785625458} +{"Finetune/Learning Rate": 4.902582086672131e-06, "Finetune/Loss": 0.7810536623001099, "Finetune/Loss (Raw)": 0.7484095692634583, "Finetune/Step": 3383, "Finetune/Step Time": 2.8742744345217943} +{"Finetune/Learning Rate": 4.896981512918325e-06, "Finetune/Loss": 0.7830866575241089, "Finetune/Loss (Raw)": 0.7450600862503052, "Finetune/Step": 3384, "Finetune/Step Time": 2.8633986096829176} +{"Finetune/Learning Rate": 4.891383102541662e-06, "Finetune/Loss": 0.7827622890472412, "Finetune/Loss (Raw)": 0.8088350296020508, "Finetune/Step": 3385, "Finetune/Step Time": 2.863326435908675} +{"Finetune/Learning Rate": 4.885786857915531e-06, "Finetune/Loss": 0.782860279083252, "Finetune/Loss (Raw)": 0.8534970283508301, "Finetune/Step": 3386, "Finetune/Step Time": 2.860300349071622} +{"Finetune/Learning Rate": 4.880192781412407e-06, "Finetune/Loss": 0.7828267812728882, "Finetune/Loss (Raw)": 0.8571096062660217, "Finetune/Step": 3387, "Finetune/Step Time": 2.8633146602660418} +{"Finetune/Learning Rate": 4.874600875403854e-06, "Finetune/Loss": 0.7836530208587646, "Finetune/Loss (Raw)": 0.8039780259132385, "Finetune/Step": 3388, "Finetune/Step Time": 2.8618877697736025} +{"Finetune/Learning Rate": 4.8690111422605036e-06, "Finetune/Loss": 0.7822118997573853, "Finetune/Loss (Raw)": 0.6346091628074646, "Finetune/Step": 3389, "Finetune/Step Time": 2.863665597513318} +{"Finetune/Learning Rate": 4.863423584352072e-06, "Finetune/Loss": 0.780422568321228, "Finetune/Loss (Raw)": 0.7212090492248535, "Finetune/Step": 3390, "Finetune/Step Time": 2.86362892575562} +{"Finetune/Learning Rate": 4.857838204047351e-06, "Finetune/Loss": 0.7806165218353271, "Finetune/Loss (Raw)": 0.7936000823974609, "Finetune/Step": 3391, "Finetune/Step Time": 2.86428564786911} +{"Finetune/Learning Rate": 4.8522550037142136e-06, "Finetune/Loss": 0.7806671261787415, "Finetune/Loss (Raw)": 0.8282243013381958, "Finetune/Step": 3392, "Finetune/Step Time": 2.8679814264178276} +{"Finetune/Learning Rate": 4.8466739857196024e-06, "Finetune/Loss": 0.7816002368927002, "Finetune/Loss (Raw)": 0.8576633930206299, "Finetune/Step": 3393, "Finetune/Step Time": 2.8679143395274878} +{"Finetune/Learning Rate": 4.841095152429538e-06, "Finetune/Loss": 0.7804087400436401, "Finetune/Loss (Raw)": 0.6797816753387451, "Finetune/Step": 3394, "Finetune/Step Time": 2.868356980383396} +{"Finetune/Learning Rate": 4.835518506209113e-06, "Finetune/Loss": 0.7810944318771362, "Finetune/Loss (Raw)": 0.8063662648200989, "Finetune/Step": 3395, "Finetune/Step Time": 2.869692685082555} +{"Finetune/Learning Rate": 4.829944049422504e-06, "Finetune/Loss": 0.7826575040817261, "Finetune/Loss (Raw)": 0.926443338394165, "Finetune/Step": 3396, "Finetune/Step Time": 2.8504776135087013} +{"Finetune/Learning Rate": 4.824371784432937e-06, "Finetune/Loss": 0.7842491269111633, "Finetune/Loss (Raw)": 0.7587728500366211, "Finetune/Step": 3397, "Finetune/Step Time": 2.823886498808861} +{"Finetune/Learning Rate": 4.8188017136027335e-06, "Finetune/Loss": 0.7842310070991516, "Finetune/Loss (Raw)": 0.8469911217689514, "Finetune/Step": 3398, "Finetune/Step Time": 2.8228311762213707} +{"Finetune/Learning Rate": 4.813233839293265e-06, "Finetune/Loss": 0.7826626300811768, "Finetune/Loss (Raw)": 0.6884565949440002, "Finetune/Step": 3399, "Finetune/Step Time": 2.8220610599964857} +{"Finetune/Learning Rate": 4.8076681638649845e-06, "Finetune/Loss": 0.7820972800254822, "Finetune/Loss (Raw)": 0.7969635128974915, "Finetune/Step": 3400, "Finetune/Step Time": 2.8064835257828236} +{"Finetune/Learning Rate": 4.802104689677406e-06, "Finetune/Loss": 0.7818993926048279, "Finetune/Loss (Raw)": 0.7795719504356384, "Finetune/Step": 3401, "Finetune/Step Time": 2.807288834825158} +{"Finetune/Learning Rate": 4.796543419089109e-06, "Finetune/Loss": 0.7821604609489441, "Finetune/Loss (Raw)": 0.7459763884544373, "Finetune/Step": 3402, "Finetune/Step Time": 2.8053413070738316} +{"Finetune/Learning Rate": 4.790984354457755e-06, "Finetune/Loss": 0.7838788032531738, "Finetune/Loss (Raw)": 0.7475247979164124, "Finetune/Step": 3403, "Finetune/Step Time": 2.7810106612741947} +{"Finetune/Learning Rate": 4.7854274981400454e-06, "Finetune/Loss": 0.7837961912155151, "Finetune/Loss (Raw)": 0.8145257234573364, "Finetune/Step": 3404, "Finetune/Step Time": 2.7877360936254263} +{"Finetune/Learning Rate": 4.779872852491757e-06, "Finetune/Loss": 0.7837656736373901, "Finetune/Loss (Raw)": 0.7490909695625305, "Finetune/Step": 3405, "Finetune/Step Time": 2.7881701439619064} +{"Finetune/Learning Rate": 4.774320419867742e-06, "Finetune/Loss": 0.7832133173942566, "Finetune/Loss (Raw)": 0.8009143471717834, "Finetune/Step": 3406, "Finetune/Step Time": 2.7859983574599028} +{"Finetune/Learning Rate": 4.7687702026218875e-06, "Finetune/Loss": 0.7825697660446167, "Finetune/Loss (Raw)": 0.7739462852478027, "Finetune/Step": 3407, "Finetune/Step Time": 2.7825010921806097} +{"Finetune/Learning Rate": 4.763222203107167e-06, "Finetune/Loss": 0.7813413143157959, "Finetune/Loss (Raw)": 0.7614704370498657, "Finetune/Step": 3408, "Finetune/Step Time": 2.785509580746293} +{"Finetune/Learning Rate": 4.7576764236756e-06, "Finetune/Loss": 0.7816250920295715, "Finetune/Loss (Raw)": 0.829200804233551, "Finetune/Step": 3409, "Finetune/Step Time": 2.7830458637326956} +{"Finetune/Learning Rate": 4.7521328666782695e-06, "Finetune/Loss": 0.7818224430084229, "Finetune/Loss (Raw)": 0.8437817692756653, "Finetune/Step": 3410, "Finetune/Step Time": 2.7820095364004374} +{"Finetune/Learning Rate": 4.746591534465312e-06, "Finetune/Loss": 0.781046986579895, "Finetune/Loss (Raw)": 0.763258695602417, "Finetune/Step": 3411, "Finetune/Step Time": 2.778031734749675} +{"Finetune/Learning Rate": 4.741052429385926e-06, "Finetune/Loss": 0.780060887336731, "Finetune/Loss (Raw)": 0.709534764289856, "Finetune/Step": 3412, "Finetune/Step Time": 2.7809784654527903} +{"Finetune/Learning Rate": 4.735515553788361e-06, "Finetune/Loss": 0.7802646160125732, "Finetune/Loss (Raw)": 0.8872367143630981, "Finetune/Step": 3413, "Finetune/Step Time": 2.78115538880229} +{"Finetune/Learning Rate": 4.7299809100199265e-06, "Finetune/Loss": 0.7800987362861633, "Finetune/Loss (Raw)": 0.7259359955787659, "Finetune/Step": 3414, "Finetune/Step Time": 2.7758783902972937} +{"Finetune/Learning Rate": 4.724448500426978e-06, "Finetune/Loss": 0.7805048227310181, "Finetune/Loss (Raw)": 0.9030199646949768, "Finetune/Step": 3415, "Finetune/Step Time": 2.7760703153908253} +{"Finetune/Learning Rate": 4.718918327354938e-06, "Finetune/Loss": 0.7804664373397827, "Finetune/Loss (Raw)": 0.7724015712738037, "Finetune/Step": 3416, "Finetune/Step Time": 2.799893582239747} +{"Finetune/Learning Rate": 4.713390393148265e-06, "Finetune/Loss": 0.7792441844940186, "Finetune/Loss (Raw)": 0.6865450143814087, "Finetune/Step": 3417, "Finetune/Step Time": 2.7997013069689274} +{"Finetune/Learning Rate": 4.707864700150478e-06, "Finetune/Loss": 0.7792922258377075, "Finetune/Loss (Raw)": 0.8199865221977234, "Finetune/Step": 3418, "Finetune/Step Time": 2.7974536195397377} +{"Finetune/Learning Rate": 4.702341250704141e-06, "Finetune/Loss": 0.7808254361152649, "Finetune/Loss (Raw)": 0.865866482257843, "Finetune/Step": 3419, "Finetune/Step Time": 2.776766525581479} +{"Finetune/Learning Rate": 4.696820047150872e-06, "Finetune/Loss": 0.7800923585891724, "Finetune/Loss (Raw)": 0.6611152291297913, "Finetune/Step": 3420, "Finetune/Step Time": 2.7739499378949404} +{"Finetune/Learning Rate": 4.69130109183133e-06, "Finetune/Loss": 0.781124472618103, "Finetune/Loss (Raw)": 0.8690767288208008, "Finetune/Step": 3421, "Finetune/Step Time": 2.7719052117317915} +{"Finetune/Learning Rate": 4.685784387085227e-06, "Finetune/Loss": 0.783501148223877, "Finetune/Loss (Raw)": 0.8903704285621643, "Finetune/Step": 3422, "Finetune/Step Time": 2.748962190002203} +{"Finetune/Learning Rate": 4.6802699352513145e-06, "Finetune/Loss": 0.7848184704780579, "Finetune/Loss (Raw)": 0.9183221459388733, "Finetune/Step": 3423, "Finetune/Step Time": 2.7487046346068382} +{"Finetune/Learning Rate": 4.674757738667405e-06, "Finetune/Loss": 0.7842627763748169, "Finetune/Loss (Raw)": 0.7348262071609497, "Finetune/Step": 3424, "Finetune/Step Time": 2.7477387078106403} +{"Finetune/Learning Rate": 4.669247799670325e-06, "Finetune/Loss": 0.784543514251709, "Finetune/Loss (Raw)": 0.8382102847099304, "Finetune/Step": 3425, "Finetune/Step Time": 2.7450263742357492} +{"Finetune/Learning Rate": 4.663740120595976e-06, "Finetune/Loss": 0.7842996120452881, "Finetune/Loss (Raw)": 0.8185157775878906, "Finetune/Step": 3426, "Finetune/Step Time": 2.74422300606966} +{"Finetune/Learning Rate": 4.658234703779283e-06, "Finetune/Loss": 0.7798938751220703, "Finetune/Loss (Raw)": 0.22108641266822815, "Finetune/Step": 3427, "Finetune/Step Time": 2.7765533588826656} +{"Finetune/Learning Rate": 4.652731551554215e-06, "Finetune/Loss": 0.7796204686164856, "Finetune/Loss (Raw)": 0.6079674959182739, "Finetune/Step": 3428, "Finetune/Step Time": 2.774007311090827} +{"Finetune/Learning Rate": 4.647230666253782e-06, "Finetune/Loss": 0.7788594961166382, "Finetune/Loss (Raw)": 0.7336024641990662, "Finetune/Step": 3429, "Finetune/Step Time": 2.7728853970766068} +{"Finetune/Learning Rate": 4.641732050210032e-06, "Finetune/Loss": 0.779446005821228, "Finetune/Loss (Raw)": 0.849768877029419, "Finetune/Step": 3430, "Finetune/Step Time": 2.774109922349453} +{"Finetune/Learning Rate": 4.63623570575406e-06, "Finetune/Loss": 0.7796989679336548, "Finetune/Loss (Raw)": 0.8367829918861389, "Finetune/Step": 3431, "Finetune/Step Time": 2.7710419315844774} +{"Finetune/Learning Rate": 4.630741635215981e-06, "Finetune/Loss": 0.7796320915222168, "Finetune/Loss (Raw)": 0.8504339456558228, "Finetune/Step": 3432, "Finetune/Step Time": 2.7705160807818174} +{"Finetune/Learning Rate": 4.625249840924954e-06, "Finetune/Loss": 0.7804504632949829, "Finetune/Loss (Raw)": 0.8890649676322937, "Finetune/Step": 3433, "Finetune/Step Time": 2.771090293303132} +{"Finetune/Learning Rate": 4.6197603252091834e-06, "Finetune/Loss": 0.78009432554245, "Finetune/Loss (Raw)": 0.8058484196662903, "Finetune/Step": 3434, "Finetune/Step Time": 2.7669860795140266} +{"Finetune/Learning Rate": 4.6142730903958876e-06, "Finetune/Loss": 0.779118537902832, "Finetune/Loss (Raw)": 0.7634201049804688, "Finetune/Step": 3435, "Finetune/Step Time": 2.7616402059793472} +{"Finetune/Learning Rate": 4.608788138811336e-06, "Finetune/Loss": 0.7791182994842529, "Finetune/Loss (Raw)": 0.7622194886207581, "Finetune/Step": 3436, "Finetune/Step Time": 2.759803008288145} +{"Finetune/Learning Rate": 4.603305472780822e-06, "Finetune/Loss": 0.7752233743667603, "Finetune/Loss (Raw)": 0.3924311101436615, "Finetune/Step": 3437, "Finetune/Step Time": 2.7925969567149878} +{"Finetune/Learning Rate": 4.597825094628669e-06, "Finetune/Loss": 0.7794536352157593, "Finetune/Loss (Raw)": 0.8286420702934265, "Finetune/Step": 3438, "Finetune/Step Time": 2.7649709694087505} +{"Finetune/Learning Rate": 4.5923470066782325e-06, "Finetune/Loss": 0.7792787551879883, "Finetune/Loss (Raw)": 0.7949594855308533, "Finetune/Step": 3439, "Finetune/Step Time": 2.7647589165717363} +{"Finetune/Learning Rate": 4.586871211251893e-06, "Finetune/Loss": 0.7786935567855835, "Finetune/Loss (Raw)": 0.7968320846557617, "Finetune/Step": 3440, "Finetune/Step Time": 2.775497203692794} +{"Finetune/Learning Rate": 4.581397710671074e-06, "Finetune/Loss": 0.7788089513778687, "Finetune/Loss (Raw)": 0.8083761930465698, "Finetune/Step": 3441, "Finetune/Step Time": 2.7961775846779346} +{"Finetune/Learning Rate": 4.575926507256204e-06, "Finetune/Loss": 0.77961665391922, "Finetune/Loss (Raw)": 0.8518063426017761, "Finetune/Step": 3442, "Finetune/Step Time": 2.795926770195365} +{"Finetune/Learning Rate": 4.57045760332675e-06, "Finetune/Loss": 0.7801942825317383, "Finetune/Loss (Raw)": 0.8284006714820862, "Finetune/Step": 3443, "Finetune/Step Time": 2.7953913751989603} +{"Finetune/Learning Rate": 4.564991001201209e-06, "Finetune/Loss": 0.7805957794189453, "Finetune/Loss (Raw)": 0.8560651540756226, "Finetune/Step": 3444, "Finetune/Step Time": 2.7941567432135344} +{"Finetune/Learning Rate": 4.559526703197091e-06, "Finetune/Loss": 0.7805894613265991, "Finetune/Loss (Raw)": 0.8015248775482178, "Finetune/Step": 3445, "Finetune/Step Time": 2.796539820730686} +{"Finetune/Learning Rate": 4.554064711630938e-06, "Finetune/Loss": 0.7803961038589478, "Finetune/Loss (Raw)": 0.7968060970306396, "Finetune/Step": 3446, "Finetune/Step Time": 2.7946474347263575} +{"Finetune/Learning Rate": 4.548605028818307e-06, "Finetune/Loss": 0.7818547487258911, "Finetune/Loss (Raw)": 0.7554721236228943, "Finetune/Step": 3447, "Finetune/Step Time": 2.773949759081006} +{"Finetune/Learning Rate": 4.543147657073781e-06, "Finetune/Loss": 0.7802470922470093, "Finetune/Loss (Raw)": 0.7410128712654114, "Finetune/Step": 3448, "Finetune/Step Time": 2.774808080866933} +{"Finetune/Learning Rate": 4.537692598710962e-06, "Finetune/Loss": 0.7784948348999023, "Finetune/Loss (Raw)": 0.6295097470283508, "Finetune/Step": 3449, "Finetune/Step Time": 2.7976186349987984} +{"Finetune/Learning Rate": 4.53223985604247e-06, "Finetune/Loss": 0.7829524278640747, "Finetune/Loss (Raw)": 0.7292945384979248, "Finetune/Step": 3450, "Finetune/Step Time": 2.7660427317023277} +{"Finetune/Learning Rate": 4.526789431379943e-06, "Finetune/Loss": 0.7838712930679321, "Finetune/Loss (Raw)": 0.8548270463943481, "Finetune/Step": 3451, "Finetune/Step Time": 2.7654045820236206} +{"Finetune/Learning Rate": 4.521341327034046e-06, "Finetune/Loss": 0.7792363166809082, "Finetune/Loss (Raw)": 0.2094230055809021, "Finetune/Step": 3452, "Finetune/Step Time": 2.79609602317214} +{"Finetune/Learning Rate": 4.51589554531444e-06, "Finetune/Loss": 0.7775263786315918, "Finetune/Loss (Raw)": 0.5200904011726379, "Finetune/Step": 3453, "Finetune/Step Time": 2.8181109074503183} +{"Finetune/Learning Rate": 4.5104520885298235e-06, "Finetune/Loss": 0.7771680355072021, "Finetune/Loss (Raw)": 0.7490704655647278, "Finetune/Step": 3454, "Finetune/Step Time": 2.8153799772262573} +{"Finetune/Learning Rate": 4.505010958987896e-06, "Finetune/Loss": 0.7784018516540527, "Finetune/Loss (Raw)": 0.819181501865387, "Finetune/Step": 3455, "Finetune/Step Time": 2.821190332993865} +{"Finetune/Learning Rate": 4.499572158995371e-06, "Finetune/Loss": 0.7784342765808105, "Finetune/Loss (Raw)": 0.8197299242019653, "Finetune/Step": 3456, "Finetune/Step Time": 2.814458819106221} +{"Finetune/Learning Rate": 4.49413569085798e-06, "Finetune/Loss": 0.7782299518585205, "Finetune/Loss (Raw)": 0.833730936050415, "Finetune/Step": 3457, "Finetune/Step Time": 2.816371437162161} +{"Finetune/Learning Rate": 4.4887015568804594e-06, "Finetune/Loss": 0.778281569480896, "Finetune/Loss (Raw)": 0.8421852588653564, "Finetune/Step": 3458, "Finetune/Step Time": 2.82164522819221} +{"Finetune/Learning Rate": 4.483269759366569e-06, "Finetune/Loss": 0.778919517993927, "Finetune/Loss (Raw)": 0.8201667666435242, "Finetune/Step": 3459, "Finetune/Step Time": 2.8212619815021753} +{"Finetune/Learning Rate": 4.477840300619059e-06, "Finetune/Loss": 0.7790601849555969, "Finetune/Loss (Raw)": 0.8637762069702148, "Finetune/Step": 3460, "Finetune/Step Time": 2.8193602338433266} +{"Finetune/Learning Rate": 4.472413182939697e-06, "Finetune/Loss": 0.7779834270477295, "Finetune/Loss (Raw)": 0.7107330560684204, "Finetune/Step": 3461, "Finetune/Step Time": 2.8213071171194315} +{"Finetune/Learning Rate": 4.46698840862927e-06, "Finetune/Loss": 0.7765963077545166, "Finetune/Loss (Raw)": 0.6175186038017273, "Finetune/Step": 3462, "Finetune/Step Time": 2.8412403035908937} +{"Finetune/Learning Rate": 4.4615659799875465e-06, "Finetune/Loss": 0.7730929851531982, "Finetune/Loss (Raw)": 0.45213523507118225, "Finetune/Step": 3463, "Finetune/Step Time": 2.8717058952897787} +{"Finetune/Learning Rate": 4.456145899313325e-06, "Finetune/Loss": 0.7738367319107056, "Finetune/Loss (Raw)": 0.8007104396820068, "Finetune/Step": 3464, "Finetune/Step Time": 2.8502488136291504} +{"Finetune/Learning Rate": 4.450728168904396e-06, "Finetune/Loss": 0.7739744186401367, "Finetune/Loss (Raw)": 0.8210001587867737, "Finetune/Step": 3465, "Finetune/Step Time": 2.8480483889579773} +{"Finetune/Learning Rate": 4.445312791057553e-06, "Finetune/Loss": 0.7723469734191895, "Finetune/Loss (Raw)": 0.6462904810905457, "Finetune/Step": 3466, "Finetune/Step Time": 2.844744762405753} +{"Finetune/Learning Rate": 4.439899768068598e-06, "Finetune/Loss": 0.7730083465576172, "Finetune/Loss (Raw)": 0.8971508145332336, "Finetune/Step": 3467, "Finetune/Step Time": 2.840696319937706} +{"Finetune/Learning Rate": 4.434489102232327e-06, "Finetune/Loss": 0.7720673680305481, "Finetune/Loss (Raw)": 0.7862245440483093, "Finetune/Step": 3468, "Finetune/Step Time": 2.842944188043475} +{"Finetune/Learning Rate": 4.429080795842551e-06, "Finetune/Loss": 0.7722940444946289, "Finetune/Loss (Raw)": 0.8530418872833252, "Finetune/Step": 3469, "Finetune/Step Time": 2.8428684156388044} +{"Finetune/Learning Rate": 4.423674851192061e-06, "Finetune/Loss": 0.7721259593963623, "Finetune/Loss (Raw)": 0.7177963256835938, "Finetune/Step": 3470, "Finetune/Step Time": 2.8400522228330374} +{"Finetune/Learning Rate": 4.418271270572657e-06, "Finetune/Loss": 0.7716569900512695, "Finetune/Loss (Raw)": 0.7977784872055054, "Finetune/Step": 3471, "Finetune/Step Time": 2.841400183737278} +{"Finetune/Learning Rate": 4.412870056275145e-06, "Finetune/Loss": 0.7719054222106934, "Finetune/Loss (Raw)": 0.7724534869194031, "Finetune/Step": 3472, "Finetune/Step Time": 2.843944985419512} +{"Finetune/Learning Rate": 4.407471210589314e-06, "Finetune/Loss": 0.77196204662323, "Finetune/Loss (Raw)": 0.7699989676475525, "Finetune/Step": 3473, "Finetune/Step Time": 2.841654412448406} +{"Finetune/Learning Rate": 4.402074735803955e-06, "Finetune/Loss": 0.7728764414787292, "Finetune/Loss (Raw)": 0.8815919756889343, "Finetune/Step": 3474, "Finetune/Step Time": 2.8168799243867397} +{"Finetune/Learning Rate": 4.3966806342068535e-06, "Finetune/Loss": 0.7722159624099731, "Finetune/Loss (Raw)": 0.7761046290397644, "Finetune/Step": 3475, "Finetune/Step Time": 2.821982705965638} +{"Finetune/Learning Rate": 4.391288908084788e-06, "Finetune/Loss": 0.7715521454811096, "Finetune/Loss (Raw)": 0.8263158202171326, "Finetune/Step": 3476, "Finetune/Step Time": 2.8242634888738394} +{"Finetune/Learning Rate": 4.385899559723531e-06, "Finetune/Loss": 0.7711181640625, "Finetune/Loss (Raw)": 0.7360431551933289, "Finetune/Step": 3477, "Finetune/Step Time": 2.8177009131759405} +{"Finetune/Learning Rate": 4.3805125914078475e-06, "Finetune/Loss": 0.7705978155136108, "Finetune/Loss (Raw)": 0.8009021878242493, "Finetune/Step": 3478, "Finetune/Step Time": 2.8165846038609743} +{"Finetune/Learning Rate": 4.375128005421486e-06, "Finetune/Loss": 0.7708097100257874, "Finetune/Loss (Raw)": 0.7740041613578796, "Finetune/Step": 3479, "Finetune/Step Time": 2.8172077536582947} +{"Finetune/Learning Rate": 4.369745804047206e-06, "Finetune/Loss": 0.7729842662811279, "Finetune/Loss (Raw)": 0.7860242128372192, "Finetune/Step": 3480, "Finetune/Step Time": 2.7955528497695923} +{"Finetune/Learning Rate": 4.364365989566725e-06, "Finetune/Loss": 0.7734173536300659, "Finetune/Loss (Raw)": 0.790562629699707, "Finetune/Step": 3481, "Finetune/Step Time": 2.796020893380046} +{"Finetune/Learning Rate": 4.358988564260777e-06, "Finetune/Loss": 0.7734596133232117, "Finetune/Loss (Raw)": 0.8003150820732117, "Finetune/Step": 3482, "Finetune/Step Time": 2.7944360580295324} +{"Finetune/Learning Rate": 4.353613530409067e-06, "Finetune/Loss": 0.7735437154769897, "Finetune/Loss (Raw)": 0.7446835041046143, "Finetune/Step": 3483, "Finetune/Step Time": 2.792202653363347} +{"Finetune/Learning Rate": 4.348240890290289e-06, "Finetune/Loss": 0.7734119296073914, "Finetune/Loss (Raw)": 0.6698048114776611, "Finetune/Step": 3484, "Finetune/Step Time": 2.811802649870515} +{"Finetune/Learning Rate": 4.342870646182128e-06, "Finetune/Loss": 0.7738907337188721, "Finetune/Loss (Raw)": 0.8740893006324768, "Finetune/Step": 3485, "Finetune/Step Time": 2.814208472147584} +{"Finetune/Learning Rate": 4.337502800361242e-06, "Finetune/Loss": 0.7746418118476868, "Finetune/Loss (Raw)": 0.8903275728225708, "Finetune/Step": 3486, "Finetune/Step Time": 2.81486283428967} +{"Finetune/Learning Rate": 4.332137355103291e-06, "Finetune/Loss": 0.7762391567230225, "Finetune/Loss (Raw)": 0.8357224464416504, "Finetune/Step": 3487, "Finetune/Step Time": 2.8140636701136827} +{"Finetune/Learning Rate": 4.326774312682894e-06, "Finetune/Loss": 0.776193380355835, "Finetune/Loss (Raw)": 0.7484946250915527, "Finetune/Step": 3488, "Finetune/Step Time": 2.8158080764114857} +{"Finetune/Learning Rate": 4.321413675373664e-06, "Finetune/Loss": 0.7757581472396851, "Finetune/Loss (Raw)": 0.7648608684539795, "Finetune/Step": 3489, "Finetune/Step Time": 2.8152394257485867} +{"Finetune/Learning Rate": 4.3160554454482025e-06, "Finetune/Loss": 0.776070237159729, "Finetune/Loss (Raw)": 0.7538382411003113, "Finetune/Step": 3490, "Finetune/Step Time": 2.8166641425341368} +{"Finetune/Learning Rate": 4.31069962517807e-06, "Finetune/Loss": 0.7776128053665161, "Finetune/Loss (Raw)": 0.8837978839874268, "Finetune/Step": 3491, "Finetune/Step Time": 2.815970454365015} +{"Finetune/Learning Rate": 4.3053462168338235e-06, "Finetune/Loss": 0.775670051574707, "Finetune/Loss (Raw)": 0.6329134702682495, "Finetune/Step": 3492, "Finetune/Step Time": 2.8399210926145315} +{"Finetune/Learning Rate": 4.299995222684988e-06, "Finetune/Loss": 0.7755383253097534, "Finetune/Loss (Raw)": 0.7878674864768982, "Finetune/Step": 3493, "Finetune/Step Time": 2.838645737618208} +{"Finetune/Learning Rate": 4.29464664500007e-06, "Finetune/Loss": 0.7760339975357056, "Finetune/Loss (Raw)": 0.8694751858711243, "Finetune/Step": 3494, "Finetune/Step Time": 2.8375518191605806} +{"Finetune/Learning Rate": 4.289300486046546e-06, "Finetune/Loss": 0.7758893966674805, "Finetune/Loss (Raw)": 0.7485288381576538, "Finetune/Step": 3495, "Finetune/Step Time": 2.8382899053394794} +{"Finetune/Learning Rate": 4.283956748090869e-06, "Finetune/Loss": 0.7748774290084839, "Finetune/Loss (Raw)": 0.7251269817352295, "Finetune/Step": 3496, "Finetune/Step Time": 2.8473404329270124} +{"Finetune/Learning Rate": 4.278615433398476e-06, "Finetune/Loss": 0.7746523022651672, "Finetune/Loss (Raw)": 0.8040013313293457, "Finetune/Step": 3497, "Finetune/Step Time": 2.8442961182445288} +{"Finetune/Learning Rate": 4.273276544233759e-06, "Finetune/Loss": 0.7747147083282471, "Finetune/Loss (Raw)": 0.7687973976135254, "Finetune/Step": 3498, "Finetune/Step Time": 2.8468803260475397} +{"Finetune/Learning Rate": 4.267940082860088e-06, "Finetune/Loss": 0.7749476432800293, "Finetune/Loss (Raw)": 0.9174643754959106, "Finetune/Step": 3499, "Finetune/Step Time": 2.8492670096457005} +{"Finetune/Learning Rate": 4.262606051539818e-06, "Finetune/Loss": 0.7743567228317261, "Finetune/Loss (Raw)": 0.8031592965126038, "Finetune/Step": 3500, "Finetune/Step Time": 2.8492605816572905} +{"Finetune/Learning Rate": 4.257274452534248e-06, "Finetune/Loss": 0.7734265327453613, "Finetune/Loss (Raw)": 0.7994502186775208, "Finetune/Step": 3501, "Finetune/Step Time": 2.845313536003232} +{"Finetune/Learning Rate": 4.251945288103668e-06, "Finetune/Loss": 0.773105263710022, "Finetune/Loss (Raw)": 0.7984015345573425, "Finetune/Step": 3502, "Finetune/Step Time": 2.8444673512130976} +{"Finetune/Learning Rate": 4.2466185605073275e-06, "Finetune/Loss": 0.7726635932922363, "Finetune/Loss (Raw)": 0.7069631814956665, "Finetune/Step": 3503, "Finetune/Step Time": 2.848361177369952} +{"Finetune/Learning Rate": 4.241294272003441e-06, "Finetune/Loss": 0.7722622752189636, "Finetune/Loss (Raw)": 0.7930639982223511, "Finetune/Step": 3504, "Finetune/Step Time": 2.8505989592522383} +{"Finetune/Learning Rate": 4.235972424849191e-06, "Finetune/Loss": 0.7734742760658264, "Finetune/Loss (Raw)": 0.8870618343353271, "Finetune/Step": 3505, "Finetune/Step Time": 2.849196195602417} +{"Finetune/Learning Rate": 4.230653021300726e-06, "Finetune/Loss": 0.775017261505127, "Finetune/Loss (Raw)": 0.8415101170539856, "Finetune/Step": 3506, "Finetune/Step Time": 2.8263579476624727} +{"Finetune/Learning Rate": 4.225336063613155e-06, "Finetune/Loss": 0.7739505767822266, "Finetune/Loss (Raw)": 0.7278649210929871, "Finetune/Step": 3507, "Finetune/Step Time": 2.8321077674627304} +{"Finetune/Learning Rate": 4.220021554040558e-06, "Finetune/Loss": 0.7740522623062134, "Finetune/Loss (Raw)": 0.8157029747962952, "Finetune/Step": 3508, "Finetune/Step Time": 2.8291299622505903} +{"Finetune/Learning Rate": 4.214709494835963e-06, "Finetune/Loss": 0.7738422155380249, "Finetune/Loss (Raw)": 0.7318994402885437, "Finetune/Step": 3509, "Finetune/Step Time": 2.82973544113338} +{"Finetune/Learning Rate": 4.209399888251377e-06, "Finetune/Loss": 0.774478554725647, "Finetune/Loss (Raw)": 0.8639807105064392, "Finetune/Step": 3510, "Finetune/Step Time": 2.8318094201385975} +{"Finetune/Learning Rate": 4.204092736537754e-06, "Finetune/Loss": 0.7757121324539185, "Finetune/Loss (Raw)": 0.9063063263893127, "Finetune/Step": 3511, "Finetune/Step Time": 2.8310489021241665} +{"Finetune/Learning Rate": 4.198788041945013e-06, "Finetune/Loss": 0.775976300239563, "Finetune/Loss (Raw)": 0.7788691520690918, "Finetune/Step": 3512, "Finetune/Step Time": 2.819192146882415} +{"Finetune/Learning Rate": 4.193485806722029e-06, "Finetune/Loss": 0.7758388519287109, "Finetune/Loss (Raw)": 0.7912439107894897, "Finetune/Step": 3513, "Finetune/Step Time": 2.8177669364959} +{"Finetune/Learning Rate": 4.188186033116634e-06, "Finetune/Loss": 0.7745603322982788, "Finetune/Loss (Raw)": 0.6898485422134399, "Finetune/Step": 3514, "Finetune/Step Time": 2.8183576688170433} +{"Finetune/Learning Rate": 4.182888723375621e-06, "Finetune/Loss": 0.7739812135696411, "Finetune/Loss (Raw)": 0.7829827070236206, "Finetune/Step": 3515, "Finetune/Step Time": 2.81868046335876} +{"Finetune/Learning Rate": 4.1775938797447325e-06, "Finetune/Loss": 0.7738405466079712, "Finetune/Loss (Raw)": 0.7859725952148438, "Finetune/Step": 3516, "Finetune/Step Time": 2.820599965751171} +{"Finetune/Learning Rate": 4.172301504468664e-06, "Finetune/Loss": 0.7750704884529114, "Finetune/Loss (Raw)": 0.7920408248901367, "Finetune/Step": 3517, "Finetune/Step Time": 2.8194758407771587} +{"Finetune/Learning Rate": 4.167011599791082e-06, "Finetune/Loss": 0.7746142148971558, "Finetune/Loss (Raw)": 0.6628034114837646, "Finetune/Step": 3518, "Finetune/Step Time": 2.8414509650319815} +{"Finetune/Learning Rate": 4.161724167954575e-06, "Finetune/Loss": 0.7740554809570312, "Finetune/Loss (Raw)": 0.7220842838287354, "Finetune/Step": 3519, "Finetune/Step Time": 2.8374694790691137} +{"Finetune/Learning Rate": 4.1564392112007135e-06, "Finetune/Loss": 0.7723926305770874, "Finetune/Loss (Raw)": 0.6153784394264221, "Finetune/Step": 3520, "Finetune/Step Time": 2.8592192586511374} +{"Finetune/Learning Rate": 4.15115673177e-06, "Finetune/Loss": 0.7725534439086914, "Finetune/Loss (Raw)": 0.878253698348999, "Finetune/Step": 3521, "Finetune/Step Time": 2.858656607568264} +{"Finetune/Learning Rate": 4.145876731901895e-06, "Finetune/Loss": 0.7732135057449341, "Finetune/Loss (Raw)": 0.7642630338668823, "Finetune/Step": 3522, "Finetune/Step Time": 2.8557417076081038} +{"Finetune/Learning Rate": 4.140599213834804e-06, "Finetune/Loss": 0.7729285955429077, "Finetune/Loss (Raw)": 0.7698975801467896, "Finetune/Step": 3523, "Finetune/Step Time": 2.849544186145067} +{"Finetune/Learning Rate": 4.135324179806079e-06, "Finetune/Loss": 0.7717489004135132, "Finetune/Loss (Raw)": 0.7754467129707336, "Finetune/Step": 3524, "Finetune/Step Time": 2.845252137631178} +{"Finetune/Learning Rate": 4.130051632052029e-06, "Finetune/Loss": 0.7721904516220093, "Finetune/Loss (Raw)": 0.8152948617935181, "Finetune/Step": 3525, "Finetune/Step Time": 2.8483449555933475} +{"Finetune/Learning Rate": 4.124781572807894e-06, "Finetune/Loss": 0.7715557217597961, "Finetune/Loss (Raw)": 0.7657408118247986, "Finetune/Step": 3526, "Finetune/Step Time": 2.8496904391795397} +{"Finetune/Learning Rate": 4.119514004307865e-06, "Finetune/Loss": 0.7717071771621704, "Finetune/Loss (Raw)": 0.7078441381454468, "Finetune/Step": 3527, "Finetune/Step Time": 2.848857395350933} +{"Finetune/Learning Rate": 4.11424892878509e-06, "Finetune/Loss": 0.7718989849090576, "Finetune/Loss (Raw)": 0.8215103149414062, "Finetune/Step": 3528, "Finetune/Step Time": 2.8531168531626463} +{"Finetune/Learning Rate": 4.108986348471634e-06, "Finetune/Loss": 0.772085964679718, "Finetune/Loss (Raw)": 0.8035114407539368, "Finetune/Step": 3529, "Finetune/Step Time": 2.853933395817876} +{"Finetune/Learning Rate": 4.103726265598531e-06, "Finetune/Loss": 0.7725135087966919, "Finetune/Loss (Raw)": 0.8007025122642517, "Finetune/Step": 3530, "Finetune/Step Time": 2.8575008753687143} +{"Finetune/Learning Rate": 4.098468682395738e-06, "Finetune/Loss": 0.7730425000190735, "Finetune/Loss (Raw)": 0.8152334690093994, "Finetune/Step": 3531, "Finetune/Step Time": 2.8602232839912176} +{"Finetune/Learning Rate": 4.093213601092161e-06, "Finetune/Loss": 0.7729182839393616, "Finetune/Loss (Raw)": 0.7986254692077637, "Finetune/Step": 3532, "Finetune/Step Time": 2.856646928936243} +{"Finetune/Learning Rate": 4.087961023915641e-06, "Finetune/Loss": 0.7737017869949341, "Finetune/Loss (Raw)": 0.849382221698761, "Finetune/Step": 3533, "Finetune/Step Time": 2.860111143440008} +{"Finetune/Learning Rate": 4.0827109530929595e-06, "Finetune/Loss": 0.7740328311920166, "Finetune/Loss (Raw)": 0.8432909250259399, "Finetune/Step": 3534, "Finetune/Step Time": 2.862239919602871} +{"Finetune/Learning Rate": 4.0774633908498365e-06, "Finetune/Loss": 0.7741131782531738, "Finetune/Loss (Raw)": 0.7842243313789368, "Finetune/Step": 3535, "Finetune/Step Time": 2.863585837185383} +{"Finetune/Learning Rate": 4.072218339410924e-06, "Finetune/Loss": 0.7744323015213013, "Finetune/Loss (Raw)": 0.8023157119750977, "Finetune/Step": 3536, "Finetune/Step Time": 2.8589648976922035} +{"Finetune/Learning Rate": 4.066975800999812e-06, "Finetune/Loss": 0.7737089395523071, "Finetune/Loss (Raw)": 0.7366088032722473, "Finetune/Step": 3537, "Finetune/Step Time": 2.8651326801627874} +{"Finetune/Learning Rate": 4.061735777839032e-06, "Finetune/Loss": 0.7744361162185669, "Finetune/Loss (Raw)": 0.9368632435798645, "Finetune/Step": 3538, "Finetune/Step Time": 2.863901497796178} +{"Finetune/Learning Rate": 4.05649827215004e-06, "Finetune/Loss": 0.7746669054031372, "Finetune/Loss (Raw)": 0.7927974462509155, "Finetune/Step": 3539, "Finetune/Step Time": 2.8659774009138346} +{"Finetune/Learning Rate": 4.051263286153226e-06, "Finetune/Loss": 0.7750552892684937, "Finetune/Loss (Raw)": 0.7592564821243286, "Finetune/Step": 3540, "Finetune/Step Time": 2.8632897082716227} +{"Finetune/Learning Rate": 4.046030822067916e-06, "Finetune/Loss": 0.7741175889968872, "Finetune/Loss (Raw)": 0.7672046422958374, "Finetune/Step": 3541, "Finetune/Step Time": 2.865571990609169} +{"Finetune/Learning Rate": 4.040800882112362e-06, "Finetune/Loss": 0.7750676870346069, "Finetune/Loss (Raw)": 0.8475520014762878, "Finetune/Step": 3542, "Finetune/Step Time": 2.866341695189476} +{"Finetune/Learning Rate": 4.035573468503751e-06, "Finetune/Loss": 0.774484395980835, "Finetune/Loss (Raw)": 0.8283517956733704, "Finetune/Step": 3543, "Finetune/Step Time": 2.8668798711150885} +{"Finetune/Learning Rate": 4.030348583458192e-06, "Finetune/Loss": 0.7743678092956543, "Finetune/Loss (Raw)": 0.7574880123138428, "Finetune/Step": 3544, "Finetune/Step Time": 2.8444620352238417} +{"Finetune/Learning Rate": 4.025126229190728e-06, "Finetune/Loss": 0.7702451944351196, "Finetune/Loss (Raw)": 0.15884347259998322, "Finetune/Step": 3545, "Finetune/Step Time": 2.8783209156244993} +{"Finetune/Learning Rate": 4.019906407915335e-06, "Finetune/Loss": 0.7698162794113159, "Finetune/Loss (Raw)": 0.765090823173523, "Finetune/Step": 3546, "Finetune/Step Time": 2.880127467215061} +{"Finetune/Learning Rate": 4.014689121844894e-06, "Finetune/Loss": 0.7687740325927734, "Finetune/Loss (Raw)": 0.7324530482292175, "Finetune/Step": 3547, "Finetune/Step Time": 2.883548628538847} +{"Finetune/Learning Rate": 4.009474373191234e-06, "Finetune/Loss": 0.7699217200279236, "Finetune/Loss (Raw)": 0.8080214262008667, "Finetune/Step": 3548, "Finetune/Step Time": 2.885213930159807} +{"Finetune/Learning Rate": 4.004262164165098e-06, "Finetune/Loss": 0.7664802670478821, "Finetune/Loss (Raw)": 0.4285755157470703, "Finetune/Step": 3549, "Finetune/Step Time": 2.9175606314092875} +{"Finetune/Learning Rate": 3.999052496976152e-06, "Finetune/Loss": 0.7659680843353271, "Finetune/Loss (Raw)": 0.8248049020767212, "Finetune/Step": 3550, "Finetune/Step Time": 2.9184485767036676} +{"Finetune/Learning Rate": 3.993845373832987e-06, "Finetune/Loss": 0.7639049887657166, "Finetune/Loss (Raw)": 0.6542434692382812, "Finetune/Step": 3551, "Finetune/Step Time": 2.9191994462162256} +{"Finetune/Learning Rate": 3.988640796943111e-06, "Finetune/Loss": 0.7639549970626831, "Finetune/Loss (Raw)": 0.7412306070327759, "Finetune/Step": 3552, "Finetune/Step Time": 2.9296573381870985} +{"Finetune/Learning Rate": 3.983438768512964e-06, "Finetune/Loss": 0.7633493542671204, "Finetune/Loss (Raw)": 0.7606848478317261, "Finetune/Step": 3553, "Finetune/Step Time": 2.931549835950136} +{"Finetune/Learning Rate": 3.978239290747888e-06, "Finetune/Loss": 0.7612466812133789, "Finetune/Loss (Raw)": 0.5493759512901306, "Finetune/Step": 3554, "Finetune/Step Time": 2.95470330119133} +{"Finetune/Learning Rate": 3.973042365852155e-06, "Finetune/Loss": 0.7659227848052979, "Finetune/Loss (Raw)": 0.8196315169334412, "Finetune/Step": 3555, "Finetune/Step Time": 2.919307788833976} +{"Finetune/Learning Rate": 3.967847996028962e-06, "Finetune/Loss": 0.7659174203872681, "Finetune/Loss (Raw)": 0.6072843670845032, "Finetune/Step": 3556, "Finetune/Step Time": 2.9200605042278767} +{"Finetune/Learning Rate": 3.9626561834804e-06, "Finetune/Loss": 0.767315149307251, "Finetune/Loss (Raw)": 0.9125041365623474, "Finetune/Step": 3557, "Finetune/Step Time": 2.920164782553911} +{"Finetune/Learning Rate": 3.957466930407499e-06, "Finetune/Loss": 0.7667034268379211, "Finetune/Loss (Raw)": 0.771473228931427, "Finetune/Step": 3558, "Finetune/Step Time": 2.9178598783910275} +{"Finetune/Learning Rate": 3.952280239010193e-06, "Finetune/Loss": 0.7628558874130249, "Finetune/Loss (Raw)": 0.34429213404655457, "Finetune/Step": 3559, "Finetune/Step Time": 2.9501927085220814} +{"Finetune/Learning Rate": 3.947096111487328e-06, "Finetune/Loss": 0.7621948719024658, "Finetune/Loss (Raw)": 0.7658260464668274, "Finetune/Step": 3560, "Finetune/Step Time": 2.953252039849758} +{"Finetune/Learning Rate": 3.9419145500366706e-06, "Finetune/Loss": 0.7610903978347778, "Finetune/Loss (Raw)": 0.7476913332939148, "Finetune/Step": 3561, "Finetune/Step Time": 2.957054963335395} +{"Finetune/Learning Rate": 3.936735556854889e-06, "Finetune/Loss": 0.7606964111328125, "Finetune/Loss (Raw)": 0.7554205656051636, "Finetune/Step": 3562, "Finetune/Step Time": 2.9549145996570587} +{"Finetune/Learning Rate": 3.931559134137583e-06, "Finetune/Loss": 0.7599455714225769, "Finetune/Loss (Raw)": 0.667312741279602, "Finetune/Step": 3563, "Finetune/Step Time": 2.953846963122487} +{"Finetune/Learning Rate": 3.926385284079234e-06, "Finetune/Loss": 0.7609256505966187, "Finetune/Loss (Raw)": 0.8876652121543884, "Finetune/Step": 3564, "Finetune/Step Time": 2.9536443762481213} +{"Finetune/Learning Rate": 3.92121400887325e-06, "Finetune/Loss": 0.7642639875411987, "Finetune/Loss (Raw)": 0.8197397589683533, "Finetune/Step": 3565, "Finetune/Step Time": 2.924079755321145} +{"Finetune/Learning Rate": 3.916045310711952e-06, "Finetune/Loss": 0.7643921971321106, "Finetune/Loss (Raw)": 0.8450567126274109, "Finetune/Step": 3566, "Finetune/Step Time": 2.9192944522947073} +{"Finetune/Learning Rate": 3.910879191786557e-06, "Finetune/Loss": 0.7641203999519348, "Finetune/Loss (Raw)": 0.7601677775382996, "Finetune/Step": 3567, "Finetune/Step Time": 2.915971664711833} +{"Finetune/Learning Rate": 3.905715654287194e-06, "Finetune/Loss": 0.764346718788147, "Finetune/Loss (Raw)": 0.8258017897605896, "Finetune/Step": 3568, "Finetune/Step Time": 2.909008665010333} +{"Finetune/Learning Rate": 3.900554700402896e-06, "Finetune/Loss": 0.7637808918952942, "Finetune/Loss (Raw)": 0.7359461188316345, "Finetune/Step": 3569, "Finetune/Step Time": 2.886622104793787} +{"Finetune/Learning Rate": 3.895396332321601e-06, "Finetune/Loss": 0.7651822566986084, "Finetune/Loss (Raw)": 1.0311824083328247, "Finetune/Step": 3570, "Finetune/Step Time": 2.8896665014326572} +{"Finetune/Learning Rate": 3.890240552230153e-06, "Finetune/Loss": 0.7635519504547119, "Finetune/Loss (Raw)": 0.619724452495575, "Finetune/Step": 3571, "Finetune/Step Time": 2.9134868029505014} +{"Finetune/Learning Rate": 3.885087362314294e-06, "Finetune/Loss": 0.7626751661300659, "Finetune/Loss (Raw)": 0.7438346743583679, "Finetune/Step": 3572, "Finetune/Step Time": 2.9193733520805836} +{"Finetune/Learning Rate": 3.8799367647586695e-06, "Finetune/Loss": 0.7612437009811401, "Finetune/Loss (Raw)": 0.6183027625083923, "Finetune/Step": 3573, "Finetune/Step Time": 2.9163317549973726} +{"Finetune/Learning Rate": 3.874788761746836e-06, "Finetune/Loss": 0.7614469528198242, "Finetune/Loss (Raw)": 0.8228186964988708, "Finetune/Step": 3574, "Finetune/Step Time": 2.9154387656599283} +{"Finetune/Learning Rate": 3.86964335546123e-06, "Finetune/Loss": 0.7617545127868652, "Finetune/Loss (Raw)": 0.7948355078697205, "Finetune/Step": 3575, "Finetune/Step Time": 2.9139803051948547} +{"Finetune/Learning Rate": 3.8645005480832065e-06, "Finetune/Loss": 0.7603106498718262, "Finetune/Loss (Raw)": 0.5562070608139038, "Finetune/Step": 3576, "Finetune/Step Time": 2.93710009008646} +{"Finetune/Learning Rate": 3.859360341793009e-06, "Finetune/Loss": 0.7614482641220093, "Finetune/Loss (Raw)": 0.7751224637031555, "Finetune/Step": 3577, "Finetune/Step Time": 2.914602557197213} +{"Finetune/Learning Rate": 3.854222738769778e-06, "Finetune/Loss": 0.7614116668701172, "Finetune/Loss (Raw)": 0.7246052026748657, "Finetune/Step": 3578, "Finetune/Step Time": 2.9134377166628838} +{"Finetune/Learning Rate": 3.849087741191556e-06, "Finetune/Loss": 0.7604788541793823, "Finetune/Loss (Raw)": 0.7354303598403931, "Finetune/Step": 3579, "Finetune/Step Time": 2.9138104803860188} +{"Finetune/Learning Rate": 3.843955351235271e-06, "Finetune/Loss": 0.764563798904419, "Finetune/Loss (Raw)": 0.7322883605957031, "Finetune/Step": 3580, "Finetune/Step Time": 2.883921340107918} +{"Finetune/Learning Rate": 3.838825571076763e-06, "Finetune/Loss": 0.7676728367805481, "Finetune/Loss (Raw)": 0.9180513620376587, "Finetune/Step": 3581, "Finetune/Step Time": 2.863957377150655} +{"Finetune/Learning Rate": 3.833698402890743e-06, "Finetune/Loss": 0.767880916595459, "Finetune/Loss (Raw)": 0.775702953338623, "Finetune/Step": 3582, "Finetune/Step Time": 2.8640878088772297} +{"Finetune/Learning Rate": 3.8285738488508286e-06, "Finetune/Loss": 0.7674449682235718, "Finetune/Loss (Raw)": 0.7633823156356812, "Finetune/Step": 3583, "Finetune/Step Time": 2.858361005783081} +{"Finetune/Learning Rate": 3.823451911129536e-06, "Finetune/Loss": 0.7655701637268066, "Finetune/Loss (Raw)": 0.5797630548477173, "Finetune/Step": 3584, "Finetune/Step Time": 2.8805949185043573} +{"Finetune/Learning Rate": 3.8183325918982485e-06, "Finetune/Loss": 0.7647339105606079, "Finetune/Loss (Raw)": 0.7266812324523926, "Finetune/Step": 3585, "Finetune/Step Time": 2.8872599247843027} +{"Finetune/Learning Rate": 3.8132158933272644e-06, "Finetune/Loss": 0.764607310295105, "Finetune/Loss (Raw)": 0.825980007648468, "Finetune/Step": 3586, "Finetune/Step Time": 2.887893795967102} +{"Finetune/Learning Rate": 3.8081018175857577e-06, "Finetune/Loss": 0.764281153678894, "Finetune/Loss (Raw)": 0.7784231901168823, "Finetune/Step": 3587, "Finetune/Step Time": 2.8862519692629576} +{"Finetune/Learning Rate": 3.8029903668417935e-06, "Finetune/Loss": 0.763603687286377, "Finetune/Loss (Raw)": 0.777052104473114, "Finetune/Step": 3588, "Finetune/Step Time": 2.8876899629831314} +{"Finetune/Learning Rate": 3.7978815432623216e-06, "Finetune/Loss": 0.7633340358734131, "Finetune/Loss (Raw)": 0.6762297749519348, "Finetune/Step": 3589, "Finetune/Step Time": 2.885709622874856} +{"Finetune/Learning Rate": 3.792775349013178e-06, "Finetune/Loss": 0.7647461891174316, "Finetune/Loss (Raw)": 0.7982679605484009, "Finetune/Step": 3590, "Finetune/Step Time": 2.864199126139283} +{"Finetune/Learning Rate": 3.7876717862590973e-06, "Finetune/Loss": 0.7677335143089294, "Finetune/Loss (Raw)": 0.8345108032226562, "Finetune/Step": 3591, "Finetune/Step Time": 2.8363501224666834} +{"Finetune/Learning Rate": 3.7825708571636756e-06, "Finetune/Loss": 0.7672120928764343, "Finetune/Loss (Raw)": 0.7339726686477661, "Finetune/Step": 3592, "Finetune/Step Time": 2.836026307195425} +{"Finetune/Learning Rate": 3.777472563889405e-06, "Finetune/Loss": 0.7677834033966064, "Finetune/Loss (Raw)": 0.8941284418106079, "Finetune/Step": 3593, "Finetune/Step Time": 2.8365568723529577} +{"Finetune/Learning Rate": 3.7723769085976658e-06, "Finetune/Loss": 0.7687504887580872, "Finetune/Loss (Raw)": 0.7700725793838501, "Finetune/Step": 3594, "Finetune/Step Time": 2.8421786911785603} +{"Finetune/Learning Rate": 3.767283893448711e-06, "Finetune/Loss": 0.7690621614456177, "Finetune/Loss (Raw)": 0.9370478987693787, "Finetune/Step": 3595, "Finetune/Step Time": 2.8423737566918135} +{"Finetune/Learning Rate": 3.7621935206016767e-06, "Finetune/Loss": 0.7690914869308472, "Finetune/Loss (Raw)": 0.7899726629257202, "Finetune/Step": 3596, "Finetune/Step Time": 2.8401881493628025} +{"Finetune/Learning Rate": 3.757105792214579e-06, "Finetune/Loss": 0.7680017352104187, "Finetune/Loss (Raw)": 0.7135642170906067, "Finetune/Step": 3597, "Finetune/Step Time": 2.8427941538393497} +{"Finetune/Learning Rate": 3.7520207104443118e-06, "Finetune/Loss": 0.7662915587425232, "Finetune/Loss (Raw)": 0.49888941645622253, "Finetune/Step": 3598, "Finetune/Step Time": 2.8677675761282444} +{"Finetune/Learning Rate": 3.74693827744665e-06, "Finetune/Loss": 0.7655866146087646, "Finetune/Loss (Raw)": 0.7075442671775818, "Finetune/Step": 3599, "Finetune/Step Time": 2.8691323455423117} +{"Finetune/Learning Rate": 3.7418584953762427e-06, "Finetune/Loss": 0.7661186456680298, "Finetune/Loss (Raw)": 0.8405601978302002, "Finetune/Step": 3600, "Finetune/Step Time": 2.8667383305728436} +{"Finetune/Learning Rate": 3.7367813663866124e-06, "Finetune/Loss": 0.7663056254386902, "Finetune/Loss (Raw)": 0.7939246892929077, "Finetune/Step": 3601, "Finetune/Step Time": 2.872932903468609} +{"Finetune/Learning Rate": 3.7317068926301716e-06, "Finetune/Loss": 0.7651514410972595, "Finetune/Loss (Raw)": 0.7338557839393616, "Finetune/Step": 3602, "Finetune/Step Time": 2.873008171096444} +{"Finetune/Learning Rate": 3.7266350762581826e-06, "Finetune/Loss": 0.7651422619819641, "Finetune/Loss (Raw)": 0.7749302983283997, "Finetune/Step": 3603, "Finetune/Step Time": 2.89363276027143} +{"Finetune/Learning Rate": 3.721565919420804e-06, "Finetune/Loss": 0.7647684812545776, "Finetune/Loss (Raw)": 0.7784760594367981, "Finetune/Step": 3604, "Finetune/Step Time": 2.894146151840687} +{"Finetune/Learning Rate": 3.716499424267055e-06, "Finetune/Loss": 0.7637980580329895, "Finetune/Loss (Raw)": 0.611830472946167, "Finetune/Step": 3605, "Finetune/Step Time": 2.9184828586876392} +{"Finetune/Learning Rate": 3.7114355929448285e-06, "Finetune/Loss": 0.7641472816467285, "Finetune/Loss (Raw)": 0.8455996513366699, "Finetune/Step": 3606, "Finetune/Step Time": 2.9261369779706} +{"Finetune/Learning Rate": 3.7063744276008897e-06, "Finetune/Loss": 0.7640589475631714, "Finetune/Loss (Raw)": 0.7626922726631165, "Finetune/Step": 3607, "Finetune/Step Time": 2.9273688942193985} +{"Finetune/Learning Rate": 3.7013159303808675e-06, "Finetune/Loss": 0.7640243172645569, "Finetune/Loss (Raw)": 0.7815915942192078, "Finetune/Step": 3608, "Finetune/Step Time": 2.934411395341158} +{"Finetune/Learning Rate": 3.6962601034292766e-06, "Finetune/Loss": 0.7640313506126404, "Finetune/Loss (Raw)": 0.7914651036262512, "Finetune/Step": 3609, "Finetune/Step Time": 2.935216225683689} +{"Finetune/Learning Rate": 3.691206948889476e-06, "Finetune/Loss": 0.7646393775939941, "Finetune/Loss (Raw)": 0.8781396746635437, "Finetune/Step": 3610, "Finetune/Step Time": 2.9405616763979197} +{"Finetune/Learning Rate": 3.6861564689037046e-06, "Finetune/Loss": 0.7633354663848877, "Finetune/Loss (Raw)": 0.5777900218963623, "Finetune/Step": 3611, "Finetune/Step Time": 2.9649513699114323} +{"Finetune/Learning Rate": 3.681108665613076e-06, "Finetune/Loss": 0.7637760043144226, "Finetune/Loss (Raw)": 0.7261912822723389, "Finetune/Step": 3612, "Finetune/Step Time": 2.9444271866232157} +{"Finetune/Learning Rate": 3.676063541157544e-06, "Finetune/Loss": 0.762690007686615, "Finetune/Loss (Raw)": 0.7350853681564331, "Finetune/Step": 3613, "Finetune/Step Time": 2.9455342888832092} +{"Finetune/Learning Rate": 3.6710210976759563e-06, "Finetune/Loss": 0.7622625827789307, "Finetune/Loss (Raw)": 0.8356103897094727, "Finetune/Step": 3614, "Finetune/Step Time": 2.9459834061563015} +{"Finetune/Learning Rate": 3.6659813373060026e-06, "Finetune/Loss": 0.7607715129852295, "Finetune/Loss (Raw)": 0.6448652744293213, "Finetune/Step": 3615, "Finetune/Step Time": 2.969936054199934} +{"Finetune/Learning Rate": 3.660944262184245e-06, "Finetune/Loss": 0.7608093023300171, "Finetune/Loss (Raw)": 0.7533335089683533, "Finetune/Step": 3616, "Finetune/Step Time": 2.9692859314382076} +{"Finetune/Learning Rate": 3.655909874446103e-06, "Finetune/Loss": 0.7595479488372803, "Finetune/Loss (Raw)": 0.6034103631973267, "Finetune/Step": 3617, "Finetune/Step Time": 2.9934374317526817} +{"Finetune/Learning Rate": 3.650878176225856e-06, "Finetune/Loss": 0.7598887085914612, "Finetune/Loss (Raw)": 0.7974513173103333, "Finetune/Step": 3618, "Finetune/Step Time": 2.993578841909766} +{"Finetune/Learning Rate": 3.6458491696566558e-06, "Finetune/Loss": 0.7584251165390015, "Finetune/Loss (Raw)": 0.696461021900177, "Finetune/Step": 3619, "Finetune/Step Time": 2.994961950927973} +{"Finetune/Learning Rate": 3.6408228568704905e-06, "Finetune/Loss": 0.7599323987960815, "Finetune/Loss (Raw)": 0.825848400592804, "Finetune/Step": 3620, "Finetune/Step Time": 2.973851267248392} +{"Finetune/Learning Rate": 3.635799239998221e-06, "Finetune/Loss": 0.7589609622955322, "Finetune/Loss (Raw)": 0.6635218858718872, "Finetune/Step": 3621, "Finetune/Step Time": 2.973800325766206} +{"Finetune/Learning Rate": 3.6307783211695693e-06, "Finetune/Loss": 0.7580690383911133, "Finetune/Loss (Raw)": 0.7553113698959351, "Finetune/Step": 3622, "Finetune/Step Time": 2.976045122370124} +{"Finetune/Learning Rate": 3.625760102513103e-06, "Finetune/Loss": 0.756413459777832, "Finetune/Loss (Raw)": 0.5366128087043762, "Finetune/Step": 3623, "Finetune/Step Time": 2.9977608546614647} +{"Finetune/Learning Rate": 3.6207445861562497e-06, "Finetune/Loss": 0.7569879293441772, "Finetune/Loss (Raw)": 0.7986536026000977, "Finetune/Step": 3624, "Finetune/Step Time": 2.9899216424673796} +{"Finetune/Learning Rate": 3.6157317742252907e-06, "Finetune/Loss": 0.7551190853118896, "Finetune/Loss (Raw)": 0.5647940039634705, "Finetune/Step": 3625, "Finetune/Step Time": 3.013512933626771} +{"Finetune/Learning Rate": 3.6107216688453607e-06, "Finetune/Loss": 0.7554663419723511, "Finetune/Loss (Raw)": 0.8132447004318237, "Finetune/Step": 3626, "Finetune/Step Time": 3.011711934581399} +{"Finetune/Learning Rate": 3.605714272140447e-06, "Finetune/Loss": 0.7547063231468201, "Finetune/Loss (Raw)": 0.8201828002929688, "Finetune/Step": 3627, "Finetune/Step Time": 3.011000035330653} +{"Finetune/Learning Rate": 3.6007095862333897e-06, "Finetune/Loss": 0.7543426752090454, "Finetune/Loss (Raw)": 0.7566109299659729, "Finetune/Step": 3628, "Finetune/Step Time": 3.012741504237056} +{"Finetune/Learning Rate": 3.5957076132458747e-06, "Finetune/Loss": 0.7540531754493713, "Finetune/Loss (Raw)": 0.7623949646949768, "Finetune/Step": 3629, "Finetune/Step Time": 3.012311588972807} +{"Finetune/Learning Rate": 3.5907083552984513e-06, "Finetune/Loss": 0.7540456652641296, "Finetune/Loss (Raw)": 0.797437846660614, "Finetune/Step": 3630, "Finetune/Step Time": 3.0120821725577116} +{"Finetune/Learning Rate": 3.5857118145104963e-06, "Finetune/Loss": 0.754372239112854, "Finetune/Loss (Raw)": 0.7487711310386658, "Finetune/Step": 3631, "Finetune/Step Time": 3.0124629624187946} +{"Finetune/Learning Rate": 3.5807179930002556e-06, "Finetune/Loss": 0.7541337013244629, "Finetune/Loss (Raw)": 0.7625315189361572, "Finetune/Step": 3632, "Finetune/Step Time": 3.015574559569359} +{"Finetune/Learning Rate": 3.575726892884811e-06, "Finetune/Loss": 0.7537781000137329, "Finetune/Loss (Raw)": 0.8415377736091614, "Finetune/Step": 3633, "Finetune/Step Time": 3.0154895428568125} +{"Finetune/Learning Rate": 3.570738516280092e-06, "Finetune/Loss": 0.7533779740333557, "Finetune/Loss (Raw)": 0.7902939319610596, "Finetune/Step": 3634, "Finetune/Step Time": 3.0169279612600803} +{"Finetune/Learning Rate": 3.5657528653008744e-06, "Finetune/Loss": 0.7525652050971985, "Finetune/Loss (Raw)": 0.6238341927528381, "Finetune/Step": 3635, "Finetune/Step Time": 3.0350348483771086} +{"Finetune/Learning Rate": 3.5607699420607753e-06, "Finetune/Loss": 0.752285361289978, "Finetune/Loss (Raw)": 0.7798873782157898, "Finetune/Step": 3636, "Finetune/Step Time": 3.0323869176208973} +{"Finetune/Learning Rate": 3.5557897486722693e-06, "Finetune/Loss": 0.7530537843704224, "Finetune/Loss (Raw)": 0.8302499055862427, "Finetune/Step": 3637, "Finetune/Step Time": 3.030662029981613} +{"Finetune/Learning Rate": 3.5508122872466523e-06, "Finetune/Loss": 0.7520486116409302, "Finetune/Loss (Raw)": 0.7353150248527527, "Finetune/Step": 3638, "Finetune/Step Time": 3.0266086980700493} +{"Finetune/Learning Rate": 3.545837559894072e-06, "Finetune/Loss": 0.7516316175460815, "Finetune/Loss (Raw)": 0.852932870388031, "Finetune/Step": 3639, "Finetune/Step Time": 3.0284137967973948} +{"Finetune/Learning Rate": 3.5408655687235282e-06, "Finetune/Loss": 0.7515172958374023, "Finetune/Loss (Raw)": 0.7642399072647095, "Finetune/Step": 3640, "Finetune/Step Time": 3.0289676003158092} +{"Finetune/Learning Rate": 3.535896315842838e-06, "Finetune/Loss": 0.7519351243972778, "Finetune/Loss (Raw)": 0.8447243571281433, "Finetune/Step": 3641, "Finetune/Step Time": 3.028962856158614} +{"Finetune/Learning Rate": 3.530929803358678e-06, "Finetune/Loss": 0.7526648044586182, "Finetune/Loss (Raw)": 0.783250093460083, "Finetune/Step": 3642, "Finetune/Step Time": 3.0288859009742737} +{"Finetune/Learning Rate": 3.5259660333765533e-06, "Finetune/Loss": 0.7511587738990784, "Finetune/Loss (Raw)": 0.5902102589607239, "Finetune/Step": 3643, "Finetune/Step Time": 3.0514939222484827} +{"Finetune/Learning Rate": 3.5210050080008074e-06, "Finetune/Loss": 0.7513833045959473, "Finetune/Loss (Raw)": 0.8147148489952087, "Finetune/Step": 3644, "Finetune/Step Time": 3.0541997775435448} +{"Finetune/Learning Rate": 3.5160467293346202e-06, "Finetune/Loss": 0.7515594363212585, "Finetune/Loss (Raw)": 0.8145840167999268, "Finetune/Step": 3645, "Finetune/Step Time": 3.0572405513375998} +{"Finetune/Learning Rate": 3.5110911994800043e-06, "Finetune/Loss": 0.7527315616607666, "Finetune/Loss (Raw)": 0.8128326535224915, "Finetune/Step": 3646, "Finetune/Step Time": 3.0309895426034927} +{"Finetune/Learning Rate": 3.5061384205378225e-06, "Finetune/Loss": 0.753502607345581, "Finetune/Loss (Raw)": 0.8207778334617615, "Finetune/Step": 3647, "Finetune/Step Time": 3.0335416607558727} +{"Finetune/Learning Rate": 3.5011883946077462e-06, "Finetune/Loss": 0.7555999755859375, "Finetune/Loss (Raw)": 0.8838425874710083, "Finetune/Step": 3648, "Finetune/Step Time": 3.0131960101425648} +{"Finetune/Learning Rate": 3.4962411237882945e-06, "Finetune/Loss": 0.7539085149765015, "Finetune/Loss (Raw)": 0.6617516875267029, "Finetune/Step": 3649, "Finetune/Step Time": 3.016745375469327} +{"Finetune/Learning Rate": 3.491296610176823e-06, "Finetune/Loss": 0.7545487880706787, "Finetune/Loss (Raw)": 0.8462185263633728, "Finetune/Step": 3650, "Finetune/Step Time": 3.0200699362903833} +{"Finetune/Learning Rate": 3.4863548558695094e-06, "Finetune/Loss": 0.7536904215812683, "Finetune/Loss (Raw)": 0.6600190997123718, "Finetune/Step": 3651, "Finetune/Step Time": 3.0212152171880007} +{"Finetune/Learning Rate": 3.481415862961365e-06, "Finetune/Loss": 0.7537497282028198, "Finetune/Loss (Raw)": 0.7830468416213989, "Finetune/Step": 3652, "Finetune/Step Time": 3.0233922451734543} +{"Finetune/Learning Rate": 3.4764796335462268e-06, "Finetune/Loss": 0.7534346580505371, "Finetune/Loss (Raw)": 0.7749609351158142, "Finetune/Step": 3653, "Finetune/Step Time": 3.0209651067852974} +{"Finetune/Learning Rate": 3.4715461697167663e-06, "Finetune/Loss": 0.7546178102493286, "Finetune/Loss (Raw)": 0.9171833992004395, "Finetune/Step": 3654, "Finetune/Step Time": 3.023608786985278} +{"Finetune/Learning Rate": 3.4666154735644785e-06, "Finetune/Loss": 0.7553931474685669, "Finetune/Loss (Raw)": 0.8070874214172363, "Finetune/Step": 3655, "Finetune/Step Time": 3.0226472206413746} +{"Finetune/Learning Rate": 3.4616875471796863e-06, "Finetune/Loss": 0.755603551864624, "Finetune/Loss (Raw)": 0.8484421372413635, "Finetune/Step": 3656, "Finetune/Step Time": 3.023439794778824} +{"Finetune/Learning Rate": 3.456762392651538e-06, "Finetune/Loss": 0.7554107308387756, "Finetune/Loss (Raw)": 0.7788283824920654, "Finetune/Step": 3657, "Finetune/Step Time": 3.025578686967492} +{"Finetune/Learning Rate": 3.4518400120680074e-06, "Finetune/Loss": 0.7555182576179504, "Finetune/Loss (Raw)": 0.8144679069519043, "Finetune/Step": 3658, "Finetune/Step Time": 3.023814605548978} +{"Finetune/Learning Rate": 3.4469204075158867e-06, "Finetune/Loss": 0.7550277709960938, "Finetune/Loss (Raw)": 0.7524543404579163, "Finetune/Step": 3659, "Finetune/Step Time": 3.0208130795508623} +{"Finetune/Learning Rate": 3.442003581080805e-06, "Finetune/Loss": 0.7549299597740173, "Finetune/Loss (Raw)": 0.7861025333404541, "Finetune/Step": 3660, "Finetune/Step Time": 3.0210134126245975} +{"Finetune/Learning Rate": 3.4370895348472024e-06, "Finetune/Loss": 0.7544463872909546, "Finetune/Loss (Raw)": 0.7874919176101685, "Finetune/Step": 3661, "Finetune/Step Time": 3.0235334895551205} +{"Finetune/Learning Rate": 3.432178270898341e-06, "Finetune/Loss": 0.7539222240447998, "Finetune/Loss (Raw)": 0.7761950492858887, "Finetune/Step": 3662, "Finetune/Step Time": 3.0226001534610987} +{"Finetune/Learning Rate": 3.4272697913163054e-06, "Finetune/Loss": 0.7542476654052734, "Finetune/Loss (Raw)": 0.8258703947067261, "Finetune/Step": 3663, "Finetune/Step Time": 3.021764513105154} +{"Finetune/Learning Rate": 3.4223640981820016e-06, "Finetune/Loss": 0.7537096738815308, "Finetune/Loss (Raw)": 0.7334609031677246, "Finetune/Step": 3664, "Finetune/Step Time": 3.03098201751709} +{"Finetune/Learning Rate": 3.417461193575151e-06, "Finetune/Loss": 0.7540530562400818, "Finetune/Loss (Raw)": 0.7805624604225159, "Finetune/Step": 3665, "Finetune/Step Time": 3.029332334175706} +{"Finetune/Learning Rate": 3.4125610795742956e-06, "Finetune/Loss": 0.7526453733444214, "Finetune/Loss (Raw)": 0.7566863894462585, "Finetune/Step": 3666, "Finetune/Step Time": 3.0275344233959913} +{"Finetune/Learning Rate": 3.4076637582567882e-06, "Finetune/Loss": 0.752937376499176, "Finetune/Loss (Raw)": 0.8301617503166199, "Finetune/Step": 3667, "Finetune/Step Time": 3.026454845443368} +{"Finetune/Learning Rate": 3.4027692316988138e-06, "Finetune/Loss": 0.7517795562744141, "Finetune/Loss (Raw)": 0.6110657453536987, "Finetune/Step": 3668, "Finetune/Step Time": 3.050087520852685} +{"Finetune/Learning Rate": 3.3978775019753476e-06, "Finetune/Loss": 0.7508724331855774, "Finetune/Loss (Raw)": 0.6510887145996094, "Finetune/Step": 3669, "Finetune/Step Time": 3.0700449254363775} +{"Finetune/Learning Rate": 3.392988571160203e-06, "Finetune/Loss": 0.7492849826812744, "Finetune/Loss (Raw)": 0.6443576216697693, "Finetune/Step": 3670, "Finetune/Step Time": 3.094821633771062} +{"Finetune/Learning Rate": 3.388102441325992e-06, "Finetune/Loss": 0.7491944432258606, "Finetune/Loss (Raw)": 0.8167592883110046, "Finetune/Step": 3671, "Finetune/Step Time": 3.092810608446598} +{"Finetune/Learning Rate": 3.383219114544145e-06, "Finetune/Loss": 0.7494074106216431, "Finetune/Loss (Raw)": 0.7847463488578796, "Finetune/Step": 3672, "Finetune/Step Time": 3.089391615241766} +{"Finetune/Learning Rate": 3.378338592884903e-06, "Finetune/Loss": 0.752991795539856, "Finetune/Loss (Raw)": 0.617647647857666, "Finetune/Step": 3673, "Finetune/Step Time": 3.0798524226993322} +{"Finetune/Learning Rate": 3.373460878417315e-06, "Finetune/Loss": 0.7529800534248352, "Finetune/Loss (Raw)": 0.7635942697525024, "Finetune/Step": 3674, "Finetune/Step Time": 3.077128041535616} +{"Finetune/Learning Rate": 3.3685859732092507e-06, "Finetune/Loss": 0.7534879446029663, "Finetune/Loss (Raw)": 0.797460675239563, "Finetune/Step": 3675, "Finetune/Step Time": 3.072579424828291} +{"Finetune/Learning Rate": 3.363713879327373e-06, "Finetune/Loss": 0.7531809210777283, "Finetune/Loss (Raw)": 0.7687200307846069, "Finetune/Step": 3676, "Finetune/Step Time": 3.072138139978051} +{"Finetune/Learning Rate": 3.3588445988371575e-06, "Finetune/Loss": 0.7556971311569214, "Finetune/Loss (Raw)": 0.7506463527679443, "Finetune/Step": 3677, "Finetune/Step Time": 3.0432347655296326} +{"Finetune/Learning Rate": 3.3539781338029044e-06, "Finetune/Loss": 0.7554379105567932, "Finetune/Loss (Raw)": 0.7916293144226074, "Finetune/Step": 3678, "Finetune/Step Time": 3.0438251458108425} +{"Finetune/Learning Rate": 3.349114486287689e-06, "Finetune/Loss": 0.7563011646270752, "Finetune/Loss (Raw)": 0.7647349238395691, "Finetune/Step": 3679, "Finetune/Step Time": 3.043652920052409} +{"Finetune/Learning Rate": 3.3442536583534225e-06, "Finetune/Loss": 0.7569886445999146, "Finetune/Loss (Raw)": 0.8292372226715088, "Finetune/Step": 3680, "Finetune/Step Time": 3.0341506265103817} +{"Finetune/Learning Rate": 3.3393956520608018e-06, "Finetune/Loss": 0.7577141523361206, "Finetune/Loss (Raw)": 0.8535481095314026, "Finetune/Step": 3681, "Finetune/Step Time": 3.032349204644561} +{"Finetune/Learning Rate": 3.334540469469335e-06, "Finetune/Loss": 0.7598497867584229, "Finetune/Loss (Raw)": 0.8227375149726868, "Finetune/Step": 3682, "Finetune/Step Time": 3.0096044577658176} +{"Finetune/Learning Rate": 3.3296881126373315e-06, "Finetune/Loss": 0.759307861328125, "Finetune/Loss (Raw)": 0.7502577304840088, "Finetune/Step": 3683, "Finetune/Step Time": 3.012363463640213} +{"Finetune/Learning Rate": 3.3248385836218977e-06, "Finetune/Loss": 0.7609902620315552, "Finetune/Loss (Raw)": 0.8226361274719238, "Finetune/Step": 3684, "Finetune/Step Time": 2.9888024292886257} +{"Finetune/Learning Rate": 3.319991884478958e-06, "Finetune/Loss": 0.760124921798706, "Finetune/Loss (Raw)": 0.8017432689666748, "Finetune/Step": 3685, "Finetune/Step Time": 2.986487537622452} +{"Finetune/Learning Rate": 3.3151480172632157e-06, "Finetune/Loss": 0.7603620290756226, "Finetune/Loss (Raw)": 0.8018162846565247, "Finetune/Step": 3686, "Finetune/Step Time": 2.9864066373556852} +{"Finetune/Learning Rate": 3.310306984028181e-06, "Finetune/Loss": 0.7644054889678955, "Finetune/Loss (Raw)": 0.8618549108505249, "Finetune/Step": 3687, "Finetune/Step Time": 2.9546284824609756} +{"Finetune/Learning Rate": 3.3054687868261735e-06, "Finetune/Loss": 0.764289379119873, "Finetune/Loss (Raw)": 0.7509604096412659, "Finetune/Step": 3688, "Finetune/Step Time": 2.950623217970133} +{"Finetune/Learning Rate": 3.3006334277082974e-06, "Finetune/Loss": 0.7654212713241577, "Finetune/Loss (Raw)": 0.8925892114639282, "Finetune/Step": 3689, "Finetune/Step Time": 2.9450392965227365} +{"Finetune/Learning Rate": 3.295800908724459e-06, "Finetune/Loss": 0.7647937536239624, "Finetune/Loss (Raw)": 0.6750901341438293, "Finetune/Step": 3690, "Finetune/Step Time": 2.97171787917614} +{"Finetune/Learning Rate": 3.290971231923359e-06, "Finetune/Loss": 0.7641489505767822, "Finetune/Loss (Raw)": 0.5847814083099365, "Finetune/Step": 3691, "Finetune/Step Time": 2.9992192145437} +{"Finetune/Learning Rate": 3.2861443993524944e-06, "Finetune/Loss": 0.7635490894317627, "Finetune/Loss (Raw)": 0.8108837604522705, "Finetune/Step": 3692, "Finetune/Step Time": 2.9999625086784363} +{"Finetune/Learning Rate": 3.2813204130581557e-06, "Finetune/Loss": 0.7611878514289856, "Finetune/Loss (Raw)": 0.5174943208694458, "Finetune/Step": 3693, "Finetune/Step Time": 3.021712761372328} +{"Finetune/Learning Rate": 3.276499275085426e-06, "Finetune/Loss": 0.7600990533828735, "Finetune/Loss (Raw)": 0.7056953310966492, "Finetune/Step": 3694, "Finetune/Step Time": 3.0258578546345234} +{"Finetune/Learning Rate": 3.2716809874781794e-06, "Finetune/Loss": 0.7599225640296936, "Finetune/Loss (Raw)": 0.737572193145752, "Finetune/Step": 3695, "Finetune/Step Time": 3.0319662801921368} +{"Finetune/Learning Rate": 3.266865552279095e-06, "Finetune/Loss": 0.7599021792411804, "Finetune/Loss (Raw)": 0.8231949210166931, "Finetune/Step": 3696, "Finetune/Step Time": 3.0292773451656103} +{"Finetune/Learning Rate": 3.262052971529617e-06, "Finetune/Loss": 0.7601068019866943, "Finetune/Loss (Raw)": 0.7621365189552307, "Finetune/Step": 3697, "Finetune/Step Time": 3.029282409697771} +{"Finetune/Learning Rate": 3.2572432472700034e-06, "Finetune/Loss": 0.7553102374076843, "Finetune/Loss (Raw)": 0.4172247350215912, "Finetune/Step": 3698, "Finetune/Step Time": 3.0571062210947275} +{"Finetune/Learning Rate": 3.252436381539291e-06, "Finetune/Loss": 0.7555974125862122, "Finetune/Loss (Raw)": 0.6564813852310181, "Finetune/Step": 3699, "Finetune/Step Time": 3.033297050744295} +{"Finetune/Learning Rate": 3.2476323763753035e-06, "Finetune/Loss": 0.7556847929954529, "Finetune/Loss (Raw)": 0.7550146579742432, "Finetune/Step": 3700, "Finetune/Step Time": 3.028229432180524} +{"Finetune/Learning Rate": 3.242831233814656e-06, "Finetune/Loss": 0.7580533027648926, "Finetune/Loss (Raw)": 0.9214752316474915, "Finetune/Step": 3701, "Finetune/Step Time": 3.035280615091324} +{"Finetune/Learning Rate": 3.238032955892744e-06, "Finetune/Loss": 0.7578585147857666, "Finetune/Loss (Raw)": 0.7978882193565369, "Finetune/Step": 3702, "Finetune/Step Time": 3.0355540737509727} +{"Finetune/Learning Rate": 3.233237544643761e-06, "Finetune/Loss": 0.7577725648880005, "Finetune/Loss (Raw)": 0.7838355898857117, "Finetune/Step": 3703, "Finetune/Step Time": 3.038396619260311} +{"Finetune/Learning Rate": 3.2284450021006697e-06, "Finetune/Loss": 0.7596299648284912, "Finetune/Loss (Raw)": 0.7939536571502686, "Finetune/Step": 3704, "Finetune/Step Time": 3.010222151875496} +{"Finetune/Learning Rate": 3.2236553302952233e-06, "Finetune/Loss": 0.7550342082977295, "Finetune/Loss (Raw)": 0.18686099350452423, "Finetune/Step": 3705, "Finetune/Step Time": 3.040321731939912} +{"Finetune/Learning Rate": 3.218868531257967e-06, "Finetune/Loss": 0.7547140717506409, "Finetune/Loss (Raw)": 0.6836264729499817, "Finetune/Step": 3706, "Finetune/Step Time": 3.0408954713493586} +{"Finetune/Learning Rate": 3.2140846070182074e-06, "Finetune/Loss": 0.7554779648780823, "Finetune/Loss (Raw)": 0.8332183361053467, "Finetune/Step": 3707, "Finetune/Step Time": 3.042792648077011} +{"Finetune/Learning Rate": 3.2093035596040554e-06, "Finetune/Loss": 0.7568763494491577, "Finetune/Loss (Raw)": 0.9112744927406311, "Finetune/Step": 3708, "Finetune/Step Time": 3.040740270167589} +{"Finetune/Learning Rate": 3.2045253910423867e-06, "Finetune/Loss": 0.7552443742752075, "Finetune/Loss (Raw)": 0.7091575264930725, "Finetune/Step": 3709, "Finetune/Step Time": 3.0367987398058176} +{"Finetune/Learning Rate": 3.199750103358862e-06, "Finetune/Loss": 0.753049373626709, "Finetune/Loss (Raw)": 0.4947480261325836, "Finetune/Step": 3710, "Finetune/Step Time": 3.0673693399876356} +{"Finetune/Learning Rate": 3.1949776985779193e-06, "Finetune/Loss": 0.7531124949455261, "Finetune/Loss (Raw)": 0.7714554071426392, "Finetune/Step": 3711, "Finetune/Step Time": 3.0650779362767935} +{"Finetune/Learning Rate": 3.1902081787227734e-06, "Finetune/Loss": 0.754294216632843, "Finetune/Loss (Raw)": 0.7310217022895813, "Finetune/Step": 3712, "Finetune/Step Time": 3.042440000921488} +{"Finetune/Learning Rate": 3.1854415458154253e-06, "Finetune/Loss": 0.7553049921989441, "Finetune/Loss (Raw)": 0.856063187122345, "Finetune/Step": 3713, "Finetune/Step Time": 3.0330996718257666} +{"Finetune/Learning Rate": 3.180677801876637e-06, "Finetune/Loss": 0.754298210144043, "Finetune/Loss (Raw)": 0.6971126794815063, "Finetune/Step": 3714, "Finetune/Step Time": 3.051588673144579} +{"Finetune/Learning Rate": 3.1759169489259536e-06, "Finetune/Loss": 0.7536194920539856, "Finetune/Loss (Raw)": 0.691551923751831, "Finetune/Step": 3715, "Finetune/Step Time": 3.0749096162617207} +{"Finetune/Learning Rate": 3.1711589889816986e-06, "Finetune/Loss": 0.7493663430213928, "Finetune/Loss (Raw)": 0.2326425313949585, "Finetune/Step": 3716, "Finetune/Step Time": 3.106972085312009} +{"Finetune/Learning Rate": 3.1664039240609624e-06, "Finetune/Loss": 0.7507965564727783, "Finetune/Loss (Raw)": 0.8592982888221741, "Finetune/Step": 3717, "Finetune/Step Time": 3.109597686678171} +{"Finetune/Learning Rate": 3.161651756179612e-06, "Finetune/Loss": 0.7500245571136475, "Finetune/Loss (Raw)": 0.6994521021842957, "Finetune/Step": 3718, "Finetune/Step Time": 3.1069211047142744} +{"Finetune/Learning Rate": 3.1569024873522823e-06, "Finetune/Loss": 0.7499409914016724, "Finetune/Loss (Raw)": 0.8238216042518616, "Finetune/Step": 3719, "Finetune/Step Time": 3.1062782760709524} +{"Finetune/Learning Rate": 3.1521561195923833e-06, "Finetune/Loss": 0.7497583627700806, "Finetune/Loss (Raw)": 0.7105857729911804, "Finetune/Step": 3720, "Finetune/Step Time": 3.1156836170703173} +{"Finetune/Learning Rate": 3.1474126549120932e-06, "Finetune/Loss": 0.7492103576660156, "Finetune/Loss (Raw)": 0.8239917755126953, "Finetune/Step": 3721, "Finetune/Step Time": 3.1153337452560663} +{"Finetune/Learning Rate": 3.14267209532236e-06, "Finetune/Loss": 0.7487014532089233, "Finetune/Loss (Raw)": 0.7049286961555481, "Finetune/Step": 3722, "Finetune/Step Time": 3.1139890793710947} +{"Finetune/Learning Rate": 3.137934442832894e-06, "Finetune/Loss": 0.7478730082511902, "Finetune/Loss (Raw)": 0.8310133814811707, "Finetune/Step": 3723, "Finetune/Step Time": 3.113670729100704} +{"Finetune/Learning Rate": 3.1331996994521917e-06, "Finetune/Loss": 0.7480114102363586, "Finetune/Loss (Raw)": 0.8076810240745544, "Finetune/Step": 3724, "Finetune/Step Time": 3.1142123118042946} +{"Finetune/Learning Rate": 3.1284678671874893e-06, "Finetune/Loss": 0.7490048408508301, "Finetune/Loss (Raw)": 0.8407211899757385, "Finetune/Step": 3725, "Finetune/Step Time": 3.1138064805418253} +{"Finetune/Learning Rate": 3.123738948044812e-06, "Finetune/Loss": 0.7501314878463745, "Finetune/Loss (Raw)": 0.6431093811988831, "Finetune/Step": 3726, "Finetune/Step Time": 3.0908836778253317} +{"Finetune/Learning Rate": 3.1190129440289385e-06, "Finetune/Loss": 0.7503739595413208, "Finetune/Loss (Raw)": 0.7385791540145874, "Finetune/Step": 3727, "Finetune/Step Time": 3.0910038482397795} +{"Finetune/Learning Rate": 3.1142898571434145e-06, "Finetune/Loss": 0.7483025193214417, "Finetune/Loss (Raw)": 0.5754093527793884, "Finetune/Step": 3728, "Finetune/Step Time": 3.114026052877307} +{"Finetune/Learning Rate": 3.109569689390547e-06, "Finetune/Loss": 0.7482185363769531, "Finetune/Loss (Raw)": 0.7831783890724182, "Finetune/Step": 3729, "Finetune/Step Time": 3.112937856465578} +{"Finetune/Learning Rate": 3.1048524427714066e-06, "Finetune/Loss": 0.7480170130729675, "Finetune/Loss (Raw)": 0.7080585956573486, "Finetune/Step": 3730, "Finetune/Step Time": 3.112789459526539} +{"Finetune/Learning Rate": 3.100138119285834e-06, "Finetune/Loss": 0.7473146915435791, "Finetune/Loss (Raw)": 0.6850399971008301, "Finetune/Step": 3731, "Finetune/Step Time": 3.1118573118001223} +{"Finetune/Learning Rate": 3.0954267209324117e-06, "Finetune/Loss": 0.7479015588760376, "Finetune/Loss (Raw)": 0.8535913825035095, "Finetune/Step": 3732, "Finetune/Step Time": 3.113540418446064} +{"Finetune/Learning Rate": 3.0907182497084964e-06, "Finetune/Loss": 0.7499079704284668, "Finetune/Loss (Raw)": 0.8686565160751343, "Finetune/Step": 3733, "Finetune/Step Time": 3.0882025621831417} +{"Finetune/Learning Rate": 3.0860127076102087e-06, "Finetune/Loss": 0.749397873878479, "Finetune/Loss (Raw)": 0.7802994847297668, "Finetune/Step": 3734, "Finetune/Step Time": 3.0813022796064615} +{"Finetune/Learning Rate": 3.081310096632406e-06, "Finetune/Loss": 0.7453320026397705, "Finetune/Loss (Raw)": 0.2422615885734558, "Finetune/Step": 3735, "Finetune/Step Time": 3.1075590439140797} +{"Finetune/Learning Rate": 3.0766104187687262e-06, "Finetune/Loss": 0.7451634407043457, "Finetune/Loss (Raw)": 0.7600165605545044, "Finetune/Step": 3736, "Finetune/Step Time": 3.1003951895982027} +{"Finetune/Learning Rate": 3.071913676011551e-06, "Finetune/Loss": 0.7446160912513733, "Finetune/Loss (Raw)": 0.7214066982269287, "Finetune/Step": 3737, "Finetune/Step Time": 3.0997211653739214} +{"Finetune/Learning Rate": 3.0672198703520205e-06, "Finetune/Loss": 0.7435966730117798, "Finetune/Loss (Raw)": 0.7476519346237183, "Finetune/Step": 3738, "Finetune/Step Time": 3.09582463093102} +{"Finetune/Learning Rate": 3.0625290037800303e-06, "Finetune/Loss": 0.745582103729248, "Finetune/Loss (Raw)": 0.8319296836853027, "Finetune/Step": 3739, "Finetune/Step Time": 3.0765700191259384} +{"Finetune/Learning Rate": 3.057841078284226e-06, "Finetune/Loss": 0.7459149360656738, "Finetune/Loss (Raw)": 0.7687817811965942, "Finetune/Step": 3740, "Finetune/Step Time": 3.073263632133603} +{"Finetune/Learning Rate": 3.053156095852019e-06, "Finetune/Loss": 0.7466093301773071, "Finetune/Loss (Raw)": 0.8239802122116089, "Finetune/Step": 3741, "Finetune/Step Time": 3.0711090806871653} +{"Finetune/Learning Rate": 3.048474058469556e-06, "Finetune/Loss": 0.7467375993728638, "Finetune/Loss (Raw)": 0.8520249128341675, "Finetune/Step": 3742, "Finetune/Step Time": 3.0704329311847687} +{"Finetune/Learning Rate": 3.0437949681217414e-06, "Finetune/Loss": 0.7476334571838379, "Finetune/Loss (Raw)": 0.7595339417457581, "Finetune/Step": 3743, "Finetune/Step Time": 3.0501662977039814} +{"Finetune/Learning Rate": 3.03911882679224e-06, "Finetune/Loss": 0.7482808828353882, "Finetune/Loss (Raw)": 0.8362109661102295, "Finetune/Step": 3744, "Finetune/Step Time": 3.048741217702627} +{"Finetune/Learning Rate": 3.0344456364634546e-06, "Finetune/Loss": 0.7491326928138733, "Finetune/Loss (Raw)": 0.7124351859092712, "Finetune/Step": 3745, "Finetune/Step Time": 3.0231637563556433} +{"Finetune/Learning Rate": 3.029775399116539e-06, "Finetune/Loss": 0.7495355606079102, "Finetune/Loss (Raw)": 0.8490164279937744, "Finetune/Step": 3746, "Finetune/Step Time": 3.023218745365739} +{"Finetune/Learning Rate": 3.025108116731399e-06, "Finetune/Loss": 0.7504943609237671, "Finetune/Loss (Raw)": 0.8191915154457092, "Finetune/Step": 3747, "Finetune/Step Time": 3.023741152137518} +{"Finetune/Learning Rate": 3.0204437912866834e-06, "Finetune/Loss": 0.750395655632019, "Finetune/Loss (Raw)": 0.8132097125053406, "Finetune/Step": 3748, "Finetune/Step Time": 3.021785171702504} +{"Finetune/Learning Rate": 3.015782424759792e-06, "Finetune/Loss": 0.7516690492630005, "Finetune/Loss (Raw)": 0.8265178203582764, "Finetune/Step": 3749, "Finetune/Step Time": 3.0216067414730787} +{"Finetune/Learning Rate": 3.0111240191268663e-06, "Finetune/Loss": 0.7518625259399414, "Finetune/Loss (Raw)": 0.7800815105438232, "Finetune/Step": 3750, "Finetune/Step Time": 3.020614607259631} +{"Finetune/Learning Rate": 3.00646857636279e-06, "Finetune/Loss": 0.752853512763977, "Finetune/Loss (Raw)": 0.6634542346000671, "Finetune/Step": 3751, "Finetune/Step Time": 3.000479258596897} +{"Finetune/Learning Rate": 3.001816098441206e-06, "Finetune/Loss": 0.7525374889373779, "Finetune/Loss (Raw)": 0.7582055330276489, "Finetune/Step": 3752, "Finetune/Step Time": 2.9980115722864866} +{"Finetune/Learning Rate": 2.997166587334476e-06, "Finetune/Loss": 0.7543253898620605, "Finetune/Loss (Raw)": 0.7936422824859619, "Finetune/Step": 3753, "Finetune/Step Time": 2.975301545113325} +{"Finetune/Learning Rate": 2.992520045013725e-06, "Finetune/Loss": 0.7541486024856567, "Finetune/Loss (Raw)": 0.7906121611595154, "Finetune/Step": 3754, "Finetune/Step Time": 2.9724839255213737} +{"Finetune/Learning Rate": 2.9878764734488088e-06, "Finetune/Loss": 0.7539803981781006, "Finetune/Loss (Raw)": 0.7986606955528259, "Finetune/Step": 3755, "Finetune/Step Time": 2.9729428607970476} +{"Finetune/Learning Rate": 2.9832358746083268e-06, "Finetune/Loss": 0.7544435858726501, "Finetune/Loss (Raw)": 0.8158944249153137, "Finetune/Step": 3756, "Finetune/Step Time": 2.9722564350813627} +{"Finetune/Learning Rate": 2.9785982504596165e-06, "Finetune/Loss": 0.7549136281013489, "Finetune/Loss (Raw)": 0.8225613236427307, "Finetune/Step": 3757, "Finetune/Step Time": 2.9724273681640625} +{"Finetune/Learning Rate": 2.9739636029687547e-06, "Finetune/Loss": 0.7555087208747864, "Finetune/Loss (Raw)": 0.873608410358429, "Finetune/Step": 3758, "Finetune/Step Time": 2.972177628427744} +{"Finetune/Learning Rate": 2.9693319341005632e-06, "Finetune/Loss": 0.7560933828353882, "Finetune/Loss (Raw)": 0.8236074447631836, "Finetune/Step": 3759, "Finetune/Step Time": 2.9722190648317337} +{"Finetune/Learning Rate": 2.9647032458185887e-06, "Finetune/Loss": 0.756506085395813, "Finetune/Loss (Raw)": 0.8153626322746277, "Finetune/Step": 3760, "Finetune/Step Time": 2.9701997358351946} +{"Finetune/Learning Rate": 2.960077540085118e-06, "Finetune/Loss": 0.7564595341682434, "Finetune/Loss (Raw)": 0.8355788588523865, "Finetune/Step": 3761, "Finetune/Step Time": 2.968835102394223} +{"Finetune/Learning Rate": 2.9554548188611866e-06, "Finetune/Loss": 0.7562304735183716, "Finetune/Loss (Raw)": 0.7609691023826599, "Finetune/Step": 3762, "Finetune/Step Time": 2.9678088035434484} +{"Finetune/Learning Rate": 2.95083508410654e-06, "Finetune/Loss": 0.7563890218734741, "Finetune/Loss (Raw)": 0.6441323757171631, "Finetune/Step": 3763, "Finetune/Step Time": 2.9448106940835714} +{"Finetune/Learning Rate": 2.946218337779684e-06, "Finetune/Loss": 0.75618976354599, "Finetune/Loss (Raw)": 0.754380464553833, "Finetune/Step": 3764, "Finetune/Step Time": 2.9449165109544992} +{"Finetune/Learning Rate": 2.941604581837839e-06, "Finetune/Loss": 0.7564482688903809, "Finetune/Loss (Raw)": 0.8633378744125366, "Finetune/Step": 3765, "Finetune/Step Time": 2.9444525167346} +{"Finetune/Learning Rate": 2.936993818236966e-06, "Finetune/Loss": 0.7567193508148193, "Finetune/Loss (Raw)": 0.770018458366394, "Finetune/Step": 3766, "Finetune/Step Time": 2.9461307637393475} +{"Finetune/Learning Rate": 2.9323860489317547e-06, "Finetune/Loss": 0.7561823129653931, "Finetune/Loss (Raw)": 0.7841888070106506, "Finetune/Step": 3767, "Finetune/Step Time": 2.9437427204102278} +{"Finetune/Learning Rate": 2.9277812758756217e-06, "Finetune/Loss": 0.7566617727279663, "Finetune/Loss (Raw)": 0.8256118297576904, "Finetune/Step": 3768, "Finetune/Step Time": 2.9446000903844833} +{"Finetune/Learning Rate": 2.9231795010207285e-06, "Finetune/Loss": 0.7559759616851807, "Finetune/Loss (Raw)": 0.756940484046936, "Finetune/Step": 3769, "Finetune/Step Time": 2.9450113400816917} +{"Finetune/Learning Rate": 2.9185807263179457e-06, "Finetune/Loss": 0.7562720775604248, "Finetune/Loss (Raw)": 0.8211500644683838, "Finetune/Step": 3770, "Finetune/Step Time": 2.94490123167634} +{"Finetune/Learning Rate": 2.9139849537168786e-06, "Finetune/Loss": 0.7564033269882202, "Finetune/Loss (Raw)": 0.6070160269737244, "Finetune/Step": 3771, "Finetune/Step Time": 2.9427579008042812} +{"Finetune/Learning Rate": 2.90939218516587e-06, "Finetune/Loss": 0.7557084560394287, "Finetune/Loss (Raw)": 0.7257679104804993, "Finetune/Step": 3772, "Finetune/Step Time": 2.9423314966261387} +{"Finetune/Learning Rate": 2.9048024226119786e-06, "Finetune/Loss": 0.75486820936203, "Finetune/Loss (Raw)": 0.7070279717445374, "Finetune/Step": 3773, "Finetune/Step Time": 2.9384911078959703} +{"Finetune/Learning Rate": 2.900215668000991e-06, "Finetune/Loss": 0.7531983256340027, "Finetune/Loss (Raw)": 0.5990939140319824, "Finetune/Step": 3774, "Finetune/Step Time": 2.9663194455206394} +{"Finetune/Learning Rate": 2.895631923277418e-06, "Finetune/Loss": 0.7528291940689087, "Finetune/Loss (Raw)": 0.7735199928283691, "Finetune/Step": 3775, "Finetune/Step Time": 2.962986608967185} +{"Finetune/Learning Rate": 2.891051190384496e-06, "Finetune/Loss": 0.7515865564346313, "Finetune/Loss (Raw)": 0.724793016910553, "Finetune/Step": 3776, "Finetune/Step Time": 2.9681738447397947} +{"Finetune/Learning Rate": 2.886473471264186e-06, "Finetune/Loss": 0.7516577243804932, "Finetune/Loss (Raw)": 0.6708559989929199, "Finetune/Step": 3777, "Finetune/Step Time": 2.966841757297516} +{"Finetune/Learning Rate": 2.8818987678571675e-06, "Finetune/Loss": 0.7506340146064758, "Finetune/Loss (Raw)": 0.7151859402656555, "Finetune/Step": 3778, "Finetune/Step Time": 2.965116485953331} +{"Finetune/Learning Rate": 2.8773270821028397e-06, "Finetune/Loss": 0.7518577575683594, "Finetune/Loss (Raw)": 0.816662073135376, "Finetune/Step": 3779, "Finetune/Step Time": 2.963881514966488} +{"Finetune/Learning Rate": 2.8727584159393374e-06, "Finetune/Loss": 0.7516047954559326, "Finetune/Loss (Raw)": 0.7506697773933411, "Finetune/Step": 3780, "Finetune/Step Time": 2.964404344558716} +{"Finetune/Learning Rate": 2.8681927713034907e-06, "Finetune/Loss": 0.7519456148147583, "Finetune/Loss (Raw)": 0.8185789585113525, "Finetune/Step": 3781, "Finetune/Step Time": 2.9630260206758976} +{"Finetune/Learning Rate": 2.8636301501308707e-06, "Finetune/Loss": 0.7505381107330322, "Finetune/Loss (Raw)": 0.7370270490646362, "Finetune/Step": 3782, "Finetune/Step Time": 2.962258119136095} +{"Finetune/Learning Rate": 2.8590705543557564e-06, "Finetune/Loss": 0.7509427070617676, "Finetune/Loss (Raw)": 0.8588738441467285, "Finetune/Step": 3783, "Finetune/Step Time": 2.964141398668289} +{"Finetune/Learning Rate": 2.8545139859111446e-06, "Finetune/Loss": 0.7500261068344116, "Finetune/Loss (Raw)": 0.7311166524887085, "Finetune/Step": 3784, "Finetune/Step Time": 2.96133672259748} +{"Finetune/Learning Rate": 2.8499604467287513e-06, "Finetune/Loss": 0.7507542371749878, "Finetune/Loss (Raw)": 0.8720259070396423, "Finetune/Step": 3785, "Finetune/Step Time": 2.9625337347388268} +{"Finetune/Learning Rate": 2.845409938739002e-06, "Finetune/Loss": 0.7501184940338135, "Finetune/Loss (Raw)": 0.7330977916717529, "Finetune/Step": 3786, "Finetune/Step Time": 2.9601135160773993} +{"Finetune/Learning Rate": 2.840862463871055e-06, "Finetune/Loss": 0.7513043284416199, "Finetune/Loss (Raw)": 0.9042400121688843, "Finetune/Step": 3787, "Finetune/Step Time": 2.961438648402691} +{"Finetune/Learning Rate": 2.8363180240527566e-06, "Finetune/Loss": 0.7521798014640808, "Finetune/Loss (Raw)": 0.8981634974479675, "Finetune/Step": 3788, "Finetune/Step Time": 2.9595080465078354} +{"Finetune/Learning Rate": 2.831776621210681e-06, "Finetune/Loss": 0.7518402934074402, "Finetune/Loss (Raw)": 0.744034469127655, "Finetune/Step": 3789, "Finetune/Step Time": 2.9563742484897375} +{"Finetune/Learning Rate": 2.827238257270125e-06, "Finetune/Loss": 0.7522299289703369, "Finetune/Loss (Raw)": 0.8260693550109863, "Finetune/Step": 3790, "Finetune/Step Time": 2.96052672713995} +{"Finetune/Learning Rate": 2.8227029341550705e-06, "Finetune/Loss": 0.7524135112762451, "Finetune/Loss (Raw)": 0.8493704795837402, "Finetune/Step": 3791, "Finetune/Step Time": 2.963743792846799} +{"Finetune/Learning Rate": 2.818170653788237e-06, "Finetune/Loss": 0.7538112998008728, "Finetune/Loss (Raw)": 0.912375807762146, "Finetune/Step": 3792, "Finetune/Step Time": 2.955221813172102} +{"Finetune/Learning Rate": 2.8136414180910376e-06, "Finetune/Loss": 0.7498005628585815, "Finetune/Loss (Raw)": 0.2671826481819153, "Finetune/Step": 3793, "Finetune/Step Time": 2.9861616510897875} +{"Finetune/Learning Rate": 2.809115228983601e-06, "Finetune/Loss": 0.7491433024406433, "Finetune/Loss (Raw)": 0.6725615859031677, "Finetune/Step": 3794, "Finetune/Step Time": 3.010435175150633} +{"Finetune/Learning Rate": 2.8045920883847612e-06, "Finetune/Loss": 0.7483513355255127, "Finetune/Loss (Raw)": 0.728786051273346, "Finetune/Step": 3795, "Finetune/Step Time": 3.0137253999710083} +{"Finetune/Learning Rate": 2.8000719982120606e-06, "Finetune/Loss": 0.7477313280105591, "Finetune/Loss (Raw)": 0.5317051410675049, "Finetune/Step": 3796, "Finetune/Step Time": 3.013095697388053} +{"Finetune/Learning Rate": 2.7955549603817565e-06, "Finetune/Loss": 0.7487058639526367, "Finetune/Loss (Raw)": 0.7758355736732483, "Finetune/Step": 3797, "Finetune/Step Time": 2.9933861196041107} +{"Finetune/Learning Rate": 2.7910409768087975e-06, "Finetune/Loss": 0.7507432699203491, "Finetune/Loss (Raw)": 0.9051395058631897, "Finetune/Step": 3798, "Finetune/Step Time": 2.968773275613785} +{"Finetune/Learning Rate": 2.786530049406844e-06, "Finetune/Loss": 0.7506361603736877, "Finetune/Loss (Raw)": 0.8030562996864319, "Finetune/Step": 3799, "Finetune/Step Time": 2.9687157068401575} +{"Finetune/Learning Rate": 2.7820221800882687e-06, "Finetune/Loss": 0.7499691247940063, "Finetune/Loss (Raw)": 0.699363112449646, "Finetune/Step": 3800, "Finetune/Step Time": 2.9706292059272528} +{"Finetune/Learning Rate": 2.7775173707641357e-06, "Finetune/Loss": 0.7519190311431885, "Finetune/Loss (Raw)": 0.867236852645874, "Finetune/Step": 3801, "Finetune/Step Time": 2.945180268958211} +{"Finetune/Learning Rate": 2.7730156233442185e-06, "Finetune/Loss": 0.7519867420196533, "Finetune/Loss (Raw)": 0.7722585201263428, "Finetune/Step": 3802, "Finetune/Step Time": 2.948759652674198} +{"Finetune/Learning Rate": 2.7685169397369902e-06, "Finetune/Loss": 0.752264142036438, "Finetune/Loss (Raw)": 0.8329628109931946, "Finetune/Step": 3803, "Finetune/Step Time": 2.9493352565914392} +{"Finetune/Learning Rate": 2.764021321849627e-06, "Finetune/Loss": 0.7530045509338379, "Finetune/Loss (Raw)": 0.8634974956512451, "Finetune/Step": 3804, "Finetune/Step Time": 2.950526311993599} +{"Finetune/Learning Rate": 2.7595287715880025e-06, "Finetune/Loss": 0.753031849861145, "Finetune/Loss (Raw)": 0.7541449666023254, "Finetune/Step": 3805, "Finetune/Step Time": 2.9484862741082907} +{"Finetune/Learning Rate": 2.7550392908566903e-06, "Finetune/Loss": 0.7539149522781372, "Finetune/Loss (Raw)": 0.9046564698219299, "Finetune/Step": 3806, "Finetune/Step Time": 2.9486744720488787} +{"Finetune/Learning Rate": 2.7505528815589723e-06, "Finetune/Loss": 0.7551491260528564, "Finetune/Loss (Raw)": 0.9227121472358704, "Finetune/Step": 3807, "Finetune/Step Time": 2.949523698538542} +{"Finetune/Learning Rate": 2.74606954559681e-06, "Finetune/Loss": 0.7542939186096191, "Finetune/Loss (Raw)": 0.7197814583778381, "Finetune/Step": 3808, "Finetune/Step Time": 2.9470872953534126} +{"Finetune/Learning Rate": 2.7415892848708725e-06, "Finetune/Loss": 0.7528448104858398, "Finetune/Loss (Raw)": 0.668053925037384, "Finetune/Step": 3809, "Finetune/Step Time": 2.9427886437624693} +{"Finetune/Learning Rate": 2.737112101280531e-06, "Finetune/Loss": 0.7506073713302612, "Finetune/Loss (Raw)": 0.5363410711288452, "Finetune/Step": 3810, "Finetune/Step Time": 2.9669955652207136} +{"Finetune/Learning Rate": 2.7326379967238427e-06, "Finetune/Loss": 0.7516505718231201, "Finetune/Loss (Raw)": 0.8837896585464478, "Finetune/Step": 3811, "Finetune/Step Time": 2.966164417564869} +{"Finetune/Learning Rate": 2.7281669730975625e-06, "Finetune/Loss": 0.7523032426834106, "Finetune/Loss (Raw)": 0.9061766266822815, "Finetune/Step": 3812, "Finetune/Step Time": 2.9666795562952757} +{"Finetune/Learning Rate": 2.723699032297139e-06, "Finetune/Loss": 0.7524405717849731, "Finetune/Loss (Raw)": 0.8193285465240479, "Finetune/Step": 3813, "Finetune/Step Time": 2.9666626881808043} +{"Finetune/Learning Rate": 2.719234176216713e-06, "Finetune/Loss": 0.7529390454292297, "Finetune/Loss (Raw)": 0.8656174540519714, "Finetune/Step": 3814, "Finetune/Step Time": 2.9667376168072224} +{"Finetune/Learning Rate": 2.714772406749121e-06, "Finetune/Loss": 0.7530142068862915, "Finetune/Loss (Raw)": 0.8714828491210938, "Finetune/Step": 3815, "Finetune/Step Time": 2.965336464345455} +{"Finetune/Learning Rate": 2.7103137257858867e-06, "Finetune/Loss": 0.7534700036048889, "Finetune/Loss (Raw)": 0.8092972636222839, "Finetune/Step": 3816, "Finetune/Step Time": 2.968921644613147} +{"Finetune/Learning Rate": 2.7058581352172242e-06, "Finetune/Loss": 0.7534687519073486, "Finetune/Loss (Raw)": 0.8924320340156555, "Finetune/Step": 3817, "Finetune/Step Time": 2.9708667881786823} +{"Finetune/Learning Rate": 2.7014056369320486e-06, "Finetune/Loss": 0.7548084259033203, "Finetune/Loss (Raw)": 0.8465558886528015, "Finetune/Step": 3818, "Finetune/Step Time": 2.944249678403139} +{"Finetune/Learning Rate": 2.6969562328179423e-06, "Finetune/Loss": 0.7555080056190491, "Finetune/Loss (Raw)": 0.6743341088294983, "Finetune/Step": 3819, "Finetune/Step Time": 2.918890008702874} +{"Finetune/Learning Rate": 2.6925099247611985e-06, "Finetune/Loss": 0.7558237910270691, "Finetune/Loss (Raw)": 0.851306676864624, "Finetune/Step": 3820, "Finetune/Step Time": 2.9261927474290133} +{"Finetune/Learning Rate": 2.6880667146467854e-06, "Finetune/Loss": 0.7564127445220947, "Finetune/Loss (Raw)": 0.5928739309310913, "Finetune/Step": 3821, "Finetune/Step Time": 2.929336676374078} +{"Finetune/Learning Rate": 2.6836266043583593e-06, "Finetune/Loss": 0.7565311193466187, "Finetune/Loss (Raw)": 0.7208502292633057, "Finetune/Step": 3822, "Finetune/Step Time": 2.92938194796443} +{"Finetune/Learning Rate": 2.679189595778264e-06, "Finetune/Loss": 0.756634533405304, "Finetune/Loss (Raw)": 0.7508122324943542, "Finetune/Step": 3823, "Finetune/Step Time": 2.92833037301898} +{"Finetune/Learning Rate": 2.674755690787526e-06, "Finetune/Loss": 0.7558329105377197, "Finetune/Loss (Raw)": 0.7205865979194641, "Finetune/Step": 3824, "Finetune/Step Time": 2.950606692582369} +{"Finetune/Learning Rate": 2.6703248912658653e-06, "Finetune/Loss": 0.7560673952102661, "Finetune/Loss (Raw)": 0.7921498417854309, "Finetune/Step": 3825, "Finetune/Step Time": 2.951846070587635} +{"Finetune/Learning Rate": 2.6658971990916704e-06, "Finetune/Loss": 0.7590943574905396, "Finetune/Loss (Raw)": 0.8046790361404419, "Finetune/Step": 3826, "Finetune/Step Time": 2.920150935649872} +{"Finetune/Learning Rate": 2.66147261614202e-06, "Finetune/Loss": 0.7599086165428162, "Finetune/Loss (Raw)": 0.7607056498527527, "Finetune/Step": 3827, "Finetune/Step Time": 2.9242165461182594} +{"Finetune/Learning Rate": 2.657051144292684e-06, "Finetune/Loss": 0.7600008845329285, "Finetune/Loss (Raw)": 0.7668256163597107, "Finetune/Step": 3828, "Finetune/Step Time": 2.924792991951108} +{"Finetune/Learning Rate": 2.6526327854180913e-06, "Finetune/Loss": 0.7589148879051208, "Finetune/Loss (Raw)": 0.7824637293815613, "Finetune/Step": 3829, "Finetune/Step Time": 2.920600313693285} +{"Finetune/Learning Rate": 2.6482175413913723e-06, "Finetune/Loss": 0.75836181640625, "Finetune/Loss (Raw)": 0.7270919680595398, "Finetune/Step": 3830, "Finetune/Step Time": 2.9221428837627172} +{"Finetune/Learning Rate": 2.6438054140843284e-06, "Finetune/Loss": 0.7582684755325317, "Finetune/Loss (Raw)": 0.7718886137008667, "Finetune/Step": 3831, "Finetune/Step Time": 2.9212346244603395} +{"Finetune/Learning Rate": 2.639396405367437e-06, "Finetune/Loss": 0.7578514814376831, "Finetune/Loss (Raw)": 0.7405808568000793, "Finetune/Step": 3832, "Finetune/Step Time": 2.9317315611988306} +{"Finetune/Learning Rate": 2.6349905171098576e-06, "Finetune/Loss": 0.7630070447921753, "Finetune/Loss (Raw)": 0.8467704057693481, "Finetune/Step": 3833, "Finetune/Step Time": 2.8995028622448444} +{"Finetune/Learning Rate": 2.630587751179422e-06, "Finetune/Loss": 0.7639780640602112, "Finetune/Loss (Raw)": 0.8079156875610352, "Finetune/Step": 3834, "Finetune/Step Time": 2.9010192696005106} +{"Finetune/Learning Rate": 2.626188109442652e-06, "Finetune/Loss": 0.7631789445877075, "Finetune/Loss (Raw)": 0.7309398055076599, "Finetune/Step": 3835, "Finetune/Step Time": 2.8992924075573683} +{"Finetune/Learning Rate": 2.621791593764724e-06, "Finetune/Loss": 0.7624398469924927, "Finetune/Loss (Raw)": 0.8166660070419312, "Finetune/Step": 3836, "Finetune/Step Time": 2.90165751054883} +{"Finetune/Learning Rate": 2.6173982060095005e-06, "Finetune/Loss": 0.7624545097351074, "Finetune/Loss (Raw)": 0.7110360264778137, "Finetune/Step": 3837, "Finetune/Step Time": 2.9020184986293316} +{"Finetune/Learning Rate": 2.613007948039524e-06, "Finetune/Loss": 0.7647644877433777, "Finetune/Loss (Raw)": 0.7904230356216431, "Finetune/Step": 3838, "Finetune/Step Time": 2.8719826284796} +{"Finetune/Learning Rate": 2.6086208217160003e-06, "Finetune/Loss": 0.7661844491958618, "Finetune/Loss (Raw)": 0.9532080292701721, "Finetune/Step": 3839, "Finetune/Step Time": 2.8732850924134254} +{"Finetune/Learning Rate": 2.6042368288988097e-06, "Finetune/Loss": 0.7622780799865723, "Finetune/Loss (Raw)": 0.23100852966308594, "Finetune/Step": 3840, "Finetune/Step Time": 2.903391068801284} +{"Finetune/Learning Rate": 2.5998559714465053e-06, "Finetune/Loss": 0.761637806892395, "Finetune/Loss (Raw)": 0.7741132378578186, "Finetune/Step": 3841, "Finetune/Step Time": 2.907303299754858} +{"Finetune/Learning Rate": 2.5954782512163123e-06, "Finetune/Loss": 0.7619743347167969, "Finetune/Loss (Raw)": 0.7401888370513916, "Finetune/Step": 3842, "Finetune/Step Time": 2.8844484109431505} +{"Finetune/Learning Rate": 2.5911036700641225e-06, "Finetune/Loss": 0.762471616268158, "Finetune/Loss (Raw)": 0.7551994919776917, "Finetune/Step": 3843, "Finetune/Step Time": 2.864693321287632} +{"Finetune/Learning Rate": 2.5867322298444995e-06, "Finetune/Loss": 0.7653379440307617, "Finetune/Loss (Raw)": 0.5995326042175293, "Finetune/Step": 3844, "Finetune/Step Time": 2.856772927567363} +{"Finetune/Learning Rate": 2.582363932410673e-06, "Finetune/Loss": 0.7649333477020264, "Finetune/Loss (Raw)": 0.8075057864189148, "Finetune/Step": 3845, "Finetune/Step Time": 2.8561359755694866} +{"Finetune/Learning Rate": 2.5779987796145487e-06, "Finetune/Loss": 0.7664024829864502, "Finetune/Loss (Raw)": 0.88750159740448, "Finetune/Step": 3846, "Finetune/Step Time": 2.8566725850105286} +{"Finetune/Learning Rate": 2.5736367733066824e-06, "Finetune/Loss": 0.7660781741142273, "Finetune/Loss (Raw)": 0.7823138236999512, "Finetune/Step": 3847, "Finetune/Step Time": 2.856197528541088} +{"Finetune/Learning Rate": 2.5692779153363133e-06, "Finetune/Loss": 0.7668688893318176, "Finetune/Loss (Raw)": 0.8117945790290833, "Finetune/Step": 3848, "Finetune/Step Time": 2.8466696981340647} +{"Finetune/Learning Rate": 2.564922207551337e-06, "Finetune/Loss": 0.7661228179931641, "Finetune/Loss (Raw)": 0.7284995913505554, "Finetune/Step": 3849, "Finetune/Step Time": 2.8454916030168533} +{"Finetune/Learning Rate": 2.560569651798315e-06, "Finetune/Loss": 0.7667328715324402, "Finetune/Loss (Raw)": 0.783012330532074, "Finetune/Step": 3850, "Finetune/Step Time": 2.8393670860677958} +{"Finetune/Learning Rate": 2.556220249922472e-06, "Finetune/Loss": 0.7668235301971436, "Finetune/Loss (Raw)": 0.8426129817962646, "Finetune/Step": 3851, "Finetune/Step Time": 2.8421255704015493} +{"Finetune/Learning Rate": 2.5518740037676947e-06, "Finetune/Loss": 0.7678667306900024, "Finetune/Loss (Raw)": 0.9412161707878113, "Finetune/Step": 3852, "Finetune/Step Time": 2.8437255024909973} +{"Finetune/Learning Rate": 2.5475309151765413e-06, "Finetune/Loss": 0.7677097320556641, "Finetune/Loss (Raw)": 0.820629358291626, "Finetune/Step": 3853, "Finetune/Step Time": 2.8441736418753862} +{"Finetune/Learning Rate": 2.543190985990215e-06, "Finetune/Loss": 0.7691035270690918, "Finetune/Loss (Raw)": 0.8215087056159973, "Finetune/Step": 3854, "Finetune/Step Time": 2.840564666315913} +{"Finetune/Learning Rate": 2.5388542180485897e-06, "Finetune/Loss": 0.7690917253494263, "Finetune/Loss (Raw)": 0.7370760440826416, "Finetune/Step": 3855, "Finetune/Step Time": 2.861632853746414} +{"Finetune/Learning Rate": 2.5345206131902044e-06, "Finetune/Loss": 0.770889401435852, "Finetune/Loss (Raw)": 0.805503249168396, "Finetune/Step": 3856, "Finetune/Step Time": 2.838866012170911} +{"Finetune/Learning Rate": 2.5301901732522407e-06, "Finetune/Loss": 0.7699242830276489, "Finetune/Loss (Raw)": 0.6596524715423584, "Finetune/Step": 3857, "Finetune/Step Time": 2.8565524872392416} +{"Finetune/Learning Rate": 2.525862900070556e-06, "Finetune/Loss": 0.7696956992149353, "Finetune/Loss (Raw)": 0.6787956953048706, "Finetune/Step": 3858, "Finetune/Step Time": 2.862566363066435} +{"Finetune/Learning Rate": 2.5215387954796554e-06, "Finetune/Loss": 0.7705867290496826, "Finetune/Loss (Raw)": 0.799085795879364, "Finetune/Step": 3859, "Finetune/Step Time": 2.8407659269869328} +{"Finetune/Learning Rate": 2.517217861312702e-06, "Finetune/Loss": 0.7706365585327148, "Finetune/Loss (Raw)": 0.8599714636802673, "Finetune/Step": 3860, "Finetune/Step Time": 2.836938040331006} +{"Finetune/Learning Rate": 2.512900099401515e-06, "Finetune/Loss": 0.7700332403182983, "Finetune/Loss (Raw)": 0.7914379239082336, "Finetune/Step": 3861, "Finetune/Step Time": 2.839941818267107} +{"Finetune/Learning Rate": 2.5085855115765678e-06, "Finetune/Loss": 0.7703095078468323, "Finetune/Loss (Raw)": 0.8156596422195435, "Finetune/Step": 3862, "Finetune/Step Time": 2.8401870038360357} +{"Finetune/Learning Rate": 2.504274099666998e-06, "Finetune/Loss": 0.774433970451355, "Finetune/Loss (Raw)": 0.770196259021759, "Finetune/Step": 3863, "Finetune/Step Time": 2.8193089179694653} +{"Finetune/Learning Rate": 2.4999658655005786e-06, "Finetune/Loss": 0.7750158309936523, "Finetune/Loss (Raw)": 0.8344841599464417, "Finetune/Step": 3864, "Finetune/Step Time": 2.82047931663692} +{"Finetune/Learning Rate": 2.4956608109037473e-06, "Finetune/Loss": 0.7740720510482788, "Finetune/Loss (Raw)": 0.6006121635437012, "Finetune/Step": 3865, "Finetune/Step Time": 2.843832843005657} +{"Finetune/Learning Rate": 2.491358937701597e-06, "Finetune/Loss": 0.7725982666015625, "Finetune/Loss (Raw)": 0.5590041279792786, "Finetune/Step": 3866, "Finetune/Step Time": 2.867025265470147} +{"Finetune/Learning Rate": 2.4870602477178627e-06, "Finetune/Loss": 0.772048830986023, "Finetune/Loss (Raw)": 0.761601984500885, "Finetune/Step": 3867, "Finetune/Step Time": 2.862342095002532} +{"Finetune/Learning Rate": 2.4827647427749347e-06, "Finetune/Loss": 0.7723792195320129, "Finetune/Loss (Raw)": 0.8110778331756592, "Finetune/Step": 3868, "Finetune/Step Time": 2.8615731466561556} +{"Finetune/Learning Rate": 2.478472424693853e-06, "Finetune/Loss": 0.77182936668396, "Finetune/Loss (Raw)": 0.7535924315452576, "Finetune/Step": 3869, "Finetune/Step Time": 2.861426306888461} +{"Finetune/Learning Rate": 2.474183295294306e-06, "Finetune/Loss": 0.7708942890167236, "Finetune/Loss (Raw)": 0.7323339581489563, "Finetune/Step": 3870, "Finetune/Step Time": 2.8644998241215944} +{"Finetune/Learning Rate": 2.4698973563946284e-06, "Finetune/Loss": 0.7700207233428955, "Finetune/Loss (Raw)": 0.6477208137512207, "Finetune/Step": 3871, "Finetune/Step Time": 2.8609564024955034} +{"Finetune/Learning Rate": 2.465614609811805e-06, "Finetune/Loss": 0.7696669101715088, "Finetune/Loss (Raw)": 0.7909173369407654, "Finetune/Step": 3872, "Finetune/Step Time": 2.863843984901905} +{"Finetune/Learning Rate": 2.4613350573614637e-06, "Finetune/Loss": 0.7704333662986755, "Finetune/Loss (Raw)": 0.8105505704879761, "Finetune/Step": 3873, "Finetune/Step Time": 2.8691172897815704} +{"Finetune/Learning Rate": 2.4570587008578896e-06, "Finetune/Loss": 0.7699742913246155, "Finetune/Loss (Raw)": 0.7902455925941467, "Finetune/Step": 3874, "Finetune/Step Time": 2.8678809888660908} +{"Finetune/Learning Rate": 2.4527855421139923e-06, "Finetune/Loss": 0.7694146633148193, "Finetune/Loss (Raw)": 0.7475622892379761, "Finetune/Step": 3875, "Finetune/Step Time": 2.8682956658303738} +{"Finetune/Learning Rate": 2.4485155829413466e-06, "Finetune/Loss": 0.7690597176551819, "Finetune/Loss (Raw)": 0.7677735686302185, "Finetune/Step": 3876, "Finetune/Step Time": 2.8692217990756035} +{"Finetune/Learning Rate": 2.4442488251501597e-06, "Finetune/Loss": 0.768999457359314, "Finetune/Loss (Raw)": 0.818812906742096, "Finetune/Step": 3877, "Finetune/Step Time": 2.867555718868971} +{"Finetune/Learning Rate": 2.439985270549281e-06, "Finetune/Loss": 0.7690272331237793, "Finetune/Loss (Raw)": 0.7836358547210693, "Finetune/Step": 3878, "Finetune/Step Time": 2.869023445993662} +{"Finetune/Learning Rate": 2.4357249209462087e-06, "Finetune/Loss": 0.7698973417282104, "Finetune/Loss (Raw)": 0.7748238444328308, "Finetune/Step": 3879, "Finetune/Step Time": 2.8708404172211885} +{"Finetune/Learning Rate": 2.4314677781470717e-06, "Finetune/Loss": 0.77081698179245, "Finetune/Loss (Raw)": 0.8759170770645142, "Finetune/Step": 3880, "Finetune/Step Time": 2.8703889045864344} +{"Finetune/Learning Rate": 2.4272138439566574e-06, "Finetune/Loss": 0.77155601978302, "Finetune/Loss (Raw)": 0.8882465958595276, "Finetune/Step": 3881, "Finetune/Step Time": 2.8697401508688927} +{"Finetune/Learning Rate": 2.422963120178372e-06, "Finetune/Loss": 0.7713414430618286, "Finetune/Loss (Raw)": 0.7631480693817139, "Finetune/Step": 3882, "Finetune/Step Time": 2.8706920817494392} +{"Finetune/Learning Rate": 2.4187156086142692e-06, "Finetune/Loss": 0.7706619501113892, "Finetune/Loss (Raw)": 0.7116758823394775, "Finetune/Step": 3883, "Finetune/Step Time": 2.8715258594602346} +{"Finetune/Learning Rate": 2.414471311065053e-06, "Finetune/Loss": 0.7701433897018433, "Finetune/Loss (Raw)": 0.7495203614234924, "Finetune/Step": 3884, "Finetune/Step Time": 2.8744386937469244} +{"Finetune/Learning Rate": 2.4102302293300393e-06, "Finetune/Loss": 0.7694213390350342, "Finetune/Loss (Raw)": 0.7301414608955383, "Finetune/Step": 3885, "Finetune/Step Time": 2.8754476197063923} +{"Finetune/Learning Rate": 2.405992365207207e-06, "Finetune/Loss": 0.7686237096786499, "Finetune/Loss (Raw)": 0.7715108394622803, "Finetune/Step": 3886, "Finetune/Step Time": 2.8768854569643736} +{"Finetune/Learning Rate": 2.401757720493153e-06, "Finetune/Loss": 0.7684744596481323, "Finetune/Loss (Raw)": 0.8044971823692322, "Finetune/Step": 3887, "Finetune/Step Time": 2.8784010242670774} +{"Finetune/Learning Rate": 2.397526296983118e-06, "Finetune/Loss": 0.7681199312210083, "Finetune/Loss (Raw)": 0.769989013671875, "Finetune/Step": 3888, "Finetune/Step Time": 2.88581277243793} +{"Finetune/Learning Rate": 2.393298096470974e-06, "Finetune/Loss": 0.7674379348754883, "Finetune/Loss (Raw)": 0.7482861876487732, "Finetune/Step": 3889, "Finetune/Step Time": 2.8883382957428694} +{"Finetune/Learning Rate": 2.3890731207492235e-06, "Finetune/Loss": 0.768593430519104, "Finetune/Loss (Raw)": 0.9088642597198486, "Finetune/Step": 3890, "Finetune/Step Time": 2.8844914715737104} +{"Finetune/Learning Rate": 2.384851371609014e-06, "Finetune/Loss": 0.7702163457870483, "Finetune/Loss (Raw)": 0.8518663644790649, "Finetune/Step": 3891, "Finetune/Step Time": 2.883530095219612} +{"Finetune/Learning Rate": 2.38063285084011e-06, "Finetune/Loss": 0.7686996459960938, "Finetune/Loss (Raw)": 0.5602492690086365, "Finetune/Step": 3892, "Finetune/Step Time": 2.907153218984604} +{"Finetune/Learning Rate": 2.3764175602309113e-06, "Finetune/Loss": 0.7681385278701782, "Finetune/Loss (Raw)": 0.7915142774581909, "Finetune/Step": 3893, "Finetune/Step Time": 2.9083181750029325} +{"Finetune/Learning Rate": 2.3722055015684598e-06, "Finetune/Loss": 0.7677052021026611, "Finetune/Loss (Raw)": 0.7145580053329468, "Finetune/Step": 3894, "Finetune/Step Time": 2.910875715315342} +{"Finetune/Learning Rate": 2.3679966766384145e-06, "Finetune/Loss": 0.7677249312400818, "Finetune/Loss (Raw)": 0.78670734167099, "Finetune/Step": 3895, "Finetune/Step Time": 2.911773217841983} +{"Finetune/Learning Rate": 2.3637910872250656e-06, "Finetune/Loss": 0.767427384853363, "Finetune/Loss (Raw)": 0.7875263094902039, "Finetune/Step": 3896, "Finetune/Step Time": 2.910482831299305} +{"Finetune/Learning Rate": 2.3595887351113367e-06, "Finetune/Loss": 0.7673834562301636, "Finetune/Loss (Raw)": 0.7513245344161987, "Finetune/Step": 3897, "Finetune/Step Time": 2.910957148298621} +{"Finetune/Learning Rate": 2.355389622078773e-06, "Finetune/Loss": 0.7669785022735596, "Finetune/Loss (Raw)": 0.7693138122558594, "Finetune/Step": 3898, "Finetune/Step Time": 2.913807211443782} +{"Finetune/Learning Rate": 2.351193749907551e-06, "Finetune/Loss": 0.7684677243232727, "Finetune/Loss (Raw)": 0.7976307272911072, "Finetune/Step": 3899, "Finetune/Step Time": 2.889749813824892} +{"Finetune/Learning Rate": 2.347001120376472e-06, "Finetune/Loss": 0.769400954246521, "Finetune/Loss (Raw)": 0.8452160954475403, "Finetune/Step": 3900, "Finetune/Step Time": 2.886842254549265} +{"Finetune/Learning Rate": 2.3428117352629586e-06, "Finetune/Loss": 0.7705361843109131, "Finetune/Loss (Raw)": 0.85234135389328, "Finetune/Step": 3901, "Finetune/Step Time": 2.887822376564145} +{"Finetune/Learning Rate": 2.338625596343069e-06, "Finetune/Loss": 0.7724298238754272, "Finetune/Loss (Raw)": 0.8414897918701172, "Finetune/Step": 3902, "Finetune/Step Time": 2.863616842776537} +{"Finetune/Learning Rate": 2.334442705391469e-06, "Finetune/Loss": 0.7705475091934204, "Finetune/Loss (Raw)": 0.5325758457183838, "Finetune/Step": 3903, "Finetune/Step Time": 2.8883251268416643} +{"Finetune/Learning Rate": 2.3302630641814626e-06, "Finetune/Loss": 0.7712099552154541, "Finetune/Loss (Raw)": 0.8095853924751282, "Finetune/Step": 3904, "Finetune/Step Time": 2.8810892403125763} +{"Finetune/Learning Rate": 2.3260866744849677e-06, "Finetune/Loss": 0.7720696926116943, "Finetune/Loss (Raw)": 0.7809075117111206, "Finetune/Step": 3905, "Finetune/Step Time": 2.8821069207042456} +{"Finetune/Learning Rate": 2.3219135380725254e-06, "Finetune/Loss": 0.7686349749565125, "Finetune/Loss (Raw)": 0.2755361795425415, "Finetune/Step": 3906, "Finetune/Step Time": 2.9162902049720287} +{"Finetune/Learning Rate": 2.3177436567132994e-06, "Finetune/Loss": 0.7687863707542419, "Finetune/Loss (Raw)": 0.8360390067100525, "Finetune/Step": 3907, "Finetune/Step Time": 2.9213421791791916} +{"Finetune/Learning Rate": 2.313577032175067e-06, "Finetune/Loss": 0.7645293474197388, "Finetune/Loss (Raw)": 0.2057756930589676, "Finetune/Step": 3908, "Finetune/Step Time": 2.9473104123026133} +{"Finetune/Learning Rate": 2.3094136662242406e-06, "Finetune/Loss": 0.7633217573165894, "Finetune/Loss (Raw)": 0.6640072464942932, "Finetune/Step": 3909, "Finetune/Step Time": 2.949350342154503} +{"Finetune/Learning Rate": 2.3052535606258297e-06, "Finetune/Loss": 0.7639725208282471, "Finetune/Loss (Raw)": 0.8203223347663879, "Finetune/Step": 3910, "Finetune/Step Time": 2.950237674638629} +{"Finetune/Learning Rate": 2.3010967171434752e-06, "Finetune/Loss": 0.7636237144470215, "Finetune/Loss (Raw)": 0.8142304420471191, "Finetune/Step": 3911, "Finetune/Step Time": 2.946661254391074} +{"Finetune/Learning Rate": 2.296943137539437e-06, "Finetune/Loss": 0.7635757923126221, "Finetune/Loss (Raw)": 0.7249746918678284, "Finetune/Step": 3912, "Finetune/Step Time": 2.9470976144075394} +{"Finetune/Learning Rate": 2.292792823574578e-06, "Finetune/Loss": 0.7626208066940308, "Finetune/Loss (Raw)": 0.7497992515563965, "Finetune/Step": 3913, "Finetune/Step Time": 2.944720344617963} +{"Finetune/Learning Rate": 2.2886457770083923e-06, "Finetune/Loss": 0.7638840675354004, "Finetune/Loss (Raw)": 0.8947931528091431, "Finetune/Step": 3914, "Finetune/Step Time": 2.9487015437334776} +{"Finetune/Learning Rate": 2.2845019995989794e-06, "Finetune/Loss": 0.7630050182342529, "Finetune/Loss (Raw)": 0.7917150855064392, "Finetune/Step": 3915, "Finetune/Step Time": 2.955129159614444} +{"Finetune/Learning Rate": 2.280361493103055e-06, "Finetune/Loss": 0.7623734474182129, "Finetune/Loss (Raw)": 0.8173215389251709, "Finetune/Step": 3916, "Finetune/Step Time": 2.9565642904490232} +{"Finetune/Learning Rate": 2.2762242592759476e-06, "Finetune/Loss": 0.7621486186981201, "Finetune/Loss (Raw)": 0.7152635455131531, "Finetune/Step": 3917, "Finetune/Step Time": 2.9539470933377743} +{"Finetune/Learning Rate": 2.2720902998715976e-06, "Finetune/Loss": 0.7611533403396606, "Finetune/Loss (Raw)": 0.6986679434776306, "Finetune/Step": 3918, "Finetune/Step Time": 2.9515038188546896} +{"Finetune/Learning Rate": 2.2679596166425653e-06, "Finetune/Loss": 0.7613822221755981, "Finetune/Loss (Raw)": 0.8786657452583313, "Finetune/Step": 3919, "Finetune/Step Time": 2.95059273019433} +{"Finetune/Learning Rate": 2.263832211340008e-06, "Finetune/Loss": 0.7598593831062317, "Finetune/Loss (Raw)": 0.7174543738365173, "Finetune/Step": 3920, "Finetune/Step Time": 2.950543152168393} +{"Finetune/Learning Rate": 2.2597080857137e-06, "Finetune/Loss": 0.7642793655395508, "Finetune/Loss (Raw)": 0.8329392671585083, "Finetune/Step": 3921, "Finetune/Step Time": 2.917309645563364} +{"Finetune/Learning Rate": 2.255587241512033e-06, "Finetune/Loss": 0.7650172710418701, "Finetune/Loss (Raw)": 0.7670166492462158, "Finetune/Step": 3922, "Finetune/Step Time": 2.895363114774227} +{"Finetune/Learning Rate": 2.2514696804819957e-06, "Finetune/Loss": 0.7643157839775085, "Finetune/Loss (Raw)": 0.6389925479888916, "Finetune/Step": 3923, "Finetune/Step Time": 2.8922094497829676} +{"Finetune/Learning Rate": 2.2473554043691915e-06, "Finetune/Loss": 0.7666870355606079, "Finetune/Loss (Raw)": 0.8352286219596863, "Finetune/Step": 3924, "Finetune/Step Time": 2.868541205301881} +{"Finetune/Learning Rate": 2.243244414917828e-06, "Finetune/Loss": 0.7668102383613586, "Finetune/Loss (Raw)": 0.7916057705879211, "Finetune/Step": 3925, "Finetune/Step Time": 2.86544849909842} +{"Finetune/Learning Rate": 2.239136713870722e-06, "Finetune/Loss": 0.7656046748161316, "Finetune/Loss (Raw)": 0.7508283853530884, "Finetune/Step": 3926, "Finetune/Step Time": 2.8666711542755365} +{"Finetune/Learning Rate": 2.2350323029692944e-06, "Finetune/Loss": 0.7650336027145386, "Finetune/Loss (Raw)": 0.7299599051475525, "Finetune/Step": 3927, "Finetune/Step Time": 2.866604493930936} +{"Finetune/Learning Rate": 2.2309311839535717e-06, "Finetune/Loss": 0.7652698159217834, "Finetune/Loss (Raw)": 0.7295957803726196, "Finetune/Step": 3928, "Finetune/Step Time": 2.8901225831359625} +{"Finetune/Learning Rate": 2.226833358562184e-06, "Finetune/Loss": 0.7653166055679321, "Finetune/Loss (Raw)": 0.8732327818870544, "Finetune/Step": 3929, "Finetune/Step Time": 2.895277826115489} +{"Finetune/Learning Rate": 2.2227388285323726e-06, "Finetune/Loss": 0.7650190591812134, "Finetune/Loss (Raw)": 0.7341621518135071, "Finetune/Step": 3930, "Finetune/Step Time": 2.895443746820092} +{"Finetune/Learning Rate": 2.2186475955999642e-06, "Finetune/Loss": 0.7648166418075562, "Finetune/Loss (Raw)": 0.8070572018623352, "Finetune/Step": 3931, "Finetune/Step Time": 2.8944316767156124} +{"Finetune/Learning Rate": 2.214559661499409e-06, "Finetune/Loss": 0.7594597339630127, "Finetune/Loss (Raw)": 0.1778133362531662, "Finetune/Step": 3932, "Finetune/Step Time": 2.921141877770424} +{"Finetune/Learning Rate": 2.2104750279637443e-06, "Finetune/Loss": 0.7600739002227783, "Finetune/Loss (Raw)": 0.8327558636665344, "Finetune/Step": 3933, "Finetune/Step Time": 2.9223480708897114} +{"Finetune/Learning Rate": 2.2063936967246136e-06, "Finetune/Loss": 0.758698046207428, "Finetune/Loss (Raw)": 0.7285529375076294, "Finetune/Step": 3934, "Finetune/Step Time": 2.9203990697860718} +{"Finetune/Learning Rate": 2.202315669512257e-06, "Finetune/Loss": 0.7582172155380249, "Finetune/Loss (Raw)": 0.8611612915992737, "Finetune/Step": 3935, "Finetune/Step Time": 2.9201306123286486} +{"Finetune/Learning Rate": 2.1982409480555165e-06, "Finetune/Loss": 0.7593284249305725, "Finetune/Loss (Raw)": 0.8620193004608154, "Finetune/Step": 3936, "Finetune/Step Time": 2.9222754649817944} +{"Finetune/Learning Rate": 2.194169534081838e-06, "Finetune/Loss": 0.7606930732727051, "Finetune/Loss (Raw)": 0.8427278399467468, "Finetune/Step": 3937, "Finetune/Step Time": 2.925356015563011} +{"Finetune/Learning Rate": 2.190101429317253e-06, "Finetune/Loss": 0.7628402709960938, "Finetune/Loss (Raw)": 0.8111889362335205, "Finetune/Step": 3938, "Finetune/Step Time": 2.90206753090024} +{"Finetune/Learning Rate": 2.186036635486395e-06, "Finetune/Loss": 0.762374222278595, "Finetune/Loss (Raw)": 0.8241322040557861, "Finetune/Step": 3939, "Finetune/Step Time": 2.903919830918312} +{"Finetune/Learning Rate": 2.1819751543125055e-06, "Finetune/Loss": 0.7612974643707275, "Finetune/Loss (Raw)": 0.7683576941490173, "Finetune/Step": 3940, "Finetune/Step Time": 2.9050878547132015} +{"Finetune/Learning Rate": 2.177916987517399e-06, "Finetune/Loss": 0.7603294849395752, "Finetune/Loss (Raw)": 0.6954168677330017, "Finetune/Step": 3941, "Finetune/Step Time": 2.9049608148634434} +{"Finetune/Learning Rate": 2.1738621368215075e-06, "Finetune/Loss": 0.7604987621307373, "Finetune/Loss (Raw)": 0.8872827291488647, "Finetune/Step": 3942, "Finetune/Step Time": 2.904194224625826} +{"Finetune/Learning Rate": 2.1698106039438416e-06, "Finetune/Loss": 0.7596901059150696, "Finetune/Loss (Raw)": 0.7679758667945862, "Finetune/Step": 3943, "Finetune/Step Time": 2.907074837014079} +{"Finetune/Learning Rate": 2.165762390602014e-06, "Finetune/Loss": 0.7589970827102661, "Finetune/Loss (Raw)": 0.7205955386161804, "Finetune/Step": 3944, "Finetune/Step Time": 2.9195152390748262} +{"Finetune/Learning Rate": 2.1617174985122247e-06, "Finetune/Loss": 0.7583115100860596, "Finetune/Loss (Raw)": 0.8046687245368958, "Finetune/Step": 3945, "Finetune/Step Time": 2.919460402801633} +{"Finetune/Learning Rate": 2.157675929389267e-06, "Finetune/Loss": 0.7581422328948975, "Finetune/Loss (Raw)": 0.8248951435089111, "Finetune/Step": 3946, "Finetune/Step Time": 2.9214448630809784} +{"Finetune/Learning Rate": 2.1536376849465347e-06, "Finetune/Loss": 0.7588654160499573, "Finetune/Loss (Raw)": 0.7669037580490112, "Finetune/Step": 3947, "Finetune/Step Time": 2.9247683715075254} +{"Finetune/Learning Rate": 2.149602766895994e-06, "Finetune/Loss": 0.7590917348861694, "Finetune/Loss (Raw)": 0.8802731037139893, "Finetune/Step": 3948, "Finetune/Step Time": 2.9177939891815186} +{"Finetune/Learning Rate": 2.1455711769482113e-06, "Finetune/Loss": 0.7611099481582642, "Finetune/Loss (Raw)": 0.8512105345726013, "Finetune/Step": 3949, "Finetune/Step Time": 2.8916318248957396} +{"Finetune/Learning Rate": 2.141542916812348e-06, "Finetune/Loss": 0.7617379426956177, "Finetune/Loss (Raw)": 0.8012305498123169, "Finetune/Step": 3950, "Finetune/Step Time": 2.890214219689369} +{"Finetune/Learning Rate": 2.137517988196144e-06, "Finetune/Loss": 0.7613793611526489, "Finetune/Loss (Raw)": 0.7049062848091125, "Finetune/Step": 3951, "Finetune/Step Time": 2.891932053491473} +{"Finetune/Learning Rate": 2.1334963928059315e-06, "Finetune/Loss": 0.7621487379074097, "Finetune/Loss (Raw)": 0.8190751075744629, "Finetune/Step": 3952, "Finetune/Step Time": 2.8708183839917183} +{"Finetune/Learning Rate": 2.129478132346626e-06, "Finetune/Loss": 0.7574853897094727, "Finetune/Loss (Raw)": 0.1952398270368576, "Finetune/Step": 3953, "Finetune/Step Time": 2.898781456053257} +{"Finetune/Learning Rate": 2.1254632085217344e-06, "Finetune/Loss": 0.7539397478103638, "Finetune/Loss (Raw)": 0.35083675384521484, "Finetune/Step": 3954, "Finetune/Step Time": 2.931826200336218} +{"Finetune/Learning Rate": 2.1214516230333438e-06, "Finetune/Loss": 0.7544476985931396, "Finetune/Loss (Raw)": 0.8257285356521606, "Finetune/Step": 3955, "Finetune/Step Time": 2.928719559684396} +{"Finetune/Learning Rate": 2.117443377582128e-06, "Finetune/Loss": 0.7550152540206909, "Finetune/Loss (Raw)": 0.8394626379013062, "Finetune/Step": 3956, "Finetune/Step Time": 2.9319185595959425} +{"Finetune/Learning Rate": 2.1134384738673487e-06, "Finetune/Loss": 0.7556494474411011, "Finetune/Loss (Raw)": 0.8636475801467896, "Finetune/Step": 3957, "Finetune/Step Time": 2.9327566511929035} +{"Finetune/Learning Rate": 2.1094369135868473e-06, "Finetune/Loss": 0.7565804719924927, "Finetune/Loss (Raw)": 0.8462597727775574, "Finetune/Step": 3958, "Finetune/Step Time": 2.9324897583574057} +{"Finetune/Learning Rate": 2.1054386984370425e-06, "Finetune/Loss": 0.7560998201370239, "Finetune/Loss (Raw)": 0.710366427898407, "Finetune/Step": 3959, "Finetune/Step Time": 2.9286990351974964} +{"Finetune/Learning Rate": 2.101443830112947e-06, "Finetune/Loss": 0.7566198110580444, "Finetune/Loss (Raw)": 0.8071339130401611, "Finetune/Step": 3960, "Finetune/Step Time": 2.928492233157158} +{"Finetune/Learning Rate": 2.0974523103081445e-06, "Finetune/Loss": 0.7569440603256226, "Finetune/Loss (Raw)": 0.8882797956466675, "Finetune/Step": 3961, "Finetune/Step Time": 2.928536307066679} +{"Finetune/Learning Rate": 2.0934641407148038e-06, "Finetune/Loss": 0.7567490339279175, "Finetune/Loss (Raw)": 0.7829508781433105, "Finetune/Step": 3962, "Finetune/Step Time": 2.924131700769067} +{"Finetune/Learning Rate": 2.089479323023672e-06, "Finetune/Loss": 0.7576179504394531, "Finetune/Loss (Raw)": 0.8421687483787537, "Finetune/Step": 3963, "Finetune/Step Time": 2.921993672847748} +{"Finetune/Learning Rate": 2.0854978589240747e-06, "Finetune/Loss": 0.7575151324272156, "Finetune/Loss (Raw)": 0.8034975528717041, "Finetune/Step": 3964, "Finetune/Step Time": 2.9245975762605667} +{"Finetune/Learning Rate": 2.0815197501039163e-06, "Finetune/Loss": 0.7584712505340576, "Finetune/Loss (Raw)": 0.8334213495254517, "Finetune/Step": 3965, "Finetune/Step Time": 2.9254821818321943} +{"Finetune/Learning Rate": 2.0775449982496807e-06, "Finetune/Loss": 0.7586565613746643, "Finetune/Loss (Raw)": 0.8141368627548218, "Finetune/Step": 3966, "Finetune/Step Time": 2.924095204100013} +{"Finetune/Learning Rate": 2.073573605046424e-06, "Finetune/Loss": 0.7566310167312622, "Finetune/Loss (Raw)": 0.6939429640769958, "Finetune/Step": 3967, "Finetune/Step Time": 2.9485993422567844} +{"Finetune/Learning Rate": 2.0696055721777875e-06, "Finetune/Loss": 0.7611940503120422, "Finetune/Loss (Raw)": 0.8150755763053894, "Finetune/Step": 3968, "Finetune/Step Time": 2.918063562363386} +{"Finetune/Learning Rate": 2.065640901325973e-06, "Finetune/Loss": 0.762075662612915, "Finetune/Loss (Raw)": 0.8869596719741821, "Finetune/Step": 3969, "Finetune/Step Time": 2.916060008108616} +{"Finetune/Learning Rate": 2.0616795941717715e-06, "Finetune/Loss": 0.7604815363883972, "Finetune/Loss (Raw)": 0.5361374020576477, "Finetune/Step": 3970, "Finetune/Step Time": 2.9394467622041702} +{"Finetune/Learning Rate": 2.057721652394542e-06, "Finetune/Loss": 0.759233832359314, "Finetune/Loss (Raw)": 0.5954940319061279, "Finetune/Step": 3971, "Finetune/Step Time": 2.9601137209683657} +{"Finetune/Learning Rate": 2.0537670776722164e-06, "Finetune/Loss": 0.7607530355453491, "Finetune/Loss (Raw)": 0.7939856052398682, "Finetune/Step": 3972, "Finetune/Step Time": 2.934699270874262} +{"Finetune/Learning Rate": 2.049815871681299e-06, "Finetune/Loss": 0.7611984610557556, "Finetune/Loss (Raw)": 0.8645287752151489, "Finetune/Step": 3973, "Finetune/Step Time": 2.9349738024175167} +{"Finetune/Learning Rate": 2.045868036096864e-06, "Finetune/Loss": 0.7607300281524658, "Finetune/Loss (Raw)": 0.827538788318634, "Finetune/Step": 3974, "Finetune/Step Time": 2.933993261307478} +{"Finetune/Learning Rate": 2.041923572592569e-06, "Finetune/Loss": 0.7612178325653076, "Finetune/Loss (Raw)": 0.8447557091712952, "Finetune/Step": 3975, "Finetune/Step Time": 2.9290144350379705} +{"Finetune/Learning Rate": 2.0379824828406234e-06, "Finetune/Loss": 0.7620295286178589, "Finetune/Loss (Raw)": 0.9156854152679443, "Finetune/Step": 3976, "Finetune/Step Time": 2.9296976905316114} +{"Finetune/Learning Rate": 2.034044768511816e-06, "Finetune/Loss": 0.7621047496795654, "Finetune/Loss (Raw)": 0.7381368279457092, "Finetune/Step": 3977, "Finetune/Step Time": 2.9347403161227703} +{"Finetune/Learning Rate": 2.0301104312755115e-06, "Finetune/Loss": 0.7620002627372742, "Finetune/Loss (Raw)": 0.769633948802948, "Finetune/Step": 3978, "Finetune/Step Time": 2.935441993176937} +{"Finetune/Learning Rate": 2.0261794727996265e-06, "Finetune/Loss": 0.7607545852661133, "Finetune/Loss (Raw)": 0.683167576789856, "Finetune/Step": 3979, "Finetune/Step Time": 2.934456717222929} +{"Finetune/Learning Rate": 2.0222518947506587e-06, "Finetune/Loss": 0.7597379684448242, "Finetune/Loss (Raw)": 0.8110889196395874, "Finetune/Step": 3980, "Finetune/Step Time": 2.9322069454938173} +{"Finetune/Learning Rate": 2.0183276987936696e-06, "Finetune/Loss": 0.7588157653808594, "Finetune/Loss (Raw)": 0.7025905251502991, "Finetune/Step": 3981, "Finetune/Step Time": 2.9329413548111916} +{"Finetune/Learning Rate": 2.0144068865922826e-06, "Finetune/Loss": 0.7590574622154236, "Finetune/Loss (Raw)": 0.8524407148361206, "Finetune/Step": 3982, "Finetune/Step Time": 2.93346581235528} +{"Finetune/Learning Rate": 2.010489459808691e-06, "Finetune/Loss": 0.7600635290145874, "Finetune/Loss (Raw)": 0.8658502101898193, "Finetune/Step": 3983, "Finetune/Step Time": 2.9080243911594152} +{"Finetune/Learning Rate": 2.0065754201036482e-06, "Finetune/Loss": 0.7598817348480225, "Finetune/Loss (Raw)": 0.7822415828704834, "Finetune/Step": 3984, "Finetune/Step Time": 2.907702213153243} +{"Finetune/Learning Rate": 2.002664769136483e-06, "Finetune/Loss": 0.7607599496841431, "Finetune/Loss (Raw)": 0.7720630168914795, "Finetune/Step": 3985, "Finetune/Step Time": 2.888444045558572} +{"Finetune/Learning Rate": 1.998757508565071e-06, "Finetune/Loss": 0.7618730068206787, "Finetune/Loss (Raw)": 0.8212665915489197, "Finetune/Step": 3986, "Finetune/Step Time": 2.886993136256933} +{"Finetune/Learning Rate": 1.9948536400458598e-06, "Finetune/Loss": 0.7620452642440796, "Finetune/Loss (Raw)": 0.8211377859115601, "Finetune/Step": 3987, "Finetune/Step Time": 2.887021876871586} +{"Finetune/Learning Rate": 1.990953165233862e-06, "Finetune/Loss": 0.7594296932220459, "Finetune/Loss (Raw)": 0.525177538394928, "Finetune/Step": 3988, "Finetune/Step Time": 2.9092752281576395} +{"Finetune/Learning Rate": 1.9870560857826473e-06, "Finetune/Loss": 0.7603815793991089, "Finetune/Loss (Raw)": 0.9132750630378723, "Finetune/Step": 3989, "Finetune/Step Time": 2.9118584785610437} +{"Finetune/Learning Rate": 1.983162403344343e-06, "Finetune/Loss": 0.759518027305603, "Finetune/Loss (Raw)": 0.7051182985305786, "Finetune/Step": 3990, "Finetune/Step Time": 2.9124021492898464} +{"Finetune/Learning Rate": 1.979272119569643e-06, "Finetune/Loss": 0.7599455714225769, "Finetune/Loss (Raw)": 0.8249295353889465, "Finetune/Step": 3991, "Finetune/Step Time": 2.905976699665189} +{"Finetune/Learning Rate": 1.9753852361077942e-06, "Finetune/Loss": 0.7593666315078735, "Finetune/Loss (Raw)": 0.7603713274002075, "Finetune/Step": 3992, "Finetune/Step Time": 2.905320258811116} +{"Finetune/Learning Rate": 1.971501754606605e-06, "Finetune/Loss": 0.7610694766044617, "Finetune/Loss (Raw)": 0.8185828328132629, "Finetune/Step": 3993, "Finetune/Step Time": 2.8831223025918007} +{"Finetune/Learning Rate": 1.9676216767124422e-06, "Finetune/Loss": 0.76214599609375, "Finetune/Loss (Raw)": 0.6967980861663818, "Finetune/Step": 3994, "Finetune/Step Time": 2.8594781793653965} +{"Finetune/Learning Rate": 1.9637450040702268e-06, "Finetune/Loss": 0.7626015543937683, "Finetune/Loss (Raw)": 0.819911539554596, "Finetune/Step": 3995, "Finetune/Step Time": 2.8633186481893063} +{"Finetune/Learning Rate": 1.9598717383234423e-06, "Finetune/Loss": 0.7626616954803467, "Finetune/Loss (Raw)": 0.8187827467918396, "Finetune/Step": 3996, "Finetune/Step Time": 2.8658282663673162} +{"Finetune/Learning Rate": 1.956001881114117e-06, "Finetune/Loss": 0.7635750770568848, "Finetune/Loss (Raw)": 0.8704986572265625, "Finetune/Step": 3997, "Finetune/Step Time": 2.8690122924745083} +{"Finetune/Learning Rate": 1.952135434082847e-06, "Finetune/Loss": 0.7640050649642944, "Finetune/Loss (Raw)": 0.7873752117156982, "Finetune/Step": 3998, "Finetune/Step Time": 2.867152478545904} +{"Finetune/Learning Rate": 1.9482723988687734e-06, "Finetune/Loss": 0.7655605673789978, "Finetune/Loss (Raw)": 0.8468238711357117, "Finetune/Step": 3999, "Finetune/Step Time": 2.867609765380621} +{"Finetune/Learning Rate": 1.9444127771095955e-06, "Finetune/Loss": 0.7655638456344604, "Finetune/Loss (Raw)": 0.791339099407196, "Finetune/Step": 4000, "Finetune/Step Time": 2.8744683042168617} +{"Finetune/Learning Rate": 1.940556570441563e-06, "Finetune/Loss": 0.7662176489830017, "Finetune/Loss (Raw)": 0.8942372798919678, "Finetune/Step": 4001, "Finetune/Step Time": 2.872342126443982} +{"Finetune/Learning Rate": 1.936703780499476e-06, "Finetune/Loss": 0.7654403448104858, "Finetune/Loss (Raw)": 0.6907529234886169, "Finetune/Step": 4002, "Finetune/Step Time": 2.8718088399618864} +{"Finetune/Learning Rate": 1.9328544089166967e-06, "Finetune/Loss": 0.7660790681838989, "Finetune/Loss (Raw)": 0.8293141722679138, "Finetune/Step": 4003, "Finetune/Step Time": 2.870525950565934} +{"Finetune/Learning Rate": 1.929008457325123e-06, "Finetune/Loss": 0.7657636404037476, "Finetune/Loss (Raw)": 0.7274062037467957, "Finetune/Step": 4004, "Finetune/Step Time": 2.8731738440692425} +{"Finetune/Learning Rate": 1.9251659273552104e-06, "Finetune/Loss": 0.765813946723938, "Finetune/Loss (Raw)": 0.8252468705177307, "Finetune/Step": 4005, "Finetune/Step Time": 2.876082954928279} +{"Finetune/Learning Rate": 1.9213268206359714e-06, "Finetune/Loss": 0.7662436962127686, "Finetune/Loss (Raw)": 0.8386371731758118, "Finetune/Step": 4006, "Finetune/Step Time": 2.8761812057346106} +{"Finetune/Learning Rate": 1.917491138794948e-06, "Finetune/Loss": 0.7665702104568481, "Finetune/Loss (Raw)": 0.8166243433952332, "Finetune/Step": 4007, "Finetune/Step Time": 2.8703370708972216} +{"Finetune/Learning Rate": 1.9136588834582516e-06, "Finetune/Loss": 0.7650837898254395, "Finetune/Loss (Raw)": 0.6856504082679749, "Finetune/Step": 4008, "Finetune/Step Time": 2.875120623037219} +{"Finetune/Learning Rate": 1.9098300562505266e-06, "Finetune/Loss": 0.7644673585891724, "Finetune/Loss (Raw)": 0.8093509078025818, "Finetune/Step": 4009, "Finetune/Step Time": 2.8716975394636393} +{"Finetune/Learning Rate": 1.9060046587949699e-06, "Finetune/Loss": 0.7632400989532471, "Finetune/Loss (Raw)": 0.6060512661933899, "Finetune/Step": 4010, "Finetune/Step Time": 2.8957879319787025} +{"Finetune/Learning Rate": 1.9021826927133213e-06, "Finetune/Loss": 0.7636082172393799, "Finetune/Loss (Raw)": 0.758804440498352, "Finetune/Step": 4011, "Finetune/Step Time": 2.899231782183051} +{"Finetune/Learning Rate": 1.8983641596258674e-06, "Finetune/Loss": 0.7636066675186157, "Finetune/Loss (Raw)": 0.7493213415145874, "Finetune/Step": 4012, "Finetune/Step Time": 2.895915597677231} +{"Finetune/Learning Rate": 1.8945490611514472e-06, "Finetune/Loss": 0.764525294303894, "Finetune/Loss (Raw)": 0.8477200269699097, "Finetune/Step": 4013, "Finetune/Step Time": 2.892496895045042} +{"Finetune/Learning Rate": 1.8907373989074263e-06, "Finetune/Loss": 0.7651844024658203, "Finetune/Loss (Raw)": 0.8558829426765442, "Finetune/Step": 4014, "Finetune/Step Time": 2.8906047865748405} +{"Finetune/Learning Rate": 1.8869291745097252e-06, "Finetune/Loss": 0.7656778693199158, "Finetune/Loss (Raw)": 0.867656409740448, "Finetune/Step": 4015, "Finetune/Step Time": 2.8895188737660646} +{"Finetune/Learning Rate": 1.8831243895728101e-06, "Finetune/Loss": 0.7659681439399719, "Finetune/Loss (Raw)": 0.8071449995040894, "Finetune/Step": 4016, "Finetune/Step Time": 2.8794792536646128} +{"Finetune/Learning Rate": 1.8793230457096823e-06, "Finetune/Loss": 0.7660852670669556, "Finetune/Loss (Raw)": 0.7632756233215332, "Finetune/Step": 4017, "Finetune/Step Time": 2.8768138010054827} +{"Finetune/Learning Rate": 1.8755251445318834e-06, "Finetune/Loss": 0.7641757130622864, "Finetune/Loss (Raw)": 0.6644426584243774, "Finetune/Step": 4018, "Finetune/Step Time": 2.881880035623908} +{"Finetune/Learning Rate": 1.871730687649501e-06, "Finetune/Loss": 0.763056755065918, "Finetune/Loss (Raw)": 0.7086371779441833, "Finetune/Step": 4019, "Finetune/Step Time": 2.8828865233808756} +{"Finetune/Learning Rate": 1.867939676671159e-06, "Finetune/Loss": 0.7642141580581665, "Finetune/Loss (Raw)": 0.7084012627601624, "Finetune/Step": 4020, "Finetune/Step Time": 2.8597943522036076} +{"Finetune/Learning Rate": 1.8641521132040207e-06, "Finetune/Loss": 0.7654210329055786, "Finetune/Loss (Raw)": 0.9459910988807678, "Finetune/Step": 4021, "Finetune/Step Time": 2.8580592814832926} +{"Finetune/Learning Rate": 1.8603679988537882e-06, "Finetune/Loss": 0.7657666206359863, "Finetune/Loss (Raw)": 0.7587972283363342, "Finetune/Step": 4022, "Finetune/Step Time": 2.8559934087097645} +{"Finetune/Learning Rate": 1.8565873352246999e-06, "Finetune/Loss": 0.7663243412971497, "Finetune/Loss (Raw)": 0.8580899238586426, "Finetune/Step": 4023, "Finetune/Step Time": 2.859823890030384} +{"Finetune/Learning Rate": 1.8528101239195394e-06, "Finetune/Loss": 0.7669923305511475, "Finetune/Loss (Raw)": 0.8730374574661255, "Finetune/Step": 4024, "Finetune/Step Time": 2.8583513852208853} +{"Finetune/Learning Rate": 1.8490363665396106e-06, "Finetune/Loss": 0.7669528722763062, "Finetune/Loss (Raw)": 0.7462638020515442, "Finetune/Step": 4025, "Finetune/Step Time": 2.856485301628709} +{"Finetune/Learning Rate": 1.845266064684771e-06, "Finetune/Loss": 0.7673384547233582, "Finetune/Loss (Raw)": 0.8186736106872559, "Finetune/Step": 4026, "Finetune/Step Time": 2.8542273342609406} +{"Finetune/Learning Rate": 1.841499219953401e-06, "Finetune/Loss": 0.7671247720718384, "Finetune/Loss (Raw)": 0.7702792882919312, "Finetune/Step": 4027, "Finetune/Step Time": 2.8577499259263277} +{"Finetune/Learning Rate": 1.8377358339424212e-06, "Finetune/Loss": 0.7647809982299805, "Finetune/Loss (Raw)": 0.5452054142951965, "Finetune/Step": 4028, "Finetune/Step Time": 2.8802299443632364} +{"Finetune/Learning Rate": 1.833975908247282e-06, "Finetune/Loss": 0.7651623487472534, "Finetune/Loss (Raw)": 0.9011589884757996, "Finetune/Step": 4029, "Finetune/Step Time": 2.8830697499215603} +{"Finetune/Learning Rate": 1.830219444461968e-06, "Finetune/Loss": 0.7646099328994751, "Finetune/Loss (Raw)": 0.7707912921905518, "Finetune/Step": 4030, "Finetune/Step Time": 2.8813878409564495} +{"Finetune/Learning Rate": 1.8264664441790037e-06, "Finetune/Loss": 0.7666475176811218, "Finetune/Loss (Raw)": 0.7933787107467651, "Finetune/Step": 4031, "Finetune/Step Time": 2.8570194337517023} +{"Finetune/Learning Rate": 1.8227169089894315e-06, "Finetune/Loss": 0.765994668006897, "Finetune/Loss (Raw)": 0.7260153889656067, "Finetune/Step": 4032, "Finetune/Step Time": 2.8777126017957926} +{"Finetune/Learning Rate": 1.818970840482832e-06, "Finetune/Loss": 0.7664557695388794, "Finetune/Loss (Raw)": 0.8399365544319153, "Finetune/Step": 4033, "Finetune/Step Time": 2.8780578766018152} +{"Finetune/Learning Rate": 1.8152282402473232e-06, "Finetune/Loss": 0.7704575657844543, "Finetune/Loss (Raw)": 0.787761926651001, "Finetune/Step": 4034, "Finetune/Step Time": 2.8451705127954483} +{"Finetune/Learning Rate": 1.8114891098695354e-06, "Finetune/Loss": 0.7699089050292969, "Finetune/Loss (Raw)": 0.7658129930496216, "Finetune/Step": 4035, "Finetune/Step Time": 2.838871458545327} +{"Finetune/Learning Rate": 1.807753450934645e-06, "Finetune/Loss": 0.7743197679519653, "Finetune/Loss (Raw)": 0.7703568935394287, "Finetune/Step": 4036, "Finetune/Step Time": 2.80890242010355} +{"Finetune/Learning Rate": 1.8040212650263488e-06, "Finetune/Loss": 0.7702760696411133, "Finetune/Loss (Raw)": 0.14641986787319183, "Finetune/Step": 4037, "Finetune/Step Time": 2.836517868563533} +{"Finetune/Learning Rate": 1.8002925537268724e-06, "Finetune/Loss": 0.7694514989852905, "Finetune/Loss (Raw)": 0.7147778272628784, "Finetune/Step": 4038, "Finetune/Step Time": 2.8328602388501167} +{"Finetune/Learning Rate": 1.7965673186169662e-06, "Finetune/Loss": 0.7660739421844482, "Finetune/Loss (Raw)": 0.38189971446990967, "Finetune/Step": 4039, "Finetune/Step Time": 2.866741916164756} +{"Finetune/Learning Rate": 1.7928455612759076e-06, "Finetune/Loss": 0.7651219367980957, "Finetune/Loss (Raw)": 0.6031233668327332, "Finetune/Step": 4040, "Finetune/Step Time": 2.8909199740737677} +{"Finetune/Learning Rate": 1.7891272832815098e-06, "Finetune/Loss": 0.7636655569076538, "Finetune/Loss (Raw)": 0.563381016254425, "Finetune/Step": 4041, "Finetune/Step Time": 2.916408272460103} +{"Finetune/Learning Rate": 1.785412486210092e-06, "Finetune/Loss": 0.7637825012207031, "Finetune/Loss (Raw)": 0.9097627997398376, "Finetune/Step": 4042, "Finetune/Step Time": 2.915791204199195} +{"Finetune/Learning Rate": 1.7817011716365096e-06, "Finetune/Loss": 0.7595866918563843, "Finetune/Loss (Raw)": 0.25464481115341187, "Finetune/Step": 4043, "Finetune/Step Time": 2.9395081754773855} +{"Finetune/Learning Rate": 1.7779933411341444e-06, "Finetune/Loss": 0.75789475440979, "Finetune/Loss (Raw)": 0.6007522344589233, "Finetune/Step": 4044, "Finetune/Step Time": 2.96190376766026} +{"Finetune/Learning Rate": 1.7742889962748933e-06, "Finetune/Loss": 0.7585500478744507, "Finetune/Loss (Raw)": 0.7991428971290588, "Finetune/Step": 4045, "Finetune/Step Time": 2.964436350390315} +{"Finetune/Learning Rate": 1.77058813862918e-06, "Finetune/Loss": 0.7596213221549988, "Finetune/Loss (Raw)": 0.8357974886894226, "Finetune/Step": 4046, "Finetune/Step Time": 2.964008964598179} +{"Finetune/Learning Rate": 1.7668907697659476e-06, "Finetune/Loss": 0.7596309185028076, "Finetune/Loss (Raw)": 0.8798934817314148, "Finetune/Step": 4047, "Finetune/Step Time": 2.961930198594928} +{"Finetune/Learning Rate": 1.763196891252662e-06, "Finetune/Loss": 0.7599208354949951, "Finetune/Loss (Raw)": 0.7545665502548218, "Finetune/Step": 4048, "Finetune/Step Time": 2.962517572566867} +{"Finetune/Learning Rate": 1.7595065046553085e-06, "Finetune/Loss": 0.7600481510162354, "Finetune/Loss (Raw)": 0.8492339253425598, "Finetune/Step": 4049, "Finetune/Step Time": 2.962411191314459} +{"Finetune/Learning Rate": 1.7558196115383918e-06, "Finetune/Loss": 0.7601518630981445, "Finetune/Loss (Raw)": 0.7802911996841431, "Finetune/Step": 4050, "Finetune/Step Time": 2.9636207055300474} +{"Finetune/Learning Rate": 1.7521362134649333e-06, "Finetune/Loss": 0.7596431970596313, "Finetune/Loss (Raw)": 0.5738857984542847, "Finetune/Step": 4051, "Finetune/Step Time": 2.9843890629708767} +{"Finetune/Learning Rate": 1.7484563119964827e-06, "Finetune/Loss": 0.759183406829834, "Finetune/Loss (Raw)": 0.7763760089874268, "Finetune/Step": 4052, "Finetune/Step Time": 2.9848420079797506} +{"Finetune/Learning Rate": 1.7447799086930906e-06, "Finetune/Loss": 0.7595812082290649, "Finetune/Loss (Raw)": 0.8425200581550598, "Finetune/Step": 4053, "Finetune/Step Time": 2.988808359950781} +{"Finetune/Learning Rate": 1.7411070051133405e-06, "Finetune/Loss": 0.7597838044166565, "Finetune/Loss (Raw)": 0.7767602205276489, "Finetune/Step": 4054, "Finetune/Step Time": 2.9902178067713976} +{"Finetune/Learning Rate": 1.7374376028143247e-06, "Finetune/Loss": 0.7605518102645874, "Finetune/Loss (Raw)": 0.8282617926597595, "Finetune/Step": 4055, "Finetune/Step Time": 2.990631990134716} +{"Finetune/Learning Rate": 1.73377170335165e-06, "Finetune/Loss": 0.7611421346664429, "Finetune/Loss (Raw)": 0.8051565289497375, "Finetune/Step": 4056, "Finetune/Step Time": 2.9774818811565638} +{"Finetune/Learning Rate": 1.7301093082794417e-06, "Finetune/Loss": 0.7602900266647339, "Finetune/Loss (Raw)": 0.7641726136207581, "Finetune/Step": 4057, "Finetune/Step Time": 2.9750515669584274} +{"Finetune/Learning Rate": 1.7264504191503362e-06, "Finetune/Loss": 0.7605221271514893, "Finetune/Loss (Raw)": 0.7638627290725708, "Finetune/Step": 4058, "Finetune/Step Time": 2.973974946886301} +{"Finetune/Learning Rate": 1.722795037515491e-06, "Finetune/Loss": 0.76006019115448, "Finetune/Loss (Raw)": 0.7479379773139954, "Finetune/Step": 4059, "Finetune/Step Time": 2.9751798901706934} +{"Finetune/Learning Rate": 1.719143164924565e-06, "Finetune/Loss": 0.7645031809806824, "Finetune/Loss (Raw)": 0.7465054392814636, "Finetune/Step": 4060, "Finetune/Step Time": 2.9518349040299654} +{"Finetune/Learning Rate": 1.7154948029257345e-06, "Finetune/Loss": 0.7638840675354004, "Finetune/Loss (Raw)": 0.7535163760185242, "Finetune/Step": 4061, "Finetune/Step Time": 2.948925670236349} +{"Finetune/Learning Rate": 1.7118499530656973e-06, "Finetune/Loss": 0.7643276453018188, "Finetune/Loss (Raw)": 0.7853253483772278, "Finetune/Step": 4062, "Finetune/Step Time": 2.9485027752816677} +{"Finetune/Learning Rate": 1.7082086168896429e-06, "Finetune/Loss": 0.7635691165924072, "Finetune/Loss (Raw)": 0.7640755772590637, "Finetune/Step": 4063, "Finetune/Step Time": 2.950096582993865} +{"Finetune/Learning Rate": 1.7045707959412893e-06, "Finetune/Loss": 0.7624768018722534, "Finetune/Loss (Raw)": 0.7222055196762085, "Finetune/Step": 4064, "Finetune/Step Time": 2.9515944216400385} +{"Finetune/Learning Rate": 1.7009364917628546e-06, "Finetune/Loss": 0.7627418041229248, "Finetune/Loss (Raw)": 0.8766488432884216, "Finetune/Step": 4065, "Finetune/Step Time": 2.9506776183843613} +{"Finetune/Learning Rate": 1.697305705895068e-06, "Finetune/Loss": 0.7572869062423706, "Finetune/Loss (Raw)": 0.11295948177576065, "Finetune/Step": 4066, "Finetune/Step Time": 2.9844582118093967} +{"Finetune/Learning Rate": 1.6936784398771666e-06, "Finetune/Loss": 0.7575745582580566, "Finetune/Loss (Raw)": 0.8609466552734375, "Finetune/Step": 4067, "Finetune/Step Time": 2.9835693407803774} +{"Finetune/Learning Rate": 1.6900546952468955e-06, "Finetune/Loss": 0.7581585049629211, "Finetune/Loss (Raw)": 0.8431087136268616, "Finetune/Step": 4068, "Finetune/Step Time": 2.982633214443922} +{"Finetune/Learning Rate": 1.6864344735405125e-06, "Finetune/Loss": 0.7591439485549927, "Finetune/Loss (Raw)": 0.8215504288673401, "Finetune/Step": 4069, "Finetune/Step Time": 2.9802488517016172} +{"Finetune/Learning Rate": 1.6828177762927722e-06, "Finetune/Loss": 0.7579694390296936, "Finetune/Loss (Raw)": 0.736947774887085, "Finetune/Step": 4070, "Finetune/Step Time": 2.9796627648174763} +{"Finetune/Learning Rate": 1.679204605036937e-06, "Finetune/Loss": 0.7583732604980469, "Finetune/Loss (Raw)": 0.819660484790802, "Finetune/Step": 4071, "Finetune/Step Time": 2.9807549081742764} +{"Finetune/Learning Rate": 1.675594961304783e-06, "Finetune/Loss": 0.7572777271270752, "Finetune/Loss (Raw)": 0.5803734660148621, "Finetune/Step": 4072, "Finetune/Step Time": 2.989841278642416} +{"Finetune/Learning Rate": 1.6719888466265833e-06, "Finetune/Loss": 0.7577153444290161, "Finetune/Loss (Raw)": 0.8606816530227661, "Finetune/Step": 4073, "Finetune/Step Time": 2.989085493609309} +{"Finetune/Learning Rate": 1.6683862625311165e-06, "Finetune/Loss": 0.7576881647109985, "Finetune/Loss (Raw)": 0.8214089870452881, "Finetune/Step": 4074, "Finetune/Step Time": 2.9913523718714714} +{"Finetune/Learning Rate": 1.6647872105456642e-06, "Finetune/Loss": 0.758414089679718, "Finetune/Loss (Raw)": 0.8598277568817139, "Finetune/Step": 4075, "Finetune/Step Time": 2.9879285469651222} +{"Finetune/Learning Rate": 1.6611916921960102e-06, "Finetune/Loss": 0.7581499814987183, "Finetune/Loss (Raw)": 0.8464664816856384, "Finetune/Step": 4076, "Finetune/Step Time": 2.987752130255103} +{"Finetune/Learning Rate": 1.6575997090064422e-06, "Finetune/Loss": 0.7561801075935364, "Finetune/Loss (Raw)": 0.5990692973136902, "Finetune/Step": 4077, "Finetune/Step Time": 3.0127736758440733} +{"Finetune/Learning Rate": 1.6540112624997451e-06, "Finetune/Loss": 0.7562417984008789, "Finetune/Loss (Raw)": 0.8091254830360413, "Finetune/Step": 4078, "Finetune/Step Time": 3.0128704700618982} +{"Finetune/Learning Rate": 1.6504263541972121e-06, "Finetune/Loss": 0.7570188045501709, "Finetune/Loss (Raw)": 0.8043635487556458, "Finetune/Step": 4079, "Finetune/Step Time": 3.0112394876778126} +{"Finetune/Learning Rate": 1.6468449856186319e-06, "Finetune/Loss": 0.7566943764686584, "Finetune/Loss (Raw)": 0.7775476574897766, "Finetune/Step": 4080, "Finetune/Step Time": 3.017796805128455} +{"Finetune/Learning Rate": 1.6432671582822857e-06, "Finetune/Loss": 0.7613914012908936, "Finetune/Loss (Raw)": 0.7964619994163513, "Finetune/Step": 4081, "Finetune/Step Time": 2.987709192559123} +{"Finetune/Learning Rate": 1.6396928737049656e-06, "Finetune/Loss": 0.7649160027503967, "Finetune/Loss (Raw)": 0.8019821047782898, "Finetune/Step": 4082, "Finetune/Step Time": 2.953437926247716} +{"Finetune/Learning Rate": 1.6361221334019561e-06, "Finetune/Loss": 0.7655074000358582, "Finetune/Loss (Raw)": 0.9014256000518799, "Finetune/Step": 4083, "Finetune/Step Time": 2.9511925000697374} +{"Finetune/Learning Rate": 1.6325549388870365e-06, "Finetune/Loss": 0.7652184367179871, "Finetune/Loss (Raw)": 0.802478015422821, "Finetune/Step": 4084, "Finetune/Step Time": 2.946342471987009} +{"Finetune/Learning Rate": 1.628991291672488e-06, "Finetune/Loss": 0.764196515083313, "Finetune/Loss (Raw)": 0.7328416109085083, "Finetune/Step": 4085, "Finetune/Step Time": 2.9492987859994173} +{"Finetune/Learning Rate": 1.6254311932690826e-06, "Finetune/Loss": 0.7637456655502319, "Finetune/Loss (Raw)": 0.7885585427284241, "Finetune/Step": 4086, "Finetune/Step Time": 2.9457356221973896} +{"Finetune/Learning Rate": 1.621874645186098e-06, "Finetune/Loss": 0.7644042372703552, "Finetune/Loss (Raw)": 0.7946537733078003, "Finetune/Step": 4087, "Finetune/Step Time": 2.9466138426214457} +{"Finetune/Learning Rate": 1.6183216489312913e-06, "Finetune/Loss": 0.7641497850418091, "Finetune/Loss (Raw)": 0.7745686173439026, "Finetune/Step": 4088, "Finetune/Step Time": 2.9387102965265512} +{"Finetune/Learning Rate": 1.614772206010924e-06, "Finetune/Loss": 0.7636375427246094, "Finetune/Loss (Raw)": 0.8227140307426453, "Finetune/Step": 4089, "Finetune/Step Time": 2.9408177081495523} +{"Finetune/Learning Rate": 1.611226317929756e-06, "Finetune/Loss": 0.7646400928497314, "Finetune/Loss (Raw)": 0.9112788438796997, "Finetune/Step": 4090, "Finetune/Step Time": 2.9410846065729856} +{"Finetune/Learning Rate": 1.607683986191023e-06, "Finetune/Loss": 0.7645519375801086, "Finetune/Loss (Raw)": 0.8308784365653992, "Finetune/Step": 4091, "Finetune/Step Time": 2.942759484052658} +{"Finetune/Learning Rate": 1.6041452122964718e-06, "Finetune/Loss": 0.7644476890563965, "Finetune/Loss (Raw)": 0.7901604771614075, "Finetune/Step": 4092, "Finetune/Step Time": 2.939324526116252} +{"Finetune/Learning Rate": 1.6006099977463295e-06, "Finetune/Loss": 0.7642835378646851, "Finetune/Loss (Raw)": 0.8124018907546997, "Finetune/Step": 4093, "Finetune/Step Time": 2.9408070277422667} +{"Finetune/Learning Rate": 1.597078344039318e-06, "Finetune/Loss": 0.7638845443725586, "Finetune/Loss (Raw)": 0.7630704045295715, "Finetune/Step": 4094, "Finetune/Step Time": 2.9418324399739504} +{"Finetune/Learning Rate": 1.5935502526726475e-06, "Finetune/Loss": 0.7643296718597412, "Finetune/Loss (Raw)": 0.7509212493896484, "Finetune/Step": 4095, "Finetune/Step Time": 2.919442068785429} +{"Finetune/Learning Rate": 1.5900257251420193e-06, "Finetune/Loss": 0.7646034955978394, "Finetune/Loss (Raw)": 0.8501139879226685, "Finetune/Step": 4096, "Finetune/Step Time": 2.9190076999366283} +{"Finetune/Learning Rate": 1.5865047629416297e-06, "Finetune/Loss": 0.7633181214332581, "Finetune/Loss (Raw)": 0.7224379181861877, "Finetune/Step": 4097, "Finetune/Step Time": 2.9230747018009424} +{"Finetune/Learning Rate": 1.5829873675641516e-06, "Finetune/Loss": 0.764960527420044, "Finetune/Loss (Raw)": 0.7463608980178833, "Finetune/Step": 4098, "Finetune/Step Time": 2.8979841098189354} +{"Finetune/Learning Rate": 1.579473540500751e-06, "Finetune/Loss": 0.7672256231307983, "Finetune/Loss (Raw)": 0.8854333162307739, "Finetune/Step": 4099, "Finetune/Step Time": 2.8742776550352573} +{"Finetune/Learning Rate": 1.5759632832410875e-06, "Finetune/Loss": 0.7668662071228027, "Finetune/Loss (Raw)": 0.7479787468910217, "Finetune/Step": 4100, "Finetune/Step Time": 2.874137597158551} +{"Finetune/Learning Rate": 1.5724565972732996e-06, "Finetune/Loss": 0.7664966583251953, "Finetune/Loss (Raw)": 0.8172284364700317, "Finetune/Step": 4101, "Finetune/Step Time": 2.875864200294018} +{"Finetune/Learning Rate": 1.5689534840840138e-06, "Finetune/Loss": 0.7658772468566895, "Finetune/Loss (Raw)": 0.7482569217681885, "Finetune/Step": 4102, "Finetune/Step Time": 2.8738891426473856} +{"Finetune/Learning Rate": 1.5654539451583418e-06, "Finetune/Loss": 0.7654123902320862, "Finetune/Loss (Raw)": 0.7852442860603333, "Finetune/Step": 4103, "Finetune/Step Time": 2.8760684989392757} +{"Finetune/Learning Rate": 1.5619579819798814e-06, "Finetune/Loss": 0.7641333937644958, "Finetune/Loss (Raw)": 0.7519745230674744, "Finetune/Step": 4104, "Finetune/Step Time": 2.873990684747696} +{"Finetune/Learning Rate": 1.5584655960307137e-06, "Finetune/Loss": 0.763181209564209, "Finetune/Loss (Raw)": 0.6162576079368591, "Finetune/Step": 4105, "Finetune/Step Time": 2.8944269120693207} +{"Finetune/Learning Rate": 1.5549767887914013e-06, "Finetune/Loss": 0.763609766960144, "Finetune/Loss (Raw)": 0.8244951367378235, "Finetune/Step": 4106, "Finetune/Step Time": 2.8993247505277395} +{"Finetune/Learning Rate": 1.5514915617409942e-06, "Finetune/Loss": 0.7647362947463989, "Finetune/Loss (Raw)": 0.827361524105072, "Finetune/Step": 4107, "Finetune/Step Time": 2.9005498439073563} +{"Finetune/Learning Rate": 1.548009916357024e-06, "Finetune/Loss": 0.764025866985321, "Finetune/Loss (Raw)": 0.7201509475708008, "Finetune/Step": 4108, "Finetune/Step Time": 2.903643136844039} +{"Finetune/Learning Rate": 1.5445318541154941e-06, "Finetune/Loss": 0.7647603750228882, "Finetune/Loss (Raw)": 0.7966145277023315, "Finetune/Step": 4109, "Finetune/Step Time": 2.9027039725333452} +{"Finetune/Learning Rate": 1.5410573764909032e-06, "Finetune/Loss": 0.7642797231674194, "Finetune/Loss (Raw)": 0.7909138202667236, "Finetune/Step": 4110, "Finetune/Step Time": 2.904078084975481} +{"Finetune/Learning Rate": 1.5375864849562206e-06, "Finetune/Loss": 0.7639497518539429, "Finetune/Loss (Raw)": 0.8236192464828491, "Finetune/Step": 4111, "Finetune/Step Time": 2.9078307412564754} +{"Finetune/Learning Rate": 1.5341191809829004e-06, "Finetune/Loss": 0.7640427350997925, "Finetune/Loss (Raw)": 0.7941287755966187, "Finetune/Step": 4112, "Finetune/Step Time": 2.9193497207015753} +{"Finetune/Learning Rate": 1.5306554660408734e-06, "Finetune/Loss": 0.764660656452179, "Finetune/Loss (Raw)": 0.8511670231819153, "Finetune/Step": 4113, "Finetune/Step Time": 2.916993238031864} +{"Finetune/Learning Rate": 1.5271953415985464e-06, "Finetune/Loss": 0.7645081281661987, "Finetune/Loss (Raw)": 0.8017446398735046, "Finetune/Step": 4114, "Finetune/Step Time": 2.9142730869352818} +{"Finetune/Learning Rate": 1.5237388091228134e-06, "Finetune/Loss": 0.7645149230957031, "Finetune/Loss (Raw)": 0.8220024704933167, "Finetune/Step": 4115, "Finetune/Step Time": 2.912679996341467} +{"Finetune/Learning Rate": 1.5202858700790325e-06, "Finetune/Loss": 0.76710045337677, "Finetune/Loss (Raw)": 0.8561298847198486, "Finetune/Step": 4116, "Finetune/Step Time": 2.8911331426352262} +{"Finetune/Learning Rate": 1.5168365259310458e-06, "Finetune/Loss": 0.7652803659439087, "Finetune/Loss (Raw)": 0.6802995800971985, "Finetune/Step": 4117, "Finetune/Step Time": 2.888686390593648} +{"Finetune/Learning Rate": 1.513390778141177e-06, "Finetune/Loss": 0.7666700482368469, "Finetune/Loss (Raw)": 0.8830007314682007, "Finetune/Step": 4118, "Finetune/Step Time": 2.8890267815440893} +{"Finetune/Learning Rate": 1.509948628170209e-06, "Finetune/Loss": 0.7667622566223145, "Finetune/Loss (Raw)": 0.8367295265197754, "Finetune/Step": 4119, "Finetune/Step Time": 2.8892911039292812} +{"Finetune/Learning Rate": 1.5065100774774167e-06, "Finetune/Loss": 0.7668516635894775, "Finetune/Loss (Raw)": 0.7718121409416199, "Finetune/Step": 4120, "Finetune/Step Time": 2.8870506081730127} +{"Finetune/Learning Rate": 1.5030751275205402e-06, "Finetune/Loss": 0.7658698558807373, "Finetune/Loss (Raw)": 0.6929169297218323, "Finetune/Step": 4121, "Finetune/Step Time": 2.8860596250742674} +{"Finetune/Learning Rate": 1.4996437797557928e-06, "Finetune/Loss": 0.7661745548248291, "Finetune/Loss (Raw)": 0.7357999682426453, "Finetune/Step": 4122, "Finetune/Step Time": 2.886607861146331} +{"Finetune/Learning Rate": 1.496216035637863e-06, "Finetune/Loss": 0.7663472890853882, "Finetune/Loss (Raw)": 0.8420242667198181, "Finetune/Step": 4123, "Finetune/Step Time": 2.883342621847987} +{"Finetune/Learning Rate": 1.4927918966199095e-06, "Finetune/Loss": 0.7651933431625366, "Finetune/Loss (Raw)": 0.671076238155365, "Finetune/Step": 4124, "Finetune/Step Time": 2.9057906847447157} +{"Finetune/Learning Rate": 1.48937136415357e-06, "Finetune/Loss": 0.7640659213066101, "Finetune/Loss (Raw)": 0.7261881232261658, "Finetune/Step": 4125, "Finetune/Step Time": 2.9041282571852207} +{"Finetune/Learning Rate": 1.4859544396889413e-06, "Finetune/Loss": 0.7636526823043823, "Finetune/Loss (Raw)": 0.7344763875007629, "Finetune/Step": 4126, "Finetune/Step Time": 2.929022777825594} +{"Finetune/Learning Rate": 1.4825411246745968e-06, "Finetune/Loss": 0.7630679607391357, "Finetune/Loss (Raw)": 0.7719805240631104, "Finetune/Step": 4127, "Finetune/Step Time": 2.929691769182682} +{"Finetune/Learning Rate": 1.4791314205575846e-06, "Finetune/Loss": 0.7633860111236572, "Finetune/Loss (Raw)": 0.8320457339286804, "Finetune/Step": 4128, "Finetune/Step Time": 2.919959617778659} +{"Finetune/Learning Rate": 1.4757253287834105e-06, "Finetune/Loss": 0.7626239657402039, "Finetune/Loss (Raw)": 0.7966998219490051, "Finetune/Step": 4129, "Finetune/Step Time": 2.919235147535801} +{"Finetune/Learning Rate": 1.4723228507960608e-06, "Finetune/Loss": 0.76357102394104, "Finetune/Loss (Raw)": 0.8119780421257019, "Finetune/Step": 4130, "Finetune/Step Time": 2.9239180479198694} +{"Finetune/Learning Rate": 1.4689239880379814e-06, "Finetune/Loss": 0.7636337876319885, "Finetune/Loss (Raw)": 0.8373486399650574, "Finetune/Step": 4131, "Finetune/Step Time": 2.9212422873824835} +{"Finetune/Learning Rate": 1.4655287419500897e-06, "Finetune/Loss": 0.7642295956611633, "Finetune/Loss (Raw)": 0.8036680817604065, "Finetune/Step": 4132, "Finetune/Step Time": 2.916801767423749} +{"Finetune/Learning Rate": 1.4621371139717677e-06, "Finetune/Loss": 0.764087438583374, "Finetune/Loss (Raw)": 0.807050883769989, "Finetune/Step": 4133, "Finetune/Step Time": 2.916840810328722} +{"Finetune/Learning Rate": 1.4587491055408632e-06, "Finetune/Loss": 0.7633116245269775, "Finetune/Loss (Raw)": 0.7393330931663513, "Finetune/Step": 4134, "Finetune/Step Time": 2.9186043832451105} +{"Finetune/Learning Rate": 1.4553647180936981e-06, "Finetune/Loss": 0.7632414102554321, "Finetune/Loss (Raw)": 0.8076356649398804, "Finetune/Step": 4135, "Finetune/Step Time": 2.920837789773941} +{"Finetune/Learning Rate": 1.4519839530650426e-06, "Finetune/Loss": 0.7647203803062439, "Finetune/Loss (Raw)": 0.8749586343765259, "Finetune/Step": 4136, "Finetune/Step Time": 2.9166824463754892} +{"Finetune/Learning Rate": 1.4486068118881435e-06, "Finetune/Loss": 0.7649244070053101, "Finetune/Loss (Raw)": 0.8354659080505371, "Finetune/Step": 4137, "Finetune/Step Time": 2.9199417270720005} +{"Finetune/Learning Rate": 1.44523329599471e-06, "Finetune/Loss": 0.7663277387619019, "Finetune/Loss (Raw)": 0.7856725454330444, "Finetune/Step": 4138, "Finetune/Step Time": 2.897279093042016} +{"Finetune/Learning Rate": 1.441863406814913e-06, "Finetune/Loss": 0.7669262290000916, "Finetune/Loss (Raw)": 0.8354148268699646, "Finetune/Step": 4139, "Finetune/Step Time": 2.8940229024738073} +{"Finetune/Learning Rate": 1.4384971457773844e-06, "Finetune/Loss": 0.766851544380188, "Finetune/Loss (Raw)": 0.7397684454917908, "Finetune/Step": 4140, "Finetune/Step Time": 2.895163532346487} +{"Finetune/Learning Rate": 1.4351345143092198e-06, "Finetune/Loss": 0.7660613656044006, "Finetune/Loss (Raw)": 0.7465733289718628, "Finetune/Step": 4141, "Finetune/Step Time": 2.8965584225952625} +{"Finetune/Learning Rate": 1.4317755138359745e-06, "Finetune/Loss": 0.7614625096321106, "Finetune/Loss (Raw)": 0.26722201704978943, "Finetune/Step": 4142, "Finetune/Step Time": 2.9258019849658012} +{"Finetune/Learning Rate": 1.428420145781666e-06, "Finetune/Loss": 0.7610388994216919, "Finetune/Loss (Raw)": 0.813437283039093, "Finetune/Step": 4143, "Finetune/Step Time": 2.921917036175728} +{"Finetune/Learning Rate": 1.4250684115687718e-06, "Finetune/Loss": 0.7602285146713257, "Finetune/Loss (Raw)": 0.703420102596283, "Finetune/Step": 4144, "Finetune/Step Time": 2.9218310602009296} +{"Finetune/Learning Rate": 1.4217203126182244e-06, "Finetune/Loss": 0.759518563747406, "Finetune/Loss (Raw)": 0.6723979115486145, "Finetune/Step": 4145, "Finetune/Step Time": 2.925385508686304} +{"Finetune/Learning Rate": 1.4183758503494283e-06, "Finetune/Loss": 0.7607383728027344, "Finetune/Loss (Raw)": 0.8205806612968445, "Finetune/Step": 4146, "Finetune/Step Time": 2.9230857118964195} +{"Finetune/Learning Rate": 1.415035026180227e-06, "Finetune/Loss": 0.7612311840057373, "Finetune/Loss (Raw)": 0.7717183828353882, "Finetune/Step": 4147, "Finetune/Step Time": 2.922732099890709} +{"Finetune/Learning Rate": 1.4116978415269378e-06, "Finetune/Loss": 0.763015627861023, "Finetune/Loss (Raw)": 0.936805248260498, "Finetune/Step": 4148, "Finetune/Step Time": 2.9212222695350647} +{"Finetune/Learning Rate": 1.4083642978043278e-06, "Finetune/Loss": 0.7618666887283325, "Finetune/Loss (Raw)": 0.798936665058136, "Finetune/Step": 4149, "Finetune/Step Time": 2.9238762129098177} +{"Finetune/Learning Rate": 1.405034396425622e-06, "Finetune/Loss": 0.7619047164916992, "Finetune/Loss (Raw)": 0.7636559009552002, "Finetune/Step": 4150, "Finetune/Step Time": 2.922900840640068} +{"Finetune/Learning Rate": 1.4017081388025e-06, "Finetune/Loss": 0.7611784934997559, "Finetune/Loss (Raw)": 0.765134334564209, "Finetune/Step": 4151, "Finetune/Step Time": 2.919863525778055} +{"Finetune/Learning Rate": 1.3983855263450963e-06, "Finetune/Loss": 0.7599036693572998, "Finetune/Loss (Raw)": 0.7098574638366699, "Finetune/Step": 4152, "Finetune/Step Time": 2.9214039966464043} +{"Finetune/Learning Rate": 1.3950665604620084e-06, "Finetune/Loss": 0.7600070238113403, "Finetune/Loss (Raw)": 0.759496808052063, "Finetune/Step": 4153, "Finetune/Step Time": 2.9238335229456425} +{"Finetune/Learning Rate": 1.391751242560273e-06, "Finetune/Loss": 0.7597628831863403, "Finetune/Loss (Raw)": 0.7874155640602112, "Finetune/Step": 4154, "Finetune/Step Time": 2.9210571367293596} +{"Finetune/Learning Rate": 1.3884395740453892e-06, "Finetune/Loss": 0.7606813907623291, "Finetune/Loss (Raw)": 0.8878518342971802, "Finetune/Step": 4155, "Finetune/Step Time": 2.9178923424333334} +{"Finetune/Learning Rate": 1.3851315563213152e-06, "Finetune/Loss": 0.7610353231430054, "Finetune/Loss (Raw)": 0.5905135273933411, "Finetune/Step": 4156, "Finetune/Step Time": 2.921169066801667} +{"Finetune/Learning Rate": 1.3818271907904446e-06, "Finetune/Loss": 0.7587671279907227, "Finetune/Loss (Raw)": 0.6108318567276001, "Finetune/Step": 4157, "Finetune/Step Time": 2.9422008469700813} +{"Finetune/Learning Rate": 1.378526478853639e-06, "Finetune/Loss": 0.7593834400177002, "Finetune/Loss (Raw)": 0.8496716022491455, "Finetune/Step": 4158, "Finetune/Step Time": 2.944369588047266} +{"Finetune/Learning Rate": 1.3752294219102024e-06, "Finetune/Loss": 0.7588291168212891, "Finetune/Loss (Raw)": 0.722429096698761, "Finetune/Step": 4159, "Finetune/Step Time": 2.9498306773602962} +{"Finetune/Learning Rate": 1.3719360213578914e-06, "Finetune/Loss": 0.7591561079025269, "Finetune/Loss (Raw)": 0.7678695321083069, "Finetune/Step": 4160, "Finetune/Step Time": 2.9295268822461367} +{"Finetune/Learning Rate": 1.3686462785929121e-06, "Finetune/Loss": 0.7587162256240845, "Finetune/Loss (Raw)": 0.7836341857910156, "Finetune/Step": 4161, "Finetune/Step Time": 2.9272293467074633} +{"Finetune/Learning Rate": 1.3653601950099181e-06, "Finetune/Loss": 0.7592461109161377, "Finetune/Loss (Raw)": 0.8555890321731567, "Finetune/Step": 4162, "Finetune/Step Time": 2.92688937112689} +{"Finetune/Learning Rate": 1.3620777720020218e-06, "Finetune/Loss": 0.7594724893569946, "Finetune/Loss (Raw)": 0.7947860360145569, "Finetune/Step": 4163, "Finetune/Step Time": 2.929932991042733} +{"Finetune/Learning Rate": 1.3587990109607685e-06, "Finetune/Loss": 0.7595160007476807, "Finetune/Loss (Raw)": 0.7759313583374023, "Finetune/Step": 4164, "Finetune/Step Time": 2.9337710421532393} +{"Finetune/Learning Rate": 1.3555239132761577e-06, "Finetune/Loss": 0.7645564675331116, "Finetune/Loss (Raw)": 0.7915979623794556, "Finetune/Step": 4165, "Finetune/Step Time": 2.9068843629211187} +{"Finetune/Learning Rate": 1.3522524803366422e-06, "Finetune/Loss": 0.7646160125732422, "Finetune/Loss (Raw)": 0.7223931550979614, "Finetune/Step": 4166, "Finetune/Step Time": 2.907125597819686} +{"Finetune/Learning Rate": 1.3489847135291123e-06, "Finetune/Loss": 0.7671595811843872, "Finetune/Loss (Raw)": 0.7074820399284363, "Finetune/Step": 4167, "Finetune/Step Time": 2.880584765225649} +{"Finetune/Learning Rate": 1.3457206142389068e-06, "Finetune/Loss": 0.7695097923278809, "Finetune/Loss (Raw)": 0.903950035572052, "Finetune/Step": 4168, "Finetune/Step Time": 2.865722807124257} +{"Finetune/Learning Rate": 1.342460183849812e-06, "Finetune/Loss": 0.7718918323516846, "Finetune/Loss (Raw)": 0.8682899475097656, "Finetune/Step": 4169, "Finetune/Step Time": 2.840369123965502} +{"Finetune/Learning Rate": 1.3392034237440554e-06, "Finetune/Loss": 0.7707224488258362, "Finetune/Loss (Raw)": 0.7600743174552917, "Finetune/Step": 4170, "Finetune/Step Time": 2.841089015826583} +{"Finetune/Learning Rate": 1.3359503353023107e-06, "Finetune/Loss": 0.774590015411377, "Finetune/Loss (Raw)": 0.7496949434280396, "Finetune/Step": 4171, "Finetune/Step Time": 2.815294934436679} +{"Finetune/Learning Rate": 1.3327009199036944e-06, "Finetune/Loss": 0.7756608724594116, "Finetune/Loss (Raw)": 0.7378190159797668, "Finetune/Step": 4172, "Finetune/Step Time": 2.792767509818077} +{"Finetune/Learning Rate": 1.3294551789257638e-06, "Finetune/Loss": 0.7744482755661011, "Finetune/Loss (Raw)": 0.6439335346221924, "Finetune/Step": 4173, "Finetune/Step Time": 2.814085651189089} +{"Finetune/Learning Rate": 1.3262131137445266e-06, "Finetune/Loss": 0.7736132144927979, "Finetune/Loss (Raw)": 0.7289102077484131, "Finetune/Step": 4174, "Finetune/Step Time": 2.8131181951612234} +{"Finetune/Learning Rate": 1.3229747257344184e-06, "Finetune/Loss": 0.7734999656677246, "Finetune/Loss (Raw)": 0.8653964400291443, "Finetune/Step": 4175, "Finetune/Step Time": 2.8137486409395933} +{"Finetune/Learning Rate": 1.3197400162683294e-06, "Finetune/Loss": 0.7727268934249878, "Finetune/Loss (Raw)": 0.6556078791618347, "Finetune/Step": 4176, "Finetune/Step Time": 2.8140365164726973} +{"Finetune/Learning Rate": 1.3165089867175818e-06, "Finetune/Loss": 0.771716833114624, "Finetune/Loss (Raw)": 0.719952404499054, "Finetune/Step": 4177, "Finetune/Step Time": 2.814305944368243} +{"Finetune/Learning Rate": 1.313281638451942e-06, "Finetune/Loss": 0.7720319032669067, "Finetune/Loss (Raw)": 0.8206210136413574, "Finetune/Step": 4178, "Finetune/Step Time": 2.8109062779694796} +{"Finetune/Learning Rate": 1.3100579728396135e-06, "Finetune/Loss": 0.7738102674484253, "Finetune/Loss (Raw)": 0.8015196323394775, "Finetune/Step": 4179, "Finetune/Step Time": 2.7902932595461607} +{"Finetune/Learning Rate": 1.3068379912472362e-06, "Finetune/Loss": 0.7731693983078003, "Finetune/Loss (Raw)": 0.6943407654762268, "Finetune/Step": 4180, "Finetune/Step Time": 2.7885920628905296} +{"Finetune/Learning Rate": 1.3036216950398994e-06, "Finetune/Loss": 0.773044228553772, "Finetune/Loss (Raw)": 0.826501727104187, "Finetune/Step": 4181, "Finetune/Step Time": 2.785675276070833} +{"Finetune/Learning Rate": 1.3004090855811147e-06, "Finetune/Loss": 0.7728546261787415, "Finetune/Loss (Raw)": 0.752487301826477, "Finetune/Step": 4182, "Finetune/Step Time": 2.783242939040065} +{"Finetune/Learning Rate": 1.297200164232838e-06, "Finetune/Loss": 0.7730903625488281, "Finetune/Loss (Raw)": 0.8584343791007996, "Finetune/Step": 4183, "Finetune/Step Time": 2.7840765099972486} +{"Finetune/Learning Rate": 1.2939949323554668e-06, "Finetune/Loss": 0.7736196517944336, "Finetune/Loss (Raw)": 0.8729068040847778, "Finetune/Step": 4184, "Finetune/Step Time": 2.771663723513484} +{"Finetune/Learning Rate": 1.290793391307823e-06, "Finetune/Loss": 0.7745893597602844, "Finetune/Loss (Raw)": 0.88829505443573, "Finetune/Step": 4185, "Finetune/Step Time": 2.773715289309621} +{"Finetune/Learning Rate": 1.2875955424471753e-06, "Finetune/Loss": 0.7745234966278076, "Finetune/Loss (Raw)": 0.7554306983947754, "Finetune/Step": 4186, "Finetune/Step Time": 2.7726310826838017} +{"Finetune/Learning Rate": 1.2844013871292193e-06, "Finetune/Loss": 0.7753099203109741, "Finetune/Loss (Raw)": 0.8486019372940063, "Finetune/Step": 4187, "Finetune/Step Time": 2.7684204168617725} +{"Finetune/Learning Rate": 1.2812109267080886e-06, "Finetune/Loss": 0.7761356830596924, "Finetune/Loss (Raw)": 0.8522018194198608, "Finetune/Step": 4188, "Finetune/Step Time": 2.766350032761693} +{"Finetune/Learning Rate": 1.2780241625363477e-06, "Finetune/Loss": 0.7766858339309692, "Finetune/Loss (Raw)": 0.8239314556121826, "Finetune/Step": 4189, "Finetune/Step Time": 2.7688208874315023} +{"Finetune/Learning Rate": 1.274841095964995e-06, "Finetune/Loss": 0.7762987017631531, "Finetune/Loss (Raw)": 0.7357777953147888, "Finetune/Step": 4190, "Finetune/Step Time": 2.773540051653981} +{"Finetune/Learning Rate": 1.2716617283434673e-06, "Finetune/Loss": 0.7760065793991089, "Finetune/Loss (Raw)": 0.7266896963119507, "Finetune/Step": 4191, "Finetune/Step Time": 2.794529665261507} +{"Finetune/Learning Rate": 1.2684860610196225e-06, "Finetune/Loss": 0.7762769460678101, "Finetune/Loss (Raw)": 0.756801187992096, "Finetune/Step": 4192, "Finetune/Step Time": 2.797212852165103} +{"Finetune/Learning Rate": 1.2653140953397536e-06, "Finetune/Loss": 0.7753000259399414, "Finetune/Loss (Raw)": 0.7516100406646729, "Finetune/Step": 4193, "Finetune/Step Time": 2.797453448176384} +{"Finetune/Learning Rate": 1.2621458326485913e-06, "Finetune/Loss": 0.780511736869812, "Finetune/Loss (Raw)": 0.7800593972206116, "Finetune/Step": 4194, "Finetune/Step Time": 2.762684389948845} +{"Finetune/Learning Rate": 1.2589812742892882e-06, "Finetune/Loss": 0.779248833656311, "Finetune/Loss (Raw)": 0.6992874145507812, "Finetune/Step": 4195, "Finetune/Step Time": 2.763989806175232} +{"Finetune/Learning Rate": 1.255820421603431e-06, "Finetune/Loss": 0.7788216471672058, "Finetune/Loss (Raw)": 0.7884334921836853, "Finetune/Step": 4196, "Finetune/Step Time": 2.7675001714378595} +{"Finetune/Learning Rate": 1.2526632759310308e-06, "Finetune/Loss": 0.7784546613693237, "Finetune/Loss (Raw)": 0.7745736837387085, "Finetune/Step": 4197, "Finetune/Step Time": 2.7715104576200247} +{"Finetune/Learning Rate": 1.249509838610533e-06, "Finetune/Loss": 0.7785708904266357, "Finetune/Loss (Raw)": 0.7518265843391418, "Finetune/Step": 4198, "Finetune/Step Time": 2.7724812105298042} +{"Finetune/Learning Rate": 1.2463601109788058e-06, "Finetune/Loss": 0.7775294184684753, "Finetune/Loss (Raw)": 0.6863513588905334, "Finetune/Step": 4199, "Finetune/Step Time": 2.7703481819480658} +{"Finetune/Learning Rate": 1.2432140943711469e-06, "Finetune/Loss": 0.778498649597168, "Finetune/Loss (Raw)": 0.7044360041618347, "Finetune/Step": 4200, "Finetune/Step Time": 2.746857674792409} +{"Finetune/Learning Rate": 1.2400717901212834e-06, "Finetune/Loss": 0.7778029441833496, "Finetune/Loss (Raw)": 0.7716299891471863, "Finetune/Step": 4201, "Finetune/Step Time": 2.745993034914136} +{"Finetune/Learning Rate": 1.2369331995613664e-06, "Finetune/Loss": 0.7769046425819397, "Finetune/Loss (Raw)": 0.706427812576294, "Finetune/Step": 4202, "Finetune/Step Time": 2.7424650117754936} +{"Finetune/Learning Rate": 1.2337983240219653e-06, "Finetune/Loss": 0.7765109539031982, "Finetune/Loss (Raw)": 0.8094301223754883, "Finetune/Step": 4203, "Finetune/Step Time": 2.743861434981227} +{"Finetune/Learning Rate": 1.2306671648320877e-06, "Finetune/Loss": 0.771752119064331, "Finetune/Loss (Raw)": 0.2373371720314026, "Finetune/Step": 4204, "Finetune/Step Time": 2.78613094240427} +{"Finetune/Learning Rate": 1.2275397233191577e-06, "Finetune/Loss": 0.7733420133590698, "Finetune/Loss (Raw)": 0.8025794625282288, "Finetune/Step": 4205, "Finetune/Step Time": 2.761592570692301} +{"Finetune/Learning Rate": 1.2244160008090256e-06, "Finetune/Loss": 0.7734650373458862, "Finetune/Loss (Raw)": 0.8248740434646606, "Finetune/Step": 4206, "Finetune/Step Time": 2.7640906739979982} +{"Finetune/Learning Rate": 1.2212959986259643e-06, "Finetune/Loss": 0.7732345461845398, "Finetune/Loss (Raw)": 0.7748598456382751, "Finetune/Step": 4207, "Finetune/Step Time": 2.761400517076254} +{"Finetune/Learning Rate": 1.2181797180926658e-06, "Finetune/Loss": 0.7734355926513672, "Finetune/Loss (Raw)": 0.803276538848877, "Finetune/Step": 4208, "Finetune/Step Time": 2.75368382781744} +{"Finetune/Learning Rate": 1.2150671605302567e-06, "Finetune/Loss": 0.7735297083854675, "Finetune/Loss (Raw)": 0.8085187673568726, "Finetune/Step": 4209, "Finetune/Step Time": 2.7547129653394222} +{"Finetune/Learning Rate": 1.2119583272582692e-06, "Finetune/Loss": 0.7738209962844849, "Finetune/Loss (Raw)": 0.8392626047134399, "Finetune/Step": 4210, "Finetune/Step Time": 2.754934836179018} +{"Finetune/Learning Rate": 1.2088532195946633e-06, "Finetune/Loss": 0.7735645771026611, "Finetune/Loss (Raw)": 0.8686032891273499, "Finetune/Step": 4211, "Finetune/Step Time": 2.7610109373927116} +{"Finetune/Learning Rate": 1.2057518388558298e-06, "Finetune/Loss": 0.7729580402374268, "Finetune/Loss (Raw)": 0.7248457670211792, "Finetune/Step": 4212, "Finetune/Step Time": 2.7622093465179205} +{"Finetune/Learning Rate": 1.202654186356559e-06, "Finetune/Loss": 0.773678719997406, "Finetune/Loss (Raw)": 0.8250812888145447, "Finetune/Step": 4213, "Finetune/Step Time": 2.7589134611189365} +{"Finetune/Learning Rate": 1.199560263410079e-06, "Finetune/Loss": 0.7737983465194702, "Finetune/Loss (Raw)": 0.8038691282272339, "Finetune/Step": 4214, "Finetune/Step Time": 2.7677862606942654} +{"Finetune/Learning Rate": 1.1964700713280275e-06, "Finetune/Loss": 0.7738128900527954, "Finetune/Loss (Raw)": 0.796522855758667, "Finetune/Step": 4215, "Finetune/Step Time": 2.768182246014476} +{"Finetune/Learning Rate": 1.1933836114204634e-06, "Finetune/Loss": 0.7745923399925232, "Finetune/Loss (Raw)": 0.8743396401405334, "Finetune/Step": 4216, "Finetune/Step Time": 2.769523374736309} +{"Finetune/Learning Rate": 1.190300884995862e-06, "Finetune/Loss": 0.7736174464225769, "Finetune/Loss (Raw)": 0.6979276537895203, "Finetune/Step": 4217, "Finetune/Step Time": 2.7720873672515154} +{"Finetune/Learning Rate": 1.1872218933611134e-06, "Finetune/Loss": 0.7722323536872864, "Finetune/Loss (Raw)": 0.7339852452278137, "Finetune/Step": 4218, "Finetune/Step Time": 2.7758513428270817} +{"Finetune/Learning Rate": 1.184146637821535e-06, "Finetune/Loss": 0.7717067003250122, "Finetune/Loss (Raw)": 0.7635962963104248, "Finetune/Step": 4219, "Finetune/Step Time": 2.7764156069606543} +{"Finetune/Learning Rate": 1.1810751196808456e-06, "Finetune/Loss": 0.7720445394515991, "Finetune/Loss (Raw)": 0.8334016799926758, "Finetune/Step": 4220, "Finetune/Step Time": 2.778029875829816} +{"Finetune/Learning Rate": 1.1780073402411873e-06, "Finetune/Loss": 0.7714102864265442, "Finetune/Loss (Raw)": 0.7312144637107849, "Finetune/Step": 4221, "Finetune/Step Time": 2.7758361101150513} +{"Finetune/Learning Rate": 1.1749433008031208e-06, "Finetune/Loss": 0.7721506953239441, "Finetune/Loss (Raw)": 0.8578439950942993, "Finetune/Step": 4222, "Finetune/Step Time": 2.7768805027008057} +{"Finetune/Learning Rate": 1.1718830026656158e-06, "Finetune/Loss": 0.7717335224151611, "Finetune/Loss (Raw)": 0.6975283622741699, "Finetune/Step": 4223, "Finetune/Step Time": 2.7744528502225876} +{"Finetune/Learning Rate": 1.1688264471260546e-06, "Finetune/Loss": 0.7709499597549438, "Finetune/Loss (Raw)": 0.7498157024383545, "Finetune/Step": 4224, "Finetune/Step Time": 2.7815081533044577} +{"Finetune/Learning Rate": 1.1657736354802373e-06, "Finetune/Loss": 0.7715268135070801, "Finetune/Loss (Raw)": 0.7962718605995178, "Finetune/Step": 4225, "Finetune/Step Time": 2.7773531060665846} +{"Finetune/Learning Rate": 1.1627245690223754e-06, "Finetune/Loss": 0.7718571424484253, "Finetune/Loss (Raw)": 0.7886466383934021, "Finetune/Step": 4226, "Finetune/Step Time": 2.7835713773965836} +{"Finetune/Learning Rate": 1.1596792490450915e-06, "Finetune/Loss": 0.7712863683700562, "Finetune/Loss (Raw)": 0.8123738765716553, "Finetune/Step": 4227, "Finetune/Step Time": 2.7828353848308325} +{"Finetune/Learning Rate": 1.1566376768394172e-06, "Finetune/Loss": 0.7687129378318787, "Finetune/Loss (Raw)": 0.41857782006263733, "Finetune/Step": 4228, "Finetune/Step Time": 2.8145232666283846} +{"Finetune/Learning Rate": 1.1535998536948057e-06, "Finetune/Loss": 0.7677980661392212, "Finetune/Loss (Raw)": 0.7001190185546875, "Finetune/Step": 4229, "Finetune/Step Time": 2.8156336061656475} +{"Finetune/Learning Rate": 1.150565780899111e-06, "Finetune/Loss": 0.7678993344306946, "Finetune/Loss (Raw)": 0.7612255215644836, "Finetune/Step": 4230, "Finetune/Step Time": 2.8182365484535694} +{"Finetune/Learning Rate": 1.1475354597385969e-06, "Finetune/Loss": 0.7679436802864075, "Finetune/Loss (Raw)": 0.7909239530563354, "Finetune/Step": 4231, "Finetune/Step Time": 2.820935297757387} +{"Finetune/Learning Rate": 1.144508891497943e-06, "Finetune/Loss": 0.7685158252716064, "Finetune/Loss (Raw)": 0.8252084255218506, "Finetune/Step": 4232, "Finetune/Step Time": 2.824656644836068} +{"Finetune/Learning Rate": 1.1414860774602332e-06, "Finetune/Loss": 0.7692333459854126, "Finetune/Loss (Raw)": 0.7081005573272705, "Finetune/Step": 4233, "Finetune/Step Time": 2.8062005136162043} +{"Finetune/Learning Rate": 1.1384670189069635e-06, "Finetune/Loss": 0.7687802314758301, "Finetune/Loss (Raw)": 0.7665008902549744, "Finetune/Step": 4234, "Finetune/Step Time": 2.803979769349098} +{"Finetune/Learning Rate": 1.1354517171180335e-06, "Finetune/Loss": 0.7686907052993774, "Finetune/Loss (Raw)": 0.8158949613571167, "Finetune/Step": 4235, "Finetune/Step Time": 2.8020849879831076} +{"Finetune/Learning Rate": 1.1324401733717506e-06, "Finetune/Loss": 0.7701705694198608, "Finetune/Loss (Raw)": 0.9095792174339294, "Finetune/Step": 4236, "Finetune/Step Time": 2.797512037679553} +{"Finetune/Learning Rate": 1.1294323889448366e-06, "Finetune/Loss": 0.7702200412750244, "Finetune/Loss (Raw)": 0.802931547164917, "Finetune/Step": 4237, "Finetune/Step Time": 2.794926021248102} +{"Finetune/Learning Rate": 1.1264283651124087e-06, "Finetune/Loss": 0.770683765411377, "Finetune/Loss (Raw)": 0.850281834602356, "Finetune/Step": 4238, "Finetune/Step Time": 2.795391444116831} +{"Finetune/Learning Rate": 1.1234281031479943e-06, "Finetune/Loss": 0.7717041969299316, "Finetune/Loss (Raw)": 0.9542362689971924, "Finetune/Step": 4239, "Finetune/Step Time": 2.796846177428961} +{"Finetune/Learning Rate": 1.120431604323533e-06, "Finetune/Loss": 0.7715820074081421, "Finetune/Loss (Raw)": 0.7784826755523682, "Finetune/Step": 4240, "Finetune/Step Time": 2.788722598925233} +{"Finetune/Learning Rate": 1.117438869909353e-06, "Finetune/Loss": 0.7707275152206421, "Finetune/Loss (Raw)": 0.7417888045310974, "Finetune/Step": 4241, "Finetune/Step Time": 2.7900140024721622} +{"Finetune/Learning Rate": 1.114449901174204e-06, "Finetune/Loss": 0.7707957029342651, "Finetune/Loss (Raw)": 0.8104736804962158, "Finetune/Step": 4242, "Finetune/Step Time": 2.7899644933640957} +{"Finetune/Learning Rate": 1.1114646993852285e-06, "Finetune/Loss": 0.770511269569397, "Finetune/Loss (Raw)": 0.7855908870697021, "Finetune/Step": 4243, "Finetune/Step Time": 2.7908649686723948} +{"Finetune/Learning Rate": 1.1084832658079748e-06, "Finetune/Loss": 0.7703119516372681, "Finetune/Loss (Raw)": 0.8306307792663574, "Finetune/Step": 4244, "Finetune/Step Time": 2.7911682426929474} +{"Finetune/Learning Rate": 1.1055056017063936e-06, "Finetune/Loss": 0.771192193031311, "Finetune/Loss (Raw)": 0.792967677116394, "Finetune/Step": 4245, "Finetune/Step Time": 2.7906242962926626} +{"Finetune/Learning Rate": 1.1025317083428377e-06, "Finetune/Loss": 0.7701543569564819, "Finetune/Loss (Raw)": 0.7501543760299683, "Finetune/Step": 4246, "Finetune/Step Time": 2.7935655526816845} +{"Finetune/Learning Rate": 1.0995615869780651e-06, "Finetune/Loss": 0.7697558999061584, "Finetune/Loss (Raw)": 0.7857246994972229, "Finetune/Step": 4247, "Finetune/Step Time": 2.8155407905578613} +{"Finetune/Learning Rate": 1.0965952388712275e-06, "Finetune/Loss": 0.770061731338501, "Finetune/Loss (Raw)": 0.8109595775604248, "Finetune/Step": 4248, "Finetune/Step Time": 2.814299486577511} +{"Finetune/Learning Rate": 1.093632665279878e-06, "Finetune/Loss": 0.7706770896911621, "Finetune/Loss (Raw)": 0.7716843485832214, "Finetune/Step": 4249, "Finetune/Step Time": 2.8143879305571318} +{"Finetune/Learning Rate": 1.0906738674599782e-06, "Finetune/Loss": 0.771189272403717, "Finetune/Loss (Raw)": 0.8013578653335571, "Finetune/Step": 4250, "Finetune/Step Time": 2.8166015427559614} +{"Finetune/Learning Rate": 1.0877188466658794e-06, "Finetune/Loss": 0.7700642347335815, "Finetune/Loss (Raw)": 0.6980192065238953, "Finetune/Step": 4251, "Finetune/Step Time": 2.82008995115757} +{"Finetune/Learning Rate": 1.0847676041503363e-06, "Finetune/Loss": 0.7708753347396851, "Finetune/Loss (Raw)": 0.7748996615409851, "Finetune/Step": 4252, "Finetune/Step Time": 2.795499764382839} +{"Finetune/Learning Rate": 1.0818201411644992e-06, "Finetune/Loss": 0.7713425159454346, "Finetune/Loss (Raw)": 0.7859835624694824, "Finetune/Step": 4253, "Finetune/Step Time": 2.795386053621769} +{"Finetune/Learning Rate": 1.0788764589579192e-06, "Finetune/Loss": 0.7719497680664062, "Finetune/Loss (Raw)": 0.8122116923332214, "Finetune/Step": 4254, "Finetune/Step Time": 2.768605262041092} +{"Finetune/Learning Rate": 1.075936558778542e-06, "Finetune/Loss": 0.7711766362190247, "Finetune/Loss (Raw)": 0.6730139851570129, "Finetune/Step": 4255, "Finetune/Step Time": 2.7686397712677717} +{"Finetune/Learning Rate": 1.0730004418727092e-06, "Finetune/Loss": 0.7713167071342468, "Finetune/Loss (Raw)": 0.8499795794487, "Finetune/Step": 4256, "Finetune/Step Time": 2.7647013925015926} +{"Finetune/Learning Rate": 1.070068109485164e-06, "Finetune/Loss": 0.7717635631561279, "Finetune/Loss (Raw)": 0.8538931012153625, "Finetune/Step": 4257, "Finetune/Step Time": 2.762318106368184} +{"Finetune/Learning Rate": 1.0671395628590408e-06, "Finetune/Loss": 0.7719746828079224, "Finetune/Loss (Raw)": 0.8390046954154968, "Finetune/Step": 4258, "Finetune/Step Time": 2.7596603985875845} +{"Finetune/Learning Rate": 1.0642148032358645e-06, "Finetune/Loss": 0.7713943719863892, "Finetune/Loss (Raw)": 0.7630687952041626, "Finetune/Step": 4259, "Finetune/Step Time": 2.7616492230445147} +{"Finetune/Learning Rate": 1.0612938318555665e-06, "Finetune/Loss": 0.7716703414916992, "Finetune/Loss (Raw)": 0.8389931321144104, "Finetune/Step": 4260, "Finetune/Step Time": 2.76324731297791} +{"Finetune/Learning Rate": 1.0583766499564618e-06, "Finetune/Loss": 0.7702008485794067, "Finetune/Loss (Raw)": 0.6189582943916321, "Finetune/Step": 4261, "Finetune/Step Time": 2.7621644902974367} +{"Finetune/Learning Rate": 1.0554632587752634e-06, "Finetune/Loss": 0.7712537050247192, "Finetune/Loss (Raw)": 0.8740941882133484, "Finetune/Step": 4262, "Finetune/Step Time": 2.7581642661243677} +{"Finetune/Learning Rate": 1.0525536595470753e-06, "Finetune/Loss": 0.7707964181900024, "Finetune/Loss (Raw)": 0.7490999102592468, "Finetune/Step": 4263, "Finetune/Step Time": 2.758838066831231} +{"Finetune/Learning Rate": 1.0496478535053944e-06, "Finetune/Loss": 0.7701327800750732, "Finetune/Loss (Raw)": 0.790012538433075, "Finetune/Step": 4264, "Finetune/Step Time": 2.760164661332965} +{"Finetune/Learning Rate": 1.0467458418821152e-06, "Finetune/Loss": 0.7698832750320435, "Finetune/Loss (Raw)": 0.8035281300544739, "Finetune/Step": 4265, "Finetune/Step Time": 2.7597183417528868} +{"Finetune/Learning Rate": 1.0438476259075136e-06, "Finetune/Loss": 0.7701918482780457, "Finetune/Loss (Raw)": 0.8251689672470093, "Finetune/Step": 4266, "Finetune/Step Time": 2.7584923151880503} +{"Finetune/Learning Rate": 1.040953206810259e-06, "Finetune/Loss": 0.7704133987426758, "Finetune/Loss (Raw)": 0.8637790083885193, "Finetune/Step": 4267, "Finetune/Step Time": 2.7602748703211546} +{"Finetune/Learning Rate": 1.0380625858174221e-06, "Finetune/Loss": 0.771030843257904, "Finetune/Loss (Raw)": 0.8188026547431946, "Finetune/Step": 4268, "Finetune/Step Time": 2.7610374316573143} +{"Finetune/Learning Rate": 1.0351757641544446e-06, "Finetune/Loss": 0.770334005355835, "Finetune/Loss (Raw)": 0.6573746204376221, "Finetune/Step": 4269, "Finetune/Step Time": 2.763221399858594} +{"Finetune/Learning Rate": 1.0322927430451745e-06, "Finetune/Loss": 0.7745550870895386, "Finetune/Loss (Raw)": 0.8075215816497803, "Finetune/Step": 4270, "Finetune/Step Time": 2.7342923525720835} +{"Finetune/Learning Rate": 1.0294135237118396e-06, "Finetune/Loss": 0.773894190788269, "Finetune/Loss (Raw)": 0.7288431525230408, "Finetune/Step": 4271, "Finetune/Step Time": 2.735421234741807} +{"Finetune/Learning Rate": 1.026538107375059e-06, "Finetune/Loss": 0.7746909856796265, "Finetune/Loss (Raw)": 0.8054082989692688, "Finetune/Step": 4272, "Finetune/Step Time": 2.7394962310791016} +{"Finetune/Learning Rate": 1.0236664952538377e-06, "Finetune/Loss": 0.7718284726142883, "Finetune/Loss (Raw)": 0.30599457025527954, "Finetune/Step": 4273, "Finetune/Step Time": 2.7705248594284058} +{"Finetune/Learning Rate": 1.0207986885655664e-06, "Finetune/Loss": 0.7717835903167725, "Finetune/Loss (Raw)": 0.8148360252380371, "Finetune/Step": 4274, "Finetune/Step Time": 2.7733764238655567} +{"Finetune/Learning Rate": 1.017934688526032e-06, "Finetune/Loss": 0.7722936272621155, "Finetune/Loss (Raw)": 0.8370062708854675, "Finetune/Step": 4275, "Finetune/Step Time": 2.7723719347268343} +{"Finetune/Learning Rate": 1.0150744963493952e-06, "Finetune/Loss": 0.7715468406677246, "Finetune/Loss (Raw)": 0.8412112593650818, "Finetune/Step": 4276, "Finetune/Step Time": 2.7726008128374815} +{"Finetune/Learning Rate": 1.0122181132482056e-06, "Finetune/Loss": 0.771820068359375, "Finetune/Loss (Raw)": 0.8339167833328247, "Finetune/Step": 4277, "Finetune/Step Time": 2.769986718893051} +{"Finetune/Learning Rate": 1.0093655404334079e-06, "Finetune/Loss": 0.7716995477676392, "Finetune/Loss (Raw)": 0.7482326626777649, "Finetune/Step": 4278, "Finetune/Step Time": 2.769715568050742} +{"Finetune/Learning Rate": 1.006516779114316e-06, "Finetune/Loss": 0.771234929561615, "Finetune/Loss (Raw)": 0.7056553363800049, "Finetune/Step": 4279, "Finetune/Step Time": 2.7703739441931248} +{"Finetune/Learning Rate": 1.0036718304986414e-06, "Finetune/Loss": 0.7704095840454102, "Finetune/Loss (Raw)": 0.6042157411575317, "Finetune/Step": 4280, "Finetune/Step Time": 2.8020848780870438} +{"Finetune/Learning Rate": 1.0008306957924708e-06, "Finetune/Loss": 0.7709583044052124, "Finetune/Loss (Raw)": 0.8297306895256042, "Finetune/Step": 4281, "Finetune/Step Time": 2.80469636246562} +{"Finetune/Learning Rate": 9.979933762002768e-07, "Finetune/Loss": 0.7705719470977783, "Finetune/Loss (Raw)": 0.737964391708374, "Finetune/Step": 4282, "Finetune/Step Time": 2.808791970834136} +{"Finetune/Learning Rate": 9.951598729249157e-07, "Finetune/Loss": 0.7675219774246216, "Finetune/Loss (Raw)": 0.49745726585388184, "Finetune/Step": 4283, "Finetune/Step Time": 2.8318163380026817} +{"Finetune/Learning Rate": 9.923301871676227e-07, "Finetune/Loss": 0.7684634923934937, "Finetune/Loss (Raw)": 0.7110202312469482, "Finetune/Step": 4284, "Finetune/Step Time": 2.8097510281950235} +{"Finetune/Learning Rate": 9.895043201280208e-07, "Finetune/Loss": 0.7693372368812561, "Finetune/Loss (Raw)": 0.7226759791374207, "Finetune/Step": 4285, "Finetune/Step Time": 2.787454828619957} +{"Finetune/Learning Rate": 9.86682273004107e-07, "Finetune/Loss": 0.7687656283378601, "Finetune/Loss (Raw)": 0.7765051126480103, "Finetune/Step": 4286, "Finetune/Step Time": 2.788044946268201} +{"Finetune/Learning Rate": 9.83864046992259e-07, "Finetune/Loss": 0.7694472074508667, "Finetune/Loss (Raw)": 0.8096737265586853, "Finetune/Step": 4287, "Finetune/Step Time": 2.7894484251737595} +{"Finetune/Learning Rate": 9.810496432872441e-07, "Finetune/Loss": 0.7699809670448303, "Finetune/Loss (Raw)": 0.8361834287643433, "Finetune/Step": 4288, "Finetune/Step Time": 2.7880559898912907} +{"Finetune/Learning Rate": 9.782390630821981e-07, "Finetune/Loss": 0.7707252502441406, "Finetune/Loss (Raw)": 0.8789021968841553, "Finetune/Step": 4289, "Finetune/Step Time": 2.788660693913698} +{"Finetune/Learning Rate": 9.754323075686422e-07, "Finetune/Loss": 0.7701550722122192, "Finetune/Loss (Raw)": 0.7826064825057983, "Finetune/Step": 4290, "Finetune/Step Time": 2.7880792170763016} +{"Finetune/Learning Rate": 9.726293779364726e-07, "Finetune/Loss": 0.77001953125, "Finetune/Loss (Raw)": 0.7774444818496704, "Finetune/Step": 4291, "Finetune/Step Time": 2.7892864923924208} +{"Finetune/Learning Rate": 9.698302753739664e-07, "Finetune/Loss": 0.7701531648635864, "Finetune/Loss (Raw)": 0.7930364012718201, "Finetune/Step": 4292, "Finetune/Step Time": 2.789132161065936} +{"Finetune/Learning Rate": 9.670350010677764e-07, "Finetune/Loss": 0.7667580246925354, "Finetune/Loss (Raw)": 0.35701560974121094, "Finetune/Step": 4293, "Finetune/Step Time": 2.817033786326647} +{"Finetune/Learning Rate": 9.642435562029339e-07, "Finetune/Loss": 0.7664300799369812, "Finetune/Loss (Raw)": 0.6804183125495911, "Finetune/Step": 4294, "Finetune/Step Time": 2.8200017027556896} +{"Finetune/Learning Rate": 9.614559419628433e-07, "Finetune/Loss": 0.7673673629760742, "Finetune/Loss (Raw)": 0.8274465799331665, "Finetune/Step": 4295, "Finetune/Step Time": 2.814755341038108} +{"Finetune/Learning Rate": 9.586721595292937e-07, "Finetune/Loss": 0.7655327320098877, "Finetune/Loss (Raw)": 0.6691265106201172, "Finetune/Step": 4296, "Finetune/Step Time": 2.8047293201088905} +{"Finetune/Learning Rate": 9.558922100824364e-07, "Finetune/Loss": 0.7651172876358032, "Finetune/Loss (Raw)": 0.8151110410690308, "Finetune/Step": 4297, "Finetune/Step Time": 2.80239475145936} +{"Finetune/Learning Rate": 9.5311609480081e-07, "Finetune/Loss": 0.7649476528167725, "Finetune/Loss (Raw)": 0.7383619546890259, "Finetune/Step": 4298, "Finetune/Step Time": 2.8031047750264406} +{"Finetune/Learning Rate": 9.503438148613208e-07, "Finetune/Loss": 0.7656270265579224, "Finetune/Loss (Raw)": 0.8366571664810181, "Finetune/Step": 4299, "Finetune/Step Time": 2.799228623509407} +{"Finetune/Learning Rate": 9.475753714392522e-07, "Finetune/Loss": 0.7659465670585632, "Finetune/Loss (Raw)": 0.7787138819694519, "Finetune/Step": 4300, "Finetune/Step Time": 2.797906093299389} +{"Finetune/Learning Rate": 9.448107657082594e-07, "Finetune/Loss": 0.7674815058708191, "Finetune/Loss (Raw)": 0.8404061198234558, "Finetune/Step": 4301, "Finetune/Step Time": 2.7745524141937494} +{"Finetune/Learning Rate": 9.420499988403686e-07, "Finetune/Loss": 0.7682815790176392, "Finetune/Loss (Raw)": 0.8313269019126892, "Finetune/Step": 4302, "Finetune/Step Time": 2.7766069937497377} +{"Finetune/Learning Rate": 9.392930720059878e-07, "Finetune/Loss": 0.7681819200515747, "Finetune/Loss (Raw)": 0.8526390790939331, "Finetune/Step": 4303, "Finetune/Step Time": 2.7761502861976624} +{"Finetune/Learning Rate": 9.365399863738834e-07, "Finetune/Loss": 0.7689759731292725, "Finetune/Loss (Raw)": 0.7572361826896667, "Finetune/Step": 4304, "Finetune/Step Time": 2.7754588276147842} +{"Finetune/Learning Rate": 9.337907431112026e-07, "Finetune/Loss": 0.7695190906524658, "Finetune/Loss (Raw)": 0.7894792556762695, "Finetune/Step": 4305, "Finetune/Step Time": 2.7748592142015696} +{"Finetune/Learning Rate": 9.310453433834654e-07, "Finetune/Loss": 0.7649217844009399, "Finetune/Loss (Raw)": 0.2321651428937912, "Finetune/Step": 4306, "Finetune/Step Time": 2.8035161402076483} +{"Finetune/Learning Rate": 9.283037883545521e-07, "Finetune/Loss": 0.7649562358856201, "Finetune/Loss (Raw)": 0.8059269785881042, "Finetune/Step": 4307, "Finetune/Step Time": 2.8029457218945026} +{"Finetune/Learning Rate": 9.255660791867238e-07, "Finetune/Loss": 0.7659571766853333, "Finetune/Loss (Raw)": 0.8224644660949707, "Finetune/Step": 4308, "Finetune/Step Time": 2.8035515677183867} +{"Finetune/Learning Rate": 9.228322170406057e-07, "Finetune/Loss": 0.7657446265220642, "Finetune/Loss (Raw)": 0.7992911338806152, "Finetune/Step": 4309, "Finetune/Step Time": 2.8055358193814754} +{"Finetune/Learning Rate": 9.201022030751938e-07, "Finetune/Loss": 0.7669785022735596, "Finetune/Loss (Raw)": 0.9104312658309937, "Finetune/Step": 4310, "Finetune/Step Time": 2.803732179105282} +{"Finetune/Learning Rate": 9.173760384478502e-07, "Finetune/Loss": 0.7667773962020874, "Finetune/Loss (Raw)": 0.8326923251152039, "Finetune/Step": 4311, "Finetune/Step Time": 2.799638532102108} +{"Finetune/Learning Rate": 9.146537243143072e-07, "Finetune/Loss": 0.7661454081535339, "Finetune/Loss (Raw)": 0.7920063138008118, "Finetune/Step": 4312, "Finetune/Step Time": 2.8000083658844233} +{"Finetune/Learning Rate": 9.119352618286681e-07, "Finetune/Loss": 0.7646684050559998, "Finetune/Loss (Raw)": 0.6992385983467102, "Finetune/Step": 4313, "Finetune/Step Time": 2.8016219828277826} +{"Finetune/Learning Rate": 9.092206521433956e-07, "Finetune/Loss": 0.7652304172515869, "Finetune/Loss (Raw)": 0.8273624181747437, "Finetune/Step": 4314, "Finetune/Step Time": 2.801522048190236} +{"Finetune/Learning Rate": 9.065098964093233e-07, "Finetune/Loss": 0.7642086744308472, "Finetune/Loss (Raw)": 0.7178305387496948, "Finetune/Step": 4315, "Finetune/Step Time": 2.807328885421157} +{"Finetune/Learning Rate": 9.038029957756534e-07, "Finetune/Loss": 0.7642801403999329, "Finetune/Loss (Raw)": 0.8613415956497192, "Finetune/Step": 4316, "Finetune/Step Time": 2.8068901374936104} +{"Finetune/Learning Rate": 9.010999513899499e-07, "Finetune/Loss": 0.7643775343894958, "Finetune/Loss (Raw)": 0.836396336555481, "Finetune/Step": 4317, "Finetune/Step Time": 2.8071440402418375} +{"Finetune/Learning Rate": 8.984007643981441e-07, "Finetune/Loss": 0.7648561000823975, "Finetune/Loss (Raw)": 0.7970435619354248, "Finetune/Step": 4318, "Finetune/Step Time": 2.8035048712044954} +{"Finetune/Learning Rate": 8.957054359445294e-07, "Finetune/Loss": 0.7658483982086182, "Finetune/Loss (Raw)": 0.8537035584449768, "Finetune/Step": 4319, "Finetune/Step Time": 2.7852877471596003} +{"Finetune/Learning Rate": 8.930139671717675e-07, "Finetune/Loss": 0.765560507774353, "Finetune/Loss (Raw)": 0.7199477553367615, "Finetune/Step": 4320, "Finetune/Step Time": 2.7819679994136095} +{"Finetune/Learning Rate": 8.903263592208789e-07, "Finetune/Loss": 0.7617939710617065, "Finetune/Loss (Raw)": 0.26948827505111694, "Finetune/Step": 4321, "Finetune/Step Time": 2.815634485334158} +{"Finetune/Learning Rate": 8.876426132312521e-07, "Finetune/Loss": 0.7621340155601501, "Finetune/Loss (Raw)": 0.8235911130905151, "Finetune/Step": 4322, "Finetune/Step Time": 2.8186143934726715} +{"Finetune/Learning Rate": 8.849627303406327e-07, "Finetune/Loss": 0.7627866864204407, "Finetune/Loss (Raw)": 0.7828308939933777, "Finetune/Step": 4323, "Finetune/Step Time": 2.8200669642537832} +{"Finetune/Learning Rate": 8.822867116851397e-07, "Finetune/Loss": 0.7626686096191406, "Finetune/Loss (Raw)": 0.773319661617279, "Finetune/Step": 4324, "Finetune/Step Time": 2.8168680388480425} +{"Finetune/Learning Rate": 8.796145583992366e-07, "Finetune/Loss": 0.7628430128097534, "Finetune/Loss (Raw)": 0.7968900799751282, "Finetune/Step": 4325, "Finetune/Step Time": 2.8171585761010647} +{"Finetune/Learning Rate": 8.769462716157651e-07, "Finetune/Loss": 0.7624309659004211, "Finetune/Loss (Raw)": 0.699089765548706, "Finetune/Step": 4326, "Finetune/Step Time": 2.8208174612373114} +{"Finetune/Learning Rate": 8.742818524659181e-07, "Finetune/Loss": 0.7633731365203857, "Finetune/Loss (Raw)": 0.8069546818733215, "Finetune/Step": 4327, "Finetune/Step Time": 2.8218016531318426} +{"Finetune/Learning Rate": 8.716213020792508e-07, "Finetune/Loss": 0.7640267610549927, "Finetune/Loss (Raw)": 0.7880978584289551, "Finetune/Step": 4328, "Finetune/Step Time": 2.820805534720421} +{"Finetune/Learning Rate": 8.689646215836789e-07, "Finetune/Loss": 0.7641001343727112, "Finetune/Loss (Raw)": 0.7810186743736267, "Finetune/Step": 4329, "Finetune/Step Time": 2.8249129112809896} +{"Finetune/Learning Rate": 8.663118121054759e-07, "Finetune/Loss": 0.7646608352661133, "Finetune/Loss (Raw)": 0.7781965732574463, "Finetune/Step": 4330, "Finetune/Step Time": 2.826739203184843} +{"Finetune/Learning Rate": 8.63662874769281e-07, "Finetune/Loss": 0.7647354602813721, "Finetune/Loss (Raw)": 0.8189868330955505, "Finetune/Step": 4331, "Finetune/Step Time": 2.8298023883253336} +{"Finetune/Learning Rate": 8.610178106980816e-07, "Finetune/Loss": 0.7693880796432495, "Finetune/Loss (Raw)": 0.832861065864563, "Finetune/Step": 4332, "Finetune/Step Time": 2.789546921849251} +{"Finetune/Learning Rate": 8.583766210132272e-07, "Finetune/Loss": 0.7687640190124512, "Finetune/Loss (Raw)": 0.7227036356925964, "Finetune/Step": 4333, "Finetune/Step Time": 2.809125754982233} +{"Finetune/Learning Rate": 8.557393068344311e-07, "Finetune/Loss": 0.76900315284729, "Finetune/Loss (Raw)": 0.8554913997650146, "Finetune/Step": 4334, "Finetune/Step Time": 2.8083783388137817} +{"Finetune/Learning Rate": 8.531058692797511e-07, "Finetune/Loss": 0.7697176933288574, "Finetune/Loss (Raw)": 0.8663181066513062, "Finetune/Step": 4335, "Finetune/Step Time": 2.8100211564451456} +{"Finetune/Learning Rate": 8.504763094656133e-07, "Finetune/Loss": 0.7702814340591431, "Finetune/Loss (Raw)": 0.8754268884658813, "Finetune/Step": 4336, "Finetune/Step Time": 2.8189867716282606} +{"Finetune/Learning Rate": 8.478506285067944e-07, "Finetune/Loss": 0.7696859836578369, "Finetune/Loss (Raw)": 0.7323035597801208, "Finetune/Step": 4337, "Finetune/Step Time": 2.8188406843692064} +{"Finetune/Learning Rate": 8.452288275164266e-07, "Finetune/Loss": 0.7695927619934082, "Finetune/Loss (Raw)": 0.8273394107818604, "Finetune/Step": 4338, "Finetune/Step Time": 2.8188584595918655} +{"Finetune/Learning Rate": 8.426109076059974e-07, "Finetune/Loss": 0.7690556049346924, "Finetune/Loss (Raw)": 0.7998412251472473, "Finetune/Step": 4339, "Finetune/Step Time": 2.814847035333514} +{"Finetune/Learning Rate": 8.3999686988535e-07, "Finetune/Loss": 0.7690587639808655, "Finetune/Loss (Raw)": 0.725249171257019, "Finetune/Step": 4340, "Finetune/Step Time": 2.813844323158264} +{"Finetune/Learning Rate": 8.373867154626836e-07, "Finetune/Loss": 0.7697654962539673, "Finetune/Loss (Raw)": 0.9155449271202087, "Finetune/Step": 4341, "Finetune/Step Time": 2.8116367030888796} +{"Finetune/Learning Rate": 8.347804454445463e-07, "Finetune/Loss": 0.7695948481559753, "Finetune/Loss (Raw)": 0.7820256352424622, "Finetune/Step": 4342, "Finetune/Step Time": 2.808220561593771} +{"Finetune/Learning Rate": 8.321780609358399e-07, "Finetune/Loss": 0.7694985866546631, "Finetune/Loss (Raw)": 0.7842040061950684, "Finetune/Step": 4343, "Finetune/Step Time": 2.806633934378624} +{"Finetune/Learning Rate": 8.295795630398263e-07, "Finetune/Loss": 0.7691818475723267, "Finetune/Loss (Raw)": 0.8337926268577576, "Finetune/Step": 4344, "Finetune/Step Time": 2.8092476967722178} +{"Finetune/Learning Rate": 8.26984952858112e-07, "Finetune/Loss": 0.7695971727371216, "Finetune/Loss (Raw)": 0.7510923147201538, "Finetune/Step": 4345, "Finetune/Step Time": 2.8053407594561577} +{"Finetune/Learning Rate": 8.243942314906572e-07, "Finetune/Loss": 0.7706190347671509, "Finetune/Loss (Raw)": 0.8647855520248413, "Finetune/Step": 4346, "Finetune/Step Time": 2.8059031069278717} +{"Finetune/Learning Rate": 8.218074000357745e-07, "Finetune/Loss": 0.7705467939376831, "Finetune/Loss (Raw)": 0.7543410658836365, "Finetune/Step": 4347, "Finetune/Step Time": 2.8053161315619946} +{"Finetune/Learning Rate": 8.192244595901266e-07, "Finetune/Loss": 0.7693201899528503, "Finetune/Loss (Raw)": 0.6763997673988342, "Finetune/Step": 4348, "Finetune/Step Time": 2.827338246628642} +{"Finetune/Learning Rate": 8.166454112487287e-07, "Finetune/Loss": 0.7694708108901978, "Finetune/Loss (Raw)": 0.7504931092262268, "Finetune/Step": 4349, "Finetune/Step Time": 2.832870326936245} +{"Finetune/Learning Rate": 8.140702561049408e-07, "Finetune/Loss": 0.7684042453765869, "Finetune/Loss (Raw)": 0.7213312983512878, "Finetune/Step": 4350, "Finetune/Step Time": 2.842092551290989} +{"Finetune/Learning Rate": 8.114989952504804e-07, "Finetune/Loss": 0.7703925371170044, "Finetune/Loss (Raw)": 0.9520230889320374, "Finetune/Step": 4351, "Finetune/Step Time": 2.840981127694249} +{"Finetune/Learning Rate": 8.089316297754079e-07, "Finetune/Loss": 0.7704806923866272, "Finetune/Loss (Raw)": 0.7611004710197449, "Finetune/Step": 4352, "Finetune/Step Time": 2.837976798415184} +{"Finetune/Learning Rate": 8.063681607681318e-07, "Finetune/Loss": 0.7711219191551208, "Finetune/Loss (Raw)": 0.8783493638038635, "Finetune/Step": 4353, "Finetune/Step Time": 2.838295442983508} +{"Finetune/Learning Rate": 8.038085893154135e-07, "Finetune/Loss": 0.7714453935623169, "Finetune/Loss (Raw)": 0.830051839351654, "Finetune/Step": 4354, "Finetune/Step Time": 2.8362499121576548} +{"Finetune/Learning Rate": 8.012529165023586e-07, "Finetune/Loss": 0.7713801264762878, "Finetune/Loss (Raw)": 0.8040226697921753, "Finetune/Step": 4355, "Finetune/Step Time": 2.836697267368436} +{"Finetune/Learning Rate": 7.987011434124203e-07, "Finetune/Loss": 0.7735812067985535, "Finetune/Loss (Raw)": 0.7003130912780762, "Finetune/Step": 4356, "Finetune/Step Time": 2.8079953771084547} +{"Finetune/Learning Rate": 7.961532711274e-07, "Finetune/Loss": 0.7739209532737732, "Finetune/Loss (Raw)": 0.7436097860336304, "Finetune/Step": 4357, "Finetune/Step Time": 2.799394767731428} +{"Finetune/Learning Rate": 7.936093007274426e-07, "Finetune/Loss": 0.7739582061767578, "Finetune/Loss (Raw)": 0.7659900188446045, "Finetune/Step": 4358, "Finetune/Step Time": 2.79934767074883} +{"Finetune/Learning Rate": 7.910692332910452e-07, "Finetune/Loss": 0.773676872253418, "Finetune/Loss (Raw)": 0.7549157738685608, "Finetune/Step": 4359, "Finetune/Step Time": 2.7979756742715836} +{"Finetune/Learning Rate": 7.885330698950411e-07, "Finetune/Loss": 0.7729871869087219, "Finetune/Loss (Raw)": 0.7369207739830017, "Finetune/Step": 4360, "Finetune/Step Time": 2.798713181167841} +{"Finetune/Learning Rate": 7.860008116146122e-07, "Finetune/Loss": 0.769235372543335, "Finetune/Loss (Raw)": 0.22787687182426453, "Finetune/Step": 4361, "Finetune/Step Time": 2.826576467603445} +{"Finetune/Learning Rate": 7.834724595232912e-07, "Finetune/Loss": 0.7694276571273804, "Finetune/Loss (Raw)": 0.791110098361969, "Finetune/Step": 4362, "Finetune/Step Time": 2.827546676620841} +{"Finetune/Learning Rate": 7.809480146929438e-07, "Finetune/Loss": 0.7700656652450562, "Finetune/Loss (Raw)": 0.8975631594657898, "Finetune/Step": 4363, "Finetune/Step Time": 2.8304960802197456} +{"Finetune/Learning Rate": 7.784274781937884e-07, "Finetune/Loss": 0.7694684267044067, "Finetune/Loss (Raw)": 0.8331325054168701, "Finetune/Step": 4364, "Finetune/Step Time": 2.831683998927474} +{"Finetune/Learning Rate": 7.759108510943825e-07, "Finetune/Loss": 0.7693312168121338, "Finetune/Loss (Raw)": 0.7853642106056213, "Finetune/Step": 4365, "Finetune/Step Time": 2.8314462080597878} +{"Finetune/Learning Rate": 7.73398134461626e-07, "Finetune/Loss": 0.7692611217498779, "Finetune/Loss (Raw)": 0.8413150310516357, "Finetune/Step": 4366, "Finetune/Step Time": 2.8285113628953695} +{"Finetune/Learning Rate": 7.708893293607611e-07, "Finetune/Loss": 0.7683391571044922, "Finetune/Loss (Raw)": 0.8362240791320801, "Finetune/Step": 4367, "Finetune/Step Time": 2.827414248138666} +{"Finetune/Learning Rate": 7.683844368553728e-07, "Finetune/Loss": 0.7679682970046997, "Finetune/Loss (Raw)": 0.7310101389884949, "Finetune/Step": 4368, "Finetune/Step Time": 2.822738464921713} +{"Finetune/Learning Rate": 7.658834580073904e-07, "Finetune/Loss": 0.7671185731887817, "Finetune/Loss (Raw)": 0.6330230236053467, "Finetune/Step": 4369, "Finetune/Step Time": 2.844916244968772} +{"Finetune/Learning Rate": 7.633863938770747e-07, "Finetune/Loss": 0.7657095193862915, "Finetune/Loss (Raw)": 0.6301134824752808, "Finetune/Step": 4370, "Finetune/Step Time": 2.869406506419182} +{"Finetune/Learning Rate": 7.608932455230344e-07, "Finetune/Loss": 0.7661826014518738, "Finetune/Loss (Raw)": 0.846147358417511, "Finetune/Step": 4371, "Finetune/Step Time": 2.8711136151105165} +{"Finetune/Learning Rate": 7.584040140022197e-07, "Finetune/Loss": 0.7652065753936768, "Finetune/Loss (Raw)": 0.705695390701294, "Finetune/Step": 4372, "Finetune/Step Time": 2.8706508968025446} +{"Finetune/Learning Rate": 7.559187003699153e-07, "Finetune/Loss": 0.764679491519928, "Finetune/Loss (Raw)": 0.7255048155784607, "Finetune/Step": 4373, "Finetune/Step Time": 2.8720971569418907} +{"Finetune/Learning Rate": 7.534373056797451e-07, "Finetune/Loss": 0.765274167060852, "Finetune/Loss (Raw)": 0.8262735605239868, "Finetune/Step": 4374, "Finetune/Step Time": 2.8703845478594303} +{"Finetune/Learning Rate": 7.509598309836763e-07, "Finetune/Loss": 0.7648343443870544, "Finetune/Loss (Raw)": 0.7294282913208008, "Finetune/Step": 4375, "Finetune/Step Time": 2.847706224769354} +{"Finetune/Learning Rate": 7.48486277332009e-07, "Finetune/Loss": 0.7646160125732422, "Finetune/Loss (Raw)": 0.7830114960670471, "Finetune/Step": 4376, "Finetune/Step Time": 2.852882541716099} +{"Finetune/Learning Rate": 7.460166457733831e-07, "Finetune/Loss": 0.7644377946853638, "Finetune/Loss (Raw)": 0.7488638162612915, "Finetune/Step": 4377, "Finetune/Step Time": 2.857614226639271} +{"Finetune/Learning Rate": 7.435509373547756e-07, "Finetune/Loss": 0.7641133069992065, "Finetune/Loss (Raw)": 0.7598341107368469, "Finetune/Step": 4378, "Finetune/Step Time": 2.856022333726287} +{"Finetune/Learning Rate": 7.410891531215026e-07, "Finetune/Loss": 0.7648818492889404, "Finetune/Loss (Raw)": 0.7963860034942627, "Finetune/Step": 4379, "Finetune/Step Time": 2.855673484504223} +{"Finetune/Learning Rate": 7.386312941172158e-07, "Finetune/Loss": 0.764999270439148, "Finetune/Loss (Raw)": 0.7899296879768372, "Finetune/Step": 4380, "Finetune/Step Time": 2.8585504107177258} +{"Finetune/Learning Rate": 7.361773613838963e-07, "Finetune/Loss": 0.7656991481781006, "Finetune/Loss (Raw)": 0.8755718469619751, "Finetune/Step": 4381, "Finetune/Step Time": 2.8589833341538906} +{"Finetune/Learning Rate": 7.337273559618707e-07, "Finetune/Loss": 0.7645434737205505, "Finetune/Loss (Raw)": 0.6642860770225525, "Finetune/Step": 4382, "Finetune/Step Time": 2.8608411606401205} +{"Finetune/Learning Rate": 7.312812788897939e-07, "Finetune/Loss": 0.7644309997558594, "Finetune/Loss (Raw)": 0.6586135029792786, "Finetune/Step": 4383, "Finetune/Step Time": 2.8609554395079613} +{"Finetune/Learning Rate": 7.288391312046583e-07, "Finetune/Loss": 0.7629896998405457, "Finetune/Loss (Raw)": 0.6654928922653198, "Finetune/Step": 4384, "Finetune/Step Time": 2.8669152539223433} +{"Finetune/Learning Rate": 7.264009139417893e-07, "Finetune/Loss": 0.7623578310012817, "Finetune/Loss (Raw)": 0.7730156183242798, "Finetune/Step": 4385, "Finetune/Step Time": 2.8688576575368643} +{"Finetune/Learning Rate": 7.239666281348445e-07, "Finetune/Loss": 0.7621468901634216, "Finetune/Loss (Raw)": 0.8120030164718628, "Finetune/Step": 4386, "Finetune/Step Time": 2.8674498219043016} +{"Finetune/Learning Rate": 7.215362748158228e-07, "Finetune/Loss": 0.7629768252372742, "Finetune/Loss (Raw)": 0.8693004846572876, "Finetune/Step": 4387, "Finetune/Step Time": 2.867015091702342} +{"Finetune/Learning Rate": 7.191098550150433e-07, "Finetune/Loss": 0.7632080912590027, "Finetune/Loss (Raw)": 0.8685941100120544, "Finetune/Step": 4388, "Finetune/Step Time": 2.8673742208629847} +{"Finetune/Learning Rate": 7.166873697611654e-07, "Finetune/Loss": 0.7644612789154053, "Finetune/Loss (Raw)": 0.7793686985969543, "Finetune/Step": 4389, "Finetune/Step Time": 2.867043238133192} +{"Finetune/Learning Rate": 7.14268820081182e-07, "Finetune/Loss": 0.7634507417678833, "Finetune/Loss (Raw)": 0.7447429299354553, "Finetune/Step": 4390, "Finetune/Step Time": 2.8685260750353336} +{"Finetune/Learning Rate": 7.118542070004108e-07, "Finetune/Loss": 0.7635773420333862, "Finetune/Loss (Raw)": 0.7653124928474426, "Finetune/Step": 4391, "Finetune/Step Time": 2.867852922528982} +{"Finetune/Learning Rate": 7.094435315425086e-07, "Finetune/Loss": 0.7635706663131714, "Finetune/Loss (Raw)": 0.7891525030136108, "Finetune/Step": 4392, "Finetune/Step Time": 2.8803037013858557} +{"Finetune/Learning Rate": 7.070367947294554e-07, "Finetune/Loss": 0.7628622651100159, "Finetune/Loss (Raw)": 0.7128525376319885, "Finetune/Step": 4393, "Finetune/Step Time": 2.881486674770713} +{"Finetune/Learning Rate": 7.046339975815675e-07, "Finetune/Loss": 0.7626673579216003, "Finetune/Loss (Raw)": 0.8002185225486755, "Finetune/Step": 4394, "Finetune/Step Time": 2.8822326231747866} +{"Finetune/Learning Rate": 7.022351411174866e-07, "Finetune/Loss": 0.7621450424194336, "Finetune/Loss (Raw)": 0.7969275116920471, "Finetune/Step": 4395, "Finetune/Step Time": 2.8800700809806585} +{"Finetune/Learning Rate": 6.998402263541848e-07, "Finetune/Loss": 0.7612324953079224, "Finetune/Loss (Raw)": 0.7019919157028198, "Finetune/Step": 4396, "Finetune/Step Time": 2.88012583181262} +{"Finetune/Learning Rate": 6.974492543069677e-07, "Finetune/Loss": 0.7630525827407837, "Finetune/Loss (Raw)": 0.8903453946113586, "Finetune/Step": 4397, "Finetune/Step Time": 2.8791180104017258} +{"Finetune/Learning Rate": 6.950622259894624e-07, "Finetune/Loss": 0.7624938488006592, "Finetune/Loss (Raw)": 0.7360097169876099, "Finetune/Step": 4398, "Finetune/Step Time": 2.8803653307259083} +{"Finetune/Learning Rate": 6.926791424136259e-07, "Finetune/Loss": 0.7634904384613037, "Finetune/Loss (Raw)": 0.8564079403877258, "Finetune/Step": 4399, "Finetune/Step Time": 2.8805323783308268} +{"Finetune/Learning Rate": 6.903000045897478e-07, "Finetune/Loss": 0.7633065581321716, "Finetune/Loss (Raw)": 0.7818630337715149, "Finetune/Step": 4400, "Finetune/Step Time": 2.88012589327991} +{"Finetune/Learning Rate": 6.879248135264394e-07, "Finetune/Loss": 0.7676928639411926, "Finetune/Loss (Raw)": 0.8674505949020386, "Finetune/Step": 4401, "Finetune/Step Time": 2.845933483913541} +{"Finetune/Learning Rate": 6.855535702306426e-07, "Finetune/Loss": 0.7669329047203064, "Finetune/Loss (Raw)": 0.717555820941925, "Finetune/Step": 4402, "Finetune/Step Time": 2.8435907680541277} +{"Finetune/Learning Rate": 6.831862757076224e-07, "Finetune/Loss": 0.766911506652832, "Finetune/Loss (Raw)": 0.8342711329460144, "Finetune/Step": 4403, "Finetune/Step Time": 2.842281185090542} +{"Finetune/Learning Rate": 6.808229309609704e-07, "Finetune/Loss": 0.7672363519668579, "Finetune/Loss (Raw)": 0.882785975933075, "Finetune/Step": 4404, "Finetune/Step Time": 2.8460400458425283} +{"Finetune/Learning Rate": 6.784635369926073e-07, "Finetune/Loss": 0.7676178216934204, "Finetune/Loss (Raw)": 0.8827469348907471, "Finetune/Step": 4405, "Finetune/Step Time": 2.8497688621282578} +{"Finetune/Learning Rate": 6.761080948027721e-07, "Finetune/Loss": 0.7668932676315308, "Finetune/Loss (Raw)": 0.6554962396621704, "Finetune/Step": 4406, "Finetune/Step Time": 2.873837873339653} +{"Finetune/Learning Rate": 6.737566053900368e-07, "Finetune/Loss": 0.7678707838058472, "Finetune/Loss (Raw)": 0.830775260925293, "Finetune/Step": 4407, "Finetune/Step Time": 2.870678948238492} +{"Finetune/Learning Rate": 6.714090697512943e-07, "Finetune/Loss": 0.7697632908821106, "Finetune/Loss (Raw)": 0.8464506268501282, "Finetune/Step": 4408, "Finetune/Step Time": 2.838590458035469} +{"Finetune/Learning Rate": 6.690654888817538e-07, "Finetune/Loss": 0.7692981362342834, "Finetune/Loss (Raw)": 0.7701975107192993, "Finetune/Step": 4409, "Finetune/Step Time": 2.8343500439077616} +{"Finetune/Learning Rate": 6.667258637749597e-07, "Finetune/Loss": 0.7694822549819946, "Finetune/Loss (Raw)": 0.7615299224853516, "Finetune/Step": 4410, "Finetune/Step Time": 2.830915091559291} +{"Finetune/Learning Rate": 6.643901954227738e-07, "Finetune/Loss": 0.7711759209632874, "Finetune/Loss (Raw)": 0.7142476439476013, "Finetune/Step": 4411, "Finetune/Step Time": 2.8103707805275917} +{"Finetune/Learning Rate": 6.620584848153811e-07, "Finetune/Loss": 0.77133709192276, "Finetune/Loss (Raw)": 0.7316467761993408, "Finetune/Step": 4412, "Finetune/Step Time": 2.8073353972285986} +{"Finetune/Learning Rate": 6.597307329412872e-07, "Finetune/Loss": 0.7730337381362915, "Finetune/Loss (Raw)": 0.9398439526557922, "Finetune/Step": 4413, "Finetune/Step Time": 2.8051989879459143} +{"Finetune/Learning Rate": 6.574069407873196e-07, "Finetune/Loss": 0.7726936340332031, "Finetune/Loss (Raw)": 0.732972264289856, "Finetune/Step": 4414, "Finetune/Step Time": 2.804774446412921} +{"Finetune/Learning Rate": 6.550871093386335e-07, "Finetune/Loss": 0.7728781700134277, "Finetune/Loss (Raw)": 0.8333005309104919, "Finetune/Step": 4415, "Finetune/Step Time": 2.8044158909469843} +{"Finetune/Learning Rate": 6.527712395786956e-07, "Finetune/Loss": 0.7722454071044922, "Finetune/Loss (Raw)": 0.7551847696304321, "Finetune/Step": 4416, "Finetune/Step Time": 2.803823783993721} +{"Finetune/Learning Rate": 6.50459332489296e-07, "Finetune/Loss": 0.7714041471481323, "Finetune/Loss (Raw)": 0.771221399307251, "Finetune/Step": 4417, "Finetune/Step Time": 2.804115440696478} +{"Finetune/Learning Rate": 6.481513890505519e-07, "Finetune/Loss": 0.7717938423156738, "Finetune/Loss (Raw)": 0.8324841260910034, "Finetune/Step": 4418, "Finetune/Step Time": 2.8072927556931973} +{"Finetune/Learning Rate": 6.458474102408873e-07, "Finetune/Loss": 0.7721673250198364, "Finetune/Loss (Raw)": 0.8252553939819336, "Finetune/Step": 4419, "Finetune/Step Time": 2.805666720494628} +{"Finetune/Learning Rate": 6.435473970370576e-07, "Finetune/Loss": 0.7711629867553711, "Finetune/Loss (Raw)": 0.6644772291183472, "Finetune/Step": 4420, "Finetune/Step Time": 2.8270669784396887} +{"Finetune/Learning Rate": 6.412513504141316e-07, "Finetune/Loss": 0.7749872803688049, "Finetune/Loss (Raw)": 0.8465253114700317, "Finetune/Step": 4421, "Finetune/Step Time": 2.7966486178338528} +{"Finetune/Learning Rate": 6.389592713454951e-07, "Finetune/Loss": 0.7767430543899536, "Finetune/Loss (Raw)": 0.9051593542098999, "Finetune/Step": 4422, "Finetune/Step Time": 2.801340851932764} +{"Finetune/Learning Rate": 6.366711608028542e-07, "Finetune/Loss": 0.7762899398803711, "Finetune/Loss (Raw)": 0.7694571614265442, "Finetune/Step": 4423, "Finetune/Step Time": 2.801418384537101} +{"Finetune/Learning Rate": 6.343870197562307e-07, "Finetune/Loss": 0.7766427993774414, "Finetune/Loss (Raw)": 0.7142897844314575, "Finetune/Step": 4424, "Finetune/Step Time": 2.8072115983814} +{"Finetune/Learning Rate": 6.321068491739701e-07, "Finetune/Loss": 0.776374340057373, "Finetune/Loss (Raw)": 0.7807462811470032, "Finetune/Step": 4425, "Finetune/Step Time": 2.81030135974288} +{"Finetune/Learning Rate": 6.298306500227236e-07, "Finetune/Loss": 0.7768029570579529, "Finetune/Loss (Raw)": 0.7932239770889282, "Finetune/Step": 4426, "Finetune/Step Time": 2.8139610681682825} +{"Finetune/Learning Rate": 6.275584232674659e-07, "Finetune/Loss": 0.7765569090843201, "Finetune/Loss (Raw)": 0.8051624298095703, "Finetune/Step": 4427, "Finetune/Step Time": 2.814965793862939} +{"Finetune/Learning Rate": 6.252901698714886e-07, "Finetune/Loss": 0.7765474319458008, "Finetune/Loss (Raw)": 0.7775065302848816, "Finetune/Step": 4428, "Finetune/Step Time": 2.817490641027689} +{"Finetune/Learning Rate": 6.230258907963949e-07, "Finetune/Loss": 0.7760621309280396, "Finetune/Loss (Raw)": 0.7782814502716064, "Finetune/Step": 4429, "Finetune/Step Time": 2.822717510163784} +{"Finetune/Learning Rate": 6.207655870021057e-07, "Finetune/Loss": 0.7754348516464233, "Finetune/Loss (Raw)": 0.7510417699813843, "Finetune/Step": 4430, "Finetune/Step Time": 2.8206224404275417} +{"Finetune/Learning Rate": 6.185092594468545e-07, "Finetune/Loss": 0.7752952575683594, "Finetune/Loss (Raw)": 0.8347613215446472, "Finetune/Step": 4431, "Finetune/Step Time": 2.819999258965254} +{"Finetune/Learning Rate": 6.162569090871917e-07, "Finetune/Loss": 0.7757075428962708, "Finetune/Loss (Raw)": 0.8100120425224304, "Finetune/Step": 4432, "Finetune/Step Time": 2.820833181962371} +{"Finetune/Learning Rate": 6.140085368779791e-07, "Finetune/Loss": 0.7754127979278564, "Finetune/Loss (Raw)": 0.7517502903938293, "Finetune/Step": 4433, "Finetune/Step Time": 2.822095587849617} +{"Finetune/Learning Rate": 6.117641437723931e-07, "Finetune/Loss": 0.7788078784942627, "Finetune/Loss (Raw)": 0.6667320728302002, "Finetune/Step": 4434, "Finetune/Step Time": 2.79483275860548} +{"Finetune/Learning Rate": 6.095237307219259e-07, "Finetune/Loss": 0.7791405916213989, "Finetune/Loss (Raw)": 0.8485223054885864, "Finetune/Step": 4435, "Finetune/Step Time": 2.79316820576787} +{"Finetune/Learning Rate": 6.072872986763767e-07, "Finetune/Loss": 0.7790321111679077, "Finetune/Loss (Raw)": 0.8085770010948181, "Finetune/Step": 4436, "Finetune/Step Time": 2.793198624625802} +{"Finetune/Learning Rate": 6.050548485838592e-07, "Finetune/Loss": 0.778834879398346, "Finetune/Loss (Raw)": 0.7740433812141418, "Finetune/Step": 4437, "Finetune/Step Time": 2.7903509940952063} +{"Finetune/Learning Rate": 6.028263813908031e-07, "Finetune/Loss": 0.777290940284729, "Finetune/Loss (Raw)": 0.7128134369850159, "Finetune/Step": 4438, "Finetune/Step Time": 2.7958831656724215} +{"Finetune/Learning Rate": 6.006018980419448e-07, "Finetune/Loss": 0.7775769233703613, "Finetune/Loss (Raw)": 0.8692975640296936, "Finetune/Step": 4439, "Finetune/Step Time": 2.7969202399253845} +{"Finetune/Learning Rate": 5.983813994803334e-07, "Finetune/Loss": 0.7765998244285583, "Finetune/Loss (Raw)": 0.6669303178787231, "Finetune/Step": 4440, "Finetune/Step Time": 2.7989150304347277} +{"Finetune/Learning Rate": 5.96164886647329e-07, "Finetune/Loss": 0.7776315808296204, "Finetune/Loss (Raw)": 0.8313077688217163, "Finetune/Step": 4441, "Finetune/Step Time": 2.7924984116107225} +{"Finetune/Learning Rate": 5.939523604826003e-07, "Finetune/Loss": 0.7763733267784119, "Finetune/Loss (Raw)": 0.6663028597831726, "Finetune/Step": 4442, "Finetune/Step Time": 2.7946679331362247} +{"Finetune/Learning Rate": 5.917438219241278e-07, "Finetune/Loss": 0.7769063711166382, "Finetune/Loss (Raw)": 0.7860656380653381, "Finetune/Step": 4443, "Finetune/Step Time": 2.79097843170166} +{"Finetune/Learning Rate": 5.895392719082016e-07, "Finetune/Loss": 0.7764525413513184, "Finetune/Loss (Raw)": 0.8032460808753967, "Finetune/Step": 4444, "Finetune/Step Time": 2.791462643072009} +{"Finetune/Learning Rate": 5.873387113694173e-07, "Finetune/Loss": 0.7762324810028076, "Finetune/Loss (Raw)": 0.8082294464111328, "Finetune/Step": 4445, "Finetune/Step Time": 2.7912192195653915} +{"Finetune/Learning Rate": 5.851421412406877e-07, "Finetune/Loss": 0.7761756181716919, "Finetune/Loss (Raw)": 0.7897698879241943, "Finetune/Step": 4446, "Finetune/Step Time": 2.794073846191168} +{"Finetune/Learning Rate": 5.829495624532211e-07, "Finetune/Loss": 0.7751415967941284, "Finetune/Loss (Raw)": 0.721344530582428, "Finetune/Step": 4447, "Finetune/Step Time": 2.7866503670811653} +{"Finetune/Learning Rate": 5.807609759365473e-07, "Finetune/Loss": 0.7758020162582397, "Finetune/Loss (Raw)": 0.8044757843017578, "Finetune/Step": 4448, "Finetune/Step Time": 2.795965190976858} +{"Finetune/Learning Rate": 5.785763826184931e-07, "Finetune/Loss": 0.7805185317993164, "Finetune/Loss (Raw)": 0.8732074499130249, "Finetune/Step": 4449, "Finetune/Step Time": 2.766608187928796} +{"Finetune/Learning Rate": 5.763957834251977e-07, "Finetune/Loss": 0.7807379961013794, "Finetune/Loss (Raw)": 0.8516817688941956, "Finetune/Step": 4450, "Finetune/Step Time": 2.7608423959463835} +{"Finetune/Learning Rate": 5.742191792811069e-07, "Finetune/Loss": 0.7819496393203735, "Finetune/Loss (Raw)": 0.9379170536994934, "Finetune/Step": 4451, "Finetune/Step Time": 2.759271366521716} +{"Finetune/Learning Rate": 5.720465711089684e-07, "Finetune/Loss": 0.7821335792541504, "Finetune/Loss (Raw)": 0.7968675494194031, "Finetune/Step": 4452, "Finetune/Step Time": 2.758945757523179} +{"Finetune/Learning Rate": 5.698779598298442e-07, "Finetune/Loss": 0.7821273803710938, "Finetune/Loss (Raw)": 0.7960997819900513, "Finetune/Step": 4453, "Finetune/Step Time": 2.760536892339587} +{"Finetune/Learning Rate": 5.677133463630935e-07, "Finetune/Loss": 0.7821968197822571, "Finetune/Loss (Raw)": 0.7079741954803467, "Finetune/Step": 4454, "Finetune/Step Time": 2.7603754680603743} +{"Finetune/Learning Rate": 5.65552731626382e-07, "Finetune/Loss": 0.7821307182312012, "Finetune/Loss (Raw)": 0.7984974384307861, "Finetune/Step": 4455, "Finetune/Step Time": 2.763508092612028} +{"Finetune/Learning Rate": 5.633961165356893e-07, "Finetune/Loss": 0.7825455069541931, "Finetune/Loss (Raw)": 0.8411876559257507, "Finetune/Step": 4456, "Finetune/Step Time": 2.766765581443906} +{"Finetune/Learning Rate": 5.612435020052831e-07, "Finetune/Loss": 0.7821935415267944, "Finetune/Loss (Raw)": 0.7359700798988342, "Finetune/Step": 4457, "Finetune/Step Time": 2.765988251194358} +{"Finetune/Learning Rate": 5.590948889477521e-07, "Finetune/Loss": 0.7822819948196411, "Finetune/Loss (Raw)": 0.7895199656486511, "Finetune/Step": 4458, "Finetune/Step Time": 2.7665411792695522} +{"Finetune/Learning Rate": 5.569502782739766e-07, "Finetune/Loss": 0.7814786434173584, "Finetune/Loss (Raw)": 0.7161516547203064, "Finetune/Step": 4459, "Finetune/Step Time": 2.764289101585746} +{"Finetune/Learning Rate": 5.548096708931461e-07, "Finetune/Loss": 0.7810691595077515, "Finetune/Loss (Raw)": 0.7804500460624695, "Finetune/Step": 4460, "Finetune/Step Time": 2.7621344663202763} +{"Finetune/Learning Rate": 5.526730677127501e-07, "Finetune/Loss": 0.7811083197593689, "Finetune/Loss (Raw)": 0.7277154326438904, "Finetune/Step": 4461, "Finetune/Step Time": 2.7418710850179195} +{"Finetune/Learning Rate": 5.505404696385796e-07, "Finetune/Loss": 0.780745267868042, "Finetune/Loss (Raw)": 0.8090218305587769, "Finetune/Step": 4462, "Finetune/Step Time": 2.737592473626137} +{"Finetune/Learning Rate": 5.48411877574736e-07, "Finetune/Loss": 0.7792222499847412, "Finetune/Loss (Raw)": 0.6713696718215942, "Finetune/Step": 4463, "Finetune/Step Time": 2.736717727035284} +{"Finetune/Learning Rate": 5.462872924236106e-07, "Finetune/Loss": 0.7786800265312195, "Finetune/Loss (Raw)": 0.806021511554718, "Finetune/Step": 4464, "Finetune/Step Time": 2.7271559685468674} +{"Finetune/Learning Rate": 5.441667150859009e-07, "Finetune/Loss": 0.7788116931915283, "Finetune/Loss (Raw)": 0.7491661310195923, "Finetune/Step": 4465, "Finetune/Step Time": 2.7309701573103666} +{"Finetune/Learning Rate": 5.420501464606098e-07, "Finetune/Loss": 0.7785576581954956, "Finetune/Loss (Raw)": 0.7948217988014221, "Finetune/Step": 4466, "Finetune/Step Time": 2.73236733302474} +{"Finetune/Learning Rate": 5.399375874450352e-07, "Finetune/Loss": 0.7792902588844299, "Finetune/Loss (Raw)": 0.8936070203781128, "Finetune/Step": 4467, "Finetune/Step Time": 2.7316033262759447} +{"Finetune/Learning Rate": 5.378290389347762e-07, "Finetune/Loss": 0.7800301909446716, "Finetune/Loss (Raw)": 0.8199567198753357, "Finetune/Step": 4468, "Finetune/Step Time": 2.7349412608891726} +{"Finetune/Learning Rate": 5.357245018237334e-07, "Finetune/Loss": 0.7745810747146606, "Finetune/Loss (Raw)": 0.21806782484054565, "Finetune/Step": 4469, "Finetune/Step Time": 2.769242128357291} +{"Finetune/Learning Rate": 5.336239770041041e-07, "Finetune/Loss": 0.7745416164398193, "Finetune/Loss (Raw)": 0.7769619226455688, "Finetune/Step": 4470, "Finetune/Step Time": 2.7661019433289766} +{"Finetune/Learning Rate": 5.315274653663882e-07, "Finetune/Loss": 0.774078369140625, "Finetune/Loss (Raw)": 0.7249137759208679, "Finetune/Step": 4471, "Finetune/Step Time": 2.7757463045418262} +{"Finetune/Learning Rate": 5.294349677993793e-07, "Finetune/Loss": 0.7729081511497498, "Finetune/Loss (Raw)": 0.6840072870254517, "Finetune/Step": 4472, "Finetune/Step Time": 2.768950954079628} +{"Finetune/Learning Rate": 5.273464851901755e-07, "Finetune/Loss": 0.7713185548782349, "Finetune/Loss (Raw)": 0.5476280450820923, "Finetune/Step": 4473, "Finetune/Step Time": 2.790458958595991} +{"Finetune/Learning Rate": 5.252620184241697e-07, "Finetune/Loss": 0.7709469199180603, "Finetune/Loss (Raw)": 0.817213773727417, "Finetune/Step": 4474, "Finetune/Step Time": 2.7908773440867662} +{"Finetune/Learning Rate": 5.231815683850472e-07, "Finetune/Loss": 0.7709662914276123, "Finetune/Loss (Raw)": 0.7568233609199524, "Finetune/Step": 4475, "Finetune/Step Time": 2.7911697905510664} +{"Finetune/Learning Rate": 5.211051359548013e-07, "Finetune/Loss": 0.7723826169967651, "Finetune/Loss (Raw)": 0.8576789498329163, "Finetune/Step": 4476, "Finetune/Step Time": 2.7671089321374893} +{"Finetune/Learning Rate": 5.190327220137137e-07, "Finetune/Loss": 0.7732245922088623, "Finetune/Loss (Raw)": 0.8582754135131836, "Finetune/Step": 4477, "Finetune/Step Time": 2.7646388839930296} +{"Finetune/Learning Rate": 5.169643274403647e-07, "Finetune/Loss": 0.7735811471939087, "Finetune/Loss (Raw)": 0.7669651508331299, "Finetune/Step": 4478, "Finetune/Step Time": 2.7582068610936403} +{"Finetune/Learning Rate": 5.148999531116306e-07, "Finetune/Loss": 0.7684003114700317, "Finetune/Loss (Raw)": 0.28887662291526794, "Finetune/Step": 4479, "Finetune/Step Time": 2.7919186260551214} +{"Finetune/Learning Rate": 5.128395999026836e-07, "Finetune/Loss": 0.7688961029052734, "Finetune/Loss (Raw)": 0.824565589427948, "Finetune/Step": 4480, "Finetune/Step Time": 2.788766600191593} +{"Finetune/Learning Rate": 5.107832686869951e-07, "Finetune/Loss": 0.7682846784591675, "Finetune/Loss (Raw)": 0.800084114074707, "Finetune/Step": 4481, "Finetune/Step Time": 2.7937815748155117} +{"Finetune/Learning Rate": 5.087309603363222e-07, "Finetune/Loss": 0.7687621116638184, "Finetune/Loss (Raw)": 0.8911696672439575, "Finetune/Step": 4482, "Finetune/Step Time": 2.7917136903852224} +{"Finetune/Learning Rate": 5.066826757207233e-07, "Finetune/Loss": 0.7678982019424438, "Finetune/Loss (Raw)": 0.6934380531311035, "Finetune/Step": 4483, "Finetune/Step Time": 2.7920322977006435} +{"Finetune/Learning Rate": 5.046384157085538e-07, "Finetune/Loss": 0.766838014125824, "Finetune/Loss (Raw)": 0.5646036863327026, "Finetune/Step": 4484, "Finetune/Step Time": 2.8146988805383444} +{"Finetune/Learning Rate": 5.025981811664515e-07, "Finetune/Loss": 0.7671405673027039, "Finetune/Loss (Raw)": 0.7823426127433777, "Finetune/Step": 4485, "Finetune/Step Time": 2.8180046528577805} +{"Finetune/Learning Rate": 5.005619729593602e-07, "Finetune/Loss": 0.7678427696228027, "Finetune/Loss (Raw)": 0.8558690547943115, "Finetune/Step": 4486, "Finetune/Step Time": 2.8158321883529425} +{"Finetune/Learning Rate": 4.985297919505106e-07, "Finetune/Loss": 0.7681606411933899, "Finetune/Loss (Raw)": 0.7956032156944275, "Finetune/Step": 4487, "Finetune/Step Time": 2.814477814361453} +{"Finetune/Learning Rate": 4.965016390014255e-07, "Finetune/Loss": 0.7677388787269592, "Finetune/Loss (Raw)": 0.6829336881637573, "Finetune/Step": 4488, "Finetune/Step Time": 2.8349120058119297} +{"Finetune/Learning Rate": 4.944775149719217e-07, "Finetune/Loss": 0.7718411087989807, "Finetune/Loss (Raw)": 0.7529694437980652, "Finetune/Step": 4489, "Finetune/Step Time": 2.8020719178020954} +{"Finetune/Learning Rate": 4.924574207201071e-07, "Finetune/Loss": 0.7713351845741272, "Finetune/Loss (Raw)": 0.7263470888137817, "Finetune/Step": 4490, "Finetune/Step Time": 2.8004289027303457} +{"Finetune/Learning Rate": 4.904413571023847e-07, "Finetune/Loss": 0.770004153251648, "Finetune/Loss (Raw)": 0.7271900177001953, "Finetune/Step": 4491, "Finetune/Step Time": 2.7998984679579735} +{"Finetune/Learning Rate": 4.88429324973444e-07, "Finetune/Loss": 0.7698855400085449, "Finetune/Loss (Raw)": 0.8179514408111572, "Finetune/Step": 4492, "Finetune/Step Time": 2.797107730060816} +{"Finetune/Learning Rate": 4.864213251862648e-07, "Finetune/Loss": 0.7706500291824341, "Finetune/Loss (Raw)": 0.8832138180732727, "Finetune/Step": 4493, "Finetune/Step Time": 2.799913829192519} +{"Finetune/Learning Rate": 4.844173585921252e-07, "Finetune/Loss": 0.7694518566131592, "Finetune/Loss (Raw)": 0.68794846534729, "Finetune/Step": 4494, "Finetune/Step Time": 2.799926556646824} +{"Finetune/Learning Rate": 4.824174260405834e-07, "Finetune/Loss": 0.7693252563476562, "Finetune/Loss (Raw)": 0.8200269937515259, "Finetune/Step": 4495, "Finetune/Step Time": 2.7990060206502676} +{"Finetune/Learning Rate": 4.804215283794955e-07, "Finetune/Loss": 0.7701247930526733, "Finetune/Loss (Raw)": 0.8333520293235779, "Finetune/Step": 4496, "Finetune/Step Time": 2.7992763593792915} +{"Finetune/Learning Rate": 4.784296664550026e-07, "Finetune/Loss": 0.7717667818069458, "Finetune/Loss (Raw)": 0.8432013392448425, "Finetune/Step": 4497, "Finetune/Step Time": 2.778500748798251} +{"Finetune/Learning Rate": 4.7644184111153455e-07, "Finetune/Loss": 0.7723639011383057, "Finetune/Loss (Raw)": 0.706532895565033, "Finetune/Step": 4498, "Finetune/Step Time": 2.752771656960249} +{"Finetune/Learning Rate": 4.7445805319181305e-07, "Finetune/Loss": 0.7722932696342468, "Finetune/Loss (Raw)": 0.8371093273162842, "Finetune/Step": 4499, "Finetune/Step Time": 2.7550988867878914} +{"Finetune/Learning Rate": 4.724783035368452e-07, "Finetune/Loss": 0.7732163667678833, "Finetune/Loss (Raw)": 0.8238574862480164, "Finetune/Step": 4500, "Finetune/Step Time": 2.7542500346899033} +{"Finetune/Learning Rate": 4.705025929859286e-07, "Finetune/Loss": 0.7739741206169128, "Finetune/Loss (Raw)": 0.8224944472312927, "Finetune/Step": 4501, "Finetune/Step Time": 2.7534351106733084} +{"Finetune/Learning Rate": 4.6853092237664875e-07, "Finetune/Loss": 0.7742170691490173, "Finetune/Loss (Raw)": 0.8573641180992126, "Finetune/Step": 4502, "Finetune/Step Time": 2.7539936006069183} +{"Finetune/Learning Rate": 4.665632925448726e-07, "Finetune/Loss": 0.7745891809463501, "Finetune/Loss (Raw)": 0.77706378698349, "Finetune/Step": 4503, "Finetune/Step Time": 2.7525823824107647} +{"Finetune/Learning Rate": 4.6459970432476297e-07, "Finetune/Loss": 0.7749542593955994, "Finetune/Loss (Raw)": 0.8297409415245056, "Finetune/Step": 4504, "Finetune/Step Time": 2.7570851165801287} +{"Finetune/Learning Rate": 4.6264015854876275e-07, "Finetune/Loss": 0.7750244140625, "Finetune/Loss (Raw)": 0.7578439116477966, "Finetune/Step": 4505, "Finetune/Step Time": 2.7526328060775995} +{"Finetune/Learning Rate": 4.6068465604760306e-07, "Finetune/Loss": 0.7750285267829895, "Finetune/Loss (Raw)": 0.7603616714477539, "Finetune/Step": 4506, "Finetune/Step Time": 2.75040365755558} +{"Finetune/Learning Rate": 4.587331976503018e-07, "Finetune/Loss": 0.775651216506958, "Finetune/Loss (Raw)": 0.8760861754417419, "Finetune/Step": 4507, "Finetune/Step Time": 2.7512528151273727} +{"Finetune/Learning Rate": 4.567857841841583e-07, "Finetune/Loss": 0.7757270336151123, "Finetune/Loss (Raw)": 0.7996434569358826, "Finetune/Step": 4508, "Finetune/Step Time": 2.7472215220332146} +{"Finetune/Learning Rate": 4.5484241647476667e-07, "Finetune/Loss": 0.775566816329956, "Finetune/Loss (Raw)": 0.855057418346405, "Finetune/Step": 4509, "Finetune/Step Time": 2.7488097939640284} +{"Finetune/Learning Rate": 4.529030953459945e-07, "Finetune/Loss": 0.7764536142349243, "Finetune/Loss (Raw)": 0.7777889370918274, "Finetune/Step": 4510, "Finetune/Step Time": 2.747793497517705} +{"Finetune/Learning Rate": 4.5096782161999975e-07, "Finetune/Loss": 0.777141273021698, "Finetune/Loss (Raw)": 0.7466452717781067, "Finetune/Step": 4511, "Finetune/Step Time": 2.7480857726186514} +{"Finetune/Learning Rate": 4.4903659611722607e-07, "Finetune/Loss": 0.779013991355896, "Finetune/Loss (Raw)": 0.9052014350891113, "Finetune/Step": 4512, "Finetune/Step Time": 2.744156239554286} +{"Finetune/Learning Rate": 4.471094196563941e-07, "Finetune/Loss": 0.7785851955413818, "Finetune/Loss (Raw)": 0.7181265354156494, "Finetune/Step": 4513, "Finetune/Step Time": 2.74428559653461} +{"Finetune/Learning Rate": 4.45186293054517e-07, "Finetune/Loss": 0.7774273753166199, "Finetune/Loss (Raw)": 0.6638001799583435, "Finetune/Step": 4514, "Finetune/Step Time": 2.7452844977378845} +{"Finetune/Learning Rate": 4.432672171268837e-07, "Finetune/Loss": 0.7773886322975159, "Finetune/Loss (Raw)": 0.8643439412117004, "Finetune/Step": 4515, "Finetune/Step Time": 2.7490721344947815} +{"Finetune/Learning Rate": 4.4135219268706895e-07, "Finetune/Loss": 0.7772672176361084, "Finetune/Loss (Raw)": 0.8530566692352295, "Finetune/Step": 4516, "Finetune/Step Time": 2.7501866184175014} +{"Finetune/Learning Rate": 4.394412205469301e-07, "Finetune/Loss": 0.7749108076095581, "Finetune/Loss (Raw)": 0.47774145007133484, "Finetune/Step": 4517, "Finetune/Step Time": 2.771669778972864} +{"Finetune/Learning Rate": 4.3753430151660445e-07, "Finetune/Loss": 0.7752596735954285, "Finetune/Loss (Raw)": 0.78939288854599, "Finetune/Step": 4518, "Finetune/Step Time": 2.774559700861573} +{"Finetune/Learning Rate": 4.3563143640451664e-07, "Finetune/Loss": 0.7752890586853027, "Finetune/Loss (Raw)": 0.76907879114151, "Finetune/Step": 4519, "Finetune/Step Time": 2.775536898523569} +{"Finetune/Learning Rate": 4.3373262601736354e-07, "Finetune/Loss": 0.77454674243927, "Finetune/Loss (Raw)": 0.6941347718238831, "Finetune/Step": 4520, "Finetune/Step Time": 2.7636949717998505} +{"Finetune/Learning Rate": 4.318378711601301e-07, "Finetune/Loss": 0.7749814987182617, "Finetune/Loss (Raw)": 0.7685002088546753, "Finetune/Step": 4521, "Finetune/Step Time": 2.7633684538304806} +{"Finetune/Learning Rate": 4.299471726360804e-07, "Finetune/Loss": 0.7739324569702148, "Finetune/Loss (Raw)": 0.6659425497055054, "Finetune/Step": 4522, "Finetune/Step Time": 2.7858545910567045} +{"Finetune/Learning Rate": 4.2806053124675897e-07, "Finetune/Loss": 0.7742030024528503, "Finetune/Loss (Raw)": 0.8315606713294983, "Finetune/Step": 4523, "Finetune/Step Time": 2.7852412182837725} +{"Finetune/Learning Rate": 4.261779477919892e-07, "Finetune/Loss": 0.7750598192214966, "Finetune/Loss (Raw)": 0.8116648197174072, "Finetune/Step": 4524, "Finetune/Step Time": 2.7802150454372168} +{"Finetune/Learning Rate": 4.242994230698738e-07, "Finetune/Loss": 0.7741931676864624, "Finetune/Loss (Raw)": 0.779413104057312, "Finetune/Step": 4525, "Finetune/Step Time": 2.7866605557501316} +{"Finetune/Learning Rate": 4.2242495787679803e-07, "Finetune/Loss": 0.7746074199676514, "Finetune/Loss (Raw)": 0.7890273332595825, "Finetune/Step": 4526, "Finetune/Step Time": 2.786770533770323} +{"Finetune/Learning Rate": 4.2055455300742175e-07, "Finetune/Loss": 0.7722556591033936, "Finetune/Loss (Raw)": 0.5553892254829407, "Finetune/Step": 4527, "Finetune/Step Time": 2.8062505200505257} +{"Finetune/Learning Rate": 4.1868820925468625e-07, "Finetune/Loss": 0.7722765207290649, "Finetune/Loss (Raw)": 0.78453528881073, "Finetune/Step": 4528, "Finetune/Step Time": 2.807783279567957} +{"Finetune/Learning Rate": 4.1682592740981074e-07, "Finetune/Loss": 0.7705197334289551, "Finetune/Loss (Raw)": 0.6425776481628418, "Finetune/Step": 4529, "Finetune/Step Time": 2.8329697530716658} +{"Finetune/Learning Rate": 4.1496770826229494e-07, "Finetune/Loss": 0.7713858485221863, "Finetune/Loss (Raw)": 0.8284164667129517, "Finetune/Step": 4530, "Finetune/Step Time": 2.8352810218930244} +{"Finetune/Learning Rate": 4.131135525999086e-07, "Finetune/Loss": 0.7702726721763611, "Finetune/Loss (Raw)": 0.6917906999588013, "Finetune/Step": 4531, "Finetune/Step Time": 2.8357501719146967} +{"Finetune/Learning Rate": 4.112634612087063e-07, "Finetune/Loss": 0.7695744633674622, "Finetune/Loss (Raw)": 0.7934120893478394, "Finetune/Step": 4532, "Finetune/Step Time": 2.8357600439339876} +{"Finetune/Learning Rate": 4.094174348730184e-07, "Finetune/Loss": 0.7688027620315552, "Finetune/Loss (Raw)": 0.7839645147323608, "Finetune/Step": 4533, "Finetune/Step Time": 2.83606163226068} +{"Finetune/Learning Rate": 4.075754743754479e-07, "Finetune/Loss": 0.769123375415802, "Finetune/Loss (Raw)": 0.6965346336364746, "Finetune/Step": 4534, "Finetune/Step Time": 2.8140446580946445} +{"Finetune/Learning Rate": 4.0573758049687883e-07, "Finetune/Loss": 0.768722653388977, "Finetune/Loss (Raw)": 0.7794851064682007, "Finetune/Step": 4535, "Finetune/Step Time": 2.813164146617055} +{"Finetune/Learning Rate": 4.03903754016467e-07, "Finetune/Loss": 0.7678443193435669, "Finetune/Loss (Raw)": 0.7340281009674072, "Finetune/Step": 4536, "Finetune/Step Time": 2.8151507899165154} +{"Finetune/Learning Rate": 4.020739957116493e-07, "Finetune/Loss": 0.767544686794281, "Finetune/Loss (Raw)": 0.7318438291549683, "Finetune/Step": 4537, "Finetune/Step Time": 2.814491208642721} +{"Finetune/Learning Rate": 4.0024830635813193e-07, "Finetune/Loss": 0.7685259580612183, "Finetune/Loss (Raw)": 0.8871276378631592, "Finetune/Step": 4538, "Finetune/Step Time": 2.8180878590792418} +{"Finetune/Learning Rate": 3.9842668672989803e-07, "Finetune/Loss": 0.7691119909286499, "Finetune/Loss (Raw)": 0.7892628312110901, "Finetune/Step": 4539, "Finetune/Step Time": 2.815935930237174} +{"Finetune/Learning Rate": 3.9660913759921095e-07, "Finetune/Loss": 0.7688542604446411, "Finetune/Loss (Raw)": 0.6986532807350159, "Finetune/Step": 4540, "Finetune/Step Time": 2.8367083240300417} +{"Finetune/Learning Rate": 3.9479565973659874e-07, "Finetune/Loss": 0.7672385573387146, "Finetune/Loss (Raw)": 0.7330387830734253, "Finetune/Step": 4541, "Finetune/Step Time": 2.8412903398275375} +{"Finetune/Learning Rate": 3.9298625391087084e-07, "Finetune/Loss": 0.7674748301506042, "Finetune/Loss (Raw)": 0.7632149457931519, "Finetune/Step": 4542, "Finetune/Step Time": 2.8395126797258854} +{"Finetune/Learning Rate": 3.911809208891082e-07, "Finetune/Loss": 0.767401397228241, "Finetune/Loss (Raw)": 0.8238996863365173, "Finetune/Step": 4543, "Finetune/Step Time": 2.8333131186664104} +{"Finetune/Learning Rate": 3.8937966143666406e-07, "Finetune/Loss": 0.7674853801727295, "Finetune/Loss (Raw)": 0.7659431099891663, "Finetune/Step": 4544, "Finetune/Step Time": 2.8337438944727182} +{"Finetune/Learning Rate": 3.875824763171654e-07, "Finetune/Loss": 0.767794132232666, "Finetune/Loss (Raw)": 0.8107401728630066, "Finetune/Step": 4545, "Finetune/Step Time": 2.830596065148711} +{"Finetune/Learning Rate": 3.8578936629251165e-07, "Finetune/Loss": 0.7669127583503723, "Finetune/Loss (Raw)": 0.7196628451347351, "Finetune/Step": 4546, "Finetune/Step Time": 2.8301659915596247} +{"Finetune/Learning Rate": 3.840003321228791e-07, "Finetune/Loss": 0.7666320204734802, "Finetune/Loss (Raw)": 0.7893240451812744, "Finetune/Step": 4547, "Finetune/Step Time": 2.829250678420067} +{"Finetune/Learning Rate": 3.8221537456670786e-07, "Finetune/Loss": 0.767487108707428, "Finetune/Loss (Raw)": 0.7739270329475403, "Finetune/Step": 4548, "Finetune/Step Time": 2.8041199054569006} +{"Finetune/Learning Rate": 3.804344943807126e-07, "Finetune/Loss": 0.7666918039321899, "Finetune/Loss (Raw)": 0.7447208762168884, "Finetune/Step": 4549, "Finetune/Step Time": 2.802534619346261} +{"Finetune/Learning Rate": 3.7865769231988593e-07, "Finetune/Loss": 0.7657034397125244, "Finetune/Loss (Raw)": 0.7786536812782288, "Finetune/Step": 4550, "Finetune/Step Time": 2.7969774063676596} +{"Finetune/Learning Rate": 3.768849691374843e-07, "Finetune/Loss": 0.765399694442749, "Finetune/Loss (Raw)": 0.7305766940116882, "Finetune/Step": 4551, "Finetune/Step Time": 2.7970264721661806} +{"Finetune/Learning Rate": 3.7511632558503655e-07, "Finetune/Loss": 0.765965461730957, "Finetune/Loss (Raw)": 0.7867095470428467, "Finetune/Step": 4552, "Finetune/Step Time": 2.791768966242671} +{"Finetune/Learning Rate": 3.733517624123428e-07, "Finetune/Loss": 0.7654285430908203, "Finetune/Loss (Raw)": 0.7120179533958435, "Finetune/Step": 4553, "Finetune/Step Time": 2.7911911569535732} +{"Finetune/Learning Rate": 3.715912803674737e-07, "Finetune/Loss": 0.7661173343658447, "Finetune/Loss (Raw)": 0.8813860416412354, "Finetune/Step": 4554, "Finetune/Step Time": 2.7893213126808405} +{"Finetune/Learning Rate": 3.698348801967688e-07, "Finetune/Loss": 0.7661154270172119, "Finetune/Loss (Raw)": 0.8049222826957703, "Finetune/Step": 4555, "Finetune/Step Time": 2.7882757615298033} +{"Finetune/Learning Rate": 3.68082562644837e-07, "Finetune/Loss": 0.7660039067268372, "Finetune/Loss (Raw)": 0.7632274627685547, "Finetune/Step": 4556, "Finetune/Step Time": 2.7884331606328487} +{"Finetune/Learning Rate": 3.6633432845455843e-07, "Finetune/Loss": 0.7654852867126465, "Finetune/Loss (Raw)": 0.7119016647338867, "Finetune/Step": 4557, "Finetune/Step Time": 2.7825521863996983} +{"Finetune/Learning Rate": 3.6459017836708134e-07, "Finetune/Loss": 0.7655735015869141, "Finetune/Loss (Raw)": 0.7623380422592163, "Finetune/Step": 4558, "Finetune/Step Time": 2.7835998460650444} +{"Finetune/Learning Rate": 3.628501131218187e-07, "Finetune/Loss": 0.764491081237793, "Finetune/Loss (Raw)": 0.6962075233459473, "Finetune/Step": 4559, "Finetune/Step Time": 2.807087177410722} +{"Finetune/Learning Rate": 3.611141334564572e-07, "Finetune/Loss": 0.7638101577758789, "Finetune/Loss (Raw)": 0.7228531241416931, "Finetune/Step": 4560, "Finetune/Step Time": 2.816442832350731} +{"Finetune/Learning Rate": 3.593822401069491e-07, "Finetune/Loss": 0.7640736103057861, "Finetune/Loss (Raw)": 0.7854781746864319, "Finetune/Step": 4561, "Finetune/Step Time": 2.8179678320884705} +{"Finetune/Learning Rate": 3.5765443380751385e-07, "Finetune/Loss": 0.764956533908844, "Finetune/Loss (Raw)": 0.7797409296035767, "Finetune/Step": 4562, "Finetune/Step Time": 2.818530660122633} +{"Finetune/Learning Rate": 3.5593071529063996e-07, "Finetune/Loss": 0.7597289681434631, "Finetune/Loss (Raw)": 0.1793973743915558, "Finetune/Step": 4563, "Finetune/Step Time": 2.8534254785627127} +{"Finetune/Learning Rate": 3.542110852870795e-07, "Finetune/Loss": 0.7588322162628174, "Finetune/Loss (Raw)": 0.6937934160232544, "Finetune/Step": 4564, "Finetune/Step Time": 2.877643033862114} +{"Finetune/Learning Rate": 3.524955445258582e-07, "Finetune/Loss": 0.7605065107345581, "Finetune/Loss (Raw)": 0.9883463382720947, "Finetune/Step": 4565, "Finetune/Step Time": 2.8779912628233433} +{"Finetune/Learning Rate": 3.507840937342588e-07, "Finetune/Loss": 0.7607802152633667, "Finetune/Loss (Raw)": 0.7478551268577576, "Finetune/Step": 4566, "Finetune/Step Time": 2.878843354061246} +{"Finetune/Learning Rate": 3.4907673363783535e-07, "Finetune/Loss": 0.7594341039657593, "Finetune/Loss (Raw)": 0.6969912648200989, "Finetune/Step": 4567, "Finetune/Step Time": 2.8799710106104612} +{"Finetune/Learning Rate": 3.4737346496041105e-07, "Finetune/Loss": 0.7602885961532593, "Finetune/Loss (Raw)": 0.7763041257858276, "Finetune/Step": 4568, "Finetune/Step Time": 2.8792422898113728} +{"Finetune/Learning Rate": 3.4567428842406603e-07, "Finetune/Loss": 0.7595517635345459, "Finetune/Loss (Raw)": 0.7369881272315979, "Finetune/Step": 4569, "Finetune/Step Time": 2.8793509155511856} +{"Finetune/Learning Rate": 3.439792047491541e-07, "Finetune/Loss": 0.7599438428878784, "Finetune/Loss (Raw)": 0.7165006399154663, "Finetune/Step": 4570, "Finetune/Step Time": 2.8823529053479433} +{"Finetune/Learning Rate": 3.422882146542883e-07, "Finetune/Loss": 0.7601778507232666, "Finetune/Loss (Raw)": 0.816015362739563, "Finetune/Step": 4571, "Finetune/Step Time": 2.885321967303753} +{"Finetune/Learning Rate": 3.406013188563484e-07, "Finetune/Loss": 0.7602691650390625, "Finetune/Loss (Raw)": 0.8149252533912659, "Finetune/Step": 4572, "Finetune/Step Time": 2.882482685148716} +{"Finetune/Learning Rate": 3.3891851807047795e-07, "Finetune/Loss": 0.7597115635871887, "Finetune/Loss (Raw)": 0.7368630766868591, "Finetune/Step": 4573, "Finetune/Step Time": 2.879781361669302} +{"Finetune/Learning Rate": 3.372398130100851e-07, "Finetune/Loss": 0.7579771280288696, "Finetune/Loss (Raw)": 0.5677677392959595, "Finetune/Step": 4574, "Finetune/Step Time": 2.899736400693655} +{"Finetune/Learning Rate": 3.355652043868418e-07, "Finetune/Loss": 0.7591349482536316, "Finetune/Loss (Raw)": 0.8695401549339294, "Finetune/Step": 4575, "Finetune/Step Time": 2.9008726868778467} +{"Finetune/Learning Rate": 3.3389469291068235e-07, "Finetune/Loss": 0.7588359117507935, "Finetune/Loss (Raw)": 0.7661980390548706, "Finetune/Step": 4576, "Finetune/Step Time": 2.893348153680563} +{"Finetune/Learning Rate": 3.322282792898024e-07, "Finetune/Loss": 0.7585180997848511, "Finetune/Loss (Raw)": 0.8325249552726746, "Finetune/Step": 4577, "Finetune/Step Time": 2.891683530062437} +{"Finetune/Learning Rate": 3.3056596423066576e-07, "Finetune/Loss": 0.757502555847168, "Finetune/Loss (Raw)": 0.7216939330101013, "Finetune/Step": 4578, "Finetune/Step Time": 2.895348249003291} +{"Finetune/Learning Rate": 3.289077484379943e-07, "Finetune/Loss": 0.7565106153488159, "Finetune/Loss (Raw)": 0.8109562397003174, "Finetune/Step": 4579, "Finetune/Step Time": 2.891571694985032} +{"Finetune/Learning Rate": 3.272536326147724e-07, "Finetune/Loss": 0.7569886445999146, "Finetune/Loss (Raw)": 0.8580540418624878, "Finetune/Step": 4580, "Finetune/Step Time": 2.889151841402054} +{"Finetune/Learning Rate": 3.256036174622479e-07, "Finetune/Loss": 0.7574458718299866, "Finetune/Loss (Raw)": 0.8546198010444641, "Finetune/Step": 4581, "Finetune/Step Time": 2.8895243164151907} +{"Finetune/Learning Rate": 3.2395770367992793e-07, "Finetune/Loss": 0.7579189538955688, "Finetune/Loss (Raw)": 0.7685279846191406, "Finetune/Step": 4582, "Finetune/Step Time": 2.8881361465901136} +{"Finetune/Learning Rate": 3.2231589196558443e-07, "Finetune/Loss": 0.7582862377166748, "Finetune/Loss (Raw)": 0.8455190658569336, "Finetune/Step": 4583, "Finetune/Step Time": 2.883352566510439} +{"Finetune/Learning Rate": 3.20678183015245e-07, "Finetune/Loss": 0.7571710348129272, "Finetune/Loss (Raw)": 0.6984326243400574, "Finetune/Step": 4584, "Finetune/Step Time": 2.8806854132562876} +{"Finetune/Learning Rate": 3.190445775232065e-07, "Finetune/Loss": 0.7582657933235168, "Finetune/Loss (Raw)": 0.876102864742279, "Finetune/Step": 4585, "Finetune/Step Time": 2.8787773698568344} +{"Finetune/Learning Rate": 3.174150761820161e-07, "Finetune/Loss": 0.7579517960548401, "Finetune/Loss (Raw)": 0.7493266463279724, "Finetune/Step": 4586, "Finetune/Step Time": 2.875568827614188} +{"Finetune/Learning Rate": 3.157896796824855e-07, "Finetune/Loss": 0.7585254907608032, "Finetune/Loss (Raw)": 0.7895880341529846, "Finetune/Step": 4587, "Finetune/Step Time": 2.8746272809803486} +{"Finetune/Learning Rate": 3.1416838871368925e-07, "Finetune/Loss": 0.7584470510482788, "Finetune/Loss (Raw)": 0.7703986167907715, "Finetune/Step": 4588, "Finetune/Step Time": 2.8754782248288393} +{"Finetune/Learning Rate": 3.1255120396295634e-07, "Finetune/Loss": 0.7574412822723389, "Finetune/Loss (Raw)": 0.5989839434623718, "Finetune/Step": 4589, "Finetune/Step Time": 2.9018256198614836} +{"Finetune/Learning Rate": 3.109381261158795e-07, "Finetune/Loss": 0.7574855089187622, "Finetune/Loss (Raw)": 0.8146839141845703, "Finetune/Step": 4590, "Finetune/Step Time": 2.9034484531730413} +{"Finetune/Learning Rate": 3.093291558563061e-07, "Finetune/Loss": 0.75840163230896, "Finetune/Loss (Raw)": 0.788628339767456, "Finetune/Step": 4591, "Finetune/Step Time": 2.902720907703042} +{"Finetune/Learning Rate": 3.0772429386634383e-07, "Finetune/Loss": 0.7588781714439392, "Finetune/Loss (Raw)": 0.8670275211334229, "Finetune/Step": 4592, "Finetune/Step Time": 2.9071648102253675} +{"Finetune/Learning Rate": 3.0612354082636076e-07, "Finetune/Loss": 0.7578226327896118, "Finetune/Loss (Raw)": 0.6140510439872742, "Finetune/Step": 4593, "Finetune/Step Time": 2.9273960646241903} +{"Finetune/Learning Rate": 3.0452689741497955e-07, "Finetune/Loss": 0.7547168135643005, "Finetune/Loss (Raw)": 0.3972785770893097, "Finetune/Step": 4594, "Finetune/Step Time": 2.956282563507557} +{"Finetune/Learning Rate": 3.029343643090832e-07, "Finetune/Loss": 0.7541818618774414, "Finetune/Loss (Raw)": 0.8251305222511292, "Finetune/Step": 4595, "Finetune/Step Time": 2.9581796005368233} +{"Finetune/Learning Rate": 3.0134594218381163e-07, "Finetune/Loss": 0.7547940015792847, "Finetune/Loss (Raw)": 0.8983059525489807, "Finetune/Step": 4596, "Finetune/Step Time": 2.955568315461278} +{"Finetune/Learning Rate": 2.9976163171255955e-07, "Finetune/Loss": 0.7574354410171509, "Finetune/Loss (Raw)": 0.556175708770752, "Finetune/Step": 4597, "Finetune/Step Time": 2.945820001885295} +{"Finetune/Learning Rate": 2.9818143356698305e-07, "Finetune/Loss": 0.7577594518661499, "Finetune/Loss (Raw)": 0.8184459805488586, "Finetune/Step": 4598, "Finetune/Step Time": 2.946240046992898} +{"Finetune/Learning Rate": 2.9660534841699175e-07, "Finetune/Loss": 0.7580628395080566, "Finetune/Loss (Raw)": 0.7637461423873901, "Finetune/Step": 4599, "Finetune/Step Time": 2.9392915181815624} +{"Finetune/Learning Rate": 2.950333769307523e-07, "Finetune/Loss": 0.7584753036499023, "Finetune/Loss (Raw)": 0.7367933988571167, "Finetune/Step": 4600, "Finetune/Step Time": 2.9444586653262377} +{"Finetune/Learning Rate": 2.9346551977468605e-07, "Finetune/Loss": 0.7604626417160034, "Finetune/Loss (Raw)": 0.8020114302635193, "Finetune/Step": 4601, "Finetune/Step Time": 2.9205741584300995} +{"Finetune/Learning Rate": 2.919017776134725e-07, "Finetune/Loss": 0.7611329555511475, "Finetune/Loss (Raw)": 0.9030167460441589, "Finetune/Step": 4602, "Finetune/Step Time": 2.917600989341736} +{"Finetune/Learning Rate": 2.903421511100468e-07, "Finetune/Loss": 0.7608040571212769, "Finetune/Loss (Raw)": 0.7147220969200134, "Finetune/Step": 4603, "Finetune/Step Time": 2.9163320921361446} +{"Finetune/Learning Rate": 2.887866409255957e-07, "Finetune/Loss": 0.7607017755508423, "Finetune/Loss (Raw)": 0.8445814847946167, "Finetune/Step": 4604, "Finetune/Step Time": 2.921072117984295} +{"Finetune/Learning Rate": 2.872352477195639e-07, "Finetune/Loss": 0.7601732611656189, "Finetune/Loss (Raw)": 0.7906328439712524, "Finetune/Step": 4605, "Finetune/Step Time": 2.9195950739085674} +{"Finetune/Learning Rate": 2.8568797214965194e-07, "Finetune/Loss": 0.7609273791313171, "Finetune/Loss (Raw)": 0.8634915351867676, "Finetune/Step": 4606, "Finetune/Step Time": 2.916862966492772} +{"Finetune/Learning Rate": 2.8414481487180956e-07, "Finetune/Loss": 0.7626453042030334, "Finetune/Loss (Raw)": 0.5087686777114868, "Finetune/Step": 4607, "Finetune/Step Time": 2.9079337157309055} +{"Finetune/Learning Rate": 2.826057765402468e-07, "Finetune/Loss": 0.7629494667053223, "Finetune/Loss (Raw)": 0.8634960651397705, "Finetune/Step": 4608, "Finetune/Step Time": 2.908874996006489} +{"Finetune/Learning Rate": 2.8107085780742394e-07, "Finetune/Loss": 0.7628207206726074, "Finetune/Loss (Raw)": 0.783614456653595, "Finetune/Step": 4609, "Finetune/Step Time": 2.9055784977972507} +{"Finetune/Learning Rate": 2.7954005932405493e-07, "Finetune/Loss": 0.7619205713272095, "Finetune/Loss (Raw)": 0.7759460210800171, "Finetune/Step": 4610, "Finetune/Step Time": 2.9069587849080563} +{"Finetune/Learning Rate": 2.780133817391073e-07, "Finetune/Loss": 0.7621523141860962, "Finetune/Loss (Raw)": 0.7230940461158752, "Finetune/Step": 4611, "Finetune/Step Time": 2.90806738846004} +{"Finetune/Learning Rate": 2.7649082569980225e-07, "Finetune/Loss": 0.7639598846435547, "Finetune/Loss (Raw)": 0.7959737181663513, "Finetune/Step": 4612, "Finetune/Step Time": 2.8831956442445517} +{"Finetune/Learning Rate": 2.749723918516145e-07, "Finetune/Loss": 0.7642680406570435, "Finetune/Loss (Raw)": 0.8217957019805908, "Finetune/Step": 4613, "Finetune/Step Time": 2.8810577653348446} +{"Finetune/Learning Rate": 2.734580808382681e-07, "Finetune/Loss": 0.7633060812950134, "Finetune/Loss (Raw)": 0.7327380180358887, "Finetune/Step": 4614, "Finetune/Step Time": 2.883859423920512} +{"Finetune/Learning Rate": 2.7194789330174054e-07, "Finetune/Loss": 0.7630763053894043, "Finetune/Loss (Raw)": 0.766189694404602, "Finetune/Step": 4615, "Finetune/Step Time": 2.8851262368261814} +{"Finetune/Learning Rate": 2.704418298822631e-07, "Finetune/Loss": 0.7642996311187744, "Finetune/Loss (Raw)": 0.8395242094993591, "Finetune/Step": 4616, "Finetune/Step Time": 2.870472678914666} +{"Finetune/Learning Rate": 2.689398912183183e-07, "Finetune/Loss": 0.764742910861969, "Finetune/Loss (Raw)": 0.809704065322876, "Finetune/Step": 4617, "Finetune/Step Time": 2.869530249387026} +{"Finetune/Learning Rate": 2.674420779466369e-07, "Finetune/Loss": 0.7650099396705627, "Finetune/Loss (Raw)": 0.7605271935462952, "Finetune/Step": 4618, "Finetune/Step Time": 2.869593683630228} +{"Finetune/Learning Rate": 2.6594839070220424e-07, "Finetune/Loss": 0.7645162343978882, "Finetune/Loss (Raw)": 0.6639966368675232, "Finetune/Step": 4619, "Finetune/Step Time": 2.8703898321837187} +{"Finetune/Learning Rate": 2.644588301182538e-07, "Finetune/Loss": 0.7647407650947571, "Finetune/Loss (Raw)": 0.8466876149177551, "Finetune/Step": 4620, "Finetune/Step Time": 2.874771174043417} +{"Finetune/Learning Rate": 2.6297339682627266e-07, "Finetune/Loss": 0.7642291784286499, "Finetune/Loss (Raw)": 0.8177304863929749, "Finetune/Step": 4621, "Finetune/Step Time": 2.873254181817174} +{"Finetune/Learning Rate": 2.6149209145599485e-07, "Finetune/Loss": 0.7658233642578125, "Finetune/Loss (Raw)": 0.8920060396194458, "Finetune/Step": 4622, "Finetune/Step Time": 2.8730661179870367} +{"Finetune/Learning Rate": 2.6001491463540695e-07, "Finetune/Loss": 0.765360951423645, "Finetune/Loss (Raw)": 0.7608385682106018, "Finetune/Step": 4623, "Finetune/Step Time": 2.8779661655426025} +{"Finetune/Learning Rate": 2.585418669907458e-07, "Finetune/Loss": 0.7654476165771484, "Finetune/Loss (Raw)": 0.8444393873214722, "Finetune/Step": 4624, "Finetune/Step Time": 2.8794318232685328} +{"Finetune/Learning Rate": 2.570729491464918e-07, "Finetune/Loss": 0.761059045791626, "Finetune/Loss (Raw)": 0.28146523237228394, "Finetune/Step": 4625, "Finetune/Step Time": 2.911180976778269} +{"Finetune/Learning Rate": 2.556081617253836e-07, "Finetune/Loss": 0.7571487426757812, "Finetune/Loss (Raw)": 0.20602235198020935, "Finetune/Step": 4626, "Finetune/Step Time": 2.9456035029143095} +{"Finetune/Learning Rate": 2.5414750534840105e-07, "Finetune/Loss": 0.7565425634384155, "Finetune/Loss (Raw)": 0.759507954120636, "Finetune/Step": 4627, "Finetune/Step Time": 2.945886190980673} +{"Finetune/Learning Rate": 2.526909806347777e-07, "Finetune/Loss": 0.7559301853179932, "Finetune/Loss (Raw)": 0.7454766631126404, "Finetune/Step": 4628, "Finetune/Step Time": 2.9473257046192884} +{"Finetune/Learning Rate": 2.51238588201993e-07, "Finetune/Loss": 0.755071759223938, "Finetune/Loss (Raw)": 0.7126147150993347, "Finetune/Step": 4629, "Finetune/Step Time": 2.9465866908431053} +{"Finetune/Learning Rate": 2.4979032866577323e-07, "Finetune/Loss": 0.7547001838684082, "Finetune/Loss (Raw)": 0.8098071813583374, "Finetune/Step": 4630, "Finetune/Step Time": 2.9456669874489307} +{"Finetune/Learning Rate": 2.483462026400996e-07, "Finetune/Loss": 0.7546442747116089, "Finetune/Loss (Raw)": 0.7699078321456909, "Finetune/Step": 4631, "Finetune/Step Time": 2.9467636235058308} +{"Finetune/Learning Rate": 2.4690621073719114e-07, "Finetune/Loss": 0.7543612122535706, "Finetune/Loss (Raw)": 0.7935110926628113, "Finetune/Step": 4632, "Finetune/Step Time": 2.9380526412278414} +{"Finetune/Learning Rate": 2.454703535675196e-07, "Finetune/Loss": 0.7541379332542419, "Finetune/Loss (Raw)": 0.7292603850364685, "Finetune/Step": 4633, "Finetune/Step Time": 2.935669358819723} +{"Finetune/Learning Rate": 2.440386317398058e-07, "Finetune/Loss": 0.7536557912826538, "Finetune/Loss (Raw)": 0.6986448764801025, "Finetune/Step": 4634, "Finetune/Step Time": 2.9346767384558916} +{"Finetune/Learning Rate": 2.42611045861012e-07, "Finetune/Loss": 0.7528946399688721, "Finetune/Loss (Raw)": 0.7786619663238525, "Finetune/Step": 4635, "Finetune/Step Time": 2.9300234001129866} +{"Finetune/Learning Rate": 2.411875965363519e-07, "Finetune/Loss": 0.7535161972045898, "Finetune/Loss (Raw)": 0.879206120967865, "Finetune/Step": 4636, "Finetune/Step Time": 2.934573298320174} +{"Finetune/Learning Rate": 2.397682843692828e-07, "Finetune/Loss": 0.7535790205001831, "Finetune/Loss (Raw)": 0.8630882501602173, "Finetune/Step": 4637, "Finetune/Step Time": 2.9320657160133123} +{"Finetune/Learning Rate": 2.3835310996150886e-07, "Finetune/Loss": 0.7535960674285889, "Finetune/Loss (Raw)": 0.7799711227416992, "Finetune/Step": 4638, "Finetune/Step Time": 2.9298978466540575} +{"Finetune/Learning Rate": 2.3694207391298018e-07, "Finetune/Loss": 0.7525344491004944, "Finetune/Loss (Raw)": 0.610761284828186, "Finetune/Step": 4639, "Finetune/Step Time": 2.954451499506831} +{"Finetune/Learning Rate": 2.3553517682189163e-07, "Finetune/Loss": 0.751875638961792, "Finetune/Loss (Raw)": 0.8208767771720886, "Finetune/Step": 4640, "Finetune/Step Time": 2.957678370177746} +{"Finetune/Learning Rate": 2.341324192846861e-07, "Finetune/Loss": 0.7521979808807373, "Finetune/Loss (Raw)": 0.7593863606452942, "Finetune/Step": 4641, "Finetune/Step Time": 2.960367465391755} +{"Finetune/Learning Rate": 2.32733801896049e-07, "Finetune/Loss": 0.7527598738670349, "Finetune/Loss (Raw)": 0.7357248663902283, "Finetune/Step": 4642, "Finetune/Step Time": 2.9598907250910997} +{"Finetune/Learning Rate": 2.3133932524890822e-07, "Finetune/Loss": 0.7519094347953796, "Finetune/Loss (Raw)": 0.7554827332496643, "Finetune/Step": 4643, "Finetune/Step Time": 2.960381304845214} +{"Finetune/Learning Rate": 2.2994898993444204e-07, "Finetune/Loss": 0.7510082125663757, "Finetune/Loss (Raw)": 0.7377023696899414, "Finetune/Step": 4644, "Finetune/Step Time": 2.961267914623022} +{"Finetune/Learning Rate": 2.2856279654207002e-07, "Finetune/Loss": 0.7534147500991821, "Finetune/Loss (Raw)": 0.7857798933982849, "Finetune/Step": 4645, "Finetune/Step Time": 2.941008983179927} +{"Finetune/Learning Rate": 2.2718074565945547e-07, "Finetune/Loss": 0.7527058124542236, "Finetune/Loss (Raw)": 0.698645293712616, "Finetune/Step": 4646, "Finetune/Step Time": 2.9396797195076942} +{"Finetune/Learning Rate": 2.2580283787250523e-07, "Finetune/Loss": 0.7522913217544556, "Finetune/Loss (Raw)": 0.7160284519195557, "Finetune/Step": 4647, "Finetune/Step Time": 2.9405784364789724} +{"Finetune/Learning Rate": 2.2442907376537204e-07, "Finetune/Loss": 0.7532604932785034, "Finetune/Loss (Raw)": 0.8181856870651245, "Finetune/Step": 4648, "Finetune/Step Time": 2.9387136679142714} +{"Finetune/Learning Rate": 2.2305945392044893e-07, "Finetune/Loss": 0.7535186409950256, "Finetune/Loss (Raw)": 0.8015430569648743, "Finetune/Step": 4649, "Finetune/Step Time": 2.9381882566958666} +{"Finetune/Learning Rate": 2.2169397891837363e-07, "Finetune/Loss": 0.7540596723556519, "Finetune/Loss (Raw)": 0.7351989150047302, "Finetune/Step": 4650, "Finetune/Step Time": 2.9188102819025517} +{"Finetune/Learning Rate": 2.2033264933802757e-07, "Finetune/Loss": 0.7534321546554565, "Finetune/Loss (Raw)": 0.7512310743331909, "Finetune/Step": 4651, "Finetune/Step Time": 2.9224710650742054} +{"Finetune/Learning Rate": 2.189754657565346e-07, "Finetune/Loss": 0.7536302804946899, "Finetune/Loss (Raw)": 0.8370368480682373, "Finetune/Step": 4652, "Finetune/Step Time": 2.925343420356512} +{"Finetune/Learning Rate": 2.1762242874925676e-07, "Finetune/Loss": 0.7542819976806641, "Finetune/Loss (Raw)": 0.8628215193748474, "Finetune/Step": 4653, "Finetune/Step Time": 2.9204657059162855} +{"Finetune/Learning Rate": 2.1627353888980296e-07, "Finetune/Loss": 0.7527369260787964, "Finetune/Loss (Raw)": 0.5912559032440186, "Finetune/Step": 4654, "Finetune/Step Time": 2.9439834132790565} +{"Finetune/Learning Rate": 2.1492879675002465e-07, "Finetune/Loss": 0.7535181045532227, "Finetune/Loss (Raw)": 0.6553853750228882, "Finetune/Step": 4655, "Finetune/Step Time": 2.9470265172421932} +{"Finetune/Learning Rate": 2.1358820290000915e-07, "Finetune/Loss": 0.75380539894104, "Finetune/Loss (Raw)": 0.8213086128234863, "Finetune/Step": 4656, "Finetune/Step Time": 2.9493987914174795} +{"Finetune/Learning Rate": 2.1225175790809183e-07, "Finetune/Loss": 0.7547668218612671, "Finetune/Loss (Raw)": 0.7656428217887878, "Finetune/Step": 4657, "Finetune/Step Time": 2.924742603674531} +{"Finetune/Learning Rate": 2.1091946234084282e-07, "Finetune/Loss": 0.7542921304702759, "Finetune/Loss (Raw)": 0.7676534652709961, "Finetune/Step": 4658, "Finetune/Step Time": 2.9216513633728027} +{"Finetune/Learning Rate": 2.0959131676308142e-07, "Finetune/Loss": 0.7557399272918701, "Finetune/Loss (Raw)": 0.8771084547042847, "Finetune/Step": 4659, "Finetune/Step Time": 2.923432594165206} +{"Finetune/Learning Rate": 2.0826732173785725e-07, "Finetune/Loss": 0.7556881904602051, "Finetune/Loss (Raw)": 0.7867928147315979, "Finetune/Step": 4660, "Finetune/Step Time": 2.923808502033353} +{"Finetune/Learning Rate": 2.0694747782646796e-07, "Finetune/Loss": 0.7559144496917725, "Finetune/Loss (Raw)": 0.8129235506057739, "Finetune/Step": 4661, "Finetune/Step Time": 2.922042513266206} +{"Finetune/Learning Rate": 2.0563178558845042e-07, "Finetune/Loss": 0.7563159465789795, "Finetune/Loss (Raw)": 0.7479282021522522, "Finetune/Step": 4662, "Finetune/Step Time": 2.9200745429843664} +{"Finetune/Learning Rate": 2.0432024558157738e-07, "Finetune/Loss": 0.7561298608779907, "Finetune/Loss (Raw)": 0.7556709051132202, "Finetune/Step": 4663, "Finetune/Step Time": 2.921268954873085} +{"Finetune/Learning Rate": 2.0301285836186625e-07, "Finetune/Loss": 0.7562767267227173, "Finetune/Loss (Raw)": 0.7528154850006104, "Finetune/Step": 4664, "Finetune/Step Time": 2.9201083201915026} +{"Finetune/Learning Rate": 2.0170962448357035e-07, "Finetune/Loss": 0.7569803595542908, "Finetune/Loss (Raw)": 0.8219085335731506, "Finetune/Step": 4665, "Finetune/Step Time": 2.923449032008648} +{"Finetune/Learning Rate": 2.004105444991844e-07, "Finetune/Loss": 0.757123589515686, "Finetune/Loss (Raw)": 0.90546715259552, "Finetune/Step": 4666, "Finetune/Step Time": 2.917167032137513} +{"Finetune/Learning Rate": 1.9911561895944008e-07, "Finetune/Loss": 0.7564505338668823, "Finetune/Loss (Raw)": 0.7031084299087524, "Finetune/Step": 4667, "Finetune/Step Time": 2.9160877224057913} +{"Finetune/Learning Rate": 1.978248484133094e-07, "Finetune/Loss": 0.7569722533226013, "Finetune/Loss (Raw)": 0.7654364109039307, "Finetune/Step": 4668, "Finetune/Step Time": 2.8991878367960453} +{"Finetune/Learning Rate": 1.965382334080046e-07, "Finetune/Loss": 0.7573482990264893, "Finetune/Loss (Raw)": 0.7811739444732666, "Finetune/Step": 4669, "Finetune/Step Time": 2.895270800217986} +{"Finetune/Learning Rate": 1.952557744889716e-07, "Finetune/Loss": 0.75713050365448, "Finetune/Loss (Raw)": 0.7353294491767883, "Finetune/Step": 4670, "Finetune/Step Time": 2.898289021104574} +{"Finetune/Learning Rate": 1.939774721998966e-07, "Finetune/Loss": 0.7537680864334106, "Finetune/Loss (Raw)": 0.3935224413871765, "Finetune/Step": 4671, "Finetune/Step Time": 2.9328331612050533} +{"Finetune/Learning Rate": 1.9270332708270612e-07, "Finetune/Loss": 0.7532660961151123, "Finetune/Loss (Raw)": 0.7016838788986206, "Finetune/Step": 4672, "Finetune/Step Time": 2.963684670627117} +{"Finetune/Learning Rate": 1.914333396775603e-07, "Finetune/Loss": 0.7533656358718872, "Finetune/Loss (Raw)": 0.8234717845916748, "Finetune/Step": 4673, "Finetune/Step Time": 2.966813003644347} +{"Finetune/Learning Rate": 1.9016751052285952e-07, "Finetune/Loss": 0.7537779808044434, "Finetune/Loss (Raw)": 0.7724441289901733, "Finetune/Step": 4674, "Finetune/Step Time": 2.967306647449732} +{"Finetune/Learning Rate": 1.8890584015524016e-07, "Finetune/Loss": 0.7536846995353699, "Finetune/Loss (Raw)": 0.7773931622505188, "Finetune/Step": 4675, "Finetune/Step Time": 2.968430010601878} +{"Finetune/Learning Rate": 1.8764832910957543e-07, "Finetune/Loss": 0.7545009255409241, "Finetune/Loss (Raw)": 0.8784030079841614, "Finetune/Step": 4676, "Finetune/Step Time": 2.9720781091600657} +{"Finetune/Learning Rate": 1.8639497791897444e-07, "Finetune/Loss": 0.7528998851776123, "Finetune/Loss (Raw)": 0.5397913455963135, "Finetune/Step": 4677, "Finetune/Step Time": 2.9990402664989233} +{"Finetune/Learning Rate": 1.851457871147855e-07, "Finetune/Loss": 0.7529041767120361, "Finetune/Loss (Raw)": 0.7792017459869385, "Finetune/Step": 4678, "Finetune/Step Time": 2.999391110613942} +{"Finetune/Learning Rate": 1.8390075722659052e-07, "Finetune/Loss": 0.7533186674118042, "Finetune/Loss (Raw)": 0.7836352586746216, "Finetune/Step": 4679, "Finetune/Step Time": 2.9965501986443996} +{"Finetune/Learning Rate": 1.8265988878220842e-07, "Finetune/Loss": 0.7518398761749268, "Finetune/Loss (Raw)": 0.5974200963973999, "Finetune/Step": 4680, "Finetune/Step Time": 3.0207531843334436} +{"Finetune/Learning Rate": 1.8142318230769284e-07, "Finetune/Loss": 0.7518917322158813, "Finetune/Loss (Raw)": 0.7186470627784729, "Finetune/Step": 4681, "Finetune/Step Time": 3.0211032293736935} +{"Finetune/Learning Rate": 1.8019063832733552e-07, "Finetune/Loss": 0.7510745525360107, "Finetune/Loss (Raw)": 0.7767891883850098, "Finetune/Step": 4682, "Finetune/Step Time": 3.0185162387788296} +{"Finetune/Learning Rate": 1.789622573636618e-07, "Finetune/Loss": 0.7515451908111572, "Finetune/Loss (Raw)": 0.8651629090309143, "Finetune/Step": 4683, "Finetune/Step Time": 3.020724007859826} +{"Finetune/Learning Rate": 1.7773803993743178e-07, "Finetune/Loss": 0.7517651319503784, "Finetune/Loss (Raw)": 0.7913854718208313, "Finetune/Step": 4684, "Finetune/Step Time": 3.018177770078182} +{"Finetune/Learning Rate": 1.765179865676414e-07, "Finetune/Loss": 0.7525032758712769, "Finetune/Loss (Raw)": 0.8063883781433105, "Finetune/Step": 4685, "Finetune/Step Time": 3.021226057782769} +{"Finetune/Learning Rate": 1.753020977715192e-07, "Finetune/Loss": 0.75327467918396, "Finetune/Loss (Raw)": 0.8610711693763733, "Finetune/Step": 4686, "Finetune/Step Time": 3.018020808696747} +{"Finetune/Learning Rate": 1.7409037406453388e-07, "Finetune/Loss": 0.7536770701408386, "Finetune/Loss (Raw)": 0.7477180361747742, "Finetune/Step": 4687, "Finetune/Step Time": 2.9985081516206264} +{"Finetune/Learning Rate": 1.7288281596038013e-07, "Finetune/Loss": 0.7542238235473633, "Finetune/Loss (Raw)": 0.7928266525268555, "Finetune/Step": 4688, "Finetune/Step Time": 2.986893158406019} +{"Finetune/Learning Rate": 1.7167942397099292e-07, "Finetune/Loss": 0.7543145418167114, "Finetune/Loss (Raw)": 0.7970990538597107, "Finetune/Step": 4689, "Finetune/Step Time": 2.98491046205163} +{"Finetune/Learning Rate": 1.7048019860654074e-07, "Finetune/Loss": 0.7550716400146484, "Finetune/Loss (Raw)": 0.8766396045684814, "Finetune/Step": 4690, "Finetune/Step Time": 2.983738349750638} +{"Finetune/Learning Rate": 1.6928514037541922e-07, "Finetune/Loss": 0.7594975829124451, "Finetune/Loss (Raw)": 0.7459294199943542, "Finetune/Step": 4691, "Finetune/Step Time": 2.949635621160269} +{"Finetune/Learning Rate": 1.6809424978426635e-07, "Finetune/Loss": 0.7605747580528259, "Finetune/Loss (Raw)": 0.8316682577133179, "Finetune/Step": 4692, "Finetune/Step Time": 2.927078301087022} +{"Finetune/Learning Rate": 1.6690752733794834e-07, "Finetune/Loss": 0.7593669295310974, "Finetune/Loss (Raw)": 0.833747923374176, "Finetune/Step": 4693, "Finetune/Step Time": 2.927490135654807} +{"Finetune/Learning Rate": 1.6572497353956496e-07, "Finetune/Loss": 0.7596933841705322, "Finetune/Loss (Raw)": 0.7896409034729004, "Finetune/Step": 4694, "Finetune/Step Time": 2.9461222626268864} +{"Finetune/Learning Rate": 1.645465888904485e-07, "Finetune/Loss": 0.7602760195732117, "Finetune/Loss (Raw)": 0.7715663313865662, "Finetune/Step": 4695, "Finetune/Step Time": 2.9534901212900877} +{"Finetune/Learning Rate": 1.633723738901627e-07, "Finetune/Loss": 0.761184573173523, "Finetune/Loss (Raw)": 0.8925973176956177, "Finetune/Step": 4696, "Finetune/Step Time": 2.954434299841523} +{"Finetune/Learning Rate": 1.6220232903650822e-07, "Finetune/Loss": 0.7609480619430542, "Finetune/Loss (Raw)": 0.7067108750343323, "Finetune/Step": 4697, "Finetune/Step Time": 2.954351533204317} +{"Finetune/Learning Rate": 1.6103645482551277e-07, "Finetune/Loss": 0.7618191838264465, "Finetune/Loss (Raw)": 0.8280069231987, "Finetune/Step": 4698, "Finetune/Step Time": 2.950672024860978} +{"Finetune/Learning Rate": 1.598747517514365e-07, "Finetune/Loss": 0.7612112164497375, "Finetune/Loss (Raw)": 0.7381961941719055, "Finetune/Step": 4699, "Finetune/Step Time": 2.94942538253963} +{"Finetune/Learning Rate": 1.587172203067766e-07, "Finetune/Loss": 0.7606003880500793, "Finetune/Loss (Raw)": 0.7367355823516846, "Finetune/Step": 4700, "Finetune/Step Time": 2.9519661646336317} +{"Finetune/Learning Rate": 1.5756386098225386e-07, "Finetune/Loss": 0.7612923383712769, "Finetune/Loss (Raw)": 0.8254355788230896, "Finetune/Step": 4701, "Finetune/Step Time": 2.9560499656945467} +{"Finetune/Learning Rate": 1.56414674266826e-07, "Finetune/Loss": 0.7633686065673828, "Finetune/Loss (Raw)": 0.8335295915603638, "Finetune/Step": 4702, "Finetune/Step Time": 2.9348320309072733} +{"Finetune/Learning Rate": 1.5526966064768e-07, "Finetune/Loss": 0.762851357460022, "Finetune/Loss (Raw)": 0.803339421749115, "Finetune/Step": 4703, "Finetune/Step Time": 2.937182182446122} +{"Finetune/Learning Rate": 1.5412882061023427e-07, "Finetune/Loss": 0.7627561092376709, "Finetune/Loss (Raw)": 0.7540003061294556, "Finetune/Step": 4704, "Finetune/Step Time": 2.935276446864009} +{"Finetune/Learning Rate": 1.5299215463813522e-07, "Finetune/Loss": 0.76175856590271, "Finetune/Loss (Raw)": 0.7048362493515015, "Finetune/Step": 4705, "Finetune/Step Time": 2.9317501448094845} +{"Finetune/Learning Rate": 1.5185966321326294e-07, "Finetune/Loss": 0.7625386714935303, "Finetune/Loss (Raw)": 0.8215506076812744, "Finetune/Step": 4706, "Finetune/Step Time": 2.9343940801918507} +{"Finetune/Learning Rate": 1.5073134681572787e-07, "Finetune/Loss": 0.7621204853057861, "Finetune/Loss (Raw)": 0.7574297189712524, "Finetune/Step": 4707, "Finetune/Step Time": 2.9396331030875444} +{"Finetune/Learning Rate": 1.4960720592386847e-07, "Finetune/Loss": 0.7610512971878052, "Finetune/Loss (Raw)": 0.7211998701095581, "Finetune/Step": 4708, "Finetune/Step Time": 2.9410413671284914} +{"Finetune/Learning Rate": 1.4848724101425128e-07, "Finetune/Loss": 0.7603330612182617, "Finetune/Loss (Raw)": 0.762679398059845, "Finetune/Step": 4709, "Finetune/Step Time": 2.9362856559455395} +{"Finetune/Learning Rate": 1.4737145256167872e-07, "Finetune/Loss": 0.7607836723327637, "Finetune/Loss (Raw)": 0.8262138962745667, "Finetune/Step": 4710, "Finetune/Step Time": 2.936682416126132} +{"Finetune/Learning Rate": 1.462598410391769e-07, "Finetune/Loss": 0.7606253027915955, "Finetune/Loss (Raw)": 0.8252432346343994, "Finetune/Step": 4711, "Finetune/Step Time": 2.935661131516099} +{"Finetune/Learning Rate": 1.4515240691800437e-07, "Finetune/Loss": 0.7618215084075928, "Finetune/Loss (Raw)": 0.8515459299087524, "Finetune/Step": 4712, "Finetune/Step Time": 2.9348044749349356} +{"Finetune/Learning Rate": 1.4404915066764557e-07, "Finetune/Loss": 0.761565089225769, "Finetune/Loss (Raw)": 0.8432835340499878, "Finetune/Step": 4713, "Finetune/Step Time": 2.9316157158464193} +{"Finetune/Learning Rate": 1.4295007275581752e-07, "Finetune/Loss": 0.7616000771522522, "Finetune/Loss (Raw)": 0.7538020014762878, "Finetune/Step": 4714, "Finetune/Step Time": 2.9361556321382523} +{"Finetune/Learning Rate": 1.4185517364846414e-07, "Finetune/Loss": 0.7617272138595581, "Finetune/Loss (Raw)": 0.8058611750602722, "Finetune/Step": 4715, "Finetune/Step Time": 2.934627629816532} +{"Finetune/Learning Rate": 1.4076445380975524e-07, "Finetune/Loss": 0.7618110179901123, "Finetune/Loss (Raw)": 0.7811277508735657, "Finetune/Step": 4716, "Finetune/Step Time": 2.9354292545467615} +{"Finetune/Learning Rate": 1.3967791370209427e-07, "Finetune/Loss": 0.7594516277313232, "Finetune/Loss (Raw)": 0.29697614908218384, "Finetune/Step": 4717, "Finetune/Step Time": 2.942355301231146} +{"Finetune/Learning Rate": 1.3859555378610944e-07, "Finetune/Loss": 0.7590023875236511, "Finetune/Loss (Raw)": 0.7571902871131897, "Finetune/Step": 4718, "Finetune/Step Time": 2.9406492728739977} +{"Finetune/Learning Rate": 1.3751737452065483e-07, "Finetune/Loss": 0.7588087320327759, "Finetune/Loss (Raw)": 0.7638369202613831, "Finetune/Step": 4719, "Finetune/Step Time": 2.9427252989262342} +{"Finetune/Learning Rate": 1.3644337636281702e-07, "Finetune/Loss": 0.7578073143959045, "Finetune/Loss (Raw)": 0.7388508915901184, "Finetune/Step": 4720, "Finetune/Step Time": 2.939447194337845} +{"Finetune/Learning Rate": 1.3537355976790622e-07, "Finetune/Loss": 0.7591990232467651, "Finetune/Loss (Raw)": 0.792186975479126, "Finetune/Step": 4721, "Finetune/Step Time": 2.9187266137450933} +{"Finetune/Learning Rate": 1.343079251894608e-07, "Finetune/Loss": 0.7623236179351807, "Finetune/Loss (Raw)": 0.7972273230552673, "Finetune/Step": 4722, "Finetune/Step Time": 2.891390787437558} +{"Finetune/Learning Rate": 1.3324647307924821e-07, "Finetune/Loss": 0.7620477080345154, "Finetune/Loss (Raw)": 0.7898097634315491, "Finetune/Step": 4723, "Finetune/Step Time": 2.8907837998121977} +{"Finetune/Learning Rate": 1.3218920388725853e-07, "Finetune/Loss": 0.7610988616943359, "Finetune/Loss (Raw)": 0.7768495678901672, "Finetune/Step": 4724, "Finetune/Step Time": 2.890358278527856} +{"Finetune/Learning Rate": 1.3113611806171545e-07, "Finetune/Loss": 0.7623236179351807, "Finetune/Loss (Raw)": 0.7129543423652649, "Finetune/Step": 4725, "Finetune/Step Time": 2.871891925111413} +{"Finetune/Learning Rate": 1.300872160490607e-07, "Finetune/Loss": 0.7623778581619263, "Finetune/Loss (Raw)": 0.8253894448280334, "Finetune/Step": 4726, "Finetune/Step Time": 2.8720610588788986} +{"Finetune/Learning Rate": 1.2904249829396864e-07, "Finetune/Loss": 0.7623987793922424, "Finetune/Loss (Raw)": 0.7664194703102112, "Finetune/Step": 4727, "Finetune/Step Time": 2.872058928012848} +{"Finetune/Learning Rate": 1.2800196523933717e-07, "Finetune/Loss": 0.7624391317367554, "Finetune/Loss (Raw)": 0.7419551014900208, "Finetune/Step": 4728, "Finetune/Step Time": 2.880092980340123} +{"Finetune/Learning Rate": 1.269656173262901e-07, "Finetune/Loss": 0.760600209236145, "Finetune/Loss (Raw)": 0.5666300058364868, "Finetune/Step": 4729, "Finetune/Step Time": 2.904895370826125} +{"Finetune/Learning Rate": 1.2593345499417819e-07, "Finetune/Loss": 0.7598521113395691, "Finetune/Loss (Raw)": 0.8072639107704163, "Finetune/Step": 4730, "Finetune/Step Time": 2.9050642531365156} +{"Finetune/Learning Rate": 1.24905478680577e-07, "Finetune/Loss": 0.7605186700820923, "Finetune/Loss (Raw)": 0.800041139125824, "Finetune/Step": 4731, "Finetune/Step Time": 2.906055236235261} +{"Finetune/Learning Rate": 1.2388168882128791e-07, "Finetune/Loss": 0.7601594924926758, "Finetune/Loss (Raw)": 0.7986094951629639, "Finetune/Step": 4732, "Finetune/Step Time": 2.902107572183013} +{"Finetune/Learning Rate": 1.22862085850336e-07, "Finetune/Loss": 0.7608581185340881, "Finetune/Loss (Raw)": 0.8800492882728577, "Finetune/Step": 4733, "Finetune/Step Time": 2.90189216658473} +{"Finetune/Learning Rate": 1.218466701999721e-07, "Finetune/Loss": 0.7606058716773987, "Finetune/Loss (Raw)": 0.8312125205993652, "Finetune/Step": 4734, "Finetune/Step Time": 2.8999642692506313} +{"Finetune/Learning Rate": 1.2083544230067412e-07, "Finetune/Loss": 0.7613363265991211, "Finetune/Loss (Raw)": 0.6022560596466064, "Finetune/Step": 4735, "Finetune/Step Time": 2.9007711820304394} +{"Finetune/Learning Rate": 1.1982840258114137e-07, "Finetune/Loss": 0.7608278393745422, "Finetune/Loss (Raw)": 0.7984215617179871, "Finetune/Step": 4736, "Finetune/Step Time": 2.9003032855689526} +{"Finetune/Learning Rate": 1.18825551468299e-07, "Finetune/Loss": 0.7575128078460693, "Finetune/Loss (Raw)": 0.3592780828475952, "Finetune/Step": 4737, "Finetune/Step Time": 2.928621966391802} +{"Finetune/Learning Rate": 1.1782688938729692e-07, "Finetune/Loss": 0.7589398622512817, "Finetune/Loss (Raw)": 0.9586222767829895, "Finetune/Step": 4738, "Finetune/Step Time": 2.929185602813959} +{"Finetune/Learning Rate": 1.1683241676150758e-07, "Finetune/Loss": 0.7587354183197021, "Finetune/Loss (Raw)": 0.6969133615493774, "Finetune/Step": 4739, "Finetune/Step Time": 2.9277010057121515} +{"Finetune/Learning Rate": 1.1584213401252931e-07, "Finetune/Loss": 0.7582494616508484, "Finetune/Loss (Raw)": 0.7337753772735596, "Finetune/Step": 4740, "Finetune/Step Time": 2.9317090529948473} +{"Finetune/Learning Rate": 1.1485604156018404e-07, "Finetune/Loss": 0.7579711675643921, "Finetune/Loss (Raw)": 0.786172091960907, "Finetune/Step": 4741, "Finetune/Step Time": 2.9371448066085577} +{"Finetune/Learning Rate": 1.1387413982251516e-07, "Finetune/Loss": 0.7584744691848755, "Finetune/Loss (Raw)": 0.7971704006195068, "Finetune/Step": 4742, "Finetune/Step Time": 2.936649028211832} +{"Finetune/Learning Rate": 1.128964292157908e-07, "Finetune/Loss": 0.7585147023200989, "Finetune/Loss (Raw)": 0.7713306546211243, "Finetune/Step": 4743, "Finetune/Step Time": 2.93473095074296} +{"Finetune/Learning Rate": 1.1192291015450164e-07, "Finetune/Loss": 0.7579213976860046, "Finetune/Loss (Raw)": 0.7635828256607056, "Finetune/Step": 4744, "Finetune/Step Time": 2.926321590319276} +{"Finetune/Learning Rate": 1.1095358305136417e-07, "Finetune/Loss": 0.7579426765441895, "Finetune/Loss (Raw)": 0.812433660030365, "Finetune/Step": 4745, "Finetune/Step Time": 2.9304109010845423} +{"Finetune/Learning Rate": 1.0998844831731415e-07, "Finetune/Loss": 0.7580034732818604, "Finetune/Loss (Raw)": 0.7683010697364807, "Finetune/Step": 4746, "Finetune/Step Time": 2.9302948620170355} +{"Finetune/Learning Rate": 1.0902750636151093e-07, "Finetune/Loss": 0.7593878507614136, "Finetune/Loss (Raw)": 0.8411984443664551, "Finetune/Step": 4747, "Finetune/Step Time": 2.927089683711529} +{"Finetune/Learning Rate": 1.0807075759133867e-07, "Finetune/Loss": 0.7588851451873779, "Finetune/Loss (Raw)": 0.782343327999115, "Finetune/Step": 4748, "Finetune/Step Time": 2.924837652593851} +{"Finetune/Learning Rate": 1.0711820241240067e-07, "Finetune/Loss": 0.758136510848999, "Finetune/Loss (Raw)": 0.7218982577323914, "Finetune/Step": 4749, "Finetune/Step Time": 2.926705926656723} +{"Finetune/Learning Rate": 1.0616984122852391e-07, "Finetune/Loss": 0.7568264007568359, "Finetune/Loss (Raw)": 0.7243182063102722, "Finetune/Step": 4750, "Finetune/Step Time": 2.930279215797782} +{"Finetune/Learning Rate": 1.0522567444175791e-07, "Finetune/Loss": 0.7570639848709106, "Finetune/Loss (Raw)": 0.7912412881851196, "Finetune/Step": 4751, "Finetune/Step Time": 2.9240858536213636} +{"Finetune/Learning Rate": 1.0428570245237247e-07, "Finetune/Loss": 0.7562321424484253, "Finetune/Loss (Raw)": 0.7379760146141052, "Finetune/Step": 4752, "Finetune/Step Time": 2.9259658474475145} +{"Finetune/Learning Rate": 1.0334992565886214e-07, "Finetune/Loss": 0.7602302432060242, "Finetune/Loss (Raw)": 0.7932180762290955, "Finetune/Step": 4753, "Finetune/Step Time": 2.8955382145941257} +{"Finetune/Learning Rate": 1.0241834445793742e-07, "Finetune/Loss": 0.7651265859603882, "Finetune/Loss (Raw)": 0.8327511548995972, "Finetune/Step": 4754, "Finetune/Step Time": 2.8616437762975693} +{"Finetune/Learning Rate": 1.0149095924453567e-07, "Finetune/Loss": 0.7653191089630127, "Finetune/Loss (Raw)": 0.7841586470603943, "Finetune/Step": 4755, "Finetune/Step Time": 2.858393892645836} +{"Finetune/Learning Rate": 1.0056777041181354e-07, "Finetune/Loss": 0.7651766538619995, "Finetune/Loss (Raw)": 0.727232813835144, "Finetune/Step": 4756, "Finetune/Step Time": 2.8569614198058844} +{"Finetune/Learning Rate": 9.964877835114684e-08, "Finetune/Loss": 0.7669402360916138, "Finetune/Loss (Raw)": 0.9383567571640015, "Finetune/Step": 4757, "Finetune/Step Time": 2.859916877001524} +{"Finetune/Learning Rate": 9.873398345213393e-08, "Finetune/Loss": 0.7668602466583252, "Finetune/Loss (Raw)": 0.799575686454773, "Finetune/Step": 4758, "Finetune/Step Time": 2.858173655346036} +{"Finetune/Learning Rate": 9.782338610259456e-08, "Finetune/Loss": 0.7671283483505249, "Finetune/Loss (Raw)": 0.8042161464691162, "Finetune/Step": 4759, "Finetune/Step Time": 2.857867993414402} +{"Finetune/Learning Rate": 9.691698668856774e-08, "Finetune/Loss": 0.7674751281738281, "Finetune/Loss (Raw)": 0.8378989100456238, "Finetune/Step": 4760, "Finetune/Step Time": 2.857483444735408} +{"Finetune/Learning Rate": 9.601478559431277e-08, "Finetune/Loss": 0.7674524784088135, "Finetune/Loss (Raw)": 0.7263615131378174, "Finetune/Step": 4761, "Finetune/Step Time": 2.860180029645562} +{"Finetune/Learning Rate": 9.511678320230921e-08, "Finetune/Loss": 0.7670626044273376, "Finetune/Loss (Raw)": 0.6487449407577515, "Finetune/Step": 4762, "Finetune/Step Time": 2.8845407627522945} +{"Finetune/Learning Rate": 9.422297989325813e-08, "Finetune/Loss": 0.7670064568519592, "Finetune/Loss (Raw)": 0.7714731097221375, "Finetune/Step": 4763, "Finetune/Step Time": 2.887292480096221} +{"Finetune/Learning Rate": 9.33333760460764e-08, "Finetune/Loss": 0.7655383348464966, "Finetune/Loss (Raw)": 0.691282331943512, "Finetune/Step": 4764, "Finetune/Step Time": 2.908741507679224} +{"Finetune/Learning Rate": 9.244797203790568e-08, "Finetune/Loss": 0.7647514343261719, "Finetune/Loss (Raw)": 0.7623691558837891, "Finetune/Step": 4765, "Finetune/Step Time": 2.9103026930242777} +{"Finetune/Learning Rate": 9.15667682441035e-08, "Finetune/Loss": 0.7648892402648926, "Finetune/Loss (Raw)": 0.7976105213165283, "Finetune/Step": 4766, "Finetune/Step Time": 2.913802456110716} +{"Finetune/Learning Rate": 9.068976503824877e-08, "Finetune/Loss": 0.7666707038879395, "Finetune/Loss (Raw)": 0.8387850522994995, "Finetune/Step": 4767, "Finetune/Step Time": 2.889634544029832} +{"Finetune/Learning Rate": 8.981696279213858e-08, "Finetune/Loss": 0.7669409513473511, "Finetune/Loss (Raw)": 0.8554729223251343, "Finetune/Step": 4768, "Finetune/Step Time": 2.8880379926413298} +{"Finetune/Learning Rate": 8.894836187578914e-08, "Finetune/Loss": 0.7677991986274719, "Finetune/Loss (Raw)": 0.8692427277565002, "Finetune/Step": 4769, "Finetune/Step Time": 2.886523960158229} +{"Finetune/Learning Rate": 8.808396265743701e-08, "Finetune/Loss": 0.7685315012931824, "Finetune/Loss (Raw)": 0.8294591307640076, "Finetune/Step": 4770, "Finetune/Step Time": 2.886318299919367} +{"Finetune/Learning Rate": 8.722376550353351e-08, "Finetune/Loss": 0.7691109776496887, "Finetune/Loss (Raw)": 0.8296535611152649, "Finetune/Step": 4771, "Finetune/Step Time": 2.882974887266755} +{"Finetune/Learning Rate": 8.636777077875247e-08, "Finetune/Loss": 0.7699394822120667, "Finetune/Loss (Raw)": 0.8437540531158447, "Finetune/Step": 4772, "Finetune/Step Time": 2.876956135034561} +{"Finetune/Learning Rate": 8.551597884598584e-08, "Finetune/Loss": 0.769623875617981, "Finetune/Loss (Raw)": 0.7453799843788147, "Finetune/Step": 4773, "Finetune/Step Time": 2.874385368078947} +{"Finetune/Learning Rate": 8.466839006634364e-08, "Finetune/Loss": 0.7709157466888428, "Finetune/Loss (Raw)": 0.8639973402023315, "Finetune/Step": 4774, "Finetune/Step Time": 2.874516362324357} +{"Finetune/Learning Rate": 8.382500479914957e-08, "Finetune/Loss": 0.7716858386993408, "Finetune/Loss (Raw)": 0.8146030902862549, "Finetune/Step": 4775, "Finetune/Step Time": 2.8746361155062914} +{"Finetune/Learning Rate": 8.298582340195205e-08, "Finetune/Loss": 0.7727593779563904, "Finetune/Loss (Raw)": 0.9556063413619995, "Finetune/Step": 4776, "Finetune/Step Time": 2.875173442065716} +{"Finetune/Learning Rate": 8.215084623051207e-08, "Finetune/Loss": 0.7725632190704346, "Finetune/Loss (Raw)": 0.7764322757720947, "Finetune/Step": 4777, "Finetune/Step Time": 2.8760712891817093} +{"Finetune/Learning Rate": 8.132007363881311e-08, "Finetune/Loss": 0.7724133729934692, "Finetune/Loss (Raw)": 0.716020405292511, "Finetune/Step": 4778, "Finetune/Step Time": 2.8718372862786055} +{"Finetune/Learning Rate": 8.049350597905126e-08, "Finetune/Loss": 0.7726083993911743, "Finetune/Loss (Raw)": 0.7761914730072021, "Finetune/Step": 4779, "Finetune/Step Time": 2.869843455031514} +{"Finetune/Learning Rate": 7.967114360164286e-08, "Finetune/Loss": 0.7719860076904297, "Finetune/Loss (Raw)": 0.7573792934417725, "Finetune/Step": 4780, "Finetune/Step Time": 2.8692111149430275} +{"Finetune/Learning Rate": 7.885298685522235e-08, "Finetune/Loss": 0.7712708711624146, "Finetune/Loss (Raw)": 0.7712742686271667, "Finetune/Step": 4781, "Finetune/Step Time": 2.8698381446301937} +{"Finetune/Learning Rate": 7.803903608663677e-08, "Finetune/Loss": 0.7716879844665527, "Finetune/Loss (Raw)": 0.6446412801742554, "Finetune/Step": 4782, "Finetune/Step Time": 2.868148051202297} +{"Finetune/Learning Rate": 7.72292916409545e-08, "Finetune/Loss": 0.7728493213653564, "Finetune/Loss (Raw)": 0.8040491342544556, "Finetune/Step": 4783, "Finetune/Step Time": 2.84625911898911} +{"Finetune/Learning Rate": 7.642375386145873e-08, "Finetune/Loss": 0.7714698314666748, "Finetune/Loss (Raw)": 0.6447296142578125, "Finetune/Step": 4784, "Finetune/Step Time": 2.8736645244061947} +{"Finetune/Learning Rate": 7.562242308965073e-08, "Finetune/Loss": 0.7712526321411133, "Finetune/Loss (Raw)": 0.7378382682800293, "Finetune/Step": 4785, "Finetune/Step Time": 2.8777791503816843} +{"Finetune/Learning Rate": 7.482529966524543e-08, "Finetune/Loss": 0.7716996669769287, "Finetune/Loss (Raw)": 0.8248782157897949, "Finetune/Step": 4786, "Finetune/Step Time": 2.878986045718193} +{"Finetune/Learning Rate": 7.403238392617806e-08, "Finetune/Loss": 0.7705861330032349, "Finetune/Loss (Raw)": 0.7345719337463379, "Finetune/Step": 4787, "Finetune/Step Time": 2.9019035305827856} +{"Finetune/Learning Rate": 7.32436762085964e-08, "Finetune/Loss": 0.7707188129425049, "Finetune/Loss (Raw)": 0.8037838339805603, "Finetune/Step": 4788, "Finetune/Step Time": 2.901514858007431} +{"Finetune/Learning Rate": 7.245917684686521e-08, "Finetune/Loss": 0.7703789472579956, "Finetune/Loss (Raw)": 0.7694109678268433, "Finetune/Step": 4789, "Finetune/Step Time": 2.89921616576612} +{"Finetune/Learning Rate": 7.167888617356622e-08, "Finetune/Loss": 0.7704381942749023, "Finetune/Loss (Raw)": 0.7555151581764221, "Finetune/Step": 4790, "Finetune/Step Time": 2.9001847002655268} +{"Finetune/Learning Rate": 7.090280451949816e-08, "Finetune/Loss": 0.7700620889663696, "Finetune/Loss (Raw)": 0.7075371146202087, "Finetune/Step": 4791, "Finetune/Step Time": 2.902007184922695} +{"Finetune/Learning Rate": 7.013093221367229e-08, "Finetune/Loss": 0.770440936088562, "Finetune/Loss (Raw)": 0.8013019561767578, "Finetune/Step": 4792, "Finetune/Step Time": 2.898824580013752} +{"Finetune/Learning Rate": 6.936326958331463e-08, "Finetune/Loss": 0.7699567675590515, "Finetune/Loss (Raw)": 0.7599344849586487, "Finetune/Step": 4793, "Finetune/Step Time": 2.896893609315157} +{"Finetune/Learning Rate": 6.859981695387153e-08, "Finetune/Loss": 0.7698121070861816, "Finetune/Loss (Raw)": 0.8869503140449524, "Finetune/Step": 4794, "Finetune/Step Time": 2.9001441337168217} +{"Finetune/Learning Rate": 6.784057464900073e-08, "Finetune/Loss": 0.7699007987976074, "Finetune/Loss (Raw)": 0.7144564986228943, "Finetune/Step": 4795, "Finetune/Step Time": 2.901535304263234} +{"Finetune/Learning Rate": 6.70855429905759e-08, "Finetune/Loss": 0.770046055316925, "Finetune/Loss (Raw)": 0.784038245677948, "Finetune/Step": 4796, "Finetune/Step Time": 2.898079141974449} +{"Finetune/Learning Rate": 6.633472229868543e-08, "Finetune/Loss": 0.7702968120574951, "Finetune/Loss (Raw)": 0.8132647275924683, "Finetune/Step": 4797, "Finetune/Step Time": 2.89892858825624} +{"Finetune/Learning Rate": 6.558811289163359e-08, "Finetune/Loss": 0.7706311941146851, "Finetune/Loss (Raw)": 0.7781316041946411, "Finetune/Step": 4798, "Finetune/Step Time": 2.8966970052570105} +{"Finetune/Learning Rate": 6.484571508593718e-08, "Finetune/Loss": 0.7746672630310059, "Finetune/Loss (Raw)": 0.910143256187439, "Finetune/Step": 4799, "Finetune/Step Time": 2.8637889344245195} +{"Finetune/Learning Rate": 6.41075291963289e-08, "Finetune/Loss": 0.7739130258560181, "Finetune/Loss (Raw)": 0.605141818523407, "Finetune/Step": 4800, "Finetune/Step Time": 2.8556070532649755} +{"Finetune/Learning Rate": 6.33735555357562e-08, "Finetune/Loss": 0.7737904787063599, "Finetune/Loss (Raw)": 0.8077829480171204, "Finetune/Step": 4801, "Finetune/Step Time": 2.854965951293707} +{"Finetune/Learning Rate": 6.264379441538126e-08, "Finetune/Loss": 0.7742292881011963, "Finetune/Loss (Raw)": 0.8286086916923523, "Finetune/Step": 4802, "Finetune/Step Time": 2.855741538107395} +{"Finetune/Learning Rate": 6.191824614457887e-08, "Finetune/Loss": 0.7744662165641785, "Finetune/Loss (Raw)": 0.8077226281166077, "Finetune/Step": 4803, "Finetune/Step Time": 2.8525977469980717} +{"Finetune/Learning Rate": 6.119691103093739e-08, "Finetune/Loss": 0.7739447355270386, "Finetune/Loss (Raw)": 0.8116529583930969, "Finetune/Step": 4804, "Finetune/Step Time": 2.8550798520445824} +{"Finetune/Learning Rate": 6.047978938026222e-08, "Finetune/Loss": 0.7751557230949402, "Finetune/Loss (Raw)": 0.6947960257530212, "Finetune/Step": 4805, "Finetune/Step Time": 2.8322281390428543} +{"Finetune/Learning Rate": 5.976688149656907e-08, "Finetune/Loss": 0.7740931510925293, "Finetune/Loss (Raw)": 0.6431944966316223, "Finetune/Step": 4806, "Finetune/Step Time": 2.8332500513643026} +{"Finetune/Learning Rate": 5.905818768208838e-08, "Finetune/Loss": 0.7735668420791626, "Finetune/Loss (Raw)": 0.716271698474884, "Finetune/Step": 4807, "Finetune/Step Time": 2.8362726494669914} +{"Finetune/Learning Rate": 5.835370823726316e-08, "Finetune/Loss": 0.7745994329452515, "Finetune/Loss (Raw)": 0.729590892791748, "Finetune/Step": 4808, "Finetune/Step Time": 2.8095227126032114} +{"Finetune/Learning Rate": 5.765344346075452e-08, "Finetune/Loss": 0.7745675444602966, "Finetune/Loss (Raw)": 0.7145634293556213, "Finetune/Step": 4809, "Finetune/Step Time": 2.8081803303211927} +{"Finetune/Learning Rate": 5.695739364943054e-08, "Finetune/Loss": 0.7752679586410522, "Finetune/Loss (Raw)": 0.8664449453353882, "Finetune/Step": 4810, "Finetune/Step Time": 2.806786624714732} +{"Finetune/Learning Rate": 5.6265559098375165e-08, "Finetune/Loss": 0.7746277451515198, "Finetune/Loss (Raw)": 0.7832098007202148, "Finetune/Step": 4811, "Finetune/Step Time": 2.806869490072131} +{"Finetune/Learning Rate": 5.557794010088713e-08, "Finetune/Loss": 0.7746380567550659, "Finetune/Loss (Raw)": 0.7927063703536987, "Finetune/Step": 4812, "Finetune/Step Time": 2.805809900164604} +{"Finetune/Learning Rate": 5.489453694847324e-08, "Finetune/Loss": 0.7746270298957825, "Finetune/Loss (Raw)": 0.804977297782898, "Finetune/Step": 4813, "Finetune/Step Time": 2.8011232893913984} +{"Finetune/Learning Rate": 5.421534993085731e-08, "Finetune/Loss": 0.7746559977531433, "Finetune/Loss (Raw)": 0.8647772669792175, "Finetune/Step": 4814, "Finetune/Step Time": 2.8013789616525173} +{"Finetune/Learning Rate": 5.354037933597456e-08, "Finetune/Loss": 0.7752185463905334, "Finetune/Loss (Raw)": 0.8197271823883057, "Finetune/Step": 4815, "Finetune/Step Time": 2.7994214221835136} +{"Finetune/Learning Rate": 5.2869625449971654e-08, "Finetune/Loss": 0.7730212807655334, "Finetune/Loss (Raw)": 0.5115765333175659, "Finetune/Step": 4816, "Finetune/Step Time": 2.8309346344321966} +{"Finetune/Learning Rate": 5.220308855721001e-08, "Finetune/Loss": 0.7736583948135376, "Finetune/Loss (Raw)": 0.8786417841911316, "Finetune/Step": 4817, "Finetune/Step Time": 2.831344271078706} +{"Finetune/Learning Rate": 5.1540768940260276e-08, "Finetune/Loss": 0.7726925611495972, "Finetune/Loss (Raw)": 0.7530195116996765, "Finetune/Step": 4818, "Finetune/Step Time": 2.8348384499549866} +{"Finetune/Learning Rate": 5.088266687990784e-08, "Finetune/Loss": 0.7731325626373291, "Finetune/Loss (Raw)": 0.8022511601448059, "Finetune/Step": 4819, "Finetune/Step Time": 2.835918551310897} +{"Finetune/Learning Rate": 5.0228782655147304e-08, "Finetune/Loss": 0.7741531729698181, "Finetune/Loss (Raw)": 0.9623022675514221, "Finetune/Step": 4820, "Finetune/Step Time": 2.835636643692851} +{"Finetune/Learning Rate": 4.9579116543188035e-08, "Finetune/Loss": 0.7738012671470642, "Finetune/Loss (Raw)": 0.7887084484100342, "Finetune/Step": 4821, "Finetune/Step Time": 2.838683657348156} +{"Finetune/Learning Rate": 4.893366881944972e-08, "Finetune/Loss": 0.772982120513916, "Finetune/Loss (Raw)": 0.6847827434539795, "Finetune/Step": 4822, "Finetune/Step Time": 2.8156705256551504} +{"Finetune/Learning Rate": 4.829243975756348e-08, "Finetune/Loss": 0.7732860445976257, "Finetune/Loss (Raw)": 0.8104749321937561, "Finetune/Step": 4823, "Finetune/Step Time": 2.8074776269495487} +{"Finetune/Learning Rate": 4.7655429629372975e-08, "Finetune/Loss": 0.7723000049591064, "Finetune/Loss (Raw)": 0.7663887739181519, "Finetune/Step": 4824, "Finetune/Step Time": 2.808769615367055} +{"Finetune/Learning Rate": 4.702263870493218e-08, "Finetune/Loss": 0.7686014175415039, "Finetune/Loss (Raw)": 0.2332809716463089, "Finetune/Step": 4825, "Finetune/Step Time": 2.841809829697013} +{"Finetune/Learning Rate": 4.639406725250761e-08, "Finetune/Loss": 0.7677096724510193, "Finetune/Loss (Raw)": 0.7138689756393433, "Finetune/Step": 4826, "Finetune/Step Time": 2.841191601008177} +{"Finetune/Learning Rate": 4.576971553857612e-08, "Finetune/Loss": 0.7686600685119629, "Finetune/Loss (Raw)": 0.8598467111587524, "Finetune/Step": 4827, "Finetune/Step Time": 2.84359965659678} +{"Finetune/Learning Rate": 4.514958382782486e-08, "Finetune/Loss": 0.7689521312713623, "Finetune/Loss (Raw)": 0.7741169929504395, "Finetune/Step": 4828, "Finetune/Step Time": 2.8439392540603876} +{"Finetune/Learning Rate": 4.453367238315465e-08, "Finetune/Loss": 0.7687785625457764, "Finetune/Loss (Raw)": 0.8032263517379761, "Finetune/Step": 4829, "Finetune/Step Time": 2.8403230365365744} +{"Finetune/Learning Rate": 4.392198146567439e-08, "Finetune/Loss": 0.7686373591423035, "Finetune/Loss (Raw)": 0.8154515624046326, "Finetune/Step": 4830, "Finetune/Step Time": 2.839664900675416} +{"Finetune/Learning Rate": 4.331451133470332e-08, "Finetune/Loss": 0.7686941623687744, "Finetune/Loss (Raw)": 0.810608446598053, "Finetune/Step": 4831, "Finetune/Step Time": 2.8401981443166733} +{"Finetune/Learning Rate": 4.271126224777433e-08, "Finetune/Loss": 0.770209014415741, "Finetune/Loss (Raw)": 0.9478997588157654, "Finetune/Step": 4832, "Finetune/Step Time": 2.842843083664775} +{"Finetune/Learning Rate": 4.211223446063062e-08, "Finetune/Loss": 0.7708141803741455, "Finetune/Loss (Raw)": 0.7822942733764648, "Finetune/Step": 4833, "Finetune/Step Time": 2.8442313466221094} +{"Finetune/Learning Rate": 4.151742822722127e-08, "Finetune/Loss": 0.770612359046936, "Finetune/Loss (Raw)": 0.7957230806350708, "Finetune/Step": 4834, "Finetune/Step Time": 2.839079024270177} +{"Finetune/Learning Rate": 4.0926843799711234e-08, "Finetune/Loss": 0.7709275484085083, "Finetune/Loss (Raw)": 0.7977805137634277, "Finetune/Step": 4835, "Finetune/Step Time": 2.83258942887187} +{"Finetune/Learning Rate": 4.034048142847136e-08, "Finetune/Loss": 0.7713649272918701, "Finetune/Loss (Raw)": 0.7771781086921692, "Finetune/Step": 4836, "Finetune/Step Time": 2.8319376781582832} +{"Finetune/Learning Rate": 3.9758341362087226e-08, "Finetune/Loss": 0.7719366550445557, "Finetune/Loss (Raw)": 0.8358618021011353, "Finetune/Step": 4837, "Finetune/Step Time": 2.835682235658169} +{"Finetune/Learning Rate": 3.918042384734921e-08, "Finetune/Loss": 0.7723817825317383, "Finetune/Loss (Raw)": 0.8831848502159119, "Finetune/Step": 4838, "Finetune/Step Time": 2.8351785484701395} +{"Finetune/Learning Rate": 3.8606729129261336e-08, "Finetune/Loss": 0.771987795829773, "Finetune/Loss (Raw)": 0.7748207449913025, "Finetune/Step": 4839, "Finetune/Step Time": 2.8355388902127743} +{"Finetune/Learning Rate": 3.8037257451035705e-08, "Finetune/Loss": 0.7716143131256104, "Finetune/Loss (Raw)": 0.8037328720092773, "Finetune/Step": 4840, "Finetune/Step Time": 2.848724592477083} +{"Finetune/Learning Rate": 3.747200905409476e-08, "Finetune/Loss": 0.7706650495529175, "Finetune/Loss (Raw)": 0.7217825651168823, "Finetune/Step": 4841, "Finetune/Step Time": 2.8525987826287746} +{"Finetune/Learning Rate": 3.6910984178069044e-08, "Finetune/Loss": 0.7712368369102478, "Finetune/Loss (Raw)": 0.8269860744476318, "Finetune/Step": 4842, "Finetune/Step Time": 2.850144900381565} +{"Finetune/Learning Rate": 3.635418306080163e-08, "Finetune/Loss": 0.7696124315261841, "Finetune/Loss (Raw)": 0.5979450941085815, "Finetune/Step": 4843, "Finetune/Step Time": 2.878817219287157} +{"Finetune/Learning Rate": 3.5801605938342585e-08, "Finetune/Loss": 0.7694615125656128, "Finetune/Loss (Raw)": 0.761803388595581, "Finetune/Step": 4844, "Finetune/Step Time": 2.879563733935356} +{"Finetune/Learning Rate": 3.5253253044951194e-08, "Finetune/Loss": 0.7683333158493042, "Finetune/Loss (Raw)": 0.152572900056839, "Finetune/Step": 4845, "Finetune/Step Time": 2.8774075005203485} +{"Finetune/Learning Rate": 3.4709124613097055e-08, "Finetune/Loss": 0.7687535285949707, "Finetune/Loss (Raw)": 0.8109790086746216, "Finetune/Step": 4846, "Finetune/Step Time": 2.881539950147271} +{"Finetune/Learning Rate": 3.4169220873458976e-08, "Finetune/Loss": 0.7694109678268433, "Finetune/Loss (Raw)": 0.8479886651039124, "Finetune/Step": 4847, "Finetune/Step Time": 2.877753907814622} +{"Finetune/Learning Rate": 3.363354205492386e-08, "Finetune/Loss": 0.7709869742393494, "Finetune/Loss (Raw)": 0.9405716061592102, "Finetune/Step": 4848, "Finetune/Step Time": 2.8784405644983053} +{"Finetune/Learning Rate": 3.310208838458562e-08, "Finetune/Loss": 0.7711173295974731, "Finetune/Loss (Raw)": 0.8088738322257996, "Finetune/Step": 4849, "Finetune/Step Time": 2.877323020249605} +{"Finetune/Learning Rate": 3.2574860087751793e-08, "Finetune/Loss": 0.7706863284111023, "Finetune/Loss (Raw)": 0.7420572638511658, "Finetune/Step": 4850, "Finetune/Step Time": 2.8756204042583704} +{"Finetune/Learning Rate": 3.20518573879347e-08, "Finetune/Loss": 0.7703381776809692, "Finetune/Loss (Raw)": 0.7452464699745178, "Finetune/Step": 4851, "Finetune/Step Time": 2.8755790665745735} +{"Finetune/Learning Rate": 3.153308050685699e-08, "Finetune/Loss": 0.7696263194084167, "Finetune/Loss (Raw)": 0.6857372522354126, "Finetune/Step": 4852, "Finetune/Step Time": 2.8767110630869865} +{"Finetune/Learning Rate": 3.1018529664449404e-08, "Finetune/Loss": 0.7704992294311523, "Finetune/Loss (Raw)": 0.8246850967407227, "Finetune/Step": 4853, "Finetune/Step Time": 2.873377664014697} +{"Finetune/Learning Rate": 3.050820507884966e-08, "Finetune/Loss": 0.7695842981338501, "Finetune/Loss (Raw)": 0.708274245262146, "Finetune/Step": 4854, "Finetune/Step Time": 2.876493973657489} +{"Finetune/Learning Rate": 3.000210696640693e-08, "Finetune/Loss": 0.7693467140197754, "Finetune/Loss (Raw)": 0.7360201478004456, "Finetune/Step": 4855, "Finetune/Step Time": 2.8764251861721277} +{"Finetune/Learning Rate": 2.9500235541675136e-08, "Finetune/Loss": 0.7699934840202332, "Finetune/Loss (Raw)": 0.8247384428977966, "Finetune/Step": 4856, "Finetune/Step Time": 2.866233415901661} +{"Finetune/Learning Rate": 2.9002591017418535e-08, "Finetune/Loss": 0.7718974351882935, "Finetune/Loss (Raw)": 0.8103336095809937, "Finetune/Step": 4857, "Finetune/Step Time": 2.8454911150038242} +{"Finetune/Learning Rate": 2.8509173604609474e-08, "Finetune/Loss": 0.7723718881607056, "Finetune/Loss (Raw)": 0.867992103099823, "Finetune/Step": 4858, "Finetune/Step Time": 2.8447805624455214} +{"Finetune/Learning Rate": 2.8019983512427295e-08, "Finetune/Loss": 0.7726672887802124, "Finetune/Loss (Raw)": 0.8378534913063049, "Finetune/Step": 4859, "Finetune/Step Time": 2.843580547720194} +{"Finetune/Learning Rate": 2.7535020948259437e-08, "Finetune/Loss": 0.7723726034164429, "Finetune/Loss (Raw)": 0.7608869671821594, "Finetune/Step": 4860, "Finetune/Step Time": 2.844408979639411} +{"Finetune/Learning Rate": 2.7054286117701446e-08, "Finetune/Loss": 0.7716168165206909, "Finetune/Loss (Raw)": 0.7833101153373718, "Finetune/Step": 4861, "Finetune/Step Time": 2.84315481595695} +{"Finetune/Learning Rate": 2.6577779224556955e-08, "Finetune/Loss": 0.7708529233932495, "Finetune/Loss (Raw)": 0.7334357500076294, "Finetune/Step": 4862, "Finetune/Step Time": 2.843602865934372} +{"Finetune/Learning Rate": 2.6105500470835488e-08, "Finetune/Loss": 0.7729541063308716, "Finetune/Loss (Raw)": 0.8712091445922852, "Finetune/Step": 4863, "Finetune/Step Time": 2.8202975913882256} +{"Finetune/Learning Rate": 2.5637450056754666e-08, "Finetune/Loss": 0.77226722240448, "Finetune/Loss (Raw)": 0.7105000615119934, "Finetune/Step": 4864, "Finetune/Step Time": 2.817733809351921} +{"Finetune/Learning Rate": 2.5173628180742426e-08, "Finetune/Loss": 0.7759472131729126, "Finetune/Loss (Raw)": 0.8303117752075195, "Finetune/Step": 4865, "Finetune/Step Time": 2.7860426772385836} +{"Finetune/Learning Rate": 2.4714035039430373e-08, "Finetune/Loss": 0.7747201919555664, "Finetune/Loss (Raw)": 0.801568329334259, "Finetune/Step": 4866, "Finetune/Step Time": 2.781965274363756} +{"Finetune/Learning Rate": 2.4258670827658203e-08, "Finetune/Loss": 0.7752982378005981, "Finetune/Loss (Raw)": 0.7709026336669922, "Finetune/Step": 4867, "Finetune/Step Time": 2.783187808468938} +{"Finetune/Learning Rate": 2.380753573847483e-08, "Finetune/Loss": 0.7760357856750488, "Finetune/Loss (Raw)": 0.828174352645874, "Finetune/Step": 4868, "Finetune/Step Time": 2.780899178236723} +{"Finetune/Learning Rate": 2.336062996313282e-08, "Finetune/Loss": 0.7741674184799194, "Finetune/Loss (Raw)": 0.5470297336578369, "Finetune/Step": 4869, "Finetune/Step Time": 2.801810571923852} +{"Finetune/Learning Rate": 2.2917953691095064e-08, "Finetune/Loss": 0.7745922803878784, "Finetune/Loss (Raw)": 0.8515458703041077, "Finetune/Step": 4870, "Finetune/Step Time": 2.803553795441985} +{"Finetune/Learning Rate": 2.247950711003033e-08, "Finetune/Loss": 0.7747195959091187, "Finetune/Loss (Raw)": 0.787631630897522, "Finetune/Step": 4871, "Finetune/Step Time": 2.8302927184849977} +{"Finetune/Learning Rate": 2.204529040581327e-08, "Finetune/Loss": 0.7754449844360352, "Finetune/Loss (Raw)": 0.8564372658729553, "Finetune/Step": 4872, "Finetune/Step Time": 2.828317893669009} +{"Finetune/Learning Rate": 2.1615303762525518e-08, "Finetune/Loss": 0.7746226191520691, "Finetune/Loss (Raw)": 0.7071647047996521, "Finetune/Step": 4873, "Finetune/Step Time": 2.825175715610385} +{"Finetune/Learning Rate": 2.118954736245682e-08, "Finetune/Loss": 0.7749831080436707, "Finetune/Loss (Raw)": 0.8144434690475464, "Finetune/Step": 4874, "Finetune/Step Time": 2.826574021950364} +{"Finetune/Learning Rate": 2.0768021386102788e-08, "Finetune/Loss": 0.7742868065834045, "Finetune/Loss (Raw)": 0.7520719766616821, "Finetune/Step": 4875, "Finetune/Step Time": 2.831361459568143} +{"Finetune/Learning Rate": 2.0350726012164922e-08, "Finetune/Loss": 0.7747759819030762, "Finetune/Loss (Raw)": 0.844961404800415, "Finetune/Step": 4876, "Finetune/Step Time": 2.8345602601766586} +{"Finetune/Learning Rate": 1.9937661417550603e-08, "Finetune/Loss": 0.7754817008972168, "Finetune/Loss (Raw)": 0.8122314810752869, "Finetune/Step": 4877, "Finetune/Step Time": 2.831340480595827} +{"Finetune/Learning Rate": 1.9528827777377524e-08, "Finetune/Loss": 0.7762901186943054, "Finetune/Loss (Raw)": 0.8277899622917175, "Finetune/Step": 4878, "Finetune/Step Time": 2.829046895727515} +{"Finetune/Learning Rate": 1.9124225264963713e-08, "Finetune/Loss": 0.7759048938751221, "Finetune/Loss (Raw)": 0.7419331669807434, "Finetune/Step": 4879, "Finetune/Step Time": 2.8321230057626963} +{"Finetune/Learning Rate": 1.872385405183863e-08, "Finetune/Loss": 0.7758296132087708, "Finetune/Loss (Raw)": 0.7283399701118469, "Finetune/Step": 4880, "Finetune/Step Time": 2.8297619353979826} +{"Finetune/Learning Rate": 1.8327714307736498e-08, "Finetune/Loss": 0.7755953073501587, "Finetune/Loss (Raw)": 0.763231098651886, "Finetune/Step": 4881, "Finetune/Step Time": 2.8282861821353436} +{"Finetune/Learning Rate": 1.7935806200595206e-08, "Finetune/Loss": 0.7756654024124146, "Finetune/Loss (Raw)": 0.8417239189147949, "Finetune/Step": 4882, "Finetune/Step Time": 2.8290049955248833} +{"Finetune/Learning Rate": 1.754812989656185e-08, "Finetune/Loss": 0.7753282785415649, "Finetune/Loss (Raw)": 0.7409974336624146, "Finetune/Step": 4883, "Finetune/Step Time": 2.828317780047655} +{"Finetune/Learning Rate": 1.7164685559986072e-08, "Finetune/Loss": 0.7759371995925903, "Finetune/Loss (Raw)": 0.8051822781562805, "Finetune/Step": 4884, "Finetune/Step Time": 2.828446062281728} +{"Finetune/Learning Rate": 1.678547335342895e-08, "Finetune/Loss": 0.7748885750770569, "Finetune/Loss (Raw)": 0.8041313290596008, "Finetune/Step": 4885, "Finetune/Step Time": 2.8292465042322874} +{"Finetune/Learning Rate": 1.6410493437651886e-08, "Finetune/Loss": 0.7745901346206665, "Finetune/Loss (Raw)": 0.7613698840141296, "Finetune/Step": 4886, "Finetune/Step Time": 2.8299318328499794} +{"Finetune/Learning Rate": 1.6039745971624388e-08, "Finetune/Loss": 0.7741146683692932, "Finetune/Loss (Raw)": 0.7433595657348633, "Finetune/Step": 4887, "Finetune/Step Time": 2.8338515367358923} +{"Finetune/Learning Rate": 1.5673231112520725e-08, "Finetune/Loss": 0.773409366607666, "Finetune/Loss (Raw)": 0.7476247549057007, "Finetune/Step": 4888, "Finetune/Step Time": 2.834262454882264} +{"Finetune/Learning Rate": 1.5310949015722167e-08, "Finetune/Loss": 0.7721812725067139, "Finetune/Loss (Raw)": 0.5691572427749634, "Finetune/Step": 4889, "Finetune/Step Time": 2.855645090341568} +{"Finetune/Learning Rate": 1.495289983481585e-08, "Finetune/Loss": 0.7729957103729248, "Finetune/Loss (Raw)": 0.7529963254928589, "Finetune/Step": 4890, "Finetune/Step Time": 2.8346789572387934} +{"Finetune/Learning Rate": 1.4599083721591468e-08, "Finetune/Loss": 0.7727906107902527, "Finetune/Loss (Raw)": 0.7452236413955688, "Finetune/Step": 4891, "Finetune/Step Time": 2.8316978942602873} +{"Finetune/Learning Rate": 1.4249500826046814e-08, "Finetune/Loss": 0.7742199897766113, "Finetune/Loss (Raw)": 0.8742493987083435, "Finetune/Step": 4892, "Finetune/Step Time": 2.8064886331558228} +{"Finetune/Learning Rate": 1.390415129638556e-08, "Finetune/Loss": 0.7719213962554932, "Finetune/Loss (Raw)": 0.46813663840293884, "Finetune/Step": 4893, "Finetune/Step Time": 2.8284253999590874} +{"Finetune/Learning Rate": 1.3563035279012815e-08, "Finetune/Loss": 0.7721951007843018, "Finetune/Loss (Raw)": 0.8326468467712402, "Finetune/Step": 4894, "Finetune/Step Time": 2.8252579774707556} +{"Finetune/Learning Rate": 1.322615291854401e-08, "Finetune/Loss": 0.771936297416687, "Finetune/Loss (Raw)": 0.8056610226631165, "Finetune/Step": 4895, "Finetune/Step Time": 2.823090311139822} +{"Finetune/Learning Rate": 1.2893504357796016e-08, "Finetune/Loss": 0.7704408168792725, "Finetune/Loss (Raw)": 0.6640427112579346, "Finetune/Step": 4896, "Finetune/Step Time": 2.855939643457532} +{"Finetune/Learning Rate": 1.256508973779269e-08, "Finetune/Loss": 0.7699704766273499, "Finetune/Loss (Raw)": 0.8090491890907288, "Finetune/Step": 4897, "Finetune/Step Time": 2.854548256844282} +{"Finetune/Learning Rate": 1.2240909197761553e-08, "Finetune/Loss": 0.7692562937736511, "Finetune/Loss (Raw)": 0.7380437850952148, "Finetune/Step": 4898, "Finetune/Step Time": 2.8545813392847776} +{"Finetune/Learning Rate": 1.1920962875137109e-08, "Finetune/Loss": 0.7686433792114258, "Finetune/Loss (Raw)": 0.7511971592903137, "Finetune/Step": 4899, "Finetune/Step Time": 2.854896554723382} +{"Finetune/Learning Rate": 1.160525090555642e-08, "Finetune/Loss": 0.7674203515052795, "Finetune/Loss (Raw)": 0.6872095465660095, "Finetune/Step": 4900, "Finetune/Step Time": 2.8595171999186277} +{"Finetune/Learning Rate": 1.1293773422862419e-08, "Finetune/Loss": 0.7673988342285156, "Finetune/Loss (Raw)": 0.742627739906311, "Finetune/Step": 4901, "Finetune/Step Time": 2.8595144730061293} +{"Finetune/Learning Rate": 1.0986530559105035e-08, "Finetune/Loss": 0.7625100612640381, "Finetune/Loss (Raw)": 0.238228440284729, "Finetune/Step": 4902, "Finetune/Step Time": 2.8867088332772255} +{"Finetune/Learning Rate": 1.0683522444534522e-08, "Finetune/Loss": 0.7626650333404541, "Finetune/Loss (Raw)": 0.8344446420669556, "Finetune/Step": 4903, "Finetune/Step Time": 2.8912428114563227} +{"Finetune/Learning Rate": 1.0384749207610346e-08, "Finetune/Loss": 0.7616232633590698, "Finetune/Loss (Raw)": 0.82225501537323, "Finetune/Step": 4904, "Finetune/Step Time": 2.890482846647501} +{"Finetune/Learning Rate": 1.009021097499452e-08, "Finetune/Loss": 0.7614477872848511, "Finetune/Loss (Raw)": 0.7539703249931335, "Finetune/Step": 4905, "Finetune/Step Time": 2.8887837007641792} +{"Finetune/Learning Rate": 9.799907871551607e-09, "Finetune/Loss": 0.7618948221206665, "Finetune/Loss (Raw)": 0.7732482552528381, "Finetune/Step": 4906, "Finetune/Step Time": 2.8866432160139084} +{"Finetune/Learning Rate": 9.51384002035538e-09, "Finetune/Loss": 0.7616955041885376, "Finetune/Loss (Raw)": 0.7506728172302246, "Finetune/Step": 4907, "Finetune/Step Time": 2.8823521155864} +{"Finetune/Learning Rate": 9.232007542681054e-09, "Finetune/Loss": 0.761807918548584, "Finetune/Loss (Raw)": 0.7717742919921875, "Finetune/Step": 4908, "Finetune/Step Time": 2.8827564157545567} +{"Finetune/Learning Rate": 8.954410558007498e-09, "Finetune/Loss": 0.761264443397522, "Finetune/Loss (Raw)": 0.7017115354537964, "Finetune/Step": 4909, "Finetune/Step Time": 2.904308410361409} +{"Finetune/Learning Rate": 8.681049184021684e-09, "Finetune/Loss": 0.7624335289001465, "Finetune/Loss (Raw)": 0.7942776679992676, "Finetune/Step": 4910, "Finetune/Step Time": 2.8801485039293766} +{"Finetune/Learning Rate": 8.411923536609801e-09, "Finetune/Loss": 0.7618314623832703, "Finetune/Loss (Raw)": 0.7269896268844604, "Finetune/Step": 4911, "Finetune/Step Time": 2.880791913717985} +{"Finetune/Learning Rate": 8.147033729867248e-09, "Finetune/Loss": 0.7625465393066406, "Finetune/Loss (Raw)": 0.7362505793571472, "Finetune/Step": 4912, "Finetune/Step Time": 2.8494306057691574} +{"Finetune/Learning Rate": 7.886379876091976e-09, "Finetune/Loss": 0.7629891633987427, "Finetune/Loss (Raw)": 0.7945025563240051, "Finetune/Step": 4913, "Finetune/Step Time": 2.8445713203400373} +{"Finetune/Learning Rate": 7.629962085784482e-09, "Finetune/Loss": 0.7624541521072388, "Finetune/Loss (Raw)": 0.75639808177948, "Finetune/Step": 4914, "Finetune/Step Time": 2.8479615058749914} +{"Finetune/Learning Rate": 7.377780467650031e-09, "Finetune/Loss": 0.7623888850212097, "Finetune/Loss (Raw)": 0.7262135148048401, "Finetune/Step": 4915, "Finetune/Step Time": 2.8245760407298803} +{"Finetune/Learning Rate": 7.129835128600882e-09, "Finetune/Loss": 0.7615543603897095, "Finetune/Loss (Raw)": 0.6969618201255798, "Finetune/Step": 4916, "Finetune/Step Time": 2.8204904925078154} +{"Finetune/Learning Rate": 6.8861261737485085e-09, "Finetune/Loss": 0.7621363401412964, "Finetune/Loss (Raw)": 0.8439018130302429, "Finetune/Step": 4917, "Finetune/Step Time": 2.822530459612608} +{"Finetune/Learning Rate": 6.646653706413597e-09, "Finetune/Loss": 0.7630484104156494, "Finetune/Loss (Raw)": 0.8722637891769409, "Finetune/Step": 4918, "Finetune/Step Time": 2.822549395263195} +{"Finetune/Learning Rate": 6.411417828117161e-09, "Finetune/Loss": 0.7642086744308472, "Finetune/Loss (Raw)": 0.8560536503791809, "Finetune/Step": 4919, "Finetune/Step Time": 2.8189739901572466} +{"Finetune/Learning Rate": 6.180418638584984e-09, "Finetune/Loss": 0.7636950016021729, "Finetune/Loss (Raw)": 0.7355479001998901, "Finetune/Step": 4920, "Finetune/Step Time": 2.8227099403738976} +{"Finetune/Learning Rate": 5.953656235747618e-09, "Finetune/Loss": 0.7643749117851257, "Finetune/Loss (Raw)": 0.8469632267951965, "Finetune/Step": 4921, "Finetune/Step Time": 2.82157139852643} +{"Finetune/Learning Rate": 5.731130715738165e-09, "Finetune/Loss": 0.7638643383979797, "Finetune/Loss (Raw)": 0.8216022253036499, "Finetune/Step": 4922, "Finetune/Step Time": 2.8231224324554205} +{"Finetune/Learning Rate": 5.5128421728944945e-09, "Finetune/Loss": 0.7630409002304077, "Finetune/Loss (Raw)": 0.6090476512908936, "Finetune/Step": 4923, "Finetune/Step Time": 2.8452393282204866} +{"Finetune/Learning Rate": 5.2987906997581385e-09, "Finetune/Loss": 0.7631517648696899, "Finetune/Loss (Raw)": 0.79823899269104, "Finetune/Step": 4924, "Finetune/Step Time": 2.844673288986087} +{"Finetune/Learning Rate": 5.088976387074285e-09, "Finetune/Loss": 0.7636906504631042, "Finetune/Loss (Raw)": 0.8822407722473145, "Finetune/Step": 4925, "Finetune/Step Time": 2.8450089003890753} +{"Finetune/Learning Rate": 4.883399323791782e-09, "Finetune/Loss": 0.7636646628379822, "Finetune/Loss (Raw)": 0.7748026847839355, "Finetune/Step": 4926, "Finetune/Step Time": 2.844467656686902} +{"Finetune/Learning Rate": 4.6820595970631376e-09, "Finetune/Loss": 0.7624285817146301, "Finetune/Loss (Raw)": 0.7519261837005615, "Finetune/Step": 4927, "Finetune/Step Time": 2.846775021404028} +{"Finetune/Learning Rate": 4.484957292244518e-09, "Finetune/Loss": 0.7639517784118652, "Finetune/Loss (Raw)": 0.8001052141189575, "Finetune/Step": 4928, "Finetune/Step Time": 2.8243428096175194} +{"Finetune/Learning Rate": 4.2920924928946395e-09, "Finetune/Loss": 0.759681224822998, "Finetune/Loss (Raw)": 0.26114949584007263, "Finetune/Step": 4929, "Finetune/Step Time": 2.8707872983068228} +{"Finetune/Learning Rate": 4.103465280778096e-09, "Finetune/Loss": 0.759319543838501, "Finetune/Loss (Raw)": 0.782313346862793, "Finetune/Step": 4930, "Finetune/Step Time": 2.8720607832074165} +{"Finetune/Learning Rate": 3.919075735860922e-09, "Finetune/Loss": 0.7599101066589355, "Finetune/Loss (Raw)": 0.8833208084106445, "Finetune/Step": 4931, "Finetune/Step Time": 2.878638170659542} +{"Finetune/Learning Rate": 3.7389239363139206e-09, "Finetune/Loss": 0.759514331817627, "Finetune/Loss (Raw)": 0.7609905004501343, "Finetune/Step": 4932, "Finetune/Step Time": 2.875658353790641} +{"Finetune/Learning Rate": 3.5630099585104437e-09, "Finetune/Loss": 0.761597752571106, "Finetune/Loss (Raw)": 0.9614782929420471, "Finetune/Step": 4933, "Finetune/Step Time": 2.870561109855771} +{"Finetune/Learning Rate": 3.3913338770263924e-09, "Finetune/Loss": 0.7622199058532715, "Finetune/Loss (Raw)": 0.7228304147720337, "Finetune/Step": 4934, "Finetune/Step Time": 2.864823153242469} +{"Finetune/Learning Rate": 3.2238957646446577e-09, "Finetune/Loss": 0.7615368366241455, "Finetune/Loss (Raw)": 0.62883460521698, "Finetune/Step": 4935, "Finetune/Step Time": 2.8876439090818167} +{"Finetune/Learning Rate": 3.0606956923462383e-09, "Finetune/Loss": 0.7621650695800781, "Finetune/Loss (Raw)": 0.8100056648254395, "Finetune/Step": 4936, "Finetune/Step Time": 2.8918878994882107} +{"Finetune/Learning Rate": 2.9017337293213433e-09, "Finetune/Loss": 0.7618030309677124, "Finetune/Loss (Raw)": 0.6682207584381104, "Finetune/Step": 4937, "Finetune/Step Time": 2.8893239479511976} +{"Finetune/Learning Rate": 2.7470099429571795e-09, "Finetune/Loss": 0.7604477405548096, "Finetune/Loss (Raw)": 0.6929742097854614, "Finetune/Step": 4938, "Finetune/Step Time": 2.8904479946941137} +{"Finetune/Learning Rate": 2.596524398850164e-09, "Finetune/Loss": 0.760466992855072, "Finetune/Loss (Raw)": 0.7856698632240295, "Finetune/Step": 4939, "Finetune/Step Time": 2.8903278298676014} +{"Finetune/Learning Rate": 2.450277160795933e-09, "Finetune/Loss": 0.7605777978897095, "Finetune/Loss (Raw)": 0.8068955540657043, "Finetune/Step": 4940, "Finetune/Step Time": 2.891213709488511} +{"Finetune/Learning Rate": 2.3082682907948908e-09, "Finetune/Loss": 0.7602828741073608, "Finetune/Loss (Raw)": 0.7672279477119446, "Finetune/Step": 4941, "Finetune/Step Time": 2.8925880175083876} +{"Finetune/Learning Rate": 2.170497849051101e-09, "Finetune/Loss": 0.7600356936454773, "Finetune/Loss (Raw)": 0.8331364393234253, "Finetune/Step": 4942, "Finetune/Step Time": 2.8941636849194765} +{"Finetune/Learning Rate": 2.0369658939700665e-09, "Finetune/Loss": 0.7595868706703186, "Finetune/Loss (Raw)": 0.7622737884521484, "Finetune/Step": 4943, "Finetune/Step Time": 2.889769660308957} +{"Finetune/Learning Rate": 1.9076724821609496e-09, "Finetune/Loss": 0.7611802816390991, "Finetune/Loss (Raw)": 0.7155311703681946, "Finetune/Step": 4944, "Finetune/Step Time": 2.862261738628149} +{"Finetune/Learning Rate": 1.7826176684376806e-09, "Finetune/Loss": 0.7602677345275879, "Finetune/Loss (Raw)": 0.7618369460105896, "Finetune/Step": 4945, "Finetune/Step Time": 2.862619323655963} +{"Finetune/Learning Rate": 1.66180150581563e-09, "Finetune/Loss": 0.7614759206771851, "Finetune/Loss (Raw)": 0.9076628088951111, "Finetune/Step": 4946, "Finetune/Step Time": 2.859964517876506} +{"Finetune/Learning Rate": 1.5452240455138267e-09, "Finetune/Loss": 0.760507345199585, "Finetune/Loss (Raw)": 0.6782757639884949, "Finetune/Step": 4947, "Finetune/Step Time": 2.879828343167901} +{"Finetune/Learning Rate": 1.4328853369538486e-09, "Finetune/Loss": 0.7581158876419067, "Finetune/Loss (Raw)": 0.6561971306800842, "Finetune/Step": 4948, "Finetune/Step Time": 2.879552874714136} +{"Finetune/Learning Rate": 1.324785427760933e-09, "Finetune/Loss": 0.7561646103858948, "Finetune/Loss (Raw)": 0.5389512777328491, "Finetune/Step": 4949, "Finetune/Step Time": 2.8991908840835094} +{"Finetune/Learning Rate": 1.2209243637628654e-09, "Finetune/Loss": 0.7570309638977051, "Finetune/Loss (Raw)": 0.7956738471984863, "Finetune/Step": 4950, "Finetune/Step Time": 2.902917478233576} +{"Finetune/Learning Rate": 1.1213021889910914e-09, "Finetune/Loss": 0.7571340799331665, "Finetune/Loss (Raw)": 0.823672354221344, "Finetune/Step": 4951, "Finetune/Step Time": 2.9079772792756557} +{"Finetune/Learning Rate": 1.0259189456784946e-09, "Finetune/Loss": 0.7577998638153076, "Finetune/Loss (Raw)": 0.8516054749488831, "Finetune/Step": 4952, "Finetune/Step Time": 2.9195608720183372} +{"Finetune/Learning Rate": 9.347746742627285e-10, "Finetune/Loss": 0.7611773014068604, "Finetune/Loss (Raw)": 0.6655902862548828, "Finetune/Step": 4953, "Finetune/Step Time": 2.8894282523542643} +{"Finetune/Learning Rate": 8.478694133839949e-10, "Finetune/Loss": 0.7616968154907227, "Finetune/Loss (Raw)": 0.7803731560707092, "Finetune/Step": 4954, "Finetune/Step Time": 2.8887156024575233} +{"Finetune/Learning Rate": 7.652031998839349e-10, "Finetune/Loss": 0.7614886164665222, "Finetune/Loss (Raw)": 0.8331968188285828, "Finetune/Step": 4955, "Finetune/Step Time": 2.885131161659956} +{"Finetune/Learning Rate": 6.867760688078484e-10, "Finetune/Loss": 0.7616228461265564, "Finetune/Loss (Raw)": 0.7912993431091309, "Finetune/Step": 4956, "Finetune/Step Time": 2.8894465286284685} +{"Finetune/Learning Rate": 6.125880534046946e-10, "Finetune/Loss": 0.7608153820037842, "Finetune/Loss (Raw)": 0.6998674273490906, "Finetune/Step": 4957, "Finetune/Step Time": 2.890362123027444} +{"Finetune/Learning Rate": 5.426391851270918e-10, "Finetune/Loss": 0.7612266540527344, "Finetune/Loss (Raw)": 0.868102490901947, "Finetune/Step": 4958, "Finetune/Step Time": 2.8905344381928444} +{"Finetune/Learning Rate": 4.769294936268764e-10, "Finetune/Loss": 0.7610744833946228, "Finetune/Loss (Raw)": 0.7911228537559509, "Finetune/Step": 4959, "Finetune/Step Time": 2.8924355264753103} +{"Finetune/Learning Rate": 4.1545900676287496e-10, "Finetune/Loss": 0.7607240676879883, "Finetune/Loss (Raw)": 0.9030498266220093, "Finetune/Step": 4960, "Finetune/Step Time": 2.889499593526125} +{"Finetune/Learning Rate": 3.582277505942422e-10, "Finetune/Loss": 0.7609701752662659, "Finetune/Loss (Raw)": 0.8137897849082947, "Finetune/Step": 4961, "Finetune/Step Time": 2.888265883550048} +{"Finetune/Learning Rate": 3.0523574938379207e-10, "Finetune/Loss": 0.7601804137229919, "Finetune/Loss (Raw)": 0.6946359276771545, "Finetune/Step": 4962, "Finetune/Step Time": 2.891882276162505} +{"Finetune/Learning Rate": 2.5648302559688754e-10, "Finetune/Loss": 0.760269284248352, "Finetune/Loss (Raw)": 0.8091566562652588, "Finetune/Step": 4963, "Finetune/Step Time": 2.8987713661044836} +{"Finetune/Learning Rate": 2.119695999014404e-10, "Finetune/Loss": 0.7608625888824463, "Finetune/Loss (Raw)": 0.8531209826469421, "Finetune/Step": 4964, "Finetune/Step Time": 2.897393999621272} +{"Finetune/Learning Rate": 1.7169549116902161e-10, "Finetune/Loss": 0.7594816088676453, "Finetune/Loss (Raw)": 0.6591008305549622, "Finetune/Step": 4965, "Finetune/Step Time": 2.9188317246735096} +{"Finetune/Learning Rate": 1.3566071647375113e-10, "Finetune/Loss": 0.7589930295944214, "Finetune/Loss (Raw)": 0.8206406235694885, "Finetune/Step": 4966, "Finetune/Step Time": 2.9210250191390514} +{"Finetune/Learning Rate": 1.0386529109118749e-10, "Finetune/Loss": 0.7587618827819824, "Finetune/Loss (Raw)": 0.7452346086502075, "Finetune/Step": 4967, "Finetune/Step Time": 2.923173639923334} +{"Finetune/Learning Rate": 7.630922850054844e-11, "Finetune/Loss": 0.7590128183364868, "Finetune/Loss (Raw)": 0.8358520865440369, "Finetune/Step": 4968, "Finetune/Step Time": 2.9112496618181467} +{"Finetune/Learning Rate": 5.299254038582113e-11, "Finetune/Loss": 0.7590820789337158, "Finetune/Loss (Raw)": 0.7306535840034485, "Finetune/Step": 4969, "Finetune/Step Time": 2.9082301445305347} +{"Finetune/Learning Rate": 3.39152366302109e-11, "Finetune/Loss": 0.7587769031524658, "Finetune/Loss (Raw)": 0.787918746471405, "Finetune/Step": 4970, "Finetune/Step Time": 2.910550005733967} +{"Finetune/Learning Rate": 1.9077325322802708e-11, "Finetune/Loss": 0.760064423084259, "Finetune/Loss (Raw)": 0.7627471685409546, "Finetune/Step": 4971, "Finetune/Step Time": 2.8829449750483036} +{"Finetune/Learning Rate": 8.478812751899768e-12, "Finetune/Loss": 0.7602291107177734, "Finetune/Loss (Raw)": 0.7828897833824158, "Finetune/Step": 4972, "Finetune/Step Time": 2.878889048472047} +{"Finetune/Learning Rate": 2.1197034127951043e-12, "Finetune/Loss": 0.7652972936630249, "Finetune/Loss (Raw)": 0.8013003468513489, "Finetune/Step": 4973, "Finetune/Step Time": 2.8444697223603725} +{"Finetune/Learning Rate": 0.0, "Finetune/Loss": 0.7650017738342285, "Finetune/Loss (Raw)": 0.7731505632400513, "Finetune/Step": 4974, "Finetune/Step Time": 2.8424946516752243} +{"Finetune/Learning Rate": 2.1197034127951043e-12, "Finetune/Loss": 0.76496821641922, "Finetune/Loss (Raw)": 0.84368896484375, "Finetune/Step": 4975, "Finetune/Step Time": 2.846069421619177} diff --git a/phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7/run-metrics.jsonl b/phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7/run-metrics.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7a753fbd8b2d6120b86e9578d2740e465e68fea7 --- /dev/null +++ b/phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7/run-metrics.jsonl @@ -0,0 +1 @@ +{"hparams": {"dataset": {"align_stage_components": ["download/llava-laion-cc-sbu-558k/chat.json", "download/llava-laion-cc-sbu-558k"], "dataset_id": "llava-v15", "dataset_resampled": true, "dataset_root_dir": "data", "finetune_stage_components": ["/home/wzwang/data/llava/llava_phi_3_joint_sharegpt_sft_data_557k.json", "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/llava/images"], "max_num_images": 6, "min_num_images": 1, "train_num_samples": 200000, "type": "llava-v15", "workers": 4}, "model": {"align_epochs": 1, "align_global_batch_size": 256, "align_learning_rate": 0.001, "align_lr_scheduler_type": "linear-warmup+cosine-decay", "align_max_grad_norm": 1.0, "align_max_steps": null, "align_per_device_batch_size": 16, "align_train_strategy": "fsdp-shard-grad-op", "align_warmup_ratio": 0.03, "align_weight_decay": 0.0, "arch_specifier": "full-align+avgpool", "enable_gradient_checkpointing": true, "enable_mixed_precision_training": true, "finetune_epochs": 1, "finetune_global_batch_size": 112, "finetune_learning_rate": 2e-05, "finetune_lr_scheduler_type": "linear-warmup+cosine-decay", "finetune_max_grad_norm": 1.0, "finetune_max_steps": null, "finetune_per_device_batch_size": 16, "finetune_train_strategy": "fsdp-full-shard", "finetune_warmup_ratio": 0.03, "finetune_weight_decay": 0.1, "image_resize_strategy": "resize-naive", "llm_backbone_id": "phi3-3b", "llm_max_length": 4096, "model_id": "phi3-3b-continue-training-hq-35-557k-sft", "pretrain_epochs": 1, "pretrain_global_batch_size": 512, "pretrain_learning_rate": 5e-05, "pretrain_lr_scheduler_type": "linear-warmup+cosine-decay", "pretrain_max_grad_norm": 1.0, "pretrain_max_steps": null, "pretrain_per_device_batch_size": 16, "pretrain_train_strategy": "fsdp-full-shard", "pretrain_warmup_ratio": 0.03, "pretrain_weight_decay": 0.01, "reduce_in_full_precision": false, "type": "one-stage+7b", "vision_backbone_id": "siglip-vit-so400m-384px"}, "mount_path": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/models", "pretrained_checkpoint": "/home/wzwang/checkpoints/mllm_pretrain_checkpoints/obelics+phi3-3b-continue-training-hq_35-run1+stage-pretrain+x7/checkpoints/latest-checkpoint.pt", "run_id": "phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7", "run_root_dir": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/checkpoints/mllm_sft_checkpoints", "seed": 7, "stage": "finetune", "trackers": ["jsonl"], "wandb_entity": null, "wandb_project": "mmpretrain"}, "run_id": "phi3-3b-continue-training-hq-35-557k-sft+stage-finetune+x7"}