{"hparams": {"dataset": {"align_stage_components": ["download/llava-laion-cc-sbu-558k/chat.json", "download/llava-laion-cc-sbu-558k"], "dataset_id": "llava-v15", "dataset_root_dir": "data", "finetune_stage_components": ["download/llava-v1.5-instruct/llava_v1_5_mix665k.json", "download/llava-v1.5-instruct"], "type": "llava-v15"}, "hf_token": ".hf_token", "model": {"align_epochs": 1, "align_global_batch_size": 256, "align_learning_rate": 0.001, "align_lr_scheduler_type": "linear-warmup+cosine-decay", "align_max_grad_norm": 1.0, "align_max_steps": null, "align_per_device_batch_size": 16, "align_train_strategy": "fsdp-shard-grad-op", "align_warmup_ratio": 0.03, "align_weight_decay": 0.0, "arch_specifier": "no-align+gelu-mlp", "enable_gradient_checkpointing": true, "enable_mixed_precision_training": true, "finetune_epochs": 1, "finetune_global_batch_size": 128, "finetune_learning_rate": 2e-05, "finetune_lr_scheduler_type": "linear-warmup+cosine-decay", "finetune_max_grad_norm": 1.0, "finetune_max_steps": null, "finetune_per_device_batch_size": 16, "finetune_train_strategy": "fsdp-full-shard", "finetune_warmup_ratio": 0.03, "finetune_weight_decay": 0.1, "image_resize_strategy": "letterbox", "llm_backbone_id": "vicuna-v15-7b", "llm_max_length": 2048, "model_id": "full-ft-one-stage+7b", "reduce_in_full_precision": false, "type": "full-ft-one-stage+7b", "vision_backbone_id": "clip-vit-l-336px"}, "pretrained_checkpoint": null, "run_id": "full-ft-one-stage+7b", "run_root_dir": "runs", "seed": 7, "stage": "full-finetune", "trackers": ["jsonl", "wandb"], "wandb_entity": null, "wandb_project": "prismatic"}, "run_id": "full-ft-one-stage+7b+stage-full-finetune+x7"} {"Full-finetune/Learning Rate": 1.2903225806451614e-07, "Full-finetune/Loss": 5.405529975891113, "Full-finetune/Loss (Raw)": 5.405529975891113, "Full-finetune/Step": 1, "Full-finetune/Step Time": 24.873047828674316} {"Full-finetune/Learning Rate": 2.580645161290323e-07, "Full-finetune/Loss": 5.691460609436035, "Full-finetune/Loss (Raw)": 5.977391242980957, "Full-finetune/Step": 2, "Full-finetune/Step Time": 17.0067218542099} {"Full-finetune/Learning Rate": 3.870967741935484e-07, "Full-finetune/Loss": 5.075779438018799, "Full-finetune/Loss (Raw)": 3.844416618347168, "Full-finetune/Step": 3, "Full-finetune/Step Time": 13.212823867797852} {"Full-finetune/Learning Rate": 5.161290322580646e-07, "Full-finetune/Loss": 4.617429733276367, "Full-finetune/Loss (Raw)": 3.242382049560547, "Full-finetune/Step": 4, "Full-finetune/Step Time": 11.360151648521423} {"Full-finetune/Learning Rate": 6.451612903225807e-07, "Full-finetune/Loss": 4.254143714904785, "Full-finetune/Loss (Raw)": 2.800996780395508, "Full-finetune/Step": 5, "Full-finetune/Step Time": 10.448075342178345} {"Full-finetune/Learning Rate": 7.741935483870968e-07, "Full-finetune/Loss": 3.9795215129852295, "Full-finetune/Loss (Raw)": 2.606409788131714, "Full-finetune/Step": 6, "Full-finetune/Step Time": 9.752447168032328} {"Full-finetune/Learning Rate": 9.032258064516129e-07, "Full-finetune/Loss": 3.7876386642456055, "Full-finetune/Loss (Raw)": 2.636342763900757, "Full-finetune/Step": 7, "Full-finetune/Step Time": 9.254452671323504} {"Full-finetune/Learning Rate": 1.0322580645161291e-06, "Full-finetune/Loss": 3.634507656097412, "Full-finetune/Loss (Raw)": 2.5625929832458496, "Full-finetune/Step": 8, "Full-finetune/Step Time": 9.038153737783432} {"Full-finetune/Learning Rate": 1.1612903225806454e-06, "Full-finetune/Loss": 3.4805455207824707, "Full-finetune/Loss (Raw)": 2.2488460540771484, "Full-finetune/Step": 9, "Full-finetune/Step Time": 8.745264848073324} {"Full-finetune/Learning Rate": 1.2903225806451614e-06, "Full-finetune/Loss": 3.387449026107788, "Full-finetune/Loss (Raw)": 2.5495810508728027, "Full-finetune/Step": 10, "Full-finetune/Step Time": 8.748241186141968} {"Full-finetune/Learning Rate": 1.4193548387096776e-06, "Full-finetune/Loss": 3.29166316986084, "Full-finetune/Loss (Raw)": 2.333806276321411, "Full-finetune/Step": 11, "Full-finetune/Step Time": 8.500518907200206} {"Full-finetune/Learning Rate": 1.5483870967741937e-06, "Full-finetune/Loss": 3.2047955989837646, "Full-finetune/Loss (Raw)": 2.249253511428833, "Full-finetune/Step": 12, "Full-finetune/Step Time": 8.306091566880545} {"Full-finetune/Learning Rate": 1.67741935483871e-06, "Full-finetune/Loss": 3.118471384048462, "Full-finetune/Loss (Raw)": 2.08258056640625, "Full-finetune/Step": 13, "Full-finetune/Step Time": 8.140230637330275} {"Full-finetune/Learning Rate": 1.8064516129032258e-06, "Full-finetune/Loss": 3.063769817352295, "Full-finetune/Loss (Raw)": 2.3526504039764404, "Full-finetune/Step": 14, "Full-finetune/Step Time": 7.969228182520185} {"Full-finetune/Learning Rate": 1.935483870967742e-06, "Full-finetune/Loss": 2.9911749362945557, "Full-finetune/Loss (Raw)": 1.9748440980911255, "Full-finetune/Step": 15, "Full-finetune/Step Time": 7.920398314793904} {"Full-finetune/Learning Rate": 2.0645161290322582e-06, "Full-finetune/Loss": 2.8918004035949707, "Full-finetune/Loss (Raw)": 1.4011839628219604, "Full-finetune/Step": 16, "Full-finetune/Step Time": 7.885233923792839} {"Full-finetune/Learning Rate": 2.1935483870967745e-06, "Full-finetune/Loss": 2.8317625522613525, "Full-finetune/Loss (Raw)": 1.871152639389038, "Full-finetune/Step": 17, "Full-finetune/Step Time": 7.792490187813254} {"Full-finetune/Learning Rate": 2.3225806451612907e-06, "Full-finetune/Loss": 2.753575563430786, "Full-finetune/Loss (Raw)": 1.4243980646133423, "Full-finetune/Step": 18, "Full-finetune/Step Time": 7.734779437383016} {"Full-finetune/Learning Rate": 2.4516129032258066e-06, "Full-finetune/Loss": 2.700429677963257, "Full-finetune/Loss (Raw)": 1.7438017129898071, "Full-finetune/Step": 19, "Full-finetune/Step Time": 7.635772905851665} {"Full-finetune/Learning Rate": 2.580645161290323e-06, "Full-finetune/Loss": 2.648192882537842, "Full-finetune/Loss (Raw)": 1.6556954383850098, "Full-finetune/Step": 20, "Full-finetune/Step Time": 7.5344293236732485} {"Full-finetune/Learning Rate": 2.709677419354839e-06, "Full-finetune/Loss": 2.5919506549835205, "Full-finetune/Loss (Raw)": 1.4671074151992798, "Full-finetune/Step": 21, "Full-finetune/Step Time": 7.5275374707721525} {"Full-finetune/Learning Rate": 2.8387096774193553e-06, "Full-finetune/Loss": 2.5337655544281006, "Full-finetune/Loss (Raw)": 1.3118785619735718, "Full-finetune/Step": 22, "Full-finetune/Step Time": 7.472153208472512} {"Full-finetune/Learning Rate": 2.967741935483871e-06, "Full-finetune/Loss": 2.4332449436187744, "Full-finetune/Loss (Raw)": 0.22178851068019867, "Full-finetune/Step": 23, "Full-finetune/Step Time": 7.54178524017334} {"Full-finetune/Learning Rate": 3.0967741935483874e-06, "Full-finetune/Loss": 2.396077871322632, "Full-finetune/Loss (Raw)": 1.541238784790039, "Full-finetune/Step": 24, "Full-finetune/Step Time": 7.464219391345978} {"Full-finetune/Learning Rate": 3.225806451612903e-06, "Full-finetune/Loss": 2.3562369346618652, "Full-finetune/Loss (Raw)": 1.4000520706176758, "Full-finetune/Step": 25, "Full-finetune/Step Time": 7.416970367431641} {"Full-finetune/Learning Rate": 3.35483870967742e-06, "Full-finetune/Loss": 2.2758491039276123, "Full-finetune/Loss (Raw)": 0.26615452766418457, "Full-finetune/Step": 26, "Full-finetune/Step Time": 7.499482778402475} {"Full-finetune/Learning Rate": 3.4838709677419357e-06, "Full-finetune/Loss": 2.2485928535461426, "Full-finetune/Loss (Raw)": 1.5399322509765625, "Full-finetune/Step": 27, "Full-finetune/Step Time": 7.4244534439510765} {"Full-finetune/Learning Rate": 3.6129032258064515e-06, "Full-finetune/Loss": 2.216071128845215, "Full-finetune/Loss (Raw)": 1.3379814624786377, "Full-finetune/Step": 28, "Full-finetune/Step Time": 7.3624633720942905} {"Full-finetune/Learning Rate": 3.741935483870968e-06, "Full-finetune/Loss": 2.18984317779541, "Full-finetune/Loss (Raw)": 1.4554681777954102, "Full-finetune/Step": 29, "Full-finetune/Step Time": 7.354638420302292} {"Full-finetune/Learning Rate": 3.870967741935484e-06, "Full-finetune/Loss": 2.1595351696014404, "Full-finetune/Loss (Raw)": 1.280592918395996, "Full-finetune/Step": 30, "Full-finetune/Step Time": 7.350450841585795} {"Full-finetune/Learning Rate": 4.000000000000001e-06, "Full-finetune/Loss": 2.137584924697876, "Full-finetune/Loss (Raw)": 1.4790880680084229, "Full-finetune/Step": 31, "Full-finetune/Step Time": 7.3210450218569845} {"Full-finetune/Learning Rate": 4.1290322580645165e-06, "Full-finetune/Loss": 2.1120643615722656, "Full-finetune/Loss (Raw)": 1.3209233283996582, "Full-finetune/Step": 32, "Full-finetune/Step Time": 7.347361341118813} {"Full-finetune/Learning Rate": 4.258064516129032e-06, "Full-finetune/Loss": 2.0841848850250244, "Full-finetune/Loss (Raw)": 1.192038655281067, "Full-finetune/Step": 33, "Full-finetune/Step Time": 7.327375787677187} {"Full-finetune/Learning Rate": 4.387096774193549e-06, "Full-finetune/Loss": 2.0558159351348877, "Full-finetune/Loss (Raw)": 1.119642972946167, "Full-finetune/Step": 34, "Full-finetune/Step Time": 7.290866129538593} {"Full-finetune/Learning Rate": 4.516129032258065e-06, "Full-finetune/Loss": 2.03924298286438, "Full-finetune/Loss (Raw)": 1.4757580757141113, "Full-finetune/Step": 35, "Full-finetune/Step Time": 7.265568011147636} {"Full-finetune/Learning Rate": 4.6451612903225815e-06, "Full-finetune/Loss": 2.016756296157837, "Full-finetune/Loss (Raw)": 1.22972571849823, "Full-finetune/Step": 36, "Full-finetune/Step Time": 7.277163889673021} {"Full-finetune/Learning Rate": 4.774193548387097e-06, "Full-finetune/Loss": 1.9994300603866577, "Full-finetune/Loss (Raw)": 1.3756883144378662, "Full-finetune/Step": 37, "Full-finetune/Step Time": 7.327691870766717} {"Full-finetune/Learning Rate": 4.903225806451613e-06, "Full-finetune/Loss": 1.9794384241104126, "Full-finetune/Loss (Raw)": 1.2397491931915283, "Full-finetune/Step": 38, "Full-finetune/Step Time": 7.2841218584462215} {"Full-finetune/Learning Rate": 5.032258064516129e-06, "Full-finetune/Loss": 1.9597368240356445, "Full-finetune/Loss (Raw)": 1.2110638618469238, "Full-finetune/Step": 39, "Full-finetune/Step Time": 7.2425770942981424} {"Full-finetune/Learning Rate": 5.161290322580646e-06, "Full-finetune/Loss": 1.941470742225647, "Full-finetune/Loss (Raw)": 1.2290953397750854, "Full-finetune/Step": 40, "Full-finetune/Step Time": 7.249567645788193} {"Full-finetune/Learning Rate": 5.290322580645162e-06, "Full-finetune/Loss": 1.926000952720642, "Full-finetune/Loss (Raw)": 1.3072172403335571, "Full-finetune/Step": 41, "Full-finetune/Step Time": 7.1994601168283605} {"Full-finetune/Learning Rate": 5.419354838709678e-06, "Full-finetune/Loss": 1.9101881980895996, "Full-finetune/Loss (Raw)": 1.261858344078064, "Full-finetune/Step": 42, "Full-finetune/Step Time": 7.162840201741173} {"Full-finetune/Learning Rate": 5.548387096774194e-06, "Full-finetune/Loss": 1.8938034772872925, "Full-finetune/Loss (Raw)": 1.2056440114974976, "Full-finetune/Step": 43, "Full-finetune/Step Time": 7.161245651023332} {"Full-finetune/Learning Rate": 5.677419354838711e-06, "Full-finetune/Loss": 1.8788068294525146, "Full-finetune/Loss (Raw)": 1.233952522277832, "Full-finetune/Step": 44, "Full-finetune/Step Time": 7.153590072285045} {"Full-finetune/Learning Rate": 5.806451612903226e-06, "Full-finetune/Loss": 1.8611574172973633, "Full-finetune/Loss (Raw)": 1.0845835208892822, "Full-finetune/Step": 45, "Full-finetune/Step Time": 7.210298485226101} {"Full-finetune/Learning Rate": 5.935483870967742e-06, "Full-finetune/Loss": 1.8261123895645142, "Full-finetune/Loss (Raw)": 0.24908331036567688, "Full-finetune/Step": 46, "Full-finetune/Step Time": 7.25814281857532} {"Full-finetune/Learning Rate": 6.064516129032259e-06, "Full-finetune/Loss": 1.8121179342269897, "Full-finetune/Loss (Raw)": 1.1683827638626099, "Full-finetune/Step": 47, "Full-finetune/Step Time": 7.23298139775053} {"Full-finetune/Learning Rate": 6.193548387096775e-06, "Full-finetune/Loss": 1.798335313796997, "Full-finetune/Loss (Raw)": 1.1505458354949951, "Full-finetune/Step": 48, "Full-finetune/Step Time": 7.241590430339177} {"Full-finetune/Learning Rate": 6.3225806451612906e-06, "Full-finetune/Loss": 1.785848617553711, "Full-finetune/Loss (Raw)": 1.1864912509918213, "Full-finetune/Step": 49, "Full-finetune/Step Time": 7.245148566304421} {"Full-finetune/Learning Rate": 6.451612903225806e-06, "Full-finetune/Loss": 1.7709547281265259, "Full-finetune/Loss (Raw)": 1.0411523580551147, "Full-finetune/Step": 50, "Full-finetune/Step Time": 7.211849203109741} {"Full-finetune/Learning Rate": 6.580645161290323e-06, "Full-finetune/Loss": 1.7589061260223389, "Full-finetune/Loss (Raw)": 1.156473994255066, "Full-finetune/Step": 51, "Full-finetune/Step Time": 7.187453816918766} {"Full-finetune/Learning Rate": 6.70967741935484e-06, "Full-finetune/Loss": 1.7486885786056519, "Full-finetune/Loss (Raw)": 1.2275891304016113, "Full-finetune/Step": 52, "Full-finetune/Step Time": 7.180780002704034} {"Full-finetune/Learning Rate": 6.838709677419355e-06, "Full-finetune/Loss": 1.7333500385284424, "Full-finetune/Loss (Raw)": 0.9357542395591736, "Full-finetune/Step": 53, "Full-finetune/Step Time": 7.195158513087146} {"Full-finetune/Learning Rate": 6.967741935483871e-06, "Full-finetune/Loss": 1.7189359664916992, "Full-finetune/Loss (Raw)": 0.9549887180328369, "Full-finetune/Step": 54, "Full-finetune/Step Time": 7.19052071041531} {"Full-finetune/Learning Rate": 7.096774193548388e-06, "Full-finetune/Loss": 1.7090120315551758, "Full-finetune/Loss (Raw)": 1.1731278896331787, "Full-finetune/Step": 55, "Full-finetune/Step Time": 7.21635159145702} {"Full-finetune/Learning Rate": 7.225806451612903e-06, "Full-finetune/Loss": 1.6985946893692017, "Full-finetune/Loss (Raw)": 1.125628113746643, "Full-finetune/Step": 56, "Full-finetune/Step Time": 7.226866087743214} {"Full-finetune/Learning Rate": 7.35483870967742e-06, "Full-finetune/Loss": 1.6867800951004028, "Full-finetune/Loss (Raw)": 1.0251621007919312, "Full-finetune/Step": 57, "Full-finetune/Step Time": 7.205622233842549} {"Full-finetune/Learning Rate": 7.483870967741936e-06, "Full-finetune/Loss": 1.6762996912002563, "Full-finetune/Loss (Raw)": 1.0789188146591187, "Full-finetune/Step": 58, "Full-finetune/Step Time": 7.253985996904044} {"Full-finetune/Learning Rate": 7.612903225806451e-06, "Full-finetune/Loss": 1.6664742231369019, "Full-finetune/Loss (Raw)": 1.096597671508789, "Full-finetune/Step": 59, "Full-finetune/Step Time": 7.261630296707153} {"Full-finetune/Learning Rate": 7.741935483870968e-06, "Full-finetune/Loss": 1.6569240093231201, "Full-finetune/Loss (Raw)": 1.0934547185897827, "Full-finetune/Step": 60, "Full-finetune/Step Time": 7.237884803613027} {"Full-finetune/Learning Rate": 7.870967741935484e-06, "Full-finetune/Loss": 1.6486470699310303, "Full-finetune/Loss (Raw)": 1.152044415473938, "Full-finetune/Step": 61, "Full-finetune/Step Time": 7.223698096197159} {"Full-finetune/Learning Rate": 8.000000000000001e-06, "Full-finetune/Loss": 1.6414639949798584, "Full-finetune/Loss (Raw)": 1.2032910585403442, "Full-finetune/Step": 62, "Full-finetune/Step Time": 7.199110088809844} {"Full-finetune/Learning Rate": 8.129032258064517e-06, "Full-finetune/Loss": 1.6347345113754272, "Full-finetune/Loss (Raw)": 1.2175010442733765, "Full-finetune/Step": 63, "Full-finetune/Step Time": 7.179618282923623} {"Full-finetune/Learning Rate": 8.258064516129033e-06, "Full-finetune/Loss": 1.6257590055465698, "Full-finetune/Loss (Raw)": 1.0603084564208984, "Full-finetune/Step": 64, "Full-finetune/Step Time": 7.213766172528267} {"Full-finetune/Learning Rate": 8.387096774193549e-06, "Full-finetune/Loss": 1.6170358657836914, "Full-finetune/Loss (Raw)": 1.058752417564392, "Full-finetune/Step": 65, "Full-finetune/Step Time": 7.208144187927246} {"Full-finetune/Learning Rate": 8.516129032258065e-06, "Full-finetune/Loss": 1.607863426208496, "Full-finetune/Loss (Raw)": 1.011643648147583, "Full-finetune/Step": 66, "Full-finetune/Step Time": 7.194636084816673} {"Full-finetune/Learning Rate": 8.64516129032258e-06, "Full-finetune/Loss": 1.59743070602417, "Full-finetune/Loss (Raw)": 0.9088878631591797, "Full-finetune/Step": 67, "Full-finetune/Step Time": 7.171497017589967} {"Full-finetune/Learning Rate": 8.774193548387098e-06, "Full-finetune/Loss": 1.5904793739318848, "Full-finetune/Loss (Raw)": 1.1247285604476929, "Full-finetune/Step": 68, "Full-finetune/Step Time": 7.1699129939079285} {"Full-finetune/Learning Rate": 8.903225806451614e-06, "Full-finetune/Loss": 1.584189534187317, "Full-finetune/Loss (Raw)": 1.156488060951233, "Full-finetune/Step": 69, "Full-finetune/Step Time": 7.147656458011572} {"Full-finetune/Learning Rate": 9.03225806451613e-06, "Full-finetune/Loss": 1.5785820484161377, "Full-finetune/Loss (Raw)": 1.191664457321167, "Full-finetune/Step": 70, "Full-finetune/Step Time": 7.129142250333514} {"Full-finetune/Learning Rate": 9.161290322580645e-06, "Full-finetune/Loss": 1.569289207458496, "Full-finetune/Loss (Raw)": 0.9187872409820557, "Full-finetune/Step": 71, "Full-finetune/Step Time": 7.112867127002125} {"Full-finetune/Learning Rate": 9.290322580645163e-06, "Full-finetune/Loss": 1.5618520975112915, "Full-finetune/Loss (Raw)": 1.0338118076324463, "Full-finetune/Step": 72, "Full-finetune/Step Time": 7.090715388456981} {"Full-finetune/Learning Rate": 9.419354838709677e-06, "Full-finetune/Loss": 1.553261637687683, "Full-finetune/Loss (Raw)": 0.9347618222236633, "Full-finetune/Step": 73, "Full-finetune/Step Time": 7.074011805939348} {"Full-finetune/Learning Rate": 9.548387096774195e-06, "Full-finetune/Loss": 1.544954538345337, "Full-finetune/Loss (Raw)": 0.9385353922843933, "Full-finetune/Step": 74, "Full-finetune/Step Time": 7.058714666882077} {"Full-finetune/Learning Rate": 9.67741935483871e-06, "Full-finetune/Loss": 1.5352888107299805, "Full-finetune/Loss (Raw)": 0.820017397403717, "Full-finetune/Step": 75, "Full-finetune/Step Time": 7.053771743774414} {"Full-finetune/Learning Rate": 9.806451612903226e-06, "Full-finetune/Loss": 1.5280263423919678, "Full-finetune/Loss (Raw)": 0.9833366274833679, "Full-finetune/Step": 76, "Full-finetune/Step Time": 7.048488648314225} {"Full-finetune/Learning Rate": 9.935483870967742e-06, "Full-finetune/Loss": 1.5228153467178345, "Full-finetune/Loss (Raw)": 1.1267871856689453, "Full-finetune/Step": 77, "Full-finetune/Step Time": 7.0284574186647095} {"Full-finetune/Learning Rate": 1.0064516129032258e-05, "Full-finetune/Loss": 1.5187678337097168, "Full-finetune/Loss (Raw)": 1.2071059942245483, "Full-finetune/Step": 78, "Full-finetune/Step Time": 7.009898592264224} {"Full-finetune/Learning Rate": 1.0193548387096774e-05, "Full-finetune/Loss": 1.5144834518432617, "Full-finetune/Loss (Raw)": 1.180302619934082, "Full-finetune/Step": 79, "Full-finetune/Step Time": 6.996029651617702} {"Full-finetune/Learning Rate": 1.0322580645161291e-05, "Full-finetune/Loss": 1.5076943635940552, "Full-finetune/Loss (Raw)": 0.9713600277900696, "Full-finetune/Step": 80, "Full-finetune/Step Time": 7.003210914134979} {"Full-finetune/Learning Rate": 1.0451612903225807e-05, "Full-finetune/Loss": 1.5032709836959839, "Full-finetune/Loss (Raw)": 1.149398684501648, "Full-finetune/Step": 81, "Full-finetune/Step Time": 7.001917397534406} {"Full-finetune/Learning Rate": 1.0580645161290325e-05, "Full-finetune/Loss": 1.4983125925064087, "Full-finetune/Loss (Raw)": 1.0966989994049072, "Full-finetune/Step": 82, "Full-finetune/Step Time": 6.987029750172685} {"Full-finetune/Learning Rate": 1.070967741935484e-05, "Full-finetune/Loss": 1.491774082183838, "Full-finetune/Loss (Raw)": 0.9556095600128174, "Full-finetune/Step": 83, "Full-finetune/Step Time": 6.9965082191559205} {"Full-finetune/Learning Rate": 1.0838709677419356e-05, "Full-finetune/Loss": 1.4883114099502563, "Full-finetune/Loss (Raw)": 1.2009048461914062, "Full-finetune/Step": 84, "Full-finetune/Step Time": 6.999910964852288} {"Full-finetune/Learning Rate": 1.096774193548387e-05, "Full-finetune/Loss": 1.4830647706985474, "Full-finetune/Loss (Raw)": 1.0423426628112793, "Full-finetune/Step": 85, "Full-finetune/Step Time": 6.987997753479902} {"Full-finetune/Learning Rate": 1.1096774193548388e-05, "Full-finetune/Loss": 1.4697409868240356, "Full-finetune/Loss (Raw)": 0.3372296690940857, "Full-finetune/Step": 86, "Full-finetune/Step Time": 7.002829094265783} {"Full-finetune/Learning Rate": 1.1225806451612904e-05, "Full-finetune/Loss": 1.4647413492202759, "Full-finetune/Loss (Raw)": 1.0347652435302734, "Full-finetune/Step": 87, "Full-finetune/Step Time": 6.991022477204773} {"Full-finetune/Learning Rate": 1.1354838709677421e-05, "Full-finetune/Loss": 1.462084412574768, "Full-finetune/Loss (Raw)": 1.2309184074401855, "Full-finetune/Step": 88, "Full-finetune/Step Time": 7.000790067694404} {"Full-finetune/Learning Rate": 1.1483870967741937e-05, "Full-finetune/Loss": 1.457628607749939, "Full-finetune/Loss (Raw)": 1.0655336380004883, "Full-finetune/Step": 89, "Full-finetune/Step Time": 6.989445884576004} {"Full-finetune/Learning Rate": 1.1612903225806453e-05, "Full-finetune/Loss": 1.4541114568710327, "Full-finetune/Loss (Raw)": 1.1410720348358154, "Full-finetune/Step": 90, "Full-finetune/Step Time": 6.999344295925564} {"Full-finetune/Learning Rate": 1.1741935483870967e-05, "Full-finetune/Loss": 1.4508087635040283, "Full-finetune/Loss (Raw)": 1.1535725593566895, "Full-finetune/Step": 91, "Full-finetune/Step Time": 7.0037712919843065} {"Full-finetune/Learning Rate": 1.1870967741935484e-05, "Full-finetune/Loss": 1.4480760097503662, "Full-finetune/Loss (Raw)": 1.1993885040283203, "Full-finetune/Step": 92, "Full-finetune/Step Time": 6.994451712007108} {"Full-finetune/Learning Rate": 1.2e-05, "Full-finetune/Loss": 1.4425047636032104, "Full-finetune/Loss (Raw)": 0.9299607872962952, "Full-finetune/Step": 93, "Full-finetune/Step Time": 6.988060279559064} {"Full-finetune/Learning Rate": 1.2129032258064518e-05, "Full-finetune/Loss": 1.4394694566726685, "Full-finetune/Loss (Raw)": 1.1571937799453735, "Full-finetune/Step": 94, "Full-finetune/Step Time": 6.972927752961504} {"Full-finetune/Learning Rate": 1.2258064516129034e-05, "Full-finetune/Loss": 1.4357081651687622, "Full-finetune/Loss (Raw)": 1.082128882408142, "Full-finetune/Step": 95, "Full-finetune/Step Time": 6.962757765619378} {"Full-finetune/Learning Rate": 1.238709677419355e-05, "Full-finetune/Loss": 1.4319560527801514, "Full-finetune/Loss (Raw)": 1.0755012035369873, "Full-finetune/Step": 96, "Full-finetune/Step Time": 6.967276573181152} {"Full-finetune/Learning Rate": 1.2516129032258067e-05, "Full-finetune/Loss": 1.427771806716919, "Full-finetune/Loss (Raw)": 1.0260896682739258, "Full-finetune/Step": 97, "Full-finetune/Step Time": 6.963979450697751} {"Full-finetune/Learning Rate": 1.2645161290322581e-05, "Full-finetune/Loss": 1.424576759338379, "Full-finetune/Loss (Raw)": 1.1146527528762817, "Full-finetune/Step": 98, "Full-finetune/Step Time": 6.953314737397797} {"Full-finetune/Learning Rate": 1.2774193548387097e-05, "Full-finetune/Loss": 1.412203073501587, "Full-finetune/Loss (Raw)": 0.1995886117219925, "Full-finetune/Step": 99, "Full-finetune/Step Time": 6.965923386390763} {"Full-finetune/Learning Rate": 1.2903225806451613e-05, "Full-finetune/Loss": 1.4101654291152954, "Full-finetune/Loss (Raw)": 1.2084518671035767, "Full-finetune/Step": 100, "Full-finetune/Step Time": 6.960215444564819} {"Full-finetune/Learning Rate": 1.303225806451613e-05, "Full-finetune/Loss": 1.406559705734253, "Full-finetune/Loss (Raw)": 1.0459705591201782, "Full-finetune/Step": 101, "Full-finetune/Step Time": 6.963319903553122} {"Full-finetune/Learning Rate": 1.3161290322580646e-05, "Full-finetune/Loss": 1.404595971107483, "Full-finetune/Loss (Raw)": 1.2062615156173706, "Full-finetune/Step": 102, "Full-finetune/Step Time": 6.948697978375005} {"Full-finetune/Learning Rate": 1.3290322580645164e-05, "Full-finetune/Loss": 1.3937327861785889, "Full-finetune/Loss (Raw)": 0.28570228815078735, "Full-finetune/Step": 103, "Full-finetune/Step Time": 6.962654507275924} {"Full-finetune/Learning Rate": 1.341935483870968e-05, "Full-finetune/Loss": 1.3913586139678955, "Full-finetune/Loss (Raw)": 1.146819829940796, "Full-finetune/Step": 104, "Full-finetune/Step Time": 6.951257547506919} {"Full-finetune/Learning Rate": 1.3548387096774194e-05, "Full-finetune/Loss": 1.3880906105041504, "Full-finetune/Loss (Raw)": 1.048222541809082, "Full-finetune/Step": 105, "Full-finetune/Step Time": 6.936406253633045} {"Full-finetune/Learning Rate": 1.367741935483871e-05, "Full-finetune/Loss": 1.384995698928833, "Full-finetune/Loss (Raw)": 1.0600049495697021, "Full-finetune/Step": 106, "Full-finetune/Step Time": 6.925615652552191} {"Full-finetune/Learning Rate": 1.3806451612903227e-05, "Full-finetune/Loss": 1.382573127746582, "Full-finetune/Loss (Raw)": 1.125802993774414, "Full-finetune/Step": 107, "Full-finetune/Step Time": 6.915776718442685} {"Full-finetune/Learning Rate": 1.3935483870967743e-05, "Full-finetune/Loss": 1.379143476486206, "Full-finetune/Loss (Raw)": 1.0121617317199707, "Full-finetune/Step": 108, "Full-finetune/Step Time": 6.90835146550779} {"Full-finetune/Learning Rate": 1.406451612903226e-05, "Full-finetune/Loss": 1.376923680305481, "Full-finetune/Loss (Raw)": 1.137197732925415, "Full-finetune/Step": 109, "Full-finetune/Step Time": 6.898590827206953} {"Full-finetune/Learning Rate": 1.4193548387096776e-05, "Full-finetune/Loss": 1.3738592863082886, "Full-finetune/Loss (Raw)": 1.0398370027542114, "Full-finetune/Step": 110, "Full-finetune/Step Time": 6.899720690467141} {"Full-finetune/Learning Rate": 1.4322580645161292e-05, "Full-finetune/Loss": 1.3714792728424072, "Full-finetune/Loss (Raw)": 1.1096713542938232, "Full-finetune/Step": 111, "Full-finetune/Step Time": 6.9067274965681476} {"Full-finetune/Learning Rate": 1.4451612903225806e-05, "Full-finetune/Loss": 1.3688321113586426, "Full-finetune/Loss (Raw)": 1.0749876499176025, "Full-finetune/Step": 112, "Full-finetune/Step Time": 6.903085842728615} {"Full-finetune/Learning Rate": 1.4580645161290324e-05, "Full-finetune/Loss": 1.366636037826538, "Full-finetune/Loss (Raw)": 1.1206867694854736, "Full-finetune/Step": 113, "Full-finetune/Step Time": 6.907210871181657} {"Full-finetune/Learning Rate": 1.470967741935484e-05, "Full-finetune/Loss": 1.3567042350769043, "Full-finetune/Loss (Raw)": 0.23440256714820862, "Full-finetune/Step": 114, "Full-finetune/Step Time": 6.940682329629597} {"Full-finetune/Learning Rate": 1.4838709677419357e-05, "Full-finetune/Loss": 1.354309320449829, "Full-finetune/Loss (Raw)": 1.0812960863113403, "Full-finetune/Step": 115, "Full-finetune/Step Time": 6.931930083813874} {"Full-finetune/Learning Rate": 1.4967741935483873e-05, "Full-finetune/Loss": 1.350560188293457, "Full-finetune/Loss (Raw)": 0.9193953275680542, "Full-finetune/Step": 116, "Full-finetune/Step Time": 6.9381501736312075} {"Full-finetune/Learning Rate": 1.5096774193548389e-05, "Full-finetune/Loss": 1.3484892845153809, "Full-finetune/Loss (Raw)": 1.1082671880722046, "Full-finetune/Step": 117, "Full-finetune/Step Time": 6.945686057082608} {"Full-finetune/Learning Rate": 1.5225806451612903e-05, "Full-finetune/Loss": 1.3467111587524414, "Full-finetune/Loss (Raw)": 1.1386771202087402, "Full-finetune/Step": 118, "Full-finetune/Step Time": 6.936145277346595} {"Full-finetune/Learning Rate": 1.535483870967742e-05, "Full-finetune/Loss": 1.3441168069839478, "Full-finetune/Loss (Raw)": 1.037977695465088, "Full-finetune/Step": 119, "Full-finetune/Step Time": 6.928299078420431} {"Full-finetune/Learning Rate": 1.5483870967741936e-05, "Full-finetune/Loss": 1.3419520854949951, "Full-finetune/Loss (Raw)": 1.0843558311462402, "Full-finetune/Step": 120, "Full-finetune/Step Time": 6.92472327152888} {"Full-finetune/Learning Rate": 1.5612903225806454e-05, "Full-finetune/Loss": 1.3393019437789917, "Full-finetune/Loss (Raw)": 1.0212832689285278, "Full-finetune/Step": 121, "Full-finetune/Step Time": 6.933842621558954} {"Full-finetune/Learning Rate": 1.5741935483870968e-05, "Full-finetune/Loss": 1.3362418413162231, "Full-finetune/Loss (Raw)": 0.965973436832428, "Full-finetune/Step": 122, "Full-finetune/Step Time": 6.9246280779604055} {"Full-finetune/Learning Rate": 1.5870967741935485e-05, "Full-finetune/Loss": 1.333601951599121, "Full-finetune/Loss (Raw)": 1.0115351676940918, "Full-finetune/Step": 123, "Full-finetune/Step Time": 6.916174739356933} {"Full-finetune/Learning Rate": 1.6000000000000003e-05, "Full-finetune/Loss": 1.3319159746170044, "Full-finetune/Loss (Raw)": 1.1245570182800293, "Full-finetune/Step": 124, "Full-finetune/Step Time": 6.910293290691991} {"Full-finetune/Learning Rate": 1.6129032258064517e-05, "Full-finetune/Loss": 1.3293272256851196, "Full-finetune/Loss (Raw)": 1.0083006620407104, "Full-finetune/Step": 125, "Full-finetune/Step Time": 6.903874397277832} {"Full-finetune/Learning Rate": 1.6258064516129034e-05, "Full-finetune/Loss": 1.327489972114563, "Full-finetune/Loss (Raw)": 1.0978449583053589, "Full-finetune/Step": 126, "Full-finetune/Step Time": 6.916098602234372} {"Full-finetune/Learning Rate": 1.638709677419355e-05, "Full-finetune/Loss": 1.3248164653778076, "Full-finetune/Loss (Raw)": 0.9879487156867981, "Full-finetune/Step": 127, "Full-finetune/Step Time": 6.906585135797816} {"Full-finetune/Learning Rate": 1.6516129032258066e-05, "Full-finetune/Loss": 1.3232429027557373, "Full-finetune/Loss (Raw)": 1.123399257659912, "Full-finetune/Step": 128, "Full-finetune/Step Time": 6.900461431592703} {"Full-finetune/Learning Rate": 1.6645161290322583e-05, "Full-finetune/Loss": 1.2899725437164307, "Full-finetune/Loss (Raw)": 1.146921157836914, "Full-finetune/Step": 129, "Full-finetune/Step Time": 6.7525866981595755} {"Full-finetune/Learning Rate": 1.6774193548387098e-05, "Full-finetune/Loss": 1.2521171569824219, "Full-finetune/Loss (Raw)": 1.1319116353988647, "Full-finetune/Step": 130, "Full-finetune/Step Time": 6.735816486179829} {"Full-finetune/Learning Rate": 1.6903225806451615e-05, "Full-finetune/Loss": 1.2306275367736816, "Full-finetune/Loss (Raw)": 1.0937461853027344, "Full-finetune/Step": 131, "Full-finetune/Step Time": 6.73596597276628} {"Full-finetune/Learning Rate": 1.703225806451613e-05, "Full-finetune/Loss": 1.2139315605163574, "Full-finetune/Loss (Raw)": 1.1052932739257812, "Full-finetune/Step": 132, "Full-finetune/Step Time": 6.736608635634184} {"Full-finetune/Learning Rate": 1.7161290322580647e-05, "Full-finetune/Loss": 1.1990251541137695, "Full-finetune/Loss (Raw)": 0.892977237701416, "Full-finetune/Step": 133, "Full-finetune/Step Time": 6.7463807053864} {"Full-finetune/Learning Rate": 1.729032258064516e-05, "Full-finetune/Loss": 1.1883482933044434, "Full-finetune/Loss (Raw)": 1.2397656440734863, "Full-finetune/Step": 134, "Full-finetune/Step Time": 6.743133643642068} {"Full-finetune/Learning Rate": 1.741935483870968e-05, "Full-finetune/Loss": 1.1755445003509521, "Full-finetune/Loss (Raw)": 0.9974704384803772, "Full-finetune/Step": 135, "Full-finetune/Step Time": 6.744930535554886} {"Full-finetune/Learning Rate": 1.7548387096774196e-05, "Full-finetune/Loss": 1.1639339923858643, "Full-finetune/Loss (Raw)": 1.0764409303665161, "Full-finetune/Step": 136, "Full-finetune/Step Time": 6.7310119066387415} {"Full-finetune/Learning Rate": 1.7677419354838713e-05, "Full-finetune/Loss": 1.1539876461029053, "Full-finetune/Loss (Raw)": 0.9757031202316284, "Full-finetune/Step": 137, "Full-finetune/Step Time": 6.733546933159232} {"Full-finetune/Learning Rate": 1.7806451612903228e-05, "Full-finetune/Loss": 1.14277982711792, "Full-finetune/Loss (Raw)": 1.1149832010269165, "Full-finetune/Step": 138, "Full-finetune/Step Time": 6.706450009718537} {"Full-finetune/Learning Rate": 1.7935483870967742e-05, "Full-finetune/Loss": 1.1316771507263184, "Full-finetune/Loss (Raw)": 0.9126586318016052, "Full-finetune/Step": 139, "Full-finetune/Step Time": 6.708650974556804} {"Full-finetune/Learning Rate": 1.806451612903226e-05, "Full-finetune/Loss": 1.1240980625152588, "Full-finetune/Loss (Raw)": 1.279141902923584, "Full-finetune/Step": 140, "Full-finetune/Step Time": 6.703326208516955} {"Full-finetune/Learning Rate": 1.8193548387096777e-05, "Full-finetune/Loss": 1.1158654689788818, "Full-finetune/Loss (Raw)": 1.028814435005188, "Full-finetune/Step": 141, "Full-finetune/Step Time": 6.697620004415512} {"Full-finetune/Learning Rate": 1.832258064516129e-05, "Full-finetune/Loss": 1.1054675579071045, "Full-finetune/Loss (Raw)": 1.0216975212097168, "Full-finetune/Step": 142, "Full-finetune/Step Time": 6.738394359126687} {"Full-finetune/Learning Rate": 1.845161290322581e-05, "Full-finetune/Loss": 1.0975465774536133, "Full-finetune/Loss (Raw)": 0.9609792232513428, "Full-finetune/Step": 143, "Full-finetune/Step Time": 6.753427874296904} {"Full-finetune/Learning Rate": 1.8580645161290326e-05, "Full-finetune/Loss": 1.0894136428833008, "Full-finetune/Loss (Raw)": 0.36015984416007996, "Full-finetune/Step": 144, "Full-finetune/Step Time": 6.764564082026482} {"Full-finetune/Learning Rate": 1.870967741935484e-05, "Full-finetune/Loss": 1.0773868560791016, "Full-finetune/Loss (Raw)": 0.33171746134757996, "Full-finetune/Step": 145, "Full-finetune/Step Time": 6.7864699605852365} {"Full-finetune/Learning Rate": 1.8838709677419354e-05, "Full-finetune/Loss": 1.0737518072128296, "Full-finetune/Loss (Raw)": 0.9591213464736938, "Full-finetune/Step": 146, "Full-finetune/Step Time": 6.778028443455696} {"Full-finetune/Learning Rate": 1.896774193548387e-05, "Full-finetune/Loss": 1.0670636892318726, "Full-finetune/Loss (Raw)": 0.8877229690551758, "Full-finetune/Step": 147, "Full-finetune/Step Time": 6.784637911245227} {"Full-finetune/Learning Rate": 1.909677419354839e-05, "Full-finetune/Loss": 1.0624663829803467, "Full-finetune/Loss (Raw)": 1.0672411918640137, "Full-finetune/Step": 148, "Full-finetune/Step Time": 6.787620175629854} {"Full-finetune/Learning Rate": 1.9225806451612907e-05, "Full-finetune/Loss": 1.0596638917922974, "Full-finetune/Loss (Raw)": 1.1083766222000122, "Full-finetune/Step": 149, "Full-finetune/Step Time": 6.777797874063253} {"Full-finetune/Learning Rate": 1.935483870967742e-05, "Full-finetune/Loss": 1.0581881999969482, "Full-finetune/Loss (Raw)": 1.122999668121338, "Full-finetune/Step": 150, "Full-finetune/Step Time": 6.78206211514771} {"Full-finetune/Learning Rate": 1.948387096774194e-05, "Full-finetune/Loss": 1.0649657249450684, "Full-finetune/Loss (Raw)": 1.089297890663147, "Full-finetune/Step": 151, "Full-finetune/Step Time": 6.761695126071572} {"Full-finetune/Learning Rate": 1.9612903225806452e-05, "Full-finetune/Loss": 1.0610580444335938, "Full-finetune/Loss (Raw)": 1.0410733222961426, "Full-finetune/Step": 152, "Full-finetune/Step Time": 6.76713677123189} {"Full-finetune/Learning Rate": 1.974193548387097e-05, "Full-finetune/Loss": 1.0591042041778564, "Full-finetune/Loss (Raw)": 1.1499592065811157, "Full-finetune/Step": 153, "Full-finetune/Step Time": 6.777296468615532} {"Full-finetune/Learning Rate": 1.9870967741935484e-05, "Full-finetune/Loss": 1.0658280849456787, "Full-finetune/Loss (Raw)": 1.1268043518066406, "Full-finetune/Step": 154, "Full-finetune/Step Time": 6.750060608610511} {"Full-finetune/Learning Rate": 2e-05, "Full-finetune/Loss": 1.0631670951843262, "Full-finetune/Loss (Raw)": 1.1993376016616821, "Full-finetune/Step": 155, "Full-finetune/Step Time": 6.758458856493235} {"Full-finetune/Learning Rate": 1.9999998059597617e-05, "Full-finetune/Loss": 1.0555944442749023, "Full-finetune/Loss (Raw)": 0.36866137385368347, "Full-finetune/Step": 156, "Full-finetune/Step Time": 6.780053878203034} {"Full-finetune/Learning Rate": 1.9999992238391222e-05, "Full-finetune/Loss": 1.052583932876587, "Full-finetune/Loss (Raw)": 1.0701282024383545, "Full-finetune/Step": 157, "Full-finetune/Step Time": 6.7709692027419806} {"Full-finetune/Learning Rate": 1.999998253638307e-05, "Full-finetune/Loss": 1.0512139797210693, "Full-finetune/Loss (Raw)": 1.1052438020706177, "Full-finetune/Step": 158, "Full-finetune/Step Time": 6.762851316481829} {"Full-finetune/Learning Rate": 1.999996895357693e-05, "Full-finetune/Loss": 1.048051357269287, "Full-finetune/Loss (Raw)": 1.0742701292037964, "Full-finetune/Step": 159, "Full-finetune/Step Time": 6.7557044718414545} {"Full-finetune/Learning Rate": 1.9999951489978074e-05, "Full-finetune/Loss": 1.0456123352050781, "Full-finetune/Loss (Raw)": 1.0087393522262573, "Full-finetune/Step": 160, "Full-finetune/Step Time": 6.746077422052622} {"Full-finetune/Learning Rate": 1.9999930145593275e-05, "Full-finetune/Loss": 1.0442790985107422, "Full-finetune/Loss (Raw)": 1.0213696956634521, "Full-finetune/Step": 161, "Full-finetune/Step Time": 6.742759542539716} {"Full-finetune/Learning Rate": 1.9999904920430818e-05, "Full-finetune/Loss": 1.0453304052352905, "Full-finetune/Loss (Raw)": 1.2542226314544678, "Full-finetune/Step": 162, "Full-finetune/Step Time": 6.741814650595188} {"Full-finetune/Learning Rate": 1.9999875814500492e-05, "Full-finetune/Loss": 1.0421969890594482, "Full-finetune/Loss (Raw)": 1.074676275253296, "Full-finetune/Step": 163, "Full-finetune/Step Time": 6.743121484294534} {"Full-finetune/Learning Rate": 1.99998428278136e-05, "Full-finetune/Loss": 1.0400539636611938, "Full-finetune/Loss (Raw)": 0.9554197192192078, "Full-finetune/Step": 164, "Full-finetune/Step Time": 6.7415273655205965} {"Full-finetune/Learning Rate": 1.9999805960382928e-05, "Full-finetune/Loss": 1.0374630689620972, "Full-finetune/Loss (Raw)": 1.0440492630004883, "Full-finetune/Step": 165, "Full-finetune/Step Time": 6.719664342701435} {"Full-finetune/Learning Rate": 1.99997652122228e-05, "Full-finetune/Loss": 1.0354994535446167, "Full-finetune/Loss (Raw)": 0.9884102940559387, "Full-finetune/Step": 166, "Full-finetune/Step Time": 6.72241672873497} {"Full-finetune/Learning Rate": 1.9999720583349015e-05, "Full-finetune/Loss": 1.0349429845809937, "Full-finetune/Loss (Raw)": 1.1398333311080933, "Full-finetune/Step": 167, "Full-finetune/Step Time": 6.724332857877016} {"Full-finetune/Learning Rate": 1.9999672073778905e-05, "Full-finetune/Loss": 1.032962679862976, "Full-finetune/Loss (Raw)": 0.9756137132644653, "Full-finetune/Step": 168, "Full-finetune/Step Time": 6.713953198865056} {"Full-finetune/Learning Rate": 1.999961968353129e-05, "Full-finetune/Loss": 1.0302939414978027, "Full-finetune/Loss (Raw)": 0.9656187891960144, "Full-finetune/Step": 169, "Full-finetune/Step Time": 6.729220515117049} {"Full-finetune/Learning Rate": 1.9999563412626503e-05, "Full-finetune/Loss": 1.023183822631836, "Full-finetune/Loss (Raw)": 0.35177767276763916, "Full-finetune/Step": 170, "Full-finetune/Step Time": 6.758419014513493} {"Full-finetune/Learning Rate": 1.9999503261086378e-05, "Full-finetune/Loss": 1.021570086479187, "Full-finetune/Loss (Raw)": 0.9990805983543396, "Full-finetune/Step": 171, "Full-finetune/Step Time": 6.757160674780607} {"Full-finetune/Learning Rate": 1.999943922893426e-05, "Full-finetune/Loss": 1.0196306705474854, "Full-finetune/Loss (Raw)": 0.9857032895088196, "Full-finetune/Step": 172, "Full-finetune/Step Time": 6.760331321507692} {"Full-finetune/Learning Rate": 1.9999371316195005e-05, "Full-finetune/Loss": 1.0204583406448364, "Full-finetune/Loss (Raw)": 1.1905255317687988, "Full-finetune/Step": 173, "Full-finetune/Step Time": 6.729773320257664} {"Full-finetune/Learning Rate": 1.9999299522894957e-05, "Full-finetune/Loss": 1.0254504680633545, "Full-finetune/Loss (Raw)": 0.8880649209022522, "Full-finetune/Step": 174, "Full-finetune/Step Time": 6.717814091593027} {"Full-finetune/Learning Rate": 1.9999223849061987e-05, "Full-finetune/Loss": 1.0256633758544922, "Full-finetune/Loss (Raw)": 1.1956452131271362, "Full-finetune/Step": 175, "Full-finetune/Step Time": 6.714859388768673} {"Full-finetune/Learning Rate": 1.999914429472546e-05, "Full-finetune/Loss": 1.0194023847579956, "Full-finetune/Loss (Raw)": 0.3491418957710266, "Full-finetune/Step": 176, "Full-finetune/Step Time": 6.719585865736008} {"Full-finetune/Learning Rate": 1.9999060859916247e-05, "Full-finetune/Loss": 1.0177438259124756, "Full-finetune/Loss (Raw)": 0.9741896390914917, "Full-finetune/Step": 177, "Full-finetune/Step Time": 6.712315985932946} {"Full-finetune/Learning Rate": 1.9998973544666734e-05, "Full-finetune/Loss": 1.018908977508545, "Full-finetune/Loss (Raw)": 1.1902981996536255, "Full-finetune/Step": 178, "Full-finetune/Step Time": 6.719766523689032} {"Full-finetune/Learning Rate": 1.9998882349010798e-05, "Full-finetune/Loss": 1.0168894529342651, "Full-finetune/Loss (Raw)": 0.8979662656784058, "Full-finetune/Step": 179, "Full-finetune/Step Time": 6.724142827093601} {"Full-finetune/Learning Rate": 1.999878727298384e-05, "Full-finetune/Loss": 1.0156477689743042, "Full-finetune/Loss (Raw)": 1.0686562061309814, "Full-finetune/Step": 180, "Full-finetune/Step Time": 6.720515040680766} {"Full-finetune/Learning Rate": 1.999868831662274e-05, "Full-finetune/Loss": 1.0162529945373535, "Full-finetune/Loss (Raw)": 1.0132231712341309, "Full-finetune/Step": 181, "Full-finetune/Step Time": 6.701189681887627} {"Full-finetune/Learning Rate": 1.9998585479965918e-05, "Full-finetune/Loss": 1.0170063972473145, "Full-finetune/Loss (Raw)": 1.0514296293258667, "Full-finetune/Step": 182, "Full-finetune/Step Time": 6.694804389029741} {"Full-finetune/Learning Rate": 1.999847876305328e-05, "Full-finetune/Loss": 1.0156779289245605, "Full-finetune/Loss (Raw)": 1.003076434135437, "Full-finetune/Step": 183, "Full-finetune/Step Time": 6.668055942282081} {"Full-finetune/Learning Rate": 1.9998368165926237e-05, "Full-finetune/Loss": 1.0159075260162354, "Full-finetune/Loss (Raw)": 1.1550238132476807, "Full-finetune/Step": 184, "Full-finetune/Step Time": 6.6550397500395775} {"Full-finetune/Learning Rate": 1.9998253688627706e-05, "Full-finetune/Loss": 1.015138864517212, "Full-finetune/Loss (Raw)": 0.9267560839653015, "Full-finetune/Step": 185, "Full-finetune/Step Time": 6.6527930330485106} {"Full-finetune/Learning Rate": 1.9998135331202124e-05, "Full-finetune/Loss": 1.0146095752716064, "Full-finetune/Loss (Raw)": 1.0111804008483887, "Full-finetune/Step": 186, "Full-finetune/Step Time": 6.633690459653735} {"Full-finetune/Learning Rate": 1.9998013093695413e-05, "Full-finetune/Loss": 1.0138765573501587, "Full-finetune/Loss (Raw)": 1.002772569656372, "Full-finetune/Step": 187, "Full-finetune/Step Time": 6.619842471554875} {"Full-finetune/Learning Rate": 1.9997886976155018e-05, "Full-finetune/Loss": 1.0140953063964844, "Full-finetune/Loss (Raw)": 1.1214419603347778, "Full-finetune/Step": 188, "Full-finetune/Step Time": 6.618378823623061} {"Full-finetune/Learning Rate": 1.9997756978629876e-05, "Full-finetune/Loss": 1.0129148960113525, "Full-finetune/Loss (Raw)": 1.000970482826233, "Full-finetune/Step": 189, "Full-finetune/Step Time": 6.628813698887825} {"Full-finetune/Learning Rate": 1.999762310117044e-05, "Full-finetune/Loss": 1.011829137802124, "Full-finetune/Loss (Raw)": 1.0643080472946167, "Full-finetune/Step": 190, "Full-finetune/Step Time": 6.635139396414161} {"Full-finetune/Learning Rate": 1.999748534382867e-05, "Full-finetune/Loss": 1.010723352432251, "Full-finetune/Loss (Raw)": 1.0759515762329102, "Full-finetune/Step": 191, "Full-finetune/Step Time": 6.640145804733038} {"Full-finetune/Learning Rate": 1.9997343706658023e-05, "Full-finetune/Loss": 1.010736107826233, "Full-finetune/Loss (Raw)": 1.0619539022445679, "Full-finetune/Step": 192, "Full-finetune/Step Time": 6.620580269023776} {"Full-finetune/Learning Rate": 1.9997198189713462e-05, "Full-finetune/Loss": 1.0097718238830566, "Full-finetune/Loss (Raw)": 0.9353206157684326, "Full-finetune/Step": 193, "Full-finetune/Step Time": 6.614434918388724} {"Full-finetune/Learning Rate": 1.9997048793051463e-05, "Full-finetune/Loss": 1.0100467205047607, "Full-finetune/Loss (Raw)": 1.046823263168335, "Full-finetune/Step": 194, "Full-finetune/Step Time": 6.61353263258934} {"Full-finetune/Learning Rate": 1.9996895516730005e-05, "Full-finetune/Loss": 1.0108104944229126, "Full-finetune/Loss (Raw)": 1.0066524744033813, "Full-finetune/Step": 195, "Full-finetune/Step Time": 6.620114933699369} {"Full-finetune/Learning Rate": 1.9996738360808566e-05, "Full-finetune/Loss": 1.0095770359039307, "Full-finetune/Loss (Raw)": 0.9668467044830322, "Full-finetune/Step": 196, "Full-finetune/Step Time": 6.6159367971122265} {"Full-finetune/Learning Rate": 1.999657732534814e-05, "Full-finetune/Loss": 1.0087454319000244, "Full-finetune/Loss (Raw)": 1.0500458478927612, "Full-finetune/Step": 197, "Full-finetune/Step Time": 6.62291000969708} {"Full-finetune/Learning Rate": 1.9996412410411224e-05, "Full-finetune/Loss": 1.007401466369629, "Full-finetune/Loss (Raw)": 1.019623041152954, "Full-finetune/Step": 198, "Full-finetune/Step Time": 6.6219203025102615} {"Full-finetune/Learning Rate": 1.9996243616061812e-05, "Full-finetune/Loss": 1.008023977279663, "Full-finetune/Loss (Raw)": 0.9984822869300842, "Full-finetune/Step": 199, "Full-finetune/Step Time": 6.626630339771509} {"Full-finetune/Learning Rate": 1.9996070942365416e-05, "Full-finetune/Loss": 1.007940411567688, "Full-finetune/Loss (Raw)": 1.0231207609176636, "Full-finetune/Step": 200, "Full-finetune/Step Time": 6.630290182307363} {"Full-finetune/Learning Rate": 1.9995894389389038e-05, "Full-finetune/Loss": 1.0094246864318848, "Full-finetune/Loss (Raw)": 1.1247501373291016, "Full-finetune/Step": 201, "Full-finetune/Step Time": 6.635226730257273} {"Full-finetune/Learning Rate": 1.9995713957201208e-05, "Full-finetune/Loss": 1.0108983516693115, "Full-finetune/Loss (Raw)": 1.1271659135818481, "Full-finetune/Step": 202, "Full-finetune/Step Time": 6.637440608814359} {"Full-finetune/Learning Rate": 1.9995529645871938e-05, "Full-finetune/Loss": 1.0127696990966797, "Full-finetune/Loss (Raw)": 1.0595440864562988, "Full-finetune/Step": 203, "Full-finetune/Step Time": 6.632611386477947} {"Full-finetune/Learning Rate": 1.999534145547276e-05, "Full-finetune/Loss": 1.0133228302001953, "Full-finetune/Loss (Raw)": 1.054126501083374, "Full-finetune/Step": 204, "Full-finetune/Step Time": 6.6264484990388155} {"Full-finetune/Learning Rate": 1.99951493860767e-05, "Full-finetune/Loss": 1.0069453716278076, "Full-finetune/Loss (Raw)": 0.31049278378486633, "Full-finetune/Step": 205, "Full-finetune/Step Time": 6.648833129554987} {"Full-finetune/Learning Rate": 1.9994953437758305e-05, "Full-finetune/Loss": 1.0053861141204834, "Full-finetune/Loss (Raw)": 1.0075019598007202, "Full-finetune/Step": 206, "Full-finetune/Step Time": 6.658460212871432} {"Full-finetune/Learning Rate": 1.999475361059362e-05, "Full-finetune/Loss": 1.00525963306427, "Full-finetune/Loss (Raw)": 1.164118766784668, "Full-finetune/Step": 207, "Full-finetune/Step Time": 6.681055173277855} {"Full-finetune/Learning Rate": 1.9994549904660187e-05, "Full-finetune/Loss": 1.0057069063186646, "Full-finetune/Loss (Raw)": 1.0286197662353516, "Full-finetune/Step": 208, "Full-finetune/Step Time": 6.666445374488831} {"Full-finetune/Learning Rate": 1.9994342320037065e-05, "Full-finetune/Loss": 1.0045912265777588, "Full-finetune/Loss (Raw)": 1.0065852403640747, "Full-finetune/Step": 209, "Full-finetune/Step Time": 6.6609472669661045} {"Full-finetune/Learning Rate": 1.9994130856804808e-05, "Full-finetune/Loss": 0.998447835445404, "Full-finetune/Loss (Raw)": 0.3103441894054413, "Full-finetune/Step": 210, "Full-finetune/Step Time": 6.684796145185828} {"Full-finetune/Learning Rate": 1.9993915515045485e-05, "Full-finetune/Loss": 0.9986621141433716, "Full-finetune/Loss (Raw)": 0.9830355048179626, "Full-finetune/Step": 211, "Full-finetune/Step Time": 6.677761234343052} {"Full-finetune/Learning Rate": 1.999369629484267e-05, "Full-finetune/Loss": 0.9976366758346558, "Full-finetune/Loss (Raw)": 1.0696485042572021, "Full-finetune/Step": 212, "Full-finetune/Step Time": 6.6752297561615705} {"Full-finetune/Learning Rate": 1.999347319628143e-05, "Full-finetune/Loss": 0.9987139701843262, "Full-finetune/Loss (Raw)": 1.1802406311035156, "Full-finetune/Step": 213, "Full-finetune/Step Time": 6.677765233442187} {"Full-finetune/Learning Rate": 1.9993246219448347e-05, "Full-finetune/Loss": 1.003701090812683, "Full-finetune/Loss (Raw)": 0.9755708575248718, "Full-finetune/Step": 214, "Full-finetune/Step Time": 6.677234189584851} {"Full-finetune/Learning Rate": 1.999301536443151e-05, "Full-finetune/Loss": 1.003014326095581, "Full-finetune/Loss (Raw)": 0.9468662142753601, "Full-finetune/Step": 215, "Full-finetune/Step Time": 6.676505740731955} {"Full-finetune/Learning Rate": 1.9992780631320508e-05, "Full-finetune/Loss": 1.0005838871002197, "Full-finetune/Loss (Raw)": 0.9198281168937683, "Full-finetune/Step": 216, "Full-finetune/Step Time": 6.67462857067585} {"Full-finetune/Learning Rate": 1.9992542020206432e-05, "Full-finetune/Loss": 1.0009397268295288, "Full-finetune/Loss (Raw)": 1.1110724210739136, "Full-finetune/Step": 217, "Full-finetune/Step Time": 6.672125084325671} {"Full-finetune/Learning Rate": 1.9992299531181892e-05, "Full-finetune/Loss": 1.0002868175506592, "Full-finetune/Loss (Raw)": 1.0575147867202759, "Full-finetune/Step": 218, "Full-finetune/Step Time": 6.661059312522411} {"Full-finetune/Learning Rate": 1.999205316434098e-05, "Full-finetune/Loss": 1.0006134510040283, "Full-finetune/Loss (Raw)": 1.1953879594802856, "Full-finetune/Step": 219, "Full-finetune/Step Time": 6.6493974309414625} {"Full-finetune/Learning Rate": 1.9991802919779318e-05, "Full-finetune/Loss": 0.9987640380859375, "Full-finetune/Loss (Raw)": 0.9626498222351074, "Full-finetune/Step": 220, "Full-finetune/Step Time": 6.645963456481695} {"Full-finetune/Learning Rate": 1.9991548797594017e-05, "Full-finetune/Loss": 1.0000097751617432, "Full-finetune/Loss (Raw)": 1.0894207954406738, "Full-finetune/Step": 221, "Full-finetune/Step Time": 6.6485504768788815} {"Full-finetune/Learning Rate": 1.9991290797883693e-05, "Full-finetune/Loss": 0.9984073042869568, "Full-finetune/Loss (Raw)": 0.9520640969276428, "Full-finetune/Step": 222, "Full-finetune/Step Time": 6.654704697430134} {"Full-finetune/Learning Rate": 1.9991028920748475e-05, "Full-finetune/Loss": 0.9975602030754089, "Full-finetune/Loss (Raw)": 0.9737041592597961, "Full-finetune/Step": 223, "Full-finetune/Step Time": 6.655788222327828} {"Full-finetune/Learning Rate": 1.9990763166289993e-05, "Full-finetune/Loss": 0.9918261766433716, "Full-finetune/Loss (Raw)": 0.3415534794330597, "Full-finetune/Step": 224, "Full-finetune/Step Time": 6.662541653960943} {"Full-finetune/Learning Rate": 1.9990493534611376e-05, "Full-finetune/Loss": 0.9919589757919312, "Full-finetune/Loss (Raw)": 1.0430883169174194, "Full-finetune/Step": 225, "Full-finetune/Step Time": 6.662616141140461} {"Full-finetune/Learning Rate": 1.9990220025817268e-05, "Full-finetune/Loss": 0.9924999475479126, "Full-finetune/Loss (Raw)": 1.183883786201477, "Full-finetune/Step": 226, "Full-finetune/Step Time": 6.659811487421393} {"Full-finetune/Learning Rate": 1.998994264001381e-05, "Full-finetune/Loss": 1.0001368522644043, "Full-finetune/Loss (Raw)": 1.1771225929260254, "Full-finetune/Step": 227, "Full-finetune/Step Time": 6.640182284638286} {"Full-finetune/Learning Rate": 1.9989661377308654e-05, "Full-finetune/Loss": 0.9995043277740479, "Full-finetune/Loss (Raw)": 1.127489686012268, "Full-finetune/Step": 228, "Full-finetune/Step Time": 6.634920476004481} {"Full-finetune/Learning Rate": 1.9989376237810944e-05, "Full-finetune/Loss": 0.9994055032730103, "Full-finetune/Loss (Raw)": 1.0333243608474731, "Full-finetune/Step": 229, "Full-finetune/Step Time": 6.628377988934517} {"Full-finetune/Learning Rate": 1.9989087221631344e-05, "Full-finetune/Loss": 0.9989721775054932, "Full-finetune/Loss (Raw)": 1.150782585144043, "Full-finetune/Step": 230, "Full-finetune/Step Time": 6.65118145942688} {"Full-finetune/Learning Rate": 1.9988794328882017e-05, "Full-finetune/Loss": 1.004667043685913, "Full-finetune/Loss (Raw)": 1.0146571397781372, "Full-finetune/Step": 231, "Full-finetune/Step Time": 6.642969051375985} {"Full-finetune/Learning Rate": 1.9988497559676622e-05, "Full-finetune/Loss": 1.0039594173431396, "Full-finetune/Loss (Raw)": 1.0562489032745361, "Full-finetune/Step": 232, "Full-finetune/Step Time": 6.645514642819762} {"Full-finetune/Learning Rate": 1.9988196914130332e-05, "Full-finetune/Loss": 0.9981529712677002, "Full-finetune/Loss (Raw)": 0.30498412251472473, "Full-finetune/Step": 233, "Full-finetune/Step Time": 6.667694544419646} {"Full-finetune/Learning Rate": 1.9987892392359827e-05, "Full-finetune/Loss": 0.9988669753074646, "Full-finetune/Loss (Raw)": 1.1513981819152832, "Full-finetune/Step": 234, "Full-finetune/Step Time": 6.6866518296301365} {"Full-finetune/Learning Rate": 1.998758399448328e-05, "Full-finetune/Loss": 0.9993671774864197, "Full-finetune/Loss (Raw)": 1.1898301839828491, "Full-finetune/Step": 235, "Full-finetune/Step Time": 6.72601062245667} {"Full-finetune/Learning Rate": 1.9987271720620376e-05, "Full-finetune/Loss": 0.9993091821670532, "Full-finetune/Loss (Raw)": 1.0047451257705688, "Full-finetune/Step": 236, "Full-finetune/Step Time": 6.726451847702265} {"Full-finetune/Learning Rate": 1.9986955570892302e-05, "Full-finetune/Loss": 0.9987431168556213, "Full-finetune/Loss (Raw)": 1.0647311210632324, "Full-finetune/Step": 237, "Full-finetune/Step Time": 6.759727979078889} {"Full-finetune/Learning Rate": 1.998663554542175e-05, "Full-finetune/Loss": 0.9985087513923645, "Full-finetune/Loss (Raw)": 1.009843111038208, "Full-finetune/Step": 238, "Full-finetune/Step Time": 6.753252871334553} {"Full-finetune/Learning Rate": 1.9986311644332913e-05, "Full-finetune/Loss": 0.9967096447944641, "Full-finetune/Loss (Raw)": 0.8793903589248657, "Full-finetune/Step": 239, "Full-finetune/Step Time": 6.737318364903331} {"Full-finetune/Learning Rate": 1.9985983867751497e-05, "Full-finetune/Loss": 0.9957898855209351, "Full-finetune/Loss (Raw)": 0.9572595357894897, "Full-finetune/Step": 240, "Full-finetune/Step Time": 6.7355131059885025} {"Full-finetune/Learning Rate": 1.99856522158047e-05, "Full-finetune/Loss": 0.9956234097480774, "Full-finetune/Loss (Raw)": 1.099368929862976, "Full-finetune/Step": 241, "Full-finetune/Step Time": 6.722710965201259} {"Full-finetune/Learning Rate": 1.998531668862123e-05, "Full-finetune/Loss": 1.0019779205322266, "Full-finetune/Loss (Raw)": 1.0477834939956665, "Full-finetune/Step": 242, "Full-finetune/Step Time": 6.688224205747247} {"Full-finetune/Learning Rate": 1.9984977286331302e-05, "Full-finetune/Loss": 1.0017725229263306, "Full-finetune/Loss (Raw)": 1.0550107955932617, "Full-finetune/Step": 243, "Full-finetune/Step Time": 6.698446325957775} {"Full-finetune/Learning Rate": 1.998463400906663e-05, "Full-finetune/Loss": 1.0016841888427734, "Full-finetune/Loss (Raw)": 0.9080930352210999, "Full-finetune/Step": 244, "Full-finetune/Step Time": 6.683624884113669} {"Full-finetune/Learning Rate": 1.998428685696043e-05, "Full-finetune/Loss": 1.0023009777069092, "Full-finetune/Loss (Raw)": 1.1872105598449707, "Full-finetune/Step": 245, "Full-finetune/Step Time": 6.665829136967659} {"Full-finetune/Learning Rate": 1.998393583014743e-05, "Full-finetune/Loss": 1.0023894309997559, "Full-finetune/Loss (Raw)": 1.1500017642974854, "Full-finetune/Step": 246, "Full-finetune/Step Time": 6.6751536671072245} {"Full-finetune/Learning Rate": 1.9983580928763852e-05, "Full-finetune/Loss": 1.0025155544281006, "Full-finetune/Loss (Raw)": 1.0541146993637085, "Full-finetune/Step": 247, "Full-finetune/Step Time": 6.675916833803058} {"Full-finetune/Learning Rate": 1.998322215294743e-05, "Full-finetune/Loss": 1.0017569065093994, "Full-finetune/Loss (Raw)": 0.9872586727142334, "Full-finetune/Step": 248, "Full-finetune/Step Time": 6.679457280784845} {"Full-finetune/Learning Rate": 1.9982859502837395e-05, "Full-finetune/Loss": 1.001699447631836, "Full-finetune/Loss (Raw)": 1.0139079093933105, "Full-finetune/Step": 249, "Full-finetune/Step Time": 6.660097802057862} {"Full-finetune/Learning Rate": 1.998249297857449e-05, "Full-finetune/Loss": 1.0024727582931519, "Full-finetune/Loss (Raw)": 1.0649737119674683, "Full-finetune/Step": 250, "Full-finetune/Step Time": 6.660042580217123} {"Full-finetune/Learning Rate": 1.9982122580300947e-05, "Full-finetune/Loss": 1.0033320188522339, "Full-finetune/Loss (Raw)": 1.1215107440948486, "Full-finetune/Step": 251, "Full-finetune/Step Time": 6.673996267840266} {"Full-finetune/Learning Rate": 1.9981748308160517e-05, "Full-finetune/Loss": 1.0024728775024414, "Full-finetune/Loss (Raw)": 1.0146005153656006, "Full-finetune/Step": 252, "Full-finetune/Step Time": 6.672732666134834} {"Full-finetune/Learning Rate": 1.9981370162298444e-05, "Full-finetune/Loss": 1.002947211265564, "Full-finetune/Loss (Raw)": 1.0690008401870728, "Full-finetune/Step": 253, "Full-finetune/Step Time": 6.667998049408197} {"Full-finetune/Learning Rate": 1.9980988142861486e-05, "Full-finetune/Loss": 1.0018856525421143, "Full-finetune/Loss (Raw)": 0.9619656205177307, "Full-finetune/Step": 254, "Full-finetune/Step Time": 6.6488719172775745} {"Full-finetune/Learning Rate": 1.998060224999789e-05, "Full-finetune/Loss": 0.9965946674346924, "Full-finetune/Loss (Raw)": 0.310712069272995, "Full-finetune/Step": 255, "Full-finetune/Step Time": 6.666898883879185} {"Full-finetune/Learning Rate": 1.9980212483857412e-05, "Full-finetune/Loss": 0.9952138662338257, "Full-finetune/Loss (Raw)": 0.9466479420661926, "Full-finetune/Step": 256, "Full-finetune/Step Time": 6.667195463553071} {"Full-finetune/Learning Rate": 1.9979818844591318e-05, "Full-finetune/Loss": 0.9952986240386963, "Full-finetune/Loss (Raw)": 1.1577644348144531, "Full-finetune/Step": 257, "Full-finetune/Step Time": 6.666392398998141} {"Full-finetune/Learning Rate": 1.9979421332352372e-05, "Full-finetune/Loss": 0.9950552582740784, "Full-finetune/Loss (Raw)": 1.1007678508758545, "Full-finetune/Step": 258, "Full-finetune/Step Time": 6.665809862315655} {"Full-finetune/Learning Rate": 1.9979019947294836e-05, "Full-finetune/Loss": 0.994897723197937, "Full-finetune/Loss (Raw)": 1.073588490486145, "Full-finetune/Step": 259, "Full-finetune/Step Time": 6.667481122538447} {"Full-finetune/Learning Rate": 1.9978614689574486e-05, "Full-finetune/Loss": 0.9947230219841003, "Full-finetune/Loss (Raw)": 1.0829237699508667, "Full-finetune/Step": 260, "Full-finetune/Step Time": 6.686379015445709} {"Full-finetune/Learning Rate": 1.9978205559348586e-05, "Full-finetune/Loss": 0.9943703413009644, "Full-finetune/Loss (Raw)": 0.8478307127952576, "Full-finetune/Step": 261, "Full-finetune/Step Time": 6.66922140866518} {"Full-finetune/Learning Rate": 1.997779255677592e-05, "Full-finetune/Loss": 0.9911924004554749, "Full-finetune/Loss (Raw)": 0.8329997062683105, "Full-finetune/Step": 262, "Full-finetune/Step Time": 6.679513867944479} {"Full-finetune/Learning Rate": 1.997737568201676e-05, "Full-finetune/Loss": 0.9913412928581238, "Full-finetune/Loss (Raw)": 1.0165212154388428, "Full-finetune/Step": 263, "Full-finetune/Step Time": 6.677817748859525} {"Full-finetune/Learning Rate": 1.9976954935232892e-05, "Full-finetune/Loss": 0.9904103875160217, "Full-finetune/Loss (Raw)": 0.9572818875312805, "Full-finetune/Step": 264, "Full-finetune/Step Time": 6.691670445725322} {"Full-finetune/Learning Rate": 1.99765303165876e-05, "Full-finetune/Loss": 0.990333616733551, "Full-finetune/Loss (Raw)": 0.9658747911453247, "Full-finetune/Step": 265, "Full-finetune/Step Time": 6.687855836004019} {"Full-finetune/Learning Rate": 1.997610182624566e-05, "Full-finetune/Loss": 0.991024374961853, "Full-finetune/Loss (Raw)": 1.2034093141555786, "Full-finetune/Step": 266, "Full-finetune/Step Time": 6.69834528118372} {"Full-finetune/Learning Rate": 1.9975669464373377e-05, "Full-finetune/Loss": 0.9908663034439087, "Full-finetune/Loss (Raw)": 0.8924224376678467, "Full-finetune/Step": 267, "Full-finetune/Step Time": 6.695327993482351} {"Full-finetune/Learning Rate": 1.9975233231138525e-05, "Full-finetune/Loss": 0.9893953800201416, "Full-finetune/Loss (Raw)": 1.090859293937683, "Full-finetune/Step": 268, "Full-finetune/Step Time": 6.69849899969995} {"Full-finetune/Learning Rate": 1.997479312671041e-05, "Full-finetune/Loss": 0.9893960952758789, "Full-finetune/Loss (Raw)": 1.0289119482040405, "Full-finetune/Step": 269, "Full-finetune/Step Time": 6.704436281695962} {"Full-finetune/Learning Rate": 1.9974349151259824e-05, "Full-finetune/Loss": 0.9894992113113403, "Full-finetune/Loss (Raw)": 1.034900426864624, "Full-finetune/Step": 270, "Full-finetune/Step Time": 6.668909991160035} {"Full-finetune/Learning Rate": 1.9973901304959066e-05, "Full-finetune/Loss": 0.9899471998214722, "Full-finetune/Loss (Raw)": 1.0183212757110596, "Full-finetune/Step": 271, "Full-finetune/Step Time": 6.659265233203769} {"Full-finetune/Learning Rate": 1.9973449587981935e-05, "Full-finetune/Loss": 0.9956377148628235, "Full-finetune/Loss (Raw)": 1.0885353088378906, "Full-finetune/Step": 272, "Full-finetune/Step Time": 6.640229359269142} {"Full-finetune/Learning Rate": 1.9972994000503734e-05, "Full-finetune/Loss": 1.0012288093566895, "Full-finetune/Loss (Raw)": 1.0473694801330566, "Full-finetune/Step": 273, "Full-finetune/Step Time": 6.618218149989843} {"Full-finetune/Learning Rate": 1.997253454270127e-05, "Full-finetune/Loss": 1.002220869064331, "Full-finetune/Loss (Raw)": 1.0861268043518066, "Full-finetune/Step": 274, "Full-finetune/Step Time": 6.62435688264668} {"Full-finetune/Learning Rate": 1.9972071214752843e-05, "Full-finetune/Loss": 1.0031819343566895, "Full-finetune/Loss (Raw)": 1.0107344388961792, "Full-finetune/Step": 275, "Full-finetune/Step Time": 6.620882961899042} {"Full-finetune/Learning Rate": 1.9971604016838264e-05, "Full-finetune/Loss": 1.0010327100753784, "Full-finetune/Loss (Raw)": 0.7921382784843445, "Full-finetune/Step": 276, "Full-finetune/Step Time": 6.653237810358405} {"Full-finetune/Learning Rate": 1.997113294913885e-05, "Full-finetune/Loss": 1.000203013420105, "Full-finetune/Loss (Raw)": 1.0021779537200928, "Full-finetune/Step": 277, "Full-finetune/Step Time": 6.6522652339190245} {"Full-finetune/Learning Rate": 1.9970658011837404e-05, "Full-finetune/Loss": 0.9994254112243652, "Full-finetune/Loss (Raw)": 1.0234721899032593, "Full-finetune/Step": 278, "Full-finetune/Step Time": 6.6445177718997} {"Full-finetune/Learning Rate": 1.997017920511825e-05, "Full-finetune/Loss": 1.0002084970474243, "Full-finetune/Loss (Raw)": 1.1895270347595215, "Full-finetune/Step": 279, "Full-finetune/Step Time": 6.6500291135162115} {"Full-finetune/Learning Rate": 1.9969696529167197e-05, "Full-finetune/Loss": 0.9996591806411743, "Full-finetune/Loss (Raw)": 0.9707567691802979, "Full-finetune/Step": 280, "Full-finetune/Step Time": 6.649602364748716} {"Full-finetune/Learning Rate": 1.996920998417156e-05, "Full-finetune/Loss": 0.998898983001709, "Full-finetune/Loss (Raw)": 1.052657127380371, "Full-finetune/Step": 281, "Full-finetune/Step Time": 6.6443180199712515} {"Full-finetune/Learning Rate": 1.996871957032016e-05, "Full-finetune/Loss": 0.9979428052902222, "Full-finetune/Loss (Raw)": 1.004415512084961, "Full-finetune/Step": 282, "Full-finetune/Step Time": 6.643098682165146} {"Full-finetune/Learning Rate": 1.996822528780332e-05, "Full-finetune/Loss": 0.9973607659339905, "Full-finetune/Loss (Raw)": 1.1248334646224976, "Full-finetune/Step": 283, "Full-finetune/Step Time": 6.640354223549366} {"Full-finetune/Learning Rate": 1.996772713681286e-05, "Full-finetune/Loss": 1.0032544136047363, "Full-finetune/Loss (Raw)": 1.123048186302185, "Full-finetune/Step": 284, "Full-finetune/Step Time": 6.618691314011812} {"Full-finetune/Learning Rate": 1.9967225117542097e-05, "Full-finetune/Loss": 1.0025404691696167, "Full-finetune/Loss (Raw)": 0.9787458777427673, "Full-finetune/Step": 285, "Full-finetune/Step Time": 6.646245809271932} {"Full-finetune/Learning Rate": 1.9966719230185864e-05, "Full-finetune/Loss": 1.0020155906677246, "Full-finetune/Loss (Raw)": 1.038057804107666, "Full-finetune/Step": 286, "Full-finetune/Step Time": 6.660590525716543} {"Full-finetune/Learning Rate": 1.9966209474940477e-05, "Full-finetune/Loss": 1.001859188079834, "Full-finetune/Loss (Raw)": 1.0542572736740112, "Full-finetune/Step": 287, "Full-finetune/Step Time": 6.6682945843786} {"Full-finetune/Learning Rate": 1.996569585200377e-05, "Full-finetune/Loss": 1.000907063484192, "Full-finetune/Loss (Raw)": 0.8868600130081177, "Full-finetune/Step": 288, "Full-finetune/Step Time": 6.675380120053887} {"Full-finetune/Learning Rate": 1.9965178361575068e-05, "Full-finetune/Loss": 1.0015286207199097, "Full-finetune/Loss (Raw)": 1.1009222269058228, "Full-finetune/Step": 289, "Full-finetune/Step Time": 6.67955019697547} {"Full-finetune/Learning Rate": 1.9964657003855197e-05, "Full-finetune/Loss": 0.9990672469139099, "Full-finetune/Loss (Raw)": 0.9391735792160034, "Full-finetune/Step": 290, "Full-finetune/Step Time": 6.690821370109916} {"Full-finetune/Learning Rate": 1.9964131779046484e-05, "Full-finetune/Loss": 0.9992409944534302, "Full-finetune/Loss (Raw)": 1.0969136953353882, "Full-finetune/Step": 291, "Full-finetune/Step Time": 6.694844391196966} {"Full-finetune/Learning Rate": 1.996360268735276e-05, "Full-finetune/Loss": 1.0002182722091675, "Full-finetune/Loss (Raw)": 1.0805174112319946, "Full-finetune/Step": 292, "Full-finetune/Step Time": 6.683501608669758} {"Full-finetune/Learning Rate": 1.9963069728979357e-05, "Full-finetune/Loss": 1.0007526874542236, "Full-finetune/Loss (Raw)": 1.1124650239944458, "Full-finetune/Step": 293, "Full-finetune/Step Time": 6.67924920283258} {"Full-finetune/Learning Rate": 1.9962532904133107e-05, "Full-finetune/Loss": 0.9986391067504883, "Full-finetune/Loss (Raw)": 0.7178556323051453, "Full-finetune/Step": 294, "Full-finetune/Step Time": 6.684977792203426} {"Full-finetune/Learning Rate": 1.996199221302234e-05, "Full-finetune/Loss": 0.9981013536453247, "Full-finetune/Loss (Raw)": 1.070997714996338, "Full-finetune/Step": 295, "Full-finetune/Step Time": 6.69131494499743} {"Full-finetune/Learning Rate": 1.9961447655856883e-05, "Full-finetune/Loss": 0.998320460319519, "Full-finetune/Loss (Raw)": 1.003668189048767, "Full-finetune/Step": 296, "Full-finetune/Step Time": 6.695368397980928} {"Full-finetune/Learning Rate": 1.9960899232848074e-05, "Full-finetune/Loss": 0.9994006156921387, "Full-finetune/Loss (Raw)": 1.1038750410079956, "Full-finetune/Step": 297, "Full-finetune/Step Time": 6.688296057283878} {"Full-finetune/Learning Rate": 1.9960346944208743e-05, "Full-finetune/Loss": 1.0034103393554688, "Full-finetune/Loss (Raw)": 0.8650240302085876, "Full-finetune/Step": 298, "Full-finetune/Step Time": 6.684439918026328} {"Full-finetune/Learning Rate": 1.995979079015322e-05, "Full-finetune/Loss": 0.9980194568634033, "Full-finetune/Loss (Raw)": 0.30904996395111084, "Full-finetune/Step": 299, "Full-finetune/Step Time": 6.6955436281859875} {"Full-finetune/Learning Rate": 1.995923077089734e-05, "Full-finetune/Loss": 0.9931076765060425, "Full-finetune/Loss (Raw)": 0.35699132084846497, "Full-finetune/Step": 300, "Full-finetune/Step Time": 6.702679386362433} {"Full-finetune/Learning Rate": 1.9958666886658436e-05, "Full-finetune/Loss": 0.9868544340133667, "Full-finetune/Loss (Raw)": 0.39011454582214355, "Full-finetune/Step": 301, "Full-finetune/Step Time": 6.722332226112485} {"Full-finetune/Learning Rate": 1.995809913765534e-05, "Full-finetune/Loss": 0.9865648746490479, "Full-finetune/Loss (Raw)": 0.8509942293167114, "Full-finetune/Step": 302, "Full-finetune/Step Time": 6.720217831432819} {"Full-finetune/Learning Rate": 1.9957527524108386e-05, "Full-finetune/Loss": 0.9796984195709229, "Full-finetune/Loss (Raw)": 0.316741019487381, "Full-finetune/Step": 303, "Full-finetune/Step Time": 6.739495085552335} {"Full-finetune/Learning Rate": 1.99569520462394e-05, "Full-finetune/Loss": 0.9854307174682617, "Full-finetune/Loss (Raw)": 1.0828783512115479, "Full-finetune/Step": 304, "Full-finetune/Step Time": 6.722192132845521} {"Full-finetune/Learning Rate": 1.995637270427172e-05, "Full-finetune/Loss": 0.9858934879302979, "Full-finetune/Loss (Raw)": 1.0334173440933228, "Full-finetune/Step": 305, "Full-finetune/Step Time": 6.714480882510543} {"Full-finetune/Learning Rate": 1.9955789498430178e-05, "Full-finetune/Loss": 0.9837585091590881, "Full-finetune/Loss (Raw)": 0.917026937007904, "Full-finetune/Step": 306, "Full-finetune/Step Time": 6.716049583628774} {"Full-finetune/Learning Rate": 1.99552024289411e-05, "Full-finetune/Loss": 0.9856686592102051, "Full-finetune/Loss (Raw)": 1.1424585580825806, "Full-finetune/Step": 307, "Full-finetune/Step Time": 6.717806443572044} {"Full-finetune/Learning Rate": 1.995461149603232e-05, "Full-finetune/Loss": 0.9852457046508789, "Full-finetune/Loss (Raw)": 1.0145251750946045, "Full-finetune/Step": 308, "Full-finetune/Step Time": 6.718717932701111} {"Full-finetune/Learning Rate": 1.9954016699933163e-05, "Full-finetune/Loss": 0.9860614538192749, "Full-finetune/Loss (Raw)": 1.1176469326019287, "Full-finetune/Step": 309, "Full-finetune/Step Time": 6.7328887693583965} {"Full-finetune/Learning Rate": 1.995341804087446e-05, "Full-finetune/Loss": 0.9855118989944458, "Full-finetune/Loss (Raw)": 0.9810852408409119, "Full-finetune/Step": 310, "Full-finetune/Step Time": 6.733201313763857} {"Full-finetune/Learning Rate": 1.9952815519088544e-05, "Full-finetune/Loss": 0.9855063557624817, "Full-finetune/Loss (Raw)": 1.002353310585022, "Full-finetune/Step": 311, "Full-finetune/Step Time": 6.73977580294013} {"Full-finetune/Learning Rate": 1.9952209134809234e-05, "Full-finetune/Loss": 0.9838961362838745, "Full-finetune/Loss (Raw)": 0.9489185214042664, "Full-finetune/Step": 312, "Full-finetune/Step Time": 6.739001547917724} {"Full-finetune/Learning Rate": 1.995159888827186e-05, "Full-finetune/Loss": 0.98514723777771, "Full-finetune/Loss (Raw)": 1.0868924856185913, "Full-finetune/Step": 313, "Full-finetune/Step Time": 6.747237669304013} {"Full-finetune/Learning Rate": 1.9950984779713244e-05, "Full-finetune/Loss": 0.9862253665924072, "Full-finetune/Loss (Raw)": 1.1491895914077759, "Full-finetune/Step": 314, "Full-finetune/Step Time": 6.73039667122066} {"Full-finetune/Learning Rate": 1.9950366809371713e-05, "Full-finetune/Loss": 0.985815703868866, "Full-finetune/Loss (Raw)": 0.950334370136261, "Full-finetune/Step": 315, "Full-finetune/Step Time": 6.7361533381044865} {"Full-finetune/Learning Rate": 1.9949744977487087e-05, "Full-finetune/Loss": 0.9799855351448059, "Full-finetune/Loss (Raw)": 0.375185489654541, "Full-finetune/Step": 316, "Full-finetune/Step Time": 6.7556432373821735} {"Full-finetune/Learning Rate": 1.994911928430069e-05, "Full-finetune/Loss": 0.9795327186584473, "Full-finetune/Loss (Raw)": 0.9430071711540222, "Full-finetune/Step": 317, "Full-finetune/Step Time": 6.746722871437669} {"Full-finetune/Learning Rate": 1.994848973005534e-05, "Full-finetune/Loss": 0.9792920351028442, "Full-finetune/Loss (Raw)": 1.0335018634796143, "Full-finetune/Step": 318, "Full-finetune/Step Time": 6.739320756867528} {"Full-finetune/Learning Rate": 1.994785631499535e-05, "Full-finetune/Loss": 0.9782342314720154, "Full-finetune/Loss (Raw)": 0.9405488967895508, "Full-finetune/Step": 319, "Full-finetune/Step Time": 6.746613513678312} {"Full-finetune/Learning Rate": 1.994721903936654e-05, "Full-finetune/Loss": 0.9770101308822632, "Full-finetune/Loss (Raw)": 0.9052658677101135, "Full-finetune/Step": 320, "Full-finetune/Step Time": 6.743084628134966} {"Full-finetune/Learning Rate": 1.9946577903416224e-05, "Full-finetune/Loss": 0.9722164869308472, "Full-finetune/Loss (Raw)": 0.32173097133636475, "Full-finetune/Step": 321, "Full-finetune/Step Time": 6.768894895911217} {"Full-finetune/Learning Rate": 1.994593290739322e-05, "Full-finetune/Loss": 0.9714419841766357, "Full-finetune/Loss (Raw)": 0.9476927518844604, "Full-finetune/Step": 322, "Full-finetune/Step Time": 6.769489225000143} {"Full-finetune/Learning Rate": 1.9945284051547823e-05, "Full-finetune/Loss": 0.9716284275054932, "Full-finetune/Loss (Raw)": 1.0305132865905762, "Full-finetune/Step": 323, "Full-finetune/Step Time": 6.7644677478820086} {"Full-finetune/Learning Rate": 1.9944631336131856e-05, "Full-finetune/Loss": 0.9725157022476196, "Full-finetune/Loss (Raw)": 1.080417513847351, "Full-finetune/Step": 324, "Full-finetune/Step Time": 6.764162318781018} {"Full-finetune/Learning Rate": 1.994397476139862e-05, "Full-finetune/Loss": 0.9722548127174377, "Full-finetune/Loss (Raw)": 1.0166661739349365, "Full-finetune/Step": 325, "Full-finetune/Step Time": 6.760146506130695} {"Full-finetune/Learning Rate": 1.994331432760292e-05, "Full-finetune/Loss": 0.9733830690383911, "Full-finetune/Loss (Raw)": 1.164031744003296, "Full-finetune/Step": 326, "Full-finetune/Step Time": 6.761234674602747} {"Full-finetune/Learning Rate": 1.9942650035001053e-05, "Full-finetune/Loss": 0.9733346700668335, "Full-finetune/Loss (Raw)": 0.9922836422920227, "Full-finetune/Step": 327, "Full-finetune/Step Time": 6.754985170438886} {"Full-finetune/Learning Rate": 1.994198188385082e-05, "Full-finetune/Loss": 0.9734207391738892, "Full-finetune/Loss (Raw)": 1.0341360569000244, "Full-finetune/Step": 328, "Full-finetune/Step Time": 6.76317491941154} {"Full-finetune/Learning Rate": 1.9941309874411525e-05, "Full-finetune/Loss": 0.9716593027114868, "Full-finetune/Loss (Raw)": 0.8992949724197388, "Full-finetune/Step": 329, "Full-finetune/Step Time": 6.778144869953394} {"Full-finetune/Learning Rate": 1.9940634006943952e-05, "Full-finetune/Loss": 0.9696035385131836, "Full-finetune/Loss (Raw)": 0.864022970199585, "Full-finetune/Step": 330, "Full-finetune/Step Time": 6.783362926915288} {"Full-finetune/Learning Rate": 1.9939954281710395e-05, "Full-finetune/Loss": 0.9693759083747864, "Full-finetune/Loss (Raw)": 1.0304077863693237, "Full-finetune/Step": 331, "Full-finetune/Step Time": 6.787240218371153} {"Full-finetune/Learning Rate": 1.9939270698974643e-05, "Full-finetune/Loss": 0.9673815965652466, "Full-finetune/Loss (Raw)": 0.7988589406013489, "Full-finetune/Step": 332, "Full-finetune/Step Time": 6.803405361250043} {"Full-finetune/Learning Rate": 1.9938583259001983e-05, "Full-finetune/Loss": 0.9727815985679626, "Full-finetune/Loss (Raw)": 1.0016897916793823, "Full-finetune/Step": 333, "Full-finetune/Step Time": 6.789121540263295} {"Full-finetune/Learning Rate": 1.993789196205919e-05, "Full-finetune/Loss": 0.9724398851394653, "Full-finetune/Loss (Raw)": 0.9637572765350342, "Full-finetune/Step": 334, "Full-finetune/Step Time": 6.78246746212244} {"Full-finetune/Learning Rate": 1.9937196808414552e-05, "Full-finetune/Loss": 0.9709623456001282, "Full-finetune/Loss (Raw)": 0.9749985337257385, "Full-finetune/Step": 335, "Full-finetune/Step Time": 6.76982156932354} {"Full-finetune/Learning Rate": 1.993649779833784e-05, "Full-finetune/Loss": 0.9712246656417847, "Full-finetune/Loss (Raw)": 1.062198281288147, "Full-finetune/Step": 336, "Full-finetune/Step Time": 6.7724576238542795} {"Full-finetune/Learning Rate": 1.993579493210032e-05, "Full-finetune/Loss": 0.9725908041000366, "Full-finetune/Loss (Raw)": 1.181445837020874, "Full-finetune/Step": 337, "Full-finetune/Step Time": 6.767139233648777} {"Full-finetune/Learning Rate": 1.9935088209974774e-05, "Full-finetune/Loss": 0.9775350093841553, "Full-finetune/Loss (Raw)": 0.9432070255279541, "Full-finetune/Step": 338, "Full-finetune/Step Time": 6.751550646498799} {"Full-finetune/Learning Rate": 1.9934377632235455e-05, "Full-finetune/Loss": 0.9770570397377014, "Full-finetune/Loss (Raw)": 0.9218509793281555, "Full-finetune/Step": 339, "Full-finetune/Step Time": 6.753648662939668} {"Full-finetune/Learning Rate": 1.9933663199158135e-05, "Full-finetune/Loss": 0.9756458401679993, "Full-finetune/Loss (Raw)": 0.8890144228935242, "Full-finetune/Step": 340, "Full-finetune/Step Time": 6.751441737636924} {"Full-finetune/Learning Rate": 1.993294491102006e-05, "Full-finetune/Loss": 0.9742013216018677, "Full-finetune/Loss (Raw)": 0.9953504800796509, "Full-finetune/Step": 341, "Full-finetune/Step Time": 6.7526800613850355} {"Full-finetune/Learning Rate": 1.9932222768099992e-05, "Full-finetune/Loss": 0.9746805429458618, "Full-finetune/Loss (Raw)": 1.0369056463241577, "Full-finetune/Step": 342, "Full-finetune/Step Time": 6.733711460605264} {"Full-finetune/Learning Rate": 1.9931496770678178e-05, "Full-finetune/Loss": 0.9750314950942993, "Full-finetune/Loss (Raw)": 0.9917992949485779, "Full-finetune/Step": 343, "Full-finetune/Step Time": 6.742192110046744} {"Full-finetune/Learning Rate": 1.993076691903636e-05, "Full-finetune/Loss": 0.9760118722915649, "Full-finetune/Loss (Raw)": 1.0453065633773804, "Full-finetune/Step": 344, "Full-finetune/Step Time": 6.727173218503594} {"Full-finetune/Learning Rate": 1.993003321345779e-05, "Full-finetune/Loss": 0.9758082628250122, "Full-finetune/Loss (Raw)": 1.0850142240524292, "Full-finetune/Step": 345, "Full-finetune/Step Time": 6.7295973766595125} {"Full-finetune/Learning Rate": 1.9929295654227193e-05, "Full-finetune/Loss": 0.9759368300437927, "Full-finetune/Loss (Raw)": 1.073970079421997, "Full-finetune/Step": 346, "Full-finetune/Step Time": 6.7357934676110744} {"Full-finetune/Learning Rate": 1.9928554241630804e-05, "Full-finetune/Loss": 0.9753250479698181, "Full-finetune/Loss (Raw)": 1.117080807685852, "Full-finetune/Step": 347, "Full-finetune/Step Time": 6.749806568026543} {"Full-finetune/Learning Rate": 1.9927808975956354e-05, "Full-finetune/Loss": 0.9758628010749817, "Full-finetune/Loss (Raw)": 1.0314841270446777, "Full-finetune/Step": 348, "Full-finetune/Step Time": 6.768736615777016} {"Full-finetune/Learning Rate": 1.9927059857493068e-05, "Full-finetune/Loss": 0.975969135761261, "Full-finetune/Loss (Raw)": 1.1030302047729492, "Full-finetune/Step": 349, "Full-finetune/Step Time": 6.776687050238252} {"Full-finetune/Learning Rate": 1.9926306886531658e-05, "Full-finetune/Loss": 0.9757005572319031, "Full-finetune/Loss (Raw)": 0.9176791906356812, "Full-finetune/Step": 350, "Full-finetune/Step Time": 6.790885653346777} {"Full-finetune/Learning Rate": 1.9925550063364337e-05, "Full-finetune/Loss": 0.9756007790565491, "Full-finetune/Loss (Raw)": 0.9609397053718567, "Full-finetune/Step": 351, "Full-finetune/Step Time": 6.813703637570143} {"Full-finetune/Learning Rate": 1.992478938828482e-05, "Full-finetune/Loss": 0.9805017709732056, "Full-finetune/Loss (Raw)": 0.9688799381256104, "Full-finetune/Step": 352, "Full-finetune/Step Time": 6.804827922955155} {"Full-finetune/Learning Rate": 1.9924024861588307e-05, "Full-finetune/Loss": 0.9796600937843323, "Full-finetune/Loss (Raw)": 0.9353480339050293, "Full-finetune/Step": 353, "Full-finetune/Step Time": 6.803297709673643} {"Full-finetune/Learning Rate": 1.9923256483571495e-05, "Full-finetune/Loss": 0.9772205352783203, "Full-finetune/Loss (Raw)": 0.8716247081756592, "Full-finetune/Step": 354, "Full-finetune/Step Time": 6.810477390885353} {"Full-finetune/Learning Rate": 1.9922484254532578e-05, "Full-finetune/Loss": 0.9760921001434326, "Full-finetune/Loss (Raw)": 1.032683253288269, "Full-finetune/Step": 355, "Full-finetune/Step Time": 6.819715840741992} {"Full-finetune/Learning Rate": 1.9921708174771237e-05, "Full-finetune/Loss": 0.9740802645683289, "Full-finetune/Loss (Raw)": 0.8699723482131958, "Full-finetune/Step": 356, "Full-finetune/Step Time": 6.826636761426926} {"Full-finetune/Learning Rate": 1.9920928244588662e-05, "Full-finetune/Loss": 0.9727760553359985, "Full-finetune/Loss (Raw)": 0.866386353969574, "Full-finetune/Step": 357, "Full-finetune/Step Time": 6.840113420039415} {"Full-finetune/Learning Rate": 1.9920144464287527e-05, "Full-finetune/Loss": 0.9666122198104858, "Full-finetune/Loss (Raw)": 0.3618101477622986, "Full-finetune/Step": 358, "Full-finetune/Step Time": 6.8372822888195515} {"Full-finetune/Learning Rate": 1.9919356834171996e-05, "Full-finetune/Loss": 0.9651146531105042, "Full-finetune/Loss (Raw)": 0.8229726552963257, "Full-finetune/Step": 359, "Full-finetune/Step Time": 6.8279728796333075} {"Full-finetune/Learning Rate": 1.9918565354547738e-05, "Full-finetune/Loss": 0.9643071889877319, "Full-finetune/Loss (Raw)": 0.9528841376304626, "Full-finetune/Step": 360, "Full-finetune/Step Time": 6.8285251557827} {"Full-finetune/Learning Rate": 1.991777002572191e-05, "Full-finetune/Loss": 0.9685494899749756, "Full-finetune/Loss (Raw)": 0.8479987978935242, "Full-finetune/Step": 361, "Full-finetune/Step Time": 6.809316297993064} {"Full-finetune/Learning Rate": 1.9916970848003166e-05, "Full-finetune/Loss": 0.9669127464294434, "Full-finetune/Loss (Raw)": 0.9419023394584656, "Full-finetune/Step": 362, "Full-finetune/Step Time": 6.801498424261808} {"Full-finetune/Learning Rate": 1.9916167821701645e-05, "Full-finetune/Loss": 0.9657807946205139, "Full-finetune/Loss (Raw)": 1.0449429750442505, "Full-finetune/Step": 363, "Full-finetune/Step Time": 6.761375682428479} {"Full-finetune/Learning Rate": 1.991536094712899e-05, "Full-finetune/Loss": 0.9660916924476624, "Full-finetune/Loss (Raw)": 1.0445362329483032, "Full-finetune/Step": 364, "Full-finetune/Step Time": 6.760043101385236} {"Full-finetune/Learning Rate": 1.991455022459833e-05, "Full-finetune/Loss": 0.9662183523178101, "Full-finetune/Loss (Raw)": 1.080944538116455, "Full-finetune/Step": 365, "Full-finetune/Step Time": 6.72997285798192} {"Full-finetune/Learning Rate": 1.9913735654424297e-05, "Full-finetune/Loss": 0.9652704000473022, "Full-finetune/Loss (Raw)": 0.8884998559951782, "Full-finetune/Step": 366, "Full-finetune/Step Time": 6.735317142680287} {"Full-finetune/Learning Rate": 1.9912917236923003e-05, "Full-finetune/Loss": 0.9660395383834839, "Full-finetune/Loss (Raw)": 0.9778491258621216, "Full-finetune/Step": 367, "Full-finetune/Step Time": 6.740860532969236} {"Full-finetune/Learning Rate": 1.9912094972412067e-05, "Full-finetune/Loss": 0.9662197828292847, "Full-finetune/Loss (Raw)": 0.9803214073181152, "Full-finetune/Step": 368, "Full-finetune/Step Time": 6.741165539249778} {"Full-finetune/Learning Rate": 1.9911268861210584e-05, "Full-finetune/Loss": 0.9650020599365234, "Full-finetune/Loss (Raw)": 0.9434981942176819, "Full-finetune/Step": 369, "Full-finetune/Step Time": 6.741736611351371} {"Full-finetune/Learning Rate": 1.991043890363916e-05, "Full-finetune/Loss": 0.965427041053772, "Full-finetune/Loss (Raw)": 1.1021894216537476, "Full-finetune/Step": 370, "Full-finetune/Step Time": 6.74093497171998} {"Full-finetune/Learning Rate": 1.9909605100019883e-05, "Full-finetune/Loss": 0.9659465551376343, "Full-finetune/Loss (Raw)": 1.1215136051177979, "Full-finetune/Step": 371, "Full-finetune/Step Time": 6.731689635664225} {"Full-finetune/Learning Rate": 1.9908767450676336e-05, "Full-finetune/Loss": 0.9667278528213501, "Full-finetune/Loss (Raw)": 1.0080955028533936, "Full-finetune/Step": 372, "Full-finetune/Step Time": 6.740511115640402} {"Full-finetune/Learning Rate": 1.9907925955933593e-05, "Full-finetune/Loss": 0.960849404335022, "Full-finetune/Loss (Raw)": 0.4347710609436035, "Full-finetune/Step": 373, "Full-finetune/Step Time": 6.761194717139006} {"Full-finetune/Learning Rate": 1.9907080616118223e-05, "Full-finetune/Loss": 0.9546267986297607, "Full-finetune/Loss (Raw)": 0.35349905490875244, "Full-finetune/Step": 374, "Full-finetune/Step Time": 6.771211255341768} {"Full-finetune/Learning Rate": 1.9906231431558283e-05, "Full-finetune/Loss": 0.954660177230835, "Full-finetune/Loss (Raw)": 1.058386206626892, "Full-finetune/Step": 375, "Full-finetune/Step Time": 6.768415624275804} {"Full-finetune/Learning Rate": 1.990537840258333e-05, "Full-finetune/Loss": 0.9536601305007935, "Full-finetune/Loss (Raw)": 0.8592510223388672, "Full-finetune/Step": 376, "Full-finetune/Step Time": 6.768436688929796} {"Full-finetune/Learning Rate": 1.9904521529524402e-05, "Full-finetune/Loss": 0.9531524777412415, "Full-finetune/Loss (Raw)": 0.9489357471466064, "Full-finetune/Step": 377, "Full-finetune/Step Time": 6.770076045766473} {"Full-finetune/Learning Rate": 1.990366081271404e-05, "Full-finetune/Loss": 0.9539734125137329, "Full-finetune/Loss (Raw)": 1.170046329498291, "Full-finetune/Step": 378, "Full-finetune/Step Time": 6.7695980258286} {"Full-finetune/Learning Rate": 1.990279625248627e-05, "Full-finetune/Loss": 0.9540013074874878, "Full-finetune/Loss (Raw)": 1.125087022781372, "Full-finetune/Step": 379, "Full-finetune/Step Time": 6.757298123091459} {"Full-finetune/Learning Rate": 1.990192784917661e-05, "Full-finetune/Loss": 0.9538376927375793, "Full-finetune/Loss (Raw)": 0.9936546087265015, "Full-finetune/Step": 380, "Full-finetune/Step Time": 6.755304144695401} {"Full-finetune/Learning Rate": 1.9901055603122067e-05, "Full-finetune/Loss": 0.9535458087921143, "Full-finetune/Loss (Raw)": 1.0316393375396729, "Full-finetune/Step": 381, "Full-finetune/Step Time": 6.764117047190666} {"Full-finetune/Learning Rate": 1.9900179514661148e-05, "Full-finetune/Loss": 0.9530300498008728, "Full-finetune/Loss (Raw)": 0.8959493637084961, "Full-finetune/Step": 382, "Full-finetune/Step Time": 6.802916349843144} {"Full-finetune/Learning Rate": 1.9899299584133848e-05, "Full-finetune/Loss": 0.9574453830718994, "Full-finetune/Loss (Raw)": 0.875883936882019, "Full-finetune/Step": 383, "Full-finetune/Step Time": 6.818765740841627} {"Full-finetune/Learning Rate": 1.9898415811881643e-05, "Full-finetune/Loss": 0.9537956118583679, "Full-finetune/Loss (Raw)": 0.4794636070728302, "Full-finetune/Step": 384, "Full-finetune/Step Time": 6.834419397637248} {"Full-finetune/Learning Rate": 1.989752819824751e-05, "Full-finetune/Loss": 0.9521933794021606, "Full-finetune/Loss (Raw)": 0.9526877999305725, "Full-finetune/Step": 385, "Full-finetune/Step Time": 6.832224605605006} {"Full-finetune/Learning Rate": 1.989663674357592e-05, "Full-finetune/Loss": 0.9509553909301758, "Full-finetune/Loss (Raw)": 0.9423004984855652, "Full-finetune/Step": 386, "Full-finetune/Step Time": 6.832552097737789} {"Full-finetune/Learning Rate": 1.9895741448212822e-05, "Full-finetune/Loss": 0.949065089225769, "Full-finetune/Loss (Raw)": 0.8316363096237183, "Full-finetune/Step": 387, "Full-finetune/Step Time": 6.834887184202671} {"Full-finetune/Learning Rate": 1.9894842312505673e-05, "Full-finetune/Loss": 0.947533369064331, "Full-finetune/Loss (Raw)": 0.8868602514266968, "Full-finetune/Step": 388, "Full-finetune/Step Time": 6.813779043033719} {"Full-finetune/Learning Rate": 1.9893939336803396e-05, "Full-finetune/Loss": 0.9478805065155029, "Full-finetune/Loss (Raw)": 0.8922685980796814, "Full-finetune/Step": 389, "Full-finetune/Step Time": 6.813575869426131} {"Full-finetune/Learning Rate": 1.989303252145643e-05, "Full-finetune/Loss": 0.9475687146186829, "Full-finetune/Loss (Raw)": 0.7930838465690613, "Full-finetune/Step": 390, "Full-finetune/Step Time": 6.80147809535265} {"Full-finetune/Learning Rate": 1.9892121866816682e-05, "Full-finetune/Loss": 0.947129487991333, "Full-finetune/Loss (Raw)": 0.9603118300437927, "Full-finetune/Step": 391, "Full-finetune/Step Time": 6.797041727229953} {"Full-finetune/Learning Rate": 1.989120737323757e-05, "Full-finetune/Loss": 0.9467912316322327, "Full-finetune/Loss (Raw)": 0.9139785766601562, "Full-finetune/Step": 392, "Full-finetune/Step Time": 6.794422330334783} {"Full-finetune/Learning Rate": 1.9890289041073984e-05, "Full-finetune/Loss": 0.9454168677330017, "Full-finetune/Loss (Raw)": 0.7899583578109741, "Full-finetune/Step": 393, "Full-finetune/Step Time": 6.807048475369811} {"Full-finetune/Learning Rate": 1.988936687068231e-05, "Full-finetune/Loss": 0.9421267509460449, "Full-finetune/Loss (Raw)": 0.7822694182395935, "Full-finetune/Step": 394, "Full-finetune/Step Time": 6.823004473000765} {"Full-finetune/Learning Rate": 1.9888440862420433e-05, "Full-finetune/Loss": 0.9443185329437256, "Full-finetune/Loss (Raw)": 1.172977328300476, "Full-finetune/Step": 395, "Full-finetune/Step Time": 6.833263518288732} {"Full-finetune/Learning Rate": 1.988751101664771e-05, "Full-finetune/Loss": 0.9441335201263428, "Full-finetune/Loss (Raw)": 1.0671693086624146, "Full-finetune/Step": 396, "Full-finetune/Step Time": 6.833776732906699} {"Full-finetune/Learning Rate": 1.9886577333724995e-05, "Full-finetune/Loss": 0.942063570022583, "Full-finetune/Loss (Raw)": 0.7639634609222412, "Full-finetune/Step": 397, "Full-finetune/Step Time": 6.849282868206501} {"Full-finetune/Learning Rate": 1.9885639814014642e-05, "Full-finetune/Loss": 0.942791223526001, "Full-finetune/Loss (Raw)": 1.128036379814148, "Full-finetune/Step": 398, "Full-finetune/Step Time": 6.843757381662726} {"Full-finetune/Learning Rate": 1.9884698457880476e-05, "Full-finetune/Loss": 0.9415065050125122, "Full-finetune/Loss (Raw)": 0.8538822531700134, "Full-finetune/Step": 399, "Full-finetune/Step Time": 6.831856530159712} {"Full-finetune/Learning Rate": 1.988375326568782e-05, "Full-finetune/Loss": 0.9400741457939148, "Full-finetune/Loss (Raw)": 0.9051837921142578, "Full-finetune/Step": 400, "Full-finetune/Step Time": 6.829872600734234} {"Full-finetune/Learning Rate": 1.9882804237803487e-05, "Full-finetune/Loss": 0.9400559663772583, "Full-finetune/Loss (Raw)": 1.0450526475906372, "Full-finetune/Step": 401, "Full-finetune/Step Time": 6.833027608692646} {"Full-finetune/Learning Rate": 1.9881851374595774e-05, "Full-finetune/Loss": 0.9389433264732361, "Full-finetune/Loss (Raw)": 0.9437037706375122, "Full-finetune/Step": 402, "Full-finetune/Step Time": 6.844234850257635} {"Full-finetune/Learning Rate": 1.988089467643447e-05, "Full-finetune/Loss": 0.938308835029602, "Full-finetune/Loss (Raw)": 0.9295189380645752, "Full-finetune/Step": 403, "Full-finetune/Step Time": 6.854528371244669} {"Full-finetune/Learning Rate": 1.9879934143690848e-05, "Full-finetune/Loss": 0.9402301907539368, "Full-finetune/Loss (Raw)": 1.0380738973617554, "Full-finetune/Step": 404, "Full-finetune/Step Time": 6.822238923981786} {"Full-finetune/Learning Rate": 1.9878969776737675e-05, "Full-finetune/Loss": 0.9379261136054993, "Full-finetune/Loss (Raw)": 0.7072559595108032, "Full-finetune/Step": 405, "Full-finetune/Step Time": 6.844324978068471} {"Full-finetune/Learning Rate": 1.9878001575949205e-05, "Full-finetune/Loss": 0.933634877204895, "Full-finetune/Loss (Raw)": 0.4741896688938141, "Full-finetune/Step": 406, "Full-finetune/Step Time": 6.863943435251713} {"Full-finetune/Learning Rate": 1.9877029541701174e-05, "Full-finetune/Loss": 0.9275821447372437, "Full-finetune/Loss (Raw)": 0.41478922963142395, "Full-finetune/Step": 407, "Full-finetune/Step Time": 6.871242867782712} {"Full-finetune/Learning Rate": 1.9876053674370806e-05, "Full-finetune/Loss": 0.9271909594535828, "Full-finetune/Loss (Raw)": 0.9206768274307251, "Full-finetune/Step": 408, "Full-finetune/Step Time": 6.870517810806632} {"Full-finetune/Learning Rate": 1.9875073974336827e-05, "Full-finetune/Loss": 0.9278941750526428, "Full-finetune/Loss (Raw)": 1.1426712274551392, "Full-finetune/Step": 409, "Full-finetune/Step Time": 6.861414194107056} {"Full-finetune/Learning Rate": 1.9874090441979433e-05, "Full-finetune/Loss": 0.9293383359909058, "Full-finetune/Loss (Raw)": 1.1892637014389038, "Full-finetune/Step": 410, "Full-finetune/Step Time": 6.859198780730367} {"Full-finetune/Learning Rate": 1.987310307768031e-05, "Full-finetune/Loss": 0.9280077219009399, "Full-finetune/Loss (Raw)": 0.9545207023620605, "Full-finetune/Step": 411, "Full-finetune/Step Time": 6.861653491854668} {"Full-finetune/Learning Rate": 1.987211188182264e-05, "Full-finetune/Loss": 0.922072172164917, "Full-finetune/Loss (Raw)": 0.3632970452308655, "Full-finetune/Step": 412, "Full-finetune/Step Time": 6.881961910054088} {"Full-finetune/Learning Rate": 1.9871116854791085e-05, "Full-finetune/Loss": 0.9224429130554199, "Full-finetune/Loss (Raw)": 1.026198148727417, "Full-finetune/Step": 413, "Full-finetune/Step Time": 6.8492469768971205} {"Full-finetune/Learning Rate": 1.9870117996971797e-05, "Full-finetune/Loss": 0.9212765693664551, "Full-finetune/Loss (Raw)": 0.888767421245575, "Full-finetune/Step": 414, "Full-finetune/Step Time": 6.834034755825996} {"Full-finetune/Learning Rate": 1.986911530875241e-05, "Full-finetune/Loss": 0.9208014011383057, "Full-finetune/Loss (Raw)": 0.9934403300285339, "Full-finetune/Step": 415, "Full-finetune/Step Time": 6.830289613455534} {"Full-finetune/Learning Rate": 1.9868108790522052e-05, "Full-finetune/Loss": 0.9223156571388245, "Full-finetune/Loss (Raw)": 1.080674648284912, "Full-finetune/Step": 416, "Full-finetune/Step Time": 6.816066723316908} {"Full-finetune/Learning Rate": 1.986709844267133e-05, "Full-finetune/Loss": 0.9213889837265015, "Full-finetune/Loss (Raw)": 0.9823114275932312, "Full-finetune/Step": 417, "Full-finetune/Step Time": 6.810662599280477} {"Full-finetune/Learning Rate": 1.9866084265592343e-05, "Full-finetune/Loss": 0.922142505645752, "Full-finetune/Loss (Raw)": 1.0356205701828003, "Full-finetune/Step": 418, "Full-finetune/Step Time": 6.7973498068749905} {"Full-finetune/Learning Rate": 1.986506625967867e-05, "Full-finetune/Loss": 0.9205290079116821, "Full-finetune/Loss (Raw)": 0.8903844356536865, "Full-finetune/Step": 419, "Full-finetune/Step Time": 6.804023949429393} {"Full-finetune/Learning Rate": 1.9864044425325382e-05, "Full-finetune/Loss": 0.9148885607719421, "Full-finetune/Loss (Raw)": 0.3585420846939087, "Full-finetune/Step": 420, "Full-finetune/Step Time": 6.820506365969777} {"Full-finetune/Learning Rate": 1.986301876292903e-05, "Full-finetune/Loss": 0.9138627648353577, "Full-finetune/Loss (Raw)": 0.9811651110649109, "Full-finetune/Step": 421, "Full-finetune/Step Time": 6.819948852062225} {"Full-finetune/Learning Rate": 1.986198927288766e-05, "Full-finetune/Loss": 0.9156758785247803, "Full-finetune/Loss (Raw)": 0.9499325156211853, "Full-finetune/Step": 422, "Full-finetune/Step Time": 6.825425677001476} {"Full-finetune/Learning Rate": 1.9860955955600784e-05, "Full-finetune/Loss": 0.9156078100204468, "Full-finetune/Loss (Raw)": 1.0622951984405518, "Full-finetune/Step": 423, "Full-finetune/Step Time": 6.818714765831828} {"Full-finetune/Learning Rate": 1.9859918811469424e-05, "Full-finetune/Loss": 0.9156004786491394, "Full-finetune/Loss (Raw)": 1.0027161836624146, "Full-finetune/Step": 424, "Full-finetune/Step Time": 6.817671639844775} {"Full-finetune/Learning Rate": 1.9858877840896076e-05, "Full-finetune/Loss": 0.9122538566589355, "Full-finetune/Loss (Raw)": 0.6755152344703674, "Full-finetune/Step": 425, "Full-finetune/Step Time": 6.8515023328363895} {"Full-finetune/Learning Rate": 1.9857833044284714e-05, "Full-finetune/Loss": 0.9128073453903198, "Full-finetune/Loss (Raw)": 0.9358680844306946, "Full-finetune/Step": 426, "Full-finetune/Step Time": 6.830632586032152} {"Full-finetune/Learning Rate": 1.9856784422040802e-05, "Full-finetune/Loss": 0.9176323413848877, "Full-finetune/Loss (Raw)": 0.9266515374183655, "Full-finetune/Step": 427, "Full-finetune/Step Time": 6.818890776485205} {"Full-finetune/Learning Rate": 1.98557319745713e-05, "Full-finetune/Loss": 0.9231113791465759, "Full-finetune/Loss (Raw)": 1.0583038330078125, "Full-finetune/Step": 428, "Full-finetune/Step Time": 6.799381414428353} {"Full-finetune/Learning Rate": 1.985467570228463e-05, "Full-finetune/Loss": 0.9281359314918518, "Full-finetune/Loss (Raw)": 1.0332608222961426, "Full-finetune/Step": 429, "Full-finetune/Step Time": 6.783903781324625} {"Full-finetune/Learning Rate": 1.985361560559072e-05, "Full-finetune/Loss": 0.9281302690505981, "Full-finetune/Loss (Raw)": 0.8502670526504517, "Full-finetune/Step": 430, "Full-finetune/Step Time": 6.777762804180384} {"Full-finetune/Learning Rate": 1.9852551684900964e-05, "Full-finetune/Loss": 0.9332046508789062, "Full-finetune/Loss (Raw)": 0.9662670493125916, "Full-finetune/Step": 431, "Full-finetune/Step Time": 6.767272813245654} {"Full-finetune/Learning Rate": 1.9851483940628256e-05, "Full-finetune/Loss": 0.9316370487213135, "Full-finetune/Loss (Raw)": 0.8822160363197327, "Full-finetune/Step": 432, "Full-finetune/Step Time": 6.773818677291274} {"Full-finetune/Learning Rate": 1.9850412373186967e-05, "Full-finetune/Loss": 0.9302371740341187, "Full-finetune/Loss (Raw)": 0.8542373776435852, "Full-finetune/Step": 433, "Full-finetune/Step Time": 6.776614286005497} {"Full-finetune/Learning Rate": 1.9849336982992948e-05, "Full-finetune/Loss": 0.9302408695220947, "Full-finetune/Loss (Raw)": 0.9174985289573669, "Full-finetune/Step": 434, "Full-finetune/Step Time": 6.776703780516982} {"Full-finetune/Learning Rate": 1.984825777046354e-05, "Full-finetune/Loss": 0.9274241924285889, "Full-finetune/Loss (Raw)": 0.7819206118583679, "Full-finetune/Step": 435, "Full-finetune/Step Time": 6.767500221729279} {"Full-finetune/Learning Rate": 1.9847174736017557e-05, "Full-finetune/Loss": 0.9262905120849609, "Full-finetune/Loss (Raw)": 0.8694213628768921, "Full-finetune/Step": 436, "Full-finetune/Step Time": 6.764448158442974} {"Full-finetune/Learning Rate": 1.9846087880075314e-05, "Full-finetune/Loss": 0.9249585866928101, "Full-finetune/Loss (Raw)": 0.9471577405929565, "Full-finetune/Step": 437, "Full-finetune/Step Time": 6.755550231784582} {"Full-finetune/Learning Rate": 1.984499720305859e-05, "Full-finetune/Loss": 0.9236435890197754, "Full-finetune/Loss (Raw)": 0.8127610087394714, "Full-finetune/Step": 438, "Full-finetune/Step Time": 6.753563264384866} {"Full-finetune/Learning Rate": 1.984390270539066e-05, "Full-finetune/Loss": 0.9228079319000244, "Full-finetune/Loss (Raw)": 0.8953991532325745, "Full-finetune/Step": 439, "Full-finetune/Step Time": 6.759744018316269} {"Full-finetune/Learning Rate": 1.9842804387496276e-05, "Full-finetune/Loss": 0.9229922294616699, "Full-finetune/Loss (Raw)": 0.9725048542022705, "Full-finetune/Step": 440, "Full-finetune/Step Time": 6.760561620816588} {"Full-finetune/Learning Rate": 1.9841702249801677e-05, "Full-finetune/Loss": 0.9222227334976196, "Full-finetune/Loss (Raw)": 0.9883917570114136, "Full-finetune/Step": 441, "Full-finetune/Step Time": 6.7576618529856205} {"Full-finetune/Learning Rate": 1.9840596292734573e-05, "Full-finetune/Loss": 0.9165771007537842, "Full-finetune/Loss (Raw)": 0.4265539050102234, "Full-finetune/Step": 442, "Full-finetune/Step Time": 6.77933463640511} {"Full-finetune/Learning Rate": 1.9839486516724173e-05, "Full-finetune/Loss": 0.9169849157333374, "Full-finetune/Loss (Raw)": 1.0025346279144287, "Full-finetune/Step": 443, "Full-finetune/Step Time": 6.784551996737719} {"Full-finetune/Learning Rate": 1.983837292220115e-05, "Full-finetune/Loss": 0.9223381280899048, "Full-finetune/Loss (Raw)": 1.0603899955749512, "Full-finetune/Step": 444, "Full-finetune/Step Time": 6.766097743064165} {"Full-finetune/Learning Rate": 1.983725550959768e-05, "Full-finetune/Loss": 0.9223035573959351, "Full-finetune/Loss (Raw)": 0.9385830760002136, "Full-finetune/Step": 445, "Full-finetune/Step Time": 6.761347085237503} {"Full-finetune/Learning Rate": 1.98361342793474e-05, "Full-finetune/Loss": 0.9221857786178589, "Full-finetune/Loss (Raw)": 1.018425464630127, "Full-finetune/Step": 446, "Full-finetune/Step Time": 6.764598270878196} {"Full-finetune/Learning Rate": 1.9835009231885444e-05, "Full-finetune/Loss": 0.9224035739898682, "Full-finetune/Loss (Raw)": 0.9684274792671204, "Full-finetune/Step": 447, "Full-finetune/Step Time": 6.755031354725361} {"Full-finetune/Learning Rate": 1.9833880367648412e-05, "Full-finetune/Loss": 0.922524094581604, "Full-finetune/Loss (Raw)": 0.9207044243812561, "Full-finetune/Step": 448, "Full-finetune/Step Time": 6.75484542734921} {"Full-finetune/Learning Rate": 1.9832747687074403e-05, "Full-finetune/Loss": 0.9285800457000732, "Full-finetune/Loss (Raw)": 1.096885323524475, "Full-finetune/Step": 449, "Full-finetune/Step Time": 6.7318852301687} {"Full-finetune/Learning Rate": 1.9831611190602984e-05, "Full-finetune/Loss": 0.9280520677566528, "Full-finetune/Loss (Raw)": 0.8801136612892151, "Full-finetune/Step": 450, "Full-finetune/Step Time": 6.731470685452223} {"Full-finetune/Learning Rate": 1.983047087867521e-05, "Full-finetune/Loss": 0.9270988702774048, "Full-finetune/Loss (Raw)": 0.908503532409668, "Full-finetune/Step": 451, "Full-finetune/Step Time": 6.735380539670587} {"Full-finetune/Learning Rate": 1.9829326751733607e-05, "Full-finetune/Loss": 0.9258438944816589, "Full-finetune/Loss (Raw)": 0.9197771549224854, "Full-finetune/Step": 452, "Full-finetune/Step Time": 6.728901691734791} {"Full-finetune/Learning Rate": 1.9828178810222197e-05, "Full-finetune/Loss": 0.9265363216400146, "Full-finetune/Loss (Raw)": 1.1052958965301514, "Full-finetune/Step": 453, "Full-finetune/Step Time": 6.73505000770092} {"Full-finetune/Learning Rate": 1.9827027054586468e-05, "Full-finetune/Loss": 0.9245777130126953, "Full-finetune/Loss (Raw)": 0.9133280515670776, "Full-finetune/Step": 454, "Full-finetune/Step Time": 6.749954413622618} {"Full-finetune/Learning Rate": 1.9825871485273395e-05, "Full-finetune/Loss": 0.9246969223022461, "Full-finetune/Loss (Raw)": 1.007542610168457, "Full-finetune/Step": 455, "Full-finetune/Step Time": 6.749009562656283} {"Full-finetune/Learning Rate": 1.9824712102731435e-05, "Full-finetune/Loss": 0.9191671013832092, "Full-finetune/Loss (Raw)": 0.326324462890625, "Full-finetune/Step": 456, "Full-finetune/Step Time": 6.755038870498538} {"Full-finetune/Learning Rate": 1.982354890741052e-05, "Full-finetune/Loss": 0.9185703992843628, "Full-finetune/Loss (Raw)": 0.8229184746742249, "Full-finetune/Step": 457, "Full-finetune/Step Time": 6.736603826284409} {"Full-finetune/Learning Rate": 1.982238189976206e-05, "Full-finetune/Loss": 0.9204541444778442, "Full-finetune/Loss (Raw)": 1.1051336526870728, "Full-finetune/Step": 458, "Full-finetune/Step Time": 6.7333365343511105} {"Full-finetune/Learning Rate": 1.9821211080238953e-05, "Full-finetune/Loss": 0.9194255471229553, "Full-finetune/Loss (Raw)": 0.8987531661987305, "Full-finetune/Step": 459, "Full-finetune/Step Time": 6.735584827139974} {"Full-finetune/Learning Rate": 1.9820036449295564e-05, "Full-finetune/Loss": 0.9190959334373474, "Full-finetune/Loss (Raw)": 0.7566658854484558, "Full-finetune/Step": 460, "Full-finetune/Step Time": 6.73475512675941} {"Full-finetune/Learning Rate": 1.9818858007387753e-05, "Full-finetune/Loss": 0.9182552099227905, "Full-finetune/Loss (Raw)": 0.8940783143043518, "Full-finetune/Step": 461, "Full-finetune/Step Time": 6.7433804757893085} {"Full-finetune/Learning Rate": 1.9817675754972846e-05, "Full-finetune/Loss": 0.917888879776001, "Full-finetune/Loss (Raw)": 0.9168663024902344, "Full-finetune/Step": 462, "Full-finetune/Step Time": 6.743018366396427} {"Full-finetune/Learning Rate": 1.9816489692509654e-05, "Full-finetune/Loss": 0.9189726114273071, "Full-finetune/Loss (Raw)": 1.113715410232544, "Full-finetune/Step": 463, "Full-finetune/Step Time": 6.747586939483881} {"Full-finetune/Learning Rate": 1.9815299820458458e-05, "Full-finetune/Loss": 0.9128326773643494, "Full-finetune/Loss (Raw)": 0.2762943208217621, "Full-finetune/Step": 464, "Full-finetune/Step Time": 6.764756757766008} {"Full-finetune/Learning Rate": 1.9814106139281033e-05, "Full-finetune/Loss": 0.9112406373023987, "Full-finetune/Loss (Raw)": 0.9776617884635925, "Full-finetune/Step": 465, "Full-finetune/Step Time": 6.772254958748817} {"Full-finetune/Learning Rate": 1.9812908649440618e-05, "Full-finetune/Loss": 0.9099953174591064, "Full-finetune/Loss (Raw)": 0.7838071584701538, "Full-finetune/Step": 466, "Full-finetune/Step Time": 6.776372781023383} {"Full-finetune/Learning Rate": 1.981170735140194e-05, "Full-finetune/Loss": 0.9103745222091675, "Full-finetune/Loss (Raw)": 0.9703860282897949, "Full-finetune/Step": 467, "Full-finetune/Step Time": 6.776174748316407} {"Full-finetune/Learning Rate": 1.9810502245631194e-05, "Full-finetune/Loss": 0.9093478322029114, "Full-finetune/Loss (Raw)": 0.7575958967208862, "Full-finetune/Step": 468, "Full-finetune/Step Time": 6.7877803687006235} {"Full-finetune/Learning Rate": 1.980929333259606e-05, "Full-finetune/Loss": 0.9042583703994751, "Full-finetune/Loss (Raw)": 0.3439035415649414, "Full-finetune/Step": 469, "Full-finetune/Step Time": 6.801436267793179} {"Full-finetune/Learning Rate": 1.9808080612765694e-05, "Full-finetune/Loss": 0.9032268524169922, "Full-finetune/Loss (Raw)": 0.9048680067062378, "Full-finetune/Step": 470, "Full-finetune/Step Time": 6.801516143605113} {"Full-finetune/Learning Rate": 1.980686408661073e-05, "Full-finetune/Loss": 0.902594804763794, "Full-finetune/Loss (Raw)": 0.9109011292457581, "Full-finetune/Step": 471, "Full-finetune/Step Time": 6.805770663544536} {"Full-finetune/Learning Rate": 1.9805643754603275e-05, "Full-finetune/Loss": 0.9027161598205566, "Full-finetune/Loss (Raw)": 1.0608311891555786, "Full-finetune/Step": 472, "Full-finetune/Step Time": 6.807291127741337} {"Full-finetune/Learning Rate": 1.9804419617216922e-05, "Full-finetune/Loss": 0.9007571935653687, "Full-finetune/Loss (Raw)": 0.8342745900154114, "Full-finetune/Step": 473, "Full-finetune/Step Time": 6.804924512282014} {"Full-finetune/Learning Rate": 1.9803191674926727e-05, "Full-finetune/Loss": 0.9000002145767212, "Full-finetune/Loss (Raw)": 0.9770727753639221, "Full-finetune/Step": 474, "Full-finetune/Step Time": 6.801197053864598} {"Full-finetune/Learning Rate": 1.9801959928209236e-05, "Full-finetune/Loss": 0.8987421989440918, "Full-finetune/Loss (Raw)": 0.9560592174530029, "Full-finetune/Step": 475, "Full-finetune/Step Time": 6.789334746077657} {"Full-finetune/Learning Rate": 1.9800724377542463e-05, "Full-finetune/Loss": 0.8980752229690552, "Full-finetune/Loss (Raw)": 0.9461047053337097, "Full-finetune/Step": 476, "Full-finetune/Step Time": 6.774629244580865} {"Full-finetune/Learning Rate": 1.9799485023405904e-05, "Full-finetune/Loss": 0.8965784311294556, "Full-finetune/Loss (Raw)": 0.91144859790802, "Full-finetune/Step": 477, "Full-finetune/Step Time": 6.780022291466594} {"Full-finetune/Learning Rate": 1.9798241866280523e-05, "Full-finetune/Loss": 0.8962462544441223, "Full-finetune/Loss (Raw)": 0.8751582503318787, "Full-finetune/Step": 478, "Full-finetune/Step Time": 6.757074078544974} {"Full-finetune/Learning Rate": 1.979699490664877e-05, "Full-finetune/Loss": 0.8961275219917297, "Full-finetune/Loss (Raw)": 0.9457411170005798, "Full-finetune/Step": 479, "Full-finetune/Step Time": 6.732107708230615} {"Full-finetune/Learning Rate": 1.9795744144994562e-05, "Full-finetune/Loss": 0.8964284658432007, "Full-finetune/Loss (Raw)": 1.0074025392532349, "Full-finetune/Step": 480, "Full-finetune/Step Time": 6.724769465625286} {"Full-finetune/Learning Rate": 1.97944895818033e-05, "Full-finetune/Loss": 0.8964800834655762, "Full-finetune/Loss (Raw)": 0.941957414150238, "Full-finetune/Step": 481, "Full-finetune/Step Time": 6.728770148009062} {"Full-finetune/Learning Rate": 1.979323121756185e-05, "Full-finetune/Loss": 0.8972073793411255, "Full-finetune/Loss (Raw)": 0.9647189378738403, "Full-finetune/Step": 482, "Full-finetune/Step Time": 6.73735960200429} {"Full-finetune/Learning Rate": 1.9791969052758563e-05, "Full-finetune/Loss": 0.8964189887046814, "Full-finetune/Loss (Raw)": 0.9317675828933716, "Full-finetune/Step": 483, "Full-finetune/Step Time": 6.748490000143647} {"Full-finetune/Learning Rate": 1.9790703087883258e-05, "Full-finetune/Loss": 0.896016001701355, "Full-finetune/Loss (Raw)": 0.8183877468109131, "Full-finetune/Step": 484, "Full-finetune/Step Time": 6.752502603456378} {"Full-finetune/Learning Rate": 1.9789433323427233e-05, "Full-finetune/Loss": 0.894493818283081, "Full-finetune/Loss (Raw)": 0.6715545058250427, "Full-finetune/Step": 485, "Full-finetune/Step Time": 6.756224058568478} {"Full-finetune/Learning Rate": 1.9788159759883258e-05, "Full-finetune/Loss": 0.8984394669532776, "Full-finetune/Loss (Raw)": 0.8668437004089355, "Full-finetune/Step": 486, "Full-finetune/Step Time": 6.750580197200179} {"Full-finetune/Learning Rate": 1.9786882397745573e-05, "Full-finetune/Loss": 0.8993988037109375, "Full-finetune/Loss (Raw)": 0.9457663893699646, "Full-finetune/Step": 487, "Full-finetune/Step Time": 6.749863179400563} {"Full-finetune/Learning Rate": 1.9785601237509907e-05, "Full-finetune/Loss": 0.8996611833572388, "Full-finetune/Loss (Raw)": 0.9864639043807983, "Full-finetune/Step": 488, "Full-finetune/Step Time": 6.746501436457038} {"Full-finetune/Learning Rate": 1.978431627967345e-05, "Full-finetune/Loss": 0.8994255661964417, "Full-finetune/Loss (Raw)": 0.8178490400314331, "Full-finetune/Step": 489, "Full-finetune/Step Time": 6.751204153522849} {"Full-finetune/Learning Rate": 1.9783027524734865e-05, "Full-finetune/Loss": 0.8983098268508911, "Full-finetune/Loss (Raw)": 0.799089252948761, "Full-finetune/Step": 490, "Full-finetune/Step Time": 6.757466584444046} {"Full-finetune/Learning Rate": 1.9781734973194294e-05, "Full-finetune/Loss": 0.8943162560462952, "Full-finetune/Loss (Raw)": 0.5337634682655334, "Full-finetune/Step": 491, "Full-finetune/Step Time": 6.785541420802474} {"Full-finetune/Learning Rate": 1.9780438625553352e-05, "Full-finetune/Loss": 0.8928204774856567, "Full-finetune/Loss (Raw)": 0.8530715703964233, "Full-finetune/Step": 492, "Full-finetune/Step Time": 6.79113132879138} {"Full-finetune/Learning Rate": 1.9779138482315128e-05, "Full-finetune/Loss": 0.8918083906173706, "Full-finetune/Loss (Raw)": 0.9514026641845703, "Full-finetune/Step": 493, "Full-finetune/Step Time": 6.792975448071957} {"Full-finetune/Learning Rate": 1.977783454398418e-05, "Full-finetune/Loss": 0.8917232751846313, "Full-finetune/Loss (Raw)": 0.8776055574417114, "Full-finetune/Step": 494, "Full-finetune/Step Time": 6.803497681394219} {"Full-finetune/Learning Rate": 1.9776526811066543e-05, "Full-finetune/Loss": 0.8913081288337708, "Full-finetune/Loss (Raw)": 0.9247116446495056, "Full-finetune/Step": 495, "Full-finetune/Step Time": 6.803448487073183} {"Full-finetune/Learning Rate": 1.977521528406972e-05, "Full-finetune/Loss": 0.8910720348358154, "Full-finetune/Loss (Raw)": 0.9500960111618042, "Full-finetune/Step": 496, "Full-finetune/Step Time": 6.816502066329122} {"Full-finetune/Learning Rate": 1.9773899963502693e-05, "Full-finetune/Loss": 0.8905866146087646, "Full-finetune/Loss (Raw)": 0.8813765048980713, "Full-finetune/Step": 497, "Full-finetune/Step Time": 6.818866902962327} {"Full-finetune/Learning Rate": 1.9772580849875905e-05, "Full-finetune/Loss": 0.8896497488021851, "Full-finetune/Loss (Raw)": 0.9822635054588318, "Full-finetune/Step": 498, "Full-finetune/Step Time": 6.816743534058332} {"Full-finetune/Learning Rate": 1.9771257943701284e-05, "Full-finetune/Loss": 0.8875026106834412, "Full-finetune/Loss (Raw)": 0.8466761708259583, "Full-finetune/Step": 499, "Full-finetune/Step Time": 6.818089893087745} {"Full-finetune/Learning Rate": 1.9769931245492225e-05, "Full-finetune/Loss": 0.8866829872131348, "Full-finetune/Loss (Raw)": 0.9031886458396912, "Full-finetune/Step": 500, "Full-finetune/Step Time": 6.822269771248102} {"Full-finetune/Learning Rate": 1.976860075576359e-05, "Full-finetune/Loss": 0.8887683153152466, "Full-finetune/Loss (Raw)": 0.7016966938972473, "Full-finetune/Step": 501, "Full-finetune/Step Time": 6.815641349181533} {"Full-finetune/Learning Rate": 1.9767266475031716e-05, "Full-finetune/Loss": 0.891963541507721, "Full-finetune/Loss (Raw)": 0.7624824047088623, "Full-finetune/Step": 502, "Full-finetune/Step Time": 6.815023589879274} {"Full-finetune/Learning Rate": 1.9765928403814416e-05, "Full-finetune/Loss": 0.8901321887969971, "Full-finetune/Loss (Raw)": 0.8239773511886597, "Full-finetune/Step": 503, "Full-finetune/Step Time": 6.831241603940725} {"Full-finetune/Learning Rate": 1.9764586542630965e-05, "Full-finetune/Loss": 0.8907719850540161, "Full-finetune/Loss (Raw)": 0.9411329030990601, "Full-finetune/Step": 504, "Full-finetune/Step Time": 6.836978523060679} {"Full-finetune/Learning Rate": 1.9763240892002113e-05, "Full-finetune/Loss": 0.8907583951950073, "Full-finetune/Loss (Raw)": 0.9472051858901978, "Full-finetune/Step": 505, "Full-finetune/Step Time": 6.837253576144576} {"Full-finetune/Learning Rate": 1.9761891452450082e-05, "Full-finetune/Loss": 0.8868318200111389, "Full-finetune/Loss (Raw)": 0.6674431562423706, "Full-finetune/Step": 506, "Full-finetune/Step Time": 6.848820239305496} {"Full-finetune/Learning Rate": 1.9760538224498563e-05, "Full-finetune/Loss": 0.8854743838310242, "Full-finetune/Loss (Raw)": 0.9513328075408936, "Full-finetune/Step": 507, "Full-finetune/Step Time": 6.84416201338172} {"Full-finetune/Learning Rate": 1.975918120867272e-05, "Full-finetune/Loss": 0.8845937252044678, "Full-finetune/Loss (Raw)": 0.8809348344802856, "Full-finetune/Step": 508, "Full-finetune/Step Time": 6.844103667885065} {"Full-finetune/Learning Rate": 1.975782040549918e-05, "Full-finetune/Loss": 0.883379340171814, "Full-finetune/Loss (Raw)": 0.8761922717094421, "Full-finetune/Step": 509, "Full-finetune/Step Time": 6.847593268379569} {"Full-finetune/Learning Rate": 1.9756455815506045e-05, "Full-finetune/Loss": 0.8830717206001282, "Full-finetune/Loss (Raw)": 0.8565767407417297, "Full-finetune/Step": 510, "Full-finetune/Step Time": 6.808808041736484} {"Full-finetune/Learning Rate": 1.9755087439222888e-05, "Full-finetune/Loss": 0.8838131427764893, "Full-finetune/Loss (Raw)": 0.9707828164100647, "Full-finetune/Step": 511, "Full-finetune/Step Time": 6.7795468512922525} {"Full-finetune/Learning Rate": 1.975371527718075e-05, "Full-finetune/Loss": 0.8872507810592651, "Full-finetune/Loss (Raw)": 0.9194797873497009, "Full-finetune/Step": 512, "Full-finetune/Step Time": 6.761874057352543} {"Full-finetune/Learning Rate": 1.9752339329912137e-05, "Full-finetune/Loss": 0.8875848650932312, "Full-finetune/Loss (Raw)": 0.9954575300216675, "Full-finetune/Step": 513, "Full-finetune/Step Time": 6.7759435176849365} {"Full-finetune/Learning Rate": 1.9750959597951026e-05, "Full-finetune/Loss": 0.8876513242721558, "Full-finetune/Loss (Raw)": 0.9508041143417358, "Full-finetune/Step": 514, "Full-finetune/Step Time": 6.788897780701518} {"Full-finetune/Learning Rate": 1.9749576081832865e-05, "Full-finetune/Loss": 0.8841841220855713, "Full-finetune/Loss (Raw)": 0.38783350586891174, "Full-finetune/Step": 515, "Full-finetune/Step Time": 6.806010769680142} {"Full-finetune/Learning Rate": 1.9748188782094576e-05, "Full-finetune/Loss": 0.8848369717597961, "Full-finetune/Loss (Raw)": 0.9704286456108093, "Full-finetune/Step": 516, "Full-finetune/Step Time": 6.809146529063582} {"Full-finetune/Learning Rate": 1.9746797699274535e-05, "Full-finetune/Loss": 0.8854252696037292, "Full-finetune/Loss (Raw)": 0.9675731062889099, "Full-finetune/Step": 517, "Full-finetune/Step Time": 6.807980356737971} {"Full-finetune/Learning Rate": 1.9745402833912598e-05, "Full-finetune/Loss": 0.8865183591842651, "Full-finetune/Loss (Raw)": 0.9329923391342163, "Full-finetune/Step": 518, "Full-finetune/Step Time": 6.819949543103576} {"Full-finetune/Learning Rate": 1.9744004186550086e-05, "Full-finetune/Loss": 0.8865715265274048, "Full-finetune/Loss (Raw)": 0.9671187996864319, "Full-finetune/Step": 519, "Full-finetune/Step Time": 6.834311045706272} {"Full-finetune/Learning Rate": 1.974260175772978e-05, "Full-finetune/Loss": 0.8857754468917847, "Full-finetune/Loss (Raw)": 0.812082827091217, "Full-finetune/Step": 520, "Full-finetune/Step Time": 6.833692815154791} {"Full-finetune/Learning Rate": 1.9741195547995944e-05, "Full-finetune/Loss": 0.8871396780014038, "Full-finetune/Loss (Raw)": 0.9645841717720032, "Full-finetune/Step": 521, "Full-finetune/Step Time": 6.825001198798418} {"Full-finetune/Learning Rate": 1.9739785557894296e-05, "Full-finetune/Loss": 0.8878414630889893, "Full-finetune/Loss (Raw)": 0.8720908761024475, "Full-finetune/Step": 522, "Full-finetune/Step Time": 6.80589678324759} {"Full-finetune/Learning Rate": 1.9738371787972025e-05, "Full-finetune/Loss": 0.8841618299484253, "Full-finetune/Loss (Raw)": 0.701989471912384, "Full-finetune/Step": 523, "Full-finetune/Step Time": 6.8010879550129175} {"Full-finetune/Learning Rate": 1.9736954238777793e-05, "Full-finetune/Loss": 0.8829643726348877, "Full-finetune/Loss (Raw)": 0.9138895869255066, "Full-finetune/Step": 524, "Full-finetune/Step Time": 6.797620303928852} {"Full-finetune/Learning Rate": 1.9735532910861713e-05, "Full-finetune/Loss": 0.8844503164291382, "Full-finetune/Loss (Raw)": 0.9541647434234619, "Full-finetune/Step": 525, "Full-finetune/Step Time": 6.780645417049527} {"Full-finetune/Learning Rate": 1.9734107804775385e-05, "Full-finetune/Loss": 0.8822505474090576, "Full-finetune/Loss (Raw)": 0.846466064453125, "Full-finetune/Step": 526, "Full-finetune/Step Time": 6.792968537658453} {"Full-finetune/Learning Rate": 1.9732678921071858e-05, "Full-finetune/Loss": 0.8821960091590881, "Full-finetune/Loss (Raw)": 0.8468981385231018, "Full-finetune/Step": 527, "Full-finetune/Step Time": 6.787036580964923} {"Full-finetune/Learning Rate": 1.9731246260305657e-05, "Full-finetune/Loss": 0.8825328350067139, "Full-finetune/Loss (Raw)": 0.9482966065406799, "Full-finetune/Step": 528, "Full-finetune/Step Time": 6.781725747510791} {"Full-finetune/Learning Rate": 1.9729809823032767e-05, "Full-finetune/Loss": 0.88170325756073, "Full-finetune/Loss (Raw)": 0.9388730525970459, "Full-finetune/Step": 529, "Full-finetune/Step Time": 6.7804726622998714} {"Full-finetune/Learning Rate": 1.9728369609810648e-05, "Full-finetune/Loss": 0.8820807933807373, "Full-finetune/Loss (Raw)": 0.9920273423194885, "Full-finetune/Step": 530, "Full-finetune/Step Time": 6.765283837914467} {"Full-finetune/Learning Rate": 1.972692562119821e-05, "Full-finetune/Loss": 0.8829667568206787, "Full-finetune/Loss (Raw)": 1.0429223775863647, "Full-finetune/Step": 531, "Full-finetune/Step Time": 6.750523487105966} {"Full-finetune/Learning Rate": 1.9725477857755842e-05, "Full-finetune/Loss": 0.8816230297088623, "Full-finetune/Loss (Raw)": 0.8660790920257568, "Full-finetune/Step": 532, "Full-finetune/Step Time": 6.747928451746702} {"Full-finetune/Learning Rate": 1.9724026320045393e-05, "Full-finetune/Loss": 0.8829514384269714, "Full-finetune/Loss (Raw)": 0.8772919178009033, "Full-finetune/Step": 533, "Full-finetune/Step Time": 6.734003426507115} {"Full-finetune/Learning Rate": 1.9722571008630172e-05, "Full-finetune/Loss": 0.8862267732620239, "Full-finetune/Loss (Raw)": 0.8934305906295776, "Full-finetune/Step": 534, "Full-finetune/Step Time": 6.722134595736861} {"Full-finetune/Learning Rate": 1.9721111924074958e-05, "Full-finetune/Loss": 0.8892934322357178, "Full-finetune/Loss (Raw)": 0.8073216080665588, "Full-finetune/Step": 535, "Full-finetune/Step Time": 6.714880893006921} {"Full-finetune/Learning Rate": 1.9719649066946e-05, "Full-finetune/Loss": 0.8881890773773193, "Full-finetune/Loss (Raw)": 0.7793150544166565, "Full-finetune/Step": 536, "Full-finetune/Step Time": 6.736416256055236} {"Full-finetune/Learning Rate": 1.9718182437810996e-05, "Full-finetune/Loss": 0.8865972757339478, "Full-finetune/Loss (Raw)": 0.9389239549636841, "Full-finetune/Step": 537, "Full-finetune/Step Time": 6.738436745479703} {"Full-finetune/Learning Rate": 1.971671203723912e-05, "Full-finetune/Loss": 0.8846898078918457, "Full-finetune/Loss (Raw)": 0.9451084733009338, "Full-finetune/Step": 538, "Full-finetune/Step Time": 6.747958680614829} {"Full-finetune/Learning Rate": 1.9715237865801007e-05, "Full-finetune/Loss": 0.8851518630981445, "Full-finetune/Loss (Raw)": 1.0136542320251465, "Full-finetune/Step": 539, "Full-finetune/Step Time": 6.741146435961127} {"Full-finetune/Learning Rate": 1.971375992406875e-05, "Full-finetune/Loss": 0.8892137408256531, "Full-finetune/Loss (Raw)": 0.8832244277000427, "Full-finetune/Step": 540, "Full-finetune/Step Time": 6.720710059627891} {"Full-finetune/Learning Rate": 1.9712278212615913e-05, "Full-finetune/Loss": 0.8882355093955994, "Full-finetune/Loss (Raw)": 0.9009891748428345, "Full-finetune/Step": 541, "Full-finetune/Step Time": 6.727940700948238} {"Full-finetune/Learning Rate": 1.9710792732017517e-05, "Full-finetune/Loss": 0.8883875608444214, "Full-finetune/Loss (Raw)": 0.9082292318344116, "Full-finetune/Step": 542, "Full-finetune/Step Time": 6.726644909009337} {"Full-finetune/Learning Rate": 1.9709303482850047e-05, "Full-finetune/Loss": 0.8887462615966797, "Full-finetune/Loss (Raw)": 1.039347767829895, "Full-finetune/Step": 543, "Full-finetune/Step Time": 6.726643094792962} {"Full-finetune/Learning Rate": 1.9707810465691456e-05, "Full-finetune/Loss": 0.8878340721130371, "Full-finetune/Loss (Raw)": 0.9639157056808472, "Full-finetune/Step": 544, "Full-finetune/Step Time": 6.727489706128836} {"Full-finetune/Learning Rate": 1.970631368112115e-05, "Full-finetune/Loss": 0.8874686360359192, "Full-finetune/Loss (Raw)": 0.9355329871177673, "Full-finetune/Step": 545, "Full-finetune/Step Time": 6.7246248088777065} {"Full-finetune/Learning Rate": 1.970481312972001e-05, "Full-finetune/Loss": 0.8862670063972473, "Full-finetune/Loss (Raw)": 0.8818159103393555, "Full-finetune/Step": 546, "Full-finetune/Step Time": 6.726214054971933} {"Full-finetune/Learning Rate": 1.9703308812070358e-05, "Full-finetune/Loss": 0.8871527910232544, "Full-finetune/Loss (Raw)": 1.0037617683410645, "Full-finetune/Step": 547, "Full-finetune/Step Time": 6.717605721205473} {"Full-finetune/Learning Rate": 1.9701800728756e-05, "Full-finetune/Loss": 0.8904893398284912, "Full-finetune/Loss (Raw)": 0.7856295704841614, "Full-finetune/Step": 548, "Full-finetune/Step Time": 6.714006012305617} {"Full-finetune/Learning Rate": 1.970028888036219e-05, "Full-finetune/Loss": 0.8882325887680054, "Full-finetune/Loss (Raw)": 0.6922958493232727, "Full-finetune/Step": 549, "Full-finetune/Step Time": 6.722766950726509} {"Full-finetune/Learning Rate": 1.9698773267475652e-05, "Full-finetune/Loss": 0.8875125646591187, "Full-finetune/Loss (Raw)": 0.8577774167060852, "Full-finetune/Step": 550, "Full-finetune/Step Time": 6.705225616693497} {"Full-finetune/Learning Rate": 1.9697253890684556e-05, "Full-finetune/Loss": 0.8857043981552124, "Full-finetune/Loss (Raw)": 0.8308419585227966, "Full-finetune/Step": 551, "Full-finetune/Step Time": 6.706265095621347} {"Full-finetune/Learning Rate": 1.969573075057855e-05, "Full-finetune/Loss": 0.8856892585754395, "Full-finetune/Loss (Raw)": 1.0007843971252441, "Full-finetune/Step": 552, "Full-finetune/Step Time": 6.702293144538999} {"Full-finetune/Learning Rate": 1.9694203847748734e-05, "Full-finetune/Loss": 0.885949432849884, "Full-finetune/Loss (Raw)": 0.7088074088096619, "Full-finetune/Step": 553, "Full-finetune/Step Time": 6.666728256270289} {"Full-finetune/Learning Rate": 1.969267318278767e-05, "Full-finetune/Loss": 0.8863548636436462, "Full-finetune/Loss (Raw)": 0.9877712726593018, "Full-finetune/Step": 554, "Full-finetune/Step Time": 6.664140051230788} {"Full-finetune/Learning Rate": 1.969113875628937e-05, "Full-finetune/Loss": 0.8860740065574646, "Full-finetune/Loss (Raw)": 0.8906940817832947, "Full-finetune/Step": 555, "Full-finetune/Step Time": 6.677550604566932} {"Full-finetune/Learning Rate": 1.9689600568849328e-05, "Full-finetune/Loss": 0.8846721649169922, "Full-finetune/Loss (Raw)": 0.8788670301437378, "Full-finetune/Step": 556, "Full-finetune/Step Time": 6.690119702368975} {"Full-finetune/Learning Rate": 1.968805862106448e-05, "Full-finetune/Loss": 0.8832725286483765, "Full-finetune/Loss (Raw)": 0.8541154861450195, "Full-finetune/Step": 557, "Full-finetune/Step Time": 6.686637561768293} {"Full-finetune/Learning Rate": 1.968651291353322e-05, "Full-finetune/Loss": 0.8784757852554321, "Full-finetune/Loss (Raw)": 0.23628593981266022, "Full-finetune/Step": 558, "Full-finetune/Step Time": 6.698172798380256} {"Full-finetune/Learning Rate": 1.968496344685541e-05, "Full-finetune/Loss": 0.8778201937675476, "Full-finetune/Loss (Raw)": 0.8823449015617371, "Full-finetune/Step": 559, "Full-finetune/Step Time": 6.692676508799195} {"Full-finetune/Learning Rate": 1.9683410221632374e-05, "Full-finetune/Loss": 0.8770358562469482, "Full-finetune/Loss (Raw)": 0.7818291187286377, "Full-finetune/Step": 560, "Full-finetune/Step Time": 6.687317872419953} {"Full-finetune/Learning Rate": 1.9681853238466883e-05, "Full-finetune/Loss": 0.8766689896583557, "Full-finetune/Loss (Raw)": 0.807268500328064, "Full-finetune/Step": 561, "Full-finetune/Step Time": 6.688822690397501} {"Full-finetune/Learning Rate": 1.9680292497963172e-05, "Full-finetune/Loss": 0.8758383989334106, "Full-finetune/Loss (Raw)": 0.8111852407455444, "Full-finetune/Step": 562, "Full-finetune/Step Time": 6.696273075416684} {"Full-finetune/Learning Rate": 1.9678728000726936e-05, "Full-finetune/Loss": 0.8772444725036621, "Full-finetune/Loss (Raw)": 0.9618998765945435, "Full-finetune/Step": 563, "Full-finetune/Step Time": 6.697156649082899} {"Full-finetune/Learning Rate": 1.967715974736532e-05, "Full-finetune/Loss": 0.8777020573616028, "Full-finetune/Loss (Raw)": 0.9279909729957581, "Full-finetune/Step": 564, "Full-finetune/Step Time": 6.706398256123066} {"Full-finetune/Learning Rate": 1.9675587738486935e-05, "Full-finetune/Loss": 0.8762062191963196, "Full-finetune/Loss (Raw)": 0.7556894421577454, "Full-finetune/Step": 565, "Full-finetune/Step Time": 6.715926507487893} {"Full-finetune/Learning Rate": 1.9674011974701855e-05, "Full-finetune/Loss": 0.8777616024017334, "Full-finetune/Loss (Raw)": 1.011858582496643, "Full-finetune/Step": 566, "Full-finetune/Step Time": 6.717367295175791} {"Full-finetune/Learning Rate": 1.9672432456621597e-05, "Full-finetune/Loss": 0.877197265625, "Full-finetune/Loss (Raw)": 0.8231551647186279, "Full-finetune/Step": 567, "Full-finetune/Step Time": 6.71903320774436} {"Full-finetune/Learning Rate": 1.9670849184859136e-05, "Full-finetune/Loss": 0.8717461824417114, "Full-finetune/Loss (Raw)": 0.2747742831707001, "Full-finetune/Step": 568, "Full-finetune/Step Time": 6.733570234850049} {"Full-finetune/Learning Rate": 1.9669262160028916e-05, "Full-finetune/Loss": 0.8705133199691772, "Full-finetune/Loss (Raw)": 0.83058100938797, "Full-finetune/Step": 569, "Full-finetune/Step Time": 6.739395204931498} {"Full-finetune/Learning Rate": 1.966767138274683e-05, "Full-finetune/Loss": 0.8742251992225647, "Full-finetune/Loss (Raw)": 0.9016789793968201, "Full-finetune/Step": 570, "Full-finetune/Step Time": 6.72536513209343} {"Full-finetune/Learning Rate": 1.966607685363022e-05, "Full-finetune/Loss": 0.8727588653564453, "Full-finetune/Loss (Raw)": 0.814838171005249, "Full-finetune/Step": 571, "Full-finetune/Step Time": 6.7304077837616205} {"Full-finetune/Learning Rate": 1.96644785732979e-05, "Full-finetune/Loss": 0.871860146522522, "Full-finetune/Loss (Raw)": 0.9453592300415039, "Full-finetune/Step": 572, "Full-finetune/Step Time": 6.730028530582786} {"Full-finetune/Learning Rate": 1.966287654237013e-05, "Full-finetune/Loss": 0.8724818229675293, "Full-finetune/Loss (Raw)": 1.0181541442871094, "Full-finetune/Step": 573, "Full-finetune/Step Time": 6.745058868080378} {"Full-finetune/Learning Rate": 1.9661270761468625e-05, "Full-finetune/Loss": 0.8724194765090942, "Full-finetune/Loss (Raw)": 1.0104453563690186, "Full-finetune/Step": 574, "Full-finetune/Step Time": 6.742280291393399} {"Full-finetune/Learning Rate": 1.965966123121656e-05, "Full-finetune/Loss": 0.872812032699585, "Full-finetune/Loss (Raw)": 1.018668293952942, "Full-finetune/Step": 575, "Full-finetune/Step Time": 6.760527169331908} {"Full-finetune/Learning Rate": 1.965804795223856e-05, "Full-finetune/Loss": 0.8724520206451416, "Full-finetune/Loss (Raw)": 0.8746284246444702, "Full-finetune/Step": 576, "Full-finetune/Step Time": 6.761846125125885} {"Full-finetune/Learning Rate": 1.9656430925160704e-05, "Full-finetune/Loss": 0.8707462549209595, "Full-finetune/Loss (Raw)": 0.878544270992279, "Full-finetune/Step": 577, "Full-finetune/Step Time": 6.757871512323618} {"Full-finetune/Learning Rate": 1.9654810150610536e-05, "Full-finetune/Loss": 0.8703271746635437, "Full-finetune/Loss (Raw)": 0.8264710307121277, "Full-finetune/Step": 578, "Full-finetune/Step Time": 6.75344174169004} {"Full-finetune/Learning Rate": 1.9653185629217038e-05, "Full-finetune/Loss": 0.8691565990447998, "Full-finetune/Loss (Raw)": 0.7586666345596313, "Full-finetune/Step": 579, "Full-finetune/Step Time": 6.766376500949264} {"Full-finetune/Learning Rate": 1.9651557361610663e-05, "Full-finetune/Loss": 0.8694406747817993, "Full-finetune/Loss (Raw)": 0.9561429023742676, "Full-finetune/Step": 580, "Full-finetune/Step Time": 6.768070187419653} {"Full-finetune/Learning Rate": 1.9649925348423308e-05, "Full-finetune/Loss": 0.8686960935592651, "Full-finetune/Loss (Raw)": 1.00998854637146, "Full-finetune/Step": 581, "Full-finetune/Step Time": 6.772284962236881} {"Full-finetune/Learning Rate": 1.964828959028832e-05, "Full-finetune/Loss": 0.8693559169769287, "Full-finetune/Loss (Raw)": 0.997782826423645, "Full-finetune/Step": 582, "Full-finetune/Step Time": 6.767884908244014} {"Full-finetune/Learning Rate": 1.964665008784051e-05, "Full-finetune/Loss": 0.8676886558532715, "Full-finetune/Loss (Raw)": 0.7941357493400574, "Full-finetune/Step": 583, "Full-finetune/Step Time": 6.772963270545006} {"Full-finetune/Learning Rate": 1.9645006841716137e-05, "Full-finetune/Loss": 0.8722048997879028, "Full-finetune/Loss (Raw)": 0.9044080972671509, "Full-finetune/Step": 584, "Full-finetune/Step Time": 6.764840740710497} {"Full-finetune/Learning Rate": 1.9643359852552912e-05, "Full-finetune/Loss": 0.8733595013618469, "Full-finetune/Loss (Raw)": 0.9707033038139343, "Full-finetune/Step": 585, "Full-finetune/Step Time": 6.766733147203922} {"Full-finetune/Learning Rate": 1.9641709120989996e-05, "Full-finetune/Loss": 0.8673443794250488, "Full-finetune/Loss (Raw)": 0.3352009654045105, "Full-finetune/Step": 586, "Full-finetune/Step Time": 6.7804783415049314} {"Full-finetune/Learning Rate": 1.9640054647668015e-05, "Full-finetune/Loss": 0.8686485886573792, "Full-finetune/Loss (Raw)": 1.0656938552856445, "Full-finetune/Step": 587, "Full-finetune/Step Time": 6.77293573319912} {"Full-finetune/Learning Rate": 1.9638396433229025e-05, "Full-finetune/Loss": 0.8689509034156799, "Full-finetune/Loss (Raw)": 0.7953647375106812, "Full-finetune/Step": 588, "Full-finetune/Step Time": 6.781574577093124} {"Full-finetune/Learning Rate": 1.963673447831656e-05, "Full-finetune/Loss": 0.8697845339775085, "Full-finetune/Loss (Raw)": 1.0007802248001099, "Full-finetune/Step": 589, "Full-finetune/Step Time": 6.7671578992158175} {"Full-finetune/Learning Rate": 1.9635068783575577e-05, "Full-finetune/Loss": 0.8706871271133423, "Full-finetune/Loss (Raw)": 1.0323936939239502, "Full-finetune/Step": 590, "Full-finetune/Step Time": 6.769103460013866} {"Full-finetune/Learning Rate": 1.9633399349652512e-05, "Full-finetune/Loss": 0.8684844970703125, "Full-finetune/Loss (Raw)": 0.8317828178405762, "Full-finetune/Step": 591, "Full-finetune/Step Time": 6.761219184845686} {"Full-finetune/Learning Rate": 1.9631726177195235e-05, "Full-finetune/Loss": 0.873222291469574, "Full-finetune/Loss (Raw)": 0.8827323317527771, "Full-finetune/Step": 592, "Full-finetune/Step Time": 6.742931112647057} {"Full-finetune/Learning Rate": 1.9630049266853076e-05, "Full-finetune/Loss": 0.8723483085632324, "Full-finetune/Loss (Raw)": 0.8657943606376648, "Full-finetune/Step": 593, "Full-finetune/Step Time": 6.757748395204544} {"Full-finetune/Learning Rate": 1.96283686192768e-05, "Full-finetune/Loss": 0.8734435439109802, "Full-finetune/Loss (Raw)": 0.9239910840988159, "Full-finetune/Step": 594, "Full-finetune/Step Time": 6.746564006432891} {"Full-finetune/Learning Rate": 1.9626684235118646e-05, "Full-finetune/Loss": 0.873252272605896, "Full-finetune/Loss (Raw)": 0.9458996653556824, "Full-finetune/Step": 595, "Full-finetune/Step Time": 6.737553138285875} {"Full-finetune/Learning Rate": 1.9624996115032287e-05, "Full-finetune/Loss": 0.8738224506378174, "Full-finetune/Loss (Raw)": 0.8305879235267639, "Full-finetune/Step": 596, "Full-finetune/Step Time": 6.721233732998371} {"Full-finetune/Learning Rate": 1.9623304259672844e-05, "Full-finetune/Loss": 0.8772674798965454, "Full-finetune/Loss (Raw)": 0.7848614454269409, "Full-finetune/Step": 597, "Full-finetune/Step Time": 6.706239715218544} {"Full-finetune/Learning Rate": 1.96216086696969e-05, "Full-finetune/Loss": 0.8769813776016235, "Full-finetune/Loss (Raw)": 0.8682466149330139, "Full-finetune/Step": 598, "Full-finetune/Step Time": 6.7285499311983585} {"Full-finetune/Learning Rate": 1.9619909345762474e-05, "Full-finetune/Loss": 0.8774212598800659, "Full-finetune/Loss (Raw)": 0.9672157168388367, "Full-finetune/Step": 599, "Full-finetune/Step Time": 6.711649840697646} {"Full-finetune/Learning Rate": 1.961820628852905e-05, "Full-finetune/Loss": 0.8767748475074768, "Full-finetune/Loss (Raw)": 0.978087842464447, "Full-finetune/Step": 600, "Full-finetune/Step Time": 6.7168983314186335} {"Full-finetune/Learning Rate": 1.9616499498657537e-05, "Full-finetune/Loss": 0.8768103718757629, "Full-finetune/Loss (Raw)": 0.8388180136680603, "Full-finetune/Step": 601, "Full-finetune/Step Time": 6.741420868784189} {"Full-finetune/Learning Rate": 1.961478897681032e-05, "Full-finetune/Loss": 0.8765624761581421, "Full-finetune/Loss (Raw)": 0.9453436732292175, "Full-finetune/Step": 602, "Full-finetune/Step Time": 6.735013579949737} {"Full-finetune/Learning Rate": 1.9613074723651214e-05, "Full-finetune/Loss": 0.8750108480453491, "Full-finetune/Loss (Raw)": 0.7574474215507507, "Full-finetune/Step": 603, "Full-finetune/Step Time": 6.740424023941159} {"Full-finetune/Learning Rate": 1.9611356739845484e-05, "Full-finetune/Loss": 0.8753107190132141, "Full-finetune/Loss (Raw)": 0.9844945073127747, "Full-finetune/Step": 604, "Full-finetune/Step Time": 6.740537658333778} {"Full-finetune/Learning Rate": 1.9609635026059855e-05, "Full-finetune/Loss": 0.8743268251419067, "Full-finetune/Loss (Raw)": 0.785507082939148, "Full-finetune/Step": 605, "Full-finetune/Step Time": 6.736689314246178} {"Full-finetune/Learning Rate": 1.9607909582962478e-05, "Full-finetune/Loss": 0.8738465309143066, "Full-finetune/Loss (Raw)": 0.8136788606643677, "Full-finetune/Step": 606, "Full-finetune/Step Time": 6.753834776580334} {"Full-finetune/Learning Rate": 1.9606180411222974e-05, "Full-finetune/Loss": 0.8717595934867859, "Full-finetune/Loss (Raw)": 0.678613543510437, "Full-finetune/Step": 607, "Full-finetune/Step Time": 6.783220482990146} {"Full-finetune/Learning Rate": 1.9604447511512396e-05, "Full-finetune/Loss": 0.8717436790466309, "Full-finetune/Loss (Raw)": 1.0053653717041016, "Full-finetune/Step": 608, "Full-finetune/Step Time": 6.780082073062658} {"Full-finetune/Learning Rate": 1.960271088450325e-05, "Full-finetune/Loss": 0.870756983757019, "Full-finetune/Loss (Raw)": 0.8156588077545166, "Full-finetune/Step": 609, "Full-finetune/Step Time": 6.77584763430059} {"Full-finetune/Learning Rate": 1.960097053086949e-05, "Full-finetune/Loss": 0.8702364563941956, "Full-finetune/Loss (Raw)": 0.8980914354324341, "Full-finetune/Step": 610, "Full-finetune/Step Time": 6.766440410166979} {"Full-finetune/Learning Rate": 1.9599226451286504e-05, "Full-finetune/Loss": 0.8700354695320129, "Full-finetune/Loss (Raw)": 0.9060408473014832, "Full-finetune/Step": 611, "Full-finetune/Step Time": 6.7444338742643595} {"Full-finetune/Learning Rate": 1.9597478646431147e-05, "Full-finetune/Loss": 0.8721398115158081, "Full-finetune/Loss (Raw)": 1.087746262550354, "Full-finetune/Step": 612, "Full-finetune/Step Time": 6.742320891469717} {"Full-finetune/Learning Rate": 1.95957271169817e-05, "Full-finetune/Loss": 0.8727575540542603, "Full-finetune/Loss (Raw)": 0.7506245374679565, "Full-finetune/Step": 613, "Full-finetune/Step Time": 6.7337669264525175} {"Full-finetune/Learning Rate": 1.95939718636179e-05, "Full-finetune/Loss": 0.8732792735099792, "Full-finetune/Loss (Raw)": 0.9336221218109131, "Full-finetune/Step": 614, "Full-finetune/Step Time": 6.719254085794091} {"Full-finetune/Learning Rate": 1.9592212887020923e-05, "Full-finetune/Loss": 0.8729860186576843, "Full-finetune/Loss (Raw)": 0.9082337021827698, "Full-finetune/Step": 615, "Full-finetune/Step Time": 6.725080501288176} {"Full-finetune/Learning Rate": 1.9590450187873403e-05, "Full-finetune/Loss": 0.8725071549415588, "Full-finetune/Loss (Raw)": 0.9251697063446045, "Full-finetune/Step": 616, "Full-finetune/Step Time": 6.727271130308509} {"Full-finetune/Learning Rate": 1.95886837668594e-05, "Full-finetune/Loss": 0.8733524084091187, "Full-finetune/Loss (Raw)": 0.9260445237159729, "Full-finetune/Step": 617, "Full-finetune/Step Time": 6.719090234488249} {"Full-finetune/Learning Rate": 1.958691362466443e-05, "Full-finetune/Loss": 0.8743455410003662, "Full-finetune/Loss (Raw)": 0.9262040853500366, "Full-finetune/Step": 618, "Full-finetune/Step Time": 6.712639460340142} {"Full-finetune/Learning Rate": 1.958513976197545e-05, "Full-finetune/Loss": 0.8767357468605042, "Full-finetune/Loss (Raw)": 0.8397084474563599, "Full-finetune/Step": 619, "Full-finetune/Step Time": 6.716620909050107} {"Full-finetune/Learning Rate": 1.9583362179480866e-05, "Full-finetune/Loss": 0.8774466514587402, "Full-finetune/Loss (Raw)": 0.9440757632255554, "Full-finetune/Step": 620, "Full-finetune/Step Time": 6.707060193642974} {"Full-finetune/Learning Rate": 1.9581580877870514e-05, "Full-finetune/Loss": 0.8772329092025757, "Full-finetune/Loss (Raw)": 0.9240338802337646, "Full-finetune/Step": 621, "Full-finetune/Step Time": 6.7254161313176155} {"Full-finetune/Learning Rate": 1.9579795857835692e-05, "Full-finetune/Loss": 0.8772475719451904, "Full-finetune/Loss (Raw)": 0.8794896602630615, "Full-finetune/Step": 622, "Full-finetune/Step Time": 6.712916977703571} {"Full-finetune/Learning Rate": 1.9578007120069123e-05, "Full-finetune/Loss": 0.8774938583374023, "Full-finetune/Loss (Raw)": 0.9562296867370605, "Full-finetune/Step": 623, "Full-finetune/Step Time": 6.713977202773094} {"Full-finetune/Learning Rate": 1.957621466526499e-05, "Full-finetune/Loss": 0.8772458434104919, "Full-finetune/Loss (Raw)": 0.9183549880981445, "Full-finetune/Step": 624, "Full-finetune/Step Time": 6.699496516957879} {"Full-finetune/Learning Rate": 1.9574418494118905e-05, "Full-finetune/Loss": 0.8778198957443237, "Full-finetune/Loss (Raw)": 0.954858124256134, "Full-finetune/Step": 625, "Full-finetune/Step Time": 6.699232717975974} {"Full-finetune/Learning Rate": 1.9572618607327928e-05, "Full-finetune/Loss": 0.8777757287025452, "Full-finetune/Loss (Raw)": 0.9766024351119995, "Full-finetune/Step": 626, "Full-finetune/Step Time": 6.6969460509717464} {"Full-finetune/Learning Rate": 1.9570815005590556e-05, "Full-finetune/Loss": 0.8783372640609741, "Full-finetune/Loss (Raw)": 0.9185580015182495, "Full-finetune/Step": 627, "Full-finetune/Step Time": 6.699141327291727} {"Full-finetune/Learning Rate": 1.9569007689606735e-05, "Full-finetune/Loss": 0.8779945373535156, "Full-finetune/Loss (Raw)": 0.8593126535415649, "Full-finetune/Step": 628, "Full-finetune/Step Time": 6.689466927200556} {"Full-finetune/Learning Rate": 1.9567196660077848e-05, "Full-finetune/Loss": 0.8798081874847412, "Full-finetune/Loss (Raw)": 0.9338473081588745, "Full-finetune/Step": 629, "Full-finetune/Step Time": 6.678557233884931} {"Full-finetune/Learning Rate": 1.9565381917706726e-05, "Full-finetune/Loss": 0.8823469281196594, "Full-finetune/Loss (Raw)": 1.0874384641647339, "Full-finetune/Step": 630, "Full-finetune/Step Time": 6.659748217090964} {"Full-finetune/Learning Rate": 1.9563563463197625e-05, "Full-finetune/Loss": 0.8818162083625793, "Full-finetune/Loss (Raw)": 0.7560480237007141, "Full-finetune/Step": 631, "Full-finetune/Step Time": 6.645011570304632} {"Full-finetune/Learning Rate": 1.9561741297256257e-05, "Full-finetune/Loss": 0.8824659585952759, "Full-finetune/Loss (Raw)": 1.0242974758148193, "Full-finetune/Step": 632, "Full-finetune/Step Time": 6.632281206548214} {"Full-finetune/Learning Rate": 1.955991542058977e-05, "Full-finetune/Loss": 0.8838647603988647, "Full-finetune/Loss (Raw)": 1.1262576580047607, "Full-finetune/Step": 633, "Full-finetune/Step Time": 6.644569143652916} {"Full-finetune/Learning Rate": 1.9558085833906753e-05, "Full-finetune/Loss": 0.8850309252738953, "Full-finetune/Loss (Raw)": 0.8167049288749695, "Full-finetune/Step": 634, "Full-finetune/Step Time": 6.634628016501665} {"Full-finetune/Learning Rate": 1.9556252537917228e-05, "Full-finetune/Loss": 0.8849458694458008, "Full-finetune/Loss (Raw)": 0.9404531717300415, "Full-finetune/Step": 635, "Full-finetune/Step Time": 6.638467833399773} {"Full-finetune/Learning Rate": 1.955441553333266e-05, "Full-finetune/Loss": 0.8851429224014282, "Full-finetune/Loss (Raw)": 0.9061495661735535, "Full-finetune/Step": 636, "Full-finetune/Step Time": 6.663024816662073} {"Full-finetune/Learning Rate": 1.955257482086596e-05, "Full-finetune/Loss": 0.8861361742019653, "Full-finetune/Loss (Raw)": 1.0033355951309204, "Full-finetune/Step": 637, "Full-finetune/Step Time": 6.652056036517024} {"Full-finetune/Learning Rate": 1.955073040123147e-05, "Full-finetune/Loss": 0.8870161175727844, "Full-finetune/Loss (Raw)": 0.9692118763923645, "Full-finetune/Step": 638, "Full-finetune/Step Time": 6.653021233156323} {"Full-finetune/Learning Rate": 1.9548882275144974e-05, "Full-finetune/Loss": 0.8863593339920044, "Full-finetune/Loss (Raw)": 0.8867130279541016, "Full-finetune/Step": 639, "Full-finetune/Step Time": 6.649490373209119} {"Full-finetune/Learning Rate": 1.9547030443323695e-05, "Full-finetune/Loss": 0.8862255811691284, "Full-finetune/Loss (Raw)": 0.9023600220680237, "Full-finetune/Step": 640, "Full-finetune/Step Time": 6.6500851679593325} {"Full-finetune/Learning Rate": 1.9545174906486287e-05, "Full-finetune/Loss": 0.8849613666534424, "Full-finetune/Loss (Raw)": 0.8336426019668579, "Full-finetune/Step": 641, "Full-finetune/Step Time": 6.647166201844811} {"Full-finetune/Learning Rate": 1.9543315665352855e-05, "Full-finetune/Loss": 0.8802087306976318, "Full-finetune/Loss (Raw)": 0.34245723485946655, "Full-finetune/Step": 642, "Full-finetune/Step Time": 6.644052727147937} {"Full-finetune/Learning Rate": 1.954145272064493e-05, "Full-finetune/Loss": 0.8841422200202942, "Full-finetune/Loss (Raw)": 0.8913237452507019, "Full-finetune/Step": 643, "Full-finetune/Step Time": 6.635339925065637} {"Full-finetune/Learning Rate": 1.9539586073085482e-05, "Full-finetune/Loss": 0.8839781284332275, "Full-finetune/Loss (Raw)": 0.9494189620018005, "Full-finetune/Step": 644, "Full-finetune/Step Time": 6.639497891068459} {"Full-finetune/Learning Rate": 1.9537715723398926e-05, "Full-finetune/Loss": 0.8842988610267639, "Full-finetune/Loss (Raw)": 1.0086305141448975, "Full-finetune/Step": 645, "Full-finetune/Step Time": 6.637593053281307} {"Full-finetune/Learning Rate": 1.9535841672311106e-05, "Full-finetune/Loss": 0.8842092752456665, "Full-finetune/Loss (Raw)": 0.9215277433395386, "Full-finetune/Step": 646, "Full-finetune/Step Time": 6.638249929994345} {"Full-finetune/Learning Rate": 1.9533963920549307e-05, "Full-finetune/Loss": 0.8832585215568542, "Full-finetune/Loss (Raw)": 0.8454177975654602, "Full-finetune/Step": 647, "Full-finetune/Step Time": 6.637431262061} {"Full-finetune/Learning Rate": 1.9532082468842243e-05, "Full-finetune/Loss": 0.8842318058013916, "Full-finetune/Loss (Raw)": 0.9366663098335266, "Full-finetune/Step": 648, "Full-finetune/Step Time": 6.635361585766077} {"Full-finetune/Learning Rate": 1.953019731792007e-05, "Full-finetune/Loss": 0.8831796646118164, "Full-finetune/Loss (Raw)": 0.8299105763435364, "Full-finetune/Step": 649, "Full-finetune/Step Time": 6.629933273419738} {"Full-finetune/Learning Rate": 1.9528308468514383e-05, "Full-finetune/Loss": 0.8827767372131348, "Full-finetune/Loss (Raw)": 0.8205127716064453, "Full-finetune/Step": 650, "Full-finetune/Step Time": 6.642974924296141} {"Full-finetune/Learning Rate": 1.9526415921358202e-05, "Full-finetune/Loss": 0.8842836618423462, "Full-finetune/Loss (Raw)": 0.8948765993118286, "Full-finetune/Step": 651, "Full-finetune/Step Time": 6.651139175519347} {"Full-finetune/Learning Rate": 1.952451967718599e-05, "Full-finetune/Loss": 0.8840286135673523, "Full-finetune/Loss (Raw)": 0.8812394142150879, "Full-finetune/Step": 652, "Full-finetune/Step Time": 6.655011508613825} {"Full-finetune/Learning Rate": 1.952261973673364e-05, "Full-finetune/Loss": 0.8833541870117188, "Full-finetune/Loss (Raw)": 0.8678475022315979, "Full-finetune/Step": 653, "Full-finetune/Step Time": 6.657154835760593} {"Full-finetune/Learning Rate": 1.9520716100738487e-05, "Full-finetune/Loss": 0.8856803178787231, "Full-finetune/Loss (Raw)": 1.1442116498947144, "Full-finetune/Step": 654, "Full-finetune/Step Time": 6.648515120148659} {"Full-finetune/Learning Rate": 1.9518808769939287e-05, "Full-finetune/Loss": 0.8857823610305786, "Full-finetune/Loss (Raw)": 0.8599579334259033, "Full-finetune/Step": 655, "Full-finetune/Step Time": 6.656839283183217} {"Full-finetune/Learning Rate": 1.9516897745076243e-05, "Full-finetune/Loss": 0.8850089311599731, "Full-finetune/Loss (Raw)": 0.8492947816848755, "Full-finetune/Step": 656, "Full-finetune/Step Time": 6.6598782036453485} {"Full-finetune/Learning Rate": 1.9514983026890988e-05, "Full-finetune/Loss": 0.8840798735618591, "Full-finetune/Loss (Raw)": 0.8199589252471924, "Full-finetune/Step": 657, "Full-finetune/Step Time": 6.679985702037811} {"Full-finetune/Learning Rate": 1.9513064616126588e-05, "Full-finetune/Loss": 0.8834865689277649, "Full-finetune/Loss (Raw)": 0.9160783886909485, "Full-finetune/Step": 658, "Full-finetune/Step Time": 6.681905809789896} {"Full-finetune/Learning Rate": 1.951114251352753e-05, "Full-finetune/Loss": 0.8808434009552002, "Full-finetune/Loss (Raw)": 0.7045941948890686, "Full-finetune/Step": 659, "Full-finetune/Step Time": 6.703522369265556} {"Full-finetune/Learning Rate": 1.950921671983976e-05, "Full-finetune/Loss": 0.8820457458496094, "Full-finetune/Loss (Raw)": 1.0199811458587646, "Full-finetune/Step": 660, "Full-finetune/Step Time": 6.708587182685733} {"Full-finetune/Learning Rate": 1.9507287235810625e-05, "Full-finetune/Loss": 0.8823196887969971, "Full-finetune/Loss (Raw)": 0.9123568534851074, "Full-finetune/Step": 661, "Full-finetune/Step Time": 6.7005083076655865} {"Full-finetune/Learning Rate": 1.9505354062188934e-05, "Full-finetune/Loss": 0.8829998970031738, "Full-finetune/Loss (Raw)": 0.9805043339729309, "Full-finetune/Step": 662, "Full-finetune/Step Time": 6.690041853114963} {"Full-finetune/Learning Rate": 1.9503417199724904e-05, "Full-finetune/Loss": 0.8843512535095215, "Full-finetune/Loss (Raw)": 0.9802838563919067, "Full-finetune/Step": 663, "Full-finetune/Step Time": 6.679643979296088} {"Full-finetune/Learning Rate": 1.95014766491702e-05, "Full-finetune/Loss": 0.8849880695343018, "Full-finetune/Loss (Raw)": 0.8608428239822388, "Full-finetune/Step": 664, "Full-finetune/Step Time": 6.667207980528474} {"Full-finetune/Learning Rate": 1.9499532411277907e-05, "Full-finetune/Loss": 0.8854691386222839, "Full-finetune/Loss (Raw)": 1.0004922151565552, "Full-finetune/Step": 665, "Full-finetune/Step Time": 6.674812778830528} {"Full-finetune/Learning Rate": 1.9497584486802548e-05, "Full-finetune/Loss": 0.8864655494689941, "Full-finetune/Loss (Raw)": 1.0726414918899536, "Full-finetune/Step": 666, "Full-finetune/Step Time": 6.667296372354031} {"Full-finetune/Learning Rate": 1.9495632876500076e-05, "Full-finetune/Loss": 0.8861957788467407, "Full-finetune/Loss (Raw)": 0.9791280627250671, "Full-finetune/Step": 667, "Full-finetune/Step Time": 6.681051526218653} {"Full-finetune/Learning Rate": 1.949367758112787e-05, "Full-finetune/Loss": 0.8852337598800659, "Full-finetune/Loss (Raw)": 0.7600895762443542, "Full-finetune/Step": 668, "Full-finetune/Step Time": 6.686456589028239} {"Full-finetune/Learning Rate": 1.949171860144474e-05, "Full-finetune/Loss": 0.8855104446411133, "Full-finetune/Loss (Raw)": 0.9364060759544373, "Full-finetune/Step": 669, "Full-finetune/Step Time": 6.680926537141204} {"Full-finetune/Learning Rate": 1.9489755938210936e-05, "Full-finetune/Loss": 0.8850146532058716, "Full-finetune/Loss (Raw)": 0.844762921333313, "Full-finetune/Step": 670, "Full-finetune/Step Time": 6.68395764939487} {"Full-finetune/Learning Rate": 1.9487789592188123e-05, "Full-finetune/Loss": 0.8837631344795227, "Full-finetune/Loss (Raw)": 0.8791547417640686, "Full-finetune/Step": 671, "Full-finetune/Step Time": 6.68284734338522} {"Full-finetune/Learning Rate": 1.9485819564139404e-05, "Full-finetune/Loss": 0.883652925491333, "Full-finetune/Loss (Raw)": 0.9498088955879211, "Full-finetune/Step": 672, "Full-finetune/Step Time": 6.679427703842521} {"Full-finetune/Learning Rate": 1.9483845854829304e-05, "Full-finetune/Loss": 0.8843376636505127, "Full-finetune/Loss (Raw)": 1.0231812000274658, "Full-finetune/Step": 673, "Full-finetune/Step Time": 6.681215377524495} {"Full-finetune/Learning Rate": 1.9481868465023788e-05, "Full-finetune/Loss": 0.8856920003890991, "Full-finetune/Loss (Raw)": 1.0551674365997314, "Full-finetune/Step": 674, "Full-finetune/Step Time": 6.681861858814955} {"Full-finetune/Learning Rate": 1.9479887395490234e-05, "Full-finetune/Loss": 0.8853582739830017, "Full-finetune/Loss (Raw)": 0.9610430598258972, "Full-finetune/Step": 675, "Full-finetune/Step Time": 6.684501223266125} {"Full-finetune/Learning Rate": 1.9477902646997464e-05, "Full-finetune/Loss": 0.8866583108901978, "Full-finetune/Loss (Raw)": 0.9520394206047058, "Full-finetune/Step": 676, "Full-finetune/Step Time": 6.679602252319455} {"Full-finetune/Learning Rate": 1.947591422031572e-05, "Full-finetune/Loss": 0.8872496485710144, "Full-finetune/Loss (Raw)": 0.7679866552352905, "Full-finetune/Step": 677, "Full-finetune/Step Time": 6.711450824514031} {"Full-finetune/Learning Rate": 1.9473922116216664e-05, "Full-finetune/Loss": 0.8884205222129822, "Full-finetune/Loss (Raw)": 1.0076537132263184, "Full-finetune/Step": 678, "Full-finetune/Step Time": 6.7345457542687654} {"Full-finetune/Learning Rate": 1.9471926335473396e-05, "Full-finetune/Loss": 0.8898879289627075, "Full-finetune/Loss (Raw)": 1.018662929534912, "Full-finetune/Step": 679, "Full-finetune/Step Time": 6.739751383662224} {"Full-finetune/Learning Rate": 1.9469926878860447e-05, "Full-finetune/Loss": 0.888702392578125, "Full-finetune/Loss (Raw)": 0.8490422964096069, "Full-finetune/Step": 680, "Full-finetune/Step Time": 6.7379649095237255} {"Full-finetune/Learning Rate": 1.9467923747153756e-05, "Full-finetune/Loss": 0.8907755613327026, "Full-finetune/Loss (Raw)": 0.9741680026054382, "Full-finetune/Step": 681, "Full-finetune/Step Time": 6.737030118703842} {"Full-finetune/Learning Rate": 1.9465916941130705e-05, "Full-finetune/Loss": 0.8907365798950195, "Full-finetune/Loss (Raw)": 0.9827839732170105, "Full-finetune/Step": 682, "Full-finetune/Step Time": 6.75451535359025} {"Full-finetune/Learning Rate": 1.9463906461570098e-05, "Full-finetune/Loss": 0.8917954564094543, "Full-finetune/Loss (Raw)": 1.026229739189148, "Full-finetune/Step": 683, "Full-finetune/Step Time": 6.736625572666526} {"Full-finetune/Learning Rate": 1.9461892309252158e-05, "Full-finetune/Loss": 0.8913854956626892, "Full-finetune/Loss (Raw)": 0.8263932466506958, "Full-finetune/Step": 684, "Full-finetune/Step Time": 6.725895598530769} {"Full-finetune/Learning Rate": 1.945987448495854e-05, "Full-finetune/Loss": 0.8899946212768555, "Full-finetune/Loss (Raw)": 0.6760890483856201, "Full-finetune/Step": 685, "Full-finetune/Step Time": 6.741742936894298} {"Full-finetune/Learning Rate": 1.945785298947233e-05, "Full-finetune/Loss": 0.8939498662948608, "Full-finetune/Loss (Raw)": 0.7425545454025269, "Full-finetune/Step": 686, "Full-finetune/Step Time": 6.736904783174396} {"Full-finetune/Learning Rate": 1.9455827823578017e-05, "Full-finetune/Loss": 0.8939114212989807, "Full-finetune/Loss (Raw)": 0.8774188160896301, "Full-finetune/Step": 687, "Full-finetune/Step Time": 6.734184289351106} {"Full-finetune/Learning Rate": 1.9453798988061535e-05, "Full-finetune/Loss": 0.8948262333869934, "Full-finetune/Loss (Raw)": 0.8989254832267761, "Full-finetune/Step": 688, "Full-finetune/Step Time": 6.733300667256117} {"Full-finetune/Learning Rate": 1.9451766483710236e-05, "Full-finetune/Loss": 0.8928373456001282, "Full-finetune/Loss (Raw)": 0.5526899695396423, "Full-finetune/Step": 689, "Full-finetune/Step Time": 6.746639283373952} {"Full-finetune/Learning Rate": 1.94497303113129e-05, "Full-finetune/Loss": 0.8918948173522949, "Full-finetune/Loss (Raw)": 0.6905373334884644, "Full-finetune/Step": 690, "Full-finetune/Step Time": 6.7714688293635845} {"Full-finetune/Learning Rate": 1.9447690471659715e-05, "Full-finetune/Loss": 0.8919639587402344, "Full-finetune/Loss (Raw)": 0.9707529544830322, "Full-finetune/Step": 691, "Full-finetune/Step Time": 6.7733992245048285} {"Full-finetune/Learning Rate": 1.944564696554231e-05, "Full-finetune/Loss": 0.8908740282058716, "Full-finetune/Loss (Raw)": 0.7884793877601624, "Full-finetune/Step": 692, "Full-finetune/Step Time": 6.79156300984323} {"Full-finetune/Learning Rate": 1.944359979375373e-05, "Full-finetune/Loss": 0.8911411762237549, "Full-finetune/Loss (Raw)": 0.7898849844932556, "Full-finetune/Step": 693, "Full-finetune/Step Time": 6.791525773704052} {"Full-finetune/Learning Rate": 1.9441548957088438e-05, "Full-finetune/Loss": 0.8862562775611877, "Full-finetune/Loss (Raw)": 0.3865954875946045, "Full-finetune/Step": 694, "Full-finetune/Step Time": 6.819276515394449} {"Full-finetune/Learning Rate": 1.9439494456342327e-05, "Full-finetune/Loss": 0.8854542970657349, "Full-finetune/Loss (Raw)": 0.7205008268356323, "Full-finetune/Step": 695, "Full-finetune/Step Time": 6.826131533831358} {"Full-finetune/Learning Rate": 1.943743629231271e-05, "Full-finetune/Loss": 0.8911154270172119, "Full-finetune/Loss (Raw)": 0.9994001388549805, "Full-finetune/Step": 696, "Full-finetune/Step Time": 6.813712252303958} {"Full-finetune/Learning Rate": 1.9435374465798318e-05, "Full-finetune/Loss": 0.8908953070640564, "Full-finetune/Loss (Raw)": 0.8023989796638489, "Full-finetune/Step": 697, "Full-finetune/Step Time": 6.820273645222187} {"Full-finetune/Learning Rate": 1.9433308977599306e-05, "Full-finetune/Loss": 0.8920599222183228, "Full-finetune/Loss (Raw)": 1.0507522821426392, "Full-finetune/Step": 698, "Full-finetune/Step Time": 6.813816679641604} {"Full-finetune/Learning Rate": 1.943123982851725e-05, "Full-finetune/Loss": 0.8941537141799927, "Full-finetune/Loss (Raw)": 1.0828452110290527, "Full-finetune/Step": 699, "Full-finetune/Step Time": 6.810995636507869} {"Full-finetune/Learning Rate": 1.9429167019355143e-05, "Full-finetune/Loss": 0.8931503295898438, "Full-finetune/Loss (Raw)": 0.8169228434562683, "Full-finetune/Step": 700, "Full-finetune/Step Time": 6.830914556980133} {"Full-finetune/Learning Rate": 1.9427090550917407e-05, "Full-finetune/Loss": 0.8875417113304138, "Full-finetune/Loss (Raw)": 0.3002544343471527, "Full-finetune/Step": 701, "Full-finetune/Step Time": 6.8349436074495316} {"Full-finetune/Learning Rate": 1.9425010424009876e-05, "Full-finetune/Loss": 0.8865036964416504, "Full-finetune/Loss (Raw)": 0.877578616142273, "Full-finetune/Step": 702, "Full-finetune/Step Time": 6.84272450581193} {"Full-finetune/Learning Rate": 1.9422926639439806e-05, "Full-finetune/Loss": 0.884353756904602, "Full-finetune/Loss (Raw)": 0.743476152420044, "Full-finetune/Step": 703, "Full-finetune/Step Time": 6.833361586555839} {"Full-finetune/Learning Rate": 1.9420839198015878e-05, "Full-finetune/Loss": 0.8848674297332764, "Full-finetune/Loss (Raw)": 0.9403806328773499, "Full-finetune/Step": 704, "Full-finetune/Step Time": 6.84625699929893} {"Full-finetune/Learning Rate": 1.941874810054818e-05, "Full-finetune/Loss": 0.8852795362472534, "Full-finetune/Loss (Raw)": 0.9312957525253296, "Full-finetune/Step": 705, "Full-finetune/Step Time": 6.845820331946015} {"Full-finetune/Learning Rate": 1.941665334784823e-05, "Full-finetune/Loss": 0.8839406967163086, "Full-finetune/Loss (Raw)": 0.6550949215888977, "Full-finetune/Step": 706, "Full-finetune/Step Time": 6.848631182685494} {"Full-finetune/Learning Rate": 1.9414554940728963e-05, "Full-finetune/Loss": 0.8844606876373291, "Full-finetune/Loss (Raw)": 0.8252257108688354, "Full-finetune/Step": 707, "Full-finetune/Step Time": 6.834234591573477} {"Full-finetune/Learning Rate": 1.9412452880004728e-05, "Full-finetune/Loss": 0.8852076530456543, "Full-finetune/Loss (Raw)": 1.051755428314209, "Full-finetune/Step": 708, "Full-finetune/Step Time": 6.839970089495182} {"Full-finetune/Learning Rate": 1.941034716649129e-05, "Full-finetune/Loss": 0.8836636543273926, "Full-finetune/Loss (Raw)": 0.8123522996902466, "Full-finetune/Step": 709, "Full-finetune/Step Time": 6.830362541601062} {"Full-finetune/Learning Rate": 1.9408237801005837e-05, "Full-finetune/Loss": 0.882276177406311, "Full-finetune/Loss (Raw)": 0.820190966129303, "Full-finetune/Step": 710, "Full-finetune/Step Time": 6.818919388577342} {"Full-finetune/Learning Rate": 1.9406124784366976e-05, "Full-finetune/Loss": 0.8832330703735352, "Full-finetune/Loss (Raw)": 0.9166146516799927, "Full-finetune/Step": 711, "Full-finetune/Step Time": 6.833177458494902} {"Full-finetune/Learning Rate": 1.9404008117394726e-05, "Full-finetune/Loss": 0.8809194564819336, "Full-finetune/Loss (Raw)": 0.6082762479782104, "Full-finetune/Step": 712, "Full-finetune/Step Time": 6.843723848462105} {"Full-finetune/Learning Rate": 1.9401887800910525e-05, "Full-finetune/Loss": 0.8804992437362671, "Full-finetune/Loss (Raw)": 0.9169090390205383, "Full-finetune/Step": 713, "Full-finetune/Step Time": 6.84423609264195} {"Full-finetune/Learning Rate": 1.939976383573722e-05, "Full-finetune/Loss": 0.8839859366416931, "Full-finetune/Loss (Raw)": 0.7814944386482239, "Full-finetune/Step": 714, "Full-finetune/Step Time": 6.83168912678957} {"Full-finetune/Learning Rate": 1.9397636222699088e-05, "Full-finetune/Loss": 0.8835098743438721, "Full-finetune/Loss (Raw)": 1.004761815071106, "Full-finetune/Step": 715, "Full-finetune/Step Time": 6.830757953226566} {"Full-finetune/Learning Rate": 1.939550496262181e-05, "Full-finetune/Loss": 0.8834320306777954, "Full-finetune/Loss (Raw)": 0.7854014039039612, "Full-finetune/Step": 716, "Full-finetune/Step Time": 6.805957909673452} {"Full-finetune/Learning Rate": 1.939337005633249e-05, "Full-finetune/Loss": 0.8832484483718872, "Full-finetune/Loss (Raw)": 0.977277934551239, "Full-finetune/Step": 717, "Full-finetune/Step Time": 6.818448657169938} {"Full-finetune/Learning Rate": 1.939123150465964e-05, "Full-finetune/Loss": 0.8824193477630615, "Full-finetune/Loss (Raw)": 0.9262658953666687, "Full-finetune/Step": 718, "Full-finetune/Step Time": 6.822634195908904} {"Full-finetune/Learning Rate": 1.938908930843319e-05, "Full-finetune/Loss": 0.8832932710647583, "Full-finetune/Loss (Raw)": 0.9436445236206055, "Full-finetune/Step": 719, "Full-finetune/Step Time": 6.823497470468283} {"Full-finetune/Learning Rate": 1.9386943468484487e-05, "Full-finetune/Loss": 0.8847248554229736, "Full-finetune/Loss (Raw)": 1.0659809112548828, "Full-finetune/Step": 720, "Full-finetune/Step Time": 6.825896956026554} {"Full-finetune/Learning Rate": 1.938479398564629e-05, "Full-finetune/Loss": 0.8845428228378296, "Full-finetune/Loss (Raw)": 0.8424922823905945, "Full-finetune/Step": 721, "Full-finetune/Step Time": 6.829932099208236} {"Full-finetune/Learning Rate": 1.938264086075277e-05, "Full-finetune/Loss": 0.8840877413749695, "Full-finetune/Loss (Raw)": 0.8657420873641968, "Full-finetune/Step": 722, "Full-finetune/Step Time": 6.856620520353317} {"Full-finetune/Learning Rate": 1.938048409463951e-05, "Full-finetune/Loss": 0.8845993280410767, "Full-finetune/Loss (Raw)": 1.0113807916641235, "Full-finetune/Step": 723, "Full-finetune/Step Time": 6.85412591136992} {"Full-finetune/Learning Rate": 1.9378323688143515e-05, "Full-finetune/Loss": 0.885631263256073, "Full-finetune/Loss (Raw)": 0.9626774191856384, "Full-finetune/Step": 724, "Full-finetune/Step Time": 6.869696134701371} {"Full-finetune/Learning Rate": 1.937615964210319e-05, "Full-finetune/Loss": 0.8878486752510071, "Full-finetune/Loss (Raw)": 1.068687081336975, "Full-finetune/Step": 725, "Full-finetune/Step Time": 6.86883787997067} {"Full-finetune/Learning Rate": 1.9373991957358362e-05, "Full-finetune/Loss": 0.8858273029327393, "Full-finetune/Loss (Raw)": 0.6095180511474609, "Full-finetune/Step": 726, "Full-finetune/Step Time": 6.857156842947006} {"Full-finetune/Learning Rate": 1.9371820634750266e-05, "Full-finetune/Loss": 0.8854572772979736, "Full-finetune/Loss (Raw)": 0.9198462963104248, "Full-finetune/Step": 727, "Full-finetune/Step Time": 6.863920448347926} {"Full-finetune/Learning Rate": 1.9369645675121554e-05, "Full-finetune/Loss": 0.8859850764274597, "Full-finetune/Loss (Raw)": 1.0456531047821045, "Full-finetune/Step": 728, "Full-finetune/Step Time": 6.863139241933823} {"Full-finetune/Learning Rate": 1.936746707931628e-05, "Full-finetune/Loss": 0.88334059715271, "Full-finetune/Loss (Raw)": 0.5003182888031006, "Full-finetune/Step": 729, "Full-finetune/Step Time": 6.852692319080234} {"Full-finetune/Learning Rate": 1.9365284848179917e-05, "Full-finetune/Loss": 0.8832918405532837, "Full-finetune/Loss (Raw)": 0.9391049146652222, "Full-finetune/Step": 730, "Full-finetune/Step Time": 6.856535730883479} {"Full-finetune/Learning Rate": 1.9363098982559346e-05, "Full-finetune/Loss": 0.8846721053123474, "Full-finetune/Loss (Raw)": 0.9341213703155518, "Full-finetune/Step": 731, "Full-finetune/Step Time": 6.863549441099167} {"Full-finetune/Learning Rate": 1.9360909483302862e-05, "Full-finetune/Loss": 0.8832029104232788, "Full-finetune/Loss (Raw)": 0.7964363098144531, "Full-finetune/Step": 732, "Full-finetune/Step Time": 6.894514111801982} {"Full-finetune/Learning Rate": 1.9358716351260164e-05, "Full-finetune/Loss": 0.8837887048721313, "Full-finetune/Loss (Raw)": 0.860491156578064, "Full-finetune/Step": 733, "Full-finetune/Step Time": 6.8925083838403225} {"Full-finetune/Learning Rate": 1.935651958728236e-05, "Full-finetune/Loss": 0.8835006952285767, "Full-finetune/Loss (Raw)": 0.7768095135688782, "Full-finetune/Step": 734, "Full-finetune/Step Time": 6.880415972322226} {"Full-finetune/Learning Rate": 1.9354319192221975e-05, "Full-finetune/Loss": 0.8840289115905762, "Full-finetune/Loss (Raw)": 0.7462282776832581, "Full-finetune/Step": 735, "Full-finetune/Step Time": 6.858019633218646} {"Full-finetune/Learning Rate": 1.9352115166932943e-05, "Full-finetune/Loss": 0.8830690383911133, "Full-finetune/Loss (Raw)": 0.8825016617774963, "Full-finetune/Step": 736, "Full-finetune/Step Time": 6.903074413537979} {"Full-finetune/Learning Rate": 1.9349907512270597e-05, "Full-finetune/Loss": 0.8847223520278931, "Full-finetune/Loss (Raw)": 1.0272835493087769, "Full-finetune/Step": 737, "Full-finetune/Step Time": 6.908897114917636} {"Full-finetune/Learning Rate": 1.9347696229091685e-05, "Full-finetune/Loss": 0.885157585144043, "Full-finetune/Loss (Raw)": 0.9537962079048157, "Full-finetune/Step": 738, "Full-finetune/Step Time": 6.905960761010647} {"Full-finetune/Learning Rate": 1.934548131825437e-05, "Full-finetune/Loss": 0.8815264701843262, "Full-finetune/Loss (Raw)": 0.44126471877098083, "Full-finetune/Step": 739, "Full-finetune/Step Time": 6.928459761664271} {"Full-finetune/Learning Rate": 1.9343262780618206e-05, "Full-finetune/Loss": 0.881168782711029, "Full-finetune/Loss (Raw)": 1.0419554710388184, "Full-finetune/Step": 740, "Full-finetune/Step Time": 6.930437874048948} {"Full-finetune/Learning Rate": 1.934104061704417e-05, "Full-finetune/Loss": 0.8805669546127319, "Full-finetune/Loss (Raw)": 0.6735942959785461, "Full-finetune/Step": 741, "Full-finetune/Step Time": 6.949691338464618} {"Full-finetune/Learning Rate": 1.9338814828394638e-05, "Full-finetune/Loss": 0.8802128434181213, "Full-finetune/Loss (Raw)": 0.8882978558540344, "Full-finetune/Step": 742, "Full-finetune/Step Time": 6.954925751313567} {"Full-finetune/Learning Rate": 1.9336585415533398e-05, "Full-finetune/Loss": 0.8809472322463989, "Full-finetune/Loss (Raw)": 1.0022343397140503, "Full-finetune/Step": 743, "Full-finetune/Step Time": 6.949239017441869} {"Full-finetune/Learning Rate": 1.9334352379325638e-05, "Full-finetune/Loss": 0.8810640573501587, "Full-finetune/Loss (Raw)": 0.940126895904541, "Full-finetune/Step": 744, "Full-finetune/Step Time": 6.950596088543534} {"Full-finetune/Learning Rate": 1.9332115720637957e-05, "Full-finetune/Loss": 0.8798332214355469, "Full-finetune/Loss (Raw)": 0.7684877514839172, "Full-finetune/Step": 745, "Full-finetune/Step Time": 6.9692642372101545} {"Full-finetune/Learning Rate": 1.9329875440338363e-05, "Full-finetune/Loss": 0.8804630041122437, "Full-finetune/Loss (Raw)": 1.0068155527114868, "Full-finetune/Step": 746, "Full-finetune/Step Time": 6.960570691153407} {"Full-finetune/Learning Rate": 1.9327631539296258e-05, "Full-finetune/Loss": 0.8818063139915466, "Full-finetune/Loss (Raw)": 1.011658787727356, "Full-finetune/Step": 747, "Full-finetune/Step Time": 6.931144241243601} {"Full-finetune/Learning Rate": 1.932538401838246e-05, "Full-finetune/Loss": 0.8823630809783936, "Full-finetune/Loss (Raw)": 1.0153398513793945, "Full-finetune/Step": 748, "Full-finetune/Step Time": 6.933192644268274} {"Full-finetune/Learning Rate": 1.9323132878469185e-05, "Full-finetune/Loss": 0.8817772269248962, "Full-finetune/Loss (Raw)": 0.8490450382232666, "Full-finetune/Step": 749, "Full-finetune/Step Time": 6.933891294524074} {"Full-finetune/Learning Rate": 1.9320878120430063e-05, "Full-finetune/Loss": 0.8814784288406372, "Full-finetune/Loss (Raw)": 0.8412390351295471, "Full-finetune/Step": 750, "Full-finetune/Step Time": 6.939841004088521} {"Full-finetune/Learning Rate": 1.9318619745140115e-05, "Full-finetune/Loss": 0.8799142837524414, "Full-finetune/Loss (Raw)": 0.7560241222381592, "Full-finetune/Step": 751, "Full-finetune/Step Time": 6.942830011248589} {"Full-finetune/Learning Rate": 1.9316357753475776e-05, "Full-finetune/Loss": 0.880413293838501, "Full-finetune/Loss (Raw)": 0.9822270274162292, "Full-finetune/Step": 752, "Full-finetune/Step Time": 6.944229809567332} {"Full-finetune/Learning Rate": 1.9314092146314872e-05, "Full-finetune/Loss": 0.8760019540786743, "Full-finetune/Loss (Raw)": 0.3902059495449066, "Full-finetune/Step": 753, "Full-finetune/Step Time": 6.960533292964101} {"Full-finetune/Learning Rate": 1.9311822924536656e-05, "Full-finetune/Loss": 0.874578595161438, "Full-finetune/Loss (Raw)": 0.7944117188453674, "Full-finetune/Step": 754, "Full-finetune/Step Time": 6.960605842992663} {"Full-finetune/Learning Rate": 1.930955008902176e-05, "Full-finetune/Loss": 0.873191237449646, "Full-finetune/Loss (Raw)": 0.7409770488739014, "Full-finetune/Step": 755, "Full-finetune/Step Time": 6.982270002365112} {"Full-finetune/Learning Rate": 1.9307273640652228e-05, "Full-finetune/Loss": 0.873108983039856, "Full-finetune/Loss (Raw)": 0.8487803936004639, "Full-finetune/Step": 756, "Full-finetune/Step Time": 6.979007301852107} {"Full-finetune/Learning Rate": 1.9304993580311505e-05, "Full-finetune/Loss": 0.8723006248474121, "Full-finetune/Loss (Raw)": 0.8303804993629456, "Full-finetune/Step": 757, "Full-finetune/Step Time": 6.99170171096921} {"Full-finetune/Learning Rate": 1.9302709908884437e-05, "Full-finetune/Loss": 0.8715806603431702, "Full-finetune/Loss (Raw)": 0.9952816963195801, "Full-finetune/Step": 758, "Full-finetune/Step Time": 7.0001465901732445} {"Full-finetune/Learning Rate": 1.9300422627257275e-05, "Full-finetune/Loss": 0.8730804920196533, "Full-finetune/Loss (Raw)": 0.948029100894928, "Full-finetune/Step": 759, "Full-finetune/Step Time": 6.99998171441257} {"Full-finetune/Learning Rate": 1.9298131736317666e-05, "Full-finetune/Loss": 0.8722119927406311, "Full-finetune/Loss (Raw)": 0.9131321907043457, "Full-finetune/Step": 760, "Full-finetune/Step Time": 6.9936150796711445} {"Full-finetune/Learning Rate": 1.929583723695466e-05, "Full-finetune/Loss": 0.8704874515533447, "Full-finetune/Loss (Raw)": 0.9055092930793762, "Full-finetune/Step": 761, "Full-finetune/Step Time": 6.986708000302315} {"Full-finetune/Learning Rate": 1.9293539130058708e-05, "Full-finetune/Loss": 0.8669590950012207, "Full-finetune/Loss (Raw)": 0.36507588624954224, "Full-finetune/Step": 762, "Full-finetune/Step Time": 7.011457359418273} {"Full-finetune/Learning Rate": 1.9291237416521662e-05, "Full-finetune/Loss": 0.8654763102531433, "Full-finetune/Loss (Raw)": 0.7506616115570068, "Full-finetune/Step": 763, "Full-finetune/Step Time": 7.015238465741277} {"Full-finetune/Learning Rate": 1.9288932097236772e-05, "Full-finetune/Loss": 0.8651211261749268, "Full-finetune/Loss (Raw)": 0.860686182975769, "Full-finetune/Step": 764, "Full-finetune/Step Time": 6.993360774591565} {"Full-finetune/Learning Rate": 1.9286623173098683e-05, "Full-finetune/Loss": 0.8643162846565247, "Full-finetune/Loss (Raw)": 0.9003136157989502, "Full-finetune/Step": 765, "Full-finetune/Step Time": 6.997152408584952} {"Full-finetune/Learning Rate": 1.928431064500345e-05, "Full-finetune/Loss": 0.8645120859146118, "Full-finetune/Loss (Raw)": 0.9942727088928223, "Full-finetune/Step": 766, "Full-finetune/Step Time": 7.015309173613787} {"Full-finetune/Learning Rate": 1.9281994513848515e-05, "Full-finetune/Loss": 0.8644769787788391, "Full-finetune/Loss (Raw)": 0.8822233080863953, "Full-finetune/Step": 767, "Full-finetune/Step Time": 7.024326166138053} {"Full-finetune/Learning Rate": 1.9279674780532726e-05, "Full-finetune/Loss": 0.8640515804290771, "Full-finetune/Loss (Raw)": 0.8479058742523193, "Full-finetune/Step": 768, "Full-finetune/Step Time": 7.03386277705431} {"Full-finetune/Learning Rate": 1.9277351445956323e-05, "Full-finetune/Loss": 0.8632379770278931, "Full-finetune/Loss (Raw)": 0.7295022010803223, "Full-finetune/Step": 769, "Full-finetune/Step Time": 7.041397463530302} {"Full-finetune/Learning Rate": 1.927502451102095e-05, "Full-finetune/Loss": 0.8672598600387573, "Full-finetune/Loss (Raw)": 0.8572632670402527, "Full-finetune/Step": 770, "Full-finetune/Step Time": 7.030682412907481} {"Full-finetune/Learning Rate": 1.9272693976629642e-05, "Full-finetune/Loss": 0.8680388927459717, "Full-finetune/Loss (Raw)": 0.9910414814949036, "Full-finetune/Step": 771, "Full-finetune/Step Time": 7.024990951642394} {"Full-finetune/Learning Rate": 1.9270359843686837e-05, "Full-finetune/Loss": 0.8678065538406372, "Full-finetune/Loss (Raw)": 0.919678807258606, "Full-finetune/Step": 772, "Full-finetune/Step Time": 7.0186149422079325} {"Full-finetune/Learning Rate": 1.9268022113098366e-05, "Full-finetune/Loss": 0.8674279451370239, "Full-finetune/Loss (Raw)": 0.960158109664917, "Full-finetune/Step": 773, "Full-finetune/Step Time": 7.017497573047876} {"Full-finetune/Learning Rate": 1.9265680785771455e-05, "Full-finetune/Loss": 0.8661585450172424, "Full-finetune/Loss (Raw)": 0.7590470910072327, "Full-finetune/Step": 774, "Full-finetune/Step Time": 7.027669671922922} {"Full-finetune/Learning Rate": 1.926333586261473e-05, "Full-finetune/Loss": 0.8670678734779358, "Full-finetune/Loss (Raw)": 0.9618148803710938, "Full-finetune/Step": 775, "Full-finetune/Step Time": 7.030967751517892} {"Full-finetune/Learning Rate": 1.9260987344538205e-05, "Full-finetune/Loss": 0.8651084899902344, "Full-finetune/Loss (Raw)": 0.6858706474304199, "Full-finetune/Step": 776, "Full-finetune/Step Time": 7.0323069747537374} {"Full-finetune/Learning Rate": 1.9258635232453296e-05, "Full-finetune/Loss": 0.8664741516113281, "Full-finetune/Loss (Raw)": 1.0047070980072021, "Full-finetune/Step": 777, "Full-finetune/Step Time": 7.04891231097281} {"Full-finetune/Learning Rate": 1.9256279527272815e-05, "Full-finetune/Loss": 0.8677282333374023, "Full-finetune/Loss (Raw)": 0.9810360074043274, "Full-finetune/Step": 778, "Full-finetune/Step Time": 7.0340971276164055} {"Full-finetune/Learning Rate": 1.9253920229910966e-05, "Full-finetune/Loss": 0.8675527572631836, "Full-finetune/Loss (Raw)": 0.8724190592765808, "Full-finetune/Step": 779, "Full-finetune/Step Time": 7.031088825315237} {"Full-finetune/Learning Rate": 1.925155734128334e-05, "Full-finetune/Loss": 0.8631770014762878, "Full-finetune/Loss (Raw)": 0.32114365696907043, "Full-finetune/Step": 780, "Full-finetune/Step Time": 7.048901479691267} {"Full-finetune/Learning Rate": 1.9249190862306935e-05, "Full-finetune/Loss": 0.8628628253936768, "Full-finetune/Loss (Raw)": 0.8276313543319702, "Full-finetune/Step": 781, "Full-finetune/Step Time": 7.049033593386412} {"Full-finetune/Learning Rate": 1.9246820793900127e-05, "Full-finetune/Loss": 0.8585001230239868, "Full-finetune/Loss (Raw)": 0.5857914686203003, "Full-finetune/Step": 782, "Full-finetune/Step Time": 7.0785021763294935} {"Full-finetune/Learning Rate": 1.92444471369827e-05, "Full-finetune/Loss": 0.8584246039390564, "Full-finetune/Loss (Raw)": 0.8502863049507141, "Full-finetune/Step": 783, "Full-finetune/Step Time": 7.110319329425693} {"Full-finetune/Learning Rate": 1.924206989247582e-05, "Full-finetune/Loss": 0.8567048907279968, "Full-finetune/Loss (Raw)": 0.6291731595993042, "Full-finetune/Step": 784, "Full-finetune/Step Time": 7.1272804364562035} {"Full-finetune/Learning Rate": 1.9239689061302053e-05, "Full-finetune/Loss": 0.8579168319702148, "Full-finetune/Loss (Raw)": 0.9750915765762329, "Full-finetune/Step": 785, "Full-finetune/Step Time": 7.122702023014426} {"Full-finetune/Learning Rate": 1.923730464438535e-05, "Full-finetune/Loss": 0.8586033582687378, "Full-finetune/Loss (Raw)": 1.003953218460083, "Full-finetune/Step": 786, "Full-finetune/Step Time": 7.12005315348506} {"Full-finetune/Learning Rate": 1.923491664265106e-05, "Full-finetune/Loss": 0.8604633212089539, "Full-finetune/Loss (Raw)": 0.9426641464233398, "Full-finetune/Step": 787, "Full-finetune/Step Time": 7.124617420136929} {"Full-finetune/Learning Rate": 1.9232525057025915e-05, "Full-finetune/Loss": 0.86052006483078, "Full-finetune/Loss (Raw)": 1.0272443294525146, "Full-finetune/Step": 788, "Full-finetune/Step Time": 7.121066149324179} {"Full-finetune/Learning Rate": 1.9230129888438046e-05, "Full-finetune/Loss": 0.8606244325637817, "Full-finetune/Loss (Raw)": 0.9257156252861023, "Full-finetune/Step": 789, "Full-finetune/Step Time": 7.120172681286931} {"Full-finetune/Learning Rate": 1.922773113781697e-05, "Full-finetune/Loss": 0.8573826551437378, "Full-finetune/Loss (Raw)": 0.5655542016029358, "Full-finetune/Step": 790, "Full-finetune/Step Time": 7.159611029550433} {"Full-finetune/Learning Rate": 1.9225328806093596e-05, "Full-finetune/Loss": 0.8564245104789734, "Full-finetune/Loss (Raw)": 0.8576481938362122, "Full-finetune/Step": 791, "Full-finetune/Step Time": 7.171044362708926} {"Full-finetune/Learning Rate": 1.922292289420022e-05, "Full-finetune/Loss": 0.8557848930358887, "Full-finetune/Loss (Raw)": 0.778968095779419, "Full-finetune/Step": 792, "Full-finetune/Step Time": 7.172749120742083} {"Full-finetune/Learning Rate": 1.9220513403070534e-05, "Full-finetune/Loss": 0.8548524379730225, "Full-finetune/Loss (Raw)": 0.8811410665512085, "Full-finetune/Step": 793, "Full-finetune/Step Time": 7.175344796851277} {"Full-finetune/Learning Rate": 1.9218100333639608e-05, "Full-finetune/Loss": 0.8530852794647217, "Full-finetune/Loss (Raw)": 0.8464410901069641, "Full-finetune/Step": 794, "Full-finetune/Step Time": 7.17749160528183} {"Full-finetune/Learning Rate": 1.9215683686843912e-05, "Full-finetune/Loss": 0.8526065945625305, "Full-finetune/Loss (Raw)": 0.9178581833839417, "Full-finetune/Step": 795, "Full-finetune/Step Time": 7.181297034025192} {"Full-finetune/Learning Rate": 1.92132634636213e-05, "Full-finetune/Loss": 0.8535414338111877, "Full-finetune/Loss (Raw)": 0.8797513842582703, "Full-finetune/Step": 796, "Full-finetune/Step Time": 7.177702968940139} {"Full-finetune/Learning Rate": 1.9210839664911013e-05, "Full-finetune/Loss": 0.8530200123786926, "Full-finetune/Loss (Raw)": 0.8696637749671936, "Full-finetune/Step": 797, "Full-finetune/Step Time": 7.184747712686658} {"Full-finetune/Learning Rate": 1.9208412291653674e-05, "Full-finetune/Loss": 0.8538609743118286, "Full-finetune/Loss (Raw)": 0.9524098038673401, "Full-finetune/Step": 798, "Full-finetune/Step Time": 7.186182228848338} {"Full-finetune/Learning Rate": 1.9205981344791307e-05, "Full-finetune/Loss": 0.8531873226165771, "Full-finetune/Loss (Raw)": 0.7929261326789856, "Full-finetune/Step": 799, "Full-finetune/Step Time": 7.193658724427223} {"Full-finetune/Learning Rate": 1.9203546825267313e-05, "Full-finetune/Loss": 0.8528482913970947, "Full-finetune/Loss (Raw)": 0.9064124822616577, "Full-finetune/Step": 800, "Full-finetune/Step Time": 7.199292229488492} {"Full-finetune/Learning Rate": 1.9201108734026477e-05, "Full-finetune/Loss": 0.8522375226020813, "Full-finetune/Loss (Raw)": 0.9450014233589172, "Full-finetune/Step": 801, "Full-finetune/Step Time": 7.223139299079776} {"Full-finetune/Learning Rate": 1.9198667072014978e-05, "Full-finetune/Loss": 0.8503739833831787, "Full-finetune/Loss (Raw)": 0.8166287541389465, "Full-finetune/Step": 802, "Full-finetune/Step Time": 7.227332388982177} {"Full-finetune/Learning Rate": 1.9196221840180378e-05, "Full-finetune/Loss": 0.8485125303268433, "Full-finetune/Loss (Raw)": 0.7227751016616821, "Full-finetune/Step": 803, "Full-finetune/Step Time": 7.233147298917174} {"Full-finetune/Learning Rate": 1.9193773039471622e-05, "Full-finetune/Loss": 0.8480836153030396, "Full-finetune/Loss (Raw)": 0.8971449732780457, "Full-finetune/Step": 804, "Full-finetune/Step Time": 7.224605668336153} {"Full-finetune/Learning Rate": 1.9191320670839047e-05, "Full-finetune/Loss": 0.8492369055747986, "Full-finetune/Loss (Raw)": 0.9156063199043274, "Full-finetune/Step": 805, "Full-finetune/Step Time": 7.195298615843058} {"Full-finetune/Learning Rate": 1.918886473523436e-05, "Full-finetune/Loss": 0.8470188975334167, "Full-finetune/Loss (Raw)": 0.7237497568130493, "Full-finetune/Step": 806, "Full-finetune/Step Time": 7.198719713836908} {"Full-finetune/Learning Rate": 1.918640523361067e-05, "Full-finetune/Loss": 0.8458812832832336, "Full-finetune/Loss (Raw)": 0.8730517029762268, "Full-finetune/Step": 807, "Full-finetune/Step Time": 7.191186409443617} {"Full-finetune/Learning Rate": 1.9183942166922455e-05, "Full-finetune/Loss": 0.8458694219589233, "Full-finetune/Loss (Raw)": 0.8475238084793091, "Full-finetune/Step": 808, "Full-finetune/Step Time": 7.2114292830228806} {"Full-finetune/Learning Rate": 1.9181475536125588e-05, "Full-finetune/Loss": 0.8453009724617004, "Full-finetune/Loss (Raw)": 0.9014059901237488, "Full-finetune/Step": 809, "Full-finetune/Step Time": 7.225035509094596} {"Full-finetune/Learning Rate": 1.917900534217732e-05, "Full-finetune/Loss": 0.8454068899154663, "Full-finetune/Loss (Raw)": 0.9963365197181702, "Full-finetune/Step": 810, "Full-finetune/Step Time": 7.208323819562793} {"Full-finetune/Learning Rate": 1.9176531586036282e-05, "Full-finetune/Loss": 0.8434902429580688, "Full-finetune/Loss (Raw)": 0.7808930277824402, "Full-finetune/Step": 811, "Full-finetune/Step Time": 7.205140875652432} {"Full-finetune/Learning Rate": 1.917405426866249e-05, "Full-finetune/Loss": 0.8455095291137695, "Full-finetune/Loss (Raw)": 1.0848654508590698, "Full-finetune/Step": 812, "Full-finetune/Step Time": 7.202825576066971} {"Full-finetune/Learning Rate": 1.9171573391017348e-05, "Full-finetune/Loss": 0.8473668098449707, "Full-finetune/Loss (Raw)": 0.9138243794441223, "Full-finetune/Step": 813, "Full-finetune/Step Time": 7.190301293507218} {"Full-finetune/Learning Rate": 1.9169088954063634e-05, "Full-finetune/Loss": 0.8483433723449707, "Full-finetune/Loss (Raw)": 0.8675591349601746, "Full-finetune/Step": 814, "Full-finetune/Step Time": 7.179303698241711} {"Full-finetune/Learning Rate": 1.9166600958765508e-05, "Full-finetune/Loss": 0.848336935043335, "Full-finetune/Loss (Raw)": 0.8765888214111328, "Full-finetune/Step": 815, "Full-finetune/Step Time": 7.1836222764104605} {"Full-finetune/Learning Rate": 1.916410940608851e-05, "Full-finetune/Loss": 0.8488202095031738, "Full-finetune/Loss (Raw)": 0.9607887864112854, "Full-finetune/Step": 816, "Full-finetune/Step Time": 7.183138890191913} {"Full-finetune/Learning Rate": 1.9161614296999565e-05, "Full-finetune/Loss": 0.8518182039260864, "Full-finetune/Loss (Raw)": 0.9364319443702698, "Full-finetune/Step": 817, "Full-finetune/Step Time": 7.172475781291723} {"Full-finetune/Learning Rate": 1.9159115632466978e-05, "Full-finetune/Loss": 0.8489142656326294, "Full-finetune/Loss (Raw)": 0.3188316822052002, "Full-finetune/Step": 818, "Full-finetune/Step Time": 7.15221256390214} {"Full-finetune/Learning Rate": 1.9156613413460432e-05, "Full-finetune/Loss": 0.8470548391342163, "Full-finetune/Loss (Raw)": 0.7327389717102051, "Full-finetune/Step": 819, "Full-finetune/Step Time": 7.152467809617519} {"Full-finetune/Learning Rate": 1.9154107640950986e-05, "Full-finetune/Loss": 0.8457680344581604, "Full-finetune/Loss (Raw)": 0.6237791776657104, "Full-finetune/Step": 820, "Full-finetune/Step Time": 7.133815975859761} {"Full-finetune/Learning Rate": 1.9151598315911088e-05, "Full-finetune/Loss": 0.8462754487991333, "Full-finetune/Loss (Raw)": 0.8548267483711243, "Full-finetune/Step": 821, "Full-finetune/Step Time": 7.134425580501556} {"Full-finetune/Learning Rate": 1.9149085439314548e-05, "Full-finetune/Loss": 0.8497250080108643, "Full-finetune/Loss (Raw)": 0.828140914440155, "Full-finetune/Step": 822, "Full-finetune/Step Time": 7.109656071290374} {"Full-finetune/Learning Rate": 1.9146569012136572e-05, "Full-finetune/Loss": 0.8520875573158264, "Full-finetune/Loss (Raw)": 1.022911548614502, "Full-finetune/Step": 823, "Full-finetune/Step Time": 7.095734246075153} {"Full-finetune/Learning Rate": 1.914404903535373e-05, "Full-finetune/Loss": 0.851629376411438, "Full-finetune/Loss (Raw)": 0.9407528042793274, "Full-finetune/Step": 824, "Full-finetune/Step Time": 7.093244846910238} {"Full-finetune/Learning Rate": 1.9141525509943987e-05, "Full-finetune/Loss": 0.8519376516342163, "Full-finetune/Loss (Raw)": 0.8418594598770142, "Full-finetune/Step": 825, "Full-finetune/Step Time": 7.084149727597833} {"Full-finetune/Learning Rate": 1.9138998436886664e-05, "Full-finetune/Loss": 0.8495744466781616, "Full-finetune/Loss (Raw)": 0.7482596039772034, "Full-finetune/Step": 826, "Full-finetune/Step Time": 7.09017032943666} {"Full-finetune/Learning Rate": 1.913646781716247e-05, "Full-finetune/Loss": 0.8475818634033203, "Full-finetune/Loss (Raw)": 0.8277970552444458, "Full-finetune/Step": 827, "Full-finetune/Step Time": 7.076582105830312} {"Full-finetune/Learning Rate": 1.9133933651753493e-05, "Full-finetune/Loss": 0.8440682888031006, "Full-finetune/Loss (Raw)": 0.3671785295009613, "Full-finetune/Step": 828, "Full-finetune/Step Time": 7.0747878439724445} {"Full-finetune/Learning Rate": 1.913139594164319e-05, "Full-finetune/Loss": 0.8483130931854248, "Full-finetune/Loss (Raw)": 0.8435959219932556, "Full-finetune/Step": 829, "Full-finetune/Step Time": 7.069210691377521} {"Full-finetune/Learning Rate": 1.9128854687816394e-05, "Full-finetune/Loss": 0.8485041856765747, "Full-finetune/Loss (Raw)": 0.9020389318466187, "Full-finetune/Step": 830, "Full-finetune/Step Time": 7.0669221095740795} {"Full-finetune/Learning Rate": 1.9126309891259324e-05, "Full-finetune/Loss": 0.8493243455886841, "Full-finetune/Loss (Raw)": 0.84846031665802, "Full-finetune/Step": 831, "Full-finetune/Step Time": 7.072074549272656} {"Full-finetune/Learning Rate": 1.9123761552959562e-05, "Full-finetune/Loss": 0.8496110439300537, "Full-finetune/Loss (Raw)": 0.9770663976669312, "Full-finetune/Step": 832, "Full-finetune/Step Time": 7.052938366308808} {"Full-finetune/Learning Rate": 1.9121209673906064e-05, "Full-finetune/Loss": 0.8455312252044678, "Full-finetune/Loss (Raw)": 0.4090763330459595, "Full-finetune/Step": 833, "Full-finetune/Step Time": 7.072774758562446} {"Full-finetune/Learning Rate": 1.911865425508917e-05, "Full-finetune/Loss": 0.8475568294525146, "Full-finetune/Loss (Raw)": 0.9143770933151245, "Full-finetune/Step": 834, "Full-finetune/Step Time": 7.0810725428164005} {"Full-finetune/Learning Rate": 1.9116095297500588e-05, "Full-finetune/Loss": 0.848028302192688, "Full-finetune/Loss (Raw)": 0.8855724930763245, "Full-finetune/Step": 835, "Full-finetune/Step Time": 7.08629147708416} {"Full-finetune/Learning Rate": 1.9113532802133394e-05, "Full-finetune/Loss": 0.8466398119926453, "Full-finetune/Loss (Raw)": 0.8740335702896118, "Full-finetune/Step": 836, "Full-finetune/Step Time": 7.080330688506365} {"Full-finetune/Learning Rate": 1.911096676998205e-05, "Full-finetune/Loss": 0.8462015986442566, "Full-finetune/Loss (Raw)": 0.7562603950500488, "Full-finetune/Step": 837, "Full-finetune/Step Time": 7.0903244614601135} {"Full-finetune/Learning Rate": 1.9108397202042376e-05, "Full-finetune/Loss": 0.8462622165679932, "Full-finetune/Loss (Raw)": 0.8279524445533752, "Full-finetune/Step": 838, "Full-finetune/Step Time": 7.095017395913601} {"Full-finetune/Learning Rate": 1.910582409931158e-05, "Full-finetune/Loss": 0.845253586769104, "Full-finetune/Loss (Raw)": 0.7875076532363892, "Full-finetune/Step": 839, "Full-finetune/Step Time": 7.0866104159504175} {"Full-finetune/Learning Rate": 1.910324746278822e-05, "Full-finetune/Loss": 0.8484809398651123, "Full-finetune/Loss (Raw)": 1.0213737487792969, "Full-finetune/Step": 840, "Full-finetune/Step Time": 7.074801616370678} {"Full-finetune/Learning Rate": 1.9100667293472252e-05, "Full-finetune/Loss": 0.8476752042770386, "Full-finetune/Loss (Raw)": 0.8137821555137634, "Full-finetune/Step": 841, "Full-finetune/Step Time": 7.0785350240767} {"Full-finetune/Learning Rate": 1.9098083592364976e-05, "Full-finetune/Loss": 0.8489007949829102, "Full-finetune/Loss (Raw)": 0.9383625388145447, "Full-finetune/Step": 842, "Full-finetune/Step Time": 7.077905463054776} {"Full-finetune/Learning Rate": 1.9095496360469087e-05, "Full-finetune/Loss": 0.8481073379516602, "Full-finetune/Loss (Raw)": 0.9032053351402283, "Full-finetune/Step": 843, "Full-finetune/Step Time": 7.090231269598007} {"Full-finetune/Learning Rate": 1.9092905598788633e-05, "Full-finetune/Loss": 0.8486159443855286, "Full-finetune/Loss (Raw)": 0.8504963517189026, "Full-finetune/Step": 844, "Full-finetune/Step Time": 7.091156980022788} {"Full-finetune/Learning Rate": 1.9090311308329045e-05, "Full-finetune/Loss": 0.848273754119873, "Full-finetune/Loss (Raw)": 0.9334849119186401, "Full-finetune/Step": 845, "Full-finetune/Step Time": 7.087590225040913} {"Full-finetune/Learning Rate": 1.9087713490097108e-05, "Full-finetune/Loss": 0.8484689593315125, "Full-finetune/Loss (Raw)": 0.9512501955032349, "Full-finetune/Step": 846, "Full-finetune/Step Time": 7.078859277069569} {"Full-finetune/Learning Rate": 1.9085112145100987e-05, "Full-finetune/Loss": 0.8446696996688843, "Full-finetune/Loss (Raw)": 0.4573451280593872, "Full-finetune/Step": 847, "Full-finetune/Step Time": 7.096722036600113} {"Full-finetune/Learning Rate": 1.9082507274350216e-05, "Full-finetune/Loss": 0.8423013687133789, "Full-finetune/Loss (Raw)": 0.7628253698348999, "Full-finetune/Step": 848, "Full-finetune/Step Time": 7.108946124091744} {"Full-finetune/Learning Rate": 1.9079898878855695e-05, "Full-finetune/Loss": 0.8428103923797607, "Full-finetune/Loss (Raw)": 0.907648503780365, "Full-finetune/Step": 849, "Full-finetune/Step Time": 7.08560542948544} {"Full-finetune/Learning Rate": 1.9077286959629684e-05, "Full-finetune/Loss": 0.8423296809196472, "Full-finetune/Loss (Raw)": 0.8042100071907043, "Full-finetune/Step": 850, "Full-finetune/Step Time": 7.078926069661975} {"Full-finetune/Learning Rate": 1.907467151768583e-05, "Full-finetune/Loss": 0.8415775299072266, "Full-finetune/Loss (Raw)": 0.9151127934455872, "Full-finetune/Step": 851, "Full-finetune/Step Time": 7.085340259596705} {"Full-finetune/Learning Rate": 1.9072052554039123e-05, "Full-finetune/Loss": 0.8400803804397583, "Full-finetune/Loss (Raw)": 0.7710402011871338, "Full-finetune/Step": 852, "Full-finetune/Step Time": 7.068289192393422} {"Full-finetune/Learning Rate": 1.9069430069705936e-05, "Full-finetune/Loss": 0.8386111259460449, "Full-finetune/Loss (Raw)": 0.8806215524673462, "Full-finetune/Step": 853, "Full-finetune/Step Time": 7.0639893040061} {"Full-finetune/Learning Rate": 1.9066804065704006e-05, "Full-finetune/Loss": 0.8403326272964478, "Full-finetune/Loss (Raw)": 0.8298673033714294, "Full-finetune/Step": 854, "Full-finetune/Step Time": 7.065345864742994} {"Full-finetune/Learning Rate": 1.9064174543052435e-05, "Full-finetune/Loss": 0.8381751179695129, "Full-finetune/Loss (Raw)": 0.6436862349510193, "Full-finetune/Step": 855, "Full-finetune/Step Time": 7.099756104871631} {"Full-finetune/Learning Rate": 1.9061541502771682e-05, "Full-finetune/Loss": 0.8368605375289917, "Full-finetune/Loss (Raw)": 0.8773874640464783, "Full-finetune/Step": 856, "Full-finetune/Step Time": 7.096923869103193} {"Full-finetune/Learning Rate": 1.905890494588359e-05, "Full-finetune/Loss": 0.8392270803451538, "Full-finetune/Loss (Raw)": 0.8032346963882446, "Full-finetune/Step": 857, "Full-finetune/Step Time": 7.086165769025683} {"Full-finetune/Learning Rate": 1.9056264873411343e-05, "Full-finetune/Loss": 0.8404742479324341, "Full-finetune/Loss (Raw)": 1.0987412929534912, "Full-finetune/Step": 858, "Full-finetune/Step Time": 7.082712510600686} {"Full-finetune/Learning Rate": 1.905362128637951e-05, "Full-finetune/Loss": 0.840508222579956, "Full-finetune/Loss (Raw)": 0.9384785294532776, "Full-finetune/Step": 859, "Full-finetune/Step Time": 7.085709044709802} {"Full-finetune/Learning Rate": 1.905097418581401e-05, "Full-finetune/Loss": 0.8408373594284058, "Full-finetune/Loss (Raw)": 0.8385508060455322, "Full-finetune/Step": 860, "Full-finetune/Step Time": 7.054319102317095} {"Full-finetune/Learning Rate": 1.904832357274214e-05, "Full-finetune/Loss": 0.8390163779258728, "Full-finetune/Loss (Raw)": 0.6274107098579407, "Full-finetune/Step": 861, "Full-finetune/Step Time": 7.043558983132243} {"Full-finetune/Learning Rate": 1.9045669448192537e-05, "Full-finetune/Loss": 0.8400412797927856, "Full-finetune/Loss (Raw)": 0.9079996347427368, "Full-finetune/Step": 862, "Full-finetune/Step Time": 7.0464111771434546} {"Full-finetune/Learning Rate": 1.904301181319523e-05, "Full-finetune/Loss": 0.8397895693778992, "Full-finetune/Loss (Raw)": 0.7140152454376221, "Full-finetune/Step": 863, "Full-finetune/Step Time": 7.051672229543328} {"Full-finetune/Learning Rate": 1.9040350668781584e-05, "Full-finetune/Loss": 0.8403133153915405, "Full-finetune/Loss (Raw)": 0.9495348930358887, "Full-finetune/Step": 864, "Full-finetune/Step Time": 7.010057657957077} {"Full-finetune/Learning Rate": 1.9037686015984343e-05, "Full-finetune/Loss": 0.8388509750366211, "Full-finetune/Loss (Raw)": 0.8401051163673401, "Full-finetune/Step": 865, "Full-finetune/Step Time": 7.021776106208563} {"Full-finetune/Learning Rate": 1.9035017855837604e-05, "Full-finetune/Loss": 0.8393340110778809, "Full-finetune/Loss (Raw)": 1.0156193971633911, "Full-finetune/Step": 866, "Full-finetune/Step Time": 7.0332984663546085} {"Full-finetune/Learning Rate": 1.9032346189376828e-05, "Full-finetune/Loss": 0.8435502052307129, "Full-finetune/Loss (Raw)": 0.9809436798095703, "Full-finetune/Step": 867, "Full-finetune/Step Time": 7.014464840292931} {"Full-finetune/Learning Rate": 1.902967101763884e-05, "Full-finetune/Loss": 0.8418097496032715, "Full-finetune/Loss (Raw)": 0.8191748261451721, "Full-finetune/Step": 868, "Full-finetune/Step Time": 7.007206032052636} {"Full-finetune/Learning Rate": 1.902699234166182e-05, "Full-finetune/Loss": 0.844354510307312, "Full-finetune/Loss (Raw)": 0.9993219375610352, "Full-finetune/Step": 869, "Full-finetune/Step Time": 6.997834250330925} {"Full-finetune/Learning Rate": 1.9024310162485308e-05, "Full-finetune/Loss": 0.8436610698699951, "Full-finetune/Loss (Raw)": 0.7995332479476929, "Full-finetune/Step": 870, "Full-finetune/Step Time": 7.001348050311208} {"Full-finetune/Learning Rate": 1.9021624481150208e-05, "Full-finetune/Loss": 0.8413547873497009, "Full-finetune/Loss (Raw)": 0.7070363163948059, "Full-finetune/Step": 871, "Full-finetune/Step Time": 7.004685111343861} {"Full-finetune/Learning Rate": 1.9018935298698777e-05, "Full-finetune/Loss": 0.8409415483474731, "Full-finetune/Loss (Raw)": 0.8872360587120056, "Full-finetune/Step": 872, "Full-finetune/Step Time": 7.0051426980644464} {"Full-finetune/Learning Rate": 1.9016242616174637e-05, "Full-finetune/Loss": 0.8424394726753235, "Full-finetune/Loss (Raw)": 0.9602194428443909, "Full-finetune/Step": 873, "Full-finetune/Step Time": 6.987962547689676} {"Full-finetune/Learning Rate": 1.9013546434622766e-05, "Full-finetune/Loss": 0.8404502868652344, "Full-finetune/Loss (Raw)": 0.7521988749504089, "Full-finetune/Step": 874, "Full-finetune/Step Time": 6.99296104349196} {"Full-finetune/Learning Rate": 1.90108467550895e-05, "Full-finetune/Loss": 0.8387041091918945, "Full-finetune/Loss (Raw)": 0.7881515622138977, "Full-finetune/Step": 875, "Full-finetune/Step Time": 7.004391750320792} {"Full-finetune/Learning Rate": 1.9008143578622527e-05, "Full-finetune/Loss": 0.8375203609466553, "Full-finetune/Loss (Raw)": 0.8638110756874084, "Full-finetune/Step": 876, "Full-finetune/Step Time": 7.0054258573800325} {"Full-finetune/Learning Rate": 1.9005436906270902e-05, "Full-finetune/Loss": 0.8377388119697571, "Full-finetune/Loss (Raw)": 0.877013623714447, "Full-finetune/Step": 877, "Full-finetune/Step Time": 6.993189884349704} {"Full-finetune/Learning Rate": 1.9002726739085027e-05, "Full-finetune/Loss": 0.838047981262207, "Full-finetune/Loss (Raw)": 0.8808093667030334, "Full-finetune/Step": 878, "Full-finetune/Step Time": 6.986254269257188} {"Full-finetune/Learning Rate": 1.900001307811667e-05, "Full-finetune/Loss": 0.8385120034217834, "Full-finetune/Loss (Raw)": 0.8154240846633911, "Full-finetune/Step": 879, "Full-finetune/Step Time": 7.006396947428584} {"Full-finetune/Learning Rate": 1.899729592441895e-05, "Full-finetune/Loss": 0.8374610543251038, "Full-finetune/Loss (Raw)": 0.8476981520652771, "Full-finetune/Step": 880, "Full-finetune/Step Time": 7.0103839710354805} {"Full-finetune/Learning Rate": 1.899457527904634e-05, "Full-finetune/Loss": 0.8397330045700073, "Full-finetune/Loss (Raw)": 0.6810210347175598, "Full-finetune/Step": 881, "Full-finetune/Step Time": 7.00653094984591} {"Full-finetune/Learning Rate": 1.8991851143054662e-05, "Full-finetune/Loss": 0.8403365015983582, "Full-finetune/Loss (Raw)": 0.8716558218002319, "Full-finetune/Step": 882, "Full-finetune/Step Time": 7.006704807281494} {"Full-finetune/Learning Rate": 1.8989123517501112e-05, "Full-finetune/Loss": 0.8421928882598877, "Full-finetune/Loss (Raw)": 0.9785974025726318, "Full-finetune/Step": 883, "Full-finetune/Step Time": 6.978250177577138} {"Full-finetune/Learning Rate": 1.8986392403444222e-05, "Full-finetune/Loss": 0.843359112739563, "Full-finetune/Loss (Raw)": 0.9980534911155701, "Full-finetune/Step": 884, "Full-finetune/Step Time": 6.9786939304322} {"Full-finetune/Learning Rate": 1.8983657801943884e-05, "Full-finetune/Loss": 0.8386197090148926, "Full-finetune/Loss (Raw)": 0.22374732792377472, "Full-finetune/Step": 885, "Full-finetune/Step Time": 6.984416134655476} {"Full-finetune/Learning Rate": 1.8980919714061343e-05, "Full-finetune/Loss": 0.837682843208313, "Full-finetune/Loss (Raw)": 0.8753587603569031, "Full-finetune/Step": 886, "Full-finetune/Step Time": 6.988092754036188} {"Full-finetune/Learning Rate": 1.89781781408592e-05, "Full-finetune/Loss": 0.8333420753479004, "Full-finetune/Loss (Raw)": 0.39241108298301697, "Full-finetune/Step": 887, "Full-finetune/Step Time": 7.014899510890245} {"Full-finetune/Learning Rate": 1.8975433083401403e-05, "Full-finetune/Loss": 0.833800733089447, "Full-finetune/Loss (Raw)": 0.9718345999717712, "Full-finetune/Step": 888, "Full-finetune/Step Time": 7.02084144949913} {"Full-finetune/Learning Rate": 1.897268454275326e-05, "Full-finetune/Loss": 0.8338832855224609, "Full-finetune/Loss (Raw)": 0.9160822629928589, "Full-finetune/Step": 889, "Full-finetune/Step Time": 7.026156943291426} {"Full-finetune/Learning Rate": 1.896993251998142e-05, "Full-finetune/Loss": 0.8378349542617798, "Full-finetune/Loss (Raw)": 0.8708889484405518, "Full-finetune/Step": 890, "Full-finetune/Step Time": 7.0035196132957935} {"Full-finetune/Learning Rate": 1.8967177016153895e-05, "Full-finetune/Loss": 0.8388253450393677, "Full-finetune/Loss (Raw)": 0.8774260878562927, "Full-finetune/Step": 891, "Full-finetune/Step Time": 7.007338508963585} {"Full-finetune/Learning Rate": 1.8964418032340037e-05, "Full-finetune/Loss": 0.8384125232696533, "Full-finetune/Loss (Raw)": 0.8078460097312927, "Full-finetune/Step": 892, "Full-finetune/Step Time": 7.0106876995414495} {"Full-finetune/Learning Rate": 1.8961655569610557e-05, "Full-finetune/Loss": 0.8390368223190308, "Full-finetune/Loss (Raw)": 0.9802236557006836, "Full-finetune/Step": 893, "Full-finetune/Step Time": 7.007214825600386} {"Full-finetune/Learning Rate": 1.8958889629037514e-05, "Full-finetune/Loss": 0.8385117053985596, "Full-finetune/Loss (Raw)": 0.9270586967468262, "Full-finetune/Step": 894, "Full-finetune/Step Time": 6.991791378706694} {"Full-finetune/Learning Rate": 1.895612021169431e-05, "Full-finetune/Loss": 0.8377838134765625, "Full-finetune/Loss (Raw)": 0.7890506982803345, "Full-finetune/Step": 895, "Full-finetune/Step Time": 6.998422987759113} {"Full-finetune/Learning Rate": 1.8953347318655704e-05, "Full-finetune/Loss": 0.8384360074996948, "Full-finetune/Loss (Raw)": 0.9313889145851135, "Full-finetune/Step": 896, "Full-finetune/Step Time": 6.991317169740796} {"Full-finetune/Learning Rate": 1.8950570950997808e-05, "Full-finetune/Loss": 0.837955117225647, "Full-finetune/Loss (Raw)": 0.6679542660713196, "Full-finetune/Step": 897, "Full-finetune/Step Time": 6.995175840333104} {"Full-finetune/Learning Rate": 1.894779110979807e-05, "Full-finetune/Loss": 0.8341006636619568, "Full-finetune/Loss (Raw)": 0.36388349533081055, "Full-finetune/Step": 898, "Full-finetune/Step Time": 7.015927407890558} {"Full-finetune/Learning Rate": 1.894500779613529e-05, "Full-finetune/Loss": 0.8323959112167358, "Full-finetune/Loss (Raw)": 0.7728416323661804, "Full-finetune/Step": 899, "Full-finetune/Step Time": 7.050039684399962} {"Full-finetune/Learning Rate": 1.8942221011089623e-05, "Full-finetune/Loss": 0.8326734900474548, "Full-finetune/Loss (Raw)": 0.9552048444747925, "Full-finetune/Step": 900, "Full-finetune/Step Time": 7.060354169458151} {"Full-finetune/Learning Rate": 1.8939430755742564e-05, "Full-finetune/Loss": 0.8330340385437012, "Full-finetune/Loss (Raw)": 1.0063111782073975, "Full-finetune/Step": 901, "Full-finetune/Step Time": 7.0664770398288965} {"Full-finetune/Learning Rate": 1.8936637031176957e-05, "Full-finetune/Loss": 0.834048867225647, "Full-finetune/Loss (Raw)": 0.8889395594596863, "Full-finetune/Step": 902, "Full-finetune/Step Time": 7.049973905086517} {"Full-finetune/Learning Rate": 1.893383983847699e-05, "Full-finetune/Loss": 0.8335601091384888, "Full-finetune/Loss (Raw)": 0.899250328540802, "Full-finetune/Step": 903, "Full-finetune/Step Time": 7.060114361345768} {"Full-finetune/Learning Rate": 1.89310391787282e-05, "Full-finetune/Loss": 0.8345785140991211, "Full-finetune/Loss (Raw)": 0.8162302374839783, "Full-finetune/Step": 904, "Full-finetune/Step Time": 7.056717487052083} {"Full-finetune/Learning Rate": 1.892823505301747e-05, "Full-finetune/Loss": 0.8343425989151001, "Full-finetune/Loss (Raw)": 0.9745155572891235, "Full-finetune/Step": 905, "Full-finetune/Step Time": 7.037207555025816} {"Full-finetune/Learning Rate": 1.8925427462433027e-05, "Full-finetune/Loss": 0.8330181837081909, "Full-finetune/Loss (Raw)": 0.8115028738975525, "Full-finetune/Step": 906, "Full-finetune/Step Time": 7.035074852406979} {"Full-finetune/Learning Rate": 1.8922616408064436e-05, "Full-finetune/Loss": 0.8334544897079468, "Full-finetune/Loss (Raw)": 0.928266167640686, "Full-finetune/Step": 907, "Full-finetune/Step Time": 7.023092927411199} {"Full-finetune/Learning Rate": 1.8919801891002615e-05, "Full-finetune/Loss": 0.8379799723625183, "Full-finetune/Loss (Raw)": 0.9004080891609192, "Full-finetune/Step": 908, "Full-finetune/Step Time": 7.005412302911282} {"Full-finetune/Learning Rate": 1.891698391233983e-05, "Full-finetune/Loss": 0.8380682468414307, "Full-finetune/Loss (Raw)": 0.838925838470459, "Full-finetune/Step": 909, "Full-finetune/Step Time": 7.0104570761322975} {"Full-finetune/Learning Rate": 1.8914162473169676e-05, "Full-finetune/Loss": 0.8402101397514343, "Full-finetune/Loss (Raw)": 0.8599622845649719, "Full-finetune/Step": 910, "Full-finetune/Step Time": 6.9830782897770405} {"Full-finetune/Learning Rate": 1.8911337574587098e-05, "Full-finetune/Loss": 0.8402556777000427, "Full-finetune/Loss (Raw)": 0.8561065196990967, "Full-finetune/Step": 911, "Full-finetune/Step Time": 6.9576727245002985} {"Full-finetune/Learning Rate": 1.8908509217688387e-05, "Full-finetune/Loss": 0.8430522680282593, "Full-finetune/Loss (Raw)": 0.987143337726593, "Full-finetune/Step": 912, "Full-finetune/Step Time": 6.949814546853304} {"Full-finetune/Learning Rate": 1.8905677403571177e-05, "Full-finetune/Loss": 0.8404112458229065, "Full-finetune/Loss (Raw)": 0.6370416879653931, "Full-finetune/Step": 913, "Full-finetune/Step Time": 6.9447109419852495} {"Full-finetune/Learning Rate": 1.890284213333443e-05, "Full-finetune/Loss": 0.8408346176147461, "Full-finetune/Loss (Raw)": 1.0581353902816772, "Full-finetune/Step": 914, "Full-finetune/Step Time": 6.948774224147201} {"Full-finetune/Learning Rate": 1.8900003408078468e-05, "Full-finetune/Loss": 0.8406933546066284, "Full-finetune/Loss (Raw)": 0.924593985080719, "Full-finetune/Step": 915, "Full-finetune/Step Time": 6.921964479610324} {"Full-finetune/Learning Rate": 1.889716122890494e-05, "Full-finetune/Loss": 0.8399548530578613, "Full-finetune/Loss (Raw)": 0.9327144622802734, "Full-finetune/Step": 916, "Full-finetune/Step Time": 6.9290347173810005} {"Full-finetune/Learning Rate": 1.889431559691684e-05, "Full-finetune/Loss": 0.840866208076477, "Full-finetune/Loss (Raw)": 1.0423587560653687, "Full-finetune/Step": 917, "Full-finetune/Step Time": 6.9703715573996305} {"Full-finetune/Learning Rate": 1.8891466513218507e-05, "Full-finetune/Loss": 0.8430820107460022, "Full-finetune/Loss (Raw)": 0.8491820693016052, "Full-finetune/Step": 918, "Full-finetune/Step Time": 6.938204374164343} {"Full-finetune/Learning Rate": 1.888861397891561e-05, "Full-finetune/Loss": 0.8411051034927368, "Full-finetune/Loss (Raw)": 0.604600191116333, "Full-finetune/Step": 919, "Full-finetune/Step Time": 6.952615750953555} {"Full-finetune/Learning Rate": 1.888575799511516e-05, "Full-finetune/Loss": 0.8407760262489319, "Full-finetune/Loss (Raw)": 0.736855685710907, "Full-finetune/Step": 920, "Full-finetune/Step Time": 6.949133509770036} {"Full-finetune/Learning Rate": 1.888289856292552e-05, "Full-finetune/Loss": 0.8412550091743469, "Full-finetune/Loss (Raw)": 0.9424515962600708, "Full-finetune/Step": 921, "Full-finetune/Step Time": 6.9384299255907536} {"Full-finetune/Learning Rate": 1.8880035683456365e-05, "Full-finetune/Loss": 0.8412360548973083, "Full-finetune/Loss (Raw)": 0.8440099954605103, "Full-finetune/Step": 922, "Full-finetune/Step Time": 6.937602769583464} {"Full-finetune/Learning Rate": 1.887716935781873e-05, "Full-finetune/Loss": 0.8414863348007202, "Full-finetune/Loss (Raw)": 0.9498958587646484, "Full-finetune/Step": 923, "Full-finetune/Step Time": 6.929125647991896} {"Full-finetune/Learning Rate": 1.887429958712498e-05, "Full-finetune/Loss": 0.8409214019775391, "Full-finetune/Loss (Raw)": 0.8074380159378052, "Full-finetune/Step": 924, "Full-finetune/Step Time": 6.937614373862743} {"Full-finetune/Learning Rate": 1.8871426372488818e-05, "Full-finetune/Loss": 0.8398748636245728, "Full-finetune/Loss (Raw)": 0.7357010245323181, "Full-finetune/Step": 925, "Full-finetune/Step Time": 6.956451402977109} {"Full-finetune/Learning Rate": 1.886854971502528e-05, "Full-finetune/Loss": 0.8373492956161499, "Full-finetune/Loss (Raw)": 0.6291388869285583, "Full-finetune/Step": 926, "Full-finetune/Step Time": 6.961366679519415} {"Full-finetune/Learning Rate": 1.886566961585074e-05, "Full-finetune/Loss": 0.8380071520805359, "Full-finetune/Loss (Raw)": 0.8771345019340515, "Full-finetune/Step": 927, "Full-finetune/Step Time": 6.953933887183666} {"Full-finetune/Learning Rate": 1.886278607608291e-05, "Full-finetune/Loss": 0.8380848169326782, "Full-finetune/Loss (Raw)": 0.9163574576377869, "Full-finetune/Step": 928, "Full-finetune/Step Time": 6.945969607681036} {"Full-finetune/Learning Rate": 1.8859899096840836e-05, "Full-finetune/Loss": 0.8374101519584656, "Full-finetune/Loss (Raw)": 0.8586468696594238, "Full-finetune/Step": 929, "Full-finetune/Step Time": 6.923026621341705} {"Full-finetune/Learning Rate": 1.8857008679244897e-05, "Full-finetune/Loss": 0.8373703956604004, "Full-finetune/Loss (Raw)": 0.811532199382782, "Full-finetune/Step": 930, "Full-finetune/Step Time": 6.9269226882606745} {"Full-finetune/Learning Rate": 1.885411482441681e-05, "Full-finetune/Loss": 0.838887095451355, "Full-finetune/Loss (Raw)": 0.916919469833374, "Full-finetune/Step": 931, "Full-finetune/Step Time": 6.908398086205125} {"Full-finetune/Learning Rate": 1.885121753347962e-05, "Full-finetune/Loss": 0.8393413424491882, "Full-finetune/Loss (Raw)": 0.9552868008613586, "Full-finetune/Step": 932, "Full-finetune/Step Time": 6.9146995190531015} {"Full-finetune/Learning Rate": 1.884831680755771e-05, "Full-finetune/Loss": 0.8388177156448364, "Full-finetune/Loss (Raw)": 0.8485837578773499, "Full-finetune/Step": 933, "Full-finetune/Step Time": 6.924797559157014} {"Full-finetune/Learning Rate": 1.8845412647776795e-05, "Full-finetune/Loss": 0.8405444025993347, "Full-finetune/Loss (Raw)": 0.9447615742683411, "Full-finetune/Step": 934, "Full-finetune/Step Time": 6.911794442683458} {"Full-finetune/Learning Rate": 1.8842505055263928e-05, "Full-finetune/Loss": 0.8390686511993408, "Full-finetune/Loss (Raw)": 0.6841520667076111, "Full-finetune/Step": 935, "Full-finetune/Step Time": 6.911527192220092} {"Full-finetune/Learning Rate": 1.883959403114748e-05, "Full-finetune/Loss": 0.8385943174362183, "Full-finetune/Loss (Raw)": 0.7868145108222961, "Full-finetune/Step": 936, "Full-finetune/Step Time": 6.9040263295173645} {"Full-finetune/Learning Rate": 1.8836679576557165e-05, "Full-finetune/Loss": 0.8395937085151672, "Full-finetune/Loss (Raw)": 1.029332160949707, "Full-finetune/Step": 937, "Full-finetune/Step Time": 6.88930974714458} {"Full-finetune/Learning Rate": 1.8833761692624034e-05, "Full-finetune/Loss": 0.840013325214386, "Full-finetune/Loss (Raw)": 1.0500447750091553, "Full-finetune/Step": 938, "Full-finetune/Step Time": 6.893530126661062} {"Full-finetune/Learning Rate": 1.883084038048045e-05, "Full-finetune/Loss": 0.8405816555023193, "Full-finetune/Loss (Raw)": 0.8536391258239746, "Full-finetune/Step": 939, "Full-finetune/Step Time": 6.894495809450746} {"Full-finetune/Learning Rate": 1.8827915641260127e-05, "Full-finetune/Loss": 0.8395532369613647, "Full-finetune/Loss (Raw)": 0.9532318115234375, "Full-finetune/Step": 940, "Full-finetune/Step Time": 6.896943151950836} {"Full-finetune/Learning Rate": 1.882498747609809e-05, "Full-finetune/Loss": 0.8393895626068115, "Full-finetune/Loss (Raw)": 0.8928717374801636, "Full-finetune/Step": 941, "Full-finetune/Step Time": 6.895858947187662} {"Full-finetune/Learning Rate": 1.8822055886130708e-05, "Full-finetune/Loss": 0.8380579948425293, "Full-finetune/Loss (Raw)": 0.6971122622489929, "Full-finetune/Step": 942, "Full-finetune/Step Time": 6.902901206165552} {"Full-finetune/Learning Rate": 1.8819120872495675e-05, "Full-finetune/Loss": 0.8380779027938843, "Full-finetune/Loss (Raw)": 0.8791397213935852, "Full-finetune/Step": 943, "Full-finetune/Step Time": 6.902292715385556} {"Full-finetune/Learning Rate": 1.8816182436332006e-05, "Full-finetune/Loss": 0.8369951248168945, "Full-finetune/Loss (Raw)": 0.8221933245658875, "Full-finetune/Step": 944, "Full-finetune/Step Time": 6.897806107997894} {"Full-finetune/Learning Rate": 1.881324057878006e-05, "Full-finetune/Loss": 0.8358473181724548, "Full-finetune/Loss (Raw)": 0.7895200848579407, "Full-finetune/Step": 945, "Full-finetune/Step Time": 6.918344859033823} {"Full-finetune/Learning Rate": 1.8810295300981504e-05, "Full-finetune/Loss": 0.8389818072319031, "Full-finetune/Loss (Raw)": 0.7200405597686768, "Full-finetune/Step": 946, "Full-finetune/Step Time": 6.916854171082377} {"Full-finetune/Learning Rate": 1.8807346604079352e-05, "Full-finetune/Loss": 0.8397329449653625, "Full-finetune/Loss (Raw)": 0.828881561756134, "Full-finetune/Step": 947, "Full-finetune/Step Time": 6.935632508248091} {"Full-finetune/Learning Rate": 1.880439448921793e-05, "Full-finetune/Loss": 0.8378921747207642, "Full-finetune/Loss (Raw)": 0.3881644904613495, "Full-finetune/Step": 948, "Full-finetune/Step Time": 6.943372460082173} {"Full-finetune/Learning Rate": 1.88014389575429e-05, "Full-finetune/Loss": 0.8392380475997925, "Full-finetune/Loss (Raw)": 1.0271023511886597, "Full-finetune/Step": 949, "Full-finetune/Step Time": 6.928166365250945} {"Full-finetune/Learning Rate": 1.879848001020124e-05, "Full-finetune/Loss": 0.8394824862480164, "Full-finetune/Loss (Raw)": 0.8594223260879517, "Full-finetune/Step": 950, "Full-finetune/Step Time": 6.925377165898681} {"Full-finetune/Learning Rate": 1.8795517648341267e-05, "Full-finetune/Loss": 0.8398760557174683, "Full-finetune/Loss (Raw)": 1.0732876062393188, "Full-finetune/Step": 951, "Full-finetune/Step Time": 6.918237404897809} {"Full-finetune/Learning Rate": 1.8792551873112614e-05, "Full-finetune/Loss": 0.8387736082077026, "Full-finetune/Loss (Raw)": 0.799640953540802, "Full-finetune/Step": 952, "Full-finetune/Step Time": 6.923158334568143} {"Full-finetune/Learning Rate": 1.8789582685666237e-05, "Full-finetune/Loss": 0.8391285538673401, "Full-finetune/Loss (Raw)": 0.887294352054596, "Full-finetune/Step": 953, "Full-finetune/Step Time": 6.914960755035281} {"Full-finetune/Learning Rate": 1.878661008715442e-05, "Full-finetune/Loss": 0.8397729396820068, "Full-finetune/Loss (Raw)": 0.830738365650177, "Full-finetune/Step": 954, "Full-finetune/Step Time": 6.91154495254159} {"Full-finetune/Learning Rate": 1.8783634078730774e-05, "Full-finetune/Loss": 0.8402318358421326, "Full-finetune/Loss (Raw)": 0.8865348100662231, "Full-finetune/Step": 955, "Full-finetune/Step Time": 6.9104711022228} {"Full-finetune/Learning Rate": 1.878065466155023e-05, "Full-finetune/Loss": 0.8445972204208374, "Full-finetune/Loss (Raw)": 0.9259505271911621, "Full-finetune/Step": 956, "Full-finetune/Step Time": 6.894188839942217} {"Full-finetune/Learning Rate": 1.877767183676904e-05, "Full-finetune/Loss": 0.8444763422012329, "Full-finetune/Loss (Raw)": 0.8281223177909851, "Full-finetune/Step": 957, "Full-finetune/Step Time": 6.890467597171664} {"Full-finetune/Learning Rate": 1.8774685605544776e-05, "Full-finetune/Loss": 0.8439532518386841, "Full-finetune/Loss (Raw)": 0.8350881934165955, "Full-finetune/Step": 958, "Full-finetune/Step Time": 6.897140244022012} {"Full-finetune/Learning Rate": 1.8771695969036342e-05, "Full-finetune/Loss": 0.8432170152664185, "Full-finetune/Loss (Raw)": 0.7542129755020142, "Full-finetune/Step": 959, "Full-finetune/Step Time": 6.8783975057303905} {"Full-finetune/Learning Rate": 1.8768702928403954e-05, "Full-finetune/Loss": 0.8423997759819031, "Full-finetune/Loss (Raw)": 0.8724664449691772, "Full-finetune/Step": 960, "Full-finetune/Step Time": 6.880343317985535} {"Full-finetune/Learning Rate": 1.8765706484809155e-05, "Full-finetune/Loss": 0.8451558947563171, "Full-finetune/Loss (Raw)": 0.7618628144264221, "Full-finetune/Step": 961, "Full-finetune/Step Time": 6.861659187823534} {"Full-finetune/Learning Rate": 1.8762706639414806e-05, "Full-finetune/Loss": 0.845646321773529, "Full-finetune/Loss (Raw)": 0.9771454930305481, "Full-finetune/Step": 962, "Full-finetune/Step Time": 6.857798928394914} {"Full-finetune/Learning Rate": 1.8759703393385087e-05, "Full-finetune/Loss": 0.8453026413917542, "Full-finetune/Loss (Raw)": 0.8415825366973877, "Full-finetune/Step": 963, "Full-finetune/Step Time": 6.850355288013816} {"Full-finetune/Learning Rate": 1.87566967478855e-05, "Full-finetune/Loss": 0.8451893329620361, "Full-finetune/Loss (Raw)": 0.8595267534255981, "Full-finetune/Step": 964, "Full-finetune/Step Time": 6.849129166454077} {"Full-finetune/Learning Rate": 1.8753686704082868e-05, "Full-finetune/Loss": 0.8450813293457031, "Full-finetune/Loss (Raw)": 0.7424429655075073, "Full-finetune/Step": 965, "Full-finetune/Step Time": 6.8535634726285934} {"Full-finetune/Learning Rate": 1.8750673263145323e-05, "Full-finetune/Loss": 0.8451600670814514, "Full-finetune/Loss (Raw)": 0.8380308151245117, "Full-finetune/Step": 966, "Full-finetune/Step Time": 6.8545436430722475} {"Full-finetune/Learning Rate": 1.874765642624233e-05, "Full-finetune/Loss": 0.8453052639961243, "Full-finetune/Loss (Raw)": 0.8060898184776306, "Full-finetune/Step": 967, "Full-finetune/Step Time": 6.858278781175613} {"Full-finetune/Learning Rate": 1.874463619454466e-05, "Full-finetune/Loss": 0.8446340560913086, "Full-finetune/Loss (Raw)": 0.9354658126831055, "Full-finetune/Step": 968, "Full-finetune/Step Time": 6.856315018609166} {"Full-finetune/Learning Rate": 1.874161256922441e-05, "Full-finetune/Loss": 0.8446008563041687, "Full-finetune/Loss (Raw)": 0.809524655342102, "Full-finetune/Step": 969, "Full-finetune/Step Time": 6.864026423543692} {"Full-finetune/Learning Rate": 1.8738585551454982e-05, "Full-finetune/Loss": 0.8416017293930054, "Full-finetune/Loss (Raw)": 0.5544684529304504, "Full-finetune/Step": 970, "Full-finetune/Step Time": 6.8700422290712595} {"Full-finetune/Learning Rate": 1.873555514241111e-05, "Full-finetune/Loss": 0.8413487672805786, "Full-finetune/Loss (Raw)": 0.8708372712135315, "Full-finetune/Step": 971, "Full-finetune/Step Time": 6.893948324024677} {"Full-finetune/Learning Rate": 1.8732521343268838e-05, "Full-finetune/Loss": 0.8376302719116211, "Full-finetune/Loss (Raw)": 0.37453025579452515, "Full-finetune/Step": 972, "Full-finetune/Step Time": 6.910900980234146} {"Full-finetune/Learning Rate": 1.8729484155205517e-05, "Full-finetune/Loss": 0.8364763259887695, "Full-finetune/Loss (Raw)": 0.7857756614685059, "Full-finetune/Step": 973, "Full-finetune/Step Time": 6.915748471394181} {"Full-finetune/Learning Rate": 1.8726443579399828e-05, "Full-finetune/Loss": 0.8354395627975464, "Full-finetune/Loss (Raw)": 0.8185429573059082, "Full-finetune/Step": 974, "Full-finetune/Step Time": 6.9312774091959} {"Full-finetune/Learning Rate": 1.8723399617031754e-05, "Full-finetune/Loss": 0.83977210521698, "Full-finetune/Loss (Raw)": 1.011914610862732, "Full-finetune/Step": 975, "Full-finetune/Step Time": 6.924415493384004} {"Full-finetune/Learning Rate": 1.8720352269282592e-05, "Full-finetune/Loss": 0.8404663801193237, "Full-finetune/Loss (Raw)": 0.8516960144042969, "Full-finetune/Step": 976, "Full-finetune/Step Time": 6.910149831324816} {"Full-finetune/Learning Rate": 1.8717301537334975e-05, "Full-finetune/Loss": 0.841032862663269, "Full-finetune/Loss (Raw)": 0.9801512956619263, "Full-finetune/Step": 977, "Full-finetune/Step Time": 6.917178258299828} {"Full-finetune/Learning Rate": 1.8714247422372816e-05, "Full-finetune/Loss": 0.8412870168685913, "Full-finetune/Loss (Raw)": 0.83674156665802, "Full-finetune/Step": 978, "Full-finetune/Step Time": 6.891792941838503} {"Full-finetune/Learning Rate": 1.8711189925581366e-05, "Full-finetune/Loss": 0.8407472372055054, "Full-finetune/Loss (Raw)": 0.8460249304771423, "Full-finetune/Step": 979, "Full-finetune/Step Time": 6.891928844153881} {"Full-finetune/Learning Rate": 1.8708129048147176e-05, "Full-finetune/Loss": 0.8428755402565002, "Full-finetune/Loss (Raw)": 1.0434575080871582, "Full-finetune/Step": 980, "Full-finetune/Step Time": 6.890594432130456} {"Full-finetune/Learning Rate": 1.8705064791258118e-05, "Full-finetune/Loss": 0.8426394462585449, "Full-finetune/Loss (Raw)": 0.8504013419151306, "Full-finetune/Step": 981, "Full-finetune/Step Time": 6.89126623980701} {"Full-finetune/Learning Rate": 1.870199715610336e-05, "Full-finetune/Loss": 0.843595564365387, "Full-finetune/Loss (Raw)": 0.9522560238838196, "Full-finetune/Step": 982, "Full-finetune/Step Time": 6.879958653822541} {"Full-finetune/Learning Rate": 1.8698926143873404e-05, "Full-finetune/Loss": 0.8456524014472961, "Full-finetune/Loss (Raw)": 0.906960129737854, "Full-finetune/Step": 983, "Full-finetune/Step Time": 6.844333365559578} {"Full-finetune/Learning Rate": 1.8695851755760042e-05, "Full-finetune/Loss": 0.8447455763816833, "Full-finetune/Loss (Raw)": 0.761313796043396, "Full-finetune/Step": 984, "Full-finetune/Step Time": 6.854094384238124} {"Full-finetune/Learning Rate": 1.8692773992956383e-05, "Full-finetune/Loss": 0.8453478813171387, "Full-finetune/Loss (Raw)": 0.8803253173828125, "Full-finetune/Step": 985, "Full-finetune/Step Time": 6.852780604735017} {"Full-finetune/Learning Rate": 1.8689692856656854e-05, "Full-finetune/Loss": 0.8428860902786255, "Full-finetune/Loss (Raw)": 0.783638060092926, "Full-finetune/Step": 986, "Full-finetune/Step Time": 6.856447756290436} {"Full-finetune/Learning Rate": 1.8686608348057178e-05, "Full-finetune/Loss": 0.8426113128662109, "Full-finetune/Loss (Raw)": 0.9033030867576599, "Full-finetune/Step": 987, "Full-finetune/Step Time": 6.853561567142606} {"Full-finetune/Learning Rate": 1.868352046835439e-05, "Full-finetune/Loss": 0.8413254618644714, "Full-finetune/Loss (Raw)": 0.6739636063575745, "Full-finetune/Step": 988, "Full-finetune/Step Time": 6.855844935402274} {"Full-finetune/Learning Rate": 1.8680429218746842e-05, "Full-finetune/Loss": 0.843798041343689, "Full-finetune/Loss (Raw)": 0.9438953399658203, "Full-finetune/Step": 989, "Full-finetune/Step Time": 6.860074123367667} {"Full-finetune/Learning Rate": 1.867733460043419e-05, "Full-finetune/Loss": 0.8415610790252686, "Full-finetune/Loss (Raw)": 0.6216749548912048, "Full-finetune/Step": 990, "Full-finetune/Step Time": 6.864043673500419} {"Full-finetune/Learning Rate": 1.8674236614617386e-05, "Full-finetune/Loss": 0.8434357643127441, "Full-finetune/Loss (Raw)": 0.9539679884910583, "Full-finetune/Step": 991, "Full-finetune/Step Time": 6.855322791263461} {"Full-finetune/Learning Rate": 1.86711352624987e-05, "Full-finetune/Loss": 0.8429291248321533, "Full-finetune/Loss (Raw)": 0.8846951127052307, "Full-finetune/Step": 992, "Full-finetune/Step Time": 6.852718431502581} {"Full-finetune/Learning Rate": 1.866803054528171e-05, "Full-finetune/Loss": 0.8428646326065063, "Full-finetune/Loss (Raw)": 0.8318454027175903, "Full-finetune/Step": 993, "Full-finetune/Step Time": 6.8628816511482} {"Full-finetune/Learning Rate": 1.8664922464171295e-05, "Full-finetune/Loss": 0.8401705622673035, "Full-finetune/Loss (Raw)": 0.6707755327224731, "Full-finetune/Step": 994, "Full-finetune/Step Time": 6.860531209036708} {"Full-finetune/Learning Rate": 1.866181102037364e-05, "Full-finetune/Loss": 0.8393481969833374, "Full-finetune/Loss (Raw)": 0.875686764717102, "Full-finetune/Step": 995, "Full-finetune/Step Time": 6.859330590814352} {"Full-finetune/Learning Rate": 1.8658696215096235e-05, "Full-finetune/Loss": 0.8390319347381592, "Full-finetune/Loss (Raw)": 0.7786822319030762, "Full-finetune/Step": 996, "Full-finetune/Step Time": 6.8633712492883205} {"Full-finetune/Learning Rate": 1.8655578049547878e-05, "Full-finetune/Loss": 0.8379201292991638, "Full-finetune/Loss (Raw)": 0.8570154905319214, "Full-finetune/Step": 997, "Full-finetune/Step Time": 6.843530040234327} {"Full-finetune/Learning Rate": 1.8652456524938665e-05, "Full-finetune/Loss": 0.8376870155334473, "Full-finetune/Loss (Raw)": 0.7696922421455383, "Full-finetune/Step": 998, "Full-finetune/Step Time": 6.856624823063612} {"Full-finetune/Learning Rate": 1.864933164248e-05, "Full-finetune/Loss": 0.8396921157836914, "Full-finetune/Loss (Raw)": 0.9636925458908081, "Full-finetune/Step": 999, "Full-finetune/Step Time": 6.860476324334741} {"Full-finetune/Learning Rate": 1.8646203403384583e-05, "Full-finetune/Loss": 0.8406932353973389, "Full-finetune/Loss (Raw)": 1.015376329421997, "Full-finetune/Step": 1000, "Full-finetune/Step Time": 6.8533825892955065} {"Full-finetune/Learning Rate": 1.8643071808866434e-05, "Full-finetune/Loss": 0.8357714414596558, "Full-finetune/Loss (Raw)": 0.3302309215068817, "Full-finetune/Step": 1001, "Full-finetune/Step Time": 6.87570714764297} {"Full-finetune/Learning Rate": 1.8639936860140856e-05, "Full-finetune/Loss": 0.8372925519943237, "Full-finetune/Loss (Raw)": 0.9468998908996582, "Full-finetune/Step": 1002, "Full-finetune/Step Time": 6.876164145767689} {"Full-finetune/Learning Rate": 1.8636798558424464e-05, "Full-finetune/Loss": 0.8386706113815308, "Full-finetune/Loss (Raw)": 0.9645431041717529, "Full-finetune/Step": 1003, "Full-finetune/Step Time": 6.8791300524026155} {"Full-finetune/Learning Rate": 1.8633656904935168e-05, "Full-finetune/Loss": 0.8395617008209229, "Full-finetune/Loss (Raw)": 0.9778708815574646, "Full-finetune/Step": 1004, "Full-finetune/Step Time": 6.879084974527359} {"Full-finetune/Learning Rate": 1.863051190089219e-05, "Full-finetune/Loss": 0.8397481441497803, "Full-finetune/Loss (Raw)": 0.9008845686912537, "Full-finetune/Step": 1005, "Full-finetune/Step Time": 6.872157227247953} {"Full-finetune/Learning Rate": 1.8627363547516032e-05, "Full-finetune/Loss": 0.838301420211792, "Full-finetune/Loss (Raw)": 0.695622444152832, "Full-finetune/Step": 1006, "Full-finetune/Step Time": 6.887046424672008} {"Full-finetune/Learning Rate": 1.8624211846028522e-05, "Full-finetune/Loss": 0.8384130001068115, "Full-finetune/Loss (Raw)": 0.8297087550163269, "Full-finetune/Step": 1007, "Full-finetune/Step Time": 6.868760261684656} {"Full-finetune/Learning Rate": 1.862105679765277e-05, "Full-finetune/Loss": 0.8388586640357971, "Full-finetune/Loss (Raw)": 0.9047447443008423, "Full-finetune/Step": 1008, "Full-finetune/Step Time": 6.867902608588338} {"Full-finetune/Learning Rate": 1.8617898403613183e-05, "Full-finetune/Loss": 0.836765468120575, "Full-finetune/Loss (Raw)": 0.41308850049972534, "Full-finetune/Step": 1009, "Full-finetune/Step Time": 6.872576730325818} {"Full-finetune/Learning Rate": 1.8614736665135476e-05, "Full-finetune/Loss": 0.8360344171524048, "Full-finetune/Loss (Raw)": 0.7780765891075134, "Full-finetune/Step": 1010, "Full-finetune/Step Time": 6.8749587293714285} {"Full-finetune/Learning Rate": 1.861157158344666e-05, "Full-finetune/Loss": 0.8347495794296265, "Full-finetune/Loss (Raw)": 0.81414794921875, "Full-finetune/Step": 1011, "Full-finetune/Step Time": 6.874326255172491} {"Full-finetune/Learning Rate": 1.8608403159775037e-05, "Full-finetune/Loss": 0.8342164754867554, "Full-finetune/Loss (Raw)": 0.9298110604286194, "Full-finetune/Step": 1012, "Full-finetune/Step Time": 6.880217297002673} {"Full-finetune/Learning Rate": 1.8605231395350213e-05, "Full-finetune/Loss": 0.8391900062561035, "Full-finetune/Loss (Raw)": 0.8603589534759521, "Full-finetune/Step": 1013, "Full-finetune/Step Time": 6.8605785593390465} {"Full-finetune/Learning Rate": 1.860205629140309e-05, "Full-finetune/Loss": 0.8400044441223145, "Full-finetune/Loss (Raw)": 0.979610025882721, "Full-finetune/Step": 1014, "Full-finetune/Step Time": 6.855934733524919} {"Full-finetune/Learning Rate": 1.8598877849165857e-05, "Full-finetune/Loss": 0.8393218517303467, "Full-finetune/Loss (Raw)": 0.30504029989242554, "Full-finetune/Step": 1015, "Full-finetune/Step Time": 6.849730679765344} {"Full-finetune/Learning Rate": 1.8595696069872013e-05, "Full-finetune/Loss": 0.838902473449707, "Full-finetune/Loss (Raw)": 0.9181560277938843, "Full-finetune/Step": 1016, "Full-finetune/Step Time": 6.848109060898423} {"Full-finetune/Learning Rate": 1.859251095475634e-05, "Full-finetune/Loss": 0.8394075632095337, "Full-finetune/Loss (Raw)": 0.9807249307632446, "Full-finetune/Step": 1017, "Full-finetune/Step Time": 6.849449794739485} {"Full-finetune/Learning Rate": 1.858932250505492e-05, "Full-finetune/Loss": 0.8390873074531555, "Full-finetune/Loss (Raw)": 0.8298999667167664, "Full-finetune/Step": 1018, "Full-finetune/Step Time": 6.8862391375005245} {"Full-finetune/Learning Rate": 1.8586130722005128e-05, "Full-finetune/Loss": 0.8387123942375183, "Full-finetune/Loss (Raw)": 0.8294403553009033, "Full-finetune/Step": 1019, "Full-finetune/Step Time": 6.883343186229467} {"Full-finetune/Learning Rate": 1.8582935606845636e-05, "Full-finetune/Loss": 0.839216947555542, "Full-finetune/Loss (Raw)": 0.8724236488342285, "Full-finetune/Step": 1020, "Full-finetune/Step Time": 6.879079112783074} {"Full-finetune/Learning Rate": 1.8579737160816397e-05, "Full-finetune/Loss": 0.8372489213943481, "Full-finetune/Loss (Raw)": 0.7283236384391785, "Full-finetune/Step": 1021, "Full-finetune/Step Time": 6.890674490481615} {"Full-finetune/Learning Rate": 1.8576535385158675e-05, "Full-finetune/Loss": 0.8367438316345215, "Full-finetune/Loss (Raw)": 0.8623982667922974, "Full-finetune/Step": 1022, "Full-finetune/Step Time": 6.896383613348007} {"Full-finetune/Learning Rate": 1.8573330281115008e-05, "Full-finetune/Loss": 0.8359013795852661, "Full-finetune/Loss (Raw)": 0.6812280416488647, "Full-finetune/Step": 1023, "Full-finetune/Step Time": 6.900112306699157} {"Full-finetune/Learning Rate": 1.8570121849929245e-05, "Full-finetune/Loss": 0.8347886800765991, "Full-finetune/Loss (Raw)": 0.788959264755249, "Full-finetune/Step": 1024, "Full-finetune/Step Time": 6.901612959802151} {"Full-finetune/Learning Rate": 1.8566910092846508e-05, "Full-finetune/Loss": 0.835784912109375, "Full-finetune/Loss (Raw)": 0.7954663038253784, "Full-finetune/Step": 1025, "Full-finetune/Step Time": 6.886350065469742} {"Full-finetune/Learning Rate": 1.8563695011113217e-05, "Full-finetune/Loss": 0.8397241830825806, "Full-finetune/Loss (Raw)": 0.8681130409240723, "Full-finetune/Step": 1026, "Full-finetune/Step Time": 6.866085002198815} {"Full-finetune/Learning Rate": 1.8560476605977085e-05, "Full-finetune/Loss": 0.8364928364753723, "Full-finetune/Loss (Raw)": 0.35923081636428833, "Full-finetune/Step": 1027, "Full-finetune/Step Time": 6.856920190155506} {"Full-finetune/Learning Rate": 1.8557254878687114e-05, "Full-finetune/Loss": 0.8361310958862305, "Full-finetune/Loss (Raw)": 0.9089019298553467, "Full-finetune/Step": 1028, "Full-finetune/Step Time": 6.850436305627227} {"Full-finetune/Learning Rate": 1.8554029830493587e-05, "Full-finetune/Loss": 0.8344090580940247, "Full-finetune/Loss (Raw)": 0.7858914732933044, "Full-finetune/Step": 1029, "Full-finetune/Step Time": 6.857955424115062} {"Full-finetune/Learning Rate": 1.855080146264809e-05, "Full-finetune/Loss": 0.8336263298988342, "Full-finetune/Loss (Raw)": 0.7887434959411621, "Full-finetune/Step": 1030, "Full-finetune/Step Time": 6.861981336027384} {"Full-finetune/Learning Rate": 1.854756977640348e-05, "Full-finetune/Loss": 0.8331928253173828, "Full-finetune/Loss (Raw)": 0.8437667489051819, "Full-finetune/Step": 1031, "Full-finetune/Step Time": 6.837786085903645} {"Full-finetune/Learning Rate": 1.8544334773013924e-05, "Full-finetune/Loss": 0.8295186758041382, "Full-finetune/Loss (Raw)": 0.3459361791610718, "Full-finetune/Step": 1032, "Full-finetune/Step Time": 6.861122081056237} {"Full-finetune/Learning Rate": 1.8541096453734852e-05, "Full-finetune/Loss": 0.8289498090744019, "Full-finetune/Loss (Raw)": 0.9016999006271362, "Full-finetune/Step": 1033, "Full-finetune/Step Time": 6.887668691575527} {"Full-finetune/Learning Rate": 1.8537854819822998e-05, "Full-finetune/Loss": 0.8283512592315674, "Full-finetune/Loss (Raw)": 0.7348871231079102, "Full-finetune/Step": 1034, "Full-finetune/Step Time": 6.905266428366303} {"Full-finetune/Learning Rate": 1.853460987253638e-05, "Full-finetune/Loss": 0.828102707862854, "Full-finetune/Loss (Raw)": 0.8964546918869019, "Full-finetune/Step": 1035, "Full-finetune/Step Time": 6.917337950319052} {"Full-finetune/Learning Rate": 1.8531361613134286e-05, "Full-finetune/Loss": 0.8276448249816895, "Full-finetune/Loss (Raw)": 0.8418017029762268, "Full-finetune/Step": 1036, "Full-finetune/Step Time": 6.921985553577542} {"Full-finetune/Learning Rate": 1.8528110042877316e-05, "Full-finetune/Loss": 0.8266705274581909, "Full-finetune/Loss (Raw)": 0.7142164707183838, "Full-finetune/Step": 1037, "Full-finetune/Step Time": 6.924684530124068} {"Full-finetune/Learning Rate": 1.8524855163027337e-05, "Full-finetune/Loss": 0.8282777070999146, "Full-finetune/Loss (Raw)": 1.065676212310791, "Full-finetune/Step": 1038, "Full-finetune/Step Time": 6.918428240343928} {"Full-finetune/Learning Rate": 1.85215969748475e-05, "Full-finetune/Loss": 0.8284231424331665, "Full-finetune/Loss (Raw)": 0.874729573726654, "Full-finetune/Step": 1039, "Full-finetune/Step Time": 6.907143227756023} {"Full-finetune/Learning Rate": 1.851833547960225e-05, "Full-finetune/Loss": 0.8263044953346252, "Full-finetune/Loss (Raw)": 0.715950608253479, "Full-finetune/Step": 1040, "Full-finetune/Step Time": 6.902754483744502} {"Full-finetune/Learning Rate": 1.8515070678557304e-05, "Full-finetune/Loss": 0.8293101787567139, "Full-finetune/Loss (Raw)": 1.0217739343643188, "Full-finetune/Step": 1041, "Full-finetune/Step Time": 6.885134842246771} {"Full-finetune/Learning Rate": 1.8511802572979672e-05, "Full-finetune/Loss": 0.8288861513137817, "Full-finetune/Loss (Raw)": 1.0038576126098633, "Full-finetune/Step": 1042, "Full-finetune/Step Time": 6.886598262935877} {"Full-finetune/Learning Rate": 1.8508531164137644e-05, "Full-finetune/Loss": 0.82452392578125, "Full-finetune/Loss (Raw)": 0.36622506380081177, "Full-finetune/Step": 1043, "Full-finetune/Step Time": 6.910489538684487} {"Full-finetune/Learning Rate": 1.8505256453300778e-05, "Full-finetune/Loss": 0.8221998810768127, "Full-finetune/Loss (Raw)": 0.6352422833442688, "Full-finetune/Step": 1044, "Full-finetune/Step Time": 6.910787746310234} {"Full-finetune/Learning Rate": 1.850197844173994e-05, "Full-finetune/Loss": 0.8204182982444763, "Full-finetune/Loss (Raw)": 0.814311683177948, "Full-finetune/Step": 1045, "Full-finetune/Step Time": 6.888252919539809} {"Full-finetune/Learning Rate": 1.8498697130727255e-05, "Full-finetune/Loss": 0.820481538772583, "Full-finetune/Loss (Raw)": 0.8572743535041809, "Full-finetune/Step": 1046, "Full-finetune/Step Time": 6.891196107491851} {"Full-finetune/Learning Rate": 1.8495412521536135e-05, "Full-finetune/Loss": 0.8228247165679932, "Full-finetune/Loss (Raw)": 0.9045254588127136, "Full-finetune/Step": 1047, "Full-finetune/Step Time": 6.867755303159356} {"Full-finetune/Learning Rate": 1.8492124615441276e-05, "Full-finetune/Loss": 0.8251219987869263, "Full-finetune/Loss (Raw)": 1.030910611152649, "Full-finetune/Step": 1048, "Full-finetune/Step Time": 6.859069503843784} {"Full-finetune/Learning Rate": 1.8488833413718646e-05, "Full-finetune/Loss": 0.8237079381942749, "Full-finetune/Loss (Raw)": 0.7614573836326599, "Full-finetune/Step": 1049, "Full-finetune/Step Time": 6.8575994949787855} {"Full-finetune/Learning Rate": 1.84855389176455e-05, "Full-finetune/Loss": 0.8230080604553223, "Full-finetune/Loss (Raw)": 0.7544208765029907, "Full-finetune/Step": 1050, "Full-finetune/Step Time": 6.870014438405633} {"Full-finetune/Learning Rate": 1.8482241128500366e-05, "Full-finetune/Loss": 0.8208780288696289, "Full-finetune/Loss (Raw)": 0.6772542595863342, "Full-finetune/Step": 1051, "Full-finetune/Step Time": 6.87493409961462} {"Full-finetune/Learning Rate": 1.847894004756305e-05, "Full-finetune/Loss": 0.8225698471069336, "Full-finetune/Loss (Raw)": 1.0239975452423096, "Full-finetune/Step": 1052, "Full-finetune/Step Time": 6.883673444390297} {"Full-finetune/Learning Rate": 1.8475635676114643e-05, "Full-finetune/Loss": 0.8233957290649414, "Full-finetune/Loss (Raw)": 0.8414106369018555, "Full-finetune/Step": 1053, "Full-finetune/Step Time": 6.871074371039867} {"Full-finetune/Learning Rate": 1.8472328015437503e-05, "Full-finetune/Loss": 0.825531005859375, "Full-finetune/Loss (Raw)": 0.9024531841278076, "Full-finetune/Step": 1054, "Full-finetune/Step Time": 6.866645187139511} {"Full-finetune/Learning Rate": 1.8469017066815265e-05, "Full-finetune/Loss": 0.8247008323669434, "Full-finetune/Loss (Raw)": 0.7708755731582642, "Full-finetune/Step": 1055, "Full-finetune/Step Time": 6.866824047639966} {"Full-finetune/Learning Rate": 1.8465702831532848e-05, "Full-finetune/Loss": 0.8256150484085083, "Full-finetune/Loss (Raw)": 1.033373236656189, "Full-finetune/Step": 1056, "Full-finetune/Step Time": 6.868333578109741} {"Full-finetune/Learning Rate": 1.8462385310876444e-05, "Full-finetune/Loss": 0.8253065347671509, "Full-finetune/Loss (Raw)": 0.819157063961029, "Full-finetune/Step": 1057, "Full-finetune/Step Time": 6.8622692953795195} {"Full-finetune/Learning Rate": 1.845906450613351e-05, "Full-finetune/Loss": 0.8248831033706665, "Full-finetune/Loss (Raw)": 0.7573375105857849, "Full-finetune/Step": 1058, "Full-finetune/Step Time": 6.8548304215073586} {"Full-finetune/Learning Rate": 1.8455740418592793e-05, "Full-finetune/Loss": 0.8238369226455688, "Full-finetune/Loss (Raw)": 0.7829996347427368, "Full-finetune/Step": 1059, "Full-finetune/Step Time": 6.872604129835963} {"Full-finetune/Learning Rate": 1.8452413049544304e-05, "Full-finetune/Loss": 0.8226637840270996, "Full-finetune/Loss (Raw)": 0.8051357269287109, "Full-finetune/Step": 1060, "Full-finetune/Step Time": 6.8701644949615} {"Full-finetune/Learning Rate": 1.844908240027933e-05, "Full-finetune/Loss": 0.8212285041809082, "Full-finetune/Loss (Raw)": 0.6648644208908081, "Full-finetune/Step": 1061, "Full-finetune/Step Time": 6.8501509465277195} {"Full-finetune/Learning Rate": 1.8445748472090432e-05, "Full-finetune/Loss": 0.8205285668373108, "Full-finetune/Loss (Raw)": 0.8551626801490784, "Full-finetune/Step": 1062, "Full-finetune/Step Time": 6.844441585242748} {"Full-finetune/Learning Rate": 1.844241126627144e-05, "Full-finetune/Loss": 0.8220785856246948, "Full-finetune/Loss (Raw)": 0.882559061050415, "Full-finetune/Step": 1063, "Full-finetune/Step Time": 6.852355809882283} {"Full-finetune/Learning Rate": 1.843907078411746e-05, "Full-finetune/Loss": 0.8246748447418213, "Full-finetune/Loss (Raw)": 1.119133472442627, "Full-finetune/Step": 1064, "Full-finetune/Step Time": 6.8393990360200405} {"Full-finetune/Learning Rate": 1.8435727026924864e-05, "Full-finetune/Loss": 0.8246324062347412, "Full-finetune/Loss (Raw)": 1.023905873298645, "Full-finetune/Step": 1065, "Full-finetune/Step Time": 6.8398880790919065} {"Full-finetune/Learning Rate": 1.8432379995991307e-05, "Full-finetune/Loss": 0.8226470947265625, "Full-finetune/Loss (Raw)": 0.7959214448928833, "Full-finetune/Step": 1066, "Full-finetune/Step Time": 6.833229383453727} {"Full-finetune/Learning Rate": 1.8429029692615702e-05, "Full-finetune/Loss": 0.8239318132400513, "Full-finetune/Loss (Raw)": 1.018088698387146, "Full-finetune/Step": 1067, "Full-finetune/Step Time": 6.840563977137208} {"Full-finetune/Learning Rate": 1.8425676118098236e-05, "Full-finetune/Loss": 0.8226912617683411, "Full-finetune/Loss (Raw)": 0.794437050819397, "Full-finetune/Step": 1068, "Full-finetune/Step Time": 6.843833204358816} {"Full-finetune/Learning Rate": 1.8422319273740364e-05, "Full-finetune/Loss": 0.8223966360092163, "Full-finetune/Loss (Raw)": 0.8551576733589172, "Full-finetune/Step": 1069, "Full-finetune/Step Time": 6.868834089487791} {"Full-finetune/Learning Rate": 1.8418959160844813e-05, "Full-finetune/Loss": 0.8239216208457947, "Full-finetune/Loss (Raw)": 0.8923144340515137, "Full-finetune/Step": 1070, "Full-finetune/Step Time": 6.857061672955751} {"Full-finetune/Learning Rate": 1.8415595780715583e-05, "Full-finetune/Loss": 0.8242901563644409, "Full-finetune/Loss (Raw)": 0.9263142347335815, "Full-finetune/Step": 1071, "Full-finetune/Step Time": 6.8541266936808825} {"Full-finetune/Learning Rate": 1.8412229134657926e-05, "Full-finetune/Loss": 0.8253412842750549, "Full-finetune/Loss (Raw)": 0.956734836101532, "Full-finetune/Step": 1072, "Full-finetune/Step Time": 6.863437332212925} {"Full-finetune/Learning Rate": 1.8408859223978378e-05, "Full-finetune/Loss": 0.8258481621742249, "Full-finetune/Loss (Raw)": 0.8543941378593445, "Full-finetune/Step": 1073, "Full-finetune/Step Time": 6.83545409142971} {"Full-finetune/Learning Rate": 1.840548604998474e-05, "Full-finetune/Loss": 0.8278582096099854, "Full-finetune/Loss (Raw)": 0.9773265719413757, "Full-finetune/Step": 1074, "Full-finetune/Step Time": 6.820649262517691} {"Full-finetune/Learning Rate": 1.840210961398606e-05, "Full-finetune/Loss": 0.828253984451294, "Full-finetune/Loss (Raw)": 0.8795438408851624, "Full-finetune/Step": 1075, "Full-finetune/Step Time": 6.815377676859498} {"Full-finetune/Learning Rate": 1.8398729917292683e-05, "Full-finetune/Loss": 0.8328278064727783, "Full-finetune/Loss (Raw)": 0.9736097455024719, "Full-finetune/Step": 1076, "Full-finetune/Step Time": 6.797534734010696} {"Full-finetune/Learning Rate": 1.8395346961216193e-05, "Full-finetune/Loss": 0.8324450254440308, "Full-finetune/Loss (Raw)": 0.9781067967414856, "Full-finetune/Step": 1077, "Full-finetune/Step Time": 6.801602890715003} {"Full-finetune/Learning Rate": 1.8391960747069453e-05, "Full-finetune/Loss": 0.8331401348114014, "Full-finetune/Loss (Raw)": 0.9483972787857056, "Full-finetune/Step": 1078, "Full-finetune/Step Time": 6.814780954271555} {"Full-finetune/Learning Rate": 1.8388571276166588e-05, "Full-finetune/Loss": 0.8306377530097961, "Full-finetune/Loss (Raw)": 0.7529881596565247, "Full-finetune/Step": 1079, "Full-finetune/Step Time": 6.818230615928769} {"Full-finetune/Learning Rate": 1.8385178549822982e-05, "Full-finetune/Loss": 0.830105721950531, "Full-finetune/Loss (Raw)": 0.731544017791748, "Full-finetune/Step": 1080, "Full-finetune/Step Time": 6.8182798735797405} {"Full-finetune/Learning Rate": 1.8381782569355288e-05, "Full-finetune/Loss": 0.8303820490837097, "Full-finetune/Loss (Raw)": 0.9226588606834412, "Full-finetune/Step": 1081, "Full-finetune/Step Time": 6.822706859558821} {"Full-finetune/Learning Rate": 1.837838333608142e-05, "Full-finetune/Loss": 0.8294099569320679, "Full-finetune/Loss (Raw)": 0.706307590007782, "Full-finetune/Step": 1082, "Full-finetune/Step Time": 6.852403612807393} {"Full-finetune/Learning Rate": 1.8374980851320555e-05, "Full-finetune/Loss": 0.8296604156494141, "Full-finetune/Loss (Raw)": 0.9185991287231445, "Full-finetune/Step": 1083, "Full-finetune/Step Time": 6.851617485284805} {"Full-finetune/Learning Rate": 1.8371575116393125e-05, "Full-finetune/Loss": 0.829740047454834, "Full-finetune/Loss (Raw)": 0.9361411929130554, "Full-finetune/Step": 1084, "Full-finetune/Step Time": 6.86602707952261} {"Full-finetune/Learning Rate": 1.8368166132620838e-05, "Full-finetune/Loss": 0.8303638696670532, "Full-finetune/Loss (Raw)": 0.9079687595367432, "Full-finetune/Step": 1085, "Full-finetune/Step Time": 6.85590890981257} {"Full-finetune/Learning Rate": 1.8364753901326647e-05, "Full-finetune/Loss": 0.831398606300354, "Full-finetune/Loss (Raw)": 0.9675421714782715, "Full-finetune/Step": 1086, "Full-finetune/Step Time": 6.84359166584909} {"Full-finetune/Learning Rate": 1.8361338423834776e-05, "Full-finetune/Loss": 0.8329333662986755, "Full-finetune/Loss (Raw)": 0.9506566524505615, "Full-finetune/Step": 1087, "Full-finetune/Step Time": 6.846792520955205} {"Full-finetune/Learning Rate": 1.8357919701470702e-05, "Full-finetune/Loss": 0.8311792612075806, "Full-finetune/Loss (Raw)": 0.6479461193084717, "Full-finetune/Step": 1088, "Full-finetune/Step Time": 6.853990757837892} {"Full-finetune/Learning Rate": 1.835449773556117e-05, "Full-finetune/Loss": 0.8321168422698975, "Full-finetune/Loss (Raw)": 0.8818625211715698, "Full-finetune/Step": 1089, "Full-finetune/Step Time": 6.8507081884890795} {"Full-finetune/Learning Rate": 1.8351072527434173e-05, "Full-finetune/Loss": 0.8320122957229614, "Full-finetune/Loss (Raw)": 0.9637721180915833, "Full-finetune/Step": 1090, "Full-finetune/Step Time": 6.860930774360895} {"Full-finetune/Learning Rate": 1.8347644078418968e-05, "Full-finetune/Loss": 0.831936240196228, "Full-finetune/Loss (Raw)": 0.8318392038345337, "Full-finetune/Step": 1091, "Full-finetune/Step Time": 6.859818024560809} {"Full-finetune/Learning Rate": 1.834421238984607e-05, "Full-finetune/Loss": 0.8326725363731384, "Full-finetune/Loss (Raw)": 0.9537763595581055, "Full-finetune/Step": 1092, "Full-finetune/Step Time": 6.859052088111639} {"Full-finetune/Learning Rate": 1.8340777463047253e-05, "Full-finetune/Loss": 0.8329525589942932, "Full-finetune/Loss (Raw)": 0.7782853245735168, "Full-finetune/Step": 1093, "Full-finetune/Step Time": 6.847127579152584} {"Full-finetune/Learning Rate": 1.833733929935554e-05, "Full-finetune/Loss": 0.8332948684692383, "Full-finetune/Loss (Raw)": 0.881854236125946, "Full-finetune/Step": 1094, "Full-finetune/Step Time": 6.840797159820795} {"Full-finetune/Learning Rate": 1.833389790010522e-05, "Full-finetune/Loss": 0.8345997333526611, "Full-finetune/Loss (Raw)": 0.9731069207191467, "Full-finetune/Step": 1095, "Full-finetune/Step Time": 6.835488440468907} {"Full-finetune/Learning Rate": 1.8330453266631828e-05, "Full-finetune/Loss": 0.8345882892608643, "Full-finetune/Loss (Raw)": 0.9340011477470398, "Full-finetune/Step": 1096, "Full-finetune/Step Time": 6.8322667349129915} {"Full-finetune/Learning Rate": 1.8327005400272165e-05, "Full-finetune/Loss": 0.8348658084869385, "Full-finetune/Loss (Raw)": 0.8450448513031006, "Full-finetune/Step": 1097, "Full-finetune/Step Time": 6.833010068163276} {"Full-finetune/Learning Rate": 1.8323554302364273e-05, "Full-finetune/Loss": 0.8371360301971436, "Full-finetune/Loss (Raw)": 0.8450562953948975, "Full-finetune/Step": 1098, "Full-finetune/Step Time": 6.841340949758887} {"Full-finetune/Learning Rate": 1.8320099974247462e-05, "Full-finetune/Loss": 0.8374788761138916, "Full-finetune/Loss (Raw)": 0.9147205948829651, "Full-finetune/Step": 1099, "Full-finetune/Step Time": 6.805053224787116} {"Full-finetune/Learning Rate": 1.831664241726229e-05, "Full-finetune/Loss": 0.8411049842834473, "Full-finetune/Loss (Raw)": 0.8386780619621277, "Full-finetune/Step": 1100, "Full-finetune/Step Time": 6.79234510101378} {"Full-finetune/Learning Rate": 1.831318163275056e-05, "Full-finetune/Loss": 0.8420828580856323, "Full-finetune/Loss (Raw)": 0.9109386205673218, "Full-finetune/Step": 1101, "Full-finetune/Step Time": 6.781824642792344} {"Full-finetune/Learning Rate": 1.8309717622055343e-05, "Full-finetune/Loss": 0.8413718342781067, "Full-finetune/Loss (Raw)": 0.7275345325469971, "Full-finetune/Step": 1102, "Full-finetune/Step Time": 6.768587972968817} {"Full-finetune/Learning Rate": 1.830625038652095e-05, "Full-finetune/Loss": 0.8412275314331055, "Full-finetune/Loss (Raw)": 0.9934394955635071, "Full-finetune/Step": 1103, "Full-finetune/Step Time": 6.755781307816505} {"Full-finetune/Learning Rate": 1.8302779927492945e-05, "Full-finetune/Loss": 0.8421661853790283, "Full-finetune/Loss (Raw)": 0.9718513488769531, "Full-finetune/Step": 1104, "Full-finetune/Step Time": 6.765630764886737} {"Full-finetune/Learning Rate": 1.829930624631815e-05, "Full-finetune/Loss": 0.8411858081817627, "Full-finetune/Loss (Raw)": 0.8546520471572876, "Full-finetune/Step": 1105, "Full-finetune/Step Time": 6.769252670928836} {"Full-finetune/Learning Rate": 1.829582934434463e-05, "Full-finetune/Loss": 0.8407285213470459, "Full-finetune/Loss (Raw)": 0.7782100439071655, "Full-finetune/Step": 1106, "Full-finetune/Step Time": 6.782671734690666} {"Full-finetune/Learning Rate": 1.829234922292171e-05, "Full-finetune/Loss": 0.8414535522460938, "Full-finetune/Loss (Raw)": 0.9388368725776672, "Full-finetune/Step": 1107, "Full-finetune/Step Time": 6.778027229011059} {"Full-finetune/Learning Rate": 1.8288865883399946e-05, "Full-finetune/Loss": 0.8413505554199219, "Full-finetune/Loss (Raw)": 1.0302764177322388, "Full-finetune/Step": 1108, "Full-finetune/Step Time": 6.779640709981322} {"Full-finetune/Learning Rate": 1.8285379327131157e-05, "Full-finetune/Loss": 0.8396233320236206, "Full-finetune/Loss (Raw)": 0.6293054223060608, "Full-finetune/Step": 1109, "Full-finetune/Step Time": 6.7916402611881495} {"Full-finetune/Learning Rate": 1.828188955546841e-05, "Full-finetune/Loss": 0.8392003774642944, "Full-finetune/Loss (Raw)": 0.8981291055679321, "Full-finetune/Step": 1110, "Full-finetune/Step Time": 6.790792206302285} {"Full-finetune/Learning Rate": 1.827839656976602e-05, "Full-finetune/Loss": 0.840325653553009, "Full-finetune/Loss (Raw)": 1.0509874820709229, "Full-finetune/Step": 1111, "Full-finetune/Step Time": 6.787061056122184} {"Full-finetune/Learning Rate": 1.8274900371379543e-05, "Full-finetune/Loss": 0.8406705260276794, "Full-finetune/Loss (Raw)": 0.8054591417312622, "Full-finetune/Step": 1112, "Full-finetune/Step Time": 6.775984920561314} {"Full-finetune/Learning Rate": 1.8271400961665784e-05, "Full-finetune/Loss": 0.8405811786651611, "Full-finetune/Loss (Raw)": 0.8688815832138062, "Full-finetune/Step": 1113, "Full-finetune/Step Time": 6.772838395088911} {"Full-finetune/Learning Rate": 1.8267898341982796e-05, "Full-finetune/Loss": 0.8405065536499023, "Full-finetune/Loss (Raw)": 0.7740877866744995, "Full-finetune/Step": 1114, "Full-finetune/Step Time": 6.796642700210214} {"Full-finetune/Learning Rate": 1.8264392513689882e-05, "Full-finetune/Loss": 0.840386152267456, "Full-finetune/Loss (Raw)": 0.8879024386405945, "Full-finetune/Step": 1115, "Full-finetune/Step Time": 6.794196518138051} {"Full-finetune/Learning Rate": 1.8260883478147578e-05, "Full-finetune/Loss": 0.8428083062171936, "Full-finetune/Loss (Raw)": 0.9839944839477539, "Full-finetune/Step": 1116, "Full-finetune/Step Time": 6.789718175306916} {"Full-finetune/Learning Rate": 1.8257371236717682e-05, "Full-finetune/Loss": 0.8417253494262695, "Full-finetune/Loss (Raw)": 0.8052724599838257, "Full-finetune/Step": 1117, "Full-finetune/Step Time": 6.788652824237943} {"Full-finetune/Learning Rate": 1.8253855790763215e-05, "Full-finetune/Loss": 0.8439241647720337, "Full-finetune/Loss (Raw)": 0.9031299948692322, "Full-finetune/Step": 1118, "Full-finetune/Step Time": 6.776798836886883} {"Full-finetune/Learning Rate": 1.8250337141648464e-05, "Full-finetune/Loss": 0.8410892486572266, "Full-finetune/Loss (Raw)": 0.5910934209823608, "Full-finetune/Step": 1119, "Full-finetune/Step Time": 6.7874024491757154} {"Full-finetune/Learning Rate": 1.8246815290738937e-05, "Full-finetune/Loss": 0.8410584926605225, "Full-finetune/Loss (Raw)": 0.8807615041732788, "Full-finetune/Step": 1120, "Full-finetune/Step Time": 6.791031531989574} {"Full-finetune/Learning Rate": 1.8243290239401402e-05, "Full-finetune/Loss": 0.8422881960868835, "Full-finetune/Loss (Raw)": 0.9892451763153076, "Full-finetune/Step": 1121, "Full-finetune/Step Time": 6.771021885797381} {"Full-finetune/Learning Rate": 1.8239761989003866e-05, "Full-finetune/Loss": 0.8440983295440674, "Full-finetune/Loss (Raw)": 0.9024726152420044, "Full-finetune/Step": 1122, "Full-finetune/Step Time": 6.778157791122794} {"Full-finetune/Learning Rate": 1.8236230540915567e-05, "Full-finetune/Loss": 0.8433120846748352, "Full-finetune/Loss (Raw)": 0.7750502228736877, "Full-finetune/Step": 1123, "Full-finetune/Step Time": 6.7962541654706} {"Full-finetune/Learning Rate": 1.8232695896506995e-05, "Full-finetune/Loss": 0.8456600308418274, "Full-finetune/Loss (Raw)": 1.0792183876037598, "Full-finetune/Step": 1124, "Full-finetune/Step Time": 6.793340476229787} {"Full-finetune/Learning Rate": 1.8229158057149875e-05, "Full-finetune/Loss": 0.8455296754837036, "Full-finetune/Loss (Raw)": 0.8403332233428955, "Full-finetune/Step": 1125, "Full-finetune/Step Time": 6.788935896009207} {"Full-finetune/Learning Rate": 1.8225617024217174e-05, "Full-finetune/Loss": 0.8466424942016602, "Full-finetune/Loss (Raw)": 0.9121355414390564, "Full-finetune/Step": 1126, "Full-finetune/Step Time": 6.770767016336322} {"Full-finetune/Learning Rate": 1.8222072799083096e-05, "Full-finetune/Loss": 0.8458276987075806, "Full-finetune/Loss (Raw)": 0.8593957424163818, "Full-finetune/Step": 1127, "Full-finetune/Step Time": 6.75980332493782} {"Full-finetune/Learning Rate": 1.821852538312309e-05, "Full-finetune/Loss": 0.8439884185791016, "Full-finetune/Loss (Raw)": 0.7799513936042786, "Full-finetune/Step": 1128, "Full-finetune/Step Time": 6.772370366379619} {"Full-finetune/Learning Rate": 1.8214974777713834e-05, "Full-finetune/Loss": 0.8489185571670532, "Full-finetune/Loss (Raw)": 0.9612831473350525, "Full-finetune/Step": 1129, "Full-finetune/Step Time": 6.748008431866765} {"Full-finetune/Learning Rate": 1.821142098423325e-05, "Full-finetune/Loss": 0.8467071652412415, "Full-finetune/Loss (Raw)": 0.6638451218605042, "Full-finetune/Step": 1130, "Full-finetune/Step Time": 6.756542935967445} {"Full-finetune/Learning Rate": 1.8207864004060497e-05, "Full-finetune/Loss": 0.8466731309890747, "Full-finetune/Loss (Raw)": 0.9601826667785645, "Full-finetune/Step": 1131, "Full-finetune/Step Time": 6.738797560334206} {"Full-finetune/Learning Rate": 1.820430383857597e-05, "Full-finetune/Loss": 0.8464542031288147, "Full-finetune/Loss (Raw)": 0.9498482942581177, "Full-finetune/Step": 1132, "Full-finetune/Step Time": 6.740436902269721} {"Full-finetune/Learning Rate": 1.8200740489161296e-05, "Full-finetune/Loss": 0.8462889194488525, "Full-finetune/Loss (Raw)": 0.87972491979599, "Full-finetune/Step": 1133, "Full-finetune/Step Time": 6.735758598893881} {"Full-finetune/Learning Rate": 1.819717395719935e-05, "Full-finetune/Loss": 0.8476475477218628, "Full-finetune/Loss (Raw)": 0.8695361018180847, "Full-finetune/Step": 1134, "Full-finetune/Step Time": 6.718263011425734} {"Full-finetune/Learning Rate": 1.819360424407422e-05, "Full-finetune/Loss": 0.8485875129699707, "Full-finetune/Loss (Raw)": 0.9500172734260559, "Full-finetune/Step": 1135, "Full-finetune/Step Time": 6.714027758687735} {"Full-finetune/Learning Rate": 1.8190031351171256e-05, "Full-finetune/Loss": 0.8481934070587158, "Full-finetune/Loss (Raw)": 0.8542966246604919, "Full-finetune/Step": 1136, "Full-finetune/Step Time": 6.711689442396164} {"Full-finetune/Learning Rate": 1.818645527987702e-05, "Full-finetune/Loss": 0.8525612950325012, "Full-finetune/Loss (Raw)": 0.972184419631958, "Full-finetune/Step": 1137, "Full-finetune/Step Time": 6.69397165812552} {"Full-finetune/Learning Rate": 1.8182876031579312e-05, "Full-finetune/Loss": 0.8533573150634766, "Full-finetune/Loss (Raw)": 0.8799651861190796, "Full-finetune/Step": 1138, "Full-finetune/Step Time": 6.703248843550682} {"Full-finetune/Learning Rate": 1.8179293607667177e-05, "Full-finetune/Loss": 0.8534767031669617, "Full-finetune/Loss (Raw)": 0.8294282555580139, "Full-finetune/Step": 1139, "Full-finetune/Step Time": 6.716634579002857} {"Full-finetune/Learning Rate": 1.817570800953088e-05, "Full-finetune/Loss": 0.8532836437225342, "Full-finetune/Loss (Raw)": 0.9051028490066528, "Full-finetune/Step": 1140, "Full-finetune/Step Time": 6.708205297589302} {"Full-finetune/Learning Rate": 1.8172119238561924e-05, "Full-finetune/Loss": 0.8532289266586304, "Full-finetune/Loss (Raw)": 0.8533550500869751, "Full-finetune/Step": 1141, "Full-finetune/Step Time": 6.714639386162162} {"Full-finetune/Learning Rate": 1.8168527296153037e-05, "Full-finetune/Loss": 0.8479007482528687, "Full-finetune/Loss (Raw)": 0.29760128259658813, "Full-finetune/Step": 1142, "Full-finetune/Step Time": 6.72586883418262} {"Full-finetune/Learning Rate": 1.8164932183698184e-05, "Full-finetune/Loss": 0.8521808385848999, "Full-finetune/Loss (Raw)": 0.8528872728347778, "Full-finetune/Step": 1143, "Full-finetune/Step Time": 6.71943873539567} {"Full-finetune/Learning Rate": 1.8161333902592554e-05, "Full-finetune/Loss": 0.8518052101135254, "Full-finetune/Loss (Raw)": 0.8700753450393677, "Full-finetune/Step": 1144, "Full-finetune/Step Time": 6.723229672759771} {"Full-finetune/Learning Rate": 1.8157732454232577e-05, "Full-finetune/Loss": 0.8508442640304565, "Full-finetune/Loss (Raw)": 0.8577330112457275, "Full-finetune/Step": 1145, "Full-finetune/Step Time": 6.733507812023163} {"Full-finetune/Learning Rate": 1.81541278400159e-05, "Full-finetune/Loss": 0.8517122268676758, "Full-finetune/Loss (Raw)": 0.9409927725791931, "Full-finetune/Step": 1146, "Full-finetune/Step Time": 6.700263710692525} {"Full-finetune/Learning Rate": 1.81505200613414e-05, "Full-finetune/Loss": 0.8505975604057312, "Full-finetune/Loss (Raw)": 0.6867626905441284, "Full-finetune/Step": 1147, "Full-finetune/Step Time": 6.703081810846925} {"Full-finetune/Learning Rate": 1.8146909119609196e-05, "Full-finetune/Loss": 0.8464640974998474, "Full-finetune/Loss (Raw)": 0.3433414101600647, "Full-finetune/Step": 1148, "Full-finetune/Step Time": 6.728521294891834} {"Full-finetune/Learning Rate": 1.8143295016220612e-05, "Full-finetune/Loss": 0.8490322828292847, "Full-finetune/Loss (Raw)": 1.0570546388626099, "Full-finetune/Step": 1149, "Full-finetune/Step Time": 6.728539332747459} {"Full-finetune/Learning Rate": 1.813967775257822e-05, "Full-finetune/Loss": 0.8484269380569458, "Full-finetune/Loss (Raw)": 0.7849092483520508, "Full-finetune/Step": 1150, "Full-finetune/Step Time": 6.718675438314676} {"Full-finetune/Learning Rate": 1.8136057330085805e-05, "Full-finetune/Loss": 0.8491895794868469, "Full-finetune/Loss (Raw)": 0.7788466215133667, "Full-finetune/Step": 1151, "Full-finetune/Step Time": 6.702686866745353} {"Full-finetune/Learning Rate": 1.8132433750148383e-05, "Full-finetune/Loss": 0.8495171070098877, "Full-finetune/Loss (Raw)": 0.8308930397033691, "Full-finetune/Step": 1152, "Full-finetune/Step Time": 6.719010079279542} {"Full-finetune/Learning Rate": 1.8128807014172197e-05, "Full-finetune/Loss": 0.8504175543785095, "Full-finetune/Loss (Raw)": 0.9107154607772827, "Full-finetune/Step": 1153, "Full-finetune/Step Time": 6.742072373628616} {"Full-finetune/Learning Rate": 1.812517712356471e-05, "Full-finetune/Loss": 0.8461625576019287, "Full-finetune/Loss (Raw)": 0.3234776556491852, "Full-finetune/Step": 1154, "Full-finetune/Step Time": 6.752590639516711} {"Full-finetune/Learning Rate": 1.812154407973461e-05, "Full-finetune/Loss": 0.8459776639938354, "Full-finetune/Loss (Raw)": 0.3355575203895569, "Full-finetune/Step": 1155, "Full-finetune/Step Time": 6.74017208814621} {"Full-finetune/Learning Rate": 1.8117907884091815e-05, "Full-finetune/Loss": 0.8467304706573486, "Full-finetune/Loss (Raw)": 1.0052603483200073, "Full-finetune/Step": 1156, "Full-finetune/Step Time": 6.73575715534389} {"Full-finetune/Learning Rate": 1.8114268538047457e-05, "Full-finetune/Loss": 0.8480523228645325, "Full-finetune/Loss (Raw)": 0.9550914764404297, "Full-finetune/Step": 1157, "Full-finetune/Step Time": 6.727297849953175} {"Full-finetune/Learning Rate": 1.81106260430139e-05, "Full-finetune/Loss": 0.8480038046836853, "Full-finetune/Loss (Raw)": 0.7825362682342529, "Full-finetune/Step": 1158, "Full-finetune/Step Time": 6.717341782525182} {"Full-finetune/Learning Rate": 1.810698040040472e-05, "Full-finetune/Loss": 0.8474924564361572, "Full-finetune/Loss (Raw)": 0.7783077359199524, "Full-finetune/Step": 1159, "Full-finetune/Step Time": 6.716262478381395} {"Full-finetune/Learning Rate": 1.810333161163472e-05, "Full-finetune/Loss": 0.8513671159744263, "Full-finetune/Loss (Raw)": 0.8418992161750793, "Full-finetune/Step": 1160, "Full-finetune/Step Time": 6.710083406418562} {"Full-finetune/Learning Rate": 1.809967967811993e-05, "Full-finetune/Loss": 0.85057532787323, "Full-finetune/Loss (Raw)": 0.8003512024879456, "Full-finetune/Step": 1161, "Full-finetune/Step Time": 6.702162262052298} {"Full-finetune/Learning Rate": 1.8096024601277586e-05, "Full-finetune/Loss": 0.8522518277168274, "Full-finetune/Loss (Raw)": 0.9494733214378357, "Full-finetune/Step": 1162, "Full-finetune/Step Time": 6.6890600156039} {"Full-finetune/Learning Rate": 1.8092366382526157e-05, "Full-finetune/Loss": 0.8500162959098816, "Full-finetune/Loss (Raw)": 0.6103094816207886, "Full-finetune/Step": 1163, "Full-finetune/Step Time": 6.6968426797539} {"Full-finetune/Learning Rate": 1.8088705023285324e-05, "Full-finetune/Loss": 0.8517557978630066, "Full-finetune/Loss (Raw)": 1.0644557476043701, "Full-finetune/Step": 1164, "Full-finetune/Step Time": 6.694579748436809} {"Full-finetune/Learning Rate": 1.8085040524975994e-05, "Full-finetune/Loss": 0.8489676713943481, "Full-finetune/Loss (Raw)": 0.35734301805496216, "Full-finetune/Step": 1165, "Full-finetune/Step Time": 6.701193666085601} {"Full-finetune/Learning Rate": 1.8081372889020282e-05, "Full-finetune/Loss": 0.8468855619430542, "Full-finetune/Loss (Raw)": 0.7991635203361511, "Full-finetune/Step": 1166, "Full-finetune/Step Time": 6.709151962772012} {"Full-finetune/Learning Rate": 1.8077702116841524e-05, "Full-finetune/Loss": 0.8449766039848328, "Full-finetune/Loss (Raw)": 0.6303765773773193, "Full-finetune/Step": 1167, "Full-finetune/Step Time": 6.723701259121299} {"Full-finetune/Learning Rate": 1.807402820986428e-05, "Full-finetune/Loss": 0.8455600738525391, "Full-finetune/Loss (Raw)": 0.7906404733657837, "Full-finetune/Step": 1168, "Full-finetune/Step Time": 6.722226811572909} {"Full-finetune/Learning Rate": 1.8070351169514324e-05, "Full-finetune/Loss": 0.8448325395584106, "Full-finetune/Loss (Raw)": 0.928650975227356, "Full-finetune/Step": 1169, "Full-finetune/Step Time": 6.723881559446454} {"Full-finetune/Learning Rate": 1.8066670997218633e-05, "Full-finetune/Loss": 0.8406277298927307, "Full-finetune/Loss (Raw)": 0.4656387269496918, "Full-finetune/Step": 1170, "Full-finetune/Step Time": 6.737395390868187} {"Full-finetune/Learning Rate": 1.806298769440542e-05, "Full-finetune/Loss": 0.8454409241676331, "Full-finetune/Loss (Raw)": 0.9823158383369446, "Full-finetune/Step": 1171, "Full-finetune/Step Time": 6.712643014267087} {"Full-finetune/Learning Rate": 1.8059301262504097e-05, "Full-finetune/Loss": 0.8475450873374939, "Full-finetune/Loss (Raw)": 0.9045747518539429, "Full-finetune/Step": 1172, "Full-finetune/Step Time": 6.707033855840564} {"Full-finetune/Learning Rate": 1.80556117029453e-05, "Full-finetune/Loss": 0.8480619192123413, "Full-finetune/Loss (Raw)": 0.8804649114608765, "Full-finetune/Step": 1173, "Full-finetune/Step Time": 6.690217984840274} {"Full-finetune/Learning Rate": 1.8051919017160875e-05, "Full-finetune/Loss": 0.8441314697265625, "Full-finetune/Loss (Raw)": 0.354181706905365, "Full-finetune/Step": 1174, "Full-finetune/Step Time": 6.6995487324893475} {"Full-finetune/Learning Rate": 1.804822320658388e-05, "Full-finetune/Loss": 0.8433118462562561, "Full-finetune/Loss (Raw)": 0.7996125817298889, "Full-finetune/Step": 1175, "Full-finetune/Step Time": 6.713235577568412} {"Full-finetune/Learning Rate": 1.8044524272648588e-05, "Full-finetune/Loss": 0.841449499130249, "Full-finetune/Loss (Raw)": 0.792522668838501, "Full-finetune/Step": 1176, "Full-finetune/Step Time": 6.708294667303562} {"Full-finetune/Learning Rate": 1.8040822216790475e-05, "Full-finetune/Loss": 0.8377549052238464, "Full-finetune/Loss (Raw)": 0.2885555028915405, "Full-finetune/Step": 1177, "Full-finetune/Step Time": 6.729284666478634} {"Full-finetune/Learning Rate": 1.803711704044625e-05, "Full-finetune/Loss": 0.834368109703064, "Full-finetune/Loss (Raw)": 0.3209069073200226, "Full-finetune/Step": 1178, "Full-finetune/Step Time": 6.732886228710413} {"Full-finetune/Learning Rate": 1.803340874505381e-05, "Full-finetune/Loss": 0.8370974659919739, "Full-finetune/Loss (Raw)": 1.026614785194397, "Full-finetune/Step": 1179, "Full-finetune/Step Time": 6.736381085589528} {"Full-finetune/Learning Rate": 1.8029697332052277e-05, "Full-finetune/Loss": 0.8352093696594238, "Full-finetune/Loss (Raw)": 0.782319188117981, "Full-finetune/Step": 1180, "Full-finetune/Step Time": 6.741757603362203} {"Full-finetune/Learning Rate": 1.8025982802881976e-05, "Full-finetune/Loss": 0.8363940715789795, "Full-finetune/Loss (Raw)": 0.9930522441864014, "Full-finetune/Step": 1181, "Full-finetune/Step Time": 6.7295434884727} {"Full-finetune/Learning Rate": 1.802226515898444e-05, "Full-finetune/Loss": 0.8337084054946899, "Full-finetune/Loss (Raw)": 0.5586938858032227, "Full-finetune/Step": 1182, "Full-finetune/Step Time": 6.730905773118138} {"Full-finetune/Learning Rate": 1.8018544401802422e-05, "Full-finetune/Loss": 0.8351683616638184, "Full-finetune/Loss (Raw)": 0.9577507972717285, "Full-finetune/Step": 1183, "Full-finetune/Step Time": 6.732918394729495} {"Full-finetune/Learning Rate": 1.801482053277987e-05, "Full-finetune/Loss": 0.8326551914215088, "Full-finetune/Loss (Raw)": 0.7116835713386536, "Full-finetune/Step": 1184, "Full-finetune/Step Time": 6.761939199641347} {"Full-finetune/Learning Rate": 1.8011093553361944e-05, "Full-finetune/Loss": 0.8332093954086304, "Full-finetune/Loss (Raw)": 0.8900934457778931, "Full-finetune/Step": 1185, "Full-finetune/Step Time": 6.765181438997388} {"Full-finetune/Learning Rate": 1.8007363464995015e-05, "Full-finetune/Loss": 0.8352528810501099, "Full-finetune/Loss (Raw)": 1.0189104080200195, "Full-finetune/Step": 1186, "Full-finetune/Step Time": 6.76591264270246} {"Full-finetune/Learning Rate": 1.800363026912665e-05, "Full-finetune/Loss": 0.8317946195602417, "Full-finetune/Loss (Raw)": 0.34034034609794617, "Full-finetune/Step": 1187, "Full-finetune/Step Time": 6.771110985428095} {"Full-finetune/Learning Rate": 1.7999893967205643e-05, "Full-finetune/Loss": 0.8327282667160034, "Full-finetune/Loss (Raw)": 0.9246456623077393, "Full-finetune/Step": 1188, "Full-finetune/Step Time": 6.770852794870734} {"Full-finetune/Learning Rate": 1.7996154560681963e-05, "Full-finetune/Loss": 0.8351467847824097, "Full-finetune/Loss (Raw)": 0.9744274616241455, "Full-finetune/Step": 1189, "Full-finetune/Step Time": 6.776786126196384} {"Full-finetune/Learning Rate": 1.7992412051006817e-05, "Full-finetune/Loss": 0.8353011012077332, "Full-finetune/Loss (Raw)": 0.8749198317527771, "Full-finetune/Step": 1190, "Full-finetune/Step Time": 6.774889597669244} {"Full-finetune/Learning Rate": 1.7988666439632593e-05, "Full-finetune/Loss": 0.8355816602706909, "Full-finetune/Loss (Raw)": 0.9184669852256775, "Full-finetune/Step": 1191, "Full-finetune/Step Time": 6.7694898750633} {"Full-finetune/Learning Rate": 1.7984917728012886e-05, "Full-finetune/Loss": 0.8343342542648315, "Full-finetune/Loss (Raw)": 0.9594658017158508, "Full-finetune/Step": 1192, "Full-finetune/Step Time": 6.777435952797532} {"Full-finetune/Learning Rate": 1.7981165917602502e-05, "Full-finetune/Loss": 0.8334569931030273, "Full-finetune/Loss (Raw)": 0.9116125106811523, "Full-finetune/Step": 1193, "Full-finetune/Step Time": 6.776811294257641} {"Full-finetune/Learning Rate": 1.7977411009857446e-05, "Full-finetune/Loss": 0.8344296813011169, "Full-finetune/Loss (Raw)": 0.9204268455505371, "Full-finetune/Step": 1194, "Full-finetune/Step Time": 6.790630409494042} {"Full-finetune/Learning Rate": 1.797365300623492e-05, "Full-finetune/Loss": 0.8334036469459534, "Full-finetune/Loss (Raw)": 0.8867560625076294, "Full-finetune/Step": 1195, "Full-finetune/Step Time": 6.7804904114454985} {"Full-finetune/Learning Rate": 1.7969891908193338e-05, "Full-finetune/Loss": 0.8341029286384583, "Full-finetune/Loss (Raw)": 0.8839497566223145, "Full-finetune/Step": 1196, "Full-finetune/Step Time": 6.779009081423283} {"Full-finetune/Learning Rate": 1.7966127717192305e-05, "Full-finetune/Loss": 0.8349679112434387, "Full-finetune/Loss (Raw)": 0.9658738970756531, "Full-finetune/Step": 1197, "Full-finetune/Step Time": 6.7470878306776285} {"Full-finetune/Learning Rate": 1.796236043469263e-05, "Full-finetune/Loss": 0.835073709487915, "Full-finetune/Loss (Raw)": 0.9058624505996704, "Full-finetune/Step": 1198, "Full-finetune/Step Time": 6.753214433789253} {"Full-finetune/Learning Rate": 1.7958590062156318e-05, "Full-finetune/Loss": 0.8352901935577393, "Full-finetune/Loss (Raw)": 0.954020619392395, "Full-finetune/Step": 1199, "Full-finetune/Step Time": 6.7498346995562315} {"Full-finetune/Learning Rate": 1.7954816601046587e-05, "Full-finetune/Loss": 0.8352645635604858, "Full-finetune/Loss (Raw)": 0.9534537196159363, "Full-finetune/Step": 1200, "Full-finetune/Step Time": 6.74755884706974} {"Full-finetune/Learning Rate": 1.7951040052827836e-05, "Full-finetune/Loss": 0.8362607955932617, "Full-finetune/Loss (Raw)": 0.9819114208221436, "Full-finetune/Step": 1201, "Full-finetune/Step Time": 6.771640822291374} {"Full-finetune/Learning Rate": 1.794726041896567e-05, "Full-finetune/Loss": 0.8370630741119385, "Full-finetune/Loss (Raw)": 1.0800155401229858, "Full-finetune/Step": 1202, "Full-finetune/Step Time": 6.786410121247172} {"Full-finetune/Learning Rate": 1.7943477700926895e-05, "Full-finetune/Loss": 0.8382018804550171, "Full-finetune/Loss (Raw)": 1.0253139734268188, "Full-finetune/Step": 1203, "Full-finetune/Step Time": 6.776608571410179} {"Full-finetune/Learning Rate": 1.7939691900179507e-05, "Full-finetune/Loss": 0.8380491733551025, "Full-finetune/Loss (Raw)": 0.9540600776672363, "Full-finetune/Step": 1204, "Full-finetune/Step Time": 6.784975901246071} {"Full-finetune/Learning Rate": 1.79359030181927e-05, "Full-finetune/Loss": 0.8366301655769348, "Full-finetune/Loss (Raw)": 0.7964749932289124, "Full-finetune/Step": 1205, "Full-finetune/Step Time": 6.812546417117119} {"Full-finetune/Learning Rate": 1.7932111056436868e-05, "Full-finetune/Loss": 0.8372998833656311, "Full-finetune/Loss (Raw)": 1.0341215133666992, "Full-finetune/Step": 1206, "Full-finetune/Step Time": 6.794307434931397} {"Full-finetune/Learning Rate": 1.79283160163836e-05, "Full-finetune/Loss": 0.8383467197418213, "Full-finetune/Loss (Raw)": 0.8869859576225281, "Full-finetune/Step": 1207, "Full-finetune/Step Time": 6.802246397361159} {"Full-finetune/Learning Rate": 1.792451789950567e-05, "Full-finetune/Loss": 0.8397351503372192, "Full-finetune/Loss (Raw)": 0.9092578887939453, "Full-finetune/Step": 1208, "Full-finetune/Step Time": 6.802863862365484} {"Full-finetune/Learning Rate": 1.7920716707277054e-05, "Full-finetune/Loss": 0.8400788307189941, "Full-finetune/Loss (Raw)": 0.9666484594345093, "Full-finetune/Step": 1209, "Full-finetune/Step Time": 6.8005499094724655} {"Full-finetune/Learning Rate": 1.7916912441172924e-05, "Full-finetune/Loss": 0.841162919998169, "Full-finetune/Loss (Raw)": 0.8450714945793152, "Full-finetune/Step": 1210, "Full-finetune/Step Time": 6.769695613533258} {"Full-finetune/Learning Rate": 1.7913105102669643e-05, "Full-finetune/Loss": 0.8408120274543762, "Full-finetune/Loss (Raw)": 0.8736854791641235, "Full-finetune/Step": 1211, "Full-finetune/Step Time": 6.7726289220154285} {"Full-finetune/Learning Rate": 1.790929469324476e-05, "Full-finetune/Loss": 0.8410342931747437, "Full-finetune/Loss (Raw)": 0.9645916819572449, "Full-finetune/Step": 1212, "Full-finetune/Step Time": 6.760878564789891} {"Full-finetune/Learning Rate": 1.7905481214377027e-05, "Full-finetune/Loss": 0.8406810164451599, "Full-finetune/Loss (Raw)": 0.8627504706382751, "Full-finetune/Step": 1213, "Full-finetune/Step Time": 6.760504480451345} {"Full-finetune/Learning Rate": 1.790166466754637e-05, "Full-finetune/Loss": 0.8391413688659668, "Full-finetune/Loss (Raw)": 0.7704687714576721, "Full-finetune/Step": 1214, "Full-finetune/Step Time": 6.774971600621939} {"Full-finetune/Learning Rate": 1.7897845054233927e-05, "Full-finetune/Loss": 0.8389235734939575, "Full-finetune/Loss (Raw)": 0.9227709770202637, "Full-finetune/Step": 1215, "Full-finetune/Step Time": 6.775680489838123} {"Full-finetune/Learning Rate": 1.7894022375922006e-05, "Full-finetune/Loss": 0.8365635871887207, "Full-finetune/Loss (Raw)": 0.34587693214416504, "Full-finetune/Step": 1216, "Full-finetune/Step Time": 6.785889502614737} {"Full-finetune/Learning Rate": 1.7890196634094122e-05, "Full-finetune/Loss": 0.8376582264900208, "Full-finetune/Loss (Raw)": 1.0219714641571045, "Full-finetune/Step": 1217, "Full-finetune/Step Time": 6.789586968719959} {"Full-finetune/Learning Rate": 1.7886367830234968e-05, "Full-finetune/Loss": 0.8376009464263916, "Full-finetune/Loss (Raw)": 0.9564476609230042, "Full-finetune/Step": 1218, "Full-finetune/Step Time": 6.775007706135511} {"Full-finetune/Learning Rate": 1.788253596583043e-05, "Full-finetune/Loss": 0.8334478139877319, "Full-finetune/Loss (Raw)": 0.3002295196056366, "Full-finetune/Step": 1219, "Full-finetune/Step Time": 6.7955763433128595} {"Full-finetune/Learning Rate": 1.787870104236757e-05, "Full-finetune/Loss": 0.8327224254608154, "Full-finetune/Loss (Raw)": 0.8609265089035034, "Full-finetune/Step": 1220, "Full-finetune/Step Time": 6.794979568570852} {"Full-finetune/Learning Rate": 1.7874863061334658e-05, "Full-finetune/Loss": 0.8332200646400452, "Full-finetune/Loss (Raw)": 0.8419864773750305, "Full-finetune/Step": 1221, "Full-finetune/Step Time": 6.805129872635007} {"Full-finetune/Learning Rate": 1.7871022024221133e-05, "Full-finetune/Loss": 0.8327932357788086, "Full-finetune/Loss (Raw)": 0.827216386795044, "Full-finetune/Step": 1222, "Full-finetune/Step Time": 6.816330414265394} {"Full-finetune/Learning Rate": 1.7867177932517634e-05, "Full-finetune/Loss": 0.8323101997375488, "Full-finetune/Loss (Raw)": 0.9112842082977295, "Full-finetune/Step": 1223, "Full-finetune/Step Time": 6.8070789240300655} {"Full-finetune/Learning Rate": 1.786333078771597e-05, "Full-finetune/Loss": 0.832134485244751, "Full-finetune/Loss (Raw)": 0.9115092754364014, "Full-finetune/Step": 1224, "Full-finetune/Step Time": 6.808100655674934} {"Full-finetune/Learning Rate": 1.785948059130915e-05, "Full-finetune/Loss": 0.8313838839530945, "Full-finetune/Loss (Raw)": 0.7489634156227112, "Full-finetune/Step": 1225, "Full-finetune/Step Time": 6.793487895280123} {"Full-finetune/Learning Rate": 1.785562734479135e-05, "Full-finetune/Loss": 0.8308996558189392, "Full-finetune/Loss (Raw)": 0.7830807566642761, "Full-finetune/Step": 1226, "Full-finetune/Step Time": 6.784426178783178} {"Full-finetune/Learning Rate": 1.785177104965795e-05, "Full-finetune/Loss": 0.8292272090911865, "Full-finetune/Loss (Raw)": 0.7006474137306213, "Full-finetune/Step": 1227, "Full-finetune/Step Time": 6.792998598888516} {"Full-finetune/Learning Rate": 1.7847911707405494e-05, "Full-finetune/Loss": 0.8288004398345947, "Full-finetune/Loss (Raw)": 0.7840436100959778, "Full-finetune/Step": 1228, "Full-finetune/Step Time": 6.79925418831408} {"Full-finetune/Learning Rate": 1.7844049319531725e-05, "Full-finetune/Loss": 0.8294818997383118, "Full-finetune/Loss (Raw)": 0.9981718063354492, "Full-finetune/Step": 1229, "Full-finetune/Step Time": 6.796064144000411} {"Full-finetune/Learning Rate": 1.7840183887535558e-05, "Full-finetune/Loss": 0.8269577622413635, "Full-finetune/Loss (Raw)": 0.404441773891449, "Full-finetune/Step": 1230, "Full-finetune/Step Time": 6.815750455483794} {"Full-finetune/Learning Rate": 1.7836315412917088e-05, "Full-finetune/Loss": 0.8269855976104736, "Full-finetune/Loss (Raw)": 0.99700927734375, "Full-finetune/Step": 1231, "Full-finetune/Step Time": 6.809698352590203} {"Full-finetune/Learning Rate": 1.78324438971776e-05, "Full-finetune/Loss": 0.8260735273361206, "Full-finetune/Loss (Raw)": 0.8551074266433716, "Full-finetune/Step": 1232, "Full-finetune/Step Time": 6.808347033336759} {"Full-finetune/Learning Rate": 1.782856934181955e-05, "Full-finetune/Loss": 0.826607882976532, "Full-finetune/Loss (Raw)": 0.9230455160140991, "Full-finetune/Step": 1233, "Full-finetune/Step Time": 6.794404258951545} {"Full-finetune/Learning Rate": 1.782469174834658e-05, "Full-finetune/Loss": 0.8261194825172424, "Full-finetune/Loss (Raw)": 0.7156929969787598, "Full-finetune/Step": 1234, "Full-finetune/Step Time": 6.802733873948455} {"Full-finetune/Learning Rate": 1.7820811118263503e-05, "Full-finetune/Loss": 0.8255933523178101, "Full-finetune/Loss (Raw)": 0.8714948296546936, "Full-finetune/Step": 1235, "Full-finetune/Step Time": 6.800869097933173} {"Full-finetune/Learning Rate": 1.7816927453076324e-05, "Full-finetune/Loss": 0.8252172470092773, "Full-finetune/Loss (Raw)": 0.9821348190307617, "Full-finetune/Step": 1236, "Full-finetune/Step Time": 6.796938732266426} {"Full-finetune/Learning Rate": 1.781304075429221e-05, "Full-finetune/Loss": 0.8279078006744385, "Full-finetune/Loss (Raw)": 0.97369384765625, "Full-finetune/Step": 1237, "Full-finetune/Step Time": 6.798636611551046} {"Full-finetune/Learning Rate": 1.7809151023419517e-05, "Full-finetune/Loss": 0.828752875328064, "Full-finetune/Loss (Raw)": 1.0062929391860962, "Full-finetune/Step": 1238, "Full-finetune/Step Time": 6.801070973277092} {"Full-finetune/Learning Rate": 1.7805258261967774e-05, "Full-finetune/Loss": 0.827536940574646, "Full-finetune/Loss (Raw)": 0.8953570127487183, "Full-finetune/Step": 1239, "Full-finetune/Step Time": 6.808143908157945} {"Full-finetune/Learning Rate": 1.780136247144768e-05, "Full-finetune/Loss": 0.8279706239700317, "Full-finetune/Loss (Raw)": 0.86097252368927, "Full-finetune/Step": 1240, "Full-finetune/Step Time": 6.80599925108254} {"Full-finetune/Learning Rate": 1.7797463653371125e-05, "Full-finetune/Loss": 0.8274974822998047, "Full-finetune/Loss (Raw)": 0.8083140850067139, "Full-finetune/Step": 1241, "Full-finetune/Step Time": 6.809877395629883} {"Full-finetune/Learning Rate": 1.7793561809251153e-05, "Full-finetune/Loss": 0.8284239768981934, "Full-finetune/Loss (Raw)": 0.8926845788955688, "Full-finetune/Step": 1242, "Full-finetune/Step Time": 6.7832333873957396} {"Full-finetune/Learning Rate": 1.7789656940602003e-05, "Full-finetune/Loss": 0.8287817239761353, "Full-finetune/Loss (Raw)": 0.9336892366409302, "Full-finetune/Step": 1243, "Full-finetune/Step Time": 6.776747789233923} {"Full-finetune/Learning Rate": 1.7785749048939076e-05, "Full-finetune/Loss": 0.8278535604476929, "Full-finetune/Loss (Raw)": 0.8651845455169678, "Full-finetune/Step": 1244, "Full-finetune/Step Time": 6.778927953913808} {"Full-finetune/Learning Rate": 1.7781838135778945e-05, "Full-finetune/Loss": 0.82756507396698, "Full-finetune/Loss (Raw)": 0.7683472037315369, "Full-finetune/Step": 1245, "Full-finetune/Step Time": 6.769073823466897} {"Full-finetune/Learning Rate": 1.777792420263936e-05, "Full-finetune/Loss": 0.8269739747047424, "Full-finetune/Loss (Raw)": 0.8274717926979065, "Full-finetune/Step": 1246, "Full-finetune/Step Time": 6.790615640580654} {"Full-finetune/Learning Rate": 1.7774007251039246e-05, "Full-finetune/Loss": 0.8299432396888733, "Full-finetune/Loss (Raw)": 0.971163272857666, "Full-finetune/Step": 1247, "Full-finetune/Step Time": 6.77556187659502} {"Full-finetune/Learning Rate": 1.777008728249869e-05, "Full-finetune/Loss": 0.828622579574585, "Full-finetune/Loss (Raw)": 0.7117074131965637, "Full-finetune/Step": 1248, "Full-finetune/Step Time": 6.779787829145789} {"Full-finetune/Learning Rate": 1.776616429853896e-05, "Full-finetune/Loss": 0.8272868394851685, "Full-finetune/Loss (Raw)": 0.8182805776596069, "Full-finetune/Step": 1249, "Full-finetune/Step Time": 6.7690923027694225} {"Full-finetune/Learning Rate": 1.7762238300682484e-05, "Full-finetune/Loss": 0.8273539543151855, "Full-finetune/Loss (Raw)": 0.9110579490661621, "Full-finetune/Step": 1250, "Full-finetune/Step Time": 6.748560592532158} {"Full-finetune/Learning Rate": 1.775830929045287e-05, "Full-finetune/Loss": 0.8283849954605103, "Full-finetune/Loss (Raw)": 0.907021164894104, "Full-finetune/Step": 1251, "Full-finetune/Step Time": 6.734472654759884} {"Full-finetune/Learning Rate": 1.7754377269374893e-05, "Full-finetune/Loss": 0.826002299785614, "Full-finetune/Loss (Raw)": 0.7742370367050171, "Full-finetune/Step": 1252, "Full-finetune/Step Time": 6.739230712875724} {"Full-finetune/Learning Rate": 1.7750442238974483e-05, "Full-finetune/Loss": 0.8256337642669678, "Full-finetune/Loss (Raw)": 0.7931667566299438, "Full-finetune/Step": 1253, "Full-finetune/Step Time": 6.758094813674688} {"Full-finetune/Learning Rate": 1.7746504200778756e-05, "Full-finetune/Loss": 0.8253178596496582, "Full-finetune/Loss (Raw)": 0.8716867566108704, "Full-finetune/Step": 1254, "Full-finetune/Step Time": 6.771579187363386} {"Full-finetune/Learning Rate": 1.7742563156315987e-05, "Full-finetune/Loss": 0.8262238502502441, "Full-finetune/Loss (Raw)": 0.9753689765930176, "Full-finetune/Step": 1255, "Full-finetune/Step Time": 6.772973587736487} {"Full-finetune/Learning Rate": 1.773861910711562e-05, "Full-finetune/Loss": 0.8272780776023865, "Full-finetune/Loss (Raw)": 0.9148932695388794, "Full-finetune/Step": 1256, "Full-finetune/Step Time": 6.768822556361556} {"Full-finetune/Learning Rate": 1.773467205470826e-05, "Full-finetune/Loss": 0.8243010640144348, "Full-finetune/Loss (Raw)": 0.5802292227745056, "Full-finetune/Step": 1257, "Full-finetune/Step Time": 6.794586515054107} {"Full-finetune/Learning Rate": 1.7730722000625683e-05, "Full-finetune/Loss": 0.8259665966033936, "Full-finetune/Loss (Raw)": 0.8770301342010498, "Full-finetune/Step": 1258, "Full-finetune/Step Time": 6.782614503055811} {"Full-finetune/Learning Rate": 1.7726768946400825e-05, "Full-finetune/Loss": 0.8244544863700867, "Full-finetune/Loss (Raw)": 0.766632080078125, "Full-finetune/Step": 1259, "Full-finetune/Step Time": 6.793649971485138} {"Full-finetune/Learning Rate": 1.772281289356779e-05, "Full-finetune/Loss": 0.8256217241287231, "Full-finetune/Loss (Raw)": 1.0992563962936401, "Full-finetune/Step": 1260, "Full-finetune/Step Time": 6.795413123443723} {"Full-finetune/Learning Rate": 1.771885384366185e-05, "Full-finetune/Loss": 0.8245904445648193, "Full-finetune/Loss (Raw)": 0.747715413570404, "Full-finetune/Step": 1261, "Full-finetune/Step Time": 6.793907914310694} {"Full-finetune/Learning Rate": 1.7714891798219432e-05, "Full-finetune/Loss": 0.8249192237854004, "Full-finetune/Loss (Raw)": 0.9116218686103821, "Full-finetune/Step": 1262, "Full-finetune/Step Time": 6.789076862856746} {"Full-finetune/Learning Rate": 1.7710926758778123e-05, "Full-finetune/Loss": 0.8247784376144409, "Full-finetune/Loss (Raw)": 0.9320042729377747, "Full-finetune/Step": 1263, "Full-finetune/Step Time": 6.784975638613105} {"Full-finetune/Learning Rate": 1.7706958726876685e-05, "Full-finetune/Loss": 0.8249471187591553, "Full-finetune/Loss (Raw)": 0.8758780360221863, "Full-finetune/Step": 1264, "Full-finetune/Step Time": 6.782567663118243} {"Full-finetune/Learning Rate": 1.770298770405503e-05, "Full-finetune/Loss": 0.820307731628418, "Full-finetune/Loss (Raw)": 0.37835004925727844, "Full-finetune/Step": 1265, "Full-finetune/Step Time": 6.800058865919709} {"Full-finetune/Learning Rate": 1.7699013691854238e-05, "Full-finetune/Loss": 0.8199815154075623, "Full-finetune/Loss (Raw)": 0.8382087349891663, "Full-finetune/Step": 1266, "Full-finetune/Step Time": 6.804401038214564} {"Full-finetune/Learning Rate": 1.769503669181654e-05, "Full-finetune/Loss": 0.8208618760108948, "Full-finetune/Loss (Raw)": 0.9421126842498779, "Full-finetune/Step": 1267, "Full-finetune/Step Time": 6.789257220923901} {"Full-finetune/Learning Rate": 1.7691056705485333e-05, "Full-finetune/Loss": 0.821492075920105, "Full-finetune/Loss (Raw)": 0.9857749938964844, "Full-finetune/Step": 1268, "Full-finetune/Step Time": 6.793308809399605} {"Full-finetune/Learning Rate": 1.7687073734405177e-05, "Full-finetune/Loss": 0.8212364912033081, "Full-finetune/Loss (Raw)": 0.8206332921981812, "Full-finetune/Step": 1269, "Full-finetune/Step Time": 6.794832302257419} {"Full-finetune/Learning Rate": 1.768308778012178e-05, "Full-finetune/Loss": 0.8262830972671509, "Full-finetune/Loss (Raw)": 0.9435712099075317, "Full-finetune/Step": 1270, "Full-finetune/Step Time": 6.785142311826348} {"Full-finetune/Learning Rate": 1.767909884418202e-05, "Full-finetune/Loss": 0.8273637294769287, "Full-finetune/Loss (Raw)": 0.9912017583847046, "Full-finetune/Step": 1271, "Full-finetune/Step Time": 6.7692662458866835} {"Full-finetune/Learning Rate": 1.7675106928133915e-05, "Full-finetune/Loss": 0.8261996507644653, "Full-finetune/Loss (Raw)": 0.7210753560066223, "Full-finetune/Step": 1272, "Full-finetune/Step Time": 6.777260737493634} {"Full-finetune/Learning Rate": 1.7671112033526655e-05, "Full-finetune/Loss": 0.8254801034927368, "Full-finetune/Loss (Raw)": 0.765632688999176, "Full-finetune/Step": 1273, "Full-finetune/Step Time": 6.766339056193829} {"Full-finetune/Learning Rate": 1.7667114161910586e-05, "Full-finetune/Loss": 0.8245373368263245, "Full-finetune/Loss (Raw)": 0.8203203082084656, "Full-finetune/Step": 1274, "Full-finetune/Step Time": 6.757435774430633} {"Full-finetune/Learning Rate": 1.7663113314837192e-05, "Full-finetune/Loss": 0.8272151947021484, "Full-finetune/Loss (Raw)": 1.0295301675796509, "Full-finetune/Step": 1275, "Full-finetune/Step Time": 6.749073192477226} {"Full-finetune/Learning Rate": 1.7659109493859134e-05, "Full-finetune/Loss": 0.8311713337898254, "Full-finetune/Loss (Raw)": 0.84972083568573, "Full-finetune/Step": 1276, "Full-finetune/Step Time": 6.724526224657893} {"Full-finetune/Learning Rate": 1.7655102700530212e-05, "Full-finetune/Loss": 0.8299182653427124, "Full-finetune/Loss (Raw)": 0.8966649770736694, "Full-finetune/Step": 1277, "Full-finetune/Step Time": 6.727374805137515} {"Full-finetune/Learning Rate": 1.7651092936405385e-05, "Full-finetune/Loss": 0.8285183906555176, "Full-finetune/Loss (Raw)": 0.6057193279266357, "Full-finetune/Step": 1278, "Full-finetune/Step Time": 6.733655426651239} {"Full-finetune/Learning Rate": 1.7647080203040765e-05, "Full-finetune/Loss": 0.8292561769485474, "Full-finetune/Loss (Raw)": 0.873285710811615, "Full-finetune/Step": 1279, "Full-finetune/Step Time": 6.735330492258072} {"Full-finetune/Learning Rate": 1.7643064501993614e-05, "Full-finetune/Loss": 0.8306213021278381, "Full-finetune/Loss (Raw)": 1.0056294202804565, "Full-finetune/Step": 1280, "Full-finetune/Step Time": 6.715021908283234} {"Full-finetune/Learning Rate": 1.763904583482235e-05, "Full-finetune/Loss": 0.8304795622825623, "Full-finetune/Loss (Raw)": 0.8925800323486328, "Full-finetune/Step": 1281, "Full-finetune/Step Time": 6.6899007223546505} {"Full-finetune/Learning Rate": 1.7635024203086532e-05, "Full-finetune/Loss": 0.8347346782684326, "Full-finetune/Loss (Raw)": 0.8681256175041199, "Full-finetune/Step": 1282, "Full-finetune/Step Time": 6.672630395740271} {"Full-finetune/Learning Rate": 1.7630999608346888e-05, "Full-finetune/Loss": 0.8375146389007568, "Full-finetune/Loss (Raw)": 0.6913917660713196, "Full-finetune/Step": 1283, "Full-finetune/Step Time": 6.666189383715391} {"Full-finetune/Learning Rate": 1.7626972052165275e-05, "Full-finetune/Loss": 0.836275577545166, "Full-finetune/Loss (Raw)": 0.8466613292694092, "Full-finetune/Step": 1284, "Full-finetune/Step Time": 6.669809024780989} {"Full-finetune/Learning Rate": 1.7622941536104715e-05, "Full-finetune/Loss": 0.8363896608352661, "Full-finetune/Loss (Raw)": 0.9696932435035706, "Full-finetune/Step": 1285, "Full-finetune/Step Time": 6.68033254891634} {"Full-finetune/Learning Rate": 1.7618908061729373e-05, "Full-finetune/Loss": 0.8368505835533142, "Full-finetune/Loss (Raw)": 0.8415377140045166, "Full-finetune/Step": 1286, "Full-finetune/Step Time": 6.695986580103636} {"Full-finetune/Learning Rate": 1.7614871630604554e-05, "Full-finetune/Loss": 0.8375994563102722, "Full-finetune/Loss (Raw)": 0.8741645216941833, "Full-finetune/Step": 1287, "Full-finetune/Step Time": 6.6954427640885115} {"Full-finetune/Learning Rate": 1.761083224429672e-05, "Full-finetune/Loss": 0.837455153465271, "Full-finetune/Loss (Raw)": 0.8234298229217529, "Full-finetune/Step": 1288, "Full-finetune/Step Time": 6.677173791453242} {"Full-finetune/Learning Rate": 1.760678990437349e-05, "Full-finetune/Loss": 0.8376500010490417, "Full-finetune/Loss (Raw)": 0.8252922296524048, "Full-finetune/Step": 1289, "Full-finetune/Step Time": 6.661296309903264} {"Full-finetune/Learning Rate": 1.76027446124036e-05, "Full-finetune/Loss": 0.8380101919174194, "Full-finetune/Loss (Raw)": 0.9955755472183228, "Full-finetune/Step": 1290, "Full-finetune/Step Time": 6.655515395104885} {"Full-finetune/Learning Rate": 1.759869636995696e-05, "Full-finetune/Loss": 0.8393830060958862, "Full-finetune/Loss (Raw)": 0.7860326170921326, "Full-finetune/Step": 1291, "Full-finetune/Step Time": 6.6526609268039465} {"Full-finetune/Learning Rate": 1.7594645178604614e-05, "Full-finetune/Loss": 0.8375992774963379, "Full-finetune/Loss (Raw)": 0.8361383676528931, "Full-finetune/Step": 1292, "Full-finetune/Step Time": 6.647145668044686} {"Full-finetune/Learning Rate": 1.7590591039918744e-05, "Full-finetune/Loss": 0.8418110013008118, "Full-finetune/Loss (Raw)": 0.8964354395866394, "Full-finetune/Step": 1293, "Full-finetune/Step Time": 6.6291966661810875} {"Full-finetune/Learning Rate": 1.7586533955472686e-05, "Full-finetune/Loss": 0.8428661823272705, "Full-finetune/Loss (Raw)": 0.9342265725135803, "Full-finetune/Step": 1294, "Full-finetune/Step Time": 6.632384542375803} {"Full-finetune/Learning Rate": 1.7582473926840916e-05, "Full-finetune/Loss": 0.8445011973381042, "Full-finetune/Loss (Raw)": 0.8396636843681335, "Full-finetune/Step": 1295, "Full-finetune/Step Time": 6.6301477793604136} {"Full-finetune/Learning Rate": 1.7578410955599046e-05, "Full-finetune/Loss": 0.844541072845459, "Full-finetune/Loss (Raw)": 0.7957447171211243, "Full-finetune/Step": 1296, "Full-finetune/Step Time": 6.634611876681447} {"Full-finetune/Learning Rate": 1.7574345043323843e-05, "Full-finetune/Loss": 0.8436567783355713, "Full-finetune/Loss (Raw)": 0.8154643774032593, "Full-finetune/Step": 1297, "Full-finetune/Step Time": 6.648236446082592} {"Full-finetune/Learning Rate": 1.7570276191593202e-05, "Full-finetune/Loss": 0.8457865118980408, "Full-finetune/Loss (Raw)": 0.7382404208183289, "Full-finetune/Step": 1298, "Full-finetune/Step Time": 6.625754313543439} {"Full-finetune/Learning Rate": 1.7566204401986172e-05, "Full-finetune/Loss": 0.8432849049568176, "Full-finetune/Loss (Raw)": 0.6621083617210388, "Full-finetune/Step": 1299, "Full-finetune/Step Time": 6.630000712350011} {"Full-finetune/Learning Rate": 1.7562129676082933e-05, "Full-finetune/Loss": 0.8425208330154419, "Full-finetune/Loss (Raw)": 0.8067789673805237, "Full-finetune/Step": 1300, "Full-finetune/Step Time": 6.626982422545552} {"Full-finetune/Learning Rate": 1.75580520154648e-05, "Full-finetune/Loss": 0.8422329425811768, "Full-finetune/Loss (Raw)": 0.8436093330383301, "Full-finetune/Step": 1301, "Full-finetune/Step Time": 6.644100673496723} {"Full-finetune/Learning Rate": 1.755397142171424e-05, "Full-finetune/Loss": 0.8460230827331543, "Full-finetune/Loss (Raw)": 0.8393176198005676, "Full-finetune/Step": 1302, "Full-finetune/Step Time": 6.646479116752744} {"Full-finetune/Learning Rate": 1.7549887896414853e-05, "Full-finetune/Loss": 0.8463137149810791, "Full-finetune/Loss (Raw)": 0.8368206024169922, "Full-finetune/Step": 1303, "Full-finetune/Step Time": 6.629278955981135} {"Full-finetune/Learning Rate": 1.7545801441151368e-05, "Full-finetune/Loss": 0.8473219275474548, "Full-finetune/Loss (Raw)": 0.9215723276138306, "Full-finetune/Step": 1304, "Full-finetune/Step Time": 6.634607695043087} {"Full-finetune/Learning Rate": 1.7541712057509666e-05, "Full-finetune/Loss": 0.8515180945396423, "Full-finetune/Loss (Raw)": 0.8256611824035645, "Full-finetune/Step": 1305, "Full-finetune/Step Time": 6.619273090735078} {"Full-finetune/Learning Rate": 1.7537619747076752e-05, "Full-finetune/Loss": 0.8553872108459473, "Full-finetune/Loss (Raw)": 0.8161569237709045, "Full-finetune/Step": 1306, "Full-finetune/Step Time": 6.616552459076047} {"Full-finetune/Learning Rate": 1.7533524511440777e-05, "Full-finetune/Loss": 0.8551402688026428, "Full-finetune/Loss (Raw)": 0.9950044751167297, "Full-finetune/Step": 1307, "Full-finetune/Step Time": 6.598968368023634} {"Full-finetune/Learning Rate": 1.7529426352191014e-05, "Full-finetune/Loss": 0.8569211959838867, "Full-finetune/Loss (Raw)": 1.010280728340149, "Full-finetune/Step": 1308, "Full-finetune/Step Time": 6.5816826820373535} {"Full-finetune/Learning Rate": 1.752532527091789e-05, "Full-finetune/Loss": 0.856023907661438, "Full-finetune/Loss (Raw)": 0.8781889081001282, "Full-finetune/Step": 1309, "Full-finetune/Step Time": 6.59929865039885} {"Full-finetune/Learning Rate": 1.7521221269212944e-05, "Full-finetune/Loss": 0.8581767082214355, "Full-finetune/Loss (Raw)": 0.834263265132904, "Full-finetune/Step": 1310, "Full-finetune/Step Time": 6.5973298996686935} {"Full-finetune/Learning Rate": 1.751711434866886e-05, "Full-finetune/Loss": 0.8577079772949219, "Full-finetune/Loss (Raw)": 0.897752583026886, "Full-finetune/Step": 1311, "Full-finetune/Step Time": 6.599600167945027} {"Full-finetune/Learning Rate": 1.751300451087946e-05, "Full-finetune/Loss": 0.8565887212753296, "Full-finetune/Loss (Raw)": 0.5684159398078918, "Full-finetune/Step": 1312, "Full-finetune/Step Time": 6.6027966234833} {"Full-finetune/Learning Rate": 1.7508891757439687e-05, "Full-finetune/Loss": 0.8564924001693726, "Full-finetune/Loss (Raw)": 0.8777603507041931, "Full-finetune/Step": 1313, "Full-finetune/Step Time": 6.609229741618037} {"Full-finetune/Learning Rate": 1.7504776089945626e-05, "Full-finetune/Loss": 0.8558322191238403, "Full-finetune/Loss (Raw)": 0.934417724609375, "Full-finetune/Step": 1314, "Full-finetune/Step Time": 6.616146953776479} {"Full-finetune/Learning Rate": 1.7500657509994478e-05, "Full-finetune/Loss": 0.860390305519104, "Full-finetune/Loss (Raw)": 0.9237709641456604, "Full-finetune/Step": 1315, "Full-finetune/Step Time": 6.598480666056275} {"Full-finetune/Learning Rate": 1.7496536019184588e-05, "Full-finetune/Loss": 0.8613675236701965, "Full-finetune/Loss (Raw)": 1.0497280359268188, "Full-finetune/Step": 1316, "Full-finetune/Step Time": 6.602090677246451} {"Full-finetune/Learning Rate": 1.749241161911543e-05, "Full-finetune/Loss": 0.8611504435539246, "Full-finetune/Loss (Raw)": 0.9466410875320435, "Full-finetune/Step": 1317, "Full-finetune/Step Time": 6.594055471941829} {"Full-finetune/Learning Rate": 1.7488284311387597e-05, "Full-finetune/Loss": 0.8609941005706787, "Full-finetune/Loss (Raw)": 0.8549086451530457, "Full-finetune/Step": 1318, "Full-finetune/Step Time": 6.594386784359813} {"Full-finetune/Learning Rate": 1.7484154097602822e-05, "Full-finetune/Loss": 0.86080002784729, "Full-finetune/Loss (Raw)": 0.8936247825622559, "Full-finetune/Step": 1319, "Full-finetune/Step Time": 6.591690666973591} {"Full-finetune/Learning Rate": 1.7480020979363956e-05, "Full-finetune/Loss": 0.8593383431434631, "Full-finetune/Loss (Raw)": 0.772367000579834, "Full-finetune/Step": 1320, "Full-finetune/Step Time": 6.59192206710577} {"Full-finetune/Learning Rate": 1.747588495827498e-05, "Full-finetune/Loss": 0.8593174815177917, "Full-finetune/Loss (Raw)": 0.9089407324790955, "Full-finetune/Step": 1321, "Full-finetune/Step Time": 6.59465735591948} {"Full-finetune/Learning Rate": 1.7471746035941007e-05, "Full-finetune/Loss": 0.8590686321258545, "Full-finetune/Loss (Raw)": 0.8885733485221863, "Full-finetune/Step": 1322, "Full-finetune/Step Time": 6.583670539781451} {"Full-finetune/Learning Rate": 1.7467604213968274e-05, "Full-finetune/Loss": 0.8594400882720947, "Full-finetune/Loss (Raw)": 0.9343035221099854, "Full-finetune/Step": 1323, "Full-finetune/Step Time": 6.5944829899817705} {"Full-finetune/Learning Rate": 1.746345949396414e-05, "Full-finetune/Loss": 0.860036313533783, "Full-finetune/Loss (Raw)": 0.96027010679245, "Full-finetune/Step": 1324, "Full-finetune/Step Time": 6.595694093033671} {"Full-finetune/Learning Rate": 1.7459311877537085e-05, "Full-finetune/Loss": 0.8601734638214111, "Full-finetune/Loss (Raw)": 0.9834255576133728, "Full-finetune/Step": 1325, "Full-finetune/Step Time": 6.612515868619084} {"Full-finetune/Learning Rate": 1.745516136629672e-05, "Full-finetune/Loss": 0.8605295419692993, "Full-finetune/Loss (Raw)": 0.9514408707618713, "Full-finetune/Step": 1326, "Full-finetune/Step Time": 6.605024565011263} {"Full-finetune/Learning Rate": 1.7451007961853778e-05, "Full-finetune/Loss": 0.8589027523994446, "Full-finetune/Loss (Raw)": 0.7457955479621887, "Full-finetune/Step": 1327, "Full-finetune/Step Time": 6.640957713127136} {"Full-finetune/Learning Rate": 1.7446851665820118e-05, "Full-finetune/Loss": 0.8596360683441162, "Full-finetune/Loss (Raw)": 1.04732084274292, "Full-finetune/Step": 1328, "Full-finetune/Step Time": 6.6354338247329} {"Full-finetune/Learning Rate": 1.744269247980871e-05, "Full-finetune/Loss": 0.8604437112808228, "Full-finetune/Loss (Raw)": 1.0852904319763184, "Full-finetune/Step": 1329, "Full-finetune/Step Time": 6.617393035441637} {"Full-finetune/Learning Rate": 1.7438530405433663e-05, "Full-finetune/Loss": 0.857339084148407, "Full-finetune/Loss (Raw)": 0.682621419429779, "Full-finetune/Step": 1330, "Full-finetune/Step Time": 6.598898423835635} {"Full-finetune/Learning Rate": 1.7434365444310185e-05, "Full-finetune/Loss": 0.8565748333930969, "Full-finetune/Loss (Raw)": 0.927487313747406, "Full-finetune/Step": 1331, "Full-finetune/Step Time": 6.5927655678242445} {"Full-finetune/Learning Rate": 1.7430197598054622e-05, "Full-finetune/Loss": 0.8549529314041138, "Full-finetune/Loss (Raw)": 0.7464579343795776, "Full-finetune/Step": 1332, "Full-finetune/Step Time": 6.595563232898712} {"Full-finetune/Learning Rate": 1.7426026868284438e-05, "Full-finetune/Loss": 0.8557116389274597, "Full-finetune/Loss (Raw)": 0.8935924172401428, "Full-finetune/Step": 1333, "Full-finetune/Step Time": 6.571877999231219} {"Full-finetune/Learning Rate": 1.7421853256618204e-05, "Full-finetune/Loss": 0.8548535108566284, "Full-finetune/Loss (Raw)": 0.9242812991142273, "Full-finetune/Step": 1334, "Full-finetune/Step Time": 6.57552040182054} {"Full-finetune/Learning Rate": 1.741767676467562e-05, "Full-finetune/Loss": 0.8549709916114807, "Full-finetune/Loss (Raw)": 0.9020230174064636, "Full-finetune/Step": 1335, "Full-finetune/Step Time": 6.567621933296323} {"Full-finetune/Learning Rate": 1.7413497394077502e-05, "Full-finetune/Loss": 0.8549219369888306, "Full-finetune/Loss (Raw)": 0.9029697179794312, "Full-finetune/Step": 1336, "Full-finetune/Step Time": 6.5632516127079725} {"Full-finetune/Learning Rate": 1.7409315146445783e-05, "Full-finetune/Loss": 0.8548117280006409, "Full-finetune/Loss (Raw)": 0.9525473713874817, "Full-finetune/Step": 1337, "Full-finetune/Step Time": 6.565524330362678} {"Full-finetune/Learning Rate": 1.7405130023403513e-05, "Full-finetune/Loss": 0.850662350654602, "Full-finetune/Loss (Raw)": 0.3139492869377136, "Full-finetune/Step": 1338, "Full-finetune/Step Time": 6.585956089198589} {"Full-finetune/Learning Rate": 1.740094202657485e-05, "Full-finetune/Loss": 0.8497222661972046, "Full-finetune/Loss (Raw)": 0.7533538341522217, "Full-finetune/Step": 1339, "Full-finetune/Step Time": 6.591602213680744} {"Full-finetune/Learning Rate": 1.7396751157585078e-05, "Full-finetune/Loss": 0.8488198518753052, "Full-finetune/Loss (Raw)": 0.8490861058235168, "Full-finetune/Step": 1340, "Full-finetune/Step Time": 6.5979632548987865} {"Full-finetune/Learning Rate": 1.739255741806059e-05, "Full-finetune/Loss": 0.848573625087738, "Full-finetune/Loss (Raw)": 0.8312349319458008, "Full-finetune/Step": 1341, "Full-finetune/Step Time": 6.598935263231397} {"Full-finetune/Learning Rate": 1.73883608096289e-05, "Full-finetune/Loss": 0.8498282432556152, "Full-finetune/Loss (Raw)": 0.9310539960861206, "Full-finetune/Step": 1342, "Full-finetune/Step Time": 6.605885159224272} {"Full-finetune/Learning Rate": 1.738416133391862e-05, "Full-finetune/Loss": 0.8488630056381226, "Full-finetune/Loss (Raw)": 0.7992265820503235, "Full-finetune/Step": 1343, "Full-finetune/Step Time": 6.627678090706468} {"Full-finetune/Learning Rate": 1.7379958992559494e-05, "Full-finetune/Loss": 0.8523164391517639, "Full-finetune/Loss (Raw)": 0.7879146933555603, "Full-finetune/Step": 1344, "Full-finetune/Step Time": 6.614695442840457} {"Full-finetune/Learning Rate": 1.7375753787182364e-05, "Full-finetune/Loss": 0.8520946502685547, "Full-finetune/Loss (Raw)": 0.9935813546180725, "Full-finetune/Step": 1345, "Full-finetune/Step Time": 6.614028876647353} {"Full-finetune/Learning Rate": 1.7371545719419188e-05, "Full-finetune/Loss": 0.8514738082885742, "Full-finetune/Loss (Raw)": 0.8769782185554504, "Full-finetune/Step": 1346, "Full-finetune/Step Time": 6.6160006262362} {"Full-finetune/Learning Rate": 1.7367334790903034e-05, "Full-finetune/Loss": 0.8565782904624939, "Full-finetune/Loss (Raw)": 0.9536060690879822, "Full-finetune/Step": 1347, "Full-finetune/Step Time": 6.6142947394400835} {"Full-finetune/Learning Rate": 1.736312100326808e-05, "Full-finetune/Loss": 0.8531731367111206, "Full-finetune/Loss (Raw)": 0.4250691831111908, "Full-finetune/Step": 1348, "Full-finetune/Step Time": 6.635404646396637} {"Full-finetune/Learning Rate": 1.7358904358149625e-05, "Full-finetune/Loss": 0.8539929389953613, "Full-finetune/Loss (Raw)": 0.9469197392463684, "Full-finetune/Step": 1349, "Full-finetune/Step Time": 6.615690365433693} {"Full-finetune/Learning Rate": 1.7354684857184056e-05, "Full-finetune/Loss": 0.8545767664909363, "Full-finetune/Loss (Raw)": 0.9019439816474915, "Full-finetune/Step": 1350, "Full-finetune/Step Time": 6.613892614841461} {"Full-finetune/Learning Rate": 1.735046250200888e-05, "Full-finetune/Loss": 0.854598343372345, "Full-finetune/Loss (Raw)": 0.9140488505363464, "Full-finetune/Step": 1351, "Full-finetune/Step Time": 6.617726471275091} {"Full-finetune/Learning Rate": 1.7346237294262717e-05, "Full-finetune/Loss": 0.850753903388977, "Full-finetune/Loss (Raw)": 0.41942059993743896, "Full-finetune/Step": 1352, "Full-finetune/Step Time": 6.635146426036954} {"Full-finetune/Learning Rate": 1.734200923558528e-05, "Full-finetune/Loss": 0.8515540361404419, "Full-finetune/Loss (Raw)": 0.8513820171356201, "Full-finetune/Step": 1353, "Full-finetune/Step Time": 6.634875770658255} {"Full-finetune/Learning Rate": 1.7337778327617397e-05, "Full-finetune/Loss": 0.8521826267242432, "Full-finetune/Loss (Raw)": 0.8635408282279968, "Full-finetune/Step": 1354, "Full-finetune/Step Time": 6.631466353312135} {"Full-finetune/Learning Rate": 1.733354457200101e-05, "Full-finetune/Loss": 0.8545650839805603, "Full-finetune/Loss (Raw)": 1.0056003332138062, "Full-finetune/Step": 1355, "Full-finetune/Step Time": 6.624327752739191} {"Full-finetune/Learning Rate": 1.7329307970379145e-05, "Full-finetune/Loss": 0.8562961220741272, "Full-finetune/Loss (Raw)": 1.0056124925613403, "Full-finetune/Step": 1356, "Full-finetune/Step Time": 6.61773906648159} {"Full-finetune/Learning Rate": 1.732506852439595e-05, "Full-finetune/Loss": 0.8552864789962769, "Full-finetune/Loss (Raw)": 0.868937075138092, "Full-finetune/Step": 1357, "Full-finetune/Step Time": 6.629908801987767} {"Full-finetune/Learning Rate": 1.7320826235696672e-05, "Full-finetune/Loss": 0.8592557907104492, "Full-finetune/Loss (Raw)": 0.9125196933746338, "Full-finetune/Step": 1358, "Full-finetune/Step Time": 6.610719297081232} {"Full-finetune/Learning Rate": 1.7316581105927658e-05, "Full-finetune/Loss": 0.8576852083206177, "Full-finetune/Loss (Raw)": 0.7959692478179932, "Full-finetune/Step": 1359, "Full-finetune/Step Time": 6.624846246093512} {"Full-finetune/Learning Rate": 1.731233313673636e-05, "Full-finetune/Loss": 0.8583186864852905, "Full-finetune/Loss (Raw)": 0.9361879825592041, "Full-finetune/Step": 1360, "Full-finetune/Step Time": 6.6176913902163506} {"Full-finetune/Learning Rate": 1.7308082329771335e-05, "Full-finetune/Loss": 0.8588829040527344, "Full-finetune/Loss (Raw)": 0.9952791333198547, "Full-finetune/Step": 1361, "Full-finetune/Step Time": 6.618837472051382} {"Full-finetune/Learning Rate": 1.7303828686682233e-05, "Full-finetune/Loss": 0.8600755929946899, "Full-finetune/Loss (Raw)": 0.8683475852012634, "Full-finetune/Step": 1362, "Full-finetune/Step Time": 6.602502699941397} {"Full-finetune/Learning Rate": 1.7299572209119813e-05, "Full-finetune/Loss": 0.8597882986068726, "Full-finetune/Loss (Raw)": 0.8347193598747253, "Full-finetune/Step": 1363, "Full-finetune/Step Time": 6.6034289337694645} {"Full-finetune/Learning Rate": 1.7295312898735933e-05, "Full-finetune/Loss": 0.8583858013153076, "Full-finetune/Loss (Raw)": 0.8026236891746521, "Full-finetune/Step": 1364, "Full-finetune/Step Time": 6.632328080013394} {"Full-finetune/Learning Rate": 1.7291050757183546e-05, "Full-finetune/Loss": 0.8567864894866943, "Full-finetune/Loss (Raw)": 0.7689772248268127, "Full-finetune/Step": 1365, "Full-finetune/Step Time": 6.634629771113396} {"Full-finetune/Learning Rate": 1.7286785786116707e-05, "Full-finetune/Loss": 0.8557876348495483, "Full-finetune/Loss (Raw)": 0.8784380555152893, "Full-finetune/Step": 1366, "Full-finetune/Step Time": 6.629538431763649} {"Full-finetune/Learning Rate": 1.7282517987190567e-05, "Full-finetune/Loss": 0.8550466299057007, "Full-finetune/Loss (Raw)": 0.8005075454711914, "Full-finetune/Step": 1367, "Full-finetune/Step Time": 6.649425990879536} {"Full-finetune/Learning Rate": 1.7278247362061372e-05, "Full-finetune/Loss": 0.8552137017250061, "Full-finetune/Loss (Raw)": 0.8823624849319458, "Full-finetune/Step": 1368, "Full-finetune/Step Time": 6.650220548734069} {"Full-finetune/Learning Rate": 1.7273973912386473e-05, "Full-finetune/Loss": 0.8565195202827454, "Full-finetune/Loss (Raw)": 0.9754626154899597, "Full-finetune/Step": 1369, "Full-finetune/Step Time": 6.660316541790962} {"Full-finetune/Learning Rate": 1.726969763982431e-05, "Full-finetune/Loss": 0.855469822883606, "Full-finetune/Loss (Raw)": 0.7583207488059998, "Full-finetune/Step": 1370, "Full-finetune/Step Time": 6.66178554110229} {"Full-finetune/Learning Rate": 1.7265418546034424e-05, "Full-finetune/Loss": 0.8551596403121948, "Full-finetune/Loss (Raw)": 0.8939864635467529, "Full-finetune/Step": 1371, "Full-finetune/Step Time": 6.6625612042844296} {"Full-finetune/Learning Rate": 1.7261136632677445e-05, "Full-finetune/Loss": 0.8513216376304626, "Full-finetune/Loss (Raw)": 0.3739131987094879, "Full-finetune/Step": 1372, "Full-finetune/Step Time": 6.688656562939286} {"Full-finetune/Learning Rate": 1.7256851901415102e-05, "Full-finetune/Loss": 0.8529129028320312, "Full-finetune/Loss (Raw)": 0.9720302820205688, "Full-finetune/Step": 1373, "Full-finetune/Step Time": 6.689149120822549} {"Full-finetune/Learning Rate": 1.725256435391021e-05, "Full-finetune/Loss": 0.8522977828979492, "Full-finetune/Loss (Raw)": 0.7487432360649109, "Full-finetune/Step": 1374, "Full-finetune/Step Time": 6.681204380467534} {"Full-finetune/Learning Rate": 1.7248273991826692e-05, "Full-finetune/Loss": 0.8520630598068237, "Full-finetune/Loss (Raw)": 0.9411106705665588, "Full-finetune/Step": 1375, "Full-finetune/Step Time": 6.679154509678483} {"Full-finetune/Learning Rate": 1.7243980816829543e-05, "Full-finetune/Loss": 0.8489607572555542, "Full-finetune/Loss (Raw)": 0.31461307406425476, "Full-finetune/Step": 1376, "Full-finetune/Step Time": 6.689497821033001} {"Full-finetune/Learning Rate": 1.723968483058487e-05, "Full-finetune/Loss": 0.8490729331970215, "Full-finetune/Loss (Raw)": 0.8326436281204224, "Full-finetune/Step": 1377, "Full-finetune/Step Time": 6.6989245638251305} {"Full-finetune/Learning Rate": 1.7235386034759853e-05, "Full-finetune/Loss": 0.8494294881820679, "Full-finetune/Loss (Raw)": 0.9566901326179504, "Full-finetune/Step": 1378, "Full-finetune/Step Time": 6.71789950504899} {"Full-finetune/Learning Rate": 1.723108443102278e-05, "Full-finetune/Loss": 0.8469845056533813, "Full-finetune/Loss (Raw)": 0.5940683484077454, "Full-finetune/Step": 1379, "Full-finetune/Step Time": 6.744103334844112} {"Full-finetune/Learning Rate": 1.722678002104301e-05, "Full-finetune/Loss": 0.8475668430328369, "Full-finetune/Loss (Raw)": 0.8487779498100281, "Full-finetune/Step": 1380, "Full-finetune/Step Time": 6.7346122451126575} {"Full-finetune/Learning Rate": 1.722247280649101e-05, "Full-finetune/Loss": 0.848595380783081, "Full-finetune/Loss (Raw)": 0.9248189926147461, "Full-finetune/Step": 1381, "Full-finetune/Step Time": 6.720405740663409} {"Full-finetune/Learning Rate": 1.7218162789038312e-05, "Full-finetune/Loss": 0.8485549688339233, "Full-finetune/Loss (Raw)": 0.86651611328125, "Full-finetune/Step": 1382, "Full-finetune/Step Time": 6.709917342290282} {"Full-finetune/Learning Rate": 1.7213849970357565e-05, "Full-finetune/Loss": 0.8468047380447388, "Full-finetune/Loss (Raw)": 0.751341700553894, "Full-finetune/Step": 1383, "Full-finetune/Step Time": 6.715045668184757} {"Full-finetune/Learning Rate": 1.7209534352122484e-05, "Full-finetune/Loss": 0.8463952541351318, "Full-finetune/Loss (Raw)": 0.8624820709228516, "Full-finetune/Step": 1384, "Full-finetune/Step Time": 6.7169362511485815} {"Full-finetune/Learning Rate": 1.720521593600787e-05, "Full-finetune/Loss": 0.8492496609687805, "Full-finetune/Loss (Raw)": 0.9455903768539429, "Full-finetune/Step": 1385, "Full-finetune/Step Time": 6.693940045312047} {"Full-finetune/Learning Rate": 1.7200894723689626e-05, "Full-finetune/Loss": 0.8490293025970459, "Full-finetune/Loss (Raw)": 0.8488202691078186, "Full-finetune/Step": 1386, "Full-finetune/Step Time": 6.6953258868306875} {"Full-finetune/Learning Rate": 1.7196570716844724e-05, "Full-finetune/Loss": 0.8488596677780151, "Full-finetune/Loss (Raw)": 0.7449234127998352, "Full-finetune/Step": 1387, "Full-finetune/Step Time": 6.690344266593456} {"Full-finetune/Learning Rate": 1.7192243917151228e-05, "Full-finetune/Loss": 0.8475798964500427, "Full-finetune/Loss (Raw)": 0.9354415535926819, "Full-finetune/Step": 1388, "Full-finetune/Step Time": 6.685867104679346} {"Full-finetune/Learning Rate": 1.7187914326288286e-05, "Full-finetune/Loss": 0.8485816717147827, "Full-finetune/Loss (Raw)": 0.8759452700614929, "Full-finetune/Step": 1389, "Full-finetune/Step Time": 6.6878718212246895} {"Full-finetune/Learning Rate": 1.718358194593612e-05, "Full-finetune/Loss": 0.8495984077453613, "Full-finetune/Loss (Raw)": 1.0417568683624268, "Full-finetune/Step": 1390, "Full-finetune/Step Time": 6.6968658193945885} {"Full-finetune/Learning Rate": 1.7179246777776053e-05, "Full-finetune/Loss": 0.848734974861145, "Full-finetune/Loss (Raw)": 0.821487307548523, "Full-finetune/Step": 1391, "Full-finetune/Step Time": 6.7128852885216475} {"Full-finetune/Learning Rate": 1.7174908823490475e-05, "Full-finetune/Loss": 0.8483253717422485, "Full-finetune/Loss (Raw)": 0.8234556913375854, "Full-finetune/Step": 1392, "Full-finetune/Step Time": 6.745361495763063} {"Full-finetune/Learning Rate": 1.717056808476286e-05, "Full-finetune/Loss": 0.8513538837432861, "Full-finetune/Loss (Raw)": 0.7659979462623596, "Full-finetune/Step": 1393, "Full-finetune/Step Time": 6.765043118968606} {"Full-finetune/Learning Rate": 1.716622456327776e-05, "Full-finetune/Loss": 0.8521872758865356, "Full-finetune/Loss (Raw)": 0.944878101348877, "Full-finetune/Step": 1394, "Full-finetune/Step Time": 6.752655370160937} {"Full-finetune/Learning Rate": 1.7161878260720826e-05, "Full-finetune/Loss": 0.8512635231018066, "Full-finetune/Loss (Raw)": 0.8238793611526489, "Full-finetune/Step": 1395, "Full-finetune/Step Time": 6.75593326240778} {"Full-finetune/Learning Rate": 1.7157529178778757e-05, "Full-finetune/Loss": 0.8484060764312744, "Full-finetune/Loss (Raw)": 0.6200209259986877, "Full-finetune/Step": 1396, "Full-finetune/Step Time": 6.764116508886218} {"Full-finetune/Learning Rate": 1.7153177319139352e-05, "Full-finetune/Loss": 0.8488320112228394, "Full-finetune/Loss (Raw)": 0.8751499652862549, "Full-finetune/Step": 1397, "Full-finetune/Step Time": 6.777877474203706} {"Full-finetune/Learning Rate": 1.7148822683491483e-05, "Full-finetune/Loss": 0.8482322692871094, "Full-finetune/Loss (Raw)": 0.8668086528778076, "Full-finetune/Step": 1398, "Full-finetune/Step Time": 6.768633421510458} {"Full-finetune/Learning Rate": 1.7144465273525105e-05, "Full-finetune/Loss": 0.8452531695365906, "Full-finetune/Loss (Raw)": 0.6098735928535461, "Full-finetune/Step": 1399, "Full-finetune/Step Time": 6.7855058163404465} {"Full-finetune/Learning Rate": 1.7140105090931232e-05, "Full-finetune/Loss": 0.8468406200408936, "Full-finetune/Loss (Raw)": 0.9242647290229797, "Full-finetune/Step": 1400, "Full-finetune/Step Time": 6.78153277002275} {"Full-finetune/Learning Rate": 1.7135742137401976e-05, "Full-finetune/Loss": 0.8472098112106323, "Full-finetune/Loss (Raw)": 0.8128930926322937, "Full-finetune/Step": 1401, "Full-finetune/Step Time": 6.779967254027724} {"Full-finetune/Learning Rate": 1.7131376414630506e-05, "Full-finetune/Loss": 0.8437495827674866, "Full-finetune/Loss (Raw)": 0.377407431602478, "Full-finetune/Step": 1402, "Full-finetune/Step Time": 6.800707429647446} {"Full-finetune/Learning Rate": 1.712700792431108e-05, "Full-finetune/Loss": 0.8421012163162231, "Full-finetune/Loss (Raw)": 0.8185385465621948, "Full-finetune/Step": 1403, "Full-finetune/Step Time": 6.80174320563674} {"Full-finetune/Learning Rate": 1.7122636668139022e-05, "Full-finetune/Loss": 0.8423914313316345, "Full-finetune/Loss (Raw)": 0.8868728876113892, "Full-finetune/Step": 1404, "Full-finetune/Step Time": 6.799107614904642} {"Full-finetune/Learning Rate": 1.711826264781073e-05, "Full-finetune/Loss": 0.8407930135726929, "Full-finetune/Loss (Raw)": 0.6920693516731262, "Full-finetune/Step": 1405, "Full-finetune/Step Time": 6.798123134300113} {"Full-finetune/Learning Rate": 1.711388586502368e-05, "Full-finetune/Loss": 0.8426856994628906, "Full-finetune/Loss (Raw)": 0.8479785919189453, "Full-finetune/Step": 1406, "Full-finetune/Step Time": 6.792170654982328} {"Full-finetune/Learning Rate": 1.710950632147641e-05, "Full-finetune/Loss": 0.838752031326294, "Full-finetune/Loss (Raw)": 0.36977851390838623, "Full-finetune/Step": 1407, "Full-finetune/Step Time": 6.8059178702533245} {"Full-finetune/Learning Rate": 1.710512401886854e-05, "Full-finetune/Loss": 0.8365765810012817, "Full-finetune/Loss (Raw)": 0.7271706461906433, "Full-finetune/Step": 1408, "Full-finetune/Step Time": 6.808771001175046} {"Full-finetune/Learning Rate": 1.7100738958900752e-05, "Full-finetune/Loss": 0.8367382287979126, "Full-finetune/Loss (Raw)": 0.9132640361785889, "Full-finetune/Step": 1409, "Full-finetune/Step Time": 6.806808710098267} {"Full-finetune/Learning Rate": 1.7096351143274804e-05, "Full-finetune/Loss": 0.8359375, "Full-finetune/Loss (Raw)": 0.7656423449516296, "Full-finetune/Step": 1410, "Full-finetune/Step Time": 6.835464347153902} {"Full-finetune/Learning Rate": 1.7091960573693523e-05, "Full-finetune/Loss": 0.837300181388855, "Full-finetune/Loss (Raw)": 0.8658110499382019, "Full-finetune/Step": 1411, "Full-finetune/Step Time": 6.824499540030956} {"Full-finetune/Learning Rate": 1.70875672518608e-05, "Full-finetune/Loss": 0.8358436226844788, "Full-finetune/Loss (Raw)": 0.6602256298065186, "Full-finetune/Step": 1412, "Full-finetune/Step Time": 6.8246777560561895} {"Full-finetune/Learning Rate": 1.7083171179481603e-05, "Full-finetune/Loss": 0.8353303670883179, "Full-finetune/Loss (Raw)": 0.903992772102356, "Full-finetune/Step": 1413, "Full-finetune/Step Time": 6.818238971754909} {"Full-finetune/Learning Rate": 1.7078772358261957e-05, "Full-finetune/Loss": 0.8366801738739014, "Full-finetune/Loss (Raw)": 1.0143147706985474, "Full-finetune/Step": 1414, "Full-finetune/Step Time": 6.808295909315348} {"Full-finetune/Learning Rate": 1.707437078990896e-05, "Full-finetune/Loss": 0.8365072011947632, "Full-finetune/Loss (Raw)": 0.8520234227180481, "Full-finetune/Step": 1415, "Full-finetune/Step Time": 6.812885884195566} {"Full-finetune/Learning Rate": 1.7069966476130773e-05, "Full-finetune/Loss": 0.837601900100708, "Full-finetune/Loss (Raw)": 0.9635452032089233, "Full-finetune/Step": 1416, "Full-finetune/Step Time": 6.8116865660995245} {"Full-finetune/Learning Rate": 1.706555941863663e-05, "Full-finetune/Loss": 0.8377221822738647, "Full-finetune/Loss (Raw)": 0.8406965136528015, "Full-finetune/Step": 1417, "Full-finetune/Step Time": 6.811536006629467} {"Full-finetune/Learning Rate": 1.7061149619136818e-05, "Full-finetune/Loss": 0.8355615139007568, "Full-finetune/Loss (Raw)": 0.7190039753913879, "Full-finetune/Step": 1418, "Full-finetune/Step Time": 6.819339778274298} {"Full-finetune/Learning Rate": 1.7056737079342694e-05, "Full-finetune/Loss": 0.8351737260818481, "Full-finetune/Loss (Raw)": 0.7364017963409424, "Full-finetune/Step": 1419, "Full-finetune/Step Time": 6.803746564313769} {"Full-finetune/Learning Rate": 1.7052321800966684e-05, "Full-finetune/Loss": 0.8357000350952148, "Full-finetune/Loss (Raw)": 0.9035058617591858, "Full-finetune/Step": 1420, "Full-finetune/Step Time": 6.804600840434432} {"Full-finetune/Learning Rate": 1.7047903785722268e-05, "Full-finetune/Loss": 0.8351033329963684, "Full-finetune/Loss (Raw)": 0.8200565576553345, "Full-finetune/Step": 1421, "Full-finetune/Step Time": 6.805075803771615} {"Full-finetune/Learning Rate": 1.704348303532399e-05, "Full-finetune/Loss": 0.8338863253593445, "Full-finetune/Loss (Raw)": 0.778448224067688, "Full-finetune/Step": 1422, "Full-finetune/Step Time": 6.801788955926895} {"Full-finetune/Learning Rate": 1.7039059551487457e-05, "Full-finetune/Loss": 0.8347516059875488, "Full-finetune/Loss (Raw)": 0.9504172801971436, "Full-finetune/Step": 1423, "Full-finetune/Step Time": 6.7934788931161165} {"Full-finetune/Learning Rate": 1.703463333592934e-05, "Full-finetune/Loss": 0.8346835970878601, "Full-finetune/Loss (Raw)": 0.7870423793792725, "Full-finetune/Step": 1424, "Full-finetune/Step Time": 6.787599366158247} {"Full-finetune/Learning Rate": 1.7030204390367368e-05, "Full-finetune/Loss": 0.8350297212600708, "Full-finetune/Loss (Raw)": 0.8597597479820251, "Full-finetune/Step": 1425, "Full-finetune/Step Time": 6.783074643462896} {"Full-finetune/Learning Rate": 1.7025772716520324e-05, "Full-finetune/Loss": 0.8353698253631592, "Full-finetune/Loss (Raw)": 0.78177809715271, "Full-finetune/Step": 1426, "Full-finetune/Step Time": 6.807294465601444} {"Full-finetune/Learning Rate": 1.702133831610805e-05, "Full-finetune/Loss": 0.8360908031463623, "Full-finetune/Loss (Raw)": 0.7543966770172119, "Full-finetune/Step": 1427, "Full-finetune/Step Time": 6.807082438841462} {"Full-finetune/Learning Rate": 1.701690119085146e-05, "Full-finetune/Loss": 0.835727334022522, "Full-finetune/Loss (Raw)": 0.7602523565292358, "Full-finetune/Step": 1428, "Full-finetune/Step Time": 6.8144850470125675} {"Full-finetune/Learning Rate": 1.701246134247251e-05, "Full-finetune/Loss": 0.8346813321113586, "Full-finetune/Loss (Raw)": 0.7097225189208984, "Full-finetune/Step": 1429, "Full-finetune/Step Time": 6.80570456571877} {"Full-finetune/Learning Rate": 1.700801877269422e-05, "Full-finetune/Loss": 0.8345316052436829, "Full-finetune/Loss (Raw)": 0.8201543688774109, "Full-finetune/Step": 1430, "Full-finetune/Step Time": 6.808156097307801} {"Full-finetune/Learning Rate": 1.7003573483240666e-05, "Full-finetune/Loss": 0.8338356614112854, "Full-finetune/Loss (Raw)": 0.7477327585220337, "Full-finetune/Step": 1431, "Full-finetune/Step Time": 6.819848395884037} {"Full-finetune/Learning Rate": 1.6999125475836973e-05, "Full-finetune/Loss": 0.8327864408493042, "Full-finetune/Loss (Raw)": 0.7872762084007263, "Full-finetune/Step": 1432, "Full-finetune/Step Time": 6.823534784838557} {"Full-finetune/Learning Rate": 1.6994674752209334e-05, "Full-finetune/Loss": 0.8337180614471436, "Full-finetune/Loss (Raw)": 0.9449127912521362, "Full-finetune/Step": 1433, "Full-finetune/Step Time": 6.824587859213352} {"Full-finetune/Learning Rate": 1.6990221314084976e-05, "Full-finetune/Loss": 0.830262303352356, "Full-finetune/Loss (Raw)": 0.37381425499916077, "Full-finetune/Step": 1434, "Full-finetune/Step Time": 6.828204175457358} {"Full-finetune/Learning Rate": 1.6985765163192204e-05, "Full-finetune/Loss": 0.8295438289642334, "Full-finetune/Loss (Raw)": 0.903041660785675, "Full-finetune/Step": 1435, "Full-finetune/Step Time": 6.835687913000584} {"Full-finetune/Learning Rate": 1.698130630126036e-05, "Full-finetune/Loss": 0.826494038105011, "Full-finetune/Loss (Raw)": 0.6199129819869995, "Full-finetune/Step": 1436, "Full-finetune/Step Time": 6.846404435113072} {"Full-finetune/Learning Rate": 1.697684473001983e-05, "Full-finetune/Loss": 0.8265018463134766, "Full-finetune/Loss (Raw)": 0.8791795969009399, "Full-finetune/Step": 1437, "Full-finetune/Step Time": 6.841006830334663} {"Full-finetune/Learning Rate": 1.6972380451202083e-05, "Full-finetune/Loss": 0.8268994092941284, "Full-finetune/Loss (Raw)": 0.8851509690284729, "Full-finetune/Step": 1438, "Full-finetune/Step Time": 6.836148303002119} {"Full-finetune/Learning Rate": 1.69679134665396e-05, "Full-finetune/Loss": 0.827307939529419, "Full-finetune/Loss (Raw)": 0.9500535130500793, "Full-finetune/Step": 1439, "Full-finetune/Step Time": 6.833298673853278} {"Full-finetune/Learning Rate": 1.696344377776594e-05, "Full-finetune/Loss": 0.8277241587638855, "Full-finetune/Loss (Raw)": 0.6216873526573181, "Full-finetune/Step": 1440, "Full-finetune/Step Time": 6.829976374283433} {"Full-finetune/Learning Rate": 1.69589713866157e-05, "Full-finetune/Loss": 0.8274956941604614, "Full-finetune/Loss (Raw)": 0.8485214710235596, "Full-finetune/Step": 1441, "Full-finetune/Step Time": 6.826959447935224} {"Full-finetune/Learning Rate": 1.6954496294824526e-05, "Full-finetune/Loss": 0.8266018033027649, "Full-finetune/Loss (Raw)": 0.8199905157089233, "Full-finetune/Step": 1442, "Full-finetune/Step Time": 6.82299598865211} {"Full-finetune/Learning Rate": 1.6950018504129112e-05, "Full-finetune/Loss": 0.8258824348449707, "Full-finetune/Loss (Raw)": 0.8316997289657593, "Full-finetune/Step": 1443, "Full-finetune/Step Time": 6.827051926404238} {"Full-finetune/Learning Rate": 1.6945538016267206e-05, "Full-finetune/Loss": 0.8238356113433838, "Full-finetune/Loss (Raw)": 0.7877289652824402, "Full-finetune/Step": 1444, "Full-finetune/Step Time": 6.8258059695363045} {"Full-finetune/Learning Rate": 1.6941054832977598e-05, "Full-finetune/Loss": 0.8230971097946167, "Full-finetune/Loss (Raw)": 0.8521115183830261, "Full-finetune/Step": 1445, "Full-finetune/Step Time": 6.828838430345058} {"Full-finetune/Learning Rate": 1.6936568956000123e-05, "Full-finetune/Loss": 0.8221715092658997, "Full-finetune/Loss (Raw)": 0.7364367246627808, "Full-finetune/Step": 1446, "Full-finetune/Step Time": 6.844738487154245} {"Full-finetune/Learning Rate": 1.693208038707566e-05, "Full-finetune/Loss": 0.8222571611404419, "Full-finetune/Loss (Raw)": 0.9045891165733337, "Full-finetune/Step": 1447, "Full-finetune/Step Time": 6.849859436973929} {"Full-finetune/Learning Rate": 1.6927589127946136e-05, "Full-finetune/Loss": 0.8233252763748169, "Full-finetune/Loss (Raw)": 0.9090811610221863, "Full-finetune/Step": 1448, "Full-finetune/Step Time": 6.841595413163304} {"Full-finetune/Learning Rate": 1.692309518035452e-05, "Full-finetune/Loss": 0.8219921588897705, "Full-finetune/Loss (Raw)": 0.7383034229278564, "Full-finetune/Step": 1449, "Full-finetune/Step Time": 6.845198908820748} {"Full-finetune/Learning Rate": 1.691859854604483e-05, "Full-finetune/Loss": 0.8207459449768066, "Full-finetune/Loss (Raw)": 0.729049801826477, "Full-finetune/Step": 1450, "Full-finetune/Step Time": 6.881322730332613} {"Full-finetune/Learning Rate": 1.6914099226762116e-05, "Full-finetune/Loss": 0.8200057148933411, "Full-finetune/Loss (Raw)": 0.8395628333091736, "Full-finetune/Step": 1451, "Full-finetune/Step Time": 6.87468191049993} {"Full-finetune/Learning Rate": 1.6909597224252478e-05, "Full-finetune/Loss": 0.8197417259216309, "Full-finetune/Loss (Raw)": 0.9264776110649109, "Full-finetune/Step": 1452, "Full-finetune/Step Time": 6.867161840200424} {"Full-finetune/Learning Rate": 1.6905092540263055e-05, "Full-finetune/Loss": 0.8182352781295776, "Full-finetune/Loss (Raw)": 0.7906047105789185, "Full-finetune/Step": 1453, "Full-finetune/Step Time": 6.863257523626089} {"Full-finetune/Learning Rate": 1.690058517654203e-05, "Full-finetune/Loss": 0.8190559148788452, "Full-finetune/Loss (Raw)": 1.0564855337142944, "Full-finetune/Step": 1454, "Full-finetune/Step Time": 6.866664653643966} {"Full-finetune/Learning Rate": 1.689607513483862e-05, "Full-finetune/Loss": 0.8205769062042236, "Full-finetune/Loss (Raw)": 0.9404724836349487, "Full-finetune/Step": 1455, "Full-finetune/Step Time": 6.835214331746101} {"Full-finetune/Learning Rate": 1.6891562416903083e-05, "Full-finetune/Loss": 0.8187629580497742, "Full-finetune/Loss (Raw)": 0.8151410222053528, "Full-finetune/Step": 1456, "Full-finetune/Step Time": 6.837864244356751} {"Full-finetune/Learning Rate": 1.688704702448672e-05, "Full-finetune/Loss": 0.8131662607192993, "Full-finetune/Loss (Raw)": 0.36890918016433716, "Full-finetune/Step": 1457, "Full-finetune/Step Time": 6.855100616812706} {"Full-finetune/Learning Rate": 1.6882528959341865e-05, "Full-finetune/Loss": 0.8145913481712341, "Full-finetune/Loss (Raw)": 0.8650298714637756, "Full-finetune/Step": 1458, "Full-finetune/Step Time": 6.854085957631469} {"Full-finetune/Learning Rate": 1.6878008223221895e-05, "Full-finetune/Loss": 0.8151025772094727, "Full-finetune/Loss (Raw)": 0.9929278492927551, "Full-finetune/Step": 1459, "Full-finetune/Step Time": 6.863282781094313} {"Full-finetune/Learning Rate": 1.687348481788121e-05, "Full-finetune/Loss": 0.8171144723892212, "Full-finetune/Loss (Raw)": 1.003982424736023, "Full-finetune/Step": 1460, "Full-finetune/Step Time": 6.853363409638405} {"Full-finetune/Learning Rate": 1.6868958745075262e-05, "Full-finetune/Loss": 0.8183590769767761, "Full-finetune/Loss (Raw)": 1.0529016256332397, "Full-finetune/Step": 1461, "Full-finetune/Step Time": 6.857588537037373} {"Full-finetune/Learning Rate": 1.6864430006560527e-05, "Full-finetune/Loss": 0.81822270154953, "Full-finetune/Loss (Raw)": 0.9068251848220825, "Full-finetune/Step": 1462, "Full-finetune/Step Time": 6.860638299956918} {"Full-finetune/Learning Rate": 1.685989860409453e-05, "Full-finetune/Loss": 0.8187100887298584, "Full-finetune/Loss (Raw)": 0.9644078016281128, "Full-finetune/Step": 1463, "Full-finetune/Step Time": 6.862215254455805} {"Full-finetune/Learning Rate": 1.6855364539435805e-05, "Full-finetune/Loss": 0.8179864287376404, "Full-finetune/Loss (Raw)": 0.8103391528129578, "Full-finetune/Step": 1464, "Full-finetune/Step Time": 6.866924338042736} {"Full-finetune/Learning Rate": 1.685082781434395e-05, "Full-finetune/Loss": 0.8172544240951538, "Full-finetune/Loss (Raw)": 0.8588569164276123, "Full-finetune/Step": 1465, "Full-finetune/Step Time": 6.860792072489858} {"Full-finetune/Learning Rate": 1.6846288430579565e-05, "Full-finetune/Loss": 0.8215166330337524, "Full-finetune/Loss (Raw)": 0.8594990372657776, "Full-finetune/Step": 1466, "Full-finetune/Step Time": 6.847178313881159} {"Full-finetune/Learning Rate": 1.6841746389904306e-05, "Full-finetune/Loss": 0.8222433924674988, "Full-finetune/Loss (Raw)": 0.8463885188102722, "Full-finetune/Step": 1467, "Full-finetune/Step Time": 6.865151587873697} {"Full-finetune/Learning Rate": 1.683720169408085e-05, "Full-finetune/Loss": 0.8227548599243164, "Full-finetune/Loss (Raw)": 0.9145610332489014, "Full-finetune/Step": 1468, "Full-finetune/Step Time": 6.857731597498059} {"Full-finetune/Learning Rate": 1.6832654344872893e-05, "Full-finetune/Loss": 0.8191996812820435, "Full-finetune/Loss (Raw)": 0.3761710524559021, "Full-finetune/Step": 1469, "Full-finetune/Step Time": 6.885003292933106} {"Full-finetune/Learning Rate": 1.6828104344045186e-05, "Full-finetune/Loss": 0.8182429671287537, "Full-finetune/Loss (Raw)": 0.808590829372406, "Full-finetune/Step": 1470, "Full-finetune/Step Time": 6.863293830305338} {"Full-finetune/Learning Rate": 1.682355169336349e-05, "Full-finetune/Loss": 0.8186800479888916, "Full-finetune/Loss (Raw)": 0.8551672101020813, "Full-finetune/Step": 1471, "Full-finetune/Step Time": 6.837325096130371} {"Full-finetune/Learning Rate": 1.6818996394594603e-05, "Full-finetune/Loss": 0.8185694217681885, "Full-finetune/Loss (Raw)": 0.7737582325935364, "Full-finetune/Step": 1472, "Full-finetune/Step Time": 6.830317920073867} {"Full-finetune/Learning Rate": 1.681443844950634e-05, "Full-finetune/Loss": 0.8155482411384583, "Full-finetune/Loss (Raw)": 0.6068709492683411, "Full-finetune/Step": 1473, "Full-finetune/Step Time": 6.836863521486521} {"Full-finetune/Learning Rate": 1.6809877859867557e-05, "Full-finetune/Loss": 0.8168237209320068, "Full-finetune/Loss (Raw)": 1.0402371883392334, "Full-finetune/Step": 1474, "Full-finetune/Step Time": 6.831585155799985} {"Full-finetune/Learning Rate": 1.680531462744813e-05, "Full-finetune/Loss": 0.8147674202919006, "Full-finetune/Loss (Raw)": 0.6904001832008362, "Full-finetune/Step": 1475, "Full-finetune/Step Time": 6.82432508841157} {"Full-finetune/Learning Rate": 1.680074875401896e-05, "Full-finetune/Loss": 0.8186644315719604, "Full-finetune/Loss (Raw)": 0.9238943457603455, "Full-finetune/Step": 1476, "Full-finetune/Step Time": 6.808810703456402} {"Full-finetune/Learning Rate": 1.679618024135197e-05, "Full-finetune/Loss": 0.8136534690856934, "Full-finetune/Loss (Raw)": 0.305510550737381, "Full-finetune/Step": 1477, "Full-finetune/Step Time": 6.832687301561236} {"Full-finetune/Learning Rate": 1.679160909122011e-05, "Full-finetune/Loss": 0.8146504759788513, "Full-finetune/Loss (Raw)": 1.029559850692749, "Full-finetune/Step": 1478, "Full-finetune/Step Time": 6.825182590633631} {"Full-finetune/Learning Rate": 1.6787035305397363e-05, "Full-finetune/Loss": 0.8134838342666626, "Full-finetune/Loss (Raw)": 0.7647175192832947, "Full-finetune/Step": 1479, "Full-finetune/Step Time": 6.839540412649512} {"Full-finetune/Learning Rate": 1.6782458885658716e-05, "Full-finetune/Loss": 0.8170462846755981, "Full-finetune/Loss (Raw)": 0.8754153251647949, "Full-finetune/Step": 1480, "Full-finetune/Step Time": 6.82142323628068} {"Full-finetune/Learning Rate": 1.6777879833780192e-05, "Full-finetune/Loss": 0.8174804449081421, "Full-finetune/Loss (Raw)": 0.9069494009017944, "Full-finetune/Step": 1481, "Full-finetune/Step Time": 6.837478131055832} {"Full-finetune/Learning Rate": 1.677329815153883e-05, "Full-finetune/Loss": 0.8171445727348328, "Full-finetune/Loss (Raw)": 0.8205522894859314, "Full-finetune/Step": 1482, "Full-finetune/Step Time": 6.829652706161141} {"Full-finetune/Learning Rate": 1.6768713840712692e-05, "Full-finetune/Loss": 0.8139824867248535, "Full-finetune/Loss (Raw)": 0.6008588075637817, "Full-finetune/Step": 1483, "Full-finetune/Step Time": 6.8546135146170855} {"Full-finetune/Learning Rate": 1.6764126903080865e-05, "Full-finetune/Loss": 0.813213586807251, "Full-finetune/Loss (Raw)": 0.9071895480155945, "Full-finetune/Step": 1484, "Full-finetune/Step Time": 6.850877992808819} {"Full-finetune/Learning Rate": 1.675953734042344e-05, "Full-finetune/Loss": 0.8126068711280823, "Full-finetune/Loss (Raw)": 0.7912790179252625, "Full-finetune/Step": 1485, "Full-finetune/Step Time": 6.839572258293629} {"Full-finetune/Learning Rate": 1.6754945154521548e-05, "Full-finetune/Loss": 0.8078000545501709, "Full-finetune/Loss (Raw)": 0.29724791646003723, "Full-finetune/Step": 1486, "Full-finetune/Step Time": 6.857727359980345} {"Full-finetune/Learning Rate": 1.6750350347157315e-05, "Full-finetune/Loss": 0.8094834685325623, "Full-finetune/Loss (Raw)": 1.0114480257034302, "Full-finetune/Step": 1487, "Full-finetune/Step Time": 6.862988019362092} {"Full-finetune/Learning Rate": 1.6745752920113907e-05, "Full-finetune/Loss": 0.8108758330345154, "Full-finetune/Loss (Raw)": 1.114406704902649, "Full-finetune/Step": 1488, "Full-finetune/Step Time": 6.8611375112086535} {"Full-finetune/Learning Rate": 1.6741152875175485e-05, "Full-finetune/Loss": 0.8081943988800049, "Full-finetune/Loss (Raw)": 0.6520612835884094, "Full-finetune/Step": 1489, "Full-finetune/Step Time": 6.874312225729227} {"Full-finetune/Learning Rate": 1.6736550214127247e-05, "Full-finetune/Loss": 0.8074836730957031, "Full-finetune/Loss (Raw)": 0.7773690819740295, "Full-finetune/Step": 1490, "Full-finetune/Step Time": 6.894558181986213} {"Full-finetune/Learning Rate": 1.673194493875539e-05, "Full-finetune/Loss": 0.8065679669380188, "Full-finetune/Loss (Raw)": 0.7175125479698181, "Full-finetune/Step": 1491, "Full-finetune/Step Time": 6.9075781889259815} {"Full-finetune/Learning Rate": 1.672733705084713e-05, "Full-finetune/Loss": 0.8076649308204651, "Full-finetune/Loss (Raw)": 0.9430374503135681, "Full-finetune/Step": 1492, "Full-finetune/Step Time": 6.878645172342658} {"Full-finetune/Learning Rate": 1.67227265521907e-05, "Full-finetune/Loss": 0.804190993309021, "Full-finetune/Loss (Raw)": 0.3243117034435272, "Full-finetune/Step": 1493, "Full-finetune/Step Time": 6.881566798314452} {"Full-finetune/Learning Rate": 1.671811344457535e-05, "Full-finetune/Loss": 0.8038550615310669, "Full-finetune/Loss (Raw)": 0.835438072681427, "Full-finetune/Step": 1494, "Full-finetune/Step Time": 6.895518466830254} {"Full-finetune/Learning Rate": 1.671349772979133e-05, "Full-finetune/Loss": 0.8043449521064758, "Full-finetune/Loss (Raw)": 0.8632182478904724, "Full-finetune/Step": 1495, "Full-finetune/Step Time": 6.880073262378573} {"Full-finetune/Learning Rate": 1.6708879409629908e-05, "Full-finetune/Loss": 0.8044942617416382, "Full-finetune/Loss (Raw)": 0.9014681577682495, "Full-finetune/Step": 1496, "Full-finetune/Step Time": 6.879673346877098} {"Full-finetune/Learning Rate": 1.670425848588337e-05, "Full-finetune/Loss": 0.8028925657272339, "Full-finetune/Loss (Raw)": 0.7704446911811829, "Full-finetune/Step": 1497, "Full-finetune/Step Time": 6.873285768553615} {"Full-finetune/Learning Rate": 1.6699634960345005e-05, "Full-finetune/Loss": 0.8046284914016724, "Full-finetune/Loss (Raw)": 0.9805170297622681, "Full-finetune/Step": 1498, "Full-finetune/Step Time": 6.876267232000828} {"Full-finetune/Learning Rate": 1.6695008834809107e-05, "Full-finetune/Loss": 0.8009626269340515, "Full-finetune/Loss (Raw)": 0.4247575104236603, "Full-finetune/Step": 1499, "Full-finetune/Step Time": 6.888448927551508} {"Full-finetune/Learning Rate": 1.669038011107099e-05, "Full-finetune/Loss": 0.8008109331130981, "Full-finetune/Loss (Raw)": 0.3544946610927582, "Full-finetune/Step": 1500, "Full-finetune/Step Time": 6.877691036090255} {"Full-finetune/Learning Rate": 1.6685748790926975e-05, "Full-finetune/Loss": 0.8008906841278076, "Full-finetune/Loss (Raw)": 0.9822380542755127, "Full-finetune/Step": 1501, "Full-finetune/Step Time": 6.909127967432141} {"Full-finetune/Learning Rate": 1.6681114876174377e-05, "Full-finetune/Loss": 0.8024499416351318, "Full-finetune/Loss (Raw)": 0.9483294486999512, "Full-finetune/Step": 1502, "Full-finetune/Step Time": 6.901724962517619} {"Full-finetune/Learning Rate": 1.6676478368611536e-05, "Full-finetune/Loss": 0.8008497953414917, "Full-finetune/Loss (Raw)": 0.7362903356552124, "Full-finetune/Step": 1503, "Full-finetune/Step Time": 6.9033868461847305} {"Full-finetune/Learning Rate": 1.667183927003779e-05, "Full-finetune/Loss": 0.8052880167961121, "Full-finetune/Loss (Raw)": 0.8827061057090759, "Full-finetune/Step": 1504, "Full-finetune/Step Time": 6.896979568526149} {"Full-finetune/Learning Rate": 1.6667197582253474e-05, "Full-finetune/Loss": 0.8055427074432373, "Full-finetune/Loss (Raw)": 0.8652452826499939, "Full-finetune/Step": 1505, "Full-finetune/Step Time": 6.881966447457671} {"Full-finetune/Learning Rate": 1.6662553307059947e-05, "Full-finetune/Loss": 0.8042721152305603, "Full-finetune/Loss (Raw)": 0.7940557599067688, "Full-finetune/Step": 1506, "Full-finetune/Step Time": 6.871047468855977} {"Full-finetune/Learning Rate": 1.6657906446259554e-05, "Full-finetune/Loss": 0.8069834113121033, "Full-finetune/Loss (Raw)": 0.9411119222640991, "Full-finetune/Step": 1507, "Full-finetune/Step Time": 6.839188067242503} {"Full-finetune/Learning Rate": 1.6653257001655652e-05, "Full-finetune/Loss": 0.8078458309173584, "Full-finetune/Loss (Raw)": 0.9591659903526306, "Full-finetune/Step": 1508, "Full-finetune/Step Time": 6.843137547373772} {"Full-finetune/Learning Rate": 1.664860497505261e-05, "Full-finetune/Loss": 0.8074198961257935, "Full-finetune/Loss (Raw)": 0.870301365852356, "Full-finetune/Step": 1509, "Full-finetune/Step Time": 6.8368606846779585} {"Full-finetune/Learning Rate": 1.664395036825577e-05, "Full-finetune/Loss": 0.8080369234085083, "Full-finetune/Loss (Raw)": 0.9454975128173828, "Full-finetune/Step": 1510, "Full-finetune/Step Time": 6.835461487993598} {"Full-finetune/Learning Rate": 1.6639293183071514e-05, "Full-finetune/Loss": 0.809674859046936, "Full-finetune/Loss (Raw)": 0.9610018730163574, "Full-finetune/Step": 1511, "Full-finetune/Step Time": 6.834654530510306} {"Full-finetune/Learning Rate": 1.6634633421307187e-05, "Full-finetune/Loss": 0.8089036345481873, "Full-finetune/Loss (Raw)": 0.7637626528739929, "Full-finetune/Step": 1512, "Full-finetune/Step Time": 6.838231241330504} {"Full-finetune/Learning Rate": 1.6629971084771165e-05, "Full-finetune/Loss": 0.8092113733291626, "Full-finetune/Loss (Raw)": 0.9849696755409241, "Full-finetune/Step": 1513, "Full-finetune/Step Time": 6.840113094076514} {"Full-finetune/Learning Rate": 1.66253061752728e-05, "Full-finetune/Loss": 0.8088704347610474, "Full-finetune/Loss (Raw)": 0.8051928877830505, "Full-finetune/Step": 1514, "Full-finetune/Step Time": 6.85909777879715} {"Full-finetune/Learning Rate": 1.662063869462246e-05, "Full-finetune/Loss": 0.8099356889724731, "Full-finetune/Loss (Raw)": 0.8812685608863831, "Full-finetune/Step": 1515, "Full-finetune/Step Time": 6.856592835858464} {"Full-finetune/Learning Rate": 1.6615968644631498e-05, "Full-finetune/Loss": 0.8095836043357849, "Full-finetune/Loss (Raw)": 0.8903762698173523, "Full-finetune/Step": 1516, "Full-finetune/Step Time": 6.859549345448613} {"Full-finetune/Learning Rate": 1.661129602711227e-05, "Full-finetune/Loss": 0.8088717460632324, "Full-finetune/Loss (Raw)": 0.7848289012908936, "Full-finetune/Step": 1517, "Full-finetune/Step Time": 6.859968610107899} {"Full-finetune/Learning Rate": 1.6606620843878128e-05, "Full-finetune/Loss": 0.808434784412384, "Full-finetune/Loss (Raw)": 0.9858236908912659, "Full-finetune/Step": 1518, "Full-finetune/Step Time": 6.853420324623585} {"Full-finetune/Learning Rate": 1.6601943096743426e-05, "Full-finetune/Loss": 0.8075399398803711, "Full-finetune/Loss (Raw)": 0.7069498896598816, "Full-finetune/Step": 1519, "Full-finetune/Step Time": 6.838899202644825} {"Full-finetune/Learning Rate": 1.6597262787523493e-05, "Full-finetune/Loss": 0.8042057752609253, "Full-finetune/Loss (Raw)": 0.3966839611530304, "Full-finetune/Step": 1520, "Full-finetune/Step Time": 6.822137011215091} {"Full-finetune/Learning Rate": 1.6592579918034678e-05, "Full-finetune/Loss": 0.80523681640625, "Full-finetune/Loss (Raw)": 0.8979673385620117, "Full-finetune/Step": 1521, "Full-finetune/Step Time": 6.7847619745880365} {"Full-finetune/Learning Rate": 1.65878944900943e-05, "Full-finetune/Loss": 0.8037389516830444, "Full-finetune/Loss (Raw)": 0.753155529499054, "Full-finetune/Step": 1522, "Full-finetune/Step Time": 6.795866660773754} {"Full-finetune/Learning Rate": 1.6583206505520695e-05, "Full-finetune/Loss": 0.8023713827133179, "Full-finetune/Loss (Raw)": 0.6488243937492371, "Full-finetune/Step": 1523, "Full-finetune/Step Time": 6.809661250561476} {"Full-finetune/Learning Rate": 1.6578515966133167e-05, "Full-finetune/Loss": 0.8031477332115173, "Full-finetune/Loss (Raw)": 0.719397783279419, "Full-finetune/Step": 1524, "Full-finetune/Step Time": 6.827204765751958} {"Full-finetune/Learning Rate": 1.6573822873752026e-05, "Full-finetune/Loss": 0.8018335700035095, "Full-finetune/Loss (Raw)": 0.7069361805915833, "Full-finetune/Step": 1525, "Full-finetune/Step Time": 6.8151556476950645} {"Full-finetune/Learning Rate": 1.6569127230198575e-05, "Full-finetune/Loss": 0.8025264143943787, "Full-finetune/Loss (Raw)": 0.9554897546768188, "Full-finetune/Step": 1526, "Full-finetune/Step Time": 6.8146112114191055} {"Full-finetune/Learning Rate": 1.6564429037295097e-05, "Full-finetune/Loss": 0.8043246269226074, "Full-finetune/Loss (Raw)": 0.8400503993034363, "Full-finetune/Step": 1527, "Full-finetune/Step Time": 6.799088958650827} {"Full-finetune/Learning Rate": 1.6559728296864868e-05, "Full-finetune/Loss": 0.800389289855957, "Full-finetune/Loss (Raw)": 0.42054861783981323, "Full-finetune/Step": 1528, "Full-finetune/Step Time": 6.8116962388157845} {"Full-finetune/Learning Rate": 1.6555025010732156e-05, "Full-finetune/Loss": 0.8016995191574097, "Full-finetune/Loss (Raw)": 0.9805953502655029, "Full-finetune/Step": 1529, "Full-finetune/Step Time": 6.803136562928557} {"Full-finetune/Learning Rate": 1.6550319180722213e-05, "Full-finetune/Loss": 0.8033514022827148, "Full-finetune/Loss (Raw)": 0.5888457894325256, "Full-finetune/Step": 1530, "Full-finetune/Step Time": 6.803476678207517} {"Full-finetune/Learning Rate": 1.6545610808661278e-05, "Full-finetune/Loss": 0.8040995597839355, "Full-finetune/Loss (Raw)": 0.9143043756484985, "Full-finetune/Step": 1531, "Full-finetune/Step Time": 6.80717764981091} {"Full-finetune/Learning Rate": 1.654089989637658e-05, "Full-finetune/Loss": 0.8039831519126892, "Full-finetune/Loss (Raw)": 0.8719738721847534, "Full-finetune/Step": 1532, "Full-finetune/Step Time": 6.815724456682801} {"Full-finetune/Learning Rate": 1.6536186445696337e-05, "Full-finetune/Loss": 0.8038793206214905, "Full-finetune/Loss (Raw)": 0.6787768602371216, "Full-finetune/Step": 1533, "Full-finetune/Step Time": 6.8092825673520565} {"Full-finetune/Learning Rate": 1.653147045844974e-05, "Full-finetune/Loss": 0.8026973009109497, "Full-finetune/Loss (Raw)": 0.6966779232025146, "Full-finetune/Step": 1534, "Full-finetune/Step Time": 6.8170051127672195} {"Full-finetune/Learning Rate": 1.6526751936466974e-05, "Full-finetune/Loss": 0.806174099445343, "Full-finetune/Loss (Raw)": 0.8148103952407837, "Full-finetune/Step": 1535, "Full-finetune/Step Time": 6.800531594082713} {"Full-finetune/Learning Rate": 1.6522030881579207e-05, "Full-finetune/Loss": 0.806693971157074, "Full-finetune/Loss (Raw)": 0.7937195301055908, "Full-finetune/Step": 1536, "Full-finetune/Step Time": 6.806766726076603} {"Full-finetune/Learning Rate": 1.6517307295618582e-05, "Full-finetune/Loss": 0.8060245513916016, "Full-finetune/Loss (Raw)": 0.827578604221344, "Full-finetune/Step": 1537, "Full-finetune/Step Time": 6.807197917252779} {"Full-finetune/Learning Rate": 1.6512581180418245e-05, "Full-finetune/Loss": 0.80341637134552, "Full-finetune/Loss (Raw)": 0.43179357051849365, "Full-finetune/Step": 1538, "Full-finetune/Step Time": 6.795712420716882} {"Full-finetune/Learning Rate": 1.650785253781229e-05, "Full-finetune/Loss": 0.8034970164299011, "Full-finetune/Loss (Raw)": 0.8761317729949951, "Full-finetune/Step": 1539, "Full-finetune/Step Time": 6.797276010736823} {"Full-finetune/Learning Rate": 1.6503121369635822e-05, "Full-finetune/Loss": 0.8049050569534302, "Full-finetune/Loss (Raw)": 0.8404554128646851, "Full-finetune/Step": 1540, "Full-finetune/Step Time": 6.797205934301019} {"Full-finetune/Learning Rate": 1.6498387677724917e-05, "Full-finetune/Loss": 0.8052237033843994, "Full-finetune/Loss (Raw)": 0.9447728395462036, "Full-finetune/Step": 1541, "Full-finetune/Step Time": 6.798484344035387} {"Full-finetune/Learning Rate": 1.6493651463916622e-05, "Full-finetune/Loss": 0.8024790287017822, "Full-finetune/Loss (Raw)": 0.6629956364631653, "Full-finetune/Step": 1542, "Full-finetune/Step Time": 6.805698458105326} {"Full-finetune/Learning Rate": 1.6488912730048973e-05, "Full-finetune/Loss": 0.8018865585327148, "Full-finetune/Loss (Raw)": 0.7761964797973633, "Full-finetune/Step": 1543, "Full-finetune/Step Time": 6.812296245247126} {"Full-finetune/Learning Rate": 1.6484171477960978e-05, "Full-finetune/Loss": 0.8014013767242432, "Full-finetune/Loss (Raw)": 0.9014358520507812, "Full-finetune/Step": 1544, "Full-finetune/Step Time": 6.820561952888966} {"Full-finetune/Learning Rate": 1.6479427709492622e-05, "Full-finetune/Loss": 0.8011601567268372, "Full-finetune/Loss (Raw)": 0.8098248839378357, "Full-finetune/Step": 1545, "Full-finetune/Step Time": 6.823390448465943} {"Full-finetune/Learning Rate": 1.6474681426484878e-05, "Full-finetune/Loss": 0.8030531406402588, "Full-finetune/Loss (Raw)": 0.9612995386123657, "Full-finetune/Step": 1546, "Full-finetune/Step Time": 6.821751015260816} {"Full-finetune/Learning Rate": 1.6469932630779677e-05, "Full-finetune/Loss": 0.8039514422416687, "Full-finetune/Loss (Raw)": 0.8513922095298767, "Full-finetune/Step": 1547, "Full-finetune/Step Time": 6.826398465782404} {"Full-finetune/Learning Rate": 1.6465181324219937e-05, "Full-finetune/Loss": 0.8035480976104736, "Full-finetune/Loss (Raw)": 0.8518718481063843, "Full-finetune/Step": 1548, "Full-finetune/Step Time": 6.835723934695125} {"Full-finetune/Learning Rate": 1.6460427508649546e-05, "Full-finetune/Loss": 0.8002765774726868, "Full-finetune/Loss (Raw)": 0.401305228471756, "Full-finetune/Step": 1549, "Full-finetune/Step Time": 6.854342978447676} {"Full-finetune/Learning Rate": 1.6455671185913367e-05, "Full-finetune/Loss": 0.8012455105781555, "Full-finetune/Loss (Raw)": 0.9024667143821716, "Full-finetune/Step": 1550, "Full-finetune/Step Time": 6.852127885445952} {"Full-finetune/Learning Rate": 1.645091235785724e-05, "Full-finetune/Loss": 0.799795925617218, "Full-finetune/Loss (Raw)": 0.7648747563362122, "Full-finetune/Step": 1551, "Full-finetune/Step Time": 6.8462495766580105} {"Full-finetune/Learning Rate": 1.644615102632797e-05, "Full-finetune/Loss": 0.8008860349655151, "Full-finetune/Loss (Raw)": 0.9265745282173157, "Full-finetune/Step": 1552, "Full-finetune/Step Time": 6.857202399522066} {"Full-finetune/Learning Rate": 1.6441387193173337e-05, "Full-finetune/Loss": 0.8002723455429077, "Full-finetune/Loss (Raw)": 0.7812169790267944, "Full-finetune/Step": 1553, "Full-finetune/Step Time": 6.868352189660072} {"Full-finetune/Learning Rate": 1.6436620860242093e-05, "Full-finetune/Loss": 0.8000631332397461, "Full-finetune/Loss (Raw)": 0.7549924254417419, "Full-finetune/Step": 1554, "Full-finetune/Step Time": 6.848066098988056} {"Full-finetune/Learning Rate": 1.6431852029383955e-05, "Full-finetune/Loss": 0.8013466596603394, "Full-finetune/Loss (Raw)": 0.9186897277832031, "Full-finetune/Step": 1555, "Full-finetune/Step Time": 6.85028413310647} {"Full-finetune/Learning Rate": 1.6427080702449616e-05, "Full-finetune/Loss": 0.8010153770446777, "Full-finetune/Loss (Raw)": 0.7178446650505066, "Full-finetune/Step": 1556, "Full-finetune/Step Time": 6.856140181422234} {"Full-finetune/Learning Rate": 1.6422306881290734e-05, "Full-finetune/Loss": 0.8016594648361206, "Full-finetune/Loss (Raw)": 0.7921607494354248, "Full-finetune/Step": 1557, "Full-finetune/Step Time": 6.8552327789366245} {"Full-finetune/Learning Rate": 1.641753056775994e-05, "Full-finetune/Loss": 0.8019146919250488, "Full-finetune/Loss (Raw)": 0.8528249263763428, "Full-finetune/Step": 1558, "Full-finetune/Step Time": 6.834377491846681} {"Full-finetune/Learning Rate": 1.641275176371082e-05, "Full-finetune/Loss": 0.8045536279678345, "Full-finetune/Loss (Raw)": 1.0855238437652588, "Full-finetune/Step": 1559, "Full-finetune/Step Time": 6.825123887509108} {"Full-finetune/Learning Rate": 1.6407970470997943e-05, "Full-finetune/Loss": 0.8054889440536499, "Full-finetune/Loss (Raw)": 0.9069961309432983, "Full-finetune/Step": 1560, "Full-finetune/Step Time": 6.8301433455199} {"Full-finetune/Learning Rate": 1.6403186691476828e-05, "Full-finetune/Loss": 0.8048679828643799, "Full-finetune/Loss (Raw)": 0.8654243350028992, "Full-finetune/Step": 1561, "Full-finetune/Step Time": 6.827598553150892} {"Full-finetune/Learning Rate": 1.639840042700397e-05, "Full-finetune/Loss": 0.8089281320571899, "Full-finetune/Loss (Raw)": 0.893519401550293, "Full-finetune/Step": 1562, "Full-finetune/Step Time": 6.818110942840576} {"Full-finetune/Learning Rate": 1.6393611679436828e-05, "Full-finetune/Loss": 0.8079896569252014, "Full-finetune/Loss (Raw)": 0.7829146981239319, "Full-finetune/Step": 1563, "Full-finetune/Step Time": 6.836210366338491} {"Full-finetune/Learning Rate": 1.6388820450633813e-05, "Full-finetune/Loss": 0.8092018365859985, "Full-finetune/Loss (Raw)": 0.7750675082206726, "Full-finetune/Step": 1564, "Full-finetune/Step Time": 6.822315353900194} {"Full-finetune/Learning Rate": 1.6384026742454315e-05, "Full-finetune/Loss": 0.808131217956543, "Full-finetune/Loss (Raw)": 0.7421427369117737, "Full-finetune/Step": 1565, "Full-finetune/Step Time": 6.811035577207804} {"Full-finetune/Learning Rate": 1.6379230556758676e-05, "Full-finetune/Loss": 0.8072620630264282, "Full-finetune/Loss (Raw)": 0.7738958597183228, "Full-finetune/Step": 1566, "Full-finetune/Step Time": 6.818557031452656} {"Full-finetune/Learning Rate": 1.63744318954082e-05, "Full-finetune/Loss": 0.806403636932373, "Full-finetune/Loss (Raw)": 0.8401812314987183, "Full-finetune/Step": 1567, "Full-finetune/Step Time": 6.824154334142804} {"Full-finetune/Learning Rate": 1.636963076026516e-05, "Full-finetune/Loss": 0.8080350756645203, "Full-finetune/Loss (Raw)": 0.8305070400238037, "Full-finetune/Step": 1568, "Full-finetune/Step Time": 6.796521574258804} {"Full-finetune/Learning Rate": 1.6364827153192773e-05, "Full-finetune/Loss": 0.8068781495094299, "Full-finetune/Loss (Raw)": 0.7004402279853821, "Full-finetune/Step": 1569, "Full-finetune/Step Time": 6.808635110035539} {"Full-finetune/Learning Rate": 1.6360021076055234e-05, "Full-finetune/Loss": 0.8079482316970825, "Full-finetune/Loss (Raw)": 0.9569528698921204, "Full-finetune/Step": 1570, "Full-finetune/Step Time": 6.8063667099922895} {"Full-finetune/Learning Rate": 1.6355212530717683e-05, "Full-finetune/Loss": 0.8083927631378174, "Full-finetune/Loss (Raw)": 0.8886008858680725, "Full-finetune/Step": 1571, "Full-finetune/Step Time": 6.801906416192651} {"Full-finetune/Learning Rate": 1.6350401519046226e-05, "Full-finetune/Loss": 0.8094528913497925, "Full-finetune/Loss (Raw)": 0.9234256744384766, "Full-finetune/Step": 1572, "Full-finetune/Step Time": 6.796056292951107} {"Full-finetune/Learning Rate": 1.634558804290792e-05, "Full-finetune/Loss": 0.80922532081604, "Full-finetune/Loss (Raw)": 0.8229804635047913, "Full-finetune/Step": 1573, "Full-finetune/Step Time": 6.821675134822726} {"Full-finetune/Learning Rate": 1.634077210417078e-05, "Full-finetune/Loss": 0.8090329170227051, "Full-finetune/Loss (Raw)": 0.7118186354637146, "Full-finetune/Step": 1574, "Full-finetune/Step Time": 6.805144842714071} {"Full-finetune/Learning Rate": 1.633595370470378e-05, "Full-finetune/Loss": 0.809590756893158, "Full-finetune/Loss (Raw)": 0.9759902954101562, "Full-finetune/Step": 1575, "Full-finetune/Step Time": 6.814830930903554} {"Full-finetune/Learning Rate": 1.6331132846376843e-05, "Full-finetune/Loss": 0.8091578483581543, "Full-finetune/Loss (Raw)": 0.8536736369132996, "Full-finetune/Step": 1576, "Full-finetune/Step Time": 6.818345746025443} {"Full-finetune/Learning Rate": 1.632630953106086e-05, "Full-finetune/Loss": 0.8102097511291504, "Full-finetune/Loss (Raw)": 0.8729420304298401, "Full-finetune/Step": 1577, "Full-finetune/Step Time": 6.8091684356331825} {"Full-finetune/Learning Rate": 1.6321483760627658e-05, "Full-finetune/Loss": 0.8114526867866516, "Full-finetune/Loss (Raw)": 0.8881476521492004, "Full-finetune/Step": 1578, "Full-finetune/Step Time": 6.767211761325598} {"Full-finetune/Learning Rate": 1.6316655536950017e-05, "Full-finetune/Loss": 0.810828685760498, "Full-finetune/Loss (Raw)": 0.7596868276596069, "Full-finetune/Step": 1579, "Full-finetune/Step Time": 6.772950848564506} {"Full-finetune/Learning Rate": 1.6311824861901693e-05, "Full-finetune/Loss": 0.8089929223060608, "Full-finetune/Loss (Raw)": 0.6914979219436646, "Full-finetune/Step": 1580, "Full-finetune/Step Time": 6.807579163461924} {"Full-finetune/Learning Rate": 1.6306991737357366e-05, "Full-finetune/Loss": 0.8085269927978516, "Full-finetune/Loss (Raw)": 0.7309702634811401, "Full-finetune/Step": 1581, "Full-finetune/Step Time": 6.802316457033157} {"Full-finetune/Learning Rate": 1.630215616519268e-05, "Full-finetune/Loss": 0.8067747950553894, "Full-finetune/Loss (Raw)": 0.8322023153305054, "Full-finetune/Step": 1582, "Full-finetune/Step Time": 6.802563082426786} {"Full-finetune/Learning Rate": 1.6297318147284223e-05, "Full-finetune/Loss": 0.8063235282897949, "Full-finetune/Loss (Raw)": 0.8827140927314758, "Full-finetune/Step": 1583, "Full-finetune/Step Time": 6.805602999404073} {"Full-finetune/Learning Rate": 1.6292477685509538e-05, "Full-finetune/Loss": 0.8064735531806946, "Full-finetune/Loss (Raw)": 0.8343416452407837, "Full-finetune/Step": 1584, "Full-finetune/Step Time": 6.807182237505913} {"Full-finetune/Learning Rate": 1.6287634781747113e-05, "Full-finetune/Loss": 0.8109807968139648, "Full-finetune/Loss (Raw)": 0.945830762386322, "Full-finetune/Step": 1585, "Full-finetune/Step Time": 6.788588559255004} {"Full-finetune/Learning Rate": 1.628278943787639e-05, "Full-finetune/Loss": 0.8123762607574463, "Full-finetune/Loss (Raw)": 1.0436536073684692, "Full-finetune/Step": 1586, "Full-finetune/Step Time": 6.830439459532499} {"Full-finetune/Learning Rate": 1.6277941655777744e-05, "Full-finetune/Loss": 0.8120735883712769, "Full-finetune/Loss (Raw)": 0.954182505607605, "Full-finetune/Step": 1587, "Full-finetune/Step Time": 6.822926430031657} {"Full-finetune/Learning Rate": 1.6273091437332506e-05, "Full-finetune/Loss": 0.8107571601867676, "Full-finetune/Loss (Raw)": 0.8354842662811279, "Full-finetune/Step": 1588, "Full-finetune/Step Time": 6.833860559388995} {"Full-finetune/Learning Rate": 1.6268238784422954e-05, "Full-finetune/Loss": 0.8091408014297485, "Full-finetune/Loss (Raw)": 0.8460087776184082, "Full-finetune/Step": 1589, "Full-finetune/Step Time": 6.83867022767663} {"Full-finetune/Learning Rate": 1.6263383698932307e-05, "Full-finetune/Loss": 0.8093817234039307, "Full-finetune/Loss (Raw)": 0.9376601576805115, "Full-finetune/Step": 1590, "Full-finetune/Step Time": 6.843958644196391} {"Full-finetune/Learning Rate": 1.6258526182744727e-05, "Full-finetune/Loss": 0.8067240715026855, "Full-finetune/Loss (Raw)": 0.624226450920105, "Full-finetune/Step": 1591, "Full-finetune/Step Time": 6.85916443169117} {"Full-finetune/Learning Rate": 1.6253666237745326e-05, "Full-finetune/Loss": 0.8058538436889648, "Full-finetune/Loss (Raw)": 0.6989574432373047, "Full-finetune/Step": 1592, "Full-finetune/Step Time": 6.861403113231063} {"Full-finetune/Learning Rate": 1.6248803865820152e-05, "Full-finetune/Loss": 0.8052290081977844, "Full-finetune/Loss (Raw)": 0.7788735032081604, "Full-finetune/Step": 1593, "Full-finetune/Step Time": 6.864576559513807} {"Full-finetune/Learning Rate": 1.624393906885619e-05, "Full-finetune/Loss": 0.80503910779953, "Full-finetune/Loss (Raw)": 0.8351966142654419, "Full-finetune/Step": 1594, "Full-finetune/Step Time": 6.87012610770762} {"Full-finetune/Learning Rate": 1.6239071848741385e-05, "Full-finetune/Loss": 0.8039571046829224, "Full-finetune/Loss (Raw)": 0.7078863978385925, "Full-finetune/Step": 1595, "Full-finetune/Step Time": 6.848154982551932} {"Full-finetune/Learning Rate": 1.6234202207364596e-05, "Full-finetune/Loss": 0.8033815622329712, "Full-finetune/Loss (Raw)": 0.8408905863761902, "Full-finetune/Step": 1596, "Full-finetune/Step Time": 6.8530867751687765} {"Full-finetune/Learning Rate": 1.6229330146615646e-05, "Full-finetune/Loss": 0.8061702251434326, "Full-finetune/Loss (Raw)": 0.7331237196922302, "Full-finetune/Step": 1597, "Full-finetune/Step Time": 6.831814700737596} {"Full-finetune/Learning Rate": 1.6224455668385283e-05, "Full-finetune/Loss": 0.8062914609909058, "Full-finetune/Loss (Raw)": 0.8241151571273804, "Full-finetune/Step": 1598, "Full-finetune/Step Time": 6.855188600718975} {"Full-finetune/Learning Rate": 1.62195787745652e-05, "Full-finetune/Loss": 0.8025361895561218, "Full-finetune/Loss (Raw)": 0.37448394298553467, "Full-finetune/Step": 1599, "Full-finetune/Step Time": 6.874976569786668} {"Full-finetune/Learning Rate": 1.6214699467048017e-05, "Full-finetune/Loss": 0.803563117980957, "Full-finetune/Loss (Raw)": 0.9052040576934814, "Full-finetune/Step": 1600, "Full-finetune/Step Time": 6.878779411315918} {"Full-finetune/Learning Rate": 1.6209817747727304e-05, "Full-finetune/Loss": 0.8018605709075928, "Full-finetune/Loss (Raw)": 0.3889394998550415, "Full-finetune/Step": 1601, "Full-finetune/Step Time": 6.891151558607817} {"Full-finetune/Learning Rate": 1.620493361849756e-05, "Full-finetune/Loss": 0.8014079332351685, "Full-finetune/Loss (Raw)": 0.9823137521743774, "Full-finetune/Step": 1602, "Full-finetune/Step Time": 6.900748046115041} {"Full-finetune/Learning Rate": 1.6200047081254223e-05, "Full-finetune/Loss": 0.8032875657081604, "Full-finetune/Loss (Raw)": 0.93098384141922, "Full-finetune/Step": 1603, "Full-finetune/Step Time": 6.905749993398786} {"Full-finetune/Learning Rate": 1.6195158137893656e-05, "Full-finetune/Loss": 0.8024412989616394, "Full-finetune/Loss (Raw)": 0.8155720233917236, "Full-finetune/Step": 1604, "Full-finetune/Step Time": 6.915937826037407} {"Full-finetune/Learning Rate": 1.6190266790313165e-05, "Full-finetune/Loss": 0.8051925301551819, "Full-finetune/Loss (Raw)": 0.6576708555221558, "Full-finetune/Step": 1605, "Full-finetune/Step Time": 6.915569677948952} {"Full-finetune/Learning Rate": 1.618537304041099e-05, "Full-finetune/Loss": 0.8021180629730225, "Full-finetune/Loss (Raw)": 0.636035144329071, "Full-finetune/Step": 1606, "Full-finetune/Step Time": 6.9456913359463215} {"Full-finetune/Learning Rate": 1.6180476890086297e-05, "Full-finetune/Loss": 0.8026787042617798, "Full-finetune/Loss (Raw)": 0.8364666700363159, "Full-finetune/Step": 1607, "Full-finetune/Step Time": 6.932565879076719} {"Full-finetune/Learning Rate": 1.6175578341239188e-05, "Full-finetune/Loss": 0.7988379001617432, "Full-finetune/Loss (Raw)": 0.3837980031967163, "Full-finetune/Step": 1608, "Full-finetune/Step Time": 6.950646733865142} {"Full-finetune/Learning Rate": 1.617067739577069e-05, "Full-finetune/Loss": 0.7986531853675842, "Full-finetune/Loss (Raw)": 0.8833040595054626, "Full-finetune/Step": 1609, "Full-finetune/Step Time": 6.934842539951205} {"Full-finetune/Learning Rate": 1.616577405558277e-05, "Full-finetune/Loss": 0.7990433573722839, "Full-finetune/Loss (Raw)": 0.8704981803894043, "Full-finetune/Step": 1610, "Full-finetune/Step Time": 6.935695184394717} {"Full-finetune/Learning Rate": 1.616086832257831e-05, "Full-finetune/Loss": 0.8001888990402222, "Full-finetune/Loss (Raw)": 0.7474890947341919, "Full-finetune/Step": 1611, "Full-finetune/Step Time": 6.926809960976243} {"Full-finetune/Learning Rate": 1.615596019866114e-05, "Full-finetune/Loss": 0.7994368672370911, "Full-finetune/Loss (Raw)": 0.810925304889679, "Full-finetune/Step": 1612, "Full-finetune/Step Time": 6.929341996088624} {"Full-finetune/Learning Rate": 1.6151049685736e-05, "Full-finetune/Loss": 0.798995852470398, "Full-finetune/Loss (Raw)": 0.7348271608352661, "Full-finetune/Step": 1613, "Full-finetune/Step Time": 6.940089371055365} {"Full-finetune/Learning Rate": 1.6146136785708564e-05, "Full-finetune/Loss": 0.8036901950836182, "Full-finetune/Loss (Raw)": 0.8981223106384277, "Full-finetune/Step": 1614, "Full-finetune/Step Time": 6.920248007401824} {"Full-finetune/Learning Rate": 1.6141221500485437e-05, "Full-finetune/Loss": 0.8032029867172241, "Full-finetune/Loss (Raw)": 0.9490832686424255, "Full-finetune/Step": 1615, "Full-finetune/Step Time": 6.903089612722397} {"Full-finetune/Learning Rate": 1.6136303831974146e-05, "Full-finetune/Loss": 0.8012086153030396, "Full-finetune/Loss (Raw)": 0.8591357469558716, "Full-finetune/Step": 1616, "Full-finetune/Step Time": 6.901709843426943} {"Full-finetune/Learning Rate": 1.6131383782083135e-05, "Full-finetune/Loss": 0.802428662776947, "Full-finetune/Loss (Raw)": 0.8082212209701538, "Full-finetune/Step": 1617, "Full-finetune/Step Time": 6.898481231182814} {"Full-finetune/Learning Rate": 1.6126461352721784e-05, "Full-finetune/Loss": 0.8028533458709717, "Full-finetune/Loss (Raw)": 0.8317286372184753, "Full-finetune/Step": 1618, "Full-finetune/Step Time": 6.8779616840183735} {"Full-finetune/Learning Rate": 1.612153654580039e-05, "Full-finetune/Loss": 0.8031707406044006, "Full-finetune/Loss (Raw)": 0.7581424117088318, "Full-finetune/Step": 1619, "Full-finetune/Step Time": 6.867741405963898} {"Full-finetune/Learning Rate": 1.6116609363230176e-05, "Full-finetune/Loss": 0.8043279051780701, "Full-finetune/Loss (Raw)": 1.0911548137664795, "Full-finetune/Step": 1620, "Full-finetune/Step Time": 6.8699493277817965} {"Full-finetune/Learning Rate": 1.6111679806923287e-05, "Full-finetune/Loss": 0.8078716397285461, "Full-finetune/Loss (Raw)": 0.7779130935668945, "Full-finetune/Step": 1621, "Full-finetune/Step Time": 6.857225539162755} {"Full-finetune/Learning Rate": 1.6106747878792784e-05, "Full-finetune/Loss": 0.8088991641998291, "Full-finetune/Loss (Raw)": 0.9669556021690369, "Full-finetune/Step": 1622, "Full-finetune/Step Time": 6.844899006187916} {"Full-finetune/Learning Rate": 1.610181358075265e-05, "Full-finetune/Loss": 0.810564398765564, "Full-finetune/Loss (Raw)": 1.0763736963272095, "Full-finetune/Step": 1623, "Full-finetune/Step Time": 6.839780984446406} {"Full-finetune/Learning Rate": 1.60968769147178e-05, "Full-finetune/Loss": 0.8103511333465576, "Full-finetune/Loss (Raw)": 0.8741627335548401, "Full-finetune/Step": 1624, "Full-finetune/Step Time": 6.841248041018844} {"Full-finetune/Learning Rate": 1.6091937882604047e-05, "Full-finetune/Loss": 0.8112069368362427, "Full-finetune/Loss (Raw)": 0.8799915909767151, "Full-finetune/Step": 1625, "Full-finetune/Step Time": 6.841047957539558} {"Full-finetune/Learning Rate": 1.608699648632814e-05, "Full-finetune/Loss": 0.8105543255805969, "Full-finetune/Loss (Raw)": 0.896980345249176, "Full-finetune/Step": 1626, "Full-finetune/Step Time": 6.831853536888957} {"Full-finetune/Learning Rate": 1.6082052727807732e-05, "Full-finetune/Loss": 0.8146284222602844, "Full-finetune/Loss (Raw)": 0.9462463855743408, "Full-finetune/Step": 1627, "Full-finetune/Step Time": 6.810554519295692} {"Full-finetune/Learning Rate": 1.60771066089614e-05, "Full-finetune/Loss": 0.8184344172477722, "Full-finetune/Loss (Raw)": 0.8416637778282166, "Full-finetune/Step": 1628, "Full-finetune/Step Time": 6.801400739699602} {"Full-finetune/Learning Rate": 1.6072158131708643e-05, "Full-finetune/Loss": 0.8168257474899292, "Full-finetune/Loss (Raw)": 0.7763253450393677, "Full-finetune/Step": 1629, "Full-finetune/Step Time": 6.772924982011318} {"Full-finetune/Learning Rate": 1.6067207297969864e-05, "Full-finetune/Loss": 0.8162188529968262, "Full-finetune/Loss (Raw)": 0.8706396818161011, "Full-finetune/Step": 1630, "Full-finetune/Step Time": 6.769978288561106} {"Full-finetune/Learning Rate": 1.6062254109666383e-05, "Full-finetune/Loss": 0.8171350955963135, "Full-finetune/Loss (Raw)": 0.8535764813423157, "Full-finetune/Step": 1631, "Full-finetune/Step Time": 6.773108936846256} {"Full-finetune/Learning Rate": 1.6057298568720436e-05, "Full-finetune/Loss": 0.8167564868927002, "Full-finetune/Loss (Raw)": 0.834243655204773, "Full-finetune/Step": 1632, "Full-finetune/Step Time": 6.763207858428359} {"Full-finetune/Learning Rate": 1.6052340677055175e-05, "Full-finetune/Loss": 0.8160886764526367, "Full-finetune/Loss (Raw)": 0.779758632183075, "Full-finetune/Step": 1633, "Full-finetune/Step Time": 6.764473112300038} {"Full-finetune/Learning Rate": 1.6047380436594663e-05, "Full-finetune/Loss": 0.8167054057121277, "Full-finetune/Loss (Raw)": 0.8730027675628662, "Full-finetune/Step": 1634, "Full-finetune/Step Time": 6.756681703031063} {"Full-finetune/Learning Rate": 1.6042417849263863e-05, "Full-finetune/Loss": 0.8156057596206665, "Full-finetune/Loss (Raw)": 0.8003564476966858, "Full-finetune/Step": 1635, "Full-finetune/Step Time": 6.77836905233562} {"Full-finetune/Learning Rate": 1.6037452916988665e-05, "Full-finetune/Loss": 0.8150854110717773, "Full-finetune/Loss (Raw)": 0.892564058303833, "Full-finetune/Step": 1636, "Full-finetune/Step Time": 6.774928115308285} {"Full-finetune/Learning Rate": 1.6032485641695862e-05, "Full-finetune/Loss": 0.8144218921661377, "Full-finetune/Loss (Raw)": 0.7853723168373108, "Full-finetune/Step": 1637, "Full-finetune/Step Time": 6.776218870654702} {"Full-finetune/Learning Rate": 1.602751602531316e-05, "Full-finetune/Loss": 0.8132722973823547, "Full-finetune/Loss (Raw)": 0.7983489036560059, "Full-finetune/Step": 1638, "Full-finetune/Step Time": 6.777870262041688} {"Full-finetune/Learning Rate": 1.602254406976916e-05, "Full-finetune/Loss": 0.8115242719650269, "Full-finetune/Loss (Raw)": 0.737259566783905, "Full-finetune/Step": 1639, "Full-finetune/Step Time": 6.774624690413475} {"Full-finetune/Learning Rate": 1.6017569776993388e-05, "Full-finetune/Loss": 0.8130413293838501, "Full-finetune/Loss (Raw)": 0.9579402804374695, "Full-finetune/Step": 1640, "Full-finetune/Step Time": 6.763271450996399} {"Full-finetune/Learning Rate": 1.601259314891627e-05, "Full-finetune/Loss": 0.81254643201828, "Full-finetune/Loss (Raw)": 0.9216246008872986, "Full-finetune/Step": 1641, "Full-finetune/Step Time": 6.760463338345289} {"Full-finetune/Learning Rate": 1.6007614187469137e-05, "Full-finetune/Loss": 0.8128973245620728, "Full-finetune/Loss (Raw)": 0.8501006364822388, "Full-finetune/Step": 1642, "Full-finetune/Step Time": 6.7397282887250185} {"Full-finetune/Learning Rate": 1.6002632894584227e-05, "Full-finetune/Loss": 0.8137123584747314, "Full-finetune/Loss (Raw)": 0.9855945706367493, "Full-finetune/Step": 1643, "Full-finetune/Step Time": 6.740506935864687} {"Full-finetune/Learning Rate": 1.599764927219468e-05, "Full-finetune/Loss": 0.8130457997322083, "Full-finetune/Loss (Raw)": 0.8050629496574402, "Full-finetune/Step": 1644, "Full-finetune/Step Time": 6.7644950821995735} {"Full-finetune/Learning Rate": 1.5992663322234548e-05, "Full-finetune/Loss": 0.813581645488739, "Full-finetune/Loss (Raw)": 0.853411853313446, "Full-finetune/Step": 1645, "Full-finetune/Step Time": 6.766094675287604} {"Full-finetune/Learning Rate": 1.5987675046638777e-05, "Full-finetune/Loss": 0.813073992729187, "Full-finetune/Loss (Raw)": 0.9208404421806335, "Full-finetune/Step": 1646, "Full-finetune/Step Time": 6.768953198567033} {"Full-finetune/Learning Rate": 1.5982684447343214e-05, "Full-finetune/Loss": 0.8136115074157715, "Full-finetune/Loss (Raw)": 0.7757523059844971, "Full-finetune/Step": 1647, "Full-finetune/Step Time": 6.780553407967091} {"Full-finetune/Learning Rate": 1.5977691526284623e-05, "Full-finetune/Loss": 0.8177875280380249, "Full-finetune/Loss (Raw)": 0.9312248229980469, "Full-finetune/Step": 1648, "Full-finetune/Step Time": 6.767075967043638} {"Full-finetune/Learning Rate": 1.5972696285400656e-05, "Full-finetune/Loss": 0.8172784447669983, "Full-finetune/Loss (Raw)": 0.8327997326850891, "Full-finetune/Step": 1649, "Full-finetune/Step Time": 6.778842503204942} {"Full-finetune/Learning Rate": 1.596769872662987e-05, "Full-finetune/Loss": 0.8184253573417664, "Full-finetune/Loss (Raw)": 0.8999599814414978, "Full-finetune/Step": 1650, "Full-finetune/Step Time": 6.766535507515073} {"Full-finetune/Learning Rate": 1.5962698851911715e-05, "Full-finetune/Loss": 0.8192484974861145, "Full-finetune/Loss (Raw)": 0.7541905045509338, "Full-finetune/Step": 1651, "Full-finetune/Step Time": 6.7677893210202456} {"Full-finetune/Learning Rate": 1.5957696663186547e-05, "Full-finetune/Loss": 0.8199815154075623, "Full-finetune/Loss (Raw)": 0.813221275806427, "Full-finetune/Step": 1652, "Full-finetune/Step Time": 6.771869149059057} {"Full-finetune/Learning Rate": 1.595269216239562e-05, "Full-finetune/Loss": 0.8210064768791199, "Full-finetune/Loss (Raw)": 0.8381299376487732, "Full-finetune/Step": 1653, "Full-finetune/Step Time": 6.7626481633633375} {"Full-finetune/Learning Rate": 1.594768535148108e-05, "Full-finetune/Loss": 0.8205828666687012, "Full-finetune/Loss (Raw)": 0.9012700915336609, "Full-finetune/Step": 1654, "Full-finetune/Step Time": 6.774855559691787} {"Full-finetune/Learning Rate": 1.5942676232385973e-05, "Full-finetune/Loss": 0.8170419931411743, "Full-finetune/Loss (Raw)": 0.3868199586868286, "Full-finetune/Step": 1655, "Full-finetune/Step Time": 6.791980231180787} {"Full-finetune/Learning Rate": 1.5937664807054242e-05, "Full-finetune/Loss": 0.8206882476806641, "Full-finetune/Loss (Raw)": 0.8872659802436829, "Full-finetune/Step": 1656, "Full-finetune/Step Time": 6.77525064535439} {"Full-finetune/Learning Rate": 1.593265107743072e-05, "Full-finetune/Loss": 0.8193601369857788, "Full-finetune/Loss (Raw)": 0.8105974197387695, "Full-finetune/Step": 1657, "Full-finetune/Step Time": 6.773109782487154} {"Full-finetune/Learning Rate": 1.5927635045461145e-05, "Full-finetune/Loss": 0.8217124342918396, "Full-finetune/Loss (Raw)": 0.8899350762367249, "Full-finetune/Step": 1658, "Full-finetune/Step Time": 6.757065441459417} {"Full-finetune/Learning Rate": 1.5922616713092135e-05, "Full-finetune/Loss": 0.8207830190658569, "Full-finetune/Loss (Raw)": 0.7953402400016785, "Full-finetune/Step": 1659, "Full-finetune/Step Time": 6.756393771618605} {"Full-finetune/Learning Rate": 1.5917596082271206e-05, "Full-finetune/Loss": 0.8208551406860352, "Full-finetune/Loss (Raw)": 0.8812114596366882, "Full-finetune/Step": 1660, "Full-finetune/Step Time": 6.753867015242577} {"Full-finetune/Learning Rate": 1.5912573154946768e-05, "Full-finetune/Loss": 0.8220446109771729, "Full-finetune/Loss (Raw)": 0.8310293555259705, "Full-finetune/Step": 1661, "Full-finetune/Step Time": 6.748378936201334} {"Full-finetune/Learning Rate": 1.5907547933068125e-05, "Full-finetune/Loss": 0.8240087628364563, "Full-finetune/Loss (Raw)": 0.9480866193771362, "Full-finetune/Step": 1662, "Full-finetune/Step Time": 6.747311037033796} {"Full-finetune/Learning Rate": 1.590252041858546e-05, "Full-finetune/Loss": 0.8221887946128845, "Full-finetune/Loss (Raw)": 0.5818518996238708, "Full-finetune/Step": 1663, "Full-finetune/Step Time": 6.766680208966136} {"Full-finetune/Learning Rate": 1.5897490613449864e-05, "Full-finetune/Loss": 0.8214435577392578, "Full-finetune/Loss (Raw)": 0.6983305215835571, "Full-finetune/Step": 1664, "Full-finetune/Step Time": 6.758866894990206} {"Full-finetune/Learning Rate": 1.5892458519613296e-05, "Full-finetune/Loss": 0.8226833343505859, "Full-finetune/Loss (Raw)": 0.9862668514251709, "Full-finetune/Step": 1665, "Full-finetune/Step Time": 6.75826495885849} {"Full-finetune/Learning Rate": 1.588742413902862e-05, "Full-finetune/Loss": 0.8257977962493896, "Full-finetune/Loss (Raw)": 0.8304433822631836, "Full-finetune/Step": 1666, "Full-finetune/Step Time": 6.7344387993216515} {"Full-finetune/Learning Rate": 1.5882387473649572e-05, "Full-finetune/Loss": 0.8259336948394775, "Full-finetune/Loss (Raw)": 0.8935282230377197, "Full-finetune/Step": 1667, "Full-finetune/Step Time": 6.731380753219128} {"Full-finetune/Learning Rate": 1.5877348525430793e-05, "Full-finetune/Loss": 0.8267182111740112, "Full-finetune/Loss (Raw)": 0.9408829808235168, "Full-finetune/Step": 1668, "Full-finetune/Step Time": 6.735694047063589} {"Full-finetune/Learning Rate": 1.5872307296327795e-05, "Full-finetune/Loss": 0.8261525630950928, "Full-finetune/Loss (Raw)": 0.8723615407943726, "Full-finetune/Step": 1669, "Full-finetune/Step Time": 6.731661960482597} {"Full-finetune/Learning Rate": 1.5867263788296984e-05, "Full-finetune/Loss": 0.8282483816146851, "Full-finetune/Loss (Raw)": 0.9312642216682434, "Full-finetune/Step": 1670, "Full-finetune/Step Time": 6.718510998412967} {"Full-finetune/Learning Rate": 1.5862218003295647e-05, "Full-finetune/Loss": 0.8284077048301697, "Full-finetune/Loss (Raw)": 0.7965931296348572, "Full-finetune/Step": 1671, "Full-finetune/Step Time": 6.715584201738238} {"Full-finetune/Learning Rate": 1.5857169943281948e-05, "Full-finetune/Loss": 0.8281134366989136, "Full-finetune/Loss (Raw)": 0.8637627363204956, "Full-finetune/Step": 1672, "Full-finetune/Step Time": 6.722139308229089} {"Full-finetune/Learning Rate": 1.585211961021495e-05, "Full-finetune/Loss": 0.8274150490760803, "Full-finetune/Loss (Raw)": 0.7204346656799316, "Full-finetune/Step": 1673, "Full-finetune/Step Time": 6.727339567616582} {"Full-finetune/Learning Rate": 1.5847067006054584e-05, "Full-finetune/Loss": 0.824498176574707, "Full-finetune/Loss (Raw)": 0.5879344344139099, "Full-finetune/Step": 1674, "Full-finetune/Step Time": 6.734190737828612} {"Full-finetune/Learning Rate": 1.584201213276167e-05, "Full-finetune/Loss": 0.8232599496841431, "Full-finetune/Loss (Raw)": 0.692898690700531, "Full-finetune/Step": 1675, "Full-finetune/Step Time": 6.738473322242498} {"Full-finetune/Learning Rate": 1.5836954992297897e-05, "Full-finetune/Loss": 0.8237944841384888, "Full-finetune/Loss (Raw)": 0.9202988743782043, "Full-finetune/Step": 1676, "Full-finetune/Step Time": 6.733302995562553} {"Full-finetune/Learning Rate": 1.583189558662585e-05, "Full-finetune/Loss": 0.8281508088111877, "Full-finetune/Loss (Raw)": 0.9589166641235352, "Full-finetune/Step": 1677, "Full-finetune/Step Time": 6.713996071368456} {"Full-finetune/Learning Rate": 1.5826833917708983e-05, "Full-finetune/Loss": 0.827184796333313, "Full-finetune/Loss (Raw)": 0.7788205742835999, "Full-finetune/Step": 1678, "Full-finetune/Step Time": 6.711835300549865} {"Full-finetune/Learning Rate": 1.5821769987511634e-05, "Full-finetune/Loss": 0.824205219745636, "Full-finetune/Loss (Raw)": 0.3834800124168396, "Full-finetune/Step": 1679, "Full-finetune/Step Time": 6.7313609048724174} {"Full-finetune/Learning Rate": 1.5816703797999015e-05, "Full-finetune/Loss": 0.8236759901046753, "Full-finetune/Loss (Raw)": 0.8588332533836365, "Full-finetune/Step": 1680, "Full-finetune/Step Time": 6.728025179356337} {"Full-finetune/Learning Rate": 1.5811635351137212e-05, "Full-finetune/Loss": 0.8243837356567383, "Full-finetune/Loss (Raw)": 0.871804416179657, "Full-finetune/Step": 1681, "Full-finetune/Step Time": 6.710027486085892} {"Full-finetune/Learning Rate": 1.580656464889319e-05, "Full-finetune/Loss": 0.8264962434768677, "Full-finetune/Loss (Raw)": 1.0253936052322388, "Full-finetune/Step": 1682, "Full-finetune/Step Time": 6.713323414325714} {"Full-finetune/Learning Rate": 1.5801491693234793e-05, "Full-finetune/Loss": 0.8248169422149658, "Full-finetune/Loss (Raw)": 0.7037431597709656, "Full-finetune/Step": 1683, "Full-finetune/Step Time": 6.720860902220011} {"Full-finetune/Learning Rate": 1.5796416486130735e-05, "Full-finetune/Loss": 0.8256534337997437, "Full-finetune/Loss (Raw)": 0.8249126076698303, "Full-finetune/Step": 1684, "Full-finetune/Step Time": 6.712501794099808} {"Full-finetune/Learning Rate": 1.5791339029550604e-05, "Full-finetune/Loss": 0.8253222703933716, "Full-finetune/Loss (Raw)": 0.7497785687446594, "Full-finetune/Step": 1685, "Full-finetune/Step Time": 6.716136809438467} {"Full-finetune/Learning Rate": 1.578625932546486e-05, "Full-finetune/Loss": 0.823511004447937, "Full-finetune/Loss (Raw)": 0.6209774613380432, "Full-finetune/Step": 1686, "Full-finetune/Step Time": 6.737774014472961} {"Full-finetune/Learning Rate": 1.578117737584484e-05, "Full-finetune/Loss": 0.8221632242202759, "Full-finetune/Loss (Raw)": 0.9130125045776367, "Full-finetune/Step": 1687, "Full-finetune/Step Time": 6.74083231203258} {"Full-finetune/Learning Rate": 1.577609318266275e-05, "Full-finetune/Loss": 0.8215264678001404, "Full-finetune/Loss (Raw)": 0.8254888653755188, "Full-finetune/Step": 1688, "Full-finetune/Step Time": 6.737437695264816} {"Full-finetune/Learning Rate": 1.5771006747891663e-05, "Full-finetune/Loss": 0.8171548843383789, "Full-finetune/Loss (Raw)": 0.3058643937110901, "Full-finetune/Step": 1689, "Full-finetune/Step Time": 6.752954337745905} {"Full-finetune/Learning Rate": 1.576591807350553e-05, "Full-finetune/Loss": 0.8175948858261108, "Full-finetune/Loss (Raw)": 0.9498421549797058, "Full-finetune/Step": 1690, "Full-finetune/Step Time": 6.743488760665059} {"Full-finetune/Learning Rate": 1.5760827161479158e-05, "Full-finetune/Loss": 0.8183778524398804, "Full-finetune/Loss (Raw)": 0.8831333518028259, "Full-finetune/Step": 1691, "Full-finetune/Step Time": 6.725304808467627} {"Full-finetune/Learning Rate": 1.5755734013788235e-05, "Full-finetune/Loss": 0.8180408477783203, "Full-finetune/Loss (Raw)": 0.731932520866394, "Full-finetune/Step": 1692, "Full-finetune/Step Time": 6.746047705411911} {"Full-finetune/Learning Rate": 1.5750638632409315e-05, "Full-finetune/Loss": 0.8173938393592834, "Full-finetune/Loss (Raw)": 0.6593272089958191, "Full-finetune/Step": 1693, "Full-finetune/Step Time": 6.763573240488768} {"Full-finetune/Learning Rate": 1.574554101931981e-05, "Full-finetune/Loss": 0.8160613775253296, "Full-finetune/Loss (Raw)": 0.6033387184143066, "Full-finetune/Step": 1694, "Full-finetune/Step Time": 6.76484370790422} {"Full-finetune/Learning Rate": 1.5740441176498015e-05, "Full-finetune/Loss": 0.8149975538253784, "Full-finetune/Loss (Raw)": 0.7040032148361206, "Full-finetune/Step": 1695, "Full-finetune/Step Time": 6.770116005092859} {"Full-finetune/Learning Rate": 1.5735339105923068e-05, "Full-finetune/Loss": 0.8152412176132202, "Full-finetune/Loss (Raw)": 0.8616989850997925, "Full-finetune/Step": 1696, "Full-finetune/Step Time": 6.767778478562832} {"Full-finetune/Learning Rate": 1.5730234809574986e-05, "Full-finetune/Loss": 0.816953182220459, "Full-finetune/Loss (Raw)": 0.9195748567581177, "Full-finetune/Step": 1697, "Full-finetune/Step Time": 6.753174478188157} {"Full-finetune/Learning Rate": 1.5725128289434647e-05, "Full-finetune/Loss": 0.816006064414978, "Full-finetune/Loss (Raw)": 0.8357171416282654, "Full-finetune/Step": 1698, "Full-finetune/Step Time": 6.754721516743302} {"Full-finetune/Learning Rate": 1.5720019547483795e-05, "Full-finetune/Loss": 0.8160830736160278, "Full-finetune/Loss (Raw)": 0.8984618186950684, "Full-finetune/Step": 1699, "Full-finetune/Step Time": 6.7524244375526905} {"Full-finetune/Learning Rate": 1.571490858570503e-05, "Full-finetune/Loss": 0.8157135248184204, "Full-finetune/Loss (Raw)": 0.8761220574378967, "Full-finetune/Step": 1700, "Full-finetune/Step Time": 6.760796325281262} {"Full-finetune/Learning Rate": 1.5709795406081818e-05, "Full-finetune/Loss": 0.8166155815124512, "Full-finetune/Loss (Raw)": 0.9384500980377197, "Full-finetune/Step": 1701, "Full-finetune/Step Time": 6.735404048115015} {"Full-finetune/Learning Rate": 1.570468001059848e-05, "Full-finetune/Loss": 0.8183244466781616, "Full-finetune/Loss (Raw)": 0.9305533170700073, "Full-finetune/Step": 1702, "Full-finetune/Step Time": 6.733966793864965} {"Full-finetune/Learning Rate": 1.5699562401240206e-05, "Full-finetune/Loss": 0.815781831741333, "Full-finetune/Loss (Raw)": 0.6505261659622192, "Full-finetune/Step": 1703, "Full-finetune/Step Time": 6.7401581555604935} {"Full-finetune/Learning Rate": 1.5694442579993042e-05, "Full-finetune/Loss": 0.8118239045143127, "Full-finetune/Loss (Raw)": 0.34706324338912964, "Full-finetune/Step": 1704, "Full-finetune/Step Time": 6.754019986838102} {"Full-finetune/Learning Rate": 1.5689320548843882e-05, "Full-finetune/Loss": 0.8116228580474854, "Full-finetune/Loss (Raw)": 0.8472127914428711, "Full-finetune/Step": 1705, "Full-finetune/Step Time": 6.766387157142162} {"Full-finetune/Learning Rate": 1.5684196309780495e-05, "Full-finetune/Loss": 0.811780571937561, "Full-finetune/Loss (Raw)": 0.908331036567688, "Full-finetune/Step": 1706, "Full-finetune/Step Time": 6.7687535881996155} {"Full-finetune/Learning Rate": 1.5679069864791493e-05, "Full-finetune/Loss": 0.8126915693283081, "Full-finetune/Loss (Raw)": 0.8762987852096558, "Full-finetune/Step": 1707, "Full-finetune/Step Time": 6.764470309019089} {"Full-finetune/Learning Rate": 1.567394121586635e-05, "Full-finetune/Loss": 0.8139610290527344, "Full-finetune/Loss (Raw)": 0.8539872765541077, "Full-finetune/Step": 1708, "Full-finetune/Step Time": 6.7442501448094845} {"Full-finetune/Learning Rate": 1.56688103649954e-05, "Full-finetune/Loss": 0.8158378601074219, "Full-finetune/Loss (Raw)": 0.9712086319923401, "Full-finetune/Step": 1709, "Full-finetune/Step Time": 6.741726806387305} {"Full-finetune/Learning Rate": 1.566367731416982e-05, "Full-finetune/Loss": 0.8158891201019287, "Full-finetune/Loss (Raw)": 0.8387579321861267, "Full-finetune/Step": 1710, "Full-finetune/Step Time": 6.750893173739314} {"Full-finetune/Learning Rate": 1.5658542065381644e-05, "Full-finetune/Loss": 0.8158056139945984, "Full-finetune/Loss (Raw)": 0.8720235824584961, "Full-finetune/Step": 1711, "Full-finetune/Step Time": 6.763531614094973} {"Full-finetune/Learning Rate": 1.565340462062377e-05, "Full-finetune/Loss": 0.8171930313110352, "Full-finetune/Loss (Raw)": 1.0119268894195557, "Full-finetune/Step": 1712, "Full-finetune/Step Time": 6.7738081105053425} {"Full-finetune/Learning Rate": 1.5648264981889936e-05, "Full-finetune/Loss": 0.8168917298316956, "Full-finetune/Loss (Raw)": 0.9072716236114502, "Full-finetune/Step": 1713, "Full-finetune/Step Time": 6.772557964548469} {"Full-finetune/Learning Rate": 1.5643123151174736e-05, "Full-finetune/Loss": 0.8157557249069214, "Full-finetune/Loss (Raw)": 0.898242175579071, "Full-finetune/Step": 1714, "Full-finetune/Step Time": 6.737707523629069} {"Full-finetune/Learning Rate": 1.5637979130473612e-05, "Full-finetune/Loss": 0.8132956027984619, "Full-finetune/Loss (Raw)": 0.6392801403999329, "Full-finetune/Step": 1715, "Full-finetune/Step Time": 6.756463436409831} {"Full-finetune/Learning Rate": 1.563283292178286e-05, "Full-finetune/Loss": 0.8135755062103271, "Full-finetune/Loss (Raw)": 0.8713147640228271, "Full-finetune/Step": 1716, "Full-finetune/Step Time": 6.744326056912541} {"Full-finetune/Learning Rate": 1.5627684527099624e-05, "Full-finetune/Loss": 0.8139395117759705, "Full-finetune/Loss (Raw)": 0.8926064968109131, "Full-finetune/Step": 1717, "Full-finetune/Step Time": 6.744138695299625} {"Full-finetune/Learning Rate": 1.5622533948421895e-05, "Full-finetune/Loss": 0.8137409687042236, "Full-finetune/Loss (Raw)": 0.9122505187988281, "Full-finetune/Step": 1718, "Full-finetune/Step Time": 6.734131997451186} {"Full-finetune/Learning Rate": 1.5617381187748507e-05, "Full-finetune/Loss": 0.8152740001678467, "Full-finetune/Loss (Raw)": 0.8204495906829834, "Full-finetune/Step": 1719, "Full-finetune/Step Time": 6.7203214559704065} {"Full-finetune/Learning Rate": 1.5612226247079155e-05, "Full-finetune/Loss": 0.8173096179962158, "Full-finetune/Loss (Raw)": 0.9595139622688293, "Full-finetune/Step": 1720, "Full-finetune/Step Time": 6.718474542722106} {"Full-finetune/Learning Rate": 1.5607069128414366e-05, "Full-finetune/Loss": 0.8183776140213013, "Full-finetune/Loss (Raw)": 0.9155759215354919, "Full-finetune/Step": 1721, "Full-finetune/Step Time": 6.718791687861085} {"Full-finetune/Learning Rate": 1.5601909833755514e-05, "Full-finetune/Loss": 0.8185769319534302, "Full-finetune/Loss (Raw)": 0.8607156872749329, "Full-finetune/Step": 1722, "Full-finetune/Step Time": 6.708969376981258} {"Full-finetune/Learning Rate": 1.559674836510482e-05, "Full-finetune/Loss": 0.8196136951446533, "Full-finetune/Loss (Raw)": 0.8405839800834656, "Full-finetune/Step": 1723, "Full-finetune/Step Time": 6.724487125873566} {"Full-finetune/Learning Rate": 1.5591584724465363e-05, "Full-finetune/Loss": 0.819303035736084, "Full-finetune/Loss (Raw)": 0.8011302351951599, "Full-finetune/Step": 1724, "Full-finetune/Step Time": 6.716849759221077} {"Full-finetune/Learning Rate": 1.5586418913841034e-05, "Full-finetune/Loss": 0.8201150894165039, "Full-finetune/Loss (Raw)": 0.8370656371116638, "Full-finetune/Step": 1725, "Full-finetune/Step Time": 6.7068461906164885} {"Full-finetune/Learning Rate": 1.558125093523659e-05, "Full-finetune/Loss": 0.8197799921035767, "Full-finetune/Loss (Raw)": 0.7812185883522034, "Full-finetune/Step": 1726, "Full-finetune/Step Time": 6.688992181792855} {"Full-finetune/Learning Rate": 1.5576080790657626e-05, "Full-finetune/Loss": 0.8235381245613098, "Full-finetune/Loss (Raw)": 0.855531632900238, "Full-finetune/Step": 1727, "Full-finetune/Step Time": 6.686891118064523} {"Full-finetune/Learning Rate": 1.5570908482110566e-05, "Full-finetune/Loss": 0.8239396214485168, "Full-finetune/Loss (Raw)": 0.9565941095352173, "Full-finetune/Step": 1728, "Full-finetune/Step Time": 6.683739459142089} {"Full-finetune/Learning Rate": 1.5565734011602693e-05, "Full-finetune/Loss": 0.8278175592422485, "Full-finetune/Loss (Raw)": 0.8853154182434082, "Full-finetune/Step": 1729, "Full-finetune/Step Time": 6.667611354961991} {"Full-finetune/Learning Rate": 1.556055738114211e-05, "Full-finetune/Loss": 0.8260177969932556, "Full-finetune/Loss (Raw)": 0.7519472241401672, "Full-finetune/Step": 1730, "Full-finetune/Step Time": 6.658922623842955} {"Full-finetune/Learning Rate": 1.555537859273777e-05, "Full-finetune/Loss": 0.8267706632614136, "Full-finetune/Loss (Raw)": 1.0273433923721313, "Full-finetune/Step": 1731, "Full-finetune/Step Time": 6.646032536402345} {"Full-finetune/Learning Rate": 1.5550197648399453e-05, "Full-finetune/Loss": 0.8277361989021301, "Full-finetune/Loss (Raw)": 0.9391613006591797, "Full-finetune/Step": 1732, "Full-finetune/Step Time": 6.6496517192572355} {"Full-finetune/Learning Rate": 1.554501455013779e-05, "Full-finetune/Loss": 0.8293878436088562, "Full-finetune/Loss (Raw)": 0.8690879344940186, "Full-finetune/Step": 1733, "Full-finetune/Step Time": 6.631224347278476} {"Full-finetune/Learning Rate": 1.5539829299964236e-05, "Full-finetune/Loss": 0.8314263820648193, "Full-finetune/Loss (Raw)": 0.8969699740409851, "Full-finetune/Step": 1734, "Full-finetune/Step Time": 6.615055834874511} {"Full-finetune/Learning Rate": 1.5534641899891084e-05, "Full-finetune/Loss": 0.8313679695129395, "Full-finetune/Loss (Raw)": 0.8289797902107239, "Full-finetune/Step": 1735, "Full-finetune/Step Time": 6.614762416109443} {"Full-finetune/Learning Rate": 1.5529452351931473e-05, "Full-finetune/Loss": 0.8351647853851318, "Full-finetune/Loss (Raw)": 0.8697940111160278, "Full-finetune/Step": 1736, "Full-finetune/Step Time": 6.595850743353367} {"Full-finetune/Learning Rate": 1.5524260658099352e-05, "Full-finetune/Loss": 0.8344210386276245, "Full-finetune/Loss (Raw)": 0.788105309009552, "Full-finetune/Step": 1737, "Full-finetune/Step Time": 6.5941942520439625} {"Full-finetune/Learning Rate": 1.551906682040952e-05, "Full-finetune/Loss": 0.8303630352020264, "Full-finetune/Loss (Raw)": 0.3510712683200836, "Full-finetune/Step": 1738, "Full-finetune/Step Time": 6.6097844541072845} {"Full-finetune/Learning Rate": 1.5513870840877608e-05, "Full-finetune/Loss": 0.8309836387634277, "Full-finetune/Loss (Raw)": 0.8269264101982117, "Full-finetune/Step": 1739, "Full-finetune/Step Time": 6.588342919945717} {"Full-finetune/Learning Rate": 1.5508672721520076e-05, "Full-finetune/Loss": 0.8305689096450806, "Full-finetune/Loss (Raw)": 0.757841944694519, "Full-finetune/Step": 1740, "Full-finetune/Step Time": 6.6035338044166565} {"Full-finetune/Learning Rate": 1.5503472464354207e-05, "Full-finetune/Loss": 0.8329697847366333, "Full-finetune/Loss (Raw)": 1.0421425104141235, "Full-finetune/Step": 1741, "Full-finetune/Step Time": 6.594321604818106} {"Full-finetune/Learning Rate": 1.5498270071398116e-05, "Full-finetune/Loss": 0.8314408659934998, "Full-finetune/Loss (Raw)": 0.7024185657501221, "Full-finetune/Step": 1742, "Full-finetune/Step Time": 6.602697219699621} {"Full-finetune/Learning Rate": 1.549306554467076e-05, "Full-finetune/Loss": 0.830653190612793, "Full-finetune/Loss (Raw)": 0.8482610583305359, "Full-finetune/Step": 1743, "Full-finetune/Step Time": 6.618056293576956} {"Full-finetune/Learning Rate": 1.5487858886191903e-05, "Full-finetune/Loss": 0.8304537534713745, "Full-finetune/Loss (Raw)": 0.8336095213890076, "Full-finetune/Step": 1744, "Full-finetune/Step Time": 6.629304995760322} {"Full-finetune/Learning Rate": 1.548265009798216e-05, "Full-finetune/Loss": 0.831059455871582, "Full-finetune/Loss (Raw)": 0.8857502937316895, "Full-finetune/Step": 1745, "Full-finetune/Step Time": 6.626051131635904} {"Full-finetune/Learning Rate": 1.547743918206295e-05, "Full-finetune/Loss": 0.8321943283081055, "Full-finetune/Loss (Raw)": 0.9769946932792664, "Full-finetune/Step": 1746, "Full-finetune/Step Time": 6.625559752807021} {"Full-finetune/Learning Rate": 1.5472226140456537e-05, "Full-finetune/Loss": 0.8296548128128052, "Full-finetune/Loss (Raw)": 0.43308085203170776, "Full-finetune/Step": 1747, "Full-finetune/Step Time": 6.642465092241764} {"Full-finetune/Learning Rate": 1.546701097518599e-05, "Full-finetune/Loss": 0.8265683054924011, "Full-finetune/Loss (Raw)": 0.6960817575454712, "Full-finetune/Step": 1748, "Full-finetune/Step Time": 6.65324742347002} {"Full-finetune/Learning Rate": 1.546179368827522e-05, "Full-finetune/Loss": 0.8273773789405823, "Full-finetune/Loss (Raw)": 0.8814763426780701, "Full-finetune/Step": 1749, "Full-finetune/Step Time": 6.6523255575448275} {"Full-finetune/Learning Rate": 1.545657428174895e-05, "Full-finetune/Loss": 0.8272231221199036, "Full-finetune/Loss (Raw)": 0.9472099542617798, "Full-finetune/Step": 1750, "Full-finetune/Step Time": 6.6704454850405455} {"Full-finetune/Learning Rate": 1.5451352757632734e-05, "Full-finetune/Loss": 0.8259519934654236, "Full-finetune/Loss (Raw)": 0.9136644005775452, "Full-finetune/Step": 1751, "Full-finetune/Step Time": 6.674126625061035} {"Full-finetune/Learning Rate": 1.544612911795294e-05, "Full-finetune/Loss": 0.827014684677124, "Full-finetune/Loss (Raw)": 1.0101886987686157, "Full-finetune/Step": 1752, "Full-finetune/Step Time": 6.673987049609423} {"Full-finetune/Learning Rate": 1.5440903364736763e-05, "Full-finetune/Loss": 0.8267897963523865, "Full-finetune/Loss (Raw)": 0.8512094616889954, "Full-finetune/Step": 1753, "Full-finetune/Step Time": 6.67203526198864} {"Full-finetune/Learning Rate": 1.5435675500012212e-05, "Full-finetune/Loss": 0.8269027471542358, "Full-finetune/Loss (Raw)": 0.9114305377006531, "Full-finetune/Step": 1754, "Full-finetune/Step Time": 6.680496580898762} {"Full-finetune/Learning Rate": 1.5430445525808123e-05, "Full-finetune/Loss": 0.8262927532196045, "Full-finetune/Loss (Raw)": 0.8681711554527283, "Full-finetune/Step": 1755, "Full-finetune/Step Time": 6.686980165541172} {"Full-finetune/Learning Rate": 1.5425213444154152e-05, "Full-finetune/Loss": 0.8273792862892151, "Full-finetune/Loss (Raw)": 0.9807381629943848, "Full-finetune/Step": 1756, "Full-finetune/Step Time": 6.6804793160408735} {"Full-finetune/Learning Rate": 1.5419979257080755e-05, "Full-finetune/Loss": 0.8241177797317505, "Full-finetune/Loss (Raw)": 0.3588544428348541, "Full-finetune/Step": 1757, "Full-finetune/Step Time": 6.69979608617723} {"Full-finetune/Learning Rate": 1.541474296661923e-05, "Full-finetune/Loss": 0.8232247829437256, "Full-finetune/Loss (Raw)": 0.7563382983207703, "Full-finetune/Step": 1758, "Full-finetune/Step Time": 6.704639179632068} {"Full-finetune/Learning Rate": 1.5409504574801667e-05, "Full-finetune/Loss": 0.8240340948104858, "Full-finetune/Loss (Raw)": 0.9571624994277954, "Full-finetune/Step": 1759, "Full-finetune/Step Time": 6.7103460393846035} {"Full-finetune/Learning Rate": 1.5404264083660993e-05, "Full-finetune/Loss": 0.8251044750213623, "Full-finetune/Loss (Raw)": 0.9712605476379395, "Full-finetune/Step": 1760, "Full-finetune/Step Time": 6.708515778183937} {"Full-finetune/Learning Rate": 1.539902149523094e-05, "Full-finetune/Loss": 0.8249247074127197, "Full-finetune/Loss (Raw)": 0.7567412257194519, "Full-finetune/Step": 1761, "Full-finetune/Step Time": 6.713822420686483} {"Full-finetune/Learning Rate": 1.5393776811546047e-05, "Full-finetune/Loss": 0.8240225315093994, "Full-finetune/Loss (Raw)": 0.7575258612632751, "Full-finetune/Step": 1762, "Full-finetune/Step Time": 6.7244745921343565} {"Full-finetune/Learning Rate": 1.538853003464168e-05, "Full-finetune/Loss": 0.8255000114440918, "Full-finetune/Loss (Raw)": 0.9894729852676392, "Full-finetune/Step": 1763, "Full-finetune/Step Time": 6.719861606135964} {"Full-finetune/Learning Rate": 1.538328116655401e-05, "Full-finetune/Loss": 0.8257754445075989, "Full-finetune/Loss (Raw)": 0.9278246164321899, "Full-finetune/Step": 1764, "Full-finetune/Step Time": 6.750591831281781} {"Full-finetune/Learning Rate": 1.5378030209320018e-05, "Full-finetune/Loss": 0.8257499933242798, "Full-finetune/Loss (Raw)": 0.7821121215820312, "Full-finetune/Step": 1765, "Full-finetune/Step Time": 6.773483676835895} {"Full-finetune/Learning Rate": 1.53727771649775e-05, "Full-finetune/Loss": 0.8266077637672424, "Full-finetune/Loss (Raw)": 0.9081462025642395, "Full-finetune/Step": 1766, "Full-finetune/Step Time": 6.775900328531861} {"Full-finetune/Learning Rate": 1.5367522035565055e-05, "Full-finetune/Loss": 0.826533317565918, "Full-finetune/Loss (Raw)": 0.7277284264564514, "Full-finetune/Step": 1767, "Full-finetune/Step Time": 6.786653760820627} {"Full-finetune/Learning Rate": 1.5362264823122107e-05, "Full-finetune/Loss": 0.8246172666549683, "Full-finetune/Loss (Raw)": 0.7126869559288025, "Full-finetune/Step": 1768, "Full-finetune/Step Time": 6.787589579820633} {"Full-finetune/Learning Rate": 1.5357005529688868e-05, "Full-finetune/Loss": 0.8228062391281128, "Full-finetune/Loss (Raw)": 0.6898089051246643, "Full-finetune/Step": 1769, "Full-finetune/Step Time": 6.802737081423402} {"Full-finetune/Learning Rate": 1.5351744157306366e-05, "Full-finetune/Loss": 0.8231717944145203, "Full-finetune/Loss (Raw)": 0.8968908190727234, "Full-finetune/Step": 1770, "Full-finetune/Step Time": 6.804132618010044} {"Full-finetune/Learning Rate": 1.5346480708016445e-05, "Full-finetune/Loss": 0.8218327760696411, "Full-finetune/Loss (Raw)": 0.8142070770263672, "Full-finetune/Step": 1771, "Full-finetune/Step Time": 6.803590856492519} {"Full-finetune/Learning Rate": 1.5341215183861738e-05, "Full-finetune/Loss": 0.8232876062393188, "Full-finetune/Loss (Raw)": 0.9912766218185425, "Full-finetune/Step": 1772, "Full-finetune/Step Time": 6.778212463483214} {"Full-finetune/Learning Rate": 1.53359475868857e-05, "Full-finetune/Loss": 0.8230654001235962, "Full-finetune/Loss (Raw)": 0.824967086315155, "Full-finetune/Step": 1773, "Full-finetune/Step Time": 6.787392886355519} {"Full-finetune/Learning Rate": 1.5330677919132577e-05, "Full-finetune/Loss": 0.8216872215270996, "Full-finetune/Loss (Raw)": 0.7444377541542053, "Full-finetune/Step": 1774, "Full-finetune/Step Time": 6.801325375214219} {"Full-finetune/Learning Rate": 1.5325406182647426e-05, "Full-finetune/Loss": 0.8230259418487549, "Full-finetune/Loss (Raw)": 0.9471086859703064, "Full-finetune/Step": 1775, "Full-finetune/Step Time": 6.789898777380586} {"Full-finetune/Learning Rate": 1.5320132379476107e-05, "Full-finetune/Loss": 0.8224227428436279, "Full-finetune/Loss (Raw)": 0.8540113568305969, "Full-finetune/Step": 1776, "Full-finetune/Step Time": 6.787707669660449} {"Full-finetune/Learning Rate": 1.531485651166528e-05, "Full-finetune/Loss": 0.8227553367614746, "Full-finetune/Loss (Raw)": 0.8753777742385864, "Full-finetune/Step": 1777, "Full-finetune/Step Time": 6.772492911666632} {"Full-finetune/Learning Rate": 1.5309578581262404e-05, "Full-finetune/Loss": 0.8222149014472961, "Full-finetune/Loss (Raw)": 0.8307839035987854, "Full-finetune/Step": 1778, "Full-finetune/Step Time": 6.785229267552495} {"Full-finetune/Learning Rate": 1.530429859031574e-05, "Full-finetune/Loss": 0.8244670629501343, "Full-finetune/Loss (Raw)": 1.0424578189849854, "Full-finetune/Step": 1779, "Full-finetune/Step Time": 6.7697602435946465} {"Full-finetune/Learning Rate": 1.5299016540874346e-05, "Full-finetune/Loss": 0.8244442939758301, "Full-finetune/Loss (Raw)": 0.8103159666061401, "Full-finetune/Step": 1780, "Full-finetune/Step Time": 6.740460770204663} {"Full-finetune/Learning Rate": 1.5293732434988095e-05, "Full-finetune/Loss": 0.8233145475387573, "Full-finetune/Loss (Raw)": 0.6935206055641174, "Full-finetune/Step": 1781, "Full-finetune/Step Time": 6.742678927257657} {"Full-finetune/Learning Rate": 1.5288446274707635e-05, "Full-finetune/Loss": 0.8230463862419128, "Full-finetune/Loss (Raw)": 0.8669466972351074, "Full-finetune/Step": 1782, "Full-finetune/Step Time": 6.730163102969527} {"Full-finetune/Learning Rate": 1.5283158062084423e-05, "Full-finetune/Loss": 0.8257319331169128, "Full-finetune/Loss (Raw)": 0.7305675745010376, "Full-finetune/Step": 1783, "Full-finetune/Step Time": 6.71275844797492} {"Full-finetune/Learning Rate": 1.5277867799170708e-05, "Full-finetune/Loss": 0.826676607131958, "Full-finetune/Loss (Raw)": 1.0081899166107178, "Full-finetune/Step": 1784, "Full-finetune/Step Time": 6.71755257062614} {"Full-finetune/Learning Rate": 1.527257548801955e-05, "Full-finetune/Loss": 0.8254172801971436, "Full-finetune/Loss (Raw)": 0.649397075176239, "Full-finetune/Step": 1785, "Full-finetune/Step Time": 6.730808014050126} {"Full-finetune/Learning Rate": 1.526728113068478e-05, "Full-finetune/Loss": 0.8250001072883606, "Full-finetune/Loss (Raw)": 0.8365364670753479, "Full-finetune/Step": 1786, "Full-finetune/Step Time": 6.728449326008558} {"Full-finetune/Learning Rate": 1.526198472922104e-05, "Full-finetune/Loss": 0.8242841958999634, "Full-finetune/Loss (Raw)": 0.7037051916122437, "Full-finetune/Step": 1787, "Full-finetune/Step Time": 6.733916150406003} {"Full-finetune/Learning Rate": 1.5256686285683753e-05, "Full-finetune/Loss": 0.8235607743263245, "Full-finetune/Loss (Raw)": 0.7886171936988831, "Full-finetune/Step": 1788, "Full-finetune/Step Time": 6.729017928242683} {"Full-finetune/Learning Rate": 1.5251385802129149e-05, "Full-finetune/Loss": 0.8193901777267456, "Full-finetune/Loss (Raw)": 0.29718634486198425, "Full-finetune/Step": 1789, "Full-finetune/Step Time": 6.753834439441562} {"Full-finetune/Learning Rate": 1.5246083280614241e-05, "Full-finetune/Loss": 0.8190810680389404, "Full-finetune/Loss (Raw)": 0.9085268974304199, "Full-finetune/Step": 1790, "Full-finetune/Step Time": 6.756255347281694} {"Full-finetune/Learning Rate": 1.5240778723196833e-05, "Full-finetune/Loss": 0.8221133351325989, "Full-finetune/Loss (Raw)": 0.9699786901473999, "Full-finetune/Step": 1791, "Full-finetune/Step Time": 6.7382469195872545} {"Full-finetune/Learning Rate": 1.523547213193552e-05, "Full-finetune/Loss": 0.8238195180892944, "Full-finetune/Loss (Raw)": 0.9167271852493286, "Full-finetune/Step": 1792, "Full-finetune/Step Time": 6.739119527861476} {"Full-finetune/Learning Rate": 1.5230163508889686e-05, "Full-finetune/Loss": 0.82172691822052, "Full-finetune/Loss (Raw)": 0.7184120416641235, "Full-finetune/Step": 1793, "Full-finetune/Step Time": 6.753124864771962} {"Full-finetune/Learning Rate": 1.5224852856119503e-05, "Full-finetune/Loss": 0.8225035667419434, "Full-finetune/Loss (Raw)": 0.9298505187034607, "Full-finetune/Step": 1794, "Full-finetune/Step Time": 6.758933335542679} {"Full-finetune/Learning Rate": 1.5219540175685938e-05, "Full-finetune/Loss": 0.8184258937835693, "Full-finetune/Loss (Raw)": 0.37158748507499695, "Full-finetune/Step": 1795, "Full-finetune/Step Time": 6.778701078146696} {"Full-finetune/Learning Rate": 1.5214225469650727e-05, "Full-finetune/Loss": 0.8174692988395691, "Full-finetune/Loss (Raw)": 0.8184419870376587, "Full-finetune/Step": 1796, "Full-finetune/Step Time": 6.771312937140465} {"Full-finetune/Learning Rate": 1.5208908740076416e-05, "Full-finetune/Loss": 0.8172774910926819, "Full-finetune/Loss (Raw)": 0.8478041291236877, "Full-finetune/Step": 1797, "Full-finetune/Step Time": 6.771102322265506} {"Full-finetune/Learning Rate": 1.5203589989026318e-05, "Full-finetune/Loss": 0.8168104887008667, "Full-finetune/Loss (Raw)": 0.8714912533760071, "Full-finetune/Step": 1798, "Full-finetune/Step Time": 6.774534195661545} {"Full-finetune/Learning Rate": 1.5198269218564535e-05, "Full-finetune/Loss": 0.8169523477554321, "Full-finetune/Loss (Raw)": 0.8147475123405457, "Full-finetune/Step": 1799, "Full-finetune/Step Time": 6.766389980912209} {"Full-finetune/Learning Rate": 1.5192946430755955e-05, "Full-finetune/Loss": 0.8165608048439026, "Full-finetune/Loss (Raw)": 0.8136475682258606, "Full-finetune/Step": 1800, "Full-finetune/Step Time": 6.759705172851682} {"Full-finetune/Learning Rate": 1.518762162766625e-05, "Full-finetune/Loss": 0.8179843425750732, "Full-finetune/Loss (Raw)": 0.9026477932929993, "Full-finetune/Step": 1801, "Full-finetune/Step Time": 6.763910077512264} {"Full-finetune/Learning Rate": 1.5182294811361871e-05, "Full-finetune/Loss": 0.8195226192474365, "Full-finetune/Loss (Raw)": 0.7848315238952637, "Full-finetune/Step": 1802, "Full-finetune/Step Time": 6.765939086675644} {"Full-finetune/Learning Rate": 1.5176965983910053e-05, "Full-finetune/Loss": 0.8207226991653442, "Full-finetune/Loss (Raw)": 0.8465059995651245, "Full-finetune/Step": 1803, "Full-finetune/Step Time": 6.778204983100295} {"Full-finetune/Learning Rate": 1.5171635147378804e-05, "Full-finetune/Loss": 0.8204441666603088, "Full-finetune/Loss (Raw)": 0.8846542835235596, "Full-finetune/Step": 1804, "Full-finetune/Step Time": 6.781438851729035} {"Full-finetune/Learning Rate": 1.5166302303836928e-05, "Full-finetune/Loss": 0.8172154426574707, "Full-finetune/Loss (Raw)": 0.5456392168998718, "Full-finetune/Step": 1805, "Full-finetune/Step Time": 6.799683284014463} {"Full-finetune/Learning Rate": 1.5160967455353985e-05, "Full-finetune/Loss": 0.8170312643051147, "Full-finetune/Loss (Raw)": 0.7552436590194702, "Full-finetune/Step": 1806, "Full-finetune/Step Time": 6.811593368649483} {"Full-finetune/Learning Rate": 1.5155630604000338e-05, "Full-finetune/Loss": 0.8210198283195496, "Full-finetune/Loss (Raw)": 0.8940173387527466, "Full-finetune/Step": 1807, "Full-finetune/Step Time": 6.793120369315147} {"Full-finetune/Learning Rate": 1.5150291751847106e-05, "Full-finetune/Loss": 0.820573091506958, "Full-finetune/Loss (Raw)": 0.8016502857208252, "Full-finetune/Step": 1808, "Full-finetune/Step Time": 6.782741356641054} {"Full-finetune/Learning Rate": 1.5144950900966198e-05, "Full-finetune/Loss": 0.8205962777137756, "Full-finetune/Loss (Raw)": 0.874772310256958, "Full-finetune/Step": 1809, "Full-finetune/Step Time": 6.781613223254681} {"Full-finetune/Learning Rate": 1.5139608053430288e-05, "Full-finetune/Loss": 0.8187291622161865, "Full-finetune/Loss (Raw)": 0.7863978147506714, "Full-finetune/Step": 1810, "Full-finetune/Step Time": 6.7832488510757685} {"Full-finetune/Learning Rate": 1.5134263211312837e-05, "Full-finetune/Loss": 0.8197947144508362, "Full-finetune/Loss (Raw)": 0.8401438593864441, "Full-finetune/Step": 1811, "Full-finetune/Step Time": 6.776585590094328} {"Full-finetune/Learning Rate": 1.5128916376688071e-05, "Full-finetune/Loss": 0.8190277814865112, "Full-finetune/Loss (Raw)": 0.7267472743988037, "Full-finetune/Step": 1812, "Full-finetune/Step Time": 6.782950419932604} {"Full-finetune/Learning Rate": 1.5123567551630993e-05, "Full-finetune/Loss": 0.8195980787277222, "Full-finetune/Loss (Raw)": 0.8227642774581909, "Full-finetune/Step": 1813, "Full-finetune/Step Time": 6.772549275308847} {"Full-finetune/Learning Rate": 1.511821673821738e-05, "Full-finetune/Loss": 0.8214374780654907, "Full-finetune/Loss (Raw)": 0.8564308285713196, "Full-finetune/Step": 1814, "Full-finetune/Step Time": 6.750178122892976} {"Full-finetune/Learning Rate": 1.5112863938523774e-05, "Full-finetune/Loss": 0.8207755088806152, "Full-finetune/Loss (Raw)": 0.8282738327980042, "Full-finetune/Step": 1815, "Full-finetune/Step Time": 6.748408678919077} {"Full-finetune/Learning Rate": 1.5107509154627491e-05, "Full-finetune/Loss": 0.8216795921325684, "Full-finetune/Loss (Raw)": 0.9412153959274292, "Full-finetune/Step": 1816, "Full-finetune/Step Time": 6.743541078642011} {"Full-finetune/Learning Rate": 1.5102152388606625e-05, "Full-finetune/Loss": 0.8259532451629639, "Full-finetune/Loss (Raw)": 0.8528866171836853, "Full-finetune/Step": 1817, "Full-finetune/Step Time": 6.726357910782099} {"Full-finetune/Learning Rate": 1.5096793642540027e-05, "Full-finetune/Loss": 0.8246039152145386, "Full-finetune/Loss (Raw)": 0.7771303057670593, "Full-finetune/Step": 1818, "Full-finetune/Step Time": 6.726870710030198} {"Full-finetune/Learning Rate": 1.5091432918507322e-05, "Full-finetune/Loss": 0.8246301412582397, "Full-finetune/Loss (Raw)": 0.8864930868148804, "Full-finetune/Step": 1819, "Full-finetune/Step Time": 6.7244043201208115} {"Full-finetune/Learning Rate": 1.5086070218588904e-05, "Full-finetune/Loss": 0.8246849775314331, "Full-finetune/Loss (Raw)": 0.7389467358589172, "Full-finetune/Step": 1820, "Full-finetune/Step Time": 6.702487520873547} {"Full-finetune/Learning Rate": 1.5080705544865932e-05, "Full-finetune/Loss": 0.8263234496116638, "Full-finetune/Loss (Raw)": 0.8690565228462219, "Full-finetune/Step": 1821, "Full-finetune/Step Time": 6.708713948726654} {"Full-finetune/Learning Rate": 1.5075338899420326e-05, "Full-finetune/Loss": 0.8300437331199646, "Full-finetune/Loss (Raw)": 1.0795358419418335, "Full-finetune/Step": 1822, "Full-finetune/Step Time": 6.700358506292105} {"Full-finetune/Learning Rate": 1.5069970284334785e-05, "Full-finetune/Loss": 0.8311952948570251, "Full-finetune/Loss (Raw)": 0.8514009714126587, "Full-finetune/Step": 1823, "Full-finetune/Step Time": 6.703127220273018} {"Full-finetune/Learning Rate": 1.506459970169276e-05, "Full-finetune/Loss": 0.8294332027435303, "Full-finetune/Loss (Raw)": 0.6361558437347412, "Full-finetune/Step": 1824, "Full-finetune/Step Time": 6.7064556907862425} {"Full-finetune/Learning Rate": 1.5059227153578466e-05, "Full-finetune/Loss": 0.8287530541419983, "Full-finetune/Loss (Raw)": 0.8325127363204956, "Full-finetune/Step": 1825, "Full-finetune/Step Time": 6.707810016348958} {"Full-finetune/Learning Rate": 1.505385264207689e-05, "Full-finetune/Loss": 0.8290965557098389, "Full-finetune/Loss (Raw)": 0.879681408405304, "Full-finetune/Step": 1826, "Full-finetune/Step Time": 6.708273807540536} {"Full-finetune/Learning Rate": 1.5048476169273767e-05, "Full-finetune/Loss": 0.828407883644104, "Full-finetune/Loss (Raw)": 0.8103121519088745, "Full-finetune/Step": 1827, "Full-finetune/Step Time": 6.74017146602273} {"Full-finetune/Learning Rate": 1.5043097737255607e-05, "Full-finetune/Loss": 0.8284719586372375, "Full-finetune/Loss (Raw)": 0.8843265175819397, "Full-finetune/Step": 1828, "Full-finetune/Step Time": 6.738514950498939} {"Full-finetune/Learning Rate": 1.5037717348109677e-05, "Full-finetune/Loss": 0.8292298316955566, "Full-finetune/Loss (Raw)": 1.0354607105255127, "Full-finetune/Step": 1829, "Full-finetune/Step Time": 6.752827387303114} {"Full-finetune/Learning Rate": 1.5032335003923994e-05, "Full-finetune/Loss": 0.8295766115188599, "Full-finetune/Loss (Raw)": 0.9749366044998169, "Full-finetune/Step": 1830, "Full-finetune/Step Time": 6.76459470950067} {"Full-finetune/Learning Rate": 1.5026950706787346e-05, "Full-finetune/Loss": 0.8309959173202515, "Full-finetune/Loss (Raw)": 0.8322001099586487, "Full-finetune/Step": 1831, "Full-finetune/Step Time": 6.75025893189013} {"Full-finetune/Learning Rate": 1.502156445878927e-05, "Full-finetune/Loss": 0.8358421921730042, "Full-finetune/Loss (Raw)": 0.967383861541748, "Full-finetune/Step": 1832, "Full-finetune/Step Time": 6.735588015988469} {"Full-finetune/Learning Rate": 1.5016176262020069e-05, "Full-finetune/Loss": 0.8349775671958923, "Full-finetune/Loss (Raw)": 0.7365387082099915, "Full-finetune/Step": 1833, "Full-finetune/Step Time": 6.7438893634825945} {"Full-finetune/Learning Rate": 1.5010786118570791e-05, "Full-finetune/Loss": 0.8354564905166626, "Full-finetune/Loss (Raw)": 0.9696376323699951, "Full-finetune/Step": 1834, "Full-finetune/Step Time": 6.742930736392736} {"Full-finetune/Learning Rate": 1.5005394030533246e-05, "Full-finetune/Loss": 0.8355396389961243, "Full-finetune/Loss (Raw)": 0.8869408965110779, "Full-finetune/Step": 1835, "Full-finetune/Step Time": 6.752391593530774} {"Full-finetune/Learning Rate": 1.5000000000000002e-05, "Full-finetune/Loss": 0.8358513116836548, "Full-finetune/Loss (Raw)": 0.8938828110694885, "Full-finetune/Step": 1836, "Full-finetune/Step Time": 6.747768081724644} {"Full-finetune/Learning Rate": 1.4994604029064372e-05, "Full-finetune/Loss": 0.834753692150116, "Full-finetune/Loss (Raw)": 0.8307091593742371, "Full-finetune/Step": 1837, "Full-finetune/Step Time": 6.749766455963254} {"Full-finetune/Learning Rate": 1.4989206119820432e-05, "Full-finetune/Loss": 0.8349075317382812, "Full-finetune/Loss (Raw)": 0.8584511280059814, "Full-finetune/Step": 1838, "Full-finetune/Step Time": 6.74254042096436} {"Full-finetune/Learning Rate": 1.4983806274363005e-05, "Full-finetune/Loss": 0.8350880146026611, "Full-finetune/Loss (Raw)": 0.8951244950294495, "Full-finetune/Step": 1839, "Full-finetune/Step Time": 6.735337818041444} {"Full-finetune/Learning Rate": 1.497840449478766e-05, "Full-finetune/Loss": 0.8337289094924927, "Full-finetune/Loss (Raw)": 0.8379644155502319, "Full-finetune/Step": 1840, "Full-finetune/Step Time": 6.734861150383949} {"Full-finetune/Learning Rate": 1.4973000783190728e-05, "Full-finetune/Loss": 0.8326600790023804, "Full-finetune/Loss (Raw)": 0.7704598903656006, "Full-finetune/Step": 1841, "Full-finetune/Step Time": 6.7376472894102335} {"Full-finetune/Learning Rate": 1.4967595141669278e-05, "Full-finetune/Loss": 0.8330208659172058, "Full-finetune/Loss (Raw)": 0.9444214105606079, "Full-finetune/Step": 1842, "Full-finetune/Step Time": 6.736053250730038} {"Full-finetune/Learning Rate": 1.4962187572321143e-05, "Full-finetune/Loss": 0.834719181060791, "Full-finetune/Loss (Raw)": 0.8566681146621704, "Full-finetune/Step": 1843, "Full-finetune/Step Time": 6.731366192921996} {"Full-finetune/Learning Rate": 1.4956778077244884e-05, "Full-finetune/Loss": 0.8343206644058228, "Full-finetune/Loss (Raw)": 0.8202962875366211, "Full-finetune/Step": 1844, "Full-finetune/Step Time": 6.742450408637524} {"Full-finetune/Learning Rate": 1.4951366658539832e-05, "Full-finetune/Loss": 0.8332083821296692, "Full-finetune/Loss (Raw)": 0.7502414584159851, "Full-finetune/Step": 1845, "Full-finetune/Step Time": 6.73702752776444} {"Full-finetune/Learning Rate": 1.4945953318306044e-05, "Full-finetune/Loss": 0.8335800170898438, "Full-finetune/Loss (Raw)": 0.9598207473754883, "Full-finetune/Step": 1846, "Full-finetune/Step Time": 6.738761829212308} {"Full-finetune/Learning Rate": 1.4940538058644332e-05, "Full-finetune/Loss": 0.8339320421218872, "Full-finetune/Loss (Raw)": 0.8655092716217041, "Full-finetune/Step": 1847, "Full-finetune/Step Time": 6.747233368456364} {"Full-finetune/Learning Rate": 1.4935120881656263e-05, "Full-finetune/Loss": 0.833233118057251, "Full-finetune/Loss (Raw)": 0.8700429797172546, "Full-finetune/Step": 1848, "Full-finetune/Step Time": 6.739697135984898} {"Full-finetune/Learning Rate": 1.4929701789444122e-05, "Full-finetune/Loss": 0.8336973786354065, "Full-finetune/Loss (Raw)": 0.9750056862831116, "Full-finetune/Step": 1849, "Full-finetune/Step Time": 6.73409603908658} {"Full-finetune/Learning Rate": 1.4924280784110965e-05, "Full-finetune/Loss": 0.8342959880828857, "Full-finetune/Loss (Raw)": 0.9373449683189392, "Full-finetune/Step": 1850, "Full-finetune/Step Time": 6.740281879901886} {"Full-finetune/Learning Rate": 1.4918857867760571e-05, "Full-finetune/Loss": 0.8328225016593933, "Full-finetune/Loss (Raw)": 0.6519694328308105, "Full-finetune/Step": 1851, "Full-finetune/Step Time": 6.7433488089591265} {"Full-finetune/Learning Rate": 1.4913433042497473e-05, "Full-finetune/Loss": 0.8335285186767578, "Full-finetune/Loss (Raw)": 0.8915033936500549, "Full-finetune/Step": 1852, "Full-finetune/Step Time": 6.744127858430147} {"Full-finetune/Learning Rate": 1.4908006310426942e-05, "Full-finetune/Loss": 0.8340290784835815, "Full-finetune/Loss (Raw)": 0.9011383652687073, "Full-finetune/Step": 1853, "Full-finetune/Step Time": 6.744320224970579} {"Full-finetune/Learning Rate": 1.4902577673654977e-05, "Full-finetune/Loss": 0.8349189758300781, "Full-finetune/Loss (Raw)": 0.8951240181922913, "Full-finetune/Step": 1854, "Full-finetune/Step Time": 6.737708942964673} {"Full-finetune/Learning Rate": 1.4897147134288334e-05, "Full-finetune/Loss": 0.8352832794189453, "Full-finetune/Loss (Raw)": 0.9021657705307007, "Full-finetune/Step": 1855, "Full-finetune/Step Time": 6.722774865105748} {"Full-finetune/Learning Rate": 1.4891714694434495e-05, "Full-finetune/Loss": 0.835555374622345, "Full-finetune/Loss (Raw)": 0.9914214015007019, "Full-finetune/Step": 1856, "Full-finetune/Step Time": 6.721868274733424} {"Full-finetune/Learning Rate": 1.4886280356201688e-05, "Full-finetune/Loss": 0.8344857096672058, "Full-finetune/Loss (Raw)": 0.7483972311019897, "Full-finetune/Step": 1857, "Full-finetune/Step Time": 6.756456647068262} {"Full-finetune/Learning Rate": 1.4880844121698872e-05, "Full-finetune/Loss": 0.8350487947463989, "Full-finetune/Loss (Raw)": 0.8240178227424622, "Full-finetune/Step": 1858, "Full-finetune/Step Time": 6.764464335516095} {"Full-finetune/Learning Rate": 1.487540599303574e-05, "Full-finetune/Loss": 0.8345758318901062, "Full-finetune/Loss (Raw)": 0.96680748462677, "Full-finetune/Step": 1859, "Full-finetune/Step Time": 6.75865657068789} {"Full-finetune/Learning Rate": 1.4869965972322728e-05, "Full-finetune/Loss": 0.8327999114990234, "Full-finetune/Loss (Raw)": 0.7118409872055054, "Full-finetune/Step": 1860, "Full-finetune/Step Time": 6.74699817225337} {"Full-finetune/Learning Rate": 1.4864524061670999e-05, "Full-finetune/Loss": 0.8321879506111145, "Full-finetune/Loss (Raw)": 0.7907589077949524, "Full-finetune/Step": 1861, "Full-finetune/Step Time": 6.74717054516077} {"Full-finetune/Learning Rate": 1.4859080263192456e-05, "Full-finetune/Loss": 0.8312511444091797, "Full-finetune/Loss (Raw)": 0.7770589590072632, "Full-finetune/Step": 1862, "Full-finetune/Step Time": 6.7314875312149525} {"Full-finetune/Learning Rate": 1.4853634578999728e-05, "Full-finetune/Loss": 0.8305369019508362, "Full-finetune/Loss (Raw)": 0.7375593781471252, "Full-finetune/Step": 1863, "Full-finetune/Step Time": 6.731097154319286} {"Full-finetune/Learning Rate": 1.4848187011206177e-05, "Full-finetune/Loss": 0.8295969367027283, "Full-finetune/Loss (Raw)": 0.7494726777076721, "Full-finetune/Step": 1864, "Full-finetune/Step Time": 6.7353151105344296} {"Full-finetune/Learning Rate": 1.4842737561925901e-05, "Full-finetune/Loss": 0.830464243888855, "Full-finetune/Loss (Raw)": 0.8991225957870483, "Full-finetune/Step": 1865, "Full-finetune/Step Time": 6.738674042746425} {"Full-finetune/Learning Rate": 1.4837286233273722e-05, "Full-finetune/Loss": 0.8350563049316406, "Full-finetune/Loss (Raw)": 0.9388588666915894, "Full-finetune/Step": 1866, "Full-finetune/Step Time": 6.7326964773237705} {"Full-finetune/Learning Rate": 1.48318330273652e-05, "Full-finetune/Loss": 0.8361832499504089, "Full-finetune/Loss (Raw)": 0.9711726307868958, "Full-finetune/Step": 1867, "Full-finetune/Step Time": 6.738940740004182} {"Full-finetune/Learning Rate": 1.4826377946316611e-05, "Full-finetune/Loss": 0.836092472076416, "Full-finetune/Loss (Raw)": 0.7462220191955566, "Full-finetune/Step": 1868, "Full-finetune/Step Time": 6.749819966033101} {"Full-finetune/Learning Rate": 1.4820920992244964e-05, "Full-finetune/Loss": 0.835313081741333, "Full-finetune/Loss (Raw)": 0.9423757791519165, "Full-finetune/Step": 1869, "Full-finetune/Step Time": 6.747788805514574} {"Full-finetune/Learning Rate": 1.481546216726801e-05, "Full-finetune/Loss": 0.8357910513877869, "Full-finetune/Loss (Raw)": 0.763598620891571, "Full-finetune/Step": 1870, "Full-finetune/Step Time": 6.74009482562542} {"Full-finetune/Learning Rate": 1.4810001473504194e-05, "Full-finetune/Loss": 0.835572361946106, "Full-finetune/Loss (Raw)": 0.8202798962593079, "Full-finetune/Step": 1871, "Full-finetune/Step Time": 6.753309370949864} {"Full-finetune/Learning Rate": 1.4804538913072719e-05, "Full-finetune/Loss": 0.8344948291778564, "Full-finetune/Loss (Raw)": 0.6956760287284851, "Full-finetune/Step": 1872, "Full-finetune/Step Time": 6.747971408069134} {"Full-finetune/Learning Rate": 1.479907448809349e-05, "Full-finetune/Loss": 0.8303785920143127, "Full-finetune/Loss (Raw)": 0.3588714301586151, "Full-finetune/Step": 1873, "Full-finetune/Step Time": 6.760371051728725} {"Full-finetune/Learning Rate": 1.4793608200687146e-05, "Full-finetune/Loss": 0.8298385739326477, "Full-finetune/Loss (Raw)": 0.9078772068023682, "Full-finetune/Step": 1874, "Full-finetune/Step Time": 6.772365922108293} {"Full-finetune/Learning Rate": 1.478814005297505e-05, "Full-finetune/Loss": 0.8318480253219604, "Full-finetune/Loss (Raw)": 0.6902945041656494, "Full-finetune/Step": 1875, "Full-finetune/Step Time": 6.764625642448664} {"Full-finetune/Learning Rate": 1.4782670047079275e-05, "Full-finetune/Loss": 0.8333296179771423, "Full-finetune/Loss (Raw)": 0.885719895362854, "Full-finetune/Step": 1876, "Full-finetune/Step Time": 6.751910507678986} {"Full-finetune/Learning Rate": 1.477719818512263e-05, "Full-finetune/Loss": 0.8334276676177979, "Full-finetune/Loss (Raw)": 0.8940247297286987, "Full-finetune/Step": 1877, "Full-finetune/Step Time": 6.7664636969566345} {"Full-finetune/Learning Rate": 1.4771724469228638e-05, "Full-finetune/Loss": 0.8312600255012512, "Full-finetune/Loss (Raw)": 0.6697530150413513, "Full-finetune/Step": 1878, "Full-finetune/Step Time": 6.759056106209755} {"Full-finetune/Learning Rate": 1.4766248901521539e-05, "Full-finetune/Loss": 0.8316042423248291, "Full-finetune/Loss (Raw)": 0.9577270150184631, "Full-finetune/Step": 1879, "Full-finetune/Step Time": 6.761160857975483} {"Full-finetune/Learning Rate": 1.4760771484126296e-05, "Full-finetune/Loss": 0.8286705613136292, "Full-finetune/Loss (Raw)": 0.6346790194511414, "Full-finetune/Step": 1880, "Full-finetune/Step Time": 6.782133145257831} {"Full-finetune/Learning Rate": 1.4755292219168581e-05, "Full-finetune/Loss": 0.8278349041938782, "Full-finetune/Loss (Raw)": 0.7442365884780884, "Full-finetune/Step": 1881, "Full-finetune/Step Time": 6.789521066471934} {"Full-finetune/Learning Rate": 1.4749811108774798e-05, "Full-finetune/Loss": 0.8275743722915649, "Full-finetune/Loss (Raw)": 0.8780844807624817, "Full-finetune/Step": 1882, "Full-finetune/Step Time": 6.785697089508176} {"Full-finetune/Learning Rate": 1.4744328155072058e-05, "Full-finetune/Loss": 0.8260515928268433, "Full-finetune/Loss (Raw)": 0.673254668712616, "Full-finetune/Step": 1883, "Full-finetune/Step Time": 6.793670866638422} {"Full-finetune/Learning Rate": 1.4738843360188184e-05, "Full-finetune/Loss": 0.821139395236969, "Full-finetune/Loss (Raw)": 0.3519769608974457, "Full-finetune/Step": 1884, "Full-finetune/Step Time": 6.81092588044703} {"Full-finetune/Learning Rate": 1.4733356726251722e-05, "Full-finetune/Loss": 0.8252376317977905, "Full-finetune/Loss (Raw)": 0.8834309577941895, "Full-finetune/Step": 1885, "Full-finetune/Step Time": 6.7940593753010035} {"Full-finetune/Learning Rate": 1.4727868255391924e-05, "Full-finetune/Loss": 0.827159583568573, "Full-finetune/Loss (Raw)": 1.0023471117019653, "Full-finetune/Step": 1886, "Full-finetune/Step Time": 6.798048989847302} {"Full-finetune/Learning Rate": 1.472237794973876e-05, "Full-finetune/Loss": 0.8254107236862183, "Full-finetune/Loss (Raw)": 0.7333114147186279, "Full-finetune/Step": 1887, "Full-finetune/Step Time": 6.792685676366091} {"Full-finetune/Learning Rate": 1.471688581142291e-05, "Full-finetune/Loss": 0.8232672214508057, "Full-finetune/Loss (Raw)": 0.6968950033187866, "Full-finetune/Step": 1888, "Full-finetune/Step Time": 6.797968177124858} {"Full-finetune/Learning Rate": 1.4711391842575765e-05, "Full-finetune/Loss": 0.8235378265380859, "Full-finetune/Loss (Raw)": 0.7913751006126404, "Full-finetune/Step": 1889, "Full-finetune/Step Time": 6.803887536749244} {"Full-finetune/Learning Rate": 1.4705896045329432e-05, "Full-finetune/Loss": 0.8239659667015076, "Full-finetune/Loss (Raw)": 0.8123307228088379, "Full-finetune/Step": 1890, "Full-finetune/Step Time": 6.797135215252638} {"Full-finetune/Learning Rate": 1.4700398421816714e-05, "Full-finetune/Loss": 0.8234158754348755, "Full-finetune/Loss (Raw)": 0.9190565347671509, "Full-finetune/Step": 1891, "Full-finetune/Step Time": 6.781685300171375} {"Full-finetune/Learning Rate": 1.469489897417114e-05, "Full-finetune/Loss": 0.8238556981086731, "Full-finetune/Loss (Raw)": 0.9841221570968628, "Full-finetune/Step": 1892, "Full-finetune/Step Time": 6.75222103856504} {"Full-finetune/Learning Rate": 1.468939770452693e-05, "Full-finetune/Loss": 0.8240988254547119, "Full-finetune/Loss (Raw)": 0.8132382035255432, "Full-finetune/Step": 1893, "Full-finetune/Step Time": 6.754438277333975} {"Full-finetune/Learning Rate": 1.4683894615019028e-05, "Full-finetune/Loss": 0.8228480219841003, "Full-finetune/Loss (Raw)": 0.7480380535125732, "Full-finetune/Step": 1894, "Full-finetune/Step Time": 6.746206106618047} {"Full-finetune/Learning Rate": 1.4678389707783072e-05, "Full-finetune/Loss": 0.8236598968505859, "Full-finetune/Loss (Raw)": 0.8316536545753479, "Full-finetune/Step": 1895, "Full-finetune/Step Time": 6.736334292218089} {"Full-finetune/Learning Rate": 1.4672882984955404e-05, "Full-finetune/Loss": 0.8247345089912415, "Full-finetune/Loss (Raw)": 0.8502383232116699, "Full-finetune/Step": 1896, "Full-finetune/Step Time": 6.739099197089672} {"Full-finetune/Learning Rate": 1.4667374448673081e-05, "Full-finetune/Loss": 0.8269857168197632, "Full-finetune/Loss (Raw)": 0.9779602289199829, "Full-finetune/Step": 1897, "Full-finetune/Step Time": 6.726089725270867} {"Full-finetune/Learning Rate": 1.4661864101073857e-05, "Full-finetune/Loss": 0.8267630338668823, "Full-finetune/Loss (Raw)": 0.868381679058075, "Full-finetune/Step": 1898, "Full-finetune/Step Time": 6.731481499969959} {"Full-finetune/Learning Rate": 1.465635194429619e-05, "Full-finetune/Loss": 0.8259634971618652, "Full-finetune/Loss (Raw)": 0.7118755578994751, "Full-finetune/Step": 1899, "Full-finetune/Step Time": 6.750708620995283} {"Full-finetune/Learning Rate": 1.4650837980479246e-05, "Full-finetune/Loss": 0.824730634689331, "Full-finetune/Loss (Raw)": 0.8334647417068481, "Full-finetune/Step": 1900, "Full-finetune/Step Time": 6.752935208380222} {"Full-finetune/Learning Rate": 1.4645322211762876e-05, "Full-finetune/Loss": 0.8245316743850708, "Full-finetune/Loss (Raw)": 0.7994963526725769, "Full-finetune/Step": 1901, "Full-finetune/Step Time": 6.748892722651362} {"Full-finetune/Learning Rate": 1.4639804640287652e-05, "Full-finetune/Loss": 0.8261419534683228, "Full-finetune/Loss (Raw)": 0.9505601525306702, "Full-finetune/Step": 1902, "Full-finetune/Step Time": 6.739368446171284} {"Full-finetune/Learning Rate": 1.4634285268194828e-05, "Full-finetune/Loss": 0.824643611907959, "Full-finetune/Loss (Raw)": 0.7553151845932007, "Full-finetune/Step": 1903, "Full-finetune/Step Time": 6.758679058402777} {"Full-finetune/Learning Rate": 1.462876409762637e-05, "Full-finetune/Loss": 0.8244373202323914, "Full-finetune/Loss (Raw)": 0.8276124000549316, "Full-finetune/Step": 1904, "Full-finetune/Step Time": 6.764544915407896} {"Full-finetune/Learning Rate": 1.4623241130724937e-05, "Full-finetune/Loss": 0.8201131820678711, "Full-finetune/Loss (Raw)": 0.32188549637794495, "Full-finetune/Step": 1905, "Full-finetune/Step Time": 6.78579549305141} {"Full-finetune/Learning Rate": 1.4617716369633876e-05, "Full-finetune/Loss": 0.8195390105247498, "Full-finetune/Loss (Raw)": 0.7572888135910034, "Full-finetune/Step": 1906, "Full-finetune/Step Time": 6.788256822153926} {"Full-finetune/Learning Rate": 1.461218981649725e-05, "Full-finetune/Loss": 0.8181297779083252, "Full-finetune/Loss (Raw)": 0.8620800971984863, "Full-finetune/Step": 1907, "Full-finetune/Step Time": 6.804836623370647} {"Full-finetune/Learning Rate": 1.4606661473459801e-05, "Full-finetune/Loss": 0.8179773092269897, "Full-finetune/Loss (Raw)": 0.7907907366752625, "Full-finetune/Step": 1908, "Full-finetune/Step Time": 6.803435415029526} {"Full-finetune/Learning Rate": 1.4601131342666973e-05, "Full-finetune/Loss": 0.8173127174377441, "Full-finetune/Loss (Raw)": 0.6084606647491455, "Full-finetune/Step": 1909, "Full-finetune/Step Time": 6.80466890335083} {"Full-finetune/Learning Rate": 1.45955994262649e-05, "Full-finetune/Loss": 0.817304253578186, "Full-finetune/Loss (Raw)": 0.8658588528633118, "Full-finetune/Step": 1910, "Full-finetune/Step Time": 6.807627713307738} {"Full-finetune/Learning Rate": 1.459006572640041e-05, "Full-finetune/Loss": 0.818740725517273, "Full-finetune/Loss (Raw)": 0.9144375920295715, "Full-finetune/Step": 1911, "Full-finetune/Step Time": 6.814055128023028} {"Full-finetune/Learning Rate": 1.4584530245221025e-05, "Full-finetune/Loss": 0.8172756433486938, "Full-finetune/Loss (Raw)": 0.8206648826599121, "Full-finetune/Step": 1912, "Full-finetune/Step Time": 6.80718102119863} {"Full-finetune/Learning Rate": 1.4578992984874956e-05, "Full-finetune/Loss": 0.8187263011932373, "Full-finetune/Loss (Raw)": 0.8350762724876404, "Full-finetune/Step": 1913, "Full-finetune/Step Time": 6.793768072500825} {"Full-finetune/Learning Rate": 1.457345394751111e-05, "Full-finetune/Loss": 0.8199582099914551, "Full-finetune/Loss (Raw)": 0.9942255020141602, "Full-finetune/Step": 1914, "Full-finetune/Step Time": 6.791867041960359} {"Full-finetune/Learning Rate": 1.4567913135279075e-05, "Full-finetune/Loss": 0.8217008709907532, "Full-finetune/Loss (Raw)": 0.9267640113830566, "Full-finetune/Step": 1915, "Full-finetune/Step Time": 6.814883979037404} {"Full-finetune/Learning Rate": 1.456237055032913e-05, "Full-finetune/Loss": 0.8219622373580933, "Full-finetune/Loss (Raw)": 0.8220719695091248, "Full-finetune/Step": 1916, "Full-finetune/Step Time": 6.815658014267683} {"Full-finetune/Learning Rate": 1.455682619481225e-05, "Full-finetune/Loss": 0.8256360292434692, "Full-finetune/Loss (Raw)": 0.7674235105514526, "Full-finetune/Step": 1917, "Full-finetune/Step Time": 6.791715687140822} {"Full-finetune/Learning Rate": 1.4551280070880089e-05, "Full-finetune/Loss": 0.8248553276062012, "Full-finetune/Loss (Raw)": 0.8086084127426147, "Full-finetune/Step": 1918, "Full-finetune/Step Time": 6.780632087960839} {"Full-finetune/Learning Rate": 1.4545732180684989e-05, "Full-finetune/Loss": 0.8238526582717896, "Full-finetune/Loss (Raw)": 0.8416346311569214, "Full-finetune/Step": 1919, "Full-finetune/Step Time": 6.7777663115412} {"Full-finetune/Learning Rate": 1.4540182526379976e-05, "Full-finetune/Loss": 0.8224794268608093, "Full-finetune/Loss (Raw)": 0.7409495115280151, "Full-finetune/Step": 1920, "Full-finetune/Step Time": 6.78764888830483} {"Full-finetune/Learning Rate": 1.4534631110118763e-05, "Full-finetune/Loss": 0.8243361711502075, "Full-finetune/Loss (Raw)": 0.9560777544975281, "Full-finetune/Step": 1921, "Full-finetune/Step Time": 6.772809904068708} {"Full-finetune/Learning Rate": 1.4529077934055754e-05, "Full-finetune/Loss": 0.819454550743103, "Full-finetune/Loss (Raw)": 0.3050011694431305, "Full-finetune/Step": 1922, "Full-finetune/Step Time": 6.79071275703609} {"Full-finetune/Learning Rate": 1.4523523000346012e-05, "Full-finetune/Loss": 0.8231992125511169, "Full-finetune/Loss (Raw)": 0.850908100605011, "Full-finetune/Step": 1923, "Full-finetune/Step Time": 6.773135870695114} {"Full-finetune/Learning Rate": 1.4517966311145313e-05, "Full-finetune/Loss": 0.8238959908485413, "Full-finetune/Loss (Raw)": 0.9076250791549683, "Full-finetune/Step": 1924, "Full-finetune/Step Time": 6.772493427619338} {"Full-finetune/Learning Rate": 1.4512407868610094e-05, "Full-finetune/Loss": 0.825212836265564, "Full-finetune/Loss (Raw)": 1.0163573026657104, "Full-finetune/Step": 1925, "Full-finetune/Step Time": 6.770350007340312} {"Full-finetune/Learning Rate": 1.450684767489748e-05, "Full-finetune/Loss": 0.8210092782974243, "Full-finetune/Loss (Raw)": 0.3334370255470276, "Full-finetune/Step": 1926, "Full-finetune/Step Time": 6.785114856436849} {"Full-finetune/Learning Rate": 1.4501285732165271e-05, "Full-finetune/Loss": 0.8177404999732971, "Full-finetune/Loss (Raw)": 0.39634835720062256, "Full-finetune/Step": 1927, "Full-finetune/Step Time": 6.805488316342235} {"Full-finetune/Learning Rate": 1.4495722042571946e-05, "Full-finetune/Loss": 0.8188004493713379, "Full-finetune/Loss (Raw)": 0.9493243098258972, "Full-finetune/Step": 1928, "Full-finetune/Step Time": 6.8045792151242495} {"Full-finetune/Learning Rate": 1.4490156608276674e-05, "Full-finetune/Loss": 0.817267656326294, "Full-finetune/Loss (Raw)": 0.706450343132019, "Full-finetune/Step": 1929, "Full-finetune/Step Time": 6.796870183199644} {"Full-finetune/Learning Rate": 1.4484589431439283e-05, "Full-finetune/Loss": 0.8161644339561462, "Full-finetune/Loss (Raw)": 0.6436123847961426, "Full-finetune/Step": 1930, "Full-finetune/Step Time": 6.783121405169368} {"Full-finetune/Learning Rate": 1.4479020514220285e-05, "Full-finetune/Loss": 0.8165087699890137, "Full-finetune/Loss (Raw)": 0.8905845880508423, "Full-finetune/Step": 1931, "Full-finetune/Step Time": 6.761505613103509} {"Full-finetune/Learning Rate": 1.4473449858780874e-05, "Full-finetune/Loss": 0.8147134780883789, "Full-finetune/Loss (Raw)": 0.654859185218811, "Full-finetune/Step": 1932, "Full-finetune/Step Time": 6.78444492444396} {"Full-finetune/Learning Rate": 1.4467877467282906e-05, "Full-finetune/Loss": 0.8174042105674744, "Full-finetune/Loss (Raw)": 0.8900485038757324, "Full-finetune/Step": 1933, "Full-finetune/Step Time": 6.768554696813226} {"Full-finetune/Learning Rate": 1.4462303341888925e-05, "Full-finetune/Loss": 0.8184846639633179, "Full-finetune/Loss (Raw)": 0.8935446739196777, "Full-finetune/Step": 1934, "Full-finetune/Step Time": 6.765938822180033} {"Full-finetune/Learning Rate": 1.4456727484762137e-05, "Full-finetune/Loss": 0.8189033269882202, "Full-finetune/Loss (Raw)": 0.9476096630096436, "Full-finetune/Step": 1935, "Full-finetune/Step Time": 6.782721783965826} {"Full-finetune/Learning Rate": 1.4451149898066418e-05, "Full-finetune/Loss": 0.8182647228240967, "Full-finetune/Loss (Raw)": 0.7198955416679382, "Full-finetune/Step": 1936, "Full-finetune/Step Time": 6.78977464325726} {"Full-finetune/Learning Rate": 1.4445570583966329e-05, "Full-finetune/Loss": 0.8181158900260925, "Full-finetune/Loss (Raw)": 0.8557281494140625, "Full-finetune/Step": 1937, "Full-finetune/Step Time": 6.788983242586255} {"Full-finetune/Learning Rate": 1.4439989544627085e-05, "Full-finetune/Loss": 0.8150987029075623, "Full-finetune/Loss (Raw)": 0.400200754404068, "Full-finetune/Step": 1938, "Full-finetune/Step Time": 6.801564157009125} {"Full-finetune/Learning Rate": 1.4434406782214584e-05, "Full-finetune/Loss": 0.8151357173919678, "Full-finetune/Loss (Raw)": 0.8448814749717712, "Full-finetune/Step": 1939, "Full-finetune/Step Time": 6.79729612544179} {"Full-finetune/Learning Rate": 1.4428822298895386e-05, "Full-finetune/Loss": 0.8131986856460571, "Full-finetune/Loss (Raw)": 0.47880375385284424, "Full-finetune/Step": 1940, "Full-finetune/Step Time": 6.798632329329848} {"Full-finetune/Learning Rate": 1.442323609683672e-05, "Full-finetune/Loss": 0.8130588531494141, "Full-finetune/Loss (Raw)": 0.8048669099807739, "Full-finetune/Step": 1941, "Full-finetune/Step Time": 6.798289205878973} {"Full-finetune/Learning Rate": 1.4417648178206481e-05, "Full-finetune/Loss": 0.8140591382980347, "Full-finetune/Loss (Raw)": 0.9844768643379211, "Full-finetune/Step": 1942, "Full-finetune/Step Time": 6.799961678683758} {"Full-finetune/Learning Rate": 1.4412058545173228e-05, "Full-finetune/Loss": 0.8149185180664062, "Full-finetune/Loss (Raw)": 0.9382673501968384, "Full-finetune/Step": 1943, "Full-finetune/Step Time": 6.79892935231328} {"Full-finetune/Learning Rate": 1.4406467199906194e-05, "Full-finetune/Loss": 0.8143447041511536, "Full-finetune/Loss (Raw)": 0.867764949798584, "Full-finetune/Step": 1944, "Full-finetune/Step Time": 6.804491991177201} {"Full-finetune/Learning Rate": 1.440087414457527e-05, "Full-finetune/Loss": 0.8106799125671387, "Full-finetune/Loss (Raw)": 0.3837865889072418, "Full-finetune/Step": 1945, "Full-finetune/Step Time": 6.822379531338811} {"Full-finetune/Learning Rate": 1.4395279381351008e-05, "Full-finetune/Loss": 0.8116968870162964, "Full-finetune/Loss (Raw)": 0.9073151350021362, "Full-finetune/Step": 1946, "Full-finetune/Step Time": 6.836522663012147} {"Full-finetune/Learning Rate": 1.438968291240463e-05, "Full-finetune/Loss": 0.812603235244751, "Full-finetune/Loss (Raw)": 1.0025041103363037, "Full-finetune/Step": 1947, "Full-finetune/Step Time": 6.833979234099388} {"Full-finetune/Learning Rate": 1.4384084739908016e-05, "Full-finetune/Loss": 0.8148927092552185, "Full-finetune/Loss (Raw)": 1.0319980382919312, "Full-finetune/Step": 1948, "Full-finetune/Step Time": 6.834551103413105} {"Full-finetune/Learning Rate": 1.4378484866033705e-05, "Full-finetune/Loss": 0.8156051635742188, "Full-finetune/Loss (Raw)": 0.9602472186088562, "Full-finetune/Step": 1949, "Full-finetune/Step Time": 6.812760816887021} {"Full-finetune/Learning Rate": 1.43728832929549e-05, "Full-finetune/Loss": 0.8148770332336426, "Full-finetune/Loss (Raw)": 0.9863461256027222, "Full-finetune/Step": 1950, "Full-finetune/Step Time": 6.820692270994186} {"Full-finetune/Learning Rate": 1.4367280022845462e-05, "Full-finetune/Loss": 0.8157554268836975, "Full-finetune/Loss (Raw)": 0.9638293385505676, "Full-finetune/Step": 1951, "Full-finetune/Step Time": 6.814629174768925} {"Full-finetune/Learning Rate": 1.4361675057879913e-05, "Full-finetune/Loss": 0.8183460235595703, "Full-finetune/Loss (Raw)": 0.9677459001541138, "Full-finetune/Step": 1952, "Full-finetune/Step Time": 6.810478590428829} {"Full-finetune/Learning Rate": 1.4356068400233429e-05, "Full-finetune/Loss": 0.8162829875946045, "Full-finetune/Loss (Raw)": 0.5684407949447632, "Full-finetune/Step": 1953, "Full-finetune/Step Time": 6.822530332952738} {"Full-finetune/Learning Rate": 1.435046005208184e-05, "Full-finetune/Loss": 0.8143017292022705, "Full-finetune/Loss (Raw)": 0.6260849833488464, "Full-finetune/Step": 1954, "Full-finetune/Step Time": 6.831651547923684} {"Full-finetune/Learning Rate": 1.4344850015601644e-05, "Full-finetune/Loss": 0.8137130737304688, "Full-finetune/Loss (Raw)": 0.734965980052948, "Full-finetune/Step": 1955, "Full-finetune/Step Time": 6.817537944763899} {"Full-finetune/Learning Rate": 1.4339238292969981e-05, "Full-finetune/Loss": 0.8125661611557007, "Full-finetune/Loss (Raw)": 0.7375184893608093, "Full-finetune/Step": 1956, "Full-finetune/Step Time": 6.812572598457336} {"Full-finetune/Learning Rate": 1.4333624886364655e-05, "Full-finetune/Loss": 0.8116610050201416, "Full-finetune/Loss (Raw)": 0.9196053743362427, "Full-finetune/Step": 1957, "Full-finetune/Step Time": 6.7954117357730865} {"Full-finetune/Learning Rate": 1.4328009797964115e-05, "Full-finetune/Loss": 0.8116878867149353, "Full-finetune/Loss (Raw)": 0.9783808588981628, "Full-finetune/Step": 1958, "Full-finetune/Step Time": 6.781511640176177} {"Full-finetune/Learning Rate": 1.432239302994747e-05, "Full-finetune/Loss": 0.8112292289733887, "Full-finetune/Loss (Raw)": 0.7734841704368591, "Full-finetune/Step": 1959, "Full-finetune/Step Time": 6.784220185130835} {"Full-finetune/Learning Rate": 1.431677458449448e-05, "Full-finetune/Loss": 0.8114712834358215, "Full-finetune/Loss (Raw)": 0.998369038105011, "Full-finetune/Step": 1960, "Full-finetune/Step Time": 6.789159858599305} {"Full-finetune/Learning Rate": 1.431115446378555e-05, "Full-finetune/Loss": 0.8113423585891724, "Full-finetune/Loss (Raw)": 0.7200372815132141, "Full-finetune/Step": 1961, "Full-finetune/Step Time": 6.777944000437856} {"Full-finetune/Learning Rate": 1.4305532670001743e-05, "Full-finetune/Loss": 0.8069489002227783, "Full-finetune/Loss (Raw)": 0.4072796106338501, "Full-finetune/Step": 1962, "Full-finetune/Step Time": 6.799523040652275} {"Full-finetune/Learning Rate": 1.4299909205324762e-05, "Full-finetune/Loss": 0.8030804991722107, "Full-finetune/Loss (Raw)": 0.391781210899353, "Full-finetune/Step": 1963, "Full-finetune/Step Time": 6.805537203326821} {"Full-finetune/Learning Rate": 1.4294284071936968e-05, "Full-finetune/Loss": 0.802421510219574, "Full-finetune/Loss (Raw)": 0.8095306754112244, "Full-finetune/Step": 1964, "Full-finetune/Step Time": 6.812586570158601} {"Full-finetune/Learning Rate": 1.4288657272021367e-05, "Full-finetune/Loss": 0.8010468482971191, "Full-finetune/Loss (Raw)": 0.6547585725784302, "Full-finetune/Step": 1965, "Full-finetune/Step Time": 6.811904342845082} {"Full-finetune/Learning Rate": 1.4283028807761603e-05, "Full-finetune/Loss": 0.8001997470855713, "Full-finetune/Loss (Raw)": 0.7500245571136475, "Full-finetune/Step": 1966, "Full-finetune/Step Time": 6.807478040456772} {"Full-finetune/Learning Rate": 1.4277398681341982e-05, "Full-finetune/Loss": 0.7991899251937866, "Full-finetune/Loss (Raw)": 0.7658542990684509, "Full-finetune/Step": 1967, "Full-finetune/Step Time": 6.7955270409584045} {"Full-finetune/Learning Rate": 1.4271766894947441e-05, "Full-finetune/Loss": 0.7997497916221619, "Full-finetune/Loss (Raw)": 0.909631609916687, "Full-finetune/Step": 1968, "Full-finetune/Step Time": 6.781763790175319} {"Full-finetune/Learning Rate": 1.4266133450763564e-05, "Full-finetune/Loss": 0.7972191572189331, "Full-finetune/Loss (Raw)": 0.44653934240341187, "Full-finetune/Step": 1969, "Full-finetune/Step Time": 6.798264991492033} {"Full-finetune/Learning Rate": 1.426049835097659e-05, "Full-finetune/Loss": 0.7960984706878662, "Full-finetune/Loss (Raw)": 0.8009711503982544, "Full-finetune/Step": 1970, "Full-finetune/Step Time": 6.794226111844182} {"Full-finetune/Learning Rate": 1.425486159777338e-05, "Full-finetune/Loss": 0.7925622463226318, "Full-finetune/Loss (Raw)": 0.4040331244468689, "Full-finetune/Step": 1971, "Full-finetune/Step Time": 6.798029752448201} {"Full-finetune/Learning Rate": 1.4249223193341456e-05, "Full-finetune/Loss": 0.7926856279373169, "Full-finetune/Loss (Raw)": 0.8360925912857056, "Full-finetune/Step": 1972, "Full-finetune/Step Time": 6.786329690366983} {"Full-finetune/Learning Rate": 1.4243583139868969e-05, "Full-finetune/Loss": 0.7930175065994263, "Full-finetune/Loss (Raw)": 0.792719304561615, "Full-finetune/Step": 1973, "Full-finetune/Step Time": 6.81340098939836} {"Full-finetune/Learning Rate": 1.423794143954471e-05, "Full-finetune/Loss": 0.7931751012802124, "Full-finetune/Loss (Raw)": 0.9799923896789551, "Full-finetune/Step": 1974, "Full-finetune/Step Time": 6.812792249023914} {"Full-finetune/Learning Rate": 1.4232298094558125e-05, "Full-finetune/Loss": 0.7931680679321289, "Full-finetune/Loss (Raw)": 0.8646020889282227, "Full-finetune/Step": 1975, "Full-finetune/Step Time": 6.802250221371651} {"Full-finetune/Learning Rate": 1.4226653107099273e-05, "Full-finetune/Loss": 0.793084979057312, "Full-finetune/Loss (Raw)": 0.8594160676002502, "Full-finetune/Step": 1976, "Full-finetune/Step Time": 6.8051880821585655} {"Full-finetune/Learning Rate": 1.422100647935887e-05, "Full-finetune/Loss": 0.7924278974533081, "Full-finetune/Loss (Raw)": 0.8908920288085938, "Full-finetune/Step": 1977, "Full-finetune/Step Time": 6.81345040909946} {"Full-finetune/Learning Rate": 1.421535821352826e-05, "Full-finetune/Loss": 0.7927405834197998, "Full-finetune/Loss (Raw)": 0.9773780107498169, "Full-finetune/Step": 1978, "Full-finetune/Step Time": 6.807179968804121} {"Full-finetune/Learning Rate": 1.4209708311799424e-05, "Full-finetune/Loss": 0.7906114459037781, "Full-finetune/Loss (Raw)": 0.37943413853645325, "Full-finetune/Step": 1979, "Full-finetune/Step Time": 6.80331508629024} {"Full-finetune/Learning Rate": 1.4204056776364985e-05, "Full-finetune/Loss": 0.7889179587364197, "Full-finetune/Loss (Raw)": 0.6747406721115112, "Full-finetune/Step": 1980, "Full-finetune/Step Time": 6.8175752107053995} {"Full-finetune/Learning Rate": 1.4198403609418184e-05, "Full-finetune/Loss": 0.7887240648269653, "Full-finetune/Loss (Raw)": 0.8763214349746704, "Full-finetune/Step": 1981, "Full-finetune/Step Time": 6.818887988105416} {"Full-finetune/Learning Rate": 1.419274881315291e-05, "Full-finetune/Loss": 0.7884987592697144, "Full-finetune/Loss (Raw)": 0.8662907481193542, "Full-finetune/Step": 1982, "Full-finetune/Step Time": 6.827254552394152} {"Full-finetune/Learning Rate": 1.418709238976368e-05, "Full-finetune/Loss": 0.7878744602203369, "Full-finetune/Loss (Raw)": 0.8222510814666748, "Full-finetune/Step": 1983, "Full-finetune/Step Time": 6.8252571653574705} {"Full-finetune/Learning Rate": 1.4181434341445634e-05, "Full-finetune/Loss": 0.7880396246910095, "Full-finetune/Loss (Raw)": 1.0125596523284912, "Full-finetune/Step": 1984, "Full-finetune/Step Time": 6.836798766627908} {"Full-finetune/Learning Rate": 1.4175774670394561e-05, "Full-finetune/Loss": 0.7896122932434082, "Full-finetune/Loss (Raw)": 0.9497004151344299, "Full-finetune/Step": 1985, "Full-finetune/Step Time": 6.799387581646442} {"Full-finetune/Learning Rate": 1.4170113378806862e-05, "Full-finetune/Loss": 0.7913259863853455, "Full-finetune/Loss (Raw)": 1.0433677434921265, "Full-finetune/Step": 1986, "Full-finetune/Step Time": 6.7906675562262535} {"Full-finetune/Learning Rate": 1.4164450468879578e-05, "Full-finetune/Loss": 0.7901518940925598, "Full-finetune/Loss (Raw)": 0.8165210485458374, "Full-finetune/Step": 1987, "Full-finetune/Step Time": 6.817779589444399} {"Full-finetune/Learning Rate": 1.4158785942810367e-05, "Full-finetune/Loss": 0.7909131050109863, "Full-finetune/Loss (Raw)": 0.8092835545539856, "Full-finetune/Step": 1988, "Full-finetune/Step Time": 6.827061768621206} {"Full-finetune/Learning Rate": 1.4153119802797526e-05, "Full-finetune/Loss": 0.791818380355835, "Full-finetune/Loss (Raw)": 0.9066298604011536, "Full-finetune/Step": 1989, "Full-finetune/Step Time": 6.829184807837009} {"Full-finetune/Learning Rate": 1.4147452051039974e-05, "Full-finetune/Loss": 0.7927137613296509, "Full-finetune/Loss (Raw)": 0.8916750550270081, "Full-finetune/Step": 1990, "Full-finetune/Step Time": 6.840223902836442} {"Full-finetune/Learning Rate": 1.4141782689737252e-05, "Full-finetune/Loss": 0.7925918102264404, "Full-finetune/Loss (Raw)": 0.7219404578208923, "Full-finetune/Step": 1991, "Full-finetune/Step Time": 6.845955589786172} {"Full-finetune/Learning Rate": 1.413611172108953e-05, "Full-finetune/Loss": 0.7935075759887695, "Full-finetune/Loss (Raw)": 0.8666878342628479, "Full-finetune/Step": 1992, "Full-finetune/Step Time": 6.8420567605644464} {"Full-finetune/Learning Rate": 1.41304391472976e-05, "Full-finetune/Loss": 0.792108952999115, "Full-finetune/Loss (Raw)": 0.7201042771339417, "Full-finetune/Step": 1993, "Full-finetune/Step Time": 6.846133420243859} {"Full-finetune/Learning Rate": 1.4124764970562874e-05, "Full-finetune/Loss": 0.7899341583251953, "Full-finetune/Loss (Raw)": 0.6604810953140259, "Full-finetune/Step": 1994, "Full-finetune/Step Time": 6.843400817364454} {"Full-finetune/Learning Rate": 1.4119089193087396e-05, "Full-finetune/Loss": 0.7879451513290405, "Full-finetune/Loss (Raw)": 0.7165829539299011, "Full-finetune/Step": 1995, "Full-finetune/Step Time": 6.847303863614798} {"Full-finetune/Learning Rate": 1.4113411817073818e-05, "Full-finetune/Loss": 0.787942111492157, "Full-finetune/Loss (Raw)": 0.7458372712135315, "Full-finetune/Step": 1996, "Full-finetune/Step Time": 6.826119789853692} {"Full-finetune/Learning Rate": 1.4107732844725424e-05, "Full-finetune/Loss": 0.7881221771240234, "Full-finetune/Loss (Raw)": 0.9654210805892944, "Full-finetune/Step": 1997, "Full-finetune/Step Time": 6.8283278699964285} {"Full-finetune/Learning Rate": 1.4102052278246107e-05, "Full-finetune/Loss": 0.7883895635604858, "Full-finetune/Loss (Raw)": 0.7978309392929077, "Full-finetune/Step": 1998, "Full-finetune/Step Time": 6.83941088244319} {"Full-finetune/Learning Rate": 1.4096370119840389e-05, "Full-finetune/Loss": 0.7852010726928711, "Full-finetune/Loss (Raw)": 0.41214659810066223, "Full-finetune/Step": 1999, "Full-finetune/Step Time": 6.827807083725929} {"Full-finetune/Learning Rate": 1.4090686371713403e-05, "Full-finetune/Loss": 0.7849148511886597, "Full-finetune/Loss (Raw)": 0.6590366363525391, "Full-finetune/Step": 2000, "Full-finetune/Step Time": 6.851186387240887} {"Full-finetune/Learning Rate": 1.4085001036070896e-05, "Full-finetune/Loss": 0.7888481616973877, "Full-finetune/Loss (Raw)": 0.86234450340271, "Full-finetune/Step": 2001, "Full-finetune/Step Time": 6.837832694873214} {"Full-finetune/Learning Rate": 1.4079314115119242e-05, "Full-finetune/Loss": 0.788414716720581, "Full-finetune/Loss (Raw)": 0.8523836731910706, "Full-finetune/Step": 2002, "Full-finetune/Step Time": 6.824957847595215} {"Full-finetune/Learning Rate": 1.4073625611065422e-05, "Full-finetune/Loss": 0.7891699075698853, "Full-finetune/Loss (Raw)": 0.7869626879692078, "Full-finetune/Step": 2003, "Full-finetune/Step Time": 6.8241846319288015} {"Full-finetune/Learning Rate": 1.4067935526117033e-05, "Full-finetune/Loss": 0.7885791063308716, "Full-finetune/Loss (Raw)": 0.8101009130477905, "Full-finetune/Step": 2004, "Full-finetune/Step Time": 6.829197369515896} {"Full-finetune/Learning Rate": 1.4062243862482286e-05, "Full-finetune/Loss": 0.7877253293991089, "Full-finetune/Loss (Raw)": 0.7847433090209961, "Full-finetune/Step": 2005, "Full-finetune/Step Time": 6.812768684700131} {"Full-finetune/Learning Rate": 1.4056550622370004e-05, "Full-finetune/Loss": 0.7888176441192627, "Full-finetune/Loss (Raw)": 0.809568464756012, "Full-finetune/Step": 2006, "Full-finetune/Step Time": 6.80269449390471} {"Full-finetune/Learning Rate": 1.4050855807989626e-05, "Full-finetune/Loss": 0.7896526455879211, "Full-finetune/Loss (Raw)": 1.0646083354949951, "Full-finetune/Step": 2007, "Full-finetune/Step Time": 6.792039107531309} {"Full-finetune/Learning Rate": 1.4045159421551191e-05, "Full-finetune/Loss": 0.7910451889038086, "Full-finetune/Loss (Raw)": 0.8129199147224426, "Full-finetune/Step": 2008, "Full-finetune/Step Time": 6.776791190728545} {"Full-finetune/Learning Rate": 1.4039461465265362e-05, "Full-finetune/Loss": 0.7914304733276367, "Full-finetune/Loss (Raw)": 0.7935581803321838, "Full-finetune/Step": 2009, "Full-finetune/Step Time": 6.776414534077048} {"Full-finetune/Learning Rate": 1.4033761941343403e-05, "Full-finetune/Loss": 0.791817307472229, "Full-finetune/Loss (Raw)": 0.9275931119918823, "Full-finetune/Step": 2010, "Full-finetune/Step Time": 6.776267766952515} {"Full-finetune/Learning Rate": 1.4028060851997183e-05, "Full-finetune/Loss": 0.7946151494979858, "Full-finetune/Loss (Raw)": 1.0313806533813477, "Full-finetune/Step": 2011, "Full-finetune/Step Time": 6.769979799166322} {"Full-finetune/Learning Rate": 1.4022358199439193e-05, "Full-finetune/Loss": 0.7984727621078491, "Full-finetune/Loss (Raw)": 0.8457504510879517, "Full-finetune/Step": 2012, "Full-finetune/Step Time": 6.7494584210217} {"Full-finetune/Learning Rate": 1.4016653985882512e-05, "Full-finetune/Loss": 0.798529863357544, "Full-finetune/Loss (Raw)": 0.8907420635223389, "Full-finetune/Step": 2013, "Full-finetune/Step Time": 6.765537453815341} {"Full-finetune/Learning Rate": 1.4010948213540838e-05, "Full-finetune/Loss": 0.79604172706604, "Full-finetune/Loss (Raw)": 0.6838594675064087, "Full-finetune/Step": 2014, "Full-finetune/Step Time": 6.7745629493147135} {"Full-finetune/Learning Rate": 1.4005240884628473e-05, "Full-finetune/Loss": 0.7933698892593384, "Full-finetune/Loss (Raw)": 0.3913223147392273, "Full-finetune/Step": 2015, "Full-finetune/Step Time": 6.79127736762166} {"Full-finetune/Learning Rate": 1.3999532001360309e-05, "Full-finetune/Loss": 0.7910481095314026, "Full-finetune/Loss (Raw)": 0.3997043967247009, "Full-finetune/Step": 2016, "Full-finetune/Step Time": 6.805568801239133} {"Full-finetune/Learning Rate": 1.3993821565951868e-05, "Full-finetune/Loss": 0.7903404235839844, "Full-finetune/Loss (Raw)": 0.7007961273193359, "Full-finetune/Step": 2017, "Full-finetune/Step Time": 6.810632629320025} {"Full-finetune/Learning Rate": 1.3988109580619244e-05, "Full-finetune/Loss": 0.7910146713256836, "Full-finetune/Loss (Raw)": 0.8986306190490723, "Full-finetune/Step": 2018, "Full-finetune/Step Time": 6.811771290376782} {"Full-finetune/Learning Rate": 1.3982396047579156e-05, "Full-finetune/Loss": 0.7899699211120605, "Full-finetune/Loss (Raw)": 0.7853262424468994, "Full-finetune/Step": 2019, "Full-finetune/Step Time": 6.818828329443932} {"Full-finetune/Learning Rate": 1.3976680969048912e-05, "Full-finetune/Loss": 0.7891597151756287, "Full-finetune/Loss (Raw)": 0.8804160356521606, "Full-finetune/Step": 2020, "Full-finetune/Step Time": 6.821460140869021} {"Full-finetune/Learning Rate": 1.3970964347246419e-05, "Full-finetune/Loss": 0.7889350652694702, "Full-finetune/Loss (Raw)": 0.7844899296760559, "Full-finetune/Step": 2021, "Full-finetune/Step Time": 6.806959662586451} {"Full-finetune/Learning Rate": 1.3965246184390193e-05, "Full-finetune/Loss": 0.7895509004592896, "Full-finetune/Loss (Raw)": 0.82685387134552, "Full-finetune/Step": 2022, "Full-finetune/Step Time": 6.813828187063336} {"Full-finetune/Learning Rate": 1.3959526482699335e-05, "Full-finetune/Loss": 0.7881020307540894, "Full-finetune/Loss (Raw)": 0.6462038159370422, "Full-finetune/Step": 2023, "Full-finetune/Step Time": 6.838126264512539} {"Full-finetune/Learning Rate": 1.3953805244393554e-05, "Full-finetune/Loss": 0.787639856338501, "Full-finetune/Loss (Raw)": 0.7910813093185425, "Full-finetune/Step": 2024, "Full-finetune/Step Time": 6.837472781538963} {"Full-finetune/Learning Rate": 1.394808247169315e-05, "Full-finetune/Loss": 0.7860448360443115, "Full-finetune/Loss (Raw)": 0.7738019227981567, "Full-finetune/Step": 2025, "Full-finetune/Step Time": 6.848916949704289} {"Full-finetune/Learning Rate": 1.3942358166819016e-05, "Full-finetune/Loss": 0.7863568067550659, "Full-finetune/Loss (Raw)": 0.9083040356636047, "Full-finetune/Step": 2026, "Full-finetune/Step Time": 6.83529644086957} {"Full-finetune/Learning Rate": 1.3936632331992648e-05, "Full-finetune/Loss": 0.7871289849281311, "Full-finetune/Loss (Raw)": 0.8107179403305054, "Full-finetune/Step": 2027, "Full-finetune/Step Time": 6.814924914389849} {"Full-finetune/Learning Rate": 1.3930904969436125e-05, "Full-finetune/Loss": 0.7873345613479614, "Full-finetune/Loss (Raw)": 0.8597776293754578, "Full-finetune/Step": 2028, "Full-finetune/Step Time": 6.829013602808118} {"Full-finetune/Learning Rate": 1.3925176081372129e-05, "Full-finetune/Loss": 0.7881788611412048, "Full-finetune/Loss (Raw)": 0.9075697660446167, "Full-finetune/Step": 2029, "Full-finetune/Step Time": 6.822577053681016} {"Full-finetune/Learning Rate": 1.3919445670023933e-05, "Full-finetune/Loss": 0.7834054827690125, "Full-finetune/Loss (Raw)": 0.33956271409988403, "Full-finetune/Step": 2030, "Full-finetune/Step Time": 6.834853725507855} {"Full-finetune/Learning Rate": 1.3913713737615387e-05, "Full-finetune/Loss": 0.7838438749313354, "Full-finetune/Loss (Raw)": 0.8114383816719055, "Full-finetune/Step": 2031, "Full-finetune/Step Time": 6.814316421747208} {"Full-finetune/Learning Rate": 1.3907980286370952e-05, "Full-finetune/Loss": 0.7848016023635864, "Full-finetune/Loss (Raw)": 0.9501961469650269, "Full-finetune/Step": 2032, "Full-finetune/Step Time": 6.809558182954788} {"Full-finetune/Learning Rate": 1.3902245318515661e-05, "Full-finetune/Loss": 0.7889732122421265, "Full-finetune/Loss (Raw)": 0.855855405330658, "Full-finetune/Step": 2033, "Full-finetune/Step Time": 6.794389925897121} {"Full-finetune/Learning Rate": 1.389650883627515e-05, "Full-finetune/Loss": 0.7906472086906433, "Full-finetune/Loss (Raw)": 0.9715561866760254, "Full-finetune/Step": 2034, "Full-finetune/Step Time": 6.782539084553719} {"Full-finetune/Learning Rate": 1.3890770841875632e-05, "Full-finetune/Loss": 0.7890796661376953, "Full-finetune/Loss (Raw)": 0.6614410877227783, "Full-finetune/Step": 2035, "Full-finetune/Step Time": 6.7910560965538025} {"Full-finetune/Learning Rate": 1.388503133754391e-05, "Full-finetune/Loss": 0.7897387742996216, "Full-finetune/Loss (Raw)": 0.875153124332428, "Full-finetune/Step": 2036, "Full-finetune/Step Time": 6.804302528500557} {"Full-finetune/Learning Rate": 1.3879290325507378e-05, "Full-finetune/Loss": 0.7914513945579529, "Full-finetune/Loss (Raw)": 0.8276760578155518, "Full-finetune/Step": 2037, "Full-finetune/Step Time": 6.819236077368259} {"Full-finetune/Learning Rate": 1.3873547807994e-05, "Full-finetune/Loss": 0.7899899482727051, "Full-finetune/Loss (Raw)": 0.6787850260734558, "Full-finetune/Step": 2038, "Full-finetune/Step Time": 6.821548022329807} {"Full-finetune/Learning Rate": 1.386780378723235e-05, "Full-finetune/Loss": 0.7903361320495605, "Full-finetune/Loss (Raw)": 0.9587580561637878, "Full-finetune/Step": 2039, "Full-finetune/Step Time": 6.815204838290811} {"Full-finetune/Learning Rate": 1.3862058265451561e-05, "Full-finetune/Loss": 0.7908047437667847, "Full-finetune/Loss (Raw)": 0.8806398510932922, "Full-finetune/Step": 2040, "Full-finetune/Step Time": 6.814356315881014} {"Full-finetune/Learning Rate": 1.385631124488136e-05, "Full-finetune/Loss": 0.7911771535873413, "Full-finetune/Loss (Raw)": 0.8827484846115112, "Full-finetune/Step": 2041, "Full-finetune/Step Time": 6.855923105031252} {"Full-finetune/Learning Rate": 1.385056272775205e-05, "Full-finetune/Loss": 0.7892763614654541, "Full-finetune/Loss (Raw)": 0.7509220242500305, "Full-finetune/Step": 2042, "Full-finetune/Step Time": 6.8568594846874475} {"Full-finetune/Learning Rate": 1.3844812716294523e-05, "Full-finetune/Loss": 0.7887675166130066, "Full-finetune/Loss (Raw)": 0.8616364002227783, "Full-finetune/Step": 2043, "Full-finetune/Step Time": 6.836678214371204} {"Full-finetune/Learning Rate": 1.3839061212740244e-05, "Full-finetune/Loss": 0.7891944050788879, "Full-finetune/Loss (Raw)": 0.8767136931419373, "Full-finetune/Step": 2044, "Full-finetune/Step Time": 6.84594801068306} {"Full-finetune/Learning Rate": 1.383330821932126e-05, "Full-finetune/Loss": 0.7901308536529541, "Full-finetune/Loss (Raw)": 0.8872824311256409, "Full-finetune/Step": 2045, "Full-finetune/Step Time": 6.866637608036399} {"Full-finetune/Learning Rate": 1.3827553738270196e-05, "Full-finetune/Loss": 0.7913852334022522, "Full-finetune/Loss (Raw)": 0.9691727161407471, "Full-finetune/Step": 2046, "Full-finetune/Step Time": 6.87609550729394} {"Full-finetune/Learning Rate": 1.382179777182025e-05, "Full-finetune/Loss": 0.7921061515808105, "Full-finetune/Loss (Raw)": 0.9339128732681274, "Full-finetune/Step": 2047, "Full-finetune/Step Time": 6.878602512180805} {"Full-finetune/Learning Rate": 1.3816040322205206e-05, "Full-finetune/Loss": 0.7919650077819824, "Full-finetune/Loss (Raw)": 0.7228884696960449, "Full-finetune/Step": 2048, "Full-finetune/Step Time": 6.867173057049513} {"Full-finetune/Learning Rate": 1.3810281391659414e-05, "Full-finetune/Loss": 0.7888223528862, "Full-finetune/Loss (Raw)": 0.5538091659545898, "Full-finetune/Step": 2049, "Full-finetune/Step Time": 6.880869645625353} {"Full-finetune/Learning Rate": 1.3804520982417802e-05, "Full-finetune/Loss": 0.7917926907539368, "Full-finetune/Loss (Raw)": 0.6852114200592041, "Full-finetune/Step": 2050, "Full-finetune/Step Time": 6.874096792191267} {"Full-finetune/Learning Rate": 1.3798759096715877e-05, "Full-finetune/Loss": 0.7928856611251831, "Full-finetune/Loss (Raw)": 0.9908076524734497, "Full-finetune/Step": 2051, "Full-finetune/Step Time": 6.877208702266216} {"Full-finetune/Learning Rate": 1.379299573678971e-05, "Full-finetune/Loss": 0.7931503057479858, "Full-finetune/Loss (Raw)": 0.9414926767349243, "Full-finetune/Step": 2052, "Full-finetune/Step Time": 6.888099912554026} {"Full-finetune/Learning Rate": 1.3787230904875947e-05, "Full-finetune/Loss": 0.7921754121780396, "Full-finetune/Loss (Raw)": 0.8915715217590332, "Full-finetune/Step": 2053, "Full-finetune/Step Time": 6.888779532164335} {"Full-finetune/Learning Rate": 1.3781464603211811e-05, "Full-finetune/Loss": 0.7970056533813477, "Full-finetune/Loss (Raw)": 0.9517103433609009, "Full-finetune/Step": 2054, "Full-finetune/Step Time": 6.871824756264687} {"Full-finetune/Learning Rate": 1.3775696834035088e-05, "Full-finetune/Loss": 0.800990104675293, "Full-finetune/Loss (Raw)": 0.9063629508018494, "Full-finetune/Step": 2055, "Full-finetune/Step Time": 6.867535283789039} {"Full-finetune/Learning Rate": 1.3769927599584141e-05, "Full-finetune/Loss": 0.8008253574371338, "Full-finetune/Loss (Raw)": 0.928234875202179, "Full-finetune/Step": 2056, "Full-finetune/Step Time": 6.856636803597212} {"Full-finetune/Learning Rate": 1.376415690209789e-05, "Full-finetune/Loss": 0.801180362701416, "Full-finetune/Loss (Raw)": 0.7518860101699829, "Full-finetune/Step": 2057, "Full-finetune/Step Time": 6.864028433337808} {"Full-finetune/Learning Rate": 1.3758384743815838e-05, "Full-finetune/Loss": 0.8021162748336792, "Full-finetune/Loss (Raw)": 0.763411819934845, "Full-finetune/Step": 2058, "Full-finetune/Step Time": 6.874403053894639} {"Full-finetune/Learning Rate": 1.3752611126978045e-05, "Full-finetune/Loss": 0.8012309074401855, "Full-finetune/Loss (Raw)": 0.7772653102874756, "Full-finetune/Step": 2059, "Full-finetune/Step Time": 6.87479211948812} {"Full-finetune/Learning Rate": 1.3746836053825133e-05, "Full-finetune/Loss": 0.8022562861442566, "Full-finetune/Loss (Raw)": 0.7861014008522034, "Full-finetune/Step": 2060, "Full-finetune/Step Time": 6.845143375918269} {"Full-finetune/Learning Rate": 1.3741059526598299e-05, "Full-finetune/Loss": 0.8025786876678467, "Full-finetune/Loss (Raw)": 0.9313075542449951, "Full-finetune/Step": 2061, "Full-finetune/Step Time": 6.843503037467599} {"Full-finetune/Learning Rate": 1.3735281547539304e-05, "Full-finetune/Loss": 0.8017507195472717, "Full-finetune/Loss (Raw)": 0.7875709533691406, "Full-finetune/Step": 2062, "Full-finetune/Step Time": 6.832132006064057} {"Full-finetune/Learning Rate": 1.3729502118890463e-05, "Full-finetune/Loss": 0.8015328645706177, "Full-finetune/Loss (Raw)": 0.9197248816490173, "Full-finetune/Step": 2063, "Full-finetune/Step Time": 6.813156824558973} {"Full-finetune/Learning Rate": 1.3723721242894663e-05, "Full-finetune/Loss": 0.8016781210899353, "Full-finetune/Loss (Raw)": 0.7384880185127258, "Full-finetune/Step": 2064, "Full-finetune/Step Time": 6.8279964979738} {"Full-finetune/Learning Rate": 1.3717938921795347e-05, "Full-finetune/Loss": 0.8013371229171753, "Full-finetune/Loss (Raw)": 0.8120801448822021, "Full-finetune/Step": 2065, "Full-finetune/Step Time": 6.835633305832744} {"Full-finetune/Learning Rate": 1.3712155157836522e-05, "Full-finetune/Loss": 0.8008212447166443, "Full-finetune/Loss (Raw)": 0.3341674506664276, "Full-finetune/Step": 2066, "Full-finetune/Step Time": 6.835901213809848} {"Full-finetune/Learning Rate": 1.3706369953262754e-05, "Full-finetune/Loss": 0.8006905913352966, "Full-finetune/Loss (Raw)": 0.8281595706939697, "Full-finetune/Step": 2067, "Full-finetune/Step Time": 6.84714531712234} {"Full-finetune/Learning Rate": 1.3700583310319171e-05, "Full-finetune/Loss": 0.8035494089126587, "Full-finetune/Loss (Raw)": 0.8447306752204895, "Full-finetune/Step": 2068, "Full-finetune/Step Time": 6.8359039686620235} {"Full-finetune/Learning Rate": 1.3694795231251453e-05, "Full-finetune/Loss": 0.8038367629051208, "Full-finetune/Loss (Raw)": 0.8416483402252197, "Full-finetune/Step": 2069, "Full-finetune/Step Time": 6.831115372478962} {"Full-finetune/Learning Rate": 1.368900571830584e-05, "Full-finetune/Loss": 0.7999863028526306, "Full-finetune/Loss (Raw)": 0.49161720275878906, "Full-finetune/Step": 2070, "Full-finetune/Step Time": 6.8431134931743145} {"Full-finetune/Learning Rate": 1.3683214773729123e-05, "Full-finetune/Loss": 0.7995961308479309, "Full-finetune/Loss (Raw)": 0.8883243799209595, "Full-finetune/Step": 2071, "Full-finetune/Step Time": 6.849407570436597} {"Full-finetune/Learning Rate": 1.3677422399768667e-05, "Full-finetune/Loss": 0.8002429008483887, "Full-finetune/Loss (Raw)": 0.9505605101585388, "Full-finetune/Step": 2072, "Full-finetune/Step Time": 6.84009656868875} {"Full-finetune/Learning Rate": 1.3671628598672373e-05, "Full-finetune/Loss": 0.8029754757881165, "Full-finetune/Loss (Raw)": 0.7335490584373474, "Full-finetune/Step": 2073, "Full-finetune/Step Time": 6.832213992252946} {"Full-finetune/Learning Rate": 1.3665833372688702e-05, "Full-finetune/Loss": 0.8032780885696411, "Full-finetune/Loss (Raw)": 0.9460490942001343, "Full-finetune/Step": 2074, "Full-finetune/Step Time": 6.821747036650777} {"Full-finetune/Learning Rate": 1.366003672406667e-05, "Full-finetune/Loss": 0.8015674352645874, "Full-finetune/Loss (Raw)": 0.7835407853126526, "Full-finetune/Step": 2075, "Full-finetune/Step Time": 6.8217412903904915} {"Full-finetune/Learning Rate": 1.3654238655055836e-05, "Full-finetune/Loss": 0.7988751530647278, "Full-finetune/Loss (Raw)": 0.6873886585235596, "Full-finetune/Step": 2076, "Full-finetune/Step Time": 6.834617791697383} {"Full-finetune/Learning Rate": 1.364843916790633e-05, "Full-finetune/Loss": 0.7975858449935913, "Full-finetune/Loss (Raw)": 0.7952160239219666, "Full-finetune/Step": 2077, "Full-finetune/Step Time": 6.834370771422982} {"Full-finetune/Learning Rate": 1.3642638264868808e-05, "Full-finetune/Loss": 0.795805811882019, "Full-finetune/Loss (Raw)": 0.7584973573684692, "Full-finetune/Step": 2078, "Full-finetune/Step Time": 6.8237561993300915} {"Full-finetune/Learning Rate": 1.3636835948194494e-05, "Full-finetune/Loss": 0.794403076171875, "Full-finetune/Loss (Raw)": 0.7842832803726196, "Full-finetune/Step": 2079, "Full-finetune/Step Time": 6.818350572139025} {"Full-finetune/Learning Rate": 1.3631032220135152e-05, "Full-finetune/Loss": 0.792431116104126, "Full-finetune/Loss (Raw)": 0.7153371572494507, "Full-finetune/Step": 2080, "Full-finetune/Step Time": 6.826015263795853} {"Full-finetune/Learning Rate": 1.3625227082943093e-05, "Full-finetune/Loss": 0.7943333983421326, "Full-finetune/Loss (Raw)": 0.8119336366653442, "Full-finetune/Step": 2081, "Full-finetune/Step Time": 6.825259802863002} {"Full-finetune/Learning Rate": 1.361942053887118e-05, "Full-finetune/Loss": 0.7956867218017578, "Full-finetune/Loss (Raw)": 0.7993077039718628, "Full-finetune/Step": 2082, "Full-finetune/Step Time": 6.812320051714778} {"Full-finetune/Learning Rate": 1.361361259017282e-05, "Full-finetune/Loss": 0.7968941926956177, "Full-finetune/Loss (Raw)": 0.8895230293273926, "Full-finetune/Step": 2083, "Full-finetune/Step Time": 6.794863605871797} {"Full-finetune/Learning Rate": 1.3607803239101965e-05, "Full-finetune/Loss": 0.7989031076431274, "Full-finetune/Loss (Raw)": 0.9946563243865967, "Full-finetune/Step": 2084, "Full-finetune/Step Time": 6.79002227820456} {"Full-finetune/Learning Rate": 1.360199248791311e-05, "Full-finetune/Loss": 0.7941452264785767, "Full-finetune/Loss (Raw)": 0.3105979859828949, "Full-finetune/Step": 2085, "Full-finetune/Step Time": 6.808742221444845} {"Full-finetune/Learning Rate": 1.359618033886129e-05, "Full-finetune/Loss": 0.793499767780304, "Full-finetune/Loss (Raw)": 0.8957598805427551, "Full-finetune/Step": 2086, "Full-finetune/Step Time": 6.813826911151409} {"Full-finetune/Learning Rate": 1.359036679420209e-05, "Full-finetune/Loss": 0.7949918508529663, "Full-finetune/Loss (Raw)": 0.9644759893417358, "Full-finetune/Step": 2087, "Full-finetune/Step Time": 6.803575681522489} {"Full-finetune/Learning Rate": 1.3584551856191635e-05, "Full-finetune/Loss": 0.7943376302719116, "Full-finetune/Loss (Raw)": 0.9146296381950378, "Full-finetune/Step": 2088, "Full-finetune/Step Time": 6.794615186750889} {"Full-finetune/Learning Rate": 1.3578735527086585e-05, "Full-finetune/Loss": 0.7954073548316956, "Full-finetune/Loss (Raw)": 0.8569543957710266, "Full-finetune/Step": 2089, "Full-finetune/Step Time": 6.789244303479791} {"Full-finetune/Learning Rate": 1.357291780914415e-05, "Full-finetune/Loss": 0.7942237854003906, "Full-finetune/Loss (Raw)": 0.25578054785728455, "Full-finetune/Step": 2090, "Full-finetune/Step Time": 6.789552543312311} {"Full-finetune/Learning Rate": 1.3567098704622064e-05, "Full-finetune/Loss": 0.797158420085907, "Full-finetune/Loss (Raw)": 0.7674224376678467, "Full-finetune/Step": 2091, "Full-finetune/Step Time": 6.7740601524710655} {"Full-finetune/Learning Rate": 1.3561278215778618e-05, "Full-finetune/Loss": 0.7976874113082886, "Full-finetune/Loss (Raw)": 0.87724369764328, "Full-finetune/Step": 2092, "Full-finetune/Step Time": 6.761229507625103} {"Full-finetune/Learning Rate": 1.355545634487262e-05, "Full-finetune/Loss": 0.7997497320175171, "Full-finetune/Loss (Raw)": 0.918738603591919, "Full-finetune/Step": 2093, "Full-finetune/Step Time": 6.758681109175086} {"Full-finetune/Learning Rate": 1.354963309416343e-05, "Full-finetune/Loss": 0.8015137910842896, "Full-finetune/Loss (Raw)": 0.9758176207542419, "Full-finetune/Step": 2094, "Full-finetune/Step Time": 6.759485449641943} {"Full-finetune/Learning Rate": 1.3543808465910938e-05, "Full-finetune/Loss": 0.8021283149719238, "Full-finetune/Loss (Raw)": 0.8445090651512146, "Full-finetune/Step": 2095, "Full-finetune/Step Time": 6.774072729051113} {"Full-finetune/Learning Rate": 1.3537982462375566e-05, "Full-finetune/Loss": 0.8014201521873474, "Full-finetune/Loss (Raw)": 0.8189900517463684, "Full-finetune/Step": 2096, "Full-finetune/Step Time": 6.776532037183642} {"Full-finetune/Learning Rate": 1.3532155085818276e-05, "Full-finetune/Loss": 0.8049423694610596, "Full-finetune/Loss (Raw)": 0.897390604019165, "Full-finetune/Step": 2097, "Full-finetune/Step Time": 6.767161114141345} {"Full-finetune/Learning Rate": 1.3526326338500553e-05, "Full-finetune/Loss": 0.8046985864639282, "Full-finetune/Loss (Raw)": 0.7697635889053345, "Full-finetune/Step": 2098, "Full-finetune/Step Time": 6.785664930939674} {"Full-finetune/Learning Rate": 1.3520496222684424e-05, "Full-finetune/Loss": 0.8043141961097717, "Full-finetune/Loss (Raw)": 0.3548315763473511, "Full-finetune/Step": 2099, "Full-finetune/Step Time": 6.78703286126256} {"Full-finetune/Learning Rate": 1.3514664740632446e-05, "Full-finetune/Loss": 0.8029663562774658, "Full-finetune/Loss (Raw)": 0.6635657548904419, "Full-finetune/Step": 2100, "Full-finetune/Step Time": 6.792641473934054} {"Full-finetune/Learning Rate": 1.3508831894607696e-05, "Full-finetune/Loss": 0.803973376750946, "Full-finetune/Loss (Raw)": 0.9216237664222717, "Full-finetune/Step": 2101, "Full-finetune/Step Time": 6.756826542317867} {"Full-finetune/Learning Rate": 1.3502997686873797e-05, "Full-finetune/Loss": 0.8025552034378052, "Full-finetune/Loss (Raw)": 0.7984617352485657, "Full-finetune/Step": 2102, "Full-finetune/Step Time": 6.759825706481934} {"Full-finetune/Learning Rate": 1.3497162119694883e-05, "Full-finetune/Loss": 0.7986850738525391, "Full-finetune/Loss (Raw)": 0.3692275583744049, "Full-finetune/Step": 2103, "Full-finetune/Step Time": 6.780625008046627} {"Full-finetune/Learning Rate": 1.3491325195335627e-05, "Full-finetune/Loss": 0.7982742786407471, "Full-finetune/Loss (Raw)": 0.8068288564682007, "Full-finetune/Step": 2104, "Full-finetune/Step Time": 6.78736050054431} {"Full-finetune/Learning Rate": 1.3485486916061228e-05, "Full-finetune/Loss": 0.7978777885437012, "Full-finetune/Loss (Raw)": 0.840145468711853, "Full-finetune/Step": 2105, "Full-finetune/Step Time": 6.79744609259069} {"Full-finetune/Learning Rate": 1.3479647284137398e-05, "Full-finetune/Loss": 0.7969646453857422, "Full-finetune/Loss (Raw)": 0.8604899048805237, "Full-finetune/Step": 2106, "Full-finetune/Step Time": 6.796300729736686} {"Full-finetune/Learning Rate": 1.3473806301830398e-05, "Full-finetune/Loss": 0.8008114099502563, "Full-finetune/Loss (Raw)": 0.8718262314796448, "Full-finetune/Step": 2107, "Full-finetune/Step Time": 6.776026492938399} {"Full-finetune/Learning Rate": 1.346796397140699e-05, "Full-finetune/Loss": 0.801598072052002, "Full-finetune/Loss (Raw)": 0.7754245400428772, "Full-finetune/Step": 2108, "Full-finetune/Step Time": 6.763184929266572} {"Full-finetune/Learning Rate": 1.3462120295134476e-05, "Full-finetune/Loss": 0.8016687035560608, "Full-finetune/Loss (Raw)": 0.8853694796562195, "Full-finetune/Step": 2109, "Full-finetune/Step Time": 6.765792841091752} {"Full-finetune/Learning Rate": 1.3456275275280661e-05, "Full-finetune/Loss": 0.8010702133178711, "Full-finetune/Loss (Raw)": 0.7896866798400879, "Full-finetune/Step": 2110, "Full-finetune/Step Time": 6.773633565753698} {"Full-finetune/Learning Rate": 1.3450428914113892e-05, "Full-finetune/Loss": 0.8008078336715698, "Full-finetune/Loss (Raw)": 0.788658618927002, "Full-finetune/Step": 2111, "Full-finetune/Step Time": 6.789048841223121} {"Full-finetune/Learning Rate": 1.3444581213903026e-05, "Full-finetune/Loss": 0.7964963912963867, "Full-finetune/Loss (Raw)": 0.46070384979248047, "Full-finetune/Step": 2112, "Full-finetune/Step Time": 6.797299966216087} {"Full-finetune/Learning Rate": 1.3438732176917437e-05, "Full-finetune/Loss": 0.7956010103225708, "Full-finetune/Loss (Raw)": 0.835085391998291, "Full-finetune/Step": 2113, "Full-finetune/Step Time": 6.795107692480087} {"Full-finetune/Learning Rate": 1.3432881805427032e-05, "Full-finetune/Loss": 0.7946032285690308, "Full-finetune/Loss (Raw)": 0.9156485199928284, "Full-finetune/Step": 2114, "Full-finetune/Step Time": 6.822600670158863} {"Full-finetune/Learning Rate": 1.3427030101702215e-05, "Full-finetune/Loss": 0.795315146446228, "Full-finetune/Loss (Raw)": 0.9076506495475769, "Full-finetune/Step": 2115, "Full-finetune/Step Time": 6.798800094053149} {"Full-finetune/Learning Rate": 1.3421177068013925e-05, "Full-finetune/Loss": 0.7922003269195557, "Full-finetune/Loss (Raw)": 0.4105875492095947, "Full-finetune/Step": 2116, "Full-finetune/Step Time": 6.803552130237222} {"Full-finetune/Learning Rate": 1.3415322706633606e-05, "Full-finetune/Loss": 0.7903919816017151, "Full-finetune/Loss (Raw)": 0.6751630306243896, "Full-finetune/Step": 2117, "Full-finetune/Step Time": 6.819176947697997} {"Full-finetune/Learning Rate": 1.3409467019833223e-05, "Full-finetune/Loss": 0.7893648147583008, "Full-finetune/Loss (Raw)": 0.7602035403251648, "Full-finetune/Step": 2118, "Full-finetune/Step Time": 6.8046982660889626} {"Full-finetune/Learning Rate": 1.3403610009885258e-05, "Full-finetune/Loss": 0.7896037697792053, "Full-finetune/Loss (Raw)": 0.7525202035903931, "Full-finetune/Step": 2119, "Full-finetune/Step Time": 6.807362345978618} {"Full-finetune/Learning Rate": 1.3397751679062692e-05, "Full-finetune/Loss": 0.7853862047195435, "Full-finetune/Loss (Raw)": 0.32683461904525757, "Full-finetune/Step": 2120, "Full-finetune/Step Time": 6.826156750321388} {"Full-finetune/Learning Rate": 1.3391892029639037e-05, "Full-finetune/Loss": 0.7864562273025513, "Full-finetune/Loss (Raw)": 0.8570689558982849, "Full-finetune/Step": 2121, "Full-finetune/Step Time": 6.817636851221323} {"Full-finetune/Learning Rate": 1.3386031063888309e-05, "Full-finetune/Loss": 0.788383424282074, "Full-finetune/Loss (Raw)": 0.9071648120880127, "Full-finetune/Step": 2122, "Full-finetune/Step Time": 6.810971295461059} {"Full-finetune/Learning Rate": 1.3380168784085028e-05, "Full-finetune/Loss": 0.789574384689331, "Full-finetune/Loss (Raw)": 0.8690246939659119, "Full-finetune/Step": 2123, "Full-finetune/Step Time": 6.802069418132305} {"Full-finetune/Learning Rate": 1.337430519250424e-05, "Full-finetune/Loss": 0.7905358076095581, "Full-finetune/Loss (Raw)": 0.8689041137695312, "Full-finetune/Step": 2124, "Full-finetune/Step Time": 6.798673750832677} {"Full-finetune/Learning Rate": 1.3368440291421475e-05, "Full-finetune/Loss": 0.7897698283195496, "Full-finetune/Loss (Raw)": 0.867367148399353, "Full-finetune/Step": 2125, "Full-finetune/Step Time": 6.810832463204861} {"Full-finetune/Learning Rate": 1.3362574083112804e-05, "Full-finetune/Loss": 0.7907281517982483, "Full-finetune/Loss (Raw)": 0.9205051064491272, "Full-finetune/Step": 2126, "Full-finetune/Step Time": 6.807884406298399} {"Full-finetune/Learning Rate": 1.3356706569854778e-05, "Full-finetune/Loss": 0.7942451238632202, "Full-finetune/Loss (Raw)": 0.8623190522193909, "Full-finetune/Step": 2127, "Full-finetune/Step Time": 6.790546951815486} {"Full-finetune/Learning Rate": 1.3350837753924466e-05, "Full-finetune/Loss": 0.791843593120575, "Full-finetune/Loss (Raw)": 0.3516368269920349, "Full-finetune/Step": 2128, "Full-finetune/Step Time": 6.788826365023851} {"Full-finetune/Learning Rate": 1.3344967637599445e-05, "Full-finetune/Loss": 0.7872710227966309, "Full-finetune/Loss (Raw)": 0.2770504653453827, "Full-finetune/Step": 2129, "Full-finetune/Step Time": 6.80225713737309} {"Full-finetune/Learning Rate": 1.3339096223157782e-05, "Full-finetune/Loss": 0.7873602509498596, "Full-finetune/Loss (Raw)": 0.8638100624084473, "Full-finetune/Step": 2130, "Full-finetune/Step Time": 6.801493627950549} {"Full-finetune/Learning Rate": 1.3333223512878068e-05, "Full-finetune/Loss": 0.7884542942047119, "Full-finetune/Loss (Raw)": 0.9269974231719971, "Full-finetune/Step": 2131, "Full-finetune/Step Time": 6.79113232344389} {"Full-finetune/Learning Rate": 1.3327349509039387e-05, "Full-finetune/Loss": 0.7883849740028381, "Full-finetune/Loss (Raw)": 0.8012320399284363, "Full-finetune/Step": 2132, "Full-finetune/Step Time": 6.794381571933627} {"Full-finetune/Learning Rate": 1.3321474213921317e-05, "Full-finetune/Loss": 0.7906796336174011, "Full-finetune/Loss (Raw)": 1.0784562826156616, "Full-finetune/Step": 2133, "Full-finetune/Step Time": 6.791199816390872} {"Full-finetune/Learning Rate": 1.3315597629803959e-05, "Full-finetune/Loss": 0.7902369499206543, "Full-finetune/Loss (Raw)": 0.7529025673866272, "Full-finetune/Step": 2134, "Full-finetune/Step Time": 6.801604492589831} {"Full-finetune/Learning Rate": 1.3309719758967885e-05, "Full-finetune/Loss": 0.7879042625427246, "Full-finetune/Loss (Raw)": 0.7660349607467651, "Full-finetune/Step": 2135, "Full-finetune/Step Time": 6.797251656651497} {"Full-finetune/Learning Rate": 1.3303840603694192e-05, "Full-finetune/Loss": 0.7882636785507202, "Full-finetune/Loss (Raw)": 0.8589189052581787, "Full-finetune/Step": 2136, "Full-finetune/Step Time": 6.789159031584859} {"Full-finetune/Learning Rate": 1.3297960166264462e-05, "Full-finetune/Loss": 0.7854006290435791, "Full-finetune/Loss (Raw)": 0.4270907938480377, "Full-finetune/Step": 2137, "Full-finetune/Step Time": 6.798602281138301} {"Full-finetune/Learning Rate": 1.3292078448960778e-05, "Full-finetune/Loss": 0.7849230766296387, "Full-finetune/Loss (Raw)": 0.8664576411247253, "Full-finetune/Step": 2138, "Full-finetune/Step Time": 6.795840058475733} {"Full-finetune/Learning Rate": 1.3286195454065726e-05, "Full-finetune/Loss": 0.782719612121582, "Full-finetune/Loss (Raw)": 0.7493429780006409, "Full-finetune/Step": 2139, "Full-finetune/Step Time": 6.809860737994313} {"Full-finetune/Learning Rate": 1.3280311183862371e-05, "Full-finetune/Loss": 0.783206582069397, "Full-finetune/Loss (Raw)": 0.9080849885940552, "Full-finetune/Step": 2140, "Full-finetune/Step Time": 6.812680389732122} {"Full-finetune/Learning Rate": 1.3274425640634287e-05, "Full-finetune/Loss": 0.7839552760124207, "Full-finetune/Loss (Raw)": 0.9865711331367493, "Full-finetune/Step": 2141, "Full-finetune/Step Time": 6.798516986891627} {"Full-finetune/Learning Rate": 1.3268538826665544e-05, "Full-finetune/Loss": 0.784813642501831, "Full-finetune/Loss (Raw)": 0.7937358617782593, "Full-finetune/Step": 2142, "Full-finetune/Step Time": 6.786517499014735} {"Full-finetune/Learning Rate": 1.326265074424069e-05, "Full-finetune/Loss": 0.7882533073425293, "Full-finetune/Loss (Raw)": 0.8315989971160889, "Full-finetune/Step": 2143, "Full-finetune/Step Time": 6.783186474815011} {"Full-finetune/Learning Rate": 1.3256761395644787e-05, "Full-finetune/Loss": 0.7914605140686035, "Full-finetune/Loss (Raw)": 0.8102245926856995, "Full-finetune/Step": 2144, "Full-finetune/Step Time": 6.774618472903967} {"Full-finetune/Learning Rate": 1.3250870783163363e-05, "Full-finetune/Loss": 0.7901993989944458, "Full-finetune/Loss (Raw)": 0.539373517036438, "Full-finetune/Step": 2145, "Full-finetune/Step Time": 6.774083754047751} {"Full-finetune/Learning Rate": 1.3244978909082457e-05, "Full-finetune/Loss": 0.7898463010787964, "Full-finetune/Loss (Raw)": 0.8534265756607056, "Full-finetune/Step": 2146, "Full-finetune/Step Time": 6.7883134093135595} {"Full-finetune/Learning Rate": 1.3239085775688591e-05, "Full-finetune/Loss": 0.7894174456596375, "Full-finetune/Loss (Raw)": 0.7304372787475586, "Full-finetune/Step": 2147, "Full-finetune/Step Time": 6.789285959675908} {"Full-finetune/Learning Rate": 1.3233191385268771e-05, "Full-finetune/Loss": 0.7901910543441772, "Full-finetune/Loss (Raw)": 0.9794414639472961, "Full-finetune/Step": 2148, "Full-finetune/Step Time": 6.7855358719825745} {"Full-finetune/Learning Rate": 1.3227295740110502e-05, "Full-finetune/Loss": 0.791064977645874, "Full-finetune/Loss (Raw)": 0.8963491916656494, "Full-finetune/Step": 2149, "Full-finetune/Step Time": 6.774859823286533} {"Full-finetune/Learning Rate": 1.3221398842501758e-05, "Full-finetune/Loss": 0.7908821105957031, "Full-finetune/Loss (Raw)": 0.803448498249054, "Full-finetune/Step": 2150, "Full-finetune/Step Time": 6.772024724632502} {"Full-finetune/Learning Rate": 1.321550069473102e-05, "Full-finetune/Loss": 0.7930880784988403, "Full-finetune/Loss (Raw)": 0.9285663366317749, "Full-finetune/Step": 2151, "Full-finetune/Step Time": 6.764481073245406} {"Full-finetune/Learning Rate": 1.3209601299087238e-05, "Full-finetune/Loss": 0.7927756905555725, "Full-finetune/Loss (Raw)": 0.7510979771614075, "Full-finetune/Step": 2152, "Full-finetune/Step Time": 6.77981430478394} {"Full-finetune/Learning Rate": 1.3203700657859855e-05, "Full-finetune/Loss": 0.793046772480011, "Full-finetune/Loss (Raw)": 0.8084995746612549, "Full-finetune/Step": 2153, "Full-finetune/Step Time": 6.769264807924628} {"Full-finetune/Learning Rate": 1.3197798773338793e-05, "Full-finetune/Loss": 0.7914155721664429, "Full-finetune/Loss (Raw)": 0.6995051503181458, "Full-finetune/Step": 2154, "Full-finetune/Step Time": 6.778004437685013} {"Full-finetune/Learning Rate": 1.3191895647814457e-05, "Full-finetune/Loss": 0.7915737628936768, "Full-finetune/Loss (Raw)": 0.8309687972068787, "Full-finetune/Step": 2155, "Full-finetune/Step Time": 6.784092443063855} {"Full-finetune/Learning Rate": 1.318599128357774e-05, "Full-finetune/Loss": 0.7901660203933716, "Full-finetune/Loss (Raw)": 0.6795858144760132, "Full-finetune/Step": 2156, "Full-finetune/Step Time": 6.778289360925555} {"Full-finetune/Learning Rate": 1.3180085682920005e-05, "Full-finetune/Loss": 0.7888643741607666, "Full-finetune/Loss (Raw)": 0.740961492061615, "Full-finetune/Step": 2157, "Full-finetune/Step Time": 6.786731343716383} {"Full-finetune/Learning Rate": 1.31741788481331e-05, "Full-finetune/Loss": 0.7932702302932739, "Full-finetune/Loss (Raw)": 0.9035063982009888, "Full-finetune/Step": 2158, "Full-finetune/Step Time": 6.76716891862452} {"Full-finetune/Learning Rate": 1.316827078150936e-05, "Full-finetune/Loss": 0.7936896085739136, "Full-finetune/Loss (Raw)": 0.8651235103607178, "Full-finetune/Step": 2159, "Full-finetune/Step Time": 6.791882302612066} {"Full-finetune/Learning Rate": 1.316236148534158e-05, "Full-finetune/Loss": 0.7926411032676697, "Full-finetune/Loss (Raw)": 0.8159886598587036, "Full-finetune/Step": 2160, "Full-finetune/Step Time": 6.786863444373012} {"Full-finetune/Learning Rate": 1.3156450961923051e-05, "Full-finetune/Loss": 0.7919426560401917, "Full-finetune/Loss (Raw)": 0.7664549946784973, "Full-finetune/Step": 2161, "Full-finetune/Step Time": 6.780724668875337} {"Full-finetune/Learning Rate": 1.3150539213547528e-05, "Full-finetune/Loss": 0.7901958227157593, "Full-finetune/Loss (Raw)": 0.747955858707428, "Full-finetune/Step": 2162, "Full-finetune/Step Time": 6.784085551276803} {"Full-finetune/Learning Rate": 1.3144626242509243e-05, "Full-finetune/Loss": 0.7912566661834717, "Full-finetune/Loss (Raw)": 0.7972369194030762, "Full-finetune/Step": 2163, "Full-finetune/Step Time": 6.768182680010796} {"Full-finetune/Learning Rate": 1.3138712051102908e-05, "Full-finetune/Loss": 0.7918980121612549, "Full-finetune/Loss (Raw)": 0.9572404623031616, "Full-finetune/Step": 2164, "Full-finetune/Step Time": 6.75370323471725} {"Full-finetune/Learning Rate": 1.3132796641623703e-05, "Full-finetune/Loss": 0.7918844223022461, "Full-finetune/Loss (Raw)": 0.8259366750717163, "Full-finetune/Step": 2165, "Full-finetune/Step Time": 6.7620405331254005} {"Full-finetune/Learning Rate": 1.3126880016367287e-05, "Full-finetune/Loss": 0.7936785221099854, "Full-finetune/Loss (Raw)": 0.9084364175796509, "Full-finetune/Step": 2166, "Full-finetune/Step Time": 6.7613261397928} {"Full-finetune/Learning Rate": 1.3120962177629783e-05, "Full-finetune/Loss": 0.7933582663536072, "Full-finetune/Loss (Raw)": 0.9177592992782593, "Full-finetune/Step": 2167, "Full-finetune/Step Time": 6.7607487216591835} {"Full-finetune/Learning Rate": 1.311504312770779e-05, "Full-finetune/Loss": 0.7927690744400024, "Full-finetune/Loss (Raw)": 0.8052210807800293, "Full-finetune/Step": 2168, "Full-finetune/Step Time": 6.759036643430591} {"Full-finetune/Learning Rate": 1.3109122868898374e-05, "Full-finetune/Loss": 0.792769730091095, "Full-finetune/Loss (Raw)": 0.8828323483467102, "Full-finetune/Step": 2169, "Full-finetune/Step Time": 6.7173646204173565} {"Full-finetune/Learning Rate": 1.310320140349907e-05, "Full-finetune/Loss": 0.7925044298171997, "Full-finetune/Loss (Raw)": 0.7169657349586487, "Full-finetune/Step": 2170, "Full-finetune/Step Time": 6.728421188890934} {"Full-finetune/Learning Rate": 1.3097278733807892e-05, "Full-finetune/Loss": 0.7913855314254761, "Full-finetune/Loss (Raw)": 0.7184207439422607, "Full-finetune/Step": 2171, "Full-finetune/Step Time": 6.727325143292546} {"Full-finetune/Learning Rate": 1.3091354862123304e-05, "Full-finetune/Loss": 0.7913128137588501, "Full-finetune/Loss (Raw)": 0.8674032688140869, "Full-finetune/Step": 2172, "Full-finetune/Step Time": 6.717113422229886} {"Full-finetune/Learning Rate": 1.3085429790744248e-05, "Full-finetune/Loss": 0.7890911102294922, "Full-finetune/Loss (Raw)": 0.6029016971588135, "Full-finetune/Step": 2173, "Full-finetune/Step Time": 6.711491411551833} {"Full-finetune/Learning Rate": 1.3079503521970127e-05, "Full-finetune/Loss": 0.7862805724143982, "Full-finetune/Loss (Raw)": 0.6094250082969666, "Full-finetune/Step": 2174, "Full-finetune/Step Time": 6.714088125154376} {"Full-finetune/Learning Rate": 1.3073576058100815e-05, "Full-finetune/Loss": 0.7849581241607666, "Full-finetune/Loss (Raw)": 0.7646398544311523, "Full-finetune/Step": 2175, "Full-finetune/Step Time": 6.729823440313339} {"Full-finetune/Learning Rate": 1.3067647401436636e-05, "Full-finetune/Loss": 0.7865087985992432, "Full-finetune/Loss (Raw)": 0.9213773012161255, "Full-finetune/Step": 2176, "Full-finetune/Step Time": 6.729681001976132} {"Full-finetune/Learning Rate": 1.3061717554278393e-05, "Full-finetune/Loss": 0.7892748117446899, "Full-finetune/Loss (Raw)": 0.9078602194786072, "Full-finetune/Step": 2177, "Full-finetune/Step Time": 6.719435468316078} {"Full-finetune/Learning Rate": 1.3055786518927342e-05, "Full-finetune/Loss": 0.789522647857666, "Full-finetune/Loss (Raw)": 0.7169275283813477, "Full-finetune/Step": 2178, "Full-finetune/Step Time": 6.707317491993308} {"Full-finetune/Learning Rate": 1.3049854297685206e-05, "Full-finetune/Loss": 0.7879747152328491, "Full-finetune/Loss (Raw)": 0.792673647403717, "Full-finetune/Step": 2179, "Full-finetune/Step Time": 6.717344436794519} {"Full-finetune/Learning Rate": 1.3043920892854155e-05, "Full-finetune/Loss": 0.7874883413314819, "Full-finetune/Loss (Raw)": 0.8792374730110168, "Full-finetune/Step": 2180, "Full-finetune/Step Time": 6.71153081022203} {"Full-finetune/Learning Rate": 1.3037986306736839e-05, "Full-finetune/Loss": 0.7875588536262512, "Full-finetune/Loss (Raw)": 0.9005972743034363, "Full-finetune/Step": 2181, "Full-finetune/Step Time": 6.710517195984721} {"Full-finetune/Learning Rate": 1.3032050541636343e-05, "Full-finetune/Loss": 0.7873918414115906, "Full-finetune/Loss (Raw)": 0.930338978767395, "Full-finetune/Step": 2182, "Full-finetune/Step Time": 6.714296882972121} {"Full-finetune/Learning Rate": 1.3026113599856229e-05, "Full-finetune/Loss": 0.7856184244155884, "Full-finetune/Loss (Raw)": 0.6793571710586548, "Full-finetune/Step": 2183, "Full-finetune/Step Time": 6.720038421452045} {"Full-finetune/Learning Rate": 1.302017548370051e-05, "Full-finetune/Loss": 0.783765971660614, "Full-finetune/Loss (Raw)": 0.6911234855651855, "Full-finetune/Step": 2184, "Full-finetune/Step Time": 6.735623283311725} {"Full-finetune/Learning Rate": 1.3014236195473649e-05, "Full-finetune/Loss": 0.7846881151199341, "Full-finetune/Loss (Raw)": 0.8699163198471069, "Full-finetune/Step": 2185, "Full-finetune/Step Time": 6.722919218242168} {"Full-finetune/Learning Rate": 1.3008295737480567e-05, "Full-finetune/Loss": 0.7851425409317017, "Full-finetune/Loss (Raw)": 0.821586012840271, "Full-finetune/Step": 2186, "Full-finetune/Step Time": 6.708788430318236} {"Full-finetune/Learning Rate": 1.300235411202664e-05, "Full-finetune/Loss": 0.7834427356719971, "Full-finetune/Loss (Raw)": 0.5596846342086792, "Full-finetune/Step": 2187, "Full-finetune/Step Time": 6.752999568358064} {"Full-finetune/Learning Rate": 1.2996411321417699e-05, "Full-finetune/Loss": 0.7834134101867676, "Full-finetune/Loss (Raw)": 0.7823541164398193, "Full-finetune/Step": 2188, "Full-finetune/Step Time": 6.786351019516587} {"Full-finetune/Learning Rate": 1.2990467367960027e-05, "Full-finetune/Loss": 0.7814358472824097, "Full-finetune/Loss (Raw)": 0.6781806945800781, "Full-finetune/Step": 2189, "Full-finetune/Step Time": 6.794324053451419} {"Full-finetune/Learning Rate": 1.298452225396035e-05, "Full-finetune/Loss": 0.7806592583656311, "Full-finetune/Loss (Raw)": 0.6881605386734009, "Full-finetune/Step": 2190, "Full-finetune/Step Time": 6.8037970662117} {"Full-finetune/Learning Rate": 1.2978575981725858e-05, "Full-finetune/Loss": 0.7797856330871582, "Full-finetune/Loss (Raw)": 0.8079104423522949, "Full-finetune/Step": 2191, "Full-finetune/Step Time": 6.819214405491948} {"Full-finetune/Learning Rate": 1.2972628553564178e-05, "Full-finetune/Loss": 0.7792673707008362, "Full-finetune/Loss (Raw)": 0.6721411943435669, "Full-finetune/Step": 2192, "Full-finetune/Step Time": 6.800898987799883} {"Full-finetune/Learning Rate": 1.2966679971783387e-05, "Full-finetune/Loss": 0.7799972295761108, "Full-finetune/Loss (Raw)": 0.9055007100105286, "Full-finetune/Step": 2193, "Full-finetune/Step Time": 6.796307509765029} {"Full-finetune/Learning Rate": 1.2960730238692023e-05, "Full-finetune/Loss": 0.7838408946990967, "Full-finetune/Loss (Raw)": 0.8261590600013733, "Full-finetune/Step": 2194, "Full-finetune/Step Time": 6.780682481825352} {"Full-finetune/Learning Rate": 1.2954779356599056e-05, "Full-finetune/Loss": 0.7844199538230896, "Full-finetune/Loss (Raw)": 0.902280330657959, "Full-finetune/Step": 2195, "Full-finetune/Step Time": 6.769401632249355} {"Full-finetune/Learning Rate": 1.2948827327813908e-05, "Full-finetune/Loss": 0.7837383151054382, "Full-finetune/Loss (Raw)": 0.7574828267097473, "Full-finetune/Step": 2196, "Full-finetune/Step Time": 6.7791453674435616} {"Full-finetune/Learning Rate": 1.2942874154646447e-05, "Full-finetune/Loss": 0.7835782170295715, "Full-finetune/Loss (Raw)": 0.8211576342582703, "Full-finetune/Step": 2197, "Full-finetune/Step Time": 6.781687676906586} {"Full-finetune/Learning Rate": 1.2936919839406978e-05, "Full-finetune/Loss": 0.7857882976531982, "Full-finetune/Loss (Raw)": 0.7745054364204407, "Full-finetune/Step": 2198, "Full-finetune/Step Time": 6.775270465761423} {"Full-finetune/Learning Rate": 1.2930964384406259e-05, "Full-finetune/Loss": 0.7849140167236328, "Full-finetune/Loss (Raw)": 0.7764120697975159, "Full-finetune/Step": 2199, "Full-finetune/Step Time": 6.776651231572032} {"Full-finetune/Learning Rate": 1.2925007791955487e-05, "Full-finetune/Loss": 0.7831735610961914, "Full-finetune/Loss (Raw)": 0.7277863621711731, "Full-finetune/Step": 2200, "Full-finetune/Step Time": 6.800399322062731} {"Full-finetune/Learning Rate": 1.2919050064366294e-05, "Full-finetune/Loss": 0.7802082300186157, "Full-finetune/Loss (Raw)": 0.3539833128452301, "Full-finetune/Step": 2201, "Full-finetune/Step Time": 6.80708141811192} {"Full-finetune/Learning Rate": 1.2913091203950764e-05, "Full-finetune/Loss": 0.7791190147399902, "Full-finetune/Loss (Raw)": 0.806634247303009, "Full-finetune/Step": 2202, "Full-finetune/Step Time": 6.798520935699344} {"Full-finetune/Learning Rate": 1.2907131213021404e-05, "Full-finetune/Loss": 0.779228925704956, "Full-finetune/Loss (Raw)": 0.7976114749908447, "Full-finetune/Step": 2203, "Full-finetune/Step Time": 6.799095010384917} {"Full-finetune/Learning Rate": 1.2901170093891182e-05, "Full-finetune/Loss": 0.77934730052948, "Full-finetune/Loss (Raw)": 0.7025349736213684, "Full-finetune/Step": 2204, "Full-finetune/Step Time": 6.796174393966794} {"Full-finetune/Learning Rate": 1.2895207848873488e-05, "Full-finetune/Loss": 0.7764406204223633, "Full-finetune/Loss (Raw)": 0.4231628477573395, "Full-finetune/Step": 2205, "Full-finetune/Step Time": 6.813687616959214} {"Full-finetune/Learning Rate": 1.288924448028215e-05, "Full-finetune/Loss": 0.775022566318512, "Full-finetune/Loss (Raw)": 0.5769824385643005, "Full-finetune/Step": 2206, "Full-finetune/Step Time": 6.8554560374468565} {"Full-finetune/Learning Rate": 1.288327999043144e-05, "Full-finetune/Loss": 0.7755030393600464, "Full-finetune/Loss (Raw)": 0.8457850813865662, "Full-finetune/Step": 2207, "Full-finetune/Step Time": 6.850553913041949} {"Full-finetune/Learning Rate": 1.2877314381636052e-05, "Full-finetune/Loss": 0.7759909629821777, "Full-finetune/Loss (Raw)": 0.7777856588363647, "Full-finetune/Step": 2208, "Full-finetune/Step Time": 6.854971881955862} {"Full-finetune/Learning Rate": 1.287134765621113e-05, "Full-finetune/Loss": 0.775780200958252, "Full-finetune/Loss (Raw)": 0.7849631309509277, "Full-finetune/Step": 2209, "Full-finetune/Step Time": 6.844514109194279} {"Full-finetune/Learning Rate": 1.2865379816472244e-05, "Full-finetune/Loss": 0.7726181745529175, "Full-finetune/Loss (Raw)": 0.3945714831352234, "Full-finetune/Step": 2210, "Full-finetune/Step Time": 6.861894009634852} {"Full-finetune/Learning Rate": 1.2859410864735389e-05, "Full-finetune/Loss": 0.7729558944702148, "Full-finetune/Loss (Raw)": 0.9327428936958313, "Full-finetune/Step": 2211, "Full-finetune/Step Time": 6.886336248368025} {"Full-finetune/Learning Rate": 1.2853440803317003e-05, "Full-finetune/Loss": 0.7697691321372986, "Full-finetune/Loss (Raw)": 0.5867562890052795, "Full-finetune/Step": 2212, "Full-finetune/Step Time": 6.909257836639881} {"Full-finetune/Learning Rate": 1.2847469634533952e-05, "Full-finetune/Loss": 0.7728059887886047, "Full-finetune/Loss (Raw)": 0.6993196606636047, "Full-finetune/Step": 2213, "Full-finetune/Step Time": 6.8972928542643785} {"Full-finetune/Learning Rate": 1.2841497360703528e-05, "Full-finetune/Loss": 0.770612895488739, "Full-finetune/Loss (Raw)": 0.6150368452072144, "Full-finetune/Step": 2214, "Full-finetune/Step Time": 6.913837872445583} {"Full-finetune/Learning Rate": 1.283552398414345e-05, "Full-finetune/Loss": 0.7698925137519836, "Full-finetune/Loss (Raw)": 0.8722651600837708, "Full-finetune/Step": 2215, "Full-finetune/Step Time": 6.913175655528903} {"Full-finetune/Learning Rate": 1.2829549507171877e-05, "Full-finetune/Loss": 0.7693773508071899, "Full-finetune/Loss (Raw)": 0.8486913442611694, "Full-finetune/Step": 2216, "Full-finetune/Step Time": 6.91520818322897} {"Full-finetune/Learning Rate": 1.2823573932107381e-05, "Full-finetune/Loss": 0.7700784802436829, "Full-finetune/Loss (Raw)": 0.9467052221298218, "Full-finetune/Step": 2217, "Full-finetune/Step Time": 6.91578190587461} {"Full-finetune/Learning Rate": 1.2817597261268965e-05, "Full-finetune/Loss": 0.772676944732666, "Full-finetune/Loss (Raw)": 0.5883740186691284, "Full-finetune/Step": 2218, "Full-finetune/Step Time": 6.902292396873236} {"Full-finetune/Learning Rate": 1.2811619496976066e-05, "Full-finetune/Loss": 0.7720894813537598, "Full-finetune/Loss (Raw)": 0.692236602306366, "Full-finetune/Step": 2219, "Full-finetune/Step Time": 6.931664424017072} {"Full-finetune/Learning Rate": 1.2805640641548529e-05, "Full-finetune/Loss": 0.7719942331314087, "Full-finetune/Loss (Raw)": 0.8650497794151306, "Full-finetune/Step": 2220, "Full-finetune/Step Time": 6.932133002206683} {"Full-finetune/Learning Rate": 1.2799660697306636e-05, "Full-finetune/Loss": 0.7704824209213257, "Full-finetune/Loss (Raw)": 0.7252201437950134, "Full-finetune/Step": 2221, "Full-finetune/Step Time": 6.9488242864608765} {"Full-finetune/Learning Rate": 1.2793679666571084e-05, "Full-finetune/Loss": 0.7699297666549683, "Full-finetune/Loss (Raw)": 0.9050824046134949, "Full-finetune/Step": 2222, "Full-finetune/Step Time": 6.957459708675742} {"Full-finetune/Learning Rate": 1.2787697551662994e-05, "Full-finetune/Loss": 0.7699660658836365, "Full-finetune/Loss (Raw)": 0.8491544723510742, "Full-finetune/Step": 2223, "Full-finetune/Step Time": 6.961610823869705} {"Full-finetune/Learning Rate": 1.2781714354903913e-05, "Full-finetune/Loss": 0.7701048851013184, "Full-finetune/Loss (Raw)": 0.836765468120575, "Full-finetune/Step": 2224, "Full-finetune/Step Time": 6.962185770273209} {"Full-finetune/Learning Rate": 1.2775730078615798e-05, "Full-finetune/Loss": 0.7690579891204834, "Full-finetune/Loss (Raw)": 0.7633851766586304, "Full-finetune/Step": 2225, "Full-finetune/Step Time": 6.962250927463174} {"Full-finetune/Learning Rate": 1.276974472512103e-05, "Full-finetune/Loss": 0.7696528434753418, "Full-finetune/Loss (Raw)": 0.845896303653717, "Full-finetune/Step": 2226, "Full-finetune/Step Time": 6.95180013589561} {"Full-finetune/Learning Rate": 1.276375829674241e-05, "Full-finetune/Loss": 0.7739813327789307, "Full-finetune/Loss (Raw)": 0.9088866710662842, "Full-finetune/Step": 2227, "Full-finetune/Step Time": 6.9370011650025845} {"Full-finetune/Learning Rate": 1.275777079580315e-05, "Full-finetune/Loss": 0.7747583389282227, "Full-finetune/Loss (Raw)": 0.7630231976509094, "Full-finetune/Step": 2228, "Full-finetune/Step Time": 6.934753214940429} {"Full-finetune/Learning Rate": 1.2751782224626891e-05, "Full-finetune/Loss": 0.7735427618026733, "Full-finetune/Loss (Raw)": 0.7660305500030518, "Full-finetune/Step": 2229, "Full-finetune/Step Time": 6.933982100337744} {"Full-finetune/Learning Rate": 1.274579258553767e-05, "Full-finetune/Loss": 0.7733250856399536, "Full-finetune/Loss (Raw)": 0.7705994248390198, "Full-finetune/Step": 2230, "Full-finetune/Step Time": 6.9343324061483145} {"Full-finetune/Learning Rate": 1.2739801880859954e-05, "Full-finetune/Loss": 0.7777073383331299, "Full-finetune/Loss (Raw)": 0.9301467537879944, "Full-finetune/Step": 2231, "Full-finetune/Step Time": 6.914672877639532} {"Full-finetune/Learning Rate": 1.2733810112918618e-05, "Full-finetune/Loss": 0.7789807319641113, "Full-finetune/Loss (Raw)": 0.969826340675354, "Full-finetune/Step": 2232, "Full-finetune/Step Time": 6.905899731442332} {"Full-finetune/Learning Rate": 1.2727817284038953e-05, "Full-finetune/Loss": 0.7779296040534973, "Full-finetune/Loss (Raw)": 0.7056037783622742, "Full-finetune/Step": 2233, "Full-finetune/Step Time": 6.903622608631849} {"Full-finetune/Learning Rate": 1.2721823396546655e-05, "Full-finetune/Loss": 0.7783489227294922, "Full-finetune/Loss (Raw)": 0.9141567349433899, "Full-finetune/Step": 2234, "Full-finetune/Step Time": 6.906686510890722} {"Full-finetune/Learning Rate": 1.2715828452767833e-05, "Full-finetune/Loss": 0.778862476348877, "Full-finetune/Loss (Raw)": 0.9375632405281067, "Full-finetune/Step": 2235, "Full-finetune/Step Time": 6.9184147249907255} {"Full-finetune/Learning Rate": 1.2709832455029017e-05, "Full-finetune/Loss": 0.7799477577209473, "Full-finetune/Loss (Raw)": 0.9143453240394592, "Full-finetune/Step": 2236, "Full-finetune/Step Time": 6.9195237793028355} {"Full-finetune/Learning Rate": 1.2703835405657124e-05, "Full-finetune/Loss": 0.7788920402526855, "Full-finetune/Loss (Raw)": 0.7502304315567017, "Full-finetune/Step": 2237, "Full-finetune/Step Time": 6.921007413417101} {"Full-finetune/Learning Rate": 1.2697837306979499e-05, "Full-finetune/Loss": 0.7778645753860474, "Full-finetune/Loss (Raw)": 0.6581746339797974, "Full-finetune/Step": 2238, "Full-finetune/Step Time": 6.9249623492360115} {"Full-finetune/Learning Rate": 1.2691838161323888e-05, "Full-finetune/Loss": 0.7803491950035095, "Full-finetune/Loss (Raw)": 1.1066956520080566, "Full-finetune/Step": 2239, "Full-finetune/Step Time": 6.910764418542385} {"Full-finetune/Learning Rate": 1.2685837971018438e-05, "Full-finetune/Loss": 0.7843573093414307, "Full-finetune/Loss (Raw)": 0.9737469553947449, "Full-finetune/Step": 2240, "Full-finetune/Step Time": 6.894010530784726} {"Full-finetune/Learning Rate": 1.2679836738391714e-05, "Full-finetune/Loss": 0.7852227687835693, "Full-finetune/Loss (Raw)": 0.9458624720573425, "Full-finetune/Step": 2241, "Full-finetune/Step Time": 6.90243424475193} {"Full-finetune/Learning Rate": 1.2673834465772662e-05, "Full-finetune/Loss": 0.7842233777046204, "Full-finetune/Loss (Raw)": 0.787720263004303, "Full-finetune/Step": 2242, "Full-finetune/Step Time": 6.875262608751655} {"Full-finetune/Learning Rate": 1.2667831155490662e-05, "Full-finetune/Loss": 0.783366858959198, "Full-finetune/Loss (Raw)": 0.7980179190635681, "Full-finetune/Step": 2243, "Full-finetune/Step Time": 6.877910319715738} {"Full-finetune/Learning Rate": 1.2661826809875474e-05, "Full-finetune/Loss": 0.7885757684707642, "Full-finetune/Loss (Raw)": 1.0773346424102783, "Full-finetune/Step": 2244, "Full-finetune/Step Time": 6.85759511962533} {"Full-finetune/Learning Rate": 1.265582143125727e-05, "Full-finetune/Loss": 0.790124237537384, "Full-finetune/Loss (Raw)": 0.8733579516410828, "Full-finetune/Step": 2245, "Full-finetune/Step Time": 6.839002503082156} {"Full-finetune/Learning Rate": 1.264981502196662e-05, "Full-finetune/Loss": 0.7916592359542847, "Full-finetune/Loss (Raw)": 0.9566901326179504, "Full-finetune/Step": 2246, "Full-finetune/Step Time": 6.852991135790944} {"Full-finetune/Learning Rate": 1.2643807584334491e-05, "Full-finetune/Loss": 0.7913463115692139, "Full-finetune/Loss (Raw)": 0.7124580144882202, "Full-finetune/Step": 2247, "Full-finetune/Step Time": 6.852845512330532} {"Full-finetune/Learning Rate": 1.2637799120692253e-05, "Full-finetune/Loss": 0.794309139251709, "Full-finetune/Loss (Raw)": 0.7060744166374207, "Full-finetune/Step": 2248, "Full-finetune/Step Time": 6.830944273620844} {"Full-finetune/Learning Rate": 1.2631789633371678e-05, "Full-finetune/Loss": 0.793688952922821, "Full-finetune/Loss (Raw)": 0.7776908874511719, "Full-finetune/Step": 2249, "Full-finetune/Step Time": 6.831625193357468} {"Full-finetune/Learning Rate": 1.2625779124704925e-05, "Full-finetune/Loss": 0.7927017211914062, "Full-finetune/Loss (Raw)": 0.7808031439781189, "Full-finetune/Step": 2250, "Full-finetune/Step Time": 6.853325409814715} {"Full-finetune/Learning Rate": 1.2619767597024561e-05, "Full-finetune/Loss": 0.79268479347229, "Full-finetune/Loss (Raw)": 0.8668494820594788, "Full-finetune/Step": 2251, "Full-finetune/Step Time": 6.8552504647523165} {"Full-finetune/Learning Rate": 1.2613755052663536e-05, "Full-finetune/Loss": 0.7883810997009277, "Full-finetune/Loss (Raw)": 0.31803804636001587, "Full-finetune/Step": 2252, "Full-finetune/Step Time": 6.869616938754916} {"Full-finetune/Learning Rate": 1.2607741493955208e-05, "Full-finetune/Loss": 0.7886943817138672, "Full-finetune/Loss (Raw)": 0.9074618816375732, "Full-finetune/Step": 2253, "Full-finetune/Step Time": 6.85248383320868} {"Full-finetune/Learning Rate": 1.2601726923233315e-05, "Full-finetune/Loss": 0.7887403964996338, "Full-finetune/Loss (Raw)": 0.9263998866081238, "Full-finetune/Step": 2254, "Full-finetune/Step Time": 6.84887901507318} {"Full-finetune/Learning Rate": 1.2595711342831998e-05, "Full-finetune/Loss": 0.7886420488357544, "Full-finetune/Loss (Raw)": 0.8497264385223389, "Full-finetune/Step": 2255, "Full-finetune/Step Time": 6.847432527691126} {"Full-finetune/Learning Rate": 1.2589694755085789e-05, "Full-finetune/Loss": 0.791844367980957, "Full-finetune/Loss (Raw)": 0.76153165102005, "Full-finetune/Step": 2256, "Full-finetune/Step Time": 6.823936762288213} {"Full-finetune/Learning Rate": 1.25836771623296e-05, "Full-finetune/Loss": 0.7961183786392212, "Full-finetune/Loss (Raw)": 0.8241268396377563, "Full-finetune/Step": 2257, "Full-finetune/Step Time": 6.8081589341163635} {"Full-finetune/Learning Rate": 1.257765856689875e-05, "Full-finetune/Loss": 0.794424295425415, "Full-finetune/Loss (Raw)": 0.6469647288322449, "Full-finetune/Step": 2258, "Full-finetune/Step Time": 6.808667620643973} {"Full-finetune/Learning Rate": 1.2571638971128933e-05, "Full-finetune/Loss": 0.7930530309677124, "Full-finetune/Loss (Raw)": 0.7514760494232178, "Full-finetune/Step": 2259, "Full-finetune/Step Time": 6.807115627452731} {"Full-finetune/Learning Rate": 1.2565618377356237e-05, "Full-finetune/Loss": 0.7928905487060547, "Full-finetune/Loss (Raw)": 0.7804418206214905, "Full-finetune/Step": 2260, "Full-finetune/Step Time": 6.81317781098187} {"Full-finetune/Learning Rate": 1.2559596787917144e-05, "Full-finetune/Loss": 0.7913703918457031, "Full-finetune/Loss (Raw)": 0.8838739395141602, "Full-finetune/Step": 2261, "Full-finetune/Step Time": 6.815356375649571} {"Full-finetune/Learning Rate": 1.2553574205148502e-05, "Full-finetune/Loss": 0.7932261228561401, "Full-finetune/Loss (Raw)": 0.9904352426528931, "Full-finetune/Step": 2262, "Full-finetune/Step Time": 6.810499437153339} {"Full-finetune/Learning Rate": 1.2547550631387571e-05, "Full-finetune/Loss": 0.7934442758560181, "Full-finetune/Loss (Raw)": 0.7939522862434387, "Full-finetune/Step": 2263, "Full-finetune/Step Time": 6.815557451918721} {"Full-finetune/Learning Rate": 1.2541526068971975e-05, "Full-finetune/Loss": 0.7936072945594788, "Full-finetune/Loss (Raw)": 0.8797875046730042, "Full-finetune/Step": 2264, "Full-finetune/Step Time": 6.830290840938687} {"Full-finetune/Learning Rate": 1.2535500520239727e-05, "Full-finetune/Loss": 0.796648383140564, "Full-finetune/Loss (Raw)": 0.816355288028717, "Full-finetune/Step": 2265, "Full-finetune/Step Time": 6.814353700727224} {"Full-finetune/Learning Rate": 1.2529473987529235e-05, "Full-finetune/Loss": 0.7940806150436401, "Full-finetune/Loss (Raw)": 0.5377781391143799, "Full-finetune/Step": 2266, "Full-finetune/Step Time": 6.82135128416121} {"Full-finetune/Learning Rate": 1.2523446473179267e-05, "Full-finetune/Loss": 0.7945401668548584, "Full-finetune/Loss (Raw)": 0.8081711530685425, "Full-finetune/Step": 2267, "Full-finetune/Step Time": 6.80237621255219} {"Full-finetune/Learning Rate": 1.2517417979528991e-05, "Full-finetune/Loss": 0.7933524250984192, "Full-finetune/Loss (Raw)": 0.7560506463050842, "Full-finetune/Step": 2268, "Full-finetune/Step Time": 6.800044637173414} {"Full-finetune/Learning Rate": 1.2511388508917946e-05, "Full-finetune/Loss": 0.7926063537597656, "Full-finetune/Loss (Raw)": 0.8910753726959229, "Full-finetune/Step": 2269, "Full-finetune/Step Time": 6.793304473161697} {"Full-finetune/Learning Rate": 1.250535806368605e-05, "Full-finetune/Loss": 0.7909077405929565, "Full-finetune/Loss (Raw)": 0.5763142704963684, "Full-finetune/Step": 2270, "Full-finetune/Step Time": 6.812650613486767} {"Full-finetune/Learning Rate": 1.2499326646173606e-05, "Full-finetune/Loss": 0.7912778854370117, "Full-finetune/Loss (Raw)": 0.8789769411087036, "Full-finetune/Step": 2271, "Full-finetune/Step Time": 6.793455757200718} {"Full-finetune/Learning Rate": 1.2493294258721282e-05, "Full-finetune/Loss": 0.7919537425041199, "Full-finetune/Loss (Raw)": 0.8967348337173462, "Full-finetune/Step": 2272, "Full-finetune/Step Time": 6.788171000778675} {"Full-finetune/Learning Rate": 1.2487260903670136e-05, "Full-finetune/Loss": 0.7940582036972046, "Full-finetune/Loss (Raw)": 0.8087444305419922, "Full-finetune/Step": 2273, "Full-finetune/Step Time": 6.7742960918694735} {"Full-finetune/Learning Rate": 1.2481226583361592e-05, "Full-finetune/Loss": 0.7934052348136902, "Full-finetune/Loss (Raw)": 0.7698454856872559, "Full-finetune/Step": 2274, "Full-finetune/Step Time": 6.78572766110301} {"Full-finetune/Learning Rate": 1.2475191300137452e-05, "Full-finetune/Loss": 0.7948712110519409, "Full-finetune/Loss (Raw)": 0.9180814623832703, "Full-finetune/Step": 2275, "Full-finetune/Step Time": 6.777755739167333} {"Full-finetune/Learning Rate": 1.2469155056339894e-05, "Full-finetune/Loss": 0.793885350227356, "Full-finetune/Loss (Raw)": 0.8532508015632629, "Full-finetune/Step": 2276, "Full-finetune/Step Time": 6.780519338324666} {"Full-finetune/Learning Rate": 1.2463117854311463e-05, "Full-finetune/Loss": 0.7922335863113403, "Full-finetune/Loss (Raw)": 0.6849266886711121, "Full-finetune/Step": 2277, "Full-finetune/Step Time": 6.795950457453728} {"Full-finetune/Learning Rate": 1.2457079696395082e-05, "Full-finetune/Loss": 0.7928289771080017, "Full-finetune/Loss (Raw)": 0.8796557784080505, "Full-finetune/Step": 2278, "Full-finetune/Step Time": 6.793800737708807} {"Full-finetune/Learning Rate": 1.2451040584934042e-05, "Full-finetune/Loss": 0.7922831773757935, "Full-finetune/Loss (Raw)": 0.8587095737457275, "Full-finetune/Step": 2279, "Full-finetune/Step Time": 6.774605201557279} {"Full-finetune/Learning Rate": 1.2445000522272005e-05, "Full-finetune/Loss": 0.7929873466491699, "Full-finetune/Loss (Raw)": 0.8412288427352905, "Full-finetune/Step": 2280, "Full-finetune/Step Time": 6.759794281795621} {"Full-finetune/Learning Rate": 1.2438959510752997e-05, "Full-finetune/Loss": 0.7930928468704224, "Full-finetune/Loss (Raw)": 0.8219975233078003, "Full-finetune/Step": 2281, "Full-finetune/Step Time": 6.761739203706384} {"Full-finetune/Learning Rate": 1.243291755272142e-05, "Full-finetune/Loss": 0.7939996123313904, "Full-finetune/Loss (Raw)": 0.8155725598335266, "Full-finetune/Step": 2282, "Full-finetune/Step Time": 6.755999991670251} {"Full-finetune/Learning Rate": 1.2426874650522039e-05, "Full-finetune/Loss": 0.794958233833313, "Full-finetune/Loss (Raw)": 0.9536796808242798, "Full-finetune/Step": 2283, "Full-finetune/Step Time": 6.7439924124628305} {"Full-finetune/Learning Rate": 1.2420830806499988e-05, "Full-finetune/Loss": 0.7946299910545349, "Full-finetune/Loss (Raw)": 0.6375637054443359, "Full-finetune/Step": 2284, "Full-finetune/Step Time": 6.758943885564804} {"Full-finetune/Learning Rate": 1.2414786023000765e-05, "Full-finetune/Loss": 0.7949899435043335, "Full-finetune/Loss (Raw)": 0.7870354056358337, "Full-finetune/Step": 2285, "Full-finetune/Step Time": 6.759602148085833} {"Full-finetune/Learning Rate": 1.240874030237023e-05, "Full-finetune/Loss": 0.7941266298294067, "Full-finetune/Loss (Raw)": 0.793004035949707, "Full-finetune/Step": 2286, "Full-finetune/Step Time": 6.769764453172684} {"Full-finetune/Learning Rate": 1.2402693646954607e-05, "Full-finetune/Loss": 0.7920866012573242, "Full-finetune/Loss (Raw)": 0.6040052771568298, "Full-finetune/Step": 2287, "Full-finetune/Step Time": 6.745820935815573} {"Full-finetune/Learning Rate": 1.2396646059100492e-05, "Full-finetune/Loss": 0.7928371429443359, "Full-finetune/Loss (Raw)": 0.9120550155639648, "Full-finetune/Step": 2288, "Full-finetune/Step Time": 6.750309845432639} {"Full-finetune/Learning Rate": 1.2390597541154832e-05, "Full-finetune/Loss": 0.7916728258132935, "Full-finetune/Loss (Raw)": 0.6174159646034241, "Full-finetune/Step": 2289, "Full-finetune/Step Time": 6.764164404943585} {"Full-finetune/Learning Rate": 1.238454809546494e-05, "Full-finetune/Loss": 0.7930667400360107, "Full-finetune/Loss (Raw)": 0.9263877868652344, "Full-finetune/Step": 2290, "Full-finetune/Step Time": 6.757601175457239} {"Full-finetune/Learning Rate": 1.2378497724378484e-05, "Full-finetune/Loss": 0.7928890585899353, "Full-finetune/Loss (Raw)": 0.774488091468811, "Full-finetune/Step": 2291, "Full-finetune/Step Time": 6.770896492525935} {"Full-finetune/Learning Rate": 1.2372446430243497e-05, "Full-finetune/Loss": 0.7912567853927612, "Full-finetune/Loss (Raw)": 0.7483096122741699, "Full-finetune/Step": 2292, "Full-finetune/Step Time": 6.779343253001571} {"Full-finetune/Learning Rate": 1.2366394215408369e-05, "Full-finetune/Loss": 0.7892618179321289, "Full-finetune/Loss (Raw)": 0.570583701133728, "Full-finetune/Step": 2293, "Full-finetune/Step Time": 6.764132214710116} {"Full-finetune/Learning Rate": 1.2360341082221847e-05, "Full-finetune/Loss": 0.7889664769172668, "Full-finetune/Loss (Raw)": 0.8706302642822266, "Full-finetune/Step": 2294, "Full-finetune/Step Time": 6.762364601716399} {"Full-finetune/Learning Rate": 1.2354287033033032e-05, "Full-finetune/Loss": 0.7879109382629395, "Full-finetune/Loss (Raw)": 0.7826513051986694, "Full-finetune/Step": 2295, "Full-finetune/Step Time": 6.790481388568878} {"Full-finetune/Learning Rate": 1.2348232070191383e-05, "Full-finetune/Loss": 0.7869861125946045, "Full-finetune/Loss (Raw)": 0.6868410706520081, "Full-finetune/Step": 2296, "Full-finetune/Step Time": 6.791133971884847} {"Full-finetune/Learning Rate": 1.2342176196046715e-05, "Full-finetune/Loss": 0.7863086462020874, "Full-finetune/Loss (Raw)": 0.7961118817329407, "Full-finetune/Step": 2297, "Full-finetune/Step Time": 6.793093591928482} {"Full-finetune/Learning Rate": 1.2336119412949193e-05, "Full-finetune/Loss": 0.7869438529014587, "Full-finetune/Loss (Raw)": 0.7982740998268127, "Full-finetune/Step": 2298, "Full-finetune/Step Time": 6.784147856757045} {"Full-finetune/Learning Rate": 1.2330061723249328e-05, "Full-finetune/Loss": 0.7882751226425171, "Full-finetune/Loss (Raw)": 0.8888282775878906, "Full-finetune/Step": 2299, "Full-finetune/Step Time": 6.78190684132278} {"Full-finetune/Learning Rate": 1.2324003129298006e-05, "Full-finetune/Loss": 0.7883601188659668, "Full-finetune/Loss (Raw)": 0.8782778978347778, "Full-finetune/Step": 2300, "Full-finetune/Step Time": 6.787509609013796} {"Full-finetune/Learning Rate": 1.2317943633446441e-05, "Full-finetune/Loss": 0.7896167039871216, "Full-finetune/Loss (Raw)": 0.7637426257133484, "Full-finetune/Step": 2301, "Full-finetune/Step Time": 6.773907760158181} {"Full-finetune/Learning Rate": 1.2311883238046204e-05, "Full-finetune/Loss": 0.7904788255691528, "Full-finetune/Loss (Raw)": 0.7197865843772888, "Full-finetune/Step": 2302, "Full-finetune/Step Time": 6.766787266358733} {"Full-finetune/Learning Rate": 1.2305821945449222e-05, "Full-finetune/Loss": 0.791245698928833, "Full-finetune/Loss (Raw)": 0.8627898693084717, "Full-finetune/Step": 2303, "Full-finetune/Step Time": 6.748426193371415} {"Full-finetune/Learning Rate": 1.2299759758007755e-05, "Full-finetune/Loss": 0.7890541553497314, "Full-finetune/Loss (Raw)": 0.6408672332763672, "Full-finetune/Step": 2304, "Full-finetune/Step Time": 6.756486274302006} {"Full-finetune/Learning Rate": 1.2293696678074428e-05, "Full-finetune/Loss": 0.7878177165985107, "Full-finetune/Loss (Raw)": 0.7495884895324707, "Full-finetune/Step": 2305, "Full-finetune/Step Time": 6.75160375982523} {"Full-finetune/Learning Rate": 1.22876327080022e-05, "Full-finetune/Loss": 0.7894846796989441, "Full-finetune/Loss (Raw)": 0.93030846118927, "Full-finetune/Step": 2306, "Full-finetune/Step Time": 6.754464738070965} {"Full-finetune/Learning Rate": 1.2281567850144383e-05, "Full-finetune/Loss": 0.7900681495666504, "Full-finetune/Loss (Raw)": 0.8673458695411682, "Full-finetune/Step": 2307, "Full-finetune/Step Time": 6.738455709069967} {"Full-finetune/Learning Rate": 1.2275502106854624e-05, "Full-finetune/Loss": 0.7873953580856323, "Full-finetune/Loss (Raw)": 0.5371265411376953, "Full-finetune/Step": 2308, "Full-finetune/Step Time": 6.740543179214001} {"Full-finetune/Learning Rate": 1.2269435480486923e-05, "Full-finetune/Loss": 0.7865245342254639, "Full-finetune/Loss (Raw)": 0.7891319394111633, "Full-finetune/Step": 2309, "Full-finetune/Step Time": 6.740374954417348} {"Full-finetune/Learning Rate": 1.226336797339562e-05, "Full-finetune/Loss": 0.7862259149551392, "Full-finetune/Loss (Raw)": 0.892112672328949, "Full-finetune/Step": 2310, "Full-finetune/Step Time": 6.734424773603678} {"Full-finetune/Learning Rate": 1.2257299587935394e-05, "Full-finetune/Loss": 0.7879779934883118, "Full-finetune/Loss (Raw)": 0.9036272764205933, "Full-finetune/Step": 2311, "Full-finetune/Step Time": 6.715020753443241} {"Full-finetune/Learning Rate": 1.2251230326461268e-05, "Full-finetune/Loss": 0.7881115078926086, "Full-finetune/Loss (Raw)": 0.708213210105896, "Full-finetune/Step": 2312, "Full-finetune/Step Time": 6.723259478807449} {"Full-finetune/Learning Rate": 1.2245160191328605e-05, "Full-finetune/Loss": 0.7875917553901672, "Full-finetune/Loss (Raw)": 0.803384006023407, "Full-finetune/Step": 2313, "Full-finetune/Step Time": 6.728066340088844} {"Full-finetune/Learning Rate": 1.2239089184893102e-05, "Full-finetune/Loss": 0.7870485186576843, "Full-finetune/Loss (Raw)": 0.7520531415939331, "Full-finetune/Step": 2314, "Full-finetune/Step Time": 6.735990097746253} {"Full-finetune/Learning Rate": 1.2233017309510804e-05, "Full-finetune/Loss": 0.7887476086616516, "Full-finetune/Loss (Raw)": 0.7771672010421753, "Full-finetune/Step": 2315, "Full-finetune/Step Time": 6.69145205616951} {"Full-finetune/Learning Rate": 1.2226944567538084e-05, "Full-finetune/Loss": 0.7898375988006592, "Full-finetune/Loss (Raw)": 0.9218792915344238, "Full-finetune/Step": 2316, "Full-finetune/Step Time": 6.656852448359132} {"Full-finetune/Learning Rate": 1.2220870961331654e-05, "Full-finetune/Loss": 0.790600061416626, "Full-finetune/Loss (Raw)": 0.7757791876792908, "Full-finetune/Step": 2317, "Full-finetune/Step Time": 6.652869233861566} {"Full-finetune/Learning Rate": 1.2214796493248564e-05, "Full-finetune/Loss": 0.7909656167030334, "Full-finetune/Loss (Raw)": 0.7349455952644348, "Full-finetune/Step": 2318, "Full-finetune/Step Time": 6.651504550129175} {"Full-finetune/Learning Rate": 1.2208721165646193e-05, "Full-finetune/Loss": 0.7920438051223755, "Full-finetune/Loss (Raw)": 0.9459189772605896, "Full-finetune/Step": 2319, "Full-finetune/Step Time": 6.64215874299407} {"Full-finetune/Learning Rate": 1.2202644980882258e-05, "Full-finetune/Loss": 0.7928856611251831, "Full-finetune/Loss (Raw)": 0.7798973917961121, "Full-finetune/Step": 2320, "Full-finetune/Step Time": 6.640419526025653} {"Full-finetune/Learning Rate": 1.2196567941314815e-05, "Full-finetune/Loss": 0.7921661138534546, "Full-finetune/Loss (Raw)": 0.813395082950592, "Full-finetune/Step": 2321, "Full-finetune/Step Time": 6.646941414102912} {"Full-finetune/Learning Rate": 1.2190490049302233e-05, "Full-finetune/Loss": 0.7922344207763672, "Full-finetune/Loss (Raw)": 0.8349087834358215, "Full-finetune/Step": 2322, "Full-finetune/Step Time": 6.647285144776106} {"Full-finetune/Learning Rate": 1.218441130720323e-05, "Full-finetune/Loss": 0.7905886769294739, "Full-finetune/Loss (Raw)": 0.6916185021400452, "Full-finetune/Step": 2323, "Full-finetune/Step Time": 6.660722970962524} {"Full-finetune/Learning Rate": 1.2178331717376848e-05, "Full-finetune/Loss": 0.7907710075378418, "Full-finetune/Loss (Raw)": 0.7808229327201843, "Full-finetune/Step": 2324, "Full-finetune/Step Time": 6.650306863710284} {"Full-finetune/Learning Rate": 1.217225128218245e-05, "Full-finetune/Loss": 0.7910766005516052, "Full-finetune/Loss (Raw)": 0.8602739572525024, "Full-finetune/Step": 2325, "Full-finetune/Step Time": 6.6560299545526505} {"Full-finetune/Learning Rate": 1.2166170003979742e-05, "Full-finetune/Loss": 0.788433849811554, "Full-finetune/Loss (Raw)": 0.43623244762420654, "Full-finetune/Step": 2326, "Full-finetune/Step Time": 6.668465878814459} {"Full-finetune/Learning Rate": 1.2160087885128745e-05, "Full-finetune/Loss": 0.7889251708984375, "Full-finetune/Loss (Raw)": 0.8393027782440186, "Full-finetune/Step": 2327, "Full-finetune/Step Time": 6.673566993325949} {"Full-finetune/Learning Rate": 1.2154004927989815e-05, "Full-finetune/Loss": 0.7890426516532898, "Full-finetune/Loss (Raw)": 0.7428233027458191, "Full-finetune/Step": 2328, "Full-finetune/Step Time": 6.656081868335605} {"Full-finetune/Learning Rate": 1.2147921134923624e-05, "Full-finetune/Loss": 0.7934922575950623, "Full-finetune/Loss (Raw)": 0.9235321879386902, "Full-finetune/Step": 2329, "Full-finetune/Step Time": 6.639400480315089} {"Full-finetune/Learning Rate": 1.2141836508291175e-05, "Full-finetune/Loss": 0.7927827835083008, "Full-finetune/Loss (Raw)": 0.7158181667327881, "Full-finetune/Step": 2330, "Full-finetune/Step Time": 6.651989109814167} {"Full-finetune/Learning Rate": 1.2135751050453793e-05, "Full-finetune/Loss": 0.7928752899169922, "Full-finetune/Loss (Raw)": 0.8094562292098999, "Full-finetune/Step": 2331, "Full-finetune/Step Time": 6.659434476867318} {"Full-finetune/Learning Rate": 1.2129664763773125e-05, "Full-finetune/Loss": 0.7952584028244019, "Full-finetune/Loss (Raw)": 1.0075745582580566, "Full-finetune/Step": 2332, "Full-finetune/Step Time": 6.665191676467657} {"Full-finetune/Learning Rate": 1.212357765061114e-05, "Full-finetune/Loss": 0.7987538576126099, "Full-finetune/Loss (Raw)": 0.8705812096595764, "Full-finetune/Step": 2333, "Full-finetune/Step Time": 6.6631321255117655} {"Full-finetune/Learning Rate": 1.211748971333013e-05, "Full-finetune/Loss": 0.8008711338043213, "Full-finetune/Loss (Raw)": 0.8479924201965332, "Full-finetune/Step": 2334, "Full-finetune/Step Time": 6.6445972714573145} {"Full-finetune/Learning Rate": 1.21114009542927e-05, "Full-finetune/Loss": 0.8007140755653381, "Full-finetune/Loss (Raw)": 0.82568359375, "Full-finetune/Step": 2335, "Full-finetune/Step Time": 6.6465536914765835} {"Full-finetune/Learning Rate": 1.2105311375861786e-05, "Full-finetune/Loss": 0.8010307550430298, "Full-finetune/Loss (Raw)": 0.8183221220970154, "Full-finetune/Step": 2336, "Full-finetune/Step Time": 6.649880051612854} {"Full-finetune/Learning Rate": 1.2099220980400625e-05, "Full-finetune/Loss": 0.8021596670150757, "Full-finetune/Loss (Raw)": 0.9294586777687073, "Full-finetune/Step": 2337, "Full-finetune/Step Time": 6.649789161980152} {"Full-finetune/Learning Rate": 1.2093129770272787e-05, "Full-finetune/Loss": 0.8057977557182312, "Full-finetune/Loss (Raw)": 0.8602509498596191, "Full-finetune/Step": 2338, "Full-finetune/Step Time": 6.631337091326714} {"Full-finetune/Learning Rate": 1.208703774784215e-05, "Full-finetune/Loss": 0.8042356967926025, "Full-finetune/Loss (Raw)": 0.7328017950057983, "Full-finetune/Step": 2339, "Full-finetune/Step Time": 6.625826507806778} {"Full-finetune/Learning Rate": 1.2080944915472908e-05, "Full-finetune/Loss": 0.8055576682090759, "Full-finetune/Loss (Raw)": 0.7559665441513062, "Full-finetune/Step": 2340, "Full-finetune/Step Time": 6.611089367419481} {"Full-finetune/Learning Rate": 1.2074851275529575e-05, "Full-finetune/Loss": 0.8070915937423706, "Full-finetune/Loss (Raw)": 0.8956610560417175, "Full-finetune/Step": 2341, "Full-finetune/Step Time": 6.636293798685074} {"Full-finetune/Learning Rate": 1.2068756830376966e-05, "Full-finetune/Loss": 0.8050744533538818, "Full-finetune/Loss (Raw)": 0.3568372428417206, "Full-finetune/Step": 2342, "Full-finetune/Step Time": 6.635403798893094} {"Full-finetune/Learning Rate": 1.2062661582380222e-05, "Full-finetune/Loss": 0.805467963218689, "Full-finetune/Loss (Raw)": 0.9226376414299011, "Full-finetune/Step": 2343, "Full-finetune/Step Time": 6.653105290606618} {"Full-finetune/Learning Rate": 1.2056565533904787e-05, "Full-finetune/Loss": 0.8048710227012634, "Full-finetune/Loss (Raw)": 0.772280216217041, "Full-finetune/Step": 2344, "Full-finetune/Step Time": 6.676192570477724} {"Full-finetune/Learning Rate": 1.2050468687316418e-05, "Full-finetune/Loss": 0.8054765462875366, "Full-finetune/Loss (Raw)": 1.0242128372192383, "Full-finetune/Step": 2345, "Full-finetune/Step Time": 6.670241599902511} {"Full-finetune/Learning Rate": 1.2044371044981188e-05, "Full-finetune/Loss": 0.8071459531784058, "Full-finetune/Loss (Raw)": 0.8020588755607605, "Full-finetune/Step": 2346, "Full-finetune/Step Time": 6.665530975908041} {"Full-finetune/Learning Rate": 1.2038272609265464e-05, "Full-finetune/Loss": 0.8082399368286133, "Full-finetune/Loss (Raw)": 0.8322715163230896, "Full-finetune/Step": 2347, "Full-finetune/Step Time": 6.6346261985599995} {"Full-finetune/Learning Rate": 1.2032173382535936e-05, "Full-finetune/Loss": 0.8081457614898682, "Full-finetune/Loss (Raw)": 0.8529942631721497, "Full-finetune/Step": 2348, "Full-finetune/Step Time": 6.635944217443466} {"Full-finetune/Learning Rate": 1.2026073367159597e-05, "Full-finetune/Loss": 0.8085987567901611, "Full-finetune/Loss (Raw)": 0.7832096815109253, "Full-finetune/Step": 2349, "Full-finetune/Step Time": 6.62706402130425} {"Full-finetune/Learning Rate": 1.2019972565503733e-05, "Full-finetune/Loss": 0.8079546093940735, "Full-finetune/Loss (Raw)": 0.8226243257522583, "Full-finetune/Step": 2350, "Full-finetune/Step Time": 6.619894398376346} {"Full-finetune/Learning Rate": 1.2013870979935957e-05, "Full-finetune/Loss": 0.808649480342865, "Full-finetune/Loss (Raw)": 0.9381016492843628, "Full-finetune/Step": 2351, "Full-finetune/Step Time": 6.606656931340694} {"Full-finetune/Learning Rate": 1.200776861282417e-05, "Full-finetune/Loss": 0.8086880445480347, "Full-finetune/Loss (Raw)": 0.84169602394104, "Full-finetune/Step": 2352, "Full-finetune/Step Time": 6.614502618089318} {"Full-finetune/Learning Rate": 1.2001665466536582e-05, "Full-finetune/Loss": 0.8092686533927917, "Full-finetune/Loss (Raw)": 0.8377067446708679, "Full-finetune/Step": 2353, "Full-finetune/Step Time": 6.608958575874567} {"Full-finetune/Learning Rate": 1.199556154344171e-05, "Full-finetune/Loss": 0.809207022190094, "Full-finetune/Loss (Raw)": 0.8380038142204285, "Full-finetune/Step": 2354, "Full-finetune/Step Time": 6.600267663598061} {"Full-finetune/Learning Rate": 1.1989456845908356e-05, "Full-finetune/Loss": 0.8081825971603394, "Full-finetune/Loss (Raw)": 0.7777580618858337, "Full-finetune/Step": 2355, "Full-finetune/Step Time": 6.607244135811925} {"Full-finetune/Learning Rate": 1.1983351376305648e-05, "Full-finetune/Loss": 0.8076274991035461, "Full-finetune/Loss (Raw)": 0.6919740438461304, "Full-finetune/Step": 2356, "Full-finetune/Step Time": 6.60857985727489} {"Full-finetune/Learning Rate": 1.197724513700299e-05, "Full-finetune/Loss": 0.808108925819397, "Full-finetune/Loss (Raw)": 0.8276505470275879, "Full-finetune/Step": 2357, "Full-finetune/Step Time": 6.61195077560842} {"Full-finetune/Learning Rate": 1.1971138130370097e-05, "Full-finetune/Loss": 0.809177815914154, "Full-finetune/Loss (Raw)": 0.9074211716651917, "Full-finetune/Step": 2358, "Full-finetune/Step Time": 6.608185162767768} {"Full-finetune/Learning Rate": 1.1965030358776975e-05, "Full-finetune/Loss": 0.804190456867218, "Full-finetune/Loss (Raw)": 0.2917638123035431, "Full-finetune/Step": 2359, "Full-finetune/Step Time": 6.6255873795598745} {"Full-finetune/Learning Rate": 1.1958921824593936e-05, "Full-finetune/Loss": 0.8035123944282532, "Full-finetune/Loss (Raw)": 0.8830349445343018, "Full-finetune/Step": 2360, "Full-finetune/Step Time": 6.624165648594499} {"Full-finetune/Learning Rate": 1.1952812530191586e-05, "Full-finetune/Loss": 0.8049341440200806, "Full-finetune/Loss (Raw)": 0.8875926733016968, "Full-finetune/Step": 2361, "Full-finetune/Step Time": 6.617773935198784} {"Full-finetune/Learning Rate": 1.1946702477940815e-05, "Full-finetune/Loss": 0.8042895793914795, "Full-finetune/Loss (Raw)": 0.8316513299942017, "Full-finetune/Step": 2362, "Full-finetune/Step Time": 6.610242258757353} {"Full-finetune/Learning Rate": 1.194059167021282e-05, "Full-finetune/Loss": 0.8012619018554688, "Full-finetune/Loss (Raw)": 0.5500233769416809, "Full-finetune/Step": 2363, "Full-finetune/Step Time": 6.6156347040086985} {"Full-finetune/Learning Rate": 1.1934480109379083e-05, "Full-finetune/Loss": 0.8000431656837463, "Full-finetune/Loss (Raw)": 0.7583406567573547, "Full-finetune/Step": 2364, "Full-finetune/Step Time": 6.612323984503746} {"Full-finetune/Learning Rate": 1.1928367797811384e-05, "Full-finetune/Loss": 0.8008970022201538, "Full-finetune/Loss (Raw)": 0.859521746635437, "Full-finetune/Step": 2365, "Full-finetune/Step Time": 6.6069792583584785} {"Full-finetune/Learning Rate": 1.1922254737881792e-05, "Full-finetune/Loss": 0.8002296090126038, "Full-finetune/Loss (Raw)": 0.5727460384368896, "Full-finetune/Step": 2366, "Full-finetune/Step Time": 6.602755976840854} {"Full-finetune/Learning Rate": 1.1916140931962661e-05, "Full-finetune/Loss": 0.7988878488540649, "Full-finetune/Loss (Raw)": 0.9349555373191833, "Full-finetune/Step": 2367, "Full-finetune/Step Time": 6.607385944575071} {"Full-finetune/Learning Rate": 1.191002638242665e-05, "Full-finetune/Loss": 0.7974066734313965, "Full-finetune/Loss (Raw)": 0.7841556668281555, "Full-finetune/Step": 2368, "Full-finetune/Step Time": 6.602856379002333} {"Full-finetune/Learning Rate": 1.1903911091646684e-05, "Full-finetune/Loss": 0.7975003719329834, "Full-finetune/Loss (Raw)": 0.9578484892845154, "Full-finetune/Step": 2369, "Full-finetune/Step Time": 6.598887629806995} {"Full-finetune/Learning Rate": 1.1897795061995998e-05, "Full-finetune/Loss": 0.797717809677124, "Full-finetune/Loss (Raw)": 0.8155580163002014, "Full-finetune/Step": 2370, "Full-finetune/Step Time": 6.600607104599476} {"Full-finetune/Learning Rate": 1.18916782958481e-05, "Full-finetune/Loss": 0.7986619472503662, "Full-finetune/Loss (Raw)": 0.9188628792762756, "Full-finetune/Step": 2371, "Full-finetune/Step Time": 6.599428394809365} {"Full-finetune/Learning Rate": 1.1885560795576782e-05, "Full-finetune/Loss": 0.7962710857391357, "Full-finetune/Loss (Raw)": 0.7713096141815186, "Full-finetune/Step": 2372, "Full-finetune/Step Time": 6.600797887891531} {"Full-finetune/Learning Rate": 1.1879442563556141e-05, "Full-finetune/Loss": 0.7966739535331726, "Full-finetune/Loss (Raw)": 0.9249224662780762, "Full-finetune/Step": 2373, "Full-finetune/Step Time": 6.621863175183535} {"Full-finetune/Learning Rate": 1.1873323602160526e-05, "Full-finetune/Loss": 0.7949143052101135, "Full-finetune/Loss (Raw)": 0.7314568161964417, "Full-finetune/Step": 2374, "Full-finetune/Step Time": 6.611905777826905} {"Full-finetune/Learning Rate": 1.1867203913764599e-05, "Full-finetune/Loss": 0.794337272644043, "Full-finetune/Loss (Raw)": 0.6385987997055054, "Full-finetune/Step": 2375, "Full-finetune/Step Time": 6.624301366508007} {"Full-finetune/Learning Rate": 1.1861083500743284e-05, "Full-finetune/Loss": 0.7958704233169556, "Full-finetune/Loss (Raw)": 0.9023179411888123, "Full-finetune/Step": 2376, "Full-finetune/Step Time": 6.628798678517342} {"Full-finetune/Learning Rate": 1.1854962365471798e-05, "Full-finetune/Loss": 0.7975468635559082, "Full-finetune/Loss (Raw)": 0.9922767877578735, "Full-finetune/Step": 2377, "Full-finetune/Step Time": 6.628746164962649} {"Full-finetune/Learning Rate": 1.1848840510325635e-05, "Full-finetune/Loss": 0.7985010147094727, "Full-finetune/Loss (Raw)": 0.9029338955879211, "Full-finetune/Step": 2378, "Full-finetune/Step Time": 6.607065377756953} {"Full-finetune/Learning Rate": 1.184271793768056e-05, "Full-finetune/Loss": 0.7984766960144043, "Full-finetune/Loss (Raw)": 0.8637400269508362, "Full-finetune/Step": 2379, "Full-finetune/Step Time": 6.6234319768846035} {"Full-finetune/Learning Rate": 1.1836594649912636e-05, "Full-finetune/Loss": 0.8017095327377319, "Full-finetune/Loss (Raw)": 0.7318395376205444, "Full-finetune/Step": 2380, "Full-finetune/Step Time": 6.603483207523823} {"Full-finetune/Learning Rate": 1.1830470649398183e-05, "Full-finetune/Loss": 0.8010734915733337, "Full-finetune/Loss (Raw)": 0.8260416984558105, "Full-finetune/Step": 2381, "Full-finetune/Step Time": 6.606463307514787} {"Full-finetune/Learning Rate": 1.1824345938513806e-05, "Full-finetune/Loss": 0.7990900278091431, "Full-finetune/Loss (Raw)": 0.6725238561630249, "Full-finetune/Step": 2382, "Full-finetune/Step Time": 6.617400158196688} {"Full-finetune/Learning Rate": 1.181822051963639e-05, "Full-finetune/Loss": 0.7968126535415649, "Full-finetune/Loss (Raw)": 0.5582235455513, "Full-finetune/Step": 2383, "Full-finetune/Step Time": 6.630903076380491} {"Full-finetune/Learning Rate": 1.1812094395143086e-05, "Full-finetune/Loss": 0.7983147501945496, "Full-finetune/Loss (Raw)": 0.953795850276947, "Full-finetune/Step": 2384, "Full-finetune/Step Time": 6.627269292250276} {"Full-finetune/Learning Rate": 1.1805967567411325e-05, "Full-finetune/Loss": 0.7981581687927246, "Full-finetune/Loss (Raw)": 0.8040766716003418, "Full-finetune/Step": 2385, "Full-finetune/Step Time": 6.632347581908107} {"Full-finetune/Learning Rate": 1.1799840038818813e-05, "Full-finetune/Loss": 0.8007182478904724, "Full-finetune/Loss (Raw)": 0.9746625423431396, "Full-finetune/Step": 2386, "Full-finetune/Step Time": 6.638740772381425} {"Full-finetune/Learning Rate": 1.1793711811743515e-05, "Full-finetune/Loss": 0.8012456893920898, "Full-finetune/Loss (Raw)": 0.8189830780029297, "Full-finetune/Step": 2387, "Full-finetune/Step Time": 6.651907572522759} {"Full-finetune/Learning Rate": 1.1787582888563689e-05, "Full-finetune/Loss": 0.8015835285186768, "Full-finetune/Loss (Raw)": 0.8236934542655945, "Full-finetune/Step": 2388, "Full-finetune/Step Time": 6.662029109895229} {"Full-finetune/Learning Rate": 1.1781453271657839e-05, "Full-finetune/Loss": 0.8021105527877808, "Full-finetune/Loss (Raw)": 0.9513294696807861, "Full-finetune/Step": 2389, "Full-finetune/Step Time": 6.661080487072468} {"Full-finetune/Learning Rate": 1.1775322963404757e-05, "Full-finetune/Loss": 0.8017556667327881, "Full-finetune/Loss (Raw)": 0.9450088739395142, "Full-finetune/Step": 2390, "Full-finetune/Step Time": 6.675050104036927} {"Full-finetune/Learning Rate": 1.176919196618349e-05, "Full-finetune/Loss": 0.8027105927467346, "Full-finetune/Loss (Raw)": 0.9161890149116516, "Full-finetune/Step": 2391, "Full-finetune/Step Time": 6.673987040296197} {"Full-finetune/Learning Rate": 1.1763060282373364e-05, "Full-finetune/Loss": 0.802489161491394, "Full-finetune/Loss (Raw)": 0.8514412045478821, "Full-finetune/Step": 2392, "Full-finetune/Step Time": 6.673518402501941} {"Full-finetune/Learning Rate": 1.1756927914353963e-05, "Full-finetune/Loss": 0.8033639788627625, "Full-finetune/Loss (Raw)": 0.9283291697502136, "Full-finetune/Step": 2393, "Full-finetune/Step Time": 6.685950189828873} {"Full-finetune/Learning Rate": 1.175079486450514e-05, "Full-finetune/Loss": 0.8022332787513733, "Full-finetune/Loss (Raw)": 0.39305099844932556, "Full-finetune/Step": 2394, "Full-finetune/Step Time": 6.7061929404735565} {"Full-finetune/Learning Rate": 1.1744661135207009e-05, "Full-finetune/Loss": 0.8027099370956421, "Full-finetune/Loss (Raw)": 0.8691848516464233, "Full-finetune/Step": 2395, "Full-finetune/Step Time": 6.711059492081404} {"Full-finetune/Learning Rate": 1.1738526728839956e-05, "Full-finetune/Loss": 0.8030465841293335, "Full-finetune/Loss (Raw)": 0.7991392612457275, "Full-finetune/Step": 2396, "Full-finetune/Step Time": 6.707776337862015} {"Full-finetune/Learning Rate": 1.1732391647784618e-05, "Full-finetune/Loss": 0.802747368812561, "Full-finetune/Loss (Raw)": 0.852778971195221, "Full-finetune/Step": 2397, "Full-finetune/Step Time": 6.705038970336318} {"Full-finetune/Learning Rate": 1.1726255894421908e-05, "Full-finetune/Loss": 0.8061763048171997, "Full-finetune/Loss (Raw)": 1.015223503112793, "Full-finetune/Step": 2398, "Full-finetune/Step Time": 6.68669749237597} {"Full-finetune/Learning Rate": 1.1720119471132985e-05, "Full-finetune/Loss": 0.8064413070678711, "Full-finetune/Loss (Raw)": 0.9128902554512024, "Full-finetune/Step": 2399, "Full-finetune/Step Time": 6.693322446197271} {"Full-finetune/Learning Rate": 1.1713982380299278e-05, "Full-finetune/Loss": 0.8051645755767822, "Full-finetune/Loss (Raw)": 0.7333165407180786, "Full-finetune/Step": 2400, "Full-finetune/Step Time": 6.684649595990777} {"Full-finetune/Learning Rate": 1.1707844624302471e-05, "Full-finetune/Loss": 0.8052011728286743, "Full-finetune/Loss (Raw)": 0.8134255409240723, "Full-finetune/Step": 2401, "Full-finetune/Step Time": 6.6883917190134525} {"Full-finetune/Learning Rate": 1.170170620552451e-05, "Full-finetune/Loss": 0.8048368692398071, "Full-finetune/Loss (Raw)": 0.7232182025909424, "Full-finetune/Step": 2402, "Full-finetune/Step Time": 6.6728004440665245} {"Full-finetune/Learning Rate": 1.1695567126347593e-05, "Full-finetune/Loss": 0.8042199611663818, "Full-finetune/Loss (Raw)": 0.8391172885894775, "Full-finetune/Step": 2403, "Full-finetune/Step Time": 6.6811074540019035} {"Full-finetune/Learning Rate": 1.1689427389154176e-05, "Full-finetune/Loss": 0.8043447732925415, "Full-finetune/Loss (Raw)": 0.8692181706428528, "Full-finetune/Step": 2404, "Full-finetune/Step Time": 6.679527800530195} {"Full-finetune/Learning Rate": 1.1683286996326975e-05, "Full-finetune/Loss": 0.805345892906189, "Full-finetune/Loss (Raw)": 0.8130768537521362, "Full-finetune/Step": 2405, "Full-finetune/Step Time": 6.665100479498506} {"Full-finetune/Learning Rate": 1.1677145950248954e-05, "Full-finetune/Loss": 0.805825412273407, "Full-finetune/Loss (Raw)": 0.9410353302955627, "Full-finetune/Step": 2406, "Full-finetune/Step Time": 6.667122986167669} {"Full-finetune/Learning Rate": 1.167100425330333e-05, "Full-finetune/Loss": 0.8036623001098633, "Full-finetune/Loss (Raw)": 0.5818277597427368, "Full-finetune/Step": 2407, "Full-finetune/Step Time": 6.689193120226264} {"Full-finetune/Learning Rate": 1.1664861907873583e-05, "Full-finetune/Loss": 0.8050413131713867, "Full-finetune/Loss (Raw)": 1.0177446603775024, "Full-finetune/Step": 2408, "Full-finetune/Step Time": 6.697778835892677} {"Full-finetune/Learning Rate": 1.165871891634343e-05, "Full-finetune/Loss": 0.8049811124801636, "Full-finetune/Loss (Raw)": 0.8142889142036438, "Full-finetune/Step": 2409, "Full-finetune/Step Time": 6.697981491684914} {"Full-finetune/Learning Rate": 1.165257528109685e-05, "Full-finetune/Loss": 0.8048021793365479, "Full-finetune/Loss (Raw)": 0.7926753163337708, "Full-finetune/Step": 2410, "Full-finetune/Step Time": 6.7072672713547945} {"Full-finetune/Learning Rate": 1.1646431004518068e-05, "Full-finetune/Loss": 0.8026244044303894, "Full-finetune/Loss (Raw)": 0.6749153137207031, "Full-finetune/Step": 2411, "Full-finetune/Step Time": 6.714725209400058} {"Full-finetune/Learning Rate": 1.1640286088991558e-05, "Full-finetune/Loss": 0.8036185503005981, "Full-finetune/Loss (Raw)": 0.7648120522499084, "Full-finetune/Step": 2412, "Full-finetune/Step Time": 6.693076292052865} {"Full-finetune/Learning Rate": 1.1634140536902039e-05, "Full-finetune/Loss": 0.8033081889152527, "Full-finetune/Loss (Raw)": 0.7473142147064209, "Full-finetune/Step": 2413, "Full-finetune/Step Time": 6.68304674141109} {"Full-finetune/Learning Rate": 1.1627994350634482e-05, "Full-finetune/Loss": 0.8040515184402466, "Full-finetune/Loss (Raw)": 0.8881513476371765, "Full-finetune/Step": 2414, "Full-finetune/Step Time": 6.679892685264349} {"Full-finetune/Learning Rate": 1.1621847532574101e-05, "Full-finetune/Loss": 0.8058016896247864, "Full-finetune/Loss (Raw)": 0.8280209898948669, "Full-finetune/Step": 2415, "Full-finetune/Step Time": 6.680053364485502} {"Full-finetune/Learning Rate": 1.1615700085106357e-05, "Full-finetune/Loss": 0.8048110008239746, "Full-finetune/Loss (Raw)": 0.7852523326873779, "Full-finetune/Step": 2416, "Full-finetune/Step Time": 6.677529154345393} {"Full-finetune/Learning Rate": 1.1609552010616953e-05, "Full-finetune/Loss": 0.8059455156326294, "Full-finetune/Loss (Raw)": 0.7626281976699829, "Full-finetune/Step": 2417, "Full-finetune/Step Time": 6.675443533807993} {"Full-finetune/Learning Rate": 1.1603403311491841e-05, "Full-finetune/Loss": 0.8021591901779175, "Full-finetune/Loss (Raw)": 0.441741406917572, "Full-finetune/Step": 2418, "Full-finetune/Step Time": 6.693043133243918} {"Full-finetune/Learning Rate": 1.1597253990117205e-05, "Full-finetune/Loss": 0.8022971749305725, "Full-finetune/Loss (Raw)": 0.792153000831604, "Full-finetune/Step": 2419, "Full-finetune/Step Time": 6.699927054345608} {"Full-finetune/Learning Rate": 1.1591104048879479e-05, "Full-finetune/Loss": 0.804223895072937, "Full-finetune/Loss (Raw)": 0.9949325919151306, "Full-finetune/Step": 2420, "Full-finetune/Step Time": 6.689600503072143} {"Full-finetune/Learning Rate": 1.1584953490165334e-05, "Full-finetune/Loss": 0.8049214482307434, "Full-finetune/Loss (Raw)": 0.6598668694496155, "Full-finetune/Step": 2421, "Full-finetune/Step Time": 6.699676621705294} {"Full-finetune/Learning Rate": 1.1578802316361685e-05, "Full-finetune/Loss": 0.803458034992218, "Full-finetune/Loss (Raw)": 0.6833125948905945, "Full-finetune/Step": 2422, "Full-finetune/Step Time": 6.709752060472965} {"Full-finetune/Learning Rate": 1.157265052985568e-05, "Full-finetune/Loss": 0.8019744157791138, "Full-finetune/Loss (Raw)": 0.5927425026893616, "Full-finetune/Step": 2423, "Full-finetune/Step Time": 6.692784925922751} {"Full-finetune/Learning Rate": 1.156649813303471e-05, "Full-finetune/Loss": 0.8035802841186523, "Full-finetune/Loss (Raw)": 0.8923935890197754, "Full-finetune/Step": 2424, "Full-finetune/Step Time": 6.693072412163019} {"Full-finetune/Learning Rate": 1.1560345128286396e-05, "Full-finetune/Loss": 0.8027598857879639, "Full-finetune/Loss (Raw)": 0.6911071538925171, "Full-finetune/Step": 2425, "Full-finetune/Step Time": 6.704163104295731} {"Full-finetune/Learning Rate": 1.1554191517998598e-05, "Full-finetune/Loss": 0.799403190612793, "Full-finetune/Loss (Raw)": 0.3686089515686035, "Full-finetune/Step": 2426, "Full-finetune/Step Time": 6.722263894975185} {"Full-finetune/Learning Rate": 1.1548037304559419e-05, "Full-finetune/Loss": 0.7991432547569275, "Full-finetune/Loss (Raw)": 0.855562150478363, "Full-finetune/Step": 2427, "Full-finetune/Step Time": 6.71392429061234} {"Full-finetune/Learning Rate": 1.1541882490357183e-05, "Full-finetune/Loss": 0.797824501991272, "Full-finetune/Loss (Raw)": 0.7094838619232178, "Full-finetune/Step": 2428, "Full-finetune/Step Time": 6.709024757146835} {"Full-finetune/Learning Rate": 1.1535727077780456e-05, "Full-finetune/Loss": 0.7985004782676697, "Full-finetune/Loss (Raw)": 0.8502620458602905, "Full-finetune/Step": 2429, "Full-finetune/Step Time": 6.721758125349879} {"Full-finetune/Learning Rate": 1.1529571069218033e-05, "Full-finetune/Loss": 0.7982950210571289, "Full-finetune/Loss (Raw)": 0.6934881210327148, "Full-finetune/Step": 2430, "Full-finetune/Step Time": 6.756516406312585} {"Full-finetune/Learning Rate": 1.152341446705894e-05, "Full-finetune/Loss": 0.798577070236206, "Full-finetune/Loss (Raw)": 0.898887038230896, "Full-finetune/Step": 2431, "Full-finetune/Step Time": 6.756105922162533} {"Full-finetune/Learning Rate": 1.1517257273692432e-05, "Full-finetune/Loss": 0.7998199462890625, "Full-finetune/Loss (Raw)": 0.7999553084373474, "Full-finetune/Step": 2432, "Full-finetune/Step Time": 6.759176092222333} {"Full-finetune/Learning Rate": 1.1511099491508003e-05, "Full-finetune/Loss": 0.7997163534164429, "Full-finetune/Loss (Raw)": 0.7363314032554626, "Full-finetune/Step": 2433, "Full-finetune/Step Time": 6.759392231702805} {"Full-finetune/Learning Rate": 1.1504941122895361e-05, "Full-finetune/Loss": 0.7990573644638062, "Full-finetune/Loss (Raw)": 0.8459568619728088, "Full-finetune/Step": 2434, "Full-finetune/Step Time": 6.758851727470756} {"Full-finetune/Learning Rate": 1.1498782170244449e-05, "Full-finetune/Loss": 0.7986364364624023, "Full-finetune/Loss (Raw)": 0.813477098941803, "Full-finetune/Step": 2435, "Full-finetune/Step Time": 6.768790107220411} {"Full-finetune/Learning Rate": 1.1492622635945438e-05, "Full-finetune/Loss": 0.8013511896133423, "Full-finetune/Loss (Raw)": 0.8846073746681213, "Full-finetune/Step": 2436, "Full-finetune/Step Time": 6.762639231979847} {"Full-finetune/Learning Rate": 1.1486462522388724e-05, "Full-finetune/Loss": 0.8011668920516968, "Full-finetune/Loss (Raw)": 0.7655396461486816, "Full-finetune/Step": 2437, "Full-finetune/Step Time": 6.7684352323412895} {"Full-finetune/Learning Rate": 1.1480301831964926e-05, "Full-finetune/Loss": 0.8013370037078857, "Full-finetune/Loss (Raw)": 0.9138878583908081, "Full-finetune/Step": 2438, "Full-finetune/Step Time": 6.772637467831373} {"Full-finetune/Learning Rate": 1.1474140567064889e-05, "Full-finetune/Loss": 0.8013327121734619, "Full-finetune/Loss (Raw)": 0.9030774235725403, "Full-finetune/Step": 2439, "Full-finetune/Step Time": 6.773094331845641} {"Full-finetune/Learning Rate": 1.1467978730079677e-05, "Full-finetune/Loss": 0.8028843402862549, "Full-finetune/Loss (Raw)": 0.906822681427002, "Full-finetune/Step": 2440, "Full-finetune/Step Time": 6.753366824239492} {"Full-finetune/Learning Rate": 1.1461816323400579e-05, "Full-finetune/Loss": 0.8037943840026855, "Full-finetune/Loss (Raw)": 0.9198711514472961, "Full-finetune/Step": 2441, "Full-finetune/Step Time": 6.749220412224531} {"Full-finetune/Learning Rate": 1.1455653349419105e-05, "Full-finetune/Loss": 0.8044500350952148, "Full-finetune/Loss (Raw)": 0.8359699249267578, "Full-finetune/Step": 2442, "Full-finetune/Step Time": 6.744853934273124} {"Full-finetune/Learning Rate": 1.1449489810526985e-05, "Full-finetune/Loss": 0.8056341409683228, "Full-finetune/Loss (Raw)": 0.9287407398223877, "Full-finetune/Step": 2443, "Full-finetune/Step Time": 6.760910691693425} {"Full-finetune/Learning Rate": 1.144332570911617e-05, "Full-finetune/Loss": 0.8051401376724243, "Full-finetune/Loss (Raw)": 0.8586509227752686, "Full-finetune/Step": 2444, "Full-finetune/Step Time": 6.767378743737936} {"Full-finetune/Learning Rate": 1.1437161047578826e-05, "Full-finetune/Loss": 0.8021247386932373, "Full-finetune/Loss (Raw)": 0.38980937004089355, "Full-finetune/Step": 2445, "Full-finetune/Step Time": 6.781836932525039} {"Full-finetune/Learning Rate": 1.1430995828307337e-05, "Full-finetune/Loss": 0.8032400608062744, "Full-finetune/Loss (Raw)": 0.8776997923851013, "Full-finetune/Step": 2446, "Full-finetune/Step Time": 6.772592045366764} {"Full-finetune/Learning Rate": 1.1424830053694303e-05, "Full-finetune/Loss": 0.8025333881378174, "Full-finetune/Loss (Raw)": 0.8554618954658508, "Full-finetune/Step": 2447, "Full-finetune/Step Time": 6.778224695473909} {"Full-finetune/Learning Rate": 1.1418663726132543e-05, "Full-finetune/Loss": 0.8035404086112976, "Full-finetune/Loss (Raw)": 0.9087954163551331, "Full-finetune/Step": 2448, "Full-finetune/Step Time": 6.778761122375727} {"Full-finetune/Learning Rate": 1.141249684801509e-05, "Full-finetune/Loss": 0.8028247356414795, "Full-finetune/Loss (Raw)": 0.7217958569526672, "Full-finetune/Step": 2449, "Full-finetune/Step Time": 6.7709309458732605} {"Full-finetune/Learning Rate": 1.140632942173519e-05, "Full-finetune/Loss": 0.8000826835632324, "Full-finetune/Loss (Raw)": 0.4839191138744354, "Full-finetune/Step": 2450, "Full-finetune/Step Time": 6.797348037362099} {"Full-finetune/Learning Rate": 1.1400161449686293e-05, "Full-finetune/Loss": 0.7971545457839966, "Full-finetune/Loss (Raw)": 0.31682726740837097, "Full-finetune/Step": 2451, "Full-finetune/Step Time": 6.803915768861771} {"Full-finetune/Learning Rate": 1.1393992934262073e-05, "Full-finetune/Loss": 0.7970705628395081, "Full-finetune/Loss (Raw)": 0.7700661420822144, "Full-finetune/Step": 2452, "Full-finetune/Step Time": 6.805202646180987} {"Full-finetune/Learning Rate": 1.1387823877856413e-05, "Full-finetune/Loss": 0.7965695858001709, "Full-finetune/Loss (Raw)": 0.7961486577987671, "Full-finetune/Step": 2453, "Full-finetune/Step Time": 6.822756372392178} {"Full-finetune/Learning Rate": 1.1381654282863399e-05, "Full-finetune/Loss": 0.7996153831481934, "Full-finetune/Loss (Raw)": 0.826087474822998, "Full-finetune/Step": 2454, "Full-finetune/Step Time": 6.814052287489176} {"Full-finetune/Learning Rate": 1.1375484151677334e-05, "Full-finetune/Loss": 0.7999246120452881, "Full-finetune/Loss (Raw)": 0.8788909316062927, "Full-finetune/Step": 2455, "Full-finetune/Step Time": 6.801399126648903} {"Full-finetune/Learning Rate": 1.1369313486692723e-05, "Full-finetune/Loss": 0.8009566068649292, "Full-finetune/Loss (Raw)": 0.8749148845672607, "Full-finetune/Step": 2456, "Full-finetune/Step Time": 6.791909785941243} {"Full-finetune/Learning Rate": 1.136314229030428e-05, "Full-finetune/Loss": 0.8004278540611267, "Full-finetune/Loss (Raw)": 0.855857789516449, "Full-finetune/Step": 2457, "Full-finetune/Step Time": 6.7890313267707825} {"Full-finetune/Learning Rate": 1.1356970564906928e-05, "Full-finetune/Loss": 0.8011857271194458, "Full-finetune/Loss (Raw)": 0.8128222823143005, "Full-finetune/Step": 2458, "Full-finetune/Step Time": 6.795417075976729} {"Full-finetune/Learning Rate": 1.1350798312895795e-05, "Full-finetune/Loss": 0.8009190559387207, "Full-finetune/Loss (Raw)": 0.7753285765647888, "Full-finetune/Step": 2459, "Full-finetune/Step Time": 6.789921868592501} {"Full-finetune/Learning Rate": 1.1344625536666208e-05, "Full-finetune/Loss": 0.7989513278007507, "Full-finetune/Loss (Raw)": 0.7557016015052795, "Full-finetune/Step": 2460, "Full-finetune/Step Time": 6.774018429219723} {"Full-finetune/Learning Rate": 1.13384522386137e-05, "Full-finetune/Loss": 0.7996393442153931, "Full-finetune/Loss (Raw)": 0.958654522895813, "Full-finetune/Step": 2461, "Full-finetune/Step Time": 6.771984765306115} {"Full-finetune/Learning Rate": 1.1332278421134007e-05, "Full-finetune/Loss": 0.7998139262199402, "Full-finetune/Loss (Raw)": 0.8703271746635437, "Full-finetune/Step": 2462, "Full-finetune/Step Time": 6.749669874086976} {"Full-finetune/Learning Rate": 1.1326104086623075e-05, "Full-finetune/Loss": 0.7995326519012451, "Full-finetune/Loss (Raw)": 0.7896871566772461, "Full-finetune/Step": 2463, "Full-finetune/Step Time": 6.750396121293306} {"Full-finetune/Learning Rate": 1.1319929237477033e-05, "Full-finetune/Loss": 0.8002188205718994, "Full-finetune/Loss (Raw)": 0.9061468839645386, "Full-finetune/Step": 2464, "Full-finetune/Step Time": 6.7354071866720915} {"Full-finetune/Learning Rate": 1.1313753876092223e-05, "Full-finetune/Loss": 0.7994163632392883, "Full-finetune/Loss (Raw)": 0.8267500400543213, "Full-finetune/Step": 2465, "Full-finetune/Step Time": 6.738247202709317} {"Full-finetune/Learning Rate": 1.1307578004865188e-05, "Full-finetune/Loss": 0.7986782193183899, "Full-finetune/Loss (Raw)": 0.7657619714736938, "Full-finetune/Step": 2466, "Full-finetune/Step Time": 6.740478632971644} {"Full-finetune/Learning Rate": 1.130140162619265e-05, "Full-finetune/Loss": 0.7993199825286865, "Full-finetune/Loss (Raw)": 0.8149559497833252, "Full-finetune/Step": 2467, "Full-finetune/Step Time": 6.720338383689523} {"Full-finetune/Learning Rate": 1.1295224742471555e-05, "Full-finetune/Loss": 0.8007906675338745, "Full-finetune/Loss (Raw)": 0.9442125558853149, "Full-finetune/Step": 2468, "Full-finetune/Step Time": 6.724789852276444} {"Full-finetune/Learning Rate": 1.128904735609902e-05, "Full-finetune/Loss": 0.8008559346199036, "Full-finetune/Loss (Raw)": 0.9040125012397766, "Full-finetune/Step": 2469, "Full-finetune/Step Time": 6.697672933340073} {"Full-finetune/Learning Rate": 1.1282869469472375e-05, "Full-finetune/Loss": 0.8040016889572144, "Full-finetune/Loss (Raw)": 0.7594889402389526, "Full-finetune/Step": 2470, "Full-finetune/Step Time": 6.6866103913635015} {"Full-finetune/Learning Rate": 1.1276691084989135e-05, "Full-finetune/Loss": 0.8038449287414551, "Full-finetune/Loss (Raw)": 0.9025753140449524, "Full-finetune/Step": 2471, "Full-finetune/Step Time": 6.670060936361551} {"Full-finetune/Learning Rate": 1.1270512205047008e-05, "Full-finetune/Loss": 0.8042927980422974, "Full-finetune/Loss (Raw)": 0.8296034336090088, "Full-finetune/Step": 2472, "Full-finetune/Step Time": 6.644810352474451} {"Full-finetune/Learning Rate": 1.1264332832043902e-05, "Full-finetune/Loss": 0.8031800985336304, "Full-finetune/Loss (Raw)": 0.8817951679229736, "Full-finetune/Step": 2473, "Full-finetune/Step Time": 6.651709521189332} {"Full-finetune/Learning Rate": 1.1258152968377907e-05, "Full-finetune/Loss": 0.8031162023544312, "Full-finetune/Loss (Raw)": 0.7938753366470337, "Full-finetune/Step": 2474, "Full-finetune/Step Time": 6.666642924770713} {"Full-finetune/Learning Rate": 1.125197261644731e-05, "Full-finetune/Loss": 0.8030133247375488, "Full-finetune/Loss (Raw)": 0.8191025853157043, "Full-finetune/Step": 2475, "Full-finetune/Step Time": 6.66627586260438} {"Full-finetune/Learning Rate": 1.1245791778650578e-05, "Full-finetune/Loss": 0.8029807806015015, "Full-finetune/Loss (Raw)": 0.8488374352455139, "Full-finetune/Step": 2476, "Full-finetune/Step Time": 6.663882711902261} {"Full-finetune/Learning Rate": 1.1239610457386381e-05, "Full-finetune/Loss": 0.8032962679862976, "Full-finetune/Loss (Raw)": 0.8235849142074585, "Full-finetune/Step": 2477, "Full-finetune/Step Time": 6.661443177610636} {"Full-finetune/Learning Rate": 1.1233428655053572e-05, "Full-finetune/Loss": 0.8033009171485901, "Full-finetune/Loss (Raw)": 0.82321697473526, "Full-finetune/Step": 2478, "Full-finetune/Step Time": 6.660916173830628} {"Full-finetune/Learning Rate": 1.1227246374051175e-05, "Full-finetune/Loss": 0.801507830619812, "Full-finetune/Loss (Raw)": 0.7085902094841003, "Full-finetune/Step": 2479, "Full-finetune/Step Time": 6.6609260533005} {"Full-finetune/Learning Rate": 1.1221063616778425e-05, "Full-finetune/Loss": 0.80050128698349, "Full-finetune/Loss (Raw)": 0.7128582000732422, "Full-finetune/Step": 2480, "Full-finetune/Step Time": 6.660068906843662} {"Full-finetune/Learning Rate": 1.1214880385634723e-05, "Full-finetune/Loss": 0.7968729734420776, "Full-finetune/Loss (Raw)": 0.3732878863811493, "Full-finetune/Step": 2481, "Full-finetune/Step Time": 6.675942288711667} {"Full-finetune/Learning Rate": 1.120869668301966e-05, "Full-finetune/Loss": 0.7983775734901428, "Full-finetune/Loss (Raw)": 1.030585765838623, "Full-finetune/Step": 2482, "Full-finetune/Step Time": 6.67378025315702} {"Full-finetune/Learning Rate": 1.1202512511333017e-05, "Full-finetune/Loss": 0.7983849048614502, "Full-finetune/Loss (Raw)": 0.7786911725997925, "Full-finetune/Step": 2483, "Full-finetune/Step Time": 6.669723117724061} {"Full-finetune/Learning Rate": 1.119632787297474e-05, "Full-finetune/Loss": 0.7986711263656616, "Full-finetune/Loss (Raw)": 0.7286210656166077, "Full-finetune/Step": 2484, "Full-finetune/Step Time": 6.6750618033111095} {"Full-finetune/Learning Rate": 1.1190142770344976e-05, "Full-finetune/Loss": 0.7988114953041077, "Full-finetune/Loss (Raw)": 0.8456102013587952, "Full-finetune/Step": 2485, "Full-finetune/Step Time": 6.677073244005442} {"Full-finetune/Learning Rate": 1.1183957205844037e-05, "Full-finetune/Loss": 0.7967966794967651, "Full-finetune/Loss (Raw)": 0.6495225429534912, "Full-finetune/Step": 2486, "Full-finetune/Step Time": 6.687610043212771} {"Full-finetune/Learning Rate": 1.1177771181872416e-05, "Full-finetune/Loss": 0.7969583868980408, "Full-finetune/Loss (Raw)": 0.3124712109565735, "Full-finetune/Step": 2487, "Full-finetune/Step Time": 6.686450557783246} {"Full-finetune/Learning Rate": 1.1171584700830803e-05, "Full-finetune/Loss": 0.7970837354660034, "Full-finetune/Loss (Raw)": 0.899070680141449, "Full-finetune/Step": 2488, "Full-finetune/Step Time": 6.686944281682372} {"Full-finetune/Learning Rate": 1.1165397765120035e-05, "Full-finetune/Loss": 0.7970250844955444, "Full-finetune/Loss (Raw)": 0.8800864219665527, "Full-finetune/Step": 2489, "Full-finetune/Step Time": 6.705420298501849} {"Full-finetune/Learning Rate": 1.115921037714115e-05, "Full-finetune/Loss": 0.7930067777633667, "Full-finetune/Loss (Raw)": 0.31730806827545166, "Full-finetune/Step": 2490, "Full-finetune/Step Time": 6.7288158889859915} {"Full-finetune/Learning Rate": 1.1153022539295345e-05, "Full-finetune/Loss": 0.7948685884475708, "Full-finetune/Loss (Raw)": 0.7883375883102417, "Full-finetune/Step": 2491, "Full-finetune/Step Time": 6.723004195839167} {"Full-finetune/Learning Rate": 1.1146834253984008e-05, "Full-finetune/Loss": 0.7946150898933411, "Full-finetune/Loss (Raw)": 0.7258987426757812, "Full-finetune/Step": 2492, "Full-finetune/Step Time": 6.724981460720301} {"Full-finetune/Learning Rate": 1.1140645523608684e-05, "Full-finetune/Loss": 0.7946103811264038, "Full-finetune/Loss (Raw)": 0.8589149117469788, "Full-finetune/Step": 2493, "Full-finetune/Step Time": 6.733368853107095} {"Full-finetune/Learning Rate": 1.1134456350571099e-05, "Full-finetune/Loss": 0.797367513179779, "Full-finetune/Loss (Raw)": 0.925660252571106, "Full-finetune/Step": 2494, "Full-finetune/Step Time": 6.723197270184755} {"Full-finetune/Learning Rate": 1.112826673727316e-05, "Full-finetune/Loss": 0.7968270778656006, "Full-finetune/Loss (Raw)": 0.8657755255699158, "Full-finetune/Step": 2495, "Full-finetune/Step Time": 6.717133484780788} {"Full-finetune/Learning Rate": 1.112207668611692e-05, "Full-finetune/Loss": 0.7966909408569336, "Full-finetune/Loss (Raw)": 0.7667313814163208, "Full-finetune/Step": 2496, "Full-finetune/Step Time": 6.749510003253818} {"Full-finetune/Learning Rate": 1.1115886199504631e-05, "Full-finetune/Loss": 0.7944849729537964, "Full-finetune/Loss (Raw)": 0.6754871606826782, "Full-finetune/Step": 2497, "Full-finetune/Step Time": 6.749027993530035} {"Full-finetune/Learning Rate": 1.110969527983869e-05, "Full-finetune/Loss": 0.7954497337341309, "Full-finetune/Loss (Raw)": 0.9390501379966736, "Full-finetune/Step": 2498, "Full-finetune/Step Time": 6.7607243321835995} {"Full-finetune/Learning Rate": 1.1103503929521677e-05, "Full-finetune/Loss": 0.7923064827919006, "Full-finetune/Loss (Raw)": 0.5165206789970398, "Full-finetune/Step": 2499, "Full-finetune/Step Time": 6.772835848852992} {"Full-finetune/Learning Rate": 1.1097312150956336e-05, "Full-finetune/Loss": 0.7930454015731812, "Full-finetune/Loss (Raw)": 0.8658989667892456, "Full-finetune/Step": 2500, "Full-finetune/Step Time": 6.773547574877739} {"Full-finetune/Learning Rate": 1.1091119946545568e-05, "Full-finetune/Loss": 0.7928249835968018, "Full-finetune/Loss (Raw)": 0.8966997265815735, "Full-finetune/Step": 2501, "Full-finetune/Step Time": 6.7547025959938765} {"Full-finetune/Learning Rate": 1.1084927318692453e-05, "Full-finetune/Loss": 0.7939262986183167, "Full-finetune/Loss (Raw)": 0.8724316358566284, "Full-finetune/Step": 2502, "Full-finetune/Step Time": 6.7653165850788355} {"Full-finetune/Learning Rate": 1.1078734269800227e-05, "Full-finetune/Loss": 0.7954152822494507, "Full-finetune/Loss (Raw)": 0.8291915655136108, "Full-finetune/Step": 2503, "Full-finetune/Step Time": 6.744785146787763} {"Full-finetune/Learning Rate": 1.1072540802272291e-05, "Full-finetune/Loss": 0.7948992848396301, "Full-finetune/Loss (Raw)": 0.8362681269645691, "Full-finetune/Step": 2504, "Full-finetune/Step Time": 6.749566083773971} {"Full-finetune/Learning Rate": 1.1066346918512211e-05, "Full-finetune/Loss": 0.7936620712280273, "Full-finetune/Loss (Raw)": 0.8339139819145203, "Full-finetune/Step": 2505, "Full-finetune/Step Time": 6.748471824452281} {"Full-finetune/Learning Rate": 1.1060152620923707e-05, "Full-finetune/Loss": 0.7928344011306763, "Full-finetune/Loss (Raw)": 0.7969925403594971, "Full-finetune/Step": 2506, "Full-finetune/Step Time": 6.752357626333833} {"Full-finetune/Learning Rate": 1.105395791191067e-05, "Full-finetune/Loss": 0.7932772636413574, "Full-finetune/Loss (Raw)": 0.9204164147377014, "Full-finetune/Step": 2507, "Full-finetune/Step Time": 6.739712305366993} {"Full-finetune/Learning Rate": 1.1047762793877146e-05, "Full-finetune/Loss": 0.7933034300804138, "Full-finetune/Loss (Raw)": 0.735197126865387, "Full-finetune/Step": 2508, "Full-finetune/Step Time": 6.7467599511146545} {"Full-finetune/Learning Rate": 1.1041567269227336e-05, "Full-finetune/Loss": 0.7931320667266846, "Full-finetune/Loss (Raw)": 0.8041041493415833, "Full-finetune/Step": 2509, "Full-finetune/Step Time": 6.749624989926815} {"Full-finetune/Learning Rate": 1.1035371340365606e-05, "Full-finetune/Loss": 0.795076847076416, "Full-finetune/Loss (Raw)": 0.9214608073234558, "Full-finetune/Step": 2510, "Full-finetune/Step Time": 6.733472935855389} {"Full-finetune/Learning Rate": 1.1029175009696468e-05, "Full-finetune/Loss": 0.797508180141449, "Full-finetune/Loss (Raw)": 0.8694267868995667, "Full-finetune/Step": 2511, "Full-finetune/Step Time": 6.729928964748979} {"Full-finetune/Learning Rate": 1.1022978279624606e-05, "Full-finetune/Loss": 0.795610785484314, "Full-finetune/Loss (Raw)": 0.7109354734420776, "Full-finetune/Step": 2512, "Full-finetune/Step Time": 6.739195004105568} {"Full-finetune/Learning Rate": 1.1016781152554846e-05, "Full-finetune/Loss": 0.7951003909111023, "Full-finetune/Loss (Raw)": 0.7387427687644958, "Full-finetune/Step": 2513, "Full-finetune/Step Time": 6.738391725346446} {"Full-finetune/Learning Rate": 1.1010583630892166e-05, "Full-finetune/Loss": 0.7941538095474243, "Full-finetune/Loss (Raw)": 0.8535035252571106, "Full-finetune/Step": 2514, "Full-finetune/Step Time": 6.743988798931241} {"Full-finetune/Learning Rate": 1.1004385717041716e-05, "Full-finetune/Loss": 0.7928044199943542, "Full-finetune/Loss (Raw)": 0.6462597846984863, "Full-finetune/Step": 2515, "Full-finetune/Step Time": 6.749678861349821} {"Full-finetune/Learning Rate": 1.0998187413408774e-05, "Full-finetune/Loss": 0.7925190329551697, "Full-finetune/Loss (Raw)": 0.7871658205986023, "Full-finetune/Step": 2516, "Full-finetune/Step Time": 6.726888215169311} {"Full-finetune/Learning Rate": 1.0991988722398786e-05, "Full-finetune/Loss": 0.7917317152023315, "Full-finetune/Loss (Raw)": 0.8505529165267944, "Full-finetune/Step": 2517, "Full-finetune/Step Time": 6.729877833276987} {"Full-finetune/Learning Rate": 1.0985789646417341e-05, "Full-finetune/Loss": 0.7902482151985168, "Full-finetune/Loss (Raw)": 0.7551218271255493, "Full-finetune/Step": 2518, "Full-finetune/Step Time": 6.725310338661075} {"Full-finetune/Learning Rate": 1.097959018787018e-05, "Full-finetune/Loss": 0.7892090082168579, "Full-finetune/Loss (Raw)": 0.7831589579582214, "Full-finetune/Step": 2519, "Full-finetune/Step Time": 6.729807874187827} {"Full-finetune/Learning Rate": 1.0973390349163195e-05, "Full-finetune/Loss": 0.7897918820381165, "Full-finetune/Loss (Raw)": 0.9260604977607727, "Full-finetune/Step": 2520, "Full-finetune/Step Time": 6.718909928575158} {"Full-finetune/Learning Rate": 1.0967190132702414e-05, "Full-finetune/Loss": 0.7856721878051758, "Full-finetune/Loss (Raw)": 0.40100884437561035, "Full-finetune/Step": 2521, "Full-finetune/Step Time": 6.72205731458962} {"Full-finetune/Learning Rate": 1.096098954089403e-05, "Full-finetune/Loss": 0.7889859080314636, "Full-finetune/Loss (Raw)": 0.817205011844635, "Full-finetune/Step": 2522, "Full-finetune/Step Time": 6.714441673830152} {"Full-finetune/Learning Rate": 1.0954788576144365e-05, "Full-finetune/Loss": 0.7868807315826416, "Full-finetune/Loss (Raw)": 0.5997141003608704, "Full-finetune/Step": 2523, "Full-finetune/Step Time": 6.715714987367392} {"Full-finetune/Learning Rate": 1.0948587240859893e-05, "Full-finetune/Loss": 0.7867711782455444, "Full-finetune/Loss (Raw)": 0.785121500492096, "Full-finetune/Step": 2524, "Full-finetune/Step Time": 6.715789278969169} {"Full-finetune/Learning Rate": 1.0942385537447236e-05, "Full-finetune/Loss": 0.7848325371742249, "Full-finetune/Loss (Raw)": 0.6046353578567505, "Full-finetune/Step": 2525, "Full-finetune/Step Time": 6.7292949836701155} {"Full-finetune/Learning Rate": 1.0936183468313147e-05, "Full-finetune/Loss": 0.7836108803749084, "Full-finetune/Loss (Raw)": 0.8588545918464661, "Full-finetune/Step": 2526, "Full-finetune/Step Time": 6.741930890828371} {"Full-finetune/Learning Rate": 1.0929981035864532e-05, "Full-finetune/Loss": 0.782967209815979, "Full-finetune/Loss (Raw)": 0.8304888606071472, "Full-finetune/Step": 2527, "Full-finetune/Step Time": 6.751384092494845} {"Full-finetune/Learning Rate": 1.0923778242508437e-05, "Full-finetune/Loss": 0.7845958471298218, "Full-finetune/Loss (Raw)": 0.9417921900749207, "Full-finetune/Step": 2528, "Full-finetune/Step Time": 6.758515821769834} {"Full-finetune/Learning Rate": 1.0917575090652038e-05, "Full-finetune/Loss": 0.7803165912628174, "Full-finetune/Loss (Raw)": 0.26567354798316956, "Full-finetune/Step": 2529, "Full-finetune/Step Time": 6.77452577650547} {"Full-finetune/Learning Rate": 1.091137158270266e-05, "Full-finetune/Loss": 0.7813827991485596, "Full-finetune/Loss (Raw)": 0.8596950769424438, "Full-finetune/Step": 2530, "Full-finetune/Step Time": 6.766128433868289} {"Full-finetune/Learning Rate": 1.0905167721067762e-05, "Full-finetune/Loss": 0.7807859182357788, "Full-finetune/Loss (Raw)": 0.7627215385437012, "Full-finetune/Step": 2531, "Full-finetune/Step Time": 6.7651553470641375} {"Full-finetune/Learning Rate": 1.0898963508154947e-05, "Full-finetune/Loss": 0.7802979946136475, "Full-finetune/Loss (Raw)": 0.8067612648010254, "Full-finetune/Step": 2532, "Full-finetune/Step Time": 6.782528173178434} {"Full-finetune/Learning Rate": 1.0892758946371943e-05, "Full-finetune/Loss": 0.7794461250305176, "Full-finetune/Loss (Raw)": 0.7040384411811829, "Full-finetune/Step": 2533, "Full-finetune/Step Time": 6.785065624862909} {"Full-finetune/Learning Rate": 1.0886554038126624e-05, "Full-finetune/Loss": 0.7750214338302612, "Full-finetune/Loss (Raw)": 0.37467435002326965, "Full-finetune/Step": 2534, "Full-finetune/Step Time": 6.802724350243807} {"Full-finetune/Learning Rate": 1.0880348785826991e-05, "Full-finetune/Loss": 0.7776609063148499, "Full-finetune/Loss (Raw)": 0.9196743369102478, "Full-finetune/Step": 2535, "Full-finetune/Step Time": 6.787019634619355} {"Full-finetune/Learning Rate": 1.087414319188118e-05, "Full-finetune/Loss": 0.7745543122291565, "Full-finetune/Loss (Raw)": 0.6201061010360718, "Full-finetune/Step": 2536, "Full-finetune/Step Time": 6.794817758724093} {"Full-finetune/Learning Rate": 1.0867937258697463e-05, "Full-finetune/Loss": 0.7740767002105713, "Full-finetune/Loss (Raw)": 0.7531506419181824, "Full-finetune/Step": 2537, "Full-finetune/Step Time": 6.801060542464256} {"Full-finetune/Learning Rate": 1.086173098868424e-05, "Full-finetune/Loss": 0.7747557163238525, "Full-finetune/Loss (Raw)": 0.8795939683914185, "Full-finetune/Step": 2538, "Full-finetune/Step Time": 6.804718868806958} {"Full-finetune/Learning Rate": 1.0855524384250048e-05, "Full-finetune/Loss": 0.7756829857826233, "Full-finetune/Loss (Raw)": 0.7936026453971863, "Full-finetune/Step": 2539, "Full-finetune/Step Time": 6.803500063717365} {"Full-finetune/Learning Rate": 1.0849317447803542e-05, "Full-finetune/Loss": 0.7763609886169434, "Full-finetune/Loss (Raw)": 0.8516026139259338, "Full-finetune/Step": 2540, "Full-finetune/Step Time": 6.802739264443517} {"Full-finetune/Learning Rate": 1.0843110181753513e-05, "Full-finetune/Loss": 0.7755353450775146, "Full-finetune/Loss (Raw)": 0.641630232334137, "Full-finetune/Step": 2541, "Full-finetune/Step Time": 6.819727659225464} {"Full-finetune/Learning Rate": 1.0836902588508888e-05, "Full-finetune/Loss": 0.7751103639602661, "Full-finetune/Loss (Raw)": 0.8337493538856506, "Full-finetune/Step": 2542, "Full-finetune/Step Time": 6.813475301489234} {"Full-finetune/Learning Rate": 1.0830694670478706e-05, "Full-finetune/Loss": 0.7752233147621155, "Full-finetune/Loss (Raw)": 0.8424767255783081, "Full-finetune/Step": 2543, "Full-finetune/Step Time": 6.807606551796198} {"Full-finetune/Learning Rate": 1.082448643007214e-05, "Full-finetune/Loss": 0.7740703821182251, "Full-finetune/Loss (Raw)": 0.6376776099205017, "Full-finetune/Step": 2544, "Full-finetune/Step Time": 6.818078281357884} {"Full-finetune/Learning Rate": 1.0818277869698488e-05, "Full-finetune/Loss": 0.7744238376617432, "Full-finetune/Loss (Raw)": 0.8078792691230774, "Full-finetune/Step": 2545, "Full-finetune/Step Time": 6.8117116298526525} {"Full-finetune/Learning Rate": 1.0812068991767171e-05, "Full-finetune/Loss": 0.773155152797699, "Full-finetune/Loss (Raw)": 0.2793460190296173, "Full-finetune/Step": 2546, "Full-finetune/Step Time": 6.811595434322953} {"Full-finetune/Learning Rate": 1.0805859798687727e-05, "Full-finetune/Loss": 0.7731722593307495, "Full-finetune/Loss (Raw)": 0.7943349480628967, "Full-finetune/Step": 2547, "Full-finetune/Step Time": 6.783371893689036} {"Full-finetune/Learning Rate": 1.0799650292869835e-05, "Full-finetune/Loss": 0.7728482484817505, "Full-finetune/Loss (Raw)": 0.9534710049629211, "Full-finetune/Step": 2548, "Full-finetune/Step Time": 6.786349916830659} {"Full-finetune/Learning Rate": 1.0793440476723274e-05, "Full-finetune/Loss": 0.7701904773712158, "Full-finetune/Loss (Raw)": 0.31965959072113037, "Full-finetune/Step": 2549, "Full-finetune/Step Time": 6.785178711637855} {"Full-finetune/Learning Rate": 1.0787230352657954e-05, "Full-finetune/Loss": 0.7711927890777588, "Full-finetune/Loss (Raw)": 0.8116142153739929, "Full-finetune/Step": 2550, "Full-finetune/Step Time": 6.785261865705252} {"Full-finetune/Learning Rate": 1.0781019923083905e-05, "Full-finetune/Loss": 0.7735614776611328, "Full-finetune/Loss (Raw)": 0.895929217338562, "Full-finetune/Step": 2551, "Full-finetune/Step Time": 6.7813411466777325} {"Full-finetune/Learning Rate": 1.077480919041127e-05, "Full-finetune/Loss": 0.7746797800064087, "Full-finetune/Loss (Raw)": 1.0355459451675415, "Full-finetune/Step": 2552, "Full-finetune/Step Time": 6.782348269596696} {"Full-finetune/Learning Rate": 1.0768598157050313e-05, "Full-finetune/Loss": 0.7749707102775574, "Full-finetune/Loss (Raw)": 0.7283426523208618, "Full-finetune/Step": 2553, "Full-finetune/Step Time": 6.782948778942227} {"Full-finetune/Learning Rate": 1.0762386825411422e-05, "Full-finetune/Loss": 0.7786135673522949, "Full-finetune/Loss (Raw)": 0.8348878026008606, "Full-finetune/Step": 2554, "Full-finetune/Step Time": 6.801256211474538} {"Full-finetune/Learning Rate": 1.0756175197905086e-05, "Full-finetune/Loss": 0.7744923830032349, "Full-finetune/Loss (Raw)": 0.32805734872817993, "Full-finetune/Step": 2555, "Full-finetune/Step Time": 6.829152036458254} {"Full-finetune/Learning Rate": 1.0749963276941919e-05, "Full-finetune/Loss": 0.7755674719810486, "Full-finetune/Loss (Raw)": 0.8470907807350159, "Full-finetune/Step": 2556, "Full-finetune/Step Time": 6.8286508191376925} {"Full-finetune/Learning Rate": 1.0743751064932648e-05, "Full-finetune/Loss": 0.7743180990219116, "Full-finetune/Loss (Raw)": 0.6903400421142578, "Full-finetune/Step": 2557, "Full-finetune/Step Time": 6.811435781419277} {"Full-finetune/Learning Rate": 1.0737538564288104e-05, "Full-finetune/Loss": 0.7752401828765869, "Full-finetune/Loss (Raw)": 0.8115189671516418, "Full-finetune/Step": 2558, "Full-finetune/Step Time": 6.770903144031763} {"Full-finetune/Learning Rate": 1.0731325777419246e-05, "Full-finetune/Loss": 0.7739375233650208, "Full-finetune/Loss (Raw)": 0.7321455478668213, "Full-finetune/Step": 2559, "Full-finetune/Step Time": 6.769052516669035} {"Full-finetune/Learning Rate": 1.0725112706737133e-05, "Full-finetune/Loss": 0.7722631692886353, "Full-finetune/Loss (Raw)": 0.5856454372406006, "Full-finetune/Step": 2560, "Full-finetune/Step Time": 6.777155049145222} {"Full-finetune/Learning Rate": 1.0718899354652931e-05, "Full-finetune/Loss": 0.7729673385620117, "Full-finetune/Loss (Raw)": 0.8264594674110413, "Full-finetune/Step": 2561, "Full-finetune/Step Time": 6.779944933950901} {"Full-finetune/Learning Rate": 1.071268572357793e-05, "Full-finetune/Loss": 0.7733628749847412, "Full-finetune/Loss (Raw)": 0.8965883255004883, "Full-finetune/Step": 2562, "Full-finetune/Step Time": 6.778307033702731} {"Full-finetune/Learning Rate": 1.0706471815923511e-05, "Full-finetune/Loss": 0.7703723907470703, "Full-finetune/Loss (Raw)": 0.4306912422180176, "Full-finetune/Step": 2563, "Full-finetune/Step Time": 6.775661384686828} {"Full-finetune/Learning Rate": 1.070025763410117e-05, "Full-finetune/Loss": 0.770086407661438, "Full-finetune/Loss (Raw)": 0.848006546497345, "Full-finetune/Step": 2564, "Full-finetune/Step Time": 6.777816021814942} {"Full-finetune/Learning Rate": 1.0694043180522515e-05, "Full-finetune/Loss": 0.771027147769928, "Full-finetune/Loss (Raw)": 0.8859489560127258, "Full-finetune/Step": 2565, "Full-finetune/Step Time": 6.774951299652457} {"Full-finetune/Learning Rate": 1.0687828457599254e-05, "Full-finetune/Loss": 0.7705099582672119, "Full-finetune/Loss (Raw)": 0.8476874232292175, "Full-finetune/Step": 2566, "Full-finetune/Step Time": 6.778248963877559} {"Full-finetune/Learning Rate": 1.0681613467743195e-05, "Full-finetune/Loss": 0.7691901922225952, "Full-finetune/Loss (Raw)": 0.7341556549072266, "Full-finetune/Step": 2567, "Full-finetune/Step Time": 6.782487731426954} {"Full-finetune/Learning Rate": 1.0675398213366257e-05, "Full-finetune/Loss": 0.7678419947624207, "Full-finetune/Loss (Raw)": 0.7342495918273926, "Full-finetune/Step": 2568, "Full-finetune/Step Time": 6.785995129495859} {"Full-finetune/Learning Rate": 1.0669182696880459e-05, "Full-finetune/Loss": 0.7686225175857544, "Full-finetune/Loss (Raw)": 1.019777774810791, "Full-finetune/Step": 2569, "Full-finetune/Step Time": 6.782983029261231} {"Full-finetune/Learning Rate": 1.0662966920697918e-05, "Full-finetune/Loss": 0.7683401107788086, "Full-finetune/Loss (Raw)": 0.7998218536376953, "Full-finetune/Step": 2570, "Full-finetune/Step Time": 6.7875617649406195} {"Full-finetune/Learning Rate": 1.0656750887230862e-05, "Full-finetune/Loss": 0.7691090106964111, "Full-finetune/Loss (Raw)": 1.0271618366241455, "Full-finetune/Step": 2571, "Full-finetune/Step Time": 6.774862417951226} {"Full-finetune/Learning Rate": 1.0650534598891608e-05, "Full-finetune/Loss": 0.7688264846801758, "Full-finetune/Loss (Raw)": 0.8224834203720093, "Full-finetune/Step": 2572, "Full-finetune/Step Time": 6.77237312681973} {"Full-finetune/Learning Rate": 1.0644318058092577e-05, "Full-finetune/Loss": 0.7720143795013428, "Full-finetune/Loss (Raw)": 0.7978545427322388, "Full-finetune/Step": 2573, "Full-finetune/Step Time": 6.761482967063785} {"Full-finetune/Learning Rate": 1.0638101267246283e-05, "Full-finetune/Loss": 0.771052360534668, "Full-finetune/Loss (Raw)": 0.7545725703239441, "Full-finetune/Step": 2574, "Full-finetune/Step Time": 6.783734057098627} {"Full-finetune/Learning Rate": 1.063188422876535e-05, "Full-finetune/Loss": 0.7699497938156128, "Full-finetune/Loss (Raw)": 0.7143297791481018, "Full-finetune/Step": 2575, "Full-finetune/Step Time": 6.77530949935317} {"Full-finetune/Learning Rate": 1.0625666945062484e-05, "Full-finetune/Loss": 0.769202470779419, "Full-finetune/Loss (Raw)": 0.8131359219551086, "Full-finetune/Step": 2576, "Full-finetune/Step Time": 6.777597591280937} {"Full-finetune/Learning Rate": 1.061944941855049e-05, "Full-finetune/Loss": 0.7703345417976379, "Full-finetune/Loss (Raw)": 0.8666989803314209, "Full-finetune/Step": 2577, "Full-finetune/Step Time": 6.782462770119309} {"Full-finetune/Learning Rate": 1.061323165164227e-05, "Full-finetune/Loss": 0.7736824750900269, "Full-finetune/Loss (Raw)": 0.9124528765678406, "Full-finetune/Step": 2578, "Full-finetune/Step Time": 6.753121130168438} {"Full-finetune/Learning Rate": 1.0607013646750818e-05, "Full-finetune/Loss": 0.7782913446426392, "Full-finetune/Loss (Raw)": 0.9067608118057251, "Full-finetune/Step": 2579, "Full-finetune/Step Time": 6.734400415793061} {"Full-finetune/Learning Rate": 1.0600795406289221e-05, "Full-finetune/Loss": 0.7769723534584045, "Full-finetune/Loss (Raw)": 0.6012402176856995, "Full-finetune/Step": 2580, "Full-finetune/Step Time": 6.754898477345705} {"Full-finetune/Learning Rate": 1.059457693267066e-05, "Full-finetune/Loss": 0.7779877781867981, "Full-finetune/Loss (Raw)": 0.9261221885681152, "Full-finetune/Step": 2581, "Full-finetune/Step Time": 6.732302024960518} {"Full-finetune/Learning Rate": 1.0588358228308395e-05, "Full-finetune/Loss": 0.7777963876724243, "Full-finetune/Loss (Raw)": 0.8015912175178528, "Full-finetune/Step": 2582, "Full-finetune/Step Time": 6.722041688859463} {"Full-finetune/Learning Rate": 1.0582139295615793e-05, "Full-finetune/Loss": 0.7764612436294556, "Full-finetune/Loss (Raw)": 0.7079945206642151, "Full-finetune/Step": 2583, "Full-finetune/Step Time": 6.730748750269413} {"Full-finetune/Learning Rate": 1.0575920137006288e-05, "Full-finetune/Loss": 0.7768978476524353, "Full-finetune/Loss (Raw)": 0.9307976365089417, "Full-finetune/Step": 2584, "Full-finetune/Step Time": 6.7313041761517525} {"Full-finetune/Learning Rate": 1.056970075489343e-05, "Full-finetune/Loss": 0.7753568291664124, "Full-finetune/Loss (Raw)": 0.6586042046546936, "Full-finetune/Step": 2585, "Full-finetune/Step Time": 6.734062621369958} {"Full-finetune/Learning Rate": 1.0563481151690827e-05, "Full-finetune/Loss": 0.7753018140792847, "Full-finetune/Loss (Raw)": 0.8057765364646912, "Full-finetune/Step": 2586, "Full-finetune/Step Time": 6.720440678298473} {"Full-finetune/Learning Rate": 1.055726132981219e-05, "Full-finetune/Loss": 0.7762131690979004, "Full-finetune/Loss (Raw)": 0.891989529132843, "Full-finetune/Step": 2587, "Full-finetune/Step Time": 6.721184518188238} {"Full-finetune/Learning Rate": 1.0551041291671311e-05, "Full-finetune/Loss": 0.7759007215499878, "Full-finetune/Loss (Raw)": 0.7157067060470581, "Full-finetune/Step": 2588, "Full-finetune/Step Time": 6.72932487167418} {"Full-finetune/Learning Rate": 1.0544821039682066e-05, "Full-finetune/Loss": 0.7751134037971497, "Full-finetune/Loss (Raw)": 0.8578765392303467, "Full-finetune/Step": 2589, "Full-finetune/Step Time": 6.733490064740181} {"Full-finetune/Learning Rate": 1.0538600576258413e-05, "Full-finetune/Loss": 0.7752288579940796, "Full-finetune/Loss (Raw)": 0.8851107954978943, "Full-finetune/Step": 2590, "Full-finetune/Step Time": 6.73665039613843} {"Full-finetune/Learning Rate": 1.0532379903814387e-05, "Full-finetune/Loss": 0.7747116088867188, "Full-finetune/Loss (Raw)": 0.7234770655632019, "Full-finetune/Step": 2591, "Full-finetune/Step Time": 6.774249734356999} {"Full-finetune/Learning Rate": 1.0526159024764118e-05, "Full-finetune/Loss": 0.774083137512207, "Full-finetune/Loss (Raw)": 0.825701892375946, "Full-finetune/Step": 2592, "Full-finetune/Step Time": 6.783708715811372} {"Full-finetune/Learning Rate": 1.0519937941521805e-05, "Full-finetune/Loss": 0.7730905413627625, "Full-finetune/Loss (Raw)": 0.6996954083442688, "Full-finetune/Step": 2593, "Full-finetune/Step Time": 6.8033884931355715} {"Full-finetune/Learning Rate": 1.0513716656501723e-05, "Full-finetune/Loss": 0.7726547122001648, "Full-finetune/Loss (Raw)": 0.7099745869636536, "Full-finetune/Step": 2594, "Full-finetune/Step Time": 6.814292864874005} {"Full-finetune/Learning Rate": 1.0507495172118242e-05, "Full-finetune/Loss": 0.7724250555038452, "Full-finetune/Loss (Raw)": 0.7855637669563293, "Full-finetune/Step": 2595, "Full-finetune/Step Time": 6.820726282894611} {"Full-finetune/Learning Rate": 1.0501273490785789e-05, "Full-finetune/Loss": 0.7707199454307556, "Full-finetune/Loss (Raw)": 0.7259606719017029, "Full-finetune/Step": 2596, "Full-finetune/Step Time": 6.813216784968972} {"Full-finetune/Learning Rate": 1.049505161491888e-05, "Full-finetune/Loss": 0.7706531286239624, "Full-finetune/Loss (Raw)": 0.8954547047615051, "Full-finetune/Step": 2597, "Full-finetune/Step Time": 6.816110854968429} {"Full-finetune/Learning Rate": 1.0488829546932106e-05, "Full-finetune/Loss": 0.7695297598838806, "Full-finetune/Loss (Raw)": 0.6157023906707764, "Full-finetune/Step": 2598, "Full-finetune/Step Time": 6.826937574893236} {"Full-finetune/Learning Rate": 1.0482607289240128e-05, "Full-finetune/Loss": 0.7691539525985718, "Full-finetune/Loss (Raw)": 0.8544690608978271, "Full-finetune/Step": 2599, "Full-finetune/Step Time": 6.832045130431652} {"Full-finetune/Learning Rate": 1.0476384844257686e-05, "Full-finetune/Loss": 0.7688829898834229, "Full-finetune/Loss (Raw)": 0.7949199080467224, "Full-finetune/Step": 2600, "Full-finetune/Step Time": 6.836798453703523} {"Full-finetune/Learning Rate": 1.0470162214399582e-05, "Full-finetune/Loss": 0.7681536674499512, "Full-finetune/Loss (Raw)": 0.7884445786476135, "Full-finetune/Step": 2601, "Full-finetune/Step Time": 6.843133505433798} {"Full-finetune/Learning Rate": 1.0463939402080706e-05, "Full-finetune/Loss": 0.7693906426429749, "Full-finetune/Loss (Raw)": 0.9522056579589844, "Full-finetune/Step": 2602, "Full-finetune/Step Time": 6.830328430980444} {"Full-finetune/Learning Rate": 1.0457716409716002e-05, "Full-finetune/Loss": 0.7700161337852478, "Full-finetune/Loss (Raw)": 0.8991668224334717, "Full-finetune/Step": 2603, "Full-finetune/Step Time": 6.828771635890007} {"Full-finetune/Learning Rate": 1.0451493239720496e-05, "Full-finetune/Loss": 0.7695736885070801, "Full-finetune/Loss (Raw)": 0.7922050356864929, "Full-finetune/Step": 2604, "Full-finetune/Step Time": 6.834947006776929} {"Full-finetune/Learning Rate": 1.0445269894509283e-05, "Full-finetune/Loss": 0.768863320350647, "Full-finetune/Loss (Raw)": 0.7326597571372986, "Full-finetune/Step": 2605, "Full-finetune/Step Time": 6.832543395459652} {"Full-finetune/Learning Rate": 1.043904637649751e-05, "Full-finetune/Loss": 0.7680264711380005, "Full-finetune/Loss (Raw)": 0.7160927653312683, "Full-finetune/Step": 2606, "Full-finetune/Step Time": 6.860892986878753} {"Full-finetune/Learning Rate": 1.0432822688100414e-05, "Full-finetune/Loss": 0.7688956260681152, "Full-finetune/Loss (Raw)": 0.8198440670967102, "Full-finetune/Step": 2607, "Full-finetune/Step Time": 6.880731724202633} {"Full-finetune/Learning Rate": 1.0426598831733283e-05, "Full-finetune/Loss": 0.7701718807220459, "Full-finetune/Loss (Raw)": 0.8762202262878418, "Full-finetune/Step": 2608, "Full-finetune/Step Time": 6.873324867337942} {"Full-finetune/Learning Rate": 1.0420374809811472e-05, "Full-finetune/Loss": 0.7741900086402893, "Full-finetune/Loss (Raw)": 0.8876051306724548, "Full-finetune/Step": 2609, "Full-finetune/Step Time": 6.857566058635712} {"Full-finetune/Learning Rate": 1.0414150624750408e-05, "Full-finetune/Loss": 0.7717673182487488, "Full-finetune/Loss (Raw)": 0.7204840779304504, "Full-finetune/Step": 2610, "Full-finetune/Step Time": 6.872756082564592} {"Full-finetune/Learning Rate": 1.0407926278965568e-05, "Full-finetune/Loss": 0.7710745334625244, "Full-finetune/Loss (Raw)": 0.6900209188461304, "Full-finetune/Step": 2611, "Full-finetune/Step Time": 6.873024569824338} {"Full-finetune/Learning Rate": 1.0401701774872508e-05, "Full-finetune/Loss": 0.7717297077178955, "Full-finetune/Loss (Raw)": 0.8124760985374451, "Full-finetune/Step": 2612, "Full-finetune/Step Time": 6.860301852226257} {"Full-finetune/Learning Rate": 1.0395477114886827e-05, "Full-finetune/Loss": 0.7726222276687622, "Full-finetune/Loss (Raw)": 0.9598554968833923, "Full-finetune/Step": 2613, "Full-finetune/Step Time": 6.857860084623098} {"Full-finetune/Learning Rate": 1.0389252301424197e-05, "Full-finetune/Loss": 0.7734760642051697, "Full-finetune/Loss (Raw)": 0.7588176727294922, "Full-finetune/Step": 2614, "Full-finetune/Step Time": 6.849860215559602} {"Full-finetune/Learning Rate": 1.0383027336900356e-05, "Full-finetune/Loss": 0.7779521942138672, "Full-finetune/Loss (Raw)": 0.8854135274887085, "Full-finetune/Step": 2615, "Full-finetune/Step Time": 6.840817546471953} {"Full-finetune/Learning Rate": 1.0376802223731077e-05, "Full-finetune/Loss": 0.7781082391738892, "Full-finetune/Loss (Raw)": 0.9190387725830078, "Full-finetune/Step": 2616, "Full-finetune/Step Time": 6.843096781522036} {"Full-finetune/Learning Rate": 1.0370576964332217e-05, "Full-finetune/Loss": 0.7743175029754639, "Full-finetune/Loss (Raw)": 0.39487364888191223, "Full-finetune/Step": 2617, "Full-finetune/Step Time": 6.837530929595232} {"Full-finetune/Learning Rate": 1.0364351561119667e-05, "Full-finetune/Loss": 0.7770620584487915, "Full-finetune/Loss (Raw)": 0.668610155582428, "Full-finetune/Step": 2618, "Full-finetune/Step Time": 6.845252599567175} {"Full-finetune/Learning Rate": 1.0358126016509392e-05, "Full-finetune/Loss": 0.7778569459915161, "Full-finetune/Loss (Raw)": 0.8900918364524841, "Full-finetune/Step": 2619, "Full-finetune/Step Time": 6.8382230047136545} {"Full-finetune/Learning Rate": 1.0351900332917401e-05, "Full-finetune/Loss": 0.7778267860412598, "Full-finetune/Loss (Raw)": 0.722029983997345, "Full-finetune/Step": 2620, "Full-finetune/Step Time": 6.83358533680439} {"Full-finetune/Learning Rate": 1.034567451275976e-05, "Full-finetune/Loss": 0.7771214246749878, "Full-finetune/Loss (Raw)": 0.7686324715614319, "Full-finetune/Step": 2621, "Full-finetune/Step Time": 6.8304756581783295} {"Full-finetune/Learning Rate": 1.0339448558452594e-05, "Full-finetune/Loss": 0.7768964171409607, "Full-finetune/Loss (Raw)": 0.896858811378479, "Full-finetune/Step": 2622, "Full-finetune/Step Time": 6.835183812305331} {"Full-finetune/Learning Rate": 1.0333222472412064e-05, "Full-finetune/Loss": 0.7762235403060913, "Full-finetune/Loss (Raw)": 0.7796421647071838, "Full-finetune/Step": 2623, "Full-finetune/Step Time": 6.854757884517312} {"Full-finetune/Learning Rate": 1.03269962570544e-05, "Full-finetune/Loss": 0.7767913937568665, "Full-finetune/Loss (Raw)": 0.8394214510917664, "Full-finetune/Step": 2624, "Full-finetune/Step Time": 6.832714585587382} {"Full-finetune/Learning Rate": 1.0320769914795874e-05, "Full-finetune/Loss": 0.7762593030929565, "Full-finetune/Loss (Raw)": 0.607371985912323, "Full-finetune/Step": 2625, "Full-finetune/Step Time": 6.845291685312986} {"Full-finetune/Learning Rate": 1.0314543448052806e-05, "Full-finetune/Loss": 0.771349310874939, "Full-finetune/Loss (Raw)": 0.3105824589729309, "Full-finetune/Step": 2626, "Full-finetune/Step Time": 6.8526116497814655} {"Full-finetune/Learning Rate": 1.0308316859241567e-05, "Full-finetune/Loss": 0.7734999060630798, "Full-finetune/Loss (Raw)": 0.7917923927307129, "Full-finetune/Step": 2627, "Full-finetune/Step Time": 6.835228046402335} {"Full-finetune/Learning Rate": 1.0302090150778572e-05, "Full-finetune/Loss": 0.773648738861084, "Full-finetune/Loss (Raw)": 0.8849475979804993, "Full-finetune/Step": 2628, "Full-finetune/Step Time": 6.834517907351255} {"Full-finetune/Learning Rate": 1.029586332508029e-05, "Full-finetune/Loss": 0.7707531452178955, "Full-finetune/Loss (Raw)": 0.5260708928108215, "Full-finetune/Step": 2629, "Full-finetune/Step Time": 6.849616350606084} {"Full-finetune/Learning Rate": 1.0289636384563226e-05, "Full-finetune/Loss": 0.7694045305252075, "Full-finetune/Loss (Raw)": 0.6998076438903809, "Full-finetune/Step": 2630, "Full-finetune/Step Time": 6.850350007414818} {"Full-finetune/Learning Rate": 1.0283409331643936e-05, "Full-finetune/Loss": 0.770051121711731, "Full-finetune/Loss (Raw)": 0.911956250667572, "Full-finetune/Step": 2631, "Full-finetune/Step Time": 6.847217841073871} {"Full-finetune/Learning Rate": 1.0277182168739019e-05, "Full-finetune/Loss": 0.7691165804862976, "Full-finetune/Loss (Raw)": 0.7166415452957153, "Full-finetune/Step": 2632, "Full-finetune/Step Time": 6.842152254655957} {"Full-finetune/Learning Rate": 1.0270954898265113e-05, "Full-finetune/Loss": 0.7693060636520386, "Full-finetune/Loss (Raw)": 0.8581713438034058, "Full-finetune/Step": 2633, "Full-finetune/Step Time": 6.84400574490428} {"Full-finetune/Learning Rate": 1.0264727522638899e-05, "Full-finetune/Loss": 0.7691757082939148, "Full-finetune/Loss (Raw)": 0.7803080677986145, "Full-finetune/Step": 2634, "Full-finetune/Step Time": 6.844989135861397} {"Full-finetune/Learning Rate": 1.0258500044277106e-05, "Full-finetune/Loss": 0.7680639028549194, "Full-finetune/Loss (Raw)": 0.7780998945236206, "Full-finetune/Step": 2635, "Full-finetune/Step Time": 6.8383803460747} {"Full-finetune/Learning Rate": 1.025227246559649e-05, "Full-finetune/Loss": 0.769885778427124, "Full-finetune/Loss (Raw)": 0.9684025049209595, "Full-finetune/Step": 2636, "Full-finetune/Step Time": 6.838054325431585} {"Full-finetune/Learning Rate": 1.0246044789013855e-05, "Full-finetune/Loss": 0.7695359587669373, "Full-finetune/Loss (Raw)": 0.7593228816986084, "Full-finetune/Step": 2637, "Full-finetune/Step Time": 6.841696495190263} {"Full-finetune/Learning Rate": 1.023981701694604e-05, "Full-finetune/Loss": 0.7694858312606812, "Full-finetune/Loss (Raw)": 0.91504967212677, "Full-finetune/Step": 2638, "Full-finetune/Step Time": 6.8628867007792} {"Full-finetune/Learning Rate": 1.0233589151809927e-05, "Full-finetune/Loss": 0.7687059640884399, "Full-finetune/Loss (Raw)": 0.769599974155426, "Full-finetune/Step": 2639, "Full-finetune/Step Time": 6.852157985791564} {"Full-finetune/Learning Rate": 1.0227361196022421e-05, "Full-finetune/Loss": 0.765839695930481, "Full-finetune/Loss (Raw)": 0.3440508544445038, "Full-finetune/Step": 2640, "Full-finetune/Step Time": 6.861093673855066} {"Full-finetune/Learning Rate": 1.0221133152000474e-05, "Full-finetune/Loss": 0.7662976980209351, "Full-finetune/Loss (Raw)": 0.797363817691803, "Full-finetune/Step": 2641, "Full-finetune/Step Time": 6.852428497746587} {"Full-finetune/Learning Rate": 1.021490502216107e-05, "Full-finetune/Loss": 0.7656856775283813, "Full-finetune/Loss (Raw)": 0.7751734256744385, "Full-finetune/Step": 2642, "Full-finetune/Step Time": 6.842101689428091} {"Full-finetune/Learning Rate": 1.020867680892122e-05, "Full-finetune/Loss": 0.7654699683189392, "Full-finetune/Loss (Raw)": 0.6186417937278748, "Full-finetune/Step": 2643, "Full-finetune/Step Time": 6.838991099968553} {"Full-finetune/Learning Rate": 1.0202448514697975e-05, "Full-finetune/Loss": 0.7644972801208496, "Full-finetune/Loss (Raw)": 0.6626654267311096, "Full-finetune/Step": 2644, "Full-finetune/Step Time": 6.871276443824172} {"Full-finetune/Learning Rate": 1.0196220141908417e-05, "Full-finetune/Loss": 0.7640478610992432, "Full-finetune/Loss (Raw)": 0.7930247187614441, "Full-finetune/Step": 2645, "Full-finetune/Step Time": 6.87400464899838} {"Full-finetune/Learning Rate": 1.018999169296965e-05, "Full-finetune/Loss": 0.764451265335083, "Full-finetune/Loss (Raw)": 0.8067634701728821, "Full-finetune/Step": 2646, "Full-finetune/Step Time": 6.859577048569918} {"Full-finetune/Learning Rate": 1.0183763170298818e-05, "Full-finetune/Loss": 0.7640906572341919, "Full-finetune/Loss (Raw)": 0.7369982600212097, "Full-finetune/Step": 2647, "Full-finetune/Step Time": 6.864634666591883} {"Full-finetune/Learning Rate": 1.0177534576313084e-05, "Full-finetune/Loss": 0.7631567716598511, "Full-finetune/Loss (Raw)": 0.8065220713615417, "Full-finetune/Step": 2648, "Full-finetune/Step Time": 6.875545779243112} {"Full-finetune/Learning Rate": 1.0171305913429648e-05, "Full-finetune/Loss": 0.7655838131904602, "Full-finetune/Loss (Raw)": 0.7116694450378418, "Full-finetune/Step": 2649, "Full-finetune/Step Time": 6.868541548028588} {"Full-finetune/Learning Rate": 1.0165077184065732e-05, "Full-finetune/Loss": 0.7647603750228882, "Full-finetune/Loss (Raw)": 0.7118081450462341, "Full-finetune/Step": 2650, "Full-finetune/Step Time": 6.8505093939602375} {"Full-finetune/Learning Rate": 1.0158848390638588e-05, "Full-finetune/Loss": 0.7662007808685303, "Full-finetune/Loss (Raw)": 0.7840803265571594, "Full-finetune/Step": 2651, "Full-finetune/Step Time": 6.845511021092534} {"Full-finetune/Learning Rate": 1.015261953556548e-05, "Full-finetune/Loss": 0.7669707536697388, "Full-finetune/Loss (Raw)": 0.8836826086044312, "Full-finetune/Step": 2652, "Full-finetune/Step Time": 6.8512459974735975} {"Full-finetune/Learning Rate": 1.0146390621263709e-05, "Full-finetune/Loss": 0.7677731513977051, "Full-finetune/Loss (Raw)": 0.7073425054550171, "Full-finetune/Step": 2653, "Full-finetune/Step Time": 6.862106163054705} {"Full-finetune/Learning Rate": 1.0140161650150598e-05, "Full-finetune/Loss": 0.7637134790420532, "Full-finetune/Loss (Raw)": 0.33921292424201965, "Full-finetune/Step": 2654, "Full-finetune/Step Time": 6.8627974428236485} {"Full-finetune/Learning Rate": 1.0133932624643487e-05, "Full-finetune/Loss": 0.7635848522186279, "Full-finetune/Loss (Raw)": 0.814022958278656, "Full-finetune/Step": 2655, "Full-finetune/Step Time": 6.861931964755058} {"Full-finetune/Learning Rate": 1.012770354715974e-05, "Full-finetune/Loss": 0.762485682964325, "Full-finetune/Loss (Raw)": 0.8011047840118408, "Full-finetune/Step": 2656, "Full-finetune/Step Time": 6.858763022348285} {"Full-finetune/Learning Rate": 1.012147442011674e-05, "Full-finetune/Loss": 0.7650078535079956, "Full-finetune/Loss (Raw)": 0.5885134339332581, "Full-finetune/Step": 2657, "Full-finetune/Step Time": 6.855394002050161} {"Full-finetune/Learning Rate": 1.0115245245931883e-05, "Full-finetune/Loss": 0.7626959681510925, "Full-finetune/Loss (Raw)": 0.5637718439102173, "Full-finetune/Step": 2658, "Full-finetune/Step Time": 6.873480228707194} {"Full-finetune/Learning Rate": 1.0109016027022602e-05, "Full-finetune/Loss": 0.7633312940597534, "Full-finetune/Loss (Raw)": 0.8440373539924622, "Full-finetune/Step": 2659, "Full-finetune/Step Time": 6.865042233839631} {"Full-finetune/Learning Rate": 1.0102786765806329e-05, "Full-finetune/Loss": 0.7639307379722595, "Full-finetune/Loss (Raw)": 0.8834946155548096, "Full-finetune/Step": 2660, "Full-finetune/Step Time": 6.8490046337246895} {"Full-finetune/Learning Rate": 1.0096557464700518e-05, "Full-finetune/Loss": 0.7664088606834412, "Full-finetune/Loss (Raw)": 1.0212364196777344, "Full-finetune/Step": 2661, "Full-finetune/Step Time": 6.853157076984644} {"Full-finetune/Learning Rate": 1.0090328126122642e-05, "Full-finetune/Loss": 0.7703377604484558, "Full-finetune/Loss (Raw)": 0.877576470375061, "Full-finetune/Step": 2662, "Full-finetune/Step Time": 6.830741930752993} {"Full-finetune/Learning Rate": 1.0084098752490179e-05, "Full-finetune/Loss": 0.7701079249382019, "Full-finetune/Loss (Raw)": 0.8902539610862732, "Full-finetune/Step": 2663, "Full-finetune/Step Time": 6.837404603138566} {"Full-finetune/Learning Rate": 1.0077869346220635e-05, "Full-finetune/Loss": 0.7686533331871033, "Full-finetune/Loss (Raw)": 0.4339198172092438, "Full-finetune/Step": 2664, "Full-finetune/Step Time": 6.838459676131606} {"Full-finetune/Learning Rate": 1.0071639909731519e-05, "Full-finetune/Loss": 0.7680109739303589, "Full-finetune/Loss (Raw)": 0.6709210276603699, "Full-finetune/Step": 2665, "Full-finetune/Step Time": 6.832302598282695} {"Full-finetune/Learning Rate": 1.0065410445440352e-05, "Full-finetune/Loss": 0.7678548097610474, "Full-finetune/Loss (Raw)": 0.8596170544624329, "Full-finetune/Step": 2666, "Full-finetune/Step Time": 6.828333407640457} {"Full-finetune/Learning Rate": 1.0059180955764666e-05, "Full-finetune/Loss": 0.767413854598999, "Full-finetune/Loss (Raw)": 0.7371528148651123, "Full-finetune/Step": 2667, "Full-finetune/Step Time": 6.822752024978399} {"Full-finetune/Learning Rate": 1.005295144312201e-05, "Full-finetune/Loss": 0.7670160531997681, "Full-finetune/Loss (Raw)": 0.8006929755210876, "Full-finetune/Step": 2668, "Full-finetune/Step Time": 6.819552946835756} {"Full-finetune/Learning Rate": 1.0046721909929928e-05, "Full-finetune/Loss": 0.7691874504089355, "Full-finetune/Loss (Raw)": 0.9195548892021179, "Full-finetune/Step": 2669, "Full-finetune/Step Time": 6.80259807780385} {"Full-finetune/Learning Rate": 1.0040492358605989e-05, "Full-finetune/Loss": 0.7692562341690063, "Full-finetune/Loss (Raw)": 0.8425657153129578, "Full-finetune/Step": 2670, "Full-finetune/Step Time": 6.7977043483406305} {"Full-finetune/Learning Rate": 1.0034262791567755e-05, "Full-finetune/Loss": 0.7675454616546631, "Full-finetune/Loss (Raw)": 0.6234873533248901, "Full-finetune/Step": 2671, "Full-finetune/Step Time": 6.8048127591609955} {"Full-finetune/Learning Rate": 1.0028033211232802e-05, "Full-finetune/Loss": 0.7669693231582642, "Full-finetune/Loss (Raw)": 0.5639377236366272, "Full-finetune/Step": 2672, "Full-finetune/Step Time": 6.819829469546676} {"Full-finetune/Learning Rate": 1.0021803620018706e-05, "Full-finetune/Loss": 0.7668670415878296, "Full-finetune/Loss (Raw)": 0.7947895526885986, "Full-finetune/Step": 2673, "Full-finetune/Step Time": 6.820524508133531} {"Full-finetune/Learning Rate": 1.0015574020343048e-05, "Full-finetune/Loss": 0.7696101665496826, "Full-finetune/Loss (Raw)": 0.6304654479026794, "Full-finetune/Step": 2674, "Full-finetune/Step Time": 6.812720039859414} {"Full-finetune/Learning Rate": 1.0009344414623418e-05, "Full-finetune/Loss": 0.7696006298065186, "Full-finetune/Loss (Raw)": 0.7931160926818848, "Full-finetune/Step": 2675, "Full-finetune/Step Time": 6.81749009154737} {"Full-finetune/Learning Rate": 1.0003114805277405e-05, "Full-finetune/Loss": 0.7682662606239319, "Full-finetune/Loss (Raw)": 0.7826719880104065, "Full-finetune/Step": 2676, "Full-finetune/Step Time": 6.831121211871505} {"Full-finetune/Learning Rate": 9.9968851947226e-06, "Full-finetune/Loss": 0.7726645469665527, "Full-finetune/Loss (Raw)": 0.8826355338096619, "Full-finetune/Step": 2677, "Full-finetune/Step Time": 6.810574248433113} {"Full-finetune/Learning Rate": 9.990655585376583e-06, "Full-finetune/Loss": 0.7725494503974915, "Full-finetune/Loss (Raw)": 0.7968828082084656, "Full-finetune/Step": 2678, "Full-finetune/Step Time": 6.799248119816184} {"Full-finetune/Learning Rate": 9.984425979656955e-06, "Full-finetune/Loss": 0.7730054259300232, "Full-finetune/Loss (Raw)": 0.9542943835258484, "Full-finetune/Step": 2679, "Full-finetune/Step Time": 6.808107929304242} {"Full-finetune/Learning Rate": 9.978196379981297e-06, "Full-finetune/Loss": 0.771719217300415, "Full-finetune/Loss (Raw)": 0.8709201216697693, "Full-finetune/Step": 2680, "Full-finetune/Step Time": 6.809671917930245} {"Full-finetune/Learning Rate": 9.971966788767198e-06, "Full-finetune/Loss": 0.7686457633972168, "Full-finetune/Loss (Raw)": 0.3349328637123108, "Full-finetune/Step": 2681, "Full-finetune/Step Time": 6.816427627578378} {"Full-finetune/Learning Rate": 9.96573720843225e-06, "Full-finetune/Loss": 0.7684601545333862, "Full-finetune/Loss (Raw)": 0.8111297488212585, "Full-finetune/Step": 2682, "Full-finetune/Step Time": 6.783971620723605} {"Full-finetune/Learning Rate": 9.959507641394015e-06, "Full-finetune/Loss": 0.7724266648292542, "Full-finetune/Loss (Raw)": 0.8357688784599304, "Full-finetune/Step": 2683, "Full-finetune/Step Time": 6.7536398228257895} {"Full-finetune/Learning Rate": 9.953278090070075e-06, "Full-finetune/Loss": 0.7719191312789917, "Full-finetune/Loss (Raw)": 0.7821298241615295, "Full-finetune/Step": 2684, "Full-finetune/Step Time": 6.753878811374307} {"Full-finetune/Learning Rate": 9.947048556877992e-06, "Full-finetune/Loss": 0.7731227278709412, "Full-finetune/Loss (Raw)": 0.8444002270698547, "Full-finetune/Step": 2685, "Full-finetune/Step Time": 6.757797623053193} {"Full-finetune/Learning Rate": 9.940819044235335e-06, "Full-finetune/Loss": 0.7724451422691345, "Full-finetune/Loss (Raw)": 0.7247855067253113, "Full-finetune/Step": 2686, "Full-finetune/Step Time": 6.760666711255908} {"Full-finetune/Learning Rate": 9.934589554559653e-06, "Full-finetune/Loss": 0.7728105783462524, "Full-finetune/Loss (Raw)": 0.7789173126220703, "Full-finetune/Step": 2687, "Full-finetune/Step Time": 6.762749399989843} {"Full-finetune/Learning Rate": 9.928360090268484e-06, "Full-finetune/Loss": 0.7748751640319824, "Full-finetune/Loss (Raw)": 0.849913477897644, "Full-finetune/Step": 2688, "Full-finetune/Step Time": 6.74442938528955} {"Full-finetune/Learning Rate": 9.922130653779368e-06, "Full-finetune/Loss": 0.7757214307785034, "Full-finetune/Loss (Raw)": 0.93478924036026, "Full-finetune/Step": 2689, "Full-finetune/Step Time": 6.752445222809911} {"Full-finetune/Learning Rate": 9.915901247509821e-06, "Full-finetune/Loss": 0.7715765833854675, "Full-finetune/Loss (Raw)": 0.36604538559913635, "Full-finetune/Step": 2690, "Full-finetune/Step Time": 6.7725874818861485} {"Full-finetune/Learning Rate": 9.909671873877363e-06, "Full-finetune/Loss": 0.7751245498657227, "Full-finetune/Loss (Raw)": 0.8848262429237366, "Full-finetune/Step": 2691, "Full-finetune/Step Time": 6.765838008373976} {"Full-finetune/Learning Rate": 9.903442535299487e-06, "Full-finetune/Loss": 0.7745695114135742, "Full-finetune/Loss (Raw)": 0.776962399482727, "Full-finetune/Step": 2692, "Full-finetune/Step Time": 6.76548127643764} {"Full-finetune/Learning Rate": 9.897213234193673e-06, "Full-finetune/Loss": 0.774225115776062, "Full-finetune/Loss (Raw)": 0.8418689370155334, "Full-finetune/Step": 2693, "Full-finetune/Step Time": 6.763639971613884} {"Full-finetune/Learning Rate": 9.890983972977401e-06, "Full-finetune/Loss": 0.7733917832374573, "Full-finetune/Loss (Raw)": 0.7410216927528381, "Full-finetune/Step": 2694, "Full-finetune/Step Time": 6.764758260920644} {"Full-finetune/Learning Rate": 9.884754754068116e-06, "Full-finetune/Loss": 0.7737224102020264, "Full-finetune/Loss (Raw)": 0.7764794826507568, "Full-finetune/Step": 2695, "Full-finetune/Step Time": 6.764653608202934} {"Full-finetune/Learning Rate": 9.878525579883264e-06, "Full-finetune/Loss": 0.7742352485656738, "Full-finetune/Loss (Raw)": 0.7998944520950317, "Full-finetune/Step": 2696, "Full-finetune/Step Time": 6.776154765859246} {"Full-finetune/Learning Rate": 9.872296452840266e-06, "Full-finetune/Loss": 0.7726092338562012, "Full-finetune/Loss (Raw)": 0.8116377592086792, "Full-finetune/Step": 2697, "Full-finetune/Step Time": 6.7797573041170835} {"Full-finetune/Learning Rate": 9.866067375356516e-06, "Full-finetune/Loss": 0.7719811201095581, "Full-finetune/Loss (Raw)": 0.7194329500198364, "Full-finetune/Step": 2698, "Full-finetune/Step Time": 6.7753662541508675} {"Full-finetune/Learning Rate": 9.859838349849404e-06, "Full-finetune/Loss": 0.7707654237747192, "Full-finetune/Loss (Raw)": 0.8715457916259766, "Full-finetune/Step": 2699, "Full-finetune/Step Time": 6.790432576090097} {"Full-finetune/Learning Rate": 9.853609378736293e-06, "Full-finetune/Loss": 0.7706042528152466, "Full-finetune/Loss (Raw)": 0.8018556833267212, "Full-finetune/Step": 2700, "Full-finetune/Step Time": 6.789950171485543} {"Full-finetune/Learning Rate": 9.847380464434525e-06, "Full-finetune/Loss": 0.7703843116760254, "Full-finetune/Loss (Raw)": 0.7697021961212158, "Full-finetune/Step": 2701, "Full-finetune/Step Time": 6.812147259712219} {"Full-finetune/Learning Rate": 9.841151609361419e-06, "Full-finetune/Loss": 0.7710968255996704, "Full-finetune/Loss (Raw)": 0.8457764387130737, "Full-finetune/Step": 2702, "Full-finetune/Step Time": 6.801439238712192} {"Full-finetune/Learning Rate": 9.83492281593427e-06, "Full-finetune/Loss": 0.7710821628570557, "Full-finetune/Loss (Raw)": 0.7124514579772949, "Full-finetune/Step": 2703, "Full-finetune/Step Time": 6.818784100934863} {"Full-finetune/Learning Rate": 9.828694086570353e-06, "Full-finetune/Loss": 0.7701563835144043, "Full-finetune/Loss (Raw)": 0.6946289539337158, "Full-finetune/Step": 2704, "Full-finetune/Step Time": 6.8311386071145535} {"Full-finetune/Learning Rate": 9.822465423686917e-06, "Full-finetune/Loss": 0.7693150043487549, "Full-finetune/Loss (Raw)": 0.7590076923370361, "Full-finetune/Step": 2705, "Full-finetune/Step Time": 6.8313936442136765} {"Full-finetune/Learning Rate": 9.816236829701187e-06, "Full-finetune/Loss": 0.7690613269805908, "Full-finetune/Loss (Raw)": 0.8799814581871033, "Full-finetune/Step": 2706, "Full-finetune/Step Time": 6.839441671967506} {"Full-finetune/Learning Rate": 9.810008307030356e-06, "Full-finetune/Loss": 0.76951003074646, "Full-finetune/Loss (Raw)": 0.9641914963722229, "Full-finetune/Step": 2707, "Full-finetune/Step Time": 6.835793998092413} {"Full-finetune/Learning Rate": 9.803779858091586e-06, "Full-finetune/Loss": 0.7719035148620605, "Full-finetune/Loss (Raw)": 0.9076066017150879, "Full-finetune/Step": 2708, "Full-finetune/Step Time": 6.8232776913791895} {"Full-finetune/Learning Rate": 9.797551485302027e-06, "Full-finetune/Loss": 0.7705866098403931, "Full-finetune/Loss (Raw)": 0.7575665712356567, "Full-finetune/Step": 2709, "Full-finetune/Step Time": 6.833566704764962} {"Full-finetune/Learning Rate": 9.791323191078781e-06, "Full-finetune/Loss": 0.7672253251075745, "Full-finetune/Loss (Raw)": 0.37134116888046265, "Full-finetune/Step": 2710, "Full-finetune/Step Time": 6.85339923389256} {"Full-finetune/Learning Rate": 9.785094977838935e-06, "Full-finetune/Loss": 0.768423318862915, "Full-finetune/Loss (Raw)": 0.8613436818122864, "Full-finetune/Step": 2711, "Full-finetune/Step Time": 6.8443319126963615} {"Full-finetune/Learning Rate": 9.77886684799953e-06, "Full-finetune/Loss": 0.7675307989120483, "Full-finetune/Loss (Raw)": 0.8165480494499207, "Full-finetune/Step": 2712, "Full-finetune/Step Time": 6.863303128629923} {"Full-finetune/Learning Rate": 9.77263880397758e-06, "Full-finetune/Loss": 0.7684800624847412, "Full-finetune/Loss (Raw)": 0.780116081237793, "Full-finetune/Step": 2713, "Full-finetune/Step Time": 6.870439141988754} {"Full-finetune/Learning Rate": 9.766410848190076e-06, "Full-finetune/Loss": 0.7691248059272766, "Full-finetune/Loss (Raw)": 0.8882988095283508, "Full-finetune/Step": 2714, "Full-finetune/Step Time": 6.870367132127285} {"Full-finetune/Learning Rate": 9.76018298305396e-06, "Full-finetune/Loss": 0.7678521871566772, "Full-finetune/Loss (Raw)": 0.7290988564491272, "Full-finetune/Step": 2715, "Full-finetune/Step Time": 6.86291229352355} {"Full-finetune/Learning Rate": 9.75395521098615e-06, "Full-finetune/Loss": 0.7684121131896973, "Full-finetune/Loss (Raw)": 0.7873696088790894, "Full-finetune/Step": 2716, "Full-finetune/Step Time": 6.856218693777919} {"Full-finetune/Learning Rate": 9.747727534403515e-06, "Full-finetune/Loss": 0.7683005332946777, "Full-finetune/Loss (Raw)": 0.8435940146446228, "Full-finetune/Step": 2717, "Full-finetune/Step Time": 6.837497737258673} {"Full-finetune/Learning Rate": 9.741499955722897e-06, "Full-finetune/Loss": 0.7672325372695923, "Full-finetune/Loss (Raw)": 0.7484144568443298, "Full-finetune/Step": 2718, "Full-finetune/Step Time": 6.837796214967966} {"Full-finetune/Learning Rate": 9.735272477361103e-06, "Full-finetune/Loss": 0.7679904699325562, "Full-finetune/Loss (Raw)": 0.8204962015151978, "Full-finetune/Step": 2719, "Full-finetune/Step Time": 6.8018919713795185} {"Full-finetune/Learning Rate": 9.729045101734889e-06, "Full-finetune/Loss": 0.7682462930679321, "Full-finetune/Loss (Raw)": 0.8584396839141846, "Full-finetune/Step": 2720, "Full-finetune/Step Time": 6.797153118997812} {"Full-finetune/Learning Rate": 9.722817831260985e-06, "Full-finetune/Loss": 0.768326461315155, "Full-finetune/Loss (Raw)": 0.7099555134773254, "Full-finetune/Step": 2721, "Full-finetune/Step Time": 6.788611063733697} {"Full-finetune/Learning Rate": 9.716590668356067e-06, "Full-finetune/Loss": 0.7691001892089844, "Full-finetune/Loss (Raw)": 0.8090150952339172, "Full-finetune/Step": 2722, "Full-finetune/Step Time": 6.7794321700930595} {"Full-finetune/Learning Rate": 9.710363615436777e-06, "Full-finetune/Loss": 0.7686142921447754, "Full-finetune/Loss (Raw)": 0.7233671545982361, "Full-finetune/Step": 2723, "Full-finetune/Step Time": 6.773759409785271} {"Full-finetune/Learning Rate": 9.704136674919712e-06, "Full-finetune/Loss": 0.769372820854187, "Full-finetune/Loss (Raw)": 0.8230490684509277, "Full-finetune/Step": 2724, "Full-finetune/Step Time": 6.776873866096139} {"Full-finetune/Learning Rate": 9.697909849221428e-06, "Full-finetune/Loss": 0.7686704397201538, "Full-finetune/Loss (Raw)": 0.8055499792098999, "Full-finetune/Step": 2725, "Full-finetune/Step Time": 6.770373398438096} {"Full-finetune/Learning Rate": 9.691683140758439e-06, "Full-finetune/Loss": 0.7701534032821655, "Full-finetune/Loss (Raw)": 0.8055277466773987, "Full-finetune/Step": 2726, "Full-finetune/Step Time": 6.76859737560153} {"Full-finetune/Learning Rate": 9.685456551947199e-06, "Full-finetune/Loss": 0.7696565985679626, "Full-finetune/Loss (Raw)": 0.7908718585968018, "Full-finetune/Step": 2727, "Full-finetune/Step Time": 6.771498588845134} {"Full-finetune/Learning Rate": 9.67923008520413e-06, "Full-finetune/Loss": 0.767716646194458, "Full-finetune/Loss (Raw)": 0.5466095209121704, "Full-finetune/Step": 2728, "Full-finetune/Step Time": 6.7701993975788355} {"Full-finetune/Learning Rate": 9.673003742945602e-06, "Full-finetune/Loss": 0.7647838592529297, "Full-finetune/Loss (Raw)": 0.4130483865737915, "Full-finetune/Step": 2729, "Full-finetune/Step Time": 6.779933365061879} {"Full-finetune/Learning Rate": 9.666777527587936e-06, "Full-finetune/Loss": 0.7622355222702026, "Full-finetune/Loss (Raw)": 0.6260098814964294, "Full-finetune/Step": 2730, "Full-finetune/Step Time": 6.782609172165394} {"Full-finetune/Learning Rate": 9.660551441547411e-06, "Full-finetune/Loss": 0.7614434957504272, "Full-finetune/Loss (Raw)": 0.7977989912033081, "Full-finetune/Step": 2731, "Full-finetune/Step Time": 6.780504949390888} {"Full-finetune/Learning Rate": 9.654325487240243e-06, "Full-finetune/Loss": 0.7616300582885742, "Full-finetune/Loss (Raw)": 0.81607985496521, "Full-finetune/Step": 2732, "Full-finetune/Step Time": 6.786282515153289} {"Full-finetune/Learning Rate": 9.6480996670826e-06, "Full-finetune/Loss": 0.7626470923423767, "Full-finetune/Loss (Raw)": 0.8628365993499756, "Full-finetune/Step": 2733, "Full-finetune/Step Time": 6.786910254508257} {"Full-finetune/Learning Rate": 9.64187398349061e-06, "Full-finetune/Loss": 0.7630080580711365, "Full-finetune/Loss (Raw)": 0.7623034715652466, "Full-finetune/Step": 2734, "Full-finetune/Step Time": 6.774190492928028} {"Full-finetune/Learning Rate": 9.635648438880334e-06, "Full-finetune/Loss": 0.7634327411651611, "Full-finetune/Loss (Raw)": 0.8742081522941589, "Full-finetune/Step": 2735, "Full-finetune/Step Time": 6.762646617367864} {"Full-finetune/Learning Rate": 9.629423035667788e-06, "Full-finetune/Loss": 0.7601485252380371, "Full-finetune/Loss (Raw)": 0.45583122968673706, "Full-finetune/Step": 2736, "Full-finetune/Step Time": 6.77963257022202} {"Full-finetune/Learning Rate": 9.623197776268926e-06, "Full-finetune/Loss": 0.7573503255844116, "Full-finetune/Loss (Raw)": 0.5294435620307922, "Full-finetune/Step": 2737, "Full-finetune/Step Time": 6.784234939143062} {"Full-finetune/Learning Rate": 9.616972663099648e-06, "Full-finetune/Loss": 0.7584080696105957, "Full-finetune/Loss (Raw)": 0.8558633327484131, "Full-finetune/Step": 2738, "Full-finetune/Step Time": 6.774976935237646} {"Full-finetune/Learning Rate": 9.610747698575801e-06, "Full-finetune/Loss": 0.7599507570266724, "Full-finetune/Loss (Raw)": 0.8874890804290771, "Full-finetune/Step": 2739, "Full-finetune/Step Time": 6.767086982727051} {"Full-finetune/Learning Rate": 9.60452288511318e-06, "Full-finetune/Loss": 0.7590078115463257, "Full-finetune/Loss (Raw)": 0.691781222820282, "Full-finetune/Step": 2740, "Full-finetune/Step Time": 6.776734804734588} {"Full-finetune/Learning Rate": 9.598298225127499e-06, "Full-finetune/Loss": 0.7584317326545715, "Full-finetune/Loss (Raw)": 0.8861166834831238, "Full-finetune/Step": 2741, "Full-finetune/Step Time": 6.787624994292855} {"Full-finetune/Learning Rate": 9.592073721034435e-06, "Full-finetune/Loss": 0.7586194276809692, "Full-finetune/Loss (Raw)": 0.7828457951545715, "Full-finetune/Step": 2742, "Full-finetune/Step Time": 6.793456017971039} {"Full-finetune/Learning Rate": 9.585849375249595e-06, "Full-finetune/Loss": 0.7586702108383179, "Full-finetune/Loss (Raw)": 0.8919119834899902, "Full-finetune/Step": 2743, "Full-finetune/Step Time": 6.785112090408802} {"Full-finetune/Learning Rate": 9.57962519018853e-06, "Full-finetune/Loss": 0.7578620314598083, "Full-finetune/Loss (Raw)": 0.8155913949012756, "Full-finetune/Step": 2744, "Full-finetune/Step Time": 6.780847918242216} {"Full-finetune/Learning Rate": 9.573401168266722e-06, "Full-finetune/Loss": 0.7617977261543274, "Full-finetune/Loss (Raw)": 0.8986462354660034, "Full-finetune/Step": 2745, "Full-finetune/Step Time": 6.762946719303727} {"Full-finetune/Learning Rate": 9.567177311899589e-06, "Full-finetune/Loss": 0.7629714012145996, "Full-finetune/Loss (Raw)": 0.8188346028327942, "Full-finetune/Step": 2746, "Full-finetune/Step Time": 6.748553020879626} {"Full-finetune/Learning Rate": 9.560953623502493e-06, "Full-finetune/Loss": 0.7623034119606018, "Full-finetune/Loss (Raw)": 0.8045879602432251, "Full-finetune/Step": 2747, "Full-finetune/Step Time": 6.764748493209481} {"Full-finetune/Learning Rate": 9.554730105490722e-06, "Full-finetune/Loss": 0.7639340162277222, "Full-finetune/Loss (Raw)": 0.9307532906532288, "Full-finetune/Step": 2748, "Full-finetune/Step Time": 6.766813423484564} {"Full-finetune/Learning Rate": 9.548506760279506e-06, "Full-finetune/Loss": 0.7646006345748901, "Full-finetune/Loss (Raw)": 0.8539531826972961, "Full-finetune/Step": 2749, "Full-finetune/Step Time": 6.763108134269714} {"Full-finetune/Learning Rate": 9.542283590284003e-06, "Full-finetune/Loss": 0.763718843460083, "Full-finetune/Loss (Raw)": 0.7839990854263306, "Full-finetune/Step": 2750, "Full-finetune/Step Time": 6.756226673722267} {"Full-finetune/Learning Rate": 9.5360605979193e-06, "Full-finetune/Loss": 0.7637341022491455, "Full-finetune/Loss (Raw)": 0.7815841436386108, "Full-finetune/Step": 2751, "Full-finetune/Step Time": 6.745275527238846} {"Full-finetune/Learning Rate": 9.52983778560042e-06, "Full-finetune/Loss": 0.7637068629264832, "Full-finetune/Loss (Raw)": 0.8359420299530029, "Full-finetune/Step": 2752, "Full-finetune/Step Time": 6.744866039603949} {"Full-finetune/Learning Rate": 9.523615155742317e-06, "Full-finetune/Loss": 0.7662042379379272, "Full-finetune/Loss (Raw)": 0.9270390272140503, "Full-finetune/Step": 2753, "Full-finetune/Step Time": 6.730974163860083} {"Full-finetune/Learning Rate": 9.517392710759872e-06, "Full-finetune/Loss": 0.7700519561767578, "Full-finetune/Loss (Raw)": 0.8030875325202942, "Full-finetune/Step": 2754, "Full-finetune/Step Time": 6.7101683262735605} {"Full-finetune/Learning Rate": 9.511170453067899e-06, "Full-finetune/Loss": 0.7666311264038086, "Full-finetune/Loss (Raw)": 0.353922039270401, "Full-finetune/Step": 2755, "Full-finetune/Step Time": 6.732480188831687} {"Full-finetune/Learning Rate": 9.504948385081121e-06, "Full-finetune/Loss": 0.7661193609237671, "Full-finetune/Loss (Raw)": 0.819446325302124, "Full-finetune/Step": 2756, "Full-finetune/Step Time": 6.74890842474997} {"Full-finetune/Learning Rate": 9.498726509214216e-06, "Full-finetune/Loss": 0.7671651840209961, "Full-finetune/Loss (Raw)": 0.659935474395752, "Full-finetune/Step": 2757, "Full-finetune/Step Time": 6.7648900002241135} {"Full-finetune/Learning Rate": 9.492504827881761e-06, "Full-finetune/Loss": 0.7685519456863403, "Full-finetune/Loss (Raw)": 0.8773150444030762, "Full-finetune/Step": 2758, "Full-finetune/Step Time": 6.7543846145272255} {"Full-finetune/Learning Rate": 9.486283343498277e-06, "Full-finetune/Loss": 0.7671216726303101, "Full-finetune/Loss (Raw)": 0.728879451751709, "Full-finetune/Step": 2759, "Full-finetune/Step Time": 6.755073459818959} {"Full-finetune/Learning Rate": 9.480062058478201e-06, "Full-finetune/Loss": 0.7666428685188293, "Full-finetune/Loss (Raw)": 0.655356764793396, "Full-finetune/Step": 2760, "Full-finetune/Step Time": 6.748917154967785} {"Full-finetune/Learning Rate": 9.473840975235883e-06, "Full-finetune/Loss": 0.7631970643997192, "Full-finetune/Loss (Raw)": 0.41711103916168213, "Full-finetune/Step": 2761, "Full-finetune/Step Time": 6.768557161092758} {"Full-finetune/Learning Rate": 9.467620096185616e-06, "Full-finetune/Loss": 0.7628858089447021, "Full-finetune/Loss (Raw)": 0.7404597997665405, "Full-finetune/Step": 2762, "Full-finetune/Step Time": 6.77751181460917} {"Full-finetune/Learning Rate": 9.46139942374159e-06, "Full-finetune/Loss": 0.7631638646125793, "Full-finetune/Loss (Raw)": 0.8136903643608093, "Full-finetune/Step": 2763, "Full-finetune/Step Time": 6.781767323613167} {"Full-finetune/Learning Rate": 9.455178960317936e-06, "Full-finetune/Loss": 0.7617285251617432, "Full-finetune/Loss (Raw)": 0.784680187702179, "Full-finetune/Step": 2764, "Full-finetune/Step Time": 6.782916244119406} {"Full-finetune/Learning Rate": 9.448958708328694e-06, "Full-finetune/Loss": 0.7584989070892334, "Full-finetune/Loss (Raw)": 0.3459375202655792, "Full-finetune/Step": 2765, "Full-finetune/Step Time": 6.795702775940299} {"Full-finetune/Learning Rate": 9.442738670187814e-06, "Full-finetune/Loss": 0.7577052116394043, "Full-finetune/Loss (Raw)": 0.8134525418281555, "Full-finetune/Step": 2766, "Full-finetune/Step Time": 6.780342997983098} {"Full-finetune/Learning Rate": 9.436518848309178e-06, "Full-finetune/Loss": 0.7581636905670166, "Full-finetune/Loss (Raw)": 0.8282829523086548, "Full-finetune/Step": 2767, "Full-finetune/Step Time": 6.794860286638141} {"Full-finetune/Learning Rate": 9.430299245106574e-06, "Full-finetune/Loss": 0.7621216773986816, "Full-finetune/Loss (Raw)": 0.8506774306297302, "Full-finetune/Step": 2768, "Full-finetune/Step Time": 6.778023341670632} {"Full-finetune/Learning Rate": 9.424079862993712e-06, "Full-finetune/Loss": 0.7625324726104736, "Full-finetune/Loss (Raw)": 0.8499433398246765, "Full-finetune/Step": 2769, "Full-finetune/Step Time": 6.787047263234854} {"Full-finetune/Learning Rate": 9.417860704384214e-06, "Full-finetune/Loss": 0.7606179714202881, "Full-finetune/Loss (Raw)": 0.530117392539978, "Full-finetune/Step": 2770, "Full-finetune/Step Time": 6.803520023822784} {"Full-finetune/Learning Rate": 9.411641771691608e-06, "Full-finetune/Loss": 0.7625683546066284, "Full-finetune/Loss (Raw)": 0.8682925701141357, "Full-finetune/Step": 2771, "Full-finetune/Step Time": 6.7972844541072845} {"Full-finetune/Learning Rate": 9.405423067329344e-06, "Full-finetune/Loss": 0.7640913724899292, "Full-finetune/Loss (Raw)": 0.8576054573059082, "Full-finetune/Step": 2772, "Full-finetune/Step Time": 6.767023665830493} {"Full-finetune/Learning Rate": 9.399204593710777e-06, "Full-finetune/Loss": 0.764892578125, "Full-finetune/Loss (Raw)": 0.8955851197242737, "Full-finetune/Step": 2773, "Full-finetune/Step Time": 6.760525586083531} {"Full-finetune/Learning Rate": 9.392986353249183e-06, "Full-finetune/Loss": 0.7611585855484009, "Full-finetune/Loss (Raw)": 0.328816682100296, "Full-finetune/Step": 2774, "Full-finetune/Step Time": 6.7800576370209455} {"Full-finetune/Learning Rate": 9.386768348357735e-06, "Full-finetune/Loss": 0.7622345089912415, "Full-finetune/Loss (Raw)": 0.8747082948684692, "Full-finetune/Step": 2775, "Full-finetune/Step Time": 6.77078191190958} {"Full-finetune/Learning Rate": 9.380550581449512e-06, "Full-finetune/Loss": 0.7618324160575867, "Full-finetune/Loss (Raw)": 0.7550594210624695, "Full-finetune/Step": 2776, "Full-finetune/Step Time": 6.763823272660375} {"Full-finetune/Learning Rate": 9.37433305493752e-06, "Full-finetune/Loss": 0.7625309228897095, "Full-finetune/Loss (Raw)": 0.8010705709457397, "Full-finetune/Step": 2777, "Full-finetune/Step Time": 6.751441134139895} {"Full-finetune/Learning Rate": 9.368115771234651e-06, "Full-finetune/Loss": 0.7635754346847534, "Full-finetune/Loss (Raw)": 0.8455043435096741, "Full-finetune/Step": 2778, "Full-finetune/Step Time": 6.752928655594587} {"Full-finetune/Learning Rate": 9.361898732753715e-06, "Full-finetune/Loss": 0.7630739808082581, "Full-finetune/Loss (Raw)": 0.7198983430862427, "Full-finetune/Step": 2779, "Full-finetune/Step Time": 6.7590846717357635} {"Full-finetune/Learning Rate": 9.355681941907428e-06, "Full-finetune/Loss": 0.7624702453613281, "Full-finetune/Loss (Raw)": 0.8064054250717163, "Full-finetune/Step": 2780, "Full-finetune/Step Time": 6.758778357878327} {"Full-finetune/Learning Rate": 9.349465401108393e-06, "Full-finetune/Loss": 0.7639778852462769, "Full-finetune/Loss (Raw)": 0.9003188610076904, "Full-finetune/Step": 2781, "Full-finetune/Step Time": 6.744102817028761} {"Full-finetune/Learning Rate": 9.34324911276914e-06, "Full-finetune/Loss": 0.7677451372146606, "Full-finetune/Loss (Raw)": 0.8214201927185059, "Full-finetune/Step": 2782, "Full-finetune/Step Time": 6.726854417473078} {"Full-finetune/Learning Rate": 9.337033079302082e-06, "Full-finetune/Loss": 0.7678592205047607, "Full-finetune/Loss (Raw)": 0.8286269903182983, "Full-finetune/Step": 2783, "Full-finetune/Step Time": 6.730836141854525} {"Full-finetune/Learning Rate": 9.330817303119545e-06, "Full-finetune/Loss": 0.7662676572799683, "Full-finetune/Loss (Raw)": 0.5973876118659973, "Full-finetune/Step": 2784, "Full-finetune/Step Time": 6.743345661088824} {"Full-finetune/Learning Rate": 9.324601786633747e-06, "Full-finetune/Loss": 0.7678189277648926, "Full-finetune/Loss (Raw)": 0.7870782613754272, "Full-finetune/Step": 2785, "Full-finetune/Step Time": 6.742618950083852} {"Full-finetune/Learning Rate": 9.318386532256807e-06, "Full-finetune/Loss": 0.7701184749603271, "Full-finetune/Loss (Raw)": 0.8581156134605408, "Full-finetune/Step": 2786, "Full-finetune/Step Time": 6.719498595222831} {"Full-finetune/Learning Rate": 9.312171542400749e-06, "Full-finetune/Loss": 0.7695484757423401, "Full-finetune/Loss (Raw)": 0.7710684537887573, "Full-finetune/Step": 2787, "Full-finetune/Step Time": 6.719668380916119} {"Full-finetune/Learning Rate": 9.305956819477485e-06, "Full-finetune/Loss": 0.7693995833396912, "Full-finetune/Loss (Raw)": 0.8644401431083679, "Full-finetune/Step": 2788, "Full-finetune/Step Time": 6.739300509914756} {"Full-finetune/Learning Rate": 9.299742365898831e-06, "Full-finetune/Loss": 0.7671964168548584, "Full-finetune/Loss (Raw)": 0.7392324209213257, "Full-finetune/Step": 2789, "Full-finetune/Step Time": 6.7516404036432505} {"Full-finetune/Learning Rate": 9.293528184076495e-06, "Full-finetune/Loss": 0.7664545178413391, "Full-finetune/Loss (Raw)": 0.7826114892959595, "Full-finetune/Step": 2790, "Full-finetune/Step Time": 6.755450813099742} {"Full-finetune/Learning Rate": 9.287314276422074e-06, "Full-finetune/Loss": 0.7642990946769714, "Full-finetune/Loss (Raw)": 0.6143603324890137, "Full-finetune/Step": 2791, "Full-finetune/Step Time": 6.764894049614668} {"Full-finetune/Learning Rate": 9.28110064534707e-06, "Full-finetune/Loss": 0.7671533823013306, "Full-finetune/Loss (Raw)": 0.7992706298828125, "Full-finetune/Step": 2792, "Full-finetune/Step Time": 6.760106418281794} {"Full-finetune/Learning Rate": 9.274887293262869e-06, "Full-finetune/Loss": 0.7691553235054016, "Full-finetune/Loss (Raw)": 0.927168607711792, "Full-finetune/Step": 2793, "Full-finetune/Step Time": 6.757959997281432} {"Full-finetune/Learning Rate": 9.268674222580757e-06, "Full-finetune/Loss": 0.7681715488433838, "Full-finetune/Loss (Raw)": 0.7336856126785278, "Full-finetune/Step": 2794, "Full-finetune/Step Time": 6.766549656167626} {"Full-finetune/Learning Rate": 9.262461435711898e-06, "Full-finetune/Loss": 0.7674708962440491, "Full-finetune/Loss (Raw)": 0.6474773287773132, "Full-finetune/Step": 2795, "Full-finetune/Step Time": 6.777301987633109} {"Full-finetune/Learning Rate": 9.256248935067356e-06, "Full-finetune/Loss": 0.7672439813613892, "Full-finetune/Loss (Raw)": 0.771645188331604, "Full-finetune/Step": 2796, "Full-finetune/Step Time": 6.803627070039511} {"Full-finetune/Learning Rate": 9.250036723058083e-06, "Full-finetune/Loss": 0.7646777033805847, "Full-finetune/Loss (Raw)": 0.5910743474960327, "Full-finetune/Step": 2797, "Full-finetune/Step Time": 6.816182337701321} {"Full-finetune/Learning Rate": 9.243824802094914e-06, "Full-finetune/Loss": 0.7610160112380981, "Full-finetune/Loss (Raw)": 0.3738710880279541, "Full-finetune/Step": 2798, "Full-finetune/Step Time": 6.839359659701586} {"Full-finetune/Learning Rate": 9.237613174588583e-06, "Full-finetune/Loss": 0.7614001035690308, "Full-finetune/Loss (Raw)": 0.672644317150116, "Full-finetune/Step": 2799, "Full-finetune/Step Time": 6.8363516964018345} {"Full-finetune/Learning Rate": 9.231401842949688e-06, "Full-finetune/Loss": 0.7618245482444763, "Full-finetune/Loss (Raw)": 0.6182688474655151, "Full-finetune/Step": 2800, "Full-finetune/Step Time": 6.8201235961169} {"Full-finetune/Learning Rate": 9.225190809588731e-06, "Full-finetune/Loss": 0.7625349760055542, "Full-finetune/Loss (Raw)": 0.8857261538505554, "Full-finetune/Step": 2801, "Full-finetune/Step Time": 6.823115568608046} {"Full-finetune/Learning Rate": 9.218980076916099e-06, "Full-finetune/Loss": 0.7643179893493652, "Full-finetune/Loss (Raw)": 0.8586874604225159, "Full-finetune/Step": 2802, "Full-finetune/Step Time": 6.831759415566921} {"Full-finetune/Learning Rate": 9.212769647342046e-06, "Full-finetune/Loss": 0.7639910578727722, "Full-finetune/Loss (Raw)": 0.7512710690498352, "Full-finetune/Step": 2803, "Full-finetune/Step Time": 6.830133343115449} {"Full-finetune/Learning Rate": 9.206559523276731e-06, "Full-finetune/Loss": 0.7643798589706421, "Full-finetune/Loss (Raw)": 0.8324462175369263, "Full-finetune/Step": 2804, "Full-finetune/Step Time": 6.813665872439742} {"Full-finetune/Learning Rate": 9.200349707130168e-06, "Full-finetune/Loss": 0.7651233673095703, "Full-finetune/Loss (Raw)": 0.9777989387512207, "Full-finetune/Step": 2805, "Full-finetune/Step Time": 6.812175219878554} {"Full-finetune/Learning Rate": 9.194140201312274e-06, "Full-finetune/Loss": 0.7646747827529907, "Full-finetune/Loss (Raw)": 0.7394633293151855, "Full-finetune/Step": 2806, "Full-finetune/Step Time": 6.818182772025466} {"Full-finetune/Learning Rate": 9.187931008232832e-06, "Full-finetune/Loss": 0.7633260488510132, "Full-finetune/Loss (Raw)": 0.7816586494445801, "Full-finetune/Step": 2807, "Full-finetune/Step Time": 6.805088296532631} {"Full-finetune/Learning Rate": 9.181722130301512e-06, "Full-finetune/Loss": 0.761145830154419, "Full-finetune/Loss (Raw)": 0.5918483138084412, "Full-finetune/Step": 2808, "Full-finetune/Step Time": 6.815817819908261} {"Full-finetune/Learning Rate": 9.175513569927865e-06, "Full-finetune/Loss": 0.761233925819397, "Full-finetune/Loss (Raw)": 0.3462146818637848, "Full-finetune/Step": 2809, "Full-finetune/Step Time": 6.8157675582915545} {"Full-finetune/Learning Rate": 9.169305329521296e-06, "Full-finetune/Loss": 0.760299563407898, "Full-finetune/Loss (Raw)": 0.6915247440338135, "Full-finetune/Step": 2810, "Full-finetune/Step Time": 6.813701489940286} {"Full-finetune/Learning Rate": 9.163097411491115e-06, "Full-finetune/Loss": 0.7603363394737244, "Full-finetune/Loss (Raw)": 0.8404822945594788, "Full-finetune/Step": 2811, "Full-finetune/Step Time": 6.816687421873212} {"Full-finetune/Learning Rate": 9.156889818246485e-06, "Full-finetune/Loss": 0.760280966758728, "Full-finetune/Loss (Raw)": 0.7750453948974609, "Full-finetune/Step": 2812, "Full-finetune/Step Time": 6.815916256979108} {"Full-finetune/Learning Rate": 9.150682552196461e-06, "Full-finetune/Loss": 0.7604352235794067, "Full-finetune/Loss (Raw)": 0.8641417026519775, "Full-finetune/Step": 2813, "Full-finetune/Step Time": 6.8147200010716915} {"Full-finetune/Learning Rate": 9.144475615749957e-06, "Full-finetune/Loss": 0.7574857473373413, "Full-finetune/Loss (Raw)": 0.34725385904312134, "Full-finetune/Step": 2814, "Full-finetune/Step Time": 6.831344053149223} {"Full-finetune/Learning Rate": 9.138269011315761e-06, "Full-finetune/Loss": 0.7586534023284912, "Full-finetune/Loss (Raw)": 0.9283662438392639, "Full-finetune/Step": 2815, "Full-finetune/Step Time": 6.833287492394447} {"Full-finetune/Learning Rate": 9.13206274130254e-06, "Full-finetune/Loss": 0.7584327459335327, "Full-finetune/Loss (Raw)": 0.8216721415519714, "Full-finetune/Step": 2816, "Full-finetune/Step Time": 6.830840051174164} {"Full-finetune/Learning Rate": 9.125856808118822e-06, "Full-finetune/Loss": 0.757330060005188, "Full-finetune/Loss (Raw)": 0.7936437129974365, "Full-finetune/Step": 2817, "Full-finetune/Step Time": 6.827519116923213} {"Full-finetune/Learning Rate": 9.119651214173012e-06, "Full-finetune/Loss": 0.7606140375137329, "Full-finetune/Loss (Raw)": 0.7864048480987549, "Full-finetune/Step": 2818, "Full-finetune/Step Time": 6.812781820073724} {"Full-finetune/Learning Rate": 9.11344596187338e-06, "Full-finetune/Loss": 0.7609632611274719, "Full-finetune/Loss (Raw)": 0.9295225739479065, "Full-finetune/Step": 2819, "Full-finetune/Step Time": 6.814679648727179} {"Full-finetune/Learning Rate": 9.107241053628058e-06, "Full-finetune/Loss": 0.7620460987091064, "Full-finetune/Loss (Raw)": 0.9155678153038025, "Full-finetune/Step": 2820, "Full-finetune/Step Time": 6.814074020832777} {"Full-finetune/Learning Rate": 9.101036491845056e-06, "Full-finetune/Loss": 0.7603516578674316, "Full-finetune/Loss (Raw)": 0.6249840259552002, "Full-finetune/Step": 2821, "Full-finetune/Step Time": 6.826426938176155} {"Full-finetune/Learning Rate": 9.094832278932238e-06, "Full-finetune/Loss": 0.7610845565795898, "Full-finetune/Loss (Raw)": 0.8348283171653748, "Full-finetune/Step": 2822, "Full-finetune/Step Time": 6.821885135024786} {"Full-finetune/Learning Rate": 9.088628417297346e-06, "Full-finetune/Loss": 0.7581526041030884, "Full-finetune/Loss (Raw)": 0.401183158159256, "Full-finetune/Step": 2823, "Full-finetune/Step Time": 6.8336782194674015} {"Full-finetune/Learning Rate": 9.082424909347969e-06, "Full-finetune/Loss": 0.756759762763977, "Full-finetune/Loss (Raw)": 0.6216112971305847, "Full-finetune/Step": 2824, "Full-finetune/Step Time": 6.820510223507881} {"Full-finetune/Learning Rate": 9.076221757491568e-06, "Full-finetune/Loss": 0.7559407353401184, "Full-finetune/Loss (Raw)": 0.7068062424659729, "Full-finetune/Step": 2825, "Full-finetune/Step Time": 6.819337978959084} {"Full-finetune/Learning Rate": 9.070018964135471e-06, "Full-finetune/Loss": 0.7555273771286011, "Full-finetune/Loss (Raw)": 0.6665260791778564, "Full-finetune/Step": 2826, "Full-finetune/Step Time": 6.821273313835263} {"Full-finetune/Learning Rate": 9.063816531686855e-06, "Full-finetune/Loss": 0.7551355361938477, "Full-finetune/Loss (Raw)": 0.8213886022567749, "Full-finetune/Step": 2827, "Full-finetune/Step Time": 6.803717123344541} {"Full-finetune/Learning Rate": 9.057614462552769e-06, "Full-finetune/Loss": 0.7563172578811646, "Full-finetune/Loss (Raw)": 0.9531206488609314, "Full-finetune/Step": 2828, "Full-finetune/Step Time": 6.803634498268366} {"Full-finetune/Learning Rate": 9.05141275914011e-06, "Full-finetune/Loss": 0.7568473815917969, "Full-finetune/Loss (Raw)": 0.8375511169433594, "Full-finetune/Step": 2829, "Full-finetune/Step Time": 6.785890486091375} {"Full-finetune/Learning Rate": 9.045211423855637e-06, "Full-finetune/Loss": 0.7571888566017151, "Full-finetune/Loss (Raw)": 0.88948655128479, "Full-finetune/Step": 2830, "Full-finetune/Step Time": 6.778221404179931} {"Full-finetune/Learning Rate": 9.039010459105974e-06, "Full-finetune/Loss": 0.759583592414856, "Full-finetune/Loss (Raw)": 1.0189745426177979, "Full-finetune/Step": 2831, "Full-finetune/Step Time": 6.761385187506676} {"Full-finetune/Learning Rate": 9.032809867297586e-06, "Full-finetune/Loss": 0.7614859938621521, "Full-finetune/Loss (Raw)": 0.9381343126296997, "Full-finetune/Step": 2832, "Full-finetune/Step Time": 6.756117546930909} {"Full-finetune/Learning Rate": 9.02660965083681e-06, "Full-finetune/Loss": 0.7617775201797485, "Full-finetune/Loss (Raw)": 0.7963295578956604, "Full-finetune/Step": 2833, "Full-finetune/Step Time": 6.7634387873113155} {"Full-finetune/Learning Rate": 9.020409812129824e-06, "Full-finetune/Loss": 0.757692277431488, "Full-finetune/Loss (Raw)": 0.3570704758167267, "Full-finetune/Step": 2834, "Full-finetune/Step Time": 6.774014342576265} {"Full-finetune/Learning Rate": 9.014210353582662e-06, "Full-finetune/Loss": 0.7565778493881226, "Full-finetune/Loss (Raw)": 0.8215456008911133, "Full-finetune/Step": 2835, "Full-finetune/Step Time": 6.77674550563097} {"Full-finetune/Learning Rate": 9.008011277601217e-06, "Full-finetune/Loss": 0.7544592022895813, "Full-finetune/Loss (Raw)": 0.6364145874977112, "Full-finetune/Step": 2836, "Full-finetune/Step Time": 6.76980085298419} {"Full-finetune/Learning Rate": 9.001812586591228e-06, "Full-finetune/Loss": 0.7551895380020142, "Full-finetune/Loss (Raw)": 0.8510503768920898, "Full-finetune/Step": 2837, "Full-finetune/Step Time": 6.757361559197307} {"Full-finetune/Learning Rate": 8.995614282958289e-06, "Full-finetune/Loss": 0.7578648924827576, "Full-finetune/Loss (Raw)": 0.7137866020202637, "Full-finetune/Step": 2838, "Full-finetune/Step Time": 6.734711838886142} {"Full-finetune/Learning Rate": 8.989416369107837e-06, "Full-finetune/Loss": 0.7566581964492798, "Full-finetune/Loss (Raw)": 0.7068800330162048, "Full-finetune/Step": 2839, "Full-finetune/Step Time": 6.7401791755110025} {"Full-finetune/Learning Rate": 8.983218847445157e-06, "Full-finetune/Loss": 0.7564949989318848, "Full-finetune/Loss (Raw)": 0.7956704497337341, "Full-finetune/Step": 2840, "Full-finetune/Step Time": 6.7240445502102375} {"Full-finetune/Learning Rate": 8.977021720375395e-06, "Full-finetune/Loss": 0.7576590776443481, "Full-finetune/Loss (Raw)": 0.9291113615036011, "Full-finetune/Step": 2841, "Full-finetune/Step Time": 6.7187273018062115} {"Full-finetune/Learning Rate": 8.970824990303532e-06, "Full-finetune/Loss": 0.7571742534637451, "Full-finetune/Loss (Raw)": 0.8262497782707214, "Full-finetune/Step": 2842, "Full-finetune/Step Time": 6.720881182700396} {"Full-finetune/Learning Rate": 8.9646286596344e-06, "Full-finetune/Loss": 0.756786048412323, "Full-finetune/Loss (Raw)": 0.6794004440307617, "Full-finetune/Step": 2843, "Full-finetune/Step Time": 6.7368693593889475} {"Full-finetune/Learning Rate": 8.958432730772667e-06, "Full-finetune/Loss": 0.757282018661499, "Full-finetune/Loss (Raw)": 0.8508533835411072, "Full-finetune/Step": 2844, "Full-finetune/Step Time": 6.737398561090231} {"Full-finetune/Learning Rate": 8.952237206122855e-06, "Full-finetune/Loss": 0.7569445371627808, "Full-finetune/Loss (Raw)": 0.8003984689712524, "Full-finetune/Step": 2845, "Full-finetune/Step Time": 6.749078553169966} {"Full-finetune/Learning Rate": 8.946042088089331e-06, "Full-finetune/Loss": 0.756955623626709, "Full-finetune/Loss (Raw)": 0.7498326897621155, "Full-finetune/Step": 2846, "Full-finetune/Step Time": 6.746959835290909} {"Full-finetune/Learning Rate": 8.939847379076293e-06, "Full-finetune/Loss": 0.7552491426467896, "Full-finetune/Loss (Raw)": 0.6020646095275879, "Full-finetune/Step": 2847, "Full-finetune/Step Time": 6.768571365624666} {"Full-finetune/Learning Rate": 8.933653081487794e-06, "Full-finetune/Loss": 0.7552551031112671, "Full-finetune/Loss (Raw)": 0.8592011332511902, "Full-finetune/Step": 2848, "Full-finetune/Step Time": 6.775001047179103} {"Full-finetune/Learning Rate": 8.927459197727712e-06, "Full-finetune/Loss": 0.7556908130645752, "Full-finetune/Loss (Raw)": 0.7657244801521301, "Full-finetune/Step": 2849, "Full-finetune/Step Time": 6.770626302808523} {"Full-finetune/Learning Rate": 8.921265730199775e-06, "Full-finetune/Loss": 0.7556673288345337, "Full-finetune/Loss (Raw)": 0.8060253262519836, "Full-finetune/Step": 2850, "Full-finetune/Step Time": 6.765318762511015} {"Full-finetune/Learning Rate": 8.91507268130755e-06, "Full-finetune/Loss": 0.7566580772399902, "Full-finetune/Loss (Raw)": 0.8501702547073364, "Full-finetune/Step": 2851, "Full-finetune/Step Time": 6.7726483307778835} {"Full-finetune/Learning Rate": 8.908880053454432e-06, "Full-finetune/Loss": 0.7566643953323364, "Full-finetune/Loss (Raw)": 0.8238564729690552, "Full-finetune/Step": 2852, "Full-finetune/Step Time": 6.773094229400158} {"Full-finetune/Learning Rate": 8.90268784904367e-06, "Full-finetune/Loss": 0.7562263011932373, "Full-finetune/Loss (Raw)": 0.7494766712188721, "Full-finetune/Step": 2853, "Full-finetune/Step Time": 6.773733522742987} {"Full-finetune/Learning Rate": 8.896496070478326e-06, "Full-finetune/Loss": 0.7567470073699951, "Full-finetune/Loss (Raw)": 0.8721819519996643, "Full-finetune/Step": 2854, "Full-finetune/Step Time": 6.766017612069845} {"Full-finetune/Learning Rate": 8.890304720161311e-06, "Full-finetune/Loss": 0.7566702365875244, "Full-finetune/Loss (Raw)": 0.7810390591621399, "Full-finetune/Step": 2855, "Full-finetune/Step Time": 6.780084660276771} {"Full-finetune/Learning Rate": 8.884113800495372e-06, "Full-finetune/Loss": 0.7584501504898071, "Full-finetune/Loss (Raw)": 0.7744452357292175, "Full-finetune/Step": 2856, "Full-finetune/Step Time": 6.793122353032231} {"Full-finetune/Learning Rate": 8.87792331388308e-06, "Full-finetune/Loss": 0.7618317604064941, "Full-finetune/Loss (Raw)": 0.8458959460258484, "Full-finetune/Step": 2857, "Full-finetune/Step Time": 6.776671856641769} {"Full-finetune/Learning Rate": 8.871733262726846e-06, "Full-finetune/Loss": 0.7625917196273804, "Full-finetune/Loss (Raw)": 0.7232853770256042, "Full-finetune/Step": 2858, "Full-finetune/Step Time": 6.768864449113607} {"Full-finetune/Learning Rate": 8.865543649428903e-06, "Full-finetune/Loss": 0.7626967430114746, "Full-finetune/Loss (Raw)": 0.8112335801124573, "Full-finetune/Step": 2859, "Full-finetune/Step Time": 6.775552595034242} {"Full-finetune/Learning Rate": 8.859354476391319e-06, "Full-finetune/Loss": 0.7616904973983765, "Full-finetune/Loss (Raw)": 0.687279999256134, "Full-finetune/Step": 2860, "Full-finetune/Step Time": 6.774904442951083} {"Full-finetune/Learning Rate": 8.853165746015997e-06, "Full-finetune/Loss": 0.7624844312667847, "Full-finetune/Loss (Raw)": 0.9644652009010315, "Full-finetune/Step": 2861, "Full-finetune/Step Time": 6.775111911818385} {"Full-finetune/Learning Rate": 8.846977460704656e-06, "Full-finetune/Loss": 0.7624640464782715, "Full-finetune/Loss (Raw)": 0.759691596031189, "Full-finetune/Step": 2862, "Full-finetune/Step Time": 6.7807093616575} {"Full-finetune/Learning Rate": 8.840789622858856e-06, "Full-finetune/Loss": 0.7617464065551758, "Full-finetune/Loss (Raw)": 0.782353401184082, "Full-finetune/Step": 2863, "Full-finetune/Step Time": 6.767554813995957} {"Full-finetune/Learning Rate": 8.834602234879968e-06, "Full-finetune/Loss": 0.7637536525726318, "Full-finetune/Loss (Raw)": 0.7127553224563599, "Full-finetune/Step": 2864, "Full-finetune/Step Time": 6.7473578825592995} {"Full-finetune/Learning Rate": 8.8284152991692e-06, "Full-finetune/Loss": 0.7665340900421143, "Full-finetune/Loss (Raw)": 0.8853369355201721, "Full-finetune/Step": 2865, "Full-finetune/Step Time": 6.739681446924806} {"Full-finetune/Learning Rate": 8.822228818127584e-06, "Full-finetune/Loss": 0.7628855109214783, "Full-finetune/Loss (Raw)": 0.3888522982597351, "Full-finetune/Step": 2866, "Full-finetune/Step Time": 6.754778869450092} {"Full-finetune/Learning Rate": 8.81604279415597e-06, "Full-finetune/Loss": 0.7625179290771484, "Full-finetune/Loss (Raw)": 0.8404356241226196, "Full-finetune/Step": 2867, "Full-finetune/Step Time": 6.758286086842418} {"Full-finetune/Learning Rate": 8.809857229655029e-06, "Full-finetune/Loss": 0.76438307762146, "Full-finetune/Loss (Raw)": 0.9305130839347839, "Full-finetune/Step": 2868, "Full-finetune/Step Time": 6.752770917490125} {"Full-finetune/Learning Rate": 8.803672127025264e-06, "Full-finetune/Loss": 0.7621067762374878, "Full-finetune/Loss (Raw)": 0.5947600603103638, "Full-finetune/Step": 2869, "Full-finetune/Step Time": 6.773860303685069} {"Full-finetune/Learning Rate": 8.797487488666986e-06, "Full-finetune/Loss": 0.7589170932769775, "Full-finetune/Loss (Raw)": 0.37456801533699036, "Full-finetune/Step": 2870, "Full-finetune/Step Time": 6.785947622731328} {"Full-finetune/Learning Rate": 8.791303316980342e-06, "Full-finetune/Loss": 0.7593269348144531, "Full-finetune/Loss (Raw)": 0.9443681836128235, "Full-finetune/Step": 2871, "Full-finetune/Step Time": 6.7855926267802715} {"Full-finetune/Learning Rate": 8.785119614365282e-06, "Full-finetune/Loss": 0.7601742744445801, "Full-finetune/Loss (Raw)": 0.9240446090698242, "Full-finetune/Step": 2872, "Full-finetune/Step Time": 6.785995235666633} {"Full-finetune/Learning Rate": 8.77893638322158e-06, "Full-finetune/Loss": 0.7597440481185913, "Full-finetune/Loss (Raw)": 0.8435782790184021, "Full-finetune/Step": 2873, "Full-finetune/Step Time": 6.788103122264147} {"Full-finetune/Learning Rate": 8.772753625948828e-06, "Full-finetune/Loss": 0.7561259269714355, "Full-finetune/Loss (Raw)": 0.35571974515914917, "Full-finetune/Step": 2874, "Full-finetune/Step Time": 6.79432937502861} {"Full-finetune/Learning Rate": 8.766571344946433e-06, "Full-finetune/Loss": 0.7566465139389038, "Full-finetune/Loss (Raw)": 0.8712265491485596, "Full-finetune/Step": 2875, "Full-finetune/Step Time": 6.775251053273678} {"Full-finetune/Learning Rate": 8.760389542613619e-06, "Full-finetune/Loss": 0.7556862235069275, "Full-finetune/Loss (Raw)": 0.807830274105072, "Full-finetune/Step": 2876, "Full-finetune/Step Time": 6.785239828750491} {"Full-finetune/Learning Rate": 8.754208221349427e-06, "Full-finetune/Loss": 0.7551857829093933, "Full-finetune/Loss (Raw)": 0.7898996472358704, "Full-finetune/Step": 2877, "Full-finetune/Step Time": 6.787978079169989} {"Full-finetune/Learning Rate": 8.748027383552696e-06, "Full-finetune/Loss": 0.7546508312225342, "Full-finetune/Loss (Raw)": 0.7155252695083618, "Full-finetune/Step": 2878, "Full-finetune/Step Time": 6.79412991926074} {"Full-finetune/Learning Rate": 8.741847031622096e-06, "Full-finetune/Loss": 0.7542234659194946, "Full-finetune/Loss (Raw)": 0.7268849611282349, "Full-finetune/Step": 2879, "Full-finetune/Step Time": 6.795778188854456} {"Full-finetune/Learning Rate": 8.7356671679561e-06, "Full-finetune/Loss": 0.7548537254333496, "Full-finetune/Loss (Raw)": 0.9166058301925659, "Full-finetune/Step": 2880, "Full-finetune/Step Time": 6.787448789924383} {"Full-finetune/Learning Rate": 8.729487794952992e-06, "Full-finetune/Loss": 0.7540687918663025, "Full-finetune/Loss (Raw)": 0.8265737295150757, "Full-finetune/Step": 2881, "Full-finetune/Step Time": 6.792997304350138} {"Full-finetune/Learning Rate": 8.72330891501087e-06, "Full-finetune/Loss": 0.7547556161880493, "Full-finetune/Loss (Raw)": 0.8909989595413208, "Full-finetune/Step": 2882, "Full-finetune/Step Time": 6.7943105939775705} {"Full-finetune/Learning Rate": 8.717130530527626e-06, "Full-finetune/Loss": 0.7592188119888306, "Full-finetune/Loss (Raw)": 0.9252104163169861, "Full-finetune/Step": 2883, "Full-finetune/Step Time": 6.778627684339881} {"Full-finetune/Learning Rate": 8.710952643900983e-06, "Full-finetune/Loss": 0.7584071159362793, "Full-finetune/Loss (Raw)": 0.7155506014823914, "Full-finetune/Step": 2884, "Full-finetune/Step Time": 6.78521073050797} {"Full-finetune/Learning Rate": 8.704775257528446e-06, "Full-finetune/Loss": 0.7600263357162476, "Full-finetune/Loss (Raw)": 0.8672015070915222, "Full-finetune/Step": 2885, "Full-finetune/Step Time": 6.753909062594175} {"Full-finetune/Learning Rate": 8.69859837380735e-06, "Full-finetune/Loss": 0.7577176094055176, "Full-finetune/Loss (Raw)": 0.5817908644676208, "Full-finetune/Step": 2886, "Full-finetune/Step Time": 6.777399644255638} {"Full-finetune/Learning Rate": 8.692421995134819e-06, "Full-finetune/Loss": 0.757300853729248, "Full-finetune/Loss (Raw)": 0.6755434274673462, "Full-finetune/Step": 2887, "Full-finetune/Step Time": 6.782820938155055} {"Full-finetune/Learning Rate": 8.686246123907778e-06, "Full-finetune/Loss": 0.7598875164985657, "Full-finetune/Loss (Raw)": 0.9864435791969299, "Full-finetune/Step": 2888, "Full-finetune/Step Time": 6.791333040222526} {"Full-finetune/Learning Rate": 8.680070762522969e-06, "Full-finetune/Loss": 0.7591938376426697, "Full-finetune/Loss (Raw)": 0.32831522822380066, "Full-finetune/Step": 2889, "Full-finetune/Step Time": 6.7906259167939425} {"Full-finetune/Learning Rate": 8.673895913376928e-06, "Full-finetune/Loss": 0.7592717409133911, "Full-finetune/Loss (Raw)": 0.7504324316978455, "Full-finetune/Step": 2890, "Full-finetune/Step Time": 6.78004421107471} {"Full-finetune/Learning Rate": 8.667721578865993e-06, "Full-finetune/Loss": 0.7588227987289429, "Full-finetune/Loss (Raw)": 0.756226122379303, "Full-finetune/Step": 2891, "Full-finetune/Step Time": 6.779597472399473} {"Full-finetune/Learning Rate": 8.661547761386307e-06, "Full-finetune/Loss": 0.7604135274887085, "Full-finetune/Loss (Raw)": 0.9883031249046326, "Full-finetune/Step": 2892, "Full-finetune/Step Time": 6.7887037973850965} {"Full-finetune/Learning Rate": 8.655374463333797e-06, "Full-finetune/Loss": 0.7638763189315796, "Full-finetune/Loss (Raw)": 0.7891676425933838, "Full-finetune/Step": 2893, "Full-finetune/Step Time": 6.76935132406652} {"Full-finetune/Learning Rate": 8.649201687104209e-06, "Full-finetune/Loss": 0.7645187377929688, "Full-finetune/Loss (Raw)": 0.8956795930862427, "Full-finetune/Step": 2894, "Full-finetune/Step Time": 6.768372738733888} {"Full-finetune/Learning Rate": 8.643029435093072e-06, "Full-finetune/Loss": 0.7644699811935425, "Full-finetune/Loss (Raw)": 0.8220452666282654, "Full-finetune/Step": 2895, "Full-finetune/Step Time": 6.755188023671508} {"Full-finetune/Learning Rate": 8.63685770969572e-06, "Full-finetune/Loss": 0.7646620273590088, "Full-finetune/Loss (Raw)": 0.8752582669258118, "Full-finetune/Step": 2896, "Full-finetune/Step Time": 6.757860749959946} {"Full-finetune/Learning Rate": 8.630686513307282e-06, "Full-finetune/Loss": 0.7649093866348267, "Full-finetune/Loss (Raw)": 0.8816027641296387, "Full-finetune/Step": 2897, "Full-finetune/Step Time": 6.752229543402791} {"Full-finetune/Learning Rate": 8.62451584832267e-06, "Full-finetune/Loss": 0.7672707438468933, "Full-finetune/Loss (Raw)": 0.8323727250099182, "Full-finetune/Step": 2898, "Full-finetune/Step Time": 6.7365081906318665} {"Full-finetune/Learning Rate": 8.618345717136604e-06, "Full-finetune/Loss": 0.7666987180709839, "Full-finetune/Loss (Raw)": 0.7950724363327026, "Full-finetune/Step": 2899, "Full-finetune/Step Time": 6.736934429034591} {"Full-finetune/Learning Rate": 8.612176122143589e-06, "Full-finetune/Loss": 0.7652578949928284, "Full-finetune/Loss (Raw)": 0.673183262348175, "Full-finetune/Step": 2900, "Full-finetune/Step Time": 6.741212038323283} {"Full-finetune/Learning Rate": 8.606007065737928e-06, "Full-finetune/Loss": 0.7636030912399292, "Full-finetune/Loss (Raw)": 0.6837663650512695, "Full-finetune/Step": 2901, "Full-finetune/Step Time": 6.750801770016551} {"Full-finetune/Learning Rate": 8.599838550313714e-06, "Full-finetune/Loss": 0.7671945095062256, "Full-finetune/Loss (Raw)": 0.788527250289917, "Full-finetune/Step": 2902, "Full-finetune/Step Time": 6.764634238556027} {"Full-finetune/Learning Rate": 8.593670578264814e-06, "Full-finetune/Loss": 0.7668946981430054, "Full-finetune/Loss (Raw)": 0.8363250494003296, "Full-finetune/Step": 2903, "Full-finetune/Step Time": 6.767534822225571} {"Full-finetune/Learning Rate": 8.587503151984911e-06, "Full-finetune/Loss": 0.767197847366333, "Full-finetune/Loss (Raw)": 0.793859601020813, "Full-finetune/Step": 2904, "Full-finetune/Step Time": 6.765295293182135} {"Full-finetune/Learning Rate": 8.581336273867455e-06, "Full-finetune/Loss": 0.7673167586326599, "Full-finetune/Loss (Raw)": 0.81629478931427, "Full-finetune/Step": 2905, "Full-finetune/Step Time": 6.767445703968406} {"Full-finetune/Learning Rate": 8.575169946305699e-06, "Full-finetune/Loss": 0.767580509185791, "Full-finetune/Loss (Raw)": 0.8792630434036255, "Full-finetune/Step": 2906, "Full-finetune/Step Time": 6.788917765021324} {"Full-finetune/Learning Rate": 8.569004171692667e-06, "Full-finetune/Loss": 0.7681745290756226, "Full-finetune/Loss (Raw)": 0.7959386110305786, "Full-finetune/Step": 2907, "Full-finetune/Step Time": 6.791225386783481} {"Full-finetune/Learning Rate": 8.562838952421177e-06, "Full-finetune/Loss": 0.7686179876327515, "Full-finetune/Loss (Raw)": 0.8631630539894104, "Full-finetune/Step": 2908, "Full-finetune/Step Time": 6.794029071927071} {"Full-finetune/Learning Rate": 8.556674290883833e-06, "Full-finetune/Loss": 0.7693431377410889, "Full-finetune/Loss (Raw)": 0.9931328296661377, "Full-finetune/Step": 2909, "Full-finetune/Step Time": 6.7878765519708395} {"Full-finetune/Learning Rate": 8.550510189473016e-06, "Full-finetune/Loss": 0.770035445690155, "Full-finetune/Loss (Raw)": 0.9100417494773865, "Full-finetune/Step": 2910, "Full-finetune/Step Time": 6.790087318047881} {"Full-finetune/Learning Rate": 8.544346650580899e-06, "Full-finetune/Loss": 0.770978569984436, "Full-finetune/Loss (Raw)": 0.9493504166603088, "Full-finetune/Step": 2911, "Full-finetune/Step Time": 6.7752560675144196} {"Full-finetune/Learning Rate": 8.538183676599426e-06, "Full-finetune/Loss": 0.772852897644043, "Full-finetune/Loss (Raw)": 0.8372970819473267, "Full-finetune/Step": 2912, "Full-finetune/Step Time": 6.767272036522627} {"Full-finetune/Learning Rate": 8.532021269920326e-06, "Full-finetune/Loss": 0.7731842994689941, "Full-finetune/Loss (Raw)": 0.8295064568519592, "Full-finetune/Step": 2913, "Full-finetune/Step Time": 6.74941031076014} {"Full-finetune/Learning Rate": 8.525859432935114e-06, "Full-finetune/Loss": 0.7712632417678833, "Full-finetune/Loss (Raw)": 0.6122116446495056, "Full-finetune/Step": 2914, "Full-finetune/Step Time": 6.77602095156908} {"Full-finetune/Learning Rate": 8.519698168035074e-06, "Full-finetune/Loss": 0.7697454690933228, "Full-finetune/Loss (Raw)": 0.5767995715141296, "Full-finetune/Step": 2915, "Full-finetune/Step Time": 6.787681745365262} {"Full-finetune/Learning Rate": 8.513537477611278e-06, "Full-finetune/Loss": 0.7697130441665649, "Full-finetune/Loss (Raw)": 0.8602926731109619, "Full-finetune/Step": 2916, "Full-finetune/Step Time": 6.775264386087656} {"Full-finetune/Learning Rate": 8.507377364054566e-06, "Full-finetune/Loss": 0.7711162567138672, "Full-finetune/Loss (Raw)": 0.9188326597213745, "Full-finetune/Step": 2917, "Full-finetune/Step Time": 6.759352860972285} {"Full-finetune/Learning Rate": 8.501217829755554e-06, "Full-finetune/Loss": 0.7705645561218262, "Full-finetune/Loss (Raw)": 0.7119987607002258, "Full-finetune/Step": 2918, "Full-finetune/Step Time": 6.764352101832628} {"Full-finetune/Learning Rate": 8.495058877104642e-06, "Full-finetune/Loss": 0.7723120450973511, "Full-finetune/Loss (Raw)": 0.8380428552627563, "Full-finetune/Step": 2919, "Full-finetune/Step Time": 6.742780098691583} {"Full-finetune/Learning Rate": 8.488900508491999e-06, "Full-finetune/Loss": 0.7687537670135498, "Full-finetune/Loss (Raw)": 0.34379759430885315, "Full-finetune/Step": 2920, "Full-finetune/Step Time": 6.747385231778026} {"Full-finetune/Learning Rate": 8.48274272630757e-06, "Full-finetune/Loss": 0.7677467465400696, "Full-finetune/Loss (Raw)": 0.7982833981513977, "Full-finetune/Step": 2921, "Full-finetune/Step Time": 6.7643646113574505} {"Full-finetune/Learning Rate": 8.476585532941064e-06, "Full-finetune/Loss": 0.7679311037063599, "Full-finetune/Loss (Raw)": 0.7572798728942871, "Full-finetune/Step": 2922, "Full-finetune/Step Time": 6.7570784240961075} {"Full-finetune/Learning Rate": 8.470428930781969e-06, "Full-finetune/Loss": 0.7685207724571228, "Full-finetune/Loss (Raw)": 0.7229593396186829, "Full-finetune/Step": 2923, "Full-finetune/Step Time": 6.778352107852697} {"Full-finetune/Learning Rate": 8.464272922219547e-06, "Full-finetune/Loss": 0.7693043947219849, "Full-finetune/Loss (Raw)": 0.8719400763511658, "Full-finetune/Step": 2924, "Full-finetune/Step Time": 6.752017676830292} {"Full-finetune/Learning Rate": 8.458117509642817e-06, "Full-finetune/Loss": 0.7717666625976562, "Full-finetune/Loss (Raw)": 0.9062529802322388, "Full-finetune/Step": 2925, "Full-finetune/Step Time": 6.74176368303597} {"Full-finetune/Learning Rate": 8.451962695440586e-06, "Full-finetune/Loss": 0.7750827074050903, "Full-finetune/Loss (Raw)": 0.7983224391937256, "Full-finetune/Step": 2926, "Full-finetune/Step Time": 6.749435517936945} {"Full-finetune/Learning Rate": 8.445808482001405e-06, "Full-finetune/Loss": 0.7741056084632874, "Full-finetune/Loss (Raw)": 0.5475703477859497, "Full-finetune/Step": 2927, "Full-finetune/Step Time": 6.758966675028205} {"Full-finetune/Learning Rate": 8.439654871713608e-06, "Full-finetune/Loss": 0.7755264639854431, "Full-finetune/Loss (Raw)": 0.8001418709754944, "Full-finetune/Step": 2928, "Full-finetune/Step Time": 6.768266793340445} {"Full-finetune/Learning Rate": 8.433501866965294e-06, "Full-finetune/Loss": 0.7752861380577087, "Full-finetune/Loss (Raw)": 0.8549656867980957, "Full-finetune/Step": 2929, "Full-finetune/Step Time": 6.758554253727198} {"Full-finetune/Learning Rate": 8.42734947014432e-06, "Full-finetune/Loss": 0.7753762602806091, "Full-finetune/Loss (Raw)": 0.8702202439308167, "Full-finetune/Step": 2930, "Full-finetune/Step Time": 6.741775635629892} {"Full-finetune/Learning Rate": 8.42119768363832e-06, "Full-finetune/Loss": 0.7763946056365967, "Full-finetune/Loss (Raw)": 0.8816184997558594, "Full-finetune/Step": 2931, "Full-finetune/Step Time": 6.745076648890972} {"Full-finetune/Learning Rate": 8.415046509834668e-06, "Full-finetune/Loss": 0.7766178846359253, "Full-finetune/Loss (Raw)": 0.8610333204269409, "Full-finetune/Step": 2932, "Full-finetune/Step Time": 6.748551541939378} {"Full-finetune/Learning Rate": 8.408895951120526e-06, "Full-finetune/Loss": 0.7752906084060669, "Full-finetune/Loss (Raw)": 0.8079001903533936, "Full-finetune/Step": 2933, "Full-finetune/Step Time": 6.760100467130542} {"Full-finetune/Learning Rate": 8.402746009882798e-06, "Full-finetune/Loss": 0.7756873965263367, "Full-finetune/Loss (Raw)": 0.7902534008026123, "Full-finetune/Step": 2934, "Full-finetune/Step Time": 6.754663804545999} {"Full-finetune/Learning Rate": 8.39659668850816e-06, "Full-finetune/Loss": 0.7759719491004944, "Full-finetune/Loss (Raw)": 0.818080723285675, "Full-finetune/Step": 2935, "Full-finetune/Step Time": 6.7603223863989115} {"Full-finetune/Learning Rate": 8.39044798938305e-06, "Full-finetune/Loss": 0.7780847549438477, "Full-finetune/Loss (Raw)": 0.8622814416885376, "Full-finetune/Step": 2936, "Full-finetune/Step Time": 6.766192842274904} {"Full-finetune/Learning Rate": 8.384299914893645e-06, "Full-finetune/Loss": 0.783109188079834, "Full-finetune/Loss (Raw)": 0.9893515110015869, "Full-finetune/Step": 2937, "Full-finetune/Step Time": 6.7493388913571835} {"Full-finetune/Learning Rate": 8.378152467425902e-06, "Full-finetune/Loss": 0.7843946814537048, "Full-finetune/Loss (Raw)": 0.8560693860054016, "Full-finetune/Step": 2938, "Full-finetune/Step Time": 6.74567237496376} {"Full-finetune/Learning Rate": 8.37200564936552e-06, "Full-finetune/Loss": 0.784329354763031, "Full-finetune/Loss (Raw)": 0.8321201205253601, "Full-finetune/Step": 2939, "Full-finetune/Step Time": 6.745075671002269} {"Full-finetune/Learning Rate": 8.365859463097963e-06, "Full-finetune/Loss": 0.7835399508476257, "Full-finetune/Loss (Raw)": 0.6740008592605591, "Full-finetune/Step": 2940, "Full-finetune/Step Time": 6.747600223869085} {"Full-finetune/Learning Rate": 8.359713911008447e-06, "Full-finetune/Loss": 0.7808837294578552, "Full-finetune/Loss (Raw)": 0.5241466760635376, "Full-finetune/Step": 2941, "Full-finetune/Step Time": 6.766129558905959} {"Full-finetune/Learning Rate": 8.353568995481934e-06, "Full-finetune/Loss": 0.7856196165084839, "Full-finetune/Loss (Raw)": 0.9534476399421692, "Full-finetune/Step": 2942, "Full-finetune/Step Time": 6.753090064972639} {"Full-finetune/Learning Rate": 8.347424718903152e-06, "Full-finetune/Loss": 0.7843093872070312, "Full-finetune/Loss (Raw)": 0.7606497406959534, "Full-finetune/Step": 2943, "Full-finetune/Step Time": 6.7582574132829905} {"Full-finetune/Learning Rate": 8.341281083656571e-06, "Full-finetune/Loss": 0.7842650413513184, "Full-finetune/Loss (Raw)": 0.8159963488578796, "Full-finetune/Step": 2944, "Full-finetune/Step Time": 6.7657552398741245} {"Full-finetune/Learning Rate": 8.33513809212642e-06, "Full-finetune/Loss": 0.7839360237121582, "Full-finetune/Loss (Raw)": 0.7515355348587036, "Full-finetune/Step": 2945, "Full-finetune/Step Time": 6.7748850248754025} {"Full-finetune/Learning Rate": 8.328995746696674e-06, "Full-finetune/Loss": 0.7839229106903076, "Full-finetune/Loss (Raw)": 0.7847246527671814, "Full-finetune/Step": 2946, "Full-finetune/Step Time": 6.76691410318017} {"Full-finetune/Learning Rate": 8.32285404975105e-06, "Full-finetune/Loss": 0.782679557800293, "Full-finetune/Loss (Raw)": 0.7703702449798584, "Full-finetune/Step": 2947, "Full-finetune/Step Time": 6.784932212904096} {"Full-finetune/Learning Rate": 8.316713003673028e-06, "Full-finetune/Loss": 0.7811213731765747, "Full-finetune/Loss (Raw)": 0.7161309123039246, "Full-finetune/Step": 2948, "Full-finetune/Step Time": 6.796054236590862} {"Full-finetune/Learning Rate": 8.310572610845824e-06, "Full-finetune/Loss": 0.7829025983810425, "Full-finetune/Loss (Raw)": 0.8529750108718872, "Full-finetune/Step": 2949, "Full-finetune/Step Time": 6.787004914134741} {"Full-finetune/Learning Rate": 8.304432873652412e-06, "Full-finetune/Loss": 0.7829927802085876, "Full-finetune/Loss (Raw)": 0.8463692665100098, "Full-finetune/Step": 2950, "Full-finetune/Step Time": 6.786733498796821} {"Full-finetune/Learning Rate": 8.298293794475495e-06, "Full-finetune/Loss": 0.7822116613388062, "Full-finetune/Loss (Raw)": 0.30119574069976807, "Full-finetune/Step": 2951, "Full-finetune/Step Time": 6.7873763758689165} {"Full-finetune/Learning Rate": 8.29215537569753e-06, "Full-finetune/Loss": 0.7840481996536255, "Full-finetune/Loss (Raw)": 0.8566929697990417, "Full-finetune/Step": 2952, "Full-finetune/Step Time": 6.785800203680992} {"Full-finetune/Learning Rate": 8.286017619700725e-06, "Full-finetune/Loss": 0.7856741547584534, "Full-finetune/Loss (Raw)": 0.9149256944656372, "Full-finetune/Step": 2953, "Full-finetune/Step Time": 6.784642672166228} {"Full-finetune/Learning Rate": 8.279880528867017e-06, "Full-finetune/Loss": 0.7860643267631531, "Full-finetune/Loss (Raw)": 0.7164698243141174, "Full-finetune/Step": 2954, "Full-finetune/Step Time": 6.790678469464183} {"Full-finetune/Learning Rate": 8.273744105578097e-06, "Full-finetune/Loss": 0.787326991558075, "Full-finetune/Loss (Raw)": 0.983010470867157, "Full-finetune/Step": 2955, "Full-finetune/Step Time": 6.797857321798801} {"Full-finetune/Learning Rate": 8.267608352215385e-06, "Full-finetune/Loss": 0.7862056493759155, "Full-finetune/Loss (Raw)": 0.8095954060554504, "Full-finetune/Step": 2956, "Full-finetune/Step Time": 6.794216254726052} {"Full-finetune/Learning Rate": 8.261473271160046e-06, "Full-finetune/Loss": 0.7857202887535095, "Full-finetune/Loss (Raw)": 0.7754181027412415, "Full-finetune/Step": 2957, "Full-finetune/Step Time": 6.783754445612431} {"Full-finetune/Learning Rate": 8.255338864792993e-06, "Full-finetune/Loss": 0.7851536273956299, "Full-finetune/Loss (Raw)": 0.8169569969177246, "Full-finetune/Step": 2958, "Full-finetune/Step Time": 6.787104031071067} {"Full-finetune/Learning Rate": 8.249205135494862e-06, "Full-finetune/Loss": 0.7796742916107178, "Full-finetune/Loss (Raw)": 0.31761056184768677, "Full-finetune/Step": 2959, "Full-finetune/Step Time": 6.802699130028486} {"Full-finetune/Learning Rate": 8.24307208564604e-06, "Full-finetune/Loss": 0.7780992984771729, "Full-finetune/Loss (Raw)": 0.7365414500236511, "Full-finetune/Step": 2960, "Full-finetune/Step Time": 6.801287380978465} {"Full-finetune/Learning Rate": 8.236939717626639e-06, "Full-finetune/Loss": 0.7779377102851868, "Full-finetune/Loss (Raw)": 0.7756478786468506, "Full-finetune/Step": 2961, "Full-finetune/Step Time": 6.786609133705497} {"Full-finetune/Learning Rate": 8.23080803381651e-06, "Full-finetune/Loss": 0.783004879951477, "Full-finetune/Loss (Raw)": 1.005663514137268, "Full-finetune/Step": 2962, "Full-finetune/Step Time": 6.776399014517665} {"Full-finetune/Learning Rate": 8.224677036595245e-06, "Full-finetune/Loss": 0.7832553386688232, "Full-finetune/Loss (Raw)": 0.8536084890365601, "Full-finetune/Step": 2963, "Full-finetune/Step Time": 6.7970492877066135} {"Full-finetune/Learning Rate": 8.218546728342161e-06, "Full-finetune/Loss": 0.7851424217224121, "Full-finetune/Loss (Raw)": 0.8779628872871399, "Full-finetune/Step": 2964, "Full-finetune/Step Time": 6.809968883171678} {"Full-finetune/Learning Rate": 8.212417111436315e-06, "Full-finetune/Loss": 0.7853949069976807, "Full-finetune/Loss (Raw)": 0.8833704590797424, "Full-finetune/Step": 2965, "Full-finetune/Step Time": 6.806191457435489} {"Full-finetune/Learning Rate": 8.206288188256486e-06, "Full-finetune/Loss": 0.7855172753334045, "Full-finetune/Loss (Raw)": 0.7294474840164185, "Full-finetune/Step": 2966, "Full-finetune/Step Time": 6.823400909081101} {"Full-finetune/Learning Rate": 8.20015996118119e-06, "Full-finetune/Loss": 0.7852784395217896, "Full-finetune/Loss (Raw)": 0.6763113141059875, "Full-finetune/Step": 2967, "Full-finetune/Step Time": 6.854760445654392} {"Full-finetune/Learning Rate": 8.194032432588677e-06, "Full-finetune/Loss": 0.7860463857650757, "Full-finetune/Loss (Raw)": 0.8939585089683533, "Full-finetune/Step": 2968, "Full-finetune/Step Time": 6.862355435267091} {"Full-finetune/Learning Rate": 8.187905604856916e-06, "Full-finetune/Loss": 0.7851083278656006, "Full-finetune/Loss (Raw)": 0.809047281742096, "Full-finetune/Step": 2969, "Full-finetune/Step Time": 6.858668047934771} {"Full-finetune/Learning Rate": 8.181779480363614e-06, "Full-finetune/Loss": 0.7847776412963867, "Full-finetune/Loss (Raw)": 0.7839187979698181, "Full-finetune/Step": 2970, "Full-finetune/Step Time": 6.8697499968111515} {"Full-finetune/Learning Rate": 8.175654061486197e-06, "Full-finetune/Loss": 0.7857636213302612, "Full-finetune/Loss (Raw)": 0.8056066632270813, "Full-finetune/Step": 2971, "Full-finetune/Step Time": 6.865850247442722} {"Full-finetune/Learning Rate": 8.16952935060182e-06, "Full-finetune/Loss": 0.7854512929916382, "Full-finetune/Loss (Raw)": 0.8108755946159363, "Full-finetune/Step": 2972, "Full-finetune/Step Time": 6.860971763730049} {"Full-finetune/Learning Rate": 8.163405350087366e-06, "Full-finetune/Loss": 0.7847476601600647, "Full-finetune/Loss (Raw)": 0.7103327512741089, "Full-finetune/Step": 2973, "Full-finetune/Step Time": 6.864178147166967} {"Full-finetune/Learning Rate": 8.157282062319437e-06, "Full-finetune/Loss": 0.785446286201477, "Full-finetune/Loss (Raw)": 0.8392531871795654, "Full-finetune/Step": 2974, "Full-finetune/Step Time": 6.865567719563842} {"Full-finetune/Learning Rate": 8.15115948967437e-06, "Full-finetune/Loss": 0.783804178237915, "Full-finetune/Loss (Raw)": 0.39187923073768616, "Full-finetune/Step": 2975, "Full-finetune/Step Time": 6.859711742028594} {"Full-finetune/Learning Rate": 8.145037634528205e-06, "Full-finetune/Loss": 0.7828894853591919, "Full-finetune/Loss (Raw)": 0.7421166896820068, "Full-finetune/Step": 2976, "Full-finetune/Step Time": 6.853967234492302} {"Full-finetune/Learning Rate": 8.138916499256718e-06, "Full-finetune/Loss": 0.782854437828064, "Full-finetune/Loss (Raw)": 0.7612398266792297, "Full-finetune/Step": 2977, "Full-finetune/Step Time": 6.851073049008846} {"Full-finetune/Learning Rate": 8.132796086235405e-06, "Full-finetune/Loss": 0.7838270664215088, "Full-finetune/Loss (Raw)": 0.930517315864563, "Full-finetune/Step": 2978, "Full-finetune/Step Time": 6.8518411591649055} {"Full-finetune/Learning Rate": 8.126676397839475e-06, "Full-finetune/Loss": 0.7836716175079346, "Full-finetune/Loss (Raw)": 0.8302738070487976, "Full-finetune/Step": 2979, "Full-finetune/Step Time": 6.850805412977934} {"Full-finetune/Learning Rate": 8.120557436443866e-06, "Full-finetune/Loss": 0.7830989360809326, "Full-finetune/Loss (Raw)": 0.7505561709403992, "Full-finetune/Step": 2980, "Full-finetune/Step Time": 6.852719709277153} {"Full-finetune/Learning Rate": 8.11443920442322e-06, "Full-finetune/Loss": 0.7828730940818787, "Full-finetune/Loss (Raw)": 0.7205743789672852, "Full-finetune/Step": 2981, "Full-finetune/Step Time": 6.878131361678243} {"Full-finetune/Learning Rate": 8.108321704151903e-06, "Full-finetune/Loss": 0.7819730043411255, "Full-finetune/Loss (Raw)": 0.7569678425788879, "Full-finetune/Step": 2982, "Full-finetune/Step Time": 6.8712741900235415} {"Full-finetune/Learning Rate": 8.102204938004004e-06, "Full-finetune/Loss": 0.7832274436950684, "Full-finetune/Loss (Raw)": 0.9416065216064453, "Full-finetune/Step": 2983, "Full-finetune/Step Time": 6.851294904947281} {"Full-finetune/Learning Rate": 8.096088908353316e-06, "Full-finetune/Loss": 0.7832649350166321, "Full-finetune/Loss (Raw)": 0.779244065284729, "Full-finetune/Step": 2984, "Full-finetune/Step Time": 6.850696632638574} {"Full-finetune/Learning Rate": 8.089973617573355e-06, "Full-finetune/Loss": 0.7831408977508545, "Full-finetune/Loss (Raw)": 0.8300140500068665, "Full-finetune/Step": 2985, "Full-finetune/Step Time": 6.849475095048547} {"Full-finetune/Learning Rate": 8.08385906803734e-06, "Full-finetune/Loss": 0.7800068855285645, "Full-finetune/Loss (Raw)": 0.3221404552459717, "Full-finetune/Step": 2986, "Full-finetune/Step Time": 6.870205560699105} {"Full-finetune/Learning Rate": 8.07774526211821e-06, "Full-finetune/Loss": 0.7798424959182739, "Full-finetune/Loss (Raw)": 0.7901877760887146, "Full-finetune/Step": 2987, "Full-finetune/Step Time": 6.882693467661738} {"Full-finetune/Learning Rate": 8.071632202188618e-06, "Full-finetune/Loss": 0.7812973260879517, "Full-finetune/Loss (Raw)": 0.873499870300293, "Full-finetune/Step": 2988, "Full-finetune/Step Time": 6.880983496084809} {"Full-finetune/Learning Rate": 8.065519890620922e-06, "Full-finetune/Loss": 0.7787514925003052, "Full-finetune/Loss (Raw)": 0.6386018991470337, "Full-finetune/Step": 2989, "Full-finetune/Step Time": 6.884028268978} {"Full-finetune/Learning Rate": 8.059408329787184e-06, "Full-finetune/Loss": 0.7800147533416748, "Full-finetune/Loss (Raw)": 0.921380877494812, "Full-finetune/Step": 2990, "Full-finetune/Step Time": 6.860285146161914} {"Full-finetune/Learning Rate": 8.053297522059189e-06, "Full-finetune/Loss": 0.7806388139724731, "Full-finetune/Loss (Raw)": 0.8622300624847412, "Full-finetune/Step": 2991, "Full-finetune/Step Time": 6.8645382802933455} {"Full-finetune/Learning Rate": 8.047187469808418e-06, "Full-finetune/Loss": 0.7804957032203674, "Full-finetune/Loss (Raw)": 0.6944440007209778, "Full-finetune/Step": 2992, "Full-finetune/Step Time": 6.875177746638656} {"Full-finetune/Learning Rate": 8.041078175406064e-06, "Full-finetune/Loss": 0.7807735204696655, "Full-finetune/Loss (Raw)": 0.9208935499191284, "Full-finetune/Step": 2993, "Full-finetune/Step Time": 6.870997196063399} {"Full-finetune/Learning Rate": 8.03496964122303e-06, "Full-finetune/Loss": 0.7849805355072021, "Full-finetune/Loss (Raw)": 0.9273515343666077, "Full-finetune/Step": 2994, "Full-finetune/Step Time": 6.848496433347464} {"Full-finetune/Learning Rate": 8.02886186962991e-06, "Full-finetune/Loss": 0.784889817237854, "Full-finetune/Loss (Raw)": 0.8288211822509766, "Full-finetune/Step": 2995, "Full-finetune/Step Time": 6.851241812109947} {"Full-finetune/Learning Rate": 8.022754862997016e-06, "Full-finetune/Loss": 0.7834678888320923, "Full-finetune/Loss (Raw)": 0.7485132813453674, "Full-finetune/Step": 2996, "Full-finetune/Step Time": 6.8659134320914745} {"Full-finetune/Learning Rate": 8.016648623694354e-06, "Full-finetune/Loss": 0.7845954298973083, "Full-finetune/Loss (Raw)": 0.7390869855880737, "Full-finetune/Step": 2997, "Full-finetune/Step Time": 6.835667030885816} {"Full-finetune/Learning Rate": 8.010543154091644e-06, "Full-finetune/Loss": 0.787445604801178, "Full-finetune/Loss (Raw)": 0.7393844723701477, "Full-finetune/Step": 2998, "Full-finetune/Step Time": 6.825619954615831} {"Full-finetune/Learning Rate": 8.004438456558297e-06, "Full-finetune/Loss": 0.7865797281265259, "Full-finetune/Loss (Raw)": 0.8335285186767578, "Full-finetune/Step": 2999, "Full-finetune/Step Time": 6.831468565389514} {"Full-finetune/Learning Rate": 7.99833453346342e-06, "Full-finetune/Loss": 0.7859519720077515, "Full-finetune/Loss (Raw)": 0.8437042832374573, "Full-finetune/Step": 3000, "Full-finetune/Step Time": 6.836425703018904} {"Full-finetune/Learning Rate": 7.992231387175832e-06, "Full-finetune/Loss": 0.7851912379264832, "Full-finetune/Loss (Raw)": 0.7462002635002136, "Full-finetune/Step": 3001, "Full-finetune/Step Time": 6.839159904047847} {"Full-finetune/Learning Rate": 7.986129020064044e-06, "Full-finetune/Loss": 0.7893414497375488, "Full-finetune/Loss (Raw)": 0.8869469165802002, "Full-finetune/Step": 3002, "Full-finetune/Step Time": 6.822863951325417} {"Full-finetune/Learning Rate": 7.980027434496267e-06, "Full-finetune/Loss": 0.7888304591178894, "Full-finetune/Loss (Raw)": 0.8058204054832458, "Full-finetune/Step": 3003, "Full-finetune/Step Time": 6.827856659889221} {"Full-finetune/Learning Rate": 7.97392663284041e-06, "Full-finetune/Loss": 0.7893151640892029, "Full-finetune/Loss (Raw)": 0.8698752522468567, "Full-finetune/Step": 3004, "Full-finetune/Step Time": 6.819551605731249} {"Full-finetune/Learning Rate": 7.967826617464065e-06, "Full-finetune/Loss": 0.7877646684646606, "Full-finetune/Loss (Raw)": 0.5914304256439209, "Full-finetune/Step": 3005, "Full-finetune/Step Time": 6.838036306202412} {"Full-finetune/Learning Rate": 7.961727390734538e-06, "Full-finetune/Loss": 0.7891148328781128, "Full-finetune/Loss (Raw)": 0.8883472084999084, "Full-finetune/Step": 3006, "Full-finetune/Step Time": 6.830636253580451} {"Full-finetune/Learning Rate": 7.955628955018813e-06, "Full-finetune/Loss": 0.788551390171051, "Full-finetune/Loss (Raw)": 0.6547600030899048, "Full-finetune/Step": 3007, "Full-finetune/Step Time": 6.821944732218981} {"Full-finetune/Learning Rate": 7.949531312683582e-06, "Full-finetune/Loss": 0.7881561517715454, "Full-finetune/Loss (Raw)": 0.8660224676132202, "Full-finetune/Step": 3008, "Full-finetune/Step Time": 6.823222270235419} {"Full-finetune/Learning Rate": 7.943434466095216e-06, "Full-finetune/Loss": 0.7889666557312012, "Full-finetune/Loss (Raw)": 0.9303094148635864, "Full-finetune/Step": 3009, "Full-finetune/Step Time": 6.816160812973976} {"Full-finetune/Learning Rate": 7.937338417619781e-06, "Full-finetune/Loss": 0.788147509098053, "Full-finetune/Loss (Raw)": 0.7861538529396057, "Full-finetune/Step": 3010, "Full-finetune/Step Time": 6.817341886460781} {"Full-finetune/Learning Rate": 7.931243169623037e-06, "Full-finetune/Loss": 0.7878237962722778, "Full-finetune/Loss (Raw)": 0.8837757706642151, "Full-finetune/Step": 3011, "Full-finetune/Step Time": 6.814236870035529} {"Full-finetune/Learning Rate": 7.925148724470428e-06, "Full-finetune/Loss": 0.7888883352279663, "Full-finetune/Loss (Raw)": 0.8518100380897522, "Full-finetune/Step": 3012, "Full-finetune/Step Time": 6.786427503451705} {"Full-finetune/Learning Rate": 7.919055084527094e-06, "Full-finetune/Loss": 0.7886606454849243, "Full-finetune/Loss (Raw)": 0.83806312084198, "Full-finetune/Step": 3013, "Full-finetune/Step Time": 6.78291355073452} {"Full-finetune/Learning Rate": 7.912962252157854e-06, "Full-finetune/Loss": 0.789423942565918, "Full-finetune/Loss (Raw)": 0.6794916987419128, "Full-finetune/Step": 3014, "Full-finetune/Step Time": 6.766410520300269} {"Full-finetune/Learning Rate": 7.906870229727216e-06, "Full-finetune/Loss": 0.7889041304588318, "Full-finetune/Loss (Raw)": 0.6090022325515747, "Full-finetune/Step": 3015, "Full-finetune/Step Time": 6.775419093668461} {"Full-finetune/Learning Rate": 7.900779019599378e-06, "Full-finetune/Loss": 0.7871941328048706, "Full-finetune/Loss (Raw)": 0.7675697803497314, "Full-finetune/Step": 3016, "Full-finetune/Step Time": 6.7786412220448256} {"Full-finetune/Learning Rate": 7.894688624138217e-06, "Full-finetune/Loss": 0.7900968790054321, "Full-finetune/Loss (Raw)": 0.6998627781867981, "Full-finetune/Step": 3017, "Full-finetune/Step Time": 6.774933991953731} {"Full-finetune/Learning Rate": 7.8885990457073e-06, "Full-finetune/Loss": 0.789981484413147, "Full-finetune/Loss (Raw)": 0.7356602549552917, "Full-finetune/Step": 3018, "Full-finetune/Step Time": 6.779547618702054} {"Full-finetune/Learning Rate": 7.882510286669875e-06, "Full-finetune/Loss": 0.790247917175293, "Full-finetune/Loss (Raw)": 0.790332019329071, "Full-finetune/Step": 3019, "Full-finetune/Step Time": 6.780257949605584} {"Full-finetune/Learning Rate": 7.876422349388861e-06, "Full-finetune/Loss": 0.7885108590126038, "Full-finetune/Loss (Raw)": 0.7659590244293213, "Full-finetune/Step": 3020, "Full-finetune/Step Time": 6.761248165741563} {"Full-finetune/Learning Rate": 7.870335236226878e-06, "Full-finetune/Loss": 0.7885684967041016, "Full-finetune/Loss (Raw)": 0.7965506315231323, "Full-finetune/Step": 3021, "Full-finetune/Step Time": 6.773929404094815} {"Full-finetune/Learning Rate": 7.864248949546209e-06, "Full-finetune/Loss": 0.7887051105499268, "Full-finetune/Loss (Raw)": 0.9131685495376587, "Full-finetune/Step": 3022, "Full-finetune/Step Time": 6.773846935480833} {"Full-finetune/Learning Rate": 7.858163491708827e-06, "Full-finetune/Loss": 0.7875787615776062, "Full-finetune/Loss (Raw)": 0.6778630614280701, "Full-finetune/Step": 3023, "Full-finetune/Step Time": 6.776727994903922} {"Full-finetune/Learning Rate": 7.85207886507638e-06, "Full-finetune/Loss": 0.7870168685913086, "Full-finetune/Loss (Raw)": 0.8033401370048523, "Full-finetune/Step": 3024, "Full-finetune/Step Time": 6.779965000227094} {"Full-finetune/Learning Rate": 7.845995072010188e-06, "Full-finetune/Loss": 0.7869046926498413, "Full-finetune/Loss (Raw)": 0.8672385811805725, "Full-finetune/Step": 3025, "Full-finetune/Step Time": 6.778597896918654} {"Full-finetune/Learning Rate": 7.839912114871256e-06, "Full-finetune/Loss": 0.7867164611816406, "Full-finetune/Loss (Raw)": 0.8082835078239441, "Full-finetune/Step": 3026, "Full-finetune/Step Time": 6.781927274540067} {"Full-finetune/Learning Rate": 7.83382999602026e-06, "Full-finetune/Loss": 0.7875592708587646, "Full-finetune/Loss (Raw)": 0.9029457569122314, "Full-finetune/Step": 3027, "Full-finetune/Step Time": 6.789775725454092} {"Full-finetune/Learning Rate": 7.827748717817552e-06, "Full-finetune/Loss": 0.7885341644287109, "Full-finetune/Loss (Raw)": 0.7979704737663269, "Full-finetune/Step": 3028, "Full-finetune/Step Time": 6.791888974606991} {"Full-finetune/Learning Rate": 7.821668282623159e-06, "Full-finetune/Loss": 0.7910500764846802, "Full-finetune/Loss (Raw)": 1.0058062076568604, "Full-finetune/Step": 3029, "Full-finetune/Step Time": 6.781435906887054} {"Full-finetune/Learning Rate": 7.815588692796771e-06, "Full-finetune/Loss": 0.7909913063049316, "Full-finetune/Loss (Raw)": 0.781014621257782, "Full-finetune/Step": 3030, "Full-finetune/Step Time": 6.762012304738164} {"Full-finetune/Learning Rate": 7.809509950697769e-06, "Full-finetune/Loss": 0.7910250425338745, "Full-finetune/Loss (Raw)": 0.8406331539154053, "Full-finetune/Step": 3031, "Full-finetune/Step Time": 6.758338252082467} {"Full-finetune/Learning Rate": 7.803432058685187e-06, "Full-finetune/Loss": 0.7911849021911621, "Full-finetune/Loss (Raw)": 0.8143298029899597, "Full-finetune/Step": 3032, "Full-finetune/Step Time": 6.762290956452489} {"Full-finetune/Learning Rate": 7.797355019117743e-06, "Full-finetune/Loss": 0.7914407253265381, "Full-finetune/Loss (Raw)": 0.849031388759613, "Full-finetune/Step": 3033, "Full-finetune/Step Time": 6.758731916546822} {"Full-finetune/Learning Rate": 7.79127883435381e-06, "Full-finetune/Loss": 0.7918888330459595, "Full-finetune/Loss (Raw)": 0.9366223812103271, "Full-finetune/Step": 3034, "Full-finetune/Step Time": 6.733560487627983} {"Full-finetune/Learning Rate": 7.78520350675144e-06, "Full-finetune/Loss": 0.7921956181526184, "Full-finetune/Loss (Raw)": 0.8352049589157104, "Full-finetune/Step": 3035, "Full-finetune/Step Time": 6.72484478354454} {"Full-finetune/Learning Rate": 7.779129038668347e-06, "Full-finetune/Loss": 0.7915326356887817, "Full-finetune/Loss (Raw)": 0.7783000469207764, "Full-finetune/Step": 3036, "Full-finetune/Step Time": 6.736462954431772} {"Full-finetune/Learning Rate": 7.773055432461916e-06, "Full-finetune/Loss": 0.7911678552627563, "Full-finetune/Loss (Raw)": 0.9464424252510071, "Full-finetune/Step": 3037, "Full-finetune/Step Time": 6.739183738827705} {"Full-finetune/Learning Rate": 7.766982690489198e-06, "Full-finetune/Loss": 0.790898323059082, "Full-finetune/Loss (Raw)": 0.8755483031272888, "Full-finetune/Step": 3038, "Full-finetune/Step Time": 6.736880872398615} {"Full-finetune/Learning Rate": 7.7609108151069e-06, "Full-finetune/Loss": 0.7891777753829956, "Full-finetune/Loss (Raw)": 0.7291175723075867, "Full-finetune/Step": 3039, "Full-finetune/Step Time": 6.737297672778368} {"Full-finetune/Learning Rate": 7.754839808671397e-06, "Full-finetune/Loss": 0.7891461253166199, "Full-finetune/Loss (Raw)": 0.8332435488700867, "Full-finetune/Step": 3040, "Full-finetune/Step Time": 6.729627069085836} {"Full-finetune/Learning Rate": 7.748769673538734e-06, "Full-finetune/Loss": 0.7884260416030884, "Full-finetune/Loss (Raw)": 0.7373315691947937, "Full-finetune/Step": 3041, "Full-finetune/Step Time": 6.735114309936762} {"Full-finetune/Learning Rate": 7.742700412064608e-06, "Full-finetune/Loss": 0.7900582551956177, "Full-finetune/Loss (Raw)": 0.8211395144462585, "Full-finetune/Step": 3042, "Full-finetune/Step Time": 6.710271617397666} {"Full-finetune/Learning Rate": 7.736632026604386e-06, "Full-finetune/Loss": 0.7879594564437866, "Full-finetune/Loss (Raw)": 0.30815234780311584, "Full-finetune/Step": 3043, "Full-finetune/Step Time": 6.718252485617995} {"Full-finetune/Learning Rate": 7.730564519513082e-06, "Full-finetune/Loss": 0.7864940762519836, "Full-finetune/Loss (Raw)": 0.6727271676063538, "Full-finetune/Step": 3044, "Full-finetune/Step Time": 6.726481311023235} {"Full-finetune/Learning Rate": 7.724497893145379e-06, "Full-finetune/Loss": 0.783841609954834, "Full-finetune/Loss (Raw)": 0.5793150663375854, "Full-finetune/Step": 3045, "Full-finetune/Step Time": 6.732128292322159} {"Full-finetune/Learning Rate": 7.718432149855622e-06, "Full-finetune/Loss": 0.785971999168396, "Full-finetune/Loss (Raw)": 0.984686553478241, "Full-finetune/Step": 3046, "Full-finetune/Step Time": 6.725950179621577} {"Full-finetune/Learning Rate": 7.7123672919978e-06, "Full-finetune/Loss": 0.7857578992843628, "Full-finetune/Loss (Raw)": 0.8106405735015869, "Full-finetune/Step": 3047, "Full-finetune/Step Time": 6.731978952884674} {"Full-finetune/Learning Rate": 7.706303321925577e-06, "Full-finetune/Loss": 0.7905300855636597, "Full-finetune/Loss (Raw)": 0.9546318650245667, "Full-finetune/Step": 3048, "Full-finetune/Step Time": 6.712687063962221} {"Full-finetune/Learning Rate": 7.700240241992247e-06, "Full-finetune/Loss": 0.7904160022735596, "Full-finetune/Loss (Raw)": 0.7836844325065613, "Full-finetune/Step": 3049, "Full-finetune/Step Time": 6.696321865543723} {"Full-finetune/Learning Rate": 7.694178054550782e-06, "Full-finetune/Loss": 0.7919083833694458, "Full-finetune/Loss (Raw)": 0.9483079314231873, "Full-finetune/Step": 3050, "Full-finetune/Step Time": 6.6868937481194735} {"Full-finetune/Learning Rate": 7.688116761953797e-06, "Full-finetune/Loss": 0.7934288382530212, "Full-finetune/Loss (Raw)": 0.9175726175308228, "Full-finetune/Step": 3051, "Full-finetune/Step Time": 6.666190423071384} {"Full-finetune/Learning Rate": 7.682056366553559e-06, "Full-finetune/Loss": 0.792704164981842, "Full-finetune/Loss (Raw)": 0.779188871383667, "Full-finetune/Step": 3052, "Full-finetune/Step Time": 6.669057372957468} {"Full-finetune/Learning Rate": 7.675996870701999e-06, "Full-finetune/Loss": 0.7926483750343323, "Full-finetune/Loss (Raw)": 0.8991074562072754, "Full-finetune/Step": 3053, "Full-finetune/Step Time": 6.6717601884156466} {"Full-finetune/Learning Rate": 7.669938276750673e-06, "Full-finetune/Loss": 0.7940186858177185, "Full-finetune/Loss (Raw)": 0.9737228155136108, "Full-finetune/Step": 3054, "Full-finetune/Step Time": 6.646498693153262} {"Full-finetune/Learning Rate": 7.663880587050812e-06, "Full-finetune/Loss": 0.7960901260375977, "Full-finetune/Loss (Raw)": 0.8127135038375854, "Full-finetune/Step": 3055, "Full-finetune/Step Time": 6.637669177725911} {"Full-finetune/Learning Rate": 7.657823803953288e-06, "Full-finetune/Loss": 0.7964603900909424, "Full-finetune/Loss (Raw)": 0.8475368618965149, "Full-finetune/Step": 3056, "Full-finetune/Step Time": 6.6161597073078156} {"Full-finetune/Learning Rate": 7.651767929808615e-06, "Full-finetune/Loss": 0.7952338457107544, "Full-finetune/Loss (Raw)": 0.697964608669281, "Full-finetune/Step": 3057, "Full-finetune/Step Time": 6.628110872581601} {"Full-finetune/Learning Rate": 7.645712966966973e-06, "Full-finetune/Loss": 0.7952706813812256, "Full-finetune/Loss (Raw)": 0.8749369978904724, "Full-finetune/Step": 3058, "Full-finetune/Step Time": 6.625170974060893} {"Full-finetune/Learning Rate": 7.639658917778156e-06, "Full-finetune/Loss": 0.7950938940048218, "Full-finetune/Loss (Raw)": 0.8589922785758972, "Full-finetune/Step": 3059, "Full-finetune/Step Time": 6.620784148573875} {"Full-finetune/Learning Rate": 7.633605784591633e-06, "Full-finetune/Loss": 0.795376181602478, "Full-finetune/Loss (Raw)": 0.8971686363220215, "Full-finetune/Step": 3060, "Full-finetune/Step Time": 6.6257198210805655} {"Full-finetune/Learning Rate": 7.627553569756505e-06, "Full-finetune/Loss": 0.7961215376853943, "Full-finetune/Loss (Raw)": 0.9033031463623047, "Full-finetune/Step": 3061, "Full-finetune/Step Time": 6.61654188297689} {"Full-finetune/Learning Rate": 7.621502275621518e-06, "Full-finetune/Loss": 0.7956252694129944, "Full-finetune/Loss (Raw)": 0.7267317175865173, "Full-finetune/Step": 3062, "Full-finetune/Step Time": 6.643591690808535} {"Full-finetune/Learning Rate": 7.615451904535066e-06, "Full-finetune/Loss": 0.7954940795898438, "Full-finetune/Loss (Raw)": 0.8012850284576416, "Full-finetune/Step": 3063, "Full-finetune/Step Time": 6.634339863434434} {"Full-finetune/Learning Rate": 7.609402458845171e-06, "Full-finetune/Loss": 0.7954555749893188, "Full-finetune/Loss (Raw)": 0.8573499321937561, "Full-finetune/Step": 3064, "Full-finetune/Step Time": 6.616637917235494} {"Full-finetune/Learning Rate": 7.60335394089951e-06, "Full-finetune/Loss": 0.7927574515342712, "Full-finetune/Loss (Raw)": 0.6439965963363647, "Full-finetune/Step": 3065, "Full-finetune/Step Time": 6.632272036746144} {"Full-finetune/Learning Rate": 7.597306353045393e-06, "Full-finetune/Loss": 0.7902783155441284, "Full-finetune/Loss (Raw)": 0.5387349128723145, "Full-finetune/Step": 3066, "Full-finetune/Step Time": 6.664663719013333} {"Full-finetune/Learning Rate": 7.5912596976297735e-06, "Full-finetune/Loss": 0.7902549505233765, "Full-finetune/Loss (Raw)": 0.8291312456130981, "Full-finetune/Step": 3067, "Full-finetune/Step Time": 6.664455762133002} {"Full-finetune/Learning Rate": 7.58521397699924e-06, "Full-finetune/Loss": 0.7909777164459229, "Full-finetune/Loss (Raw)": 0.766523003578186, "Full-finetune/Step": 3068, "Full-finetune/Step Time": 6.675264846533537} {"Full-finetune/Learning Rate": 7.579169193500014e-06, "Full-finetune/Loss": 0.7921267151832581, "Full-finetune/Loss (Raw)": 0.6712120175361633, "Full-finetune/Step": 3069, "Full-finetune/Step Time": 6.665467735379934} {"Full-finetune/Learning Rate": 7.573125349477964e-06, "Full-finetune/Loss": 0.7909583449363708, "Full-finetune/Loss (Raw)": 0.8038967251777649, "Full-finetune/Step": 3070, "Full-finetune/Step Time": 6.6629976741969585} {"Full-finetune/Learning Rate": 7.567082447278582e-06, "Full-finetune/Loss": 0.7925615310668945, "Full-finetune/Loss (Raw)": 0.9658566117286682, "Full-finetune/Step": 3071, "Full-finetune/Step Time": 6.653991451486945} {"Full-finetune/Learning Rate": 7.561040489247008e-06, "Full-finetune/Loss": 0.7923793792724609, "Full-finetune/Loss (Raw)": 0.7926904559135437, "Full-finetune/Step": 3072, "Full-finetune/Step Time": 6.655877333134413} {"Full-finetune/Learning Rate": 7.554999477728001e-06, "Full-finetune/Loss": 0.7928820252418518, "Full-finetune/Loss (Raw)": 0.8158713579177856, "Full-finetune/Step": 3073, "Full-finetune/Step Time": 6.655796281993389} {"Full-finetune/Learning Rate": 7.548959415065961e-06, "Full-finetune/Loss": 0.7929513454437256, "Full-finetune/Loss (Raw)": 0.7935965657234192, "Full-finetune/Step": 3074, "Full-finetune/Step Time": 6.657003290951252} {"Full-finetune/Learning Rate": 7.54292030360492e-06, "Full-finetune/Loss": 0.7891983985900879, "Full-finetune/Loss (Raw)": 0.28999418020248413, "Full-finetune/Step": 3075, "Full-finetune/Step Time": 6.658503795042634} {"Full-finetune/Learning Rate": 7.5368821456885375e-06, "Full-finetune/Loss": 0.7889918684959412, "Full-finetune/Loss (Raw)": 0.6896957755088806, "Full-finetune/Step": 3076, "Full-finetune/Step Time": 6.654474074020982} {"Full-finetune/Learning Rate": 7.530844943660111e-06, "Full-finetune/Loss": 0.7890238761901855, "Full-finetune/Loss (Raw)": 0.8570667505264282, "Full-finetune/Step": 3077, "Full-finetune/Step Time": 6.663819778710604} {"Full-finetune/Learning Rate": 7.524808699862552e-06, "Full-finetune/Loss": 0.7878371477127075, "Full-finetune/Loss (Raw)": 0.6944703459739685, "Full-finetune/Step": 3078, "Full-finetune/Step Time": 6.659945445135236} {"Full-finetune/Learning Rate": 7.518773416638412e-06, "Full-finetune/Loss": 0.790294349193573, "Full-finetune/Loss (Raw)": 0.6157194972038269, "Full-finetune/Step": 3079, "Full-finetune/Step Time": 6.663182742893696} {"Full-finetune/Learning Rate": 7.512739096329868e-06, "Full-finetune/Loss": 0.7890685796737671, "Full-finetune/Loss (Raw)": 0.6997941732406616, "Full-finetune/Step": 3080, "Full-finetune/Step Time": 6.666897563263774} {"Full-finetune/Learning Rate": 7.50670574127872e-06, "Full-finetune/Loss": 0.7877160906791687, "Full-finetune/Loss (Raw)": 0.7418054938316345, "Full-finetune/Step": 3081, "Full-finetune/Step Time": 6.679666416719556} {"Full-finetune/Learning Rate": 7.500673353826399e-06, "Full-finetune/Loss": 0.7885439395904541, "Full-finetune/Loss (Raw)": 0.8224339485168457, "Full-finetune/Step": 3082, "Full-finetune/Step Time": 6.672815699130297} {"Full-finetune/Learning Rate": 7.4946419363139535e-06, "Full-finetune/Loss": 0.7875622510910034, "Full-finetune/Loss (Raw)": 0.8573588132858276, "Full-finetune/Step": 3083, "Full-finetune/Step Time": 6.677473267540336} {"Full-finetune/Learning Rate": 7.488611491082056e-06, "Full-finetune/Loss": 0.7872579097747803, "Full-finetune/Loss (Raw)": 0.7706435918807983, "Full-finetune/Step": 3084, "Full-finetune/Step Time": 6.689521027728915} {"Full-finetune/Learning Rate": 7.482582020471012e-06, "Full-finetune/Loss": 0.7888092994689941, "Full-finetune/Loss (Raw)": 0.9739874601364136, "Full-finetune/Step": 3085, "Full-finetune/Step Time": 6.6854820884764194} {"Full-finetune/Learning Rate": 7.476553526820733e-06, "Full-finetune/Loss": 0.7889851927757263, "Full-finetune/Loss (Raw)": 0.8394733667373657, "Full-finetune/Step": 3086, "Full-finetune/Step Time": 6.684156326577067} {"Full-finetune/Learning Rate": 7.4705260124707705e-06, "Full-finetune/Loss": 0.7927281260490417, "Full-finetune/Loss (Raw)": 0.796705424785614, "Full-finetune/Step": 3087, "Full-finetune/Step Time": 6.6696738339960575} {"Full-finetune/Learning Rate": 7.464499479760275e-06, "Full-finetune/Loss": 0.7914443016052246, "Full-finetune/Loss (Raw)": 0.5722110271453857, "Full-finetune/Step": 3088, "Full-finetune/Step Time": 6.666930329054594} {"Full-finetune/Learning Rate": 7.458473931028029e-06, "Full-finetune/Loss": 0.7924181222915649, "Full-finetune/Loss (Raw)": 0.9002965092658997, "Full-finetune/Step": 3089, "Full-finetune/Step Time": 6.670774733647704} {"Full-finetune/Learning Rate": 7.452449368612433e-06, "Full-finetune/Loss": 0.7902615070343018, "Full-finetune/Loss (Raw)": 0.7296156287193298, "Full-finetune/Step": 3090, "Full-finetune/Step Time": 6.6624287981539965} {"Full-finetune/Learning Rate": 7.446425794851498e-06, "Full-finetune/Loss": 0.7893412113189697, "Full-finetune/Loss (Raw)": 0.7358131408691406, "Full-finetune/Step": 3091, "Full-finetune/Step Time": 6.655839718878269} {"Full-finetune/Learning Rate": 7.440403212082863e-06, "Full-finetune/Loss": 0.7847892642021179, "Full-finetune/Loss (Raw)": 0.29531222581863403, "Full-finetune/Step": 3092, "Full-finetune/Step Time": 6.660966258496046} {"Full-finetune/Learning Rate": 7.434381622643766e-06, "Full-finetune/Loss": 0.7842944860458374, "Full-finetune/Loss (Raw)": 0.8200398683547974, "Full-finetune/Step": 3093, "Full-finetune/Step Time": 6.667737508192658} {"Full-finetune/Learning Rate": 7.42836102887107e-06, "Full-finetune/Loss": 0.7852065563201904, "Full-finetune/Loss (Raw)": 0.8461880683898926, "Full-finetune/Step": 3094, "Full-finetune/Step Time": 6.652559939771891} {"Full-finetune/Learning Rate": 7.422341433101254e-06, "Full-finetune/Loss": 0.7860879898071289, "Full-finetune/Loss (Raw)": 0.7891327738761902, "Full-finetune/Step": 3095, "Full-finetune/Step Time": 6.6140919756144285} {"Full-finetune/Learning Rate": 7.4163228376704e-06, "Full-finetune/Loss": 0.7856196761131287, "Full-finetune/Loss (Raw)": 0.8340166211128235, "Full-finetune/Step": 3096, "Full-finetune/Step Time": 6.608697546645999} {"Full-finetune/Learning Rate": 7.410305244914216e-06, "Full-finetune/Loss": 0.7816624641418457, "Full-finetune/Loss (Raw)": 0.3025323152542114, "Full-finetune/Step": 3097, "Full-finetune/Step Time": 6.629029208794236} {"Full-finetune/Learning Rate": 7.404288657168006e-06, "Full-finetune/Loss": 0.7800939083099365, "Full-finetune/Loss (Raw)": 0.5831392407417297, "Full-finetune/Step": 3098, "Full-finetune/Step Time": 6.617451690137386} {"Full-finetune/Learning Rate": 7.398273076766687e-06, "Full-finetune/Loss": 0.7804087400436401, "Full-finetune/Loss (Raw)": 0.8459029793739319, "Full-finetune/Step": 3099, "Full-finetune/Step Time": 6.6207922752946615} {"Full-finetune/Learning Rate": 7.392258506044796e-06, "Full-finetune/Loss": 0.782046377658844, "Full-finetune/Loss (Raw)": 1.0204988718032837, "Full-finetune/Step": 3100, "Full-finetune/Step Time": 6.62269345857203} {"Full-finetune/Learning Rate": 7.386244947336463e-06, "Full-finetune/Loss": 0.7809468507766724, "Full-finetune/Loss (Raw)": 0.5695899128913879, "Full-finetune/Step": 3101, "Full-finetune/Step Time": 6.624229529872537} {"Full-finetune/Learning Rate": 7.380232402975443e-06, "Full-finetune/Loss": 0.7814359068870544, "Full-finetune/Loss (Raw)": 0.9018484354019165, "Full-finetune/Step": 3102, "Full-finetune/Step Time": 6.631353918462992} {"Full-finetune/Learning Rate": 7.3742208752950776e-06, "Full-finetune/Loss": 0.7857272028923035, "Full-finetune/Loss (Raw)": 0.9411697387695312, "Full-finetune/Step": 3103, "Full-finetune/Step Time": 6.624652387574315} {"Full-finetune/Learning Rate": 7.3682103666283245e-06, "Full-finetune/Loss": 0.7866349816322327, "Full-finetune/Loss (Raw)": 0.8583054542541504, "Full-finetune/Step": 3104, "Full-finetune/Step Time": 6.619214987382293} {"Full-finetune/Learning Rate": 7.362200879307748e-06, "Full-finetune/Loss": 0.7874032855033875, "Full-finetune/Loss (Raw)": 0.8595896363258362, "Full-finetune/Step": 3105, "Full-finetune/Step Time": 6.609478756785393} {"Full-finetune/Learning Rate": 7.3561924156655105e-06, "Full-finetune/Loss": 0.7857497930526733, "Full-finetune/Loss (Raw)": 0.718868613243103, "Full-finetune/Step": 3106, "Full-finetune/Step Time": 6.608560575172305} {"Full-finetune/Learning Rate": 7.350184978033386e-06, "Full-finetune/Loss": 0.7867844700813293, "Full-finetune/Loss (Raw)": 0.9627115726470947, "Full-finetune/Step": 3107, "Full-finetune/Step Time": 6.60209908336401} {"Full-finetune/Learning Rate": 7.344178568742734e-06, "Full-finetune/Loss": 0.7868586182594299, "Full-finetune/Loss (Raw)": 0.760047435760498, "Full-finetune/Step": 3108, "Full-finetune/Step Time": 6.595065115019679} {"Full-finetune/Learning Rate": 7.338173190124526e-06, "Full-finetune/Loss": 0.7872616052627563, "Full-finetune/Loss (Raw)": 0.7721620202064514, "Full-finetune/Step": 3109, "Full-finetune/Step Time": 6.570912962779403} {"Full-finetune/Learning Rate": 7.3321688445093395e-06, "Full-finetune/Loss": 0.7870898842811584, "Full-finetune/Loss (Raw)": 0.7349769473075867, "Full-finetune/Step": 3110, "Full-finetune/Step Time": 6.567474404349923} {"Full-finetune/Learning Rate": 7.326165534227341e-06, "Full-finetune/Loss": 0.785696268081665, "Full-finetune/Loss (Raw)": 0.7632287740707397, "Full-finetune/Step": 3111, "Full-finetune/Step Time": 6.57696270942688} {"Full-finetune/Learning Rate": 7.320163261608293e-06, "Full-finetune/Loss": 0.786555290222168, "Full-finetune/Loss (Raw)": 0.8892025947570801, "Full-finetune/Step": 3112, "Full-finetune/Step Time": 6.561557784676552} {"Full-finetune/Learning Rate": 7.314162028981564e-06, "Full-finetune/Loss": 0.7861335277557373, "Full-finetune/Loss (Raw)": 0.7760225534439087, "Full-finetune/Step": 3113, "Full-finetune/Step Time": 6.5748046189546585} {"Full-finetune/Learning Rate": 7.308161838676113e-06, "Full-finetune/Loss": 0.7903424501419067, "Full-finetune/Loss (Raw)": 0.8608837723731995, "Full-finetune/Step": 3114, "Full-finetune/Step Time": 6.561627479270101} {"Full-finetune/Learning Rate": 7.302162693020503e-06, "Full-finetune/Loss": 0.790271520614624, "Full-finetune/Loss (Raw)": 0.7811123132705688, "Full-finetune/Step": 3115, "Full-finetune/Step Time": 6.544020123779774} {"Full-finetune/Learning Rate": 7.2961645943428804e-06, "Full-finetune/Loss": 0.7879408597946167, "Full-finetune/Loss (Raw)": 0.5751777291297913, "Full-finetune/Step": 3116, "Full-finetune/Step Time": 6.56961802393198} {"Full-finetune/Learning Rate": 7.290167544970989e-06, "Full-finetune/Loss": 0.7895881533622742, "Full-finetune/Loss (Raw)": 0.849449872970581, "Full-finetune/Step": 3117, "Full-finetune/Step Time": 6.565457670018077} {"Full-finetune/Learning Rate": 7.284171547232168e-06, "Full-finetune/Loss": 0.7860704660415649, "Full-finetune/Loss (Raw)": 0.47111767530441284, "Full-finetune/Step": 3118, "Full-finetune/Step Time": 6.585903698578477} {"Full-finetune/Learning Rate": 7.278176603453347e-06, "Full-finetune/Loss": 0.7856608629226685, "Full-finetune/Loss (Raw)": 0.8098044991493225, "Full-finetune/Step": 3119, "Full-finetune/Step Time": 6.586222881451249} {"Full-finetune/Learning Rate": 7.272182715961049e-06, "Full-finetune/Loss": 0.786794126033783, "Full-finetune/Loss (Raw)": 0.8394947648048401, "Full-finetune/Step": 3120, "Full-finetune/Step Time": 6.580539980903268} {"Full-finetune/Learning Rate": 7.266189887081385e-06, "Full-finetune/Loss": 0.7843825817108154, "Full-finetune/Loss (Raw)": 0.6122167706489563, "Full-finetune/Step": 3121, "Full-finetune/Step Time": 6.591428060084581} {"Full-finetune/Learning Rate": 7.2601981191400484e-06, "Full-finetune/Loss": 0.7831604480743408, "Full-finetune/Loss (Raw)": 0.7709153294563293, "Full-finetune/Step": 3122, "Full-finetune/Step Time": 6.593483189120889} {"Full-finetune/Learning Rate": 7.254207414462333e-06, "Full-finetune/Loss": 0.7827925682067871, "Full-finetune/Loss (Raw)": 0.78173828125, "Full-finetune/Step": 3123, "Full-finetune/Step Time": 6.588504565879703} {"Full-finetune/Learning Rate": 7.248217775373112e-06, "Full-finetune/Loss": 0.7837967872619629, "Full-finetune/Loss (Raw)": 0.8770597577095032, "Full-finetune/Step": 3124, "Full-finetune/Step Time": 6.572405328974128} {"Full-finetune/Learning Rate": 7.242229204196849e-06, "Full-finetune/Loss": 0.783187747001648, "Full-finetune/Loss (Raw)": 0.6611306667327881, "Full-finetune/Step": 3125, "Full-finetune/Step Time": 6.572393046692014} {"Full-finetune/Learning Rate": 7.236241703257594e-06, "Full-finetune/Loss": 0.7841208577156067, "Full-finetune/Loss (Raw)": 0.8588157892227173, "Full-finetune/Step": 3126, "Full-finetune/Step Time": 6.56323734857142} {"Full-finetune/Learning Rate": 7.230255274878972e-06, "Full-finetune/Loss": 0.7849636673927307, "Full-finetune/Loss (Raw)": 0.9414041638374329, "Full-finetune/Step": 3127, "Full-finetune/Step Time": 6.559819210320711} {"Full-finetune/Learning Rate": 7.224269921384206e-06, "Full-finetune/Loss": 0.782396674156189, "Full-finetune/Loss (Raw)": 0.5151376724243164, "Full-finetune/Step": 3128, "Full-finetune/Step Time": 6.603047549724579} {"Full-finetune/Learning Rate": 7.218285645096088e-06, "Full-finetune/Loss": 0.7826092839241028, "Full-finetune/Loss (Raw)": 0.7734120488166809, "Full-finetune/Step": 3129, "Full-finetune/Step Time": 6.599760077893734} {"Full-finetune/Learning Rate": 7.2123024483370056e-06, "Full-finetune/Loss": 0.7812820672988892, "Full-finetune/Loss (Raw)": 0.7170590162277222, "Full-finetune/Step": 3130, "Full-finetune/Step Time": 6.614302651956677} {"Full-finetune/Learning Rate": 7.20632033342892e-06, "Full-finetune/Loss": 0.7808456420898438, "Full-finetune/Loss (Raw)": 0.7499584555625916, "Full-finetune/Step": 3131, "Full-finetune/Step Time": 6.617716282606125} {"Full-finetune/Learning Rate": 7.200339302693367e-06, "Full-finetune/Loss": 0.7772157192230225, "Full-finetune/Loss (Raw)": 0.4052450358867645, "Full-finetune/Step": 3132, "Full-finetune/Step Time": 6.636049872264266} {"Full-finetune/Learning Rate": 7.194359358451475e-06, "Full-finetune/Loss": 0.7789012789726257, "Full-finetune/Loss (Raw)": 0.8071811199188232, "Full-finetune/Step": 3133, "Full-finetune/Step Time": 6.627110261470079} {"Full-finetune/Learning Rate": 7.188380503023936e-06, "Full-finetune/Loss": 0.7771384716033936, "Full-finetune/Loss (Raw)": 0.662714421749115, "Full-finetune/Step": 3134, "Full-finetune/Step Time": 6.6414685901254416} {"Full-finetune/Learning Rate": 7.182402738731036e-06, "Full-finetune/Loss": 0.7788268327713013, "Full-finetune/Loss (Raw)": 0.8708651661872864, "Full-finetune/Step": 3135, "Full-finetune/Step Time": 6.6441097389906645} {"Full-finetune/Learning Rate": 7.176426067892623e-06, "Full-finetune/Loss": 0.7783941030502319, "Full-finetune/Loss (Raw)": 0.8106359243392944, "Full-finetune/Step": 3136, "Full-finetune/Step Time": 6.64508955180645} {"Full-finetune/Learning Rate": 7.170450492828126e-06, "Full-finetune/Loss": 0.7766901254653931, "Full-finetune/Loss (Raw)": 0.7121966481208801, "Full-finetune/Step": 3137, "Full-finetune/Step Time": 6.66114841401577} {"Full-finetune/Learning Rate": 7.164476015856552e-06, "Full-finetune/Loss": 0.7755275368690491, "Full-finetune/Loss (Raw)": 0.6373387575149536, "Full-finetune/Step": 3138, "Full-finetune/Step Time": 6.68894455768168} {"Full-finetune/Learning Rate": 7.158502639296475e-06, "Full-finetune/Loss": 0.7749298810958862, "Full-finetune/Loss (Raw)": 0.8072787523269653, "Full-finetune/Step": 3139, "Full-finetune/Step Time": 6.689740967005491} {"Full-finetune/Learning Rate": 7.152530365466051e-06, "Full-finetune/Loss": 0.7743624448776245, "Full-finetune/Loss (Raw)": 0.7791829705238342, "Full-finetune/Step": 3140, "Full-finetune/Step Time": 6.701049426570535} {"Full-finetune/Learning Rate": 7.146559196683001e-06, "Full-finetune/Loss": 0.7739173173904419, "Full-finetune/Loss (Raw)": 0.7810893654823303, "Full-finetune/Step": 3141, "Full-finetune/Step Time": 6.7020880207419395} {"Full-finetune/Learning Rate": 7.140589135264614e-06, "Full-finetune/Loss": 0.7743907570838928, "Full-finetune/Loss (Raw)": 0.7400849461555481, "Full-finetune/Step": 3142, "Full-finetune/Step Time": 6.70629439689219} {"Full-finetune/Learning Rate": 7.13462018352776e-06, "Full-finetune/Loss": 0.7737727761268616, "Full-finetune/Loss (Raw)": 0.5298998951911926, "Full-finetune/Step": 3143, "Full-finetune/Step Time": 6.70539903268218} {"Full-finetune/Learning Rate": 7.12865234378887e-06, "Full-finetune/Loss": 0.7749775052070618, "Full-finetune/Loss (Raw)": 0.9217796921730042, "Full-finetune/Step": 3144, "Full-finetune/Step Time": 6.69708289578557} {"Full-finetune/Learning Rate": 7.122685618363948e-06, "Full-finetune/Loss": 0.7765623331069946, "Full-finetune/Loss (Raw)": 0.9027162194252014, "Full-finetune/Step": 3145, "Full-finetune/Step Time": 6.6824958473443985} {"Full-finetune/Learning Rate": 7.116720009568565e-06, "Full-finetune/Loss": 0.7775726914405823, "Full-finetune/Loss (Raw)": 0.8649866580963135, "Full-finetune/Step": 3146, "Full-finetune/Step Time": 6.673428075388074} {"Full-finetune/Learning Rate": 7.110755519717851e-06, "Full-finetune/Loss": 0.7777146100997925, "Full-finetune/Loss (Raw)": 0.8085036873817444, "Full-finetune/Step": 3147, "Full-finetune/Step Time": 6.681084994226694} {"Full-finetune/Learning Rate": 7.104792151126515e-06, "Full-finetune/Loss": 0.7790534496307373, "Full-finetune/Loss (Raw)": 0.937329113483429, "Full-finetune/Step": 3148, "Full-finetune/Step Time": 6.701423402875662} {"Full-finetune/Learning Rate": 7.098829906108819e-06, "Full-finetune/Loss": 0.7760679125785828, "Full-finetune/Loss (Raw)": 0.41439956426620483, "Full-finetune/Step": 3149, "Full-finetune/Step Time": 6.707478128373623} {"Full-finetune/Learning Rate": 7.092868786978596e-06, "Full-finetune/Loss": 0.7750269770622253, "Full-finetune/Loss (Raw)": 0.7799255847930908, "Full-finetune/Step": 3150, "Full-finetune/Step Time": 6.704031331464648} {"Full-finetune/Learning Rate": 7.086908796049243e-06, "Full-finetune/Loss": 0.7763003706932068, "Full-finetune/Loss (Raw)": 0.8408608436584473, "Full-finetune/Step": 3151, "Full-finetune/Step Time": 6.705321529880166} {"Full-finetune/Learning Rate": 7.08094993563371e-06, "Full-finetune/Loss": 0.7762312889099121, "Full-finetune/Loss (Raw)": 0.7945042252540588, "Full-finetune/Step": 3152, "Full-finetune/Step Time": 6.700955925509334} {"Full-finetune/Learning Rate": 7.074992208044518e-06, "Full-finetune/Loss": 0.7760618925094604, "Full-finetune/Loss (Raw)": 0.8455439209938049, "Full-finetune/Step": 3153, "Full-finetune/Step Time": 6.7010175585746765} {"Full-finetune/Learning Rate": 7.069035615593743e-06, "Full-finetune/Loss": 0.7759343981742859, "Full-finetune/Loss (Raw)": 0.7919624447822571, "Full-finetune/Step": 3154, "Full-finetune/Step Time": 6.693056099116802} {"Full-finetune/Learning Rate": 7.063080160593026e-06, "Full-finetune/Loss": 0.7756408452987671, "Full-finetune/Loss (Raw)": 0.8653755187988281, "Full-finetune/Step": 3155, "Full-finetune/Step Time": 6.67696144990623} {"Full-finetune/Learning Rate": 7.0571258453535585e-06, "Full-finetune/Loss": 0.7753152847290039, "Full-finetune/Loss (Raw)": 0.7563007473945618, "Full-finetune/Step": 3156, "Full-finetune/Step Time": 6.67164340429008} {"Full-finetune/Learning Rate": 7.051172672186093e-06, "Full-finetune/Loss": 0.7747700214385986, "Full-finetune/Loss (Raw)": 0.9360167384147644, "Full-finetune/Step": 3157, "Full-finetune/Step Time": 6.678136672824621} {"Full-finetune/Learning Rate": 7.045220643400946e-06, "Full-finetune/Loss": 0.7708770036697388, "Full-finetune/Loss (Raw)": 0.28269705176353455, "Full-finetune/Step": 3158, "Full-finetune/Step Time": 6.6835403852164745} {"Full-finetune/Learning Rate": 7.039269761307977e-06, "Full-finetune/Loss": 0.7700651288032532, "Full-finetune/Loss (Raw)": 0.7367202043533325, "Full-finetune/Step": 3159, "Full-finetune/Step Time": 6.687248410657048} {"Full-finetune/Learning Rate": 7.0333200282166146e-06, "Full-finetune/Loss": 0.770142674446106, "Full-finetune/Loss (Raw)": 0.8242558836936951, "Full-finetune/Step": 3160, "Full-finetune/Step Time": 6.677611263468862} {"Full-finetune/Learning Rate": 7.027371446435829e-06, "Full-finetune/Loss": 0.770150899887085, "Full-finetune/Loss (Raw)": 0.8500869870185852, "Full-finetune/Step": 3161, "Full-finetune/Step Time": 6.696572605520487} {"Full-finetune/Learning Rate": 7.0214240182741455e-06, "Full-finetune/Loss": 0.7660131454467773, "Full-finetune/Loss (Raw)": 0.40698015689849854, "Full-finetune/Step": 3162, "Full-finetune/Step Time": 6.715499175712466} {"Full-finetune/Learning Rate": 7.015477746039652e-06, "Full-finetune/Loss": 0.7667114734649658, "Full-finetune/Loss (Raw)": 0.9246016144752502, "Full-finetune/Step": 3163, "Full-finetune/Step Time": 6.726154386997223} {"Full-finetune/Learning Rate": 7.009532632039975e-06, "Full-finetune/Loss": 0.7671536207199097, "Full-finetune/Loss (Raw)": 0.8348899483680725, "Full-finetune/Step": 3164, "Full-finetune/Step Time": 6.708028849214315} {"Full-finetune/Learning Rate": 7.003588678582303e-06, "Full-finetune/Loss": 0.7639208436012268, "Full-finetune/Loss (Raw)": 0.5326477289199829, "Full-finetune/Step": 3165, "Full-finetune/Step Time": 6.709644041955471} {"Full-finetune/Learning Rate": 6.9976458879733635e-06, "Full-finetune/Loss": 0.7631993889808655, "Full-finetune/Loss (Raw)": 0.7831960320472717, "Full-finetune/Step": 3166, "Full-finetune/Step Time": 6.710655819624662} {"Full-finetune/Learning Rate": 6.991704262519436e-06, "Full-finetune/Loss": 0.7637460231781006, "Full-finetune/Loss (Raw)": 0.799094021320343, "Full-finetune/Step": 3167, "Full-finetune/Step Time": 6.708280477672815} {"Full-finetune/Learning Rate": 6.985763804526354e-06, "Full-finetune/Loss": 0.7646661400794983, "Full-finetune/Loss (Raw)": 0.9510201215744019, "Full-finetune/Step": 3168, "Full-finetune/Step Time": 6.71408605389297} {"Full-finetune/Learning Rate": 6.979824516299491e-06, "Full-finetune/Loss": 0.7613287568092346, "Full-finetune/Loss (Raw)": 0.3101420998573303, "Full-finetune/Step": 3169, "Full-finetune/Step Time": 6.729054199531674} {"Full-finetune/Learning Rate": 6.973886400143772e-06, "Full-finetune/Loss": 0.7600765228271484, "Full-finetune/Loss (Raw)": 0.6608557105064392, "Full-finetune/Step": 3170, "Full-finetune/Step Time": 6.7312232200056314} {"Full-finetune/Learning Rate": 6.9679494583636595e-06, "Full-finetune/Loss": 0.763540506362915, "Full-finetune/Loss (Raw)": 0.7515411376953125, "Full-finetune/Step": 3171, "Full-finetune/Step Time": 6.714647242799401} {"Full-finetune/Learning Rate": 6.9620136932631655e-06, "Full-finetune/Loss": 0.7641660571098328, "Full-finetune/Loss (Raw)": 0.7527994513511658, "Full-finetune/Step": 3172, "Full-finetune/Step Time": 6.697189297527075} {"Full-finetune/Learning Rate": 6.956079107145845e-06, "Full-finetune/Loss": 0.7648482918739319, "Full-finetune/Loss (Raw)": 0.6666414141654968, "Full-finetune/Step": 3173, "Full-finetune/Step Time": 6.708579810336232} {"Full-finetune/Learning Rate": 6.950145702314795e-06, "Full-finetune/Loss": 0.7647319436073303, "Full-finetune/Loss (Raw)": 0.9697880148887634, "Full-finetune/Step": 3174, "Full-finetune/Step Time": 6.714504659175873} {"Full-finetune/Learning Rate": 6.9442134810726615e-06, "Full-finetune/Loss": 0.7644662857055664, "Full-finetune/Loss (Raw)": 0.7766386270523071, "Full-finetune/Step": 3175, "Full-finetune/Step Time": 6.709828030318022} {"Full-finetune/Learning Rate": 6.938282445721609e-06, "Full-finetune/Loss": 0.7644596695899963, "Full-finetune/Loss (Raw)": 0.9537853598594666, "Full-finetune/Step": 3176, "Full-finetune/Step Time": 6.712289333343506} {"Full-finetune/Learning Rate": 6.932352598563365e-06, "Full-finetune/Loss": 0.7643131613731384, "Full-finetune/Loss (Raw)": 0.7649351954460144, "Full-finetune/Step": 3177, "Full-finetune/Step Time": 6.7149330992251635} {"Full-finetune/Learning Rate": 6.92642394189919e-06, "Full-finetune/Loss": 0.7631950378417969, "Full-finetune/Loss (Raw)": 0.80519038438797, "Full-finetune/Step": 3178, "Full-finetune/Step Time": 6.720930470153689} {"Full-finetune/Learning Rate": 6.920496478029873e-06, "Full-finetune/Loss": 0.7632829546928406, "Full-finetune/Loss (Raw)": 0.9288204908370972, "Full-finetune/Step": 3179, "Full-finetune/Step Time": 6.7260752730071545} {"Full-finetune/Learning Rate": 6.914570209255758e-06, "Full-finetune/Loss": 0.7629724144935608, "Full-finetune/Loss (Raw)": 0.7394412755966187, "Full-finetune/Step": 3180, "Full-finetune/Step Time": 6.722826916724443} {"Full-finetune/Learning Rate": 6.908645137876699e-06, "Full-finetune/Loss": 0.76258385181427, "Full-finetune/Loss (Raw)": 0.8493661284446716, "Full-finetune/Step": 3181, "Full-finetune/Step Time": 6.718369193375111} {"Full-finetune/Learning Rate": 6.902721266192112e-06, "Full-finetune/Loss": 0.7614700198173523, "Full-finetune/Loss (Raw)": 0.8311538696289062, "Full-finetune/Step": 3182, "Full-finetune/Step Time": 6.721529688686132} {"Full-finetune/Learning Rate": 6.896798596500929e-06, "Full-finetune/Loss": 0.7606688737869263, "Full-finetune/Loss (Raw)": 0.7101732492446899, "Full-finetune/Step": 3183, "Full-finetune/Step Time": 6.720435705035925} {"Full-finetune/Learning Rate": 6.8908771311016276e-06, "Full-finetune/Loss": 0.7600077390670776, "Full-finetune/Loss (Raw)": 0.7629111409187317, "Full-finetune/Step": 3184, "Full-finetune/Step Time": 6.730939578264952} {"Full-finetune/Learning Rate": 6.884956872292216e-06, "Full-finetune/Loss": 0.7613489627838135, "Full-finetune/Loss (Raw)": 0.8696418404579163, "Full-finetune/Step": 3185, "Full-finetune/Step Time": 6.725439436733723} {"Full-finetune/Learning Rate": 6.87903782237022e-06, "Full-finetune/Loss": 0.7605763673782349, "Full-finetune/Loss (Raw)": 0.7760351896286011, "Full-finetune/Step": 3186, "Full-finetune/Step Time": 6.739793948829174} {"Full-finetune/Learning Rate": 6.8731199836327155e-06, "Full-finetune/Loss": 0.760672926902771, "Full-finetune/Loss (Raw)": 0.8713613748550415, "Full-finetune/Step": 3187, "Full-finetune/Step Time": 6.738687817007303} {"Full-finetune/Learning Rate": 6.867203358376295e-06, "Full-finetune/Loss": 0.7590717673301697, "Full-finetune/Loss (Raw)": 0.692216694355011, "Full-finetune/Step": 3188, "Full-finetune/Step Time": 6.74628484621644} {"Full-finetune/Learning Rate": 6.861287948897091e-06, "Full-finetune/Loss": 0.7578646540641785, "Full-finetune/Loss (Raw)": 0.7487890124320984, "Full-finetune/Step": 3189, "Full-finetune/Step Time": 6.743653066456318} {"Full-finetune/Learning Rate": 6.855373757490761e-06, "Full-finetune/Loss": 0.758662223815918, "Full-finetune/Loss (Raw)": 0.8288236260414124, "Full-finetune/Step": 3190, "Full-finetune/Step Time": 6.719458822160959} {"Full-finetune/Learning Rate": 6.849460786452476e-06, "Full-finetune/Loss": 0.7589278221130371, "Full-finetune/Loss (Raw)": 0.8352757096290588, "Full-finetune/Step": 3191, "Full-finetune/Step Time": 6.744470626115799} {"Full-finetune/Learning Rate": 6.843549038076951e-06, "Full-finetune/Loss": 0.7585644125938416, "Full-finetune/Loss (Raw)": 0.8108392953872681, "Full-finetune/Step": 3192, "Full-finetune/Step Time": 6.750227697193623} {"Full-finetune/Learning Rate": 6.83763851465842e-06, "Full-finetune/Loss": 0.7596982717514038, "Full-finetune/Loss (Raw)": 0.7891327738761902, "Full-finetune/Step": 3193, "Full-finetune/Step Time": 6.734522804617882} {"Full-finetune/Learning Rate": 6.831729218490645e-06, "Full-finetune/Loss": 0.7612141370773315, "Full-finetune/Loss (Raw)": 0.7327687740325928, "Full-finetune/Step": 3194, "Full-finetune/Step Time": 6.718925714492798} {"Full-finetune/Learning Rate": 6.825821151866903e-06, "Full-finetune/Loss": 0.7612067461013794, "Full-finetune/Loss (Raw)": 0.8281806707382202, "Full-finetune/Step": 3195, "Full-finetune/Step Time": 6.725084338337183} {"Full-finetune/Learning Rate": 6.819914317079999e-06, "Full-finetune/Loss": 0.7614941000938416, "Full-finetune/Loss (Raw)": 0.8033047318458557, "Full-finetune/Step": 3196, "Full-finetune/Step Time": 6.725443918257952} {"Full-finetune/Learning Rate": 6.814008716422265e-06, "Full-finetune/Loss": 0.7631224393844604, "Full-finetune/Loss (Raw)": 0.8796462416648865, "Full-finetune/Step": 3197, "Full-finetune/Step Time": 6.71697460860014} {"Full-finetune/Learning Rate": 6.808104352185544e-06, "Full-finetune/Loss": 0.7625076770782471, "Full-finetune/Loss (Raw)": 0.7251963019371033, "Full-finetune/Step": 3198, "Full-finetune/Step Time": 6.735281245782971} {"Full-finetune/Learning Rate": 6.8022012266612116e-06, "Full-finetune/Loss": 0.7612747550010681, "Full-finetune/Loss (Raw)": 0.8080450892448425, "Full-finetune/Step": 3199, "Full-finetune/Step Time": 6.735491581261158} {"Full-finetune/Learning Rate": 6.79629934214015e-06, "Full-finetune/Loss": 0.7631072998046875, "Full-finetune/Loss (Raw)": 1.0272619724273682, "Full-finetune/Step": 3200, "Full-finetune/Step Time": 6.725367764011025} {"Full-finetune/Learning Rate": 6.790398700912764e-06, "Full-finetune/Loss": 0.7615147829055786, "Full-finetune/Loss (Raw)": 0.6120256781578064, "Full-finetune/Step": 3201, "Full-finetune/Step Time": 6.716635420918465} {"Full-finetune/Learning Rate": 6.784499305268983e-06, "Full-finetune/Loss": 0.7614414691925049, "Full-finetune/Loss (Raw)": 0.7842057347297668, "Full-finetune/Step": 3202, "Full-finetune/Step Time": 6.71402345225215} {"Full-finetune/Learning Rate": 6.778601157498241e-06, "Full-finetune/Loss": 0.765300989151001, "Full-finetune/Loss (Raw)": 0.7840218544006348, "Full-finetune/Step": 3203, "Full-finetune/Step Time": 6.695469183847308} {"Full-finetune/Learning Rate": 6.772704259889503e-06, "Full-finetune/Loss": 0.7659214735031128, "Full-finetune/Loss (Raw)": 0.7691159248352051, "Full-finetune/Step": 3204, "Full-finetune/Step Time": 6.691887645050883} {"Full-finetune/Learning Rate": 6.76680861473123e-06, "Full-finetune/Loss": 0.7650031447410583, "Full-finetune/Loss (Raw)": 0.7395183444023132, "Full-finetune/Step": 3205, "Full-finetune/Step Time": 6.678182834759355} {"Full-finetune/Learning Rate": 6.7609142243114115e-06, "Full-finetune/Loss": 0.7647943496704102, "Full-finetune/Loss (Raw)": 0.6677424311637878, "Full-finetune/Step": 3206, "Full-finetune/Step Time": 6.6802454851567745} {"Full-finetune/Learning Rate": 6.755021090917545e-06, "Full-finetune/Loss": 0.7659827470779419, "Full-finetune/Loss (Raw)": 0.7678429484367371, "Full-finetune/Step": 3207, "Full-finetune/Step Time": 6.680782230570912} {"Full-finetune/Learning Rate": 6.7491292168366386e-06, "Full-finetune/Loss": 0.766965925693512, "Full-finetune/Loss (Raw)": 0.8256362080574036, "Full-finetune/Step": 3208, "Full-finetune/Step Time": 6.6744598764926195} {"Full-finetune/Learning Rate": 6.743238604355219e-06, "Full-finetune/Loss": 0.7673349976539612, "Full-finetune/Loss (Raw)": 0.7890456914901733, "Full-finetune/Step": 3209, "Full-finetune/Step Time": 6.668043199926615} {"Full-finetune/Learning Rate": 6.737349255759312e-06, "Full-finetune/Loss": 0.7664757966995239, "Full-finetune/Loss (Raw)": 0.7124594449996948, "Full-finetune/Step": 3210, "Full-finetune/Step Time": 6.667773334309459} {"Full-finetune/Learning Rate": 6.731461173334459e-06, "Full-finetune/Loss": 0.7660391330718994, "Full-finetune/Loss (Raw)": 0.8014643788337708, "Full-finetune/Step": 3211, "Full-finetune/Step Time": 6.662521120160818} {"Full-finetune/Learning Rate": 6.725574359365714e-06, "Full-finetune/Loss": 0.7631046772003174, "Full-finetune/Loss (Raw)": 0.39503514766693115, "Full-finetune/Step": 3212, "Full-finetune/Step Time": 6.673499118536711} {"Full-finetune/Learning Rate": 6.7196888161376305e-06, "Full-finetune/Loss": 0.7621413469314575, "Full-finetune/Loss (Raw)": 0.8506813049316406, "Full-finetune/Step": 3213, "Full-finetune/Step Time": 6.6728444546461105} {"Full-finetune/Learning Rate": 6.71380454593428e-06, "Full-finetune/Loss": 0.7612029910087585, "Full-finetune/Loss (Raw)": 0.7193602919578552, "Full-finetune/Step": 3214, "Full-finetune/Step Time": 6.685806525871158} {"Full-finetune/Learning Rate": 6.707921551039224e-06, "Full-finetune/Loss": 0.7600647211074829, "Full-finetune/Loss (Raw)": 0.6510039567947388, "Full-finetune/Step": 3215, "Full-finetune/Step Time": 6.695741057395935} {"Full-finetune/Learning Rate": 6.70203983373554e-06, "Full-finetune/Loss": 0.7606117725372314, "Full-finetune/Loss (Raw)": 0.6422365307807922, "Full-finetune/Step": 3216, "Full-finetune/Step Time": 6.7173437755554914} {"Full-finetune/Learning Rate": 6.69615939630581e-06, "Full-finetune/Loss": 0.7599583268165588, "Full-finetune/Loss (Raw)": 0.8166564702987671, "Full-finetune/Step": 3217, "Full-finetune/Step Time": 6.709205523133278} {"Full-finetune/Learning Rate": 6.690280241032117e-06, "Full-finetune/Loss": 0.7607380151748657, "Full-finetune/Loss (Raw)": 0.8294141292572021, "Full-finetune/Step": 3218, "Full-finetune/Step Time": 6.70818574167788} {"Full-finetune/Learning Rate": 6.684402370196048e-06, "Full-finetune/Loss": 0.760265052318573, "Full-finetune/Loss (Raw)": 0.6752737760543823, "Full-finetune/Step": 3219, "Full-finetune/Step Time": 6.693172659724951} {"Full-finetune/Learning Rate": 6.678525786078684e-06, "Full-finetune/Loss": 0.7654502391815186, "Full-finetune/Loss (Raw)": 0.9590193629264832, "Full-finetune/Step": 3220, "Full-finetune/Step Time": 6.673904951661825} {"Full-finetune/Learning Rate": 6.672650490960617e-06, "Full-finetune/Loss": 0.764965295791626, "Full-finetune/Loss (Raw)": 0.7579615712165833, "Full-finetune/Step": 3221, "Full-finetune/Step Time": 6.678717570379376} {"Full-finetune/Learning Rate": 6.666776487121934e-06, "Full-finetune/Loss": 0.7609225511550903, "Full-finetune/Loss (Raw)": 0.32871705293655396, "Full-finetune/Step": 3222, "Full-finetune/Step Time": 6.695130802690983} {"Full-finetune/Learning Rate": 6.660903776842218e-06, "Full-finetune/Loss": 0.7608107328414917, "Full-finetune/Loss (Raw)": 0.7748233675956726, "Full-finetune/Step": 3223, "Full-finetune/Step Time": 6.700450345873833} {"Full-finetune/Learning Rate": 6.655032362400562e-06, "Full-finetune/Loss": 0.7605046033859253, "Full-finetune/Loss (Raw)": 0.7948294878005981, "Full-finetune/Step": 3224, "Full-finetune/Step Time": 6.702601689845324} {"Full-finetune/Learning Rate": 6.649162246075538e-06, "Full-finetune/Loss": 0.7642654180526733, "Full-finetune/Loss (Raw)": 0.7839231491088867, "Full-finetune/Step": 3225, "Full-finetune/Step Time": 6.687246005982161} {"Full-finetune/Learning Rate": 6.6432934301452235e-06, "Full-finetune/Loss": 0.7659920454025269, "Full-finetune/Loss (Raw)": 0.8041403293609619, "Full-finetune/Step": 3226, "Full-finetune/Step Time": 6.686081113293767} {"Full-finetune/Learning Rate": 6.637425916887198e-06, "Full-finetune/Loss": 0.7647883892059326, "Full-finetune/Loss (Raw)": 0.6918361186981201, "Full-finetune/Step": 3227, "Full-finetune/Step Time": 6.687099674716592} {"Full-finetune/Learning Rate": 6.631559708578524e-06, "Full-finetune/Loss": 0.7628955841064453, "Full-finetune/Loss (Raw)": 0.7782214283943176, "Full-finetune/Step": 3228, "Full-finetune/Step Time": 6.685409123077989} {"Full-finetune/Learning Rate": 6.625694807495766e-06, "Full-finetune/Loss": 0.7654527425765991, "Full-finetune/Loss (Raw)": 0.8969111442565918, "Full-finetune/Step": 3229, "Full-finetune/Step Time": 6.6705494206398726} {"Full-finetune/Learning Rate": 6.619831215914974e-06, "Full-finetune/Loss": 0.7641512155532837, "Full-finetune/Loss (Raw)": 0.7352445721626282, "Full-finetune/Step": 3230, "Full-finetune/Step Time": 6.6731417793780565} {"Full-finetune/Learning Rate": 6.6139689361116945e-06, "Full-finetune/Loss": 0.7630175352096558, "Full-finetune/Loss (Raw)": 0.7960686087608337, "Full-finetune/Step": 3231, "Full-finetune/Step Time": 6.687598828226328} {"Full-finetune/Learning Rate": 6.608107970360964e-06, "Full-finetune/Loss": 0.763594388961792, "Full-finetune/Loss (Raw)": 0.9321407079696655, "Full-finetune/Step": 3232, "Full-finetune/Step Time": 6.690333569422364} {"Full-finetune/Learning Rate": 6.602248320937308e-06, "Full-finetune/Loss": 0.7647466063499451, "Full-finetune/Loss (Raw)": 1.007072925567627, "Full-finetune/Step": 3233, "Full-finetune/Step Time": 6.694750130176544} {"Full-finetune/Learning Rate": 6.596389990114748e-06, "Full-finetune/Loss": 0.7645934820175171, "Full-finetune/Loss (Raw)": 0.6992671489715576, "Full-finetune/Step": 3234, "Full-finetune/Step Time": 6.717466758564115} {"Full-finetune/Learning Rate": 6.5905329801667796e-06, "Full-finetune/Loss": 0.7642931938171387, "Full-finetune/Loss (Raw)": 0.9242745637893677, "Full-finetune/Step": 3235, "Full-finetune/Step Time": 6.723051169887185} {"Full-finetune/Learning Rate": 6.584677293366396e-06, "Full-finetune/Loss": 0.7632421255111694, "Full-finetune/Loss (Raw)": 0.6255103945732117, "Full-finetune/Step": 3236, "Full-finetune/Step Time": 6.729249047115445} {"Full-finetune/Learning Rate": 6.578822931986078e-06, "Full-finetune/Loss": 0.7640293836593628, "Full-finetune/Loss (Raw)": 0.8729258179664612, "Full-finetune/Step": 3237, "Full-finetune/Step Time": 6.7283855974674225} {"Full-finetune/Learning Rate": 6.57296989829779e-06, "Full-finetune/Loss": 0.7613484263420105, "Full-finetune/Loss (Raw)": 0.3918215334415436, "Full-finetune/Step": 3238, "Full-finetune/Step Time": 6.7497279811650515} {"Full-finetune/Learning Rate": 6.567118194572972e-06, "Full-finetune/Loss": 0.7629184722900391, "Full-finetune/Loss (Raw)": 0.964196503162384, "Full-finetune/Step": 3239, "Full-finetune/Step Time": 6.745529292151332} {"Full-finetune/Learning Rate": 6.5612678230825646e-06, "Full-finetune/Loss": 0.7632150650024414, "Full-finetune/Loss (Raw)": 0.9271647930145264, "Full-finetune/Step": 3240, "Full-finetune/Step Time": 6.747403360903263} {"Full-finetune/Learning Rate": 6.555418786096976e-06, "Full-finetune/Loss": 0.7640864849090576, "Full-finetune/Loss (Raw)": 0.8875613808631897, "Full-finetune/Step": 3241, "Full-finetune/Step Time": 6.747037723660469} {"Full-finetune/Learning Rate": 6.549571085886111e-06, "Full-finetune/Loss": 0.7646414041519165, "Full-finetune/Loss (Raw)": 0.9319168329238892, "Full-finetune/Step": 3242, "Full-finetune/Step Time": 6.744060566648841} {"Full-finetune/Learning Rate": 6.5437247247193445e-06, "Full-finetune/Loss": 0.7652133107185364, "Full-finetune/Loss (Raw)": 0.8543121814727783, "Full-finetune/Step": 3243, "Full-finetune/Step Time": 6.743405474349856} {"Full-finetune/Learning Rate": 6.537879704865531e-06, "Full-finetune/Loss": 0.7673433423042297, "Full-finetune/Loss (Raw)": 0.8478244543075562, "Full-finetune/Step": 3244, "Full-finetune/Step Time": 6.708934765309095} {"Full-finetune/Learning Rate": 6.532036028593012e-06, "Full-finetune/Loss": 0.7676219344139099, "Full-finetune/Loss (Raw)": 0.8851084113121033, "Full-finetune/Step": 3245, "Full-finetune/Step Time": 6.71527798101306} {"Full-finetune/Learning Rate": 6.526193698169603e-06, "Full-finetune/Loss": 0.7691880464553833, "Full-finetune/Loss (Raw)": 0.6715763807296753, "Full-finetune/Step": 3246, "Full-finetune/Step Time": 6.699438249692321} {"Full-finetune/Learning Rate": 6.520352715862601e-06, "Full-finetune/Loss": 0.7686631679534912, "Full-finetune/Loss (Raw)": 0.7426248788833618, "Full-finetune/Step": 3247, "Full-finetune/Step Time": 6.698928011581302} {"Full-finetune/Learning Rate": 6.514513083938779e-06, "Full-finetune/Loss": 0.7694607973098755, "Full-finetune/Loss (Raw)": 0.9415875673294067, "Full-finetune/Step": 3248, "Full-finetune/Step Time": 6.703338095918298} {"Full-finetune/Learning Rate": 6.508674804664374e-06, "Full-finetune/Loss": 0.7720391750335693, "Full-finetune/Loss (Raw)": 0.9422506093978882, "Full-finetune/Step": 3249, "Full-finetune/Step Time": 6.692808797582984} {"Full-finetune/Learning Rate": 6.50283788030512e-06, "Full-finetune/Loss": 0.7720005512237549, "Full-finetune/Loss (Raw)": 0.7659802436828613, "Full-finetune/Step": 3250, "Full-finetune/Step Time": 6.722143961116672} {"Full-finetune/Learning Rate": 6.497002313126204e-06, "Full-finetune/Loss": 0.7709597945213318, "Full-finetune/Loss (Raw)": 0.6485121846199036, "Full-finetune/Step": 3251, "Full-finetune/Step Time": 6.749692747369409} {"Full-finetune/Learning Rate": 6.491168105392303e-06, "Full-finetune/Loss": 0.7709981203079224, "Full-finetune/Loss (Raw)": 0.8819618821144104, "Full-finetune/Step": 3252, "Full-finetune/Step Time": 6.750826032832265} {"Full-finetune/Learning Rate": 6.485335259367558e-06, "Full-finetune/Loss": 0.7722931504249573, "Full-finetune/Loss (Raw)": 0.8268991708755493, "Full-finetune/Step": 3253, "Full-finetune/Step Time": 6.75300327129662} {"Full-finetune/Learning Rate": 6.4795037773155765e-06, "Full-finetune/Loss": 0.7723821997642517, "Full-finetune/Loss (Raw)": 0.8702154159545898, "Full-finetune/Step": 3254, "Full-finetune/Step Time": 6.763130474835634} {"Full-finetune/Learning Rate": 6.473673661499451e-06, "Full-finetune/Loss": 0.77188640832901, "Full-finetune/Loss (Raw)": 0.877943217754364, "Full-finetune/Step": 3255, "Full-finetune/Step Time": 6.773639764636755} {"Full-finetune/Learning Rate": 6.467844914181727e-06, "Full-finetune/Loss": 0.7747277021408081, "Full-finetune/Loss (Raw)": 0.8788284063339233, "Full-finetune/Step": 3256, "Full-finetune/Step Time": 6.742064731195569} {"Full-finetune/Learning Rate": 6.462017537624437e-06, "Full-finetune/Loss": 0.7736924886703491, "Full-finetune/Loss (Raw)": 0.6408975124359131, "Full-finetune/Step": 3257, "Full-finetune/Step Time": 6.751456655561924} {"Full-finetune/Learning Rate": 6.4561915340890665e-06, "Full-finetune/Loss": 0.7759348154067993, "Full-finetune/Loss (Raw)": 1.0040748119354248, "Full-finetune/Step": 3258, "Full-finetune/Step Time": 6.740326017141342} {"Full-finetune/Learning Rate": 6.450366905836573e-06, "Full-finetune/Loss": 0.7757023572921753, "Full-finetune/Loss (Raw)": 0.720198929309845, "Full-finetune/Step": 3259, "Full-finetune/Step Time": 6.742214320227504} {"Full-finetune/Learning Rate": 6.444543655127383e-06, "Full-finetune/Loss": 0.7789196968078613, "Full-finetune/Loss (Raw)": 0.8170700669288635, "Full-finetune/Step": 3260, "Full-finetune/Step Time": 6.740546345710754} {"Full-finetune/Learning Rate": 6.438721784221385e-06, "Full-finetune/Loss": 0.77836674451828, "Full-finetune/Loss (Raw)": 0.7364039421081543, "Full-finetune/Step": 3261, "Full-finetune/Step Time": 6.730858709663153} {"Full-finetune/Learning Rate": 6.432901295377936e-06, "Full-finetune/Loss": 0.7803854942321777, "Full-finetune/Loss (Raw)": 0.9211185574531555, "Full-finetune/Step": 3262, "Full-finetune/Step Time": 6.717121975496411} {"Full-finetune/Learning Rate": 6.427082190855855e-06, "Full-finetune/Loss": 0.7807795405387878, "Full-finetune/Loss (Raw)": 0.9212993383407593, "Full-finetune/Step": 3263, "Full-finetune/Step Time": 6.714770371094346} {"Full-finetune/Learning Rate": 6.4212644729134155e-06, "Full-finetune/Loss": 0.7800154685974121, "Full-finetune/Loss (Raw)": 0.712837815284729, "Full-finetune/Step": 3264, "Full-finetune/Step Time": 6.715595694258809} {"Full-finetune/Learning Rate": 6.415448143808367e-06, "Full-finetune/Loss": 0.7818578481674194, "Full-finetune/Loss (Raw)": 0.9480202198028564, "Full-finetune/Step": 3265, "Full-finetune/Step Time": 6.698294162750244} {"Full-finetune/Learning Rate": 6.409633205797911e-06, "Full-finetune/Loss": 0.7830999493598938, "Full-finetune/Loss (Raw)": 0.796326220035553, "Full-finetune/Step": 3266, "Full-finetune/Step Time": 6.672030633315444} {"Full-finetune/Learning Rate": 6.403819661138712e-06, "Full-finetune/Loss": 0.78255695104599, "Full-finetune/Loss (Raw)": 0.7377681732177734, "Full-finetune/Step": 3267, "Full-finetune/Step Time": 6.68553832359612} {"Full-finetune/Learning Rate": 6.398007512086897e-06, "Full-finetune/Loss": 0.783538818359375, "Full-finetune/Loss (Raw)": 0.9048613905906677, "Full-finetune/Step": 3268, "Full-finetune/Step Time": 6.678730731830001} {"Full-finetune/Learning Rate": 6.3921967608980375e-06, "Full-finetune/Loss": 0.7842361927032471, "Full-finetune/Loss (Raw)": 0.8703606128692627, "Full-finetune/Step": 3269, "Full-finetune/Step Time": 6.682116536423564} {"Full-finetune/Learning Rate": 6.386387409827182e-06, "Full-finetune/Loss": 0.7841827869415283, "Full-finetune/Loss (Raw)": 0.7332459688186646, "Full-finetune/Step": 3270, "Full-finetune/Step Time": 6.670816348865628} {"Full-finetune/Learning Rate": 6.38057946112882e-06, "Full-finetune/Loss": 0.7861860990524292, "Full-finetune/Loss (Raw)": 0.7863204479217529, "Full-finetune/Step": 3271, "Full-finetune/Step Time": 6.654974417760968} {"Full-finetune/Learning Rate": 6.374772917056908e-06, "Full-finetune/Loss": 0.7849530577659607, "Full-finetune/Loss (Raw)": 0.7639597058296204, "Full-finetune/Step": 3272, "Full-finetune/Step Time": 6.68330604955554} {"Full-finetune/Learning Rate": 6.368967779864854e-06, "Full-finetune/Loss": 0.7836220860481262, "Full-finetune/Loss (Raw)": 0.7323461174964905, "Full-finetune/Step": 3273, "Full-finetune/Step Time": 6.68848380073905} {"Full-finetune/Learning Rate": 6.3631640518055085e-06, "Full-finetune/Loss": 0.7793271541595459, "Full-finetune/Loss (Raw)": 0.3152306377887726, "Full-finetune/Step": 3274, "Full-finetune/Step Time": 6.707028470933437} {"Full-finetune/Learning Rate": 6.3573617351311945e-06, "Full-finetune/Loss": 0.7786439657211304, "Full-finetune/Loss (Raw)": 0.7210533618927002, "Full-finetune/Step": 3275, "Full-finetune/Step Time": 6.705149561166763} {"Full-finetune/Learning Rate": 6.351560832093673e-06, "Full-finetune/Loss": 0.7778552770614624, "Full-finetune/Loss (Raw)": 0.8363897204399109, "Full-finetune/Step": 3276, "Full-finetune/Step Time": 6.689582355320454} {"Full-finetune/Learning Rate": 6.3457613449441654e-06, "Full-finetune/Loss": 0.7810729742050171, "Full-finetune/Loss (Raw)": 0.8262544274330139, "Full-finetune/Step": 3277, "Full-finetune/Step Time": 6.669624721631408} {"Full-finetune/Learning Rate": 6.3399632759333364e-06, "Full-finetune/Loss": 0.7812628746032715, "Full-finetune/Loss (Raw)": 0.804239809513092, "Full-finetune/Step": 3278, "Full-finetune/Step Time": 6.6735434122383595} {"Full-finetune/Learning Rate": 6.3341666273113e-06, "Full-finetune/Loss": 0.7812259793281555, "Full-finetune/Loss (Raw)": 0.8361378908157349, "Full-finetune/Step": 3279, "Full-finetune/Step Time": 6.680357165634632} {"Full-finetune/Learning Rate": 6.328371401327629e-06, "Full-finetune/Loss": 0.7823140025138855, "Full-finetune/Loss (Raw)": 0.9337759017944336, "Full-finetune/Step": 3280, "Full-finetune/Step Time": 6.679759111255407} {"Full-finetune/Learning Rate": 6.322577600231332e-06, "Full-finetune/Loss": 0.7833507061004639, "Full-finetune/Loss (Raw)": 0.978238046169281, "Full-finetune/Step": 3281, "Full-finetune/Step Time": 6.6819109581410885} {"Full-finetune/Learning Rate": 6.316785226270878e-06, "Full-finetune/Loss": 0.7832850217819214, "Full-finetune/Loss (Raw)": 0.7835454940795898, "Full-finetune/Step": 3282, "Full-finetune/Step Time": 6.683235693722963} {"Full-finetune/Learning Rate": 6.310994281694167e-06, "Full-finetune/Loss": 0.7793777585029602, "Full-finetune/Loss (Raw)": 0.36525195837020874, "Full-finetune/Step": 3283, "Full-finetune/Step Time": 6.701470134779811} {"Full-finetune/Learning Rate": 6.305204768748551e-06, "Full-finetune/Loss": 0.7794579267501831, "Full-finetune/Loss (Raw)": 0.7665620446205139, "Full-finetune/Step": 3284, "Full-finetune/Step Time": 6.705408841371536} {"Full-finetune/Learning Rate": 6.299416689680831e-06, "Full-finetune/Loss": 0.7788522243499756, "Full-finetune/Loss (Raw)": 0.8584938645362854, "Full-finetune/Step": 3285, "Full-finetune/Step Time": 6.699135361239314} {"Full-finetune/Learning Rate": 6.293630046737245e-06, "Full-finetune/Loss": 0.7828962206840515, "Full-finetune/Loss (Raw)": 0.8003230094909668, "Full-finetune/Step": 3286, "Full-finetune/Step Time": 6.686806235462427} {"Full-finetune/Learning Rate": 6.28784484216348e-06, "Full-finetune/Loss": 0.7836856245994568, "Full-finetune/Loss (Raw)": 0.8377662301063538, "Full-finetune/Step": 3287, "Full-finetune/Step Time": 6.6939078848809} {"Full-finetune/Learning Rate": 6.282061078204657e-06, "Full-finetune/Loss": 0.7843666076660156, "Full-finetune/Loss (Raw)": 0.9114225506782532, "Full-finetune/Step": 3288, "Full-finetune/Step Time": 6.6995902974158525} {"Full-finetune/Learning Rate": 6.276278757105341e-06, "Full-finetune/Loss": 0.7835202813148499, "Full-finetune/Loss (Raw)": 0.7417529225349426, "Full-finetune/Step": 3289, "Full-finetune/Step Time": 6.6812368128448725} {"Full-finetune/Learning Rate": 6.270497881109541e-06, "Full-finetune/Loss": 0.7870615124702454, "Full-finetune/Loss (Raw)": 0.8602573871612549, "Full-finetune/Step": 3290, "Full-finetune/Step Time": 6.663338039070368} {"Full-finetune/Learning Rate": 6.264718452460699e-06, "Full-finetune/Loss": 0.7851574420928955, "Full-finetune/Loss (Raw)": 0.6808810830116272, "Full-finetune/Step": 3291, "Full-finetune/Step Time": 6.659736840054393} {"Full-finetune/Learning Rate": 6.258940473401705e-06, "Full-finetune/Loss": 0.7846341133117676, "Full-finetune/Loss (Raw)": 0.7679070830345154, "Full-finetune/Step": 3292, "Full-finetune/Step Time": 6.6710638999938965} {"Full-finetune/Learning Rate": 6.253163946174872e-06, "Full-finetune/Loss": 0.7868255376815796, "Full-finetune/Loss (Raw)": 0.8131417632102966, "Full-finetune/Step": 3293, "Full-finetune/Step Time": 6.66761876642704} {"Full-finetune/Learning Rate": 6.247388873021959e-06, "Full-finetune/Loss": 0.786281168460846, "Full-finetune/Loss (Raw)": 0.7135252952575684, "Full-finetune/Step": 3294, "Full-finetune/Step Time": 6.693996887654066} {"Full-finetune/Learning Rate": 6.2416152561841635e-06, "Full-finetune/Loss": 0.7861565351486206, "Full-finetune/Loss (Raw)": 0.7831450700759888, "Full-finetune/Step": 3295, "Full-finetune/Step Time": 6.6973804365843534} {"Full-finetune/Learning Rate": 6.2358430979021075e-06, "Full-finetune/Loss": 0.785308837890625, "Full-finetune/Loss (Raw)": 0.8425105214118958, "Full-finetune/Step": 3296, "Full-finetune/Step Time": 6.698983142152429} {"Full-finetune/Learning Rate": 6.230072400415863e-06, "Full-finetune/Loss": 0.788171648979187, "Full-finetune/Loss (Raw)": 0.6765817403793335, "Full-finetune/Step": 3297, "Full-finetune/Step Time": 6.701390711590648} {"Full-finetune/Learning Rate": 6.224303165964913e-06, "Full-finetune/Loss": 0.7900524139404297, "Full-finetune/Loss (Raw)": 0.9015900492668152, "Full-finetune/Step": 3298, "Full-finetune/Step Time": 6.699493171647191} {"Full-finetune/Learning Rate": 6.21853539678819e-06, "Full-finetune/Loss": 0.7871741056442261, "Full-finetune/Loss (Raw)": 0.3831181228160858, "Full-finetune/Step": 3299, "Full-finetune/Step Time": 6.717236617580056} {"Full-finetune/Learning Rate": 6.212769095124055e-06, "Full-finetune/Loss": 0.7880052328109741, "Full-finetune/Loss (Raw)": 0.859183132648468, "Full-finetune/Step": 3300, "Full-finetune/Step Time": 6.719428302720189} {"Full-finetune/Learning Rate": 6.207004263210292e-06, "Full-finetune/Loss": 0.7880405187606812, "Full-finetune/Loss (Raw)": 0.6711629033088684, "Full-finetune/Step": 3301, "Full-finetune/Step Time": 6.708984229713678} {"Full-finetune/Learning Rate": 6.2012409032841294e-06, "Full-finetune/Loss": 0.7875006198883057, "Full-finetune/Loss (Raw)": 0.9006772637367249, "Full-finetune/Step": 3302, "Full-finetune/Step Time": 6.707286210730672} {"Full-finetune/Learning Rate": 6.1954790175822e-06, "Full-finetune/Loss": 0.7875930666923523, "Full-finetune/Loss (Raw)": 0.7884780168533325, "Full-finetune/Step": 3303, "Full-finetune/Step Time": 6.706774443387985} {"Full-finetune/Learning Rate": 6.189718608340587e-06, "Full-finetune/Loss": 0.7859212160110474, "Full-finetune/Loss (Raw)": 0.7397855520248413, "Full-finetune/Step": 3304, "Full-finetune/Step Time": 6.716774012893438} {"Full-finetune/Learning Rate": 6.183959677794795e-06, "Full-finetune/Loss": 0.786758542060852, "Full-finetune/Loss (Raw)": 0.8721045851707458, "Full-finetune/Step": 3305, "Full-finetune/Step Time": 6.7244460098445415} {"Full-finetune/Learning Rate": 6.1782022281797485e-06, "Full-finetune/Loss": 0.7860192060470581, "Full-finetune/Loss (Raw)": 0.7105590105056763, "Full-finetune/Step": 3306, "Full-finetune/Step Time": 6.717113452032208} {"Full-finetune/Learning Rate": 6.17244626172981e-06, "Full-finetune/Loss": 0.7861654758453369, "Full-finetune/Loss (Raw)": 0.9475424885749817, "Full-finetune/Step": 3307, "Full-finetune/Step Time": 6.707604823634028} {"Full-finetune/Learning Rate": 6.166691780678743e-06, "Full-finetune/Loss": 0.7868403196334839, "Full-finetune/Loss (Raw)": 0.8258196115493774, "Full-finetune/Step": 3308, "Full-finetune/Step Time": 6.714027799665928} {"Full-finetune/Learning Rate": 6.1609387872597595e-06, "Full-finetune/Loss": 0.7870861291885376, "Full-finetune/Loss (Raw)": 0.8808336853981018, "Full-finetune/Step": 3309, "Full-finetune/Step Time": 6.734533075243235} {"Full-finetune/Learning Rate": 6.155187283705479e-06, "Full-finetune/Loss": 0.7863473892211914, "Full-finetune/Loss (Raw)": 0.736594557762146, "Full-finetune/Step": 3310, "Full-finetune/Step Time": 6.732228897511959} {"Full-finetune/Learning Rate": 6.14943727224795e-06, "Full-finetune/Loss": 0.7863552570343018, "Full-finetune/Loss (Raw)": 0.7111874222755432, "Full-finetune/Step": 3311, "Full-finetune/Step Time": 6.741038579493761} {"Full-finetune/Learning Rate": 6.1436887551186466e-06, "Full-finetune/Loss": 0.7864692807197571, "Full-finetune/Loss (Raw)": 0.777498722076416, "Full-finetune/Step": 3312, "Full-finetune/Step Time": 6.745962725952268} {"Full-finetune/Learning Rate": 6.137941734548443e-06, "Full-finetune/Loss": 0.7830226421356201, "Full-finetune/Loss (Raw)": 0.4284726083278656, "Full-finetune/Step": 3313, "Full-finetune/Step Time": 6.759497422724962} {"Full-finetune/Learning Rate": 6.132196212767653e-06, "Full-finetune/Loss": 0.7827038764953613, "Full-finetune/Loss (Raw)": 0.7352309823036194, "Full-finetune/Step": 3314, "Full-finetune/Step Time": 6.745747005566955} {"Full-finetune/Learning Rate": 6.126452192005999e-06, "Full-finetune/Loss": 0.7835973501205444, "Full-finetune/Loss (Raw)": 0.9857219457626343, "Full-finetune/Step": 3315, "Full-finetune/Step Time": 6.745628766715527} {"Full-finetune/Learning Rate": 6.120709674492627e-06, "Full-finetune/Loss": 0.7841459512710571, "Full-finetune/Loss (Raw)": 0.7624413371086121, "Full-finetune/Step": 3316, "Full-finetune/Step Time": 6.738594872877002} {"Full-finetune/Learning Rate": 6.114968662456093e-06, "Full-finetune/Loss": 0.7842012643814087, "Full-finetune/Loss (Raw)": 0.7558738589286804, "Full-finetune/Step": 3317, "Full-finetune/Step Time": 6.738972779363394} {"Full-finetune/Learning Rate": 6.10922915812437e-06, "Full-finetune/Loss": 0.7803325653076172, "Full-finetune/Loss (Raw)": 0.3336370289325714, "Full-finetune/Step": 3318, "Full-finetune/Step Time": 6.753065600991249} {"Full-finetune/Learning Rate": 6.103491163724853e-06, "Full-finetune/Loss": 0.7807879447937012, "Full-finetune/Loss (Raw)": 0.893557608127594, "Full-finetune/Step": 3319, "Full-finetune/Step Time": 6.735040193423629} {"Full-finetune/Learning Rate": 6.09775468148434e-06, "Full-finetune/Loss": 0.7803726196289062, "Full-finetune/Loss (Raw)": 0.7576807141304016, "Full-finetune/Step": 3320, "Full-finetune/Step Time": 6.7267425041645765} {"Full-finetune/Learning Rate": 6.092019713629053e-06, "Full-finetune/Loss": 0.7796825170516968, "Full-finetune/Loss (Raw)": 0.7007891535758972, "Full-finetune/Step": 3321, "Full-finetune/Step Time": 6.727288847789168} {"Full-finetune/Learning Rate": 6.086286262384617e-06, "Full-finetune/Loss": 0.7799239158630371, "Full-finetune/Loss (Raw)": 0.7636731266975403, "Full-finetune/Step": 3322, "Full-finetune/Step Time": 6.709782397374511} {"Full-finetune/Learning Rate": 6.080554329976071e-06, "Full-finetune/Loss": 0.7803627252578735, "Full-finetune/Loss (Raw)": 0.884351909160614, "Full-finetune/Step": 3323, "Full-finetune/Step Time": 6.717776691541076} {"Full-finetune/Learning Rate": 6.074823918627872e-06, "Full-finetune/Loss": 0.7800049185752869, "Full-finetune/Loss (Raw)": 0.7575034499168396, "Full-finetune/Step": 3324, "Full-finetune/Step Time": 6.72102408669889} {"Full-finetune/Learning Rate": 6.069095030563877e-06, "Full-finetune/Loss": 0.7784762978553772, "Full-finetune/Loss (Raw)": 0.6839770674705505, "Full-finetune/Step": 3325, "Full-finetune/Step Time": 6.721819009631872} {"Full-finetune/Learning Rate": 6.063367668007356e-06, "Full-finetune/Loss": 0.7796655893325806, "Full-finetune/Loss (Raw)": 0.8774277567863464, "Full-finetune/Step": 3326, "Full-finetune/Step Time": 6.703192848712206} {"Full-finetune/Learning Rate": 6.057641833180987e-06, "Full-finetune/Loss": 0.7778930068016052, "Full-finetune/Loss (Raw)": 0.5811606645584106, "Full-finetune/Step": 3327, "Full-finetune/Step Time": 6.716054918244481} {"Full-finetune/Learning Rate": 6.0519175283068534e-06, "Full-finetune/Loss": 0.777047336101532, "Full-finetune/Loss (Raw)": 0.9190133213996887, "Full-finetune/Step": 3328, "Full-finetune/Step Time": 6.720365123823285} {"Full-finetune/Learning Rate": 6.046194755606448e-06, "Full-finetune/Loss": 0.7786399126052856, "Full-finetune/Loss (Raw)": 0.815875232219696, "Full-finetune/Step": 3329, "Full-finetune/Step Time": 6.7237797155976295} {"Full-finetune/Learning Rate": 6.040473517300665e-06, "Full-finetune/Loss": 0.7779127359390259, "Full-finetune/Loss (Raw)": 0.6911299228668213, "Full-finetune/Step": 3330, "Full-finetune/Step Time": 6.73748960159719} {"Full-finetune/Learning Rate": 6.0347538156098104e-06, "Full-finetune/Loss": 0.7781412601470947, "Full-finetune/Loss (Raw)": 0.8132665157318115, "Full-finetune/Step": 3331, "Full-finetune/Step Time": 6.751233045011759} {"Full-finetune/Learning Rate": 6.0290356527535836e-06, "Full-finetune/Loss": 0.778343141078949, "Full-finetune/Loss (Raw)": 0.7949560284614563, "Full-finetune/Step": 3332, "Full-finetune/Step Time": 6.745351223275065} {"Full-finetune/Learning Rate": 6.023319030951091e-06, "Full-finetune/Loss": 0.7789559960365295, "Full-finetune/Loss (Raw)": 0.8179660439491272, "Full-finetune/Step": 3333, "Full-finetune/Step Time": 6.745319342240691} {"Full-finetune/Learning Rate": 6.017603952420846e-06, "Full-finetune/Loss": 0.7801699042320251, "Full-finetune/Loss (Raw)": 0.8231285214424133, "Full-finetune/Step": 3334, "Full-finetune/Step Time": 6.745787909254432} {"Full-finetune/Learning Rate": 6.011890419380756e-06, "Full-finetune/Loss": 0.7798994779586792, "Full-finetune/Loss (Raw)": 0.7332194447517395, "Full-finetune/Step": 3335, "Full-finetune/Step Time": 6.724694192409515} {"Full-finetune/Learning Rate": 6.0061784340481366e-06, "Full-finetune/Loss": 0.779421329498291, "Full-finetune/Loss (Raw)": 0.7644370198249817, "Full-finetune/Step": 3336, "Full-finetune/Step Time": 6.72395840100944} {"Full-finetune/Learning Rate": 6.000467998639692e-06, "Full-finetune/Loss": 0.7786004543304443, "Full-finetune/Loss (Raw)": 0.6839800477027893, "Full-finetune/Step": 3337, "Full-finetune/Step Time": 6.727300396189094} {"Full-finetune/Learning Rate": 5.994759115371531e-06, "Full-finetune/Loss": 0.779310941696167, "Full-finetune/Loss (Raw)": 0.8033944368362427, "Full-finetune/Step": 3338, "Full-finetune/Step Time": 6.731128511950374} {"Full-finetune/Learning Rate": 5.989051786459163e-06, "Full-finetune/Loss": 0.7797116041183472, "Full-finetune/Loss (Raw)": 0.852747917175293, "Full-finetune/Step": 3339, "Full-finetune/Step Time": 6.723779721185565} {"Full-finetune/Learning Rate": 5.98334601411749e-06, "Full-finetune/Loss": 0.7829830646514893, "Full-finetune/Loss (Raw)": 0.813784658908844, "Full-finetune/Step": 3340, "Full-finetune/Step Time": 6.707140382379293} {"Full-finetune/Learning Rate": 5.977641800560811e-06, "Full-finetune/Loss": 0.7838428020477295, "Full-finetune/Loss (Raw)": 0.9607221484184265, "Full-finetune/Step": 3341, "Full-finetune/Step Time": 6.713454166427255} {"Full-finetune/Learning Rate": 5.971939148002819e-06, "Full-finetune/Loss": 0.7850837111473083, "Full-finetune/Loss (Raw)": 0.8782044649124146, "Full-finetune/Step": 3342, "Full-finetune/Step Time": 6.693409921601415} {"Full-finetune/Learning Rate": 5.966238058656601e-06, "Full-finetune/Loss": 0.7866023182868958, "Full-finetune/Loss (Raw)": 0.8453855514526367, "Full-finetune/Step": 3343, "Full-finetune/Step Time": 6.680401409044862} {"Full-finetune/Learning Rate": 5.960538534734641e-06, "Full-finetune/Loss": 0.7864833474159241, "Full-finetune/Loss (Raw)": 0.6270087361335754, "Full-finetune/Step": 3344, "Full-finetune/Step Time": 6.660430861636996} {"Full-finetune/Learning Rate": 5.9548405784488095e-06, "Full-finetune/Loss": 0.782837986946106, "Full-finetune/Loss (Raw)": 0.35004115104675293, "Full-finetune/Step": 3345, "Full-finetune/Step Time": 6.684320542961359} {"Full-finetune/Learning Rate": 5.949144192010378e-06, "Full-finetune/Loss": 0.7832661867141724, "Full-finetune/Loss (Raw)": 0.88422691822052, "Full-finetune/Step": 3346, "Full-finetune/Step Time": 6.683065192773938} {"Full-finetune/Learning Rate": 5.94344937763e-06, "Full-finetune/Loss": 0.7833219766616821, "Full-finetune/Loss (Raw)": 0.6824234127998352, "Full-finetune/Step": 3347, "Full-finetune/Step Time": 6.683942053467035} {"Full-finetune/Learning Rate": 5.9377561375177164e-06, "Full-finetune/Loss": 0.7824902534484863, "Full-finetune/Loss (Raw)": 0.852552592754364, "Full-finetune/Step": 3348, "Full-finetune/Step Time": 6.688734760507941} {"Full-finetune/Learning Rate": 5.9320644738829706e-06, "Full-finetune/Loss": 0.7831974625587463, "Full-finetune/Loss (Raw)": 0.8484823107719421, "Full-finetune/Step": 3349, "Full-finetune/Step Time": 6.69530526176095} {"Full-finetune/Learning Rate": 5.926374388934579e-06, "Full-finetune/Loss": 0.7884301543235779, "Full-finetune/Loss (Raw)": 0.9985067248344421, "Full-finetune/Step": 3350, "Full-finetune/Step Time": 6.6843618005514145} {"Full-finetune/Learning Rate": 5.920685884880762e-06, "Full-finetune/Loss": 0.7881970405578613, "Full-finetune/Loss (Raw)": 0.7449897527694702, "Full-finetune/Step": 3351, "Full-finetune/Step Time": 6.690990224480629} {"Full-finetune/Learning Rate": 5.914998963929109e-06, "Full-finetune/Loss": 0.7885441184043884, "Full-finetune/Loss (Raw)": 0.8392490148544312, "Full-finetune/Step": 3352, "Full-finetune/Step Time": 6.694961508736014} {"Full-finetune/Learning Rate": 5.9093136282866014e-06, "Full-finetune/Loss": 0.7894854545593262, "Full-finetune/Loss (Raw)": 0.9044174551963806, "Full-finetune/Step": 3353, "Full-finetune/Step Time": 6.710289945825934} {"Full-finetune/Learning Rate": 5.903629880159614e-06, "Full-finetune/Loss": 0.7901328206062317, "Full-finetune/Loss (Raw)": 0.8870015740394592, "Full-finetune/Step": 3354, "Full-finetune/Step Time": 6.708626376464963} {"Full-finetune/Learning Rate": 5.897947721753894e-06, "Full-finetune/Loss": 0.7912706732749939, "Full-finetune/Loss (Raw)": 0.8374776244163513, "Full-finetune/Step": 3355, "Full-finetune/Step Time": 6.700623441487551} {"Full-finetune/Learning Rate": 5.89226715527458e-06, "Full-finetune/Loss": 0.7920234203338623, "Full-finetune/Loss (Raw)": 0.8745782971382141, "Full-finetune/Step": 3356, "Full-finetune/Step Time": 6.70193830691278} {"Full-finetune/Learning Rate": 5.886588182926185e-06, "Full-finetune/Loss": 0.7913031578063965, "Full-finetune/Loss (Raw)": 0.804715096950531, "Full-finetune/Step": 3357, "Full-finetune/Step Time": 6.702545924112201} {"Full-finetune/Learning Rate": 5.880910806912607e-06, "Full-finetune/Loss": 0.7914155721664429, "Full-finetune/Loss (Raw)": 0.7496346235275269, "Full-finetune/Step": 3358, "Full-finetune/Step Time": 6.707091273739934} {"Full-finetune/Learning Rate": 5.8752350294371274e-06, "Full-finetune/Loss": 0.7929837107658386, "Full-finetune/Loss (Raw)": 0.9967902898788452, "Full-finetune/Step": 3359, "Full-finetune/Step Time": 6.680317189544439} {"Full-finetune/Learning Rate": 5.8695608527024075e-06, "Full-finetune/Loss": 0.7926227450370789, "Full-finetune/Loss (Raw)": 0.885934054851532, "Full-finetune/Step": 3360, "Full-finetune/Step Time": 6.680782565847039} {"Full-finetune/Learning Rate": 5.863888278910475e-06, "Full-finetune/Loss": 0.7912766933441162, "Full-finetune/Loss (Raw)": 0.8347718119621277, "Full-finetune/Step": 3361, "Full-finetune/Step Time": 6.693854911252856} {"Full-finetune/Learning Rate": 5.8582173102627526e-06, "Full-finetune/Loss": 0.7914472818374634, "Full-finetune/Loss (Raw)": 0.7211107611656189, "Full-finetune/Step": 3362, "Full-finetune/Step Time": 6.687117008492351} {"Full-finetune/Learning Rate": 5.852547948960029e-06, "Full-finetune/Loss": 0.7911353707313538, "Full-finetune/Loss (Raw)": 0.8843527436256409, "Full-finetune/Step": 3363, "Full-finetune/Step Time": 6.686627635732293} {"Full-finetune/Learning Rate": 5.8468801972024755e-06, "Full-finetune/Loss": 0.7931199073791504, "Full-finetune/Loss (Raw)": 0.8795304298400879, "Full-finetune/Step": 3364, "Full-finetune/Step Time": 6.679401073604822} {"Full-finetune/Learning Rate": 5.841214057189638e-06, "Full-finetune/Loss": 0.7921921014785767, "Full-finetune/Loss (Raw)": 0.7541661262512207, "Full-finetune/Step": 3365, "Full-finetune/Step Time": 6.693185010924935} {"Full-finetune/Learning Rate": 5.8355495311204266e-06, "Full-finetune/Loss": 0.7944632768630981, "Full-finetune/Loss (Raw)": 0.6825264096260071, "Full-finetune/Step": 3366, "Full-finetune/Step Time": 6.685546958819032} {"Full-finetune/Learning Rate": 5.829886621193141e-06, "Full-finetune/Loss": 0.7924275994300842, "Full-finetune/Loss (Raw)": 0.7036360502243042, "Full-finetune/Step": 3367, "Full-finetune/Step Time": 6.691792033612728} {"Full-finetune/Learning Rate": 5.824225329605442e-06, "Full-finetune/Loss": 0.7885745763778687, "Full-finetune/Loss (Raw)": 0.4339701533317566, "Full-finetune/Step": 3368, "Full-finetune/Step Time": 6.7086481153965} {"Full-finetune/Learning Rate": 5.818565658554364e-06, "Full-finetune/Loss": 0.7881746888160706, "Full-finetune/Loss (Raw)": 0.8363797664642334, "Full-finetune/Step": 3369, "Full-finetune/Step Time": 6.697180546820164} {"Full-finetune/Learning Rate": 5.8129076102363266e-06, "Full-finetune/Loss": 0.7876508235931396, "Full-finetune/Loss (Raw)": 0.8648583889007568, "Full-finetune/Step": 3370, "Full-finetune/Step Time": 6.6948763113468885} {"Full-finetune/Learning Rate": 5.807251186847095e-06, "Full-finetune/Loss": 0.7854422926902771, "Full-finetune/Loss (Raw)": 0.5716260671615601, "Full-finetune/Step": 3371, "Full-finetune/Step Time": 6.716408798471093} {"Full-finetune/Learning Rate": 5.801596390581817e-06, "Full-finetune/Loss": 0.7844991087913513, "Full-finetune/Loss (Raw)": 0.7270938158035278, "Full-finetune/Step": 3372, "Full-finetune/Step Time": 6.727139396592975} {"Full-finetune/Learning Rate": 5.795943223635018e-06, "Full-finetune/Loss": 0.7841450572013855, "Full-finetune/Loss (Raw)": 0.8397913575172424, "Full-finetune/Step": 3373, "Full-finetune/Step Time": 6.731392487883568} {"Full-finetune/Learning Rate": 5.7902916882005755e-06, "Full-finetune/Loss": 0.7852482795715332, "Full-finetune/Loss (Raw)": 0.8127924203872681, "Full-finetune/Step": 3374, "Full-finetune/Step Time": 6.734218860045075} {"Full-finetune/Learning Rate": 5.784641786471742e-06, "Full-finetune/Loss": 0.7875912189483643, "Full-finetune/Loss (Raw)": 1.0425164699554443, "Full-finetune/Step": 3375, "Full-finetune/Step Time": 6.731669565662742} {"Full-finetune/Learning Rate": 5.778993520641132e-06, "Full-finetune/Loss": 0.7874237298965454, "Full-finetune/Loss (Raw)": 0.9201498031616211, "Full-finetune/Step": 3376, "Full-finetune/Step Time": 6.7239985931664705} {"Full-finetune/Learning Rate": 5.7733468929007294e-06, "Full-finetune/Loss": 0.7850745320320129, "Full-finetune/Loss (Raw)": 0.6415507793426514, "Full-finetune/Step": 3377, "Full-finetune/Step Time": 6.734093740582466} {"Full-finetune/Learning Rate": 5.7677019054418805e-06, "Full-finetune/Loss": 0.7860833406448364, "Full-finetune/Loss (Raw)": 0.8951082825660706, "Full-finetune/Step": 3378, "Full-finetune/Step Time": 6.719059385359287} {"Full-finetune/Learning Rate": 5.762058560455287e-06, "Full-finetune/Loss": 0.7858601808547974, "Full-finetune/Loss (Raw)": 0.6199515461921692, "Full-finetune/Step": 3379, "Full-finetune/Step Time": 6.6934996619820595} {"Full-finetune/Learning Rate": 5.756416860131036e-06, "Full-finetune/Loss": 0.7843822240829468, "Full-finetune/Loss (Raw)": 0.6927832961082458, "Full-finetune/Step": 3380, "Full-finetune/Step Time": 6.689802687615156} {"Full-finetune/Learning Rate": 5.750776806658549e-06, "Full-finetune/Loss": 0.7837463617324829, "Full-finetune/Loss (Raw)": 0.7455096244812012, "Full-finetune/Step": 3381, "Full-finetune/Step Time": 6.685076644644141} {"Full-finetune/Learning Rate": 5.745138402226621e-06, "Full-finetune/Loss": 0.7838781476020813, "Full-finetune/Loss (Raw)": 0.8870787620544434, "Full-finetune/Step": 3382, "Full-finetune/Step Time": 6.675766749307513} {"Full-finetune/Learning Rate": 5.739501649023413e-06, "Full-finetune/Loss": 0.7831205725669861, "Full-finetune/Loss (Raw)": 0.7809756398200989, "Full-finetune/Step": 3383, "Full-finetune/Step Time": 6.663063734769821} {"Full-finetune/Learning Rate": 5.7338665492364365e-06, "Full-finetune/Loss": 0.78312748670578, "Full-finetune/Loss (Raw)": 0.879714846611023, "Full-finetune/Step": 3384, "Full-finetune/Step Time": 6.648608323186636} {"Full-finetune/Learning Rate": 5.728233105052563e-06, "Full-finetune/Loss": 0.7832713723182678, "Full-finetune/Loss (Raw)": 0.6593137979507446, "Full-finetune/Step": 3385, "Full-finetune/Step Time": 6.638358803465962} {"Full-finetune/Learning Rate": 5.722601318658021e-06, "Full-finetune/Loss": 0.7815261483192444, "Full-finetune/Loss (Raw)": 0.7806851267814636, "Full-finetune/Step": 3386, "Full-finetune/Step Time": 6.629626987501979} {"Full-finetune/Learning Rate": 5.7169711922383984e-06, "Full-finetune/Loss": 0.781650185585022, "Full-finetune/Loss (Raw)": 0.7360811829566956, "Full-finetune/Step": 3387, "Full-finetune/Step Time": 6.618870034813881} {"Full-finetune/Learning Rate": 5.711342727978637e-06, "Full-finetune/Loss": 0.7812161445617676, "Full-finetune/Loss (Raw)": 0.7615053653717041, "Full-finetune/Step": 3388, "Full-finetune/Step Time": 6.601458631455898} {"Full-finetune/Learning Rate": 5.7057159280630316e-06, "Full-finetune/Loss": 0.781832754611969, "Full-finetune/Loss (Raw)": 0.8153367042541504, "Full-finetune/Step": 3389, "Full-finetune/Step Time": 6.606124863028526} {"Full-finetune/Learning Rate": 5.700090794675241e-06, "Full-finetune/Loss": 0.7810577154159546, "Full-finetune/Loss (Raw)": 0.8219057321548462, "Full-finetune/Step": 3390, "Full-finetune/Step Time": 6.610340192914009} {"Full-finetune/Learning Rate": 5.694467329998264e-06, "Full-finetune/Loss": 0.781462550163269, "Full-finetune/Loss (Raw)": 0.9731273055076599, "Full-finetune/Step": 3391, "Full-finetune/Step Time": 6.606854537501931} {"Full-finetune/Learning Rate": 5.68884553621445e-06, "Full-finetune/Loss": 0.7817950248718262, "Full-finetune/Loss (Raw)": 0.7553879618644714, "Full-finetune/Step": 3392, "Full-finetune/Step Time": 6.606911484152079} {"Full-finetune/Learning Rate": 5.683225415505521e-06, "Full-finetune/Loss": 0.7813209891319275, "Full-finetune/Loss (Raw)": 0.8873456716537476, "Full-finetune/Step": 3393, "Full-finetune/Step Time": 6.604131357744336} {"Full-finetune/Learning Rate": 5.67760697005253e-06, "Full-finetune/Loss": 0.780762791633606, "Full-finetune/Loss (Raw)": 0.7248708605766296, "Full-finetune/Step": 3394, "Full-finetune/Step Time": 6.624224100261927} {"Full-finetune/Learning Rate": 5.671990202035886e-06, "Full-finetune/Loss": 0.7818486094474792, "Full-finetune/Loss (Raw)": 0.8767591118812561, "Full-finetune/Step": 3395, "Full-finetune/Step Time": 6.608378326520324} {"Full-finetune/Learning Rate": 5.666375113635347e-06, "Full-finetune/Loss": 0.7799760699272156, "Full-finetune/Loss (Raw)": 0.6651743650436401, "Full-finetune/Step": 3396, "Full-finetune/Step Time": 6.608244031667709} {"Full-finetune/Learning Rate": 5.660761707030022e-06, "Full-finetune/Loss": 0.7790837287902832, "Full-finetune/Loss (Raw)": 0.756140947341919, "Full-finetune/Step": 3397, "Full-finetune/Step Time": 6.605953132733703} {"Full-finetune/Learning Rate": 5.655149984398359e-06, "Full-finetune/Loss": 0.779788076877594, "Full-finetune/Loss (Raw)": 0.8234030604362488, "Full-finetune/Step": 3398, "Full-finetune/Step Time": 6.605365911498666} {"Full-finetune/Learning Rate": 5.649539947918159e-06, "Full-finetune/Loss": 0.7796769142150879, "Full-finetune/Loss (Raw)": 0.7720965147018433, "Full-finetune/Step": 3399, "Full-finetune/Step Time": 6.614795571193099} {"Full-finetune/Learning Rate": 5.643931599766577e-06, "Full-finetune/Loss": 0.779744029045105, "Full-finetune/Loss (Raw)": 0.7725518345832825, "Full-finetune/Step": 3400, "Full-finetune/Step Time": 6.588539898395538} {"Full-finetune/Learning Rate": 5.638324942120091e-06, "Full-finetune/Loss": 0.7796424627304077, "Full-finetune/Loss (Raw)": 0.7193395495414734, "Full-finetune/Step": 3401, "Full-finetune/Step Time": 6.580912668257952} {"Full-finetune/Learning Rate": 5.632719977154537e-06, "Full-finetune/Loss": 0.7832205295562744, "Full-finetune/Loss (Raw)": 0.7732304930686951, "Full-finetune/Step": 3402, "Full-finetune/Step Time": 6.56211069971323} {"Full-finetune/Learning Rate": 5.6271167070451016e-06, "Full-finetune/Loss": 0.7834380865097046, "Full-finetune/Loss (Raw)": 0.7488998770713806, "Full-finetune/Step": 3403, "Full-finetune/Step Time": 6.557182729244232} {"Full-finetune/Learning Rate": 5.621515133966301e-06, "Full-finetune/Loss": 0.7828456163406372, "Full-finetune/Loss (Raw)": 0.760546863079071, "Full-finetune/Step": 3404, "Full-finetune/Step Time": 6.555110862478614} {"Full-finetune/Learning Rate": 5.615915260091987e-06, "Full-finetune/Loss": 0.7809860706329346, "Full-finetune/Loss (Raw)": 0.5882371068000793, "Full-finetune/Step": 3405, "Full-finetune/Step Time": 6.595502598211169} {"Full-finetune/Learning Rate": 5.610317087595372e-06, "Full-finetune/Loss": 0.7813167572021484, "Full-finetune/Loss (Raw)": 0.8465638160705566, "Full-finetune/Step": 3406, "Full-finetune/Step Time": 6.602955982089043} {"Full-finetune/Learning Rate": 5.604720618648993e-06, "Full-finetune/Loss": 0.7812852263450623, "Full-finetune/Loss (Raw)": 0.8321049809455872, "Full-finetune/Step": 3407, "Full-finetune/Step Time": 6.591311268508434} {"Full-finetune/Learning Rate": 5.599125855424734e-06, "Full-finetune/Loss": 0.780572772026062, "Full-finetune/Loss (Raw)": 0.8425803780555725, "Full-finetune/Step": 3408, "Full-finetune/Step Time": 6.5919907335191965} {"Full-finetune/Learning Rate": 5.593532800093808e-06, "Full-finetune/Loss": 0.7794598937034607, "Full-finetune/Loss (Raw)": 0.8357921838760376, "Full-finetune/Step": 3409, "Full-finetune/Step Time": 6.590033138170838} {"Full-finetune/Learning Rate": 5.5879414548267754e-06, "Full-finetune/Loss": 0.7787630558013916, "Full-finetune/Loss (Raw)": 0.6943468451499939, "Full-finetune/Step": 3410, "Full-finetune/Step Time": 6.59399376437068} {"Full-finetune/Learning Rate": 5.582351821793525e-06, "Full-finetune/Loss": 0.7831782698631287, "Full-finetune/Loss (Raw)": 0.9304004311561584, "Full-finetune/Step": 3411, "Full-finetune/Step Time": 6.575692495331168} {"Full-finetune/Learning Rate": 5.576763903163281e-06, "Full-finetune/Loss": 0.7837401628494263, "Full-finetune/Loss (Raw)": 0.83847975730896, "Full-finetune/Step": 3412, "Full-finetune/Step Time": 6.571390142664313} {"Full-finetune/Learning Rate": 5.571177701104614e-06, "Full-finetune/Loss": 0.7842327356338501, "Full-finetune/Loss (Raw)": 0.9215529561042786, "Full-finetune/Step": 3413, "Full-finetune/Step Time": 6.578901503235102} {"Full-finetune/Learning Rate": 5.56559321778542e-06, "Full-finetune/Loss": 0.7852119207382202, "Full-finetune/Loss (Raw)": 0.9256539940834045, "Full-finetune/Step": 3414, "Full-finetune/Step Time": 6.576515970751643} {"Full-finetune/Learning Rate": 5.560010455372915e-06, "Full-finetune/Loss": 0.7838670015335083, "Full-finetune/Loss (Raw)": 0.6656160354614258, "Full-finetune/Step": 3415, "Full-finetune/Step Time": 6.574093608185649} {"Full-finetune/Learning Rate": 5.5544294160336735e-06, "Full-finetune/Loss": 0.7800451517105103, "Full-finetune/Loss (Raw)": 0.4222222864627838, "Full-finetune/Step": 3416, "Full-finetune/Step Time": 6.590302461758256} {"Full-finetune/Learning Rate": 5.5488501019335824e-06, "Full-finetune/Loss": 0.7800055742263794, "Full-finetune/Loss (Raw)": 0.7366905212402344, "Full-finetune/Step": 3417, "Full-finetune/Step Time": 6.607282059267163} {"Full-finetune/Learning Rate": 5.5432725152378675e-06, "Full-finetune/Loss": 0.7796599268913269, "Full-finetune/Loss (Raw)": 0.8160129189491272, "Full-finetune/Step": 3418, "Full-finetune/Step Time": 6.618881568312645} {"Full-finetune/Learning Rate": 5.537696658111077e-06, "Full-finetune/Loss": 0.7806936502456665, "Full-finetune/Loss (Raw)": 0.8131993412971497, "Full-finetune/Step": 3419, "Full-finetune/Step Time": 6.610620833933353} {"Full-finetune/Learning Rate": 5.532122532717095e-06, "Full-finetune/Loss": 0.7787973880767822, "Full-finetune/Loss (Raw)": 0.5251815319061279, "Full-finetune/Step": 3420, "Full-finetune/Step Time": 6.635357705876231} {"Full-finetune/Learning Rate": 5.52655014121913e-06, "Full-finetune/Loss": 0.7791544198989868, "Full-finetune/Loss (Raw)": 0.8588483333587646, "Full-finetune/Step": 3421, "Full-finetune/Step Time": 6.63751608133316} {"Full-finetune/Learning Rate": 5.5209794857797135e-06, "Full-finetune/Loss": 0.7789678573608398, "Full-finetune/Loss (Raw)": 0.6896398067474365, "Full-finetune/Step": 3422, "Full-finetune/Step Time": 6.630939599126577} {"Full-finetune/Learning Rate": 5.51541056856072e-06, "Full-finetune/Loss": 0.7787436246871948, "Full-finetune/Loss (Raw)": 0.7544509172439575, "Full-finetune/Step": 3423, "Full-finetune/Step Time": 6.629586756229401} {"Full-finetune/Learning Rate": 5.509843391723332e-06, "Full-finetune/Loss": 0.7748618125915527, "Full-finetune/Loss (Raw)": 0.3456370532512665, "Full-finetune/Step": 3424, "Full-finetune/Step Time": 6.642088422551751} {"Full-finetune/Learning Rate": 5.504277957428053e-06, "Full-finetune/Loss": 0.7756094336509705, "Full-finetune/Loss (Raw)": 0.7722751498222351, "Full-finetune/Step": 3425, "Full-finetune/Step Time": 6.629298755899072} {"Full-finetune/Learning Rate": 5.498714267834731e-06, "Full-finetune/Loss": 0.7737456560134888, "Full-finetune/Loss (Raw)": 0.663021981716156, "Full-finetune/Step": 3426, "Full-finetune/Step Time": 6.630682116374373} {"Full-finetune/Learning Rate": 5.493152325102523e-06, "Full-finetune/Loss": 0.7772649526596069, "Full-finetune/Loss (Raw)": 0.8335922956466675, "Full-finetune/Step": 3427, "Full-finetune/Step Time": 6.616562090814114} {"Full-finetune/Learning Rate": 5.487592131389907e-06, "Full-finetune/Loss": 0.776447057723999, "Full-finetune/Loss (Raw)": 0.7544885277748108, "Full-finetune/Step": 3428, "Full-finetune/Step Time": 6.634210618212819} {"Full-finetune/Learning Rate": 5.482033688854689e-06, "Full-finetune/Loss": 0.7778286933898926, "Full-finetune/Loss (Raw)": 0.8480162620544434, "Full-finetune/Step": 3429, "Full-finetune/Step Time": 6.630752624943852} {"Full-finetune/Learning Rate": 5.47647699965399e-06, "Full-finetune/Loss": 0.7758963108062744, "Full-finetune/Loss (Raw)": 0.6533306241035461, "Full-finetune/Step": 3430, "Full-finetune/Step Time": 6.624634800478816} {"Full-finetune/Learning Rate": 5.470922065944253e-06, "Full-finetune/Loss": 0.7769811153411865, "Full-finetune/Loss (Raw)": 0.9273394346237183, "Full-finetune/Step": 3431, "Full-finetune/Step Time": 6.628909315913916} {"Full-finetune/Learning Rate": 5.465368889881235e-06, "Full-finetune/Loss": 0.7761836051940918, "Full-finetune/Loss (Raw)": 0.6376991271972656, "Full-finetune/Step": 3432, "Full-finetune/Step Time": 6.630289478227496} {"Full-finetune/Learning Rate": 5.459817473620024e-06, "Full-finetune/Loss": 0.7755683660507202, "Full-finetune/Loss (Raw)": 0.7933547496795654, "Full-finetune/Step": 3433, "Full-finetune/Step Time": 6.637122130021453} {"Full-finetune/Learning Rate": 5.454267819315016e-06, "Full-finetune/Loss": 0.7753905057907104, "Full-finetune/Loss (Raw)": 0.6877840757369995, "Full-finetune/Step": 3434, "Full-finetune/Step Time": 6.661740999668837} {"Full-finetune/Learning Rate": 5.448719929119916e-06, "Full-finetune/Loss": 0.7736896872520447, "Full-finetune/Loss (Raw)": 0.7298455238342285, "Full-finetune/Step": 3435, "Full-finetune/Step Time": 6.674937214702368} {"Full-finetune/Learning Rate": 5.44317380518775e-06, "Full-finetune/Loss": 0.772788405418396, "Full-finetune/Loss (Raw)": 0.7104605436325073, "Full-finetune/Step": 3436, "Full-finetune/Step Time": 6.668602341786027} {"Full-finetune/Learning Rate": 5.43762944967087e-06, "Full-finetune/Loss": 0.7721498608589172, "Full-finetune/Loss (Raw)": 0.7990975975990295, "Full-finetune/Step": 3437, "Full-finetune/Step Time": 6.647504396736622} {"Full-finetune/Learning Rate": 5.432086864720929e-06, "Full-finetune/Loss": 0.7719880938529968, "Full-finetune/Loss (Raw)": 0.715884804725647, "Full-finetune/Step": 3438, "Full-finetune/Step Time": 6.645613685250282} {"Full-finetune/Learning Rate": 5.426546052488892e-06, "Full-finetune/Loss": 0.7728209495544434, "Full-finetune/Loss (Raw)": 0.8177925944328308, "Full-finetune/Step": 3439, "Full-finetune/Step Time": 6.651012299582362} {"Full-finetune/Learning Rate": 5.421007015125046e-06, "Full-finetune/Loss": 0.7723077535629272, "Full-finetune/Loss (Raw)": 0.7118082642555237, "Full-finetune/Step": 3440, "Full-finetune/Step Time": 6.642644850537181} {"Full-finetune/Learning Rate": 5.415469754778979e-06, "Full-finetune/Loss": 0.7738105058670044, "Full-finetune/Loss (Raw)": 0.6208258867263794, "Full-finetune/Step": 3441, "Full-finetune/Step Time": 6.6463097259402275} {"Full-finetune/Learning Rate": 5.409934273599594e-06, "Full-finetune/Loss": 0.7737741470336914, "Full-finetune/Loss (Raw)": 0.7305827140808105, "Full-finetune/Step": 3442, "Full-finetune/Step Time": 6.653944903984666} {"Full-finetune/Learning Rate": 5.404400573735105e-06, "Full-finetune/Loss": 0.7716898918151855, "Full-finetune/Loss (Raw)": 0.7189281582832336, "Full-finetune/Step": 3443, "Full-finetune/Step Time": 6.663744663819671} {"Full-finetune/Learning Rate": 5.3988686573330316e-06, "Full-finetune/Loss": 0.772179365158081, "Full-finetune/Loss (Raw)": 0.8250954151153564, "Full-finetune/Step": 3444, "Full-finetune/Step Time": 6.656796783208847} {"Full-finetune/Learning Rate": 5.393338526540202e-06, "Full-finetune/Loss": 0.7707443237304688, "Full-finetune/Loss (Raw)": 0.572196364402771, "Full-finetune/Step": 3445, "Full-finetune/Step Time": 6.675580188632011} {"Full-finetune/Learning Rate": 5.387810183502749e-06, "Full-finetune/Loss": 0.7739472985267639, "Full-finetune/Loss (Raw)": 0.7436135411262512, "Full-finetune/Step": 3446, "Full-finetune/Step Time": 6.666548080742359} {"Full-finetune/Learning Rate": 5.382283630366123e-06, "Full-finetune/Loss": 0.7739991545677185, "Full-finetune/Loss (Raw)": 0.9001999497413635, "Full-finetune/Step": 3447, "Full-finetune/Step Time": 6.6616213377565145} {"Full-finetune/Learning Rate": 5.37675886927507e-06, "Full-finetune/Loss": 0.7738224267959595, "Full-finetune/Loss (Raw)": 0.735051691532135, "Full-finetune/Step": 3448, "Full-finetune/Step Time": 6.667498210445046} {"Full-finetune/Learning Rate": 5.371235902373632e-06, "Full-finetune/Loss": 0.775378942489624, "Full-finetune/Loss (Raw)": 0.9000313878059387, "Full-finetune/Step": 3449, "Full-finetune/Step Time": 6.66354082711041} {"Full-finetune/Learning Rate": 5.365714731805174e-06, "Full-finetune/Loss": 0.7754793167114258, "Full-finetune/Loss (Raw)": 0.776507556438446, "Full-finetune/Step": 3450, "Full-finetune/Step Time": 6.6839636992663145} {"Full-finetune/Learning Rate": 5.360195359712353e-06, "Full-finetune/Loss": 0.7747355699539185, "Full-finetune/Loss (Raw)": 0.7891653776168823, "Full-finetune/Step": 3451, "Full-finetune/Step Time": 6.667011709883809} {"Full-finetune/Learning Rate": 5.354677788237126e-06, "Full-finetune/Loss": 0.7756969928741455, "Full-finetune/Loss (Raw)": 0.8805667757987976, "Full-finetune/Step": 3452, "Full-finetune/Step Time": 6.651589319109917} {"Full-finetune/Learning Rate": 5.349162019520759e-06, "Full-finetune/Loss": 0.776570200920105, "Full-finetune/Loss (Raw)": 0.7957428693771362, "Full-finetune/Step": 3453, "Full-finetune/Step Time": 6.649547701701522} {"Full-finetune/Learning Rate": 5.343648055703812e-06, "Full-finetune/Loss": 0.7755679488182068, "Full-finetune/Loss (Raw)": 0.7491392493247986, "Full-finetune/Step": 3454, "Full-finetune/Step Time": 6.658330177888274} {"Full-finetune/Learning Rate": 5.338135898926147e-06, "Full-finetune/Loss": 0.7736777067184448, "Full-finetune/Loss (Raw)": 0.33921322226524353, "Full-finetune/Step": 3455, "Full-finetune/Step Time": 6.666751390323043} {"Full-finetune/Learning Rate": 5.33262555132692e-06, "Full-finetune/Loss": 0.7732160091400146, "Full-finetune/Loss (Raw)": 0.8599147200584412, "Full-finetune/Step": 3456, "Full-finetune/Step Time": 6.663154672831297} {"Full-finetune/Learning Rate": 5.327117015044599e-06, "Full-finetune/Loss": 0.7734546065330505, "Full-finetune/Loss (Raw)": 0.8464106321334839, "Full-finetune/Step": 3457, "Full-finetune/Step Time": 6.653927596285939} {"Full-finetune/Learning Rate": 5.321610292216937e-06, "Full-finetune/Loss": 0.7744241952896118, "Full-finetune/Loss (Raw)": 0.8152331113815308, "Full-finetune/Step": 3458, "Full-finetune/Step Time": 6.662594307214022} {"Full-finetune/Learning Rate": 5.316105384980974e-06, "Full-finetune/Loss": 0.774489164352417, "Full-finetune/Loss (Raw)": 0.8215888738632202, "Full-finetune/Step": 3459, "Full-finetune/Step Time": 6.65297519415617} {"Full-finetune/Learning Rate": 5.3106022954730704e-06, "Full-finetune/Loss": 0.7753075361251831, "Full-finetune/Loss (Raw)": 0.8997084498405457, "Full-finetune/Step": 3460, "Full-finetune/Step Time": 6.654792565852404} {"Full-finetune/Learning Rate": 5.3051010258288624e-06, "Full-finetune/Loss": 0.7715555429458618, "Full-finetune/Loss (Raw)": 0.3377048373222351, "Full-finetune/Step": 3461, "Full-finetune/Step Time": 6.674020491540432} {"Full-finetune/Learning Rate": 5.299601578183289e-06, "Full-finetune/Loss": 0.7713795304298401, "Full-finetune/Loss (Raw)": 0.8006031513214111, "Full-finetune/Step": 3462, "Full-finetune/Step Time": 6.670640826225281} {"Full-finetune/Learning Rate": 5.294103954670573e-06, "Full-finetune/Loss": 0.7716231942176819, "Full-finetune/Loss (Raw)": 0.764410674571991, "Full-finetune/Step": 3463, "Full-finetune/Step Time": 6.672893233597279} {"Full-finetune/Learning Rate": 5.288608157424238e-06, "Full-finetune/Loss": 0.7726831436157227, "Full-finetune/Loss (Raw)": 0.9001119136810303, "Full-finetune/Step": 3464, "Full-finetune/Step Time": 6.683881279081106} {"Full-finetune/Learning Rate": 5.283114188577094e-06, "Full-finetune/Loss": 0.7730064392089844, "Full-finetune/Loss (Raw)": 0.7253568768501282, "Full-finetune/Step": 3465, "Full-finetune/Step Time": 6.679098214954138} {"Full-finetune/Learning Rate": 5.277622050261242e-06, "Full-finetune/Loss": 0.7720547318458557, "Full-finetune/Loss (Raw)": 0.6815723776817322, "Full-finetune/Step": 3466, "Full-finetune/Step Time": 6.677238397300243} {"Full-finetune/Learning Rate": 5.272131744608078e-06, "Full-finetune/Loss": 0.7705265283584595, "Full-finetune/Loss (Raw)": 0.6571457982063293, "Full-finetune/Step": 3467, "Full-finetune/Step Time": 6.675798751413822} {"Full-finetune/Learning Rate": 5.2666432737482844e-06, "Full-finetune/Loss": 0.7691562175750732, "Full-finetune/Loss (Raw)": 0.6383820176124573, "Full-finetune/Step": 3468, "Full-finetune/Step Time": 6.683657938614488} {"Full-finetune/Learning Rate": 5.261156639811817e-06, "Full-finetune/Loss": 0.7672301530838013, "Full-finetune/Loss (Raw)": 0.7141817808151245, "Full-finetune/Step": 3469, "Full-finetune/Step Time": 6.691847071051598} {"Full-finetune/Learning Rate": 5.255671844927944e-06, "Full-finetune/Loss": 0.7663537263870239, "Full-finetune/Loss (Raw)": 0.7660292983055115, "Full-finetune/Step": 3470, "Full-finetune/Step Time": 6.699347984045744} {"Full-finetune/Learning Rate": 5.250188891225203e-06, "Full-finetune/Loss": 0.7664813995361328, "Full-finetune/Loss (Raw)": 0.8617268204689026, "Full-finetune/Step": 3471, "Full-finetune/Step Time": 6.705004807561636} {"Full-finetune/Learning Rate": 5.24470778083142e-06, "Full-finetune/Loss": 0.7673687934875488, "Full-finetune/Loss (Raw)": 0.7405993938446045, "Full-finetune/Step": 3472, "Full-finetune/Step Time": 6.705070059746504} {"Full-finetune/Learning Rate": 5.2392285158737085e-06, "Full-finetune/Loss": 0.7713586688041687, "Full-finetune/Loss (Raw)": 0.860734760761261, "Full-finetune/Step": 3473, "Full-finetune/Step Time": 6.7048789374530315} {"Full-finetune/Learning Rate": 5.233751098478465e-06, "Full-finetune/Loss": 0.7696417570114136, "Full-finetune/Loss (Raw)": 0.6644645929336548, "Full-finetune/Step": 3474, "Full-finetune/Step Time": 6.720457339659333} {"Full-finetune/Learning Rate": 5.228275530771366e-06, "Full-finetune/Loss": 0.7706507444381714, "Full-finetune/Loss (Raw)": 0.8115801811218262, "Full-finetune/Step": 3475, "Full-finetune/Step Time": 6.726681061089039} {"Full-finetune/Learning Rate": 5.22280181487737e-06, "Full-finetune/Loss": 0.7689142227172852, "Full-finetune/Loss (Raw)": 0.6302779316902161, "Full-finetune/Step": 3476, "Full-finetune/Step Time": 6.740449609234929} {"Full-finetune/Learning Rate": 5.217329952920727e-06, "Full-finetune/Loss": 0.7680631875991821, "Full-finetune/Loss (Raw)": 0.7395409941673279, "Full-finetune/Step": 3477, "Full-finetune/Step Time": 6.748103430494666} {"Full-finetune/Learning Rate": 5.2118599470249575e-06, "Full-finetune/Loss": 0.7676076889038086, "Full-finetune/Loss (Raw)": 0.9402003884315491, "Full-finetune/Step": 3478, "Full-finetune/Step Time": 6.740430183708668} {"Full-finetune/Learning Rate": 5.206391799312855e-06, "Full-finetune/Loss": 0.7697510719299316, "Full-finetune/Loss (Raw)": 1.0193487405776978, "Full-finetune/Step": 3479, "Full-finetune/Step Time": 6.727326788008213} {"Full-finetune/Learning Rate": 5.200925511906513e-06, "Full-finetune/Loss": 0.7697746157646179, "Full-finetune/Loss (Raw)": 0.8422642350196838, "Full-finetune/Step": 3480, "Full-finetune/Step Time": 6.718409152701497} {"Full-finetune/Learning Rate": 5.195461086927284e-06, "Full-finetune/Loss": 0.7693331837654114, "Full-finetune/Loss (Raw)": 0.847912609577179, "Full-finetune/Step": 3481, "Full-finetune/Step Time": 6.695618877187371} {"Full-finetune/Learning Rate": 5.189998526495808e-06, "Full-finetune/Loss": 0.7683707475662231, "Full-finetune/Loss (Raw)": 0.7638120055198669, "Full-finetune/Step": 3482, "Full-finetune/Step Time": 6.694892914965749} {"Full-finetune/Learning Rate": 5.184537832731996e-06, "Full-finetune/Loss": 0.7676138877868652, "Full-finetune/Loss (Raw)": 0.7405994534492493, "Full-finetune/Step": 3483, "Full-finetune/Step Time": 6.728639578446746} {"Full-finetune/Learning Rate": 5.1790790077550366e-06, "Full-finetune/Loss": 0.7666394710540771, "Full-finetune/Loss (Raw)": 0.7498534917831421, "Full-finetune/Step": 3484, "Full-finetune/Step Time": 6.744897613301873} {"Full-finetune/Learning Rate": 5.173622053683395e-06, "Full-finetune/Loss": 0.7676575183868408, "Full-finetune/Loss (Raw)": 0.9350187182426453, "Full-finetune/Step": 3485, "Full-finetune/Step Time": 6.741497576236725} {"Full-finetune/Learning Rate": 5.168166972634803e-06, "Full-finetune/Loss": 0.7681251764297485, "Full-finetune/Loss (Raw)": 0.8094931840896606, "Full-finetune/Step": 3486, "Full-finetune/Step Time": 6.734025277197361} {"Full-finetune/Learning Rate": 5.1627137667262815e-06, "Full-finetune/Loss": 0.7659595608711243, "Full-finetune/Loss (Raw)": 0.7195954918861389, "Full-finetune/Step": 3487, "Full-finetune/Step Time": 6.732149409130216} {"Full-finetune/Learning Rate": 5.1572624380741044e-06, "Full-finetune/Loss": 0.7643458843231201, "Full-finetune/Loss (Raw)": 0.6793875098228455, "Full-finetune/Step": 3488, "Full-finetune/Step Time": 6.731254063546658} {"Full-finetune/Learning Rate": 5.151812988793825e-06, "Full-finetune/Loss": 0.7646380662918091, "Full-finetune/Loss (Raw)": 0.8721683025360107, "Full-finetune/Step": 3489, "Full-finetune/Step Time": 6.7179635763168335} {"Full-finetune/Learning Rate": 5.146365421000275e-06, "Full-finetune/Loss": 0.7645934820175171, "Full-finetune/Loss (Raw)": 0.7154088616371155, "Full-finetune/Step": 3490, "Full-finetune/Step Time": 6.704421324655414} {"Full-finetune/Learning Rate": 5.140919736807546e-06, "Full-finetune/Loss": 0.7647523283958435, "Full-finetune/Loss (Raw)": 0.9046842455863953, "Full-finetune/Step": 3491, "Full-finetune/Step Time": 6.6993227787315845} {"Full-finetune/Learning Rate": 5.135475938329002e-06, "Full-finetune/Loss": 0.7641048431396484, "Full-finetune/Loss (Raw)": 0.7966431379318237, "Full-finetune/Step": 3492, "Full-finetune/Step Time": 6.708402501419187} {"Full-finetune/Learning Rate": 5.1300340276772756e-06, "Full-finetune/Loss": 0.7620933055877686, "Full-finetune/Loss (Raw)": 0.49669912457466125, "Full-finetune/Step": 3493, "Full-finetune/Step Time": 6.699762092903256} {"Full-finetune/Learning Rate": 5.124594006964263e-06, "Full-finetune/Loss": 0.7639949917793274, "Full-finetune/Loss (Raw)": 0.9259335398674011, "Full-finetune/Step": 3494, "Full-finetune/Step Time": 6.686851482838392} {"Full-finetune/Learning Rate": 5.1191558783011315e-06, "Full-finetune/Loss": 0.7651205062866211, "Full-finetune/Loss (Raw)": 0.847709059715271, "Full-finetune/Step": 3495, "Full-finetune/Step Time": 6.676405666396022} {"Full-finetune/Learning Rate": 5.113719643798312e-06, "Full-finetune/Loss": 0.7684448957443237, "Full-finetune/Loss (Raw)": 0.8594883680343628, "Full-finetune/Step": 3496, "Full-finetune/Step Time": 6.6657329220324755} {"Full-finetune/Learning Rate": 5.108285305565508e-06, "Full-finetune/Loss": 0.7667800784111023, "Full-finetune/Loss (Raw)": 0.6232843995094299, "Full-finetune/Step": 3497, "Full-finetune/Step Time": 6.674051471054554} {"Full-finetune/Learning Rate": 5.1028528657116715e-06, "Full-finetune/Loss": 0.7668372988700867, "Full-finetune/Loss (Raw)": 0.872183084487915, "Full-finetune/Step": 3498, "Full-finetune/Step Time": 6.677433447912335} {"Full-finetune/Learning Rate": 5.097422326345024e-06, "Full-finetune/Loss": 0.7685266733169556, "Full-finetune/Loss (Raw)": 0.7878665924072266, "Full-finetune/Step": 3499, "Full-finetune/Step Time": 6.663158889859915} {"Full-finetune/Learning Rate": 5.091993689573062e-06, "Full-finetune/Loss": 0.7698746919631958, "Full-finetune/Loss (Raw)": 0.8996394276618958, "Full-finetune/Step": 3500, "Full-finetune/Step Time": 6.653034957125783} {"Full-finetune/Learning Rate": 5.086566957502527e-06, "Full-finetune/Loss": 0.7700549364089966, "Full-finetune/Loss (Raw)": 0.8628592491149902, "Full-finetune/Step": 3501, "Full-finetune/Step Time": 6.639293424785137} {"Full-finetune/Learning Rate": 5.081142132239429e-06, "Full-finetune/Loss": 0.7710893154144287, "Full-finetune/Loss (Raw)": 0.9451978802680969, "Full-finetune/Step": 3502, "Full-finetune/Step Time": 6.635035561397672} {"Full-finetune/Learning Rate": 5.075719215889039e-06, "Full-finetune/Loss": 0.7697309255599976, "Full-finetune/Loss (Raw)": 0.8686339259147644, "Full-finetune/Step": 3503, "Full-finetune/Step Time": 6.635128125548363} {"Full-finetune/Learning Rate": 5.070298210555881e-06, "Full-finetune/Loss": 0.7684396505355835, "Full-finetune/Loss (Raw)": 0.7548763751983643, "Full-finetune/Step": 3504, "Full-finetune/Step Time": 6.636218853294849} {"Full-finetune/Learning Rate": 5.064879118343744e-06, "Full-finetune/Loss": 0.7695547342300415, "Full-finetune/Loss (Raw)": 0.7842787504196167, "Full-finetune/Step": 3505, "Full-finetune/Step Time": 6.6330003924667835} {"Full-finetune/Learning Rate": 5.059461941355665e-06, "Full-finetune/Loss": 0.7683655023574829, "Full-finetune/Loss (Raw)": 0.7428891658782959, "Full-finetune/Step": 3506, "Full-finetune/Step Time": 6.629945972934365} {"Full-finetune/Learning Rate": 5.05404668169396e-06, "Full-finetune/Loss": 0.768151581287384, "Full-finetune/Loss (Raw)": 0.5925683379173279, "Full-finetune/Step": 3507, "Full-finetune/Step Time": 6.6447634268552065} {"Full-finetune/Learning Rate": 5.048633341460174e-06, "Full-finetune/Loss": 0.7689193487167358, "Full-finetune/Loss (Raw)": 0.7910609245300293, "Full-finetune/Step": 3508, "Full-finetune/Step Time": 6.646018758416176} {"Full-finetune/Learning Rate": 5.043221922755115e-06, "Full-finetune/Loss": 0.7689906358718872, "Full-finetune/Loss (Raw)": 0.754629909992218, "Full-finetune/Step": 3509, "Full-finetune/Step Time": 6.65943574346602} {"Full-finetune/Learning Rate": 5.03781242767886e-06, "Full-finetune/Loss": 0.7677967548370361, "Full-finetune/Loss (Raw)": 0.7342644929885864, "Full-finetune/Step": 3510, "Full-finetune/Step Time": 6.6588912680745125} {"Full-finetune/Learning Rate": 5.032404858330721e-06, "Full-finetune/Loss": 0.7672741413116455, "Full-finetune/Loss (Raw)": 0.7140809297561646, "Full-finetune/Step": 3511, "Full-finetune/Step Time": 6.6669293865561485} {"Full-finetune/Learning Rate": 5.026999216809275e-06, "Full-finetune/Loss": 0.7664488554000854, "Full-finetune/Loss (Raw)": 0.7740710377693176, "Full-finetune/Step": 3512, "Full-finetune/Step Time": 6.6653796043246984} {"Full-finetune/Learning Rate": 5.021595505212342e-06, "Full-finetune/Loss": 0.7679420709609985, "Full-finetune/Loss (Raw)": 0.8504502773284912, "Full-finetune/Step": 3513, "Full-finetune/Step Time": 6.665404587984085} {"Full-finetune/Learning Rate": 5.016193725637e-06, "Full-finetune/Loss": 0.7675909996032715, "Full-finetune/Loss (Raw)": 0.7357470989227295, "Full-finetune/Step": 3514, "Full-finetune/Step Time": 6.671134755015373} {"Full-finetune/Learning Rate": 5.0107938801795695e-06, "Full-finetune/Loss": 0.7680294513702393, "Full-finetune/Loss (Raw)": 0.7921960353851318, "Full-finetune/Step": 3515, "Full-finetune/Step Time": 6.678085641935468} {"Full-finetune/Learning Rate": 5.005395970935627e-06, "Full-finetune/Loss": 0.7682851552963257, "Full-finetune/Loss (Raw)": 0.7942439317703247, "Full-finetune/Step": 3516, "Full-finetune/Step Time": 6.679341658949852} {"Full-finetune/Learning Rate": 5.000000000000003e-06, "Full-finetune/Loss": 0.7684423327445984, "Full-finetune/Loss (Raw)": 0.8354498147964478, "Full-finetune/Step": 3517, "Full-finetune/Step Time": 6.676849499344826} {"Full-finetune/Learning Rate": 4.994605969466758e-06, "Full-finetune/Loss": 0.7669711112976074, "Full-finetune/Loss (Raw)": 0.6335943341255188, "Full-finetune/Step": 3518, "Full-finetune/Step Time": 6.7029558550566435} {"Full-finetune/Learning Rate": 4.989213881429211e-06, "Full-finetune/Loss": 0.7646948099136353, "Full-finetune/Loss (Raw)": 0.6817659735679626, "Full-finetune/Step": 3519, "Full-finetune/Step Time": 6.727273847907782} {"Full-finetune/Learning Rate": 4.983823737979933e-06, "Full-finetune/Loss": 0.7646779417991638, "Full-finetune/Loss (Raw)": 0.7532236576080322, "Full-finetune/Step": 3520, "Full-finetune/Step Time": 6.7294273022562265} {"Full-finetune/Learning Rate": 4.97843554121073e-06, "Full-finetune/Loss": 0.7646466493606567, "Full-finetune/Loss (Raw)": 0.8833425045013428, "Full-finetune/Step": 3521, "Full-finetune/Step Time": 6.730291239917278} {"Full-finetune/Learning Rate": 4.973049293212655e-06, "Full-finetune/Loss": 0.7639515399932861, "Full-finetune/Loss (Raw)": 0.6358982920646667, "Full-finetune/Step": 3522, "Full-finetune/Step Time": 6.726790893822908} {"Full-finetune/Learning Rate": 4.967664996076007e-06, "Full-finetune/Loss": 0.7619606256484985, "Full-finetune/Loss (Raw)": 0.6219173073768616, "Full-finetune/Step": 3523, "Full-finetune/Step Time": 6.752123534679413} {"Full-finetune/Learning Rate": 4.962282651890325e-06, "Full-finetune/Loss": 0.7620143890380859, "Full-finetune/Loss (Raw)": 0.6720632910728455, "Full-finetune/Step": 3524, "Full-finetune/Step Time": 6.761896466836333} {"Full-finetune/Learning Rate": 4.9569022627443944e-06, "Full-finetune/Loss": 0.763799786567688, "Full-finetune/Loss (Raw)": 0.984665036201477, "Full-finetune/Step": 3525, "Full-finetune/Step Time": 6.765632279217243} {"Full-finetune/Learning Rate": 4.951523830726236e-06, "Full-finetune/Loss": 0.762497067451477, "Full-finetune/Loss (Raw)": 0.6566567420959473, "Full-finetune/Step": 3526, "Full-finetune/Step Time": 6.774328511208296} {"Full-finetune/Learning Rate": 4.946147357923116e-06, "Full-finetune/Loss": 0.7626755237579346, "Full-finetune/Loss (Raw)": 0.7949368357658386, "Full-finetune/Step": 3527, "Full-finetune/Step Time": 6.772986721247435} {"Full-finetune/Learning Rate": 4.940772846421538e-06, "Full-finetune/Loss": 0.7627347111701965, "Full-finetune/Loss (Raw)": 0.7801293730735779, "Full-finetune/Step": 3528, "Full-finetune/Step Time": 6.773155948147178} {"Full-finetune/Learning Rate": 4.935400298307241e-06, "Full-finetune/Loss": 0.7620232105255127, "Full-finetune/Loss (Raw)": 0.6282640099525452, "Full-finetune/Step": 3529, "Full-finetune/Step Time": 6.783503605052829} {"Full-finetune/Learning Rate": 4.930029715665215e-06, "Full-finetune/Loss": 0.7619595527648926, "Full-finetune/Loss (Raw)": 0.7650931477546692, "Full-finetune/Step": 3530, "Full-finetune/Step Time": 6.785895671695471} {"Full-finetune/Learning Rate": 4.9246611005796776e-06, "Full-finetune/Loss": 0.7627975344657898, "Full-finetune/Loss (Raw)": 0.8561518788337708, "Full-finetune/Step": 3531, "Full-finetune/Step Time": 6.78540800511837} {"Full-finetune/Learning Rate": 4.919294455134071e-06, "Full-finetune/Loss": 0.762092649936676, "Full-finetune/Loss (Raw)": 0.6703221201896667, "Full-finetune/Step": 3532, "Full-finetune/Step Time": 6.797685950994492} {"Full-finetune/Learning Rate": 4.913929781411099e-06, "Full-finetune/Loss": 0.759993314743042, "Full-finetune/Loss (Raw)": 0.3195193409919739, "Full-finetune/Step": 3533, "Full-finetune/Step Time": 6.77849405631423} {"Full-finetune/Learning Rate": 4.90856708149268e-06, "Full-finetune/Loss": 0.7598546147346497, "Full-finetune/Loss (Raw)": 0.8288218379020691, "Full-finetune/Step": 3534, "Full-finetune/Step Time": 6.786309398710728} {"Full-finetune/Learning Rate": 4.903206357459976e-06, "Full-finetune/Loss": 0.7559391260147095, "Full-finetune/Loss (Raw)": 0.33091822266578674, "Full-finetune/Step": 3535, "Full-finetune/Step Time": 6.804920768365264} {"Full-finetune/Learning Rate": 4.897847611393378e-06, "Full-finetune/Loss": 0.7553700804710388, "Full-finetune/Loss (Raw)": 0.7697346210479736, "Full-finetune/Step": 3536, "Full-finetune/Step Time": 6.802143730223179} {"Full-finetune/Learning Rate": 4.892490845372511e-06, "Full-finetune/Loss": 0.7563645839691162, "Full-finetune/Loss (Raw)": 0.9630916714668274, "Full-finetune/Step": 3537, "Full-finetune/Step Time": 6.81009410135448} {"Full-finetune/Learning Rate": 4.8871360614762295e-06, "Full-finetune/Loss": 0.7580331563949585, "Full-finetune/Loss (Raw)": 0.9079259037971497, "Full-finetune/Step": 3538, "Full-finetune/Step Time": 6.811877416446805} {"Full-finetune/Learning Rate": 4.881783261782621e-06, "Full-finetune/Loss": 0.7576549649238586, "Full-finetune/Loss (Raw)": 0.8819915056228638, "Full-finetune/Step": 3539, "Full-finetune/Step Time": 6.815002351999283} {"Full-finetune/Learning Rate": 4.876432448369006e-06, "Full-finetune/Loss": 0.7575162649154663, "Full-finetune/Loss (Raw)": 0.8207290172576904, "Full-finetune/Step": 3540, "Full-finetune/Step Time": 6.829281760379672} {"Full-finetune/Learning Rate": 4.871083623311933e-06, "Full-finetune/Loss": 0.7566640377044678, "Full-finetune/Loss (Raw)": 0.8124576807022095, "Full-finetune/Step": 3541, "Full-finetune/Step Time": 6.819427199661732} {"Full-finetune/Learning Rate": 4.865736788687164e-06, "Full-finetune/Loss": 0.7547784447669983, "Full-finetune/Loss (Raw)": 0.6843110918998718, "Full-finetune/Step": 3542, "Full-finetune/Step Time": 6.838434072211385} {"Full-finetune/Learning Rate": 4.860391946569714e-06, "Full-finetune/Loss": 0.7555375099182129, "Full-finetune/Loss (Raw)": 0.7627747058868408, "Full-finetune/Step": 3543, "Full-finetune/Step Time": 6.850575469434261} {"Full-finetune/Learning Rate": 4.855049099033806e-06, "Full-finetune/Loss": 0.7588158249855042, "Full-finetune/Loss (Raw)": 0.8418452143669128, "Full-finetune/Step": 3544, "Full-finetune/Step Time": 6.831013802438974} {"Full-finetune/Learning Rate": 4.849708248152897e-06, "Full-finetune/Loss": 0.7563185691833496, "Full-finetune/Loss (Raw)": 0.4170371890068054, "Full-finetune/Step": 3545, "Full-finetune/Step Time": 6.833850771188736} {"Full-finetune/Learning Rate": 4.8443693959996655e-06, "Full-finetune/Loss": 0.7556167840957642, "Full-finetune/Loss (Raw)": 0.7261949181556702, "Full-finetune/Step": 3546, "Full-finetune/Step Time": 6.82996896840632} {"Full-finetune/Learning Rate": 4.839032544646016e-06, "Full-finetune/Loss": 0.7563991546630859, "Full-finetune/Loss (Raw)": 0.9133340716362, "Full-finetune/Step": 3547, "Full-finetune/Step Time": 6.826830560341477} {"Full-finetune/Learning Rate": 4.833697696163077e-06, "Full-finetune/Loss": 0.7582127451896667, "Full-finetune/Loss (Raw)": 0.7573204636573792, "Full-finetune/Step": 3548, "Full-finetune/Step Time": 6.803986053913832} {"Full-finetune/Learning Rate": 4.828364852621195e-06, "Full-finetune/Loss": 0.7587406635284424, "Full-finetune/Loss (Raw)": 0.92641681432724, "Full-finetune/Step": 3549, "Full-finetune/Step Time": 6.802550479769707} {"Full-finetune/Learning Rate": 4.823034016089949e-06, "Full-finetune/Loss": 0.7560014724731445, "Full-finetune/Loss (Raw)": 0.33902984857559204, "Full-finetune/Step": 3550, "Full-finetune/Step Time": 6.800144638866186} {"Full-finetune/Learning Rate": 4.8177051886381345e-06, "Full-finetune/Loss": 0.7555137872695923, "Full-finetune/Loss (Raw)": 0.6920244693756104, "Full-finetune/Step": 3551, "Full-finetune/Step Time": 6.817378418520093} {"Full-finetune/Learning Rate": 4.812378372333751e-06, "Full-finetune/Loss": 0.7592383623123169, "Full-finetune/Loss (Raw)": 0.8223828673362732, "Full-finetune/Step": 3552, "Full-finetune/Step Time": 6.795826900750399} {"Full-finetune/Learning Rate": 4.807053569244047e-06, "Full-finetune/Loss": 0.7581712603569031, "Full-finetune/Loss (Raw)": 0.6356861591339111, "Full-finetune/Step": 3553, "Full-finetune/Step Time": 6.802867215126753} {"Full-finetune/Learning Rate": 4.801730781435469e-06, "Full-finetune/Loss": 0.7600958347320557, "Full-finetune/Loss (Raw)": 0.9093735218048096, "Full-finetune/Step": 3554, "Full-finetune/Step Time": 6.805515486747026} {"Full-finetune/Learning Rate": 4.796410010973686e-06, "Full-finetune/Loss": 0.760854959487915, "Full-finetune/Loss (Raw)": 0.9307523965835571, "Full-finetune/Step": 3555, "Full-finetune/Step Time": 6.802953999489546} {"Full-finetune/Learning Rate": 4.791091259923587e-06, "Full-finetune/Loss": 0.7576095461845398, "Full-finetune/Loss (Raw)": 0.3390781879425049, "Full-finetune/Step": 3556, "Full-finetune/Step Time": 6.802929615601897} {"Full-finetune/Learning Rate": 4.785774530349275e-06, "Full-finetune/Loss": 0.75859534740448, "Full-finetune/Loss (Raw)": 0.9741950631141663, "Full-finetune/Step": 3557, "Full-finetune/Step Time": 6.801241358742118} {"Full-finetune/Learning Rate": 4.7804598243140664e-06, "Full-finetune/Loss": 0.7597347497940063, "Full-finetune/Loss (Raw)": 0.7991799116134644, "Full-finetune/Step": 3558, "Full-finetune/Step Time": 6.802244555205107} {"Full-finetune/Learning Rate": 4.775147143880496e-06, "Full-finetune/Loss": 0.75910484790802, "Full-finetune/Loss (Raw)": 0.8467104434967041, "Full-finetune/Step": 3559, "Full-finetune/Step Time": 6.800637507811189} {"Full-finetune/Learning Rate": 4.769836491110314e-06, "Full-finetune/Loss": 0.7610477209091187, "Full-finetune/Loss (Raw)": 0.8863856792449951, "Full-finetune/Step": 3560, "Full-finetune/Step Time": 6.784530032426119} {"Full-finetune/Learning Rate": 4.764527868064484e-06, "Full-finetune/Loss": 0.7623471021652222, "Full-finetune/Loss (Raw)": 0.9596746563911438, "Full-finetune/Step": 3561, "Full-finetune/Step Time": 6.768109867349267} {"Full-finetune/Learning Rate": 4.759221276803172e-06, "Full-finetune/Loss": 0.7618930339813232, "Full-finetune/Loss (Raw)": 0.6296648383140564, "Full-finetune/Step": 3562, "Full-finetune/Step Time": 6.743463518097997} {"Full-finetune/Learning Rate": 4.75391671938576e-06, "Full-finetune/Loss": 0.761443018913269, "Full-finetune/Loss (Raw)": 0.6722507476806641, "Full-finetune/Step": 3563, "Full-finetune/Step Time": 6.729512467980385} {"Full-finetune/Learning Rate": 4.748614197870852e-06, "Full-finetune/Loss": 0.7619284391403198, "Full-finetune/Loss (Raw)": 0.7725927233695984, "Full-finetune/Step": 3564, "Full-finetune/Step Time": 6.732725227251649} {"Full-finetune/Learning Rate": 4.743313714316249e-06, "Full-finetune/Loss": 0.7616307735443115, "Full-finetune/Loss (Raw)": 0.7609931230545044, "Full-finetune/Step": 3565, "Full-finetune/Step Time": 6.735372485592961} {"Full-finetune/Learning Rate": 4.738015270778965e-06, "Full-finetune/Loss": 0.7629945278167725, "Full-finetune/Loss (Raw)": 0.8904417753219604, "Full-finetune/Step": 3566, "Full-finetune/Step Time": 6.734600618481636} {"Full-finetune/Learning Rate": 4.7327188693152235e-06, "Full-finetune/Loss": 0.7628616690635681, "Full-finetune/Loss (Raw)": 0.8007848262786865, "Full-finetune/Step": 3567, "Full-finetune/Step Time": 6.738638469949365} {"Full-finetune/Learning Rate": 4.727424511980453e-06, "Full-finetune/Loss": 0.7636322975158691, "Full-finetune/Loss (Raw)": 0.810457170009613, "Full-finetune/Step": 3568, "Full-finetune/Step Time": 6.7436267249286175} {"Full-finetune/Learning Rate": 4.722132200829291e-06, "Full-finetune/Loss": 0.7646243572235107, "Full-finetune/Loss (Raw)": 0.7478029727935791, "Full-finetune/Step": 3569, "Full-finetune/Step Time": 6.7311953492462635} {"Full-finetune/Learning Rate": 4.716841937915582e-06, "Full-finetune/Loss": 0.7647988200187683, "Full-finetune/Loss (Raw)": 0.7529171109199524, "Full-finetune/Step": 3570, "Full-finetune/Step Time": 6.72510802000761} {"Full-finetune/Learning Rate": 4.71155372529237e-06, "Full-finetune/Loss": 0.765520453453064, "Full-finetune/Loss (Raw)": 0.8112924695014954, "Full-finetune/Step": 3571, "Full-finetune/Step Time": 6.717546423897147} {"Full-finetune/Learning Rate": 4.706267565011909e-06, "Full-finetune/Loss": 0.7659969329833984, "Full-finetune/Loss (Raw)": 0.8860897421836853, "Full-finetune/Step": 3572, "Full-finetune/Step Time": 6.718780290335417} {"Full-finetune/Learning Rate": 4.700983459125652e-06, "Full-finetune/Loss": 0.7683325409889221, "Full-finetune/Loss (Raw)": 0.8711573481559753, "Full-finetune/Step": 3573, "Full-finetune/Step Time": 6.700645675882697} {"Full-finetune/Learning Rate": 4.695701409684264e-06, "Full-finetune/Loss": 0.7695202827453613, "Full-finetune/Loss (Raw)": 0.8956469297409058, "Full-finetune/Step": 3574, "Full-finetune/Step Time": 6.69882557541132} {"Full-finetune/Learning Rate": 4.690421418737604e-06, "Full-finetune/Loss": 0.7686271667480469, "Full-finetune/Loss (Raw)": 0.7858780026435852, "Full-finetune/Step": 3575, "Full-finetune/Step Time": 6.700075117871165} {"Full-finetune/Learning Rate": 4.685143488334723e-06, "Full-finetune/Loss": 0.7698183059692383, "Full-finetune/Loss (Raw)": 0.8875090479850769, "Full-finetune/Step": 3576, "Full-finetune/Step Time": 6.697896171361208} {"Full-finetune/Learning Rate": 4.679867620523895e-06, "Full-finetune/Loss": 0.7690197229385376, "Full-finetune/Loss (Raw)": 0.7978196144104004, "Full-finetune/Step": 3577, "Full-finetune/Step Time": 6.716207671910524} {"Full-finetune/Learning Rate": 4.674593817352575e-06, "Full-finetune/Loss": 0.7696526646614075, "Full-finetune/Loss (Raw)": 0.8575206398963928, "Full-finetune/Step": 3578, "Full-finetune/Step Time": 6.701008630916476} {"Full-finetune/Learning Rate": 4.669322080867427e-06, "Full-finetune/Loss": 0.7699940204620361, "Full-finetune/Loss (Raw)": 0.8328632712364197, "Full-finetune/Step": 3579, "Full-finetune/Step Time": 6.701912231743336} {"Full-finetune/Learning Rate": 4.664052413114305e-06, "Full-finetune/Loss": 0.7696465253829956, "Full-finetune/Loss (Raw)": 0.8360815644264221, "Full-finetune/Step": 3580, "Full-finetune/Step Time": 6.70947028696537} {"Full-finetune/Learning Rate": 4.658784816138266e-06, "Full-finetune/Loss": 0.7702289819717407, "Full-finetune/Loss (Raw)": 0.8702932000160217, "Full-finetune/Step": 3581, "Full-finetune/Step Time": 6.7195413783192635} {"Full-finetune/Learning Rate": 4.653519291983561e-06, "Full-finetune/Loss": 0.7698192596435547, "Full-finetune/Loss (Raw)": 0.6967042684555054, "Full-finetune/Step": 3582, "Full-finetune/Step Time": 6.7211623303592205} {"Full-finetune/Learning Rate": 4.648255842693635e-06, "Full-finetune/Loss": 0.772948682308197, "Full-finetune/Loss (Raw)": 0.7397739887237549, "Full-finetune/Step": 3583, "Full-finetune/Step Time": 6.703498279675841} {"Full-finetune/Learning Rate": 4.642994470311136e-06, "Full-finetune/Loss": 0.7725733518600464, "Full-finetune/Loss (Raw)": 0.811872661113739, "Full-finetune/Step": 3584, "Full-finetune/Step Time": 6.705346092581749} {"Full-finetune/Learning Rate": 4.6377351768779e-06, "Full-finetune/Loss": 0.7733070254325867, "Full-finetune/Loss (Raw)": 0.9403219223022461, "Full-finetune/Step": 3585, "Full-finetune/Step Time": 6.705099586397409} {"Full-finetune/Learning Rate": 4.632477964434944e-06, "Full-finetune/Loss": 0.7721112966537476, "Full-finetune/Loss (Raw)": 0.662173330783844, "Full-finetune/Step": 3586, "Full-finetune/Step Time": 6.702266527339816} {"Full-finetune/Learning Rate": 4.6272228350225026e-06, "Full-finetune/Loss": 0.7714707255363464, "Full-finetune/Loss (Raw)": 0.7396020293235779, "Full-finetune/Step": 3587, "Full-finetune/Step Time": 6.704724816605449} {"Full-finetune/Learning Rate": 4.621969790679984e-06, "Full-finetune/Loss": 0.7695251703262329, "Full-finetune/Loss (Raw)": 0.6506801843643188, "Full-finetune/Step": 3588, "Full-finetune/Step Time": 6.705238156020641} {"Full-finetune/Learning Rate": 4.6167188334459936e-06, "Full-finetune/Loss": 0.7728928923606873, "Full-finetune/Loss (Raw)": 0.7687704563140869, "Full-finetune/Step": 3589, "Full-finetune/Step Time": 6.704511418938637} {"Full-finetune/Learning Rate": 4.611469965358323e-06, "Full-finetune/Loss": 0.7733428478240967, "Full-finetune/Loss (Raw)": 0.8581945896148682, "Full-finetune/Step": 3590, "Full-finetune/Step Time": 6.7077708169817924} {"Full-finetune/Learning Rate": 4.606223188453956e-06, "Full-finetune/Loss": 0.773000955581665, "Full-finetune/Loss (Raw)": 0.720645546913147, "Full-finetune/Step": 3591, "Full-finetune/Step Time": 6.716080337762833} {"Full-finetune/Learning Rate": 4.6009785047690666e-06, "Full-finetune/Loss": 0.772042989730835, "Full-finetune/Loss (Raw)": 0.7775010466575623, "Full-finetune/Step": 3592, "Full-finetune/Step Time": 6.721398802474141} {"Full-finetune/Learning Rate": 4.595735916339008e-06, "Full-finetune/Loss": 0.7735008001327515, "Full-finetune/Loss (Raw)": 0.911953330039978, "Full-finetune/Step": 3593, "Full-finetune/Step Time": 6.717238342389464} {"Full-finetune/Learning Rate": 4.590495425198335e-06, "Full-finetune/Loss": 0.7724305391311646, "Full-finetune/Loss (Raw)": 0.54458087682724, "Full-finetune/Step": 3594, "Full-finetune/Step Time": 6.723504533991218} {"Full-finetune/Learning Rate": 4.585257033380779e-06, "Full-finetune/Loss": 0.7737212181091309, "Full-finetune/Loss (Raw)": 0.8223543167114258, "Full-finetune/Step": 3595, "Full-finetune/Step Time": 6.734547728672624} {"Full-finetune/Learning Rate": 4.580020742919247e-06, "Full-finetune/Loss": 0.7762680053710938, "Full-finetune/Loss (Raw)": 0.964371383190155, "Full-finetune/Step": 3596, "Full-finetune/Step Time": 6.720477439463139} {"Full-finetune/Learning Rate": 4.5747865558458524e-06, "Full-finetune/Loss": 0.7726273536682129, "Full-finetune/Loss (Raw)": 0.24817411601543427, "Full-finetune/Step": 3597, "Full-finetune/Step Time": 6.727808699011803} {"Full-finetune/Learning Rate": 4.569554474191878e-06, "Full-finetune/Loss": 0.7724018692970276, "Full-finetune/Loss (Raw)": 0.7371729016304016, "Full-finetune/Step": 3598, "Full-finetune/Step Time": 6.741469364613295} {"Full-finetune/Learning Rate": 4.56432449998779e-06, "Full-finetune/Loss": 0.7710349559783936, "Full-finetune/Loss (Raw)": 0.6867566108703613, "Full-finetune/Step": 3599, "Full-finetune/Step Time": 6.733712203800678} {"Full-finetune/Learning Rate": 4.559096635263242e-06, "Full-finetune/Loss": 0.7686490416526794, "Full-finetune/Loss (Raw)": 0.43520790338516235, "Full-finetune/Step": 3600, "Full-finetune/Step Time": 6.744734248146415} {"Full-finetune/Learning Rate": 4.553870882047064e-06, "Full-finetune/Loss": 0.7684828042984009, "Full-finetune/Loss (Raw)": 0.8394473791122437, "Full-finetune/Step": 3601, "Full-finetune/Step Time": 6.72757282666862} {"Full-finetune/Learning Rate": 4.548647242367271e-06, "Full-finetune/Loss": 0.7694185972213745, "Full-finetune/Loss (Raw)": 0.784252405166626, "Full-finetune/Step": 3602, "Full-finetune/Step Time": 6.711986133828759} {"Full-finetune/Learning Rate": 4.543425718251051e-06, "Full-finetune/Loss": 0.7692905068397522, "Full-finetune/Loss (Raw)": 0.7951821088790894, "Full-finetune/Step": 3603, "Full-finetune/Step Time": 6.710841912776232} {"Full-finetune/Learning Rate": 4.538206311724782e-06, "Full-finetune/Loss": 0.7708145976066589, "Full-finetune/Loss (Raw)": 0.8253605961799622, "Full-finetune/Step": 3604, "Full-finetune/Step Time": 6.697389714419842} {"Full-finetune/Learning Rate": 4.532989024814015e-06, "Full-finetune/Loss": 0.7700309157371521, "Full-finetune/Loss (Raw)": 0.639229953289032, "Full-finetune/Step": 3605, "Full-finetune/Step Time": 6.68407173268497} {"Full-finetune/Learning Rate": 4.527773859543466e-06, "Full-finetune/Loss": 0.7683457732200623, "Full-finetune/Loss (Raw)": 0.7245039939880371, "Full-finetune/Step": 3606, "Full-finetune/Step Time": 6.696401339024305} {"Full-finetune/Learning Rate": 4.52256081793705e-06, "Full-finetune/Loss": 0.7666588425636292, "Full-finetune/Loss (Raw)": 0.8034185767173767, "Full-finetune/Step": 3607, "Full-finetune/Step Time": 6.7002195585519075} {"Full-finetune/Learning Rate": 4.517349902017841e-06, "Full-finetune/Loss": 0.7649986743927002, "Full-finetune/Loss (Raw)": 0.6297667026519775, "Full-finetune/Step": 3608, "Full-finetune/Step Time": 6.727902734652162} {"Full-finetune/Learning Rate": 4.512141113808097e-06, "Full-finetune/Loss": 0.764245867729187, "Full-finetune/Loss (Raw)": 0.7515461444854736, "Full-finetune/Step": 3609, "Full-finetune/Step Time": 6.729419682174921} {"Full-finetune/Learning Rate": 4.5069344553292436e-06, "Full-finetune/Loss": 0.7635810375213623, "Full-finetune/Loss (Raw)": 0.678720235824585, "Full-finetune/Step": 3610, "Full-finetune/Step Time": 6.729397898539901} {"Full-finetune/Learning Rate": 4.501729928601887e-06, "Full-finetune/Loss": 0.7603868246078491, "Full-finetune/Loss (Raw)": 0.3317328691482544, "Full-finetune/Step": 3611, "Full-finetune/Step Time": 6.710616547614336} {"Full-finetune/Learning Rate": 4.4965275356458e-06, "Full-finetune/Loss": 0.7606444358825684, "Full-finetune/Loss (Raw)": 0.7828381061553955, "Full-finetune/Step": 3612, "Full-finetune/Step Time": 6.709286021068692} {"Full-finetune/Learning Rate": 4.491327278479924e-06, "Full-finetune/Loss": 0.7586740255355835, "Full-finetune/Loss (Raw)": 0.6827977299690247, "Full-finetune/Step": 3613, "Full-finetune/Step Time": 6.7107949536293745} {"Full-finetune/Learning Rate": 4.4861291591223934e-06, "Full-finetune/Loss": 0.7584700584411621, "Full-finetune/Loss (Raw)": 0.7833897471427917, "Full-finetune/Step": 3614, "Full-finetune/Step Time": 6.705512324348092} {"Full-finetune/Learning Rate": 4.4809331795904835e-06, "Full-finetune/Loss": 0.7593523263931274, "Full-finetune/Loss (Raw)": 0.8325234651565552, "Full-finetune/Step": 3615, "Full-finetune/Step Time": 6.711237125098705} {"Full-finetune/Learning Rate": 4.47573934190065e-06, "Full-finetune/Loss": 0.7594050765037537, "Full-finetune/Loss (Raw)": 0.6861422657966614, "Full-finetune/Step": 3616, "Full-finetune/Step Time": 6.7154777105897665} {"Full-finetune/Learning Rate": 4.470547648068532e-06, "Full-finetune/Loss": 0.7582029104232788, "Full-finetune/Loss (Raw)": 0.7182866334915161, "Full-finetune/Step": 3617, "Full-finetune/Step Time": 6.7245420552790165} {"Full-finetune/Learning Rate": 4.465358100108916e-06, "Full-finetune/Loss": 0.7578662633895874, "Full-finetune/Loss (Raw)": 0.6723234057426453, "Full-finetune/Step": 3618, "Full-finetune/Step Time": 6.733682546764612} {"Full-finetune/Learning Rate": 4.460170700035769e-06, "Full-finetune/Loss": 0.756697952747345, "Full-finetune/Loss (Raw)": 0.7551421523094177, "Full-finetune/Step": 3619, "Full-finetune/Step Time": 6.7327934969216585} {"Full-finetune/Learning Rate": 4.454985449862215e-06, "Full-finetune/Loss": 0.7566173076629639, "Full-finetune/Loss (Raw)": 0.7863214015960693, "Full-finetune/Step": 3620, "Full-finetune/Step Time": 6.723512368276715} {"Full-finetune/Learning Rate": 4.449802351600551e-06, "Full-finetune/Loss": 0.7584244012832642, "Full-finetune/Loss (Raw)": 0.7280045747756958, "Full-finetune/Step": 3621, "Full-finetune/Step Time": 6.718270713463426} {"Full-finetune/Learning Rate": 4.444621407262237e-06, "Full-finetune/Loss": 0.7573176622390747, "Full-finetune/Loss (Raw)": 0.7842732667922974, "Full-finetune/Step": 3622, "Full-finetune/Step Time": 6.717600770294666} {"Full-finetune/Learning Rate": 4.439442618857891e-06, "Full-finetune/Loss": 0.7571722269058228, "Full-finetune/Loss (Raw)": 0.8290918469429016, "Full-finetune/Step": 3623, "Full-finetune/Step Time": 6.719473654404283} {"Full-finetune/Learning Rate": 4.434265988397312e-06, "Full-finetune/Loss": 0.7573856115341187, "Full-finetune/Loss (Raw)": 0.8868021368980408, "Full-finetune/Step": 3624, "Full-finetune/Step Time": 6.713913977146149} {"Full-finetune/Learning Rate": 4.4290915178894355e-06, "Full-finetune/Loss": 0.7593947649002075, "Full-finetune/Loss (Raw)": 0.8804558515548706, "Full-finetune/Step": 3625, "Full-finetune/Step Time": 6.705746615305543} {"Full-finetune/Learning Rate": 4.423919209342376e-06, "Full-finetune/Loss": 0.7577976584434509, "Full-finetune/Loss (Raw)": 0.6677534580230713, "Full-finetune/Step": 3626, "Full-finetune/Step Time": 6.70281857252121} {"Full-finetune/Learning Rate": 4.41874906476341e-06, "Full-finetune/Loss": 0.7583146691322327, "Full-finetune/Loss (Raw)": 0.8540384769439697, "Full-finetune/Step": 3627, "Full-finetune/Step Time": 6.717937085777521} {"Full-finetune/Learning Rate": 4.413581086158969e-06, "Full-finetune/Loss": 0.7575571537017822, "Full-finetune/Loss (Raw)": 0.8026832938194275, "Full-finetune/Step": 3628, "Full-finetune/Step Time": 6.724728401750326} {"Full-finetune/Learning Rate": 4.408415275534641e-06, "Full-finetune/Loss": 0.7567660808563232, "Full-finetune/Loss (Raw)": 0.7616038918495178, "Full-finetune/Step": 3629, "Full-finetune/Step Time": 6.731795800849795} {"Full-finetune/Learning Rate": 4.4032516348951795e-06, "Full-finetune/Loss": 0.7548823356628418, "Full-finetune/Loss (Raw)": 0.7040696740150452, "Full-finetune/Step": 3630, "Full-finetune/Step Time": 6.732589842751622} {"Full-finetune/Learning Rate": 4.3980901662444905e-06, "Full-finetune/Loss": 0.7530471086502075, "Full-finetune/Loss (Raw)": 0.633728563785553, "Full-finetune/Step": 3631, "Full-finetune/Step Time": 6.74699779972434} {"Full-finetune/Learning Rate": 4.39293087158564e-06, "Full-finetune/Loss": 0.7540535926818848, "Full-finetune/Loss (Raw)": 0.8837077021598816, "Full-finetune/Step": 3632, "Full-finetune/Step Time": 6.750012429431081} {"Full-finetune/Learning Rate": 4.387773752920845e-06, "Full-finetune/Loss": 0.7547891139984131, "Full-finetune/Loss (Raw)": 0.8784229159355164, "Full-finetune/Step": 3633, "Full-finetune/Step Time": 6.744529468938708} {"Full-finetune/Learning Rate": 4.382618812251495e-06, "Full-finetune/Loss": 0.7550662755966187, "Full-finetune/Loss (Raw)": 0.7783691883087158, "Full-finetune/Step": 3634, "Full-finetune/Step Time": 6.73772587813437} {"Full-finetune/Learning Rate": 4.377466051578111e-06, "Full-finetune/Loss": 0.7556571364402771, "Full-finetune/Loss (Raw)": 0.6682001352310181, "Full-finetune/Step": 3635, "Full-finetune/Step Time": 6.722161104902625} {"Full-finetune/Learning Rate": 4.372315472900377e-06, "Full-finetune/Loss": 0.7559112906455994, "Full-finetune/Loss (Raw)": 0.8235912322998047, "Full-finetune/Step": 3636, "Full-finetune/Step Time": 6.721538307145238} {"Full-finetune/Learning Rate": 4.367167078217141e-06, "Full-finetune/Loss": 0.7566743493080139, "Full-finetune/Loss (Raw)": 0.852300226688385, "Full-finetune/Step": 3637, "Full-finetune/Step Time": 6.717465879395604} {"Full-finetune/Learning Rate": 4.36202086952639e-06, "Full-finetune/Loss": 0.7574149966239929, "Full-finetune/Loss (Raw)": 0.8290643095970154, "Full-finetune/Step": 3638, "Full-finetune/Step Time": 6.715359140187502} {"Full-finetune/Learning Rate": 4.356876848825266e-06, "Full-finetune/Loss": 0.7582145929336548, "Full-finetune/Loss (Raw)": 0.8164319396018982, "Full-finetune/Step": 3639, "Full-finetune/Step Time": 6.704504678025842} {"Full-finetune/Learning Rate": 4.351735018110066e-06, "Full-finetune/Loss": 0.7545220851898193, "Full-finetune/Loss (Raw)": 0.3014260232448578, "Full-finetune/Step": 3640, "Full-finetune/Step Time": 6.723624147474766} {"Full-finetune/Learning Rate": 4.346595379376232e-06, "Full-finetune/Loss": 0.7535679340362549, "Full-finetune/Loss (Raw)": 0.7283214926719666, "Full-finetune/Step": 3641, "Full-finetune/Step Time": 6.726813681423664} {"Full-finetune/Learning Rate": 4.341457934618357e-06, "Full-finetune/Loss": 0.7541474103927612, "Full-finetune/Loss (Raw)": 0.8099214434623718, "Full-finetune/Step": 3642, "Full-finetune/Step Time": 6.729501321911812} {"Full-finetune/Learning Rate": 4.336322685830181e-06, "Full-finetune/Loss": 0.7544985413551331, "Full-finetune/Loss (Raw)": 0.8371404409408569, "Full-finetune/Step": 3643, "Full-finetune/Step Time": 6.722797667607665} {"Full-finetune/Learning Rate": 4.331189635004604e-06, "Full-finetune/Loss": 0.7543677091598511, "Full-finetune/Loss (Raw)": 0.7775039076805115, "Full-finetune/Step": 3644, "Full-finetune/Step Time": 6.720224840566516} {"Full-finetune/Learning Rate": 4.326058784133652e-06, "Full-finetune/Loss": 0.7537858486175537, "Full-finetune/Loss (Raw)": 0.7609624862670898, "Full-finetune/Step": 3645, "Full-finetune/Step Time": 6.719190644100308} {"Full-finetune/Learning Rate": 4.3209301352085075e-06, "Full-finetune/Loss": 0.75547856092453, "Full-finetune/Loss (Raw)": 0.8502622842788696, "Full-finetune/Step": 3646, "Full-finetune/Step Time": 6.703874198719859} {"Full-finetune/Learning Rate": 4.315803690219507e-06, "Full-finetune/Loss": 0.7567042708396912, "Full-finetune/Loss (Raw)": 0.8386643528938293, "Full-finetune/Step": 3647, "Full-finetune/Step Time": 6.681702198460698} {"Full-finetune/Learning Rate": 4.310679451156122e-06, "Full-finetune/Loss": 0.7577768564224243, "Full-finetune/Loss (Raw)": 0.8905121684074402, "Full-finetune/Step": 3648, "Full-finetune/Step Time": 6.683210097253323} {"Full-finetune/Learning Rate": 4.305557420006962e-06, "Full-finetune/Loss": 0.7577669024467468, "Full-finetune/Loss (Raw)": 0.8820672631263733, "Full-finetune/Step": 3649, "Full-finetune/Step Time": 6.698112241923809} {"Full-finetune/Learning Rate": 4.300437598759794e-06, "Full-finetune/Loss": 0.760189414024353, "Full-finetune/Loss (Raw)": 0.9459851384162903, "Full-finetune/Step": 3650, "Full-finetune/Step Time": 6.677822522819042} {"Full-finetune/Learning Rate": 4.295319989401522e-06, "Full-finetune/Loss": 0.7604734897613525, "Full-finetune/Loss (Raw)": 0.6582770943641663, "Full-finetune/Step": 3651, "Full-finetune/Step Time": 6.67704856954515} {"Full-finetune/Learning Rate": 4.2902045939181855e-06, "Full-finetune/Loss": 0.7616075277328491, "Full-finetune/Loss (Raw)": 0.8172101378440857, "Full-finetune/Step": 3652, "Full-finetune/Step Time": 6.669281298294663} {"Full-finetune/Learning Rate": 4.285091414294973e-06, "Full-finetune/Loss": 0.7608444094657898, "Full-finetune/Loss (Raw)": 0.8869956731796265, "Full-finetune/Step": 3653, "Full-finetune/Step Time": 6.666676364839077} {"Full-finetune/Learning Rate": 4.2799804525162085e-06, "Full-finetune/Loss": 0.7616463899612427, "Full-finetune/Loss (Raw)": 0.7593076825141907, "Full-finetune/Step": 3654, "Full-finetune/Step Time": 6.685377229005098} {"Full-finetune/Learning Rate": 4.274871710565356e-06, "Full-finetune/Loss": 0.7627195119857788, "Full-finetune/Loss (Raw)": 0.9322988390922546, "Full-finetune/Step": 3655, "Full-finetune/Step Time": 6.679297031834722} {"Full-finetune/Learning Rate": 4.269765190425015e-06, "Full-finetune/Loss": 0.7619942426681519, "Full-finetune/Loss (Raw)": 0.687290608882904, "Full-finetune/Step": 3656, "Full-finetune/Step Time": 6.683160996064544} {"Full-finetune/Learning Rate": 4.264660894076934e-06, "Full-finetune/Loss": 0.7634263038635254, "Full-finetune/Loss (Raw)": 0.8115614056587219, "Full-finetune/Step": 3657, "Full-finetune/Step Time": 6.677756166085601} {"Full-finetune/Learning Rate": 4.25955882350199e-06, "Full-finetune/Loss": 0.7634087800979614, "Full-finetune/Loss (Raw)": 0.7628588080406189, "Full-finetune/Step": 3658, "Full-finetune/Step Time": 6.692800952121615} {"Full-finetune/Learning Rate": 4.254458980680188e-06, "Full-finetune/Loss": 0.7630146145820618, "Full-finetune/Loss (Raw)": 0.8056989908218384, "Full-finetune/Step": 3659, "Full-finetune/Step Time": 6.696122728288174} {"Full-finetune/Learning Rate": 4.2493613675906865e-06, "Full-finetune/Loss": 0.7648345232009888, "Full-finetune/Loss (Raw)": 0.9032635688781738, "Full-finetune/Step": 3660, "Full-finetune/Step Time": 6.683095199987292} {"Full-finetune/Learning Rate": 4.244265986211766e-06, "Full-finetune/Loss": 0.7686692476272583, "Full-finetune/Loss (Raw)": 0.8103644251823425, "Full-finetune/Step": 3661, "Full-finetune/Step Time": 6.663189159706235} {"Full-finetune/Learning Rate": 4.239172838520846e-06, "Full-finetune/Loss": 0.7693147659301758, "Full-finetune/Loss (Raw)": 0.9114452004432678, "Full-finetune/Step": 3662, "Full-finetune/Step Time": 6.642712639644742} {"Full-finetune/Learning Rate": 4.2340819264944755e-06, "Full-finetune/Loss": 0.7744749784469604, "Full-finetune/Loss (Raw)": 0.9914358258247375, "Full-finetune/Step": 3663, "Full-finetune/Step Time": 6.622181996703148} {"Full-finetune/Learning Rate": 4.22899325210834e-06, "Full-finetune/Loss": 0.7741786241531372, "Full-finetune/Loss (Raw)": 0.7318019270896912, "Full-finetune/Step": 3664, "Full-finetune/Step Time": 6.63439229875803} {"Full-finetune/Learning Rate": 4.223906817337253e-06, "Full-finetune/Loss": 0.7730798721313477, "Full-finetune/Loss (Raw)": 0.8224474191665649, "Full-finetune/Step": 3665, "Full-finetune/Step Time": 6.625824311748147} {"Full-finetune/Learning Rate": 4.218822624155159e-06, "Full-finetune/Loss": 0.7723835706710815, "Full-finetune/Loss (Raw)": 0.8187952041625977, "Full-finetune/Step": 3666, "Full-finetune/Step Time": 6.621064629405737} {"Full-finetune/Learning Rate": 4.213740674535141e-06, "Full-finetune/Loss": 0.768710732460022, "Full-finetune/Loss (Raw)": 0.41187742352485657, "Full-finetune/Step": 3667, "Full-finetune/Step Time": 6.637598626315594} {"Full-finetune/Learning Rate": 4.2086609704494015e-06, "Full-finetune/Loss": 0.7680960297584534, "Full-finetune/Loss (Raw)": 0.7420431971549988, "Full-finetune/Step": 3668, "Full-finetune/Step Time": 6.617600746452808} {"Full-finetune/Learning Rate": 4.203583513869267e-06, "Full-finetune/Loss": 0.7674517631530762, "Full-finetune/Loss (Raw)": 0.729993462562561, "Full-finetune/Step": 3669, "Full-finetune/Step Time": 6.622959233820438} {"Full-finetune/Learning Rate": 4.198508306765209e-06, "Full-finetune/Loss": 0.7684528827667236, "Full-finetune/Loss (Raw)": 0.8124514818191528, "Full-finetune/Step": 3670, "Full-finetune/Step Time": 6.599353186786175} {"Full-finetune/Learning Rate": 4.193435351106811e-06, "Full-finetune/Loss": 0.7694534063339233, "Full-finetune/Loss (Raw)": 0.8908392190933228, "Full-finetune/Step": 3671, "Full-finetune/Step Time": 6.581645535305142} {"Full-finetune/Learning Rate": 4.188364648862791e-06, "Full-finetune/Loss": 0.7685168385505676, "Full-finetune/Loss (Raw)": 0.7219693064689636, "Full-finetune/Step": 3672, "Full-finetune/Step Time": 6.589813910424709} {"Full-finetune/Learning Rate": 4.183296202000988e-06, "Full-finetune/Loss": 0.7694687843322754, "Full-finetune/Loss (Raw)": 0.5388783812522888, "Full-finetune/Step": 3673, "Full-finetune/Step Time": 6.575715279206634} {"Full-finetune/Learning Rate": 4.178230012488368e-06, "Full-finetune/Loss": 0.7699745297431946, "Full-finetune/Loss (Raw)": 0.7909358143806458, "Full-finetune/Step": 3674, "Full-finetune/Step Time": 6.567561198025942} {"Full-finetune/Learning Rate": 4.173166082291019e-06, "Full-finetune/Loss": 0.7657414674758911, "Full-finetune/Loss (Raw)": 0.37150147557258606, "Full-finetune/Step": 3675, "Full-finetune/Step Time": 6.591404477134347} {"Full-finetune/Learning Rate": 4.16810441337415e-06, "Full-finetune/Loss": 0.7662138938903809, "Full-finetune/Loss (Raw)": 0.8177925944328308, "Full-finetune/Step": 3676, "Full-finetune/Step Time": 6.595337750390172} {"Full-finetune/Learning Rate": 4.163045007702105e-06, "Full-finetune/Loss": 0.7661160230636597, "Full-finetune/Loss (Raw)": 0.9138885736465454, "Full-finetune/Step": 3677, "Full-finetune/Step Time": 6.59533803537488} {"Full-finetune/Learning Rate": 4.157987867238338e-06, "Full-finetune/Loss": 0.7677897214889526, "Full-finetune/Loss (Raw)": 0.5532518029212952, "Full-finetune/Step": 3678, "Full-finetune/Step Time": 6.578116061165929} {"Full-finetune/Learning Rate": 4.152932993945418e-06, "Full-finetune/Loss": 0.7682695984840393, "Full-finetune/Loss (Raw)": 0.7534617781639099, "Full-finetune/Step": 3679, "Full-finetune/Step Time": 6.566549189388752} {"Full-finetune/Learning Rate": 4.147880389785051e-06, "Full-finetune/Loss": 0.7686107158660889, "Full-finetune/Loss (Raw)": 0.8660394549369812, "Full-finetune/Step": 3680, "Full-finetune/Step Time": 6.572848554700613} {"Full-finetune/Learning Rate": 4.142830056718052e-06, "Full-finetune/Loss": 0.7700631022453308, "Full-finetune/Loss (Raw)": 0.8216006755828857, "Full-finetune/Step": 3681, "Full-finetune/Step Time": 6.554449621587992} {"Full-finetune/Learning Rate": 4.137781996704356e-06, "Full-finetune/Loss": 0.7710242867469788, "Full-finetune/Loss (Raw)": 1.0323988199234009, "Full-finetune/Step": 3682, "Full-finetune/Step Time": 6.552258018404245} {"Full-finetune/Learning Rate": 4.1327362117030174e-06, "Full-finetune/Loss": 0.7700749039649963, "Full-finetune/Loss (Raw)": 0.8092350363731384, "Full-finetune/Step": 3683, "Full-finetune/Step Time": 6.5527889132499695} {"Full-finetune/Learning Rate": 4.127692703672207e-06, "Full-finetune/Loss": 0.7718566060066223, "Full-finetune/Loss (Raw)": 0.5671355724334717, "Full-finetune/Step": 3684, "Full-finetune/Step Time": 6.553657673299313} {"Full-finetune/Learning Rate": 4.1226514745692115e-06, "Full-finetune/Loss": 0.7703068852424622, "Full-finetune/Loss (Raw)": 0.7758283615112305, "Full-finetune/Step": 3685, "Full-finetune/Step Time": 6.55007435195148} {"Full-finetune/Learning Rate": 4.117612526350429e-06, "Full-finetune/Loss": 0.7705687880516052, "Full-finetune/Loss (Raw)": 0.8327001929283142, "Full-finetune/Step": 3686, "Full-finetune/Step Time": 6.550533276051283} {"Full-finetune/Learning Rate": 4.112575860971384e-06, "Full-finetune/Loss": 0.7704379558563232, "Full-finetune/Loss (Raw)": 0.8299685120582581, "Full-finetune/Step": 3687, "Full-finetune/Step Time": 6.5488543175160885} {"Full-finetune/Learning Rate": 4.107541480386708e-06, "Full-finetune/Loss": 0.7682948708534241, "Full-finetune/Loss (Raw)": 0.6120738983154297, "Full-finetune/Step": 3688, "Full-finetune/Step Time": 6.558380527421832} {"Full-finetune/Learning Rate": 4.102509386550141e-06, "Full-finetune/Loss": 0.767597496509552, "Full-finetune/Loss (Raw)": 0.8704060316085815, "Full-finetune/Step": 3689, "Full-finetune/Step Time": 6.558432539924979} {"Full-finetune/Learning Rate": 4.0974795814145384e-06, "Full-finetune/Loss": 0.7692975997924805, "Full-finetune/Loss (Raw)": 0.8472834229469299, "Full-finetune/Step": 3690, "Full-finetune/Step Time": 6.562163833528757} {"Full-finetune/Learning Rate": 4.092452066931877e-06, "Full-finetune/Loss": 0.7663829326629639, "Full-finetune/Loss (Raw)": 0.2991713285446167, "Full-finetune/Step": 3691, "Full-finetune/Step Time": 6.580514846369624} {"Full-finetune/Learning Rate": 4.087426845053236e-06, "Full-finetune/Loss": 0.7671710252761841, "Full-finetune/Loss (Raw)": 0.8734702467918396, "Full-finetune/Step": 3692, "Full-finetune/Step Time": 6.574371622875333} {"Full-finetune/Learning Rate": 4.082403917728796e-06, "Full-finetune/Loss": 0.7676199674606323, "Full-finetune/Loss (Raw)": 0.8184566497802734, "Full-finetune/Step": 3693, "Full-finetune/Step Time": 6.574105864390731} {"Full-finetune/Learning Rate": 4.077383286907869e-06, "Full-finetune/Loss": 0.7657556533813477, "Full-finetune/Loss (Raw)": 0.6518065929412842, "Full-finetune/Step": 3694, "Full-finetune/Step Time": 6.598340732976794} {"Full-finetune/Learning Rate": 4.072364954538858e-06, "Full-finetune/Loss": 0.7674816846847534, "Full-finetune/Loss (Raw)": 1.0217210054397583, "Full-finetune/Step": 3695, "Full-finetune/Step Time": 6.577429028227925} {"Full-finetune/Learning Rate": 4.067348922569281e-06, "Full-finetune/Loss": 0.7672548890113831, "Full-finetune/Loss (Raw)": 0.7814254760742188, "Full-finetune/Step": 3696, "Full-finetune/Step Time": 6.570467561483383} {"Full-finetune/Learning Rate": 4.062335192945762e-06, "Full-finetune/Loss": 0.76551353931427, "Full-finetune/Loss (Raw)": 0.524911642074585, "Full-finetune/Step": 3697, "Full-finetune/Step Time": 6.58633947186172} {"Full-finetune/Learning Rate": 4.057323767614032e-06, "Full-finetune/Loss": 0.7660123109817505, "Full-finetune/Loss (Raw)": 0.8167622089385986, "Full-finetune/Step": 3698, "Full-finetune/Step Time": 6.603483570739627} {"Full-finetune/Learning Rate": 4.052314648518925e-06, "Full-finetune/Loss": 0.7659486532211304, "Full-finetune/Loss (Raw)": 0.803142249584198, "Full-finetune/Step": 3699, "Full-finetune/Step Time": 6.6010337714105844} {"Full-finetune/Learning Rate": 4.047307837604383e-06, "Full-finetune/Loss": 0.765458345413208, "Full-finetune/Loss (Raw)": 0.8233259320259094, "Full-finetune/Step": 3700, "Full-finetune/Step Time": 6.602437464520335} {"Full-finetune/Learning Rate": 4.0423033368134545e-06, "Full-finetune/Loss": 0.7635717391967773, "Full-finetune/Loss (Raw)": 0.6296688318252563, "Full-finetune/Step": 3701, "Full-finetune/Step Time": 6.6101849135011435} {"Full-finetune/Learning Rate": 4.037301148088292e-06, "Full-finetune/Loss": 0.7630045413970947, "Full-finetune/Loss (Raw)": 0.8230533599853516, "Full-finetune/Step": 3702, "Full-finetune/Step Time": 6.5989078264683485} {"Full-finetune/Learning Rate": 4.032301273370132e-06, "Full-finetune/Loss": 0.7635084390640259, "Full-finetune/Loss (Raw)": 0.8503708839416504, "Full-finetune/Step": 3703, "Full-finetune/Step Time": 6.596110463142395} {"Full-finetune/Learning Rate": 4.027303714599345e-06, "Full-finetune/Loss": 0.7629389762878418, "Full-finetune/Loss (Raw)": 0.8146204352378845, "Full-finetune/Step": 3704, "Full-finetune/Step Time": 6.611487716436386} {"Full-finetune/Learning Rate": 4.022308473715379e-06, "Full-finetune/Loss": 0.7615182399749756, "Full-finetune/Loss (Raw)": 0.6159643530845642, "Full-finetune/Step": 3705, "Full-finetune/Step Time": 6.592943497002125} {"Full-finetune/Learning Rate": 4.017315552656788e-06, "Full-finetune/Loss": 0.7608753442764282, "Full-finetune/Loss (Raw)": 0.7752277851104736, "Full-finetune/Step": 3706, "Full-finetune/Step Time": 6.594678001478314} {"Full-finetune/Learning Rate": 4.01232495336123e-06, "Full-finetune/Loss": 0.7601857781410217, "Full-finetune/Loss (Raw)": 0.7446005344390869, "Full-finetune/Step": 3707, "Full-finetune/Step Time": 6.629178136587143} {"Full-finetune/Learning Rate": 4.0073366777654574e-06, "Full-finetune/Loss": 0.7586424946784973, "Full-finetune/Loss (Raw)": 0.638543426990509, "Full-finetune/Step": 3708, "Full-finetune/Step Time": 6.639945209026337} {"Full-finetune/Learning Rate": 4.002350727805324e-06, "Full-finetune/Loss": 0.7590830326080322, "Full-finetune/Loss (Raw)": 0.9266769289970398, "Full-finetune/Step": 3709, "Full-finetune/Step Time": 6.63022000901401} {"Full-finetune/Learning Rate": 3.997367105415775e-06, "Full-finetune/Loss": 0.7609304189682007, "Full-finetune/Loss (Raw)": 0.9331755042076111, "Full-finetune/Step": 3710, "Full-finetune/Step Time": 6.627022758126259} {"Full-finetune/Learning Rate": 3.992385812530864e-06, "Full-finetune/Loss": 0.7602433562278748, "Full-finetune/Loss (Raw)": 0.6518269181251526, "Full-finetune/Step": 3711, "Full-finetune/Step Time": 6.637931453064084} {"Full-finetune/Learning Rate": 3.987406851083735e-06, "Full-finetune/Loss": 0.7608959674835205, "Full-finetune/Loss (Raw)": 0.8954142332077026, "Full-finetune/Step": 3712, "Full-finetune/Step Time": 6.636998040601611} {"Full-finetune/Learning Rate": 3.982430223006614e-06, "Full-finetune/Loss": 0.7557279467582703, "Full-finetune/Loss (Raw)": 0.27880483865737915, "Full-finetune/Step": 3713, "Full-finetune/Step Time": 6.654422665014863} {"Full-finetune/Learning Rate": 3.977455930230842e-06, "Full-finetune/Loss": 0.7567387819290161, "Full-finetune/Loss (Raw)": 0.7915665507316589, "Full-finetune/Step": 3714, "Full-finetune/Step Time": 6.647998843342066} {"Full-finetune/Learning Rate": 3.972483974686845e-06, "Full-finetune/Loss": 0.7574173212051392, "Full-finetune/Loss (Raw)": 0.8264552354812622, "Full-finetune/Step": 3715, "Full-finetune/Step Time": 6.641743183135986} {"Full-finetune/Learning Rate": 3.967514358304139e-06, "Full-finetune/Loss": 0.7577121257781982, "Full-finetune/Loss (Raw)": 0.6884192228317261, "Full-finetune/Step": 3716, "Full-finetune/Step Time": 6.664554258808494} {"Full-finetune/Learning Rate": 3.962547083011338e-06, "Full-finetune/Loss": 0.7569516897201538, "Full-finetune/Loss (Raw)": 0.6714285016059875, "Full-finetune/Step": 3717, "Full-finetune/Step Time": 6.66401850618422} {"Full-finetune/Learning Rate": 3.957582150736141e-06, "Full-finetune/Loss": 0.7550321817398071, "Full-finetune/Loss (Raw)": 0.6125023365020752, "Full-finetune/Step": 3718, "Full-finetune/Step Time": 6.668390387669206} {"Full-finetune/Learning Rate": 3.952619563405343e-06, "Full-finetune/Loss": 0.7541936635971069, "Full-finetune/Loss (Raw)": 0.6133059859275818, "Full-finetune/Step": 3719, "Full-finetune/Step Time": 6.669028203934431} {"Full-finetune/Learning Rate": 3.9476593229448245e-06, "Full-finetune/Loss": 0.7545284032821655, "Full-finetune/Loss (Raw)": 0.8203539848327637, "Full-finetune/Step": 3720, "Full-finetune/Step Time": 6.662568377330899} {"Full-finetune/Learning Rate": 3.942701431279564e-06, "Full-finetune/Loss": 0.7543879151344299, "Full-finetune/Loss (Raw)": 0.893965482711792, "Full-finetune/Step": 3721, "Full-finetune/Step Time": 6.663072843104601} {"Full-finetune/Learning Rate": 3.937745890333623e-06, "Full-finetune/Loss": 0.7566689252853394, "Full-finetune/Loss (Raw)": 0.8365529179573059, "Full-finetune/Step": 3722, "Full-finetune/Step Time": 6.6604127530008554} {"Full-finetune/Learning Rate": 3.932792702030139e-06, "Full-finetune/Loss": 0.7576285600662231, "Full-finetune/Loss (Raw)": 0.9451882839202881, "Full-finetune/Step": 3723, "Full-finetune/Step Time": 6.6579041592776775} {"Full-finetune/Learning Rate": 3.92784186829136e-06, "Full-finetune/Loss": 0.7559865117073059, "Full-finetune/Loss (Raw)": 0.7541879415512085, "Full-finetune/Step": 3724, "Full-finetune/Step Time": 6.658798836171627} {"Full-finetune/Learning Rate": 3.9228933910386014e-06, "Full-finetune/Loss": 0.7609710693359375, "Full-finetune/Loss (Raw)": 0.8861948251724243, "Full-finetune/Step": 3725, "Full-finetune/Step Time": 6.643654892221093} {"Full-finetune/Learning Rate": 3.917947272192273e-06, "Full-finetune/Loss": 0.7581743597984314, "Full-finetune/Loss (Raw)": 0.37919822335243225, "Full-finetune/Step": 3726, "Full-finetune/Step Time": 6.644040351733565} {"Full-finetune/Learning Rate": 3.913003513671866e-06, "Full-finetune/Loss": 0.758563220500946, "Full-finetune/Loss (Raw)": 0.7365288734436035, "Full-finetune/Step": 3727, "Full-finetune/Step Time": 6.648730428889394} {"Full-finetune/Learning Rate": 3.908062117395956e-06, "Full-finetune/Loss": 0.7594796419143677, "Full-finetune/Loss (Raw)": 0.5525137782096863, "Full-finetune/Step": 3728, "Full-finetune/Step Time": 6.638182522729039} {"Full-finetune/Learning Rate": 3.903123085282204e-06, "Full-finetune/Loss": 0.7593196630477905, "Full-finetune/Loss (Raw)": 0.8189623951911926, "Full-finetune/Step": 3729, "Full-finetune/Step Time": 6.646912490949035} {"Full-finetune/Learning Rate": 3.898186419247347e-06, "Full-finetune/Loss": 0.7597002983093262, "Full-finetune/Loss (Raw)": 0.8329871296882629, "Full-finetune/Step": 3730, "Full-finetune/Step Time": 6.675734667107463} {"Full-finetune/Learning Rate": 3.893252121207221e-06, "Full-finetune/Loss": 0.759967565536499, "Full-finetune/Loss (Raw)": 0.8293870687484741, "Full-finetune/Step": 3731, "Full-finetune/Step Time": 6.675617149099708} {"Full-finetune/Learning Rate": 3.888320193076719e-06, "Full-finetune/Loss": 0.7600988745689392, "Full-finetune/Loss (Raw)": 0.8421663641929626, "Full-finetune/Step": 3732, "Full-finetune/Step Time": 6.674093188717961} {"Full-finetune/Learning Rate": 3.8833906367698245e-06, "Full-finetune/Loss": 0.7611179351806641, "Full-finetune/Loss (Raw)": 0.7696648240089417, "Full-finetune/Step": 3733, "Full-finetune/Step Time": 6.681248625740409} {"Full-finetune/Learning Rate": 3.878463454199613e-06, "Full-finetune/Loss": 0.7624689340591431, "Full-finetune/Loss (Raw)": 0.8974409103393555, "Full-finetune/Step": 3734, "Full-finetune/Step Time": 6.674349632114172} {"Full-finetune/Learning Rate": 3.87353864727822e-06, "Full-finetune/Loss": 0.7611456513404846, "Full-finetune/Loss (Raw)": 0.6340320110321045, "Full-finetune/Step": 3735, "Full-finetune/Step Time": 6.6756715178489685} {"Full-finetune/Learning Rate": 3.8686162179168695e-06, "Full-finetune/Loss": 0.7640216946601868, "Full-finetune/Loss (Raw)": 0.9979043006896973, "Full-finetune/Step": 3736, "Full-finetune/Step Time": 6.645977774634957} {"Full-finetune/Learning Rate": 3.863696168025859e-06, "Full-finetune/Loss": 0.764153242111206, "Full-finetune/Loss (Raw)": 0.7683717608451843, "Full-finetune/Step": 3737, "Full-finetune/Step Time": 6.66407835111022} {"Full-finetune/Learning Rate": 3.858778499514565e-06, "Full-finetune/Loss": 0.7642390727996826, "Full-finetune/Loss (Raw)": 0.6897202730178833, "Full-finetune/Step": 3738, "Full-finetune/Step Time": 6.673111060634255} {"Full-finetune/Learning Rate": 3.853863214291439e-06, "Full-finetune/Loss": 0.7672932147979736, "Full-finetune/Loss (Raw)": 0.7226640582084656, "Full-finetune/Step": 3739, "Full-finetune/Step Time": 6.653768420219421} {"Full-finetune/Learning Rate": 3.848950314264001e-06, "Full-finetune/Loss": 0.7671422362327576, "Full-finetune/Loss (Raw)": 0.7635034322738647, "Full-finetune/Step": 3740, "Full-finetune/Step Time": 6.636696979403496} {"Full-finetune/Learning Rate": 3.8440398013388655e-06, "Full-finetune/Loss": 0.7688080072402954, "Full-finetune/Loss (Raw)": 0.8960162997245789, "Full-finetune/Step": 3741, "Full-finetune/Step Time": 6.636183746159077} {"Full-finetune/Learning Rate": 3.839131677421694e-06, "Full-finetune/Loss": 0.7691202163696289, "Full-finetune/Loss (Raw)": 0.8233540654182434, "Full-finetune/Step": 3742, "Full-finetune/Step Time": 6.6322838421911} {"Full-finetune/Learning Rate": 3.834225944417235e-06, "Full-finetune/Loss": 0.7690329551696777, "Full-finetune/Loss (Raw)": 0.8213618397712708, "Full-finetune/Step": 3743, "Full-finetune/Step Time": 6.6647396963089705} {"Full-finetune/Learning Rate": 3.829322604229313e-06, "Full-finetune/Loss": 0.7664602994918823, "Full-finetune/Loss (Raw)": 0.35683515667915344, "Full-finetune/Step": 3744, "Full-finetune/Step Time": 6.680376783013344} {"Full-finetune/Learning Rate": 3.824421658760815e-06, "Full-finetune/Loss": 0.7633531093597412, "Full-finetune/Loss (Raw)": 0.3205677568912506, "Full-finetune/Step": 3745, "Full-finetune/Step Time": 6.687232431024313} {"Full-finetune/Learning Rate": 3.819523109913706e-06, "Full-finetune/Loss": 0.7635046243667603, "Full-finetune/Loss (Raw)": 0.6917219161987305, "Full-finetune/Step": 3746, "Full-finetune/Step Time": 6.677849596366286} {"Full-finetune/Learning Rate": 3.814626959589012e-06, "Full-finetune/Loss": 0.7623463869094849, "Full-finetune/Loss (Raw)": 0.606890082359314, "Full-finetune/Step": 3747, "Full-finetune/Step Time": 6.697719627991319} {"Full-finetune/Learning Rate": 3.8097332096868368e-06, "Full-finetune/Loss": 0.762658953666687, "Full-finetune/Loss (Raw)": 0.826321005821228, "Full-finetune/Step": 3748, "Full-finetune/Step Time": 6.70829757489264} {"Full-finetune/Learning Rate": 3.8048418621063475e-06, "Full-finetune/Loss": 0.7618206739425659, "Full-finetune/Loss (Raw)": 0.6206989884376526, "Full-finetune/Step": 3749, "Full-finetune/Step Time": 6.715142024680972} {"Full-finetune/Learning Rate": 3.7999529187457775e-06, "Full-finetune/Loss": 0.762654185295105, "Full-finetune/Loss (Raw)": 0.8909652233123779, "Full-finetune/Step": 3750, "Full-finetune/Step Time": 6.7193354945629835} {"Full-finetune/Learning Rate": 3.7950663815024424e-06, "Full-finetune/Loss": 0.7637771964073181, "Full-finetune/Loss (Raw)": 0.9728456139564514, "Full-finetune/Step": 3751, "Full-finetune/Step Time": 6.725711466744542} {"Full-finetune/Learning Rate": 3.790182252272698e-06, "Full-finetune/Loss": 0.762953519821167, "Full-finetune/Loss (Raw)": 0.7813634872436523, "Full-finetune/Step": 3752, "Full-finetune/Step Time": 6.728516537696123} {"Full-finetune/Learning Rate": 3.785300532951983e-06, "Full-finetune/Loss": 0.7615817189216614, "Full-finetune/Loss (Raw)": 0.7048713564872742, "Full-finetune/Step": 3753, "Full-finetune/Step Time": 6.7528108805418015} {"Full-finetune/Learning Rate": 3.780421225434803e-06, "Full-finetune/Loss": 0.7625375390052795, "Full-finetune/Loss (Raw)": 0.790098249912262, "Full-finetune/Step": 3754, "Full-finetune/Step Time": 6.75596989877522} {"Full-finetune/Learning Rate": 3.7755443316147177e-06, "Full-finetune/Loss": 0.7618526816368103, "Full-finetune/Loss (Raw)": 0.7663784027099609, "Full-finetune/Step": 3755, "Full-finetune/Step Time": 6.7430934477597475} {"Full-finetune/Learning Rate": 3.7706698533843556e-06, "Full-finetune/Loss": 0.760265588760376, "Full-finetune/Loss (Raw)": 0.5995326638221741, "Full-finetune/Step": 3756, "Full-finetune/Step Time": 6.744324441999197} {"Full-finetune/Learning Rate": 3.765797792635406e-06, "Full-finetune/Loss": 0.7614166736602783, "Full-finetune/Loss (Raw)": 0.9089438319206238, "Full-finetune/Step": 3757, "Full-finetune/Step Time": 6.747320497408509} {"Full-finetune/Learning Rate": 3.7609281512586203e-06, "Full-finetune/Loss": 0.7609899044036865, "Full-finetune/Loss (Raw)": 0.6494393348693848, "Full-finetune/Step": 3758, "Full-finetune/Step Time": 6.760742072016001} {"Full-finetune/Learning Rate": 3.756060931143811e-06, "Full-finetune/Loss": 0.7625713348388672, "Full-finetune/Loss (Raw)": 0.8361600637435913, "Full-finetune/Step": 3759, "Full-finetune/Step Time": 6.745218543335795} {"Full-finetune/Learning Rate": 3.7511961341798487e-06, "Full-finetune/Loss": 0.7612372636795044, "Full-finetune/Loss (Raw)": 0.7129436135292053, "Full-finetune/Step": 3760, "Full-finetune/Step Time": 6.760292042046785} {"Full-finetune/Learning Rate": 3.746333762254677e-06, "Full-finetune/Loss": 0.7594547271728516, "Full-finetune/Loss (Raw)": 0.6502541899681091, "Full-finetune/Step": 3761, "Full-finetune/Step Time": 6.780951477587223} {"Full-finetune/Learning Rate": 3.7414738172552744e-06, "Full-finetune/Loss": 0.7594701051712036, "Full-finetune/Loss (Raw)": 0.7803391814231873, "Full-finetune/Step": 3762, "Full-finetune/Step Time": 6.786380203440785} {"Full-finetune/Learning Rate": 3.7366163010676937e-06, "Full-finetune/Loss": 0.7611942887306213, "Full-finetune/Loss (Raw)": 0.8888974189758301, "Full-finetune/Step": 3763, "Full-finetune/Step Time": 6.7859941851347685} {"Full-finetune/Learning Rate": 3.7317612155770467e-06, "Full-finetune/Loss": 0.7604301571846008, "Full-finetune/Loss (Raw)": 0.7257844805717468, "Full-finetune/Step": 3764, "Full-finetune/Step Time": 6.785736221820116} {"Full-finetune/Learning Rate": 3.726908562667496e-06, "Full-finetune/Loss": 0.7585437297821045, "Full-finetune/Loss (Raw)": 0.6108319759368896, "Full-finetune/Step": 3765, "Full-finetune/Step Time": 6.783682195469737} {"Full-finetune/Learning Rate": 3.72205834422226e-06, "Full-finetune/Loss": 0.7590024471282959, "Full-finetune/Loss (Raw)": 0.887782871723175, "Full-finetune/Step": 3766, "Full-finetune/Step Time": 6.786878861486912} {"Full-finetune/Learning Rate": 3.717210562123613e-06, "Full-finetune/Loss": 0.7591020464897156, "Full-finetune/Loss (Raw)": 0.8291836977005005, "Full-finetune/Step": 3767, "Full-finetune/Step Time": 6.789564788341522} {"Full-finetune/Learning Rate": 3.712365218252887e-06, "Full-finetune/Loss": 0.762129545211792, "Full-finetune/Loss (Raw)": 0.6889418363571167, "Full-finetune/Step": 3768, "Full-finetune/Step Time": 6.779635043814778} {"Full-finetune/Learning Rate": 3.7075223144904638e-06, "Full-finetune/Loss": 0.758304238319397, "Full-finetune/Loss (Raw)": 0.23867864906787872, "Full-finetune/Step": 3769, "Full-finetune/Step Time": 6.794756405055523} {"Full-finetune/Learning Rate": 3.702681852715777e-06, "Full-finetune/Loss": 0.7593876123428345, "Full-finetune/Loss (Raw)": 0.9486020803451538, "Full-finetune/Step": 3770, "Full-finetune/Step Time": 6.785943850874901} {"Full-finetune/Learning Rate": 3.6978438348073253e-06, "Full-finetune/Loss": 0.7602344155311584, "Full-finetune/Loss (Raw)": 0.9455267190933228, "Full-finetune/Step": 3771, "Full-finetune/Step Time": 6.797462539747357} {"Full-finetune/Learning Rate": 3.6930082626426377e-06, "Full-finetune/Loss": 0.7608196139335632, "Full-finetune/Loss (Raw)": 0.8524104356765747, "Full-finetune/Step": 3772, "Full-finetune/Step Time": 6.803411673754454} {"Full-finetune/Learning Rate": 3.6881751380983066e-06, "Full-finetune/Loss": 0.7575114369392395, "Full-finetune/Loss (Raw)": 0.33751827478408813, "Full-finetune/Step": 3773, "Full-finetune/Step Time": 6.830105572938919} {"Full-finetune/Learning Rate": 3.6833444630499804e-06, "Full-finetune/Loss": 0.757552981376648, "Full-finetune/Loss (Raw)": 0.8555793166160583, "Full-finetune/Step": 3774, "Full-finetune/Step Time": 6.831457637250423} {"Full-finetune/Learning Rate": 3.6785162393723482e-06, "Full-finetune/Loss": 0.7578803300857544, "Full-finetune/Loss (Raw)": 0.8805654644966125, "Full-finetune/Step": 3775, "Full-finetune/Step Time": 6.836094260215759} {"Full-finetune/Learning Rate": 3.6736904689391417e-06, "Full-finetune/Loss": 0.757683515548706, "Full-finetune/Loss (Raw)": 0.8653196692466736, "Full-finetune/Step": 3776, "Full-finetune/Step Time": 6.838166028261185} {"Full-finetune/Learning Rate": 3.6688671536231557e-06, "Full-finetune/Loss": 0.7528378963470459, "Full-finetune/Loss (Raw)": 0.26182472705841064, "Full-finetune/Step": 3777, "Full-finetune/Step Time": 6.8457113187760115} {"Full-finetune/Learning Rate": 3.6640462952962217e-06, "Full-finetune/Loss": 0.7518905997276306, "Full-finetune/Loss (Raw)": 0.824732780456543, "Full-finetune/Step": 3778, "Full-finetune/Step Time": 6.853717666119337} {"Full-finetune/Learning Rate": 3.6592278958292225e-06, "Full-finetune/Loss": 0.7519584894180298, "Full-finetune/Loss (Raw)": 0.6669676899909973, "Full-finetune/Step": 3779, "Full-finetune/Step Time": 6.842181421816349} {"Full-finetune/Learning Rate": 3.6544119570920845e-06, "Full-finetune/Loss": 0.7513598203659058, "Full-finetune/Loss (Raw)": 0.7405800223350525, "Full-finetune/Step": 3780, "Full-finetune/Step Time": 6.843430068343878} {"Full-finetune/Learning Rate": 3.6495984809537775e-06, "Full-finetune/Loss": 0.7510838508605957, "Full-finetune/Loss (Raw)": 0.8516696095466614, "Full-finetune/Step": 3781, "Full-finetune/Step Time": 6.839977638795972} {"Full-finetune/Learning Rate": 3.6447874692823195e-06, "Full-finetune/Loss": 0.7509193420410156, "Full-finetune/Loss (Raw)": 0.7382564544677734, "Full-finetune/Step": 3782, "Full-finetune/Step Time": 6.813239175826311} {"Full-finetune/Learning Rate": 3.639978923944766e-06, "Full-finetune/Loss": 0.748975932598114, "Full-finetune/Loss (Raw)": 0.6835359334945679, "Full-finetune/Step": 3783, "Full-finetune/Step Time": 6.8149951454252005} {"Full-finetune/Learning Rate": 3.6351728468072265e-06, "Full-finetune/Loss": 0.749118983745575, "Full-finetune/Loss (Raw)": 0.7056024670600891, "Full-finetune/Step": 3784, "Full-finetune/Step Time": 6.820429801940918} {"Full-finetune/Learning Rate": 3.6303692397348455e-06, "Full-finetune/Loss": 0.7489646673202515, "Full-finetune/Loss (Raw)": 0.7918075919151306, "Full-finetune/Step": 3785, "Full-finetune/Step Time": 6.818370403721929} {"Full-finetune/Learning Rate": 3.6255681045918e-06, "Full-finetune/Loss": 0.7502278089523315, "Full-finetune/Loss (Raw)": 0.9245479702949524, "Full-finetune/Step": 3786, "Full-finetune/Step Time": 6.802243934944272} {"Full-finetune/Learning Rate": 3.6207694432413255e-06, "Full-finetune/Loss": 0.7504419684410095, "Full-finetune/Loss (Raw)": 0.8331051468849182, "Full-finetune/Step": 3787, "Full-finetune/Step Time": 6.799925858154893} {"Full-finetune/Learning Rate": 3.6159732575456862e-06, "Full-finetune/Loss": 0.7492510080337524, "Full-finetune/Loss (Raw)": 0.750821053981781, "Full-finetune/Step": 3788, "Full-finetune/Step Time": 6.805408535525203} {"Full-finetune/Learning Rate": 3.6111795493661885e-06, "Full-finetune/Loss": 0.7479037642478943, "Full-finetune/Loss (Raw)": 0.6379148364067078, "Full-finetune/Step": 3789, "Full-finetune/Step Time": 6.823906950652599} {"Full-finetune/Learning Rate": 3.606388320563177e-06, "Full-finetune/Loss": 0.7475013136863708, "Full-finetune/Loss (Raw)": 0.8599345088005066, "Full-finetune/Step": 3790, "Full-finetune/Step Time": 6.826210459694266} {"Full-finetune/Learning Rate": 3.6015995729960316e-06, "Full-finetune/Loss": 0.7462218999862671, "Full-finetune/Loss (Raw)": 0.8276692628860474, "Full-finetune/Step": 3791, "Full-finetune/Step Time": 6.825856998562813} {"Full-finetune/Learning Rate": 3.596813308523176e-06, "Full-finetune/Loss": 0.7430996298789978, "Full-finetune/Loss (Raw)": 0.3321515619754791, "Full-finetune/Step": 3792, "Full-finetune/Step Time": 6.832233740016818} {"Full-finetune/Learning Rate": 3.592029529002059e-06, "Full-finetune/Loss": 0.7430298328399658, "Full-finetune/Loss (Raw)": 0.8135067820549011, "Full-finetune/Step": 3793, "Full-finetune/Step Time": 6.850929316133261} {"Full-finetune/Learning Rate": 3.5872482362891802e-06, "Full-finetune/Loss": 0.7429256439208984, "Full-finetune/Loss (Raw)": 0.8054695725440979, "Full-finetune/Step": 3794, "Full-finetune/Step Time": 6.850205779075623} {"Full-finetune/Learning Rate": 3.5824694322400653e-06, "Full-finetune/Loss": 0.7450199127197266, "Full-finetune/Loss (Raw)": 0.6799418330192566, "Full-finetune/Step": 3795, "Full-finetune/Step Time": 6.843930508941412} {"Full-finetune/Learning Rate": 3.5776931187092667e-06, "Full-finetune/Loss": 0.7457979917526245, "Full-finetune/Loss (Raw)": 0.8416309952735901, "Full-finetune/Step": 3796, "Full-finetune/Step Time": 6.848820498213172} {"Full-finetune/Learning Rate": 3.5729192975503856e-06, "Full-finetune/Loss": 0.744745135307312, "Full-finetune/Loss (Raw)": 0.5952358841896057, "Full-finetune/Step": 3797, "Full-finetune/Step Time": 6.851815005764365} {"Full-finetune/Learning Rate": 3.5681479706160483e-06, "Full-finetune/Loss": 0.7440783381462097, "Full-finetune/Loss (Raw)": 0.7270994186401367, "Full-finetune/Step": 3798, "Full-finetune/Step Time": 6.848361603915691} {"Full-finetune/Learning Rate": 3.563379139757911e-06, "Full-finetune/Loss": 0.7416695356369019, "Full-finetune/Loss (Raw)": 0.5825097560882568, "Full-finetune/Step": 3799, "Full-finetune/Step Time": 6.857384622097015} {"Full-finetune/Learning Rate": 3.558612806826666e-06, "Full-finetune/Loss": 0.7426047325134277, "Full-finetune/Loss (Raw)": 0.8416715264320374, "Full-finetune/Step": 3800, "Full-finetune/Step Time": 6.853014573454857} {"Full-finetune/Learning Rate": 3.553848973672033e-06, "Full-finetune/Loss": 0.7444823980331421, "Full-finetune/Loss (Raw)": 0.7792255282402039, "Full-finetune/Step": 3801, "Full-finetune/Step Time": 6.852273318916559} {"Full-finetune/Learning Rate": 3.549087642142762e-06, "Full-finetune/Loss": 0.7452043294906616, "Full-finetune/Loss (Raw)": 0.8833458423614502, "Full-finetune/Step": 3802, "Full-finetune/Step Time": 6.8529680501669645} {"Full-finetune/Learning Rate": 3.544328814086632e-06, "Full-finetune/Loss": 0.7492812871932983, "Full-finetune/Loss (Raw)": 0.8933545351028442, "Full-finetune/Step": 3803, "Full-finetune/Step Time": 6.829627903178334} {"Full-finetune/Learning Rate": 3.5395724913504546e-06, "Full-finetune/Loss": 0.7493494749069214, "Full-finetune/Loss (Raw)": 0.8265153765678406, "Full-finetune/Step": 3804, "Full-finetune/Step Time": 6.813177788630128} {"Full-finetune/Learning Rate": 3.5348186757800683e-06, "Full-finetune/Loss": 0.746994137763977, "Full-finetune/Loss (Raw)": 0.612403929233551, "Full-finetune/Step": 3805, "Full-finetune/Step Time": 6.829399228096008} {"Full-finetune/Learning Rate": 3.530067369220326e-06, "Full-finetune/Loss": 0.7487569451332092, "Full-finetune/Loss (Raw)": 0.7788942456245422, "Full-finetune/Step": 3806, "Full-finetune/Step Time": 6.841142527759075} {"Full-finetune/Learning Rate": 3.525318573515125e-06, "Full-finetune/Loss": 0.7485682368278503, "Full-finetune/Loss (Raw)": 0.7293000221252441, "Full-finetune/Step": 3807, "Full-finetune/Step Time": 6.842995574697852} {"Full-finetune/Learning Rate": 3.520572290507378e-06, "Full-finetune/Loss": 0.7466714978218079, "Full-finetune/Loss (Raw)": 0.6232636570930481, "Full-finetune/Step": 3808, "Full-finetune/Step Time": 6.849225560203195} {"Full-finetune/Learning Rate": 3.5158285220390256e-06, "Full-finetune/Loss": 0.7460708618164062, "Full-finetune/Loss (Raw)": 0.7447132468223572, "Full-finetune/Step": 3809, "Full-finetune/Step Time": 6.8631391897797585} {"Full-finetune/Learning Rate": 3.5110872699510313e-06, "Full-finetune/Loss": 0.7447737455368042, "Full-finetune/Loss (Raw)": 0.8663758635520935, "Full-finetune/Step": 3810, "Full-finetune/Step Time": 6.859471457079053} {"Full-finetune/Learning Rate": 3.5063485360833816e-06, "Full-finetune/Loss": 0.7440454959869385, "Full-finetune/Loss (Raw)": 0.7160183191299438, "Full-finetune/Step": 3811, "Full-finetune/Step Time": 6.864498924463987} {"Full-finetune/Learning Rate": 3.5016123222750863e-06, "Full-finetune/Loss": 0.7451364994049072, "Full-finetune/Loss (Raw)": 0.7067814469337463, "Full-finetune/Step": 3812, "Full-finetune/Step Time": 6.858120104297996} {"Full-finetune/Learning Rate": 3.4968786303641764e-06, "Full-finetune/Loss": 0.7451757192611694, "Full-finetune/Loss (Raw)": 0.7808483242988586, "Full-finetune/Step": 3813, "Full-finetune/Step Time": 6.855404892936349} {"Full-finetune/Learning Rate": 3.492147462187714e-06, "Full-finetune/Loss": 0.7442800402641296, "Full-finetune/Loss (Raw)": 0.718052089214325, "Full-finetune/Step": 3814, "Full-finetune/Step Time": 6.853083491325378} {"Full-finetune/Learning Rate": 3.4874188195817626e-06, "Full-finetune/Loss": 0.7442036271095276, "Full-finetune/Loss (Raw)": 0.8201860785484314, "Full-finetune/Step": 3815, "Full-finetune/Step Time": 6.890115523710847} {"Full-finetune/Learning Rate": 3.4826927043814197e-06, "Full-finetune/Loss": 0.7458699345588684, "Full-finetune/Loss (Raw)": 0.8253677487373352, "Full-finetune/Step": 3816, "Full-finetune/Step Time": 6.895290249958634} {"Full-finetune/Learning Rate": 3.4779691184207954e-06, "Full-finetune/Loss": 0.7447974681854248, "Full-finetune/Loss (Raw)": 0.7331249117851257, "Full-finetune/Step": 3817, "Full-finetune/Step Time": 6.8914450984448195} {"Full-finetune/Learning Rate": 3.473248063533028e-06, "Full-finetune/Loss": 0.7440353631973267, "Full-finetune/Loss (Raw)": 0.7497418522834778, "Full-finetune/Step": 3818, "Full-finetune/Step Time": 6.884003719314933} {"Full-finetune/Learning Rate": 3.4685295415502663e-06, "Full-finetune/Loss": 0.7474836111068726, "Full-finetune/Loss (Raw)": 0.7405412197113037, "Full-finetune/Step": 3819, "Full-finetune/Step Time": 6.866769976913929} {"Full-finetune/Learning Rate": 3.4638135543036656e-06, "Full-finetune/Loss": 0.7457269430160522, "Full-finetune/Loss (Raw)": 0.6486150026321411, "Full-finetune/Step": 3820, "Full-finetune/Step Time": 6.867194473743439} {"Full-finetune/Learning Rate": 3.4591001036234206e-06, "Full-finetune/Loss": 0.7446144819259644, "Full-finetune/Loss (Raw)": 0.6760674715042114, "Full-finetune/Step": 3821, "Full-finetune/Step Time": 6.872261743992567} {"Full-finetune/Learning Rate": 3.4543891913387253e-06, "Full-finetune/Loss": 0.7449905276298523, "Full-finetune/Loss (Raw)": 0.6999393701553345, "Full-finetune/Step": 3822, "Full-finetune/Step Time": 6.851052453741431} {"Full-finetune/Learning Rate": 3.449680819277792e-06, "Full-finetune/Loss": 0.7440857291221619, "Full-finetune/Loss (Raw)": 0.9059023857116699, "Full-finetune/Step": 3823, "Full-finetune/Step Time": 6.853532118722796} {"Full-finetune/Learning Rate": 3.4449749892678486e-06, "Full-finetune/Loss": 0.7444294095039368, "Full-finetune/Loss (Raw)": 0.8254192471504211, "Full-finetune/Step": 3824, "Full-finetune/Step Time": 6.852342527359724} {"Full-finetune/Learning Rate": 3.4402717031351363e-06, "Full-finetune/Loss": 0.745384156703949, "Full-finetune/Loss (Raw)": 0.6471157073974609, "Full-finetune/Step": 3825, "Full-finetune/Step Time": 6.830956580117345} {"Full-finetune/Learning Rate": 3.4355709627049073e-06, "Full-finetune/Loss": 0.7443539500236511, "Full-finetune/Loss (Raw)": 0.6849040389060974, "Full-finetune/Step": 3826, "Full-finetune/Step Time": 6.816909147426486} {"Full-finetune/Learning Rate": 3.4308727698014243e-06, "Full-finetune/Loss": 0.7441582083702087, "Full-finetune/Loss (Raw)": 0.778076171875, "Full-finetune/Step": 3827, "Full-finetune/Step Time": 6.8543049190193415} {"Full-finetune/Learning Rate": 3.4261771262479724e-06, "Full-finetune/Loss": 0.7442178130149841, "Full-finetune/Loss (Raw)": 0.8309634327888489, "Full-finetune/Step": 3828, "Full-finetune/Step Time": 6.858067195862532} {"Full-finetune/Learning Rate": 3.4214840338668376e-06, "Full-finetune/Loss": 0.7414469718933105, "Full-finetune/Loss (Raw)": 0.2749957740306854, "Full-finetune/Step": 3829, "Full-finetune/Step Time": 6.8701854608953} {"Full-finetune/Learning Rate": 3.416793494479308e-06, "Full-finetune/Loss": 0.741204023361206, "Full-finetune/Loss (Raw)": 0.7919607758522034, "Full-finetune/Step": 3830, "Full-finetune/Step Time": 6.8799715749919415} {"Full-finetune/Learning Rate": 3.412105509905701e-06, "Full-finetune/Loss": 0.7403849363327026, "Full-finetune/Loss (Raw)": 0.7455229163169861, "Full-finetune/Step": 3831, "Full-finetune/Step Time": 6.886820575222373} {"Full-finetune/Learning Rate": 3.407420081965327e-06, "Full-finetune/Loss": 0.741697371006012, "Full-finetune/Loss (Raw)": 0.9826152920722961, "Full-finetune/Step": 3832, "Full-finetune/Step Time": 6.873992521315813} {"Full-finetune/Learning Rate": 3.402737212476509e-06, "Full-finetune/Loss": 0.7435184717178345, "Full-finetune/Loss (Raw)": 0.8490626215934753, "Full-finetune/Step": 3833, "Full-finetune/Step Time": 6.906610779464245} {"Full-finetune/Learning Rate": 3.398056903256579e-06, "Full-finetune/Loss": 0.7443821430206299, "Full-finetune/Loss (Raw)": 0.8857771754264832, "Full-finetune/Step": 3834, "Full-finetune/Step Time": 6.90057741291821} {"Full-finetune/Learning Rate": 3.393379156121873e-06, "Full-finetune/Loss": 0.7452661991119385, "Full-finetune/Loss (Raw)": 0.8577583432197571, "Full-finetune/Step": 3835, "Full-finetune/Step Time": 6.872171422466636} {"Full-finetune/Learning Rate": 3.3887039728877336e-06, "Full-finetune/Loss": 0.7459716200828552, "Full-finetune/Loss (Raw)": 0.7288433909416199, "Full-finetune/Step": 3836, "Full-finetune/Step Time": 6.8503239918500185} {"Full-finetune/Learning Rate": 3.3840313553685034e-06, "Full-finetune/Loss": 0.744570255279541, "Full-finetune/Loss (Raw)": 0.7472991347312927, "Full-finetune/Step": 3837, "Full-finetune/Step Time": 6.855479691177607} {"Full-finetune/Learning Rate": 3.379361305377542e-06, "Full-finetune/Loss": 0.7429868578910828, "Full-finetune/Loss (Raw)": 0.7304999232292175, "Full-finetune/Step": 3838, "Full-finetune/Step Time": 6.843521922826767} {"Full-finetune/Learning Rate": 3.374693824727204e-06, "Full-finetune/Loss": 0.7441071271896362, "Full-finetune/Loss (Raw)": 0.7952191829681396, "Full-finetune/Step": 3839, "Full-finetune/Step Time": 6.858179941773415} {"Full-finetune/Learning Rate": 3.3700289152288377e-06, "Full-finetune/Loss": 0.7429471611976624, "Full-finetune/Loss (Raw)": 0.7469417452812195, "Full-finetune/Step": 3840, "Full-finetune/Step Time": 6.858386667445302} {"Full-finetune/Learning Rate": 3.3653665786928138e-06, "Full-finetune/Loss": 0.748185932636261, "Full-finetune/Loss (Raw)": 0.949364185333252, "Full-finetune/Step": 3841, "Full-finetune/Step Time": 6.840130653232336} {"Full-finetune/Learning Rate": 3.360706816928491e-06, "Full-finetune/Loss": 0.747905969619751, "Full-finetune/Loss (Raw)": 0.7557335495948792, "Full-finetune/Step": 3842, "Full-finetune/Step Time": 6.831459935754538} {"Full-finetune/Learning Rate": 3.3560496317442305e-06, "Full-finetune/Loss": 0.7462180256843567, "Full-finetune/Loss (Raw)": 0.610394299030304, "Full-finetune/Step": 3843, "Full-finetune/Step Time": 6.840146718546748} {"Full-finetune/Learning Rate": 3.351395024947395e-06, "Full-finetune/Loss": 0.7468032836914062, "Full-finetune/Loss (Raw)": 0.7633358240127563, "Full-finetune/Step": 3844, "Full-finetune/Step Time": 6.822414146736264} {"Full-finetune/Learning Rate": 3.3467429983443477e-06, "Full-finetune/Loss": 0.7475409507751465, "Full-finetune/Loss (Raw)": 0.7658481597900391, "Full-finetune/Step": 3845, "Full-finetune/Step Time": 6.805399436503649} {"Full-finetune/Learning Rate": 3.34209355374045e-06, "Full-finetune/Loss": 0.7476603984832764, "Full-finetune/Loss (Raw)": 0.6278000473976135, "Full-finetune/Step": 3846, "Full-finetune/Step Time": 6.800988104194403} {"Full-finetune/Learning Rate": 3.337446692940055e-06, "Full-finetune/Loss": 0.749744176864624, "Full-finetune/Loss (Raw)": 0.880024254322052, "Full-finetune/Step": 3847, "Full-finetune/Step Time": 6.78889668546617} {"Full-finetune/Learning Rate": 3.332802417746527e-06, "Full-finetune/Loss": 0.7458807229995728, "Full-finetune/Loss (Raw)": 0.3258287012577057, "Full-finetune/Step": 3848, "Full-finetune/Step Time": 6.797524552792311} {"Full-finetune/Learning Rate": 3.3281607299622175e-06, "Full-finetune/Loss": 0.7458863854408264, "Full-finetune/Loss (Raw)": 0.8946933150291443, "Full-finetune/Step": 3849, "Full-finetune/Step Time": 6.8130023293197155} {"Full-finetune/Learning Rate": 3.3235216313884657e-06, "Full-finetune/Loss": 0.7431776523590088, "Full-finetune/Loss (Raw)": 0.4898372292518616, "Full-finetune/Step": 3850, "Full-finetune/Step Time": 6.820904860273004} {"Full-finetune/Learning Rate": 3.3188851238256246e-06, "Full-finetune/Loss": 0.7408465147018433, "Full-finetune/Loss (Raw)": 0.6467952132225037, "Full-finetune/Step": 3851, "Full-finetune/Step Time": 6.8133794236928225} {"Full-finetune/Learning Rate": 3.3142512090730283e-06, "Full-finetune/Loss": 0.7419228553771973, "Full-finetune/Loss (Raw)": 0.8919637799263, "Full-finetune/Step": 3852, "Full-finetune/Step Time": 6.8144979905337095} {"Full-finetune/Learning Rate": 3.309619888929011e-06, "Full-finetune/Loss": 0.7385315299034119, "Full-finetune/Loss (Raw)": 0.4521029591560364, "Full-finetune/Step": 3853, "Full-finetune/Step Time": 6.8283028937876225} {"Full-finetune/Learning Rate": 3.304991165190895e-06, "Full-finetune/Loss": 0.7418270707130432, "Full-finetune/Loss (Raw)": 0.801027238368988, "Full-finetune/Step": 3854, "Full-finetune/Step Time": 6.814717041328549} {"Full-finetune/Learning Rate": 3.300365039655e-06, "Full-finetune/Loss": 0.7400569915771484, "Full-finetune/Loss (Raw)": 0.5099667906761169, "Full-finetune/Step": 3855, "Full-finetune/Step Time": 6.825102740898728} {"Full-finetune/Learning Rate": 3.2957415141166327e-06, "Full-finetune/Loss": 0.7427521347999573, "Full-finetune/Loss (Raw)": 0.8974872827529907, "Full-finetune/Step": 3856, "Full-finetune/Step Time": 6.817619357258081} {"Full-finetune/Learning Rate": 3.2911205903700916e-06, "Full-finetune/Loss": 0.7391471862792969, "Full-finetune/Loss (Raw)": 0.3575209975242615, "Full-finetune/Step": 3857, "Full-finetune/Step Time": 6.825601955875754} {"Full-finetune/Learning Rate": 3.2865022702086756e-06, "Full-finetune/Loss": 0.7352008819580078, "Full-finetune/Loss (Raw)": 0.327873557806015, "Full-finetune/Step": 3858, "Full-finetune/Step Time": 6.81912194006145} {"Full-finetune/Learning Rate": 3.281886555424656e-06, "Full-finetune/Loss": 0.7361637353897095, "Full-finetune/Loss (Raw)": 0.9526204466819763, "Full-finetune/Step": 3859, "Full-finetune/Step Time": 6.811442829668522} {"Full-finetune/Learning Rate": 3.277273447809299e-06, "Full-finetune/Loss": 0.7358805537223816, "Full-finetune/Loss (Raw)": 0.8059275150299072, "Full-finetune/Step": 3860, "Full-finetune/Step Time": 6.805256171151996} {"Full-finetune/Learning Rate": 3.2726629491528714e-06, "Full-finetune/Loss": 0.7356197834014893, "Full-finetune/Loss (Raw)": 0.7362809181213379, "Full-finetune/Step": 3861, "Full-finetune/Step Time": 6.790532277897} {"Full-finetune/Learning Rate": 3.268055061244614e-06, "Full-finetune/Loss": 0.7349978685379028, "Full-finetune/Loss (Raw)": 0.8178393840789795, "Full-finetune/Step": 3862, "Full-finetune/Step Time": 6.789336934685707} {"Full-finetune/Learning Rate": 3.2634497858727553e-06, "Full-finetune/Loss": 0.7351944446563721, "Full-finetune/Loss (Raw)": 0.6591950058937073, "Full-finetune/Step": 3863, "Full-finetune/Step Time": 6.79832024499774} {"Full-finetune/Learning Rate": 3.2588471248245157e-06, "Full-finetune/Loss": 0.7337051033973694, "Full-finetune/Loss (Raw)": 0.8072659969329834, "Full-finetune/Step": 3864, "Full-finetune/Step Time": 6.800936084240675} {"Full-finetune/Learning Rate": 3.254247079886097e-06, "Full-finetune/Loss": 0.7332732677459717, "Full-finetune/Loss (Raw)": 0.7130924463272095, "Full-finetune/Step": 3865, "Full-finetune/Step Time": 6.818448279052973} {"Full-finetune/Learning Rate": 3.2496496528426867e-06, "Full-finetune/Loss": 0.734992504119873, "Full-finetune/Loss (Raw)": 0.909785270690918, "Full-finetune/Step": 3866, "Full-finetune/Step Time": 6.810326188802719} {"Full-finetune/Learning Rate": 3.245054845478454e-06, "Full-finetune/Loss": 0.7369664907455444, "Full-finetune/Loss (Raw)": 0.9753339886665344, "Full-finetune/Step": 3867, "Full-finetune/Step Time": 6.810870129615068} {"Full-finetune/Learning Rate": 3.240462659576562e-06, "Full-finetune/Loss": 0.7375614643096924, "Full-finetune/Loss (Raw)": 0.8396701812744141, "Full-finetune/Step": 3868, "Full-finetune/Step Time": 6.814593391492963} {"Full-finetune/Learning Rate": 3.23587309691914e-06, "Full-finetune/Loss": 0.7361992001533508, "Full-finetune/Loss (Raw)": 0.7216381430625916, "Full-finetune/Step": 3869, "Full-finetune/Step Time": 6.826468667015433} {"Full-finetune/Learning Rate": 3.231286159287308e-06, "Full-finetune/Loss": 0.7350272536277771, "Full-finetune/Loss (Raw)": 0.6733422875404358, "Full-finetune/Step": 3870, "Full-finetune/Step Time": 6.850448643788695} {"Full-finetune/Learning Rate": 3.2267018484611725e-06, "Full-finetune/Loss": 0.7348166704177856, "Full-finetune/Loss (Raw)": 0.7944068908691406, "Full-finetune/Step": 3871, "Full-finetune/Step Time": 6.8350043799728155} {"Full-finetune/Learning Rate": 3.222120166219812e-06, "Full-finetune/Loss": 0.7350715398788452, "Full-finetune/Loss (Raw)": 0.38945868611335754, "Full-finetune/Step": 3872, "Full-finetune/Step Time": 6.850322039797902} {"Full-finetune/Learning Rate": 3.217541114341288e-06, "Full-finetune/Loss": 0.7376669645309448, "Full-finetune/Loss (Raw)": 0.6527801752090454, "Full-finetune/Step": 3873, "Full-finetune/Step Time": 6.839980915188789} {"Full-finetune/Learning Rate": 3.2129646946026407e-06, "Full-finetune/Loss": 0.7383420467376709, "Full-finetune/Loss (Raw)": 0.7781378030776978, "Full-finetune/Step": 3874, "Full-finetune/Step Time": 6.8396126963198185} {"Full-finetune/Learning Rate": 3.2083909087798905e-06, "Full-finetune/Loss": 0.7395850419998169, "Full-finetune/Loss (Raw)": 0.765994131565094, "Full-finetune/Step": 3875, "Full-finetune/Step Time": 6.821508405730128} {"Full-finetune/Learning Rate": 3.2038197586480336e-06, "Full-finetune/Loss": 0.7394118309020996, "Full-finetune/Loss (Raw)": 0.8041529655456543, "Full-finetune/Step": 3876, "Full-finetune/Step Time": 6.808099489659071} {"Full-finetune/Learning Rate": 3.199251245981041e-06, "Full-finetune/Loss": 0.7399171590805054, "Full-finetune/Loss (Raw)": 0.6853753924369812, "Full-finetune/Step": 3877, "Full-finetune/Step Time": 6.815238017588854} {"Full-finetune/Learning Rate": 3.1946853725518724e-06, "Full-finetune/Loss": 0.7365931272506714, "Full-finetune/Loss (Raw)": 0.46548697352409363, "Full-finetune/Step": 3878, "Full-finetune/Step Time": 6.832780480384827} {"Full-finetune/Learning Rate": 3.1901221401324446e-06, "Full-finetune/Loss": 0.7343552112579346, "Full-finetune/Loss (Raw)": 0.6863925457000732, "Full-finetune/Step": 3879, "Full-finetune/Step Time": 6.857817197218537} {"Full-finetune/Learning Rate": 3.18556155049366e-06, "Full-finetune/Loss": 0.734557032585144, "Full-finetune/Loss (Raw)": 0.8071976900100708, "Full-finetune/Step": 3880, "Full-finetune/Step Time": 6.85414769873023} {"Full-finetune/Learning Rate": 3.1810036054054005e-06, "Full-finetune/Loss": 0.7354772090911865, "Full-finetune/Loss (Raw)": 0.8226494789123535, "Full-finetune/Step": 3881, "Full-finetune/Step Time": 6.835913069546223} {"Full-finetune/Learning Rate": 3.1764483066365117e-06, "Full-finetune/Loss": 0.735676646232605, "Full-finetune/Loss (Raw)": 0.8156381249427795, "Full-finetune/Step": 3882, "Full-finetune/Step Time": 6.839456591755152} {"Full-finetune/Learning Rate": 3.1718956559548154e-06, "Full-finetune/Loss": 0.7365796566009521, "Full-finetune/Loss (Raw)": 0.8819595575332642, "Full-finetune/Step": 3883, "Full-finetune/Step Time": 6.832250772044063} {"Full-finetune/Learning Rate": 3.1673456551271086e-06, "Full-finetune/Loss": 0.73747318983078, "Full-finetune/Loss (Raw)": 0.7139060497283936, "Full-finetune/Step": 3884, "Full-finetune/Step Time": 6.8250144850462675} {"Full-finetune/Learning Rate": 3.162798305919157e-06, "Full-finetune/Loss": 0.7344452142715454, "Full-finetune/Loss (Raw)": 0.5213640928268433, "Full-finetune/Step": 3885, "Full-finetune/Step Time": 6.830216448754072} {"Full-finetune/Learning Rate": 3.1582536100956973e-06, "Full-finetune/Loss": 0.7346670627593994, "Full-finetune/Loss (Raw)": 0.6778355240821838, "Full-finetune/Step": 3886, "Full-finetune/Step Time": 6.8274105452001095} {"Full-finetune/Learning Rate": 3.1537115694204345e-06, "Full-finetune/Loss": 0.7336736917495728, "Full-finetune/Loss (Raw)": 0.70900559425354, "Full-finetune/Step": 3887, "Full-finetune/Step Time": 6.828251929953694} {"Full-finetune/Learning Rate": 3.1491721856560555e-06, "Full-finetune/Loss": 0.7341760396957397, "Full-finetune/Loss (Raw)": 0.7772419452667236, "Full-finetune/Step": 3888, "Full-finetune/Step Time": 6.820706553757191} {"Full-finetune/Learning Rate": 3.144635460564197e-06, "Full-finetune/Loss": 0.7351651787757874, "Full-finetune/Loss (Raw)": 0.7768681049346924, "Full-finetune/Step": 3889, "Full-finetune/Step Time": 6.8019566256552935} {"Full-finetune/Learning Rate": 3.1401013959054726e-06, "Full-finetune/Loss": 0.7351593375205994, "Full-finetune/Loss (Raw)": 0.779590368270874, "Full-finetune/Step": 3890, "Full-finetune/Step Time": 6.794188156723976} {"Full-finetune/Learning Rate": 3.1355699934394724e-06, "Full-finetune/Loss": 0.7335784435272217, "Full-finetune/Loss (Raw)": 0.6865438222885132, "Full-finetune/Step": 3891, "Full-finetune/Step Time": 6.809655774384737} {"Full-finetune/Learning Rate": 3.1310412549247403e-06, "Full-finetune/Loss": 0.7341263890266418, "Full-finetune/Loss (Raw)": 0.7959239482879639, "Full-finetune/Step": 3892, "Full-finetune/Step Time": 6.812995603308082} {"Full-finetune/Learning Rate": 3.1265151821187933e-06, "Full-finetune/Loss": 0.732213020324707, "Full-finetune/Loss (Raw)": 0.365917444229126, "Full-finetune/Step": 3893, "Full-finetune/Step Time": 6.822559904307127} {"Full-finetune/Learning Rate": 3.121991776778109e-06, "Full-finetune/Loss": 0.7316336631774902, "Full-finetune/Loss (Raw)": 0.8136283159255981, "Full-finetune/Step": 3894, "Full-finetune/Step Time": 6.820759780704975} {"Full-finetune/Learning Rate": 3.1174710406581355e-06, "Full-finetune/Loss": 0.731410026550293, "Full-finetune/Loss (Raw)": 0.8005501627922058, "Full-finetune/Step": 3895, "Full-finetune/Step Time": 6.819442814216018} {"Full-finetune/Learning Rate": 3.1129529755132815e-06, "Full-finetune/Loss": 0.7321860194206238, "Full-finetune/Loss (Raw)": 0.7882716655731201, "Full-finetune/Step": 3896, "Full-finetune/Step Time": 6.807640166953206} {"Full-finetune/Learning Rate": 3.108437583096918e-06, "Full-finetune/Loss": 0.7362076044082642, "Full-finetune/Loss (Raw)": 0.7534435391426086, "Full-finetune/Step": 3897, "Full-finetune/Step Time": 6.788833219558001} {"Full-finetune/Learning Rate": 3.103924865161383e-06, "Full-finetune/Loss": 0.7345505356788635, "Full-finetune/Loss (Raw)": 0.7364968061447144, "Full-finetune/Step": 3898, "Full-finetune/Step Time": 6.8050557896494865} {"Full-finetune/Learning Rate": 3.0994148234579734e-06, "Full-finetune/Loss": 0.7341804504394531, "Full-finetune/Loss (Raw)": 0.8981574773788452, "Full-finetune/Step": 3899, "Full-finetune/Step Time": 6.7985069416463375} {"Full-finetune/Learning Rate": 3.0949074597369444e-06, "Full-finetune/Loss": 0.7335096597671509, "Full-finetune/Loss (Raw)": 0.7665449976921082, "Full-finetune/Step": 3900, "Full-finetune/Step Time": 6.8081098180264235} {"Full-finetune/Learning Rate": 3.090402775747523e-06, "Full-finetune/Loss": 0.7376009821891785, "Full-finetune/Loss (Raw)": 0.8612101674079895, "Full-finetune/Step": 3901, "Full-finetune/Step Time": 6.779153943061829} {"Full-finetune/Learning Rate": 3.0859007732378897e-06, "Full-finetune/Loss": 0.7381885051727295, "Full-finetune/Loss (Raw)": 0.9307801723480225, "Full-finetune/Step": 3902, "Full-finetune/Step Time": 6.7642619870603085} {"Full-finetune/Learning Rate": 3.0814014539551727e-06, "Full-finetune/Loss": 0.7382253408432007, "Full-finetune/Loss (Raw)": 0.8852832317352295, "Full-finetune/Step": 3903, "Full-finetune/Step Time": 6.758458841592073} {"Full-finetune/Learning Rate": 3.076904819645481e-06, "Full-finetune/Loss": 0.7374407052993774, "Full-finetune/Loss (Raw)": 0.7648804783821106, "Full-finetune/Step": 3904, "Full-finetune/Step Time": 6.762307794764638} {"Full-finetune/Learning Rate": 3.072410872053867e-06, "Full-finetune/Loss": 0.7402594089508057, "Full-finetune/Loss (Raw)": 0.6226282119750977, "Full-finetune/Step": 3905, "Full-finetune/Step Time": 6.75748848170042} {"Full-finetune/Learning Rate": 3.067919612924343e-06, "Full-finetune/Loss": 0.739829957485199, "Full-finetune/Loss (Raw)": 0.7697581052780151, "Full-finetune/Step": 3906, "Full-finetune/Step Time": 6.789868338033557} {"Full-finetune/Learning Rate": 3.0634310439998803e-06, "Full-finetune/Loss": 0.742769718170166, "Full-finetune/Loss (Raw)": 1.0432597398757935, "Full-finetune/Step": 3907, "Full-finetune/Step Time": 6.776152180507779} {"Full-finetune/Learning Rate": 3.0589451670224037e-06, "Full-finetune/Loss": 0.7413529753684998, "Full-finetune/Loss (Raw)": 0.5592369437217712, "Full-finetune/Step": 3908, "Full-finetune/Step Time": 6.782949833199382} {"Full-finetune/Learning Rate": 3.054461983732795e-06, "Full-finetune/Loss": 0.7398598790168762, "Full-finetune/Loss (Raw)": 0.6605514287948608, "Full-finetune/Step": 3909, "Full-finetune/Step Time": 6.789574621245265} {"Full-finetune/Learning Rate": 3.0499814958708883e-06, "Full-finetune/Loss": 0.7407844066619873, "Full-finetune/Loss (Raw)": 0.856603741645813, "Full-finetune/Step": 3910, "Full-finetune/Step Time": 6.7902880776673555} {"Full-finetune/Learning Rate": 3.045503705175478e-06, "Full-finetune/Loss": 0.7427214980125427, "Full-finetune/Loss (Raw)": 0.9314761757850647, "Full-finetune/Step": 3911, "Full-finetune/Step Time": 6.787061583250761} {"Full-finetune/Learning Rate": 3.041028613384307e-06, "Full-finetune/Loss": 0.7426050901412964, "Full-finetune/Loss (Raw)": 0.6907051205635071, "Full-finetune/Step": 3912, "Full-finetune/Step Time": 6.790641475468874} {"Full-finetune/Learning Rate": 3.036556222234063e-06, "Full-finetune/Loss": 0.7424930334091187, "Full-finetune/Loss (Raw)": 0.7774602770805359, "Full-finetune/Step": 3913, "Full-finetune/Step Time": 6.794687332585454} {"Full-finetune/Learning Rate": 3.032086533460402e-06, "Full-finetune/Loss": 0.7410295605659485, "Full-finetune/Loss (Raw)": 0.7372256517410278, "Full-finetune/Step": 3914, "Full-finetune/Step Time": 6.7971763629466295} {"Full-finetune/Learning Rate": 3.027619548797921e-06, "Full-finetune/Loss": 0.7410565614700317, "Full-finetune/Loss (Raw)": 0.8365548849105835, "Full-finetune/Step": 3915, "Full-finetune/Step Time": 6.794451005756855} {"Full-finetune/Learning Rate": 3.023155269980169e-06, "Full-finetune/Loss": 0.7416958808898926, "Full-finetune/Loss (Raw)": 0.8326619863510132, "Full-finetune/Step": 3916, "Full-finetune/Step Time": 6.795088170096278} {"Full-finetune/Learning Rate": 3.0186936987396442e-06, "Full-finetune/Loss": 0.7424218654632568, "Full-finetune/Loss (Raw)": 0.7308388352394104, "Full-finetune/Step": 3917, "Full-finetune/Step Time": 6.796009810641408} {"Full-finetune/Learning Rate": 3.014234836807798e-06, "Full-finetune/Loss": 0.7425804734230042, "Full-finetune/Loss (Raw)": 0.8802374601364136, "Full-finetune/Step": 3918, "Full-finetune/Step Time": 6.794894536957145} {"Full-finetune/Learning Rate": 3.0097786859150247e-06, "Full-finetune/Loss": 0.7419722080230713, "Full-finetune/Loss (Raw)": 0.7498066425323486, "Full-finetune/Step": 3919, "Full-finetune/Step Time": 6.8059387151151896} {"Full-finetune/Learning Rate": 3.005325247790668e-06, "Full-finetune/Loss": 0.7455295920372009, "Full-finetune/Loss (Raw)": 0.7874993085861206, "Full-finetune/Step": 3920, "Full-finetune/Step Time": 6.822450118139386} {"Full-finetune/Learning Rate": 3.0008745241630266e-06, "Full-finetune/Loss": 0.7438327670097351, "Full-finetune/Loss (Raw)": 0.5963136553764343, "Full-finetune/Step": 3921, "Full-finetune/Step Time": 6.8320367112755775} {"Full-finetune/Learning Rate": 2.9964265167593386e-06, "Full-finetune/Loss": 0.7442808151245117, "Full-finetune/Loss (Raw)": 0.8628157377243042, "Full-finetune/Step": 3922, "Full-finetune/Step Time": 6.835796570405364} {"Full-finetune/Learning Rate": 2.9919812273057815e-06, "Full-finetune/Loss": 0.742890477180481, "Full-finetune/Loss (Raw)": 0.5019768476486206, "Full-finetune/Step": 3923, "Full-finetune/Step Time": 6.836607132107019} {"Full-finetune/Learning Rate": 2.987538657527491e-06, "Full-finetune/Loss": 0.7428672313690186, "Full-finetune/Loss (Raw)": 0.8386675715446472, "Full-finetune/Step": 3924, "Full-finetune/Step Time": 6.841346895322204} {"Full-finetune/Learning Rate": 2.9830988091485426e-06, "Full-finetune/Loss": 0.7446792125701904, "Full-finetune/Loss (Raw)": 0.8271673917770386, "Full-finetune/Step": 3925, "Full-finetune/Step Time": 6.8376432955265045} {"Full-finetune/Learning Rate": 2.9786616838919515e-06, "Full-finetune/Loss": 0.7444317936897278, "Full-finetune/Loss (Raw)": 0.695430338382721, "Full-finetune/Step": 3926, "Full-finetune/Step Time": 6.843323336914182} {"Full-finetune/Learning Rate": 2.9742272834796813e-06, "Full-finetune/Loss": 0.7456536889076233, "Full-finetune/Loss (Raw)": 0.738906741142273, "Full-finetune/Step": 3927, "Full-finetune/Step Time": 6.851550513878465} {"Full-finetune/Learning Rate": 2.969795609632636e-06, "Full-finetune/Loss": 0.745792031288147, "Full-finetune/Loss (Raw)": 0.8593833446502686, "Full-finetune/Step": 3928, "Full-finetune/Step Time": 6.85258187353611} {"Full-finetune/Learning Rate": 2.9653666640706614e-06, "Full-finetune/Loss": 0.7462575435638428, "Full-finetune/Loss (Raw)": 0.8388137221336365, "Full-finetune/Step": 3929, "Full-finetune/Step Time": 6.8504090141505} {"Full-finetune/Learning Rate": 2.9609404485125414e-06, "Full-finetune/Loss": 0.7448660135269165, "Full-finetune/Loss (Raw)": 0.705227255821228, "Full-finetune/Step": 3930, "Full-finetune/Step Time": 6.866953141987324} {"Full-finetune/Learning Rate": 2.9565169646760108e-06, "Full-finetune/Loss": 0.7448770999908447, "Full-finetune/Loss (Raw)": 0.8947746157646179, "Full-finetune/Step": 3931, "Full-finetune/Step Time": 6.878584919497371} {"Full-finetune/Learning Rate": 2.9520962142777367e-06, "Full-finetune/Loss": 0.7438329458236694, "Full-finetune/Loss (Raw)": 0.6928642988204956, "Full-finetune/Step": 3932, "Full-finetune/Step Time": 6.904352821409702} {"Full-finetune/Learning Rate": 2.947678199033317e-06, "Full-finetune/Loss": 0.7431674003601074, "Full-finetune/Loss (Raw)": 0.527208149433136, "Full-finetune/Step": 3933, "Full-finetune/Step Time": 6.91314153932035} {"Full-finetune/Learning Rate": 2.943262920657306e-06, "Full-finetune/Loss": 0.7426089644432068, "Full-finetune/Loss (Raw)": 0.7074161171913147, "Full-finetune/Step": 3934, "Full-finetune/Step Time": 6.900350470095873} {"Full-finetune/Learning Rate": 2.938850380863184e-06, "Full-finetune/Loss": 0.742835521697998, "Full-finetune/Loss (Raw)": 0.7583003640174866, "Full-finetune/Step": 3935, "Full-finetune/Step Time": 6.90352888405323} {"Full-finetune/Learning Rate": 2.9344405813633724e-06, "Full-finetune/Loss": 0.7448505163192749, "Full-finetune/Loss (Raw)": 0.8811820149421692, "Full-finetune/Step": 3936, "Full-finetune/Step Time": 6.896170238032937} {"Full-finetune/Learning Rate": 2.930033523869228e-06, "Full-finetune/Loss": 0.7454250454902649, "Full-finetune/Loss (Raw)": 0.8182496428489685, "Full-finetune/Step": 3937, "Full-finetune/Step Time": 6.890587756410241} {"Full-finetune/Learning Rate": 2.925629210091043e-06, "Full-finetune/Loss": 0.7445197701454163, "Full-finetune/Loss (Raw)": 0.7505026459693909, "Full-finetune/Step": 3938, "Full-finetune/Step Time": 6.890705427154899} {"Full-finetune/Learning Rate": 2.9212276417380468e-06, "Full-finetune/Loss": 0.745259165763855, "Full-finetune/Loss (Raw)": 0.8106675148010254, "Full-finetune/Step": 3939, "Full-finetune/Step Time": 6.892628867179155} {"Full-finetune/Learning Rate": 2.9168288205183983e-06, "Full-finetune/Loss": 0.7461768388748169, "Full-finetune/Loss (Raw)": 0.8242419958114624, "Full-finetune/Step": 3940, "Full-finetune/Step Time": 6.880501663312316} {"Full-finetune/Learning Rate": 2.9124327481392023e-06, "Full-finetune/Loss": 0.7466517686843872, "Full-finetune/Loss (Raw)": 0.8416317701339722, "Full-finetune/Step": 3941, "Full-finetune/Step Time": 6.884733024984598} {"Full-finetune/Learning Rate": 2.9080394263064815e-06, "Full-finetune/Loss": 0.7477676272392273, "Full-finetune/Loss (Raw)": 0.8608885407447815, "Full-finetune/Step": 3942, "Full-finetune/Step Time": 6.891269579529762} {"Full-finetune/Learning Rate": 2.9036488567252006e-06, "Full-finetune/Loss": 0.7461288571357727, "Full-finetune/Loss (Raw)": 0.6104177236557007, "Full-finetune/Step": 3943, "Full-finetune/Step Time": 6.878407336771488} {"Full-finetune/Learning Rate": 2.8992610410992506e-06, "Full-finetune/Loss": 0.7462500333786011, "Full-finetune/Loss (Raw)": 0.8408787250518799, "Full-finetune/Step": 3944, "Full-finetune/Step Time": 6.86831521242857} {"Full-finetune/Learning Rate": 2.894875981131463e-06, "Full-finetune/Loss": 0.7481521368026733, "Full-finetune/Loss (Raw)": 0.9765962362289429, "Full-finetune/Step": 3945, "Full-finetune/Step Time": 6.8909764140844345} {"Full-finetune/Learning Rate": 2.890493678523595e-06, "Full-finetune/Loss": 0.7482485771179199, "Full-finetune/Loss (Raw)": 0.762089729309082, "Full-finetune/Step": 3946, "Full-finetune/Step Time": 6.905941367149353} {"Full-finetune/Learning Rate": 2.8861141349763224e-06, "Full-finetune/Loss": 0.7486619353294373, "Full-finetune/Loss (Raw)": 0.7934489846229553, "Full-finetune/Step": 3947, "Full-finetune/Step Time": 6.923006422817707} {"Full-finetune/Learning Rate": 2.881737352189271e-06, "Full-finetune/Loss": 0.7463757395744324, "Full-finetune/Loss (Raw)": 0.35598254203796387, "Full-finetune/Step": 3948, "Full-finetune/Step Time": 6.9434805158525705} {"Full-finetune/Learning Rate": 2.8773633318609796e-06, "Full-finetune/Loss": 0.7478516697883606, "Full-finetune/Loss (Raw)": 0.8649852275848389, "Full-finetune/Step": 3949, "Full-finetune/Step Time": 6.940304607152939} {"Full-finetune/Learning Rate": 2.872992075688922e-06, "Full-finetune/Loss": 0.7491822242736816, "Full-finetune/Loss (Raw)": 0.8702520728111267, "Full-finetune/Step": 3950, "Full-finetune/Step Time": 6.9369866624474525} {"Full-finetune/Learning Rate": 2.868623585369497e-06, "Full-finetune/Loss": 0.7489657402038574, "Full-finetune/Loss (Raw)": 0.8781901001930237, "Full-finetune/Step": 3951, "Full-finetune/Step Time": 6.941073400899768} {"Full-finetune/Learning Rate": 2.864257862598029e-06, "Full-finetune/Loss": 0.7477309703826904, "Full-finetune/Loss (Raw)": 0.6673729419708252, "Full-finetune/Step": 3952, "Full-finetune/Step Time": 6.949337102472782} {"Full-finetune/Learning Rate": 2.8598949090687723e-06, "Full-finetune/Loss": 0.748573899269104, "Full-finetune/Loss (Raw)": 0.755009114742279, "Full-finetune/Step": 3953, "Full-finetune/Step Time": 6.94715934433043} {"Full-finetune/Learning Rate": 2.8555347264748988e-06, "Full-finetune/Loss": 0.7489933967590332, "Full-finetune/Loss (Raw)": 0.7386030554771423, "Full-finetune/Step": 3954, "Full-finetune/Step Time": 6.951170559972525} {"Full-finetune/Learning Rate": 2.8511773165085164e-06, "Full-finetune/Loss": 0.748060405254364, "Full-finetune/Loss (Raw)": 0.6586471199989319, "Full-finetune/Step": 3955, "Full-finetune/Step Time": 6.9090959671884775} {"Full-finetune/Learning Rate": 2.8468226808606525e-06, "Full-finetune/Loss": 0.7485837340354919, "Full-finetune/Loss (Raw)": 0.8979485630989075, "Full-finetune/Step": 3956, "Full-finetune/Step Time": 6.908835418522358} {"Full-finetune/Learning Rate": 2.842470821221246e-06, "Full-finetune/Loss": 0.7528181076049805, "Full-finetune/Loss (Raw)": 0.8169925212860107, "Full-finetune/Step": 3957, "Full-finetune/Step Time": 6.890688745304942} {"Full-finetune/Learning Rate": 2.8381217392791784e-06, "Full-finetune/Loss": 0.752302885055542, "Full-finetune/Loss (Raw)": 0.7260196805000305, "Full-finetune/Step": 3958, "Full-finetune/Step Time": 6.8869339954108} {"Full-finetune/Learning Rate": 2.833775436722238e-06, "Full-finetune/Loss": 0.7514731287956238, "Full-finetune/Loss (Raw)": 0.6393044590950012, "Full-finetune/Step": 3959, "Full-finetune/Step Time": 6.899579482153058} {"Full-finetune/Learning Rate": 2.829431915237144e-06, "Full-finetune/Loss": 0.7489689588546753, "Full-finetune/Loss (Raw)": 0.662081778049469, "Full-finetune/Step": 3960, "Full-finetune/Step Time": 6.90286260843277} {"Full-finetune/Learning Rate": 2.825091176509529e-06, "Full-finetune/Loss": 0.7485320568084717, "Full-finetune/Loss (Raw)": 0.7931479811668396, "Full-finetune/Step": 3961, "Full-finetune/Step Time": 6.875847350805998} {"Full-finetune/Learning Rate": 2.8207532222239497e-06, "Full-finetune/Loss": 0.746631383895874, "Full-finetune/Loss (Raw)": 0.6424881815910339, "Full-finetune/Step": 3962, "Full-finetune/Step Time": 6.883600642904639} {"Full-finetune/Learning Rate": 2.816418054063883e-06, "Full-finetune/Loss": 0.7464958429336548, "Full-finetune/Loss (Raw)": 0.840410053730011, "Full-finetune/Step": 3963, "Full-finetune/Step Time": 6.888308709487319} {"Full-finetune/Learning Rate": 2.8120856737117187e-06, "Full-finetune/Loss": 0.747089684009552, "Full-finetune/Loss (Raw)": 0.8048565983772278, "Full-finetune/Step": 3964, "Full-finetune/Step Time": 6.89688809029758} {"Full-finetune/Learning Rate": 2.807756082848775e-06, "Full-finetune/Loss": 0.747403621673584, "Full-finetune/Loss (Raw)": 0.7874824404716492, "Full-finetune/Step": 3965, "Full-finetune/Step Time": 6.908602986484766} {"Full-finetune/Learning Rate": 2.803429283155281e-06, "Full-finetune/Loss": 0.7446624040603638, "Full-finetune/Loss (Raw)": 0.3796217143535614, "Full-finetune/Step": 3966, "Full-finetune/Step Time": 6.931411335244775} {"Full-finetune/Learning Rate": 2.7991052763103767e-06, "Full-finetune/Loss": 0.7445969581604004, "Full-finetune/Loss (Raw)": 0.7868347764015198, "Full-finetune/Step": 3967, "Full-finetune/Step Time": 6.9043026845902205} {"Full-finetune/Learning Rate": 2.7947840639921308e-06, "Full-finetune/Loss": 0.745220422744751, "Full-finetune/Loss (Raw)": 0.8267592787742615, "Full-finetune/Step": 3968, "Full-finetune/Step Time": 6.9027893748134375} {"Full-finetune/Learning Rate": 2.7904656478775196e-06, "Full-finetune/Loss": 0.7438966035842896, "Full-finetune/Loss (Raw)": 0.7799151539802551, "Full-finetune/Step": 3969, "Full-finetune/Step Time": 6.9277488477528095} {"Full-finetune/Learning Rate": 2.7861500296424372e-06, "Full-finetune/Loss": 0.7446293234825134, "Full-finetune/Loss (Raw)": 0.8495181202888489, "Full-finetune/Step": 3970, "Full-finetune/Step Time": 6.929151061922312} {"Full-finetune/Learning Rate": 2.781837210961689e-06, "Full-finetune/Loss": 0.7469218969345093, "Full-finetune/Loss (Raw)": 0.9038422107696533, "Full-finetune/Step": 3971, "Full-finetune/Step Time": 6.920848464593291} {"Full-finetune/Learning Rate": 2.7775271935089964e-06, "Full-finetune/Loss": 0.746967077255249, "Full-finetune/Loss (Raw)": 0.7691165804862976, "Full-finetune/Step": 3972, "Full-finetune/Step Time": 6.917840955778956} {"Full-finetune/Learning Rate": 2.7732199789569937e-06, "Full-finetune/Loss": 0.7469797730445862, "Full-finetune/Loss (Raw)": 0.767476499080658, "Full-finetune/Step": 3973, "Full-finetune/Step Time": 6.915043933317065} {"Full-finetune/Learning Rate": 2.768915568977222e-06, "Full-finetune/Loss": 0.7478143572807312, "Full-finetune/Loss (Raw)": 0.7346269488334656, "Full-finetune/Step": 3974, "Full-finetune/Step Time": 6.918116649612784} {"Full-finetune/Learning Rate": 2.7646139652401473e-06, "Full-finetune/Loss": 0.7480658292770386, "Full-finetune/Loss (Raw)": 0.9122040867805481, "Full-finetune/Step": 3975, "Full-finetune/Step Time": 6.915785972028971} {"Full-finetune/Learning Rate": 2.7603151694151354e-06, "Full-finetune/Loss": 0.7512073516845703, "Full-finetune/Loss (Raw)": 0.7279449105262756, "Full-finetune/Step": 3976, "Full-finetune/Step Time": 6.9090267941355705} {"Full-finetune/Learning Rate": 2.7560191831704584e-06, "Full-finetune/Loss": 0.7490200996398926, "Full-finetune/Loss (Raw)": 0.6147357821464539, "Full-finetune/Step": 3977, "Full-finetune/Step Time": 6.903716692700982} {"Full-finetune/Learning Rate": 2.751726008173312e-06, "Full-finetune/Loss": 0.7488776445388794, "Full-finetune/Loss (Raw)": 0.47159919142723083, "Full-finetune/Step": 3978, "Full-finetune/Step Time": 6.894918754696846} {"Full-finetune/Learning Rate": 2.747435646089791e-06, "Full-finetune/Loss": 0.7502482533454895, "Full-finetune/Loss (Raw)": 0.822234570980072, "Full-finetune/Step": 3979, "Full-finetune/Step Time": 6.8986050970852375} {"Full-finetune/Learning Rate": 2.7431480985849023e-06, "Full-finetune/Loss": 0.7477884888648987, "Full-finetune/Loss (Raw)": 0.5771152377128601, "Full-finetune/Step": 3980, "Full-finetune/Step Time": 6.900383917614818} {"Full-finetune/Learning Rate": 2.7388633673225586e-06, "Full-finetune/Loss": 0.750944972038269, "Full-finetune/Loss (Raw)": 0.856124222278595, "Full-finetune/Step": 3981, "Full-finetune/Step Time": 6.88306100666523} {"Full-finetune/Learning Rate": 2.734581453965579e-06, "Full-finetune/Loss": 0.7508187890052795, "Full-finetune/Loss (Raw)": 0.7848745584487915, "Full-finetune/Step": 3982, "Full-finetune/Step Time": 6.881979743018746} {"Full-finetune/Learning Rate": 2.730302360175693e-06, "Full-finetune/Loss": 0.752916693687439, "Full-finetune/Loss (Raw)": 0.7785009145736694, "Full-finetune/Step": 3983, "Full-finetune/Step Time": 6.865715941414237} {"Full-finetune/Learning Rate": 2.726026087613528e-06, "Full-finetune/Loss": 0.7485547065734863, "Full-finetune/Loss (Raw)": 0.33915314078330994, "Full-finetune/Step": 3984, "Full-finetune/Step Time": 6.8848265036940575} {"Full-finetune/Learning Rate": 2.7217526379386327e-06, "Full-finetune/Loss": 0.7522922158241272, "Full-finetune/Loss (Raw)": 0.8359267115592957, "Full-finetune/Step": 3985, "Full-finetune/Step Time": 6.87876882404089} {"Full-finetune/Learning Rate": 2.7174820128094393e-06, "Full-finetune/Loss": 0.7571463584899902, "Full-finetune/Loss (Raw)": 0.9492008090019226, "Full-finetune/Step": 3986, "Full-finetune/Step Time": 6.857625871896744} {"Full-finetune/Learning Rate": 2.713214213883295e-06, "Full-finetune/Loss": 0.7552486658096313, "Full-finetune/Loss (Raw)": 0.7097218632698059, "Full-finetune/Step": 3987, "Full-finetune/Step Time": 6.875339327380061} {"Full-finetune/Learning Rate": 2.7089492428164556e-06, "Full-finetune/Loss": 0.7554100751876831, "Full-finetune/Loss (Raw)": 0.8265772461891174, "Full-finetune/Step": 3988, "Full-finetune/Step Time": 6.878698633983731} {"Full-finetune/Learning Rate": 2.7046871012640687e-06, "Full-finetune/Loss": 0.7564237117767334, "Full-finetune/Loss (Raw)": 0.8660372495651245, "Full-finetune/Step": 3989, "Full-finetune/Step Time": 6.877461759373546} {"Full-finetune/Learning Rate": 2.7004277908801877e-06, "Full-finetune/Loss": 0.756208062171936, "Full-finetune/Loss (Raw)": 0.7902324795722961, "Full-finetune/Step": 3990, "Full-finetune/Step Time": 6.881915610283613} {"Full-finetune/Learning Rate": 2.6961713133177705e-06, "Full-finetune/Loss": 0.7577430009841919, "Full-finetune/Loss (Raw)": 0.8556638956069946, "Full-finetune/Step": 3991, "Full-finetune/Step Time": 6.874061970040202} {"Full-finetune/Learning Rate": 2.6919176702286696e-06, "Full-finetune/Loss": 0.7565597295761108, "Full-finetune/Loss (Raw)": 0.6558102369308472, "Full-finetune/Step": 3992, "Full-finetune/Step Time": 6.8915979862213135} {"Full-finetune/Learning Rate": 2.687666863263644e-06, "Full-finetune/Loss": 0.7573484182357788, "Full-finetune/Loss (Raw)": 0.8140462040901184, "Full-finetune/Step": 3993, "Full-finetune/Step Time": 6.858074270188808} {"Full-finetune/Learning Rate": 2.683418894072345e-06, "Full-finetune/Loss": 0.7555987238883972, "Full-finetune/Loss (Raw)": 0.6858187317848206, "Full-finetune/Step": 3994, "Full-finetune/Step Time": 6.87037349306047} {"Full-finetune/Learning Rate": 2.6791737643033333e-06, "Full-finetune/Loss": 0.7537673711776733, "Full-finetune/Loss (Raw)": 0.7409271001815796, "Full-finetune/Step": 3995, "Full-finetune/Step Time": 6.8703019469976425} {"Full-finetune/Learning Rate": 2.6749314756040547e-06, "Full-finetune/Loss": 0.7527116537094116, "Full-finetune/Loss (Raw)": 0.7045398950576782, "Full-finetune/Step": 3996, "Full-finetune/Step Time": 6.868305945768952} {"Full-finetune/Learning Rate": 2.6706920296208573e-06, "Full-finetune/Loss": 0.7524219155311584, "Full-finetune/Loss (Raw)": 0.6845476031303406, "Full-finetune/Step": 3997, "Full-finetune/Step Time": 6.856249378994107} {"Full-finetune/Learning Rate": 2.666455427998994e-06, "Full-finetune/Loss": 0.754006564617157, "Full-finetune/Loss (Raw)": 0.8761729598045349, "Full-finetune/Step": 3998, "Full-finetune/Step Time": 6.839968936517835} {"Full-finetune/Learning Rate": 2.6622216723826035e-06, "Full-finetune/Loss": 0.7537729740142822, "Full-finetune/Loss (Raw)": 0.7645151019096375, "Full-finetune/Step": 3999, "Full-finetune/Step Time": 6.834627894684672} {"Full-finetune/Learning Rate": 2.6579907644147227e-06, "Full-finetune/Loss": 0.756815493106842, "Full-finetune/Loss (Raw)": 0.7788975238800049, "Full-finetune/Step": 4000, "Full-finetune/Step Time": 6.804715149104595} {"Full-finetune/Learning Rate": 2.653762705737287e-06, "Full-finetune/Loss": 0.7574414014816284, "Full-finetune/Loss (Raw)": 0.7328919768333435, "Full-finetune/Step": 4001, "Full-finetune/Step Time": 6.816018313169479} {"Full-finetune/Learning Rate": 2.6495374979911215e-06, "Full-finetune/Loss": 0.756722092628479, "Full-finetune/Loss (Raw)": 0.6860722899436951, "Full-finetune/Step": 4002, "Full-finetune/Step Time": 6.826378570869565} {"Full-finetune/Learning Rate": 2.6453151428159472e-06, "Full-finetune/Loss": 0.7565380930900574, "Full-finetune/Loss (Raw)": 0.7424439191818237, "Full-finetune/Step": 4003, "Full-finetune/Step Time": 6.838338006287813} {"Full-finetune/Learning Rate": 2.641095641850375e-06, "Full-finetune/Loss": 0.7567535638809204, "Full-finetune/Loss (Raw)": 0.8317307233810425, "Full-finetune/Step": 4004, "Full-finetune/Step Time": 6.842859353870153} {"Full-finetune/Learning Rate": 2.6368789967319196e-06, "Full-finetune/Loss": 0.7574714422225952, "Full-finetune/Loss (Raw)": 0.7772665619850159, "Full-finetune/Step": 4005, "Full-finetune/Step Time": 6.827912453562021} {"Full-finetune/Learning Rate": 2.6326652090969697e-06, "Full-finetune/Loss": 0.7612612247467041, "Full-finetune/Loss (Raw)": 0.9505754709243774, "Full-finetune/Step": 4006, "Full-finetune/Step Time": 6.81708307005465} {"Full-finetune/Learning Rate": 2.6284542805808144e-06, "Full-finetune/Loss": 0.758678674697876, "Full-finetune/Loss (Raw)": 0.3558277487754822, "Full-finetune/Step": 4007, "Full-finetune/Step Time": 6.800245705991983} {"Full-finetune/Learning Rate": 2.624246212817638e-06, "Full-finetune/Loss": 0.7575695514678955, "Full-finetune/Loss (Raw)": 0.6652300357818604, "Full-finetune/Step": 4008, "Full-finetune/Step Time": 6.799018399789929} {"Full-finetune/Learning Rate": 2.620041007440508e-06, "Full-finetune/Loss": 0.7573928236961365, "Full-finetune/Loss (Raw)": 0.8000279068946838, "Full-finetune/Step": 4009, "Full-finetune/Step Time": 6.805395118892193} {"Full-finetune/Learning Rate": 2.6158386660813807e-06, "Full-finetune/Loss": 0.7563304901123047, "Full-finetune/Loss (Raw)": 0.6796491146087646, "Full-finetune/Step": 4010, "Full-finetune/Step Time": 6.823065700009465} {"Full-finetune/Learning Rate": 2.6116391903711035e-06, "Full-finetune/Loss": 0.7558926343917847, "Full-finetune/Loss (Raw)": 0.8259196281433105, "Full-finetune/Step": 4011, "Full-finetune/Step Time": 6.829397577792406} {"Full-finetune/Learning Rate": 2.607442581939411e-06, "Full-finetune/Loss": 0.7546290159225464, "Full-finetune/Loss (Raw)": 0.5521662831306458, "Full-finetune/Step": 4012, "Full-finetune/Step Time": 6.846946265548468} {"Full-finetune/Learning Rate": 2.603248842414925e-06, "Full-finetune/Loss": 0.756159782409668, "Full-finetune/Loss (Raw)": 0.7173062562942505, "Full-finetune/Step": 4013, "Full-finetune/Step Time": 6.841369664296508} {"Full-finetune/Learning Rate": 2.599057973425151e-06, "Full-finetune/Loss": 0.7565099000930786, "Full-finetune/Loss (Raw)": 0.7226393818855286, "Full-finetune/Step": 4014, "Full-finetune/Step Time": 6.856482297182083} {"Full-finetune/Learning Rate": 2.5948699765964915e-06, "Full-finetune/Loss": 0.7570233941078186, "Full-finetune/Loss (Raw)": 0.7747414708137512, "Full-finetune/Step": 4015, "Full-finetune/Step Time": 6.858300231397152} {"Full-finetune/Learning Rate": 2.5906848535542196e-06, "Full-finetune/Loss": 0.7571739554405212, "Full-finetune/Loss (Raw)": 0.7965124249458313, "Full-finetune/Step": 4016, "Full-finetune/Step Time": 6.849878519773483} {"Full-finetune/Learning Rate": 2.5865026059224974e-06, "Full-finetune/Loss": 0.7575478553771973, "Full-finetune/Loss (Raw)": 0.8247299790382385, "Full-finetune/Step": 4017, "Full-finetune/Step Time": 6.8519506230950356} {"Full-finetune/Learning Rate": 2.58232323532438e-06, "Full-finetune/Loss": 0.7539650201797485, "Full-finetune/Loss (Raw)": 0.320976197719574, "Full-finetune/Step": 4018, "Full-finetune/Step Time": 6.871899651363492} {"Full-finetune/Learning Rate": 2.5781467433817973e-06, "Full-finetune/Loss": 0.7558008432388306, "Full-finetune/Loss (Raw)": 0.9215400218963623, "Full-finetune/Step": 4019, "Full-finetune/Step Time": 6.852474234998226} {"Full-finetune/Learning Rate": 2.573973131715565e-06, "Full-finetune/Loss": 0.7564713954925537, "Full-finetune/Loss (Raw)": 0.8817571997642517, "Full-finetune/Step": 4020, "Full-finetune/Step Time": 6.851108280941844} {"Full-finetune/Learning Rate": 2.569802401945378e-06, "Full-finetune/Loss": 0.7597665190696716, "Full-finetune/Loss (Raw)": 0.7876890301704407, "Full-finetune/Step": 4021, "Full-finetune/Step Time": 6.843068782240152} {"Full-finetune/Learning Rate": 2.565634555689818e-06, "Full-finetune/Loss": 0.7592962980270386, "Full-finetune/Loss (Raw)": 0.7534353733062744, "Full-finetune/Step": 4022, "Full-finetune/Step Time": 6.846595732495189} {"Full-finetune/Learning Rate": 2.5614695945663415e-06, "Full-finetune/Loss": 0.7593976259231567, "Full-finetune/Loss (Raw)": 0.8135299682617188, "Full-finetune/Step": 4023, "Full-finetune/Step Time": 6.84991760738194} {"Full-finetune/Learning Rate": 2.557307520191291e-06, "Full-finetune/Loss": 0.7600229978561401, "Full-finetune/Loss (Raw)": 0.8683148622512817, "Full-finetune/Step": 4024, "Full-finetune/Step Time": 6.856244998052716} {"Full-finetune/Learning Rate": 2.5531483341798856e-06, "Full-finetune/Loss": 0.7598893046379089, "Full-finetune/Loss (Raw)": 0.7363290786743164, "Full-finetune/Step": 4025, "Full-finetune/Step Time": 6.856549611315131} {"Full-finetune/Learning Rate": 2.548992038146224e-06, "Full-finetune/Loss": 0.7607486248016357, "Full-finetune/Loss (Raw)": 0.8464885354042053, "Full-finetune/Step": 4026, "Full-finetune/Step Time": 6.844453984871507} {"Full-finetune/Learning Rate": 2.5448386337032817e-06, "Full-finetune/Loss": 0.7607941031455994, "Full-finetune/Loss (Raw)": 0.9039772748947144, "Full-finetune/Step": 4027, "Full-finetune/Step Time": 6.840781789273024} {"Full-finetune/Learning Rate": 2.5406881224629175e-06, "Full-finetune/Loss": 0.7605389952659607, "Full-finetune/Loss (Raw)": 0.7338951230049133, "Full-finetune/Step": 4028, "Full-finetune/Step Time": 6.826607834547758} {"Full-finetune/Learning Rate": 2.5365405060358663e-06, "Full-finetune/Loss": 0.7603561282157898, "Full-finetune/Loss (Raw)": 0.8378024101257324, "Full-finetune/Step": 4029, "Full-finetune/Step Time": 6.827110404148698} {"Full-finetune/Learning Rate": 2.532395786031726e-06, "Full-finetune/Loss": 0.75611412525177, "Full-finetune/Loss (Raw)": 0.3878038227558136, "Full-finetune/Step": 4030, "Full-finetune/Step Time": 6.842835275456309} {"Full-finetune/Learning Rate": 2.528253964058992e-06, "Full-finetune/Loss": 0.754977822303772, "Full-finetune/Loss (Raw)": 0.7398431301116943, "Full-finetune/Step": 4031, "Full-finetune/Step Time": 6.843902062624693} {"Full-finetune/Learning Rate": 2.5241150417250216e-06, "Full-finetune/Loss": 0.7548417448997498, "Full-finetune/Loss (Raw)": 0.7474530339241028, "Full-finetune/Step": 4032, "Full-finetune/Step Time": 6.837648700922728} {"Full-finetune/Learning Rate": 2.5199790206360486e-06, "Full-finetune/Loss": 0.7566744089126587, "Full-finetune/Loss (Raw)": 0.8572191596031189, "Full-finetune/Step": 4033, "Full-finetune/Step Time": 6.826219318434596} {"Full-finetune/Learning Rate": 2.5158459023971826e-06, "Full-finetune/Loss": 0.756685733795166, "Full-finetune/Loss (Raw)": 0.7711980938911438, "Full-finetune/Step": 4034, "Full-finetune/Step Time": 6.787781178951263} {"Full-finetune/Learning Rate": 2.511715688612405e-06, "Full-finetune/Loss": 0.7536701560020447, "Full-finetune/Loss (Raw)": 0.6572694182395935, "Full-finetune/Step": 4035, "Full-finetune/Step Time": 6.794811554253101} {"Full-finetune/Learning Rate": 2.5075883808845736e-06, "Full-finetune/Loss": 0.7570222020149231, "Full-finetune/Loss (Raw)": 0.9882979393005371, "Full-finetune/Step": 4036, "Full-finetune/Step Time": 6.781677452847362} {"Full-finetune/Learning Rate": 2.5034639808154115e-06, "Full-finetune/Loss": 0.7572187185287476, "Full-finetune/Loss (Raw)": 0.6857061386108398, "Full-finetune/Step": 4037, "Full-finetune/Step Time": 6.78821568749845} {"Full-finetune/Learning Rate": 2.4993424900055228e-06, "Full-finetune/Loss": 0.7533010244369507, "Full-finetune/Loss (Raw)": 0.3551306426525116, "Full-finetune/Step": 4038, "Full-finetune/Step Time": 6.804634751752019} {"Full-finetune/Learning Rate": 2.4952239100543808e-06, "Full-finetune/Loss": 0.7520009279251099, "Full-finetune/Loss (Raw)": 0.765078067779541, "Full-finetune/Step": 4039, "Full-finetune/Step Time": 6.825301580131054} {"Full-finetune/Learning Rate": 2.491108242560313e-06, "Full-finetune/Loss": 0.7532705664634705, "Full-finetune/Loss (Raw)": 0.8532112240791321, "Full-finetune/Step": 4040, "Full-finetune/Step Time": 6.814436413347721} {"Full-finetune/Learning Rate": 2.486995489120542e-06, "Full-finetune/Loss": 0.7526983618736267, "Full-finetune/Loss (Raw)": 0.7042186856269836, "Full-finetune/Step": 4041, "Full-finetune/Step Time": 6.808777000755072} {"Full-finetune/Learning Rate": 2.4828856513311405e-06, "Full-finetune/Loss": 0.752963125705719, "Full-finetune/Loss (Raw)": 0.7711102962493896, "Full-finetune/Step": 4042, "Full-finetune/Step Time": 6.822736971080303} {"Full-finetune/Learning Rate": 2.4787787307870605e-06, "Full-finetune/Loss": 0.7529738545417786, "Full-finetune/Loss (Raw)": 0.8379318118095398, "Full-finetune/Step": 4043, "Full-finetune/Step Time": 6.8359689842909575} {"Full-finetune/Learning Rate": 2.474674729082115e-06, "Full-finetune/Loss": 0.7526019811630249, "Full-finetune/Loss (Raw)": 0.7850601077079773, "Full-finetune/Step": 4044, "Full-finetune/Step Time": 6.828277081251144} {"Full-finetune/Learning Rate": 2.470573647808987e-06, "Full-finetune/Loss": 0.7491521835327148, "Full-finetune/Loss (Raw)": 0.2892717123031616, "Full-finetune/Step": 4045, "Full-finetune/Step Time": 6.837411556392908} {"Full-finetune/Learning Rate": 2.466475488559227e-06, "Full-finetune/Loss": 0.7478299140930176, "Full-finetune/Loss (Raw)": 0.71098393201828, "Full-finetune/Step": 4046, "Full-finetune/Step Time": 6.83455516025424} {"Full-finetune/Learning Rate": 2.4623802529232476e-06, "Full-finetune/Loss": 0.7477506399154663, "Full-finetune/Loss (Raw)": 0.7396585941314697, "Full-finetune/Step": 4047, "Full-finetune/Step Time": 6.837121607735753} {"Full-finetune/Learning Rate": 2.458287942490335e-06, "Full-finetune/Loss": 0.7444251775741577, "Full-finetune/Loss (Raw)": 0.36184102296829224, "Full-finetune/Step": 4048, "Full-finetune/Step Time": 6.8211835864931345} {"Full-finetune/Learning Rate": 2.454198558848635e-06, "Full-finetune/Loss": 0.7448325753211975, "Full-finetune/Loss (Raw)": 0.6484639644622803, "Full-finetune/Step": 4049, "Full-finetune/Step Time": 6.804431583732367} {"Full-finetune/Learning Rate": 2.4501121035851494e-06, "Full-finetune/Loss": 0.7438890337944031, "Full-finetune/Loss (Raw)": 0.7420331239700317, "Full-finetune/Step": 4050, "Full-finetune/Step Time": 6.802575135603547} {"Full-finetune/Learning Rate": 2.4460285782857606e-06, "Full-finetune/Loss": 0.74552321434021, "Full-finetune/Loss (Raw)": 0.711156964302063, "Full-finetune/Step": 4051, "Full-finetune/Step Time": 6.793753484264016} {"Full-finetune/Learning Rate": 2.441947984535201e-06, "Full-finetune/Loss": 0.7447804808616638, "Full-finetune/Loss (Raw)": 0.7435974478721619, "Full-finetune/Step": 4052, "Full-finetune/Step Time": 6.813806407153606} {"Full-finetune/Learning Rate": 2.4378703239170707e-06, "Full-finetune/Loss": 0.741202712059021, "Full-finetune/Loss (Raw)": 0.3692225515842438, "Full-finetune/Step": 4053, "Full-finetune/Step Time": 6.830480037257075} {"Full-finetune/Learning Rate": 2.4337955980138293e-06, "Full-finetune/Loss": 0.740604043006897, "Full-finetune/Loss (Raw)": 0.6187857389450073, "Full-finetune/Step": 4054, "Full-finetune/Step Time": 6.839277558028698} {"Full-finetune/Learning Rate": 2.4297238084067988e-06, "Full-finetune/Loss": 0.7409456968307495, "Full-finetune/Loss (Raw)": 0.7826454639434814, "Full-finetune/Step": 4055, "Full-finetune/Step Time": 6.821154272183776} {"Full-finetune/Learning Rate": 2.425654956676161e-06, "Full-finetune/Loss": 0.7386462688446045, "Full-finetune/Loss (Raw)": 0.5650540590286255, "Full-finetune/Step": 4056, "Full-finetune/Step Time": 6.83677251636982} {"Full-finetune/Learning Rate": 2.421589044400955e-06, "Full-finetune/Loss": 0.738906979560852, "Full-finetune/Loss (Raw)": 0.8721878528594971, "Full-finetune/Step": 4057, "Full-finetune/Step Time": 6.833024935796857} {"Full-finetune/Learning Rate": 2.4175260731590878e-06, "Full-finetune/Loss": 0.739149808883667, "Full-finetune/Loss (Raw)": 0.736309289932251, "Full-finetune/Step": 4058, "Full-finetune/Step Time": 6.813998429104686} {"Full-finetune/Learning Rate": 2.413466044527318e-06, "Full-finetune/Loss": 0.7376559972763062, "Full-finetune/Loss (Raw)": 0.7035654783248901, "Full-finetune/Step": 4059, "Full-finetune/Step Time": 6.817485569044948} {"Full-finetune/Learning Rate": 2.4094089600812576e-06, "Full-finetune/Loss": 0.7357711791992188, "Full-finetune/Loss (Raw)": 0.4516054689884186, "Full-finetune/Step": 4060, "Full-finetune/Step Time": 6.819287534803152} {"Full-finetune/Learning Rate": 2.405354821395388e-06, "Full-finetune/Loss": 0.7363548278808594, "Full-finetune/Loss (Raw)": 0.6019173860549927, "Full-finetune/Step": 4061, "Full-finetune/Step Time": 6.811273455619812} {"Full-finetune/Learning Rate": 2.4013036300430403e-06, "Full-finetune/Loss": 0.7371993660926819, "Full-finetune/Loss (Raw)": 0.8155166506767273, "Full-finetune/Step": 4062, "Full-finetune/Step Time": 6.813582157716155} {"Full-finetune/Learning Rate": 2.3972553875964035e-06, "Full-finetune/Loss": 0.7340133190155029, "Full-finetune/Loss (Raw)": 0.3504851758480072, "Full-finetune/Step": 4063, "Full-finetune/Step Time": 6.820462424308062} {"Full-finetune/Learning Rate": 2.393210095626515e-06, "Full-finetune/Loss": 0.7300900220870972, "Full-finetune/Loss (Raw)": 0.3790079653263092, "Full-finetune/Step": 4064, "Full-finetune/Step Time": 6.839361142367125} {"Full-finetune/Learning Rate": 2.38916775570328e-06, "Full-finetune/Loss": 0.7285775542259216, "Full-finetune/Loss (Raw)": 0.6246500611305237, "Full-finetune/Step": 4065, "Full-finetune/Step Time": 6.8447809889912605} {"Full-finetune/Learning Rate": 2.3851283693954506e-06, "Full-finetune/Loss": 0.7289276123046875, "Full-finetune/Loss (Raw)": 0.7953083515167236, "Full-finetune/Step": 4066, "Full-finetune/Step Time": 6.84862862713635} {"Full-finetune/Learning Rate": 2.3810919382706297e-06, "Full-finetune/Loss": 0.7293121814727783, "Full-finetune/Loss (Raw)": 0.8598923683166504, "Full-finetune/Step": 4067, "Full-finetune/Step Time": 6.856131058186293} {"Full-finetune/Learning Rate": 2.3770584638952874e-06, "Full-finetune/Loss": 0.729185938835144, "Full-finetune/Loss (Raw)": 0.8080762624740601, "Full-finetune/Step": 4068, "Full-finetune/Step Time": 6.868439864367247} {"Full-finetune/Learning Rate": 2.3730279478347275e-06, "Full-finetune/Loss": 0.7293225526809692, "Full-finetune/Loss (Raw)": 0.8591228127479553, "Full-finetune/Step": 4069, "Full-finetune/Step Time": 6.880586078390479} {"Full-finetune/Learning Rate": 2.3690003916531157e-06, "Full-finetune/Loss": 0.7284823060035706, "Full-finetune/Loss (Raw)": 0.7533397078514099, "Full-finetune/Step": 4070, "Full-finetune/Step Time": 6.874864837154746} {"Full-finetune/Learning Rate": 2.3649757969134667e-06, "Full-finetune/Loss": 0.7293500900268555, "Full-finetune/Loss (Raw)": 0.7214946150779724, "Full-finetune/Step": 4071, "Full-finetune/Step Time": 6.879869628697634} {"Full-finetune/Learning Rate": 2.3609541651776537e-06, "Full-finetune/Loss": 0.727973222732544, "Full-finetune/Loss (Raw)": 0.6646429896354675, "Full-finetune/Step": 4072, "Full-finetune/Step Time": 6.888609996065497} {"Full-finetune/Learning Rate": 2.356935498006391e-06, "Full-finetune/Loss": 0.726323127746582, "Full-finetune/Loss (Raw)": 0.7653822898864746, "Full-finetune/Step": 4073, "Full-finetune/Step Time": 6.871024599298835} {"Full-finetune/Learning Rate": 2.3529197969592375e-06, "Full-finetune/Loss": 0.7272933125495911, "Full-finetune/Loss (Raw)": 0.8862715363502502, "Full-finetune/Step": 4074, "Full-finetune/Step Time": 6.85763162560761} {"Full-finetune/Learning Rate": 2.3489070635946175e-06, "Full-finetune/Loss": 0.7267714738845825, "Full-finetune/Loss (Raw)": 0.7266564965248108, "Full-finetune/Step": 4075, "Full-finetune/Step Time": 6.835781684145331} {"Full-finetune/Learning Rate": 2.3448972994697906e-06, "Full-finetune/Loss": 0.7284356355667114, "Full-finetune/Loss (Raw)": 0.5689897537231445, "Full-finetune/Step": 4076, "Full-finetune/Step Time": 6.83563463576138} {"Full-finetune/Learning Rate": 2.340890506140869e-06, "Full-finetune/Loss": 0.7278894186019897, "Full-finetune/Loss (Raw)": 0.795068621635437, "Full-finetune/Step": 4077, "Full-finetune/Step Time": 6.848675003275275} {"Full-finetune/Learning Rate": 2.3368866851628102e-06, "Full-finetune/Loss": 0.7268011569976807, "Full-finetune/Loss (Raw)": 0.730962336063385, "Full-finetune/Step": 4078, "Full-finetune/Step Time": 6.851597247645259} {"Full-finetune/Learning Rate": 2.3328858380894194e-06, "Full-finetune/Loss": 0.7265760898590088, "Full-finetune/Loss (Raw)": 0.8493759632110596, "Full-finetune/Step": 4079, "Full-finetune/Step Time": 6.8625699784606695} {"Full-finetune/Learning Rate": 2.328887966473348e-06, "Full-finetune/Loss": 0.7266207933425903, "Full-finetune/Loss (Raw)": 0.6730949878692627, "Full-finetune/Step": 4080, "Full-finetune/Step Time": 6.862810904160142} {"Full-finetune/Learning Rate": 2.324893071866087e-06, "Full-finetune/Loss": 0.7262885570526123, "Full-finetune/Loss (Raw)": 0.7124890089035034, "Full-finetune/Step": 4081, "Full-finetune/Step Time": 6.883520681411028} {"Full-finetune/Learning Rate": 2.320901155817983e-06, "Full-finetune/Loss": 0.7260931730270386, "Full-finetune/Loss (Raw)": 0.7135891318321228, "Full-finetune/Step": 4082, "Full-finetune/Step Time": 6.880672093480825} {"Full-finetune/Learning Rate": 2.316912219878222e-06, "Full-finetune/Loss": 0.727629542350769, "Full-finetune/Loss (Raw)": 0.8553019165992737, "Full-finetune/Step": 4083, "Full-finetune/Step Time": 6.883082799613476} {"Full-finetune/Learning Rate": 2.312926265594825e-06, "Full-finetune/Loss": 0.7242095470428467, "Full-finetune/Loss (Raw)": 0.46018412709236145, "Full-finetune/Step": 4084, "Full-finetune/Step Time": 6.896417060866952} {"Full-finetune/Learning Rate": 2.308943294514667e-06, "Full-finetune/Loss": 0.7223966717720032, "Full-finetune/Loss (Raw)": 0.5849504470825195, "Full-finetune/Step": 4085, "Full-finetune/Step Time": 6.907622113823891} {"Full-finetune/Learning Rate": 2.3049633081834634e-06, "Full-finetune/Loss": 0.7221027612686157, "Full-finetune/Loss (Raw)": 0.6884012818336487, "Full-finetune/Step": 4086, "Full-finetune/Step Time": 6.914628865197301} {"Full-finetune/Learning Rate": 2.3009863081457663e-06, "Full-finetune/Loss": 0.7239508628845215, "Full-finetune/Loss (Raw)": 0.8758555054664612, "Full-finetune/Step": 4087, "Full-finetune/Step Time": 6.902479637414217} {"Full-finetune/Learning Rate": 2.2970122959449716e-06, "Full-finetune/Loss": 0.7251390218734741, "Full-finetune/Loss (Raw)": 0.814176082611084, "Full-finetune/Step": 4088, "Full-finetune/Step Time": 6.897752853110433} {"Full-finetune/Learning Rate": 2.2930412731233174e-06, "Full-finetune/Loss": 0.7250198125839233, "Full-finetune/Loss (Raw)": 0.7778798937797546, "Full-finetune/Step": 4089, "Full-finetune/Step Time": 6.898739529773593} {"Full-finetune/Learning Rate": 2.2890732412218795e-06, "Full-finetune/Loss": 0.7261578440666199, "Full-finetune/Loss (Raw)": 0.7881561517715454, "Full-finetune/Step": 4090, "Full-finetune/Step Time": 6.890548914670944} {"Full-finetune/Learning Rate": 2.2851082017805704e-06, "Full-finetune/Loss": 0.7254940271377563, "Full-finetune/Loss (Raw)": 0.7554455995559692, "Full-finetune/Step": 4091, "Full-finetune/Step Time": 6.9026133716106415} {"Full-finetune/Learning Rate": 2.2811461563381497e-06, "Full-finetune/Loss": 0.725019097328186, "Full-finetune/Loss (Raw)": 0.7440633177757263, "Full-finetune/Step": 4092, "Full-finetune/Step Time": 6.904024597257376} {"Full-finetune/Learning Rate": 2.2771871064322117e-06, "Full-finetune/Loss": 0.725825309753418, "Full-finetune/Loss (Raw)": 0.8906838297843933, "Full-finetune/Step": 4093, "Full-finetune/Step Time": 6.889077674597502} {"Full-finetune/Learning Rate": 2.2732310535991775e-06, "Full-finetune/Loss": 0.7304561138153076, "Full-finetune/Loss (Raw)": 0.9723620414733887, "Full-finetune/Step": 4094, "Full-finetune/Step Time": 6.870942328125238} {"Full-finetune/Learning Rate": 2.2692779993743207e-06, "Full-finetune/Loss": 0.729600191116333, "Full-finetune/Loss (Raw)": 0.6772751808166504, "Full-finetune/Step": 4095, "Full-finetune/Step Time": 6.877898842096329} {"Full-finetune/Learning Rate": 2.265327945291742e-06, "Full-finetune/Loss": 0.7302642464637756, "Full-finetune/Loss (Raw)": 0.9117608070373535, "Full-finetune/Step": 4096, "Full-finetune/Step Time": 6.881810130551457} {"Full-finetune/Learning Rate": 2.2613808928843827e-06, "Full-finetune/Loss": 0.7307497262954712, "Full-finetune/Loss (Raw)": 0.8420581221580505, "Full-finetune/Step": 4097, "Full-finetune/Step Time": 6.876688765361905} {"Full-finetune/Learning Rate": 2.2574368436840144e-06, "Full-finetune/Loss": 0.7287867665290833, "Full-finetune/Loss (Raw)": 0.598253607749939, "Full-finetune/Step": 4098, "Full-finetune/Step Time": 6.883791871368885} {"Full-finetune/Learning Rate": 2.2534957992212457e-06, "Full-finetune/Loss": 0.7279029488563538, "Full-finetune/Loss (Raw)": 0.7907145619392395, "Full-finetune/Step": 4099, "Full-finetune/Step Time": 6.896618137136102} {"Full-finetune/Learning Rate": 2.2495577610255203e-06, "Full-finetune/Loss": 0.729025661945343, "Full-finetune/Loss (Raw)": 0.912821888923645, "Full-finetune/Step": 4100, "Full-finetune/Step Time": 6.895871261134744} {"Full-finetune/Learning Rate": 2.24562273062511e-06, "Full-finetune/Loss": 0.7289992570877075, "Full-finetune/Loss (Raw)": 0.764096736907959, "Full-finetune/Step": 4101, "Full-finetune/Step Time": 6.915932698175311} {"Full-finetune/Learning Rate": 2.2416907095471296e-06, "Full-finetune/Loss": 0.7291508913040161, "Full-finetune/Loss (Raw)": 0.7540433406829834, "Full-finetune/Step": 4102, "Full-finetune/Step Time": 6.91206824593246} {"Full-finetune/Learning Rate": 2.237761699317519e-06, "Full-finetune/Loss": 0.7282295227050781, "Full-finetune/Loss (Raw)": 0.7942630052566528, "Full-finetune/Step": 4103, "Full-finetune/Step Time": 6.914372943341732} {"Full-finetune/Learning Rate": 2.2338357014610425e-06, "Full-finetune/Loss": 0.7289496064186096, "Full-finetune/Loss (Raw)": 0.820115327835083, "Full-finetune/Step": 4104, "Full-finetune/Step Time": 6.901523757725954} {"Full-finetune/Learning Rate": 2.2299127175013113e-06, "Full-finetune/Loss": 0.7292300462722778, "Full-finetune/Loss (Raw)": 0.6506249904632568, "Full-finetune/Step": 4105, "Full-finetune/Step Time": 6.894724076613784} {"Full-finetune/Learning Rate": 2.2259927489607568e-06, "Full-finetune/Loss": 0.7313266396522522, "Full-finetune/Loss (Raw)": 0.7399737238883972, "Full-finetune/Step": 4106, "Full-finetune/Step Time": 6.892239291220903} {"Full-finetune/Learning Rate": 2.222075797360641e-06, "Full-finetune/Loss": 0.7306506633758545, "Full-finetune/Loss (Raw)": 0.7357075214385986, "Full-finetune/Step": 4107, "Full-finetune/Step Time": 6.893455097451806} {"Full-finetune/Learning Rate": 2.2181618642210577e-06, "Full-finetune/Loss": 0.7326390147209167, "Full-finetune/Loss (Raw)": 0.8316237330436707, "Full-finetune/Step": 4108, "Full-finetune/Step Time": 6.8917419239878654} {"Full-finetune/Learning Rate": 2.2142509510609277e-06, "Full-finetune/Loss": 0.7316297292709351, "Full-finetune/Loss (Raw)": 0.726942241191864, "Full-finetune/Step": 4109, "Full-finetune/Step Time": 6.899200119078159} {"Full-finetune/Learning Rate": 2.210343059397999e-06, "Full-finetune/Loss": 0.7314358949661255, "Full-finetune/Loss (Raw)": 0.760055422782898, "Full-finetune/Step": 4110, "Full-finetune/Step Time": 6.905959729105234} {"Full-finetune/Learning Rate": 2.206438190748846e-06, "Full-finetune/Loss": 0.7325252890586853, "Full-finetune/Loss (Raw)": 0.9179394841194153, "Full-finetune/Step": 4111, "Full-finetune/Step Time": 6.911910191178322} {"Full-finetune/Learning Rate": 2.2025363466288796e-06, "Full-finetune/Loss": 0.7344591617584229, "Full-finetune/Loss (Raw)": 0.5866984724998474, "Full-finetune/Step": 4112, "Full-finetune/Step Time": 6.9051120188087225} {"Full-finetune/Learning Rate": 2.1986375285523233e-06, "Full-finetune/Loss": 0.7328959703445435, "Full-finetune/Loss (Raw)": 0.6358370780944824, "Full-finetune/Step": 4113, "Full-finetune/Step Time": 6.892598107457161} {"Full-finetune/Learning Rate": 2.194741738032229e-06, "Full-finetune/Loss": 0.731731116771698, "Full-finetune/Loss (Raw)": 0.8001014590263367, "Full-finetune/Step": 4114, "Full-finetune/Step Time": 6.8941648211330175} {"Full-finetune/Learning Rate": 2.1908489765804853e-06, "Full-finetune/Loss": 0.7325579524040222, "Full-finetune/Loss (Raw)": 0.8155536651611328, "Full-finetune/Step": 4115, "Full-finetune/Step Time": 6.87911462597549} {"Full-finetune/Learning Rate": 2.1869592457077924e-06, "Full-finetune/Loss": 0.7301589250564575, "Full-finetune/Loss (Raw)": 0.5195016860961914, "Full-finetune/Step": 4116, "Full-finetune/Step Time": 6.893573148176074} {"Full-finetune/Learning Rate": 2.183072546923679e-06, "Full-finetune/Loss": 0.728295087814331, "Full-finetune/Loss (Raw)": 0.6274608969688416, "Full-finetune/Step": 4117, "Full-finetune/Step Time": 6.9123882707208395} {"Full-finetune/Learning Rate": 2.179188881736498e-06, "Full-finetune/Loss": 0.729496955871582, "Full-finetune/Loss (Raw)": 0.9440723061561584, "Full-finetune/Step": 4118, "Full-finetune/Step Time": 6.914199450984597} {"Full-finetune/Learning Rate": 2.1753082516534242e-06, "Full-finetune/Loss": 0.7299339771270752, "Full-finetune/Loss (Raw)": 0.9116045236587524, "Full-finetune/Step": 4119, "Full-finetune/Step Time": 6.9084795862436295} {"Full-finetune/Learning Rate": 2.1714306581804533e-06, "Full-finetune/Loss": 0.7301178574562073, "Full-finetune/Loss (Raw)": 0.6793481111526489, "Full-finetune/Step": 4120, "Full-finetune/Step Time": 6.9031667578965425} {"Full-finetune/Learning Rate": 2.1675561028224012e-06, "Full-finetune/Loss": 0.7300592660903931, "Full-finetune/Loss (Raw)": 0.8065398335456848, "Full-finetune/Step": 4121, "Full-finetune/Step Time": 6.91822974011302} {"Full-finetune/Learning Rate": 2.163684587082915e-06, "Full-finetune/Loss": 0.7301497459411621, "Full-finetune/Loss (Raw)": 0.6974130272865295, "Full-finetune/Step": 4122, "Full-finetune/Step Time": 6.916470143944025} {"Full-finetune/Learning Rate": 2.159816112464447e-06, "Full-finetune/Loss": 0.7315888404846191, "Full-finetune/Loss (Raw)": 0.9251300692558289, "Full-finetune/Step": 4123, "Full-finetune/Step Time": 6.917135624215007} {"Full-finetune/Learning Rate": 2.1559506804682762e-06, "Full-finetune/Loss": 0.7304297685623169, "Full-finetune/Loss (Raw)": 0.5561751127243042, "Full-finetune/Step": 4124, "Full-finetune/Step Time": 6.918549105525017} {"Full-finetune/Learning Rate": 2.1520882925945074e-06, "Full-finetune/Loss": 0.7312934398651123, "Full-finetune/Loss (Raw)": 0.7950916290283203, "Full-finetune/Step": 4125, "Full-finetune/Step Time": 6.92169133014977} {"Full-finetune/Learning Rate": 2.1482289503420537e-06, "Full-finetune/Loss": 0.7309343814849854, "Full-finetune/Loss (Raw)": 0.8302145004272461, "Full-finetune/Step": 4126, "Full-finetune/Step Time": 6.915222084149718} {"Full-finetune/Learning Rate": 2.144372655208653e-06, "Full-finetune/Loss": 0.7312682867050171, "Full-finetune/Loss (Raw)": 0.8072550296783447, "Full-finetune/Step": 4127, "Full-finetune/Step Time": 6.89521093852818} {"Full-finetune/Learning Rate": 2.1405194086908555e-06, "Full-finetune/Loss": 0.7310469150543213, "Full-finetune/Loss (Raw)": 0.7505650520324707, "Full-finetune/Step": 4128, "Full-finetune/Step Time": 6.890535295009613} {"Full-finetune/Learning Rate": 2.1366692122840317e-06, "Full-finetune/Loss": 0.7314136028289795, "Full-finetune/Loss (Raw)": 0.7798200249671936, "Full-finetune/Step": 4129, "Full-finetune/Step Time": 6.870578125119209} {"Full-finetune/Learning Rate": 2.1328220674823686e-06, "Full-finetune/Loss": 0.7320621013641357, "Full-finetune/Loss (Raw)": 0.7690933346748352, "Full-finetune/Step": 4130, "Full-finetune/Step Time": 6.8606626987457275} {"Full-finetune/Learning Rate": 2.1289779757788655e-06, "Full-finetune/Loss": 0.7323793172836304, "Full-finetune/Loss (Raw)": 0.7830362915992737, "Full-finetune/Step": 4131, "Full-finetune/Step Time": 6.853457733988762} {"Full-finetune/Learning Rate": 2.1251369386653454e-06, "Full-finetune/Loss": 0.7321701049804688, "Full-finetune/Loss (Raw)": 0.8049531579017639, "Full-finetune/Step": 4132, "Full-finetune/Step Time": 6.854354467242956} {"Full-finetune/Learning Rate": 2.121298957632434e-06, "Full-finetune/Loss": 0.7316639423370361, "Full-finetune/Loss (Raw)": 0.7124814987182617, "Full-finetune/Step": 4133, "Full-finetune/Step Time": 6.861760338768363} {"Full-finetune/Learning Rate": 2.117464034169575e-06, "Full-finetune/Loss": 0.7300492525100708, "Full-finetune/Loss (Raw)": 0.743891716003418, "Full-finetune/Step": 4134, "Full-finetune/Step Time": 6.867211546748877} {"Full-finetune/Learning Rate": 2.113632169765033e-06, "Full-finetune/Loss": 0.732681393623352, "Full-finetune/Loss (Raw)": 0.6927490830421448, "Full-finetune/Step": 4135, "Full-finetune/Step Time": 6.849499173462391} {"Full-finetune/Learning Rate": 2.1098033659058792e-06, "Full-finetune/Loss": 0.7332773208618164, "Full-finetune/Loss (Raw)": 0.741499662399292, "Full-finetune/Step": 4136, "Full-finetune/Step Time": 6.8490352761000395} {"Full-finetune/Learning Rate": 2.105977624077995e-06, "Full-finetune/Loss": 0.7324355840682983, "Full-finetune/Loss (Raw)": 0.6922917366027832, "Full-finetune/Step": 4137, "Full-finetune/Step Time": 6.8363356590271} {"Full-finetune/Learning Rate": 2.102154945766076e-06, "Full-finetune/Loss": 0.7338119149208069, "Full-finetune/Loss (Raw)": 0.8558197617530823, "Full-finetune/Step": 4138, "Full-finetune/Step Time": 6.812310790643096} {"Full-finetune/Learning Rate": 2.0983353324536316e-06, "Full-finetune/Loss": 0.7329139709472656, "Full-finetune/Loss (Raw)": 0.710983157157898, "Full-finetune/Step": 4139, "Full-finetune/Step Time": 6.802106602117419} {"Full-finetune/Learning Rate": 2.0945187856229778e-06, "Full-finetune/Loss": 0.7342071533203125, "Full-finetune/Loss (Raw)": 0.7176981568336487, "Full-finetune/Step": 4140, "Full-finetune/Step Time": 6.792222112417221} {"Full-finetune/Learning Rate": 2.0907053067552384e-06, "Full-finetune/Loss": 0.7315980792045593, "Full-finetune/Loss (Raw)": 0.3833365738391876, "Full-finetune/Step": 4141, "Full-finetune/Step Time": 6.800939988344908} {"Full-finetune/Learning Rate": 2.0868948973303593e-06, "Full-finetune/Loss": 0.7314945459365845, "Full-finetune/Loss (Raw)": 0.7093870639801025, "Full-finetune/Step": 4142, "Full-finetune/Step Time": 6.778001483529806} {"Full-finetune/Learning Rate": 2.0830875588270773e-06, "Full-finetune/Loss": 0.7310546636581421, "Full-finetune/Loss (Raw)": 0.7184405326843262, "Full-finetune/Step": 4143, "Full-finetune/Step Time": 6.774259088560939} {"Full-finetune/Learning Rate": 2.0792832927229465e-06, "Full-finetune/Loss": 0.7270489931106567, "Full-finetune/Loss (Raw)": 0.28378522396087646, "Full-finetune/Step": 4144, "Full-finetune/Step Time": 6.788860829547048} {"Full-finetune/Learning Rate": 2.0754821004943337e-06, "Full-finetune/Loss": 0.7257564663887024, "Full-finetune/Loss (Raw)": 0.6592816114425659, "Full-finetune/Step": 4145, "Full-finetune/Step Time": 6.797510232776403} {"Full-finetune/Learning Rate": 2.071683983616406e-06, "Full-finetune/Loss": 0.729712963104248, "Full-finetune/Loss (Raw)": 0.8274169564247131, "Full-finetune/Step": 4146, "Full-finetune/Step Time": 6.774262145161629} {"Full-finetune/Learning Rate": 2.0678889435631333e-06, "Full-finetune/Loss": 0.7286084890365601, "Full-finetune/Loss (Raw)": 0.7801547646522522, "Full-finetune/Step": 4147, "Full-finetune/Step Time": 6.780002947896719} {"Full-finetune/Learning Rate": 2.064096981807302e-06, "Full-finetune/Loss": 0.7282772660255432, "Full-finetune/Loss (Raw)": 0.8393710851669312, "Full-finetune/Step": 4148, "Full-finetune/Step Time": 6.780457194894552} {"Full-finetune/Learning Rate": 2.060308099820496e-06, "Full-finetune/Loss": 0.7280620336532593, "Full-finetune/Loss (Raw)": 0.7601375579833984, "Full-finetune/Step": 4149, "Full-finetune/Step Time": 6.769812675192952} {"Full-finetune/Learning Rate": 2.056522299073108e-06, "Full-finetune/Loss": 0.727143406867981, "Full-finetune/Loss (Raw)": 0.6358558535575867, "Full-finetune/Step": 4150, "Full-finetune/Step Time": 6.79456620849669} {"Full-finetune/Learning Rate": 2.052739581034332e-06, "Full-finetune/Loss": 0.7268131971359253, "Full-finetune/Loss (Raw)": 0.771253228187561, "Full-finetune/Step": 4151, "Full-finetune/Step Time": 6.799382772296667} {"Full-finetune/Learning Rate": 2.0489599471721678e-06, "Full-finetune/Loss": 0.7260156869888306, "Full-finetune/Loss (Raw)": 0.7662307620048523, "Full-finetune/Step": 4152, "Full-finetune/Step Time": 6.804108204320073} {"Full-finetune/Learning Rate": 2.0451833989534165e-06, "Full-finetune/Loss": 0.7259156703948975, "Full-finetune/Loss (Raw)": 0.7235308885574341, "Full-finetune/Step": 4153, "Full-finetune/Step Time": 6.8015154749155045} {"Full-finetune/Learning Rate": 2.0414099378436812e-06, "Full-finetune/Loss": 0.7255048751831055, "Full-finetune/Loss (Raw)": 0.7939116954803467, "Full-finetune/Step": 4154, "Full-finetune/Step Time": 6.805761961266398} {"Full-finetune/Learning Rate": 2.0376395653073735e-06, "Full-finetune/Loss": 0.7241491079330444, "Full-finetune/Loss (Raw)": 0.7304379343986511, "Full-finetune/Step": 4155, "Full-finetune/Step Time": 6.807885590940714} {"Full-finetune/Learning Rate": 2.0338722828077007e-06, "Full-finetune/Loss": 0.7237544059753418, "Full-finetune/Loss (Raw)": 0.6833807826042175, "Full-finetune/Step": 4156, "Full-finetune/Step Time": 6.807278800755739} {"Full-finetune/Learning Rate": 2.030108091806664e-06, "Full-finetune/Loss": 0.7240956425666809, "Full-finetune/Loss (Raw)": 0.8814689517021179, "Full-finetune/Step": 4157, "Full-finetune/Step Time": 6.80836090259254} {"Full-finetune/Learning Rate": 2.0263469937650813e-06, "Full-finetune/Loss": 0.7271312475204468, "Full-finetune/Loss (Raw)": 0.7763699293136597, "Full-finetune/Step": 4158, "Full-finetune/Step Time": 6.799580607563257} {"Full-finetune/Learning Rate": 2.0225889901425565e-06, "Full-finetune/Loss": 0.7280230522155762, "Full-finetune/Loss (Raw)": 0.853984534740448, "Full-finetune/Step": 4159, "Full-finetune/Step Time": 6.799411837011576} {"Full-finetune/Learning Rate": 2.0188340823975005e-06, "Full-finetune/Loss": 0.7291539907455444, "Full-finetune/Loss (Raw)": 0.8922189474105835, "Full-finetune/Step": 4160, "Full-finetune/Step Time": 6.813734786584973} {"Full-finetune/Learning Rate": 2.0150822719871167e-06, "Full-finetune/Loss": 0.7287061810493469, "Full-finetune/Loss (Raw)": 0.7998932600021362, "Full-finetune/Step": 4161, "Full-finetune/Step Time": 6.811257887631655} {"Full-finetune/Learning Rate": 2.011333560367411e-06, "Full-finetune/Loss": 0.7297892570495605, "Full-finetune/Loss (Raw)": 0.9098362922668457, "Full-finetune/Step": 4162, "Full-finetune/Step Time": 6.812368921935558} {"Full-finetune/Learning Rate": 2.007587948993185e-06, "Full-finetune/Loss": 0.7294982075691223, "Full-finetune/Loss (Raw)": 0.6200106739997864, "Full-finetune/Step": 4163, "Full-finetune/Step Time": 6.823134858161211} {"Full-finetune/Learning Rate": 2.003845439318035e-06, "Full-finetune/Loss": 0.7254551649093628, "Full-finetune/Loss (Raw)": 0.47079402208328247, "Full-finetune/Step": 4164, "Full-finetune/Step Time": 6.835302514955401} {"Full-finetune/Learning Rate": 2.000106032794361e-06, "Full-finetune/Loss": 0.7270305156707764, "Full-finetune/Loss (Raw)": 0.8873412013053894, "Full-finetune/Step": 4165, "Full-finetune/Step Time": 6.828322960063815} {"Full-finetune/Learning Rate": 1.996369730873353e-06, "Full-finetune/Loss": 0.7311103343963623, "Full-finetune/Loss (Raw)": 0.8773556351661682, "Full-finetune/Step": 4166, "Full-finetune/Step Time": 6.809045193716884} {"Full-finetune/Learning Rate": 1.99263653500499e-06, "Full-finetune/Loss": 0.7307577729225159, "Full-finetune/Loss (Raw)": 0.7199535369873047, "Full-finetune/Step": 4167, "Full-finetune/Step Time": 6.793037511408329} {"Full-finetune/Learning Rate": 1.9889064466380593e-06, "Full-finetune/Loss": 0.7288637161254883, "Full-finetune/Loss (Raw)": 0.6107701659202576, "Full-finetune/Step": 4168, "Full-finetune/Step Time": 6.791113218292594} {"Full-finetune/Learning Rate": 1.985179467220133e-06, "Full-finetune/Loss": 0.7261784076690674, "Full-finetune/Loss (Raw)": 0.3604983389377594, "Full-finetune/Step": 4169, "Full-finetune/Step Time": 6.810268761590123} {"Full-finetune/Learning Rate": 1.9814555981975803e-06, "Full-finetune/Loss": 0.7251995801925659, "Full-finetune/Loss (Raw)": 0.6458157896995544, "Full-finetune/Step": 4170, "Full-finetune/Step Time": 6.801346285268664} {"Full-finetune/Learning Rate": 1.9777348410155606e-06, "Full-finetune/Loss": 0.725009560585022, "Full-finetune/Loss (Raw)": 0.813616156578064, "Full-finetune/Step": 4171, "Full-finetune/Step Time": 6.792898694053292} {"Full-finetune/Learning Rate": 1.9740171971180278e-06, "Full-finetune/Loss": 0.7247440218925476, "Full-finetune/Loss (Raw)": 0.7510724067687988, "Full-finetune/Step": 4172, "Full-finetune/Step Time": 6.812622647732496} {"Full-finetune/Learning Rate": 1.9703026679477253e-06, "Full-finetune/Loss": 0.7282017469406128, "Full-finetune/Loss (Raw)": 0.7318546175956726, "Full-finetune/Step": 4173, "Full-finetune/Step Time": 6.789357205852866} {"Full-finetune/Learning Rate": 1.9665912549461898e-06, "Full-finetune/Loss": 0.7253628969192505, "Full-finetune/Loss (Raw)": 0.34761229157447815, "Full-finetune/Step": 4174, "Full-finetune/Step Time": 6.808719921857119} {"Full-finetune/Learning Rate": 1.962882959553751e-06, "Full-finetune/Loss": 0.7250983715057373, "Full-finetune/Loss (Raw)": 0.7058041095733643, "Full-finetune/Step": 4175, "Full-finetune/Step Time": 6.7979861702769995} {"Full-finetune/Learning Rate": 1.959177783209527e-06, "Full-finetune/Loss": 0.7280909419059753, "Full-finetune/Loss (Raw)": 0.7448854446411133, "Full-finetune/Step": 4176, "Full-finetune/Step Time": 6.8138691727072} {"Full-finetune/Learning Rate": 1.955475727351417e-06, "Full-finetune/Loss": 0.7292037010192871, "Full-finetune/Loss (Raw)": 0.7908910512924194, "Full-finetune/Step": 4177, "Full-finetune/Step Time": 6.832876360043883} {"Full-finetune/Learning Rate": 1.9517767934161224e-06, "Full-finetune/Loss": 0.7300530672073364, "Full-finetune/Loss (Raw)": 0.850760817527771, "Full-finetune/Step": 4178, "Full-finetune/Step Time": 6.8352831192314625} {"Full-finetune/Learning Rate": 1.9480809828391266e-06, "Full-finetune/Loss": 0.7302786111831665, "Full-finetune/Loss (Raw)": 0.7400197386741638, "Full-finetune/Step": 4179, "Full-finetune/Step Time": 6.848257170990109} {"Full-finetune/Learning Rate": 1.9443882970547003e-06, "Full-finetune/Loss": 0.731036901473999, "Full-finetune/Loss (Raw)": 0.8406615853309631, "Full-finetune/Step": 4180, "Full-finetune/Step Time": 6.828190248459578} {"Full-finetune/Learning Rate": 1.940698737495904e-06, "Full-finetune/Loss": 0.7340741753578186, "Full-finetune/Loss (Raw)": 0.7579938173294067, "Full-finetune/Step": 4181, "Full-finetune/Step Time": 6.813227443024516} {"Full-finetune/Learning Rate": 1.937012305594583e-06, "Full-finetune/Loss": 0.7334434986114502, "Full-finetune/Loss (Raw)": 0.5380618572235107, "Full-finetune/Step": 4182, "Full-finetune/Step Time": 6.813315419480205} {"Full-finetune/Learning Rate": 1.93332900278137e-06, "Full-finetune/Loss": 0.7337916493415833, "Full-finetune/Loss (Raw)": 0.8272110223770142, "Full-finetune/Step": 4183, "Full-finetune/Step Time": 6.812494609504938} {"Full-finetune/Learning Rate": 1.9296488304856785e-06, "Full-finetune/Loss": 0.7353031635284424, "Full-finetune/Loss (Raw)": 0.7585257291793823, "Full-finetune/Step": 4184, "Full-finetune/Step Time": 6.790300976485014} {"Full-finetune/Learning Rate": 1.92597179013572e-06, "Full-finetune/Loss": 0.7352045774459839, "Full-finetune/Loss (Raw)": 0.8595679402351379, "Full-finetune/Step": 4185, "Full-finetune/Step Time": 6.793395418673754} {"Full-finetune/Learning Rate": 1.9222978831584793e-06, "Full-finetune/Loss": 0.7363106608390808, "Full-finetune/Loss (Raw)": 0.8778864741325378, "Full-finetune/Step": 4186, "Full-finetune/Step Time": 6.807475769892335} {"Full-finetune/Learning Rate": 1.9186271109797215e-06, "Full-finetune/Loss": 0.7363841533660889, "Full-finetune/Loss (Raw)": 0.7129708528518677, "Full-finetune/Step": 4187, "Full-finetune/Step Time": 6.794893126934767} {"Full-finetune/Learning Rate": 1.9149594750240087e-06, "Full-finetune/Loss": 0.7374959588050842, "Full-finetune/Loss (Raw)": 0.5939211845397949, "Full-finetune/Step": 4188, "Full-finetune/Step Time": 6.7755167707800865} {"Full-finetune/Learning Rate": 1.911294976714676e-06, "Full-finetune/Loss": 0.7386482357978821, "Full-finetune/Loss (Raw)": 0.7494056820869446, "Full-finetune/Step": 4189, "Full-finetune/Step Time": 6.758344018831849} {"Full-finetune/Learning Rate": 1.9076336174738476e-06, "Full-finetune/Loss": 0.7364906668663025, "Full-finetune/Loss (Raw)": 0.5393446087837219, "Full-finetune/Step": 4190, "Full-finetune/Step Time": 6.759277233853936} {"Full-finetune/Learning Rate": 1.9039753987224164e-06, "Full-finetune/Loss": 0.7397801876068115, "Full-finetune/Loss (Raw)": 0.7715542912483215, "Full-finetune/Step": 4191, "Full-finetune/Step Time": 6.745949417352676} {"Full-finetune/Learning Rate": 1.9003203218800748e-06, "Full-finetune/Loss": 0.743967592716217, "Full-finetune/Loss (Raw)": 0.9149916768074036, "Full-finetune/Step": 4192, "Full-finetune/Step Time": 6.725366689264774} {"Full-finetune/Learning Rate": 1.8966683883652826e-06, "Full-finetune/Loss": 0.7414329051971436, "Full-finetune/Loss (Raw)": 0.3002089858055115, "Full-finetune/Step": 4193, "Full-finetune/Step Time": 6.735145537182689} {"Full-finetune/Learning Rate": 1.8930195995952827e-06, "Full-finetune/Loss": 0.7416441440582275, "Full-finetune/Loss (Raw)": 0.8223506808280945, "Full-finetune/Step": 4194, "Full-finetune/Step Time": 6.73564862459898} {"Full-finetune/Learning Rate": 1.8893739569861058e-06, "Full-finetune/Loss": 0.7415874004364014, "Full-finetune/Loss (Raw)": 0.8526228070259094, "Full-finetune/Step": 4195, "Full-finetune/Step Time": 6.728288406506181} {"Full-finetune/Learning Rate": 1.8857314619525469e-06, "Full-finetune/Loss": 0.7410507202148438, "Full-finetune/Loss (Raw)": 0.7393796443939209, "Full-finetune/Step": 4196, "Full-finetune/Step Time": 6.7149356715381145} {"Full-finetune/Learning Rate": 1.8820921159081896e-06, "Full-finetune/Loss": 0.7378733158111572, "Full-finetune/Loss (Raw)": 0.45241808891296387, "Full-finetune/Step": 4197, "Full-finetune/Step Time": 6.7248202208429575} {"Full-finetune/Learning Rate": 1.8784559202653907e-06, "Full-finetune/Loss": 0.7387230396270752, "Full-finetune/Loss (Raw)": 0.8621097803115845, "Full-finetune/Step": 4198, "Full-finetune/Step Time": 6.724452808499336} {"Full-finetune/Learning Rate": 1.8748228764352915e-06, "Full-finetune/Loss": 0.7403290867805481, "Full-finetune/Loss (Raw)": 0.9270662069320679, "Full-finetune/Step": 4199, "Full-finetune/Step Time": 6.695800516754389} {"Full-finetune/Learning Rate": 1.8711929858278066e-06, "Full-finetune/Loss": 0.7414196729660034, "Full-finetune/Loss (Raw)": 0.8042434453964233, "Full-finetune/Step": 4200, "Full-finetune/Step Time": 6.693059640005231} {"Full-finetune/Learning Rate": 1.8675662498516167e-06, "Full-finetune/Loss": 0.7409705519676208, "Full-finetune/Loss (Raw)": 0.7078872323036194, "Full-finetune/Step": 4201, "Full-finetune/Step Time": 6.704163724556565} {"Full-finetune/Learning Rate": 1.863942669914196e-06, "Full-finetune/Loss": 0.7401052117347717, "Full-finetune/Loss (Raw)": 0.7755069732666016, "Full-finetune/Step": 4202, "Full-finetune/Step Time": 6.7078039944171906} {"Full-finetune/Learning Rate": 1.8603222474217819e-06, "Full-finetune/Loss": 0.7400664687156677, "Full-finetune/Loss (Raw)": 0.7216969728469849, "Full-finetune/Step": 4203, "Full-finetune/Step Time": 6.70992636680603} {"Full-finetune/Learning Rate": 1.8567049837793894e-06, "Full-finetune/Loss": 0.741182804107666, "Full-finetune/Loss (Raw)": 0.7118822932243347, "Full-finetune/Step": 4204, "Full-finetune/Step Time": 6.690610455349088} {"Full-finetune/Learning Rate": 1.8530908803908088e-06, "Full-finetune/Loss": 0.7412469387054443, "Full-finetune/Loss (Raw)": 0.8032765984535217, "Full-finetune/Step": 4205, "Full-finetune/Step Time": 6.672585954889655} {"Full-finetune/Learning Rate": 1.8494799386586015e-06, "Full-finetune/Loss": 0.7410948872566223, "Full-finetune/Loss (Raw)": 0.7114971280097961, "Full-finetune/Step": 4206, "Full-finetune/Step Time": 6.671584723517299} {"Full-finetune/Learning Rate": 1.8458721599841056e-06, "Full-finetune/Loss": 0.7407200336456299, "Full-finetune/Loss (Raw)": 0.8013938069343567, "Full-finetune/Step": 4207, "Full-finetune/Step Time": 6.6651625242084265} {"Full-finetune/Learning Rate": 1.8422675457674254e-06, "Full-finetune/Loss": 0.7414326071739197, "Full-finetune/Loss (Raw)": 0.7643072009086609, "Full-finetune/Step": 4208, "Full-finetune/Step Time": 6.654971173033118} {"Full-finetune/Learning Rate": 1.8386660974074466e-06, "Full-finetune/Loss": 0.7431809902191162, "Full-finetune/Loss (Raw)": 0.9362836480140686, "Full-finetune/Step": 4209, "Full-finetune/Step Time": 6.634771743789315} {"Full-finetune/Learning Rate": 1.8350678163018221e-06, "Full-finetune/Loss": 0.7436240911483765, "Full-finetune/Loss (Raw)": 0.7703070640563965, "Full-finetune/Step": 4210, "Full-finetune/Step Time": 6.630145084112883} {"Full-finetune/Learning Rate": 1.831472703846966e-06, "Full-finetune/Loss": 0.7434056997299194, "Full-finetune/Loss (Raw)": 0.8273465633392334, "Full-finetune/Step": 4211, "Full-finetune/Step Time": 6.635434107854962} {"Full-finetune/Learning Rate": 1.827880761438079e-06, "Full-finetune/Loss": 0.7450048923492432, "Full-finetune/Loss (Raw)": 0.6648852229118347, "Full-finetune/Step": 4212, "Full-finetune/Step Time": 6.626322966068983} {"Full-finetune/Learning Rate": 1.8242919904691214e-06, "Full-finetune/Loss": 0.7452486753463745, "Full-finetune/Loss (Raw)": 0.6161503195762634, "Full-finetune/Step": 4213, "Full-finetune/Step Time": 6.625113490968943} {"Full-finetune/Learning Rate": 1.820706392332824e-06, "Full-finetune/Loss": 0.7459311485290527, "Full-finetune/Loss (Raw)": 0.7757583856582642, "Full-finetune/Step": 4214, "Full-finetune/Step Time": 6.615574894472957} {"Full-finetune/Learning Rate": 1.8171239684206898e-06, "Full-finetune/Loss": 0.7445827126502991, "Full-finetune/Loss (Raw)": 0.7032523155212402, "Full-finetune/Step": 4215, "Full-finetune/Step Time": 6.641192747280002} {"Full-finetune/Learning Rate": 1.8135447201229861e-06, "Full-finetune/Loss": 0.7445487380027771, "Full-finetune/Loss (Raw)": 0.809831976890564, "Full-finetune/Step": 4216, "Full-finetune/Step Time": 6.646573759615421} {"Full-finetune/Learning Rate": 1.8099686488287483e-06, "Full-finetune/Loss": 0.7449378371238708, "Full-finetune/Loss (Raw)": 0.8276829123497009, "Full-finetune/Step": 4217, "Full-finetune/Step Time": 6.643244640901685} {"Full-finetune/Learning Rate": 1.8063957559257794e-06, "Full-finetune/Loss": 0.7447608113288879, "Full-finetune/Loss (Raw)": 0.7654947638511658, "Full-finetune/Step": 4218, "Full-finetune/Step Time": 6.642969915643334} {"Full-finetune/Learning Rate": 1.8028260428006538e-06, "Full-finetune/Loss": 0.7432960867881775, "Full-finetune/Loss (Raw)": 0.5679630637168884, "Full-finetune/Step": 4219, "Full-finetune/Step Time": 6.625732086598873} {"Full-finetune/Learning Rate": 1.7992595108387068e-06, "Full-finetune/Loss": 0.7438668608665466, "Full-finetune/Loss (Raw)": 0.8171229958534241, "Full-finetune/Step": 4220, "Full-finetune/Step Time": 6.615025958046317} {"Full-finetune/Learning Rate": 1.795696161424032e-06, "Full-finetune/Loss": 0.7438998222351074, "Full-finetune/Loss (Raw)": 0.8949017524719238, "Full-finetune/Step": 4221, "Full-finetune/Step Time": 6.616461122408509} {"Full-finetune/Learning Rate": 1.7921359959395046e-06, "Full-finetune/Loss": 0.7426617741584778, "Full-finetune/Loss (Raw)": 0.8138930201530457, "Full-finetune/Step": 4222, "Full-finetune/Step Time": 6.620764423161745} {"Full-finetune/Learning Rate": 1.7885790157667526e-06, "Full-finetune/Loss": 0.7440689206123352, "Full-finetune/Loss (Raw)": 0.8573861122131348, "Full-finetune/Step": 4223, "Full-finetune/Step Time": 6.611629808321595} {"Full-finetune/Learning Rate": 1.7850252222861697e-06, "Full-finetune/Loss": 0.7424949407577515, "Full-finetune/Loss (Raw)": 0.7102972269058228, "Full-finetune/Step": 4224, "Full-finetune/Step Time": 6.616421798244119} {"Full-finetune/Learning Rate": 1.7814746168769138e-06, "Full-finetune/Loss": 0.7412716746330261, "Full-finetune/Loss (Raw)": 0.6854761838912964, "Full-finetune/Step": 4225, "Full-finetune/Step Time": 6.608894707635045} {"Full-finetune/Learning Rate": 1.7779272009169068e-06, "Full-finetune/Loss": 0.7434391379356384, "Full-finetune/Loss (Raw)": 0.875690758228302, "Full-finetune/Step": 4226, "Full-finetune/Step Time": 6.602679315954447} {"Full-finetune/Learning Rate": 1.77438297578283e-06, "Full-finetune/Loss": 0.744916558265686, "Full-finetune/Loss (Raw)": 0.9798228144645691, "Full-finetune/Step": 4227, "Full-finetune/Step Time": 6.60185182467103} {"Full-finetune/Learning Rate": 1.7708419428501256e-06, "Full-finetune/Loss": 0.7438328862190247, "Full-finetune/Loss (Raw)": 0.7741152048110962, "Full-finetune/Step": 4228, "Full-finetune/Step Time": 6.603688381612301} {"Full-finetune/Learning Rate": 1.7673041034930083e-06, "Full-finetune/Loss": 0.7444746494293213, "Full-finetune/Loss (Raw)": 0.8462346196174622, "Full-finetune/Step": 4229, "Full-finetune/Step Time": 6.58673313818872} {"Full-finetune/Learning Rate": 1.7637694590844357e-06, "Full-finetune/Loss": 0.7406493425369263, "Full-finetune/Loss (Raw)": 0.2644117474555969, "Full-finetune/Step": 4230, "Full-finetune/Step Time": 6.600076362490654} {"Full-finetune/Learning Rate": 1.7602380109961348e-06, "Full-finetune/Loss": 0.7388171553611755, "Full-finetune/Loss (Raw)": 0.5597345232963562, "Full-finetune/Step": 4231, "Full-finetune/Step Time": 6.637754300609231} {"Full-finetune/Learning Rate": 1.7567097605985972e-06, "Full-finetune/Loss": 0.7384871244430542, "Full-finetune/Loss (Raw)": 0.7778751850128174, "Full-finetune/Step": 4232, "Full-finetune/Step Time": 6.646115865558386} {"Full-finetune/Learning Rate": 1.7531847092610644e-06, "Full-finetune/Loss": 0.7384117245674133, "Full-finetune/Loss (Raw)": 0.6409791707992554, "Full-finetune/Step": 4233, "Full-finetune/Step Time": 6.6522191017866135} {"Full-finetune/Learning Rate": 1.7496628583515395e-06, "Full-finetune/Loss": 0.7400825023651123, "Full-finetune/Loss (Raw)": 0.9538320302963257, "Full-finetune/Step": 4234, "Full-finetune/Step Time": 6.655519913882017} {"Full-finetune/Learning Rate": 1.7461442092367864e-06, "Full-finetune/Loss": 0.7406050562858582, "Full-finetune/Loss (Raw)": 0.8025896549224854, "Full-finetune/Step": 4235, "Full-finetune/Step Time": 6.65436284057796} {"Full-finetune/Learning Rate": 1.7426287632823213e-06, "Full-finetune/Loss": 0.7389960885047913, "Full-finetune/Loss (Raw)": 0.6256827712059021, "Full-finetune/Step": 4236, "Full-finetune/Step Time": 6.663349479436874} {"Full-finetune/Learning Rate": 1.7391165218524232e-06, "Full-finetune/Loss": 0.7403569221496582, "Full-finetune/Loss (Raw)": 0.901123046875, "Full-finetune/Step": 4237, "Full-finetune/Step Time": 6.655796317383647} {"Full-finetune/Learning Rate": 1.735607486310119e-06, "Full-finetune/Loss": 0.7411164045333862, "Full-finetune/Loss (Raw)": 0.8572766780853271, "Full-finetune/Step": 4238, "Full-finetune/Step Time": 6.654575245454907} {"Full-finetune/Learning Rate": 1.7321016580172068e-06, "Full-finetune/Loss": 0.7403197288513184, "Full-finetune/Loss (Raw)": 0.8159557580947876, "Full-finetune/Step": 4239, "Full-finetune/Step Time": 6.6501228883862495} {"Full-finetune/Learning Rate": 1.728599038334221e-06, "Full-finetune/Loss": 0.7416538000106812, "Full-finetune/Loss (Raw)": 0.7574668526649475, "Full-finetune/Step": 4240, "Full-finetune/Step Time": 6.639542555436492} {"Full-finetune/Learning Rate": 1.7250996286204602e-06, "Full-finetune/Loss": 0.7428037524223328, "Full-finetune/Loss (Raw)": 0.7830324769020081, "Full-finetune/Step": 4241, "Full-finetune/Step Time": 6.640732709318399} {"Full-finetune/Learning Rate": 1.7216034302339824e-06, "Full-finetune/Loss": 0.7431287169456482, "Full-finetune/Loss (Raw)": 0.8416917324066162, "Full-finetune/Step": 4242, "Full-finetune/Step Time": 6.6388875264674425} {"Full-finetune/Learning Rate": 1.718110444531591e-06, "Full-finetune/Loss": 0.7425534129142761, "Full-finetune/Loss (Raw)": 0.7419111132621765, "Full-finetune/Step": 4243, "Full-finetune/Step Time": 6.659714866429567} {"Full-finetune/Learning Rate": 1.7146206728688465e-06, "Full-finetune/Loss": 0.7448539137840271, "Full-finetune/Loss (Raw)": 0.8139729499816895, "Full-finetune/Step": 4244, "Full-finetune/Step Time": 6.643773080781102} {"Full-finetune/Learning Rate": 1.7111341166000594e-06, "Full-finetune/Loss": 0.7461364269256592, "Full-finetune/Loss (Raw)": 0.7916205525398254, "Full-finetune/Step": 4245, "Full-finetune/Step Time": 6.636615524068475} {"Full-finetune/Learning Rate": 1.7076507770782957e-06, "Full-finetune/Loss": 0.74437016248703, "Full-finetune/Loss (Raw)": 0.7179925441741943, "Full-finetune/Step": 4246, "Full-finetune/Step Time": 6.661498079076409} {"Full-finetune/Learning Rate": 1.7041706556553717e-06, "Full-finetune/Loss": 0.743708610534668, "Full-finetune/Loss (Raw)": 0.8269147276878357, "Full-finetune/Step": 4247, "Full-finetune/Step Time": 6.663251673802733} {"Full-finetune/Learning Rate": 1.7006937536818503e-06, "Full-finetune/Loss": 0.7405974864959717, "Full-finetune/Loss (Raw)": 0.2811335623264313, "Full-finetune/Step": 4248, "Full-finetune/Step Time": 6.669229215011001} {"Full-finetune/Learning Rate": 1.6972200725070587e-06, "Full-finetune/Loss": 0.740890622138977, "Full-finetune/Loss (Raw)": 0.8440653085708618, "Full-finetune/Step": 4249, "Full-finetune/Step Time": 6.652269694954157} {"Full-finetune/Learning Rate": 1.6937496134790554e-06, "Full-finetune/Loss": 0.7399527430534363, "Full-finetune/Loss (Raw)": 0.5773597955703735, "Full-finetune/Step": 4250, "Full-finetune/Step Time": 6.648590378463268} {"Full-finetune/Learning Rate": 1.6902823779446586e-06, "Full-finetune/Loss": 0.7379679083824158, "Full-finetune/Loss (Raw)": 0.671067476272583, "Full-finetune/Step": 4251, "Full-finetune/Step Time": 6.648226885125041} {"Full-finetune/Learning Rate": 1.686818367249441e-06, "Full-finetune/Loss": 0.7412890791893005, "Full-finetune/Loss (Raw)": 0.9812905192375183, "Full-finetune/Step": 4252, "Full-finetune/Step Time": 6.649975990876555} {"Full-finetune/Learning Rate": 1.6833575827377135e-06, "Full-finetune/Loss": 0.7392431497573853, "Full-finetune/Loss (Raw)": 0.5332121849060059, "Full-finetune/Step": 4253, "Full-finetune/Step Time": 6.669972866773605} {"Full-finetune/Learning Rate": 1.6799000257525388e-06, "Full-finetune/Loss": 0.7365126609802246, "Full-finetune/Loss (Raw)": 0.48071274161338806, "Full-finetune/Step": 4254, "Full-finetune/Step Time": 6.68044657073915} {"Full-finetune/Learning Rate": 1.6764456976357279e-06, "Full-finetune/Loss": 0.7355270385742188, "Full-finetune/Loss (Raw)": 0.6810861229896545, "Full-finetune/Step": 4255, "Full-finetune/Step Time": 6.686535427346826} {"Full-finetune/Learning Rate": 1.6729945997278386e-06, "Full-finetune/Loss": 0.7359017729759216, "Full-finetune/Loss (Raw)": 0.7985346913337708, "Full-finetune/Step": 4256, "Full-finetune/Step Time": 6.7020688354969025} {"Full-finetune/Learning Rate": 1.6695467333681748e-06, "Full-finetune/Loss": 0.7362563610076904, "Full-finetune/Loss (Raw)": 0.8252118229866028, "Full-finetune/Step": 4257, "Full-finetune/Step Time": 6.7067961525171995} {"Full-finetune/Learning Rate": 1.6661020998947818e-06, "Full-finetune/Loss": 0.7350276708602905, "Full-finetune/Loss (Raw)": 0.6118196845054626, "Full-finetune/Step": 4258, "Full-finetune/Step Time": 6.7071056086570024} {"Full-finetune/Learning Rate": 1.6626607006444628e-06, "Full-finetune/Loss": 0.7358978390693665, "Full-finetune/Loss (Raw)": 0.8944135904312134, "Full-finetune/Step": 4259, "Full-finetune/Step Time": 6.710974924266338} {"Full-finetune/Learning Rate": 1.6592225369527515e-06, "Full-finetune/Loss": 0.7354706525802612, "Full-finetune/Loss (Raw)": 0.7502768635749817, "Full-finetune/Step": 4260, "Full-finetune/Step Time": 6.707646440714598} {"Full-finetune/Learning Rate": 1.6557876101539305e-06, "Full-finetune/Loss": 0.736160397529602, "Full-finetune/Loss (Raw)": 0.8007711172103882, "Full-finetune/Step": 4261, "Full-finetune/Step Time": 6.70149827003479} {"Full-finetune/Learning Rate": 1.6523559215810336e-06, "Full-finetune/Loss": 0.7361708879470825, "Full-finetune/Loss (Raw)": 0.7452355623245239, "Full-finetune/Step": 4262, "Full-finetune/Step Time": 6.6917203441262245} {"Full-finetune/Learning Rate": 1.64892747256583e-06, "Full-finetune/Loss": 0.7381061911582947, "Full-finetune/Loss (Raw)": 0.9404621720314026, "Full-finetune/Step": 4263, "Full-finetune/Step Time": 6.689525201916695} {"Full-finetune/Learning Rate": 1.645502264438833e-06, "Full-finetune/Loss": 0.7372023463249207, "Full-finetune/Loss (Raw)": 0.6258098483085632, "Full-finetune/Step": 4264, "Full-finetune/Step Time": 6.70063872076571} {"Full-finetune/Learning Rate": 1.6420802985292995e-06, "Full-finetune/Loss": 0.7372560501098633, "Full-finetune/Loss (Raw)": 0.6991598010063171, "Full-finetune/Step": 4265, "Full-finetune/Step Time": 6.707388384267688} {"Full-finetune/Learning Rate": 1.638661576165227e-06, "Full-finetune/Loss": 0.7376832962036133, "Full-finetune/Loss (Raw)": 0.9105141162872314, "Full-finetune/Step": 4266, "Full-finetune/Step Time": 6.706526288762689} {"Full-finetune/Learning Rate": 1.6352460986733564e-06, "Full-finetune/Loss": 0.7370904088020325, "Full-finetune/Loss (Raw)": 0.6350922584533691, "Full-finetune/Step": 4267, "Full-finetune/Step Time": 6.719830449670553} {"Full-finetune/Learning Rate": 1.6318338673791655e-06, "Full-finetune/Loss": 0.7370178699493408, "Full-finetune/Loss (Raw)": 0.7084174752235413, "Full-finetune/Step": 4268, "Full-finetune/Step Time": 6.710040779784322} {"Full-finetune/Learning Rate": 1.6284248836068772e-06, "Full-finetune/Loss": 0.7382164001464844, "Full-finetune/Loss (Raw)": 0.5367417931556702, "Full-finetune/Step": 4269, "Full-finetune/Step Time": 6.736187554895878} {"Full-finetune/Learning Rate": 1.6250191486794497e-06, "Full-finetune/Loss": 0.7387545108795166, "Full-finetune/Loss (Raw)": 0.7782651782035828, "Full-finetune/Step": 4270, "Full-finetune/Step Time": 6.736518682911992} {"Full-finetune/Learning Rate": 1.6216166639185804e-06, "Full-finetune/Loss": 0.7356865406036377, "Full-finetune/Loss (Raw)": 0.32573431730270386, "Full-finetune/Step": 4271, "Full-finetune/Step Time": 6.755674220621586} {"Full-finetune/Learning Rate": 1.618217430644713e-06, "Full-finetune/Loss": 0.7398614883422852, "Full-finetune/Loss (Raw)": 0.8181880116462708, "Full-finetune/Step": 4272, "Full-finetune/Step Time": 6.738542668521404} {"Full-finetune/Learning Rate": 1.6148214501770221e-06, "Full-finetune/Loss": 0.7399860620498657, "Full-finetune/Loss (Raw)": 0.6752265691757202, "Full-finetune/Step": 4273, "Full-finetune/Step Time": 6.726326389238238} {"Full-finetune/Learning Rate": 1.6114287238334148e-06, "Full-finetune/Loss": 0.7393696308135986, "Full-finetune/Loss (Raw)": 0.7485141158103943, "Full-finetune/Step": 4274, "Full-finetune/Step Time": 6.731935841962695} {"Full-finetune/Learning Rate": 1.6080392529305489e-06, "Full-finetune/Loss": 0.7380762100219727, "Full-finetune/Loss (Raw)": 0.614596426486969, "Full-finetune/Step": 4275, "Full-finetune/Step Time": 6.752655161544681} {"Full-finetune/Learning Rate": 1.60465303878381e-06, "Full-finetune/Loss": 0.7378960251808167, "Full-finetune/Loss (Raw)": 0.8163108229637146, "Full-finetune/Step": 4276, "Full-finetune/Step Time": 6.753606297075748} {"Full-finetune/Learning Rate": 1.6012700827073213e-06, "Full-finetune/Loss": 0.7374342679977417, "Full-finetune/Loss (Raw)": 0.7010276317596436, "Full-finetune/Step": 4277, "Full-finetune/Step Time": 6.775109458714724} {"Full-finetune/Learning Rate": 1.5978903860139416e-06, "Full-finetune/Loss": 0.7392028570175171, "Full-finetune/Loss (Raw)": 0.8622358441352844, "Full-finetune/Step": 4278, "Full-finetune/Step Time": 6.749085167422891} {"Full-finetune/Learning Rate": 1.5945139500152662e-06, "Full-finetune/Loss": 0.738699197769165, "Full-finetune/Loss (Raw)": 0.7067829370498657, "Full-finetune/Step": 4279, "Full-finetune/Step Time": 6.745825447142124} {"Full-finetune/Learning Rate": 1.5911407760216235e-06, "Full-finetune/Loss": 0.7392443418502808, "Full-finetune/Loss (Raw)": 0.8360163569450378, "Full-finetune/Step": 4280, "Full-finetune/Step Time": 6.739322671666741} {"Full-finetune/Learning Rate": 1.5877708653420742e-06, "Full-finetune/Loss": 0.7406642436981201, "Full-finetune/Loss (Raw)": 0.9052694439888, "Full-finetune/Step": 4281, "Full-finetune/Step Time": 6.744295632466674} {"Full-finetune/Learning Rate": 1.58440421928442e-06, "Full-finetune/Loss": 0.7409687638282776, "Full-finetune/Loss (Raw)": 0.8328955769538879, "Full-finetune/Step": 4282, "Full-finetune/Step Time": 6.7415530402213335} {"Full-finetune/Learning Rate": 1.581040839155189e-06, "Full-finetune/Loss": 0.7412489652633667, "Full-finetune/Loss (Raw)": 0.7663058638572693, "Full-finetune/Step": 4283, "Full-finetune/Step Time": 6.755698522552848} {"Full-finetune/Learning Rate": 1.5776807262596371e-06, "Full-finetune/Loss": 0.7422035932540894, "Full-finetune/Loss (Raw)": 0.8055702447891235, "Full-finetune/Step": 4284, "Full-finetune/Step Time": 6.764158803969622} {"Full-finetune/Learning Rate": 1.574323881901767e-06, "Full-finetune/Loss": 0.7399762868881226, "Full-finetune/Loss (Raw)": 0.5963733792304993, "Full-finetune/Step": 4285, "Full-finetune/Step Time": 6.797718765214086} {"Full-finetune/Learning Rate": 1.5709703073843008e-06, "Full-finetune/Loss": 0.739815354347229, "Full-finetune/Loss (Raw)": 0.7557776570320129, "Full-finetune/Step": 4286, "Full-finetune/Step Time": 6.78875370696187} {"Full-finetune/Learning Rate": 1.5676200040086941e-06, "Full-finetune/Loss": 0.7395104765892029, "Full-finetune/Loss (Raw)": 0.8149510622024536, "Full-finetune/Step": 4287, "Full-finetune/Step Time": 6.790913311764598} {"Full-finetune/Learning Rate": 1.564272973075136e-06, "Full-finetune/Loss": 0.7395120859146118, "Full-finetune/Loss (Raw)": 0.8924299478530884, "Full-finetune/Step": 4288, "Full-finetune/Step Time": 6.783970341086388} {"Full-finetune/Learning Rate": 1.560929215882544e-06, "Full-finetune/Loss": 0.7389686107635498, "Full-finetune/Loss (Raw)": 0.7303227186203003, "Full-finetune/Step": 4289, "Full-finetune/Step Time": 6.784896047785878} {"Full-finetune/Learning Rate": 1.5575887337285644e-06, "Full-finetune/Loss": 0.7387040853500366, "Full-finetune/Loss (Raw)": 0.8759796023368835, "Full-finetune/Step": 4290, "Full-finetune/Step Time": 6.786157304421067} {"Full-finetune/Learning Rate": 1.5542515279095704e-06, "Full-finetune/Loss": 0.7407243251800537, "Full-finetune/Loss (Raw)": 0.8786032795906067, "Full-finetune/Step": 4291, "Full-finetune/Step Time": 6.769937248900533} {"Full-finetune/Learning Rate": 1.5509175997206705e-06, "Full-finetune/Loss": 0.7435926198959351, "Full-finetune/Loss (Raw)": 0.8379439115524292, "Full-finetune/Step": 4292, "Full-finetune/Step Time": 6.775441521778703} {"Full-finetune/Learning Rate": 1.5475869504556996e-06, "Full-finetune/Loss": 0.7430564165115356, "Full-finetune/Loss (Raw)": 0.8186936378479004, "Full-finetune/Step": 4293, "Full-finetune/Step Time": 6.782665455713868} {"Full-finetune/Learning Rate": 1.5442595814072081e-06, "Full-finetune/Loss": 0.7420996427536011, "Full-finetune/Loss (Raw)": 0.7548975944519043, "Full-finetune/Step": 4294, "Full-finetune/Step Time": 6.805086938664317} {"Full-finetune/Learning Rate": 1.540935493866491e-06, "Full-finetune/Loss": 0.7387944459915161, "Full-finetune/Loss (Raw)": 0.2968812584877014, "Full-finetune/Step": 4295, "Full-finetune/Step Time": 6.82082461565733} {"Full-finetune/Learning Rate": 1.53761468912356e-06, "Full-finetune/Loss": 0.7412067651748657, "Full-finetune/Loss (Raw)": 0.9195528030395508, "Full-finetune/Step": 4296, "Full-finetune/Step Time": 6.817624581977725} {"Full-finetune/Learning Rate": 1.5342971684671537e-06, "Full-finetune/Loss": 0.7449822425842285, "Full-finetune/Loss (Raw)": 0.8437488079071045, "Full-finetune/Step": 4297, "Full-finetune/Step Time": 6.801406377926469} {"Full-finetune/Learning Rate": 1.530982933184737e-06, "Full-finetune/Loss": 0.7445628046989441, "Full-finetune/Loss (Raw)": 0.5921327471733093, "Full-finetune/Step": 4298, "Full-finetune/Step Time": 6.795683171600103} {"Full-finetune/Learning Rate": 1.527671984562501e-06, "Full-finetune/Loss": 0.7444858551025391, "Full-finetune/Loss (Raw)": 0.8037644624710083, "Full-finetune/Step": 4299, "Full-finetune/Step Time": 6.801632940769196} {"Full-finetune/Learning Rate": 1.524364323885359e-06, "Full-finetune/Loss": 0.7454996109008789, "Full-finetune/Loss (Raw)": 0.8808442950248718, "Full-finetune/Step": 4300, "Full-finetune/Step Time": 6.786318263038993} {"Full-finetune/Learning Rate": 1.5210599524369484e-06, "Full-finetune/Loss": 0.7425791025161743, "Full-finetune/Loss (Raw)": 0.35801586508750916, "Full-finetune/Step": 4301, "Full-finetune/Step Time": 6.798825042322278} {"Full-finetune/Learning Rate": 1.517758871499635e-06, "Full-finetune/Loss": 0.7467941641807556, "Full-finetune/Loss (Raw)": 0.8871468901634216, "Full-finetune/Step": 4302, "Full-finetune/Step Time": 6.784139698371291} {"Full-finetune/Learning Rate": 1.5144610823545035e-06, "Full-finetune/Loss": 0.7483824491500854, "Full-finetune/Loss (Raw)": 0.9090998768806458, "Full-finetune/Step": 4303, "Full-finetune/Step Time": 6.783466283231974} {"Full-finetune/Learning Rate": 1.511166586281355e-06, "Full-finetune/Loss": 0.7451344728469849, "Full-finetune/Loss (Raw)": 0.3291509449481964, "Full-finetune/Step": 4304, "Full-finetune/Step Time": 6.7672443222254515} {"Full-finetune/Learning Rate": 1.507875384558727e-06, "Full-finetune/Loss": 0.7440502643585205, "Full-finetune/Loss (Raw)": 0.6521056294441223, "Full-finetune/Step": 4305, "Full-finetune/Step Time": 6.749347178265452} {"Full-finetune/Learning Rate": 1.504587478463867e-06, "Full-finetune/Loss": 0.7429021000862122, "Full-finetune/Loss (Raw)": 0.7037971019744873, "Full-finetune/Step": 4306, "Full-finetune/Step Time": 6.754512021318078} {"Full-finetune/Learning Rate": 1.5013028692727483e-06, "Full-finetune/Loss": 0.7415997982025146, "Full-finetune/Loss (Raw)": 0.5733277797698975, "Full-finetune/Step": 4307, "Full-finetune/Step Time": 6.74314558506012} {"Full-finetune/Learning Rate": 1.4980215582600621e-06, "Full-finetune/Loss": 0.7403738498687744, "Full-finetune/Loss (Raw)": 0.6837374567985535, "Full-finetune/Step": 4308, "Full-finetune/Step Time": 6.7426522467285395} {"Full-finetune/Learning Rate": 1.4947435466992222e-06, "Full-finetune/Loss": 0.7401430606842041, "Full-finetune/Loss (Raw)": 0.7284512519836426, "Full-finetune/Step": 4309, "Full-finetune/Step Time": 6.746672939509153} {"Full-finetune/Learning Rate": 1.4914688358623608e-06, "Full-finetune/Loss": 0.7386294603347778, "Full-finetune/Loss (Raw)": 0.3443273603916168, "Full-finetune/Step": 4310, "Full-finetune/Step Time": 6.754459237679839} {"Full-finetune/Learning Rate": 1.488197427020327e-06, "Full-finetune/Loss": 0.738274097442627, "Full-finetune/Loss (Raw)": 0.7817186117172241, "Full-finetune/Step": 4311, "Full-finetune/Step Time": 6.760474171489477} {"Full-finetune/Learning Rate": 1.4849293214426975e-06, "Full-finetune/Loss": 0.7389963865280151, "Full-finetune/Loss (Raw)": 0.8509857654571533, "Full-finetune/Step": 4312, "Full-finetune/Step Time": 6.7672527730464935} {"Full-finetune/Learning Rate": 1.481664520397753e-06, "Full-finetune/Loss": 0.7392350435256958, "Full-finetune/Loss (Raw)": 0.8901123404502869, "Full-finetune/Step": 4313, "Full-finetune/Step Time": 6.776389656588435} {"Full-finetune/Learning Rate": 1.4784030251524994e-06, "Full-finetune/Loss": 0.7390486001968384, "Full-finetune/Loss (Raw)": 0.8540241718292236, "Full-finetune/Step": 4314, "Full-finetune/Step Time": 6.765310447663069} {"Full-finetune/Learning Rate": 1.4751448369726652e-06, "Full-finetune/Loss": 0.7393561601638794, "Full-finetune/Loss (Raw)": 0.7523329854011536, "Full-finetune/Step": 4315, "Full-finetune/Step Time": 6.762756304815412} {"Full-finetune/Learning Rate": 1.4718899571226842e-06, "Full-finetune/Loss": 0.739912748336792, "Full-finetune/Loss (Raw)": 0.6651647090911865, "Full-finetune/Step": 4316, "Full-finetune/Step Time": 6.765396028757095} {"Full-finetune/Learning Rate": 1.468638386865716e-06, "Full-finetune/Loss": 0.7400698065757751, "Full-finetune/Loss (Raw)": 0.7695127129554749, "Full-finetune/Step": 4317, "Full-finetune/Step Time": 6.763245467096567} {"Full-finetune/Learning Rate": 1.465390127463625e-06, "Full-finetune/Loss": 0.7405771613121033, "Full-finetune/Loss (Raw)": 0.6042805314064026, "Full-finetune/Step": 4318, "Full-finetune/Step Time": 6.766407983377576} {"Full-finetune/Learning Rate": 1.4621451801770038e-06, "Full-finetune/Loss": 0.7391321659088135, "Full-finetune/Loss (Raw)": 0.5865945816040039, "Full-finetune/Step": 4319, "Full-finetune/Step Time": 6.770991280674934} {"Full-finetune/Learning Rate": 1.4589035462651502e-06, "Full-finetune/Loss": 0.7377448081970215, "Full-finetune/Loss (Raw)": 0.7374163866043091, "Full-finetune/Step": 4320, "Full-finetune/Step Time": 6.7745703887194395} {"Full-finetune/Learning Rate": 1.4556652269860772e-06, "Full-finetune/Loss": 0.7400018572807312, "Full-finetune/Loss (Raw)": 0.5891117453575134, "Full-finetune/Step": 4321, "Full-finetune/Step Time": 6.76741598546505} {"Full-finetune/Learning Rate": 1.4524302235965203e-06, "Full-finetune/Loss": 0.7403882145881653, "Full-finetune/Loss (Raw)": 0.8717964291572571, "Full-finetune/Step": 4322, "Full-finetune/Step Time": 6.769400782883167} {"Full-finetune/Learning Rate": 1.4491985373519146e-06, "Full-finetune/Loss": 0.738300085067749, "Full-finetune/Loss (Raw)": 0.5853431820869446, "Full-finetune/Step": 4323, "Full-finetune/Step Time": 6.765028536319733} {"Full-finetune/Learning Rate": 1.4459701695064155e-06, "Full-finetune/Loss": 0.7383999824523926, "Full-finetune/Loss (Raw)": 0.752169132232666, "Full-finetune/Step": 4324, "Full-finetune/Step Time": 6.764144970104098} {"Full-finetune/Learning Rate": 1.4427451213128873e-06, "Full-finetune/Loss": 0.738878607749939, "Full-finetune/Loss (Raw)": 0.5136919021606445, "Full-finetune/Step": 4325, "Full-finetune/Step Time": 6.752756534144282} {"Full-finetune/Learning Rate": 1.4395233940229147e-06, "Full-finetune/Loss": 0.7371658086776733, "Full-finetune/Loss (Raw)": 0.6428593993186951, "Full-finetune/Step": 4326, "Full-finetune/Step Time": 6.771147763356566} {"Full-finetune/Learning Rate": 1.4363049888867853e-06, "Full-finetune/Loss": 0.7339367866516113, "Full-finetune/Loss (Raw)": 0.5137571096420288, "Full-finetune/Step": 4327, "Full-finetune/Step Time": 6.786974826827645} {"Full-finetune/Learning Rate": 1.4330899071534942e-06, "Full-finetune/Loss": 0.7334336042404175, "Full-finetune/Loss (Raw)": 0.7398349046707153, "Full-finetune/Step": 4328, "Full-finetune/Step Time": 6.7903991639614105} {"Full-finetune/Learning Rate": 1.4298781500707558e-06, "Full-finetune/Loss": 0.7340453267097473, "Full-finetune/Loss (Raw)": 0.7861911058425903, "Full-finetune/Step": 4329, "Full-finetune/Step Time": 6.779256341978908} {"Full-finetune/Learning Rate": 1.426669718884991e-06, "Full-finetune/Loss": 0.7345651388168335, "Full-finetune/Loss (Raw)": 0.8420365452766418, "Full-finetune/Step": 4330, "Full-finetune/Step Time": 6.777980595827103} {"Full-finetune/Learning Rate": 1.4234646148413277e-06, "Full-finetune/Loss": 0.7354280948638916, "Full-finetune/Loss (Raw)": 0.8321616649627686, "Full-finetune/Step": 4331, "Full-finetune/Step Time": 6.777365883812308} {"Full-finetune/Learning Rate": 1.420262839183605e-06, "Full-finetune/Loss": 0.7360454797744751, "Full-finetune/Loss (Raw)": 0.7909099459648132, "Full-finetune/Step": 4332, "Full-finetune/Step Time": 6.779960226267576} {"Full-finetune/Learning Rate": 1.4170643931543693e-06, "Full-finetune/Loss": 0.7363212704658508, "Full-finetune/Loss (Raw)": 0.8385761976242065, "Full-finetune/Step": 4333, "Full-finetune/Step Time": 6.7812668811529875} {"Full-finetune/Learning Rate": 1.4138692779948749e-06, "Full-finetune/Loss": 0.7376706600189209, "Full-finetune/Loss (Raw)": 0.8842069506645203, "Full-finetune/Step": 4334, "Full-finetune/Step Time": 6.778445681557059} {"Full-finetune/Learning Rate": 1.4106774949450808e-06, "Full-finetune/Loss": 0.7376524209976196, "Full-finetune/Loss (Raw)": 0.7990652322769165, "Full-finetune/Step": 4335, "Full-finetune/Step Time": 6.774074975401163} {"Full-finetune/Learning Rate": 1.4074890452436607e-06, "Full-finetune/Loss": 0.7386277318000793, "Full-finetune/Loss (Raw)": 0.8891475796699524, "Full-finetune/Step": 4336, "Full-finetune/Step Time": 6.7892677038908005} {"Full-finetune/Learning Rate": 1.4043039301279904e-06, "Full-finetune/Loss": 0.7354846000671387, "Full-finetune/Loss (Raw)": 0.5339749455451965, "Full-finetune/Step": 4337, "Full-finetune/Step Time": 6.811037531122565} {"Full-finetune/Learning Rate": 1.4011221508341433e-06, "Full-finetune/Loss": 0.7356257438659668, "Full-finetune/Loss (Raw)": 0.7883583307266235, "Full-finetune/Step": 4338, "Full-finetune/Step Time": 6.810864234343171} {"Full-finetune/Learning Rate": 1.3979437085969127e-06, "Full-finetune/Loss": 0.7349535226821899, "Full-finetune/Loss (Raw)": 0.7413113117218018, "Full-finetune/Step": 4339, "Full-finetune/Step Time": 6.810886532068253} {"Full-finetune/Learning Rate": 1.3947686046497878e-06, "Full-finetune/Loss": 0.7351218461990356, "Full-finetune/Loss (Raw)": 0.6864251494407654, "Full-finetune/Step": 4340, "Full-finetune/Step Time": 6.824512807652354} {"Full-finetune/Learning Rate": 1.3915968402249647e-06, "Full-finetune/Loss": 0.7374566197395325, "Full-finetune/Loss (Raw)": 0.9150075316429138, "Full-finetune/Step": 4341, "Full-finetune/Step Time": 6.825881792232394} {"Full-finetune/Learning Rate": 1.3884284165533423e-06, "Full-finetune/Loss": 0.7367688417434692, "Full-finetune/Loss (Raw)": 0.6877190470695496, "Full-finetune/Step": 4342, "Full-finetune/Step Time": 6.865870859473944} {"Full-finetune/Learning Rate": 1.3852633348645262e-06, "Full-finetune/Loss": 0.7365742921829224, "Full-finetune/Loss (Raw)": 0.6783462762832642, "Full-finetune/Step": 4343, "Full-finetune/Step Time": 6.829202298074961} {"Full-finetune/Learning Rate": 1.38210159638682e-06, "Full-finetune/Loss": 0.7364444732666016, "Full-finetune/Loss (Raw)": 0.7932190895080566, "Full-finetune/Step": 4344, "Full-finetune/Step Time": 6.8281201627105474} {"Full-finetune/Learning Rate": 1.3789432023472315e-06, "Full-finetune/Loss": 0.7357885837554932, "Full-finetune/Loss (Raw)": 0.7437336444854736, "Full-finetune/Step": 4345, "Full-finetune/Step Time": 6.836578018963337} {"Full-finetune/Learning Rate": 1.3757881539714768e-06, "Full-finetune/Loss": 0.7359275817871094, "Full-finetune/Loss (Raw)": 0.7832847833633423, "Full-finetune/Step": 4346, "Full-finetune/Step Time": 6.839765580371022} {"Full-finetune/Learning Rate": 1.3726364524839687e-06, "Full-finetune/Loss": 0.7382975816726685, "Full-finetune/Loss (Raw)": 0.8713158965110779, "Full-finetune/Step": 4347, "Full-finetune/Step Time": 6.832363476976752} {"Full-finetune/Learning Rate": 1.369488099107814e-06, "Full-finetune/Loss": 0.7382032871246338, "Full-finetune/Loss (Raw)": 0.805061399936676, "Full-finetune/Step": 4348, "Full-finetune/Step Time": 6.838276538997889} {"Full-finetune/Learning Rate": 1.3663430950648326e-06, "Full-finetune/Loss": 0.7380257844924927, "Full-finetune/Loss (Raw)": 0.8721799254417419, "Full-finetune/Step": 4349, "Full-finetune/Step Time": 6.835181046277285} {"Full-finetune/Learning Rate": 1.363201441575539e-06, "Full-finetune/Loss": 0.735835075378418, "Full-finetune/Loss (Raw)": 0.5334736108779907, "Full-finetune/Step": 4350, "Full-finetune/Step Time": 6.845919108018279} {"Full-finetune/Learning Rate": 1.360063139859147e-06, "Full-finetune/Loss": 0.7353927493095398, "Full-finetune/Loss (Raw)": 0.8007740378379822, "Full-finetune/Step": 4351, "Full-finetune/Step Time": 6.846155816689134} {"Full-finetune/Learning Rate": 1.3569281911335686e-06, "Full-finetune/Loss": 0.736024022102356, "Full-finetune/Loss (Raw)": 0.7910947203636169, "Full-finetune/Step": 4352, "Full-finetune/Step Time": 6.838324531912804} {"Full-finetune/Learning Rate": 1.3537965966154177e-06, "Full-finetune/Loss": 0.7371277809143066, "Full-finetune/Loss (Raw)": 0.8267655372619629, "Full-finetune/Step": 4353, "Full-finetune/Step Time": 6.826021984219551} {"Full-finetune/Learning Rate": 1.3506683575200053e-06, "Full-finetune/Loss": 0.7358708381652832, "Full-finetune/Loss (Raw)": 0.7147939801216125, "Full-finetune/Step": 4354, "Full-finetune/Step Time": 6.824617015197873} {"Full-finetune/Learning Rate": 1.347543475061337e-06, "Full-finetune/Loss": 0.7344835996627808, "Full-finetune/Loss (Raw)": 0.8022642135620117, "Full-finetune/Step": 4355, "Full-finetune/Step Time": 6.811086600646377} {"Full-finetune/Learning Rate": 1.344421950452126e-06, "Full-finetune/Loss": 0.7347142696380615, "Full-finetune/Loss (Raw)": 0.8036355376243591, "Full-finetune/Step": 4356, "Full-finetune/Step Time": 6.8091285061091185} {"Full-finetune/Learning Rate": 1.341303784903767e-06, "Full-finetune/Loss": 0.7347768545150757, "Full-finetune/Loss (Raw)": 0.8542481660842896, "Full-finetune/Step": 4357, "Full-finetune/Step Time": 6.809151077643037} {"Full-finetune/Learning Rate": 1.3381889796263602e-06, "Full-finetune/Loss": 0.7390613555908203, "Full-finetune/Loss (Raw)": 0.8128306865692139, "Full-finetune/Step": 4358, "Full-finetune/Step Time": 6.800982177257538} {"Full-finetune/Learning Rate": 1.335077535828706e-06, "Full-finetune/Loss": 0.7406401634216309, "Full-finetune/Loss (Raw)": 0.7618228197097778, "Full-finetune/Step": 4359, "Full-finetune/Step Time": 6.762340612709522} {"Full-finetune/Learning Rate": 1.3319694547182916e-06, "Full-finetune/Loss": 0.7400888204574585, "Full-finetune/Loss (Raw)": 0.70730060338974, "Full-finetune/Step": 4360, "Full-finetune/Step Time": 6.754670398309827} {"Full-finetune/Learning Rate": 1.328864737501302e-06, "Full-finetune/Loss": 0.7428457736968994, "Full-finetune/Loss (Raw)": 0.9938726425170898, "Full-finetune/Step": 4361, "Full-finetune/Step Time": 6.763141050934792} {"Full-finetune/Learning Rate": 1.325763385382618e-06, "Full-finetune/Loss": 0.741408109664917, "Full-finetune/Loss (Raw)": 0.7698063850402832, "Full-finetune/Step": 4362, "Full-finetune/Step Time": 6.7656570468097925} {"Full-finetune/Learning Rate": 1.3226653995658144e-06, "Full-finetune/Loss": 0.7409851551055908, "Full-finetune/Loss (Raw)": 0.7484545111656189, "Full-finetune/Step": 4363, "Full-finetune/Step Time": 6.762459892779589} {"Full-finetune/Learning Rate": 1.319570781253159e-06, "Full-finetune/Loss": 0.7415428757667542, "Full-finetune/Loss (Raw)": 0.6970683336257935, "Full-finetune/Step": 4364, "Full-finetune/Step Time": 6.773883180692792} {"Full-finetune/Learning Rate": 1.3164795316456091e-06, "Full-finetune/Loss": 0.7397790551185608, "Full-finetune/Loss (Raw)": 0.675360381603241, "Full-finetune/Step": 4365, "Full-finetune/Step Time": 6.7885082848370075} {"Full-finetune/Learning Rate": 1.313391651942827e-06, "Full-finetune/Loss": 0.7396832704544067, "Full-finetune/Loss (Raw)": 0.8450139760971069, "Full-finetune/Step": 4366, "Full-finetune/Step Time": 6.777558632194996} {"Full-finetune/Learning Rate": 1.3103071433431501e-06, "Full-finetune/Loss": 0.7388948798179626, "Full-finetune/Loss (Raw)": 0.7150388360023499, "Full-finetune/Step": 4367, "Full-finetune/Step Time": 6.783713011071086} {"Full-finetune/Learning Rate": 1.307226007043617e-06, "Full-finetune/Loss": 0.7393983602523804, "Full-finetune/Loss (Raw)": 0.8219149708747864, "Full-finetune/Step": 4368, "Full-finetune/Step Time": 6.779476394876838} {"Full-finetune/Learning Rate": 1.30414824423996e-06, "Full-finetune/Loss": 0.7390190362930298, "Full-finetune/Loss (Raw)": 0.7344777584075928, "Full-finetune/Step": 4369, "Full-finetune/Step Time": 6.786343760788441} {"Full-finetune/Learning Rate": 1.301073856126598e-06, "Full-finetune/Loss": 0.739068865776062, "Full-finetune/Loss (Raw)": 0.8480625748634338, "Full-finetune/Step": 4370, "Full-finetune/Step Time": 6.789135502651334} {"Full-finetune/Learning Rate": 1.2980028438966396e-06, "Full-finetune/Loss": 0.7401351928710938, "Full-finetune/Loss (Raw)": 0.8784079551696777, "Full-finetune/Step": 4371, "Full-finetune/Step Time": 6.767284853383899} {"Full-finetune/Learning Rate": 1.2949352087418864e-06, "Full-finetune/Loss": 0.735621452331543, "Full-finetune/Loss (Raw)": 0.23621498048305511, "Full-finetune/Step": 4372, "Full-finetune/Step Time": 6.787084084004164} {"Full-finetune/Learning Rate": 1.291870951852826e-06, "Full-finetune/Loss": 0.7349424362182617, "Full-finetune/Loss (Raw)": 0.7047008872032166, "Full-finetune/Step": 4373, "Full-finetune/Step Time": 6.784015785902739} {"Full-finetune/Learning Rate": 1.288810074418637e-06, "Full-finetune/Loss": 0.735335111618042, "Full-finetune/Loss (Raw)": 0.7682594060897827, "Full-finetune/Step": 4374, "Full-finetune/Step Time": 6.750525813549757} {"Full-finetune/Learning Rate": 1.2857525776271852e-06, "Full-finetune/Loss": 0.7346211075782776, "Full-finetune/Loss (Raw)": 0.7355204820632935, "Full-finetune/Step": 4375, "Full-finetune/Step Time": 6.759326938539743} {"Full-finetune/Learning Rate": 1.2826984626650297e-06, "Full-finetune/Loss": 0.7381243705749512, "Full-finetune/Loss (Raw)": 0.7295517921447754, "Full-finetune/Step": 4376, "Full-finetune/Step Time": 6.755190458148718} {"Full-finetune/Learning Rate": 1.2796477307174082e-06, "Full-finetune/Loss": 0.7376464605331421, "Full-finetune/Loss (Raw)": 0.7828863263130188, "Full-finetune/Step": 4377, "Full-finetune/Step Time": 6.756535232067108} {"Full-finetune/Learning Rate": 1.2766003829682504e-06, "Full-finetune/Loss": 0.7388518452644348, "Full-finetune/Loss (Raw)": 0.7316526174545288, "Full-finetune/Step": 4378, "Full-finetune/Step Time": 6.766992015764117} {"Full-finetune/Learning Rate": 1.273556420600175e-06, "Full-finetune/Loss": 0.7383307218551636, "Full-finetune/Loss (Raw)": 0.6043682098388672, "Full-finetune/Step": 4379, "Full-finetune/Step Time": 6.778393194079399} {"Full-finetune/Learning Rate": 1.2705158447944843e-06, "Full-finetune/Loss": 0.7374932765960693, "Full-finetune/Loss (Raw)": 0.8740898370742798, "Full-finetune/Step": 4380, "Full-finetune/Step Time": 6.782044114544988} {"Full-finetune/Learning Rate": 1.2674786567311648e-06, "Full-finetune/Loss": 0.7397563457489014, "Full-finetune/Loss (Raw)": 0.8228947520256042, "Full-finetune/Step": 4381, "Full-finetune/Step Time": 6.779668493196368} {"Full-finetune/Learning Rate": 1.2644448575888913e-06, "Full-finetune/Loss": 0.7428357005119324, "Full-finetune/Loss (Raw)": 0.8748682141304016, "Full-finetune/Step": 4382, "Full-finetune/Step Time": 6.774452164769173} {"Full-finetune/Learning Rate": 1.2614144485450208e-06, "Full-finetune/Loss": 0.7422640323638916, "Full-finetune/Loss (Raw)": 0.6079090237617493, "Full-finetune/Step": 4383, "Full-finetune/Step Time": 6.789310520514846} {"Full-finetune/Learning Rate": 1.2583874307755961e-06, "Full-finetune/Loss": 0.7420501708984375, "Full-finetune/Loss (Raw)": 0.7711657881736755, "Full-finetune/Step": 4384, "Full-finetune/Step Time": 6.7759622018784285} {"Full-finetune/Learning Rate": 1.2553638054553418e-06, "Full-finetune/Loss": 0.7415786981582642, "Full-finetune/Loss (Raw)": 0.7648595571517944, "Full-finetune/Step": 4385, "Full-finetune/Step Time": 6.768762443214655} {"Full-finetune/Learning Rate": 1.252343573757674e-06, "Full-finetune/Loss": 0.7417185306549072, "Full-finetune/Loss (Raw)": 0.6297183632850647, "Full-finetune/Step": 4386, "Full-finetune/Step Time": 6.787039930000901} {"Full-finetune/Learning Rate": 1.2493267368546802e-06, "Full-finetune/Loss": 0.7421494722366333, "Full-finetune/Loss (Raw)": 0.9495707154273987, "Full-finetune/Step": 4387, "Full-finetune/Step Time": 6.775202939286828} {"Full-finetune/Learning Rate": 1.2463132959171343e-06, "Full-finetune/Loss": 0.7426217794418335, "Full-finetune/Loss (Raw)": 0.8107314705848694, "Full-finetune/Step": 4388, "Full-finetune/Step Time": 6.7807756960392} {"Full-finetune/Learning Rate": 1.2433032521145006e-06, "Full-finetune/Loss": 0.7425459027290344, "Full-finetune/Loss (Raw)": 0.7910618782043457, "Full-finetune/Step": 4389, "Full-finetune/Step Time": 6.779418170452118} {"Full-finetune/Learning Rate": 1.2402966066149135e-06, "Full-finetune/Loss": 0.7426561117172241, "Full-finetune/Loss (Raw)": 0.7593448162078857, "Full-finetune/Step": 4390, "Full-finetune/Step Time": 6.779040666297078} {"Full-finetune/Learning Rate": 1.2372933605851944e-06, "Full-finetune/Loss": 0.7412472367286682, "Full-finetune/Loss (Raw)": 0.7601272463798523, "Full-finetune/Step": 4391, "Full-finetune/Step Time": 6.7875327952206135} {"Full-finetune/Learning Rate": 1.2342935151908453e-06, "Full-finetune/Loss": 0.7390689849853516, "Full-finetune/Loss (Raw)": 0.34698575735092163, "Full-finetune/Step": 4392, "Full-finetune/Step Time": 6.809073762968183} {"Full-finetune/Learning Rate": 1.231297071596046e-06, "Full-finetune/Loss": 0.7384953498840332, "Full-finetune/Loss (Raw)": 0.6257436275482178, "Full-finetune/Step": 4393, "Full-finetune/Step Time": 6.817715236917138} {"Full-finetune/Learning Rate": 1.2283040309636596e-06, "Full-finetune/Loss": 0.7370376586914062, "Full-finetune/Loss (Raw)": 0.7239279747009277, "Full-finetune/Step": 4394, "Full-finetune/Step Time": 6.827687758952379} {"Full-finetune/Learning Rate": 1.2253143944552258e-06, "Full-finetune/Loss": 0.7381294965744019, "Full-finetune/Loss (Raw)": 0.7748517990112305, "Full-finetune/Step": 4395, "Full-finetune/Step Time": 6.818306701257825} {"Full-finetune/Learning Rate": 1.2223281632309636e-06, "Full-finetune/Loss": 0.7390130162239075, "Full-finetune/Loss (Raw)": 0.8214983940124512, "Full-finetune/Step": 4396, "Full-finetune/Step Time": 6.83678637072444} {"Full-finetune/Learning Rate": 1.2193453384497722e-06, "Full-finetune/Loss": 0.7380402684211731, "Full-finetune/Loss (Raw)": 0.4122316539287567, "Full-finetune/Step": 4397, "Full-finetune/Step Time": 6.812621988356113} {"Full-finetune/Learning Rate": 1.2163659212692246e-06, "Full-finetune/Loss": 0.7378686666488647, "Full-finetune/Loss (Raw)": 0.7562996745109558, "Full-finetune/Step": 4398, "Full-finetune/Step Time": 6.8242208026349545} {"Full-finetune/Learning Rate": 1.2133899128455796e-06, "Full-finetune/Loss": 0.7408057451248169, "Full-finetune/Loss (Raw)": 0.7016841769218445, "Full-finetune/Step": 4399, "Full-finetune/Step Time": 6.818552056327462} {"Full-finetune/Learning Rate": 1.2104173143337672e-06, "Full-finetune/Loss": 0.7404078245162964, "Full-finetune/Loss (Raw)": 0.7672531604766846, "Full-finetune/Step": 4400, "Full-finetune/Step Time": 6.82572628185153} {"Full-finetune/Learning Rate": 1.2074481268873894e-06, "Full-finetune/Loss": 0.7376651763916016, "Full-finetune/Loss (Raw)": 0.3241644501686096, "Full-finetune/Step": 4401, "Full-finetune/Step Time": 6.845018578693271} {"Full-finetune/Learning Rate": 1.2044823516587345e-06, "Full-finetune/Loss": 0.7367219924926758, "Full-finetune/Loss (Raw)": 0.6277866959571838, "Full-finetune/Step": 4402, "Full-finetune/Step Time": 6.862788289785385} {"Full-finetune/Learning Rate": 1.2015199897987616e-06, "Full-finetune/Loss": 0.7383949756622314, "Full-finetune/Loss (Raw)": 0.828740656375885, "Full-finetune/Step": 4403, "Full-finetune/Step Time": 6.836966259405017} {"Full-finetune/Learning Rate": 1.198561042457105e-06, "Full-finetune/Loss": 0.7393795847892761, "Full-finetune/Loss (Raw)": 0.9423387050628662, "Full-finetune/Step": 4404, "Full-finetune/Step Time": 6.838187590241432} {"Full-finetune/Learning Rate": 1.195605510782073e-06, "Full-finetune/Loss": 0.7396353483200073, "Full-finetune/Loss (Raw)": 0.7337724566459656, "Full-finetune/Step": 4405, "Full-finetune/Step Time": 6.827976364642382} {"Full-finetune/Learning Rate": 1.192653395920652e-06, "Full-finetune/Loss": 0.7377599477767944, "Full-finetune/Loss (Raw)": 0.622177004814148, "Full-finetune/Step": 4406, "Full-finetune/Step Time": 6.825164904817939} {"Full-finetune/Learning Rate": 1.189704699018499e-06, "Full-finetune/Loss": 0.7373777627944946, "Full-finetune/Loss (Raw)": 0.6578630805015564, "Full-finetune/Step": 4407, "Full-finetune/Step Time": 6.823549505323172} {"Full-finetune/Learning Rate": 1.186759421219943e-06, "Full-finetune/Loss": 0.7381277084350586, "Full-finetune/Loss (Raw)": 0.9320135712623596, "Full-finetune/Step": 4408, "Full-finetune/Step Time": 6.822434628382325} {"Full-finetune/Learning Rate": 1.1838175636679938e-06, "Full-finetune/Loss": 0.7363308668136597, "Full-finetune/Loss (Raw)": 0.6752707958221436, "Full-finetune/Step": 4409, "Full-finetune/Step Time": 6.821275567635894} {"Full-finetune/Learning Rate": 1.1808791275043297e-06, "Full-finetune/Loss": 0.7360353469848633, "Full-finetune/Loss (Raw)": 0.7950636148452759, "Full-finetune/Step": 4410, "Full-finetune/Step Time": 6.818373564630747} {"Full-finetune/Learning Rate": 1.1779441138692926e-06, "Full-finetune/Loss": 0.736051619052887, "Full-finetune/Loss (Raw)": 0.7683961391448975, "Full-finetune/Step": 4411, "Full-finetune/Step Time": 6.802092362195253} {"Full-finetune/Learning Rate": 1.1750125239019118e-06, "Full-finetune/Loss": 0.7355167865753174, "Full-finetune/Loss (Raw)": 0.7371086478233337, "Full-finetune/Step": 4412, "Full-finetune/Step Time": 6.793090900406241} {"Full-finetune/Learning Rate": 1.1720843587398756e-06, "Full-finetune/Loss": 0.7385549545288086, "Full-finetune/Loss (Raw)": 0.9852614998817444, "Full-finetune/Step": 4413, "Full-finetune/Step Time": 6.756158361211419} {"Full-finetune/Learning Rate": 1.1691596195195498e-06, "Full-finetune/Loss": 0.7383872270584106, "Full-finetune/Loss (Raw)": 0.7343103289604187, "Full-finetune/Step": 4414, "Full-finetune/Step Time": 6.7553641982376575} {"Full-finetune/Learning Rate": 1.1662383073759686e-06, "Full-finetune/Loss": 0.7387295961380005, "Full-finetune/Loss (Raw)": 0.858767032623291, "Full-finetune/Step": 4415, "Full-finetune/Step Time": 6.760640945285559} {"Full-finetune/Learning Rate": 1.1633204234428352e-06, "Full-finetune/Loss": 0.7370381951332092, "Full-finetune/Loss (Raw)": 0.6759377121925354, "Full-finetune/Step": 4416, "Full-finetune/Step Time": 6.761734638363123} {"Full-finetune/Learning Rate": 1.1604059688525238e-06, "Full-finetune/Loss": 0.7382606267929077, "Full-finetune/Loss (Raw)": 0.8867905735969543, "Full-finetune/Step": 4417, "Full-finetune/Step Time": 6.762869523838162} {"Full-finetune/Learning Rate": 1.157494944736075e-06, "Full-finetune/Loss": 0.7374610900878906, "Full-finetune/Loss (Raw)": 0.7736381888389587, "Full-finetune/Step": 4418, "Full-finetune/Step Time": 6.7619694620370865} {"Full-finetune/Learning Rate": 1.1545873522232055e-06, "Full-finetune/Loss": 0.7371610999107361, "Full-finetune/Loss (Raw)": 0.8402106761932373, "Full-finetune/Step": 4419, "Full-finetune/Step Time": 6.767412610352039} {"Full-finetune/Learning Rate": 1.1516831924422945e-06, "Full-finetune/Loss": 0.7359470129013062, "Full-finetune/Loss (Raw)": 0.6825339198112488, "Full-finetune/Step": 4420, "Full-finetune/Step Time": 6.768683020025492} {"Full-finetune/Learning Rate": 1.1487824665203828e-06, "Full-finetune/Loss": 0.7353450059890747, "Full-finetune/Loss (Raw)": 0.7416388988494873, "Full-finetune/Step": 4421, "Full-finetune/Step Time": 6.766379456967115} {"Full-finetune/Learning Rate": 1.1458851755831934e-06, "Full-finetune/Loss": 0.7354134321212769, "Full-finetune/Loss (Raw)": 0.763658881187439, "Full-finetune/Step": 4422, "Full-finetune/Step Time": 6.749316560104489} {"Full-finetune/Learning Rate": 1.1429913207551046e-06, "Full-finetune/Loss": 0.7378062605857849, "Full-finetune/Loss (Raw)": 0.6031589508056641, "Full-finetune/Step": 4423, "Full-finetune/Step Time": 6.735064793378115} {"Full-finetune/Learning Rate": 1.1401009031591658e-06, "Full-finetune/Loss": 0.7331920862197876, "Full-finetune/Loss (Raw)": 0.3289370536804199, "Full-finetune/Step": 4424, "Full-finetune/Step Time": 6.757491447031498} {"Full-finetune/Learning Rate": 1.137213923917092e-06, "Full-finetune/Loss": 0.7313473224639893, "Full-finetune/Loss (Raw)": 0.6076183319091797, "Full-finetune/Step": 4425, "Full-finetune/Step Time": 6.773927487432957} {"Full-finetune/Learning Rate": 1.1343303841492626e-06, "Full-finetune/Loss": 0.7332415580749512, "Full-finetune/Loss (Raw)": 0.8345949649810791, "Full-finetune/Step": 4426, "Full-finetune/Step Time": 6.770387943834066} {"Full-finetune/Learning Rate": 1.1314502849747244e-06, "Full-finetune/Loss": 0.731637716293335, "Full-finetune/Loss (Raw)": 0.5984737873077393, "Full-finetune/Step": 4427, "Full-finetune/Step Time": 6.779943224042654} {"Full-finetune/Learning Rate": 1.1285736275111836e-06, "Full-finetune/Loss": 0.7309462428092957, "Full-finetune/Loss (Raw)": 0.7923433184623718, "Full-finetune/Step": 4428, "Full-finetune/Step Time": 6.7856379970908165} {"Full-finetune/Learning Rate": 1.1257004128750205e-06, "Full-finetune/Loss": 0.7341524958610535, "Full-finetune/Loss (Raw)": 0.7684110999107361, "Full-finetune/Step": 4429, "Full-finetune/Step Time": 6.76864523999393} {"Full-finetune/Learning Rate": 1.122830642181273e-06, "Full-finetune/Loss": 0.7319618463516235, "Full-finetune/Loss (Raw)": 0.6067437529563904, "Full-finetune/Step": 4430, "Full-finetune/Step Time": 6.806235374882817} {"Full-finetune/Learning Rate": 1.119964316543637e-06, "Full-finetune/Loss": 0.7307322025299072, "Full-finetune/Loss (Raw)": 0.7517024874687195, "Full-finetune/Step": 4431, "Full-finetune/Step Time": 6.814216066151857} {"Full-finetune/Learning Rate": 1.1171014370744837e-06, "Full-finetune/Loss": 0.7346219420433044, "Full-finetune/Loss (Raw)": 0.8270424008369446, "Full-finetune/Step": 4432, "Full-finetune/Step Time": 6.8025492783635855} {"Full-finetune/Learning Rate": 1.114242004884839e-06, "Full-finetune/Loss": 0.7340877056121826, "Full-finetune/Loss (Raw)": 0.5837287902832031, "Full-finetune/Step": 4433, "Full-finetune/Step Time": 6.806582907214761} {"Full-finetune/Learning Rate": 1.111386021084394e-06, "Full-finetune/Loss": 0.7352889776229858, "Full-finetune/Loss (Raw)": 0.8575564622879028, "Full-finetune/Step": 4434, "Full-finetune/Step Time": 6.802161293104291} {"Full-finetune/Learning Rate": 1.1085334867814946e-06, "Full-finetune/Loss": 0.7369999885559082, "Full-finetune/Loss (Raw)": 0.7923333644866943, "Full-finetune/Step": 4435, "Full-finetune/Step Time": 6.797073548659682} {"Full-finetune/Learning Rate": 1.1056844030831603e-06, "Full-finetune/Loss": 0.7364603281021118, "Full-finetune/Loss (Raw)": 0.6146590709686279, "Full-finetune/Step": 4436, "Full-finetune/Step Time": 6.8097924049943686} {"Full-finetune/Learning Rate": 1.1028387710950616e-06, "Full-finetune/Loss": 0.736356258392334, "Full-finetune/Loss (Raw)": 0.7151334285736084, "Full-finetune/Step": 4437, "Full-finetune/Step Time": 6.810964768752456} {"Full-finetune/Learning Rate": 1.0999965919215327e-06, "Full-finetune/Loss": 0.7399650812149048, "Full-finetune/Loss (Raw)": 0.8062530159950256, "Full-finetune/Step": 4438, "Full-finetune/Step Time": 6.79437081515789} {"Full-finetune/Learning Rate": 1.0971578666655713e-06, "Full-finetune/Loss": 0.7410796880722046, "Full-finetune/Loss (Raw)": 0.9243940114974976, "Full-finetune/Step": 4439, "Full-finetune/Step Time": 6.801547491922975} {"Full-finetune/Learning Rate": 1.0943225964288272e-06, "Full-finetune/Loss": 0.7411920428276062, "Full-finetune/Loss (Raw)": 0.8653661012649536, "Full-finetune/Step": 4440, "Full-finetune/Step Time": 6.800598591566086} {"Full-finetune/Learning Rate": 1.091490782311614e-06, "Full-finetune/Loss": 0.7410783767700195, "Full-finetune/Loss (Raw)": 0.8755597472190857, "Full-finetune/Step": 4441, "Full-finetune/Step Time": 6.795504437759519} {"Full-finetune/Learning Rate": 1.088662425412903e-06, "Full-finetune/Loss": 0.7402921915054321, "Full-finetune/Loss (Raw)": 0.753392219543457, "Full-finetune/Step": 4442, "Full-finetune/Step Time": 6.8105206079781055} {"Full-finetune/Learning Rate": 1.0858375268303267e-06, "Full-finetune/Loss": 0.740630567073822, "Full-finetune/Loss (Raw)": 0.7956463098526001, "Full-finetune/Step": 4443, "Full-finetune/Step Time": 6.8112203404307365} {"Full-finetune/Learning Rate": 1.0830160876601737e-06, "Full-finetune/Loss": 0.7408633232116699, "Full-finetune/Loss (Raw)": 0.6949582695960999, "Full-finetune/Step": 4444, "Full-finetune/Step Time": 6.802257979288697} {"Full-finetune/Learning Rate": 1.0801981089973844e-06, "Full-finetune/Loss": 0.7402326464653015, "Full-finetune/Loss (Raw)": 0.6887857913970947, "Full-finetune/Step": 4445, "Full-finetune/Step Time": 6.805273689329624} {"Full-finetune/Learning Rate": 1.0773835919355669e-06, "Full-finetune/Loss": 0.7422654628753662, "Full-finetune/Loss (Raw)": 0.8644806742668152, "Full-finetune/Step": 4446, "Full-finetune/Step Time": 6.807745194062591} {"Full-finetune/Learning Rate": 1.0745725375669768e-06, "Full-finetune/Loss": 0.7436676621437073, "Full-finetune/Loss (Raw)": 0.7660766243934631, "Full-finetune/Step": 4447, "Full-finetune/Step Time": 6.798716867342591} {"Full-finetune/Learning Rate": 1.0717649469825298e-06, "Full-finetune/Loss": 0.7439548373222351, "Full-finetune/Loss (Raw)": 0.7741761803627014, "Full-finetune/Step": 4448, "Full-finetune/Step Time": 6.797699591144919} {"Full-finetune/Learning Rate": 1.0689608212718005e-06, "Full-finetune/Loss": 0.7462859153747559, "Full-finetune/Loss (Raw)": 0.8874809145927429, "Full-finetune/Step": 4449, "Full-finetune/Step Time": 6.785383004695177} {"Full-finetune/Learning Rate": 1.0661601615230122e-06, "Full-finetune/Loss": 0.7448980808258057, "Full-finetune/Loss (Raw)": 0.6941618323326111, "Full-finetune/Step": 4450, "Full-finetune/Step Time": 6.779633713886142} {"Full-finetune/Learning Rate": 1.0633629688230452e-06, "Full-finetune/Loss": 0.7451586127281189, "Full-finetune/Loss (Raw)": 0.6186904907226562, "Full-finetune/Step": 4451, "Full-finetune/Step Time": 6.785530287772417} {"Full-finetune/Learning Rate": 1.0605692442574356e-06, "Full-finetune/Loss": 0.7419651746749878, "Full-finetune/Loss (Raw)": 0.34340551495552063, "Full-finetune/Step": 4452, "Full-finetune/Step Time": 6.813771991059184} {"Full-finetune/Learning Rate": 1.0577789889103763e-06, "Full-finetune/Loss": 0.743426501750946, "Full-finetune/Loss (Raw)": 0.7007416486740112, "Full-finetune/Step": 4453, "Full-finetune/Step Time": 6.80641170963645} {"Full-finetune/Learning Rate": 1.054992203864712e-06, "Full-finetune/Loss": 0.7440599203109741, "Full-finetune/Loss (Raw)": 0.7239404320716858, "Full-finetune/Step": 4454, "Full-finetune/Step Time": 6.804426791146398} {"Full-finetune/Learning Rate": 1.0522088902019324e-06, "Full-finetune/Loss": 0.7449174523353577, "Full-finetune/Loss (Raw)": 0.6235193610191345, "Full-finetune/Step": 4455, "Full-finetune/Step Time": 6.802165746688843} {"Full-finetune/Learning Rate": 1.049429049002193e-06, "Full-finetune/Loss": 0.7448314428329468, "Full-finetune/Loss (Raw)": 0.7288257479667664, "Full-finetune/Step": 4456, "Full-finetune/Step Time": 6.804568627849221} {"Full-finetune/Learning Rate": 1.0466526813442957e-06, "Full-finetune/Loss": 0.7437583208084106, "Full-finetune/Loss (Raw)": 0.6488367915153503, "Full-finetune/Step": 4457, "Full-finetune/Step Time": 6.815929824486375} {"Full-finetune/Learning Rate": 1.0438797883056927e-06, "Full-finetune/Loss": 0.7425181865692139, "Full-finetune/Loss (Raw)": 0.6832966208457947, "Full-finetune/Step": 4458, "Full-finetune/Step Time": 6.830088069662452} {"Full-finetune/Learning Rate": 1.0411103709624903e-06, "Full-finetune/Loss": 0.7414639592170715, "Full-finetune/Loss (Raw)": 0.6972171664237976, "Full-finetune/Step": 4459, "Full-finetune/Step Time": 6.835966357961297} {"Full-finetune/Learning Rate": 1.0383444303894453e-06, "Full-finetune/Loss": 0.7420629262924194, "Full-finetune/Loss (Raw)": 0.8675808906555176, "Full-finetune/Step": 4460, "Full-finetune/Step Time": 6.835507465526462} {"Full-finetune/Learning Rate": 1.0355819676599655e-06, "Full-finetune/Loss": 0.7408808469772339, "Full-finetune/Loss (Raw)": 0.6872649192810059, "Full-finetune/Step": 4461, "Full-finetune/Step Time": 6.83495401032269} {"Full-finetune/Learning Rate": 1.0328229838461069e-06, "Full-finetune/Loss": 0.7399418354034424, "Full-finetune/Loss (Raw)": 0.7640169262886047, "Full-finetune/Step": 4462, "Full-finetune/Step Time": 6.848154243081808} {"Full-finetune/Learning Rate": 1.0300674800185795e-06, "Full-finetune/Loss": 0.7377797961235046, "Full-finetune/Loss (Raw)": 0.5223193764686584, "Full-finetune/Step": 4463, "Full-finetune/Step Time": 6.857317589223385} {"Full-finetune/Learning Rate": 1.0273154572467436e-06, "Full-finetune/Loss": 0.7367287874221802, "Full-finetune/Loss (Raw)": 0.7546212077140808, "Full-finetune/Step": 4464, "Full-finetune/Step Time": 6.860891254618764} {"Full-finetune/Learning Rate": 1.0245669165985973e-06, "Full-finetune/Loss": 0.7381391525268555, "Full-finetune/Loss (Raw)": 0.7145017385482788, "Full-finetune/Step": 4465, "Full-finetune/Step Time": 6.838181424885988} {"Full-finetune/Learning Rate": 1.0218218591408013e-06, "Full-finetune/Loss": 0.7377936840057373, "Full-finetune/Loss (Raw)": 0.7441447973251343, "Full-finetune/Step": 4466, "Full-finetune/Step Time": 6.836821345612407} {"Full-finetune/Learning Rate": 1.0190802859386585e-06, "Full-finetune/Loss": 0.7384108304977417, "Full-finetune/Loss (Raw)": 0.8202961683273315, "Full-finetune/Step": 4467, "Full-finetune/Step Time": 6.831579660996795} {"Full-finetune/Learning Rate": 1.0163421980561184e-06, "Full-finetune/Loss": 0.7388641834259033, "Full-finetune/Loss (Raw)": 0.7444573044776917, "Full-finetune/Step": 4468, "Full-finetune/Step Time": 6.808856623247266} {"Full-finetune/Learning Rate": 1.0136075965557812e-06, "Full-finetune/Loss": 0.7376617789268494, "Full-finetune/Loss (Raw)": 0.7610981464385986, "Full-finetune/Step": 4469, "Full-finetune/Step Time": 6.798690581694245} {"Full-finetune/Learning Rate": 1.0108764824988903e-06, "Full-finetune/Loss": 0.7382875680923462, "Full-finetune/Loss (Raw)": 0.7678235173225403, "Full-finetune/Step": 4470, "Full-finetune/Step Time": 6.760266864672303} {"Full-finetune/Learning Rate": 1.008148856945339e-06, "Full-finetune/Loss": 0.7377488017082214, "Full-finetune/Loss (Raw)": 0.6093800067901611, "Full-finetune/Step": 4471, "Full-finetune/Step Time": 6.773797694593668} {"Full-finetune/Learning Rate": 1.0054247209536628e-06, "Full-finetune/Loss": 0.7377982139587402, "Full-finetune/Loss (Raw)": 0.7995492219924927, "Full-finetune/Step": 4472, "Full-finetune/Step Time": 6.7644082326442} {"Full-finetune/Learning Rate": 1.0027040755810513e-06, "Full-finetune/Loss": 0.7396565675735474, "Full-finetune/Loss (Raw)": 0.9816075563430786, "Full-finetune/Step": 4473, "Full-finetune/Step Time": 6.753836818039417} {"Full-finetune/Learning Rate": 9.999869218833313e-07, "Full-finetune/Loss": 0.7399773597717285, "Full-finetune/Loss (Raw)": 0.8243429064750671, "Full-finetune/Step": 4474, "Full-finetune/Step Time": 6.752877106890082} {"Full-finetune/Learning Rate": 9.972732609149738e-07, "Full-finetune/Loss": 0.7384332418441772, "Full-finetune/Loss (Raw)": 0.6736621260643005, "Full-finetune/Step": 4475, "Full-finetune/Step Time": 6.774845220148563} {"Full-finetune/Learning Rate": 9.945630937291006e-07, "Full-finetune/Loss": 0.7387665510177612, "Full-finetune/Loss (Raw)": 0.8477340936660767, "Full-finetune/Step": 4476, "Full-finetune/Step Time": 6.777178533375263} {"Full-finetune/Learning Rate": 9.918564213774762e-07, "Full-finetune/Loss": 0.7374637722969055, "Full-finetune/Loss (Raw)": 0.7054201364517212, "Full-finetune/Step": 4477, "Full-finetune/Step Time": 6.777762819081545} {"Full-finetune/Learning Rate": 9.891532449105045e-07, "Full-finetune/Loss": 0.7399317026138306, "Full-finetune/Loss (Raw)": 0.8493623733520508, "Full-finetune/Step": 4478, "Full-finetune/Step Time": 6.761126456782222} {"Full-finetune/Learning Rate": 9.864535653772367e-07, "Full-finetune/Loss": 0.7398681044578552, "Full-finetune/Loss (Raw)": 0.7926353812217712, "Full-finetune/Step": 4479, "Full-finetune/Step Time": 6.771040722727776} {"Full-finetune/Learning Rate": 9.837573838253655e-07, "Full-finetune/Loss": 0.7387763857841492, "Full-finetune/Loss (Raw)": 0.6513601541519165, "Full-finetune/Step": 4480, "Full-finetune/Step Time": 6.776340000331402} {"Full-finetune/Learning Rate": 9.810647013012265e-07, "Full-finetune/Loss": 0.7378277778625488, "Full-finetune/Loss (Raw)": 0.7053410410881042, "Full-finetune/Step": 4481, "Full-finetune/Step Time": 6.779392970725894} {"Full-finetune/Learning Rate": 9.783755188497944e-07, "Full-finetune/Loss": 0.7376929521560669, "Full-finetune/Loss (Raw)": 0.6975399255752563, "Full-finetune/Step": 4482, "Full-finetune/Step Time": 6.794256364926696} {"Full-finetune/Learning Rate": 9.75689837514696e-07, "Full-finetune/Loss": 0.7376177906990051, "Full-finetune/Loss (Raw)": 0.7926437854766846, "Full-finetune/Step": 4483, "Full-finetune/Step Time": 6.791955199092627} {"Full-finetune/Learning Rate": 9.730076583381841e-07, "Full-finetune/Loss": 0.7381764650344849, "Full-finetune/Loss (Raw)": 0.8751447200775146, "Full-finetune/Step": 4484, "Full-finetune/Step Time": 6.80839179456234} {"Full-finetune/Learning Rate": 9.703289823611606e-07, "Full-finetune/Loss": 0.7373825311660767, "Full-finetune/Loss (Raw)": 0.7526169419288635, "Full-finetune/Step": 4485, "Full-finetune/Step Time": 6.809342380613089} {"Full-finetune/Learning Rate": 9.676538106231725e-07, "Full-finetune/Loss": 0.7367468476295471, "Full-finetune/Loss (Raw)": 0.7314718961715698, "Full-finetune/Step": 4486, "Full-finetune/Step Time": 6.806008245795965} {"Full-finetune/Learning Rate": 9.649821441623986e-07, "Full-finetune/Loss": 0.7332943081855774, "Full-finetune/Loss (Raw)": 0.31989145278930664, "Full-finetune/Step": 4487, "Full-finetune/Step Time": 6.825845282524824} {"Full-finetune/Learning Rate": 9.623139840156604e-07, "Full-finetune/Loss": 0.7339062690734863, "Full-finetune/Loss (Raw)": 0.7856310606002808, "Full-finetune/Step": 4488, "Full-finetune/Step Time": 6.832892956212163} {"Full-finetune/Learning Rate": 9.596493312184197e-07, "Full-finetune/Loss": 0.7298380136489868, "Full-finetune/Loss (Raw)": 0.473139226436615, "Full-finetune/Step": 4489, "Full-finetune/Step Time": 6.823719706386328} {"Full-finetune/Learning Rate": 9.569881868047747e-07, "Full-finetune/Loss": 0.7289528250694275, "Full-finetune/Loss (Raw)": 0.6565032601356506, "Full-finetune/Step": 4490, "Full-finetune/Step Time": 6.828103521838784} {"Full-finetune/Learning Rate": 9.543305518074652e-07, "Full-finetune/Loss": 0.7288473844528198, "Full-finetune/Loss (Raw)": 0.7349578738212585, "Full-finetune/Step": 4491, "Full-finetune/Step Time": 6.829062322154641} {"Full-finetune/Learning Rate": 9.516764272578638e-07, "Full-finetune/Loss": 0.7297471165657043, "Full-finetune/Loss (Raw)": 0.8122383952140808, "Full-finetune/Step": 4492, "Full-finetune/Step Time": 6.812336266040802} {"Full-finetune/Learning Rate": 9.49025814185992e-07, "Full-finetune/Loss": 0.7301070690155029, "Full-finetune/Loss (Raw)": 0.7214321494102478, "Full-finetune/Step": 4493, "Full-finetune/Step Time": 6.807981893420219} {"Full-finetune/Learning Rate": 9.463787136204938e-07, "Full-finetune/Loss": 0.7280855178833008, "Full-finetune/Loss (Raw)": 0.5862574577331543, "Full-finetune/Step": 4494, "Full-finetune/Step Time": 6.81365286372602} {"Full-finetune/Learning Rate": 9.437351265886585e-07, "Full-finetune/Loss": 0.7285223007202148, "Full-finetune/Loss (Raw)": 0.7709423303604126, "Full-finetune/Step": 4495, "Full-finetune/Step Time": 6.814189435914159} {"Full-finetune/Learning Rate": 9.410950541164143e-07, "Full-finetune/Loss": 0.7275222539901733, "Full-finetune/Loss (Raw)": 0.6939085721969604, "Full-finetune/Step": 4496, "Full-finetune/Step Time": 6.8223488591611385} {"Full-finetune/Learning Rate": 9.384584972283184e-07, "Full-finetune/Loss": 0.7278473973274231, "Full-finetune/Loss (Raw)": 0.7760935425758362, "Full-finetune/Step": 4497, "Full-finetune/Step Time": 6.825124446302652} {"Full-finetune/Learning Rate": 9.358254569475689e-07, "Full-finetune/Loss": 0.7265010476112366, "Full-finetune/Loss (Raw)": 0.6757307052612305, "Full-finetune/Step": 4498, "Full-finetune/Step Time": 6.830346290022135} {"Full-finetune/Learning Rate": 9.331959342959951e-07, "Full-finetune/Loss": 0.726393461227417, "Full-finetune/Loss (Raw)": 0.864641547203064, "Full-finetune/Step": 4499, "Full-finetune/Step Time": 6.830873237922788} {"Full-finetune/Learning Rate": 9.305699302940662e-07, "Full-finetune/Loss": 0.7300132513046265, "Full-finetune/Loss (Raw)": 0.6995472311973572, "Full-finetune/Step": 4500, "Full-finetune/Step Time": 6.819761458784342} {"Full-finetune/Learning Rate": 9.279474459608806e-07, "Full-finetune/Loss": 0.7313343286514282, "Full-finetune/Loss (Raw)": 0.8737940192222595, "Full-finetune/Step": 4501, "Full-finetune/Step Time": 6.82870583422482} {"Full-finetune/Learning Rate": 9.253284823141728e-07, "Full-finetune/Loss": 0.7304404973983765, "Full-finetune/Loss (Raw)": 0.6538574695587158, "Full-finetune/Step": 4502, "Full-finetune/Step Time": 6.833765113726258} {"Full-finetune/Learning Rate": 9.227130403703178e-07, "Full-finetune/Loss": 0.7313310503959656, "Full-finetune/Loss (Raw)": 0.8495048880577087, "Full-finetune/Step": 4503, "Full-finetune/Step Time": 6.8235934022814035} {"Full-finetune/Learning Rate": 9.201011211443101e-07, "Full-finetune/Loss": 0.7315536737442017, "Full-finetune/Loss (Raw)": 0.7580521106719971, "Full-finetune/Step": 4504, "Full-finetune/Step Time": 6.824634701013565} {"Full-finetune/Learning Rate": 9.174927256497846e-07, "Full-finetune/Loss": 0.7312649488449097, "Full-finetune/Loss (Raw)": 0.7459222674369812, "Full-finetune/Step": 4505, "Full-finetune/Step Time": 6.824171286076307} {"Full-finetune/Learning Rate": 9.148878548990137e-07, "Full-finetune/Loss": 0.7329715490341187, "Full-finetune/Loss (Raw)": 0.9501037001609802, "Full-finetune/Step": 4506, "Full-finetune/Step Time": 6.803008070215583} {"Full-finetune/Learning Rate": 9.122865099028944e-07, "Full-finetune/Loss": 0.7306669354438782, "Full-finetune/Loss (Raw)": 0.30938267707824707, "Full-finetune/Step": 4507, "Full-finetune/Step Time": 6.808052258566022} {"Full-finetune/Learning Rate": 9.09688691670958e-07, "Full-finetune/Loss": 0.7296879887580872, "Full-finetune/Loss (Raw)": 0.7487805485725403, "Full-finetune/Step": 4508, "Full-finetune/Step Time": 6.8010049238801} {"Full-finetune/Learning Rate": 9.070944012113669e-07, "Full-finetune/Loss": 0.7288026809692383, "Full-finetune/Loss (Raw)": 0.7095754146575928, "Full-finetune/Step": 4509, "Full-finetune/Step Time": 6.7897900473326445} {"Full-finetune/Learning Rate": 9.045036395309148e-07, "Full-finetune/Loss": 0.7285430431365967, "Full-finetune/Loss (Raw)": 0.8416392207145691, "Full-finetune/Step": 4510, "Full-finetune/Step Time": 6.785280676558614} {"Full-finetune/Learning Rate": 9.019164076350262e-07, "Full-finetune/Loss": 0.731134295463562, "Full-finetune/Loss (Raw)": 0.9395833015441895, "Full-finetune/Step": 4511, "Full-finetune/Step Time": 6.782172080129385} {"Full-finetune/Learning Rate": 8.993327065277524e-07, "Full-finetune/Loss": 0.727839469909668, "Full-finetune/Loss (Raw)": 0.34942692518234253, "Full-finetune/Step": 4512, "Full-finetune/Step Time": 6.7956782057881355} {"Full-finetune/Learning Rate": 8.967525372117825e-07, "Full-finetune/Loss": 0.7278881072998047, "Full-finetune/Loss (Raw)": 0.7710832357406616, "Full-finetune/Step": 4513, "Full-finetune/Step Time": 6.8013810608536005} {"Full-finetune/Learning Rate": 8.941759006884265e-07, "Full-finetune/Loss": 0.7281079292297363, "Full-finetune/Loss (Raw)": 0.6578555107116699, "Full-finetune/Step": 4514, "Full-finetune/Step Time": 6.782563952729106} {"Full-finetune/Learning Rate": 8.916027979576247e-07, "Full-finetune/Loss": 0.726627767086029, "Full-finetune/Loss (Raw)": 0.7601165771484375, "Full-finetune/Step": 4515, "Full-finetune/Step Time": 6.785803573206067} {"Full-finetune/Learning Rate": 8.890332300179516e-07, "Full-finetune/Loss": 0.7250417470932007, "Full-finetune/Loss (Raw)": 0.6077200174331665, "Full-finetune/Step": 4516, "Full-finetune/Step Time": 6.7800559643656015} {"Full-finetune/Learning Rate": 8.864671978666084e-07, "Full-finetune/Loss": 0.7239891290664673, "Full-finetune/Loss (Raw)": 0.6563199758529663, "Full-finetune/Step": 4517, "Full-finetune/Step Time": 6.792662752792239} {"Full-finetune/Learning Rate": 8.839047024994152e-07, "Full-finetune/Loss": 0.725204348564148, "Full-finetune/Loss (Raw)": 0.9149029850959778, "Full-finetune/Step": 4518, "Full-finetune/Step Time": 6.787757208570838} {"Full-finetune/Learning Rate": 8.813457449108309e-07, "Full-finetune/Loss": 0.7261343598365784, "Full-finetune/Loss (Raw)": 0.8791612386703491, "Full-finetune/Step": 4519, "Full-finetune/Step Time": 6.791187820956111} {"Full-finetune/Learning Rate": 8.787903260939368e-07, "Full-finetune/Loss": 0.7301186323165894, "Full-finetune/Loss (Raw)": 0.8569784164428711, "Full-finetune/Step": 4520, "Full-finetune/Step Time": 6.760790018364787} {"Full-finetune/Learning Rate": 8.762384470404417e-07, "Full-finetune/Loss": 0.7322176694869995, "Full-finetune/Loss (Raw)": 0.8944188356399536, "Full-finetune/Step": 4521, "Full-finetune/Step Time": 6.747811734676361} {"Full-finetune/Learning Rate": 8.736901087406779e-07, "Full-finetune/Loss": 0.7321508526802063, "Full-finetune/Loss (Raw)": 0.7153714299201965, "Full-finetune/Step": 4522, "Full-finetune/Step Time": 6.744701558724046} {"Full-finetune/Learning Rate": 8.711453121836066e-07, "Full-finetune/Loss": 0.7322403788566589, "Full-finetune/Loss (Raw)": 0.7863157987594604, "Full-finetune/Step": 4523, "Full-finetune/Step Time": 6.748603427782655} {"Full-finetune/Learning Rate": 8.686040583568134e-07, "Full-finetune/Loss": 0.732111930847168, "Full-finetune/Loss (Raw)": 0.8050580024719238, "Full-finetune/Step": 4524, "Full-finetune/Step Time": 6.733357205986977} {"Full-finetune/Learning Rate": 8.660663482465093e-07, "Full-finetune/Loss": 0.7349303960800171, "Full-finetune/Loss (Raw)": 0.7729892134666443, "Full-finetune/Step": 4525, "Full-finetune/Step Time": 6.717387184500694} {"Full-finetune/Learning Rate": 8.63532182837531e-07, "Full-finetune/Loss": 0.7333822250366211, "Full-finetune/Loss (Raw)": 0.5581418871879578, "Full-finetune/Step": 4526, "Full-finetune/Step Time": 6.703635808080435} {"Full-finetune/Learning Rate": 8.610015631133395e-07, "Full-finetune/Loss": 0.7312973141670227, "Full-finetune/Loss (Raw)": 0.43480876088142395, "Full-finetune/Step": 4527, "Full-finetune/Step Time": 6.7119639571756124} {"Full-finetune/Learning Rate": 8.584744900560149e-07, "Full-finetune/Loss": 0.7308993339538574, "Full-finetune/Loss (Raw)": 0.7163037061691284, "Full-finetune/Step": 4528, "Full-finetune/Step Time": 6.703226504847407} {"Full-finetune/Learning Rate": 8.559509646462693e-07, "Full-finetune/Loss": 0.7345848083496094, "Full-finetune/Loss (Raw)": 0.7959074974060059, "Full-finetune/Step": 4529, "Full-finetune/Step Time": 6.687714349478483} {"Full-finetune/Learning Rate": 8.534309878634317e-07, "Full-finetune/Loss": 0.7364745140075684, "Full-finetune/Loss (Raw)": 0.8696680665016174, "Full-finetune/Step": 4530, "Full-finetune/Step Time": 6.671928063035011} {"Full-finetune/Learning Rate": 8.509145606854552e-07, "Full-finetune/Loss": 0.736987829208374, "Full-finetune/Loss (Raw)": 0.8944509029388428, "Full-finetune/Step": 4531, "Full-finetune/Step Time": 6.67840252071619} {"Full-finetune/Learning Rate": 8.484016840889176e-07, "Full-finetune/Loss": 0.7343724370002747, "Full-finetune/Loss (Raw)": 0.6075728535652161, "Full-finetune/Step": 4532, "Full-finetune/Step Time": 6.6879688911139965} {"Full-finetune/Learning Rate": 8.458923590490165e-07, "Full-finetune/Loss": 0.7348929643630981, "Full-finetune/Loss (Raw)": 0.8003999590873718, "Full-finetune/Step": 4533, "Full-finetune/Step Time": 6.680905239656568} {"Full-finetune/Learning Rate": 8.433865865395718e-07, "Full-finetune/Loss": 0.7326194047927856, "Full-finetune/Loss (Raw)": 0.33116063475608826, "Full-finetune/Step": 4534, "Full-finetune/Step Time": 6.699450850486755} {"Full-finetune/Learning Rate": 8.408843675330225e-07, "Full-finetune/Loss": 0.7324925065040588, "Full-finetune/Loss (Raw)": 0.6416198015213013, "Full-finetune/Step": 4535, "Full-finetune/Step Time": 6.707743600010872} {"Full-finetune/Learning Rate": 8.383857030004361e-07, "Full-finetune/Loss": 0.7312268614768982, "Full-finetune/Loss (Raw)": 0.7700067162513733, "Full-finetune/Step": 4536, "Full-finetune/Step Time": 6.7177539467811584} {"Full-finetune/Learning Rate": 8.358905939114948e-07, "Full-finetune/Loss": 0.7321233749389648, "Full-finetune/Loss (Raw)": 0.790033757686615, "Full-finetune/Step": 4537, "Full-finetune/Step Time": 6.715652793645859} {"Full-finetune/Learning Rate": 8.333990412344961e-07, "Full-finetune/Loss": 0.7324141263961792, "Full-finetune/Loss (Raw)": 0.8322687745094299, "Full-finetune/Step": 4538, "Full-finetune/Step Time": 6.715330675244331} {"Full-finetune/Learning Rate": 8.30911045936369e-07, "Full-finetune/Loss": 0.731549859046936, "Full-finetune/Loss (Raw)": 0.6577791571617126, "Full-finetune/Step": 4539, "Full-finetune/Step Time": 6.7222431022673845} {"Full-finetune/Learning Rate": 8.284266089826531e-07, "Full-finetune/Loss": 0.7281496524810791, "Full-finetune/Loss (Raw)": 0.3018738031387329, "Full-finetune/Step": 4540, "Full-finetune/Step Time": 6.741817306727171} {"Full-finetune/Learning Rate": 8.259457313375097e-07, "Full-finetune/Loss": 0.7258302569389343, "Full-finetune/Loss (Raw)": 0.68837970495224, "Full-finetune/Step": 4541, "Full-finetune/Step Time": 6.763665830716491} {"Full-finetune/Learning Rate": 8.234684139637205e-07, "Full-finetune/Loss": 0.7250841856002808, "Full-finetune/Loss (Raw)": 0.6388131976127625, "Full-finetune/Step": 4542, "Full-finetune/Step Time": 6.765232253819704} {"Full-finetune/Learning Rate": 8.209946578226836e-07, "Full-finetune/Loss": 0.7244194746017456, "Full-finetune/Loss (Raw)": 0.7736909985542297, "Full-finetune/Step": 4543, "Full-finetune/Step Time": 6.759520316496491} {"Full-finetune/Learning Rate": 8.185244638744139e-07, "Full-finetune/Loss": 0.725920557975769, "Full-finetune/Loss (Raw)": 0.8680683970451355, "Full-finetune/Step": 4544, "Full-finetune/Step Time": 6.750644708052278} {"Full-finetune/Learning Rate": 8.160578330775459e-07, "Full-finetune/Loss": 0.7248727083206177, "Full-finetune/Loss (Raw)": 0.7526718974113464, "Full-finetune/Step": 4545, "Full-finetune/Step Time": 6.761313304305077} {"Full-finetune/Learning Rate": 8.135947663893329e-07, "Full-finetune/Loss": 0.7255160808563232, "Full-finetune/Loss (Raw)": 0.8559882640838623, "Full-finetune/Step": 4546, "Full-finetune/Step Time": 6.761066701263189} {"Full-finetune/Learning Rate": 8.111352647656423e-07, "Full-finetune/Loss": 0.7254860401153564, "Full-finetune/Loss (Raw)": 0.836364209651947, "Full-finetune/Step": 4547, "Full-finetune/Step Time": 6.7541369665414095} {"Full-finetune/Learning Rate": 8.086793291609562e-07, "Full-finetune/Loss": 0.7245551347732544, "Full-finetune/Loss (Raw)": 0.5633739233016968, "Full-finetune/Step": 4548, "Full-finetune/Step Time": 6.7768206391483545} {"Full-finetune/Learning Rate": 8.062269605283779e-07, "Full-finetune/Loss": 0.7233419418334961, "Full-finetune/Loss (Raw)": 0.58635413646698, "Full-finetune/Step": 4549, "Full-finetune/Step Time": 6.777246223762631} {"Full-finetune/Learning Rate": 8.037781598196225e-07, "Full-finetune/Loss": 0.7243466973304749, "Full-finetune/Loss (Raw)": 0.8922659158706665, "Full-finetune/Step": 4550, "Full-finetune/Step Time": 6.774123068898916} {"Full-finetune/Learning Rate": 8.013329279850235e-07, "Full-finetune/Loss": 0.7260728478431702, "Full-finetune/Loss (Raw)": 0.8241108059883118, "Full-finetune/Step": 4551, "Full-finetune/Step Time": 6.772017884999514} {"Full-finetune/Learning Rate": 7.988912659735249e-07, "Full-finetune/Loss": 0.7281762957572937, "Full-finetune/Loss (Raw)": 0.5981746315956116, "Full-finetune/Step": 4552, "Full-finetune/Step Time": 6.763120209798217} {"Full-finetune/Learning Rate": 7.964531747326898e-07, "Full-finetune/Loss": 0.7296807765960693, "Full-finetune/Loss (Raw)": 0.8001949787139893, "Full-finetune/Step": 4553, "Full-finetune/Step Time": 6.7429533414542675} {"Full-finetune/Learning Rate": 7.940186552086937e-07, "Full-finetune/Loss": 0.7301487922668457, "Full-finetune/Loss (Raw)": 0.8944920301437378, "Full-finetune/Step": 4554, "Full-finetune/Step Time": 6.741005590185523} {"Full-finetune/Learning Rate": 7.915877083463242e-07, "Full-finetune/Loss": 0.7317452430725098, "Full-finetune/Loss (Raw)": 0.8028321266174316, "Full-finetune/Step": 4555, "Full-finetune/Step Time": 6.740961782634258} {"Full-finetune/Learning Rate": 7.891603350889888e-07, "Full-finetune/Loss": 0.7328912019729614, "Full-finetune/Loss (Raw)": 0.9390212297439575, "Full-finetune/Step": 4556, "Full-finetune/Step Time": 6.748048782348633} {"Full-finetune/Learning Rate": 7.867365363787005e-07, "Full-finetune/Loss": 0.7321546077728271, "Full-finetune/Loss (Raw)": 0.6741223931312561, "Full-finetune/Step": 4557, "Full-finetune/Step Time": 6.749725358560681} {"Full-finetune/Learning Rate": 7.843163131560871e-07, "Full-finetune/Loss": 0.7318727374076843, "Full-finetune/Loss (Raw)": 0.5706644058227539, "Full-finetune/Step": 4558, "Full-finetune/Step Time": 6.72489332780242} {"Full-finetune/Learning Rate": 7.818996663603917e-07, "Full-finetune/Loss": 0.7331017255783081, "Full-finetune/Loss (Raw)": 0.9090188145637512, "Full-finetune/Step": 4559, "Full-finetune/Step Time": 6.7256786450743675} {"Full-finetune/Learning Rate": 7.794865969294685e-07, "Full-finetune/Loss": 0.7323390245437622, "Full-finetune/Loss (Raw)": 0.7294152975082397, "Full-finetune/Step": 4560, "Full-finetune/Step Time": 6.719530405476689} {"Full-finetune/Learning Rate": 7.770771057997828e-07, "Full-finetune/Loss": 0.7339868545532227, "Full-finetune/Loss (Raw)": 0.7946475148200989, "Full-finetune/Step": 4561, "Full-finetune/Step Time": 6.7094827108085155} {"Full-finetune/Learning Rate": 7.746711939064066e-07, "Full-finetune/Loss": 0.7338404655456543, "Full-finetune/Loss (Raw)": 0.8388212323188782, "Full-finetune/Step": 4562, "Full-finetune/Step Time": 6.708278110250831} {"Full-finetune/Learning Rate": 7.722688621830333e-07, "Full-finetune/Loss": 0.7299981117248535, "Full-finetune/Loss (Raw)": 0.30050864815711975, "Full-finetune/Step": 4563, "Full-finetune/Step Time": 6.725029043853283} {"Full-finetune/Learning Rate": 7.698701115619578e-07, "Full-finetune/Loss": 0.7310011386871338, "Full-finetune/Loss (Raw)": 0.743049681186676, "Full-finetune/Step": 4564, "Full-finetune/Step Time": 6.7088264785707} {"Full-finetune/Learning Rate": 7.674749429740868e-07, "Full-finetune/Loss": 0.7307990789413452, "Full-finetune/Loss (Raw)": 0.6892716288566589, "Full-finetune/Step": 4565, "Full-finetune/Step Time": 6.702963154762983} {"Full-finetune/Learning Rate": 7.650833573489436e-07, "Full-finetune/Loss": 0.7304916381835938, "Full-finetune/Loss (Raw)": 0.7668984532356262, "Full-finetune/Step": 4566, "Full-finetune/Step Time": 6.715328091755509} {"Full-finetune/Learning Rate": 7.626953556146521e-07, "Full-finetune/Loss": 0.7300982475280762, "Full-finetune/Loss (Raw)": 0.8740432262420654, "Full-finetune/Step": 4567, "Full-finetune/Step Time": 6.702499456703663} {"Full-finetune/Learning Rate": 7.603109386979501e-07, "Full-finetune/Loss": 0.7296305894851685, "Full-finetune/Loss (Raw)": 0.8055046796798706, "Full-finetune/Step": 4568, "Full-finetune/Step Time": 6.699341373518109} {"Full-finetune/Learning Rate": 7.579301075241808e-07, "Full-finetune/Loss": 0.7293692827224731, "Full-finetune/Loss (Raw)": 0.8421081304550171, "Full-finetune/Step": 4569, "Full-finetune/Step Time": 6.697219479829073} {"Full-finetune/Learning Rate": 7.555528630173014e-07, "Full-finetune/Loss": 0.7299938201904297, "Full-finetune/Loss (Raw)": 0.8333364725112915, "Full-finetune/Step": 4570, "Full-finetune/Step Time": 6.683654373511672} {"Full-finetune/Learning Rate": 7.531792060998766e-07, "Full-finetune/Loss": 0.7286335229873657, "Full-finetune/Loss (Raw)": 0.6215240955352783, "Full-finetune/Step": 4571, "Full-finetune/Step Time": 6.700459938496351} {"Full-finetune/Learning Rate": 7.508091376930682e-07, "Full-finetune/Loss": 0.728884756565094, "Full-finetune/Loss (Raw)": 0.7271203994750977, "Full-finetune/Step": 4572, "Full-finetune/Step Time": 6.726514032110572} {"Full-finetune/Learning Rate": 7.484426587166615e-07, "Full-finetune/Loss": 0.7287514209747314, "Full-finetune/Loss (Raw)": 0.6717222929000854, "Full-finetune/Step": 4573, "Full-finetune/Step Time": 6.740422626957297} {"Full-finetune/Learning Rate": 7.460797700890365e-07, "Full-finetune/Loss": 0.7282469868659973, "Full-finetune/Loss (Raw)": 0.7999083399772644, "Full-finetune/Step": 4574, "Full-finetune/Step Time": 6.738977747038007} {"Full-finetune/Learning Rate": 7.437204727271852e-07, "Full-finetune/Loss": 0.7278327941894531, "Full-finetune/Loss (Raw)": 0.7130618691444397, "Full-finetune/Step": 4575, "Full-finetune/Step Time": 6.752389699220657} {"Full-finetune/Learning Rate": 7.41364767546705e-07, "Full-finetune/Loss": 0.727107048034668, "Full-finetune/Loss (Raw)": 0.6812795400619507, "Full-finetune/Step": 4576, "Full-finetune/Step Time": 6.759114816784859} {"Full-finetune/Learning Rate": 7.390126554617982e-07, "Full-finetune/Loss": 0.7271779775619507, "Full-finetune/Loss (Raw)": 0.8965645432472229, "Full-finetune/Step": 4577, "Full-finetune/Step Time": 6.7614174373447895} {"Full-finetune/Learning Rate": 7.366641373852745e-07, "Full-finetune/Loss": 0.7282797694206238, "Full-finetune/Loss (Raw)": 0.8351839780807495, "Full-finetune/Step": 4578, "Full-finetune/Step Time": 6.764629350975156} {"Full-finetune/Learning Rate": 7.343192142285471e-07, "Full-finetune/Loss": 0.726669192314148, "Full-finetune/Loss (Raw)": 0.41253548860549927, "Full-finetune/Step": 4579, "Full-finetune/Step Time": 6.771396975964308} {"Full-finetune/Learning Rate": 7.319778869016358e-07, "Full-finetune/Loss": 0.7260395884513855, "Full-finetune/Loss (Raw)": 0.26281818747520447, "Full-finetune/Step": 4580, "Full-finetune/Step Time": 6.761868020519614} {"Full-finetune/Learning Rate": 7.296401563131661e-07, "Full-finetune/Loss": 0.7256313562393188, "Full-finetune/Loss (Raw)": 0.6484873294830322, "Full-finetune/Step": 4581, "Full-finetune/Step Time": 6.769928261637688} {"Full-finetune/Learning Rate": 7.273060233703599e-07, "Full-finetune/Loss": 0.7257256507873535, "Full-finetune/Loss (Raw)": 0.7360160946846008, "Full-finetune/Step": 4582, "Full-finetune/Step Time": 6.763172369450331} {"Full-finetune/Learning Rate": 7.249754889790539e-07, "Full-finetune/Loss": 0.7277151346206665, "Full-finetune/Loss (Raw)": 0.8781712055206299, "Full-finetune/Step": 4583, "Full-finetune/Step Time": 6.748911049216986} {"Full-finetune/Learning Rate": 7.2264855404368e-07, "Full-finetune/Loss": 0.7274829149246216, "Full-finetune/Loss (Raw)": 0.6990999579429626, "Full-finetune/Step": 4584, "Full-finetune/Step Time": 6.7382302191108465} {"Full-finetune/Learning Rate": 7.203252194672783e-07, "Full-finetune/Loss": 0.7273355722427368, "Full-finetune/Loss (Raw)": 0.6299829483032227, "Full-finetune/Step": 4585, "Full-finetune/Step Time": 6.7261770106852055} {"Full-finetune/Learning Rate": 7.180054861514885e-07, "Full-finetune/Loss": 0.7272582054138184, "Full-finetune/Loss (Raw)": 0.6733881235122681, "Full-finetune/Step": 4586, "Full-finetune/Step Time": 6.717604028061032} {"Full-finetune/Learning Rate": 7.156893549965538e-07, "Full-finetune/Loss": 0.7286132574081421, "Full-finetune/Loss (Raw)": 0.8706679344177246, "Full-finetune/Step": 4587, "Full-finetune/Step Time": 6.712808795273304} {"Full-finetune/Learning Rate": 7.133768269013186e-07, "Full-finetune/Loss": 0.7284038662910461, "Full-finetune/Loss (Raw)": 0.8407761454582214, "Full-finetune/Step": 4588, "Full-finetune/Step Time": 6.73603131249547} {"Full-finetune/Learning Rate": 7.110679027632295e-07, "Full-finetune/Loss": 0.7289272546768188, "Full-finetune/Loss (Raw)": 0.7542587518692017, "Full-finetune/Step": 4589, "Full-finetune/Step Time": 6.7360779251903296} {"Full-finetune/Learning Rate": 7.087625834783385e-07, "Full-finetune/Loss": 0.7285017967224121, "Full-finetune/Loss (Raw)": 0.7095559239387512, "Full-finetune/Step": 4590, "Full-finetune/Step Time": 6.725548751652241} {"Full-finetune/Learning Rate": 7.064608699412944e-07, "Full-finetune/Loss": 0.7308349609375, "Full-finetune/Loss (Raw)": 0.8209629654884338, "Full-finetune/Step": 4591, "Full-finetune/Step Time": 6.709268284961581} {"Full-finetune/Learning Rate": 7.041627630453418e-07, "Full-finetune/Loss": 0.7271531224250793, "Full-finetune/Loss (Raw)": 0.2833458185195923, "Full-finetune/Step": 4592, "Full-finetune/Step Time": 6.709049094468355} {"Full-finetune/Learning Rate": 7.018682636823371e-07, "Full-finetune/Loss": 0.7280729413032532, "Full-finetune/Loss (Raw)": 0.8322372436523438, "Full-finetune/Step": 4593, "Full-finetune/Step Time": 6.714042764157057} {"Full-finetune/Learning Rate": 6.99577372742728e-07, "Full-finetune/Loss": 0.7254327535629272, "Full-finetune/Loss (Raw)": 0.4061986207962036, "Full-finetune/Step": 4594, "Full-finetune/Step Time": 6.731717320159078} {"Full-finetune/Learning Rate": 6.972900911155656e-07, "Full-finetune/Loss": 0.7252383828163147, "Full-finetune/Loss (Raw)": 0.7954251766204834, "Full-finetune/Step": 4595, "Full-finetune/Step Time": 6.7336610946804285} {"Full-finetune/Learning Rate": 6.950064196884987e-07, "Full-finetune/Loss": 0.7252769470214844, "Full-finetune/Loss (Raw)": 0.7493916749954224, "Full-finetune/Step": 4596, "Full-finetune/Step Time": 6.741033706814051} {"Full-finetune/Learning Rate": 6.927263593477751e-07, "Full-finetune/Loss": 0.7248460054397583, "Full-finetune/Loss (Raw)": 0.7059297561645508, "Full-finetune/Step": 4597, "Full-finetune/Step Time": 6.74296186119318} {"Full-finetune/Learning Rate": 6.904499109782426e-07, "Full-finetune/Loss": 0.7248622179031372, "Full-finetune/Loss (Raw)": 0.7699063420295715, "Full-finetune/Step": 4598, "Full-finetune/Step Time": 6.740882754325867} {"Full-finetune/Learning Rate": 6.881770754633444e-07, "Full-finetune/Loss": 0.7256346940994263, "Full-finetune/Loss (Raw)": 0.7082548141479492, "Full-finetune/Step": 4599, "Full-finetune/Step Time": 6.734482251107693} {"Full-finetune/Learning Rate": 6.859078536851283e-07, "Full-finetune/Loss": 0.7253917455673218, "Full-finetune/Loss (Raw)": 0.768447756767273, "Full-finetune/Step": 4600, "Full-finetune/Step Time": 6.738072495907545} {"Full-finetune/Learning Rate": 6.836422465242298e-07, "Full-finetune/Loss": 0.7229197025299072, "Full-finetune/Loss (Raw)": 0.665191650390625, "Full-finetune/Step": 4601, "Full-finetune/Step Time": 6.7429560255259275} {"Full-finetune/Learning Rate": 6.81380254859888e-07, "Full-finetune/Loss": 0.7241159081459045, "Full-finetune/Loss (Raw)": 0.9774568676948547, "Full-finetune/Step": 4602, "Full-finetune/Step Time": 6.743790669366717} {"Full-finetune/Learning Rate": 6.791218795699406e-07, "Full-finetune/Loss": 0.723929762840271, "Full-finetune/Loss (Raw)": 0.6498379707336426, "Full-finetune/Step": 4603, "Full-finetune/Step Time": 6.735572958365083} {"Full-finetune/Learning Rate": 6.768671215308165e-07, "Full-finetune/Loss": 0.7236617803573608, "Full-finetune/Loss (Raw)": 0.8134335875511169, "Full-finetune/Step": 4604, "Full-finetune/Step Time": 6.728625528514385} {"Full-finetune/Learning Rate": 6.746159816175435e-07, "Full-finetune/Loss": 0.7206778526306152, "Full-finetune/Loss (Raw)": 0.3234732151031494, "Full-finetune/Step": 4605, "Full-finetune/Step Time": 6.746068125590682} {"Full-finetune/Learning Rate": 6.723684607037451e-07, "Full-finetune/Loss": 0.7204592227935791, "Full-finetune/Loss (Raw)": 0.8213748335838318, "Full-finetune/Step": 4606, "Full-finetune/Step Time": 6.753675207495689} {"Full-finetune/Learning Rate": 6.701245596616402e-07, "Full-finetune/Loss": 0.7199947237968445, "Full-finetune/Loss (Raw)": 0.7331840991973877, "Full-finetune/Step": 4607, "Full-finetune/Step Time": 6.744547059759498} {"Full-finetune/Learning Rate": 6.678842793620433e-07, "Full-finetune/Loss": 0.720880389213562, "Full-finetune/Loss (Raw)": 0.764722466468811, "Full-finetune/Step": 4608, "Full-finetune/Step Time": 6.739758083596826} {"Full-finetune/Learning Rate": 6.656476206743623e-07, "Full-finetune/Loss": 0.7227937579154968, "Full-finetune/Loss (Raw)": 0.9502493143081665, "Full-finetune/Step": 4609, "Full-finetune/Step Time": 6.737235391512513} {"Full-finetune/Learning Rate": 6.634145844666051e-07, "Full-finetune/Loss": 0.722979724407196, "Full-finetune/Loss (Raw)": 0.721346378326416, "Full-finetune/Step": 4610, "Full-finetune/Step Time": 6.719079118221998} {"Full-finetune/Learning Rate": 6.611851716053641e-07, "Full-finetune/Loss": 0.7189927101135254, "Full-finetune/Loss (Raw)": 0.2823134958744049, "Full-finetune/Step": 4611, "Full-finetune/Step Time": 6.736521136015654} {"Full-finetune/Learning Rate": 6.589593829558316e-07, "Full-finetune/Loss": 0.7182576060295105, "Full-finetune/Loss (Raw)": 0.7810468077659607, "Full-finetune/Step": 4612, "Full-finetune/Step Time": 6.717053635045886} {"Full-finetune/Learning Rate": 6.567372193817967e-07, "Full-finetune/Loss": 0.7172906398773193, "Full-finetune/Loss (Raw)": 0.6288370490074158, "Full-finetune/Step": 4613, "Full-finetune/Step Time": 6.7408241499215364} {"Full-finetune/Learning Rate": 6.545186817456339e-07, "Full-finetune/Loss": 0.717036783695221, "Full-finetune/Loss (Raw)": 0.6989867687225342, "Full-finetune/Step": 4614, "Full-finetune/Step Time": 6.74733324162662} {"Full-finetune/Learning Rate": 6.523037709083158e-07, "Full-finetune/Loss": 0.7214827537536621, "Full-finetune/Loss (Raw)": 0.8889703750610352, "Full-finetune/Step": 4615, "Full-finetune/Step Time": 6.727143639698625} {"Full-finetune/Learning Rate": 6.500924877294057e-07, "Full-finetune/Loss": 0.7211184501647949, "Full-finetune/Loss (Raw)": 0.7390009164810181, "Full-finetune/Step": 4616, "Full-finetune/Step Time": 6.71816716901958} {"Full-finetune/Learning Rate": 6.478848330670607e-07, "Full-finetune/Loss": 0.7225993871688843, "Full-finetune/Loss (Raw)": 0.6627048850059509, "Full-finetune/Step": 4617, "Full-finetune/Step Time": 6.709344206377864} {"Full-finetune/Learning Rate": 6.456808077780263e-07, "Full-finetune/Loss": 0.7240074276924133, "Full-finetune/Loss (Raw)": 0.8367302417755127, "Full-finetune/Step": 4618, "Full-finetune/Step Time": 6.71039698459208} {"Full-finetune/Learning Rate": 6.434804127176409e-07, "Full-finetune/Loss": 0.7251802682876587, "Full-finetune/Loss (Raw)": 0.8850887417793274, "Full-finetune/Step": 4619, "Full-finetune/Step Time": 6.711649347096682} {"Full-finetune/Learning Rate": 6.4128364873984e-07, "Full-finetune/Loss": 0.7244576215744019, "Full-finetune/Loss (Raw)": 0.7197380065917969, "Full-finetune/Step": 4620, "Full-finetune/Step Time": 6.71490940824151} {"Full-finetune/Learning Rate": 6.390905166971406e-07, "Full-finetune/Loss": 0.7256395816802979, "Full-finetune/Loss (Raw)": 0.8727121353149414, "Full-finetune/Step": 4621, "Full-finetune/Step Time": 6.7047572415322065} {"Full-finetune/Learning Rate": 6.369010174406531e-07, "Full-finetune/Loss": 0.7274004817008972, "Full-finetune/Loss (Raw)": 0.8116551041603088, "Full-finetune/Step": 4622, "Full-finetune/Step Time": 6.711906671524048} {"Full-finetune/Learning Rate": 6.347151518200834e-07, "Full-finetune/Loss": 0.7280948758125305, "Full-finetune/Loss (Raw)": 0.8598251342773438, "Full-finetune/Step": 4623, "Full-finetune/Step Time": 6.708415212109685} {"Full-finetune/Learning Rate": 6.325329206837217e-07, "Full-finetune/Loss": 0.7283667325973511, "Full-finetune/Loss (Raw)": 0.728710949420929, "Full-finetune/Step": 4624, "Full-finetune/Step Time": 6.700258268043399} {"Full-finetune/Learning Rate": 6.303543248784483e-07, "Full-finetune/Loss": 0.728857696056366, "Full-finetune/Loss (Raw)": 0.8389284610748291, "Full-finetune/Step": 4625, "Full-finetune/Step Time": 6.700883937999606} {"Full-finetune/Learning Rate": 6.281793652497359e-07, "Full-finetune/Loss": 0.7262528538703918, "Full-finetune/Loss (Raw)": 0.3423186242580414, "Full-finetune/Step": 4626, "Full-finetune/Step Time": 6.713724719360471} {"Full-finetune/Learning Rate": 6.260080426416415e-07, "Full-finetune/Loss": 0.725406289100647, "Full-finetune/Loss (Raw)": 0.7562797665596008, "Full-finetune/Step": 4627, "Full-finetune/Step Time": 6.72297590970993} {"Full-finetune/Learning Rate": 6.238403578968144e-07, "Full-finetune/Loss": 0.7250564098358154, "Full-finetune/Loss (Raw)": 0.6547666788101196, "Full-finetune/Step": 4628, "Full-finetune/Step Time": 6.725936716422439} {"Full-finetune/Learning Rate": 6.216763118564883e-07, "Full-finetune/Loss": 0.7240025401115417, "Full-finetune/Loss (Raw)": 0.7388970851898193, "Full-finetune/Step": 4629, "Full-finetune/Step Time": 6.723749710246921} {"Full-finetune/Learning Rate": 6.195159053604926e-07, "Full-finetune/Loss": 0.7241361141204834, "Full-finetune/Loss (Raw)": 0.6709544062614441, "Full-finetune/Step": 4630, "Full-finetune/Step Time": 6.731917085126042} {"Full-finetune/Learning Rate": 6.173591392472334e-07, "Full-finetune/Loss": 0.7219028472900391, "Full-finetune/Loss (Raw)": 0.5636391043663025, "Full-finetune/Step": 4631, "Full-finetune/Step Time": 6.750589467585087} {"Full-finetune/Learning Rate": 6.152060143537109e-07, "Full-finetune/Loss": 0.7180477380752563, "Full-finetune/Loss (Raw)": 0.26460468769073486, "Full-finetune/Step": 4632, "Full-finetune/Step Time": 6.752955378964543} {"Full-finetune/Learning Rate": 6.130565315155124e-07, "Full-finetune/Loss": 0.7166796922683716, "Full-finetune/Loss (Raw)": 0.570814847946167, "Full-finetune/Step": 4633, "Full-finetune/Step Time": 6.775041125714779} {"Full-finetune/Learning Rate": 6.109106915668106e-07, "Full-finetune/Loss": 0.7159546613693237, "Full-finetune/Loss (Raw)": 0.8572998046875, "Full-finetune/Step": 4634, "Full-finetune/Step Time": 6.782644547522068} {"Full-finetune/Learning Rate": 6.087684953403616e-07, "Full-finetune/Loss": 0.7178981304168701, "Full-finetune/Loss (Raw)": 0.5581388473510742, "Full-finetune/Step": 4635, "Full-finetune/Step Time": 6.7934958059340715} {"Full-finetune/Learning Rate": 6.066299436675117e-07, "Full-finetune/Loss": 0.7181829214096069, "Full-finetune/Loss (Raw)": 0.7852376103401184, "Full-finetune/Step": 4636, "Full-finetune/Step Time": 6.79574822075665} {"Full-finetune/Learning Rate": 6.04495037378191e-07, "Full-finetune/Loss": 0.7192648649215698, "Full-finetune/Loss (Raw)": 0.8480718731880188, "Full-finetune/Step": 4637, "Full-finetune/Step Time": 6.789532259106636} {"Full-finetune/Learning Rate": 6.023637773009139e-07, "Full-finetune/Loss": 0.7204310894012451, "Full-finetune/Loss (Raw)": 0.9909065961837769, "Full-finetune/Step": 4638, "Full-finetune/Step Time": 6.793938871473074} {"Full-finetune/Learning Rate": 6.002361642627807e-07, "Full-finetune/Loss": 0.7177248597145081, "Full-finetune/Loss (Raw)": 0.5931854844093323, "Full-finetune/Step": 4639, "Full-finetune/Step Time": 6.807885069400072} {"Full-finetune/Learning Rate": 5.981121990894789e-07, "Full-finetune/Loss": 0.721693754196167, "Full-finetune/Loss (Raw)": 0.8574556112289429, "Full-finetune/Step": 4640, "Full-finetune/Step Time": 6.7961566764861345} {"Full-finetune/Learning Rate": 5.959918826052757e-07, "Full-finetune/Loss": 0.7218137383460999, "Full-finetune/Loss (Raw)": 0.786429226398468, "Full-finetune/Step": 4641, "Full-finetune/Step Time": 6.79353273101151} {"Full-finetune/Learning Rate": 5.938752156330241e-07, "Full-finetune/Loss": 0.7228844165802002, "Full-finetune/Loss (Raw)": 0.7949089407920837, "Full-finetune/Step": 4642, "Full-finetune/Step Time": 6.795078845694661} {"Full-finetune/Learning Rate": 5.917621989941624e-07, "Full-finetune/Loss": 0.7237615585327148, "Full-finetune/Loss (Raw)": 0.8723900318145752, "Full-finetune/Step": 4643, "Full-finetune/Step Time": 6.7921585235744715} {"Full-finetune/Learning Rate": 5.896528335087137e-07, "Full-finetune/Loss": 0.7218970060348511, "Full-finetune/Loss (Raw)": 0.3690636456012726, "Full-finetune/Step": 4644, "Full-finetune/Step Time": 6.811613751575351} {"Full-finetune/Learning Rate": 5.875471199952754e-07, "Full-finetune/Loss": 0.723129391670227, "Full-finetune/Loss (Raw)": 0.8140600919723511, "Full-finetune/Step": 4645, "Full-finetune/Step Time": 6.79937619715929} {"Full-finetune/Learning Rate": 5.854450592710382e-07, "Full-finetune/Loss": 0.7207733392715454, "Full-finetune/Loss (Raw)": 0.6133209466934204, "Full-finetune/Step": 4646, "Full-finetune/Step Time": 6.812748974189162} {"Full-finetune/Learning Rate": 5.833466521517695e-07, "Full-finetune/Loss": 0.7200966477394104, "Full-finetune/Loss (Raw)": 0.7925460934638977, "Full-finetune/Step": 4647, "Full-finetune/Step Time": 6.8074547983706} {"Full-finetune/Learning Rate": 5.812518994518213e-07, "Full-finetune/Loss": 0.71909099817276, "Full-finetune/Loss (Raw)": 0.7282606363296509, "Full-finetune/Step": 4648, "Full-finetune/Step Time": 6.811950387433171} {"Full-finetune/Learning Rate": 5.791608019841244e-07, "Full-finetune/Loss": 0.7187029123306274, "Full-finetune/Loss (Raw)": 0.8447415828704834, "Full-finetune/Step": 4649, "Full-finetune/Step Time": 6.809088239446282} {"Full-finetune/Learning Rate": 5.770733605601953e-07, "Full-finetune/Loss": 0.7180384993553162, "Full-finetune/Loss (Raw)": 0.6303303241729736, "Full-finetune/Step": 4650, "Full-finetune/Step Time": 6.817358698695898} {"Full-finetune/Learning Rate": 5.74989575990127e-07, "Full-finetune/Loss": 0.718051016330719, "Full-finetune/Loss (Raw)": 0.7879148721694946, "Full-finetune/Step": 4651, "Full-finetune/Step Time": 6.810852982103825} {"Full-finetune/Learning Rate": 5.729094490825948e-07, "Full-finetune/Loss": 0.7176931500434875, "Full-finetune/Loss (Raw)": 0.7592521905899048, "Full-finetune/Step": 4652, "Full-finetune/Step Time": 6.809202920645475} {"Full-finetune/Learning Rate": 5.708329806448587e-07, "Full-finetune/Loss": 0.7139718532562256, "Full-finetune/Loss (Raw)": 0.2966669797897339, "Full-finetune/Step": 4653, "Full-finetune/Step Time": 6.825553713366389} {"Full-finetune/Learning Rate": 5.687601714827551e-07, "Full-finetune/Loss": 0.7153213024139404, "Full-finetune/Loss (Raw)": 0.7308654189109802, "Full-finetune/Step": 4654, "Full-finetune/Step Time": 6.830757105723023} {"Full-finetune/Learning Rate": 5.666910224006971e-07, "Full-finetune/Loss": 0.7167536020278931, "Full-finetune/Loss (Raw)": 0.6181446313858032, "Full-finetune/Step": 4655, "Full-finetune/Step Time": 6.81554445810616} {"Full-finetune/Learning Rate": 5.646255342016848e-07, "Full-finetune/Loss": 0.7145085334777832, "Full-finetune/Loss (Raw)": 0.42893800139427185, "Full-finetune/Step": 4656, "Full-finetune/Step Time": 6.8454804215580225} {"Full-finetune/Learning Rate": 5.625637076872914e-07, "Full-finetune/Loss": 0.7140052318572998, "Full-finetune/Loss (Raw)": 0.7314744591712952, "Full-finetune/Step": 4657, "Full-finetune/Step Time": 6.8432827685028315} {"Full-finetune/Learning Rate": 5.605055436576746e-07, "Full-finetune/Loss": 0.7137194275856018, "Full-finetune/Loss (Raw)": 0.8330939412117004, "Full-finetune/Step": 4658, "Full-finetune/Step Time": 6.838785840198398} {"Full-finetune/Learning Rate": 5.584510429115641e-07, "Full-finetune/Loss": 0.7134059071540833, "Full-finetune/Loss (Raw)": 0.8543224930763245, "Full-finetune/Step": 4659, "Full-finetune/Step Time": 6.836572881788015} {"Full-finetune/Learning Rate": 5.564002062462737e-07, "Full-finetune/Loss": 0.7151689529418945, "Full-finetune/Loss (Raw)": 0.8332439661026001, "Full-finetune/Step": 4660, "Full-finetune/Step Time": 6.843141032382846} {"Full-finetune/Learning Rate": 5.54353034457693e-07, "Full-finetune/Loss": 0.7141183614730835, "Full-finetune/Loss (Raw)": 0.6659143567085266, "Full-finetune/Step": 4661, "Full-finetune/Step Time": 6.84512173011899} {"Full-finetune/Learning Rate": 5.523095283402868e-07, "Full-finetune/Loss": 0.7180819511413574, "Full-finetune/Loss (Raw)": 0.8384981751441956, "Full-finetune/Step": 4662, "Full-finetune/Step Time": 6.826192574575543} {"Full-finetune/Learning Rate": 5.502696886871039e-07, "Full-finetune/Loss": 0.7194000482559204, "Full-finetune/Loss (Raw)": 0.8103407025337219, "Full-finetune/Step": 4663, "Full-finetune/Step Time": 6.815190194174647} {"Full-finetune/Learning Rate": 5.482335162897657e-07, "Full-finetune/Loss": 0.7194450497627258, "Full-finetune/Loss (Raw)": 0.7757728695869446, "Full-finetune/Step": 4664, "Full-finetune/Step Time": 6.803159981966019} {"Full-finetune/Learning Rate": 5.462010119384665e-07, "Full-finetune/Loss": 0.7186698913574219, "Full-finetune/Loss (Raw)": 0.690804660320282, "Full-finetune/Step": 4665, "Full-finetune/Step Time": 6.803444126620889} {"Full-finetune/Learning Rate": 5.441721764219853e-07, "Full-finetune/Loss": 0.7166029810905457, "Full-finetune/Loss (Raw)": 0.5677090287208557, "Full-finetune/Step": 4666, "Full-finetune/Step Time": 6.821716628968716} {"Full-finetune/Learning Rate": 5.42147010527675e-07, "Full-finetune/Loss": 0.7179248929023743, "Full-finetune/Loss (Raw)": 0.8269895315170288, "Full-finetune/Step": 4667, "Full-finetune/Step Time": 6.809647353366017} {"Full-finetune/Learning Rate": 5.401255150414598e-07, "Full-finetune/Loss": 0.7212669849395752, "Full-finetune/Loss (Raw)": 0.7296515703201294, "Full-finetune/Step": 4668, "Full-finetune/Step Time": 6.800927933305502} {"Full-finetune/Learning Rate": 5.381076907478433e-07, "Full-finetune/Loss": 0.7185986042022705, "Full-finetune/Loss (Raw)": 0.3468283712863922, "Full-finetune/Step": 4669, "Full-finetune/Step Time": 6.799590468406677} {"Full-finetune/Learning Rate": 5.360935384299049e-07, "Full-finetune/Loss": 0.7198142409324646, "Full-finetune/Loss (Raw)": 0.7944204211235046, "Full-finetune/Step": 4670, "Full-finetune/Step Time": 6.79832549393177} {"Full-finetune/Learning Rate": 5.34083058869297e-07, "Full-finetune/Loss": 0.7192484140396118, "Full-finetune/Loss (Raw)": 0.7012600302696228, "Full-finetune/Step": 4671, "Full-finetune/Step Time": 6.793532425537705} {"Full-finetune/Learning Rate": 5.320762528462453e-07, "Full-finetune/Loss": 0.718862771987915, "Full-finetune/Loss (Raw)": 0.8187007308006287, "Full-finetune/Step": 4672, "Full-finetune/Step Time": 6.807630022987723} {"Full-finetune/Learning Rate": 5.30073121139556e-07, "Full-finetune/Loss": 0.7191272377967834, "Full-finetune/Loss (Raw)": 0.7865297198295593, "Full-finetune/Step": 4673, "Full-finetune/Step Time": 6.797059044241905} {"Full-finetune/Learning Rate": 5.28073664526606e-07, "Full-finetune/Loss": 0.7191327214241028, "Full-finetune/Loss (Raw)": 0.8566904664039612, "Full-finetune/Step": 4674, "Full-finetune/Step Time": 6.8201940059661865} {"Full-finetune/Learning Rate": 5.260778837833391e-07, "Full-finetune/Loss": 0.7191063761711121, "Full-finetune/Loss (Raw)": 0.8329941630363464, "Full-finetune/Step": 4675, "Full-finetune/Step Time": 6.822477288544178} {"Full-finetune/Learning Rate": 5.240857796842846e-07, "Full-finetune/Loss": 0.7204257249832153, "Full-finetune/Loss (Raw)": 0.7322462797164917, "Full-finetune/Step": 4676, "Full-finetune/Step Time": 6.793995464220643} {"Full-finetune/Learning Rate": 5.220973530025375e-07, "Full-finetune/Loss": 0.7224004864692688, "Full-finetune/Loss (Raw)": 0.8391278982162476, "Full-finetune/Step": 4677, "Full-finetune/Step Time": 6.7842960730195045} {"Full-finetune/Learning Rate": 5.201126045097671e-07, "Full-finetune/Loss": 0.7213440537452698, "Full-finetune/Loss (Raw)": 0.7570422887802124, "Full-finetune/Step": 4678, "Full-finetune/Step Time": 6.808823259547353} {"Full-finetune/Learning Rate": 5.181315349762162e-07, "Full-finetune/Loss": 0.7197530269622803, "Full-finetune/Loss (Raw)": 0.6204560399055481, "Full-finetune/Step": 4679, "Full-finetune/Step Time": 6.808409990742803} {"Full-finetune/Learning Rate": 5.161541451706975e-07, "Full-finetune/Loss": 0.7219604253768921, "Full-finetune/Loss (Raw)": 0.8807277083396912, "Full-finetune/Step": 4680, "Full-finetune/Step Time": 6.811008673161268} {"Full-finetune/Learning Rate": 5.141804358605995e-07, "Full-finetune/Loss": 0.721528172492981, "Full-finetune/Loss (Raw)": 0.7448585033416748, "Full-finetune/Step": 4681, "Full-finetune/Step Time": 6.827656801789999} {"Full-finetune/Learning Rate": 5.122104078118773e-07, "Full-finetune/Loss": 0.7201871871948242, "Full-finetune/Loss (Raw)": 0.7228482961654663, "Full-finetune/Step": 4682, "Full-finetune/Step Time": 6.838610149919987} {"Full-finetune/Learning Rate": 5.102440617890658e-07, "Full-finetune/Loss": 0.7199484705924988, "Full-finetune/Loss (Raw)": 0.7722799777984619, "Full-finetune/Step": 4683, "Full-finetune/Step Time": 6.823186673223972} {"Full-finetune/Learning Rate": 5.082813985552604e-07, "Full-finetune/Loss": 0.7194300293922424, "Full-finetune/Loss (Raw)": 0.8726574778556824, "Full-finetune/Step": 4684, "Full-finetune/Step Time": 6.821796404197812} {"Full-finetune/Learning Rate": 5.063224188721327e-07, "Full-finetune/Loss": 0.7208069562911987, "Full-finetune/Loss (Raw)": 0.8503739833831787, "Full-finetune/Step": 4685, "Full-finetune/Step Time": 6.824759494513273} {"Full-finetune/Learning Rate": 5.043671234999271e-07, "Full-finetune/Loss": 0.7214215993881226, "Full-finetune/Loss (Raw)": 0.649338960647583, "Full-finetune/Step": 4686, "Full-finetune/Step Time": 6.822520732879639} {"Full-finetune/Learning Rate": 5.02415513197454e-07, "Full-finetune/Loss": 0.7204947471618652, "Full-finetune/Loss (Raw)": 0.7903807163238525, "Full-finetune/Step": 4687, "Full-finetune/Step Time": 6.813639920204878} {"Full-finetune/Learning Rate": 5.004675887220978e-07, "Full-finetune/Loss": 0.7228026390075684, "Full-finetune/Loss (Raw)": 1.0248184204101562, "Full-finetune/Step": 4688, "Full-finetune/Step Time": 6.811866290867329} {"Full-finetune/Learning Rate": 4.985233508298037e-07, "Full-finetune/Loss": 0.7234025001525879, "Full-finetune/Loss (Raw)": 0.8714379072189331, "Full-finetune/Step": 4689, "Full-finetune/Step Time": 6.802868394181132} {"Full-finetune/Learning Rate": 4.965828002750994e-07, "Full-finetune/Loss": 0.7218618392944336, "Full-finetune/Loss (Raw)": 0.6416139602661133, "Full-finetune/Step": 4690, "Full-finetune/Step Time": 6.826538980007172} {"Full-finetune/Learning Rate": 4.946459378110701e-07, "Full-finetune/Loss": 0.7264793515205383, "Full-finetune/Loss (Raw)": 0.8915498852729797, "Full-finetune/Step": 4691, "Full-finetune/Step Time": 6.809561226516962} {"Full-finetune/Learning Rate": 4.927127641893759e-07, "Full-finetune/Loss": 0.7279784083366394, "Full-finetune/Loss (Raw)": 0.9349275231361389, "Full-finetune/Step": 4692, "Full-finetune/Step Time": 6.820359606295824} {"Full-finetune/Learning Rate": 4.907832801602452e-07, "Full-finetune/Loss": 0.7286316156387329, "Full-finetune/Loss (Raw)": 0.7728877663612366, "Full-finetune/Step": 4693, "Full-finetune/Step Time": 6.830993067473173} {"Full-finetune/Learning Rate": 4.888574864724715e-07, "Full-finetune/Loss": 0.7295123338699341, "Full-finetune/Loss (Raw)": 0.8796309232711792, "Full-finetune/Step": 4694, "Full-finetune/Step Time": 6.8148877415806055} {"Full-finetune/Learning Rate": 4.869353838734169e-07, "Full-finetune/Loss": 0.7289634943008423, "Full-finetune/Loss (Raw)": 0.8037862181663513, "Full-finetune/Step": 4695, "Full-finetune/Step Time": 6.819920903071761} {"Full-finetune/Learning Rate": 4.850169731090127e-07, "Full-finetune/Loss": 0.727916955947876, "Full-finetune/Loss (Raw)": 0.6715525388717651, "Full-finetune/Step": 4696, "Full-finetune/Step Time": 6.830358674749732} {"Full-finetune/Learning Rate": 4.831022549237574e-07, "Full-finetune/Loss": 0.7272427678108215, "Full-finetune/Loss (Raw)": 0.7558099031448364, "Full-finetune/Step": 4697, "Full-finetune/Step Time": 6.825137222185731} {"Full-finetune/Learning Rate": 4.811912300607169e-07, "Full-finetune/Loss": 0.7274343967437744, "Full-finetune/Loss (Raw)": 0.8578574061393738, "Full-finetune/Step": 4698, "Full-finetune/Step Time": 6.829467747360468} {"Full-finetune/Learning Rate": 4.792838992615179e-07, "Full-finetune/Loss": 0.7294607162475586, "Full-finetune/Loss (Raw)": 0.880893886089325, "Full-finetune/Step": 4699, "Full-finetune/Step Time": 6.824444379657507} {"Full-finetune/Learning Rate": 4.773802632663627e-07, "Full-finetune/Loss": 0.7298436760902405, "Full-finetune/Loss (Raw)": 0.776142418384552, "Full-finetune/Step": 4700, "Full-finetune/Step Time": 6.799410965293646} {"Full-finetune/Learning Rate": 4.7548032281401367e-07, "Full-finetune/Loss": 0.7309547662734985, "Full-finetune/Loss (Raw)": 0.81394362449646, "Full-finetune/Step": 4701, "Full-finetune/Step Time": 6.788314465433359} {"Full-finetune/Learning Rate": 4.735840786418011e-07, "Full-finetune/Loss": 0.7305346727371216, "Full-finetune/Loss (Raw)": 0.7461352944374084, "Full-finetune/Step": 4702, "Full-finetune/Step Time": 6.780266048386693} {"Full-finetune/Learning Rate": 4.716915314856196e-07, "Full-finetune/Loss": 0.7319310903549194, "Full-finetune/Loss (Raw)": 0.8918035626411438, "Full-finetune/Step": 4703, "Full-finetune/Step Time": 6.763255724683404} {"Full-finetune/Learning Rate": 4.698026820799306e-07, "Full-finetune/Loss": 0.7317894101142883, "Full-finetune/Loss (Raw)": 0.6631495356559753, "Full-finetune/Step": 4704, "Full-finetune/Step Time": 6.758166896179318} {"Full-finetune/Learning Rate": 4.6791753115775884e-07, "Full-finetune/Loss": 0.7316305041313171, "Full-finetune/Loss (Raw)": 0.8762187361717224, "Full-finetune/Step": 4705, "Full-finetune/Step Time": 6.759446585550904} {"Full-finetune/Learning Rate": 4.660360794506946e-07, "Full-finetune/Loss": 0.7307212352752686, "Full-finetune/Loss (Raw)": 0.7187938094139099, "Full-finetune/Step": 4706, "Full-finetune/Step Time": 6.753011789172888} {"Full-finetune/Learning Rate": 4.641583276888939e-07, "Full-finetune/Loss": 0.7328363656997681, "Full-finetune/Loss (Raw)": 0.6832760572433472, "Full-finetune/Step": 4707, "Full-finetune/Step Time": 6.736684603616595} {"Full-finetune/Learning Rate": 4.622842766010749e-07, "Full-finetune/Loss": 0.7361249923706055, "Full-finetune/Loss (Raw)": 0.6837664246559143, "Full-finetune/Step": 4708, "Full-finetune/Step Time": 6.718202020972967} {"Full-finetune/Learning Rate": 4.604139269145191e-07, "Full-finetune/Loss": 0.7362494468688965, "Full-finetune/Loss (Raw)": 0.6644195914268494, "Full-finetune/Step": 4709, "Full-finetune/Step Time": 6.723023658618331} {"Full-finetune/Learning Rate": 4.585472793550738e-07, "Full-finetune/Loss": 0.7378501296043396, "Full-finetune/Loss (Raw)": 0.9409023523330688, "Full-finetune/Step": 4710, "Full-finetune/Step Time": 6.7135827746242285} {"Full-finetune/Learning Rate": 4.5668433464714835e-07, "Full-finetune/Loss": 0.736993134021759, "Full-finetune/Loss (Raw)": 0.7684730291366577, "Full-finetune/Step": 4711, "Full-finetune/Step Time": 6.714547263458371} {"Full-finetune/Learning Rate": 4.548250935137144e-07, "Full-finetune/Loss": 0.7370314598083496, "Full-finetune/Loss (Raw)": 0.7040044665336609, "Full-finetune/Step": 4712, "Full-finetune/Step Time": 6.72792648896575} {"Full-finetune/Learning Rate": 4.5296955667630926e-07, "Full-finetune/Loss": 0.7386384010314941, "Full-finetune/Loss (Raw)": 0.8356765508651733, "Full-finetune/Step": 4713, "Full-finetune/Step Time": 6.731134183704853} {"Full-finetune/Learning Rate": 4.51117724855028e-07, "Full-finetune/Loss": 0.7392110824584961, "Full-finetune/Loss (Raw)": 0.7466892004013062, "Full-finetune/Step": 4714, "Full-finetune/Step Time": 6.734250048175454} {"Full-finetune/Learning Rate": 4.492695987685314e-07, "Full-finetune/Loss": 0.7385572791099548, "Full-finetune/Loss (Raw)": 0.7869795560836792, "Full-finetune/Step": 4715, "Full-finetune/Step Time": 6.73701805062592} {"Full-finetune/Learning Rate": 4.474251791340412e-07, "Full-finetune/Loss": 0.737788200378418, "Full-finetune/Loss (Raw)": 0.7423272132873535, "Full-finetune/Step": 4716, "Full-finetune/Step Time": 6.7140266969799995} {"Full-finetune/Learning Rate": 4.4558446666734147e-07, "Full-finetune/Loss": 0.7382218837738037, "Full-finetune/Loss (Raw)": 0.8097751140594482, "Full-finetune/Step": 4717, "Full-finetune/Step Time": 6.711557501927018} {"Full-finetune/Learning Rate": 4.437474620827764e-07, "Full-finetune/Loss": 0.7370482683181763, "Full-finetune/Loss (Raw)": 0.5593400001525879, "Full-finetune/Step": 4718, "Full-finetune/Step Time": 6.725675126537681} {"Full-finetune/Learning Rate": 4.419141660932491e-07, "Full-finetune/Loss": 0.7356722354888916, "Full-finetune/Loss (Raw)": 0.6448268890380859, "Full-finetune/Step": 4719, "Full-finetune/Step Time": 6.7257131934165955} {"Full-finetune/Learning Rate": 4.4008457941022933e-07, "Full-finetune/Loss": 0.7371380925178528, "Full-finetune/Loss (Raw)": 0.4709751009941101, "Full-finetune/Step": 4720, "Full-finetune/Step Time": 6.742776531726122} {"Full-finetune/Learning Rate": 4.382587027437435e-07, "Full-finetune/Loss": 0.7352915406227112, "Full-finetune/Loss (Raw)": 0.5958731770515442, "Full-finetune/Step": 4721, "Full-finetune/Step Time": 6.746861910447478} {"Full-finetune/Learning Rate": 4.364365368023771e-07, "Full-finetune/Loss": 0.7374585866928101, "Full-finetune/Loss (Raw)": 0.6835858225822449, "Full-finetune/Step": 4722, "Full-finetune/Step Time": 6.730750992894173} {"Full-finetune/Learning Rate": 4.3461808229327773e-07, "Full-finetune/Loss": 0.7372823357582092, "Full-finetune/Loss (Raw)": 0.7728622555732727, "Full-finetune/Step": 4723, "Full-finetune/Step Time": 6.72936219163239} {"Full-finetune/Learning Rate": 4.3280333992215206e-07, "Full-finetune/Loss": 0.7363548278808594, "Full-finetune/Loss (Raw)": 0.6306750178337097, "Full-finetune/Step": 4724, "Full-finetune/Step Time": 6.75095945969224} {"Full-finetune/Learning Rate": 4.3099231039326785e-07, "Full-finetune/Loss": 0.7363667488098145, "Full-finetune/Loss (Raw)": 0.707450807094574, "Full-finetune/Step": 4725, "Full-finetune/Step Time": 6.7536312751472} {"Full-finetune/Learning Rate": 4.291849944094462e-07, "Full-finetune/Loss": 0.7356754541397095, "Full-finetune/Loss (Raw)": 0.6814199686050415, "Full-finetune/Step": 4726, "Full-finetune/Step Time": 6.766792930662632} {"Full-finetune/Learning Rate": 4.273813926720771e-07, "Full-finetune/Loss": 0.7356963753700256, "Full-finetune/Loss (Raw)": 0.7109329700469971, "Full-finetune/Step": 4727, "Full-finetune/Step Time": 6.774440262466669} {"Full-finetune/Learning Rate": 4.2558150588109747e-07, "Full-finetune/Loss": 0.7352311611175537, "Full-finetune/Loss (Raw)": 0.7088959813117981, "Full-finetune/Step": 4728, "Full-finetune/Step Time": 6.777279499918222} {"Full-finetune/Learning Rate": 4.237853347350107e-07, "Full-finetune/Loss": 0.7379993200302124, "Full-finetune/Loss (Raw)": 1.0195204019546509, "Full-finetune/Step": 4729, "Full-finetune/Step Time": 6.773902494460344} {"Full-finetune/Learning Rate": 4.219928799308759e-07, "Full-finetune/Loss": 0.7364298701286316, "Full-finetune/Loss (Raw)": 0.7765695452690125, "Full-finetune/Step": 4730, "Full-finetune/Step Time": 6.769714646041393} {"Full-finetune/Learning Rate": 4.2020414216431106e-07, "Full-finetune/Loss": 0.7362567186355591, "Full-finetune/Loss (Raw)": 0.6276721358299255, "Full-finetune/Step": 4731, "Full-finetune/Step Time": 6.768771894276142} {"Full-finetune/Learning Rate": 4.184191221294875e-07, "Full-finetune/Loss": 0.7360734343528748, "Full-finetune/Loss (Raw)": 0.7899748682975769, "Full-finetune/Step": 4732, "Full-finetune/Step Time": 6.77902140840888} {"Full-finetune/Learning Rate": 4.16637820519139e-07, "Full-finetune/Loss": 0.740172266960144, "Full-finetune/Loss (Raw)": 0.8481239080429077, "Full-finetune/Step": 4733, "Full-finetune/Step Time": 6.756094604730606} {"Full-finetune/Learning Rate": 4.1486023802455253e-07, "Full-finetune/Loss": 0.7390784025192261, "Full-finetune/Loss (Raw)": 0.6813595294952393, "Full-finetune/Step": 4734, "Full-finetune/Step Time": 6.762596894055605} {"Full-finetune/Learning Rate": 4.1308637533557294e-07, "Full-finetune/Loss": 0.7400546073913574, "Full-finetune/Loss (Raw)": 0.8581411242485046, "Full-finetune/Step": 4735, "Full-finetune/Step Time": 6.763733945786953} {"Full-finetune/Learning Rate": 4.1131623314060175e-07, "Full-finetune/Loss": 0.7386407852172852, "Full-finetune/Loss (Raw)": 0.5837540626525879, "Full-finetune/Step": 4736, "Full-finetune/Step Time": 6.773648517206311} {"Full-finetune/Learning Rate": 4.095498121265995e-07, "Full-finetune/Loss": 0.7365280985832214, "Full-finetune/Loss (Raw)": 0.6798219680786133, "Full-finetune/Step": 4737, "Full-finetune/Step Time": 6.783617235720158} {"Full-finetune/Learning Rate": 4.077871129790767e-07, "Full-finetune/Loss": 0.7374905347824097, "Full-finetune/Loss (Raw)": 0.8445436358451843, "Full-finetune/Step": 4738, "Full-finetune/Step Time": 6.793370332568884} {"Full-finetune/Learning Rate": 4.060281363821017e-07, "Full-finetune/Loss": 0.7407896518707275, "Full-finetune/Loss (Raw)": 0.704595685005188, "Full-finetune/Step": 4739, "Full-finetune/Step Time": 6.778693011030555} {"Full-finetune/Learning Rate": 4.042728830183018e-07, "Full-finetune/Loss": 0.7399213910102844, "Full-finetune/Loss (Raw)": 0.669908881187439, "Full-finetune/Step": 4740, "Full-finetune/Step Time": 6.791724184527993} {"Full-finetune/Learning Rate": 4.025213535688544e-07, "Full-finetune/Loss": 0.7392469644546509, "Full-finetune/Loss (Raw)": 0.5425056219100952, "Full-finetune/Step": 4741, "Full-finetune/Step Time": 6.774964492768049} {"Full-finetune/Learning Rate": 4.007735487134956e-07, "Full-finetune/Loss": 0.7389991879463196, "Full-finetune/Loss (Raw)": 0.6672726273536682, "Full-finetune/Step": 4742, "Full-finetune/Step Time": 6.794262696057558} {"Full-finetune/Learning Rate": 3.99029469130513e-07, "Full-finetune/Loss": 0.7371543645858765, "Full-finetune/Loss (Raw)": 0.6528322696685791, "Full-finetune/Step": 4743, "Full-finetune/Step Time": 6.810899551957846} {"Full-finetune/Learning Rate": 3.972891154967506e-07, "Full-finetune/Loss": 0.7386725544929504, "Full-finetune/Loss (Raw)": 0.9333342909812927, "Full-finetune/Step": 4744, "Full-finetune/Step Time": 6.812822535634041} {"Full-finetune/Learning Rate": 3.95552488487605e-07, "Full-finetune/Loss": 0.7389158010482788, "Full-finetune/Loss (Raw)": 0.6938403248786926, "Full-finetune/Step": 4745, "Full-finetune/Step Time": 6.832327712327242} {"Full-finetune/Learning Rate": 3.9381958877702684e-07, "Full-finetune/Loss": 0.7378116846084595, "Full-finetune/Loss (Raw)": 0.6954019069671631, "Full-finetune/Step": 4746, "Full-finetune/Step Time": 6.846315730363131} {"Full-finetune/Learning Rate": 3.920904170375239e-07, "Full-finetune/Loss": 0.7379552125930786, "Full-finetune/Loss (Raw)": 0.9034615159034729, "Full-finetune/Step": 4747, "Full-finetune/Step Time": 6.84628314524889} {"Full-finetune/Learning Rate": 3.903649739401494e-07, "Full-finetune/Loss": 0.7388836145401001, "Full-finetune/Loss (Raw)": 0.8385777473449707, "Full-finetune/Step": 4748, "Full-finetune/Step Time": 6.842259569093585} {"Full-finetune/Learning Rate": 3.8864326015451536e-07, "Full-finetune/Loss": 0.7382410168647766, "Full-finetune/Loss (Raw)": 0.7904556393623352, "Full-finetune/Step": 4749, "Full-finetune/Step Time": 6.8389250207692385} {"Full-finetune/Learning Rate": 3.8692527634878853e-07, "Full-finetune/Loss": 0.7375913262367249, "Full-finetune/Loss (Raw)": 0.7284942865371704, "Full-finetune/Step": 4750, "Full-finetune/Step Time": 6.8310875203460455} {"Full-finetune/Learning Rate": 3.8521102318968106e-07, "Full-finetune/Loss": 0.7367091178894043, "Full-finetune/Loss (Raw)": 0.7469062209129333, "Full-finetune/Step": 4751, "Full-finetune/Step Time": 6.84682871773839} {"Full-finetune/Learning Rate": 3.835005013424631e-07, "Full-finetune/Loss": 0.7374739646911621, "Full-finetune/Loss (Raw)": 0.8266072273254395, "Full-finetune/Step": 4752, "Full-finetune/Step Time": 6.85132341645658} {"Full-finetune/Learning Rate": 3.8179371147095354e-07, "Full-finetune/Loss": 0.7363617420196533, "Full-finetune/Loss (Raw)": 0.6965668201446533, "Full-finetune/Step": 4753, "Full-finetune/Step Time": 6.843445183709264} {"Full-finetune/Learning Rate": 3.80090654237526e-07, "Full-finetune/Loss": 0.7398936152458191, "Full-finetune/Loss (Raw)": 0.7943994998931885, "Full-finetune/Step": 4754, "Full-finetune/Step Time": 6.83063012547791} {"Full-finetune/Learning Rate": 3.7839133030310174e-07, "Full-finetune/Loss": 0.7398975491523743, "Full-finetune/Loss (Raw)": 0.7567809224128723, "Full-finetune/Step": 4755, "Full-finetune/Step Time": 6.830895094200969} {"Full-finetune/Learning Rate": 3.766957403271554e-07, "Full-finetune/Loss": 0.7407156229019165, "Full-finetune/Loss (Raw)": 0.7594848871231079, "Full-finetune/Step": 4756, "Full-finetune/Step Time": 6.824737513437867} {"Full-finetune/Learning Rate": 3.750038849677162e-07, "Full-finetune/Loss": 0.7409517168998718, "Full-finetune/Loss (Raw)": 0.7691094875335693, "Full-finetune/Step": 4757, "Full-finetune/Step Time": 6.812788736075163} {"Full-finetune/Learning Rate": 3.7331576488135456e-07, "Full-finetune/Loss": 0.7415360808372498, "Full-finetune/Loss (Raw)": 0.7457499504089355, "Full-finetune/Step": 4758, "Full-finetune/Step Time": 6.804131839424372} {"Full-finetune/Learning Rate": 3.716313807231986e-07, "Full-finetune/Loss": 0.7424955368041992, "Full-finetune/Loss (Raw)": 0.6864482164382935, "Full-finetune/Step": 4759, "Full-finetune/Step Time": 6.789443820714951} {"Full-finetune/Learning Rate": 3.699507331469276e-07, "Full-finetune/Loss": 0.7464601993560791, "Full-finetune/Loss (Raw)": 0.7720919251441956, "Full-finetune/Step": 4760, "Full-finetune/Step Time": 6.773544907569885} {"Full-finetune/Learning Rate": 3.682738228047655e-07, "Full-finetune/Loss": 0.7466399669647217, "Full-finetune/Loss (Raw)": 0.5938257575035095, "Full-finetune/Step": 4761, "Full-finetune/Step Time": 6.76700565032661} {"Full-finetune/Learning Rate": 3.666006503474895e-07, "Full-finetune/Loss": 0.7455548048019409, "Full-finetune/Loss (Raw)": 0.718392014503479, "Full-finetune/Step": 4762, "Full-finetune/Step Time": 6.765614802017808} {"Full-finetune/Learning Rate": 3.6493121642442454e-07, "Full-finetune/Loss": 0.7471708059310913, "Full-finetune/Loss (Raw)": 0.7649837136268616, "Full-finetune/Step": 4763, "Full-finetune/Step Time": 6.739795316010714} {"Full-finetune/Learning Rate": 3.6326552168344574e-07, "Full-finetune/Loss": 0.7463207244873047, "Full-finetune/Loss (Raw)": 0.6764335036277771, "Full-finetune/Step": 4764, "Full-finetune/Step Time": 6.743843797594309} {"Full-finetune/Learning Rate": 3.616035667709761e-07, "Full-finetune/Loss": 0.7447497844696045, "Full-finetune/Loss (Raw)": 0.6469905376434326, "Full-finetune/Step": 4765, "Full-finetune/Step Time": 6.743631577119231} {"Full-finetune/Learning Rate": 3.5994535233198844e-07, "Full-finetune/Loss": 0.7442022562026978, "Full-finetune/Loss (Raw)": 0.9208205342292786, "Full-finetune/Step": 4766, "Full-finetune/Step Time": 6.74572928994894} {"Full-finetune/Learning Rate": 3.582908790100037e-07, "Full-finetune/Loss": 0.7459720969200134, "Full-finetune/Loss (Raw)": 0.8197287321090698, "Full-finetune/Step": 4767, "Full-finetune/Step Time": 6.715920580551028} {"Full-finetune/Learning Rate": 3.566401474470904e-07, "Full-finetune/Loss": 0.7450364828109741, "Full-finetune/Loss (Raw)": 0.7376933097839355, "Full-finetune/Step": 4768, "Full-finetune/Step Time": 6.720508543774486} {"Full-finetune/Learning Rate": 3.5499315828386393e-07, "Full-finetune/Loss": 0.7447500824928284, "Full-finetune/Loss (Raw)": 0.7497727274894714, "Full-finetune/Step": 4769, "Full-finetune/Step Time": 6.719197550788522} {"Full-finetune/Learning Rate": 3.533499121594919e-07, "Full-finetune/Loss": 0.7421560883522034, "Full-finetune/Loss (Raw)": 0.4628777801990509, "Full-finetune/Step": 4770, "Full-finetune/Step Time": 6.7225303035229445} {"Full-finetune/Learning Rate": 3.5171040971168414e-07, "Full-finetune/Loss": 0.7423292994499207, "Full-finetune/Loss (Raw)": 0.8945627808570862, "Full-finetune/Step": 4771, "Full-finetune/Step Time": 6.725948723033071} {"Full-finetune/Learning Rate": 3.500746515766973e-07, "Full-finetune/Loss": 0.7448232769966125, "Full-finetune/Loss (Raw)": 0.6882922053337097, "Full-finetune/Step": 4772, "Full-finetune/Step Time": 6.7205326817929745} {"Full-finetune/Learning Rate": 3.4844263838934023e-07, "Full-finetune/Loss": 0.7427297234535217, "Full-finetune/Loss (Raw)": 0.5460802316665649, "Full-finetune/Step": 4773, "Full-finetune/Step Time": 6.73127100430429} {"Full-finetune/Learning Rate": 3.468143707829641e-07, "Full-finetune/Loss": 0.7441151142120361, "Full-finetune/Loss (Raw)": 0.7906529307365417, "Full-finetune/Step": 4774, "Full-finetune/Step Time": 6.722008401528001} {"Full-finetune/Learning Rate": 3.45189849389469e-07, "Full-finetune/Loss": 0.7446863651275635, "Full-finetune/Loss (Raw)": 0.8656640648841858, "Full-finetune/Step": 4775, "Full-finetune/Step Time": 6.718171734362841} {"Full-finetune/Learning Rate": 3.4356907483929835e-07, "Full-finetune/Loss": 0.7442829608917236, "Full-finetune/Loss (Raw)": 0.6766273975372314, "Full-finetune/Step": 4776, "Full-finetune/Step Time": 6.731047682464123} {"Full-finetune/Learning Rate": 3.419520477614435e-07, "Full-finetune/Loss": 0.7436081171035767, "Full-finetune/Loss (Raw)": 0.7583605051040649, "Full-finetune/Step": 4777, "Full-finetune/Step Time": 6.731998508796096} {"Full-finetune/Learning Rate": 3.403387687834425e-07, "Full-finetune/Loss": 0.7408912777900696, "Full-finetune/Loss (Raw)": 0.28257784247398376, "Full-finetune/Step": 4778, "Full-finetune/Step Time": 6.7354949321597815} {"Full-finetune/Learning Rate": 3.3872923853137453e-07, "Full-finetune/Loss": 0.7418931722640991, "Full-finetune/Loss (Raw)": 0.9161526560783386, "Full-finetune/Step": 4779, "Full-finetune/Step Time": 6.736693495884538} {"Full-finetune/Learning Rate": 3.371234576298699e-07, "Full-finetune/Loss": 0.7414020895957947, "Full-finetune/Loss (Raw)": 0.6963963508605957, "Full-finetune/Step": 4780, "Full-finetune/Step Time": 6.741442274302244} {"Full-finetune/Learning Rate": 3.355214267021012e-07, "Full-finetune/Loss": 0.7441511154174805, "Full-finetune/Loss (Raw)": 0.648546040058136, "Full-finetune/Step": 4781, "Full-finetune/Step Time": 6.7309354320168495} {"Full-finetune/Learning Rate": 3.3392314636978117e-07, "Full-finetune/Loss": 0.7435494661331177, "Full-finetune/Loss (Raw)": 0.6538511514663696, "Full-finetune/Step": 4782, "Full-finetune/Step Time": 6.732384011149406} {"Full-finetune/Learning Rate": 3.323286172531748e-07, "Full-finetune/Loss": 0.741551399230957, "Full-finetune/Loss (Raw)": 0.36239317059516907, "Full-finetune/Step": 4783, "Full-finetune/Step Time": 6.745707863941789} {"Full-finetune/Learning Rate": 3.30737839971087e-07, "Full-finetune/Loss": 0.7443050146102905, "Full-finetune/Loss (Raw)": 0.7814053297042847, "Full-finetune/Step": 4784, "Full-finetune/Step Time": 6.716937530785799} {"Full-finetune/Learning Rate": 3.2915081514086624e-07, "Full-finetune/Loss": 0.7460236549377441, "Full-finetune/Loss (Raw)": 0.9514572620391846, "Full-finetune/Step": 4785, "Full-finetune/Step Time": 6.718597067520022} {"Full-finetune/Learning Rate": 3.2756754337840757e-07, "Full-finetune/Loss": 0.7458829879760742, "Full-finetune/Loss (Raw)": 0.8150844573974609, "Full-finetune/Step": 4786, "Full-finetune/Step Time": 6.721543239429593} {"Full-finetune/Learning Rate": 3.2598802529814734e-07, "Full-finetune/Loss": 0.74508136510849, "Full-finetune/Loss (Raw)": 0.7517183423042297, "Full-finetune/Step": 4787, "Full-finetune/Step Time": 6.717304183170199} {"Full-finetune/Learning Rate": 3.2441226151306403e-07, "Full-finetune/Loss": 0.7434903979301453, "Full-finetune/Loss (Raw)": 0.6296022534370422, "Full-finetune/Step": 4788, "Full-finetune/Step Time": 6.727121224626899} {"Full-finetune/Learning Rate": 3.228402526346819e-07, "Full-finetune/Loss": 0.7429275512695312, "Full-finetune/Loss (Raw)": 0.5938658714294434, "Full-finetune/Step": 4789, "Full-finetune/Step Time": 6.727278573438525} {"Full-finetune/Learning Rate": 3.212719992730684e-07, "Full-finetune/Loss": 0.7427121996879578, "Full-finetune/Loss (Raw)": 0.810937762260437, "Full-finetune/Step": 4790, "Full-finetune/Step Time": 6.743388678878546} {"Full-finetune/Learning Rate": 3.197075020368312e-07, "Full-finetune/Loss": 0.7386998534202576, "Full-finetune/Loss (Raw)": 0.29675835371017456, "Full-finetune/Step": 4791, "Full-finetune/Step Time": 6.763138826936483} {"Full-finetune/Learning Rate": 3.1814676153311907e-07, "Full-finetune/Loss": 0.7401720881462097, "Full-finetune/Loss (Raw)": 0.9642176032066345, "Full-finetune/Step": 4792, "Full-finetune/Step Time": 6.7889171447604895} {"Full-finetune/Learning Rate": 3.165897783676275e-07, "Full-finetune/Loss": 0.7412578463554382, "Full-finetune/Loss (Raw)": 0.8297774195671082, "Full-finetune/Step": 4793, "Full-finetune/Step Time": 6.787489579990506} {"Full-finetune/Learning Rate": 3.1503655314458983e-07, "Full-finetune/Loss": 0.7421949505805969, "Full-finetune/Loss (Raw)": 0.6876649856567383, "Full-finetune/Step": 4794, "Full-finetune/Step Time": 6.7701383754611015} {"Full-finetune/Learning Rate": 3.134870864667827e-07, "Full-finetune/Loss": 0.741125226020813, "Full-finetune/Loss (Raw)": 0.6900659799575806, "Full-finetune/Step": 4795, "Full-finetune/Step Time": 6.8019969668239355} {"Full-finetune/Learning Rate": 3.1194137893552523e-07, "Full-finetune/Loss": 0.7420470118522644, "Full-finetune/Loss (Raw)": 0.847633421421051, "Full-finetune/Step": 4796, "Full-finetune/Step Time": 6.796445459127426} {"Full-finetune/Learning Rate": 3.1039943115067417e-07, "Full-finetune/Loss": 0.7456084489822388, "Full-finetune/Loss (Raw)": 0.8026961088180542, "Full-finetune/Step": 4797, "Full-finetune/Step Time": 6.778954787179828} {"Full-finetune/Learning Rate": 3.088612437106309e-07, "Full-finetune/Loss": 0.7441420555114746, "Full-finetune/Loss (Raw)": 0.6067215204238892, "Full-finetune/Step": 4798, "Full-finetune/Step Time": 6.80596923828125} {"Full-finetune/Learning Rate": 3.0732681721233446e-07, "Full-finetune/Loss": 0.7452127933502197, "Full-finetune/Loss (Raw)": 0.8383174538612366, "Full-finetune/Step": 4799, "Full-finetune/Step Time": 6.811334513127804} {"Full-finetune/Learning Rate": 3.057961522512676e-07, "Full-finetune/Loss": 0.7462193965911865, "Full-finetune/Loss (Raw)": 0.9475468397140503, "Full-finetune/Step": 4800, "Full-finetune/Step Time": 6.79539056122303} {"Full-finetune/Learning Rate": 3.0426924942145166e-07, "Full-finetune/Loss": 0.7467739582061768, "Full-finetune/Loss (Raw)": 0.8575047850608826, "Full-finetune/Step": 4801, "Full-finetune/Step Time": 6.788353499025106} {"Full-finetune/Learning Rate": 3.027461093154449e-07, "Full-finetune/Loss": 0.7462548017501831, "Full-finetune/Loss (Raw)": 0.7902459502220154, "Full-finetune/Step": 4802, "Full-finetune/Step Time": 6.763146219775081} {"Full-finetune/Learning Rate": 3.012267325243512e-07, "Full-finetune/Loss": 0.7463998794555664, "Full-finetune/Loss (Raw)": 0.851557195186615, "Full-finetune/Step": 4803, "Full-finetune/Step Time": 6.768578216433525} {"Full-finetune/Learning Rate": 2.9971111963780994e-07, "Full-finetune/Loss": 0.7470338344573975, "Full-finetune/Loss (Raw)": 0.8133981823921204, "Full-finetune/Step": 4804, "Full-finetune/Step Time": 6.760870352387428} {"Full-finetune/Learning Rate": 2.981992712440007e-07, "Full-finetune/Loss": 0.7471376657485962, "Full-finetune/Loss (Raw)": 0.8524185419082642, "Full-finetune/Step": 4805, "Full-finetune/Step Time": 6.767176017165184} {"Full-finetune/Learning Rate": 2.96691187929643e-07, "Full-finetune/Loss": 0.7473307847976685, "Full-finetune/Loss (Raw)": 0.7817666530609131, "Full-finetune/Step": 4806, "Full-finetune/Step Time": 6.74888670258224} {"Full-finetune/Learning Rate": 2.9518687027999427e-07, "Full-finetune/Loss": 0.7484608888626099, "Full-finetune/Loss (Raw)": 0.7651090025901794, "Full-finetune/Step": 4807, "Full-finetune/Step Time": 6.751102836802602} {"Full-finetune/Learning Rate": 2.936863188788497e-07, "Full-finetune/Loss": 0.7487071752548218, "Full-finetune/Loss (Raw)": 0.9122443199157715, "Full-finetune/Step": 4808, "Full-finetune/Step Time": 6.737473571673036} {"Full-finetune/Learning Rate": 2.921895343085446e-07, "Full-finetune/Loss": 0.7472911477088928, "Full-finetune/Loss (Raw)": 0.5636087656021118, "Full-finetune/Step": 4809, "Full-finetune/Step Time": 6.727082882076502} {"Full-finetune/Learning Rate": 2.9069651714995426e-07, "Full-finetune/Loss": 0.7474190592765808, "Full-finetune/Loss (Raw)": 0.7392240762710571, "Full-finetune/Step": 4810, "Full-finetune/Step Time": 6.718562640249729} {"Full-finetune/Learning Rate": 2.8920726798248645e-07, "Full-finetune/Loss": 0.747521162033081, "Full-finetune/Loss (Raw)": 0.7853435277938843, "Full-finetune/Step": 4811, "Full-finetune/Step Time": 6.735536923632026} {"Full-finetune/Learning Rate": 2.8772178738408985e-07, "Full-finetune/Loss": 0.7468574047088623, "Full-finetune/Loss (Raw)": 0.7876946330070496, "Full-finetune/Step": 4812, "Full-finetune/Step Time": 6.725055752322078} {"Full-finetune/Learning Rate": 2.862400759312522e-07, "Full-finetune/Loss": 0.7438731789588928, "Full-finetune/Loss (Raw)": 0.4683936834335327, "Full-finetune/Step": 4813, "Full-finetune/Step Time": 6.739987527951598} {"Full-finetune/Learning Rate": 2.847621341989959e-07, "Full-finetune/Loss": 0.745154619216919, "Full-finetune/Loss (Raw)": 0.81336510181427, "Full-finetune/Step": 4814, "Full-finetune/Step Time": 6.7316588424146175} {"Full-finetune/Learning Rate": 2.832879627608831e-07, "Full-finetune/Loss": 0.7458801865577698, "Full-finetune/Loss (Raw)": 0.8832565546035767, "Full-finetune/Step": 4815, "Full-finetune/Step Time": 6.729715725407004} {"Full-finetune/Learning Rate": 2.8181756218900626e-07, "Full-finetune/Loss": 0.7431355714797974, "Full-finetune/Loss (Raw)": 0.673511803150177, "Full-finetune/Step": 4816, "Full-finetune/Step Time": 6.74669661000371} {"Full-finetune/Learning Rate": 2.803509330540033e-07, "Full-finetune/Loss": 0.7427750825881958, "Full-finetune/Loss (Raw)": 0.8252859115600586, "Full-finetune/Step": 4817, "Full-finetune/Step Time": 6.752303127199411} {"Full-finetune/Learning Rate": 2.788880759250423e-07, "Full-finetune/Loss": 0.7443104386329651, "Full-finetune/Loss (Raw)": 0.8381444215774536, "Full-finetune/Step": 4818, "Full-finetune/Step Time": 6.734424753114581} {"Full-finetune/Learning Rate": 2.7742899136983026e-07, "Full-finetune/Loss": 0.7441538572311401, "Full-finetune/Loss (Raw)": 0.8715113401412964, "Full-finetune/Step": 4819, "Full-finetune/Step Time": 6.734152587130666} {"Full-finetune/Learning Rate": 2.759736799546109e-07, "Full-finetune/Loss": 0.7435740828514099, "Full-finetune/Loss (Raw)": 0.8607072234153748, "Full-finetune/Step": 4820, "Full-finetune/Step Time": 6.726386938244104} {"Full-finetune/Learning Rate": 2.745221422441602e-07, "Full-finetune/Loss": 0.7444263100624084, "Full-finetune/Loss (Raw)": 0.8819760084152222, "Full-finetune/Step": 4821, "Full-finetune/Step Time": 6.714643597602844} {"Full-finetune/Learning Rate": 2.73074378801792e-07, "Full-finetune/Loss": 0.7440081834793091, "Full-finetune/Loss (Raw)": 0.8261142373085022, "Full-finetune/Step": 4822, "Full-finetune/Step Time": 6.723809376358986} {"Full-finetune/Learning Rate": 2.7163039018935357e-07, "Full-finetune/Loss": 0.7444413900375366, "Full-finetune/Loss (Raw)": 0.8592331409454346, "Full-finetune/Step": 4823, "Full-finetune/Step Time": 6.7219787035137415} {"Full-finetune/Learning Rate": 2.701901769672322e-07, "Full-finetune/Loss": 0.7414023876190186, "Full-finetune/Loss (Raw)": 0.282558798789978, "Full-finetune/Step": 4824, "Full-finetune/Step Time": 6.727288259193301} {"Full-finetune/Learning Rate": 2.687537396943451e-07, "Full-finetune/Loss": 0.7412815093994141, "Full-finetune/Loss (Raw)": 0.7403438687324524, "Full-finetune/Step": 4825, "Full-finetune/Step Time": 6.7324844263494015} {"Full-finetune/Learning Rate": 2.673210789281433e-07, "Full-finetune/Loss": 0.7405768632888794, "Full-finetune/Loss (Raw)": 0.7676620483398438, "Full-finetune/Step": 4826, "Full-finetune/Step Time": 6.731981603428721} {"Full-finetune/Learning Rate": 2.658921952246163e-07, "Full-finetune/Loss": 0.740488588809967, "Full-finetune/Loss (Raw)": 0.8695933818817139, "Full-finetune/Step": 4827, "Full-finetune/Step Time": 6.723452169448137} {"Full-finetune/Learning Rate": 2.6446708913828725e-07, "Full-finetune/Loss": 0.7411584258079529, "Full-finetune/Loss (Raw)": 0.8618761897087097, "Full-finetune/Step": 4828, "Full-finetune/Step Time": 6.730499150231481} {"Full-finetune/Learning Rate": 2.6304576122221035e-07, "Full-finetune/Loss": 0.7408329248428345, "Full-finetune/Loss (Raw)": 0.772275984287262, "Full-finetune/Step": 4829, "Full-finetune/Step Time": 6.738323410972953} {"Full-finetune/Learning Rate": 2.616282120279745e-07, "Full-finetune/Loss": 0.7407604455947876, "Full-finetune/Loss (Raw)": 0.7368628978729248, "Full-finetune/Step": 4830, "Full-finetune/Step Time": 6.736277852207422} {"Full-finetune/Learning Rate": 2.602144421057051e-07, "Full-finetune/Loss": 0.7365075349807739, "Full-finetune/Loss (Raw)": 0.34743666648864746, "Full-finetune/Step": 4831, "Full-finetune/Step Time": 6.758966786786914} {"Full-finetune/Learning Rate": 2.5880445200405667e-07, "Full-finetune/Loss": 0.7364820241928101, "Full-finetune/Loss (Raw)": 0.6598758101463318, "Full-finetune/Step": 4832, "Full-finetune/Step Time": 6.782349655404687} {"Full-finetune/Learning Rate": 2.573982422702193e-07, "Full-finetune/Loss": 0.7356874942779541, "Full-finetune/Loss (Raw)": 0.7745215892791748, "Full-finetune/Step": 4833, "Full-finetune/Step Time": 6.79612367041409} {"Full-finetune/Learning Rate": 2.559958134499163e-07, "Full-finetune/Loss": 0.7371742725372314, "Full-finetune/Loss (Raw)": 0.9090994596481323, "Full-finetune/Step": 4834, "Full-finetune/Step Time": 6.800172382965684} {"Full-finetune/Learning Rate": 2.545971660874036e-07, "Full-finetune/Loss": 0.73842453956604, "Full-finetune/Loss (Raw)": 0.8433163166046143, "Full-finetune/Step": 4835, "Full-finetune/Step Time": 6.797107798978686} {"Full-finetune/Learning Rate": 2.532023007254658e-07, "Full-finetune/Loss": 0.7400525212287903, "Full-finetune/Loss (Raw)": 0.8921431303024292, "Full-finetune/Step": 4836, "Full-finetune/Step Time": 6.795552222058177} {"Full-finetune/Learning Rate": 2.518112179054266e-07, "Full-finetune/Loss": 0.7408919334411621, "Full-finetune/Loss (Raw)": 0.7718586325645447, "Full-finetune/Step": 4837, "Full-finetune/Step Time": 6.777049267664552} {"Full-finetune/Learning Rate": 2.504239181671353e-07, "Full-finetune/Loss": 0.7403203845024109, "Full-finetune/Loss (Raw)": 0.8677492141723633, "Full-finetune/Step": 4838, "Full-finetune/Step Time": 6.778340891003609} {"Full-finetune/Learning Rate": 2.490404020489767e-07, "Full-finetune/Loss": 0.739655613899231, "Full-finetune/Loss (Raw)": 0.6833879947662354, "Full-finetune/Step": 4839, "Full-finetune/Step Time": 6.779403368011117} {"Full-finetune/Learning Rate": 2.476606700878681e-07, "Full-finetune/Loss": 0.7401950359344482, "Full-finetune/Loss (Raw)": 0.7730444073677063, "Full-finetune/Step": 4840, "Full-finetune/Step Time": 6.76979560777545} {"Full-finetune/Learning Rate": 2.4628472281925443e-07, "Full-finetune/Loss": 0.7392534017562866, "Full-finetune/Loss (Raw)": 0.7151511907577515, "Full-finetune/Step": 4841, "Full-finetune/Step Time": 6.7753072418272495} {"Full-finetune/Learning Rate": 2.449125607771141e-07, "Full-finetune/Loss": 0.7384502291679382, "Full-finetune/Loss (Raw)": 0.6438802480697632, "Full-finetune/Step": 4842, "Full-finetune/Step Time": 6.7859171107411385} {"Full-finetune/Learning Rate": 2.435441844939557e-07, "Full-finetune/Loss": 0.7396436333656311, "Full-finetune/Loss (Raw)": 0.9397411346435547, "Full-finetune/Step": 4843, "Full-finetune/Step Time": 6.783671095967293} {"Full-finetune/Learning Rate": 2.4217959450082207e-07, "Full-finetune/Loss": 0.7391023635864258, "Full-finetune/Loss (Raw)": 0.6730377674102783, "Full-finetune/Step": 4844, "Full-finetune/Step Time": 6.803963596001267} {"Full-finetune/Learning Rate": 2.408187913272841e-07, "Full-finetune/Loss": 0.7396321296691895, "Full-finetune/Loss (Raw)": 0.8775920271873474, "Full-finetune/Step": 4845, "Full-finetune/Step Time": 6.805717915296555} {"Full-finetune/Learning Rate": 2.3946177550143835e-07, "Full-finetune/Loss": 0.7414677143096924, "Full-finetune/Loss (Raw)": 0.7942917943000793, "Full-finetune/Step": 4846, "Full-finetune/Step Time": 6.817215453833342} {"Full-finetune/Learning Rate": 2.3810854754992008e-07, "Full-finetune/Loss": 0.7388988733291626, "Full-finetune/Loss (Raw)": 0.31601086258888245, "Full-finetune/Step": 4847, "Full-finetune/Step Time": 6.8374833185225725} {"Full-finetune/Learning Rate": 2.3675910799789036e-07, "Full-finetune/Loss": 0.7404345870018005, "Full-finetune/Loss (Raw)": 0.6675481796264648, "Full-finetune/Step": 4848, "Full-finetune/Step Time": 6.800757084041834} {"Full-finetune/Learning Rate": 2.354134573690392e-07, "Full-finetune/Loss": 0.7410455942153931, "Full-finetune/Loss (Raw)": 0.6740798354148865, "Full-finetune/Step": 4849, "Full-finetune/Step Time": 6.816142704337835} {"Full-finetune/Learning Rate": 2.3407159618558772e-07, "Full-finetune/Loss": 0.7424800395965576, "Full-finetune/Loss (Raw)": 0.8671965599060059, "Full-finetune/Step": 4850, "Full-finetune/Step Time": 6.824682069942355} {"Full-finetune/Learning Rate": 2.3273352496828605e-07, "Full-finetune/Loss": 0.7431667447090149, "Full-finetune/Loss (Raw)": 0.8607643842697144, "Full-finetune/Step": 4851, "Full-finetune/Step Time": 6.841189805418253} {"Full-finetune/Learning Rate": 2.3139924423641325e-07, "Full-finetune/Loss": 0.7434625625610352, "Full-finetune/Loss (Raw)": 0.6685367822647095, "Full-finetune/Step": 4852, "Full-finetune/Step Time": 6.833352820947766} {"Full-finetune/Learning Rate": 2.3006875450777733e-07, "Full-finetune/Loss": 0.7443764209747314, "Full-finetune/Loss (Raw)": 0.8244218826293945, "Full-finetune/Step": 4853, "Full-finetune/Step Time": 6.839729903265834} {"Full-finetune/Learning Rate": 2.287420562987175e-07, "Full-finetune/Loss": 0.7431336641311646, "Full-finetune/Loss (Raw)": 0.5223540663719177, "Full-finetune/Step": 4854, "Full-finetune/Step Time": 6.841905131936073} {"Full-finetune/Learning Rate": 2.2741915012409744e-07, "Full-finetune/Loss": 0.7437052726745605, "Full-finetune/Loss (Raw)": 0.7840990424156189, "Full-finetune/Step": 4855, "Full-finetune/Step Time": 6.8425448928028345} {"Full-finetune/Learning Rate": 2.2610003649731093e-07, "Full-finetune/Loss": 0.7444698810577393, "Full-finetune/Loss (Raw)": 0.8067584037780762, "Full-finetune/Step": 4856, "Full-finetune/Step Time": 6.847348002716899} {"Full-finetune/Learning Rate": 2.2478471593028073e-07, "Full-finetune/Loss": 0.7433782815933228, "Full-finetune/Loss (Raw)": 0.8798025250434875, "Full-finetune/Step": 4857, "Full-finetune/Step Time": 6.845671245828271} {"Full-finetune/Learning Rate": 2.234731889334585e-07, "Full-finetune/Loss": 0.7447761297225952, "Full-finetune/Loss (Raw)": 0.9554873108863831, "Full-finetune/Step": 4858, "Full-finetune/Step Time": 6.855226369574666} {"Full-finetune/Learning Rate": 2.221654560158204e-07, "Full-finetune/Loss": 0.7460013628005981, "Full-finetune/Loss (Raw)": 0.7845078706741333, "Full-finetune/Step": 4859, "Full-finetune/Step Time": 6.84124238230288} {"Full-finetune/Learning Rate": 2.2086151768487273e-07, "Full-finetune/Loss": 0.7453765273094177, "Full-finetune/Loss (Raw)": 0.7099936604499817, "Full-finetune/Step": 4860, "Full-finetune/Step Time": 6.829675829038024} {"Full-finetune/Learning Rate": 2.195613744466485e-07, "Full-finetune/Loss": 0.7443957328796387, "Full-finetune/Loss (Raw)": 0.7225814461708069, "Full-finetune/Step": 4861, "Full-finetune/Step Time": 6.843990046530962} {"Full-finetune/Learning Rate": 2.182650268057085e-07, "Full-finetune/Loss": 0.7462487816810608, "Full-finetune/Loss (Raw)": 0.9185584187507629, "Full-finetune/Step": 4862, "Full-finetune/Step Time": 6.828527489677072} {"Full-finetune/Learning Rate": 2.1697247526513698e-07, "Full-finetune/Loss": 0.7467901706695557, "Full-finetune/Loss (Raw)": 0.9274311661720276, "Full-finetune/Step": 4863, "Full-finetune/Step Time": 6.833407636731863} {"Full-finetune/Learning Rate": 2.1568372032655384e-07, "Full-finetune/Loss": 0.7480795979499817, "Full-finetune/Loss (Raw)": 0.7488043904304504, "Full-finetune/Step": 4864, "Full-finetune/Step Time": 6.837375385686755} {"Full-finetune/Learning Rate": 2.143987624900945e-07, "Full-finetune/Loss": 0.7492510676383972, "Full-finetune/Loss (Raw)": 0.8297697305679321, "Full-finetune/Step": 4865, "Full-finetune/Step Time": 6.8309937082231045} {"Full-finetune/Learning Rate": 2.1311760225442678e-07, "Full-finetune/Loss": 0.7483464479446411, "Full-finetune/Loss (Raw)": 0.7287501096725464, "Full-finetune/Step": 4866, "Full-finetune/Step Time": 6.82256880402565} {"Full-finetune/Learning Rate": 2.118402401167452e-07, "Full-finetune/Loss": 0.7455234527587891, "Full-finetune/Loss (Raw)": 0.3432578444480896, "Full-finetune/Step": 4867, "Full-finetune/Step Time": 6.841227527707815} {"Full-finetune/Learning Rate": 2.1056667657276876e-07, "Full-finetune/Loss": 0.745722234249115, "Full-finetune/Loss (Raw)": 0.6953466534614563, "Full-finetune/Step": 4868, "Full-finetune/Step Time": 6.830944431945682} {"Full-finetune/Learning Rate": 2.0929691211674319e-07, "Full-finetune/Loss": 0.7464350461959839, "Full-finetune/Loss (Raw)": 0.6337506771087646, "Full-finetune/Step": 4869, "Full-finetune/Step Time": 6.834326596930623} {"Full-finetune/Learning Rate": 2.0803094724143879e-07, "Full-finetune/Loss": 0.7466850280761719, "Full-finetune/Loss (Raw)": 0.6992675065994263, "Full-finetune/Step": 4870, "Full-finetune/Step Time": 6.810884278267622} {"Full-finetune/Learning Rate": 2.0676878243815145e-07, "Full-finetune/Loss": 0.7477935552597046, "Full-finetune/Loss (Raw)": 0.7947292923927307, "Full-finetune/Step": 4871, "Full-finetune/Step Time": 6.804136233404279} {"Full-finetune/Learning Rate": 2.055104181967027e-07, "Full-finetune/Loss": 0.7466294765472412, "Full-finetune/Loss (Raw)": 0.7843250036239624, "Full-finetune/Step": 4872, "Full-finetune/Step Time": 6.803693214431405} {"Full-finetune/Learning Rate": 2.0425585500543854e-07, "Full-finetune/Loss": 0.7465299367904663, "Full-finetune/Loss (Raw)": 0.6811050176620483, "Full-finetune/Step": 4873, "Full-finetune/Step Time": 6.800209056586027} {"Full-finetune/Learning Rate": 2.0300509335123286e-07, "Full-finetune/Loss": 0.7454925775527954, "Full-finetune/Loss (Raw)": 0.562615692615509, "Full-finetune/Step": 4874, "Full-finetune/Step Time": 6.783839790150523} {"Full-finetune/Learning Rate": 2.0175813371948072e-07, "Full-finetune/Loss": 0.7441420555114746, "Full-finetune/Loss (Raw)": 0.7305948138237, "Full-finetune/Step": 4875, "Full-finetune/Step Time": 6.792687956243753} {"Full-finetune/Learning Rate": 2.0051497659409947e-07, "Full-finetune/Loss": 0.7444907426834106, "Full-finetune/Loss (Raw)": 0.8832061290740967, "Full-finetune/Step": 4876, "Full-finetune/Step Time": 6.784409765154123} {"Full-finetune/Learning Rate": 1.9927562245753874e-07, "Full-finetune/Loss": 0.7451590299606323, "Full-finetune/Loss (Raw)": 0.876002311706543, "Full-finetune/Step": 4877, "Full-finetune/Step Time": 6.785933600738645} {"Full-finetune/Learning Rate": 1.9804007179076602e-07, "Full-finetune/Loss": 0.7450739145278931, "Full-finetune/Loss (Raw)": 0.7175984382629395, "Full-finetune/Step": 4878, "Full-finetune/Step Time": 6.786898357793689} {"Full-finetune/Learning Rate": 1.968083250732744e-07, "Full-finetune/Loss": 0.745823323726654, "Full-finetune/Loss (Raw)": 0.8428277969360352, "Full-finetune/Step": 4879, "Full-finetune/Step Time": 6.768220445141196} {"Full-finetune/Learning Rate": 1.9558038278308044e-07, "Full-finetune/Loss": 0.746185302734375, "Full-finetune/Loss (Raw)": 0.8729395270347595, "Full-finetune/Step": 4880, "Full-finetune/Step Time": 6.763868218287826} {"Full-finetune/Learning Rate": 1.9435624539672515e-07, "Full-finetune/Loss": 0.7483114004135132, "Full-finetune/Loss (Raw)": 0.9687146544456482, "Full-finetune/Step": 4881, "Full-finetune/Step Time": 6.757991841062903} {"Full-finetune/Learning Rate": 1.9313591338927185e-07, "Full-finetune/Loss": 0.7473627924919128, "Full-finetune/Loss (Raw)": 0.6729776263237, "Full-finetune/Step": 4882, "Full-finetune/Step Time": 6.7596124187111855} {"Full-finetune/Learning Rate": 1.9191938723430614e-07, "Full-finetune/Loss": 0.7466951012611389, "Full-finetune/Loss (Raw)": 0.6713085770606995, "Full-finetune/Step": 4883, "Full-finetune/Step Time": 6.750513568520546} {"Full-finetune/Learning Rate": 1.9070666740394151e-07, "Full-finetune/Loss": 0.7474602460861206, "Full-finetune/Loss (Raw)": 0.8574265837669373, "Full-finetune/Step": 4884, "Full-finetune/Step Time": 6.752510724589229} {"Full-finetune/Learning Rate": 1.8949775436880924e-07, "Full-finetune/Loss": 0.7471755743026733, "Full-finetune/Loss (Raw)": 0.732677161693573, "Full-finetune/Step": 4885, "Full-finetune/Step Time": 6.756111826747656} {"Full-finetune/Learning Rate": 1.8829264859806296e-07, "Full-finetune/Loss": 0.7480606436729431, "Full-finetune/Loss (Raw)": 0.8590293526649475, "Full-finetune/Step": 4886, "Full-finetune/Step Time": 6.76128663867712} {"Full-finetune/Learning Rate": 1.8709135055938298e-07, "Full-finetune/Loss": 0.7491394281387329, "Full-finetune/Loss (Raw)": 0.8245382905006409, "Full-finetune/Step": 4887, "Full-finetune/Step Time": 6.777952738106251} {"Full-finetune/Learning Rate": 1.8589386071896975e-07, "Full-finetune/Loss": 0.7494907379150391, "Full-finetune/Loss (Raw)": 0.8170580863952637, "Full-finetune/Step": 4888, "Full-finetune/Step Time": 6.787719698622823} {"Full-finetune/Learning Rate": 1.8470017954154262e-07, "Full-finetune/Loss": 0.7510087490081787, "Full-finetune/Loss (Raw)": 0.7881278395652771, "Full-finetune/Step": 4889, "Full-finetune/Step Time": 6.777121411636472} {"Full-finetune/Learning Rate": 1.8351030749034992e-07, "Full-finetune/Loss": 0.7507792115211487, "Full-finetune/Loss (Raw)": 0.689015805721283, "Full-finetune/Step": 4890, "Full-finetune/Step Time": 6.79536497592926} {"Full-finetune/Learning Rate": 1.8232424502715672e-07, "Full-finetune/Loss": 0.7504355907440186, "Full-finetune/Loss (Raw)": 0.7209954857826233, "Full-finetune/Step": 4891, "Full-finetune/Step Time": 6.793183034285903} {"Full-finetune/Learning Rate": 1.811419926122493e-07, "Full-finetune/Loss": 0.7511706352233887, "Full-finetune/Loss (Raw)": 0.7705175280570984, "Full-finetune/Step": 4892, "Full-finetune/Step Time": 6.789015136659145} {"Full-finetune/Learning Rate": 1.7996355070443727e-07, "Full-finetune/Loss": 0.7530056238174438, "Full-finetune/Loss (Raw)": 0.881878674030304, "Full-finetune/Step": 4893, "Full-finetune/Step Time": 6.789325309917331} {"Full-finetune/Learning Rate": 1.787889197610515e-07, "Full-finetune/Loss": 0.7514737248420715, "Full-finetune/Loss (Raw)": 0.7247288823127747, "Full-finetune/Step": 4894, "Full-finetune/Step Time": 6.794763846322894} {"Full-finetune/Learning Rate": 1.776181002379429e-07, "Full-finetune/Loss": 0.7501758337020874, "Full-finetune/Loss (Raw)": 0.6536030173301697, "Full-finetune/Step": 4895, "Full-finetune/Step Time": 6.79753365367651} {"Full-finetune/Learning Rate": 1.7645109258948245e-07, "Full-finetune/Loss": 0.7510688304901123, "Full-finetune/Loss (Raw)": 0.851999044418335, "Full-finetune/Step": 4896, "Full-finetune/Step Time": 6.79016001150012} {"Full-finetune/Learning Rate": 1.7528789726856566e-07, "Full-finetune/Loss": 0.7500463128089905, "Full-finetune/Loss (Raw)": 0.6188914775848389, "Full-finetune/Step": 4897, "Full-finetune/Step Time": 6.796720432117581} {"Full-finetune/Learning Rate": 1.7412851472660585e-07, "Full-finetune/Loss": 0.75169837474823, "Full-finetune/Loss (Raw)": 0.6743353605270386, "Full-finetune/Step": 4898, "Full-finetune/Step Time": 6.798935942351818} {"Full-finetune/Learning Rate": 1.7297294541353317e-07, "Full-finetune/Loss": 0.7514415979385376, "Full-finetune/Loss (Raw)": 0.8616946339607239, "Full-finetune/Step": 4899, "Full-finetune/Step Time": 6.796467389911413} {"Full-finetune/Learning Rate": 1.7182118977780548e-07, "Full-finetune/Loss": 0.7521999478340149, "Full-finetune/Loss (Raw)": 0.7853650450706482, "Full-finetune/Step": 4900, "Full-finetune/Step Time": 6.7834992073476315} {"Full-finetune/Learning Rate": 1.706732482663942e-07, "Full-finetune/Loss": 0.7537410259246826, "Full-finetune/Loss (Raw)": 0.7433335185050964, "Full-finetune/Step": 4901, "Full-finetune/Step Time": 6.7713776379823685} {"Full-finetune/Learning Rate": 1.6952912132479404e-07, "Full-finetune/Loss": 0.7534348964691162, "Full-finetune/Loss (Raw)": 0.7514678239822388, "Full-finetune/Step": 4902, "Full-finetune/Step Time": 6.771108113229275} {"Full-finetune/Learning Rate": 1.6838880939701875e-07, "Full-finetune/Loss": 0.7522553205490112, "Full-finetune/Loss (Raw)": 0.714678168296814, "Full-finetune/Step": 4903, "Full-finetune/Step Time": 6.780536942183971} {"Full-finetune/Learning Rate": 1.6725231292559985e-07, "Full-finetune/Loss": 0.753063440322876, "Full-finetune/Loss (Raw)": 0.7800691723823547, "Full-finetune/Step": 4904, "Full-finetune/Step Time": 6.775668002665043} {"Full-finetune/Learning Rate": 1.661196323515901e-07, "Full-finetune/Loss": 0.753314733505249, "Full-finetune/Loss (Raw)": 0.7905334234237671, "Full-finetune/Step": 4905, "Full-finetune/Step Time": 6.779313787817955} {"Full-finetune/Learning Rate": 1.6499076811456015e-07, "Full-finetune/Loss": 0.7567087411880493, "Full-finetune/Loss (Raw)": 0.7170009613037109, "Full-finetune/Step": 4906, "Full-finetune/Step Time": 6.763185761868954} {"Full-finetune/Learning Rate": 1.6386572065260065e-07, "Full-finetune/Loss": 0.7542071342468262, "Full-finetune/Loss (Raw)": 0.5959463715553284, "Full-finetune/Step": 4907, "Full-finetune/Step Time": 6.770206812769175} {"Full-finetune/Learning Rate": 1.6274449040232233e-07, "Full-finetune/Loss": 0.7547081708908081, "Full-finetune/Loss (Raw)": 0.7605358362197876, "Full-finetune/Step": 4908, "Full-finetune/Step Time": 6.7816462479531765} {"Full-finetune/Learning Rate": 1.6162707779884933e-07, "Full-finetune/Loss": 0.755608320236206, "Full-finetune/Loss (Raw)": 0.7637664079666138, "Full-finetune/Step": 4909, "Full-finetune/Step Time": 6.777579288929701} {"Full-finetune/Learning Rate": 1.6051348327583038e-07, "Full-finetune/Loss": 0.7568836212158203, "Full-finetune/Loss (Raw)": 0.8170835971832275, "Full-finetune/Step": 4910, "Full-finetune/Step Time": 6.766738969832659} {"Full-finetune/Learning Rate": 1.5940370726542864e-07, "Full-finetune/Loss": 0.7600083351135254, "Full-finetune/Loss (Raw)": 0.7623630166053772, "Full-finetune/Step": 4911, "Full-finetune/Step Time": 6.747452022507787} {"Full-finetune/Learning Rate": 1.5829775019832628e-07, "Full-finetune/Loss": 0.7598163485527039, "Full-finetune/Loss (Raw)": 0.7568289637565613, "Full-finetune/Step": 4912, "Full-finetune/Step Time": 6.753905000165105} {"Full-finetune/Learning Rate": 1.571956125037244e-07, "Full-finetune/Loss": 0.7586320638656616, "Full-finetune/Loss (Raw)": 0.799863338470459, "Full-finetune/Step": 4913, "Full-finetune/Step Time": 6.762173868715763} {"Full-finetune/Learning Rate": 1.5609729460934087e-07, "Full-finetune/Loss": 0.7553939819335938, "Full-finetune/Loss (Raw)": 0.4006084203720093, "Full-finetune/Step": 4914, "Full-finetune/Step Time": 6.777008814737201} {"Full-finetune/Learning Rate": 1.550027969414114e-07, "Full-finetune/Loss": 0.7546415328979492, "Full-finetune/Loss (Raw)": 0.6554126739501953, "Full-finetune/Step": 4915, "Full-finetune/Step Time": 6.790023311972618} {"Full-finetune/Learning Rate": 1.5391211992468736e-07, "Full-finetune/Loss": 0.7556345462799072, "Full-finetune/Loss (Raw)": 0.7567099928855896, "Full-finetune/Step": 4916, "Full-finetune/Step Time": 6.764144418761134} {"Full-finetune/Learning Rate": 1.5282526398244236e-07, "Full-finetune/Loss": 0.7541576623916626, "Full-finetune/Loss (Raw)": 0.4048146605491638, "Full-finetune/Step": 4917, "Full-finetune/Step Time": 6.777953457087278} {"Full-finetune/Learning Rate": 1.5174222953646344e-07, "Full-finetune/Loss": 0.7540040016174316, "Full-finetune/Loss (Raw)": 0.7912707328796387, "Full-finetune/Step": 4918, "Full-finetune/Step Time": 6.762231824919581} {"Full-finetune/Learning Rate": 1.5066301700705334e-07, "Full-finetune/Loss": 0.7576549649238586, "Full-finetune/Loss (Raw)": 0.76408451795578, "Full-finetune/Step": 4919, "Full-finetune/Step Time": 6.744356734678149} {"Full-finetune/Learning Rate": 1.4958762681303362e-07, "Full-finetune/Loss": 0.7569600343704224, "Full-finetune/Loss (Raw)": 0.8752679228782654, "Full-finetune/Step": 4920, "Full-finetune/Step Time": 6.728848960250616} {"Full-finetune/Learning Rate": 1.4851605937174384e-07, "Full-finetune/Loss": 0.7563483715057373, "Full-finetune/Loss (Raw)": 0.7514790296554565, "Full-finetune/Step": 4921, "Full-finetune/Step Time": 6.741242341697216} {"Full-finetune/Learning Rate": 1.474483150990369e-07, "Full-finetune/Loss": 0.7562217712402344, "Full-finetune/Loss (Raw)": 0.6714690327644348, "Full-finetune/Step": 4922, "Full-finetune/Step Time": 6.742021504789591} {"Full-finetune/Learning Rate": 1.4638439440928354e-07, "Full-finetune/Loss": 0.7565637826919556, "Full-finetune/Loss (Raw)": 0.7338429093360901, "Full-finetune/Step": 4923, "Full-finetune/Step Time": 6.716182628646493} {"Full-finetune/Learning Rate": 1.4532429771537237e-07, "Full-finetune/Loss": 0.7556283473968506, "Full-finetune/Loss (Raw)": 0.7278984189033508, "Full-finetune/Step": 4924, "Full-finetune/Step Time": 6.717261224985123} {"Full-finetune/Learning Rate": 1.4426802542870433e-07, "Full-finetune/Loss": 0.7550320625305176, "Full-finetune/Loss (Raw)": 0.7263655066490173, "Full-finetune/Step": 4925, "Full-finetune/Step Time": 6.71708713658154} {"Full-finetune/Learning Rate": 1.4321557795919705e-07, "Full-finetune/Loss": 0.7559638023376465, "Full-finetune/Loss (Raw)": 0.7259857654571533, "Full-finetune/Step": 4926, "Full-finetune/Step Time": 6.6903002597391605} {"Full-finetune/Learning Rate": 1.4216695571528828e-07, "Full-finetune/Loss": 0.7553501129150391, "Full-finetune/Loss (Raw)": 0.7597711682319641, "Full-finetune/Step": 4927, "Full-finetune/Step Time": 6.687937889248133} {"Full-finetune/Learning Rate": 1.411221591039269e-07, "Full-finetune/Loss": 0.752280592918396, "Full-finetune/Loss (Raw)": 0.5546421408653259, "Full-finetune/Step": 4928, "Full-finetune/Step Time": 6.710455557331443} {"Full-finetune/Learning Rate": 1.4008118853057529e-07, "Full-finetune/Loss": 0.7512408494949341, "Full-finetune/Loss (Raw)": 0.72441166639328, "Full-finetune/Step": 4929, "Full-finetune/Step Time": 6.71517744101584} {"Full-finetune/Learning Rate": 1.3904404439921582e-07, "Full-finetune/Loss": 0.7511756420135498, "Full-finetune/Loss (Raw)": 0.7819042205810547, "Full-finetune/Step": 4930, "Full-finetune/Step Time": 6.7137580290436745} {"Full-finetune/Learning Rate": 1.3801072711234541e-07, "Full-finetune/Loss": 0.7510469555854797, "Full-finetune/Loss (Raw)": 0.8350872993469238, "Full-finetune/Step": 4931, "Full-finetune/Step Time": 6.711426878347993} {"Full-finetune/Learning Rate": 1.369812370709711e-07, "Full-finetune/Loss": 0.7512484788894653, "Full-finetune/Loss (Raw)": 0.8391917943954468, "Full-finetune/Step": 4932, "Full-finetune/Step Time": 6.709041370078921} {"Full-finetune/Learning Rate": 1.3595557467461994e-07, "Full-finetune/Loss": 0.7500693798065186, "Full-finetune/Loss (Raw)": 0.7014986872673035, "Full-finetune/Step": 4933, "Full-finetune/Step Time": 6.719671478495002} {"Full-finetune/Learning Rate": 1.3493374032133134e-07, "Full-finetune/Loss": 0.7505080699920654, "Full-finetune/Loss (Raw)": 0.8379148244857788, "Full-finetune/Step": 4934, "Full-finetune/Step Time": 6.715055523440242} {"Full-finetune/Learning Rate": 1.3391573440765915e-07, "Full-finetune/Loss": 0.7511316537857056, "Full-finetune/Loss (Raw)": 0.8449311852455139, "Full-finetune/Step": 4935, "Full-finetune/Step Time": 6.713435091078281} {"Full-finetune/Learning Rate": 1.329015573286696e-07, "Full-finetune/Loss": 0.7493711113929749, "Full-finetune/Loss (Raw)": 0.6868957281112671, "Full-finetune/Step": 4936, "Full-finetune/Step Time": 6.724463101476431} {"Full-finetune/Learning Rate": 1.3189120947794897e-07, "Full-finetune/Loss": 0.7520343065261841, "Full-finetune/Loss (Raw)": 0.9044891595840454, "Full-finetune/Step": 4937, "Full-finetune/Step Time": 6.716877831146121} {"Full-finetune/Learning Rate": 1.308846912475914e-07, "Full-finetune/Loss": 0.7524970769882202, "Full-finetune/Loss (Raw)": 0.7984626889228821, "Full-finetune/Step": 4938, "Full-finetune/Step Time": 6.728031480684876} {"Full-finetune/Learning Rate": 1.2988200302820552e-07, "Full-finetune/Loss": 0.7489726543426514, "Full-finetune/Loss (Raw)": 0.3342161178588867, "Full-finetune/Step": 4939, "Full-finetune/Step Time": 6.724811192601919} {"Full-finetune/Learning Rate": 1.2888314520891676e-07, "Full-finetune/Loss": 0.7476376295089722, "Full-finetune/Loss (Raw)": 0.6168113350868225, "Full-finetune/Step": 4940, "Full-finetune/Step Time": 6.724358292296529} {"Full-finetune/Learning Rate": 1.2788811817736168e-07, "Full-finetune/Loss": 0.7491714954376221, "Full-finetune/Loss (Raw)": 0.6647359132766724, "Full-finetune/Step": 4941, "Full-finetune/Step Time": 6.705834520980716} {"Full-finetune/Learning Rate": 1.2689692231969364e-07, "Full-finetune/Loss": 0.7483052611351013, "Full-finetune/Loss (Raw)": 0.7024832963943481, "Full-finetune/Step": 4942, "Full-finetune/Step Time": 6.712384227663279} {"Full-finetune/Learning Rate": 1.2590955802057047e-07, "Full-finetune/Loss": 0.7467524409294128, "Full-finetune/Loss (Raw)": 0.6844963431358337, "Full-finetune/Step": 4943, "Full-finetune/Step Time": 6.723622815683484} {"Full-finetune/Learning Rate": 1.2492602566317457e-07, "Full-finetune/Loss": 0.747753918170929, "Full-finetune/Loss (Raw)": 0.801694393157959, "Full-finetune/Step": 4944, "Full-finetune/Step Time": 6.7094864416867495} {"Full-finetune/Learning Rate": 1.2394632562919283e-07, "Full-finetune/Loss": 0.7481650114059448, "Full-finetune/Loss (Raw)": 0.877911388874054, "Full-finetune/Step": 4945, "Full-finetune/Step Time": 6.708658758550882} {"Full-finetune/Learning Rate": 1.2297045829882892e-07, "Full-finetune/Loss": 0.7472089529037476, "Full-finetune/Loss (Raw)": 0.7157700061798096, "Full-finetune/Step": 4946, "Full-finetune/Step Time": 6.7086243238300085} {"Full-finetune/Learning Rate": 1.2199842405079766e-07, "Full-finetune/Loss": 0.746367871761322, "Full-finetune/Loss (Raw)": 0.7638523578643799, "Full-finetune/Step": 4947, "Full-finetune/Step Time": 6.721205050125718} {"Full-finetune/Learning Rate": 1.2103022326232505e-07, "Full-finetune/Loss": 0.7454241514205933, "Full-finetune/Loss (Raw)": 0.7399057149887085, "Full-finetune/Step": 4948, "Full-finetune/Step Time": 6.7177002392709255} {"Full-finetune/Learning Rate": 1.2006585630915391e-07, "Full-finetune/Loss": 0.7440955638885498, "Full-finetune/Loss (Raw)": 0.7119189500808716, "Full-finetune/Step": 4949, "Full-finetune/Step Time": 6.716036152094603} {"Full-finetune/Learning Rate": 1.1910532356553261e-07, "Full-finetune/Loss": 0.7427933812141418, "Full-finetune/Loss (Raw)": 0.6594401597976685, "Full-finetune/Step": 4950, "Full-finetune/Step Time": 6.722150221467018} {"Full-finetune/Learning Rate": 1.1814862540422744e-07, "Full-finetune/Loss": 0.7426130771636963, "Full-finetune/Loss (Raw)": 0.8361479640007019, "Full-finetune/Step": 4951, "Full-finetune/Step Time": 6.721023702993989} {"Full-finetune/Learning Rate": 1.1719576219651585e-07, "Full-finetune/Loss": 0.7466167211532593, "Full-finetune/Loss (Raw)": 0.7950278520584106, "Full-finetune/Step": 4952, "Full-finetune/Step Time": 6.711597329005599} {"Full-finetune/Learning Rate": 1.1624673431218092e-07, "Full-finetune/Loss": 0.7461539506912231, "Full-finetune/Loss (Raw)": 0.6811072826385498, "Full-finetune/Step": 4953, "Full-finetune/Step Time": 6.712213976308703} {"Full-finetune/Learning Rate": 1.1530154211952583e-07, "Full-finetune/Loss": 0.7463406324386597, "Full-finetune/Loss (Raw)": 0.7915580868721008, "Full-finetune/Step": 4954, "Full-finetune/Step Time": 6.746095294132829} {"Full-finetune/Learning Rate": 1.1436018598535937e-07, "Full-finetune/Loss": 0.7457070350646973, "Full-finetune/Loss (Raw)": 0.7884978652000427, "Full-finetune/Step": 4955, "Full-finetune/Step Time": 6.748222693800926} {"Full-finetune/Learning Rate": 1.1342266627500375e-07, "Full-finetune/Loss": 0.7453551292419434, "Full-finetune/Loss (Raw)": 0.8168224692344666, "Full-finetune/Step": 4956, "Full-finetune/Step Time": 6.735490804538131} {"Full-finetune/Learning Rate": 1.1248898335229241e-07, "Full-finetune/Loss": 0.7458738088607788, "Full-finetune/Loss (Raw)": 0.838671863079071, "Full-finetune/Step": 4957, "Full-finetune/Step Time": 6.725084446370602} {"Full-finetune/Learning Rate": 1.1155913757956881e-07, "Full-finetune/Loss": 0.745406985282898, "Full-finetune/Loss (Raw)": 0.6771080493927002, "Full-finetune/Step": 4958, "Full-finetune/Step Time": 6.741791725158691} {"Full-finetune/Learning Rate": 1.1063312931768877e-07, "Full-finetune/Loss": 0.7460839748382568, "Full-finetune/Loss (Raw)": 0.4340917468070984, "Full-finetune/Step": 4959, "Full-finetune/Step Time": 6.742022702470422} {"Full-finetune/Learning Rate": 1.0971095892601702e-07, "Full-finetune/Loss": 0.7467027902603149, "Full-finetune/Loss (Raw)": 0.73907870054245, "Full-finetune/Step": 4960, "Full-finetune/Step Time": 6.715251915156841} {"Full-finetune/Learning Rate": 1.0879262676243174e-07, "Full-finetune/Loss": 0.7464319467544556, "Full-finetune/Loss (Raw)": 0.7398677468299866, "Full-finetune/Step": 4961, "Full-finetune/Step Time": 6.703155178576708} {"Full-finetune/Learning Rate": 1.0787813318331786e-07, "Full-finetune/Loss": 0.7456477284431458, "Full-finetune/Loss (Raw)": 0.8087140321731567, "Full-finetune/Step": 4962, "Full-finetune/Step Time": 6.701940657570958} {"Full-finetune/Learning Rate": 1.0696747854357259e-07, "Full-finetune/Loss": 0.744916558265686, "Full-finetune/Loss (Raw)": 0.7497246265411377, "Full-finetune/Step": 4963, "Full-finetune/Step Time": 6.7167229894548655} {"Full-finetune/Learning Rate": 1.0606066319660435e-07, "Full-finetune/Loss": 0.7446982860565186, "Full-finetune/Loss (Raw)": 0.8642090559005737, "Full-finetune/Step": 4964, "Full-finetune/Step Time": 6.729923602193594} {"Full-finetune/Learning Rate": 1.0515768749432942e-07, "Full-finetune/Loss": 0.7457126975059509, "Full-finetune/Loss (Raw)": 0.9016970992088318, "Full-finetune/Step": 4965, "Full-finetune/Step Time": 6.731133811175823} {"Full-finetune/Learning Rate": 1.0425855178717636e-07, "Full-finetune/Loss": 0.7446610927581787, "Full-finetune/Loss (Raw)": 0.7331441044807434, "Full-finetune/Step": 4966, "Full-finetune/Step Time": 6.734434613958001} {"Full-finetune/Learning Rate": 1.0336325642408052e-07, "Full-finetune/Loss": 0.7460737228393555, "Full-finetune/Loss (Raw)": 0.8642110228538513, "Full-finetune/Step": 4967, "Full-finetune/Step Time": 6.732496494427323} {"Full-finetune/Learning Rate": 1.024718017524895e-07, "Full-finetune/Loss": 0.7460969686508179, "Full-finetune/Loss (Raw)": 0.7760077714920044, "Full-finetune/Step": 4968, "Full-finetune/Step Time": 6.7283488642424345} {"Full-finetune/Learning Rate": 1.015841881183588e-07, "Full-finetune/Loss": 0.7461939454078674, "Full-finetune/Loss (Raw)": 0.7275724411010742, "Full-finetune/Step": 4969, "Full-finetune/Step Time": 6.742104293778539} {"Full-finetune/Learning Rate": 1.0070041586615398e-07, "Full-finetune/Loss": 0.7473785877227783, "Full-finetune/Loss (Raw)": 0.795511782169342, "Full-finetune/Step": 4970, "Full-finetune/Step Time": 6.7238418739289045} {"Full-finetune/Learning Rate": 9.98204853388518e-08, "Full-finetune/Loss": 0.7470718622207642, "Full-finetune/Loss (Raw)": 0.9004843235015869, "Full-finetune/Step": 4971, "Full-finetune/Step Time": 6.734323559328914} {"Full-finetune/Learning Rate": 9.894439687793466e-08, "Full-finetune/Loss": 0.7477248311042786, "Full-finetune/Loss (Raw)": 0.7566120028495789, "Full-finetune/Step": 4972, "Full-finetune/Step Time": 6.727765487506986} {"Full-finetune/Learning Rate": 9.807215082339395e-08, "Full-finetune/Loss": 0.7481393814086914, "Full-finetune/Loss (Raw)": 0.9306540489196777, "Full-finetune/Step": 4973, "Full-finetune/Step Time": 6.728251708671451} {"Full-finetune/Learning Rate": 9.720374751373329e-08, "Full-finetune/Loss": 0.7442730665206909, "Full-finetune/Loss (Raw)": 0.29940274357795715, "Full-finetune/Step": 4974, "Full-finetune/Step Time": 6.719620933756232} {"Full-finetune/Learning Rate": 9.633918728596203e-08, "Full-finetune/Loss": 0.7471771240234375, "Full-finetune/Loss (Raw)": 0.6877297163009644, "Full-finetune/Step": 4975, "Full-finetune/Step Time": 6.714256474748254} {"Full-finetune/Learning Rate": 9.547847047559955e-08, "Full-finetune/Loss": 0.7490055561065674, "Full-finetune/Loss (Raw)": 0.9015896320343018, "Full-finetune/Step": 4976, "Full-finetune/Step Time": 6.717443305999041} {"Full-finetune/Learning Rate": 9.462159741667309e-08, "Full-finetune/Loss": 0.7490378618240356, "Full-finetune/Loss (Raw)": 0.6782236099243164, "Full-finetune/Step": 4977, "Full-finetune/Step Time": 6.716205939650536} {"Full-finetune/Learning Rate": 9.376856844171889e-08, "Full-finetune/Loss": 0.7479556798934937, "Full-finetune/Loss (Raw)": 0.7286685109138489, "Full-finetune/Step": 4978, "Full-finetune/Step Time": 6.706454396247864} {"Full-finetune/Learning Rate": 9.291938388178102e-08, "Full-finetune/Loss": 0.7463706135749817, "Full-finetune/Loss (Raw)": 0.6578772664070129, "Full-finetune/Step": 4979, "Full-finetune/Step Time": 6.6975378673523664} {"Full-finetune/Learning Rate": 9.207404406640919e-08, "Full-finetune/Loss": 0.7462588548660278, "Full-finetune/Loss (Raw)": 0.6542373895645142, "Full-finetune/Step": 4980, "Full-finetune/Step Time": 6.691260777413845} {"Full-finetune/Learning Rate": 9.123254932366655e-08, "Full-finetune/Loss": 0.7453840970993042, "Full-finetune/Loss (Raw)": 0.712448239326477, "Full-finetune/Step": 4981, "Full-finetune/Step Time": 6.682760506868362} {"Full-finetune/Learning Rate": 9.039489998011853e-08, "Full-finetune/Loss": 0.7480830550193787, "Full-finetune/Loss (Raw)": 0.8678191900253296, "Full-finetune/Step": 4982, "Full-finetune/Step Time": 6.667715756222606} {"Full-finetune/Learning Rate": 8.956109636084065e-08, "Full-finetune/Loss": 0.7451508045196533, "Full-finetune/Loss (Raw)": 0.40877610445022583, "Full-finetune/Step": 4983, "Full-finetune/Step Time": 6.674663262441754} {"Full-finetune/Learning Rate": 8.873113878941631e-08, "Full-finetune/Loss": 0.7437900900840759, "Full-finetune/Loss (Raw)": 0.6325826048851013, "Full-finetune/Step": 4984, "Full-finetune/Step Time": 6.675828415900469} {"Full-finetune/Learning Rate": 8.790502758793562e-08, "Full-finetune/Loss": 0.743780255317688, "Full-finetune/Loss (Raw)": 0.8785461783409119, "Full-finetune/Step": 4985, "Full-finetune/Step Time": 6.673106862232089} {"Full-finetune/Learning Rate": 8.70827630769977e-08, "Full-finetune/Loss": 0.7410068511962891, "Full-finetune/Loss (Raw)": 0.6004933714866638, "Full-finetune/Step": 4986, "Full-finetune/Step Time": 6.665673602372408} {"Full-finetune/Learning Rate": 8.626434557570507e-08, "Full-finetune/Loss": 0.7411675453186035, "Full-finetune/Loss (Raw)": 0.8050734996795654, "Full-finetune/Step": 4987, "Full-finetune/Step Time": 6.673499984666705} {"Full-finetune/Learning Rate": 8.544977540167032e-08, "Full-finetune/Loss": 0.7422068119049072, "Full-finetune/Loss (Raw)": 0.8430150151252747, "Full-finetune/Step": 4988, "Full-finetune/Step Time": 6.682331867516041} {"Full-finetune/Learning Rate": 8.463905287101282e-08, "Full-finetune/Loss": 0.7428835034370422, "Full-finetune/Loss (Raw)": 0.8092020153999329, "Full-finetune/Step": 4989, "Full-finetune/Step Time": 6.6742589846253395} {"Full-finetune/Learning Rate": 8.383217829835755e-08, "Full-finetune/Loss": 0.7417514324188232, "Full-finetune/Loss (Raw)": 0.7736542820930481, "Full-finetune/Step": 4990, "Full-finetune/Step Time": 6.677490316331387} {"Full-finetune/Learning Rate": 8.302915199683737e-08, "Full-finetune/Loss": 0.7404432892799377, "Full-finetune/Loss (Raw)": 0.7599861025810242, "Full-finetune/Step": 4991, "Full-finetune/Step Time": 6.671505084261298} {"Full-finetune/Learning Rate": 8.222997427809076e-08, "Full-finetune/Loss": 0.7417190074920654, "Full-finetune/Loss (Raw)": 0.9120928049087524, "Full-finetune/Step": 4992, "Full-finetune/Step Time": 6.673765299841762} {"Full-finetune/Learning Rate": 8.143464545226298e-08, "Full-finetune/Loss": 0.7391695976257324, "Full-finetune/Loss (Raw)": 0.5034482479095459, "Full-finetune/Step": 4993, "Full-finetune/Step Time": 6.688648249953985} {"Full-finetune/Learning Rate": 8.064316582800491e-08, "Full-finetune/Loss": 0.7396010160446167, "Full-finetune/Loss (Raw)": 0.7839715480804443, "Full-finetune/Step": 4994, "Full-finetune/Step Time": 6.697190713137388} {"Full-finetune/Learning Rate": 7.98555357124764e-08, "Full-finetune/Loss": 0.7413493990898132, "Full-finetune/Loss (Raw)": 0.5670524835586548, "Full-finetune/Step": 4995, "Full-finetune/Step Time": 6.681676948443055} {"Full-finetune/Learning Rate": 7.907175541133849e-08, "Full-finetune/Loss": 0.7429265975952148, "Full-finetune/Loss (Raw)": 0.8972367644309998, "Full-finetune/Step": 4996, "Full-finetune/Step Time": 6.684014018625021} {"Full-finetune/Learning Rate": 7.829182522876344e-08, "Full-finetune/Loss": 0.7445451021194458, "Full-finetune/Loss (Raw)": 0.8409116268157959, "Full-finetune/Step": 4997, "Full-finetune/Step Time": 6.670129166916013} {"Full-finetune/Learning Rate": 7.75157454674258e-08, "Full-finetune/Loss": 0.7470475435256958, "Full-finetune/Loss (Raw)": 1.0195757150650024, "Full-finetune/Step": 4998, "Full-finetune/Step Time": 6.668406521901488} {"Full-finetune/Learning Rate": 7.674351642850797e-08, "Full-finetune/Loss": 0.7477049231529236, "Full-finetune/Loss (Raw)": 0.8788828253746033, "Full-finetune/Step": 4999, "Full-finetune/Step Time": 6.660221643745899} {"Full-finetune/Learning Rate": 7.597513841169469e-08, "Full-finetune/Loss": 0.7442892789840698, "Full-finetune/Loss (Raw)": 0.3471203148365021, "Full-finetune/Step": 5000, "Full-finetune/Step Time": 6.680446140468121} {"Full-finetune/Learning Rate": 7.521061171518184e-08, "Full-finetune/Loss": 0.7452328205108643, "Full-finetune/Loss (Raw)": 0.8018749952316284, "Full-finetune/Step": 5001, "Full-finetune/Step Time": 6.663623755797744} {"Full-finetune/Learning Rate": 7.444993663566325e-08, "Full-finetune/Loss": 0.7449285984039307, "Full-finetune/Loss (Raw)": 0.5236794948577881, "Full-finetune/Step": 5002, "Full-finetune/Step Time": 6.666123306378722} {"Full-finetune/Learning Rate": 7.369311346834496e-08, "Full-finetune/Loss": 0.7446703910827637, "Full-finetune/Loss (Raw)": 0.6975465416908264, "Full-finetune/Step": 5003, "Full-finetune/Step Time": 6.653949528932571} {"Full-finetune/Learning Rate": 7.294014250693538e-08, "Full-finetune/Loss": 0.7425051927566528, "Full-finetune/Loss (Raw)": 0.606061577796936, "Full-finetune/Step": 5004, "Full-finetune/Step Time": 6.669024121016264} {"Full-finetune/Learning Rate": 7.21910240436463e-08, "Full-finetune/Loss": 0.7416462302207947, "Full-finetune/Loss (Raw)": 0.7660486698150635, "Full-finetune/Step": 5005, "Full-finetune/Step Time": 6.681480819359422} {"Full-finetune/Learning Rate": 7.144575836919632e-08, "Full-finetune/Loss": 0.7421646118164062, "Full-finetune/Loss (Raw)": 0.7839544415473938, "Full-finetune/Step": 5006, "Full-finetune/Step Time": 6.673843640834093} {"Full-finetune/Learning Rate": 7.07043457728096e-08, "Full-finetune/Loss": 0.7399085760116577, "Full-finetune/Loss (Raw)": 0.554052472114563, "Full-finetune/Step": 5007, "Full-finetune/Step Time": 6.68416784517467} {"Full-finetune/Learning Rate": 6.996678654221267e-08, "Full-finetune/Loss": 0.738493800163269, "Full-finetune/Loss (Raw)": 0.6918466091156006, "Full-finetune/Step": 5008, "Full-finetune/Step Time": 6.691992059350014} {"Full-finetune/Learning Rate": 6.923308096363879e-08, "Full-finetune/Loss": 0.7381359338760376, "Full-finetune/Loss (Raw)": 0.9229032397270203, "Full-finetune/Step": 5009, "Full-finetune/Step Time": 6.694146707653999} {"Full-finetune/Learning Rate": 6.850322932182352e-08, "Full-finetune/Loss": 0.7390439510345459, "Full-finetune/Loss (Raw)": 0.789214551448822, "Full-finetune/Step": 5010, "Full-finetune/Step Time": 6.685662316158414} {"Full-finetune/Learning Rate": 6.777723190000918e-08, "Full-finetune/Loss": 0.7396836876869202, "Full-finetune/Loss (Raw)": 0.7531896829605103, "Full-finetune/Step": 5011, "Full-finetune/Step Time": 6.686358939856291} {"Full-finetune/Learning Rate": 6.705508897994151e-08, "Full-finetune/Loss": 0.7389611005783081, "Full-finetune/Loss (Raw)": 0.764943540096283, "Full-finetune/Step": 5012, "Full-finetune/Step Time": 6.684538060799241} {"Full-finetune/Learning Rate": 6.633680084186856e-08, "Full-finetune/Loss": 0.7382732629776001, "Full-finetune/Loss (Raw)": 0.644622266292572, "Full-finetune/Step": 5013, "Full-finetune/Step Time": 6.683539701625705} {"Full-finetune/Learning Rate": 6.562236776454512e-08, "Full-finetune/Loss": 0.7371089458465576, "Full-finetune/Loss (Raw)": 0.7099965214729309, "Full-finetune/Step": 5014, "Full-finetune/Step Time": 6.674531241878867} {"Full-finetune/Learning Rate": 6.491179002522829e-08, "Full-finetune/Loss": 0.7360670566558838, "Full-finetune/Loss (Raw)": 0.6911804676055908, "Full-finetune/Step": 5015, "Full-finetune/Step Time": 6.653985120356083} {"Full-finetune/Learning Rate": 6.420506789967973e-08, "Full-finetune/Loss": 0.7353780269622803, "Full-finetune/Loss (Raw)": 0.728862464427948, "Full-finetune/Step": 5016, "Full-finetune/Step Time": 6.669511314481497} {"Full-finetune/Learning Rate": 6.350220166216337e-08, "Full-finetune/Loss": 0.7342888712882996, "Full-finetune/Loss (Raw)": 0.6487162113189697, "Full-finetune/Step": 5017, "Full-finetune/Step Time": 6.669121935963631} {"Full-finetune/Learning Rate": 6.280319158544989e-08, "Full-finetune/Loss": 0.7340911626815796, "Full-finetune/Loss (Raw)": 0.6637132167816162, "Full-finetune/Step": 5018, "Full-finetune/Step Time": 6.667986279353499} {"Full-finetune/Learning Rate": 6.21080379408101e-08, "Full-finetune/Loss": 0.7341462969779968, "Full-finetune/Loss (Raw)": 0.7280507683753967, "Full-finetune/Step": 5019, "Full-finetune/Step Time": 6.666790101677179} {"Full-finetune/Learning Rate": 6.14167409980193e-08, "Full-finetune/Loss": 0.7307947278022766, "Full-finetune/Loss (Raw)": 0.34151893854141235, "Full-finetune/Step": 5020, "Full-finetune/Step Time": 6.693854887038469} {"Full-finetune/Learning Rate": 6.072930102535734e-08, "Full-finetune/Loss": 0.7305011749267578, "Full-finetune/Loss (Raw)": 0.8442952632904053, "Full-finetune/Step": 5021, "Full-finetune/Step Time": 6.6924764867872} {"Full-finetune/Learning Rate": 6.004571828960525e-08, "Full-finetune/Loss": 0.7311097383499146, "Full-finetune/Loss (Raw)": 0.8026283979415894, "Full-finetune/Step": 5022, "Full-finetune/Step Time": 6.675047254189849} {"Full-finetune/Learning Rate": 5.936599305604862e-08, "Full-finetune/Loss": 0.7318556308746338, "Full-finetune/Loss (Raw)": 0.7490770816802979, "Full-finetune/Step": 5023, "Full-finetune/Step Time": 6.681538473814726} {"Full-finetune/Learning Rate": 5.869012558847642e-08, "Full-finetune/Loss": 0.7310509085655212, "Full-finetune/Loss (Raw)": 0.7489956021308899, "Full-finetune/Step": 5024, "Full-finetune/Step Time": 6.685239622369409} {"Full-finetune/Learning Rate": 5.801811614917885e-08, "Full-finetune/Loss": 0.7320502400398254, "Full-finetune/Loss (Raw)": 0.7468039393424988, "Full-finetune/Step": 5025, "Full-finetune/Step Time": 6.689978007227182} {"Full-finetune/Learning Rate": 5.73499649989484e-08, "Full-finetune/Loss": 0.7332922220230103, "Full-finetune/Loss (Raw)": 0.8333154320716858, "Full-finetune/Step": 5026, "Full-finetune/Step Time": 6.681659637019038} {"Full-finetune/Learning Rate": 5.6685672397083226e-08, "Full-finetune/Loss": 0.733073353767395, "Full-finetune/Loss (Raw)": 0.8336719870567322, "Full-finetune/Step": 5027, "Full-finetune/Step Time": 6.695282567292452} {"Full-finetune/Learning Rate": 5.602523860138154e-08, "Full-finetune/Loss": 0.7339355945587158, "Full-finetune/Loss (Raw)": 0.8957347869873047, "Full-finetune/Step": 5028, "Full-finetune/Step Time": 6.697233967483044} {"Full-finetune/Learning Rate": 5.536866386814499e-08, "Full-finetune/Loss": 0.7345303297042847, "Full-finetune/Loss (Raw)": 0.8194629549980164, "Full-finetune/Step": 5029, "Full-finetune/Step Time": 6.698747675865889} {"Full-finetune/Learning Rate": 5.471594845217865e-08, "Full-finetune/Loss": 0.7345283031463623, "Full-finetune/Loss (Raw)": 0.7512106895446777, "Full-finetune/Step": 5030, "Full-finetune/Step Time": 6.70188475959003} {"Full-finetune/Learning Rate": 5.4067092606785445e-08, "Full-finetune/Loss": 0.734825611114502, "Full-finetune/Loss (Raw)": 0.7527204751968384, "Full-finetune/Step": 5031, "Full-finetune/Step Time": 6.693902490660548} {"Full-finetune/Learning Rate": 5.342209658377728e-08, "Full-finetune/Loss": 0.7351803779602051, "Full-finetune/Loss (Raw)": 0.8254937529563904, "Full-finetune/Step": 5032, "Full-finetune/Step Time": 6.68132458627224} {"Full-finetune/Learning Rate": 5.278096063346172e-08, "Full-finetune/Loss": 0.7350736856460571, "Full-finetune/Loss (Raw)": 0.7768686413764954, "Full-finetune/Step": 5033, "Full-finetune/Step Time": 6.681265350431204} {"Full-finetune/Learning Rate": 5.214368500465305e-08, "Full-finetune/Loss": 0.7357462048530579, "Full-finetune/Loss (Raw)": 0.8030890822410583, "Full-finetune/Step": 5034, "Full-finetune/Step Time": 6.687770836055279} {"Full-finetune/Learning Rate": 5.151026994466457e-08, "Full-finetune/Loss": 0.7366466522216797, "Full-finetune/Loss (Raw)": 0.7112060189247131, "Full-finetune/Step": 5035, "Full-finetune/Step Time": 6.685844596475363} {"Full-finetune/Learning Rate": 5.088071569931185e-08, "Full-finetune/Loss": 0.7365186810493469, "Full-finetune/Loss (Raw)": 0.7441540956497192, "Full-finetune/Step": 5036, "Full-finetune/Step Time": 6.666193462908268} {"Full-finetune/Learning Rate": 5.025502251291392e-08, "Full-finetune/Loss": 0.7376677393913269, "Full-finetune/Loss (Raw)": 0.9108405113220215, "Full-finetune/Step": 5037, "Full-finetune/Step Time": 6.6617179568856955} {"Full-finetune/Learning Rate": 4.963319062828875e-08, "Full-finetune/Loss": 0.7382471561431885, "Full-finetune/Loss (Raw)": 0.8912468552589417, "Full-finetune/Step": 5038, "Full-finetune/Step Time": 6.670756779611111} {"Full-finetune/Learning Rate": 4.901522028675776e-08, "Full-finetune/Loss": 0.7397810220718384, "Full-finetune/Loss (Raw)": 0.9587014317512512, "Full-finetune/Step": 5039, "Full-finetune/Step Time": 6.675886608660221} {"Full-finetune/Learning Rate": 4.8401111728143545e-08, "Full-finetune/Loss": 0.7381961345672607, "Full-finetune/Loss (Raw)": 0.553966760635376, "Full-finetune/Step": 5040, "Full-finetune/Step Time": 6.679846720770001} {"Full-finetune/Learning Rate": 4.779086519076992e-08, "Full-finetune/Loss": 0.7391319274902344, "Full-finetune/Loss (Raw)": 0.9196411967277527, "Full-finetune/Step": 5041, "Full-finetune/Step Time": 6.668424105271697} {"Full-finetune/Learning Rate": 4.7184480911459665e-08, "Full-finetune/Loss": 0.7428895235061646, "Full-finetune/Loss (Raw)": 0.8815813660621643, "Full-finetune/Step": 5042, "Full-finetune/Step Time": 6.6639304887503386} {"Full-finetune/Learning Rate": 4.65819591255412e-08, "Full-finetune/Loss": 0.7440866231918335, "Full-finetune/Loss (Raw)": 0.8086346387863159, "Full-finetune/Step": 5043, "Full-finetune/Step Time": 6.655896930024028} {"Full-finetune/Learning Rate": 4.5983300066839706e-08, "Full-finetune/Loss": 0.7443594932556152, "Full-finetune/Loss (Raw)": 0.7916427850723267, "Full-finetune/Step": 5044, "Full-finetune/Step Time": 6.65960050560534} {"Full-finetune/Learning Rate": 4.538850396768379e-08, "Full-finetune/Loss": 0.7434254884719849, "Full-finetune/Loss (Raw)": 0.285258948802948, "Full-finetune/Step": 5045, "Full-finetune/Step Time": 6.658623928204179} {"Full-finetune/Learning Rate": 4.479757105890104e-08, "Full-finetune/Loss": 0.7397827506065369, "Full-finetune/Loss (Raw)": 0.3250063955783844, "Full-finetune/Step": 5046, "Full-finetune/Step Time": 6.677223660051823} {"Full-finetune/Learning Rate": 4.4210501569823536e-08, "Full-finetune/Loss": 0.7399406433105469, "Full-finetune/Loss (Raw)": 0.7842879295349121, "Full-finetune/Step": 5047, "Full-finetune/Step Time": 6.677757179364562} {"Full-finetune/Learning Rate": 4.362729572827906e-08, "Full-finetune/Loss": 0.7401432394981384, "Full-finetune/Loss (Raw)": 0.9012060165405273, "Full-finetune/Step": 5048, "Full-finetune/Step Time": 6.6689623557031155} {"Full-finetune/Learning Rate": 4.304795376059989e-08, "Full-finetune/Loss": 0.7399005889892578, "Full-finetune/Loss (Raw)": 0.7204148769378662, "Full-finetune/Step": 5049, "Full-finetune/Step Time": 6.662076788023114} {"Full-finetune/Learning Rate": 4.2472475891617295e-08, "Full-finetune/Loss": 0.7402916550636292, "Full-finetune/Loss (Raw)": 0.7215322852134705, "Full-finetune/Step": 5050, "Full-finetune/Step Time": 6.67365163192153} {"Full-finetune/Learning Rate": 4.1900862344661506e-08, "Full-finetune/Loss": 0.7393971681594849, "Full-finetune/Loss (Raw)": 0.6193442940711975, "Full-finetune/Step": 5051, "Full-finetune/Step Time": 6.689044140279293} {"Full-finetune/Learning Rate": 4.133311334156509e-08, "Full-finetune/Loss": 0.7365677356719971, "Full-finetune/Loss (Raw)": 0.3657340705394745, "Full-finetune/Step": 5052, "Full-finetune/Step Time": 6.702251480892301} {"Full-finetune/Learning Rate": 4.076922910266179e-08, "Full-finetune/Loss": 0.7355458736419678, "Full-finetune/Loss (Raw)": 0.5955653786659241, "Full-finetune/Step": 5053, "Full-finetune/Step Time": 6.710955869406462} {"Full-finetune/Learning Rate": 4.020920984678323e-08, "Full-finetune/Loss": 0.7367439866065979, "Full-finetune/Loss (Raw)": 0.8793460726737976, "Full-finetune/Step": 5054, "Full-finetune/Step Time": 6.71865008212626} {"Full-finetune/Learning Rate": 3.965305579126111e-08, "Full-finetune/Loss": 0.736621618270874, "Full-finetune/Loss (Raw)": 0.7441009879112244, "Full-finetune/Step": 5055, "Full-finetune/Step Time": 6.718352731317282} {"Full-finetune/Learning Rate": 3.9100767151928345e-08, "Full-finetune/Loss": 0.73857581615448, "Full-finetune/Loss (Raw)": 0.8047900199890137, "Full-finetune/Step": 5056, "Full-finetune/Step Time": 6.6937333177775145} {"Full-finetune/Learning Rate": 3.855234414311904e-08, "Full-finetune/Loss": 0.7386459112167358, "Full-finetune/Loss (Raw)": 0.7333805561065674, "Full-finetune/Step": 5057, "Full-finetune/Step Time": 6.697703113779426} {"Full-finetune/Learning Rate": 3.800778697766294e-08, "Full-finetune/Loss": 0.7386330962181091, "Full-finetune/Loss (Raw)": 0.7802590131759644, "Full-finetune/Step": 5058, "Full-finetune/Step Time": 6.702202392742038} {"Full-finetune/Learning Rate": 3.746709586689323e-08, "Full-finetune/Loss": 0.7389587163925171, "Full-finetune/Loss (Raw)": 0.8767722249031067, "Full-finetune/Step": 5059, "Full-finetune/Step Time": 6.699781626462936} {"Full-finetune/Learning Rate": 3.693027102064206e-08, "Full-finetune/Loss": 0.7395205497741699, "Full-finetune/Loss (Raw)": 0.911105751991272, "Full-finetune/Step": 5060, "Full-finetune/Step Time": 6.700847037136555} {"Full-finetune/Learning Rate": 3.639731264724056e-08, "Full-finetune/Loss": 0.7406367063522339, "Full-finetune/Loss (Raw)": 0.8443666696548462, "Full-finetune/Step": 5061, "Full-finetune/Step Time": 6.6833264622837305} {"Full-finetune/Learning Rate": 3.586822095351772e-08, "Full-finetune/Loss": 0.7388893365859985, "Full-finetune/Loss (Raw)": 0.6142504215240479, "Full-finetune/Step": 5062, "Full-finetune/Step Time": 6.6885681208223104} {"Full-finetune/Learning Rate": 3.5342996144805966e-08, "Full-finetune/Loss": 0.7391690015792847, "Full-finetune/Loss (Raw)": 0.8807284235954285, "Full-finetune/Step": 5063, "Full-finetune/Step Time": 6.686427891254425} {"Full-finetune/Learning Rate": 3.482163842493447e-08, "Full-finetune/Loss": 0.7385802268981934, "Full-finetune/Loss (Raw)": 0.6115245819091797, "Full-finetune/Step": 5064, "Full-finetune/Step Time": 6.682267293334007} {"Full-finetune/Learning Rate": 3.4304147996230275e-08, "Full-finetune/Loss": 0.7382628917694092, "Full-finetune/Loss (Raw)": 0.8638787269592285, "Full-finetune/Step": 5065, "Full-finetune/Step Time": 6.690290503203869} {"Full-finetune/Learning Rate": 3.379052505952274e-08, "Full-finetune/Loss": 0.7388091087341309, "Full-finetune/Loss (Raw)": 0.8683804273605347, "Full-finetune/Step": 5066, "Full-finetune/Step Time": 6.682270584627986} {"Full-finetune/Learning Rate": 3.328076981413908e-08, "Full-finetune/Loss": 0.7419570684432983, "Full-finetune/Loss (Raw)": 0.7371507287025452, "Full-finetune/Step": 5067, "Full-finetune/Step Time": 6.677552687004209} {"Full-finetune/Learning Rate": 3.2774882457904386e-08, "Full-finetune/Loss": 0.7433624267578125, "Full-finetune/Loss (Raw)": 0.796700119972229, "Full-finetune/Step": 5068, "Full-finetune/Step Time": 6.681644093245268} {"Full-finetune/Learning Rate": 3.227286318714384e-08, "Full-finetune/Loss": 0.7436535358428955, "Full-finetune/Loss (Raw)": 0.7019951343536377, "Full-finetune/Step": 5069, "Full-finetune/Step Time": 6.683606643229723} {"Full-finetune/Learning Rate": 3.177471219668271e-08, "Full-finetune/Loss": 0.7438310384750366, "Full-finetune/Loss (Raw)": 0.7252084016799927, "Full-finetune/Step": 5070, "Full-finetune/Step Time": 6.6809511967003345} {"Full-finetune/Learning Rate": 3.1280429679841905e-08, "Full-finetune/Loss": 0.7441195249557495, "Full-finetune/Loss (Raw)": 0.7214114665985107, "Full-finetune/Step": 5071, "Full-finetune/Step Time": 6.687873052433133} {"Full-finetune/Learning Rate": 3.079001582844354e-08, "Full-finetune/Loss": 0.7452877759933472, "Full-finetune/Loss (Raw)": 0.9512413144111633, "Full-finetune/Step": 5072, "Full-finetune/Step Time": 6.690780151635408} {"Full-finetune/Learning Rate": 3.0303470832806494e-08, "Full-finetune/Loss": 0.7449194192886353, "Full-finetune/Loss (Raw)": 0.8307603001594543, "Full-finetune/Step": 5073, "Full-finetune/Step Time": 6.694950228556991} {"Full-finetune/Learning Rate": 2.9820794881751934e-08, "Full-finetune/Loss": 0.7461536526679993, "Full-finetune/Loss (Raw)": 0.8737505078315735, "Full-finetune/Step": 5074, "Full-finetune/Step Time": 6.690716879442334} {"Full-finetune/Learning Rate": 2.9341988162595593e-08, "Full-finetune/Loss": 0.7430728673934937, "Full-finetune/Loss (Raw)": 0.3695175349712372, "Full-finetune/Step": 5075, "Full-finetune/Step Time": 6.696271013468504} {"Full-finetune/Learning Rate": 2.886705086115216e-08, "Full-finetune/Loss": 0.743424654006958, "Full-finetune/Loss (Raw)": 0.7849313020706177, "Full-finetune/Step": 5076, "Full-finetune/Step Time": 6.695925194770098} {"Full-finetune/Learning Rate": 2.8395983161736418e-08, "Full-finetune/Loss": 0.7437525987625122, "Full-finetune/Loss (Raw)": 0.7538887858390808, "Full-finetune/Step": 5077, "Full-finetune/Step Time": 6.717359077185392} {"Full-finetune/Learning Rate": 2.7928785247161027e-08, "Full-finetune/Loss": 0.7441045641899109, "Full-finetune/Loss (Raw)": 0.70449298620224, "Full-finetune/Step": 5078, "Full-finetune/Step Time": 6.7010160982608795} {"Full-finetune/Learning Rate": 2.7465457298736508e-08, "Full-finetune/Loss": 0.7444412112236023, "Full-finetune/Loss (Raw)": 0.8792431950569153, "Full-finetune/Step": 5079, "Full-finetune/Step Time": 6.700969897210598} {"Full-finetune/Learning Rate": 2.700599949626903e-08, "Full-finetune/Loss": 0.7447835206985474, "Full-finetune/Loss (Raw)": 0.8388346433639526, "Full-finetune/Step": 5080, "Full-finetune/Step Time": 6.692925591021776} {"Full-finetune/Learning Rate": 2.6550412018067072e-08, "Full-finetune/Loss": 0.7441903352737427, "Full-finetune/Loss (Raw)": 0.6051896214485168, "Full-finetune/Step": 5081, "Full-finetune/Step Time": 6.6890586372464895} {"Full-finetune/Learning Rate": 2.6098695040935874e-08, "Full-finetune/Loss": 0.7406659126281738, "Full-finetune/Loss (Raw)": 0.3404288589954376, "Full-finetune/Step": 5082, "Full-finetune/Step Time": 6.66826993227005} {"Full-finetune/Learning Rate": 2.5650848740177425e-08, "Full-finetune/Loss": 0.7401026487350464, "Full-finetune/Loss (Raw)": 0.7164059281349182, "Full-finetune/Step": 5083, "Full-finetune/Step Time": 6.672542599961162} {"Full-finetune/Learning Rate": 2.5206873289590484e-08, "Full-finetune/Loss": 0.7392013072967529, "Full-finetune/Loss (Raw)": 0.7014429569244385, "Full-finetune/Step": 5084, "Full-finetune/Step Time": 6.692247508093715} {"Full-finetune/Learning Rate": 2.4766768861475e-08, "Full-finetune/Loss": 0.7383942604064941, "Full-finetune/Loss (Raw)": 0.7353725433349609, "Full-finetune/Step": 5085, "Full-finetune/Step Time": 6.694488998502493} {"Full-finetune/Learning Rate": 2.4330535626627684e-08, "Full-finetune/Loss": 0.7401849031448364, "Full-finetune/Loss (Raw)": 0.9063068628311157, "Full-finetune/Step": 5086, "Full-finetune/Step Time": 6.681972146034241} {"Full-finetune/Learning Rate": 2.389817375433978e-08, "Full-finetune/Loss": 0.7427821159362793, "Full-finetune/Loss (Raw)": 0.7665318250656128, "Full-finetune/Step": 5087, "Full-finetune/Step Time": 6.695242764428258} {"Full-finetune/Learning Rate": 2.3469683412403745e-08, "Full-finetune/Loss": 0.7443946599960327, "Full-finetune/Loss (Raw)": 0.9454898834228516, "Full-finetune/Step": 5088, "Full-finetune/Step Time": 6.69447741471231} {"Full-finetune/Learning Rate": 2.304506476710877e-08, "Full-finetune/Loss": 0.7451947331428528, "Full-finetune/Loss (Raw)": 0.8422776460647583, "Full-finetune/Step": 5089, "Full-finetune/Step Time": 6.692772351205349} {"Full-finetune/Learning Rate": 2.262431798323972e-08, "Full-finetune/Loss": 0.7444618940353394, "Full-finetune/Loss (Raw)": 0.7149151563644409, "Full-finetune/Step": 5090, "Full-finetune/Step Time": 6.694963157176971} {"Full-finetune/Learning Rate": 2.2207443224081528e-08, "Full-finetune/Loss": 0.7450328469276428, "Full-finetune/Loss (Raw)": 0.8228022456169128, "Full-finetune/Step": 5091, "Full-finetune/Step Time": 6.7018179800361395} {"Full-finetune/Learning Rate": 2.1794440651414782e-08, "Full-finetune/Loss": 0.7407390475273132, "Full-finetune/Loss (Raw)": 0.3146018981933594, "Full-finetune/Step": 5092, "Full-finetune/Step Time": 6.706524681299925} {"Full-finetune/Learning Rate": 2.1385310425517945e-08, "Full-finetune/Loss": 0.740021824836731, "Full-finetune/Loss (Raw)": 0.8098878860473633, "Full-finetune/Step": 5093, "Full-finetune/Step Time": 6.707475550472736} {"Full-finetune/Learning Rate": 2.0980052705165123e-08, "Full-finetune/Loss": 0.7389092445373535, "Full-finetune/Loss (Raw)": 0.5907312035560608, "Full-finetune/Step": 5094, "Full-finetune/Step Time": 6.7162707801908255} {"Full-finetune/Learning Rate": 2.05786676476305e-08, "Full-finetune/Loss": 0.7365989685058594, "Full-finetune/Loss (Raw)": 0.56850266456604, "Full-finetune/Step": 5095, "Full-finetune/Step Time": 6.722891030833125} {"Full-finetune/Learning Rate": 2.0181155408682816e-08, "Full-finetune/Loss": 0.7358078360557556, "Full-finetune/Loss (Raw)": 0.6747423410415649, "Full-finetune/Step": 5096, "Full-finetune/Step Time": 6.7493813671171665} {"Full-finetune/Learning Rate": 1.978751614258978e-08, "Full-finetune/Loss": 0.7337197065353394, "Full-finetune/Loss (Raw)": 0.4602903425693512, "Full-finetune/Step": 5097, "Full-finetune/Step Time": 6.72886067442596} {"Full-finetune/Learning Rate": 1.9397750002113634e-08, "Full-finetune/Loss": 0.7324931621551514, "Full-finetune/Loss (Raw)": 0.6385142207145691, "Full-finetune/Step": 5098, "Full-finetune/Step Time": 6.730523252859712} {"Full-finetune/Learning Rate": 1.901185713851672e-08, "Full-finetune/Loss": 0.7309383153915405, "Full-finetune/Loss (Raw)": 0.7014693021774292, "Full-finetune/Step": 5099, "Full-finetune/Step Time": 6.718167310580611} {"Full-finetune/Learning Rate": 1.8629837701554797e-08, "Full-finetune/Loss": 0.7301650047302246, "Full-finetune/Loss (Raw)": 0.6576252579689026, "Full-finetune/Step": 5100, "Full-finetune/Step Time": 6.704546075314283} {"Full-finetune/Learning Rate": 1.825169183948372e-08, "Full-finetune/Loss": 0.7284331321716309, "Full-finetune/Loss (Raw)": 0.7089676260948181, "Full-finetune/Step": 5101, "Full-finetune/Step Time": 6.705670662224293} {"Full-finetune/Learning Rate": 1.7877419699053876e-08, "Full-finetune/Loss": 0.7318053245544434, "Full-finetune/Loss (Raw)": 0.731049120426178, "Full-finetune/Step": 5102, "Full-finetune/Step Time": 6.689281992614269} {"Full-finetune/Learning Rate": 1.7507021425512417e-08, "Full-finetune/Loss": 0.7332584857940674, "Full-finetune/Loss (Raw)": 0.8737353086471558, "Full-finetune/Step": 5103, "Full-finetune/Step Time": 6.674394000321627} {"Full-finetune/Learning Rate": 1.7140497162605464e-08, "Full-finetune/Loss": 0.7301592826843262, "Full-finetune/Loss (Raw)": 0.5048840641975403, "Full-finetune/Step": 5104, "Full-finetune/Step Time": 6.6763402707874775} {"Full-finetune/Learning Rate": 1.677784705257146e-08, "Full-finetune/Loss": 0.731330156326294, "Full-finetune/Loss (Raw)": 0.8280990719795227, "Full-finetune/Step": 5105, "Full-finetune/Step Time": 6.655424416065216} {"Full-finetune/Learning Rate": 1.6419071236148943e-08, "Full-finetune/Loss": 0.7329080104827881, "Full-finetune/Loss (Raw)": 0.9306458234786987, "Full-finetune/Step": 5106, "Full-finetune/Step Time": 6.661625683307648} {"Full-finetune/Learning Rate": 1.6064169852572088e-08, "Full-finetune/Loss": 0.7343850135803223, "Full-finetune/Loss (Raw)": 0.8469244241714478, "Full-finetune/Step": 5107, "Full-finetune/Step Time": 6.660152776166797} {"Full-finetune/Learning Rate": 1.5713143039571833e-08, "Full-finetune/Loss": 0.7352346181869507, "Full-finetune/Loss (Raw)": 0.7629878520965576, "Full-finetune/Step": 5108, "Full-finetune/Step Time": 6.644012516364455} {"Full-finetune/Learning Rate": 1.5365990933373653e-08, "Full-finetune/Loss": 0.7365725040435791, "Full-finetune/Loss (Raw)": 0.8836930394172668, "Full-finetune/Step": 5109, "Full-finetune/Step Time": 6.646761802956462} {"Full-finetune/Learning Rate": 1.5022713668699785e-08, "Full-finetune/Loss": 0.7355601191520691, "Full-finetune/Loss (Raw)": 0.7382407784461975, "Full-finetune/Step": 5110, "Full-finetune/Step Time": 6.658504882827401} {"Full-finetune/Learning Rate": 1.4683311378771437e-08, "Full-finetune/Loss": 0.7373903393745422, "Full-finetune/Loss (Raw)": 0.6430377960205078, "Full-finetune/Step": 5111, "Full-finetune/Step Time": 6.665459789335728} {"Full-finetune/Learning Rate": 1.434778419530325e-08, "Full-finetune/Loss": 0.7351326942443848, "Full-finetune/Loss (Raw)": 0.343606561422348, "Full-finetune/Step": 5112, "Full-finetune/Step Time": 6.673496253788471} {"Full-finetune/Learning Rate": 1.401613224850551e-08, "Full-finetune/Loss": 0.7304951548576355, "Full-finetune/Loss (Raw)": 0.2849411368370056, "Full-finetune/Step": 5113, "Full-finetune/Step Time": 6.697235314175487} {"Full-finetune/Learning Rate": 1.3688355667087483e-08, "Full-finetune/Loss": 0.7315866351127625, "Full-finetune/Loss (Raw)": 0.7402059435844421, "Full-finetune/Step": 5114, "Full-finetune/Step Time": 6.698373841121793} {"Full-finetune/Learning Rate": 1.3364454578252972e-08, "Full-finetune/Loss": 0.7308844327926636, "Full-finetune/Loss (Raw)": 0.7151834964752197, "Full-finetune/Step": 5115, "Full-finetune/Step Time": 6.69009274430573} {"Full-finetune/Learning Rate": 1.3044429107700319e-08, "Full-finetune/Loss": 0.7262846827507019, "Full-finetune/Loss (Raw)": 0.2542543113231659, "Full-finetune/Step": 5116, "Full-finetune/Step Time": 6.7017748188227415} {"Full-finetune/Learning Rate": 1.272827937962573e-08, "Full-finetune/Loss": 0.727403998374939, "Full-finetune/Loss (Raw)": 0.9524697661399841, "Full-finetune/Step": 5117, "Full-finetune/Step Time": 6.703381035476923} {"Full-finetune/Learning Rate": 1.2416005516722174e-08, "Full-finetune/Loss": 0.7275825142860413, "Full-finetune/Loss (Raw)": 0.7965110540390015, "Full-finetune/Step": 5118, "Full-finetune/Step Time": 6.705238683149219} {"Full-finetune/Learning Rate": 1.2107607640174934e-08, "Full-finetune/Loss": 0.7285379767417908, "Full-finetune/Loss (Raw)": 0.8822771906852722, "Full-finetune/Step": 5119, "Full-finetune/Step Time": 6.70533468015492} {"Full-finetune/Learning Rate": 1.1803085869667164e-08, "Full-finetune/Loss": 0.7240495681762695, "Full-finetune/Loss (Raw)": 0.3375850021839142, "Full-finetune/Step": 5120, "Full-finetune/Step Time": 6.707028545439243} {"Full-finetune/Learning Rate": 1.1502440323379882e-08, "Full-finetune/Loss": 0.7257974147796631, "Full-finetune/Loss (Raw)": 0.7271703481674194, "Full-finetune/Step": 5121, "Full-finetune/Step Time": 6.691996062174439} {"Full-finetune/Learning Rate": 1.1205671117985318e-08, "Full-finetune/Loss": 0.7250913381576538, "Full-finetune/Loss (Raw)": 0.6935949921607971, "Full-finetune/Step": 5122, "Full-finetune/Step Time": 6.682016734033823} {"Full-finetune/Learning Rate": 1.0912778368655786e-08, "Full-finetune/Loss": 0.7269373536109924, "Full-finetune/Loss (Raw)": 0.8033393621444702, "Full-finetune/Step": 5123, "Full-finetune/Step Time": 6.684032207354903} {"Full-finetune/Learning Rate": 1.0623762189057029e-08, "Full-finetune/Loss": 0.7267910838127136, "Full-finetune/Loss (Raw)": 0.8785171508789062, "Full-finetune/Step": 5124, "Full-finetune/Step Time": 6.694883806630969} {"Full-finetune/Learning Rate": 1.0338622691349332e-08, "Full-finetune/Loss": 0.7268843054771423, "Full-finetune/Loss (Raw)": 0.8528395295143127, "Full-finetune/Step": 5125, "Full-finetune/Step Time": 6.698449898511171} {"Full-finetune/Learning Rate": 1.005735998619084e-08, "Full-finetune/Loss": 0.7219082117080688, "Full-finetune/Loss (Raw)": 0.38263997435569763, "Full-finetune/Step": 5126, "Full-finetune/Step Time": 6.714586958289146} {"Full-finetune/Learning Rate": 9.779974182733131e-09, "Full-finetune/Loss": 0.7202713489532471, "Full-finetune/Loss (Raw)": 0.6693586111068726, "Full-finetune/Step": 5127, "Full-finetune/Step Time": 6.72717772051692} {"Full-finetune/Learning Rate": 9.506465388624541e-09, "Full-finetune/Loss": 0.7235547304153442, "Full-finetune/Loss (Raw)": 0.7674006223678589, "Full-finetune/Step": 5128, "Full-finetune/Step Time": 6.711918568238616} {"Full-finetune/Learning Rate": 9.236833710010163e-09, "Full-finetune/Loss": 0.7195411920547485, "Full-finetune/Loss (Raw)": 0.28813326358795166, "Full-finetune/Step": 5129, "Full-finetune/Step Time": 6.730213329195976} {"Full-finetune/Learning Rate": 8.971079251526293e-09, "Full-finetune/Loss": 0.7214105129241943, "Full-finetune/Loss (Raw)": 0.7629618048667908, "Full-finetune/Step": 5130, "Full-finetune/Step Time": 6.734625671058893} {"Full-finetune/Learning Rate": 8.709202116308214e-09, "Full-finetune/Loss": 0.7205718755722046, "Full-finetune/Loss (Raw)": 0.5901921391487122, "Full-finetune/Step": 5131, "Full-finetune/Step Time": 6.739359335973859} {"Full-finetune/Learning Rate": 8.451202405985736e-09, "Full-finetune/Loss": 0.7204427123069763, "Full-finetune/Loss (Raw)": 0.5895328521728516, "Full-finetune/Step": 5132, "Full-finetune/Step Time": 6.732999783009291} {"Full-finetune/Learning Rate": 8.197080220683217e-09, "Full-finetune/Loss": 0.7201672792434692, "Full-finetune/Loss (Raw)": 0.7307947874069214, "Full-finetune/Step": 5133, "Full-finetune/Step Time": 6.722801852971315} {"Full-finetune/Learning Rate": 7.946835659020657e-09, "Full-finetune/Loss": 0.7203686237335205, "Full-finetune/Loss (Raw)": 0.809729814529419, "Full-finetune/Step": 5134, "Full-finetune/Step Time": 6.725993553176522} {"Full-finetune/Learning Rate": 7.700468818111483e-09, "Full-finetune/Loss": 0.720936119556427, "Full-finetune/Loss (Raw)": 0.6266833543777466, "Full-finetune/Step": 5135, "Full-finetune/Step Time": 6.719566237181425} {"Full-finetune/Learning Rate": 7.457979793568105e-09, "Full-finetune/Loss": 0.7226452827453613, "Full-finetune/Loss (Raw)": 0.9106217622756958, "Full-finetune/Step": 5136, "Full-finetune/Step Time": 6.723790863528848} {"Full-finetune/Learning Rate": 7.219368679495242e-09, "Full-finetune/Loss": 0.7214428782463074, "Full-finetune/Loss (Raw)": 0.7689919471740723, "Full-finetune/Step": 5137, "Full-finetune/Step Time": 6.726799054071307} {"Full-finetune/Learning Rate": 6.984635568492159e-09, "Full-finetune/Loss": 0.721016526222229, "Full-finetune/Loss (Raw)": 0.7346505522727966, "Full-finetune/Step": 5138, "Full-finetune/Step Time": 6.739290421828628} {"Full-finetune/Learning Rate": 6.753780551654876e-09, "Full-finetune/Loss": 0.7177611589431763, "Full-finetune/Loss (Raw)": 0.33649542927742004, "Full-finetune/Step": 5139, "Full-finetune/Step Time": 6.756299363449216} {"Full-finetune/Learning Rate": 6.526803718572838e-09, "Full-finetune/Loss": 0.7179615497589111, "Full-finetune/Loss (Raw)": 0.79059237241745, "Full-finetune/Step": 5140, "Full-finetune/Step Time": 6.7505697552114725} {"Full-finetune/Learning Rate": 6.3037051573333615e-09, "Full-finetune/Loss": 0.7197757959365845, "Full-finetune/Loss (Raw)": 0.8768439292907715, "Full-finetune/Step": 5141, "Full-finetune/Step Time": 6.757562721148133} {"Full-finetune/Learning Rate": 6.0844849545149685e-09, "Full-finetune/Loss": 0.7195746898651123, "Full-finetune/Loss (Raw)": 0.6842618584632874, "Full-finetune/Step": 5142, "Full-finetune/Step Time": 6.760520454496145} {"Full-finetune/Learning Rate": 5.869143195192939e-09, "Full-finetune/Loss": 0.7210835814476013, "Full-finetune/Loss (Raw)": 0.8843131065368652, "Full-finetune/Step": 5143, "Full-finetune/Step Time": 6.76261923648417} {"Full-finetune/Learning Rate": 5.657679962938201e-09, "Full-finetune/Loss": 0.7198289036750793, "Full-finetune/Loss (Raw)": 0.5682677030563354, "Full-finetune/Step": 5144, "Full-finetune/Step Time": 6.766558080911636} {"Full-finetune/Learning Rate": 5.4500953398139985e-09, "Full-finetune/Loss": 0.7206504344940186, "Full-finetune/Loss (Raw)": 0.753875195980072, "Full-finetune/Step": 5145, "Full-finetune/Step Time": 6.776765396818519} {"Full-finetune/Learning Rate": 5.246389406381447e-09, "Full-finetune/Loss": 0.7223601341247559, "Full-finetune/Loss (Raw)": 0.8825567960739136, "Full-finetune/Step": 5146, "Full-finetune/Step Time": 6.761303875595331} {"Full-finetune/Learning Rate": 5.046562241693975e-09, "Full-finetune/Loss": 0.7228087186813354, "Full-finetune/Loss (Raw)": 0.7854631543159485, "Full-finetune/Step": 5147, "Full-finetune/Step Time": 6.762918997555971} {"Full-finetune/Learning Rate": 4.850613923300662e-09, "Full-finetune/Loss": 0.7240970134735107, "Full-finetune/Loss (Raw)": 0.5064267516136169, "Full-finetune/Step": 5148, "Full-finetune/Step Time": 6.739273017272353} {"Full-finetune/Learning Rate": 4.658544527244013e-09, "Full-finetune/Loss": 0.7234220504760742, "Full-finetune/Loss (Raw)": 0.7578960657119751, "Full-finetune/Step": 5149, "Full-finetune/Step Time": 6.754543319344521} {"Full-finetune/Learning Rate": 4.470354128065513e-09, "Full-finetune/Loss": 0.7231124639511108, "Full-finetune/Loss (Raw)": 0.7629969120025635, "Full-finetune/Step": 5150, "Full-finetune/Step Time": 6.761001881211996} {"Full-finetune/Learning Rate": 4.286042798794521e-09, "Full-finetune/Loss": 0.7228110432624817, "Full-finetune/Loss (Raw)": 0.7104983925819397, "Full-finetune/Step": 5151, "Full-finetune/Step Time": 6.757484244182706} {"Full-finetune/Learning Rate": 4.105610610961597e-09, "Full-finetune/Loss": 0.7224870920181274, "Full-finetune/Loss (Raw)": 0.707530677318573, "Full-finetune/Step": 5152, "Full-finetune/Step Time": 6.7582970801740885} {"Full-finetune/Learning Rate": 3.929057634587397e-09, "Full-finetune/Loss": 0.7198886275291443, "Full-finetune/Loss (Raw)": 0.41420021653175354, "Full-finetune/Step": 5153, "Full-finetune/Step Time": 6.764368902891874} {"Full-finetune/Learning Rate": 3.756383938189334e-09, "Full-finetune/Loss": 0.7162477970123291, "Full-finetune/Loss (Raw)": 0.3672845661640167, "Full-finetune/Step": 5154, "Full-finetune/Step Time": 6.783116187900305} {"Full-finetune/Learning Rate": 3.587589588778251e-09, "Full-finetune/Loss": 0.7152348160743713, "Full-finetune/Loss (Raw)": 0.7040121555328369, "Full-finetune/Step": 5155, "Full-finetune/Step Time": 6.772777728736401} {"Full-finetune/Learning Rate": 3.4226746518606356e-09, "Full-finetune/Loss": 0.714802622795105, "Full-finetune/Loss (Raw)": 0.8404110670089722, "Full-finetune/Step": 5156, "Full-finetune/Step Time": 6.7852926682680845} {"Full-finetune/Learning Rate": 3.2616391914364056e-09, "Full-finetune/Loss": 0.7144469022750854, "Full-finetune/Loss (Raw)": 0.7739337086677551, "Full-finetune/Step": 5157, "Full-finetune/Step Time": 6.784712478518486} {"Full-finetune/Learning Rate": 3.1044832699989035e-09, "Full-finetune/Loss": 0.7145538330078125, "Full-finetune/Loss (Raw)": 0.7649059295654297, "Full-finetune/Step": 5158, "Full-finetune/Step Time": 6.780540000647306} {"Full-finetune/Learning Rate": 2.9512069485393426e-09, "Full-finetune/Loss": 0.7155600786209106, "Full-finetune/Loss (Raw)": 0.8815187215805054, "Full-finetune/Step": 5159, "Full-finetune/Step Time": 6.783543154597282} {"Full-finetune/Learning Rate": 2.801810286540141e-09, "Full-finetune/Loss": 0.7161063551902771, "Full-finetune/Loss (Raw)": 0.8954112529754639, "Full-finetune/Step": 5160, "Full-finetune/Step Time": 6.781949190422893} {"Full-finetune/Learning Rate": 2.656293341980476e-09, "Full-finetune/Loss": 0.7163934111595154, "Full-finetune/Loss (Raw)": 0.813610851764679, "Full-finetune/Step": 5161, "Full-finetune/Step Time": 6.792529175058007} {"Full-finetune/Learning Rate": 2.5146561713307315e-09, "Full-finetune/Loss": 0.7154660820960999, "Full-finetune/Loss (Raw)": 0.6843929290771484, "Full-finetune/Step": 5162, "Full-finetune/Step Time": 6.788129495456815} {"Full-finetune/Learning Rate": 2.3768988295580497e-09, "Full-finetune/Loss": 0.7161672115325928, "Full-finetune/Loss (Raw)": 0.8009517788887024, "Full-finetune/Step": 5163, "Full-finetune/Step Time": 6.783680768683553} {"Full-finetune/Learning Rate": 2.2430213701252203e-09, "Full-finetune/Loss": 0.7167410850524902, "Full-finetune/Loss (Raw)": 0.8176102638244629, "Full-finetune/Step": 5164, "Full-finetune/Step Time": 6.797395154833794} {"Full-finetune/Learning Rate": 2.1130238449851292e-09, "Full-finetune/Loss": 0.7140117883682251, "Full-finetune/Loss (Raw)": 0.5614887475967407, "Full-finetune/Step": 5165, "Full-finetune/Step Time": 6.807160506024957} {"Full-finetune/Learning Rate": 1.986906304588532e-09, "Full-finetune/Loss": 0.7127847671508789, "Full-finetune/Loss (Raw)": 0.7341923117637634, "Full-finetune/Step": 5166, "Full-finetune/Step Time": 6.813688579946756} {"Full-finetune/Learning Rate": 1.8646687978784992e-09, "Full-finetune/Loss": 0.7103380560874939, "Full-finetune/Loss (Raw)": 0.6455206274986267, "Full-finetune/Step": 5167, "Full-finetune/Step Time": 6.807212652638555} {"Full-finetune/Learning Rate": 1.7463113722937518e-09, "Full-finetune/Loss": 0.7127994298934937, "Full-finetune/Loss (Raw)": 0.8690149188041687, "Full-finetune/Step": 5168, "Full-finetune/Step Time": 6.798756843432784} {"Full-finetune/Learning Rate": 1.631834073765326e-09, "Full-finetune/Loss": 0.7122877836227417, "Full-finetune/Loss (Raw)": 0.8541572093963623, "Full-finetune/Step": 5169, "Full-finetune/Step Time": 6.8000989481806755} {"Full-finetune/Learning Rate": 1.5212369467210164e-09, "Full-finetune/Loss": 0.7103496789932251, "Full-finetune/Loss (Raw)": 0.6334981322288513, "Full-finetune/Step": 5170, "Full-finetune/Step Time": 6.797151470556855} {"Full-finetune/Learning Rate": 1.4145200340809352e-09, "Full-finetune/Loss": 0.7114275693893433, "Full-finetune/Loss (Raw)": 0.9466145634651184, "Full-finetune/Step": 5171, "Full-finetune/Step Time": 6.792747305706143} {"Full-finetune/Learning Rate": 1.3116833772597315e-09, "Full-finetune/Loss": 0.7110037207603455, "Full-finetune/Loss (Raw)": 0.7373859882354736, "Full-finetune/Step": 5172, "Full-finetune/Step Time": 6.788832399994135} {"Full-finetune/Learning Rate": 1.2127270161654824e-09, "Full-finetune/Loss": 0.7142841219902039, "Full-finetune/Loss (Raw)": 0.7051520943641663, "Full-finetune/Step": 5173, "Full-finetune/Step Time": 6.770474165678024} {"Full-finetune/Learning Rate": 1.1176509892030229e-09, "Full-finetune/Loss": 0.719305694103241, "Full-finetune/Loss (Raw)": 0.9677644371986389, "Full-finetune/Step": 5174, "Full-finetune/Step Time": 6.751726560294628} {"Full-finetune/Learning Rate": 1.0264553332683946e-09, "Full-finetune/Loss": 0.7188574075698853, "Full-finetune/Loss (Raw)": 0.7269101142883301, "Full-finetune/Step": 5175, "Full-finetune/Step Time": 6.758353408426046} {"Full-finetune/Learning Rate": 9.39140083752177e-10, "Full-finetune/Loss": 0.7142876982688904, "Full-finetune/Loss (Raw)": 0.3162822127342224, "Full-finetune/Step": 5176, "Full-finetune/Step Time": 6.77561991289258} {"Full-finetune/Learning Rate": 8.557052745405969e-10, "Full-finetune/Loss": 0.7151610851287842, "Full-finetune/Loss (Raw)": 0.8322024345397949, "Full-finetune/Step": 5177, "Full-finetune/Step Time": 6.769398951902986} {"Full-finetune/Learning Rate": 7.761509380133092e-10, "Full-finetune/Loss": 0.7146140336990356, "Full-finetune/Loss (Raw)": 0.651518702507019, "Full-finetune/Step": 5178, "Full-finetune/Step Time": 6.754301825538278} {"Full-finetune/Learning Rate": 7.004771050433956e-10, "Full-finetune/Loss": 0.7150797843933105, "Full-finetune/Loss (Raw)": 0.6789596080780029, "Full-finetune/Step": 5179, "Full-finetune/Step Time": 6.749676149338484} {"Full-finetune/Learning Rate": 6.286838049984755e-10, "Full-finetune/Loss": 0.7169123888015747, "Full-finetune/Loss (Raw)": 0.6003101468086243, "Full-finetune/Step": 5180, "Full-finetune/Step Time": 6.7403048649430275} {"Full-finetune/Learning Rate": 5.607710657407061e-10, "Full-finetune/Loss": 0.7185388803482056, "Full-finetune/Loss (Raw)": 0.8037508130073547, "Full-finetune/Step": 5181, "Full-finetune/Step Time": 6.745574312284589} {"Full-finetune/Learning Rate": 4.967389136245615e-10, "Full-finetune/Loss": 0.7163488864898682, "Full-finetune/Loss (Raw)": 0.5990326404571533, "Full-finetune/Step": 5182, "Full-finetune/Step Time": 6.748310225084424} {"Full-finetune/Learning Rate": 4.3658737350016354e-10, "Full-finetune/Loss": 0.7170150279998779, "Full-finetune/Loss (Raw)": 0.8293637633323669, "Full-finetune/Step": 5183, "Full-finetune/Step Time": 6.753505673259497} {"Full-finetune/Learning Rate": 3.8031646871106166e-10, "Full-finetune/Loss": 0.7158575654029846, "Full-finetune/Loss (Raw)": 0.6566346287727356, "Full-finetune/Step": 5184, "Full-finetune/Step Time": 6.763208566233516} {"Full-finetune/Learning Rate": 3.279262210953427e-10, "Full-finetune/Loss": 0.716610312461853, "Full-finetune/Loss (Raw)": 0.8297275304794312, "Full-finetune/Step": 5185, "Full-finetune/Step Time": 6.773828061297536} {"Full-finetune/Learning Rate": 2.794166509845209e-10, "Full-finetune/Loss": 0.7134051322937012, "Full-finetune/Loss (Raw)": 0.3700040578842163, "Full-finetune/Step": 5186, "Full-finetune/Step Time": 6.789492052048445} {"Full-finetune/Learning Rate": 2.3478777720353785e-10, "Full-finetune/Loss": 0.7114734649658203, "Full-finetune/Loss (Raw)": 0.6295140981674194, "Full-finetune/Step": 5187, "Full-finetune/Step Time": 6.807293904945254} {"Full-finetune/Learning Rate": 1.940396170718728e-10, "Full-finetune/Loss": 0.7096347808837891, "Full-finetune/Loss (Raw)": 0.675752580165863, "Full-finetune/Step": 5188, "Full-finetune/Step Time": 6.808090224862099} {"Full-finetune/Learning Rate": 1.5717218640465272e-10, "Full-finetune/Loss": 0.7075951099395752, "Full-finetune/Loss (Raw)": 0.5832914710044861, "Full-finetune/Step": 5189, "Full-finetune/Step Time": 6.830557545647025} {"Full-finetune/Learning Rate": 1.2418549950821145e-10, "Full-finetune/Loss": 0.7073980569839478, "Full-finetune/Loss (Raw)": 0.5890231132507324, "Full-finetune/Step": 5190, "Full-finetune/Step Time": 6.82763971015811} {"Full-finetune/Learning Rate": 9.507956918453076e-11, "Full-finetune/Loss": 0.7053499221801758, "Full-finetune/Loss (Raw)": 0.6185694336891174, "Full-finetune/Step": 5191, "Full-finetune/Step Time": 6.838544791564345} {"Full-finetune/Learning Rate": 6.985440672790945e-11, "Full-finetune/Loss": 0.7061767578125, "Full-finetune/Loss (Raw)": 0.7173683047294617, "Full-finetune/Step": 5192, "Full-finetune/Step Time": 6.8337688613682985} {"Full-finetune/Learning Rate": 4.851002192940435e-11, "Full-finetune/Loss": 0.7045490741729736, "Full-finetune/Loss (Raw)": 0.6555178165435791, "Full-finetune/Step": 5193, "Full-finetune/Step Time": 6.843903556466103} {"Full-finetune/Learning Rate": 3.1046423071279254e-11, "Full-finetune/Loss": 0.7003294229507446, "Full-finetune/Loss (Raw)": 0.32826969027519226, "Full-finetune/Step": 5194, "Full-finetune/Step Time": 6.860497998073697} {"Full-finetune/Learning Rate": 1.7463616930335493e-11, "Full-finetune/Loss": 0.7001593112945557, "Full-finetune/Loss (Raw)": 0.7153821587562561, "Full-finetune/Step": 5195, "Full-finetune/Step Time": 6.848202357068658} {"Full-finetune/Learning Rate": 7.761608780132434e-12, "Full-finetune/Loss": 0.6994156837463379, "Full-finetune/Loss (Raw)": 0.701519787311554, "Full-finetune/Step": 5196, "Full-finetune/Step Time": 6.8431984055787325} {"Full-finetune/Learning Rate": 1.9404023832159115e-12, "Full-finetune/Loss": 0.7002208232879639, "Full-finetune/Loss (Raw)": 0.805050790309906, "Full-finetune/Step": 5197, "Full-finetune/Step Time": 6.834853954613209} {"Full-finetune/Learning Rate": 0.0, "Full-finetune/Loss": 0.7000993490219116, "Full-finetune/Loss (Raw)": 0.7096576690673828, "Full-finetune/Step": 5198, "Full-finetune/Step Time": 6.830334419384599}