{"Finetune/Learning Rate": 7.692307692307692e-08, "Finetune/Loss": 9.865138053894043, "Finetune/Loss (Raw)": 9.865138053894043, "Finetune/Step": 1, "Finetune/Step Time": 14.660694122314453} {"Finetune/Learning Rate": 1.5384615384615385e-07, "Finetune/Loss": 9.978597640991211, "Finetune/Loss (Raw)": 10.092057228088379, "Finetune/Step": 2, "Finetune/Step Time": 11.290221691131592} {"Finetune/Learning Rate": 2.3076923076923078e-07, "Finetune/Loss": 9.961700439453125, "Finetune/Loss (Raw)": 9.927906036376953, "Finetune/Step": 3, "Finetune/Step Time": 10.139443079630533} {"Finetune/Learning Rate": 3.076923076923077e-07, "Finetune/Loss": 10.036373138427734, "Finetune/Loss (Raw)": 10.260393142700195, "Finetune/Step": 4, "Finetune/Step Time": 9.728033483028412} {"Finetune/Learning Rate": 3.8461538461538463e-07, "Finetune/Loss": 10.038104057312012, "Finetune/Loss (Raw)": 10.045024871826172, "Finetune/Step": 5, "Finetune/Step Time": 9.330220127105713} {"Finetune/Learning Rate": 4.6153846153846156e-07, "Finetune/Loss": 9.96912956237793, "Finetune/Loss (Raw)": 9.624249458312988, "Finetune/Step": 6, "Finetune/Step Time": 9.067095081011454} {"Finetune/Learning Rate": 5.384615384615384e-07, "Finetune/Loss": 9.875020980834961, "Finetune/Loss (Raw)": 9.310371398925781, "Finetune/Step": 7, "Finetune/Step Time": 8.877002579825264} {"Finetune/Learning Rate": 6.153846153846154e-07, "Finetune/Loss": 9.776061058044434, "Finetune/Loss (Raw)": 9.083349227905273, "Finetune/Step": 8, "Finetune/Step Time": 8.824377685785294} {"Finetune/Learning Rate": 6.923076923076922e-07, "Finetune/Loss": 9.628030776977539, "Finetune/Loss (Raw)": 8.44378662109375, "Finetune/Step": 9, "Finetune/Step Time": 8.730186409420437} {"Finetune/Learning Rate": 7.692307692307693e-07, "Finetune/Loss": 9.53133487701416, "Finetune/Loss (Raw)": 8.6610689163208, "Finetune/Step": 10, "Finetune/Step Time": 8.51972563266754} {"Finetune/Learning Rate": 8.461538461538461e-07, "Finetune/Loss": 9.39122486114502, "Finetune/Loss (Raw)": 7.9901299476623535, "Finetune/Step": 11, "Finetune/Step Time": 8.454294378107244} {"Finetune/Learning Rate": 9.230769230769231e-07, "Finetune/Loss": 9.183758735656738, "Finetune/Loss (Raw)": 6.901623249053955, "Finetune/Step": 12, "Finetune/Step Time": 8.4759747783343} {"Finetune/Learning Rate": 1e-06, "Finetune/Loss": 8.985602378845215, "Finetune/Loss (Raw)": 6.607728481292725, "Finetune/Step": 13, "Finetune/Step Time": 8.417969850393442} {"Finetune/Learning Rate": 1.0769230769230769e-06, "Finetune/Loss": 8.700939178466797, "Finetune/Loss (Raw)": 5.000319957733154, "Finetune/Step": 14, "Finetune/Step Time": 8.392841850008283} {"Finetune/Learning Rate": 1.1538461538461536e-06, "Finetune/Loss": 8.454697608947754, "Finetune/Loss (Raw)": 5.007307052612305, "Finetune/Step": 15, "Finetune/Step Time": 8.35947790145874} {"Finetune/Learning Rate": 1.2307692307692308e-06, "Finetune/Loss": 8.160318374633789, "Finetune/Loss (Raw)": 3.744636058807373, "Finetune/Step": 16, "Finetune/Step Time": 8.404550224542618} {"Finetune/Learning Rate": 1.3076923076923077e-06, "Finetune/Loss": 7.856196880340576, "Finetune/Loss (Raw)": 2.9902467727661133, "Finetune/Step": 17, "Finetune/Step Time": 8.371050245621625} {"Finetune/Learning Rate": 1.3846153846153844e-06, "Finetune/Loss": 7.581020832061768, "Finetune/Loss (Raw)": 2.9030404090881348, "Finetune/Step": 18, "Finetune/Step Time": 8.338023132748074} {"Finetune/Learning Rate": 1.4615384615384614e-06, "Finetune/Loss": 7.3379902839660645, "Finetune/Loss (Raw)": 2.9634459018707275, "Finetune/Step": 19, "Finetune/Step Time": 8.24712814782795} {"Finetune/Learning Rate": 1.5384615384615385e-06, "Finetune/Loss": 7.09036111831665, "Finetune/Loss (Raw)": 2.385401487350464, "Finetune/Step": 20, "Finetune/Step Time": 8.305135345458984} {"Finetune/Learning Rate": 1.6153846153846154e-06, "Finetune/Loss": 6.856446743011475, "Finetune/Loss (Raw)": 2.1781554222106934, "Finetune/Step": 21, "Finetune/Step Time": 8.276204234077817} {"Finetune/Learning Rate": 1.6923076923076922e-06, "Finetune/Loss": 6.629848480224609, "Finetune/Loss (Raw)": 1.8712804317474365, "Finetune/Step": 22, "Finetune/Step Time": 8.25478463823145} {"Finetune/Learning Rate": 1.769230769230769e-06, "Finetune/Loss": 6.413041114807129, "Finetune/Loss (Raw)": 1.643276572227478, "Finetune/Step": 23, "Finetune/Step Time": 8.23861314939416} {"Finetune/Learning Rate": 1.8461538461538462e-06, "Finetune/Loss": 6.216305732727051, "Finetune/Loss (Raw)": 1.691400170326233, "Finetune/Step": 24, "Finetune/Step Time": 8.297311584154764} {"Finetune/Learning Rate": 1.923076923076923e-06, "Finetune/Loss": 6.052402973175049, "Finetune/Loss (Raw)": 2.1187381744384766, "Finetune/Step": 25, "Finetune/Step Time": 8.233297653198242} {"Finetune/Learning Rate": 2e-06, "Finetune/Loss": 5.895357608795166, "Finetune/Loss (Raw)": 1.9692203998565674, "Finetune/Step": 26, "Finetune/Step Time": 8.215580894396854} {"Finetune/Learning Rate": 1.9999932336646454e-06, "Finetune/Loss": 5.726846694946289, "Finetune/Loss (Raw)": 1.3455783128738403, "Finetune/Step": 27, "Finetune/Step Time": 8.210080650117662} {"Finetune/Learning Rate": 1.9999729347501482e-06, "Finetune/Loss": 5.574076175689697, "Finetune/Loss (Raw)": 1.4492627382278442, "Finetune/Step": 28, "Finetune/Step Time": 8.240609739507947} {"Finetune/Learning Rate": 1.999939103531207e-06, "Finetune/Loss": 5.43409538269043, "Finetune/Loss (Raw)": 1.5146280527114868, "Finetune/Step": 29, "Finetune/Step Time": 8.236932351671417} {"Finetune/Learning Rate": 1.9998917404656485e-06, "Finetune/Loss": 5.2987236976623535, "Finetune/Loss (Raw)": 1.3729479312896729, "Finetune/Step": 30, "Finetune/Step Time": 8.192907094955444} {"Finetune/Learning Rate": 1.9998308461944218e-06, "Finetune/Loss": 5.158546447753906, "Finetune/Loss (Raw)": 0.9532352685928345, "Finetune/Step": 31, "Finetune/Step Time": 8.200238212462395} {"Finetune/Learning Rate": 1.9997564215415883e-06, "Finetune/Loss": 5.033377647399902, "Finetune/Loss (Raw)": 1.153144359588623, "Finetune/Step": 32, "Finetune/Step Time": 8.230717562139034} {"Finetune/Learning Rate": 1.999668467514313e-06, "Finetune/Loss": 4.760508060455322, "Finetune/Loss (Raw)": 1.1333155632019043, "Finetune/Step": 33, "Finetune/Step Time": 8.222517533735795} {"Finetune/Learning Rate": 1.9995669853028485e-06, "Finetune/Loss": 4.477713584899902, "Finetune/Loss (Raw)": 1.0426304340362549, "Finetune/Step": 34, "Finetune/Step Time": 8.213778958601111} {"Finetune/Learning Rate": 1.99945197628052e-06, "Finetune/Loss": 4.209099292755127, "Finetune/Loss (Raw)": 1.3322415351867676, "Finetune/Step": 35, "Finetune/Step Time": 8.202072286605835} {"Finetune/Learning Rate": 1.9993234420037072e-06, "Finetune/Loss": 3.9312500953674316, "Finetune/Loss (Raw)": 1.3692221641540527, "Finetune/Step": 36, "Finetune/Step Time": 8.239714894029829} {"Finetune/Learning Rate": 1.9991813842118214e-06, "Finetune/Loss": 3.6502485275268555, "Finetune/Loss (Raw)": 1.0529708862304688, "Finetune/Step": 37, "Finetune/Step Time": 8.191374559660215} {"Finetune/Learning Rate": 1.9990258048272846e-06, "Finetune/Loss": 3.3839759826660156, "Finetune/Loss (Raw)": 1.1035234928131104, "Finetune/Step": 38, "Finetune/Step Time": 8.18368451218856} {"Finetune/Learning Rate": 1.998856705955501e-06, "Finetune/Loss": 3.1312644481658936, "Finetune/Loss (Raw)": 1.223606824874878, "Finetune/Step": 39, "Finetune/Step Time": 8.145404534462171} {"Finetune/Learning Rate": 1.9986740898848305e-06, "Finetune/Loss": 2.8757028579711914, "Finetune/Loss (Raw)": 0.9053840637207031, "Finetune/Step": 40, "Finetune/Step Time": 8.165298014879227} {"Finetune/Learning Rate": 1.9984779590865555e-06, "Finetune/Loss": 2.641507863998413, "Finetune/Loss (Raw)": 0.949539303779602, "Finetune/Step": 41, "Finetune/Step Time": 8.160166106572966} {"Finetune/Learning Rate": 1.9982683162148497e-06, "Finetune/Loss": 2.3987655639648438, "Finetune/Loss (Raw)": 0.8933203220367432, "Finetune/Step": 42, "Finetune/Step Time": 8.152945467403956} {"Finetune/Learning Rate": 1.998045164106742e-06, "Finetune/Loss": 2.1663949489593506, "Finetune/Loss (Raw)": 0.5542664527893066, "Finetune/Step": 43, "Finetune/Step Time": 8.14549213231996} {"Finetune/Learning Rate": 1.9978085057820744e-06, "Finetune/Loss": 1.9763292074203491, "Finetune/Loss (Raw)": 0.8195223808288574, "Finetune/Step": 44, "Finetune/Step Time": 8.155563874678178} {"Finetune/Learning Rate": 1.997558344443468e-06, "Finetune/Loss": 1.7960071563720703, "Finetune/Loss (Raw)": 0.837417483329773, "Finetune/Step": 45, "Finetune/Step Time": 8.153450478447809} {"Finetune/Learning Rate": 1.997294683476273e-06, "Finetune/Loss": 1.6671693325042725, "Finetune/Loss (Raw)": 0.877512514591217, "Finetune/Step": 46, "Finetune/Step Time": 8.147091860356538} {"Finetune/Learning Rate": 1.9970175264485263e-06, "Finetune/Loss": 1.545576810836792, "Finetune/Loss (Raw)": 1.116349697113037, "Finetune/Step": 47, "Finetune/Step Time": 8.142031177561334} {"Finetune/Learning Rate": 1.9967268771109036e-06, "Finetune/Loss": 1.4600415229797363, "Finetune/Loss (Raw)": 1.0075080394744873, "Finetune/Step": 48, "Finetune/Step Time": 8.16036100188891} {"Finetune/Learning Rate": 1.9964227393966656e-06, "Finetune/Loss": 1.4084546566009521, "Finetune/Loss (Raw)": 1.3394618034362793, "Finetune/Step": 49, "Finetune/Step Time": 8.13175019439386} {"Finetune/Learning Rate": 1.9961051174216078e-06, "Finetune/Loss": 1.3488855361938477, "Finetune/Loss (Raw)": 0.9968328475952148, "Finetune/Step": 50, "Finetune/Step Time": 8.095413012504578} {"Finetune/Learning Rate": 1.9957740154840047e-06, "Finetune/Loss": 1.2896502017974854, "Finetune/Loss (Raw)": 1.067909836769104, "Finetune/Step": 51, "Finetune/Step Time": 8.092968370400223} {"Finetune/Learning Rate": 1.9954294380645497e-06, "Finetune/Loss": 1.2408299446105957, "Finetune/Loss (Raw)": 0.823157548904419, "Finetune/Step": 52, "Finetune/Step Time": 8.102976445968334} {"Finetune/Learning Rate": 1.9950713898262947e-06, "Finetune/Loss": 1.2049344778060913, "Finetune/Loss (Raw)": 1.0294996500015259, "Finetune/Step": 53, "Finetune/Step Time": 8.101315255435008} {"Finetune/Learning Rate": 1.994699875614589e-06, "Finetune/Loss": 1.168423056602478, "Finetune/Loss (Raw)": 0.7029151320457458, "Finetune/Step": 54, "Finetune/Step Time": 8.097389141718546} {"Finetune/Learning Rate": 1.9943149004570123e-06, "Finetune/Loss": 1.1338075399398804, "Finetune/Loss (Raw)": 0.5355775356292725, "Finetune/Step": 55, "Finetune/Step Time": 8.0934907653115} {"Finetune/Learning Rate": 1.9939164695633066e-06, "Finetune/Loss": 1.1065033674240112, "Finetune/Loss (Raw)": 0.8176673650741577, "Finetune/Step": 56, "Finetune/Step Time": 8.105527222156525} {"Finetune/Learning Rate": 1.9935045883253057e-06, "Finetune/Loss": 1.0699050426483154, "Finetune/Loss (Raw)": 0.9475914239883423, "Finetune/Step": 57, "Finetune/Step Time": 8.109982360873307} {"Finetune/Learning Rate": 1.9930792623168636e-06, "Finetune/Loss": 1.026103138923645, "Finetune/Loss (Raw)": 0.567560076713562, "Finetune/Step": 58, "Finetune/Step Time": 8.103559740658465} {"Finetune/Learning Rate": 1.9926404972937756e-06, "Finetune/Loss": 1.0081753730773926, "Finetune/Loss (Raw)": 0.7718905806541443, "Finetune/Step": 59, "Finetune/Step Time": 8.077576398849487} {"Finetune/Learning Rate": 1.9921882991937056e-06, "Finetune/Loss": 0.984332799911499, "Finetune/Loss (Raw)": 0.6862999200820923, "Finetune/Step": 60, "Finetune/Step Time": 8.099455746014913} {"Finetune/Learning Rate": 1.9917226741361015e-06, "Finetune/Loss": 0.9570143222808838, "Finetune/Loss (Raw)": 0.640434980392456, "Finetune/Step": 61, "Finetune/Step Time": 8.10193756760144} {"Finetune/Learning Rate": 1.9912436284221133e-06, "Finetune/Loss": 0.9471430778503418, "Finetune/Loss (Raw)": 1.0570694208145142, "Finetune/Step": 62, "Finetune/Step Time": 8.098249631543313} {"Finetune/Learning Rate": 1.9907511685345087e-06, "Finetune/Loss": 0.9438138008117676, "Finetune/Loss (Raw)": 0.8466969728469849, "Finetune/Step": 63, "Finetune/Step Time": 8.077731427692232} {"Finetune/Learning Rate": 1.990245301137586e-06, "Finetune/Loss": 0.9359328746795654, "Finetune/Loss (Raw)": 0.9009562730789185, "Finetune/Step": 64, "Finetune/Step Time": 8.090345375239849} {"Finetune/Learning Rate": 1.9897260330770818e-06, "Finetune/Loss": 0.9189454317092896, "Finetune/Loss (Raw)": 0.589718222618103, "Finetune/Step": 65, "Finetune/Step Time": 8.097115817436805} {"Finetune/Learning Rate": 1.9891933713800795e-06, "Finetune/Loss": 0.9191099405288696, "Finetune/Loss (Raw)": 1.0478938817977905, "Finetune/Step": 66, "Finetune/Step Time": 8.092240503340056} {"Finetune/Learning Rate": 1.988647323254915e-06, "Finetune/Loss": 0.9033946990966797, "Finetune/Loss (Raw)": 0.829352855682373, "Finetune/Step": 67, "Finetune/Step Time": 8.09047442763599} {"Finetune/Learning Rate": 1.988087896091077e-06, "Finetune/Loss": 0.8905056715011597, "Finetune/Loss (Raw)": 0.9567732810974121, "Finetune/Step": 68, "Finetune/Step Time": 8.108650372308844} {"Finetune/Learning Rate": 1.9875150974591097e-06, "Finetune/Loss": 0.8826954960823059, "Finetune/Loss (Raw)": 0.8030451536178589, "Finetune/Step": 69, "Finetune/Step Time": 8.114156937253648} {"Finetune/Learning Rate": 1.986928935110508e-06, "Finetune/Loss": 0.8760511875152588, "Finetune/Loss (Raw)": 0.8909059762954712, "Finetune/Step": 70, "Finetune/Step Time": 8.11115096637181} {"Finetune/Learning Rate": 1.9863294169776144e-06, "Finetune/Loss": 0.8687433004379272, "Finetune/Loss (Raw)": 0.9897531867027283, "Finetune/Step": 71, "Finetune/Step Time": 8.107634527582517} {"Finetune/Learning Rate": 1.98571655117351e-06, "Finetune/Loss": 0.8632872700691223, "Finetune/Loss (Raw)": 0.7307913303375244, "Finetune/Step": 72, "Finetune/Step Time": 8.11926234430737} {"Finetune/Learning Rate": 1.9850903459919064e-06, "Finetune/Loss": 0.8661879301071167, "Finetune/Loss (Raw)": 1.042359709739685, "Finetune/Step": 73, "Finetune/Step Time": 8.107033020829501} {"Finetune/Learning Rate": 1.984450809907031e-06, "Finetune/Loss": 0.8624250292778015, "Finetune/Loss (Raw)": 0.77290940284729, "Finetune/Step": 74, "Finetune/Step Time": 8.10406757689811} {"Finetune/Learning Rate": 1.9837979515735165e-06, "Finetune/Loss": 0.864813506603241, "Finetune/Loss (Raw)": 0.6306957006454468, "Finetune/Step": 75, "Finetune/Step Time": 8.10263692220052} {"Finetune/Learning Rate": 1.9831317798262784e-06, "Finetune/Loss": 0.86402428150177, "Finetune/Loss (Raw)": 0.7942678332328796, "Finetune/Step": 76, "Finetune/Step Time": 8.106886355500473} {"Finetune/Learning Rate": 1.9824523036804008e-06, "Finetune/Loss": 0.8639849424362183, "Finetune/Loss (Raw)": 0.8361599445343018, "Finetune/Step": 77, "Finetune/Step Time": 8.114500027198297} {"Finetune/Learning Rate": 1.9817595323310094e-06, "Finetune/Loss": 0.8555475473403931, "Finetune/Loss (Raw)": 0.6075143814086914, "Finetune/Step": 78, "Finetune/Step Time": 8.109805947695023} {"Finetune/Learning Rate": 1.981053475153152e-06, "Finetune/Loss": 0.8513253331184387, "Finetune/Loss (Raw)": 0.9812397956848145, "Finetune/Step": 79, "Finetune/Step Time": 8.10484205921994} {"Finetune/Learning Rate": 1.980334141701667e-06, "Finetune/Loss": 0.845012366771698, "Finetune/Loss (Raw)": 0.8054937720298767, "Finetune/Step": 80, "Finetune/Step Time": 8.11869510114193} {"Finetune/Learning Rate": 1.9796015417110575e-06, "Finetune/Loss": 0.8292620182037354, "Finetune/Loss (Raw)": 0.8354504108428955, "Finetune/Step": 81, "Finetune/Step Time": 8.125411171972015} {"Finetune/Learning Rate": 1.9788556850953576e-06, "Finetune/Loss": 0.82494056224823, "Finetune/Loss (Raw)": 0.8585481643676758, "Finetune/Step": 82, "Finetune/Step Time": 8.121067837971014} {"Finetune/Learning Rate": 1.9780965819479996e-06, "Finetune/Loss": 0.8181912302970886, "Finetune/Loss (Raw)": 0.8519296646118164, "Finetune/Step": 83, "Finetune/Step Time": 8.117911218160605} {"Finetune/Learning Rate": 1.977324242541677e-06, "Finetune/Loss": 0.8122221231460571, "Finetune/Loss (Raw)": 0.6321468353271484, "Finetune/Step": 84, "Finetune/Step Time": 8.130197862784067} {"Finetune/Learning Rate": 1.9765386773282033e-06, "Finetune/Loss": 0.8053423166275024, "Finetune/Loss (Raw)": 0.8093468546867371, "Finetune/Step": 85, "Finetune/Step Time": 8.133183897242827} {"Finetune/Learning Rate": 1.975739896938375e-06, "Finetune/Loss": 0.8027232885360718, "Finetune/Loss (Raw)": 0.6191050410270691, "Finetune/Step": 86, "Finetune/Step Time": 8.131129641865575} {"Finetune/Learning Rate": 1.9749279121818236e-06, "Finetune/Loss": 0.8046040534973145, "Finetune/Loss (Raw)": 0.5957619547843933, "Finetune/Step": 87, "Finetune/Step Time": 8.115280688494101} {"Finetune/Learning Rate": 1.9741027340468712e-06, "Finetune/Loss": 0.7973116636276245, "Finetune/Loss (Raw)": 0.584309995174408, "Finetune/Step": 88, "Finetune/Step Time": 8.123132434758274} {"Finetune/Learning Rate": 1.9732643737003824e-06, "Finetune/Loss": 0.7917964458465576, "Finetune/Loss (Raw)": 0.7711040377616882, "Finetune/Step": 89, "Finetune/Step Time": 8.133957878927166} {"Finetune/Learning Rate": 1.9724128424876116e-06, "Finetune/Loss": 0.7937757968902588, "Finetune/Loss (Raw)": 0.6308996081352234, "Finetune/Step": 90, "Finetune/Step Time": 8.134311278661093} {"Finetune/Learning Rate": 1.971548151932049e-06, "Finetune/Loss": 0.7875382900238037, "Finetune/Loss (Raw)": 0.5722923278808594, "Finetune/Step": 91, "Finetune/Step Time": 8.124911758925888} {"Finetune/Learning Rate": 1.9706703137352693e-06, "Finetune/Loss": 0.7862656712532043, "Finetune/Loss (Raw)": 0.645574152469635, "Finetune/Step": 92, "Finetune/Step Time": 8.131606068300163} {"Finetune/Learning Rate": 1.9697793397767668e-06, "Finetune/Loss": 0.7912427186965942, "Finetune/Loss (Raw)": 0.7996997833251953, "Finetune/Step": 93, "Finetune/Step Time": 8.142247687103929} {"Finetune/Learning Rate": 1.9688752421137977e-06, "Finetune/Loss": 0.7746778726577759, "Finetune/Loss (Raw)": 0.5269953012466431, "Finetune/Step": 94, "Finetune/Step Time": 8.137293757276332} {"Finetune/Learning Rate": 1.9679580329812193e-06, "Finetune/Loss": 0.772078812122345, "Finetune/Loss (Raw)": 0.76352858543396, "Finetune/Step": 95, "Finetune/Step Time": 8.134923091687654} {"Finetune/Learning Rate": 1.9670277247913204e-06, "Finetune/Loss": 0.7701733112335205, "Finetune/Loss (Raw)": 0.8399784564971924, "Finetune/Step": 96, "Finetune/Step Time": 8.140672760705153} {"Finetune/Learning Rate": 1.966084330133655e-06, "Finetune/Loss": 0.7755440473556519, "Finetune/Loss (Raw)": 0.7615828514099121, "Finetune/Step": 97, "Finetune/Step Time": 8.148265005386982} {"Finetune/Learning Rate": 1.9651278617748727e-06, "Finetune/Loss": 0.7698299288749695, "Finetune/Loss (Raw)": 0.8650422096252441, "Finetune/Step": 98, "Finetune/Step Time": 8.14530020344014} {"Finetune/Learning Rate": 1.964158332658545e-06, "Finetune/Loss": 0.7692362666130066, "Finetune/Loss (Raw)": 0.8103560209274292, "Finetune/Step": 99, "Finetune/Step Time": 8.140406353305085} {"Finetune/Learning Rate": 1.96317575590499e-06, "Finetune/Loss": 0.7623845338821411, "Finetune/Loss (Raw)": 0.7375152707099915, "Finetune/Step": 100, "Finetune/Step Time": 8.145412719249725} {"Finetune/Learning Rate": 1.962180144811095e-06, "Finetune/Loss": 0.7622607350349426, "Finetune/Loss (Raw)": 0.7990851402282715, "Finetune/Step": 101, "Finetune/Step Time": 8.15237817433801} {"Finetune/Learning Rate": 1.9611715128501377e-06, "Finetune/Loss": 0.751060962677002, "Finetune/Loss (Raw)": 0.532513439655304, "Finetune/Step": 102, "Finetune/Step Time": 8.147959405300664} {"Finetune/Learning Rate": 1.9601498736716015e-06, "Finetune/Loss": 0.7448062300682068, "Finetune/Loss (Raw)": 0.7896014451980591, "Finetune/Step": 103, "Finetune/Step Time": 8.14514685371547} {"Finetune/Learning Rate": 1.959115241100994e-06, "Finetune/Loss": 0.749428391456604, "Finetune/Loss (Raw)": 0.8786987662315369, "Finetune/Step": 104, "Finetune/Step Time": 8.150016259688597} {"Finetune/Learning Rate": 1.9580676291396564e-06, "Finetune/Loss": 0.736178457736969, "Finetune/Loss (Raw)": 0.6183630228042603, "Finetune/Step": 105, "Finetune/Step Time": 8.15801769438244} {"Finetune/Learning Rate": 1.9570070519645765e-06, "Finetune/Loss": 0.7307526469230652, "Finetune/Loss (Raw)": 0.5992834568023682, "Finetune/Step": 106, "Finetune/Step Time": 8.155282681843019} {"Finetune/Learning Rate": 1.9559335239281964e-06, "Finetune/Loss": 0.7414824962615967, "Finetune/Loss (Raw)": 0.9740495681762695, "Finetune/Step": 107, "Finetune/Step Time": 8.1520814717373} {"Finetune/Learning Rate": 1.9548470595582163e-06, "Finetune/Loss": 0.7416486144065857, "Finetune/Loss (Raw)": 0.7995845675468445, "Finetune/Step": 108, "Finetune/Step Time": 8.158625589476692} {"Finetune/Learning Rate": 1.9537476735574024e-06, "Finetune/Loss": 0.7438761591911316, "Finetune/Loss (Raw)": 0.907441258430481, "Finetune/Step": 109, "Finetune/Step Time": 8.15709911355185} {"Finetune/Learning Rate": 1.9526353808033826e-06, "Finetune/Loss": 0.7581198215484619, "Finetune/Loss (Raw)": 1.063312292098999, "Finetune/Step": 110, "Finetune/Step Time": 8.153300512920726} {"Finetune/Learning Rate": 1.951510196348448e-06, "Finetune/Loss": 0.7500084638595581, "Finetune/Loss (Raw)": 0.721677303314209, "Finetune/Step": 111, "Finetune/Step Time": 8.149805700456774} {"Finetune/Learning Rate": 1.95037213541935e-06, "Finetune/Loss": 0.7441349029541016, "Finetune/Loss (Raw)": 0.617538332939148, "Finetune/Step": 112, "Finetune/Step Time": 8.15369054036481} {"Finetune/Learning Rate": 1.9492212134170927e-06, "Finetune/Loss": 0.7389544248580933, "Finetune/Loss (Raw)": 0.6696748733520508, "Finetune/Step": 113, "Finetune/Step Time": 8.164067432943698} {"Finetune/Learning Rate": 1.948057445916724e-06, "Finetune/Loss": 0.7344619035720825, "Finetune/Loss (Raw)": 0.7147866487503052, "Finetune/Step": 114, "Finetune/Step Time": 8.164654901153163} {"Finetune/Learning Rate": 1.946880848667126e-06, "Finetune/Loss": 0.7249537110328674, "Finetune/Loss (Raw)": 0.5476685762405396, "Finetune/Step": 115, "Finetune/Step Time": 8.162369062589562} {"Finetune/Learning Rate": 1.945691437590802e-06, "Finetune/Loss": 0.7235547304153442, "Finetune/Loss (Raw)": 0.5873792171478271, "Finetune/Step": 116, "Finetune/Step Time": 8.170009249243243} {"Finetune/Learning Rate": 1.944489228783661e-06, "Finetune/Loss": 0.719789981842041, "Finetune/Loss (Raw)": 0.6888762712478638, "Finetune/Step": 117, "Finetune/Step Time": 8.175941043429905} {"Finetune/Learning Rate": 1.9432742385147987e-06, "Finetune/Loss": 0.7203906774520874, "Finetune/Loss (Raw)": 0.6383252143859863, "Finetune/Step": 118, "Finetune/Step Time": 8.172768669613337} {"Finetune/Learning Rate": 1.942046483226278e-06, "Finetune/Loss": 0.7280589938163757, "Finetune/Loss (Raw)": 0.8411493897438049, "Finetune/Step": 119, "Finetune/Step Time": 8.168605850524262} {"Finetune/Learning Rate": 1.940805979532907e-06, "Finetune/Loss": 0.7396230697631836, "Finetune/Loss (Raw)": 0.9543601274490356, "Finetune/Step": 120, "Finetune/Step Time": 8.159381914138795} {"Finetune/Learning Rate": 1.939552744222014e-06, "Finetune/Loss": 0.7435191869735718, "Finetune/Loss (Raw)": 0.8957815766334534, "Finetune/Step": 121, "Finetune/Step Time": 8.16651033567003} {"Finetune/Learning Rate": 1.938286794253219e-06, "Finetune/Loss": 0.7560069561004639, "Finetune/Loss (Raw)": 1.030505895614624, "Finetune/Step": 122, "Finetune/Step Time": 8.15405963287979} {"Finetune/Learning Rate": 1.9370081467582075e-06, "Finetune/Loss": 0.7645430564880371, "Finetune/Loss (Raw)": 0.8454493880271912, "Finetune/Step": 123, "Finetune/Step Time": 8.141553211987503} {"Finetune/Learning Rate": 1.9357168190404938e-06, "Finetune/Loss": 0.7584219574928284, "Finetune/Loss (Raw)": 0.4496978521347046, "Finetune/Step": 124, "Finetune/Step Time": 8.1481388192023} {"Finetune/Learning Rate": 1.9344128285751904e-06, "Finetune/Loss": 0.7554245591163635, "Finetune/Loss (Raw)": 0.7037830948829651, "Finetune/Step": 125, "Finetune/Step Time": 8.154271131515502} {"Finetune/Learning Rate": 1.9330961930087725e-06, "Finetune/Loss": 0.7549006342887878, "Finetune/Loss (Raw)": 0.5102306008338928, "Finetune/Step": 126, "Finetune/Step Time": 8.152476473460121} {"Finetune/Learning Rate": 1.931766930158834e-06, "Finetune/Loss": 0.7424267530441284, "Finetune/Loss (Raw)": 0.36436453461647034, "Finetune/Step": 127, "Finetune/Step Time": 8.149017377162544} {"Finetune/Learning Rate": 1.930425058013852e-06, "Finetune/Loss": 0.7446653246879578, "Finetune/Loss (Raw)": 0.9116120338439941, "Finetune/Step": 128, "Finetune/Step Time": 8.152294974774122} {"Finetune/Learning Rate": 1.9290705947329407e-06, "Finetune/Loss": 0.7428208589553833, "Finetune/Loss (Raw)": 0.702559769153595, "Finetune/Step": 129, "Finetune/Step Time": 8.10907126031816} {"Finetune/Learning Rate": 1.9277035586456053e-06, "Finetune/Loss": 0.7353521585464478, "Finetune/Loss (Raw)": 0.626044511795044, "Finetune/Step": 130, "Finetune/Step Time": 8.100122321397066} {"Finetune/Learning Rate": 1.926323968251495e-06, "Finetune/Loss": 0.7314519882202148, "Finetune/Loss (Raw)": 0.6855503916740417, "Finetune/Step": 131, "Finetune/Step Time": 8.100322686135769} {"Finetune/Learning Rate": 1.924931842220152e-06, "Finetune/Loss": 0.7292096614837646, "Finetune/Loss (Raw)": 0.6657595634460449, "Finetune/Step": 132, "Finetune/Step Time": 8.10139375180006} {"Finetune/Learning Rate": 1.9235271993907604e-06, "Finetune/Loss": 0.7232733964920044, "Finetune/Loss (Raw)": 0.6091256737709045, "Finetune/Step": 133, "Finetune/Step Time": 8.111682575196028} {"Finetune/Learning Rate": 1.922110058771888e-06, "Finetune/Loss": 0.735271692276001, "Finetune/Loss (Raw)": 0.9164590835571289, "Finetune/Step": 134, "Finetune/Step Time": 8.112690281122923} {"Finetune/Learning Rate": 1.920680439541233e-06, "Finetune/Loss": 0.73537677526474, "Finetune/Loss (Raw)": 0.7929632067680359, "Finetune/Step": 135, "Finetune/Step Time": 8.10419625788927} {"Finetune/Learning Rate": 1.9192383610453615e-06, "Finetune/Loss": 0.728008508682251, "Finetune/Loss (Raw)": 0.6429150104522705, "Finetune/Step": 136, "Finetune/Step Time": 8.103712106123567} {"Finetune/Learning Rate": 1.9177838427994463e-06, "Finetune/Loss": 0.7292001247406006, "Finetune/Loss (Raw)": 0.656494140625, "Finetune/Step": 137, "Finetune/Step Time": 8.11459356546402} {"Finetune/Learning Rate": 1.9163169044870047e-06, "Finetune/Loss": 0.7343157529830933, "Finetune/Loss (Raw)": 0.7629834413528442, "Finetune/Step": 138, "Finetune/Step Time": 8.123914670199156} {"Finetune/Learning Rate": 1.914837565959629e-06, "Finetune/Loss": 0.7272433638572693, "Finetune/Loss (Raw)": 0.7477329969406128, "Finetune/Step": 139, "Finetune/Step Time": 8.128167875111103} {"Finetune/Learning Rate": 1.913345847236721e-06, "Finetune/Loss": 0.7242938280105591, "Finetune/Loss (Raw)": 0.7051993608474731, "Finetune/Step": 140, "Finetune/Step Time": 8.117826532572508} {"Finetune/Learning Rate": 1.911841768505219e-06, "Finetune/Loss": 0.7232804298400879, "Finetune/Loss (Raw)": 0.8750138878822327, "Finetune/Step": 141, "Finetune/Step Time": 8.129113510251045} {"Finetune/Learning Rate": 1.9103253501193253e-06, "Finetune/Loss": 0.7170553803443909, "Finetune/Loss (Raw)": 0.8641109466552734, "Finetune/Step": 142, "Finetune/Step Time": 8.120137955993414} {"Finetune/Learning Rate": 1.90879661260023e-06, "Finetune/Loss": 0.7107381820678711, "Finetune/Loss (Raw)": 0.519526481628418, "Finetune/Step": 143, "Finetune/Step Time": 8.12320695631206} {"Finetune/Learning Rate": 1.9072555766358345e-06, "Finetune/Loss": 0.7180532217025757, "Finetune/Loss (Raw)": 0.8516191244125366, "Finetune/Step": 144, "Finetune/Step Time": 8.118682146072388} {"Finetune/Learning Rate": 1.9057022630804714e-06, "Finetune/Loss": 0.7247540950775146, "Finetune/Loss (Raw)": 0.8841038942337036, "Finetune/Step": 145, "Finetune/Step Time": 8.12665930390358} {"Finetune/Learning Rate": 1.9041366929546216e-06, "Finetune/Loss": 0.7304012775421143, "Finetune/Loss (Raw)": 0.8954966068267822, "Finetune/Step": 146, "Finetune/Step Time": 8.117461638525128} {"Finetune/Learning Rate": 1.90255888744463e-06, "Finetune/Loss": 0.7307177782058716, "Finetune/Loss (Raw)": 0.5577958822250366, "Finetune/Step": 147, "Finetune/Step Time": 8.12968523800373} {"Finetune/Learning Rate": 1.9009688679024189e-06, "Finetune/Loss": 0.742587149143219, "Finetune/Loss (Raw)": 0.967198371887207, "Finetune/Step": 148, "Finetune/Step Time": 8.110598336905241} {"Finetune/Learning Rate": 1.8993666558451996e-06, "Finetune/Loss": 0.7417466044425964, "Finetune/Loss (Raw)": 0.661979079246521, "Finetune/Step": 149, "Finetune/Step Time": 8.122831042855978} {"Finetune/Learning Rate": 1.8977522729551797e-06, "Finetune/Loss": 0.7410972118377686, "Finetune/Loss (Raw)": 0.617545485496521, "Finetune/Step": 150, "Finetune/Step Time": 8.122217820957303} {"Finetune/Learning Rate": 1.8961257410792717e-06, "Finetune/Loss": 0.7347741723060608, "Finetune/Loss (Raw)": 0.6388112306594849, "Finetune/Step": 151, "Finetune/Step Time": 8.125153601169586} {"Finetune/Learning Rate": 1.8944870822287954e-06, "Finetune/Loss": 0.72802734375, "Finetune/Loss (Raw)": 0.7384614944458008, "Finetune/Step": 152, "Finetune/Step Time": 8.115594569593668} {"Finetune/Learning Rate": 1.892836318579182e-06, "Finetune/Loss": 0.7245137095451355, "Finetune/Loss (Raw)": 0.7833454012870789, "Finetune/Step": 153, "Finetune/Step Time": 8.135310163721442} {"Finetune/Learning Rate": 1.891173472469672e-06, "Finetune/Loss": 0.7156688570976257, "Finetune/Loss (Raw)": 0.7474710941314697, "Finetune/Step": 154, "Finetune/Step Time": 8.137505451217294} {"Finetune/Learning Rate": 1.8894985664030142e-06, "Finetune/Loss": 0.7119573950767517, "Finetune/Loss (Raw)": 0.7266814708709717, "Finetune/Step": 155, "Finetune/Step Time": 8.137968104332685} {"Finetune/Learning Rate": 1.8878116230451613e-06, "Finetune/Loss": 0.7186722159385681, "Finetune/Loss (Raw)": 0.6645724177360535, "Finetune/Step": 156, "Finetune/Step Time": 8.131628323346376} {"Finetune/Learning Rate": 1.886112665224962e-06, "Finetune/Loss": 0.7162966728210449, "Finetune/Loss (Raw)": 0.6277649998664856, "Finetune/Step": 157, "Finetune/Step Time": 8.139532936736941} {"Finetune/Learning Rate": 1.8844017159338529e-06, "Finetune/Loss": 0.7238640785217285, "Finetune/Loss (Raw)": 0.7523888349533081, "Finetune/Step": 158, "Finetune/Step Time": 8.147205978631973} {"Finetune/Learning Rate": 1.8826787983255471e-06, "Finetune/Loss": 0.7407703399658203, "Finetune/Loss (Raw)": 0.905363142490387, "Finetune/Step": 159, "Finetune/Step Time": 8.144672702997923} {"Finetune/Learning Rate": 1.8809439357157222e-06, "Finetune/Loss": 0.7365674376487732, "Finetune/Loss (Raw)": 0.7771205306053162, "Finetune/Step": 160, "Finetune/Step Time": 8.138436686247587} {"Finetune/Learning Rate": 1.8791971515817019e-06, "Finetune/Loss": 0.7326788902282715, "Finetune/Loss (Raw)": 0.578126072883606, "Finetune/Step": 161, "Finetune/Step Time": 8.144944850355387} {"Finetune/Learning Rate": 1.8774384695621405e-06, "Finetune/Loss": 0.7385411858558655, "Finetune/Loss (Raw)": 0.8136380314826965, "Finetune/Step": 162, "Finetune/Step Time": 8.145868776366115} {"Finetune/Learning Rate": 1.8756679134567035e-06, "Finetune/Loss": 0.7397851943969727, "Finetune/Loss (Raw)": 0.7253584861755371, "Finetune/Step": 163, "Finetune/Step Time": 8.147338543087244} {"Finetune/Learning Rate": 1.8738855072257428e-06, "Finetune/Loss": 0.7464828491210938, "Finetune/Loss (Raw)": 0.8800842761993408, "Finetune/Step": 164, "Finetune/Step Time": 8.13625955954194} {"Finetune/Learning Rate": 1.8720912749899754e-06, "Finetune/Loss": 0.7505017518997192, "Finetune/Loss (Raw)": 0.7377313375473022, "Finetune/Step": 165, "Finetune/Step Time": 8.15655691921711} {"Finetune/Learning Rate": 1.8702852410301553e-06, "Finetune/Loss": 0.7488179206848145, "Finetune/Loss (Raw)": 0.8625748157501221, "Finetune/Step": 166, "Finetune/Step Time": 8.159106513485312} {"Finetune/Learning Rate": 1.868467429786745e-06, "Finetune/Loss": 0.7406893968582153, "Finetune/Loss (Raw)": 0.5328530073165894, "Finetune/Step": 167, "Finetune/Step Time": 8.167778799310327} {"Finetune/Learning Rate": 1.866637865859586e-06, "Finetune/Loss": 0.7444413900375366, "Finetune/Loss (Raw)": 0.7629777789115906, "Finetune/Step": 168, "Finetune/Step Time": 8.165093410760164} {"Finetune/Learning Rate": 1.8647965740075644e-06, "Finetune/Loss": 0.7491466403007507, "Finetune/Loss (Raw)": 0.8070607781410217, "Finetune/Step": 169, "Finetune/Step Time": 8.172305949032307} {"Finetune/Learning Rate": 1.8629435791482763e-06, "Finetune/Loss": 0.7514162063598633, "Finetune/Loss (Raw)": 0.8356103301048279, "Finetune/Step": 170, "Finetune/Step Time": 8.176159251481295} {"Finetune/Learning Rate": 1.861078906357691e-06, "Finetune/Loss": 0.752625584602356, "Finetune/Loss (Raw)": 0.7864335775375366, "Finetune/Step": 171, "Finetune/Step Time": 8.178320977836847} {"Finetune/Learning Rate": 1.8592025808698113e-06, "Finetune/Loss": 0.7558410167694092, "Finetune/Loss (Raw)": 0.8080942630767822, "Finetune/Step": 172, "Finetune/Step Time": 8.174599807709455} {"Finetune/Learning Rate": 1.8573146280763324e-06, "Finetune/Loss": 0.7521925568580627, "Finetune/Loss (Raw)": 0.7582612037658691, "Finetune/Step": 173, "Finetune/Step Time": 8.184572972357273} {"Finetune/Learning Rate": 1.8554150735262971e-06, "Finetune/Loss": 0.7480905055999756, "Finetune/Loss (Raw)": 0.7328474521636963, "Finetune/Step": 174, "Finetune/Step Time": 8.187999900430441} {"Finetune/Learning Rate": 1.8535039429257528e-06, "Finetune/Loss": 0.751968264579773, "Finetune/Loss (Raw)": 0.6436123847961426, "Finetune/Step": 175, "Finetune/Step Time": 8.190631423145533} {"Finetune/Learning Rate": 1.8515812621373995e-06, "Finetune/Loss": 0.7519350051879883, "Finetune/Loss (Raw)": 0.8505551815032959, "Finetune/Step": 176, "Finetune/Step Time": 8.18467452377081} {"Finetune/Learning Rate": 1.8496470571802441e-06, "Finetune/Loss": 0.7485690116882324, "Finetune/Loss (Raw)": 0.7763920426368713, "Finetune/Step": 177, "Finetune/Step Time": 8.20068888925016} {"Finetune/Learning Rate": 1.8477013542292443e-06, "Finetune/Loss": 0.742199718952179, "Finetune/Loss (Raw)": 0.6916806101799011, "Finetune/Step": 178, "Finetune/Step Time": 8.21746757440269} {"Finetune/Learning Rate": 1.8457441796149584e-06, "Finetune/Loss": 0.7461390495300293, "Finetune/Loss (Raw)": 0.6838520765304565, "Finetune/Step": 179, "Finetune/Step Time": 8.218134259805083} {"Finetune/Learning Rate": 1.8437755598231854e-06, "Finetune/Loss": 0.7347394227981567, "Finetune/Loss (Raw)": 0.6024124026298523, "Finetune/Step": 180, "Finetune/Step Time": 8.220284044742584} {"Finetune/Learning Rate": 1.841795521494609e-06, "Finetune/Loss": 0.7383739948272705, "Finetune/Loss (Raw)": 0.778285026550293, "Finetune/Step": 181, "Finetune/Step Time": 8.21342265419662} {"Finetune/Learning Rate": 1.839804091424436e-06, "Finetune/Loss": 0.7400475144386292, "Finetune/Loss (Raw)": 0.6710984110832214, "Finetune/Step": 182, "Finetune/Step Time": 8.217505667358637} {"Finetune/Learning Rate": 1.8378012965620333e-06, "Finetune/Loss": 0.7369861602783203, "Finetune/Loss (Raw)": 0.5408456325531006, "Finetune/Step": 183, "Finetune/Step Time": 8.217663384974003} {"Finetune/Learning Rate": 1.8357871640105645e-06, "Finetune/Loss": 0.7427244782447815, "Finetune/Loss (Raw)": 0.9220883250236511, "Finetune/Step": 184, "Finetune/Step Time": 8.214239202439785} {"Finetune/Learning Rate": 1.8337617210266223e-06, "Finetune/Loss": 0.7376034259796143, "Finetune/Loss (Raw)": 0.6194739937782288, "Finetune/Step": 185, "Finetune/Step Time": 8.217092180624604} {"Finetune/Learning Rate": 1.8317249950198596e-06, "Finetune/Loss": 0.7323201894760132, "Finetune/Loss (Raw)": 0.5784069299697876, "Finetune/Step": 186, "Finetune/Step Time": 8.223856594413519} {"Finetune/Learning Rate": 1.8296770135526187e-06, "Finetune/Loss": 0.7330161929130554, "Finetune/Loss (Raw)": 0.7489522695541382, "Finetune/Step": 187, "Finetune/Step Time": 8.236478589475155} {"Finetune/Learning Rate": 1.8276178043395584e-06, "Finetune/Loss": 0.729059636592865, "Finetune/Loss (Raw)": 0.5379623174667358, "Finetune/Step": 188, "Finetune/Step Time": 8.230481281876564} {"Finetune/Learning Rate": 1.825547395247279e-06, "Finetune/Loss": 0.7463459968566895, "Finetune/Loss (Raw)": 1.1809312105178833, "Finetune/Step": 189, "Finetune/Step Time": 8.226396191865206} {"Finetune/Learning Rate": 1.8234658142939453e-06, "Finetune/Loss": 0.7467281222343445, "Finetune/Loss (Raw)": 0.7646147012710571, "Finetune/Step": 190, "Finetune/Step Time": 8.231104861944914} {"Finetune/Learning Rate": 1.821373089648906e-06, "Finetune/Loss": 0.7427999973297119, "Finetune/Loss (Raw)": 0.7796639800071716, "Finetune/Step": 191, "Finetune/Step Time": 8.239301869645715} {"Finetune/Learning Rate": 1.8192692496323154e-06, "Finetune/Loss": 0.7384656071662903, "Finetune/Loss (Raw)": 0.6384196877479553, "Finetune/Step": 192, "Finetune/Step Time": 8.238349562510848} {"Finetune/Learning Rate": 1.8171543227147472e-06, "Finetune/Loss": 0.7424736022949219, "Finetune/Loss (Raw)": 0.7063843011856079, "Finetune/Step": 193, "Finetune/Step Time": 8.225359365344048} {"Finetune/Learning Rate": 1.8150283375168112e-06, "Finetune/Loss": 0.7400912046432495, "Finetune/Loss (Raw)": 0.7374001145362854, "Finetune/Step": 194, "Finetune/Step Time": 8.234932765364647} {"Finetune/Learning Rate": 1.812891322808765e-06, "Finetune/Loss": 0.738048791885376, "Finetune/Loss (Raw)": 0.6600022912025452, "Finetune/Step": 195, "Finetune/Step Time": 8.234945721924305} {"Finetune/Learning Rate": 1.8107433075101251e-06, "Finetune/Loss": 0.7379904389381409, "Finetune/Loss (Raw)": 0.8782154321670532, "Finetune/Step": 196, "Finetune/Step Time": 8.227682089433074} {"Finetune/Learning Rate": 1.8085843206892748e-06, "Finetune/Loss": 0.734855055809021, "Finetune/Loss (Raw)": 0.6373993158340454, "Finetune/Step": 197, "Finetune/Step Time": 8.228883858770132} {"Finetune/Learning Rate": 1.8064143915630721e-06, "Finetune/Loss": 0.7263481020927429, "Finetune/Loss (Raw)": 0.5903528928756714, "Finetune/Step": 198, "Finetune/Step Time": 8.234011318534613} {"Finetune/Learning Rate": 1.8042335494964533e-06, "Finetune/Loss": 0.7409375905990601, "Finetune/Loss (Raw)": 0.9997148513793945, "Finetune/Step": 199, "Finetune/Step Time": 8.234588388353586} {"Finetune/Learning Rate": 1.8020418240020358e-06, "Finetune/Loss": 0.735733151435852, "Finetune/Loss (Raw)": 0.5964370965957642, "Finetune/Step": 200, "Finetune/Step Time": 8.233554596081376} {"Finetune/Learning Rate": 1.7998392447397195e-06, "Finetune/Loss": 0.7322739362716675, "Finetune/Loss (Raw)": 0.6963669657707214, "Finetune/Step": 201, "Finetune/Step Time": 8.240076538175344} {"Finetune/Learning Rate": 1.7976258415162833e-06, "Finetune/Loss": 0.7169126272201538, "Finetune/Loss (Raw)": 0.34404700994491577, "Finetune/Step": 202, "Finetune/Step Time": 8.23892386816442} {"Finetune/Learning Rate": 1.7954016442849853e-06, "Finetune/Loss": 0.7150916457176208, "Finetune/Loss (Raw)": 0.7281608581542969, "Finetune/Step": 203, "Finetune/Step Time": 8.237633844837546} {"Finetune/Learning Rate": 1.7931666831451535e-06, "Finetune/Loss": 0.7133442759513855, "Finetune/Loss (Raw)": 0.7521803379058838, "Finetune/Step": 204, "Finetune/Step Time": 8.237342722713947} {"Finetune/Learning Rate": 1.7909209883417812e-06, "Finetune/Loss": 0.715347170829773, "Finetune/Loss (Raw)": 0.8223538398742676, "Finetune/Step": 205, "Finetune/Step Time": 8.23551925830543} {"Finetune/Learning Rate": 1.7886645902651164e-06, "Finetune/Loss": 0.7199630737304688, "Finetune/Loss (Raw)": 0.8805556893348694, "Finetune/Step": 206, "Finetune/Step Time": 8.24155642464757} {"Finetune/Learning Rate": 1.7863975194502522e-06, "Finetune/Loss": 0.7225880026817322, "Finetune/Loss (Raw)": 0.7276099920272827, "Finetune/Step": 207, "Finetune/Step Time": 8.24134910851717} {"Finetune/Learning Rate": 1.7841198065767105e-06, "Finetune/Loss": 0.7176876068115234, "Finetune/Loss (Raw)": 0.6937423944473267, "Finetune/Step": 208, "Finetune/Step Time": 8.236577570438385} {"Finetune/Learning Rate": 1.7818314824680298e-06, "Finetune/Loss": 0.7165228724479675, "Finetune/Loss (Raw)": 0.7391218543052673, "Finetune/Step": 209, "Finetune/Step Time": 8.23305120691657} {"Finetune/Learning Rate": 1.7795325780913469e-06, "Finetune/Loss": 0.7151067852973938, "Finetune/Loss (Raw)": 0.646365225315094, "Finetune/Step": 210, "Finetune/Step Time": 8.241420902311802} {"Finetune/Learning Rate": 1.7772231245569777e-06, "Finetune/Loss": 0.714853048324585, "Finetune/Loss (Raw)": 0.6757323741912842, "Finetune/Step": 211, "Finetune/Step Time": 8.241460610181093} {"Finetune/Learning Rate": 1.7749031531179962e-06, "Finetune/Loss": 0.7153056859970093, "Finetune/Loss (Raw)": 0.6168981790542603, "Finetune/Step": 212, "Finetune/Step Time": 8.237747482955456} {"Finetune/Learning Rate": 1.772572695169812e-06, "Finetune/Loss": 0.7202032804489136, "Finetune/Loss (Raw)": 0.9350075721740723, "Finetune/Step": 213, "Finetune/Step Time": 8.236372541636229} {"Finetune/Learning Rate": 1.7702317822497454e-06, "Finetune/Loss": 0.7191460132598877, "Finetune/Loss (Raw)": 0.637264609336853, "Finetune/Step": 214, "Finetune/Step Time": 8.233595931902528} {"Finetune/Learning Rate": 1.7678804460366e-06, "Finetune/Loss": 0.7183898091316223, "Finetune/Loss (Raw)": 0.5166471600532532, "Finetune/Step": 215, "Finetune/Step Time": 8.2424539308995} {"Finetune/Learning Rate": 1.7655187183502342e-06, "Finetune/Loss": 0.7159522771835327, "Finetune/Loss (Raw)": 0.8440881967544556, "Finetune/Step": 216, "Finetune/Step Time": 8.23068481683731} {"Finetune/Learning Rate": 1.7631466311511314e-06, "Finetune/Loss": 0.722637414932251, "Finetune/Loss (Raw)": 0.8333979845046997, "Finetune/Step": 217, "Finetune/Step Time": 8.22191659733653} {"Finetune/Learning Rate": 1.7607642165399663e-06, "Finetune/Loss": 0.719668984413147, "Finetune/Loss (Raw)": 0.4834175407886505, "Finetune/Step": 218, "Finetune/Step Time": 8.228177482262254} {"Finetune/Learning Rate": 1.7583715067571716e-06, "Finetune/Loss": 0.7240577936172485, "Finetune/Loss (Raw)": 0.8893941044807434, "Finetune/Step": 219, "Finetune/Step Time": 8.223600158467889} {"Finetune/Learning Rate": 1.7559685341825009e-06, "Finetune/Loss": 0.7273392677307129, "Finetune/Loss (Raw)": 0.642969012260437, "Finetune/Step": 220, "Finetune/Step Time": 8.213178757578135} {"Finetune/Learning Rate": 1.7535553313345904e-06, "Finetune/Loss": 0.7059352993965149, "Finetune/Loss (Raw)": 0.49600425362586975, "Finetune/Step": 221, "Finetune/Step Time": 8.224925827234983} {"Finetune/Learning Rate": 1.7511319308705197e-06, "Finetune/Loss": 0.7106304168701172, "Finetune/Loss (Raw)": 0.9148595929145813, "Finetune/Step": 222, "Finetune/Step Time": 8.224968582391739} {"Finetune/Learning Rate": 1.7486983655853698e-06, "Finetune/Loss": 0.7116391062736511, "Finetune/Loss (Raw)": 0.8119412064552307, "Finetune/Step": 223, "Finetune/Step Time": 8.224092854186893} {"Finetune/Learning Rate": 1.7462546684117779e-06, "Finetune/Loss": 0.7045779824256897, "Finetune/Loss (Raw)": 0.4124630093574524, "Finetune/Step": 224, "Finetune/Step Time": 8.216138618066907} {"Finetune/Learning Rate": 1.7438008724194928e-06, "Finetune/Loss": 0.7099413871765137, "Finetune/Loss (Raw)": 0.8780146837234497, "Finetune/Step": 225, "Finetune/Step Time": 8.212607927620411} {"Finetune/Learning Rate": 1.7413370108149287e-06, "Finetune/Loss": 0.7061430215835571, "Finetune/Loss (Raw)": 0.6158514022827148, "Finetune/Step": 226, "Finetune/Step Time": 8.214491048827767} {"Finetune/Learning Rate": 1.7388631169407123e-06, "Finetune/Loss": 0.6997050642967224, "Finetune/Loss (Raw)": 0.45398783683776855, "Finetune/Step": 227, "Finetune/Step Time": 8.217708257958293} {"Finetune/Learning Rate": 1.7363792242752351e-06, "Finetune/Loss": 0.6905880570411682, "Finetune/Loss (Raw)": 0.5864713191986084, "Finetune/Step": 228, "Finetune/Step Time": 8.217063447460532} {"Finetune/Learning Rate": 1.733885366432199e-06, "Finetune/Loss": 0.6894593238830566, "Finetune/Loss (Raw)": 0.6012790203094482, "Finetune/Step": 229, "Finetune/Step Time": 8.221099400892854} {"Finetune/Learning Rate": 1.7313815771601608e-06, "Finetune/Loss": 0.6900476217269897, "Finetune/Loss (Raw)": 0.6091784238815308, "Finetune/Step": 230, "Finetune/Step Time": 8.217105608433485} {"Finetune/Learning Rate": 1.7288678903420762e-06, "Finetune/Loss": 0.6826992630958557, "Finetune/Loss (Raw)": 0.7645690441131592, "Finetune/Step": 231, "Finetune/Step Time": 8.222638016566634} {"Finetune/Learning Rate": 1.7263443399948407e-06, "Finetune/Loss": 0.6893703937530518, "Finetune/Loss (Raw)": 0.8099119663238525, "Finetune/Step": 232, "Finetune/Step Time": 8.219022195786238} {"Finetune/Learning Rate": 1.723810960268831e-06, "Finetune/Loss": 0.6903643608093262, "Finetune/Loss (Raw)": 0.7281734943389893, "Finetune/Step": 233, "Finetune/Step Time": 8.218884075060487} {"Finetune/Learning Rate": 1.72126778544744e-06, "Finetune/Loss": 0.6986916065216064, "Finetune/Loss (Raw)": 0.6105203628540039, "Finetune/Step": 234, "Finetune/Step Time": 8.218180857598782} {"Finetune/Learning Rate": 1.7187148499466158e-06, "Finetune/Loss": 0.7000617980957031, "Finetune/Loss (Raw)": 0.7720062732696533, "Finetune/Step": 235, "Finetune/Step Time": 8.220927309244871} {"Finetune/Learning Rate": 1.7161521883143932e-06, "Finetune/Loss": 0.6927201151847839, "Finetune/Loss (Raw)": 0.5172455310821533, "Finetune/Step": 236, "Finetune/Step Time": 8.218430001288652} {"Finetune/Learning Rate": 1.7135798352304288e-06, "Finetune/Loss": 0.6903230547904968, "Finetune/Loss (Raw)": 0.7456501722335815, "Finetune/Step": 237, "Finetune/Step Time": 8.220463503152132} {"Finetune/Learning Rate": 1.7109978255055292e-06, "Finetune/Loss": 0.686388373374939, "Finetune/Loss (Raw)": 0.7546454668045044, "Finetune/Step": 238, "Finetune/Step Time": 8.220822215080261} {"Finetune/Learning Rate": 1.7084061940811824e-06, "Finetune/Loss": 0.6774868965148926, "Finetune/Loss (Raw)": 0.4427635073661804, "Finetune/Step": 239, "Finetune/Step Time": 8.225940007716417} {"Finetune/Learning Rate": 1.7058049760290828e-06, "Finetune/Loss": 0.6770272254943848, "Finetune/Loss (Raw)": 0.6790297031402588, "Finetune/Step": 240, "Finetune/Step Time": 8.22200015373528} {"Finetune/Learning Rate": 1.7031942065506574e-06, "Finetune/Loss": 0.6747690439224243, "Finetune/Loss (Raw)": 0.6668626070022583, "Finetune/Step": 241, "Finetune/Step Time": 8.211970193311572} {"Finetune/Learning Rate": 1.7005739209765904e-06, "Finetune/Loss": 0.6781421303749084, "Finetune/Loss (Raw)": 0.7543028593063354, "Finetune/Step": 242, "Finetune/Step Time": 8.198791513219476} {"Finetune/Learning Rate": 1.6979441547663433e-06, "Finetune/Loss": 0.6738342046737671, "Finetune/Loss (Raw)": 0.5378786325454712, "Finetune/Step": 243, "Finetune/Step Time": 8.204445518553257} {"Finetune/Learning Rate": 1.6953049435076767e-06, "Finetune/Loss": 0.678647518157959, "Finetune/Loss (Raw)": 0.7709237933158875, "Finetune/Step": 244, "Finetune/Step Time": 8.194263383746147} {"Finetune/Learning Rate": 1.692656322916167e-06, "Finetune/Loss": 0.6660218834877014, "Finetune/Loss (Raw)": 0.5309868454933167, "Finetune/Step": 245, "Finetune/Step Time": 8.187900079414248} {"Finetune/Learning Rate": 1.6899983288347247e-06, "Finetune/Loss": 0.673303484916687, "Finetune/Loss (Raw)": 0.8702768683433533, "Finetune/Step": 246, "Finetune/Step Time": 8.180267505347729} {"Finetune/Learning Rate": 1.6873309972331082e-06, "Finetune/Loss": 0.6745977997779846, "Finetune/Loss (Raw)": 0.558064341545105, "Finetune/Step": 247, "Finetune/Step Time": 8.190600933507085} {"Finetune/Learning Rate": 1.684654364207438e-06, "Finetune/Loss": 0.6663388609886169, "Finetune/Loss (Raw)": 0.5798025131225586, "Finetune/Step": 248, "Finetune/Step Time": 8.199034564197063} {"Finetune/Learning Rate": 1.6819684659797075e-06, "Finetune/Loss": 0.6590651273727417, "Finetune/Loss (Raw)": 0.6006399393081665, "Finetune/Step": 249, "Finetune/Step Time": 8.20359281823039} {"Finetune/Learning Rate": 1.6792733388972931e-06, "Finetune/Loss": 0.666793704032898, "Finetune/Loss (Raw)": 0.7307294607162476, "Finetune/Step": 250, "Finetune/Step Time": 8.214663559570909} {"Finetune/Learning Rate": 1.6765690194324615e-06, "Finetune/Loss": 0.663303792476654, "Finetune/Loss (Raw)": 0.777717649936676, "Finetune/Step": 251, "Finetune/Step Time": 8.2332533467561} {"Finetune/Learning Rate": 1.6738555441818782e-06, "Finetune/Loss": 0.6592702865600586, "Finetune/Loss (Raw)": 0.5138977766036987, "Finetune/Step": 252, "Finetune/Step Time": 8.215701222419739} {"Finetune/Learning Rate": 1.67113294986611e-06, "Finetune/Loss": 0.6656836867332458, "Finetune/Loss (Raw)": 0.7012330293655396, "Finetune/Step": 253, "Finetune/Step Time": 8.208479469642043} {"Finetune/Learning Rate": 1.6684012733291289e-06, "Finetune/Loss": 0.6552008986473083, "Finetune/Loss (Raw)": 0.5794099569320679, "Finetune/Step": 254, "Finetune/Step Time": 8.208647929131985} {"Finetune/Learning Rate": 1.6656605515378146e-06, "Finetune/Loss": 0.6549873352050781, "Finetune/Loss (Raw)": 0.8051059246063232, "Finetune/Step": 255, "Finetune/Step Time": 8.215565368533134} {"Finetune/Learning Rate": 1.6629108215814523e-06, "Finetune/Loss": 0.664789080619812, "Finetune/Loss (Raw)": 0.7261197566986084, "Finetune/Step": 256, "Finetune/Step Time": 8.208769192919135} {"Finetune/Learning Rate": 1.6601521206712316e-06, "Finetune/Loss": 0.6634975075721741, "Finetune/Loss (Raw)": 0.8366852402687073, "Finetune/Step": 257, "Finetune/Step Time": 8.208143236115575} {"Finetune/Learning Rate": 1.6573844861397444e-06, "Finetune/Loss": 0.666907012462616, "Finetune/Loss (Raw)": 0.7249550223350525, "Finetune/Step": 258, "Finetune/Step Time": 8.214850183576345} {"Finetune/Learning Rate": 1.6546079554404764e-06, "Finetune/Loss": 0.6724696755409241, "Finetune/Loss (Raw)": 0.6319937705993652, "Finetune/Step": 259, "Finetune/Step Time": 8.218301760032773} {"Finetune/Learning Rate": 1.6518225661473042e-06, "Finetune/Loss": 0.6742480397224426, "Finetune/Loss (Raw)": 0.6433791518211365, "Finetune/Step": 260, "Finetune/Step Time": 8.215660052374005} {"Finetune/Learning Rate": 1.6490283559539836e-06, "Finetune/Loss": 0.6736900806427002, "Finetune/Loss (Raw)": 0.5834246873855591, "Finetune/Step": 261, "Finetune/Step Time": 8.217009229585528} {"Finetune/Learning Rate": 1.6462253626736412e-06, "Finetune/Loss": 0.6780363321304321, "Finetune/Loss (Raw)": 0.7482554316520691, "Finetune/Step": 262, "Finetune/Step Time": 8.217529559507966} {"Finetune/Learning Rate": 1.6434136242382611e-06, "Finetune/Loss": 0.6721709966659546, "Finetune/Loss (Raw)": 0.5768792033195496, "Finetune/Step": 263, "Finetune/Step Time": 8.220732102170587} {"Finetune/Learning Rate": 1.6405931786981752e-06, "Finetune/Loss": 0.6617582440376282, "Finetune/Loss (Raw)": 0.4767047166824341, "Finetune/Step": 264, "Finetune/Step Time": 8.21050250530243} {"Finetune/Learning Rate": 1.637764064221543e-06, "Finetune/Loss": 0.6584570407867432, "Finetune/Loss (Raw)": 0.6225340366363525, "Finetune/Step": 265, "Finetune/Step Time": 8.209130266681314} {"Finetune/Learning Rate": 1.63492631909384e-06, "Finetune/Loss": 0.6547315120697021, "Finetune/Loss (Raw)": 0.4913027286529541, "Finetune/Step": 266, "Finetune/Step Time": 8.210684588178992} {"Finetune/Learning Rate": 1.6320799817173356e-06, "Finetune/Loss": 0.6411423087120056, "Finetune/Loss (Raw)": 0.33715322613716125, "Finetune/Step": 267, "Finetune/Step Time": 8.213788909837604} {"Finetune/Learning Rate": 1.6292250906105769e-06, "Finetune/Loss": 0.6410590410232544, "Finetune/Loss (Raw)": 0.5145804286003113, "Finetune/Step": 268, "Finetune/Step Time": 8.21546139381826} {"Finetune/Learning Rate": 1.6263616844078651e-06, "Finetune/Loss": 0.6423385143280029, "Finetune/Loss (Raw)": 0.7865951061248779, "Finetune/Step": 269, "Finetune/Step Time": 8.215663082897663} {"Finetune/Learning Rate": 1.6234898018587336e-06, "Finetune/Loss": 0.6350007057189941, "Finetune/Loss (Raw)": 0.5198345184326172, "Finetune/Step": 270, "Finetune/Step Time": 8.22196388617158} {"Finetune/Learning Rate": 1.6206094818274228e-06, "Finetune/Loss": 0.6340144872665405, "Finetune/Loss (Raw)": 0.4112033247947693, "Finetune/Step": 271, "Finetune/Step Time": 8.224049353972077} {"Finetune/Learning Rate": 1.6177207632923556e-06, "Finetune/Loss": 0.6295524835586548, "Finetune/Loss (Raw)": 0.5362470149993896, "Finetune/Step": 272, "Finetune/Step Time": 8.217443600296974} {"Finetune/Learning Rate": 1.6148236853456085e-06, "Finetune/Loss": 0.6317451000213623, "Finetune/Loss (Raw)": 0.7370251417160034, "Finetune/Step": 273, "Finetune/Step Time": 8.222385052591562} {"Finetune/Learning Rate": 1.6119182871923833e-06, "Finetune/Loss": 0.6272639036178589, "Finetune/Loss (Raw)": 0.6109045147895813, "Finetune/Step": 274, "Finetune/Step Time": 8.233561845496297} {"Finetune/Learning Rate": 1.6090046081504766e-06, "Finetune/Loss": 0.6289491653442383, "Finetune/Loss (Raw)": 0.5918078422546387, "Finetune/Step": 275, "Finetune/Step Time": 8.237091498449445} {"Finetune/Learning Rate": 1.6060826876497477e-06, "Finetune/Loss": 0.6262859106063843, "Finetune/Loss (Raw)": 0.6856992840766907, "Finetune/Step": 276, "Finetune/Step Time": 8.243941510096192} {"Finetune/Learning Rate": 1.6031525652315843e-06, "Finetune/Loss": 0.622409462928772, "Finetune/Loss (Raw)": 0.40694040060043335, "Finetune/Step": 277, "Finetune/Step Time": 8.242366364225745} {"Finetune/Learning Rate": 1.6002142805483684e-06, "Finetune/Loss": 0.6092771291732788, "Finetune/Loss (Raw)": 0.45004209876060486, "Finetune/Step": 278, "Finetune/Step Time": 8.246095886453986} {"Finetune/Learning Rate": 1.5972678733629386e-06, "Finetune/Loss": 0.6070301532745361, "Finetune/Loss (Raw)": 0.4861607849597931, "Finetune/Step": 279, "Finetune/Step Time": 8.249266773462296} {"Finetune/Learning Rate": 1.5943133835480533e-06, "Finetune/Loss": 0.6098250150680542, "Finetune/Loss (Raw)": 0.669238805770874, "Finetune/Step": 280, "Finetune/Step Time": 8.235404344275594} {"Finetune/Learning Rate": 1.5913508510858508e-06, "Finetune/Loss": 0.6188188195228577, "Finetune/Loss (Raw)": 0.8884420394897461, "Finetune/Step": 281, "Finetune/Step Time": 8.237579429522157} {"Finetune/Learning Rate": 1.5883803160673068e-06, "Finetune/Loss": 0.6109426617622375, "Finetune/Loss (Raw)": 0.4786924123764038, "Finetune/Step": 282, "Finetune/Step Time": 8.236711006611586} {"Finetune/Learning Rate": 1.5854018186916938e-06, "Finetune/Loss": 0.6079537272453308, "Finetune/Loss (Raw)": 0.682072103023529, "Finetune/Step": 283, "Finetune/Step Time": 8.243474464863539} {"Finetune/Learning Rate": 1.5824153992660358e-06, "Finetune/Loss": 0.6112866997718811, "Finetune/Loss (Raw)": 0.6205520629882812, "Finetune/Step": 284, "Finetune/Step Time": 8.240037579089403} {"Finetune/Learning Rate": 1.5794210982045635e-06, "Finetune/Loss": 0.6026301383972168, "Finetune/Loss (Raw)": 0.4242229759693146, "Finetune/Step": 285, "Finetune/Step Time": 8.241248462349176} {"Finetune/Learning Rate": 1.5764189560281674e-06, "Finetune/Loss": 0.607843816280365, "Finetune/Loss (Raw)": 0.7462479472160339, "Finetune/Step": 286, "Finetune/Step Time": 8.229700226336718} {"Finetune/Learning Rate": 1.573409013363849e-06, "Finetune/Loss": 0.6066193580627441, "Finetune/Loss (Raw)": 0.765924334526062, "Finetune/Step": 287, "Finetune/Step Time": 8.23453607968986} {"Finetune/Learning Rate": 1.5703913109441712e-06, "Finetune/Loss": 0.5987279415130615, "Finetune/Loss (Raw)": 0.4735930263996124, "Finetune/Step": 288, "Finetune/Step Time": 8.231039859354496} {"Finetune/Learning Rate": 1.5673658896067067e-06, "Finetune/Loss": 0.6000238656997681, "Finetune/Loss (Raw)": 0.8781557679176331, "Finetune/Step": 289, "Finetune/Step Time": 8.232533007860184} {"Finetune/Learning Rate": 1.5643327902934867e-06, "Finetune/Loss": 0.5914379358291626, "Finetune/Loss (Raw)": 0.45020434260368347, "Finetune/Step": 290, "Finetune/Step Time": 8.232704110443592} {"Finetune/Learning Rate": 1.5612920540504452e-06, "Finetune/Loss": 0.5910717248916626, "Finetune/Loss (Raw)": 0.6202751994132996, "Finetune/Step": 291, "Finetune/Step Time": 8.239120103418827} {"Finetune/Learning Rate": 1.5582437220268645e-06, "Finetune/Loss": 0.5859724283218384, "Finetune/Loss (Raw)": 0.4802022874355316, "Finetune/Step": 292, "Finetune/Step Time": 8.239243926480412} {"Finetune/Learning Rate": 1.5551878354748185e-06, "Finetune/Loss": 0.5916406512260437, "Finetune/Loss (Raw)": 0.764808177947998, "Finetune/Step": 293, "Finetune/Step Time": 8.241679348051548} {"Finetune/Learning Rate": 1.5521244357486132e-06, "Finetune/Loss": 0.5875035524368286, "Finetune/Loss (Raw)": 0.6158686876296997, "Finetune/Step": 294, "Finetune/Step Time": 8.241852261126041} {"Finetune/Learning Rate": 1.5490535643042284e-06, "Finetune/Loss": 0.5876559019088745, "Finetune/Loss (Raw)": 0.5817544460296631, "Finetune/Step": 295, "Finetune/Step Time": 8.252083403989673} {"Finetune/Learning Rate": 1.5459752626987562e-06, "Finetune/Loss": 0.5924941301345825, "Finetune/Loss (Raw)": 0.631525993347168, "Finetune/Step": 296, "Finetune/Step Time": 8.247899688780308} {"Finetune/Learning Rate": 1.5428895725898383e-06, "Finetune/Loss": 0.5873022675514221, "Finetune/Loss (Raw)": 0.45639634132385254, "Finetune/Step": 297, "Finetune/Step Time": 8.248388711363077} {"Finetune/Learning Rate": 1.5397965357351034e-06, "Finetune/Loss": 0.5936338305473328, "Finetune/Loss (Raw)": 0.6939111948013306, "Finetune/Step": 298, "Finetune/Step Time": 8.250023076310754} {"Finetune/Learning Rate": 1.5366961939916006e-06, "Finetune/Loss": 0.6083956360816956, "Finetune/Loss (Raw)": 0.8095324039459229, "Finetune/Step": 299, "Finetune/Step Time": 8.254106774926186} {"Finetune/Learning Rate": 1.5335885893152333e-06, "Finetune/Loss": 0.6149575710296631, "Finetune/Loss (Raw)": 0.7245610356330872, "Finetune/Step": 300, "Finetune/Step Time": 8.25250007212162} {"Finetune/Learning Rate": 1.5304737637601926e-06, "Finetune/Loss": 0.6109316349029541, "Finetune/Loss (Raw)": 0.6577668190002441, "Finetune/Step": 301, "Finetune/Step Time": 8.250673048198223} {"Finetune/Learning Rate": 1.5273517594783875e-06, "Finetune/Loss": 0.609856128692627, "Finetune/Loss (Raw)": 0.48541688919067383, "Finetune/Step": 302, "Finetune/Step Time": 8.248989447951317} {"Finetune/Learning Rate": 1.5242226187188733e-06, "Finetune/Loss": 0.6215323209762573, "Finetune/Loss (Raw)": 0.7848411202430725, "Finetune/Step": 303, "Finetune/Step Time": 8.250467857345939} {"Finetune/Learning Rate": 1.5210863838272818e-06, "Finetune/Loss": 0.6243193745613098, "Finetune/Loss (Raw)": 0.6254329085350037, "Finetune/Step": 304, "Finetune/Step Time": 8.249635120853782} {"Finetune/Learning Rate": 1.5179430972452468e-06, "Finetune/Loss": 0.6153388023376465, "Finetune/Loss (Raw)": 0.4496474266052246, "Finetune/Step": 305, "Finetune/Step Time": 8.250309649854898} {"Finetune/Learning Rate": 1.5147928015098307e-06, "Finetune/Loss": 0.6190809011459351, "Finetune/Loss (Raw)": 0.7306502461433411, "Finetune/Step": 306, "Finetune/Step Time": 8.248871682211757} {"Finetune/Learning Rate": 1.5116355392529485e-06, "Finetune/Loss": 0.6201831102371216, "Finetune/Loss (Raw)": 0.6270795464515686, "Finetune/Step": 307, "Finetune/Step Time": 8.255950134247541} {"Finetune/Learning Rate": 1.5084713532007904e-06, "Finetune/Loss": 0.6183590888977051, "Finetune/Loss (Raw)": 0.6273305416107178, "Finetune/Step": 308, "Finetune/Step Time": 8.247870247811079} {"Finetune/Learning Rate": 1.5053002861732443e-06, "Finetune/Loss": 0.6253807544708252, "Finetune/Loss (Raw)": 0.6316333413124084, "Finetune/Step": 309, "Finetune/Step Time": 8.261579617857933} {"Finetune/Learning Rate": 1.5021223810833165e-06, "Finetune/Loss": 0.6358621120452881, "Finetune/Loss (Raw)": 0.7854472994804382, "Finetune/Step": 310, "Finetune/Step Time": 8.260334772989154} {"Finetune/Learning Rate": 1.4989376809365494e-06, "Finetune/Loss": 0.6380155682563782, "Finetune/Loss (Raw)": 0.5550707578659058, "Finetune/Step": 311, "Finetune/Step Time": 8.266726607456803} {"Finetune/Learning Rate": 1.4957462288304418e-06, "Finetune/Loss": 0.6325434446334839, "Finetune/Loss (Raw)": 0.49413084983825684, "Finetune/Step": 312, "Finetune/Step Time": 8.262875882908702} {"Finetune/Learning Rate": 1.4925480679538644e-06, "Finetune/Loss": 0.6192367672920227, "Finetune/Loss (Raw)": 0.462628036737442, "Finetune/Step": 313, "Finetune/Step Time": 8.26078781299293} {"Finetune/Learning Rate": 1.489343241586475e-06, "Finetune/Loss": 0.6216601133346558, "Finetune/Loss (Raw)": 0.5562398433685303, "Finetune/Step": 314, "Finetune/Step Time": 8.260475086048245} {"Finetune/Learning Rate": 1.4861317930981333e-06, "Finetune/Loss": 0.6168132424354553, "Finetune/Loss (Raw)": 0.5269725918769836, "Finetune/Step": 315, "Finetune/Step Time": 8.266457490622997} {"Finetune/Learning Rate": 1.4829137659483142e-06, "Finetune/Loss": 0.619225263595581, "Finetune/Loss (Raw)": 0.6977347135543823, "Finetune/Step": 316, "Finetune/Step Time": 8.260891243815422} {"Finetune/Learning Rate": 1.47968920368552e-06, "Finetune/Loss": 0.6179523468017578, "Finetune/Loss (Raw)": 0.3834901452064514, "Finetune/Step": 317, "Finetune/Step Time": 8.267824715003371} {"Finetune/Learning Rate": 1.4764581499466892e-06, "Finetune/Loss": 0.6134445667266846, "Finetune/Loss (Raw)": 0.6019992828369141, "Finetune/Step": 318, "Finetune/Step Time": 8.269760571420193} {"Finetune/Learning Rate": 1.4732206484566089e-06, "Finetune/Loss": 0.6042500734329224, "Finetune/Loss (Raw)": 0.4717017412185669, "Finetune/Step": 319, "Finetune/Step Time": 8.277317879721522} {"Finetune/Learning Rate": 1.46997674302732e-06, "Finetune/Loss": 0.6078135967254639, "Finetune/Loss (Raw)": 0.5876243114471436, "Finetune/Step": 320, "Finetune/Step Time": 8.271461511030793} {"Finetune/Learning Rate": 1.4667264775575267e-06, "Finetune/Loss": 0.5925869941711426, "Finetune/Loss (Raw)": 0.39090490341186523, "Finetune/Step": 321, "Finetune/Step Time": 8.281856883317232} {"Finetune/Learning Rate": 1.4634698960320017e-06, "Finetune/Loss": 0.5972726345062256, "Finetune/Loss (Raw)": 0.6001442670822144, "Finetune/Step": 322, "Finetune/Step Time": 8.271885493770242} {"Finetune/Learning Rate": 1.46020704252099e-06, "Finetune/Loss": 0.5970953702926636, "Finetune/Loss (Raw)": 0.6146036386489868, "Finetune/Step": 323, "Finetune/Step Time": 8.275404799729586} {"Finetune/Learning Rate": 1.4569379611796135e-06, "Finetune/Loss": 0.6007739305496216, "Finetune/Loss (Raw)": 0.5979160666465759, "Finetune/Step": 324, "Finetune/Step Time": 8.272974843159318} {"Finetune/Learning Rate": 1.4536626962472743e-06, "Finetune/Loss": 0.5957345962524414, "Finetune/Loss (Raw)": 0.60355144739151, "Finetune/Step": 325, "Finetune/Step Time": 8.269252168014646} {"Finetune/Learning Rate": 1.4503812920470533e-06, "Finetune/Loss": 0.5983239412307739, "Finetune/Loss (Raw)": 0.6987257599830627, "Finetune/Step": 326, "Finetune/Step Time": 8.271031925454736} {"Finetune/Learning Rate": 1.447093792985114e-06, "Finetune/Loss": 0.5914102792739868, "Finetune/Loss (Raw)": 0.36051610112190247, "Finetune/Step": 327, "Finetune/Step Time": 8.275448629632592} {"Finetune/Learning Rate": 1.4438002435500977e-06, "Finetune/Loss": 0.5940062999725342, "Finetune/Loss (Raw)": 0.7146002054214478, "Finetune/Step": 328, "Finetune/Step Time": 8.270387491211295} {"Finetune/Learning Rate": 1.4405006883125248e-06, "Finetune/Loss": 0.6099476218223572, "Finetune/Loss (Raw)": 0.9665191173553467, "Finetune/Step": 329, "Finetune/Step Time": 8.263527370989323} {"Finetune/Learning Rate": 1.4371951719241904e-06, "Finetune/Loss": 0.6140360832214355, "Finetune/Loss (Raw)": 0.8247416019439697, "Finetune/Step": 330, "Finetune/Step Time": 8.269595503807068} {"Finetune/Learning Rate": 1.433883739117558e-06, "Finetune/Loss": 0.6066181659698486, "Finetune/Loss (Raw)": 0.5721586346626282, "Finetune/Step": 331, "Finetune/Step Time": 8.275024149566889} {"Finetune/Learning Rate": 1.4305664347051584e-06, "Finetune/Loss": 0.5916957855224609, "Finetune/Loss (Raw)": 0.24704599380493164, "Finetune/Step": 332, "Finetune/Step Time": 8.273811265826225} {"Finetune/Learning Rate": 1.4272433035789796e-06, "Finetune/Loss": 0.594577431678772, "Finetune/Loss (Raw)": 0.7499802708625793, "Finetune/Step": 333, "Finetune/Step Time": 8.268118681386113} {"Finetune/Learning Rate": 1.4239143907098608e-06, "Finetune/Loss": 0.5953695774078369, "Finetune/Loss (Raw)": 0.51076340675354, "Finetune/Step": 334, "Finetune/Step Time": 8.274836329743266} {"Finetune/Learning Rate": 1.4205797411468834e-06, "Finetune/Loss": 0.5944970846176147, "Finetune/Loss (Raw)": 0.7569212913513184, "Finetune/Step": 335, "Finetune/Step Time": 8.2803422100842} {"Finetune/Learning Rate": 1.4172394000167623e-06, "Finetune/Loss": 0.5899540185928345, "Finetune/Loss (Raw)": 0.48005789518356323, "Finetune/Step": 336, "Finetune/Step Time": 8.274205951020122} {"Finetune/Learning Rate": 1.4138934125232338e-06, "Finetune/Loss": 0.596733808517456, "Finetune/Loss (Raw)": 0.6665995121002197, "Finetune/Step": 337, "Finetune/Step Time": 8.274107040837407} {"Finetune/Learning Rate": 1.410541823946445e-06, "Finetune/Loss": 0.5894007682800293, "Finetune/Loss (Raw)": 0.49599283933639526, "Finetune/Step": 338, "Finetune/Step Time": 8.275667745620012} {"Finetune/Learning Rate": 1.4071846796423403e-06, "Finetune/Loss": 0.5856136083602905, "Finetune/Loss (Raw)": 0.5058910846710205, "Finetune/Step": 339, "Finetune/Step Time": 8.278166748583317} {"Finetune/Learning Rate": 1.4038220250420486e-06, "Finetune/Loss": 0.5856126546859741, "Finetune/Loss (Raw)": 0.627299964427948, "Finetune/Step": 340, "Finetune/Step Time": 8.273583484813571} {"Finetune/Learning Rate": 1.4004539056512664e-06, "Finetune/Loss": 0.5899782180786133, "Finetune/Loss (Raw)": 0.7713313698768616, "Finetune/Step": 341, "Finetune/Step Time": 8.259013561531901} {"Finetune/Learning Rate": 1.3970803670496452e-06, "Finetune/Loss": 0.5809580087661743, "Finetune/Loss (Raw)": 0.49679994583129883, "Finetune/Step": 342, "Finetune/Step Time": 8.262681672349572} {"Finetune/Learning Rate": 1.3937014548901714e-06, "Finetune/Loss": 0.5867119431495667, "Finetune/Loss (Raw)": 0.7391970157623291, "Finetune/Step": 343, "Finetune/Step Time": 8.265034150332212} {"Finetune/Learning Rate": 1.390317214898551e-06, "Finetune/Loss": 0.58747398853302, "Finetune/Loss (Raw)": 0.5185142755508423, "Finetune/Step": 344, "Finetune/Step Time": 8.273461982607841} {"Finetune/Learning Rate": 1.386927692872589e-06, "Finetune/Loss": 0.5913121700286865, "Finetune/Loss (Raw)": 0.5854501128196716, "Finetune/Step": 345, "Finetune/Step Time": 8.274682154878974} {"Finetune/Learning Rate": 1.3835329346815714e-06, "Finetune/Loss": 0.6008738875389099, "Finetune/Loss (Raw)": 0.8622146844863892, "Finetune/Step": 346, "Finetune/Step Time": 8.274644169956446} {"Finetune/Learning Rate": 1.3801329862656428e-06, "Finetune/Loss": 0.6099209785461426, "Finetune/Loss (Raw)": 0.8164809942245483, "Finetune/Step": 347, "Finetune/Step Time": 8.286306634545326} {"Finetune/Learning Rate": 1.376727893635185e-06, "Finetune/Loss": 0.6143853664398193, "Finetune/Loss (Raw)": 0.8405938148498535, "Finetune/Step": 348, "Finetune/Step Time": 8.29314604960382} {"Finetune/Learning Rate": 1.3733177028701958e-06, "Finetune/Loss": 0.6287169456481934, "Finetune/Loss (Raw)": 0.8420994281768799, "Finetune/Step": 349, "Finetune/Step Time": 8.27071531303227} {"Finetune/Learning Rate": 1.369902460119664e-06, "Finetune/Loss": 0.6285111308097839, "Finetune/Loss (Raw)": 0.5954145789146423, "Finetune/Step": 350, "Finetune/Step Time": 8.284844532608986} {"Finetune/Learning Rate": 1.3664822116009448e-06, "Finetune/Loss": 0.6331342458724976, "Finetune/Loss (Raw)": 0.6196413636207581, "Finetune/Step": 351, "Finetune/Step Time": 8.276892947033048} {"Finetune/Learning Rate": 1.3630570035991351e-06, "Finetune/Loss": 0.6356652975082397, "Finetune/Loss (Raw)": 0.6686176061630249, "Finetune/Step": 352, "Finetune/Step Time": 8.282237682491541} {"Finetune/Learning Rate": 1.359626882466447e-06, "Finetune/Loss": 0.6463245153427124, "Finetune/Loss (Raw)": 0.732001006603241, "Finetune/Step": 353, "Finetune/Step Time": 8.268488809466362} {"Finetune/Learning Rate": 1.3561918946215804e-06, "Finetune/Loss": 0.6479730606079102, "Finetune/Loss (Raw)": 0.6528966426849365, "Finetune/Step": 354, "Finetune/Step Time": 8.277665017172694} {"Finetune/Learning Rate": 1.3527520865490949e-06, "Finetune/Loss": 0.6515235900878906, "Finetune/Loss (Raw)": 0.728222131729126, "Finetune/Step": 355, "Finetune/Step Time": 8.267876207828522} {"Finetune/Learning Rate": 1.3493075047987799e-06, "Finetune/Loss": 0.651990532875061, "Finetune/Loss (Raw)": 0.6128564476966858, "Finetune/Step": 356, "Finetune/Step Time": 8.264573672786355} {"Finetune/Learning Rate": 1.3458581959850262e-06, "Finetune/Loss": 0.6515002250671387, "Finetune/Loss (Raw)": 0.5878646373748779, "Finetune/Step": 357, "Finetune/Step Time": 8.252947205677629} {"Finetune/Learning Rate": 1.3424042067861942e-06, "Finetune/Loss": 0.6521344780921936, "Finetune/Loss (Raw)": 0.7190194725990295, "Finetune/Step": 358, "Finetune/Step Time": 8.268965447321534} {"Finetune/Learning Rate": 1.3389455839439825e-06, "Finetune/Loss": 0.668251633644104, "Finetune/Loss (Raw)": 0.8762645721435547, "Finetune/Step": 359, "Finetune/Step Time": 8.257272195070982} {"Finetune/Learning Rate": 1.3354823742627947e-06, "Finetune/Loss": 0.6639536619186401, "Finetune/Loss (Raw)": 0.5770638585090637, "Finetune/Step": 360, "Finetune/Step Time": 8.257598539814353} {"Finetune/Learning Rate": 1.3320146246091073e-06, "Finetune/Loss": 0.6611751317977905, "Finetune/Loss (Raw)": 0.8776092529296875, "Finetune/Step": 361, "Finetune/Step Time": 8.2347616776824} {"Finetune/Learning Rate": 1.3285423819108348e-06, "Finetune/Loss": 0.6545203924179077, "Finetune/Loss (Raw)": 0.6117883920669556, "Finetune/Step": 362, "Finetune/Step Time": 8.245363406836987} {"Finetune/Learning Rate": 1.3250656931566937e-06, "Finetune/Loss": 0.6565032601356506, "Finetune/Loss (Raw)": 0.6356102228164673, "Finetune/Step": 363, "Finetune/Step Time": 8.245635487139225} {"Finetune/Learning Rate": 1.3215846053955681e-06, "Finetune/Loss": 0.6641097068786621, "Finetune/Loss (Raw)": 0.4904526472091675, "Finetune/Step": 364, "Finetune/Step Time": 8.244865886867046} {"Finetune/Learning Rate": 1.318099165735873e-06, "Finetune/Loss": 0.6537470817565918, "Finetune/Loss (Raw)": 0.41837644577026367, "Finetune/Step": 365, "Finetune/Step Time": 8.245272291824222} {"Finetune/Learning Rate": 1.3146094213449146e-06, "Finetune/Loss": 0.6558437347412109, "Finetune/Loss (Raw)": 0.577856183052063, "Finetune/Step": 366, "Finetune/Step Time": 8.255215782672167} {"Finetune/Learning Rate": 1.3111154194482555e-06, "Finetune/Loss": 0.6513071656227112, "Finetune/Loss (Raw)": 0.6117510795593262, "Finetune/Step": 367, "Finetune/Step Time": 8.252753984183073} {"Finetune/Learning Rate": 1.3076172073290723e-06, "Finetune/Loss": 0.6512618064880371, "Finetune/Loss (Raw)": 0.4786064624786377, "Finetune/Step": 368, "Finetune/Step Time": 8.253516972064972} {"Finetune/Learning Rate": 1.304114832327518e-06, "Finetune/Loss": 0.6483334898948669, "Finetune/Loss (Raw)": 0.5728938579559326, "Finetune/Step": 369, "Finetune/Step Time": 8.254995491355658} {"Finetune/Learning Rate": 1.3006083418400798e-06, "Finetune/Loss": 0.6562089920043945, "Finetune/Loss (Raw)": 0.7480068206787109, "Finetune/Step": 370, "Finetune/Step Time": 8.273751178756356} {"Finetune/Learning Rate": 1.2970977833189392e-06, "Finetune/Loss": 0.6572293043136597, "Finetune/Loss (Raw)": 0.5385423898696899, "Finetune/Step": 371, "Finetune/Step Time": 8.269189218059182} {"Finetune/Learning Rate": 1.2935832042713286e-06, "Finetune/Loss": 0.6566015481948853, "Finetune/Loss (Raw)": 0.6072101593017578, "Finetune/Step": 372, "Finetune/Step Time": 8.27289243787527} {"Finetune/Learning Rate": 1.2900646522588887e-06, "Finetune/Loss": 0.6464792490005493, "Finetune/Loss (Raw)": 0.44741880893707275, "Finetune/Step": 373, "Finetune/Step Time": 8.270370312035084} {"Finetune/Learning Rate": 1.2865421748970254e-06, "Finetune/Loss": 0.653746485710144, "Finetune/Loss (Raw)": 0.7293506264686584, "Finetune/Step": 374, "Finetune/Step Time": 8.289883214980364} {"Finetune/Learning Rate": 1.2830158198542653e-06, "Finetune/Loss": 0.6523761749267578, "Finetune/Loss (Raw)": 0.6953480243682861, "Finetune/Step": 375, "Finetune/Step Time": 8.283259706571698} {"Finetune/Learning Rate": 1.2794856348516094e-06, "Finetune/Loss": 0.6573168039321899, "Finetune/Loss (Raw)": 0.6766132116317749, "Finetune/Step": 376, "Finetune/Step Time": 8.28427897207439} {"Finetune/Learning Rate": 1.2759516676618892e-06, "Finetune/Loss": 0.659633994102478, "Finetune/Loss (Raw)": 0.659602701663971, "Finetune/Step": 377, "Finetune/Step Time": 8.273506313562393} {"Finetune/Learning Rate": 1.2724139661091187e-06, "Finetune/Loss": 0.6515295505523682, "Finetune/Loss (Raw)": 0.602872908115387, "Finetune/Step": 378, "Finetune/Step Time": 8.270012255758047} {"Finetune/Learning Rate": 1.2688725780678485e-06, "Finetune/Loss": 0.6480716466903687, "Finetune/Loss (Raw)": 0.7058272361755371, "Finetune/Step": 379, "Finetune/Step Time": 8.265755906701088} {"Finetune/Learning Rate": 1.2653275514625163e-06, "Finetune/Loss": 0.6459954977035522, "Finetune/Loss (Raw)": 0.7741550207138062, "Finetune/Step": 380, "Finetune/Step Time": 8.270213248208165} {"Finetune/Learning Rate": 1.2617789342668003e-06, "Finetune/Loss": 0.6386021971702576, "Finetune/Loss (Raw)": 0.6055153012275696, "Finetune/Step": 381, "Finetune/Step Time": 8.25908200442791} {"Finetune/Learning Rate": 1.2582267745029684e-06, "Finetune/Loss": 0.638108491897583, "Finetune/Loss (Raw)": 0.5796173810958862, "Finetune/Step": 382, "Finetune/Step Time": 8.269456546753645} {"Finetune/Learning Rate": 1.2546711202412285e-06, "Finetune/Loss": 0.6448140144348145, "Finetune/Loss (Raw)": 0.8342177867889404, "Finetune/Step": 383, "Finetune/Step Time": 8.26572342403233} {"Finetune/Learning Rate": 1.2511120195990796e-06, "Finetune/Loss": 0.6418009996414185, "Finetune/Loss (Raw)": 0.5721985101699829, "Finetune/Step": 384, "Finetune/Step Time": 8.27063375711441} {"Finetune/Learning Rate": 1.247549520740658e-06, "Finetune/Loss": 0.6370537877082825, "Finetune/Loss (Raw)": 0.580091118812561, "Finetune/Step": 385, "Finetune/Step Time": 8.261324640363455} {"Finetune/Learning Rate": 1.2439836718760885e-06, "Finetune/Loss": 0.6353474855422974, "Finetune/Loss (Raw)": 0.5982964038848877, "Finetune/Step": 386, "Finetune/Step Time": 8.273992486298084} {"Finetune/Learning Rate": 1.2404145212608288e-06, "Finetune/Loss": 0.6364976167678833, "Finetune/Loss (Raw)": 0.7650250196456909, "Finetune/Step": 387, "Finetune/Step Time": 8.263847514986992} {"Finetune/Learning Rate": 1.2368421171950191e-06, "Finetune/Loss": 0.6381202936172485, "Finetune/Loss (Raw)": 0.664782702922821, "Finetune/Step": 388, "Finetune/Step Time": 8.264969171956182} {"Finetune/Learning Rate": 1.2332665080228277e-06, "Finetune/Loss": 0.6367518305778503, "Finetune/Loss (Raw)": 0.5440729856491089, "Finetune/Step": 389, "Finetune/Step Time": 8.243817027658224} {"Finetune/Learning Rate": 1.2296877421317956e-06, "Finetune/Loss": 0.6355535984039307, "Finetune/Loss (Raw)": 0.680676281452179, "Finetune/Step": 390, "Finetune/Step Time": 8.252237107604742} {"Finetune/Learning Rate": 1.2261058679521832e-06, "Finetune/Loss": 0.6241719126701355, "Finetune/Loss (Raw)": 0.5120516419410706, "Finetune/Step": 391, "Finetune/Step Time": 8.266054732725024} {"Finetune/Learning Rate": 1.2225209339563143e-06, "Finetune/Loss": 0.6171822547912598, "Finetune/Loss (Raw)": 0.35339561104774475, "Finetune/Step": 392, "Finetune/Step Time": 8.277787033468485} {"Finetune/Learning Rate": 1.2189329886579207e-06, "Finetune/Loss": 0.6144852042198181, "Finetune/Loss (Raw)": 0.7913020253181458, "Finetune/Step": 393, "Finetune/Step Time": 8.26743389852345} {"Finetune/Learning Rate": 1.2153420806114839e-06, "Finetune/Loss": 0.6130729913711548, "Finetune/Loss (Raw)": 0.5665990114212036, "Finetune/Step": 394, "Finetune/Step Time": 8.275158079341054} {"Finetune/Learning Rate": 1.2117482584115802e-06, "Finetune/Loss": 0.610605001449585, "Finetune/Loss (Raw)": 0.5566345453262329, "Finetune/Step": 395, "Finetune/Step Time": 8.269831467419863} {"Finetune/Learning Rate": 1.2081515706922224e-06, "Finetune/Loss": 0.6141884922981262, "Finetune/Loss (Raw)": 0.6051236391067505, "Finetune/Step": 396, "Finetune/Step Time": 8.27787908911705} {"Finetune/Learning Rate": 1.204552066126201e-06, "Finetune/Loss": 0.6202771663665771, "Finetune/Loss (Raw)": 0.6132125854492188, "Finetune/Step": 397, "Finetune/Step Time": 8.267361834645271} {"Finetune/Learning Rate": 1.2009497934244255e-06, "Finetune/Loss": 0.6271025538444519, "Finetune/Loss (Raw)": 0.7962691783905029, "Finetune/Step": 398, "Finetune/Step Time": 8.276233930140734} {"Finetune/Learning Rate": 1.1973448013352666e-06, "Finetune/Loss": 0.6344858407974243, "Finetune/Loss (Raw)": 0.8480173349380493, "Finetune/Step": 399, "Finetune/Step Time": 8.27758022211492} {"Finetune/Learning Rate": 1.1937371386438953e-06, "Finetune/Loss": 0.6360624432563782, "Finetune/Loss (Raw)": 0.5290576815605164, "Finetune/Step": 400, "Finetune/Step Time": 8.280862184241414} {"Finetune/Learning Rate": 1.1901268541716223e-06, "Finetune/Loss": 0.640167236328125, "Finetune/Loss (Raw)": 0.704247236251831, "Finetune/Step": 401, "Finetune/Step Time": 8.259521812200546} {"Finetune/Learning Rate": 1.1865139967752388e-06, "Finetune/Loss": 0.6386705636978149, "Finetune/Loss (Raw)": 0.7001122236251831, "Finetune/Step": 402, "Finetune/Step Time": 8.25364868156612} {"Finetune/Learning Rate": 1.1828986153463546e-06, "Finetune/Loss": 0.6351354122161865, "Finetune/Loss (Raw)": 0.42541825771331787, "Finetune/Step": 403, "Finetune/Step Time": 8.248123185709119} {"Finetune/Learning Rate": 1.1792807588107356e-06, "Finetune/Loss": 0.6307356357574463, "Finetune/Loss (Raw)": 0.46641862392425537, "Finetune/Step": 404, "Finetune/Step Time": 8.256658028811216} {"Finetune/Learning Rate": 1.1756604761276432e-06, "Finetune/Loss": 0.6387262344360352, "Finetune/Loss (Raw)": 0.7031169533729553, "Finetune/Step": 405, "Finetune/Step Time": 8.247783094644547} {"Finetune/Learning Rate": 1.1720378162891706e-06, "Finetune/Loss": 0.6366531848907471, "Finetune/Loss (Raw)": 0.6630139350891113, "Finetune/Step": 406, "Finetune/Step Time": 8.252171320840716} {"Finetune/Learning Rate": 1.168412828319581e-06, "Finetune/Loss": 0.6279836297035217, "Finetune/Loss (Raw)": 0.4179202914237976, "Finetune/Step": 407, "Finetune/Step Time": 8.253486031666398} {"Finetune/Learning Rate": 1.1647855612746423e-06, "Finetune/Loss": 0.6223418712615967, "Finetune/Loss (Raw)": 0.4960789680480957, "Finetune/Step": 408, "Finetune/Step Time": 8.264905277639627} {"Finetune/Learning Rate": 1.161156064240965e-06, "Finetune/Loss": 0.6299872398376465, "Finetune/Loss (Raw)": 0.9042545557022095, "Finetune/Step": 409, "Finetune/Step Time": 8.252373669296503} {"Finetune/Learning Rate": 1.157524386335338e-06, "Finetune/Loss": 0.6282296776771545, "Finetune/Loss (Raw)": 0.5466301441192627, "Finetune/Step": 410, "Finetune/Step Time": 8.25745777413249} {"Finetune/Learning Rate": 1.1538905767040618e-06, "Finetune/Loss": 0.6263099908828735, "Finetune/Loss (Raw)": 0.6443963646888733, "Finetune/Step": 411, "Finetune/Step Time": 8.252091152593493} {"Finetune/Learning Rate": 1.1502546845222858e-06, "Finetune/Loss": 0.6199332475662231, "Finetune/Loss (Raw)": 0.570099413394928, "Finetune/Step": 412, "Finetune/Step Time": 8.259166706353426} {"Finetune/Learning Rate": 1.1466167589933418e-06, "Finetune/Loss": 0.6257153749465942, "Finetune/Loss (Raw)": 0.7905451655387878, "Finetune/Step": 413, "Finetune/Step Time": 8.246897568926215} {"Finetune/Learning Rate": 1.142976849348078e-06, "Finetune/Loss": 0.625879168510437, "Finetune/Loss (Raw)": 0.5848570466041565, "Finetune/Step": 414, "Finetune/Step Time": 8.263457711786032} {"Finetune/Learning Rate": 1.1393350048441926e-06, "Finetune/Loss": 0.6275038719177246, "Finetune/Loss (Raw)": 0.8862085938453674, "Finetune/Step": 415, "Finetune/Step Time": 8.262184254825115} {"Finetune/Learning Rate": 1.1356912747655684e-06, "Finetune/Loss": 0.6302433013916016, "Finetune/Loss (Raw)": 0.6598597168922424, "Finetune/Step": 416, "Finetune/Step Time": 8.265200773254037} {"Finetune/Learning Rate": 1.132045708421605e-06, "Finetune/Loss": 0.6385177373886108, "Finetune/Loss (Raw)": 0.8448743224143982, "Finetune/Step": 417, "Finetune/Step Time": 8.256350370123982} {"Finetune/Learning Rate": 1.128398355146551e-06, "Finetune/Loss": 0.635964035987854, "Finetune/Loss (Raw)": 0.5165787935256958, "Finetune/Step": 418, "Finetune/Step Time": 8.264470145106316} {"Finetune/Learning Rate": 1.124749264298837e-06, "Finetune/Loss": 0.6328761577606201, "Finetune/Loss (Raw)": 0.666211724281311, "Finetune/Step": 419, "Finetune/Step Time": 8.260790495201945} {"Finetune/Learning Rate": 1.1210984852604083e-06, "Finetune/Loss": 0.6314404010772705, "Finetune/Loss (Raw)": 0.6188391447067261, "Finetune/Step": 420, "Finetune/Step Time": 8.264527581632137} {"Finetune/Learning Rate": 1.117446067436055e-06, "Finetune/Loss": 0.6329562067985535, "Finetune/Loss (Raw)": 0.5925776958465576, "Finetune/Step": 421, "Finetune/Step Time": 8.252044092863798} {"Finetune/Learning Rate": 1.1137920602527447e-06, "Finetune/Loss": 0.6349536180496216, "Finetune/Loss (Raw)": 0.7445922493934631, "Finetune/Step": 422, "Finetune/Step Time": 8.243183707818389} {"Finetune/Learning Rate": 1.110136513158954e-06, "Finetune/Loss": 0.6413317918777466, "Finetune/Loss (Raw)": 0.7161535024642944, "Finetune/Step": 423, "Finetune/Step Time": 8.23476385511458} {"Finetune/Learning Rate": 1.1064794756239976e-06, "Finetune/Loss": 0.64731764793396, "Finetune/Loss (Raw)": 0.5449428558349609, "Finetune/Step": 424, "Finetune/Step Time": 8.238023752346635} {"Finetune/Learning Rate": 1.1028209971373603e-06, "Finetune/Loss": 0.6458497643470764, "Finetune/Loss (Raw)": 0.7443310022354126, "Finetune/Step": 425, "Finetune/Step Time": 8.229516034945846} {"Finetune/Learning Rate": 1.0991611272080268e-06, "Finetune/Loss": 0.6509504914283752, "Finetune/Loss (Raw)": 0.7298218011856079, "Finetune/Step": 426, "Finetune/Step Time": 8.226060966029763} {"Finetune/Learning Rate": 1.0954999153638118e-06, "Finetune/Loss": 0.6576856970787048, "Finetune/Loss (Raw)": 0.7721615433692932, "Finetune/Step": 427, "Finetune/Step Time": 8.228979839012027} {"Finetune/Learning Rate": 1.0918374111506892e-06, "Finetune/Loss": 0.6590461134910583, "Finetune/Loss (Raw)": 0.648656964302063, "Finetune/Step": 428, "Finetune/Step Time": 8.233147380873561} {"Finetune/Learning Rate": 1.0881736641321227e-06, "Finetune/Loss": 0.6584206223487854, "Finetune/Loss (Raw)": 0.5931961536407471, "Finetune/Step": 429, "Finetune/Step Time": 8.225984793156385} {"Finetune/Learning Rate": 1.0845087238883943e-06, "Finetune/Loss": 0.6522035598754883, "Finetune/Loss (Raw)": 0.5973235368728638, "Finetune/Step": 430, "Finetune/Step Time": 8.230592912063003} {"Finetune/Learning Rate": 1.0808426400159335e-06, "Finetune/Loss": 0.6424784660339355, "Finetune/Loss (Raw)": 0.5368146896362305, "Finetune/Step": 431, "Finetune/Step Time": 8.232535511255264} {"Finetune/Learning Rate": 1.0771754621266464e-06, "Finetune/Loss": 0.6438357830047607, "Finetune/Loss (Raw)": 0.5724923610687256, "Finetune/Step": 432, "Finetune/Step Time": 8.23405464924872} {"Finetune/Learning Rate": 1.0735072398472433e-06, "Finetune/Loss": 0.6400271654129028, "Finetune/Loss (Raw)": 0.5823716521263123, "Finetune/Step": 433, "Finetune/Step Time": 8.227550249546766} {"Finetune/Learning Rate": 1.0698380228185684e-06, "Finetune/Loss": 0.6421873569488525, "Finetune/Loss (Raw)": 0.7692368030548096, "Finetune/Step": 434, "Finetune/Step Time": 8.231791166588664} {"Finetune/Learning Rate": 1.066167860694928e-06, "Finetune/Loss": 0.6472954154014587, "Finetune/Loss (Raw)": 0.5888758897781372, "Finetune/Step": 435, "Finetune/Step Time": 8.230115085840225} {"Finetune/Learning Rate": 1.0624968031434172e-06, "Finetune/Loss": 0.6574999094009399, "Finetune/Loss (Raw)": 0.792963445186615, "Finetune/Step": 436, "Finetune/Step Time": 8.234470365568995} {"Finetune/Learning Rate": 1.058824899843249e-06, "Finetune/Loss": 0.65472412109375, "Finetune/Loss (Raw)": 0.6142922043800354, "Finetune/Step": 437, "Finetune/Step Time": 8.225829843431711} {"Finetune/Learning Rate": 1.055152200485082e-06, "Finetune/Loss": 0.6587070226669312, "Finetune/Loss (Raw)": 0.7904649972915649, "Finetune/Step": 438, "Finetune/Step Time": 8.22860618494451} {"Finetune/Learning Rate": 1.0514787547703466e-06, "Finetune/Loss": 0.661663293838501, "Finetune/Loss (Raw)": 0.5125219821929932, "Finetune/Step": 439, "Finetune/Step Time": 8.230016116052866} {"Finetune/Learning Rate": 1.0478046124105744e-06, "Finetune/Loss": 0.662384033203125, "Finetune/Loss (Raw)": 0.5191425681114197, "Finetune/Step": 440, "Finetune/Step Time": 8.235413700342178} {"Finetune/Learning Rate": 1.0441298231267241e-06, "Finetune/Loss": 0.6548092365264893, "Finetune/Loss (Raw)": 0.6618607044219971, "Finetune/Step": 441, "Finetune/Step Time": 8.243945606052876} {"Finetune/Learning Rate": 1.0404544366485093e-06, "Finetune/Loss": 0.6539057493209839, "Finetune/Loss (Raw)": 0.517719566822052, "Finetune/Step": 442, "Finetune/Step Time": 8.251740276813507} {"Finetune/Learning Rate": 1.0367785027137243e-06, "Finetune/Loss": 0.6521528363227844, "Finetune/Loss (Raw)": 0.5883023142814636, "Finetune/Step": 443, "Finetune/Step Time": 8.2504553347826} {"Finetune/Learning Rate": 1.0331020710675728e-06, "Finetune/Loss": 0.6513197422027588, "Finetune/Loss (Raw)": 0.5434401035308838, "Finetune/Step": 444, "Finetune/Step Time": 8.251113072037697} {"Finetune/Learning Rate": 1.0294251914619943e-06, "Finetune/Loss": 0.6409310102462769, "Finetune/Loss (Raw)": 0.45810747146606445, "Finetune/Step": 445, "Finetune/Step Time": 8.25133085437119} {"Finetune/Learning Rate": 1.0257479136549886e-06, "Finetune/Loss": 0.6419024467468262, "Finetune/Loss (Raw)": 0.6159411072731018, "Finetune/Step": 446, "Finetune/Step Time": 8.252628663554788} {"Finetune/Learning Rate": 1.022070287409946e-06, "Finetune/Loss": 0.6357274055480957, "Finetune/Loss (Raw)": 0.6886078119277954, "Finetune/Step": 447, "Finetune/Step Time": 8.250157110393047} {"Finetune/Learning Rate": 1.018392362494972e-06, "Finetune/Loss": 0.6311939358711243, "Finetune/Loss (Raw)": 0.5147894620895386, "Finetune/Step": 448, "Finetune/Step Time": 8.248562004417181} {"Finetune/Learning Rate": 1.0147141886822122e-06, "Finetune/Loss": 0.6246950626373291, "Finetune/Loss (Raw)": 0.6369085311889648, "Finetune/Step": 449, "Finetune/Step Time": 8.252582728862762} {"Finetune/Learning Rate": 1.0110358157471823e-06, "Finetune/Loss": 0.6220688223838806, "Finetune/Loss (Raw)": 0.43254080414772034, "Finetune/Step": 450, "Finetune/Step Time": 8.260057961568236} {"Finetune/Learning Rate": 1.0073572934680919e-06, "Finetune/Loss": 0.6166802644729614, "Finetune/Loss (Raw)": 0.4937768578529358, "Finetune/Step": 451, "Finetune/Step Time": 8.256333572790027} {"Finetune/Learning Rate": 1.003678671625172e-06, "Finetune/Loss": 0.62004554271698, "Finetune/Loss (Raw)": 0.7265303134918213, "Finetune/Step": 452, "Finetune/Step Time": 8.257348233833909} {"Finetune/Learning Rate": 1e-06, "Finetune/Loss": 0.6205949187278748, "Finetune/Loss (Raw)": 0.6101561784744263, "Finetune/Step": 453, "Finetune/Step Time": 8.260625399649143} {"Finetune/Learning Rate": 9.963213283748281e-07, "Finetune/Loss": 0.6133934259414673, "Finetune/Loss (Raw)": 0.5141457319259644, "Finetune/Step": 454, "Finetune/Step Time": 8.261997267603874} {"Finetune/Learning Rate": 9.92642706531908e-07, "Finetune/Loss": 0.6031798720359802, "Finetune/Loss (Raw)": 0.38931789994239807, "Finetune/Step": 455, "Finetune/Step Time": 8.260920248925686} {"Finetune/Learning Rate": 9.889641842528176e-07, "Finetune/Loss": 0.6074199080467224, "Finetune/Loss (Raw)": 0.6806249022483826, "Finetune/Step": 456, "Finetune/Step Time": 8.257688026875257} {"Finetune/Learning Rate": 9.85285811317788e-07, "Finetune/Loss": 0.5962210297584534, "Finetune/Loss (Raw)": 0.38596707582473755, "Finetune/Step": 457, "Finetune/Step Time": 8.270863937214017} {"Finetune/Learning Rate": 9.816076375050283e-07, "Finetune/Loss": 0.5856749415397644, "Finetune/Loss (Raw)": 0.3923463225364685, "Finetune/Step": 458, "Finetune/Step Time": 8.271519457921386} {"Finetune/Learning Rate": 9.77929712590054e-07, "Finetune/Loss": 0.5809522867202759, "Finetune/Loss (Raw)": 0.6210357546806335, "Finetune/Step": 459, "Finetune/Step Time": 8.272252997383475} {"Finetune/Learning Rate": 9.742520863450115e-07, "Finetune/Loss": 0.5804948210716248, "Finetune/Loss (Raw)": 0.6340187788009644, "Finetune/Step": 460, "Finetune/Step Time": 8.269182888790965} {"Finetune/Learning Rate": 9.705748085380059e-07, "Finetune/Loss": 0.579422116279602, "Finetune/Loss (Raw)": 0.5588700771331787, "Finetune/Step": 461, "Finetune/Step Time": 8.273907497525215} {"Finetune/Learning Rate": 9.668979289324271e-07, "Finetune/Loss": 0.5778698921203613, "Finetune/Loss (Raw)": 0.5476502180099487, "Finetune/Step": 462, "Finetune/Step Time": 8.270765060558915} {"Finetune/Learning Rate": 9.632214972862759e-07, "Finetune/Loss": 0.5760120153427124, "Finetune/Loss (Raw)": 0.47736257314682007, "Finetune/Step": 463, "Finetune/Step Time": 8.26987661793828} {"Finetune/Learning Rate": 9.595455633514908e-07, "Finetune/Loss": 0.581368088722229, "Finetune/Loss (Raw)": 0.7438879013061523, "Finetune/Step": 464, "Finetune/Step Time": 8.260644365102053} {"Finetune/Learning Rate": 9.558701768732758e-07, "Finetune/Loss": 0.58762127161026, "Finetune/Loss (Raw)": 0.7824748158454895, "Finetune/Step": 465, "Finetune/Step Time": 8.262955792248249} {"Finetune/Learning Rate": 9.521953875894255e-07, "Finetune/Loss": 0.5826552510261536, "Finetune/Loss (Raw)": 0.6103223562240601, "Finetune/Step": 466, "Finetune/Step Time": 8.260741973295808} {"Finetune/Learning Rate": 9.485212452296534e-07, "Finetune/Loss": 0.5803333520889282, "Finetune/Loss (Raw)": 0.5145756602287292, "Finetune/Step": 467, "Finetune/Step Time": 8.263882542029023} {"Finetune/Learning Rate": 9.448477995149181e-07, "Finetune/Loss": 0.5696244239807129, "Finetune/Loss (Raw)": 0.45027777552604675, "Finetune/Step": 468, "Finetune/Step Time": 8.262203188613057} {"Finetune/Learning Rate": 9.41175100156751e-07, "Finetune/Loss": 0.5738898515701294, "Finetune/Loss (Raw)": 0.750786304473877, "Finetune/Step": 469, "Finetune/Step Time": 8.27861800417304} {"Finetune/Learning Rate": 9.375031968565829e-07, "Finetune/Loss": 0.5646210312843323, "Finetune/Loss (Raw)": 0.4938617944717407, "Finetune/Step": 470, "Finetune/Step Time": 8.286257853731513} {"Finetune/Learning Rate": 9.338321393050719e-07, "Finetune/Loss": 0.5596054792404175, "Finetune/Loss (Raw)": 0.3520256578922272, "Finetune/Step": 471, "Finetune/Step Time": 8.28607115894556} {"Finetune/Learning Rate": 9.301619771814315e-07, "Finetune/Loss": 0.556736946105957, "Finetune/Loss (Raw)": 0.4273498058319092, "Finetune/Step": 472, "Finetune/Step Time": 8.284356500953436} {"Finetune/Learning Rate": 9.264927601527568e-07, "Finetune/Loss": 0.5523493885993958, "Finetune/Loss (Raw)": 0.521457850933075, "Finetune/Step": 473, "Finetune/Step Time": 8.277731725946069} {"Finetune/Learning Rate": 9.228245378733536e-07, "Finetune/Loss": 0.5537993311882019, "Finetune/Loss (Raw)": 0.5641178488731384, "Finetune/Step": 474, "Finetune/Step Time": 8.279118658974767} {"Finetune/Learning Rate": 9.191573599840661e-07, "Finetune/Loss": 0.5505632162094116, "Finetune/Loss (Raw)": 0.48474740982055664, "Finetune/Step": 475, "Finetune/Step Time": 8.279820714145899} {"Finetune/Learning Rate": 9.154912761116055e-07, "Finetune/Loss": 0.5497899651527405, "Finetune/Loss (Raw)": 0.5186957716941833, "Finetune/Step": 476, "Finetune/Step Time": 8.275784393772483} {"Finetune/Learning Rate": 9.118263358678772e-07, "Finetune/Loss": 0.5521950721740723, "Finetune/Loss (Raw)": 0.5350710153579712, "Finetune/Step": 477, "Finetune/Step Time": 8.27952866256237} {"Finetune/Learning Rate": 9.081625888493106e-07, "Finetune/Loss": 0.5528886914253235, "Finetune/Loss (Raw)": 0.6381365060806274, "Finetune/Step": 478, "Finetune/Step Time": 8.27418515086174} {"Finetune/Learning Rate": 9.045000846361883e-07, "Finetune/Loss": 0.5487607717514038, "Finetune/Loss (Raw)": 0.5565152168273926, "Finetune/Step": 479, "Finetune/Step Time": 8.28587744385004} {"Finetune/Learning Rate": 9.00838872791973e-07, "Finetune/Loss": 0.5465717911720276, "Finetune/Loss (Raw)": 0.44474148750305176, "Finetune/Step": 480, "Finetune/Step Time": 8.284975538030267} {"Finetune/Learning Rate": 8.971790028626394e-07, "Finetune/Loss": 0.5425082445144653, "Finetune/Loss (Raw)": 0.5068745613098145, "Finetune/Step": 481, "Finetune/Step Time": 8.299614937976003} {"Finetune/Learning Rate": 8.935205243760021e-07, "Finetune/Loss": 0.5413834452629089, "Finetune/Loss (Raw)": 0.3965466320514679, "Finetune/Step": 482, "Finetune/Step Time": 8.298208981752396} {"Finetune/Learning Rate": 8.89863486841046e-07, "Finetune/Loss": 0.5454421639442444, "Finetune/Loss (Raw)": 0.6236573457717896, "Finetune/Step": 483, "Finetune/Step Time": 8.308152126148343} {"Finetune/Learning Rate": 8.862079397472552e-07, "Finetune/Loss": 0.5433338284492493, "Finetune/Loss (Raw)": 0.6590635776519775, "Finetune/Step": 484, "Finetune/Step Time": 8.308168552815914} {"Finetune/Learning Rate": 8.825539325639451e-07, "Finetune/Loss": 0.5332594513893127, "Finetune/Loss (Raw)": 0.28777557611465454, "Finetune/Step": 485, "Finetune/Step Time": 8.310950329527259} {"Finetune/Learning Rate": 8.789015147395918e-07, "Finetune/Loss": 0.5304272174835205, "Finetune/Loss (Raw)": 0.42351287603378296, "Finetune/Step": 486, "Finetune/Step Time": 8.308415595442057} {"Finetune/Learning Rate": 8.752507357011629e-07, "Finetune/Loss": 0.5346905589103699, "Finetune/Loss (Raw)": 0.5257471203804016, "Finetune/Step": 487, "Finetune/Step Time": 8.322709910571575} {"Finetune/Learning Rate": 8.716016448534489e-07, "Finetune/Loss": 0.5272058248519897, "Finetune/Loss (Raw)": 0.4411134123802185, "Finetune/Step": 488, "Finetune/Step Time": 8.323886726051569} {"Finetune/Learning Rate": 8.679542915783948e-07, "Finetune/Loss": 0.5367838740348816, "Finetune/Loss (Raw)": 0.6924644112586975, "Finetune/Step": 489, "Finetune/Step Time": 8.343021741136909} {"Finetune/Learning Rate": 8.643087252344312e-07, "Finetune/Loss": 0.5437455177307129, "Finetune/Loss (Raw)": 0.615118145942688, "Finetune/Step": 490, "Finetune/Step Time": 8.339495765045285} {"Finetune/Learning Rate": 8.606649951558071e-07, "Finetune/Loss": 0.5399590134620667, "Finetune/Loss (Raw)": 0.4998692274093628, "Finetune/Step": 491, "Finetune/Step Time": 8.343626031652093} {"Finetune/Learning Rate": 8.570231506519219e-07, "Finetune/Loss": 0.5413339734077454, "Finetune/Loss (Raw)": 0.6780160665512085, "Finetune/Step": 492, "Finetune/Step Time": 8.338157447054982} {"Finetune/Learning Rate": 8.533832410066581e-07, "Finetune/Loss": 0.5389467477798462, "Finetune/Loss (Raw)": 0.48248058557510376, "Finetune/Step": 493, "Finetune/Step Time": 8.336081879213452} {"Finetune/Learning Rate": 8.49745315477714e-07, "Finetune/Loss": 0.5388675928115845, "Finetune/Loss (Raw)": 0.5451158881187439, "Finetune/Step": 494, "Finetune/Step Time": 8.335848059505224} {"Finetune/Learning Rate": 8.461094232959381e-07, "Finetune/Loss": 0.5438902378082275, "Finetune/Loss (Raw)": 0.6380869150161743, "Finetune/Step": 495, "Finetune/Step Time": 8.328229561448097} {"Finetune/Learning Rate": 8.424756136646622e-07, "Finetune/Loss": 0.535010576248169, "Finetune/Loss (Raw)": 0.45973968505859375, "Finetune/Step": 496, "Finetune/Step Time": 8.328264644369483} {"Finetune/Learning Rate": 8.38843935759035e-07, "Finetune/Loss": 0.5311355590820312, "Finetune/Loss (Raw)": 0.6584734916687012, "Finetune/Step": 497, "Finetune/Step Time": 8.317808743566275} {"Finetune/Learning Rate": 8.352144387253582e-07, "Finetune/Loss": 0.5284730195999146, "Finetune/Loss (Raw)": 0.5251213312149048, "Finetune/Step": 498, "Finetune/Step Time": 8.31678687222302} {"Finetune/Learning Rate": 8.315871716804193e-07, "Finetune/Loss": 0.5344496965408325, "Finetune/Loss (Raw)": 0.7058284878730774, "Finetune/Step": 499, "Finetune/Step Time": 8.322967318817973} {"Finetune/Learning Rate": 8.279621837108294e-07, "Finetune/Loss": 0.5385503768920898, "Finetune/Loss (Raw)": 0.5814995765686035, "Finetune/Step": 500, "Finetune/Step Time": 8.320044254884124} {"Finetune/Learning Rate": 8.24339523872357e-07, "Finetune/Loss": 0.530063271522522, "Finetune/Loss (Raw)": 0.47919970750808716, "Finetune/Step": 501, "Finetune/Step Time": 8.314149042591453} {"Finetune/Learning Rate": 8.207192411892645e-07, "Finetune/Loss": 0.5341697335243225, "Finetune/Loss (Raw)": 0.6252694129943848, "Finetune/Step": 502, "Finetune/Step Time": 8.310489855706692} {"Finetune/Learning Rate": 8.171013846536454e-07, "Finetune/Loss": 0.5387723445892334, "Finetune/Loss (Raw)": 0.4993094205856323, "Finetune/Step": 503, "Finetune/Step Time": 8.312724171206355} {"Finetune/Learning Rate": 8.134860032247612e-07, "Finetune/Loss": 0.5495314598083496, "Finetune/Loss (Raw)": 0.7716392874717712, "Finetune/Step": 504, "Finetune/Step Time": 8.310382716357708} {"Finetune/Learning Rate": 8.098731458283779e-07, "Finetune/Loss": 0.5500634908676147, "Finetune/Loss (Raw)": 0.538483738899231, "Finetune/Step": 505, "Finetune/Step Time": 8.309786947444081} {"Finetune/Learning Rate": 8.06262861356105e-07, "Finetune/Loss": 0.552280843257904, "Finetune/Loss (Raw)": 0.6350739598274231, "Finetune/Step": 506, "Finetune/Step Time": 8.317642832174897} {"Finetune/Learning Rate": 8.026551986647334e-07, "Finetune/Loss": 0.550383448600769, "Finetune/Loss (Raw)": 0.4240296483039856, "Finetune/Step": 507, "Finetune/Step Time": 8.31672266870737} {"Finetune/Learning Rate": 7.990502065755748e-07, "Finetune/Loss": 0.5480238795280457, "Finetune/Loss (Raw)": 0.44318947196006775, "Finetune/Step": 508, "Finetune/Step Time": 8.322995889931917} {"Finetune/Learning Rate": 7.954479338737994e-07, "Finetune/Loss": 0.5446785092353821, "Finetune/Loss (Raw)": 0.42801928520202637, "Finetune/Step": 509, "Finetune/Step Time": 8.334955800324678} {"Finetune/Learning Rate": 7.918484293077776e-07, "Finetune/Loss": 0.5461719036102295, "Finetune/Loss (Raw)": 0.685924768447876, "Finetune/Step": 510, "Finetune/Step Time": 8.329546004533768} {"Finetune/Learning Rate": 7.8825174158842e-07, "Finetune/Loss": 0.5502729415893555, "Finetune/Loss (Raw)": 0.6877486705780029, "Finetune/Step": 511, "Finetune/Step Time": 8.333741644397378} {"Finetune/Learning Rate": 7.846579193885164e-07, "Finetune/Loss": 0.5554705858230591, "Finetune/Loss (Raw)": 0.6110678315162659, "Finetune/Step": 512, "Finetune/Step Time": 8.330479944124818} {"Finetune/Learning Rate": 7.810670113420797e-07, "Finetune/Loss": 0.5582756996154785, "Finetune/Loss (Raw)": 0.5966354608535767, "Finetune/Step": 513, "Finetune/Step Time": 8.3345926720649} {"Finetune/Learning Rate": 7.774790660436857e-07, "Finetune/Loss": 0.5616116523742676, "Finetune/Loss (Raw)": 0.5032970309257507, "Finetune/Step": 514, "Finetune/Step Time": 8.326806344091892} {"Finetune/Learning Rate": 7.738941320478169e-07, "Finetune/Loss": 0.5533002018928528, "Finetune/Loss (Raw)": 0.3576918840408325, "Finetune/Step": 515, "Finetune/Step Time": 8.342790730297565} {"Finetune/Learning Rate": 7.703122578682045e-07, "Finetune/Loss": 0.5456091165542603, "Finetune/Loss (Raw)": 0.4129503071308136, "Finetune/Step": 516, "Finetune/Step Time": 8.33944489620626} {"Finetune/Learning Rate": 7.667334919771723e-07, "Finetune/Loss": 0.5572496652603149, "Finetune/Loss (Raw)": 0.660273551940918, "Finetune/Step": 517, "Finetune/Step Time": 8.352306535467505} {"Finetune/Learning Rate": 7.631578828049808e-07, "Finetune/Loss": 0.5641331672668457, "Finetune/Loss (Raw)": 0.6437825560569763, "Finetune/Step": 518, "Finetune/Step Time": 8.349085299298167} {"Finetune/Learning Rate": 7.595854787391712e-07, "Finetune/Loss": 0.5669863224029541, "Finetune/Loss (Raw)": 0.6170499920845032, "Finetune/Step": 519, "Finetune/Step Time": 8.350216090679169} {"Finetune/Learning Rate": 7.560163281239115e-07, "Finetune/Loss": 0.5687286257743835, "Finetune/Loss (Raw)": 0.49686604738235474, "Finetune/Step": 520, "Finetune/Step Time": 8.344498379155993} {"Finetune/Learning Rate": 7.524504792593418e-07, "Finetune/Loss": 0.5621106624603271, "Finetune/Loss (Raw)": 0.48068952560424805, "Finetune/Step": 521, "Finetune/Step Time": 8.349603367969394} {"Finetune/Learning Rate": 7.488879804009204e-07, "Finetune/Loss": 0.5550142526626587, "Finetune/Loss (Raw)": 0.38803333044052124, "Finetune/Step": 522, "Finetune/Step Time": 8.343548193573952} {"Finetune/Learning Rate": 7.453288797587713e-07, "Finetune/Loss": 0.5638364553451538, "Finetune/Loss (Raw)": 0.7821810245513916, "Finetune/Step": 523, "Finetune/Step Time": 8.351520279422402} {"Finetune/Learning Rate": 7.417732254970316e-07, "Finetune/Loss": 0.5589340925216675, "Finetune/Loss (Raw)": 0.5211392641067505, "Finetune/Step": 524, "Finetune/Step Time": 8.344392282888293} {"Finetune/Learning Rate": 7.382210657331997e-07, "Finetune/Loss": 0.5611717700958252, "Finetune/Loss (Raw)": 0.5540878772735596, "Finetune/Step": 525, "Finetune/Step Time": 8.34572895988822} {"Finetune/Learning Rate": 7.346724485374835e-07, "Finetune/Loss": 0.5660703182220459, "Finetune/Loss (Raw)": 0.7018696069717407, "Finetune/Step": 526, "Finetune/Step Time": 8.343409983441234} {"Finetune/Learning Rate": 7.311274219321515e-07, "Finetune/Loss": 0.5596774816513062, "Finetune/Loss (Raw)": 0.4335139989852905, "Finetune/Step": 527, "Finetune/Step Time": 8.347329949960113} {"Finetune/Learning Rate": 7.275860338908814e-07, "Finetune/Loss": 0.5590056777000427, "Finetune/Loss (Raw)": 0.43824315071105957, "Finetune/Step": 528, "Finetune/Step Time": 8.345975356176496} {"Finetune/Learning Rate": 7.24048332338111e-07, "Finetune/Loss": 0.5536854267120361, "Finetune/Loss (Raw)": 0.4882239103317261, "Finetune/Step": 529, "Finetune/Step Time": 8.360911183059216} {"Finetune/Learning Rate": 7.205143651483906e-07, "Finetune/Loss": 0.556377649307251, "Finetune/Loss (Raw)": 0.6112726926803589, "Finetune/Step": 530, "Finetune/Step Time": 8.370106741786003} {"Finetune/Learning Rate": 7.169841801457345e-07, "Finetune/Loss": 0.5476377010345459, "Finetune/Loss (Raw)": 0.4261508584022522, "Finetune/Step": 531, "Finetune/Step Time": 8.38327263109386} {"Finetune/Learning Rate": 7.134578251029744e-07, "Finetune/Loss": 0.5486646294593811, "Finetune/Loss (Raw)": 0.6143611073493958, "Finetune/Step": 532, "Finetune/Step Time": 8.377403475344181} {"Finetune/Learning Rate": 7.099353477411112e-07, "Finetune/Loss": 0.5454484224319458, "Finetune/Loss (Raw)": 0.3762791156768799, "Finetune/Step": 533, "Finetune/Step Time": 8.379047168418765} {"Finetune/Learning Rate": 7.064167957286713e-07, "Finetune/Loss": 0.549249529838562, "Finetune/Loss (Raw)": 0.7469061613082886, "Finetune/Step": 534, "Finetune/Step Time": 8.379066290333867} {"Finetune/Learning Rate": 7.029022166810608e-07, "Finetune/Loss": 0.546907901763916, "Finetune/Loss (Raw)": 0.42437678575515747, "Finetune/Step": 535, "Finetune/Step Time": 8.381148602813482} {"Finetune/Learning Rate": 6.993916581599202e-07, "Finetune/Loss": 0.5408473014831543, "Finetune/Loss (Raw)": 0.5776993036270142, "Finetune/Step": 536, "Finetune/Step Time": 8.37838831730187} {"Finetune/Learning Rate": 6.958851676724822e-07, "Finetune/Loss": 0.5354907512664795, "Finetune/Loss (Raw)": 0.36707478761672974, "Finetune/Step": 537, "Finetune/Step Time": 8.36758209578693} {"Finetune/Learning Rate": 6.923827926709276e-07, "Finetune/Loss": 0.5271867513656616, "Finetune/Loss (Raw)": 0.3693474531173706, "Finetune/Step": 538, "Finetune/Step Time": 8.368433199822903} {"Finetune/Learning Rate": 6.888845805517447e-07, "Finetune/Loss": 0.5279525518417358, "Finetune/Loss (Raw)": 0.44853490591049194, "Finetune/Step": 539, "Finetune/Step Time": 8.374392068013549} {"Finetune/Learning Rate": 6.853905786550854e-07, "Finetune/Loss": 0.5331371426582336, "Finetune/Loss (Raw)": 0.6090960502624512, "Finetune/Step": 540, "Finetune/Step Time": 8.368003372102976} {"Finetune/Learning Rate": 6.819008342641273e-07, "Finetune/Loss": 0.5366674661636353, "Finetune/Loss (Raw)": 0.5409900546073914, "Finetune/Step": 541, "Finetune/Step Time": 8.368681266903877} {"Finetune/Learning Rate": 6.78415394604432e-07, "Finetune/Loss": 0.5297398567199707, "Finetune/Loss (Raw)": 0.4642414450645447, "Finetune/Step": 542, "Finetune/Step Time": 8.371933970600367} {"Finetune/Learning Rate": 6.749343068433065e-07, "Finetune/Loss": 0.5281941890716553, "Finetune/Loss (Raw)": 0.6382855772972107, "Finetune/Step": 543, "Finetune/Step Time": 8.373805299401283} {"Finetune/Learning Rate": 6.714576180891652e-07, "Finetune/Loss": 0.5221086740493774, "Finetune/Loss (Raw)": 0.4163326323032379, "Finetune/Step": 544, "Finetune/Step Time": 8.372549088671803} {"Finetune/Learning Rate": 6.679853753908926e-07, "Finetune/Loss": 0.5214840769767761, "Finetune/Loss (Raw)": 0.576648473739624, "Finetune/Step": 545, "Finetune/Step Time": 8.374690731987357} {"Finetune/Learning Rate": 6.645176257372054e-07, "Finetune/Loss": 0.5241678953170776, "Finetune/Loss (Raw)": 0.589178204536438, "Finetune/Step": 546, "Finetune/Step Time": 8.371096849441528} {"Finetune/Learning Rate": 6.610544160560176e-07, "Finetune/Loss": 0.5310385227203369, "Finetune/Loss (Raw)": 0.5775535702705383, "Finetune/Step": 547, "Finetune/Step Time": 8.373712258413434} {"Finetune/Learning Rate": 6.575957932138057e-07, "Finetune/Loss": 0.5340479612350464, "Finetune/Loss (Raw)": 0.5092527866363525, "Finetune/Step": 548, "Finetune/Step Time": 8.368665799498558} {"Finetune/Learning Rate": 6.541418040149739e-07, "Finetune/Loss": 0.5264758467674255, "Finetune/Loss (Raw)": 0.41796448826789856, "Finetune/Step": 549, "Finetune/Step Time": 8.374616062268615} {"Finetune/Learning Rate": 6.506924952012202e-07, "Finetune/Loss": 0.5231429934501648, "Finetune/Loss (Raw)": 0.5371323823928833, "Finetune/Step": 550, "Finetune/Step Time": 8.388060865923762} {"Finetune/Learning Rate": 6.472479134509052e-07, "Finetune/Loss": 0.5162891149520874, "Finetune/Loss (Raw)": 0.39772626757621765, "Finetune/Step": 551, "Finetune/Step Time": 8.396295811980963} {"Finetune/Learning Rate": 6.438081053784195e-07, "Finetune/Loss": 0.5188237428665161, "Finetune/Loss (Raw)": 0.5779727697372437, "Finetune/Step": 552, "Finetune/Step Time": 8.393978003412485} {"Finetune/Learning Rate": 6.40373117533553e-07, "Finetune/Loss": 0.5257651209831238, "Finetune/Loss (Raw)": 0.702813982963562, "Finetune/Step": 553, "Finetune/Step Time": 8.394250011071563} {"Finetune/Learning Rate": 6.369429964008649e-07, "Finetune/Loss": 0.5320202112197876, "Finetune/Loss (Raw)": 0.5881966352462769, "Finetune/Step": 554, "Finetune/Step Time": 8.39605613425374} {"Finetune/Learning Rate": 6.335177883990552e-07, "Finetune/Loss": 0.5256351232528687, "Finetune/Loss (Raw)": 0.5778579115867615, "Finetune/Step": 555, "Finetune/Step Time": 8.3970121499151} {"Finetune/Learning Rate": 6.300975398803361e-07, "Finetune/Loss": 0.5325769186019897, "Finetune/Loss (Raw)": 0.7432752251625061, "Finetune/Step": 556, "Finetune/Step Time": 8.379424599930644} {"Finetune/Learning Rate": 6.26682297129804e-07, "Finetune/Loss": 0.5287914872169495, "Finetune/Loss (Raw)": 0.4329557418823242, "Finetune/Step": 557, "Finetune/Step Time": 8.379423327744007} {"Finetune/Learning Rate": 6.232721063648147e-07, "Finetune/Loss": 0.5191252827644348, "Finetune/Loss (Raw)": 0.3925497233867645, "Finetune/Step": 558, "Finetune/Step Time": 8.379413271322846} {"Finetune/Learning Rate": 6.198670137343573e-07, "Finetune/Loss": 0.5179949402809143, "Finetune/Loss (Raw)": 0.3973434567451477, "Finetune/Step": 559, "Finetune/Step Time": 8.377387575805187} {"Finetune/Learning Rate": 6.164670653184284e-07, "Finetune/Loss": 0.5247922539710999, "Finetune/Loss (Raw)": 0.6557573080062866, "Finetune/Step": 560, "Finetune/Step Time": 8.37533606402576} {"Finetune/Learning Rate": 6.130723071274106e-07, "Finetune/Loss": 0.5228114128112793, "Finetune/Loss (Raw)": 0.4248366355895996, "Finetune/Step": 561, "Finetune/Step Time": 8.373040461912751} {"Finetune/Learning Rate": 6.09682785101449e-07, "Finetune/Loss": 0.5202571749687195, "Finetune/Loss (Raw)": 0.5295379161834717, "Finetune/Step": 562, "Finetune/Step Time": 8.374575931578875} {"Finetune/Learning Rate": 6.062985451098286e-07, "Finetune/Loss": 0.5216213464736938, "Finetune/Loss (Raw)": 0.4698048233985901, "Finetune/Step": 563, "Finetune/Step Time": 8.37301630526781} {"Finetune/Learning Rate": 6.029196329503547e-07, "Finetune/Loss": 0.5252275466918945, "Finetune/Loss (Raw)": 0.7297582626342773, "Finetune/Step": 564, "Finetune/Step Time": 8.360770987346768} {"Finetune/Learning Rate": 5.995460943487334e-07, "Finetune/Loss": 0.5350785255432129, "Finetune/Loss (Raw)": 0.6915113925933838, "Finetune/Step": 565, "Finetune/Step Time": 8.363747466355562} {"Finetune/Learning Rate": 5.961779749579515e-07, "Finetune/Loss": 0.530637264251709, "Finetune/Loss (Raw)": 0.6047857403755188, "Finetune/Step": 566, "Finetune/Step Time": 8.364938605576754} {"Finetune/Learning Rate": 5.928153203576595e-07, "Finetune/Loss": 0.5313167572021484, "Finetune/Loss (Raw)": 0.4461202919483185, "Finetune/Step": 567, "Finetune/Step Time": 8.363749215379357} {"Finetune/Learning Rate": 5.894581760535549e-07, "Finetune/Loss": 0.5294469594955444, "Finetune/Loss (Raw)": 0.5178666710853577, "Finetune/Step": 568, "Finetune/Step Time": 8.361235216259956} {"Finetune/Learning Rate": 5.861065874767661e-07, "Finetune/Loss": 0.5399486422538757, "Finetune/Loss (Raw)": 0.7031269073486328, "Finetune/Step": 569, "Finetune/Step Time": 8.348345497623086} {"Finetune/Learning Rate": 5.827605999832375e-07, "Finetune/Loss": 0.5468181371688843, "Finetune/Loss (Raw)": 0.5891706943511963, "Finetune/Step": 570, "Finetune/Step Time": 8.342931404709816} {"Finetune/Learning Rate": 5.794202588531166e-07, "Finetune/Loss": 0.548895001411438, "Finetune/Loss (Raw)": 0.5149953961372375, "Finetune/Step": 571, "Finetune/Step Time": 8.338869217783213} {"Finetune/Learning Rate": 5.760856092901394e-07, "Finetune/Loss": 0.5420686602592468, "Finetune/Loss (Raw)": 0.3906540274620056, "Finetune/Step": 572, "Finetune/Step Time": 8.339482609182596} {"Finetune/Learning Rate": 5.727566964210202e-07, "Finetune/Loss": 0.545730710029602, "Finetune/Loss (Raw)": 0.6581748723983765, "Finetune/Step": 573, "Finetune/Step Time": 8.333968637511134} {"Finetune/Learning Rate": 5.694335652948415e-07, "Finetune/Loss": 0.5488846302032471, "Finetune/Loss (Raw)": 0.5651683807373047, "Finetune/Step": 574, "Finetune/Step Time": 8.324928432703018} {"Finetune/Learning Rate": 5.661162608824419e-07, "Finetune/Loss": 0.5534048080444336, "Finetune/Loss (Raw)": 0.7829313278198242, "Finetune/Step": 575, "Finetune/Step Time": 8.324236646294594} {"Finetune/Learning Rate": 5.628048280758095e-07, "Finetune/Loss": 0.5633429288864136, "Finetune/Loss (Raw)": 0.7343502640724182, "Finetune/Step": 576, "Finetune/Step Time": 8.32567629404366} {"Finetune/Learning Rate": 5.594993116874749e-07, "Finetune/Loss": 0.5565583109855652, "Finetune/Loss (Raw)": 0.35954228043556213, "Finetune/Step": 577, "Finetune/Step Time": 8.319653639569879} {"Finetune/Learning Rate": 5.561997564499023e-07, "Finetune/Loss": 0.5525857210159302, "Finetune/Loss (Raw)": 0.4620548486709595, "Finetune/Step": 578, "Finetune/Step Time": 8.311710635200143} {"Finetune/Learning Rate": 5.529062070148859e-07, "Finetune/Loss": 0.5451415777206421, "Finetune/Loss (Raw)": 0.33934253454208374, "Finetune/Step": 579, "Finetune/Step Time": 8.31493010185659} {"Finetune/Learning Rate": 5.496187079529464e-07, "Finetune/Loss": 0.5482041835784912, "Finetune/Loss (Raw)": 0.6072532534599304, "Finetune/Step": 580, "Finetune/Step Time": 8.318087585270405} {"Finetune/Learning Rate": 5.46337303752726e-07, "Finetune/Loss": 0.5561789870262146, "Finetune/Loss (Raw)": 0.673159122467041, "Finetune/Step": 581, "Finetune/Step Time": 8.314368423074484} {"Finetune/Learning Rate": 5.430620388203866e-07, "Finetune/Loss": 0.5558865070343018, "Finetune/Loss (Raw)": 0.5277732610702515, "Finetune/Step": 582, "Finetune/Step Time": 8.315145201981068} {"Finetune/Learning Rate": 5.397929574790104e-07, "Finetune/Loss": 0.5556349754333496, "Finetune/Loss (Raw)": 0.3896789848804474, "Finetune/Step": 583, "Finetune/Step Time": 8.316507045179605} {"Finetune/Learning Rate": 5.365301039679984e-07, "Finetune/Loss": 0.5555466413497925, "Finetune/Loss (Raw)": 0.5751434564590454, "Finetune/Step": 584, "Finetune/Step Time": 8.321638882160187} {"Finetune/Learning Rate": 5.332735224424734e-07, "Finetune/Loss": 0.5471370220184326, "Finetune/Loss (Raw)": 0.43370625376701355, "Finetune/Step": 585, "Finetune/Step Time": 8.314531523734331} {"Finetune/Learning Rate": 5.300232569726803e-07, "Finetune/Loss": 0.5450361967086792, "Finetune/Loss (Raw)": 0.5209710597991943, "Finetune/Step": 586, "Finetune/Step Time": 8.314824050292373} {"Finetune/Learning Rate": 5.267793515433912e-07, "Finetune/Loss": 0.5465739965438843, "Finetune/Loss (Raw)": 0.627068042755127, "Finetune/Step": 587, "Finetune/Step Time": 8.316832728683949} {"Finetune/Learning Rate": 5.235418500533109e-07, "Finetune/Loss": 0.5396832227706909, "Finetune/Loss (Raw)": 0.5227707028388977, "Finetune/Step": 588, "Finetune/Step Time": 8.319935349747539} {"Finetune/Learning Rate": 5.203107963144804e-07, "Finetune/Loss": 0.5452530384063721, "Finetune/Loss (Raw)": 0.6111888289451599, "Finetune/Step": 589, "Finetune/Step Time": 8.309966204687953} {"Finetune/Learning Rate": 5.170862340516858e-07, "Finetune/Loss": 0.5499493479728699, "Finetune/Loss (Raw)": 0.5428320169448853, "Finetune/Step": 590, "Finetune/Step Time": 8.308490831404924} {"Finetune/Learning Rate": 5.138682069018669e-07, "Finetune/Loss": 0.558122992515564, "Finetune/Loss (Raw)": 0.658900797367096, "Finetune/Step": 591, "Finetune/Step Time": 8.310957968235016} {"Finetune/Learning Rate": 5.106567584135251e-07, "Finetune/Loss": 0.5590943098068237, "Finetune/Loss (Raw)": 0.6868391036987305, "Finetune/Step": 592, "Finetune/Step Time": 8.325682608410716} {"Finetune/Learning Rate": 5.074519320461357e-07, "Finetune/Loss": 0.5630652904510498, "Finetune/Loss (Raw)": 0.5519067645072937, "Finetune/Step": 593, "Finetune/Step Time": 8.321094933897257} {"Finetune/Learning Rate": 5.042537711695583e-07, "Finetune/Loss": 0.5623278021812439, "Finetune/Loss (Raw)": 0.5059400200843811, "Finetune/Step": 594, "Finetune/Step Time": 8.322293322533369} {"Finetune/Learning Rate": 5.010623190634507e-07, "Finetune/Loss": 0.5635894536972046, "Finetune/Loss (Raw)": 0.5101783871650696, "Finetune/Step": 595, "Finetune/Step Time": 8.320961000397801} {"Finetune/Learning Rate": 4.978776189166839e-07, "Finetune/Loss": 0.5552474856376648, "Finetune/Loss (Raw)": 0.46281421184539795, "Finetune/Step": 596, "Finetune/Step Time": 8.324716236442327} {"Finetune/Learning Rate": 4.946997138267561e-07, "Finetune/Loss": 0.5491765737533569, "Finetune/Loss (Raw)": 0.4972403049468994, "Finetune/Step": 597, "Finetune/Step Time": 8.322135793045163} {"Finetune/Learning Rate": 4.915286467992097e-07, "Finetune/Loss": 0.551352858543396, "Finetune/Loss (Raw)": 0.6744298338890076, "Finetune/Step": 598, "Finetune/Step Time": 8.31998129747808} {"Finetune/Learning Rate": 4.883644607470517e-07, "Finetune/Loss": 0.5470731854438782, "Finetune/Loss (Raw)": 0.3091697096824646, "Finetune/Step": 599, "Finetune/Step Time": 8.322240591049194} {"Finetune/Learning Rate": 4.852071984901696e-07, "Finetune/Loss": 0.5456486344337463, "Finetune/Loss (Raw)": 0.47228002548217773, "Finetune/Step": 600, "Finetune/Step Time": 8.324567805975676} {"Finetune/Learning Rate": 4.820569027547533e-07, "Finetune/Loss": 0.5407305359840393, "Finetune/Loss (Raw)": 0.5457478761672974, "Finetune/Step": 601, "Finetune/Step Time": 8.328713595867157} {"Finetune/Learning Rate": 4.789136161727184e-07, "Finetune/Loss": 0.5377331972122192, "Finetune/Loss (Raw)": 0.4932549297809601, "Finetune/Step": 602, "Finetune/Step Time": 8.317004205659032} {"Finetune/Learning Rate": 4.7577738128112697e-07, "Finetune/Loss": 0.5401453971862793, "Finetune/Loss (Raw)": 0.5921869277954102, "Finetune/Step": 603, "Finetune/Step Time": 8.305700397118926} {"Finetune/Learning Rate": 4.7264824052161243e-07, "Finetune/Loss": 0.5434533357620239, "Finetune/Loss (Raw)": 0.4965066909790039, "Finetune/Step": 604, "Finetune/Step Time": 8.308139553293586} {"Finetune/Learning Rate": 4.6952623623980736e-07, "Finetune/Loss": 0.5397113561630249, "Finetune/Loss (Raw)": 0.5384323596954346, "Finetune/Step": 605, "Finetune/Step Time": 8.306985192000866} {"Finetune/Learning Rate": 4.664114106847666e-07, "Finetune/Loss": 0.5337201952934265, "Finetune/Loss (Raw)": 0.3734516501426697, "Finetune/Step": 606, "Finetune/Step Time": 8.30649784579873} {"Finetune/Learning Rate": 4.6330380600839956e-07, "Finetune/Loss": 0.5294575691223145, "Finetune/Loss (Raw)": 0.6465276479721069, "Finetune/Step": 607, "Finetune/Step Time": 8.30766418389976} {"Finetune/Learning Rate": 4.6020346426489677e-07, "Finetune/Loss": 0.5279605388641357, "Finetune/Loss (Raw)": 0.6864449381828308, "Finetune/Step": 608, "Finetune/Step Time": 8.30939924903214} {"Finetune/Learning Rate": 4.5711042741016147e-07, "Finetune/Loss": 0.532565712928772, "Finetune/Loss (Raw)": 0.5069094896316528, "Finetune/Step": 609, "Finetune/Step Time": 8.304205399006605} {"Finetune/Learning Rate": 4.540247373012439e-07, "Finetune/Loss": 0.5366933941841125, "Finetune/Loss (Raw)": 0.5941404104232788, "Finetune/Step": 610, "Finetune/Step Time": 8.302259255200624} {"Finetune/Learning Rate": 4.5094643569577185e-07, "Finetune/Loss": 0.5460551381111145, "Finetune/Loss (Raw)": 0.6389173865318298, "Finetune/Step": 611, "Finetune/Step Time": 8.301684655249119} {"Finetune/Learning Rate": 4.4787556425138674e-07, "Finetune/Loss": 0.5428253412246704, "Finetune/Loss (Raw)": 0.5039008855819702, "Finetune/Step": 612, "Finetune/Step Time": 8.296958647668362} {"Finetune/Learning Rate": 4.4481216452518154e-07, "Finetune/Loss": 0.5385921001434326, "Finetune/Loss (Raw)": 0.5376946926116943, "Finetune/Step": 613, "Finetune/Step Time": 8.283465454354882} {"Finetune/Learning Rate": 4.417562779731354e-07, "Finetune/Loss": 0.5326421856880188, "Finetune/Loss (Raw)": 0.33737635612487793, "Finetune/Step": 614, "Finetune/Step Time": 8.282165441662073} {"Finetune/Learning Rate": 4.3870794594955464e-07, "Finetune/Loss": 0.5395115613937378, "Finetune/Loss (Raw)": 0.6094971299171448, "Finetune/Step": 615, "Finetune/Step Time": 8.27672104537487} {"Finetune/Learning Rate": 4.356672097065134e-07, "Finetune/Loss": 0.5373699069023132, "Finetune/Loss (Raw)": 0.5066120624542236, "Finetune/Step": 616, "Finetune/Step Time": 8.27913599461317} {"Finetune/Learning Rate": 4.3263411039329345e-07, "Finetune/Loss": 0.5331211090087891, "Finetune/Loss (Raw)": 0.29774391651153564, "Finetune/Step": 617, "Finetune/Step Time": 8.275354901328683} {"Finetune/Learning Rate": 4.296086890558289e-07, "Finetune/Loss": 0.5319308638572693, "Finetune/Loss (Raw)": 0.4828830361366272, "Finetune/Step": 618, "Finetune/Step Time": 8.274210289120674} {"Finetune/Learning Rate": 4.26590986636151e-07, "Finetune/Loss": 0.5278881788253784, "Finetune/Loss (Raw)": 0.497703492641449, "Finetune/Step": 619, "Finetune/Step Time": 8.269098222255707} {"Finetune/Learning Rate": 4.2358104397183257e-07, "Finetune/Loss": 0.5322997570037842, "Finetune/Loss (Raw)": 0.663939356803894, "Finetune/Step": 620, "Finetune/Step Time": 8.27540585771203} {"Finetune/Learning Rate": 4.205789017954363e-07, "Finetune/Loss": 0.527165412902832, "Finetune/Loss (Raw)": 0.44688960909843445, "Finetune/Step": 621, "Finetune/Step Time": 8.273714438080788} {"Finetune/Learning Rate": 4.175846007339643e-07, "Finetune/Loss": 0.5256209969520569, "Finetune/Loss (Raw)": 0.49341195821762085, "Finetune/Step": 622, "Finetune/Step Time": 8.262986114248633} {"Finetune/Learning Rate": 4.1459818130830616e-07, "Finetune/Loss": 0.5226724147796631, "Finetune/Loss (Raw)": 0.5645468831062317, "Finetune/Step": 623, "Finetune/Step Time": 8.270471984520555} {"Finetune/Learning Rate": 4.116196839326932e-07, "Finetune/Loss": 0.5172016620635986, "Finetune/Loss (Raw)": 0.5117740631103516, "Finetune/Step": 624, "Finetune/Step Time": 8.269429247826338} {"Finetune/Learning Rate": 4.086491489141494e-07, "Finetune/Loss": 0.517922043800354, "Finetune/Loss (Raw)": 0.574958086013794, "Finetune/Step": 625, "Finetune/Step Time": 8.276022853329778} {"Finetune/Learning Rate": 4.056866164519465e-07, "Finetune/Loss": 0.5195438861846924, "Finetune/Loss (Raw)": 0.5578400492668152, "Finetune/Step": 626, "Finetune/Step Time": 8.266029564663768} {"Finetune/Learning Rate": 4.0273212663706146e-07, "Finetune/Loss": 0.5213897228240967, "Finetune/Loss (Raw)": 0.5692455768585205, "Finetune/Step": 627, "Finetune/Step Time": 8.249949358403683} {"Finetune/Learning Rate": 3.9978571945163187e-07, "Finetune/Loss": 0.5164872407913208, "Finetune/Loss (Raw)": 0.3059343695640564, "Finetune/Step": 628, "Finetune/Step Time": 8.256957871839404} {"Finetune/Learning Rate": 3.9684743476841555e-07, "Finetune/Loss": 0.5169044733047485, "Finetune/Loss (Raw)": 0.5105917453765869, "Finetune/Step": 629, "Finetune/Step Time": 8.257525119930506} {"Finetune/Learning Rate": 3.9391731235025227e-07, "Finetune/Loss": 0.5067298412322998, "Finetune/Loss (Raw)": 0.34884005784988403, "Finetune/Step": 630, "Finetune/Step Time": 8.246633859351277} {"Finetune/Learning Rate": 3.9099539184952333e-07, "Finetune/Loss": 0.5060752630233765, "Finetune/Loss (Raw)": 0.2882236838340759, "Finetune/Step": 631, "Finetune/Step Time": 8.246334599331021} {"Finetune/Learning Rate": 3.8808171280761657e-07, "Finetune/Loss": 0.5067206621170044, "Finetune/Loss (Raw)": 0.49293315410614014, "Finetune/Step": 632, "Finetune/Step Time": 8.251604650169611} {"Finetune/Learning Rate": 3.851763146543916e-07, "Finetune/Loss": 0.5104818940162659, "Finetune/Loss (Raw)": 0.6661067008972168, "Finetune/Step": 633, "Finetune/Step Time": 8.23848425783217} {"Finetune/Learning Rate": 3.822792367076446e-07, "Finetune/Loss": 0.5096858143806458, "Finetune/Loss (Raw)": 0.4677817225456238, "Finetune/Step": 634, "Finetune/Step Time": 8.240239737555385} {"Finetune/Learning Rate": 3.793905181725772e-07, "Finetune/Loss": 0.4969560503959656, "Finetune/Loss (Raw)": 0.18483400344848633, "Finetune/Step": 635, "Finetune/Step Time": 8.239155665040016} {"Finetune/Learning Rate": 3.765101981412665e-07, "Finetune/Loss": 0.5019855499267578, "Finetune/Loss (Raw)": 0.6574516296386719, "Finetune/Step": 636, "Finetune/Step Time": 8.24243300408125} {"Finetune/Learning Rate": 3.73638315592135e-07, "Finetune/Loss": 0.5009574890136719, "Finetune/Loss (Raw)": 0.5055341124534607, "Finetune/Step": 637, "Finetune/Step Time": 8.243898015469313} {"Finetune/Learning Rate": 3.70774909389423e-07, "Finetune/Loss": 0.5092203617095947, "Finetune/Loss (Raw)": 0.6378625631332397, "Finetune/Step": 638, "Finetune/Step Time": 8.245446655899286} {"Finetune/Learning Rate": 3.679200182826645e-07, "Finetune/Loss": 0.5002419948577881, "Finetune/Loss (Raw)": 0.359220027923584, "Finetune/Step": 639, "Finetune/Step Time": 8.243626214563847} {"Finetune/Learning Rate": 3.6507368090616006e-07, "Finetune/Loss": 0.49534302949905396, "Finetune/Loss (Raw)": 0.5296787619590759, "Finetune/Step": 640, "Finetune/Step Time": 8.248841520398855} {"Finetune/Learning Rate": 3.622359357784569e-07, "Finetune/Loss": 0.49902331829071045, "Finetune/Loss (Raw)": 0.6246786117553711, "Finetune/Step": 641, "Finetune/Step Time": 8.245410541072488} {"Finetune/Learning Rate": 3.5940682130182486e-07, "Finetune/Loss": 0.498426616191864, "Finetune/Loss (Raw)": 0.5750458240509033, "Finetune/Step": 642, "Finetune/Step Time": 8.237708140164614} {"Finetune/Learning Rate": 3.5658637576173845e-07, "Finetune/Loss": 0.49992480874061584, "Finetune/Loss (Raw)": 0.6868606209754944, "Finetune/Step": 643, "Finetune/Step Time": 8.231156079098582} {"Finetune/Learning Rate": 3.5377463732635895e-07, "Finetune/Loss": 0.49541807174682617, "Finetune/Loss (Raw)": 0.3596850037574768, "Finetune/Step": 644, "Finetune/Step Time": 8.23342852666974} {"Finetune/Learning Rate": 3.509716440460163e-07, "Finetune/Loss": 0.4993836581707001, "Finetune/Loss (Raw)": 0.6645931005477905, "Finetune/Step": 645, "Finetune/Step Time": 8.22019542939961} {"Finetune/Learning Rate": 3.4817743385269535e-07, "Finetune/Loss": 0.5020940899848938, "Finetune/Loss (Raw)": 0.42410948872566223, "Finetune/Step": 646, "Finetune/Step Time": 8.221884440630674} {"Finetune/Learning Rate": 3.453920445595233e-07, "Finetune/Loss": 0.4980165660381317, "Finetune/Loss (Raw)": 0.4790174663066864, "Finetune/Step": 647, "Finetune/Step Time": 8.211020385846496} {"Finetune/Learning Rate": 3.426155138602558e-07, "Finetune/Loss": 0.49678850173950195, "Finetune/Loss (Raw)": 0.4673140048980713, "Finetune/Step": 648, "Finetune/Step Time": 8.217494761571288} {"Finetune/Learning Rate": 3.398478793287681e-07, "Finetune/Loss": 0.507292628288269, "Finetune/Loss (Raw)": 0.6338764429092407, "Finetune/Step": 649, "Finetune/Step Time": 8.214572684839368} {"Finetune/Learning Rate": 3.3708917841854777e-07, "Finetune/Loss": 0.5069860219955444, "Finetune/Loss (Raw)": 0.47307032346725464, "Finetune/Step": 650, "Finetune/Step Time": 8.21842877753079} {"Finetune/Learning Rate": 3.343394484621854e-07, "Finetune/Loss": 0.5089740753173828, "Finetune/Loss (Raw)": 0.5613225102424622, "Finetune/Step": 651, "Finetune/Step Time": 8.210931783542037} {"Finetune/Learning Rate": 3.3159872667087076e-07, "Finetune/Loss": 0.504582941532135, "Finetune/Loss (Raw)": 0.5234217047691345, "Finetune/Step": 652, "Finetune/Step Time": 8.220149541273713} {"Finetune/Learning Rate": 3.288670501338899e-07, "Finetune/Loss": 0.5028582811355591, "Finetune/Loss (Raw)": 0.3917011022567749, "Finetune/Step": 653, "Finetune/Step Time": 8.221522584557533} {"Finetune/Learning Rate": 3.261444558181218e-07, "Finetune/Loss": 0.5058507919311523, "Finetune/Loss (Raw)": 0.5891727209091187, "Finetune/Step": 654, "Finetune/Step Time": 8.21879006177187} {"Finetune/Learning Rate": 3.2343098056753816e-07, "Finetune/Loss": 0.5079330205917358, "Finetune/Loss (Raw)": 0.631177544593811, "Finetune/Step": 655, "Finetune/Step Time": 8.21283758804202} {"Finetune/Learning Rate": 3.2072666110270687e-07, "Finetune/Loss": 0.5137085914611816, "Finetune/Loss (Raw)": 0.6965910196304321, "Finetune/Step": 656, "Finetune/Step Time": 8.218798918649554} {"Finetune/Learning Rate": 3.1803153402029205e-07, "Finetune/Loss": 0.5128712058067322, "Finetune/Loss (Raw)": 0.5481630563735962, "Finetune/Step": 657, "Finetune/Step Time": 8.21494516916573} {"Finetune/Learning Rate": 3.1534563579256166e-07, "Finetune/Loss": 0.5045182704925537, "Finetune/Loss (Raw)": 0.29054540395736694, "Finetune/Step": 658, "Finetune/Step Time": 8.215702768415213} {"Finetune/Learning Rate": 3.126690027668918e-07, "Finetune/Loss": 0.5000544786453247, "Finetune/Loss (Raw)": 0.4264044165611267, "Finetune/Step": 659, "Finetune/Step Time": 8.208429342135787} {"Finetune/Learning Rate": 3.100016711652752e-07, "Finetune/Loss": 0.504601240158081, "Finetune/Loss (Raw)": 0.4514305591583252, "Finetune/Step": 660, "Finetune/Step Time": 8.21028696745634} {"Finetune/Learning Rate": 3.073436770838329e-07, "Finetune/Loss": 0.5027679204940796, "Finetune/Loss (Raw)": 0.4519270956516266, "Finetune/Step": 661, "Finetune/Step Time": 8.223989171907306} {"Finetune/Learning Rate": 3.046950564923233e-07, "Finetune/Loss": 0.5103476047515869, "Finetune/Loss (Raw)": 0.591388463973999, "Finetune/Step": 662, "Finetune/Step Time": 8.221908748149872} {"Finetune/Learning Rate": 3.020558452336562e-07, "Finetune/Loss": 0.5159671306610107, "Finetune/Loss (Raw)": 0.4680500626564026, "Finetune/Step": 663, "Finetune/Step Time": 8.21150828152895} {"Finetune/Learning Rate": 2.9942607902340944e-07, "Finetune/Loss": 0.5164834856987, "Finetune/Loss (Raw)": 0.5094554424285889, "Finetune/Step": 664, "Finetune/Step Time": 8.212374415248632} {"Finetune/Learning Rate": 2.968057934493425e-07, "Finetune/Loss": 0.513717532157898, "Finetune/Loss (Raw)": 0.5775968432426453, "Finetune/Step": 665, "Finetune/Step Time": 8.229007670655847} {"Finetune/Learning Rate": 2.941950239709171e-07, "Finetune/Loss": 0.514220118522644, "Finetune/Loss (Raw)": 0.483864426612854, "Finetune/Step": 666, "Finetune/Step Time": 8.229868462309241} {"Finetune/Learning Rate": 2.915938059188178e-07, "Finetune/Loss": 0.5209416747093201, "Finetune/Loss (Raw)": 0.39992353320121765, "Finetune/Step": 667, "Finetune/Step Time": 8.224602485075593} {"Finetune/Learning Rate": 2.8900217449447073e-07, "Finetune/Loss": 0.5140461325645447, "Finetune/Loss (Raw)": 0.43679386377334595, "Finetune/Step": 668, "Finetune/Step Time": 8.224046051502228} {"Finetune/Learning Rate": 2.864201647695714e-07, "Finetune/Loss": 0.5123769044876099, "Finetune/Loss (Raw)": 0.45211926102638245, "Finetune/Step": 669, "Finetune/Step Time": 8.230557020753622} {"Finetune/Learning Rate": 2.838478116856069e-07, "Finetune/Loss": 0.5120682120323181, "Finetune/Loss (Raw)": 0.6279834508895874, "Finetune/Step": 670, "Finetune/Step Time": 8.225143942981958} {"Finetune/Learning Rate": 2.812851500533843e-07, "Finetune/Loss": 0.5158766508102417, "Finetune/Loss (Raw)": 0.4810901880264282, "Finetune/Step": 671, "Finetune/Step Time": 8.221386767923832} {"Finetune/Learning Rate": 2.7873221455256003e-07, "Finetune/Loss": 0.5078751444816589, "Finetune/Loss (Raw)": 0.2736321985721588, "Finetune/Step": 672, "Finetune/Step Time": 8.221263149753213} {"Finetune/Learning Rate": 2.7618903973116926e-07, "Finetune/Loss": 0.5073752403259277, "Finetune/Loss (Raw)": 0.6086806058883667, "Finetune/Step": 673, "Finetune/Step Time": 8.21725843474269} {"Finetune/Learning Rate": 2.736556600051593e-07, "Finetune/Loss": 0.49834781885147095, "Finetune/Loss (Raw)": 0.28616824746131897, "Finetune/Step": 674, "Finetune/Step Time": 8.217052618041635} {"Finetune/Learning Rate": 2.711321096579241e-07, "Finetune/Loss": 0.48392194509506226, "Finetune/Loss (Raw)": 0.22523270547389984, "Finetune/Step": 675, "Finetune/Step Time": 8.212683867663145} {"Finetune/Learning Rate": 2.686184228398395e-07, "Finetune/Loss": 0.4864746034145355, "Finetune/Loss (Raw)": 0.44137102365493774, "Finetune/Step": 676, "Finetune/Step Time": 8.214132007211447} {"Finetune/Learning Rate": 2.6611463356780093e-07, "Finetune/Loss": 0.4841887354850769, "Finetune/Loss (Raw)": 0.591444730758667, "Finetune/Step": 677, "Finetune/Step Time": 8.213763613253832} {"Finetune/Learning Rate": 2.6362077572476494e-07, "Finetune/Loss": 0.48853886127471924, "Finetune/Loss (Raw)": 0.5633131265640259, "Finetune/Step": 678, "Finetune/Step Time": 8.210540615022182} {"Finetune/Learning Rate": 2.611368830592877e-07, "Finetune/Loss": 0.48885464668273926, "Finetune/Loss (Raw)": 0.489122599363327, "Finetune/Step": 679, "Finetune/Step Time": 8.207799911499023} {"Finetune/Learning Rate": 2.5866298918507157e-07, "Finetune/Loss": 0.49059972167015076, "Finetune/Loss (Raw)": 0.523155927658081, "Finetune/Step": 680, "Finetune/Step Time": 8.204986015334725} {"Finetune/Learning Rate": 2.561991275805072e-07, "Finetune/Loss": 0.4871780574321747, "Finetune/Loss (Raw)": 0.524384617805481, "Finetune/Step": 681, "Finetune/Step Time": 8.21272348985076} {"Finetune/Learning Rate": 2.537453315882222e-07, "Finetune/Loss": 0.48634567856788635, "Finetune/Loss (Raw)": 0.44643306732177734, "Finetune/Step": 682, "Finetune/Step Time": 8.213495522737503} {"Finetune/Learning Rate": 2.513016344146303e-07, "Finetune/Loss": 0.4810183346271515, "Finetune/Loss (Raw)": 0.3908478319644928, "Finetune/Step": 683, "Finetune/Step Time": 8.208796007558703} {"Finetune/Learning Rate": 2.4886806912948033e-07, "Finetune/Loss": 0.4794929623603821, "Finetune/Loss (Raw)": 0.47460854053497314, "Finetune/Step": 684, "Finetune/Step Time": 8.217704808339477} {"Finetune/Learning Rate": 2.4644466866540957e-07, "Finetune/Loss": 0.48219892382621765, "Finetune/Loss (Raw)": 0.47829389572143555, "Finetune/Step": 685, "Finetune/Step Time": 8.219274019822478} {"Finetune/Learning Rate": 2.440314658174992e-07, "Finetune/Loss": 0.47811126708984375, "Finetune/Loss (Raw)": 0.4583669900894165, "Finetune/Step": 686, "Finetune/Step Time": 8.217759342864156} {"Finetune/Learning Rate": 2.4162849324282853e-07, "Finetune/Loss": 0.47507309913635254, "Finetune/Loss (Raw)": 0.5339555144309998, "Finetune/Step": 687, "Finetune/Step Time": 8.220146518200636} {"Finetune/Learning Rate": 2.3923578346003357e-07, "Finetune/Loss": 0.4719434380531311, "Finetune/Loss (Raw)": 0.596442461013794, "Finetune/Step": 688, "Finetune/Step Time": 8.222236528992653} {"Finetune/Learning Rate": 2.3685336884886865e-07, "Finetune/Loss": 0.4687420129776001, "Finetune/Loss (Raw)": 0.44571763277053833, "Finetune/Step": 689, "Finetune/Step Time": 8.228867493569851} {"Finetune/Learning Rate": 2.344812816497659e-07, "Finetune/Loss": 0.4670864939689636, "Finetune/Loss (Raw)": 0.23756885528564453, "Finetune/Step": 690, "Finetune/Step Time": 8.223947240039706} {"Finetune/Learning Rate": 2.3211955396339998e-07, "Finetune/Loss": 0.459225058555603, "Finetune/Loss (Raw)": 0.1748388558626175, "Finetune/Step": 691, "Finetune/Step Time": 8.22298500686884} {"Finetune/Learning Rate": 2.2976821775025458e-07, "Finetune/Loss": 0.4669884741306305, "Finetune/Loss (Raw)": 0.6998598575592041, "Finetune/Step": 692, "Finetune/Step Time": 8.23314605653286} {"Finetune/Learning Rate": 2.27427304830188e-07, "Finetune/Loss": 0.4651643633842468, "Finetune/Loss (Raw)": 0.39355573058128357, "Finetune/Step": 693, "Finetune/Step Time": 8.23782648332417} {"Finetune/Learning Rate": 2.250968468820038e-07, "Finetune/Loss": 0.45940321683883667, "Finetune/Loss (Raw)": 0.4070315659046173, "Finetune/Step": 694, "Finetune/Step Time": 8.235362300649285} {"Finetune/Learning Rate": 2.2277687544302248e-07, "Finetune/Loss": 0.45652398467063904, "Finetune/Loss (Raw)": 0.3759145140647888, "Finetune/Step": 695, "Finetune/Step Time": 8.23318818025291} {"Finetune/Learning Rate": 2.204674219086531e-07, "Finetune/Loss": 0.4547576308250427, "Finetune/Loss (Raw)": 0.45293134450912476, "Finetune/Step": 696, "Finetune/Step Time": 8.232473943382502} {"Finetune/Learning Rate": 2.181685175319702e-07, "Finetune/Loss": 0.44768762588500977, "Finetune/Loss (Raw)": 0.3513575792312622, "Finetune/Step": 697, "Finetune/Step Time": 8.228443775326014} {"Finetune/Learning Rate": 2.1588019342328966e-07, "Finetune/Loss": 0.45380663871765137, "Finetune/Loss (Raw)": 0.6796718835830688, "Finetune/Step": 698, "Finetune/Step Time": 8.22476595826447} {"Finetune/Learning Rate": 2.1360248054974784e-07, "Finetune/Loss": 0.4548926055431366, "Finetune/Loss (Raw)": 0.43467554450035095, "Finetune/Step": 699, "Finetune/Step Time": 8.22501708008349} {"Finetune/Learning Rate": 2.1133540973488338e-07, "Finetune/Loss": 0.4548181891441345, "Finetune/Loss (Raw)": 0.43441128730773926, "Finetune/Step": 700, "Finetune/Step Time": 8.22489994391799} {"Finetune/Learning Rate": 2.0907901165821906e-07, "Finetune/Loss": 0.451925665140152, "Finetune/Loss (Raw)": 0.35955846309661865, "Finetune/Step": 701, "Finetune/Step Time": 8.2273690700531} {"Finetune/Learning Rate": 2.068333168548465e-07, "Finetune/Loss": 0.4501837491989136, "Finetune/Loss (Raw)": 0.5722428560256958, "Finetune/Step": 702, "Finetune/Step Time": 8.234095817431808} {"Finetune/Learning Rate": 2.0459835571501482e-07, "Finetune/Loss": 0.44986385107040405, "Finetune/Loss (Raw)": 0.4708532691001892, "Finetune/Step": 703, "Finetune/Step Time": 8.23223340511322} {"Finetune/Learning Rate": 2.0237415848371664e-07, "Finetune/Loss": 0.4544259011745453, "Finetune/Loss (Raw)": 0.41961753368377686, "Finetune/Step": 704, "Finetune/Step Time": 8.236570689827204} {"Finetune/Learning Rate": 2.0016075526028065e-07, "Finetune/Loss": 0.4552956819534302, "Finetune/Loss (Raw)": 0.6365131139755249, "Finetune/Step": 705, "Finetune/Step Time": 8.24315414018929} {"Finetune/Learning Rate": 1.9795817599796416e-07, "Finetune/Loss": 0.4616260528564453, "Finetune/Loss (Raw)": 0.4887404441833496, "Finetune/Step": 706, "Finetune/Step Time": 8.247865559533238} {"Finetune/Learning Rate": 1.957664505035468e-07, "Finetune/Loss": 0.4760374128818512, "Finetune/Loss (Raw)": 0.686396598815918, "Finetune/Step": 707, "Finetune/Step Time": 8.246522096917033} {"Finetune/Learning Rate": 1.9358560843692784e-07, "Finetune/Loss": 0.4823299050331116, "Finetune/Loss (Raw)": 0.6427305936813354, "Finetune/Step": 708, "Finetune/Step Time": 8.243212424218655} {"Finetune/Learning Rate": 1.9141567931072522e-07, "Finetune/Loss": 0.4771655201911926, "Finetune/Loss (Raw)": 0.42618513107299805, "Finetune/Step": 709, "Finetune/Step Time": 8.248615542426705} {"Finetune/Learning Rate": 1.8925669248987508e-07, "Finetune/Loss": 0.47323375940322876, "Finetune/Loss (Raw)": 0.4374958574771881, "Finetune/Step": 710, "Finetune/Step Time": 8.243092976510525} {"Finetune/Learning Rate": 1.871086771912348e-07, "Finetune/Loss": 0.47067344188690186, "Finetune/Loss (Raw)": 0.40719282627105713, "Finetune/Step": 711, "Finetune/Step Time": 8.240001939237118} {"Finetune/Learning Rate": 1.8497166248318874e-07, "Finetune/Loss": 0.464697003364563, "Finetune/Loss (Raw)": 0.33190950751304626, "Finetune/Step": 712, "Finetune/Step Time": 8.240705540403724} {"Finetune/Learning Rate": 1.8284567728525257e-07, "Finetune/Loss": 0.4584384560585022, "Finetune/Loss (Raw)": 0.3241111934185028, "Finetune/Step": 713, "Finetune/Step Time": 8.246419301256537} {"Finetune/Learning Rate": 1.8073075036768459e-07, "Finetune/Loss": 0.45920318365097046, "Finetune/Loss (Raw)": 0.47090375423431396, "Finetune/Step": 714, "Finetune/Step Time": 8.23013542406261} {"Finetune/Learning Rate": 1.78626910351094e-07, "Finetune/Loss": 0.45780259370803833, "Finetune/Loss (Raw)": 0.3460298478603363, "Finetune/Step": 715, "Finetune/Step Time": 8.226184971630573} {"Finetune/Learning Rate": 1.765341857060547e-07, "Finetune/Loss": 0.4630092978477478, "Finetune/Loss (Raw)": 0.6412231922149658, "Finetune/Step": 716, "Finetune/Step Time": 8.214238127693534} {"Finetune/Learning Rate": 1.7445260475272073e-07, "Finetune/Loss": 0.4644228219985962, "Finetune/Loss (Raw)": 0.5235264301300049, "Finetune/Step": 717, "Finetune/Step Time": 8.226265596225858} {"Finetune/Learning Rate": 1.7238219566044144e-07, "Finetune/Loss": 0.46186167001724243, "Finetune/Loss (Raw)": 0.37641045451164246, "Finetune/Step": 718, "Finetune/Step Time": 8.222414206713438} {"Finetune/Learning Rate": 1.7032298644738108e-07, "Finetune/Loss": 0.4617343544960022, "Finetune/Loss (Raw)": 0.5298808813095093, "Finetune/Step": 719, "Finetune/Step Time": 8.210768362507224} {"Finetune/Learning Rate": 1.6827500498014024e-07, "Finetune/Loss": 0.4574926793575287, "Finetune/Loss (Raw)": 0.4607093930244446, "Finetune/Step": 720, "Finetune/Step Time": 8.19920831732452} {"Finetune/Learning Rate": 1.662382789733776e-07, "Finetune/Loss": 0.4597262740135193, "Finetune/Loss (Raw)": 0.5171921253204346, "Finetune/Step": 721, "Finetune/Step Time": 8.20565582625568} {"Finetune/Learning Rate": 1.6421283598943525e-07, "Finetune/Loss": 0.46557867527008057, "Finetune/Loss (Raw)": 0.42484617233276367, "Finetune/Step": 722, "Finetune/Step Time": 8.202447146177292} {"Finetune/Learning Rate": 1.621987034379666e-07, "Finetune/Loss": 0.4748958349227905, "Finetune/Loss (Raw)": 0.47298794984817505, "Finetune/Step": 723, "Finetune/Step Time": 8.203017421066761} {"Finetune/Learning Rate": 1.601959085755641e-07, "Finetune/Loss": 0.465138703584671, "Finetune/Loss (Raw)": 0.3876311182975769, "Finetune/Step": 724, "Finetune/Step Time": 8.203670939430594} {"Finetune/Learning Rate": 1.5820447850539075e-07, "Finetune/Loss": 0.4670618176460266, "Finetune/Loss (Raw)": 0.455095112323761, "Finetune/Step": 725, "Finetune/Step Time": 8.208265967667103} {"Finetune/Learning Rate": 1.5622444017681436e-07, "Finetune/Loss": 0.4697716236114502, "Finetune/Loss (Raw)": 0.49374574422836304, "Finetune/Step": 726, "Finetune/Step Time": 8.202389981597662} {"Finetune/Learning Rate": 1.542558203850416e-07, "Finetune/Loss": 0.4769960641860962, "Finetune/Loss (Raw)": 0.6070969104766846, "Finetune/Step": 727, "Finetune/Step Time": 8.201148688793182} {"Finetune/Learning Rate": 1.5229864577075548e-07, "Finetune/Loss": 0.4859362244606018, "Finetune/Loss (Raw)": 0.7390159368515015, "Finetune/Step": 728, "Finetune/Step Time": 8.201156178489327} {"Finetune/Learning Rate": 1.5035294281975597e-07, "Finetune/Loss": 0.4928450882434845, "Finetune/Loss (Raw)": 0.5724420547485352, "Finetune/Step": 729, "Finetune/Step Time": 8.207849340513349} {"Finetune/Learning Rate": 1.4841873786260017e-07, "Finetune/Loss": 0.4856604039669037, "Finetune/Loss (Raw)": 0.4497615694999695, "Finetune/Step": 730, "Finetune/Step Time": 8.202583337202668} {"Finetune/Learning Rate": 1.4649605707424706e-07, "Finetune/Loss": 0.48320573568344116, "Finetune/Loss (Raw)": 0.35612666606903076, "Finetune/Step": 731, "Finetune/Step Time": 8.206991421058774} {"Finetune/Learning Rate": 1.4458492647370258e-07, "Finetune/Loss": 0.48824381828308105, "Finetune/Loss (Raw)": 0.595629870891571, "Finetune/Step": 732, "Finetune/Step Time": 8.207549231126904} {"Finetune/Learning Rate": 1.426853719236676e-07, "Finetune/Loss": 0.49535036087036133, "Finetune/Loss (Raw)": 0.586967945098877, "Finetune/Step": 733, "Finetune/Step Time": 8.212569415569305} {"Finetune/Learning Rate": 1.4079741913018862e-07, "Finetune/Loss": 0.4938738942146301, "Finetune/Loss (Raw)": 0.5249958038330078, "Finetune/Step": 734, "Finetune/Step Time": 8.209086967632174} {"Finetune/Learning Rate": 1.3892109364230908e-07, "Finetune/Loss": 0.49139758944511414, "Finetune/Loss (Raw)": 0.39161139726638794, "Finetune/Step": 735, "Finetune/Step Time": 8.207228649407625} {"Finetune/Learning Rate": 1.3705642085172365e-07, "Finetune/Loss": 0.49561941623687744, "Finetune/Loss (Raw)": 0.5547173023223877, "Finetune/Step": 736, "Finetune/Step Time": 8.192445589229465} {"Finetune/Learning Rate": 1.352034259924355e-07, "Finetune/Loss": 0.489141047000885, "Finetune/Loss (Raw)": 0.42920371890068054, "Finetune/Step": 737, "Finetune/Step Time": 8.198311023414135} {"Finetune/Learning Rate": 1.3336213414041385e-07, "Finetune/Loss": 0.485382616519928, "Finetune/Loss (Raw)": 0.36847126483917236, "Finetune/Step": 738, "Finetune/Step Time": 8.193595174700022} {"Finetune/Learning Rate": 1.315325702132548e-07, "Finetune/Loss": 0.4808560609817505, "Finetune/Loss (Raw)": 0.5415461659431458, "Finetune/Step": 739, "Finetune/Step Time": 8.19452346675098} {"Finetune/Learning Rate": 1.2971475896984475e-07, "Finetune/Loss": 0.47755658626556396, "Finetune/Loss (Raw)": 0.5371484756469727, "Finetune/Step": 740, "Finetune/Step Time": 8.20343174599111} {"Finetune/Learning Rate": 1.279087250100247e-07, "Finetune/Loss": 0.48923617601394653, "Finetune/Loss (Raw)": 0.7999305129051208, "Finetune/Step": 741, "Finetune/Step Time": 8.217053532600403} {"Finetune/Learning Rate": 1.2611449277425712e-07, "Finetune/Loss": 0.4900434613227844, "Finetune/Loss (Raw)": 0.46332991123199463, "Finetune/Step": 742, "Finetune/Step Time": 8.21554071456194} {"Finetune/Learning Rate": 1.2433208654329651e-07, "Finetune/Loss": 0.4907895028591156, "Finetune/Loss (Raw)": 0.4310652017593384, "Finetune/Step": 743, "Finetune/Step Time": 8.212867241352797} {"Finetune/Learning Rate": 1.225615304378591e-07, "Finetune/Loss": 0.49347764253616333, "Finetune/Loss (Raw)": 0.41793113946914673, "Finetune/Step": 744, "Finetune/Step Time": 8.212531451135874} {"Finetune/Learning Rate": 1.2080284841829801e-07, "Finetune/Loss": 0.49908971786499023, "Finetune/Loss (Raw)": 0.503696620464325, "Finetune/Step": 745, "Finetune/Step Time": 8.217588152736425} {"Finetune/Learning Rate": 1.1905606428427773e-07, "Finetune/Loss": 0.49321845173835754, "Finetune/Loss (Raw)": 0.2830231189727783, "Finetune/Step": 746, "Finetune/Step Time": 8.215429270640016} {"Finetune/Learning Rate": 1.1732120167445247e-07, "Finetune/Loss": 0.4976850152015686, "Finetune/Loss (Raw)": 0.48896074295043945, "Finetune/Step": 747, "Finetune/Step Time": 8.215041188523173} {"Finetune/Learning Rate": 1.1559828406614713e-07, "Finetune/Loss": 0.4932042956352234, "Finetune/Loss (Raw)": 0.4978407919406891, "Finetune/Step": 748, "Finetune/Step Time": 8.21543494425714} {"Finetune/Learning Rate": 1.1388733477503808e-07, "Finetune/Loss": 0.4896036684513092, "Finetune/Loss (Raw)": 0.4083055257797241, "Finetune/Step": 749, "Finetune/Step Time": 8.219939282163978} {"Finetune/Learning Rate": 1.1218837695483851e-07, "Finetune/Loss": 0.49589434266090393, "Finetune/Loss (Raw)": 0.577711284160614, "Finetune/Step": 750, "Finetune/Step Time": 8.221815794706345} {"Finetune/Learning Rate": 1.105014335969855e-07, "Finetune/Loss": 0.49687695503234863, "Finetune/Loss (Raw)": 0.5613255500793457, "Finetune/Step": 751, "Finetune/Step Time": 8.223054522648454} {"Finetune/Learning Rate": 1.0882652753032795e-07, "Finetune/Loss": 0.49773502349853516, "Finetune/Loss (Raw)": 0.4881671667098999, "Finetune/Step": 752, "Finetune/Step Time": 8.217142593115568} {"Finetune/Learning Rate": 1.07163681420818e-07, "Finetune/Loss": 0.49794110655784607, "Finetune/Loss (Raw)": 0.5237871408462524, "Finetune/Step": 753, "Finetune/Step Time": 8.212412666529417} {"Finetune/Learning Rate": 1.0551291777120463e-07, "Finetune/Loss": 0.5024509429931641, "Finetune/Loss (Raw)": 0.5691612958908081, "Finetune/Step": 754, "Finetune/Step Time": 8.220906063914299} {"Finetune/Learning Rate": 1.0387425892072832e-07, "Finetune/Loss": 0.5035966634750366, "Finetune/Loss (Raw)": 0.5096509456634521, "Finetune/Step": 755, "Finetune/Step Time": 8.236627619713545} {"Finetune/Learning Rate": 1.0224772704482032e-07, "Finetune/Loss": 0.5091097950935364, "Finetune/Loss (Raw)": 0.5640504360198975, "Finetune/Step": 756, "Finetune/Step Time": 8.234491929411888} {"Finetune/Learning Rate": 1.0063334415480051e-07, "Finetune/Loss": 0.5157208442687988, "Finetune/Loss (Raw)": 0.6666486263275146, "Finetune/Step": 757, "Finetune/Step Time": 8.247724778950214} {"Finetune/Learning Rate": 9.903113209758096e-08, "Finetune/Loss": 0.5117827653884888, "Finetune/Loss (Raw)": 0.3677274286746979, "Finetune/Step": 758, "Finetune/Step Time": 8.253811245784163} {"Finetune/Learning Rate": 9.744111255537002e-08, "Finetune/Loss": 0.5085450410842896, "Finetune/Loss (Raw)": 0.5034877061843872, "Finetune/Step": 759, "Finetune/Step Time": 8.255410438403487} {"Finetune/Learning Rate": 9.586330704537848e-08, "Finetune/Loss": 0.5017160177230835, "Finetune/Loss (Raw)": 0.5204882621765137, "Finetune/Step": 760, "Finetune/Step Time": 8.256172649562359} {"Finetune/Learning Rate": 9.429773691952858e-08, "Finetune/Loss": 0.49787014722824097, "Finetune/Loss (Raw)": 0.44937485456466675, "Finetune/Step": 761, "Finetune/Step Time": 8.270900294184685} {"Finetune/Learning Rate": 9.274442336416565e-08, "Finetune/Loss": 0.4950363039970398, "Finetune/Loss (Raw)": 0.35907799005508423, "Finetune/Step": 762, "Finetune/Step Time": 8.266749523580074} {"Finetune/Learning Rate": 9.120338739977029e-08, "Finetune/Loss": 0.4944266080856323, "Finetune/Loss (Raw)": 0.33661672472953796, "Finetune/Step": 763, "Finetune/Step Time": 8.265392046421766} {"Finetune/Learning Rate": 8.967464988067475e-08, "Finetune/Loss": 0.4885804057121277, "Finetune/Loss (Raw)": 0.4085506796836853, "Finetune/Step": 764, "Finetune/Step Time": 8.267804631963372} {"Finetune/Learning Rate": 8.815823149478075e-08, "Finetune/Loss": 0.4792185127735138, "Finetune/Loss (Raw)": 0.2873886227607727, "Finetune/Step": 765, "Finetune/Step Time": 8.269289579242468} {"Finetune/Learning Rate": 8.66541527632787e-08, "Finetune/Loss": 0.4813975691795349, "Finetune/Loss (Raw)": 0.5947256684303284, "Finetune/Step": 766, "Finetune/Step Time": 8.253943908959627} {"Finetune/Learning Rate": 8.51624340403707e-08, "Finetune/Loss": 0.48074930906295776, "Finetune/Loss (Raw)": 0.37086743116378784, "Finetune/Step": 767, "Finetune/Step Time": 8.255700269713998} {"Finetune/Learning Rate": 8.368309551299535e-08, "Finetune/Loss": 0.47662127017974854, "Finetune/Loss (Raw)": 0.4226193130016327, "Finetune/Step": 768, "Finetune/Step Time": 8.247733164578676} {"Finetune/Learning Rate": 8.221615720055353e-08, "Finetune/Loss": 0.4818105697631836, "Finetune/Loss (Raw)": 0.5952619314193726, "Finetune/Step": 769, "Finetune/Step Time": 8.251916317269206} {"Finetune/Learning Rate": 8.076163895463861e-08, "Finetune/Loss": 0.48248231410980225, "Finetune/Loss (Raw)": 0.3899666965007782, "Finetune/Step": 770, "Finetune/Step Time": 8.259624043479562} {"Finetune/Learning Rate": 7.931956045876687e-08, "Finetune/Loss": 0.48141276836395264, "Finetune/Loss (Raw)": 0.5073209404945374, "Finetune/Step": 771, "Finetune/Step Time": 8.263192655518651} {"Finetune/Learning Rate": 7.788994122811177e-08, "Finetune/Loss": 0.48107093572616577, "Finetune/Loss (Raw)": 0.5262089967727661, "Finetune/Step": 772, "Finetune/Step Time": 8.262796465307474} {"Finetune/Learning Rate": 7.647280060923966e-08, "Finetune/Loss": 0.4743120074272156, "Finetune/Loss (Raw)": 0.5836449265480042, "Finetune/Step": 773, "Finetune/Step Time": 8.269398057833314} {"Finetune/Learning Rate": 7.506815777984788e-08, "Finetune/Loss": 0.4736061096191406, "Finetune/Loss (Raw)": 0.44074195623397827, "Finetune/Step": 774, "Finetune/Step Time": 8.254377817735076} {"Finetune/Learning Rate": 7.367603174850501e-08, "Finetune/Loss": 0.47860604524612427, "Finetune/Loss (Raw)": 0.5910627245903015, "Finetune/Step": 775, "Finetune/Step Time": 8.262244675308466} {"Finetune/Learning Rate": 7.229644135439472e-08, "Finetune/Loss": 0.48229843378067017, "Finetune/Loss (Raw)": 0.5360870361328125, "Finetune/Step": 776, "Finetune/Step Time": 8.260060373693705} {"Finetune/Learning Rate": 7.092940526705926e-08, "Finetune/Loss": 0.4831291735172272, "Finetune/Loss (Raw)": 0.5302805304527283, "Finetune/Step": 777, "Finetune/Step Time": 8.250195370987058} {"Finetune/Learning Rate": 6.957494198614777e-08, "Finetune/Loss": 0.487271785736084, "Finetune/Loss (Raw)": 0.41558730602264404, "Finetune/Step": 778, "Finetune/Step Time": 8.247723925858736} {"Finetune/Learning Rate": 6.823306984116595e-08, "Finetune/Loss": 0.49356168508529663, "Finetune/Loss (Raw)": 0.6902366876602173, "Finetune/Step": 779, "Finetune/Step Time": 8.248097939416766} {"Finetune/Learning Rate": 6.690380699122767e-08, "Finetune/Loss": 0.4928348660469055, "Finetune/Loss (Raw)": 0.474582701921463, "Finetune/Step": 780, "Finetune/Step Time": 8.244429910555482} {"Finetune/Learning Rate": 6.558717142480918e-08, "Finetune/Loss": 0.4950956702232361, "Finetune/Loss (Raw)": 0.48065149784088135, "Finetune/Step": 781, "Finetune/Step Time": 8.241180181503296} {"Finetune/Learning Rate": 6.428318095950647e-08, "Finetune/Loss": 0.48972517251968384, "Finetune/Loss (Raw)": 0.4058552384376526, "Finetune/Step": 782, "Finetune/Step Time": 8.245320454239845} {"Finetune/Learning Rate": 6.299185324179268e-08, "Finetune/Loss": 0.4839443862438202, "Finetune/Loss (Raw)": 0.3763408362865448, "Finetune/Step": 783, "Finetune/Step Time": 8.247568564489484} {"Finetune/Learning Rate": 6.171320574678062e-08, "Finetune/Loss": 0.48245924711227417, "Finetune/Loss (Raw)": 0.4406425952911377, "Finetune/Step": 784, "Finetune/Step Time": 8.245103461667895} {"Finetune/Learning Rate": 6.044725577798615e-08, "Finetune/Loss": 0.481707364320755, "Finetune/Loss (Raw)": 0.49972671270370483, "Finetune/Step": 785, "Finetune/Step Time": 8.244635237380862} {"Finetune/Learning Rate": 5.919402046709288e-08, "Finetune/Loss": 0.47635191679000854, "Finetune/Loss (Raw)": 0.3977867364883423, "Finetune/Step": 786, "Finetune/Step Time": 8.244947239756584} {"Finetune/Learning Rate": 5.7953516773721956e-08, "Finetune/Loss": 0.4792554974555969, "Finetune/Loss (Raw)": 0.6025664806365967, "Finetune/Step": 787, "Finetune/Step Time": 8.242482133209705} {"Finetune/Learning Rate": 5.6725761485201365e-08, "Finetune/Loss": 0.4774760603904724, "Finetune/Loss (Raw)": 0.5071084499359131, "Finetune/Step": 788, "Finetune/Step Time": 8.243132079020143} {"Finetune/Learning Rate": 5.5510771216338736e-08, "Finetune/Loss": 0.47247204184532166, "Finetune/Loss (Raw)": 0.5065193176269531, "Finetune/Step": 789, "Finetune/Step Time": 8.230287224054337} {"Finetune/Learning Rate": 5.430856240919779e-08, "Finetune/Loss": 0.4740738272666931, "Finetune/Loss (Raw)": 0.41898512840270996, "Finetune/Step": 790, "Finetune/Step Time": 8.22934740409255} {"Finetune/Learning Rate": 5.311915133287415e-08, "Finetune/Loss": 0.47169122099876404, "Finetune/Loss (Raw)": 0.42724430561065674, "Finetune/Step": 791, "Finetune/Step Time": 8.237079517915845} {"Finetune/Learning Rate": 5.194255408327619e-08, "Finetune/Loss": 0.4762084484100342, "Finetune/Loss (Raw)": 0.6650394201278687, "Finetune/Step": 792, "Finetune/Step Time": 8.241331798955798} {"Finetune/Learning Rate": 5.077878658290724e-08, "Finetune/Loss": 0.4776965379714966, "Finetune/Loss (Raw)": 0.4969936013221741, "Finetune/Step": 793, "Finetune/Step Time": 8.227530313655734} {"Finetune/Learning Rate": 4.962786458064972e-08, "Finetune/Loss": 0.4771706461906433, "Finetune/Loss (Raw)": 0.3422502279281616, "Finetune/Step": 794, "Finetune/Step Time": 8.227124504745007} {"Finetune/Learning Rate": 4.848980365155175e-08, "Finetune/Loss": 0.49215662479400635, "Finetune/Loss (Raw)": 0.8161677122116089, "Finetune/Step": 795, "Finetune/Step Time": 8.217270413413644} {"Finetune/Learning Rate": 4.736461919661749e-08, "Finetune/Loss": 0.49389907717704773, "Finetune/Loss (Raw)": 0.4643082618713379, "Finetune/Step": 796, "Finetune/Step Time": 8.213214000687003} {"Finetune/Learning Rate": 4.625232644259758e-08, "Finetune/Loss": 0.5091369152069092, "Finetune/Loss (Raw)": 0.7750016450881958, "Finetune/Step": 797, "Finetune/Step Time": 8.210380885750055} {"Finetune/Learning Rate": 4.51529404417833e-08, "Finetune/Loss": 0.504656970500946, "Finetune/Loss (Raw)": 0.45136523246765137, "Finetune/Step": 798, "Finetune/Step Time": 8.208243865519762} {"Finetune/Learning Rate": 4.40664760718038e-08, "Finetune/Loss": 0.5089479088783264, "Finetune/Loss (Raw)": 0.5081787109375, "Finetune/Step": 799, "Finetune/Step Time": 8.210927534848452} {"Finetune/Learning Rate": 4.2992948035423305e-08, "Finetune/Loss": 0.509466290473938, "Finetune/Loss (Raw)": 0.43920695781707764, "Finetune/Step": 800, "Finetune/Step Time": 8.212385876104236} {"Finetune/Learning Rate": 4.1932370860343514e-08, "Finetune/Loss": 0.502199649810791, "Finetune/Loss (Raw)": 0.36272865533828735, "Finetune/Step": 801, "Finetune/Step Time": 8.217161988839507} {"Finetune/Learning Rate": 4.0884758899006e-08, "Finetune/Loss": 0.50467848777771, "Finetune/Loss (Raw)": 0.46928954124450684, "Finetune/Step": 802, "Finetune/Step Time": 8.216899391263723} {"Finetune/Learning Rate": 3.985012632839824e-08, "Finetune/Loss": 0.5081347823143005, "Finetune/Loss (Raw)": 0.6179227828979492, "Finetune/Step": 803, "Finetune/Step Time": 8.216463051736355} {"Finetune/Learning Rate": 3.8828487149862424e-08, "Finetune/Loss": 0.5068284273147583, "Finetune/Loss (Raw)": 0.48440444469451904, "Finetune/Step": 804, "Finetune/Step Time": 8.220568653196096} {"Finetune/Learning Rate": 3.781985518890496e-08, "Finetune/Loss": 0.5069479942321777, "Finetune/Loss (Raw)": 0.5874717831611633, "Finetune/Step": 805, "Finetune/Step Time": 8.208791675046086} {"Finetune/Learning Rate": 3.682424409501006e-08, "Finetune/Loss": 0.5098456144332886, "Finetune/Loss (Raw)": 0.5334672927856445, "Finetune/Step": 806, "Finetune/Step Time": 8.20798677764833} {"Finetune/Learning Rate": 3.5841667341454883e-08, "Finetune/Loss": 0.5063552260398865, "Finetune/Loss (Raw)": 0.47936832904815674, "Finetune/Step": 807, "Finetune/Step Time": 8.208364345133305} {"Finetune/Learning Rate": 3.487213822512714e-08, "Finetune/Loss": 0.5043436288833618, "Finetune/Loss (Raw)": 0.47171616554260254, "Finetune/Step": 808, "Finetune/Step Time": 8.213120451197028} {"Finetune/Learning Rate": 3.391566986634486e-08, "Finetune/Loss": 0.502490222454071, "Finetune/Loss (Raw)": 0.4709722101688385, "Finetune/Step": 809, "Finetune/Step Time": 8.206962391734123} {"Finetune/Learning Rate": 3.297227520867962e-08, "Finetune/Loss": 0.5043805241584778, "Finetune/Loss (Raw)": 0.47607699036598206, "Finetune/Step": 810, "Finetune/Step Time": 8.209227494895458} {"Finetune/Learning Rate": 3.20419670187807e-08, "Finetune/Loss": 0.4970998764038086, "Finetune/Loss (Raw)": 0.45725536346435547, "Finetune/Step": 811, "Finetune/Step Time": 8.205937091261148} {"Finetune/Learning Rate": 3.112475788620217e-08, "Finetune/Loss": 0.49190783500671387, "Finetune/Loss (Raw)": 0.3084378242492676, "Finetune/Step": 812, "Finetune/Step Time": 8.2154181599617} {"Finetune/Learning Rate": 3.022066022323355e-08, "Finetune/Loss": 0.4914732575416565, "Finetune/Loss (Raw)": 0.46674492955207825, "Finetune/Step": 813, "Finetune/Step Time": 8.213634008541703} {"Finetune/Learning Rate": 2.9329686264730646e-08, "Finetune/Loss": 0.4934089183807373, "Finetune/Loss (Raw)": 0.4677963852882385, "Finetune/Step": 814, "Finetune/Step Time": 8.213402595371008} {"Finetune/Learning Rate": 2.8451848067950535e-08, "Finetune/Loss": 0.4978242814540863, "Finetune/Loss (Raw)": 0.5176327228546143, "Finetune/Step": 815, "Finetune/Step Time": 8.215341698378325} {"Finetune/Learning Rate": 2.7587157512388714e-08, "Finetune/Loss": 0.5041627883911133, "Finetune/Loss (Raw)": 0.6434741020202637, "Finetune/Step": 816, "Finetune/Step Time": 8.216733621433377} {"Finetune/Learning Rate": 2.6735626299617452e-08, "Finetune/Loss": 0.5049294233322144, "Finetune/Loss (Raw)": 0.5242598056793213, "Finetune/Step": 817, "Finetune/Step Time": 8.212694542482495} {"Finetune/Learning Rate": 2.5897265953128577e-08, "Finetune/Loss": 0.5147011280059814, "Finetune/Loss (Raw)": 0.7104817628860474, "Finetune/Step": 818, "Finetune/Step Time": 8.212837345898151} {"Finetune/Learning Rate": 2.507208781817638e-08, "Finetune/Loss": 0.5143786668777466, "Finetune/Loss (Raw)": 0.5922492146492004, "Finetune/Step": 819, "Finetune/Step Time": 8.204259388148785} {"Finetune/Learning Rate": 2.426010306162485e-08, "Finetune/Loss": 0.5073811411857605, "Finetune/Loss (Raw)": 0.2831851840019226, "Finetune/Step": 820, "Finetune/Step Time": 8.206302342936397} {"Finetune/Learning Rate": 2.3461322671796456e-08, "Finetune/Loss": 0.507904589176178, "Finetune/Loss (Raw)": 0.523269772529602, "Finetune/Step": 821, "Finetune/Step Time": 8.19890115968883} {"Finetune/Learning Rate": 2.2675757458323065e-08, "Finetune/Loss": 0.511327862739563, "Finetune/Loss (Raw)": 0.528531551361084, "Finetune/Step": 822, "Finetune/Step Time": 8.200744863599539} {"Finetune/Learning Rate": 2.190341805199991e-08, "Finetune/Loss": 0.5196588635444641, "Finetune/Loss (Raw)": 0.6938350200653076, "Finetune/Step": 823, "Finetune/Step Time": 8.19958864338696} {"Finetune/Learning Rate": 2.114431490464219e-08, "Finetune/Loss": 0.5080147981643677, "Finetune/Loss (Raw)": 0.29242947697639465, "Finetune/Step": 824, "Finetune/Step Time": 8.202224487438798} {"Finetune/Learning Rate": 2.039845828894249e-08, "Finetune/Loss": 0.502947211265564, "Finetune/Loss (Raw)": 0.33483099937438965, "Finetune/Step": 825, "Finetune/Step Time": 8.21018029563129} {"Finetune/Learning Rate": 1.9665858298333004e-08, "Finetune/Loss": 0.5109093189239502, "Finetune/Loss (Raw)": 0.5970368385314941, "Finetune/Step": 826, "Finetune/Step Time": 8.201501125469804} {"Finetune/Learning Rate": 1.8946524846848e-08, "Finetune/Loss": 0.4991220235824585, "Finetune/Loss (Raw)": 0.4389733672142029, "Finetune/Step": 827, "Finetune/Step Time": 8.205599384382367} {"Finetune/Learning Rate": 1.8240467668990456e-08, "Finetune/Loss": 0.5032386779785156, "Finetune/Loss (Raw)": 0.5960429310798645, "Finetune/Step": 828, "Finetune/Step Time": 8.208264589309692} {"Finetune/Learning Rate": 1.7547696319599294e-08, "Finetune/Loss": 0.49100613594055176, "Finetune/Loss (Raw)": 0.3835597634315491, "Finetune/Step": 829, "Finetune/Step Time": 8.211081329733133} {"Finetune/Learning Rate": 1.686822017372147e-08, "Finetune/Loss": 0.4921236038208008, "Finetune/Loss (Raw)": 0.48712342977523804, "Finetune/Step": 830, "Finetune/Step Time": 8.2047089766711} {"Finetune/Learning Rate": 1.620204842648365e-08, "Finetune/Loss": 0.4886814057826996, "Finetune/Loss (Raw)": 0.3980288505554199, "Finetune/Step": 831, "Finetune/Step Time": 8.207793213427067} {"Finetune/Learning Rate": 1.5549190092968735e-08, "Finetune/Loss": 0.4875599443912506, "Finetune/Loss (Raw)": 0.40332090854644775, "Finetune/Step": 832, "Finetune/Step Time": 8.209062557667494} {"Finetune/Learning Rate": 1.4909654008093742e-08, "Finetune/Loss": 0.48746457695961, "Finetune/Loss (Raw)": 0.3596762716770172, "Finetune/Step": 833, "Finetune/Step Time": 8.203022502362728} {"Finetune/Learning Rate": 1.4283448826489796e-08, "Finetune/Loss": 0.4879339933395386, "Finetune/Loss (Raw)": 0.48431211709976196, "Finetune/Step": 834, "Finetune/Step Time": 8.203666182234883} {"Finetune/Learning Rate": 1.3670583022385329e-08, "Finetune/Loss": 0.4837394952774048, "Finetune/Loss (Raw)": 0.48369771242141724, "Finetune/Step": 835, "Finetune/Step Time": 8.206923166289926} {"Finetune/Learning Rate": 1.3071064889491723e-08, "Finetune/Loss": 0.48631855845451355, "Finetune/Loss (Raw)": 0.5669344663619995, "Finetune/Step": 836, "Finetune/Step Time": 8.208121195435524} {"Finetune/Learning Rate": 1.2484902540890075e-08, "Finetune/Loss": 0.48332542181015015, "Finetune/Loss (Raw)": 0.4916912913322449, "Finetune/Step": 837, "Finetune/Step Time": 8.206490514799953} {"Finetune/Learning Rate": 1.1912103908922944e-08, "Finetune/Loss": 0.48043906688690186, "Finetune/Loss (Raw)": 0.4411047101020813, "Finetune/Step": 838, "Finetune/Step Time": 8.204540455713868} {"Finetune/Learning Rate": 1.1352676745085e-08, "Finetune/Loss": 0.48118340969085693, "Finetune/Loss (Raw)": 0.503186821937561, "Finetune/Step": 839, "Finetune/Step Time": 8.207894694060087} {"Finetune/Learning Rate": 1.0806628619920322e-08, "Finetune/Loss": 0.482453316450119, "Finetune/Loss (Raw)": 0.512352705001831, "Finetune/Step": 840, "Finetune/Step Time": 8.206949688494205} {"Finetune/Learning Rate": 1.0273966922918153e-08, "Finetune/Loss": 0.48803848028182983, "Finetune/Loss (Raw)": 0.6496974229812622, "Finetune/Step": 841, "Finetune/Step Time": 8.205636203289032} {"Finetune/Learning Rate": 9.754698862413757e-09, "Finetune/Loss": 0.4869323968887329, "Finetune/Loss (Raw)": 0.4406835436820984, "Finetune/Step": 842, "Finetune/Step Time": 8.221349835395813} {"Finetune/Learning Rate": 9.248831465491047e-09, "Finetune/Loss": 0.49189233779907227, "Finetune/Loss (Raw)": 0.6159725189208984, "Finetune/Step": 843, "Finetune/Step Time": 8.221531035378575} {"Finetune/Learning Rate": 8.75637157788689e-09, "Finetune/Loss": 0.5004274845123291, "Finetune/Loss (Raw)": 0.5815622806549072, "Finetune/Step": 844, "Finetune/Step Time": 8.236955197528005} {"Finetune/Learning Rate": 8.27732586389851e-09, "Finetune/Loss": 0.5022778511047363, "Finetune/Loss (Raw)": 0.525958240032196, "Finetune/Step": 845, "Finetune/Step Time": 8.2403548322618} {"Finetune/Learning Rate": 7.81170080629412e-09, "Finetune/Loss": 0.5115762948989868, "Finetune/Loss (Raw)": 0.7653457522392273, "Finetune/Step": 846, "Finetune/Step Time": 8.241246884688735} {"Finetune/Learning Rate": 7.359502706224096e-09, "Finetune/Loss": 0.5119650363922119, "Finetune/Loss (Raw)": 0.5300738215446472, "Finetune/Step": 847, "Finetune/Step Time": 8.238796254619956} {"Finetune/Learning Rate": 6.9207376831366125e-09, "Finetune/Loss": 0.5097517967224121, "Finetune/Loss (Raw)": 0.5726501941680908, "Finetune/Step": 848, "Finetune/Step Time": 8.248000988736749} {"Finetune/Learning Rate": 6.495411674694029e-09, "Finetune/Loss": 0.5022613406181335, "Finetune/Loss (Raw)": 0.28456467390060425, "Finetune/Step": 849, "Finetune/Step Time": 8.246418733149767} {"Finetune/Learning Rate": 6.083530436693407e-09, "Finetune/Loss": 0.49839070439338684, "Finetune/Loss (Raw)": 0.5866209268569946, "Finetune/Step": 850, "Finetune/Step Time": 8.238309381529689} {"Finetune/Learning Rate": 5.68509954298757e-09, "Finetune/Loss": 0.49805939197540283, "Finetune/Loss (Raw)": 0.5816481709480286, "Finetune/Step": 851, "Finetune/Step Time": 8.236817333847284} {"Finetune/Learning Rate": 5.300124385410942e-09, "Finetune/Loss": 0.5076366662979126, "Finetune/Loss (Raw)": 0.5896576046943665, "Finetune/Step": 852, "Finetune/Step Time": 8.233460307121277} {"Finetune/Learning Rate": 4.928610173705494e-09, "Finetune/Loss": 0.5057846307754517, "Finetune/Loss (Raw)": 0.4640045166015625, "Finetune/Step": 853, "Finetune/Step Time": 8.2276072204113} {"Finetune/Learning Rate": 4.570561935450467e-09, "Finetune/Loss": 0.5051233768463135, "Finetune/Loss (Raw)": 0.5073712468147278, "Finetune/Step": 854, "Finetune/Step Time": 8.23331324569881} {"Finetune/Learning Rate": 4.225984515995096e-09, "Finetune/Loss": 0.5017882585525513, "Finetune/Loss (Raw)": 0.5871099233627319, "Finetune/Step": 855, "Finetune/Step Time": 8.23470215126872} {"Finetune/Learning Rate": 3.894882578391878e-09, "Finetune/Loss": 0.5075423121452332, "Finetune/Loss (Raw)": 0.47655946016311646, "Finetune/Step": 856, "Finetune/Step Time": 8.231591129675508} {"Finetune/Learning Rate": 3.57726060333452e-09, "Finetune/Loss": 0.5144922137260437, "Finetune/Loss (Raw)": 0.5572287440299988, "Finetune/Step": 857, "Finetune/Step Time": 8.220938524231315} {"Finetune/Learning Rate": 3.2731228890965358e-09, "Finetune/Loss": 0.5067514181137085, "Finetune/Loss (Raw)": 0.3493308424949646, "Finetune/Step": 858, "Finetune/Step Time": 8.234756043180823} {"Finetune/Learning Rate": 2.982473551473297e-09, "Finetune/Loss": 0.508776843547821, "Finetune/Loss (Raw)": 0.5037867426872253, "Finetune/Step": 859, "Finetune/Step Time": 8.241670435294509} {"Finetune/Learning Rate": 2.705316523726853e-09, "Finetune/Loss": 0.5000834465026855, "Finetune/Loss (Raw)": 0.31785324215888977, "Finetune/Step": 860, "Finetune/Step Time": 8.242638491094112} {"Finetune/Learning Rate": 2.441655556531863e-09, "Finetune/Loss": 0.5021644830703735, "Finetune/Loss (Raw)": 0.45015543699264526, "Finetune/Step": 861, "Finetune/Step Time": 8.244946891441941} {"Finetune/Learning Rate": 2.191494217925305e-09, "Finetune/Loss": 0.5039900541305542, "Finetune/Loss (Raw)": 0.5455400943756104, "Finetune/Step": 862, "Finetune/Step Time": 8.24387489259243} {"Finetune/Learning Rate": 1.9548358932582888e-09, "Finetune/Loss": 0.5039212107658386, "Finetune/Loss (Raw)": 0.39582568407058716, "Finetune/Step": 863, "Finetune/Step Time": 8.246979039162397} {"Finetune/Learning Rate": 1.7316837851499844e-09, "Finetune/Loss": 0.5074023008346558, "Finetune/Loss (Raw)": 0.5147161483764648, "Finetune/Step": 864, "Finetune/Step Time": 8.261756161227822} {"Finetune/Learning Rate": 1.5220409134444334e-09, "Finetune/Loss": 0.510027289390564, "Finetune/Loss (Raw)": 0.44367504119873047, "Finetune/Step": 865, "Finetune/Step Time": 8.258302018046379} {"Finetune/Learning Rate": 1.3259101151694707e-09, "Finetune/Loss": 0.5068385004997253, "Finetune/Loss (Raw)": 0.38227301836013794, "Finetune/Step": 866, "Finetune/Step Time": 8.25982991605997} {"Finetune/Learning Rate": 1.1432940444987548e-09, "Finetune/Loss": 0.5092265605926514, "Finetune/Loss (Raw)": 0.5601142048835754, "Finetune/Step": 867, "Finetune/Step Time": 8.2656554505229} {"Finetune/Learning Rate": 9.74195172715242e-10, "Finetune/Loss": 0.5084606409072876, "Finetune/Loss (Raw)": 0.5424255132675171, "Finetune/Step": 868, "Finetune/Step Time": 8.259043153375387} {"Finetune/Learning Rate": 8.186157881784339e-10, "Finetune/Loss": 0.5069960951805115, "Finetune/Loss (Raw)": 0.44482582807540894, "Finetune/Step": 869, "Finetune/Step Time": 8.264174614101648} {"Finetune/Learning Rate": 6.765579962928481e-10, "Finetune/Loss": 0.5092530250549316, "Finetune/Loss (Raw)": 0.5133262872695923, "Finetune/Step": 870, "Finetune/Step Time": 8.261784477159381} {"Finetune/Learning Rate": 5.480237194799287e-10, "Finetune/Loss": 0.5082311630249023, "Finetune/Loss (Raw)": 0.4704878032207489, "Finetune/Step": 871, "Finetune/Step Time": 8.265619702637196} {"Finetune/Learning Rate": 4.330146971515125e-10, "Finetune/Loss": 0.50864577293396, "Finetune/Loss (Raw)": 0.5256202816963196, "Finetune/Step": 872, "Finetune/Step Time": 8.26339827477932} {"Finetune/Learning Rate": 3.3153248568695835e-10, "Finetune/Loss": 0.5070329904556274, "Finetune/Loss (Raw)": 0.5980875492095947, "Finetune/Step": 873, "Finetune/Step Time": 8.25958744995296} {"Finetune/Learning Rate": 2.4357845841149746e-10, "Finetune/Loss": 0.5068725347518921, "Finetune/Loss (Raw)": 0.43555015325546265, "Finetune/Step": 874, "Finetune/Step Time": 8.260683357715607} {"Finetune/Learning Rate": 1.691538055782482e-10, "Finetune/Loss": 0.4972653090953827, "Finetune/Loss (Raw)": 0.3085401654243469, "Finetune/Step": 875, "Finetune/Step Time": 8.263432033360004} {"Finetune/Learning Rate": 1.0825953435122937e-10, "Finetune/Loss": 0.4937065541744232, "Finetune/Loss (Raw)": 0.46768277883529663, "Finetune/Step": 876, "Finetune/Step Time": 8.261020194739103} {"Finetune/Learning Rate": 6.089646879281485e-11, "Finetune/Loss": 0.49946922063827515, "Finetune/Loss (Raw)": 0.7103620171546936, "Finetune/Step": 877, "Finetune/Step Time": 8.266378350555897} {"Finetune/Learning Rate": 2.706524985174319e-11, "Finetune/Loss": 0.4926163852214813, "Finetune/Loss (Raw)": 0.5460571646690369, "Finetune/Step": 878, "Finetune/Step Time": 8.269975000992417} {"Finetune/Learning Rate": 6.766335354568831e-12, "Finetune/Loss": 0.4914758503437042, "Finetune/Loss (Raw)": 0.4935757517814636, "Finetune/Step": 879, "Finetune/Step Time": 8.270850433036685} {"Finetune/Learning Rate": 0.0, "Finetune/Loss": 0.4937971234321594, "Finetune/Loss (Raw)": 0.6469314098358154, "Finetune/Step": 880, "Finetune/Step Time": 8.277488490566611}