{ "best_metric": null, "best_model_checkpoint": null, "epoch": 2.8823843082998257, "global_step": 200000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 1.9999956764235376e-05, "loss": 1.0119, "step": 10 }, { "epoch": 0.0, "learning_rate": 1.9999908724496906e-05, "loss": 0.5547, "step": 20 }, { "epoch": 0.0, "learning_rate": 1.9999860684758435e-05, "loss": 0.4887, "step": 30 }, { "epoch": 0.0, "learning_rate": 1.9999812645019964e-05, "loss": 0.4381, "step": 40 }, { "epoch": 0.0, "learning_rate": 1.999976460528149e-05, "loss": 0.374, "step": 50 }, { "epoch": 0.0, "learning_rate": 1.999971656554302e-05, "loss": 0.3704, "step": 60 }, { "epoch": 0.0, "learning_rate": 1.999966852580455e-05, "loss": 0.3445, "step": 70 }, { "epoch": 0.0, "learning_rate": 1.9999620486066074e-05, "loss": 0.3367, "step": 80 }, { "epoch": 0.0, "learning_rate": 1.9999572446327604e-05, "loss": 0.328, "step": 90 }, { "epoch": 0.0, "learning_rate": 1.9999524406589133e-05, "loss": 0.3112, "step": 100 }, { "epoch": 0.0, "learning_rate": 1.9999476366850662e-05, "loss": 0.294, "step": 110 }, { "epoch": 0.0, "learning_rate": 1.9999428327112188e-05, "loss": 0.279, "step": 120 }, { "epoch": 0.0, "learning_rate": 1.9999380287373717e-05, "loss": 0.2838, "step": 130 }, { "epoch": 0.0, "learning_rate": 1.9999332247635247e-05, "loss": 0.279, "step": 140 }, { "epoch": 0.0, "learning_rate": 1.9999284207896773e-05, "loss": 0.2581, "step": 150 }, { "epoch": 0.0, "learning_rate": 1.9999236168158302e-05, "loss": 0.2651, "step": 160 }, { "epoch": 0.0, "learning_rate": 1.999918812841983e-05, "loss": 0.2498, "step": 170 }, { "epoch": 0.0, "learning_rate": 1.999914008868136e-05, "loss": 0.2378, "step": 180 }, { "epoch": 0.0, "learning_rate": 1.9999092048942886e-05, "loss": 0.237, "step": 190 }, { "epoch": 0.0, "learning_rate": 1.9999044009204415e-05, "loss": 0.2462, "step": 200 }, { "epoch": 0.0, "learning_rate": 1.9998995969465945e-05, "loss": 0.2412, "step": 210 }, { "epoch": 0.0, "learning_rate": 1.9998947929727474e-05, "loss": 0.2202, "step": 220 }, { "epoch": 0.0, "learning_rate": 1.9998899889989e-05, "loss": 0.2176, "step": 230 }, { "epoch": 0.0, "learning_rate": 1.999885185025053e-05, "loss": 0.2145, "step": 240 }, { "epoch": 0.0, "learning_rate": 1.999880381051206e-05, "loss": 0.1972, "step": 250 }, { "epoch": 0.0, "learning_rate": 1.9998755770773584e-05, "loss": 0.2118, "step": 260 }, { "epoch": 0.0, "learning_rate": 1.9998707731035114e-05, "loss": 0.2123, "step": 270 }, { "epoch": 0.0, "learning_rate": 1.9998659691296643e-05, "loss": 0.1982, "step": 280 }, { "epoch": 0.0, "learning_rate": 1.9998611651558172e-05, "loss": 0.2082, "step": 290 }, { "epoch": 0.0, "learning_rate": 1.9998563611819698e-05, "loss": 0.1963, "step": 300 }, { "epoch": 0.0, "learning_rate": 1.9998515572081227e-05, "loss": 0.177, "step": 310 }, { "epoch": 0.0, "learning_rate": 1.9998467532342757e-05, "loss": 0.1931, "step": 320 }, { "epoch": 0.0, "learning_rate": 1.9998419492604282e-05, "loss": 0.1811, "step": 330 }, { "epoch": 0.0, "learning_rate": 1.999837145286581e-05, "loss": 0.182, "step": 340 }, { "epoch": 0.01, "learning_rate": 1.999832341312734e-05, "loss": 0.1795, "step": 350 }, { "epoch": 0.01, "learning_rate": 1.999827537338887e-05, "loss": 0.1669, "step": 360 }, { "epoch": 0.01, "learning_rate": 1.9998227333650396e-05, "loss": 0.1752, "step": 370 }, { "epoch": 0.01, "learning_rate": 1.9998179293911925e-05, "loss": 0.182, "step": 380 }, { "epoch": 0.01, "learning_rate": 1.9998131254173455e-05, "loss": 0.1644, "step": 390 }, { "epoch": 0.01, "learning_rate": 1.9998083214434984e-05, "loss": 0.1659, "step": 400 }, { "epoch": 0.01, "learning_rate": 1.999803517469651e-05, "loss": 0.1618, "step": 410 }, { "epoch": 0.01, "learning_rate": 1.999798713495804e-05, "loss": 0.1606, "step": 420 }, { "epoch": 0.01, "learning_rate": 1.999793909521957e-05, "loss": 0.1658, "step": 430 }, { "epoch": 0.01, "learning_rate": 1.9997891055481094e-05, "loss": 0.1701, "step": 440 }, { "epoch": 0.01, "learning_rate": 1.9997843015742623e-05, "loss": 0.1586, "step": 450 }, { "epoch": 0.01, "learning_rate": 1.9997794976004153e-05, "loss": 0.1506, "step": 460 }, { "epoch": 0.01, "learning_rate": 1.9997746936265682e-05, "loss": 0.1644, "step": 470 }, { "epoch": 0.01, "learning_rate": 1.9997698896527208e-05, "loss": 0.1466, "step": 480 }, { "epoch": 0.01, "learning_rate": 1.9997650856788737e-05, "loss": 0.1512, "step": 490 }, { "epoch": 0.01, "learning_rate": 1.9997602817050266e-05, "loss": 0.1576, "step": 500 }, { "epoch": 0.01, "learning_rate": 1.9997554777311792e-05, "loss": 0.1502, "step": 510 }, { "epoch": 0.01, "learning_rate": 1.999750673757332e-05, "loss": 0.1619, "step": 520 }, { "epoch": 0.01, "learning_rate": 1.999745869783485e-05, "loss": 0.1455, "step": 530 }, { "epoch": 0.01, "learning_rate": 1.999741065809638e-05, "loss": 0.1399, "step": 540 }, { "epoch": 0.01, "learning_rate": 1.9997362618357906e-05, "loss": 0.1423, "step": 550 }, { "epoch": 0.01, "learning_rate": 1.9997314578619435e-05, "loss": 0.1413, "step": 560 }, { "epoch": 0.01, "learning_rate": 1.9997266538880965e-05, "loss": 0.149, "step": 570 }, { "epoch": 0.01, "learning_rate": 1.9997218499142494e-05, "loss": 0.1356, "step": 580 }, { "epoch": 0.01, "learning_rate": 1.999717045940402e-05, "loss": 0.141, "step": 590 }, { "epoch": 0.01, "learning_rate": 1.999712241966555e-05, "loss": 0.137, "step": 600 }, { "epoch": 0.01, "learning_rate": 1.9997074379927078e-05, "loss": 0.142, "step": 610 }, { "epoch": 0.01, "learning_rate": 1.9997026340188604e-05, "loss": 0.1388, "step": 620 }, { "epoch": 0.01, "learning_rate": 1.9996978300450133e-05, "loss": 0.1413, "step": 630 }, { "epoch": 0.01, "learning_rate": 1.9996930260711663e-05, "loss": 0.1419, "step": 640 }, { "epoch": 0.01, "learning_rate": 1.9996882220973192e-05, "loss": 0.1461, "step": 650 }, { "epoch": 0.01, "learning_rate": 1.9996834181234718e-05, "loss": 0.1357, "step": 660 }, { "epoch": 0.01, "learning_rate": 1.9996786141496247e-05, "loss": 0.1354, "step": 670 }, { "epoch": 0.01, "learning_rate": 1.9996738101757776e-05, "loss": 0.1363, "step": 680 }, { "epoch": 0.01, "learning_rate": 1.9996690062019302e-05, "loss": 0.1374, "step": 690 }, { "epoch": 0.01, "learning_rate": 1.999664202228083e-05, "loss": 0.1385, "step": 700 }, { "epoch": 0.01, "learning_rate": 1.999659398254236e-05, "loss": 0.1491, "step": 710 }, { "epoch": 0.01, "learning_rate": 1.999654594280389e-05, "loss": 0.126, "step": 720 }, { "epoch": 0.01, "learning_rate": 1.9996497903065416e-05, "loss": 0.1295, "step": 730 }, { "epoch": 0.01, "learning_rate": 1.9996449863326945e-05, "loss": 0.1405, "step": 740 }, { "epoch": 0.01, "learning_rate": 1.9996401823588474e-05, "loss": 0.1267, "step": 750 }, { "epoch": 0.01, "learning_rate": 1.9996353783850004e-05, "loss": 0.1265, "step": 760 }, { "epoch": 0.01, "learning_rate": 1.999630574411153e-05, "loss": 0.121, "step": 770 }, { "epoch": 0.01, "learning_rate": 1.999625770437306e-05, "loss": 0.124, "step": 780 }, { "epoch": 0.01, "learning_rate": 1.9996209664634588e-05, "loss": 0.1277, "step": 790 }, { "epoch": 0.01, "learning_rate": 1.9996161624896114e-05, "loss": 0.1166, "step": 800 }, { "epoch": 0.01, "learning_rate": 1.9996113585157643e-05, "loss": 0.1203, "step": 810 }, { "epoch": 0.01, "learning_rate": 1.9996065545419173e-05, "loss": 0.1244, "step": 820 }, { "epoch": 0.01, "learning_rate": 1.9996017505680702e-05, "loss": 0.1293, "step": 830 }, { "epoch": 0.01, "learning_rate": 1.9995969465942228e-05, "loss": 0.1309, "step": 840 }, { "epoch": 0.01, "learning_rate": 1.9995921426203757e-05, "loss": 0.1197, "step": 850 }, { "epoch": 0.01, "learning_rate": 1.9995873386465286e-05, "loss": 0.131, "step": 860 }, { "epoch": 0.01, "learning_rate": 1.9995825346726812e-05, "loss": 0.133, "step": 870 }, { "epoch": 0.01, "learning_rate": 1.999577730698834e-05, "loss": 0.114, "step": 880 }, { "epoch": 0.01, "learning_rate": 1.999572926724987e-05, "loss": 0.1241, "step": 890 }, { "epoch": 0.01, "learning_rate": 1.99956812275114e-05, "loss": 0.1213, "step": 900 }, { "epoch": 0.01, "learning_rate": 1.9995633187772926e-05, "loss": 0.1275, "step": 910 }, { "epoch": 0.01, "learning_rate": 1.9995585148034455e-05, "loss": 0.1218, "step": 920 }, { "epoch": 0.01, "learning_rate": 1.9995537108295984e-05, "loss": 0.1239, "step": 930 }, { "epoch": 0.01, "learning_rate": 1.9995489068557514e-05, "loss": 0.1247, "step": 940 }, { "epoch": 0.01, "learning_rate": 1.999544102881904e-05, "loss": 0.1091, "step": 950 }, { "epoch": 0.01, "learning_rate": 1.999539298908057e-05, "loss": 0.1174, "step": 960 }, { "epoch": 0.01, "learning_rate": 1.9995344949342098e-05, "loss": 0.1211, "step": 970 }, { "epoch": 0.01, "learning_rate": 1.9995296909603624e-05, "loss": 0.1151, "step": 980 }, { "epoch": 0.01, "learning_rate": 1.9995248869865153e-05, "loss": 0.1269, "step": 990 }, { "epoch": 0.01, "learning_rate": 1.9995200830126683e-05, "loss": 0.118, "step": 1000 }, { "epoch": 0.01, "learning_rate": 1.9995152790388212e-05, "loss": 0.116, "step": 1010 }, { "epoch": 0.01, "learning_rate": 1.9995104750649738e-05, "loss": 0.1079, "step": 1020 }, { "epoch": 0.01, "learning_rate": 1.9995056710911267e-05, "loss": 0.1105, "step": 1030 }, { "epoch": 0.01, "learning_rate": 1.9995008671172796e-05, "loss": 0.1084, "step": 1040 }, { "epoch": 0.02, "learning_rate": 1.9994960631434322e-05, "loss": 0.1122, "step": 1050 }, { "epoch": 0.02, "learning_rate": 1.999491259169585e-05, "loss": 0.1102, "step": 1060 }, { "epoch": 0.02, "learning_rate": 1.999486455195738e-05, "loss": 0.117, "step": 1070 }, { "epoch": 0.02, "learning_rate": 1.999481651221891e-05, "loss": 0.1096, "step": 1080 }, { "epoch": 0.02, "learning_rate": 1.9994768472480436e-05, "loss": 0.1154, "step": 1090 }, { "epoch": 0.02, "learning_rate": 1.9994720432741965e-05, "loss": 0.11, "step": 1100 }, { "epoch": 0.02, "learning_rate": 1.9994672393003494e-05, "loss": 0.1084, "step": 1110 }, { "epoch": 0.02, "learning_rate": 1.9994624353265024e-05, "loss": 0.103, "step": 1120 }, { "epoch": 0.02, "learning_rate": 1.999457631352655e-05, "loss": 0.1033, "step": 1130 }, { "epoch": 0.02, "learning_rate": 1.999452827378808e-05, "loss": 0.1185, "step": 1140 }, { "epoch": 0.02, "learning_rate": 1.9994480234049608e-05, "loss": 0.1157, "step": 1150 }, { "epoch": 0.02, "learning_rate": 1.9994432194311134e-05, "loss": 0.1047, "step": 1160 }, { "epoch": 0.02, "learning_rate": 1.9994384154572663e-05, "loss": 0.1023, "step": 1170 }, { "epoch": 0.02, "learning_rate": 1.9994336114834192e-05, "loss": 0.115, "step": 1180 }, { "epoch": 0.02, "learning_rate": 1.9994288075095722e-05, "loss": 0.1172, "step": 1190 }, { "epoch": 0.02, "learning_rate": 1.9994240035357248e-05, "loss": 0.1033, "step": 1200 }, { "epoch": 0.02, "learning_rate": 1.9994191995618777e-05, "loss": 0.1044, "step": 1210 }, { "epoch": 0.02, "learning_rate": 1.9994143955880306e-05, "loss": 0.1042, "step": 1220 }, { "epoch": 0.02, "learning_rate": 1.9994095916141832e-05, "loss": 0.1156, "step": 1230 }, { "epoch": 0.02, "learning_rate": 1.999404787640336e-05, "loss": 0.1081, "step": 1240 }, { "epoch": 0.02, "learning_rate": 1.999399983666489e-05, "loss": 0.0975, "step": 1250 }, { "epoch": 0.02, "learning_rate": 1.999395179692642e-05, "loss": 0.0989, "step": 1260 }, { "epoch": 0.02, "learning_rate": 1.9993903757187946e-05, "loss": 0.105, "step": 1270 }, { "epoch": 0.02, "learning_rate": 1.9993855717449475e-05, "loss": 0.1129, "step": 1280 }, { "epoch": 0.02, "learning_rate": 1.9993807677711004e-05, "loss": 0.0925, "step": 1290 }, { "epoch": 0.02, "learning_rate": 1.9993759637972533e-05, "loss": 0.1051, "step": 1300 }, { "epoch": 0.02, "learning_rate": 1.999371159823406e-05, "loss": 0.117, "step": 1310 }, { "epoch": 0.02, "learning_rate": 1.999366355849559e-05, "loss": 0.1076, "step": 1320 }, { "epoch": 0.02, "learning_rate": 1.9993615518757118e-05, "loss": 0.1056, "step": 1330 }, { "epoch": 0.02, "learning_rate": 1.9993567479018644e-05, "loss": 0.1068, "step": 1340 }, { "epoch": 0.02, "learning_rate": 1.9993519439280173e-05, "loss": 0.1155, "step": 1350 }, { "epoch": 0.02, "learning_rate": 1.9993471399541702e-05, "loss": 0.0998, "step": 1360 }, { "epoch": 0.02, "learning_rate": 1.999342335980323e-05, "loss": 0.1004, "step": 1370 }, { "epoch": 0.02, "learning_rate": 1.9993375320064757e-05, "loss": 0.1006, "step": 1380 }, { "epoch": 0.02, "learning_rate": 1.9993327280326287e-05, "loss": 0.0929, "step": 1390 }, { "epoch": 0.02, "learning_rate": 1.9993279240587816e-05, "loss": 0.1018, "step": 1400 }, { "epoch": 0.02, "learning_rate": 1.9993231200849342e-05, "loss": 0.0979, "step": 1410 }, { "epoch": 0.02, "learning_rate": 1.999318316111087e-05, "loss": 0.1063, "step": 1420 }, { "epoch": 0.02, "learning_rate": 1.99931351213724e-05, "loss": 0.1032, "step": 1430 }, { "epoch": 0.02, "learning_rate": 1.999308708163393e-05, "loss": 0.094, "step": 1440 }, { "epoch": 0.02, "learning_rate": 1.9993039041895456e-05, "loss": 0.1073, "step": 1450 }, { "epoch": 0.02, "learning_rate": 1.9992991002156985e-05, "loss": 0.0988, "step": 1460 }, { "epoch": 0.02, "learning_rate": 1.9992942962418514e-05, "loss": 0.1095, "step": 1470 }, { "epoch": 0.02, "learning_rate": 1.9992894922680043e-05, "loss": 0.1055, "step": 1480 }, { "epoch": 0.02, "learning_rate": 1.999284688294157e-05, "loss": 0.0908, "step": 1490 }, { "epoch": 0.02, "learning_rate": 1.99927988432031e-05, "loss": 0.0924, "step": 1500 }, { "epoch": 0.02, "learning_rate": 1.9992750803464628e-05, "loss": 0.0949, "step": 1510 }, { "epoch": 0.02, "learning_rate": 1.9992702763726154e-05, "loss": 0.097, "step": 1520 }, { "epoch": 0.02, "learning_rate": 1.9992654723987683e-05, "loss": 0.0939, "step": 1530 }, { "epoch": 0.02, "learning_rate": 1.9992606684249212e-05, "loss": 0.0922, "step": 1540 }, { "epoch": 0.02, "learning_rate": 1.999255864451074e-05, "loss": 0.092, "step": 1550 }, { "epoch": 0.02, "learning_rate": 1.9992510604772267e-05, "loss": 0.0963, "step": 1560 }, { "epoch": 0.02, "learning_rate": 1.9992462565033797e-05, "loss": 0.0912, "step": 1570 }, { "epoch": 0.02, "learning_rate": 1.9992414525295326e-05, "loss": 0.0963, "step": 1580 }, { "epoch": 0.02, "learning_rate": 1.9992366485556852e-05, "loss": 0.0883, "step": 1590 }, { "epoch": 0.02, "learning_rate": 1.999231844581838e-05, "loss": 0.1008, "step": 1600 }, { "epoch": 0.02, "learning_rate": 1.999227040607991e-05, "loss": 0.0844, "step": 1610 }, { "epoch": 0.02, "learning_rate": 1.999222236634144e-05, "loss": 0.09, "step": 1620 }, { "epoch": 0.02, "learning_rate": 1.9992174326602966e-05, "loss": 0.0904, "step": 1630 }, { "epoch": 0.02, "learning_rate": 1.9992126286864495e-05, "loss": 0.1015, "step": 1640 }, { "epoch": 0.02, "learning_rate": 1.9992078247126024e-05, "loss": 0.1012, "step": 1650 }, { "epoch": 0.02, "learning_rate": 1.999203020738755e-05, "loss": 0.0849, "step": 1660 }, { "epoch": 0.02, "learning_rate": 1.999198216764908e-05, "loss": 0.0955, "step": 1670 }, { "epoch": 0.02, "learning_rate": 1.999193412791061e-05, "loss": 0.0961, "step": 1680 }, { "epoch": 0.02, "learning_rate": 1.9991886088172138e-05, "loss": 0.0949, "step": 1690 }, { "epoch": 0.02, "learning_rate": 1.9991838048433664e-05, "loss": 0.0878, "step": 1700 }, { "epoch": 0.02, "learning_rate": 1.9991790008695193e-05, "loss": 0.1, "step": 1710 }, { "epoch": 0.02, "learning_rate": 1.9991741968956722e-05, "loss": 0.0926, "step": 1720 }, { "epoch": 0.02, "learning_rate": 1.999169392921825e-05, "loss": 0.0911, "step": 1730 }, { "epoch": 0.03, "learning_rate": 1.9991645889479777e-05, "loss": 0.099, "step": 1740 }, { "epoch": 0.03, "learning_rate": 1.9991597849741307e-05, "loss": 0.0947, "step": 1750 }, { "epoch": 0.03, "learning_rate": 1.9991549810002836e-05, "loss": 0.0949, "step": 1760 }, { "epoch": 0.03, "learning_rate": 1.9991501770264362e-05, "loss": 0.0981, "step": 1770 }, { "epoch": 0.03, "learning_rate": 1.999145373052589e-05, "loss": 0.0919, "step": 1780 }, { "epoch": 0.03, "learning_rate": 1.999140569078742e-05, "loss": 0.0926, "step": 1790 }, { "epoch": 0.03, "learning_rate": 1.999135765104895e-05, "loss": 0.0852, "step": 1800 }, { "epoch": 0.03, "learning_rate": 1.999130961131048e-05, "loss": 0.0913, "step": 1810 }, { "epoch": 0.03, "learning_rate": 1.9991261571572008e-05, "loss": 0.0868, "step": 1820 }, { "epoch": 0.03, "learning_rate": 1.9991213531833534e-05, "loss": 0.0932, "step": 1830 }, { "epoch": 0.03, "learning_rate": 1.9991165492095063e-05, "loss": 0.0954, "step": 1840 }, { "epoch": 0.03, "learning_rate": 1.9991117452356593e-05, "loss": 0.092, "step": 1850 }, { "epoch": 0.03, "learning_rate": 1.9991069412618122e-05, "loss": 0.0874, "step": 1860 }, { "epoch": 0.03, "learning_rate": 1.9991021372879648e-05, "loss": 0.0942, "step": 1870 }, { "epoch": 0.03, "learning_rate": 1.9990973333141177e-05, "loss": 0.0858, "step": 1880 }, { "epoch": 0.03, "learning_rate": 1.9990925293402706e-05, "loss": 0.0915, "step": 1890 }, { "epoch": 0.03, "learning_rate": 1.9990877253664232e-05, "loss": 0.0853, "step": 1900 }, { "epoch": 0.03, "learning_rate": 1.999082921392576e-05, "loss": 0.0848, "step": 1910 }, { "epoch": 0.03, "learning_rate": 1.999078117418729e-05, "loss": 0.0869, "step": 1920 }, { "epoch": 0.03, "learning_rate": 1.999073313444882e-05, "loss": 0.0881, "step": 1930 }, { "epoch": 0.03, "learning_rate": 1.9990685094710346e-05, "loss": 0.0914, "step": 1940 }, { "epoch": 0.03, "learning_rate": 1.9990637054971875e-05, "loss": 0.0862, "step": 1950 }, { "epoch": 0.03, "learning_rate": 1.9990589015233404e-05, "loss": 0.0851, "step": 1960 }, { "epoch": 0.03, "learning_rate": 1.9990540975494934e-05, "loss": 0.0813, "step": 1970 }, { "epoch": 0.03, "learning_rate": 1.999049293575646e-05, "loss": 0.0733, "step": 1980 }, { "epoch": 0.03, "learning_rate": 1.999044489601799e-05, "loss": 0.0935, "step": 1990 }, { "epoch": 0.03, "learning_rate": 1.9990396856279518e-05, "loss": 0.0975, "step": 2000 }, { "epoch": 0.03, "learning_rate": 1.9990348816541044e-05, "loss": 0.0877, "step": 2010 }, { "epoch": 0.03, "learning_rate": 1.9990300776802573e-05, "loss": 0.0968, "step": 2020 }, { "epoch": 0.03, "learning_rate": 1.9990252737064102e-05, "loss": 0.0858, "step": 2030 }, { "epoch": 0.03, "learning_rate": 1.9990204697325632e-05, "loss": 0.0851, "step": 2040 }, { "epoch": 0.03, "learning_rate": 1.9990156657587158e-05, "loss": 0.0803, "step": 2050 }, { "epoch": 0.03, "learning_rate": 1.9990108617848687e-05, "loss": 0.0874, "step": 2060 }, { "epoch": 0.03, "learning_rate": 1.9990060578110216e-05, "loss": 0.0882, "step": 2070 }, { "epoch": 0.03, "learning_rate": 1.9990012538371742e-05, "loss": 0.0789, "step": 2080 }, { "epoch": 0.03, "learning_rate": 1.998996449863327e-05, "loss": 0.0842, "step": 2090 }, { "epoch": 0.03, "learning_rate": 1.99899164588948e-05, "loss": 0.0806, "step": 2100 }, { "epoch": 0.03, "learning_rate": 1.998986841915633e-05, "loss": 0.08, "step": 2110 }, { "epoch": 0.03, "learning_rate": 1.9989820379417856e-05, "loss": 0.0834, "step": 2120 }, { "epoch": 0.03, "learning_rate": 1.9989772339679385e-05, "loss": 0.0851, "step": 2130 }, { "epoch": 0.03, "learning_rate": 1.9989724299940914e-05, "loss": 0.0844, "step": 2140 }, { "epoch": 0.03, "learning_rate": 1.9989676260202443e-05, "loss": 0.0804, "step": 2150 }, { "epoch": 0.03, "learning_rate": 1.998962822046397e-05, "loss": 0.0792, "step": 2160 }, { "epoch": 0.03, "learning_rate": 1.99895801807255e-05, "loss": 0.0747, "step": 2170 }, { "epoch": 0.03, "learning_rate": 1.9989532140987028e-05, "loss": 0.0795, "step": 2180 }, { "epoch": 0.03, "learning_rate": 1.9989484101248554e-05, "loss": 0.0721, "step": 2190 }, { "epoch": 0.03, "learning_rate": 1.9989436061510083e-05, "loss": 0.0859, "step": 2200 }, { "epoch": 0.03, "learning_rate": 1.9989388021771612e-05, "loss": 0.0844, "step": 2210 }, { "epoch": 0.03, "learning_rate": 1.998933998203314e-05, "loss": 0.0813, "step": 2220 }, { "epoch": 0.03, "learning_rate": 1.9989291942294667e-05, "loss": 0.0885, "step": 2230 }, { "epoch": 0.03, "learning_rate": 1.9989243902556197e-05, "loss": 0.0873, "step": 2240 }, { "epoch": 0.03, "learning_rate": 1.9989195862817726e-05, "loss": 0.0803, "step": 2250 }, { "epoch": 0.03, "learning_rate": 1.9989147823079252e-05, "loss": 0.0779, "step": 2260 }, { "epoch": 0.03, "learning_rate": 1.998909978334078e-05, "loss": 0.0899, "step": 2270 }, { "epoch": 0.03, "learning_rate": 1.998905174360231e-05, "loss": 0.0789, "step": 2280 }, { "epoch": 0.03, "learning_rate": 1.998900370386384e-05, "loss": 0.0929, "step": 2290 }, { "epoch": 0.03, "learning_rate": 1.9988955664125366e-05, "loss": 0.0861, "step": 2300 }, { "epoch": 0.03, "learning_rate": 1.9988907624386895e-05, "loss": 0.0717, "step": 2310 }, { "epoch": 0.03, "learning_rate": 1.9988859584648424e-05, "loss": 0.0856, "step": 2320 }, { "epoch": 0.03, "learning_rate": 1.9988811544909953e-05, "loss": 0.075, "step": 2330 }, { "epoch": 0.03, "learning_rate": 1.998876350517148e-05, "loss": 0.0906, "step": 2340 }, { "epoch": 0.03, "learning_rate": 1.998871546543301e-05, "loss": 0.0801, "step": 2350 }, { "epoch": 0.03, "learning_rate": 1.9988667425694538e-05, "loss": 0.0752, "step": 2360 }, { "epoch": 0.03, "learning_rate": 1.9988619385956064e-05, "loss": 0.0732, "step": 2370 }, { "epoch": 0.03, "learning_rate": 1.9988571346217593e-05, "loss": 0.073, "step": 2380 }, { "epoch": 0.03, "learning_rate": 1.9988523306479122e-05, "loss": 0.0783, "step": 2390 }, { "epoch": 0.03, "learning_rate": 1.998847526674065e-05, "loss": 0.0744, "step": 2400 }, { "epoch": 0.03, "learning_rate": 1.9988427227002177e-05, "loss": 0.0792, "step": 2410 }, { "epoch": 0.03, "learning_rate": 1.9988379187263707e-05, "loss": 0.0863, "step": 2420 }, { "epoch": 0.04, "learning_rate": 1.9988331147525236e-05, "loss": 0.0776, "step": 2430 }, { "epoch": 0.04, "learning_rate": 1.9988283107786762e-05, "loss": 0.0765, "step": 2440 }, { "epoch": 0.04, "learning_rate": 1.998823506804829e-05, "loss": 0.0743, "step": 2450 }, { "epoch": 0.04, "learning_rate": 1.998818702830982e-05, "loss": 0.0788, "step": 2460 }, { "epoch": 0.04, "learning_rate": 1.998813898857135e-05, "loss": 0.0747, "step": 2470 }, { "epoch": 0.04, "learning_rate": 1.9988090948832876e-05, "loss": 0.0801, "step": 2480 }, { "epoch": 0.04, "learning_rate": 1.9988042909094405e-05, "loss": 0.0736, "step": 2490 }, { "epoch": 0.04, "learning_rate": 1.9987994869355934e-05, "loss": 0.0783, "step": 2500 }, { "epoch": 0.04, "learning_rate": 1.9987946829617463e-05, "loss": 0.0763, "step": 2510 }, { "epoch": 0.04, "learning_rate": 1.998789878987899e-05, "loss": 0.0783, "step": 2520 }, { "epoch": 0.04, "learning_rate": 1.998785075014052e-05, "loss": 0.0867, "step": 2530 }, { "epoch": 0.04, "learning_rate": 1.9987802710402048e-05, "loss": 0.0722, "step": 2540 }, { "epoch": 0.04, "learning_rate": 1.9987754670663574e-05, "loss": 0.0727, "step": 2550 }, { "epoch": 0.04, "learning_rate": 1.9987706630925103e-05, "loss": 0.0746, "step": 2560 }, { "epoch": 0.04, "learning_rate": 1.9987658591186632e-05, "loss": 0.0809, "step": 2570 }, { "epoch": 0.04, "learning_rate": 1.998761055144816e-05, "loss": 0.0802, "step": 2580 }, { "epoch": 0.04, "learning_rate": 1.9987562511709687e-05, "loss": 0.0796, "step": 2590 }, { "epoch": 0.04, "learning_rate": 1.9987514471971217e-05, "loss": 0.0827, "step": 2600 }, { "epoch": 0.04, "learning_rate": 1.9987466432232746e-05, "loss": 0.085, "step": 2610 }, { "epoch": 0.04, "learning_rate": 1.9987418392494272e-05, "loss": 0.0726, "step": 2620 }, { "epoch": 0.04, "learning_rate": 1.99873703527558e-05, "loss": 0.0782, "step": 2630 }, { "epoch": 0.04, "learning_rate": 1.998732231301733e-05, "loss": 0.0826, "step": 2640 }, { "epoch": 0.04, "learning_rate": 1.998727427327886e-05, "loss": 0.074, "step": 2650 }, { "epoch": 0.04, "learning_rate": 1.9987226233540385e-05, "loss": 0.0737, "step": 2660 }, { "epoch": 0.04, "learning_rate": 1.9987178193801915e-05, "loss": 0.0787, "step": 2670 }, { "epoch": 0.04, "learning_rate": 1.9987130154063444e-05, "loss": 0.0734, "step": 2680 }, { "epoch": 0.04, "learning_rate": 1.9987082114324973e-05, "loss": 0.0648, "step": 2690 }, { "epoch": 0.04, "learning_rate": 1.99870340745865e-05, "loss": 0.0752, "step": 2700 }, { "epoch": 0.04, "learning_rate": 1.998698603484803e-05, "loss": 0.0712, "step": 2710 }, { "epoch": 0.04, "learning_rate": 1.9986937995109558e-05, "loss": 0.0642, "step": 2720 }, { "epoch": 0.04, "learning_rate": 1.9986889955371084e-05, "loss": 0.0724, "step": 2730 }, { "epoch": 0.04, "learning_rate": 1.9986841915632613e-05, "loss": 0.0683, "step": 2740 }, { "epoch": 0.04, "learning_rate": 1.9986793875894142e-05, "loss": 0.0712, "step": 2750 }, { "epoch": 0.04, "learning_rate": 1.998674583615567e-05, "loss": 0.069, "step": 2760 }, { "epoch": 0.04, "learning_rate": 1.9986697796417197e-05, "loss": 0.0701, "step": 2770 }, { "epoch": 0.04, "learning_rate": 1.9986649756678727e-05, "loss": 0.0737, "step": 2780 }, { "epoch": 0.04, "learning_rate": 1.9986601716940256e-05, "loss": 0.0756, "step": 2790 }, { "epoch": 0.04, "learning_rate": 1.998655367720178e-05, "loss": 0.088, "step": 2800 }, { "epoch": 0.04, "learning_rate": 1.998650563746331e-05, "loss": 0.0657, "step": 2810 }, { "epoch": 0.04, "learning_rate": 1.998645759772484e-05, "loss": 0.0743, "step": 2820 }, { "epoch": 0.04, "learning_rate": 1.998640955798637e-05, "loss": 0.0728, "step": 2830 }, { "epoch": 0.04, "learning_rate": 1.9986361518247895e-05, "loss": 0.0715, "step": 2840 }, { "epoch": 0.04, "learning_rate": 1.9986313478509425e-05, "loss": 0.075, "step": 2850 }, { "epoch": 0.04, "learning_rate": 1.9986265438770954e-05, "loss": 0.0736, "step": 2860 }, { "epoch": 0.04, "learning_rate": 1.9986217399032483e-05, "loss": 0.0653, "step": 2870 }, { "epoch": 0.04, "learning_rate": 1.998616935929401e-05, "loss": 0.0654, "step": 2880 }, { "epoch": 0.04, "learning_rate": 1.998612131955554e-05, "loss": 0.0771, "step": 2890 }, { "epoch": 0.04, "learning_rate": 1.9986073279817068e-05, "loss": 0.058, "step": 2900 }, { "epoch": 0.04, "learning_rate": 1.9986025240078593e-05, "loss": 0.0688, "step": 2910 }, { "epoch": 0.04, "learning_rate": 1.9985977200340123e-05, "loss": 0.0753, "step": 2920 }, { "epoch": 0.04, "learning_rate": 1.9985929160601652e-05, "loss": 0.0743, "step": 2930 }, { "epoch": 0.04, "learning_rate": 1.998588112086318e-05, "loss": 0.0647, "step": 2940 }, { "epoch": 0.04, "learning_rate": 1.9985833081124707e-05, "loss": 0.0616, "step": 2950 }, { "epoch": 0.04, "learning_rate": 1.9985785041386236e-05, "loss": 0.0753, "step": 2960 }, { "epoch": 0.04, "learning_rate": 1.9985737001647766e-05, "loss": 0.0712, "step": 2970 }, { "epoch": 0.04, "learning_rate": 1.998568896190929e-05, "loss": 0.0682, "step": 2980 }, { "epoch": 0.04, "learning_rate": 1.998564092217082e-05, "loss": 0.0679, "step": 2990 }, { "epoch": 0.04, "learning_rate": 1.998559288243235e-05, "loss": 0.0764, "step": 3000 }, { "epoch": 0.04, "learning_rate": 1.998554484269388e-05, "loss": 0.0644, "step": 3010 }, { "epoch": 0.04, "learning_rate": 1.9985496802955405e-05, "loss": 0.0593, "step": 3020 }, { "epoch": 0.04, "learning_rate": 1.9985448763216935e-05, "loss": 0.0652, "step": 3030 }, { "epoch": 0.04, "learning_rate": 1.9985400723478464e-05, "loss": 0.0677, "step": 3040 }, { "epoch": 0.04, "learning_rate": 1.998535268373999e-05, "loss": 0.0658, "step": 3050 }, { "epoch": 0.04, "learning_rate": 1.998530464400152e-05, "loss": 0.0669, "step": 3060 }, { "epoch": 0.04, "learning_rate": 1.9985256604263048e-05, "loss": 0.0674, "step": 3070 }, { "epoch": 0.04, "learning_rate": 1.9985208564524577e-05, "loss": 0.0722, "step": 3080 }, { "epoch": 0.04, "learning_rate": 1.9985160524786103e-05, "loss": 0.0668, "step": 3090 }, { "epoch": 0.04, "learning_rate": 1.9985112485047633e-05, "loss": 0.0759, "step": 3100 }, { "epoch": 0.04, "learning_rate": 1.9985064445309162e-05, "loss": 0.0736, "step": 3110 }, { "epoch": 0.04, "learning_rate": 1.998501640557069e-05, "loss": 0.0766, "step": 3120 }, { "epoch": 0.05, "learning_rate": 1.9984968365832217e-05, "loss": 0.0764, "step": 3130 }, { "epoch": 0.05, "learning_rate": 1.9984920326093746e-05, "loss": 0.0701, "step": 3140 }, { "epoch": 0.05, "learning_rate": 1.9984872286355276e-05, "loss": 0.0764, "step": 3150 }, { "epoch": 0.05, "learning_rate": 1.99848242466168e-05, "loss": 0.0708, "step": 3160 }, { "epoch": 0.05, "learning_rate": 1.998477620687833e-05, "loss": 0.0749, "step": 3170 }, { "epoch": 0.05, "learning_rate": 1.998472816713986e-05, "loss": 0.0758, "step": 3180 }, { "epoch": 0.05, "learning_rate": 1.998468012740139e-05, "loss": 0.0694, "step": 3190 }, { "epoch": 0.05, "learning_rate": 1.9984632087662915e-05, "loss": 0.0718, "step": 3200 }, { "epoch": 0.05, "learning_rate": 1.9984584047924444e-05, "loss": 0.0747, "step": 3210 }, { "epoch": 0.05, "learning_rate": 1.9984536008185974e-05, "loss": 0.0613, "step": 3220 }, { "epoch": 0.05, "learning_rate": 1.99844879684475e-05, "loss": 0.0575, "step": 3230 }, { "epoch": 0.05, "learning_rate": 1.998443992870903e-05, "loss": 0.0625, "step": 3240 }, { "epoch": 0.05, "learning_rate": 1.9984391888970558e-05, "loss": 0.0616, "step": 3250 }, { "epoch": 0.05, "learning_rate": 1.9984343849232087e-05, "loss": 0.071, "step": 3260 }, { "epoch": 0.05, "learning_rate": 1.9984295809493613e-05, "loss": 0.0646, "step": 3270 }, { "epoch": 0.05, "learning_rate": 1.9984247769755143e-05, "loss": 0.064, "step": 3280 }, { "epoch": 0.05, "learning_rate": 1.9984199730016672e-05, "loss": 0.0683, "step": 3290 }, { "epoch": 0.05, "learning_rate": 1.99841516902782e-05, "loss": 0.0686, "step": 3300 }, { "epoch": 0.05, "learning_rate": 1.9984103650539727e-05, "loss": 0.0715, "step": 3310 }, { "epoch": 0.05, "learning_rate": 1.9984055610801256e-05, "loss": 0.0574, "step": 3320 }, { "epoch": 0.05, "learning_rate": 1.9984007571062786e-05, "loss": 0.068, "step": 3330 }, { "epoch": 0.05, "learning_rate": 1.998395953132431e-05, "loss": 0.0644, "step": 3340 }, { "epoch": 0.05, "learning_rate": 1.998391149158584e-05, "loss": 0.0634, "step": 3350 }, { "epoch": 0.05, "learning_rate": 1.998386345184737e-05, "loss": 0.0646, "step": 3360 }, { "epoch": 0.05, "learning_rate": 1.99838154121089e-05, "loss": 0.0602, "step": 3370 }, { "epoch": 0.05, "learning_rate": 1.9983767372370425e-05, "loss": 0.0685, "step": 3380 }, { "epoch": 0.05, "learning_rate": 1.9983719332631954e-05, "loss": 0.0589, "step": 3390 }, { "epoch": 0.05, "learning_rate": 1.9983671292893484e-05, "loss": 0.0703, "step": 3400 }, { "epoch": 0.05, "learning_rate": 1.998362325315501e-05, "loss": 0.0633, "step": 3410 }, { "epoch": 0.05, "learning_rate": 1.998357521341654e-05, "loss": 0.0676, "step": 3420 }, { "epoch": 0.05, "learning_rate": 1.9983527173678068e-05, "loss": 0.065, "step": 3430 }, { "epoch": 0.05, "learning_rate": 1.9983479133939597e-05, "loss": 0.0658, "step": 3440 }, { "epoch": 0.05, "learning_rate": 1.9983431094201123e-05, "loss": 0.0694, "step": 3450 }, { "epoch": 0.05, "learning_rate": 1.9983383054462652e-05, "loss": 0.0647, "step": 3460 }, { "epoch": 0.05, "learning_rate": 1.9983335014724182e-05, "loss": 0.0721, "step": 3470 }, { "epoch": 0.05, "learning_rate": 1.998328697498571e-05, "loss": 0.0626, "step": 3480 }, { "epoch": 0.05, "learning_rate": 1.9983238935247237e-05, "loss": 0.058, "step": 3490 }, { "epoch": 0.05, "learning_rate": 1.9983190895508766e-05, "loss": 0.0653, "step": 3500 }, { "epoch": 0.05, "learning_rate": 1.9983142855770295e-05, "loss": 0.0698, "step": 3510 }, { "epoch": 0.05, "learning_rate": 1.998309481603182e-05, "loss": 0.0687, "step": 3520 }, { "epoch": 0.05, "learning_rate": 1.998304677629335e-05, "loss": 0.0709, "step": 3530 }, { "epoch": 0.05, "learning_rate": 1.998299873655488e-05, "loss": 0.0729, "step": 3540 }, { "epoch": 0.05, "learning_rate": 1.998295069681641e-05, "loss": 0.0632, "step": 3550 }, { "epoch": 0.05, "learning_rate": 1.9982902657077935e-05, "loss": 0.0803, "step": 3560 }, { "epoch": 0.05, "learning_rate": 1.9982854617339464e-05, "loss": 0.0678, "step": 3570 }, { "epoch": 0.05, "learning_rate": 1.9982806577600994e-05, "loss": 0.0627, "step": 3580 }, { "epoch": 0.05, "learning_rate": 1.998275853786252e-05, "loss": 0.064, "step": 3590 }, { "epoch": 0.05, "learning_rate": 1.998271049812405e-05, "loss": 0.0764, "step": 3600 }, { "epoch": 0.05, "learning_rate": 1.9982662458385578e-05, "loss": 0.065, "step": 3610 }, { "epoch": 0.05, "learning_rate": 1.9982614418647107e-05, "loss": 0.0621, "step": 3620 }, { "epoch": 0.05, "learning_rate": 1.9982566378908633e-05, "loss": 0.0664, "step": 3630 }, { "epoch": 0.05, "learning_rate": 1.9982518339170162e-05, "loss": 0.064, "step": 3640 }, { "epoch": 0.05, "learning_rate": 1.998247029943169e-05, "loss": 0.0676, "step": 3650 }, { "epoch": 0.05, "learning_rate": 1.998242225969322e-05, "loss": 0.0579, "step": 3660 }, { "epoch": 0.05, "learning_rate": 1.9982374219954747e-05, "loss": 0.0542, "step": 3670 }, { "epoch": 0.05, "learning_rate": 1.9982326180216276e-05, "loss": 0.0571, "step": 3680 }, { "epoch": 0.05, "learning_rate": 1.9982278140477805e-05, "loss": 0.0676, "step": 3690 }, { "epoch": 0.05, "learning_rate": 1.998223010073933e-05, "loss": 0.0692, "step": 3700 }, { "epoch": 0.05, "learning_rate": 1.998218206100086e-05, "loss": 0.0666, "step": 3710 }, { "epoch": 0.05, "learning_rate": 1.998213402126239e-05, "loss": 0.0583, "step": 3720 }, { "epoch": 0.05, "learning_rate": 1.998208598152392e-05, "loss": 0.0654, "step": 3730 }, { "epoch": 0.05, "learning_rate": 1.9982037941785445e-05, "loss": 0.0656, "step": 3740 }, { "epoch": 0.05, "learning_rate": 1.9981989902046974e-05, "loss": 0.0686, "step": 3750 }, { "epoch": 0.05, "learning_rate": 1.9981941862308503e-05, "loss": 0.0697, "step": 3760 }, { "epoch": 0.05, "learning_rate": 1.998189382257003e-05, "loss": 0.064, "step": 3770 }, { "epoch": 0.05, "learning_rate": 1.998184578283156e-05, "loss": 0.0662, "step": 3780 }, { "epoch": 0.05, "learning_rate": 1.9981797743093088e-05, "loss": 0.0612, "step": 3790 }, { "epoch": 0.05, "learning_rate": 1.9981749703354617e-05, "loss": 0.0714, "step": 3800 }, { "epoch": 0.05, "learning_rate": 1.9981701663616143e-05, "loss": 0.0663, "step": 3810 }, { "epoch": 0.06, "learning_rate": 1.9981653623877672e-05, "loss": 0.0666, "step": 3820 }, { "epoch": 0.06, "learning_rate": 1.99816055841392e-05, "loss": 0.0666, "step": 3830 }, { "epoch": 0.06, "learning_rate": 1.998155754440073e-05, "loss": 0.0649, "step": 3840 }, { "epoch": 0.06, "learning_rate": 1.9981509504662257e-05, "loss": 0.0685, "step": 3850 }, { "epoch": 0.06, "learning_rate": 1.9981461464923786e-05, "loss": 0.0612, "step": 3860 }, { "epoch": 0.06, "learning_rate": 1.9981413425185315e-05, "loss": 0.0579, "step": 3870 }, { "epoch": 0.06, "learning_rate": 1.998136538544684e-05, "loss": 0.0651, "step": 3880 }, { "epoch": 0.06, "learning_rate": 1.998131734570837e-05, "loss": 0.0526, "step": 3890 }, { "epoch": 0.06, "learning_rate": 1.99812693059699e-05, "loss": 0.0697, "step": 3900 }, { "epoch": 0.06, "learning_rate": 1.998122126623143e-05, "loss": 0.0682, "step": 3910 }, { "epoch": 0.06, "learning_rate": 1.9981173226492955e-05, "loss": 0.0614, "step": 3920 }, { "epoch": 0.06, "learning_rate": 1.9981125186754484e-05, "loss": 0.0614, "step": 3930 }, { "epoch": 0.06, "learning_rate": 1.9981077147016013e-05, "loss": 0.0504, "step": 3940 }, { "epoch": 0.06, "learning_rate": 1.998102910727754e-05, "loss": 0.0563, "step": 3950 }, { "epoch": 0.06, "learning_rate": 1.998098106753907e-05, "loss": 0.0621, "step": 3960 }, { "epoch": 0.06, "learning_rate": 1.9980933027800598e-05, "loss": 0.055, "step": 3970 }, { "epoch": 0.06, "learning_rate": 1.9980884988062127e-05, "loss": 0.0556, "step": 3980 }, { "epoch": 0.06, "learning_rate": 1.9980836948323653e-05, "loss": 0.0649, "step": 3990 }, { "epoch": 0.06, "learning_rate": 1.9980788908585182e-05, "loss": 0.063, "step": 4000 }, { "epoch": 0.06, "learning_rate": 1.998074086884671e-05, "loss": 0.0658, "step": 4010 }, { "epoch": 0.06, "learning_rate": 1.998069282910824e-05, "loss": 0.0626, "step": 4020 }, { "epoch": 0.06, "learning_rate": 1.9980644789369767e-05, "loss": 0.0612, "step": 4030 }, { "epoch": 0.06, "learning_rate": 1.9980596749631296e-05, "loss": 0.056, "step": 4040 }, { "epoch": 0.06, "learning_rate": 1.9980548709892825e-05, "loss": 0.0626, "step": 4050 }, { "epoch": 0.06, "learning_rate": 1.998050067015435e-05, "loss": 0.0567, "step": 4060 }, { "epoch": 0.06, "learning_rate": 1.998045263041588e-05, "loss": 0.0656, "step": 4070 }, { "epoch": 0.06, "learning_rate": 1.998040459067741e-05, "loss": 0.054, "step": 4080 }, { "epoch": 0.06, "learning_rate": 1.998035655093894e-05, "loss": 0.0657, "step": 4090 }, { "epoch": 0.06, "learning_rate": 1.9980308511200465e-05, "loss": 0.0664, "step": 4100 }, { "epoch": 0.06, "learning_rate": 1.9980260471461994e-05, "loss": 0.0675, "step": 4110 }, { "epoch": 0.06, "learning_rate": 1.9980212431723523e-05, "loss": 0.062, "step": 4120 }, { "epoch": 0.06, "learning_rate": 1.998016439198505e-05, "loss": 0.053, "step": 4130 }, { "epoch": 0.06, "learning_rate": 1.998011635224658e-05, "loss": 0.0583, "step": 4140 }, { "epoch": 0.06, "learning_rate": 1.9980068312508108e-05, "loss": 0.0536, "step": 4150 }, { "epoch": 0.06, "learning_rate": 1.9980020272769637e-05, "loss": 0.064, "step": 4160 }, { "epoch": 0.06, "learning_rate": 1.9979972233031163e-05, "loss": 0.057, "step": 4170 }, { "epoch": 0.06, "learning_rate": 1.9979924193292692e-05, "loss": 0.062, "step": 4180 }, { "epoch": 0.06, "learning_rate": 1.997987615355422e-05, "loss": 0.0606, "step": 4190 }, { "epoch": 0.06, "learning_rate": 1.997982811381575e-05, "loss": 0.0527, "step": 4200 }, { "epoch": 0.06, "learning_rate": 1.9979780074077277e-05, "loss": 0.0577, "step": 4210 }, { "epoch": 0.06, "learning_rate": 1.9979732034338806e-05, "loss": 0.0548, "step": 4220 }, { "epoch": 0.06, "learning_rate": 1.9979683994600335e-05, "loss": 0.0536, "step": 4230 }, { "epoch": 0.06, "learning_rate": 1.997963595486186e-05, "loss": 0.0575, "step": 4240 }, { "epoch": 0.06, "learning_rate": 1.997958791512339e-05, "loss": 0.0577, "step": 4250 }, { "epoch": 0.06, "learning_rate": 1.997953987538492e-05, "loss": 0.0554, "step": 4260 }, { "epoch": 0.06, "learning_rate": 1.997949183564645e-05, "loss": 0.0569, "step": 4270 }, { "epoch": 0.06, "learning_rate": 1.9979443795907975e-05, "loss": 0.0634, "step": 4280 }, { "epoch": 0.06, "learning_rate": 1.9979395756169504e-05, "loss": 0.0582, "step": 4290 }, { "epoch": 0.06, "learning_rate": 1.9979347716431033e-05, "loss": 0.0589, "step": 4300 }, { "epoch": 0.06, "learning_rate": 1.997929967669256e-05, "loss": 0.0601, "step": 4310 }, { "epoch": 0.06, "learning_rate": 1.997925163695409e-05, "loss": 0.054, "step": 4320 }, { "epoch": 0.06, "learning_rate": 1.9979203597215618e-05, "loss": 0.0581, "step": 4330 }, { "epoch": 0.06, "learning_rate": 1.9979155557477147e-05, "loss": 0.0753, "step": 4340 }, { "epoch": 0.06, "learning_rate": 1.9979107517738673e-05, "loss": 0.0696, "step": 4350 }, { "epoch": 0.06, "learning_rate": 1.9979059478000205e-05, "loss": 0.0651, "step": 4360 }, { "epoch": 0.06, "learning_rate": 1.997901143826173e-05, "loss": 0.0585, "step": 4370 }, { "epoch": 0.06, "learning_rate": 1.997896339852326e-05, "loss": 0.0659, "step": 4380 }, { "epoch": 0.06, "learning_rate": 1.997891535878479e-05, "loss": 0.064, "step": 4390 }, { "epoch": 0.06, "learning_rate": 1.997886731904632e-05, "loss": 0.0696, "step": 4400 }, { "epoch": 0.06, "learning_rate": 1.9978819279307845e-05, "loss": 0.0572, "step": 4410 }, { "epoch": 0.06, "learning_rate": 1.9978771239569374e-05, "loss": 0.0525, "step": 4420 }, { "epoch": 0.06, "learning_rate": 1.9978723199830904e-05, "loss": 0.0565, "step": 4430 }, { "epoch": 0.06, "learning_rate": 1.9978675160092433e-05, "loss": 0.0559, "step": 4440 }, { "epoch": 0.06, "learning_rate": 1.997862712035396e-05, "loss": 0.0615, "step": 4450 }, { "epoch": 0.06, "learning_rate": 1.9978579080615488e-05, "loss": 0.0638, "step": 4460 }, { "epoch": 0.06, "learning_rate": 1.9978531040877017e-05, "loss": 0.0624, "step": 4470 }, { "epoch": 0.06, "learning_rate": 1.9978483001138543e-05, "loss": 0.053, "step": 4480 }, { "epoch": 0.06, "learning_rate": 1.9978434961400072e-05, "loss": 0.0482, "step": 4490 }, { "epoch": 0.06, "learning_rate": 1.99783869216616e-05, "loss": 0.0562, "step": 4500 }, { "epoch": 0.06, "learning_rate": 1.997833888192313e-05, "loss": 0.0558, "step": 4510 }, { "epoch": 0.07, "learning_rate": 1.9978290842184657e-05, "loss": 0.0481, "step": 4520 }, { "epoch": 0.07, "learning_rate": 1.9978242802446186e-05, "loss": 0.0557, "step": 4530 }, { "epoch": 0.07, "learning_rate": 1.9978194762707715e-05, "loss": 0.059, "step": 4540 }, { "epoch": 0.07, "learning_rate": 1.997814672296924e-05, "loss": 0.0578, "step": 4550 }, { "epoch": 0.07, "learning_rate": 1.997809868323077e-05, "loss": 0.0562, "step": 4560 }, { "epoch": 0.07, "learning_rate": 1.99780506434923e-05, "loss": 0.056, "step": 4570 }, { "epoch": 0.07, "learning_rate": 1.997800260375383e-05, "loss": 0.0553, "step": 4580 }, { "epoch": 0.07, "learning_rate": 1.9977954564015355e-05, "loss": 0.0585, "step": 4590 }, { "epoch": 0.07, "learning_rate": 1.9977906524276884e-05, "loss": 0.0534, "step": 4600 }, { "epoch": 0.07, "learning_rate": 1.9977858484538413e-05, "loss": 0.0532, "step": 4610 }, { "epoch": 0.07, "learning_rate": 1.997781044479994e-05, "loss": 0.0582, "step": 4620 }, { "epoch": 0.07, "learning_rate": 1.997776240506147e-05, "loss": 0.063, "step": 4630 }, { "epoch": 0.07, "learning_rate": 1.9977714365322998e-05, "loss": 0.058, "step": 4640 }, { "epoch": 0.07, "learning_rate": 1.9977666325584527e-05, "loss": 0.062, "step": 4650 }, { "epoch": 0.07, "learning_rate": 1.9977618285846053e-05, "loss": 0.0618, "step": 4660 }, { "epoch": 0.07, "learning_rate": 1.9977570246107582e-05, "loss": 0.0612, "step": 4670 }, { "epoch": 0.07, "learning_rate": 1.997752220636911e-05, "loss": 0.0475, "step": 4680 }, { "epoch": 0.07, "learning_rate": 1.997747416663064e-05, "loss": 0.0631, "step": 4690 }, { "epoch": 0.07, "learning_rate": 1.9977426126892167e-05, "loss": 0.0588, "step": 4700 }, { "epoch": 0.07, "learning_rate": 1.9977378087153696e-05, "loss": 0.0639, "step": 4710 }, { "epoch": 0.07, "learning_rate": 1.9977330047415225e-05, "loss": 0.0517, "step": 4720 }, { "epoch": 0.07, "learning_rate": 1.997728200767675e-05, "loss": 0.0451, "step": 4730 }, { "epoch": 0.07, "learning_rate": 1.997723396793828e-05, "loss": 0.0506, "step": 4740 }, { "epoch": 0.07, "learning_rate": 1.997718592819981e-05, "loss": 0.0548, "step": 4750 }, { "epoch": 0.07, "learning_rate": 1.997713788846134e-05, "loss": 0.0586, "step": 4760 }, { "epoch": 0.07, "learning_rate": 1.9977089848722865e-05, "loss": 0.0528, "step": 4770 }, { "epoch": 0.07, "learning_rate": 1.9977041808984394e-05, "loss": 0.0564, "step": 4780 }, { "epoch": 0.07, "learning_rate": 1.9976993769245923e-05, "loss": 0.0496, "step": 4790 }, { "epoch": 0.07, "learning_rate": 1.997694572950745e-05, "loss": 0.0547, "step": 4800 }, { "epoch": 0.07, "learning_rate": 1.997689768976898e-05, "loss": 0.0568, "step": 4810 }, { "epoch": 0.07, "learning_rate": 1.9976849650030508e-05, "loss": 0.0575, "step": 4820 }, { "epoch": 0.07, "learning_rate": 1.9976801610292037e-05, "loss": 0.0668, "step": 4830 }, { "epoch": 0.07, "learning_rate": 1.9976753570553563e-05, "loss": 0.0633, "step": 4840 }, { "epoch": 0.07, "learning_rate": 1.9976705530815092e-05, "loss": 0.0522, "step": 4850 }, { "epoch": 0.07, "learning_rate": 1.997665749107662e-05, "loss": 0.0492, "step": 4860 }, { "epoch": 0.07, "learning_rate": 1.997660945133815e-05, "loss": 0.0626, "step": 4870 }, { "epoch": 0.07, "learning_rate": 1.9976561411599677e-05, "loss": 0.0522, "step": 4880 }, { "epoch": 0.07, "learning_rate": 1.9976513371861206e-05, "loss": 0.0573, "step": 4890 }, { "epoch": 0.07, "learning_rate": 1.9976465332122735e-05, "loss": 0.0586, "step": 4900 }, { "epoch": 0.07, "learning_rate": 1.997641729238426e-05, "loss": 0.0611, "step": 4910 }, { "epoch": 0.07, "learning_rate": 1.997636925264579e-05, "loss": 0.0599, "step": 4920 }, { "epoch": 0.07, "learning_rate": 1.997632121290732e-05, "loss": 0.0555, "step": 4930 }, { "epoch": 0.07, "learning_rate": 1.997627317316885e-05, "loss": 0.0523, "step": 4940 }, { "epoch": 0.07, "learning_rate": 1.9976225133430375e-05, "loss": 0.0577, "step": 4950 }, { "epoch": 0.07, "learning_rate": 1.9976177093691904e-05, "loss": 0.0465, "step": 4960 }, { "epoch": 0.07, "learning_rate": 1.9976129053953433e-05, "loss": 0.0589, "step": 4970 }, { "epoch": 0.07, "learning_rate": 1.997608101421496e-05, "loss": 0.0622, "step": 4980 }, { "epoch": 0.07, "learning_rate": 1.997603297447649e-05, "loss": 0.0654, "step": 4990 }, { "epoch": 0.07, "learning_rate": 1.9975984934738018e-05, "loss": 0.05, "step": 5000 }, { "epoch": 0.07, "learning_rate": 1.9975936894999547e-05, "loss": 0.0524, "step": 5010 }, { "epoch": 0.07, "learning_rate": 1.9975888855261073e-05, "loss": 0.0544, "step": 5020 }, { "epoch": 0.07, "learning_rate": 1.9975840815522602e-05, "loss": 0.0508, "step": 5030 }, { "epoch": 0.07, "learning_rate": 1.997579277578413e-05, "loss": 0.0563, "step": 5040 }, { "epoch": 0.07, "learning_rate": 1.997574473604566e-05, "loss": 0.0604, "step": 5050 }, { "epoch": 0.07, "learning_rate": 1.9975696696307187e-05, "loss": 0.0568, "step": 5060 }, { "epoch": 0.07, "learning_rate": 1.9975648656568716e-05, "loss": 0.0589, "step": 5070 }, { "epoch": 0.07, "learning_rate": 1.9975600616830245e-05, "loss": 0.0493, "step": 5080 }, { "epoch": 0.07, "learning_rate": 1.997555257709177e-05, "loss": 0.0477, "step": 5090 }, { "epoch": 0.07, "learning_rate": 1.99755045373533e-05, "loss": 0.0531, "step": 5100 }, { "epoch": 0.07, "learning_rate": 1.997545649761483e-05, "loss": 0.0584, "step": 5110 }, { "epoch": 0.07, "learning_rate": 1.997540845787636e-05, "loss": 0.0457, "step": 5120 }, { "epoch": 0.07, "learning_rate": 1.9975360418137885e-05, "loss": 0.0541, "step": 5130 }, { "epoch": 0.07, "learning_rate": 1.9975312378399414e-05, "loss": 0.0469, "step": 5140 }, { "epoch": 0.07, "learning_rate": 1.9975264338660943e-05, "loss": 0.0593, "step": 5150 }, { "epoch": 0.07, "learning_rate": 1.997521629892247e-05, "loss": 0.0527, "step": 5160 }, { "epoch": 0.07, "learning_rate": 1.9975168259184e-05, "loss": 0.0573, "step": 5170 }, { "epoch": 0.07, "learning_rate": 1.9975120219445528e-05, "loss": 0.0562, "step": 5180 }, { "epoch": 0.07, "learning_rate": 1.9975072179707057e-05, "loss": 0.0562, "step": 5190 }, { "epoch": 0.07, "learning_rate": 1.9975024139968583e-05, "loss": 0.0537, "step": 5200 }, { "epoch": 0.08, "learning_rate": 1.9974976100230112e-05, "loss": 0.054, "step": 5210 }, { "epoch": 0.08, "learning_rate": 1.997492806049164e-05, "loss": 0.0531, "step": 5220 }, { "epoch": 0.08, "learning_rate": 1.997488002075317e-05, "loss": 0.0584, "step": 5230 }, { "epoch": 0.08, "learning_rate": 1.9974831981014696e-05, "loss": 0.0542, "step": 5240 }, { "epoch": 0.08, "learning_rate": 1.9974783941276226e-05, "loss": 0.0541, "step": 5250 }, { "epoch": 0.08, "learning_rate": 1.9974735901537755e-05, "loss": 0.0481, "step": 5260 }, { "epoch": 0.08, "learning_rate": 1.997468786179928e-05, "loss": 0.0572, "step": 5270 }, { "epoch": 0.08, "learning_rate": 1.997463982206081e-05, "loss": 0.0489, "step": 5280 }, { "epoch": 0.08, "learning_rate": 1.997459178232234e-05, "loss": 0.0593, "step": 5290 }, { "epoch": 0.08, "learning_rate": 1.997454374258387e-05, "loss": 0.0523, "step": 5300 }, { "epoch": 0.08, "learning_rate": 1.9974495702845395e-05, "loss": 0.0537, "step": 5310 }, { "epoch": 0.08, "learning_rate": 1.9974447663106924e-05, "loss": 0.0496, "step": 5320 }, { "epoch": 0.08, "learning_rate": 1.9974399623368453e-05, "loss": 0.0532, "step": 5330 }, { "epoch": 0.08, "learning_rate": 1.997435158362998e-05, "loss": 0.06, "step": 5340 }, { "epoch": 0.08, "learning_rate": 1.9974303543891508e-05, "loss": 0.0558, "step": 5350 }, { "epoch": 0.08, "learning_rate": 1.9974255504153038e-05, "loss": 0.0551, "step": 5360 }, { "epoch": 0.08, "learning_rate": 1.9974207464414567e-05, "loss": 0.0479, "step": 5370 }, { "epoch": 0.08, "learning_rate": 1.9974159424676093e-05, "loss": 0.0519, "step": 5380 }, { "epoch": 0.08, "learning_rate": 1.9974111384937622e-05, "loss": 0.0583, "step": 5390 }, { "epoch": 0.08, "learning_rate": 1.997406334519915e-05, "loss": 0.0559, "step": 5400 }, { "epoch": 0.08, "learning_rate": 1.997401530546068e-05, "loss": 0.0487, "step": 5410 }, { "epoch": 0.08, "learning_rate": 1.9973967265722206e-05, "loss": 0.0474, "step": 5420 }, { "epoch": 0.08, "learning_rate": 1.9973919225983736e-05, "loss": 0.0575, "step": 5430 }, { "epoch": 0.08, "learning_rate": 1.9973871186245265e-05, "loss": 0.0562, "step": 5440 }, { "epoch": 0.08, "learning_rate": 1.997382314650679e-05, "loss": 0.0477, "step": 5450 }, { "epoch": 0.08, "learning_rate": 1.997377510676832e-05, "loss": 0.0542, "step": 5460 }, { "epoch": 0.08, "learning_rate": 1.997372706702985e-05, "loss": 0.0696, "step": 5470 }, { "epoch": 0.08, "learning_rate": 1.997367902729138e-05, "loss": 0.0496, "step": 5480 }, { "epoch": 0.08, "learning_rate": 1.9973630987552904e-05, "loss": 0.0574, "step": 5490 }, { "epoch": 0.08, "learning_rate": 1.9973582947814434e-05, "loss": 0.0507, "step": 5500 }, { "epoch": 0.08, "learning_rate": 1.9973534908075963e-05, "loss": 0.0557, "step": 5510 }, { "epoch": 0.08, "learning_rate": 1.997348686833749e-05, "loss": 0.0507, "step": 5520 }, { "epoch": 0.08, "learning_rate": 1.9973438828599018e-05, "loss": 0.0516, "step": 5530 }, { "epoch": 0.08, "learning_rate": 1.9973390788860547e-05, "loss": 0.0497, "step": 5540 }, { "epoch": 0.08, "learning_rate": 1.9973342749122077e-05, "loss": 0.056, "step": 5550 }, { "epoch": 0.08, "learning_rate": 1.9973294709383603e-05, "loss": 0.0487, "step": 5560 }, { "epoch": 0.08, "learning_rate": 1.9973246669645132e-05, "loss": 0.0487, "step": 5570 }, { "epoch": 0.08, "learning_rate": 1.997319862990666e-05, "loss": 0.0473, "step": 5580 }, { "epoch": 0.08, "learning_rate": 1.997315059016819e-05, "loss": 0.0504, "step": 5590 }, { "epoch": 0.08, "learning_rate": 1.9973102550429716e-05, "loss": 0.051, "step": 5600 }, { "epoch": 0.08, "learning_rate": 1.9973054510691246e-05, "loss": 0.052, "step": 5610 }, { "epoch": 0.08, "learning_rate": 1.9973006470952775e-05, "loss": 0.0567, "step": 5620 }, { "epoch": 0.08, "learning_rate": 1.99729584312143e-05, "loss": 0.0458, "step": 5630 }, { "epoch": 0.08, "learning_rate": 1.997291039147583e-05, "loss": 0.0565, "step": 5640 }, { "epoch": 0.08, "learning_rate": 1.997286235173736e-05, "loss": 0.0568, "step": 5650 }, { "epoch": 0.08, "learning_rate": 1.997281431199889e-05, "loss": 0.0459, "step": 5660 }, { "epoch": 0.08, "learning_rate": 1.9972766272260414e-05, "loss": 0.0536, "step": 5670 }, { "epoch": 0.08, "learning_rate": 1.9972718232521944e-05, "loss": 0.0568, "step": 5680 }, { "epoch": 0.08, "learning_rate": 1.9972670192783473e-05, "loss": 0.0608, "step": 5690 }, { "epoch": 0.08, "learning_rate": 1.9972622153045e-05, "loss": 0.0505, "step": 5700 }, { "epoch": 0.08, "learning_rate": 1.9972574113306528e-05, "loss": 0.042, "step": 5710 }, { "epoch": 0.08, "learning_rate": 1.9972526073568057e-05, "loss": 0.0417, "step": 5720 }, { "epoch": 0.08, "learning_rate": 1.9972478033829587e-05, "loss": 0.05, "step": 5730 }, { "epoch": 0.08, "learning_rate": 1.9972429994091113e-05, "loss": 0.0432, "step": 5740 }, { "epoch": 0.08, "learning_rate": 1.9972381954352642e-05, "loss": 0.041, "step": 5750 }, { "epoch": 0.08, "learning_rate": 1.997233391461417e-05, "loss": 0.0657, "step": 5760 }, { "epoch": 0.08, "learning_rate": 1.99722858748757e-05, "loss": 0.0502, "step": 5770 }, { "epoch": 0.08, "learning_rate": 1.9972237835137226e-05, "loss": 0.0515, "step": 5780 }, { "epoch": 0.08, "learning_rate": 1.9972189795398755e-05, "loss": 0.0487, "step": 5790 }, { "epoch": 0.08, "learning_rate": 1.9972141755660285e-05, "loss": 0.0561, "step": 5800 }, { "epoch": 0.08, "learning_rate": 1.997209371592181e-05, "loss": 0.046, "step": 5810 }, { "epoch": 0.08, "learning_rate": 1.997204567618334e-05, "loss": 0.0466, "step": 5820 }, { "epoch": 0.08, "learning_rate": 1.997199763644487e-05, "loss": 0.0511, "step": 5830 }, { "epoch": 0.08, "learning_rate": 1.99719495967064e-05, "loss": 0.0585, "step": 5840 }, { "epoch": 0.08, "learning_rate": 1.9971901556967924e-05, "loss": 0.0512, "step": 5850 }, { "epoch": 0.08, "learning_rate": 1.9971853517229454e-05, "loss": 0.0563, "step": 5860 }, { "epoch": 0.08, "learning_rate": 1.9971805477490983e-05, "loss": 0.0491, "step": 5870 }, { "epoch": 0.08, "learning_rate": 1.997175743775251e-05, "loss": 0.0507, "step": 5880 }, { "epoch": 0.08, "learning_rate": 1.9971709398014038e-05, "loss": 0.0406, "step": 5890 }, { "epoch": 0.09, "learning_rate": 1.9971661358275567e-05, "loss": 0.0632, "step": 5900 }, { "epoch": 0.09, "learning_rate": 1.9971613318537097e-05, "loss": 0.0485, "step": 5910 }, { "epoch": 0.09, "learning_rate": 1.9971565278798622e-05, "loss": 0.0404, "step": 5920 }, { "epoch": 0.09, "learning_rate": 1.9971517239060152e-05, "loss": 0.0485, "step": 5930 }, { "epoch": 0.09, "learning_rate": 1.997146919932168e-05, "loss": 0.0594, "step": 5940 }, { "epoch": 0.09, "learning_rate": 1.997142115958321e-05, "loss": 0.0534, "step": 5950 }, { "epoch": 0.09, "learning_rate": 1.9971373119844736e-05, "loss": 0.0448, "step": 5960 }, { "epoch": 0.09, "learning_rate": 1.9971325080106265e-05, "loss": 0.0442, "step": 5970 }, { "epoch": 0.09, "learning_rate": 1.9971277040367795e-05, "loss": 0.0471, "step": 5980 }, { "epoch": 0.09, "learning_rate": 1.997122900062932e-05, "loss": 0.0494, "step": 5990 }, { "epoch": 0.09, "learning_rate": 1.997118096089085e-05, "loss": 0.0588, "step": 6000 }, { "epoch": 0.09, "learning_rate": 1.997113292115238e-05, "loss": 0.0425, "step": 6010 }, { "epoch": 0.09, "learning_rate": 1.997108488141391e-05, "loss": 0.0469, "step": 6020 }, { "epoch": 0.09, "learning_rate": 1.9971036841675434e-05, "loss": 0.0537, "step": 6030 }, { "epoch": 0.09, "learning_rate": 1.9970988801936964e-05, "loss": 0.0436, "step": 6040 }, { "epoch": 0.09, "learning_rate": 1.9970940762198493e-05, "loss": 0.0605, "step": 6050 }, { "epoch": 0.09, "learning_rate": 1.997089272246002e-05, "loss": 0.0514, "step": 6060 }, { "epoch": 0.09, "learning_rate": 1.9970844682721548e-05, "loss": 0.047, "step": 6070 }, { "epoch": 0.09, "learning_rate": 1.9970796642983077e-05, "loss": 0.0664, "step": 6080 }, { "epoch": 0.09, "learning_rate": 1.9970748603244606e-05, "loss": 0.0542, "step": 6090 }, { "epoch": 0.09, "learning_rate": 1.9970700563506132e-05, "loss": 0.0481, "step": 6100 }, { "epoch": 0.09, "learning_rate": 1.997065252376766e-05, "loss": 0.0444, "step": 6110 }, { "epoch": 0.09, "learning_rate": 1.997060448402919e-05, "loss": 0.0446, "step": 6120 }, { "epoch": 0.09, "learning_rate": 1.997055644429072e-05, "loss": 0.0471, "step": 6130 }, { "epoch": 0.09, "learning_rate": 1.9970508404552246e-05, "loss": 0.0514, "step": 6140 }, { "epoch": 0.09, "learning_rate": 1.9970460364813775e-05, "loss": 0.0555, "step": 6150 }, { "epoch": 0.09, "learning_rate": 1.9970412325075305e-05, "loss": 0.0489, "step": 6160 }, { "epoch": 0.09, "learning_rate": 1.997036428533683e-05, "loss": 0.0492, "step": 6170 }, { "epoch": 0.09, "learning_rate": 1.997031624559836e-05, "loss": 0.0506, "step": 6180 }, { "epoch": 0.09, "learning_rate": 1.997026820585989e-05, "loss": 0.0496, "step": 6190 }, { "epoch": 0.09, "learning_rate": 1.9970220166121418e-05, "loss": 0.0425, "step": 6200 }, { "epoch": 0.09, "learning_rate": 1.9970172126382944e-05, "loss": 0.053, "step": 6210 }, { "epoch": 0.09, "learning_rate": 1.9970124086644473e-05, "loss": 0.051, "step": 6220 }, { "epoch": 0.09, "learning_rate": 1.9970076046906003e-05, "loss": 0.05, "step": 6230 }, { "epoch": 0.09, "learning_rate": 1.997002800716753e-05, "loss": 0.0429, "step": 6240 }, { "epoch": 0.09, "learning_rate": 1.9969979967429058e-05, "loss": 0.0474, "step": 6250 }, { "epoch": 0.09, "learning_rate": 1.9969931927690587e-05, "loss": 0.044, "step": 6260 }, { "epoch": 0.09, "learning_rate": 1.9969883887952116e-05, "loss": 0.0501, "step": 6270 }, { "epoch": 0.09, "learning_rate": 1.9969835848213642e-05, "loss": 0.0462, "step": 6280 }, { "epoch": 0.09, "learning_rate": 1.996979261244902e-05, "loss": 0.0448, "step": 6290 }, { "epoch": 0.09, "learning_rate": 1.9969744572710546e-05, "loss": 0.0505, "step": 6300 }, { "epoch": 0.09, "learning_rate": 1.9969696532972075e-05, "loss": 0.0444, "step": 6310 }, { "epoch": 0.09, "learning_rate": 1.9969648493233605e-05, "loss": 0.0462, "step": 6320 }, { "epoch": 0.09, "learning_rate": 1.9969600453495134e-05, "loss": 0.0447, "step": 6330 }, { "epoch": 0.09, "learning_rate": 1.996955241375666e-05, "loss": 0.044, "step": 6340 }, { "epoch": 0.09, "learning_rate": 1.996950437401819e-05, "loss": 0.0509, "step": 6350 }, { "epoch": 0.09, "learning_rate": 1.996945633427972e-05, "loss": 0.0543, "step": 6360 }, { "epoch": 0.09, "learning_rate": 1.9969408294541244e-05, "loss": 0.051, "step": 6370 }, { "epoch": 0.09, "learning_rate": 1.9969360254802774e-05, "loss": 0.0424, "step": 6380 }, { "epoch": 0.09, "learning_rate": 1.9969312215064303e-05, "loss": 0.041, "step": 6390 }, { "epoch": 0.09, "learning_rate": 1.9969264175325832e-05, "loss": 0.0449, "step": 6400 }, { "epoch": 0.09, "learning_rate": 1.9969216135587358e-05, "loss": 0.0462, "step": 6410 }, { "epoch": 0.09, "learning_rate": 1.9969168095848887e-05, "loss": 0.0427, "step": 6420 }, { "epoch": 0.09, "learning_rate": 1.9969120056110417e-05, "loss": 0.0518, "step": 6430 }, { "epoch": 0.09, "learning_rate": 1.9969072016371946e-05, "loss": 0.0437, "step": 6440 }, { "epoch": 0.09, "learning_rate": 1.996902397663347e-05, "loss": 0.0428, "step": 6450 }, { "epoch": 0.09, "learning_rate": 1.9968975936895e-05, "loss": 0.0564, "step": 6460 }, { "epoch": 0.09, "learning_rate": 1.996892789715653e-05, "loss": 0.0461, "step": 6470 }, { "epoch": 0.09, "learning_rate": 1.9968879857418056e-05, "loss": 0.0488, "step": 6480 }, { "epoch": 0.09, "learning_rate": 1.9968831817679585e-05, "loss": 0.0444, "step": 6490 }, { "epoch": 0.09, "learning_rate": 1.9968783777941115e-05, "loss": 0.0509, "step": 6500 }, { "epoch": 0.09, "learning_rate": 1.9968735738202644e-05, "loss": 0.0517, "step": 6510 }, { "epoch": 0.09, "learning_rate": 1.996868769846417e-05, "loss": 0.0446, "step": 6520 }, { "epoch": 0.09, "learning_rate": 1.99686396587257e-05, "loss": 0.0414, "step": 6530 }, { "epoch": 0.09, "learning_rate": 1.996859161898723e-05, "loss": 0.0485, "step": 6540 }, { "epoch": 0.09, "learning_rate": 1.9968543579248754e-05, "loss": 0.0524, "step": 6550 }, { "epoch": 0.09, "learning_rate": 1.9968495539510283e-05, "loss": 0.0501, "step": 6560 }, { "epoch": 0.09, "learning_rate": 1.9968447499771813e-05, "loss": 0.0487, "step": 6570 }, { "epoch": 0.09, "learning_rate": 1.9968399460033342e-05, "loss": 0.0457, "step": 6580 }, { "epoch": 0.09, "learning_rate": 1.9968351420294868e-05, "loss": 0.0546, "step": 6590 }, { "epoch": 0.1, "learning_rate": 1.9968303380556397e-05, "loss": 0.0521, "step": 6600 }, { "epoch": 0.1, "learning_rate": 1.9968255340817926e-05, "loss": 0.0442, "step": 6610 }, { "epoch": 0.1, "learning_rate": 1.9968207301079456e-05, "loss": 0.0516, "step": 6620 }, { "epoch": 0.1, "learning_rate": 1.996815926134098e-05, "loss": 0.0448, "step": 6630 }, { "epoch": 0.1, "learning_rate": 1.996811122160251e-05, "loss": 0.0498, "step": 6640 }, { "epoch": 0.1, "learning_rate": 1.996806318186404e-05, "loss": 0.0415, "step": 6650 }, { "epoch": 0.1, "learning_rate": 1.9968015142125566e-05, "loss": 0.0555, "step": 6660 }, { "epoch": 0.1, "learning_rate": 1.9967967102387095e-05, "loss": 0.0499, "step": 6670 }, { "epoch": 0.1, "learning_rate": 1.9967919062648625e-05, "loss": 0.0481, "step": 6680 }, { "epoch": 0.1, "learning_rate": 1.9967871022910154e-05, "loss": 0.0443, "step": 6690 }, { "epoch": 0.1, "learning_rate": 1.996782298317168e-05, "loss": 0.0433, "step": 6700 }, { "epoch": 0.1, "learning_rate": 1.996777494343321e-05, "loss": 0.0612, "step": 6710 }, { "epoch": 0.1, "learning_rate": 1.9967726903694738e-05, "loss": 0.051, "step": 6720 }, { "epoch": 0.1, "learning_rate": 1.9967678863956264e-05, "loss": 0.0422, "step": 6730 }, { "epoch": 0.1, "learning_rate": 1.9967630824217793e-05, "loss": 0.0419, "step": 6740 }, { "epoch": 0.1, "learning_rate": 1.9967582784479323e-05, "loss": 0.0437, "step": 6750 }, { "epoch": 0.1, "learning_rate": 1.9967534744740852e-05, "loss": 0.0589, "step": 6760 }, { "epoch": 0.1, "learning_rate": 1.9967486705002378e-05, "loss": 0.0416, "step": 6770 }, { "epoch": 0.1, "learning_rate": 1.9967438665263907e-05, "loss": 0.0452, "step": 6780 }, { "epoch": 0.1, "learning_rate": 1.9967390625525436e-05, "loss": 0.0441, "step": 6790 }, { "epoch": 0.1, "learning_rate": 1.9967342585786966e-05, "loss": 0.0534, "step": 6800 }, { "epoch": 0.1, "learning_rate": 1.996729454604849e-05, "loss": 0.0483, "step": 6810 }, { "epoch": 0.1, "learning_rate": 1.996724650631002e-05, "loss": 0.0471, "step": 6820 }, { "epoch": 0.1, "learning_rate": 1.996719846657155e-05, "loss": 0.045, "step": 6830 }, { "epoch": 0.1, "learning_rate": 1.9967150426833076e-05, "loss": 0.0399, "step": 6840 }, { "epoch": 0.1, "learning_rate": 1.9967102387094605e-05, "loss": 0.044, "step": 6850 }, { "epoch": 0.1, "learning_rate": 1.9967054347356134e-05, "loss": 0.0435, "step": 6860 }, { "epoch": 0.1, "learning_rate": 1.9967006307617664e-05, "loss": 0.0397, "step": 6870 }, { "epoch": 0.1, "learning_rate": 1.996695826787919e-05, "loss": 0.045, "step": 6880 }, { "epoch": 0.1, "learning_rate": 1.996691022814072e-05, "loss": 0.0432, "step": 6890 }, { "epoch": 0.1, "learning_rate": 1.9966862188402248e-05, "loss": 0.0482, "step": 6900 }, { "epoch": 0.1, "learning_rate": 1.9966814148663774e-05, "loss": 0.0412, "step": 6910 }, { "epoch": 0.1, "learning_rate": 1.9966766108925303e-05, "loss": 0.0557, "step": 6920 }, { "epoch": 0.1, "learning_rate": 1.9966718069186833e-05, "loss": 0.0487, "step": 6930 }, { "epoch": 0.1, "learning_rate": 1.9966670029448362e-05, "loss": 0.0367, "step": 6940 }, { "epoch": 0.1, "learning_rate": 1.9966621989709888e-05, "loss": 0.0468, "step": 6950 }, { "epoch": 0.1, "learning_rate": 1.9966573949971417e-05, "loss": 0.0492, "step": 6960 }, { "epoch": 0.1, "learning_rate": 1.9966525910232946e-05, "loss": 0.0416, "step": 6970 }, { "epoch": 0.1, "learning_rate": 1.9966477870494476e-05, "loss": 0.049, "step": 6980 }, { "epoch": 0.1, "learning_rate": 1.9966429830756e-05, "loss": 0.0469, "step": 6990 }, { "epoch": 0.1, "learning_rate": 1.996638179101753e-05, "loss": 0.0433, "step": 7000 }, { "epoch": 0.1, "learning_rate": 1.996633375127906e-05, "loss": 0.0456, "step": 7010 }, { "epoch": 0.1, "learning_rate": 1.9966285711540586e-05, "loss": 0.045, "step": 7020 }, { "epoch": 0.1, "learning_rate": 1.9966237671802115e-05, "loss": 0.0491, "step": 7030 }, { "epoch": 0.1, "learning_rate": 1.9966189632063644e-05, "loss": 0.0439, "step": 7040 }, { "epoch": 0.1, "learning_rate": 1.9966141592325174e-05, "loss": 0.0424, "step": 7050 }, { "epoch": 0.1, "learning_rate": 1.99660935525867e-05, "loss": 0.0514, "step": 7060 }, { "epoch": 0.1, "learning_rate": 1.996604551284823e-05, "loss": 0.0394, "step": 7070 }, { "epoch": 0.1, "learning_rate": 1.9965997473109758e-05, "loss": 0.0393, "step": 7080 }, { "epoch": 0.1, "learning_rate": 1.9965949433371284e-05, "loss": 0.0475, "step": 7090 }, { "epoch": 0.1, "learning_rate": 1.9965901393632813e-05, "loss": 0.0492, "step": 7100 }, { "epoch": 0.1, "learning_rate": 1.9965853353894343e-05, "loss": 0.0449, "step": 7110 }, { "epoch": 0.1, "learning_rate": 1.9965805314155872e-05, "loss": 0.0393, "step": 7120 }, { "epoch": 0.1, "learning_rate": 1.9965757274417398e-05, "loss": 0.0469, "step": 7130 }, { "epoch": 0.1, "learning_rate": 1.9965709234678927e-05, "loss": 0.0465, "step": 7140 }, { "epoch": 0.1, "learning_rate": 1.9965661194940456e-05, "loss": 0.0542, "step": 7150 }, { "epoch": 0.1, "learning_rate": 1.9965613155201985e-05, "loss": 0.0456, "step": 7160 }, { "epoch": 0.1, "learning_rate": 1.996556511546351e-05, "loss": 0.0498, "step": 7170 }, { "epoch": 0.1, "learning_rate": 1.996551707572504e-05, "loss": 0.0513, "step": 7180 }, { "epoch": 0.1, "learning_rate": 1.996546903598657e-05, "loss": 0.043, "step": 7190 }, { "epoch": 0.1, "learning_rate": 1.9965420996248096e-05, "loss": 0.0432, "step": 7200 }, { "epoch": 0.1, "learning_rate": 1.9965372956509625e-05, "loss": 0.0541, "step": 7210 }, { "epoch": 0.1, "learning_rate": 1.9965324916771154e-05, "loss": 0.0506, "step": 7220 }, { "epoch": 0.1, "learning_rate": 1.9965276877032684e-05, "loss": 0.0481, "step": 7230 }, { "epoch": 0.1, "learning_rate": 1.996522883729421e-05, "loss": 0.0442, "step": 7240 }, { "epoch": 0.1, "learning_rate": 1.996518079755574e-05, "loss": 0.0476, "step": 7250 }, { "epoch": 0.1, "learning_rate": 1.9965132757817268e-05, "loss": 0.0409, "step": 7260 }, { "epoch": 0.1, "learning_rate": 1.9965084718078794e-05, "loss": 0.044, "step": 7270 }, { "epoch": 0.1, "learning_rate": 1.9965036678340323e-05, "loss": 0.0565, "step": 7280 }, { "epoch": 0.11, "learning_rate": 1.9964988638601852e-05, "loss": 0.0496, "step": 7290 }, { "epoch": 0.11, "learning_rate": 1.996494059886338e-05, "loss": 0.051, "step": 7300 }, { "epoch": 0.11, "learning_rate": 1.9964892559124908e-05, "loss": 0.0415, "step": 7310 }, { "epoch": 0.11, "learning_rate": 1.9964844519386437e-05, "loss": 0.0451, "step": 7320 }, { "epoch": 0.11, "learning_rate": 1.9964796479647966e-05, "loss": 0.0418, "step": 7330 }, { "epoch": 0.11, "learning_rate": 1.9964748439909495e-05, "loss": 0.0414, "step": 7340 }, { "epoch": 0.11, "learning_rate": 1.996470040017102e-05, "loss": 0.0397, "step": 7350 }, { "epoch": 0.11, "learning_rate": 1.996465236043255e-05, "loss": 0.0422, "step": 7360 }, { "epoch": 0.11, "learning_rate": 1.996460432069408e-05, "loss": 0.0431, "step": 7370 }, { "epoch": 0.11, "learning_rate": 1.9964556280955606e-05, "loss": 0.0442, "step": 7380 }, { "epoch": 0.11, "learning_rate": 1.9964508241217135e-05, "loss": 0.0445, "step": 7390 }, { "epoch": 0.11, "learning_rate": 1.9964460201478664e-05, "loss": 0.0502, "step": 7400 }, { "epoch": 0.11, "learning_rate": 1.9964412161740193e-05, "loss": 0.0482, "step": 7410 }, { "epoch": 0.11, "learning_rate": 1.996436412200172e-05, "loss": 0.0429, "step": 7420 }, { "epoch": 0.11, "learning_rate": 1.996431608226325e-05, "loss": 0.0532, "step": 7430 }, { "epoch": 0.11, "learning_rate": 1.9964268042524778e-05, "loss": 0.0401, "step": 7440 }, { "epoch": 0.11, "learning_rate": 1.9964220002786307e-05, "loss": 0.0354, "step": 7450 }, { "epoch": 0.11, "learning_rate": 1.9964171963047836e-05, "loss": 0.038, "step": 7460 }, { "epoch": 0.11, "learning_rate": 1.9964123923309366e-05, "loss": 0.0425, "step": 7470 }, { "epoch": 0.11, "learning_rate": 1.996407588357089e-05, "loss": 0.054, "step": 7480 }, { "epoch": 0.11, "learning_rate": 1.996402784383242e-05, "loss": 0.0407, "step": 7490 }, { "epoch": 0.11, "learning_rate": 1.996397980409395e-05, "loss": 0.0421, "step": 7500 }, { "epoch": 0.11, "learning_rate": 1.9963931764355476e-05, "loss": 0.0517, "step": 7510 }, { "epoch": 0.11, "learning_rate": 1.9963883724617005e-05, "loss": 0.0491, "step": 7520 }, { "epoch": 0.11, "learning_rate": 1.9963835684878535e-05, "loss": 0.0425, "step": 7530 }, { "epoch": 0.11, "learning_rate": 1.9963787645140064e-05, "loss": 0.0374, "step": 7540 }, { "epoch": 0.11, "learning_rate": 1.996373960540159e-05, "loss": 0.0467, "step": 7550 }, { "epoch": 0.11, "learning_rate": 1.996369156566312e-05, "loss": 0.0467, "step": 7560 }, { "epoch": 0.11, "learning_rate": 1.9963643525924648e-05, "loss": 0.0496, "step": 7570 }, { "epoch": 0.11, "learning_rate": 1.9963595486186174e-05, "loss": 0.0522, "step": 7580 }, { "epoch": 0.11, "learning_rate": 1.9963547446447703e-05, "loss": 0.0439, "step": 7590 }, { "epoch": 0.11, "learning_rate": 1.9963499406709233e-05, "loss": 0.0417, "step": 7600 }, { "epoch": 0.11, "learning_rate": 1.9963451366970762e-05, "loss": 0.0456, "step": 7610 }, { "epoch": 0.11, "learning_rate": 1.9963403327232288e-05, "loss": 0.0461, "step": 7620 }, { "epoch": 0.11, "learning_rate": 1.9963355287493817e-05, "loss": 0.0454, "step": 7630 }, { "epoch": 0.11, "learning_rate": 1.9963307247755346e-05, "loss": 0.0557, "step": 7640 }, { "epoch": 0.11, "learning_rate": 1.9963259208016876e-05, "loss": 0.0447, "step": 7650 }, { "epoch": 0.11, "learning_rate": 1.99632111682784e-05, "loss": 0.0451, "step": 7660 }, { "epoch": 0.11, "learning_rate": 1.996316312853993e-05, "loss": 0.0338, "step": 7670 }, { "epoch": 0.11, "learning_rate": 1.996311508880146e-05, "loss": 0.0426, "step": 7680 }, { "epoch": 0.11, "learning_rate": 1.9963067049062986e-05, "loss": 0.0508, "step": 7690 }, { "epoch": 0.11, "learning_rate": 1.9963019009324515e-05, "loss": 0.0413, "step": 7700 }, { "epoch": 0.11, "learning_rate": 1.9962970969586044e-05, "loss": 0.0433, "step": 7710 }, { "epoch": 0.11, "learning_rate": 1.9962922929847574e-05, "loss": 0.048, "step": 7720 }, { "epoch": 0.11, "learning_rate": 1.99628748901091e-05, "loss": 0.0504, "step": 7730 }, { "epoch": 0.11, "learning_rate": 1.996282685037063e-05, "loss": 0.0401, "step": 7740 }, { "epoch": 0.11, "learning_rate": 1.9962778810632158e-05, "loss": 0.0398, "step": 7750 }, { "epoch": 0.11, "learning_rate": 1.9962730770893684e-05, "loss": 0.0437, "step": 7760 }, { "epoch": 0.11, "learning_rate": 1.9962682731155213e-05, "loss": 0.0541, "step": 7770 }, { "epoch": 0.11, "learning_rate": 1.9962634691416743e-05, "loss": 0.0475, "step": 7780 }, { "epoch": 0.11, "learning_rate": 1.9962586651678272e-05, "loss": 0.046, "step": 7790 }, { "epoch": 0.11, "learning_rate": 1.9962538611939798e-05, "loss": 0.0426, "step": 7800 }, { "epoch": 0.11, "learning_rate": 1.9962490572201327e-05, "loss": 0.0422, "step": 7810 }, { "epoch": 0.11, "learning_rate": 1.9962442532462856e-05, "loss": 0.0392, "step": 7820 }, { "epoch": 0.11, "learning_rate": 1.9962394492724386e-05, "loss": 0.0428, "step": 7830 }, { "epoch": 0.11, "learning_rate": 1.996234645298591e-05, "loss": 0.0395, "step": 7840 }, { "epoch": 0.11, "learning_rate": 1.996229841324744e-05, "loss": 0.055, "step": 7850 }, { "epoch": 0.11, "learning_rate": 1.996225037350897e-05, "loss": 0.0427, "step": 7860 }, { "epoch": 0.11, "learning_rate": 1.9962202333770496e-05, "loss": 0.044, "step": 7870 }, { "epoch": 0.11, "learning_rate": 1.9962154294032025e-05, "loss": 0.0369, "step": 7880 }, { "epoch": 0.11, "learning_rate": 1.9962106254293554e-05, "loss": 0.0486, "step": 7890 }, { "epoch": 0.11, "learning_rate": 1.9962058214555084e-05, "loss": 0.0445, "step": 7900 }, { "epoch": 0.11, "learning_rate": 1.996201017481661e-05, "loss": 0.0426, "step": 7910 }, { "epoch": 0.11, "learning_rate": 1.996196213507814e-05, "loss": 0.0466, "step": 7920 }, { "epoch": 0.11, "learning_rate": 1.9961914095339668e-05, "loss": 0.0526, "step": 7930 }, { "epoch": 0.11, "learning_rate": 1.9961866055601194e-05, "loss": 0.0444, "step": 7940 }, { "epoch": 0.11, "learning_rate": 1.9961818015862723e-05, "loss": 0.0438, "step": 7950 }, { "epoch": 0.11, "learning_rate": 1.9961769976124253e-05, "loss": 0.0434, "step": 7960 }, { "epoch": 0.11, "learning_rate": 1.9961721936385782e-05, "loss": 0.0478, "step": 7970 }, { "epoch": 0.12, "learning_rate": 1.9961673896647308e-05, "loss": 0.0366, "step": 7980 }, { "epoch": 0.12, "learning_rate": 1.9961625856908837e-05, "loss": 0.043, "step": 7990 }, { "epoch": 0.12, "learning_rate": 1.9961577817170366e-05, "loss": 0.0416, "step": 8000 }, { "epoch": 0.12, "learning_rate": 1.9961529777431895e-05, "loss": 0.0388, "step": 8010 }, { "epoch": 0.12, "learning_rate": 1.996148173769342e-05, "loss": 0.0423, "step": 8020 }, { "epoch": 0.12, "learning_rate": 1.996143369795495e-05, "loss": 0.0425, "step": 8030 }, { "epoch": 0.12, "learning_rate": 1.996138565821648e-05, "loss": 0.0483, "step": 8040 }, { "epoch": 0.12, "learning_rate": 1.9961337618478006e-05, "loss": 0.0497, "step": 8050 }, { "epoch": 0.12, "learning_rate": 1.9961289578739535e-05, "loss": 0.0394, "step": 8060 }, { "epoch": 0.12, "learning_rate": 1.9961241539001064e-05, "loss": 0.0461, "step": 8070 }, { "epoch": 0.12, "learning_rate": 1.9961193499262594e-05, "loss": 0.0401, "step": 8080 }, { "epoch": 0.12, "learning_rate": 1.996114545952412e-05, "loss": 0.0447, "step": 8090 }, { "epoch": 0.12, "learning_rate": 1.996109741978565e-05, "loss": 0.0402, "step": 8100 }, { "epoch": 0.12, "learning_rate": 1.9961049380047178e-05, "loss": 0.0508, "step": 8110 }, { "epoch": 0.12, "learning_rate": 1.9961001340308704e-05, "loss": 0.0549, "step": 8120 }, { "epoch": 0.12, "learning_rate": 1.9960953300570233e-05, "loss": 0.0408, "step": 8130 }, { "epoch": 0.12, "learning_rate": 1.9960905260831762e-05, "loss": 0.0425, "step": 8140 }, { "epoch": 0.12, "learning_rate": 1.996085722109329e-05, "loss": 0.0511, "step": 8150 }, { "epoch": 0.12, "learning_rate": 1.9960809181354818e-05, "loss": 0.0448, "step": 8160 }, { "epoch": 0.12, "learning_rate": 1.9960761141616347e-05, "loss": 0.0363, "step": 8170 }, { "epoch": 0.12, "learning_rate": 1.9960713101877876e-05, "loss": 0.0381, "step": 8180 }, { "epoch": 0.12, "learning_rate": 1.9960665062139405e-05, "loss": 0.0415, "step": 8190 }, { "epoch": 0.12, "learning_rate": 1.996061702240093e-05, "loss": 0.0524, "step": 8200 }, { "epoch": 0.12, "learning_rate": 1.996056898266246e-05, "loss": 0.0385, "step": 8210 }, { "epoch": 0.12, "learning_rate": 1.996052094292399e-05, "loss": 0.0407, "step": 8220 }, { "epoch": 0.12, "learning_rate": 1.9960472903185516e-05, "loss": 0.0479, "step": 8230 }, { "epoch": 0.12, "learning_rate": 1.9960424863447045e-05, "loss": 0.0437, "step": 8240 }, { "epoch": 0.12, "learning_rate": 1.9960376823708574e-05, "loss": 0.0442, "step": 8250 }, { "epoch": 0.12, "learning_rate": 1.9960328783970103e-05, "loss": 0.0432, "step": 8260 }, { "epoch": 0.12, "learning_rate": 1.996028074423163e-05, "loss": 0.0479, "step": 8270 }, { "epoch": 0.12, "learning_rate": 1.996023270449316e-05, "loss": 0.0445, "step": 8280 }, { "epoch": 0.12, "learning_rate": 1.9960184664754688e-05, "loss": 0.0353, "step": 8290 }, { "epoch": 0.12, "learning_rate": 1.9960136625016214e-05, "loss": 0.0427, "step": 8300 }, { "epoch": 0.12, "learning_rate": 1.9960088585277743e-05, "loss": 0.045, "step": 8310 }, { "epoch": 0.12, "learning_rate": 1.9960040545539272e-05, "loss": 0.0514, "step": 8320 }, { "epoch": 0.12, "learning_rate": 1.99599925058008e-05, "loss": 0.0409, "step": 8330 }, { "epoch": 0.12, "learning_rate": 1.9959944466062327e-05, "loss": 0.0408, "step": 8340 }, { "epoch": 0.12, "learning_rate": 1.9959896426323857e-05, "loss": 0.0421, "step": 8350 }, { "epoch": 0.12, "learning_rate": 1.9959848386585386e-05, "loss": 0.0452, "step": 8360 }, { "epoch": 0.12, "learning_rate": 1.9959800346846915e-05, "loss": 0.0477, "step": 8370 }, { "epoch": 0.12, "learning_rate": 1.995975230710844e-05, "loss": 0.0444, "step": 8380 }, { "epoch": 0.12, "learning_rate": 1.995970426736997e-05, "loss": 0.0442, "step": 8390 }, { "epoch": 0.12, "learning_rate": 1.99596562276315e-05, "loss": 0.0408, "step": 8400 }, { "epoch": 0.12, "learning_rate": 1.9959608187893026e-05, "loss": 0.0459, "step": 8410 }, { "epoch": 0.12, "learning_rate": 1.9959560148154555e-05, "loss": 0.0411, "step": 8420 }, { "epoch": 0.12, "learning_rate": 1.9959512108416084e-05, "loss": 0.0498, "step": 8430 }, { "epoch": 0.12, "learning_rate": 1.9959464068677613e-05, "loss": 0.039, "step": 8440 }, { "epoch": 0.12, "learning_rate": 1.995941602893914e-05, "loss": 0.0347, "step": 8450 }, { "epoch": 0.12, "learning_rate": 1.995936798920067e-05, "loss": 0.0432, "step": 8460 }, { "epoch": 0.12, "learning_rate": 1.9959319949462198e-05, "loss": 0.046, "step": 8470 }, { "epoch": 0.12, "learning_rate": 1.9959271909723724e-05, "loss": 0.0435, "step": 8480 }, { "epoch": 0.12, "learning_rate": 1.9959223869985253e-05, "loss": 0.0349, "step": 8490 }, { "epoch": 0.12, "learning_rate": 1.9959175830246782e-05, "loss": 0.0446, "step": 8500 }, { "epoch": 0.12, "learning_rate": 1.995912779050831e-05, "loss": 0.0397, "step": 8510 }, { "epoch": 0.12, "learning_rate": 1.9959079750769837e-05, "loss": 0.0368, "step": 8520 }, { "epoch": 0.12, "learning_rate": 1.9959031711031367e-05, "loss": 0.0359, "step": 8530 }, { "epoch": 0.12, "learning_rate": 1.9958983671292896e-05, "loss": 0.0403, "step": 8540 }, { "epoch": 0.12, "learning_rate": 1.9958935631554425e-05, "loss": 0.0395, "step": 8550 }, { "epoch": 0.12, "learning_rate": 1.995888759181595e-05, "loss": 0.0476, "step": 8560 }, { "epoch": 0.12, "learning_rate": 1.995883955207748e-05, "loss": 0.043, "step": 8570 }, { "epoch": 0.12, "learning_rate": 1.995879151233901e-05, "loss": 0.0383, "step": 8580 }, { "epoch": 0.12, "learning_rate": 1.9958743472600536e-05, "loss": 0.0438, "step": 8590 }, { "epoch": 0.12, "learning_rate": 1.9958695432862065e-05, "loss": 0.0433, "step": 8600 }, { "epoch": 0.12, "learning_rate": 1.9958647393123594e-05, "loss": 0.0385, "step": 8610 }, { "epoch": 0.12, "learning_rate": 1.9958599353385123e-05, "loss": 0.0391, "step": 8620 }, { "epoch": 0.12, "learning_rate": 1.995855131364665e-05, "loss": 0.0447, "step": 8630 }, { "epoch": 0.12, "learning_rate": 1.995850327390818e-05, "loss": 0.0401, "step": 8640 }, { "epoch": 0.12, "learning_rate": 1.9958455234169708e-05, "loss": 0.0377, "step": 8650 }, { "epoch": 0.12, "learning_rate": 1.9958407194431234e-05, "loss": 0.0411, "step": 8660 }, { "epoch": 0.12, "learning_rate": 1.9958359154692763e-05, "loss": 0.0423, "step": 8670 }, { "epoch": 0.13, "learning_rate": 1.9958311114954292e-05, "loss": 0.0352, "step": 8680 }, { "epoch": 0.13, "learning_rate": 1.995826307521582e-05, "loss": 0.0338, "step": 8690 }, { "epoch": 0.13, "learning_rate": 1.9958215035477347e-05, "loss": 0.0465, "step": 8700 }, { "epoch": 0.13, "learning_rate": 1.9958166995738877e-05, "loss": 0.0409, "step": 8710 }, { "epoch": 0.13, "learning_rate": 1.9958118956000406e-05, "loss": 0.0457, "step": 8720 }, { "epoch": 0.13, "learning_rate": 1.9958070916261935e-05, "loss": 0.0362, "step": 8730 }, { "epoch": 0.13, "learning_rate": 1.995802287652346e-05, "loss": 0.0379, "step": 8740 }, { "epoch": 0.13, "learning_rate": 1.995797483678499e-05, "loss": 0.0332, "step": 8750 }, { "epoch": 0.13, "learning_rate": 1.995792679704652e-05, "loss": 0.0459, "step": 8760 }, { "epoch": 0.13, "learning_rate": 1.9957878757308045e-05, "loss": 0.0331, "step": 8770 }, { "epoch": 0.13, "learning_rate": 1.9957830717569575e-05, "loss": 0.0431, "step": 8780 }, { "epoch": 0.13, "learning_rate": 1.9957782677831104e-05, "loss": 0.038, "step": 8790 }, { "epoch": 0.13, "learning_rate": 1.9957734638092633e-05, "loss": 0.0493, "step": 8800 }, { "epoch": 0.13, "learning_rate": 1.995768659835416e-05, "loss": 0.0391, "step": 8810 }, { "epoch": 0.13, "learning_rate": 1.995763855861569e-05, "loss": 0.038, "step": 8820 }, { "epoch": 0.13, "learning_rate": 1.9957590518877218e-05, "loss": 0.0407, "step": 8830 }, { "epoch": 0.13, "learning_rate": 1.9957542479138744e-05, "loss": 0.0413, "step": 8840 }, { "epoch": 0.13, "learning_rate": 1.9957494439400273e-05, "loss": 0.0458, "step": 8850 }, { "epoch": 0.13, "learning_rate": 1.9957446399661802e-05, "loss": 0.0401, "step": 8860 }, { "epoch": 0.13, "learning_rate": 1.995739835992333e-05, "loss": 0.045, "step": 8870 }, { "epoch": 0.13, "learning_rate": 1.9957350320184857e-05, "loss": 0.0501, "step": 8880 }, { "epoch": 0.13, "learning_rate": 1.9957302280446386e-05, "loss": 0.0392, "step": 8890 }, { "epoch": 0.13, "learning_rate": 1.9957254240707916e-05, "loss": 0.0405, "step": 8900 }, { "epoch": 0.13, "learning_rate": 1.9957206200969445e-05, "loss": 0.0369, "step": 8910 }, { "epoch": 0.13, "learning_rate": 1.995715816123097e-05, "loss": 0.0368, "step": 8920 }, { "epoch": 0.13, "learning_rate": 1.99571101214925e-05, "loss": 0.0409, "step": 8930 }, { "epoch": 0.13, "learning_rate": 1.995706208175403e-05, "loss": 0.0451, "step": 8940 }, { "epoch": 0.13, "learning_rate": 1.9957014042015555e-05, "loss": 0.0412, "step": 8950 }, { "epoch": 0.13, "learning_rate": 1.9956966002277085e-05, "loss": 0.036, "step": 8960 }, { "epoch": 0.13, "learning_rate": 1.9956917962538614e-05, "loss": 0.0414, "step": 8970 }, { "epoch": 0.13, "learning_rate": 1.9956869922800143e-05, "loss": 0.042, "step": 8980 }, { "epoch": 0.13, "learning_rate": 1.995682188306167e-05, "loss": 0.0406, "step": 8990 }, { "epoch": 0.13, "learning_rate": 1.9956773843323198e-05, "loss": 0.042, "step": 9000 }, { "epoch": 0.13, "learning_rate": 1.9956725803584728e-05, "loss": 0.0486, "step": 9010 }, { "epoch": 0.13, "learning_rate": 1.9956677763846253e-05, "loss": 0.0418, "step": 9020 }, { "epoch": 0.13, "learning_rate": 1.9956629724107783e-05, "loss": 0.0431, "step": 9030 }, { "epoch": 0.13, "learning_rate": 1.9956581684369312e-05, "loss": 0.0377, "step": 9040 }, { "epoch": 0.13, "learning_rate": 1.995653364463084e-05, "loss": 0.0403, "step": 9050 }, { "epoch": 0.13, "learning_rate": 1.9956485604892367e-05, "loss": 0.0447, "step": 9060 }, { "epoch": 0.13, "learning_rate": 1.9956437565153896e-05, "loss": 0.0449, "step": 9070 }, { "epoch": 0.13, "learning_rate": 1.9956389525415426e-05, "loss": 0.0344, "step": 9080 }, { "epoch": 0.13, "learning_rate": 1.9956341485676955e-05, "loss": 0.0404, "step": 9090 }, { "epoch": 0.13, "learning_rate": 1.995629824991233e-05, "loss": 0.0409, "step": 9100 }, { "epoch": 0.13, "learning_rate": 1.995625021017386e-05, "loss": 0.0363, "step": 9110 }, { "epoch": 0.13, "learning_rate": 1.9956202170435385e-05, "loss": 0.0358, "step": 9120 }, { "epoch": 0.13, "learning_rate": 1.9956154130696914e-05, "loss": 0.0489, "step": 9130 }, { "epoch": 0.13, "learning_rate": 1.9956106090958443e-05, "loss": 0.0407, "step": 9140 }, { "epoch": 0.13, "learning_rate": 1.995605805121997e-05, "loss": 0.0374, "step": 9150 }, { "epoch": 0.13, "learning_rate": 1.99560100114815e-05, "loss": 0.0385, "step": 9160 }, { "epoch": 0.13, "learning_rate": 1.9955961971743028e-05, "loss": 0.037, "step": 9170 }, { "epoch": 0.13, "learning_rate": 1.9955913932004557e-05, "loss": 0.0413, "step": 9180 }, { "epoch": 0.13, "learning_rate": 1.9955865892266083e-05, "loss": 0.0393, "step": 9190 }, { "epoch": 0.13, "learning_rate": 1.9955817852527612e-05, "loss": 0.0405, "step": 9200 }, { "epoch": 0.13, "learning_rate": 1.995576981278914e-05, "loss": 0.0468, "step": 9210 }, { "epoch": 0.13, "learning_rate": 1.995572177305067e-05, "loss": 0.0381, "step": 9220 }, { "epoch": 0.13, "learning_rate": 1.9955673733312197e-05, "loss": 0.0403, "step": 9230 }, { "epoch": 0.13, "learning_rate": 1.9955625693573726e-05, "loss": 0.0412, "step": 9240 }, { "epoch": 0.13, "learning_rate": 1.9955577653835255e-05, "loss": 0.0403, "step": 9250 }, { "epoch": 0.13, "learning_rate": 1.995552961409678e-05, "loss": 0.0368, "step": 9260 }, { "epoch": 0.13, "learning_rate": 1.995548157435831e-05, "loss": 0.0504, "step": 9270 }, { "epoch": 0.13, "learning_rate": 1.995543353461984e-05, "loss": 0.0404, "step": 9280 }, { "epoch": 0.13, "learning_rate": 1.995538549488137e-05, "loss": 0.0357, "step": 9290 }, { "epoch": 0.13, "learning_rate": 1.9955337455142895e-05, "loss": 0.0374, "step": 9300 }, { "epoch": 0.13, "learning_rate": 1.9955289415404424e-05, "loss": 0.0325, "step": 9310 }, { "epoch": 0.13, "learning_rate": 1.9955241375665953e-05, "loss": 0.0378, "step": 9320 }, { "epoch": 0.13, "learning_rate": 1.995519333592748e-05, "loss": 0.0473, "step": 9330 }, { "epoch": 0.13, "learning_rate": 1.995514529618901e-05, "loss": 0.0405, "step": 9340 }, { "epoch": 0.13, "learning_rate": 1.9955097256450538e-05, "loss": 0.041, "step": 9350 }, { "epoch": 0.13, "learning_rate": 1.9955049216712067e-05, "loss": 0.0404, "step": 9360 }, { "epoch": 0.14, "learning_rate": 1.9955001176973593e-05, "loss": 0.0355, "step": 9370 }, { "epoch": 0.14, "learning_rate": 1.9954953137235122e-05, "loss": 0.0373, "step": 9380 }, { "epoch": 0.14, "learning_rate": 1.995490509749665e-05, "loss": 0.0339, "step": 9390 }, { "epoch": 0.14, "learning_rate": 1.995485705775818e-05, "loss": 0.0362, "step": 9400 }, { "epoch": 0.14, "learning_rate": 1.9954809018019706e-05, "loss": 0.0511, "step": 9410 }, { "epoch": 0.14, "learning_rate": 1.9954760978281236e-05, "loss": 0.0361, "step": 9420 }, { "epoch": 0.14, "learning_rate": 1.9954712938542765e-05, "loss": 0.0442, "step": 9430 }, { "epoch": 0.14, "learning_rate": 1.995466489880429e-05, "loss": 0.0384, "step": 9440 }, { "epoch": 0.14, "learning_rate": 1.995461685906582e-05, "loss": 0.0372, "step": 9450 }, { "epoch": 0.14, "learning_rate": 1.995456881932735e-05, "loss": 0.0455, "step": 9460 }, { "epoch": 0.14, "learning_rate": 1.995452077958888e-05, "loss": 0.0366, "step": 9470 }, { "epoch": 0.14, "learning_rate": 1.9954472739850405e-05, "loss": 0.0411, "step": 9480 }, { "epoch": 0.14, "learning_rate": 1.9954424700111934e-05, "loss": 0.0447, "step": 9490 }, { "epoch": 0.14, "learning_rate": 1.9954376660373463e-05, "loss": 0.0458, "step": 9500 }, { "epoch": 0.14, "learning_rate": 1.995432862063499e-05, "loss": 0.0373, "step": 9510 }, { "epoch": 0.14, "learning_rate": 1.9954280580896518e-05, "loss": 0.0407, "step": 9520 }, { "epoch": 0.14, "learning_rate": 1.9954232541158048e-05, "loss": 0.0417, "step": 9530 }, { "epoch": 0.14, "learning_rate": 1.9954184501419577e-05, "loss": 0.0409, "step": 9540 }, { "epoch": 0.14, "learning_rate": 1.9954136461681103e-05, "loss": 0.0417, "step": 9550 }, { "epoch": 0.14, "learning_rate": 1.9954088421942632e-05, "loss": 0.0463, "step": 9560 }, { "epoch": 0.14, "learning_rate": 1.995404038220416e-05, "loss": 0.039, "step": 9570 }, { "epoch": 0.14, "learning_rate": 1.995399234246569e-05, "loss": 0.0364, "step": 9580 }, { "epoch": 0.14, "learning_rate": 1.9953944302727216e-05, "loss": 0.0365, "step": 9590 }, { "epoch": 0.14, "learning_rate": 1.9953896262988746e-05, "loss": 0.0381, "step": 9600 }, { "epoch": 0.14, "learning_rate": 1.9953848223250275e-05, "loss": 0.0366, "step": 9610 }, { "epoch": 0.14, "learning_rate": 1.99538001835118e-05, "loss": 0.0432, "step": 9620 }, { "epoch": 0.14, "learning_rate": 1.995375214377333e-05, "loss": 0.0373, "step": 9630 }, { "epoch": 0.14, "learning_rate": 1.995370410403486e-05, "loss": 0.0332, "step": 9640 }, { "epoch": 0.14, "learning_rate": 1.995365606429639e-05, "loss": 0.0389, "step": 9650 }, { "epoch": 0.14, "learning_rate": 1.9953608024557914e-05, "loss": 0.0426, "step": 9660 }, { "epoch": 0.14, "learning_rate": 1.9953559984819444e-05, "loss": 0.0382, "step": 9670 }, { "epoch": 0.14, "learning_rate": 1.9953511945080973e-05, "loss": 0.0342, "step": 9680 }, { "epoch": 0.14, "learning_rate": 1.99534639053425e-05, "loss": 0.0372, "step": 9690 }, { "epoch": 0.14, "learning_rate": 1.9953415865604028e-05, "loss": 0.0373, "step": 9700 }, { "epoch": 0.14, "learning_rate": 1.9953367825865557e-05, "loss": 0.0424, "step": 9710 }, { "epoch": 0.14, "learning_rate": 1.9953319786127087e-05, "loss": 0.0437, "step": 9720 }, { "epoch": 0.14, "learning_rate": 1.9953271746388613e-05, "loss": 0.0403, "step": 9730 }, { "epoch": 0.14, "learning_rate": 1.9953223706650142e-05, "loss": 0.0422, "step": 9740 }, { "epoch": 0.14, "learning_rate": 1.995317566691167e-05, "loss": 0.0395, "step": 9750 }, { "epoch": 0.14, "learning_rate": 1.99531276271732e-05, "loss": 0.0366, "step": 9760 }, { "epoch": 0.14, "learning_rate": 1.9953079587434726e-05, "loss": 0.0396, "step": 9770 }, { "epoch": 0.14, "learning_rate": 1.9953031547696256e-05, "loss": 0.0406, "step": 9780 }, { "epoch": 0.14, "learning_rate": 1.9952983507957785e-05, "loss": 0.0416, "step": 9790 }, { "epoch": 0.14, "learning_rate": 1.995293546821931e-05, "loss": 0.0351, "step": 9800 }, { "epoch": 0.14, "learning_rate": 1.995288742848084e-05, "loss": 0.0507, "step": 9810 }, { "epoch": 0.14, "learning_rate": 1.995283938874237e-05, "loss": 0.0338, "step": 9820 }, { "epoch": 0.14, "learning_rate": 1.99527913490039e-05, "loss": 0.0462, "step": 9830 }, { "epoch": 0.14, "learning_rate": 1.9952743309265424e-05, "loss": 0.0434, "step": 9840 }, { "epoch": 0.14, "learning_rate": 1.9952695269526954e-05, "loss": 0.0372, "step": 9850 }, { "epoch": 0.14, "learning_rate": 1.9952647229788483e-05, "loss": 0.0418, "step": 9860 }, { "epoch": 0.14, "learning_rate": 1.995259919005001e-05, "loss": 0.0332, "step": 9870 }, { "epoch": 0.14, "learning_rate": 1.9952551150311538e-05, "loss": 0.0385, "step": 9880 }, { "epoch": 0.14, "learning_rate": 1.9952503110573067e-05, "loss": 0.0375, "step": 9890 }, { "epoch": 0.14, "learning_rate": 1.9952455070834597e-05, "loss": 0.0393, "step": 9900 }, { "epoch": 0.14, "learning_rate": 1.9952407031096123e-05, "loss": 0.041, "step": 9910 }, { "epoch": 0.14, "learning_rate": 1.9952358991357652e-05, "loss": 0.0381, "step": 9920 }, { "epoch": 0.14, "learning_rate": 1.995231095161918e-05, "loss": 0.033, "step": 9930 }, { "epoch": 0.14, "learning_rate": 1.995226291188071e-05, "loss": 0.046, "step": 9940 }, { "epoch": 0.14, "learning_rate": 1.9952214872142236e-05, "loss": 0.0372, "step": 9950 }, { "epoch": 0.14, "learning_rate": 1.9952166832403765e-05, "loss": 0.0368, "step": 9960 }, { "epoch": 0.14, "learning_rate": 1.9952118792665295e-05, "loss": 0.0387, "step": 9970 }, { "epoch": 0.14, "learning_rate": 1.995207075292682e-05, "loss": 0.0472, "step": 9980 }, { "epoch": 0.14, "learning_rate": 1.995202271318835e-05, "loss": 0.0386, "step": 9990 }, { "epoch": 0.14, "learning_rate": 1.995197467344988e-05, "loss": 0.0333, "step": 10000 }, { "epoch": 0.14, "learning_rate": 1.995192663371141e-05, "loss": 0.0411, "step": 10010 }, { "epoch": 0.14, "learning_rate": 1.9951878593972934e-05, "loss": 0.0378, "step": 10020 }, { "epoch": 0.14, "learning_rate": 1.9951830554234464e-05, "loss": 0.0461, "step": 10030 }, { "epoch": 0.14, "learning_rate": 1.9951782514495993e-05, "loss": 0.0416, "step": 10040 }, { "epoch": 0.14, "learning_rate": 1.995173447475752e-05, "loss": 0.0481, "step": 10050 }, { "epoch": 0.14, "learning_rate": 1.9951686435019048e-05, "loss": 0.0439, "step": 10060 }, { "epoch": 0.15, "learning_rate": 1.9951638395280577e-05, "loss": 0.0345, "step": 10070 }, { "epoch": 0.15, "learning_rate": 1.9951590355542107e-05, "loss": 0.0425, "step": 10080 }, { "epoch": 0.15, "learning_rate": 1.9951542315803632e-05, "loss": 0.0345, "step": 10090 }, { "epoch": 0.15, "learning_rate": 1.9951494276065162e-05, "loss": 0.0333, "step": 10100 }, { "epoch": 0.15, "learning_rate": 1.995144623632669e-05, "loss": 0.034, "step": 10110 }, { "epoch": 0.15, "learning_rate": 1.995139819658822e-05, "loss": 0.0418, "step": 10120 }, { "epoch": 0.15, "learning_rate": 1.9951350156849746e-05, "loss": 0.0348, "step": 10130 }, { "epoch": 0.15, "learning_rate": 1.9951302117111275e-05, "loss": 0.0391, "step": 10140 }, { "epoch": 0.15, "learning_rate": 1.9951254077372805e-05, "loss": 0.039, "step": 10150 }, { "epoch": 0.15, "learning_rate": 1.995120603763433e-05, "loss": 0.0368, "step": 10160 }, { "epoch": 0.15, "learning_rate": 1.995115799789586e-05, "loss": 0.0335, "step": 10170 }, { "epoch": 0.15, "learning_rate": 1.995110995815739e-05, "loss": 0.0325, "step": 10180 }, { "epoch": 0.15, "learning_rate": 1.995106191841892e-05, "loss": 0.0346, "step": 10190 }, { "epoch": 0.15, "learning_rate": 1.9951013878680444e-05, "loss": 0.0363, "step": 10200 }, { "epoch": 0.15, "learning_rate": 1.9950965838941974e-05, "loss": 0.04, "step": 10210 }, { "epoch": 0.15, "learning_rate": 1.9950917799203503e-05, "loss": 0.0407, "step": 10220 }, { "epoch": 0.15, "learning_rate": 1.995086975946503e-05, "loss": 0.0375, "step": 10230 }, { "epoch": 0.15, "learning_rate": 1.9950821719726558e-05, "loss": 0.0392, "step": 10240 }, { "epoch": 0.15, "learning_rate": 1.9950773679988087e-05, "loss": 0.0288, "step": 10250 }, { "epoch": 0.15, "learning_rate": 1.9950725640249616e-05, "loss": 0.0356, "step": 10260 }, { "epoch": 0.15, "learning_rate": 1.9950677600511142e-05, "loss": 0.0522, "step": 10270 }, { "epoch": 0.15, "learning_rate": 1.995062956077267e-05, "loss": 0.039, "step": 10280 }, { "epoch": 0.15, "learning_rate": 1.99505815210342e-05, "loss": 0.0373, "step": 10290 }, { "epoch": 0.15, "learning_rate": 1.995053348129573e-05, "loss": 0.0329, "step": 10300 }, { "epoch": 0.15, "learning_rate": 1.9950485441557256e-05, "loss": 0.0397, "step": 10310 }, { "epoch": 0.15, "learning_rate": 1.9950437401818785e-05, "loss": 0.0361, "step": 10320 }, { "epoch": 0.15, "learning_rate": 1.9950389362080315e-05, "loss": 0.0427, "step": 10330 }, { "epoch": 0.15, "learning_rate": 1.995034132234184e-05, "loss": 0.0359, "step": 10340 }, { "epoch": 0.15, "learning_rate": 1.995029328260337e-05, "loss": 0.0366, "step": 10350 }, { "epoch": 0.15, "learning_rate": 1.99502452428649e-05, "loss": 0.0371, "step": 10360 }, { "epoch": 0.15, "learning_rate": 1.9950197203126428e-05, "loss": 0.037, "step": 10370 }, { "epoch": 0.15, "learning_rate": 1.9950149163387954e-05, "loss": 0.0372, "step": 10380 }, { "epoch": 0.15, "learning_rate": 1.9950101123649483e-05, "loss": 0.0374, "step": 10390 }, { "epoch": 0.15, "learning_rate": 1.9950053083911013e-05, "loss": 0.0432, "step": 10400 }, { "epoch": 0.15, "learning_rate": 1.995000504417254e-05, "loss": 0.0376, "step": 10410 }, { "epoch": 0.15, "learning_rate": 1.9949957004434068e-05, "loss": 0.0347, "step": 10420 }, { "epoch": 0.15, "learning_rate": 1.9949908964695597e-05, "loss": 0.0429, "step": 10430 }, { "epoch": 0.15, "learning_rate": 1.9949860924957126e-05, "loss": 0.04, "step": 10440 }, { "epoch": 0.15, "learning_rate": 1.9949812885218652e-05, "loss": 0.0395, "step": 10450 }, { "epoch": 0.15, "learning_rate": 1.994976484548018e-05, "loss": 0.0384, "step": 10460 }, { "epoch": 0.15, "learning_rate": 1.994971680574171e-05, "loss": 0.0374, "step": 10470 }, { "epoch": 0.15, "learning_rate": 1.994966876600324e-05, "loss": 0.0426, "step": 10480 }, { "epoch": 0.15, "learning_rate": 1.9949620726264766e-05, "loss": 0.0335, "step": 10490 }, { "epoch": 0.15, "learning_rate": 1.9949572686526295e-05, "loss": 0.0344, "step": 10500 }, { "epoch": 0.15, "learning_rate": 1.9949524646787824e-05, "loss": 0.0397, "step": 10510 }, { "epoch": 0.15, "learning_rate": 1.9949476607049354e-05, "loss": 0.0481, "step": 10520 }, { "epoch": 0.15, "learning_rate": 1.9949428567310883e-05, "loss": 0.0426, "step": 10530 }, { "epoch": 0.15, "learning_rate": 1.9949380527572412e-05, "loss": 0.0368, "step": 10540 }, { "epoch": 0.15, "learning_rate": 1.9949332487833938e-05, "loss": 0.0357, "step": 10550 }, { "epoch": 0.15, "learning_rate": 1.9949284448095467e-05, "loss": 0.0379, "step": 10560 }, { "epoch": 0.15, "learning_rate": 1.9949236408356997e-05, "loss": 0.0353, "step": 10570 }, { "epoch": 0.15, "learning_rate": 1.9949188368618523e-05, "loss": 0.0379, "step": 10580 }, { "epoch": 0.15, "learning_rate": 1.9949140328880052e-05, "loss": 0.0453, "step": 10590 }, { "epoch": 0.15, "learning_rate": 1.994909228914158e-05, "loss": 0.0351, "step": 10600 }, { "epoch": 0.15, "learning_rate": 1.994904424940311e-05, "loss": 0.0378, "step": 10610 }, { "epoch": 0.15, "learning_rate": 1.9948996209664636e-05, "loss": 0.037, "step": 10620 }, { "epoch": 0.15, "learning_rate": 1.9948948169926166e-05, "loss": 0.0377, "step": 10630 }, { "epoch": 0.15, "learning_rate": 1.9948900130187695e-05, "loss": 0.0414, "step": 10640 }, { "epoch": 0.15, "learning_rate": 1.994885209044922e-05, "loss": 0.0476, "step": 10650 }, { "epoch": 0.15, "learning_rate": 1.994880405071075e-05, "loss": 0.0301, "step": 10660 }, { "epoch": 0.15, "learning_rate": 1.994875601097228e-05, "loss": 0.0385, "step": 10670 }, { "epoch": 0.15, "learning_rate": 1.994870797123381e-05, "loss": 0.0371, "step": 10680 }, { "epoch": 0.15, "learning_rate": 1.9948659931495334e-05, "loss": 0.0408, "step": 10690 }, { "epoch": 0.15, "learning_rate": 1.9948611891756864e-05, "loss": 0.0384, "step": 10700 }, { "epoch": 0.15, "learning_rate": 1.9948563852018393e-05, "loss": 0.0321, "step": 10710 }, { "epoch": 0.15, "learning_rate": 1.994851581227992e-05, "loss": 0.035, "step": 10720 }, { "epoch": 0.15, "learning_rate": 1.9948467772541448e-05, "loss": 0.0408, "step": 10730 }, { "epoch": 0.15, "learning_rate": 1.9948419732802977e-05, "loss": 0.0352, "step": 10740 }, { "epoch": 0.15, "learning_rate": 1.9948371693064507e-05, "loss": 0.041, "step": 10750 }, { "epoch": 0.16, "learning_rate": 1.9948323653326033e-05, "loss": 0.0406, "step": 10760 }, { "epoch": 0.16, "learning_rate": 1.9948275613587562e-05, "loss": 0.0326, "step": 10770 }, { "epoch": 0.16, "learning_rate": 1.994822757384909e-05, "loss": 0.037, "step": 10780 }, { "epoch": 0.16, "learning_rate": 1.994817953411062e-05, "loss": 0.041, "step": 10790 }, { "epoch": 0.16, "learning_rate": 1.9948131494372146e-05, "loss": 0.0379, "step": 10800 }, { "epoch": 0.16, "learning_rate": 1.9948083454633675e-05, "loss": 0.052, "step": 10810 }, { "epoch": 0.16, "learning_rate": 1.9948035414895205e-05, "loss": 0.0443, "step": 10820 }, { "epoch": 0.16, "learning_rate": 1.994798737515673e-05, "loss": 0.0359, "step": 10830 }, { "epoch": 0.16, "learning_rate": 1.994793933541826e-05, "loss": 0.0461, "step": 10840 }, { "epoch": 0.16, "learning_rate": 1.994789129567979e-05, "loss": 0.0324, "step": 10850 }, { "epoch": 0.16, "learning_rate": 1.994784325594132e-05, "loss": 0.0394, "step": 10860 }, { "epoch": 0.16, "learning_rate": 1.9947795216202844e-05, "loss": 0.0474, "step": 10870 }, { "epoch": 0.16, "learning_rate": 1.9947747176464374e-05, "loss": 0.0341, "step": 10880 }, { "epoch": 0.16, "learning_rate": 1.9947699136725903e-05, "loss": 0.0293, "step": 10890 }, { "epoch": 0.16, "learning_rate": 1.994765109698743e-05, "loss": 0.0353, "step": 10900 }, { "epoch": 0.16, "learning_rate": 1.9947603057248958e-05, "loss": 0.0389, "step": 10910 }, { "epoch": 0.16, "learning_rate": 1.9947555017510487e-05, "loss": 0.0385, "step": 10920 }, { "epoch": 0.16, "learning_rate": 1.9947506977772017e-05, "loss": 0.0386, "step": 10930 }, { "epoch": 0.16, "learning_rate": 1.9947458938033542e-05, "loss": 0.0347, "step": 10940 }, { "epoch": 0.16, "learning_rate": 1.9947410898295072e-05, "loss": 0.0394, "step": 10950 }, { "epoch": 0.16, "learning_rate": 1.99473628585566e-05, "loss": 0.0398, "step": 10960 }, { "epoch": 0.16, "learning_rate": 1.994731481881813e-05, "loss": 0.033, "step": 10970 }, { "epoch": 0.16, "learning_rate": 1.9947266779079656e-05, "loss": 0.0292, "step": 10980 }, { "epoch": 0.16, "learning_rate": 1.9947218739341185e-05, "loss": 0.0347, "step": 10990 }, { "epoch": 0.16, "learning_rate": 1.9947170699602715e-05, "loss": 0.0402, "step": 11000 }, { "epoch": 0.16, "learning_rate": 1.994712265986424e-05, "loss": 0.0319, "step": 11010 }, { "epoch": 0.16, "learning_rate": 1.994707462012577e-05, "loss": 0.0309, "step": 11020 }, { "epoch": 0.16, "learning_rate": 1.99470265803873e-05, "loss": 0.0364, "step": 11030 }, { "epoch": 0.16, "learning_rate": 1.994697854064883e-05, "loss": 0.0413, "step": 11040 }, { "epoch": 0.16, "learning_rate": 1.9946930500910354e-05, "loss": 0.0392, "step": 11050 }, { "epoch": 0.16, "learning_rate": 1.9946882461171884e-05, "loss": 0.0379, "step": 11060 }, { "epoch": 0.16, "learning_rate": 1.9946834421433413e-05, "loss": 0.0356, "step": 11070 }, { "epoch": 0.16, "learning_rate": 1.994678638169494e-05, "loss": 0.0373, "step": 11080 }, { "epoch": 0.16, "learning_rate": 1.9946738341956468e-05, "loss": 0.0287, "step": 11090 }, { "epoch": 0.16, "learning_rate": 1.9946690302217997e-05, "loss": 0.0387, "step": 11100 }, { "epoch": 0.16, "learning_rate": 1.9946642262479526e-05, "loss": 0.0418, "step": 11110 }, { "epoch": 0.16, "learning_rate": 1.9946594222741052e-05, "loss": 0.0359, "step": 11120 }, { "epoch": 0.16, "learning_rate": 1.994654618300258e-05, "loss": 0.0369, "step": 11130 }, { "epoch": 0.16, "learning_rate": 1.994649814326411e-05, "loss": 0.0378, "step": 11140 }, { "epoch": 0.16, "learning_rate": 1.994645010352564e-05, "loss": 0.0371, "step": 11150 }, { "epoch": 0.16, "learning_rate": 1.9946402063787166e-05, "loss": 0.0288, "step": 11160 }, { "epoch": 0.16, "learning_rate": 1.9946354024048695e-05, "loss": 0.0386, "step": 11170 }, { "epoch": 0.16, "learning_rate": 1.9946305984310225e-05, "loss": 0.0333, "step": 11180 }, { "epoch": 0.16, "learning_rate": 1.994625794457175e-05, "loss": 0.044, "step": 11190 }, { "epoch": 0.16, "learning_rate": 1.994620990483328e-05, "loss": 0.0448, "step": 11200 }, { "epoch": 0.16, "learning_rate": 1.994616186509481e-05, "loss": 0.0385, "step": 11210 }, { "epoch": 0.16, "learning_rate": 1.9946113825356338e-05, "loss": 0.0346, "step": 11220 }, { "epoch": 0.16, "learning_rate": 1.9946065785617864e-05, "loss": 0.0468, "step": 11230 }, { "epoch": 0.16, "learning_rate": 1.9946017745879393e-05, "loss": 0.0406, "step": 11240 }, { "epoch": 0.16, "learning_rate": 1.9945969706140923e-05, "loss": 0.0362, "step": 11250 }, { "epoch": 0.16, "learning_rate": 1.994592166640245e-05, "loss": 0.031, "step": 11260 }, { "epoch": 0.16, "learning_rate": 1.9945873626663978e-05, "loss": 0.0385, "step": 11270 }, { "epoch": 0.16, "learning_rate": 1.9945825586925507e-05, "loss": 0.036, "step": 11280 }, { "epoch": 0.16, "learning_rate": 1.9945777547187036e-05, "loss": 0.037, "step": 11290 }, { "epoch": 0.16, "learning_rate": 1.9945729507448562e-05, "loss": 0.0311, "step": 11300 }, { "epoch": 0.16, "learning_rate": 1.994568146771009e-05, "loss": 0.0387, "step": 11310 }, { "epoch": 0.16, "learning_rate": 1.994563342797162e-05, "loss": 0.0373, "step": 11320 }, { "epoch": 0.16, "learning_rate": 1.994558538823315e-05, "loss": 0.0416, "step": 11330 }, { "epoch": 0.16, "learning_rate": 1.9945537348494676e-05, "loss": 0.0295, "step": 11340 }, { "epoch": 0.16, "learning_rate": 1.9945489308756205e-05, "loss": 0.0388, "step": 11350 }, { "epoch": 0.16, "learning_rate": 1.9945441269017734e-05, "loss": 0.0408, "step": 11360 }, { "epoch": 0.16, "learning_rate": 1.994539322927926e-05, "loss": 0.0435, "step": 11370 }, { "epoch": 0.16, "learning_rate": 1.994534518954079e-05, "loss": 0.0402, "step": 11380 }, { "epoch": 0.16, "learning_rate": 1.994529714980232e-05, "loss": 0.0294, "step": 11390 }, { "epoch": 0.16, "learning_rate": 1.9945249110063848e-05, "loss": 0.0466, "step": 11400 }, { "epoch": 0.16, "learning_rate": 1.9945201070325374e-05, "loss": 0.0317, "step": 11410 }, { "epoch": 0.16, "learning_rate": 1.9945153030586903e-05, "loss": 0.0395, "step": 11420 }, { "epoch": 0.16, "learning_rate": 1.9945104990848433e-05, "loss": 0.0416, "step": 11430 }, { "epoch": 0.16, "learning_rate": 1.994505695110996e-05, "loss": 0.033, "step": 11440 }, { "epoch": 0.17, "learning_rate": 1.9945008911371488e-05, "loss": 0.0355, "step": 11450 }, { "epoch": 0.17, "learning_rate": 1.9944960871633017e-05, "loss": 0.0574, "step": 11460 }, { "epoch": 0.17, "learning_rate": 1.9944912831894546e-05, "loss": 0.0338, "step": 11470 }, { "epoch": 0.17, "learning_rate": 1.9944864792156072e-05, "loss": 0.0383, "step": 11480 }, { "epoch": 0.17, "learning_rate": 1.99448167524176e-05, "loss": 0.0423, "step": 11490 }, { "epoch": 0.17, "learning_rate": 1.994476871267913e-05, "loss": 0.0452, "step": 11500 }, { "epoch": 0.17, "learning_rate": 1.994472067294066e-05, "loss": 0.0365, "step": 11510 }, { "epoch": 0.17, "learning_rate": 1.9944672633202186e-05, "loss": 0.0337, "step": 11520 }, { "epoch": 0.17, "learning_rate": 1.9944624593463715e-05, "loss": 0.0388, "step": 11530 }, { "epoch": 0.17, "learning_rate": 1.9944576553725244e-05, "loss": 0.0304, "step": 11540 }, { "epoch": 0.17, "learning_rate": 1.994452851398677e-05, "loss": 0.041, "step": 11550 }, { "epoch": 0.17, "learning_rate": 1.99444804742483e-05, "loss": 0.0346, "step": 11560 }, { "epoch": 0.17, "learning_rate": 1.994443243450983e-05, "loss": 0.0407, "step": 11570 }, { "epoch": 0.17, "learning_rate": 1.9944384394771358e-05, "loss": 0.0355, "step": 11580 }, { "epoch": 0.17, "learning_rate": 1.9944336355032884e-05, "loss": 0.0432, "step": 11590 }, { "epoch": 0.17, "learning_rate": 1.9944288315294413e-05, "loss": 0.0407, "step": 11600 }, { "epoch": 0.17, "learning_rate": 1.9944240275555943e-05, "loss": 0.0387, "step": 11610 }, { "epoch": 0.17, "learning_rate": 1.994419223581747e-05, "loss": 0.036, "step": 11620 }, { "epoch": 0.17, "learning_rate": 1.9944149000052846e-05, "loss": 0.0318, "step": 11630 }, { "epoch": 0.17, "learning_rate": 1.9944100960314376e-05, "loss": 0.0349, "step": 11640 }, { "epoch": 0.17, "learning_rate": 1.99440529205759e-05, "loss": 0.0417, "step": 11650 }, { "epoch": 0.17, "learning_rate": 1.994400488083743e-05, "loss": 0.0344, "step": 11660 }, { "epoch": 0.17, "learning_rate": 1.994395684109896e-05, "loss": 0.0352, "step": 11670 }, { "epoch": 0.17, "learning_rate": 1.9943908801360486e-05, "loss": 0.0338, "step": 11680 }, { "epoch": 0.17, "learning_rate": 1.9943860761622015e-05, "loss": 0.0336, "step": 11690 }, { "epoch": 0.17, "learning_rate": 1.9943812721883545e-05, "loss": 0.0316, "step": 11700 }, { "epoch": 0.17, "learning_rate": 1.9943764682145074e-05, "loss": 0.0452, "step": 11710 }, { "epoch": 0.17, "learning_rate": 1.99437166424066e-05, "loss": 0.0367, "step": 11720 }, { "epoch": 0.17, "learning_rate": 1.994366860266813e-05, "loss": 0.0391, "step": 11730 }, { "epoch": 0.17, "learning_rate": 1.9943620562929658e-05, "loss": 0.0379, "step": 11740 }, { "epoch": 0.17, "learning_rate": 1.9943572523191188e-05, "loss": 0.032, "step": 11750 }, { "epoch": 0.17, "learning_rate": 1.9943524483452713e-05, "loss": 0.039, "step": 11760 }, { "epoch": 0.17, "learning_rate": 1.9943476443714243e-05, "loss": 0.0346, "step": 11770 }, { "epoch": 0.17, "learning_rate": 1.9943428403975772e-05, "loss": 0.031, "step": 11780 }, { "epoch": 0.17, "learning_rate": 1.9943380364237298e-05, "loss": 0.0324, "step": 11790 }, { "epoch": 0.17, "learning_rate": 1.9943332324498827e-05, "loss": 0.0357, "step": 11800 }, { "epoch": 0.17, "learning_rate": 1.9943284284760356e-05, "loss": 0.0351, "step": 11810 }, { "epoch": 0.17, "learning_rate": 1.9943236245021886e-05, "loss": 0.0351, "step": 11820 }, { "epoch": 0.17, "learning_rate": 1.994318820528341e-05, "loss": 0.041, "step": 11830 }, { "epoch": 0.17, "learning_rate": 1.994314016554494e-05, "loss": 0.0386, "step": 11840 }, { "epoch": 0.17, "learning_rate": 1.994309212580647e-05, "loss": 0.0348, "step": 11850 }, { "epoch": 0.17, "learning_rate": 1.9943044086067996e-05, "loss": 0.0314, "step": 11860 }, { "epoch": 0.17, "learning_rate": 1.9942996046329525e-05, "loss": 0.0375, "step": 11870 }, { "epoch": 0.17, "learning_rate": 1.9942948006591054e-05, "loss": 0.0328, "step": 11880 }, { "epoch": 0.17, "learning_rate": 1.9942899966852584e-05, "loss": 0.0401, "step": 11890 }, { "epoch": 0.17, "learning_rate": 1.994285192711411e-05, "loss": 0.0387, "step": 11900 }, { "epoch": 0.17, "learning_rate": 1.994280388737564e-05, "loss": 0.0325, "step": 11910 }, { "epoch": 0.17, "learning_rate": 1.9942755847637168e-05, "loss": 0.034, "step": 11920 }, { "epoch": 0.17, "learning_rate": 1.9942707807898697e-05, "loss": 0.0271, "step": 11930 }, { "epoch": 0.17, "learning_rate": 1.9942659768160223e-05, "loss": 0.0348, "step": 11940 }, { "epoch": 0.17, "learning_rate": 1.9942611728421753e-05, "loss": 0.0367, "step": 11950 }, { "epoch": 0.17, "learning_rate": 1.9942563688683282e-05, "loss": 0.036, "step": 11960 }, { "epoch": 0.17, "learning_rate": 1.9942515648944808e-05, "loss": 0.0322, "step": 11970 }, { "epoch": 0.17, "learning_rate": 1.9942467609206337e-05, "loss": 0.0318, "step": 11980 }, { "epoch": 0.17, "learning_rate": 1.9942419569467866e-05, "loss": 0.0334, "step": 11990 }, { "epoch": 0.17, "learning_rate": 1.9942371529729396e-05, "loss": 0.0426, "step": 12000 }, { "epoch": 0.17, "learning_rate": 1.994232348999092e-05, "loss": 0.038, "step": 12010 }, { "epoch": 0.17, "learning_rate": 1.994227545025245e-05, "loss": 0.038, "step": 12020 }, { "epoch": 0.17, "learning_rate": 1.994222741051398e-05, "loss": 0.0379, "step": 12030 }, { "epoch": 0.17, "learning_rate": 1.9942179370775506e-05, "loss": 0.0396, "step": 12040 }, { "epoch": 0.17, "learning_rate": 1.9942131331037035e-05, "loss": 0.0324, "step": 12050 }, { "epoch": 0.17, "learning_rate": 1.9942083291298564e-05, "loss": 0.0323, "step": 12060 }, { "epoch": 0.17, "learning_rate": 1.9942035251560094e-05, "loss": 0.0439, "step": 12070 }, { "epoch": 0.17, "learning_rate": 1.994198721182162e-05, "loss": 0.0373, "step": 12080 }, { "epoch": 0.17, "learning_rate": 1.994193917208315e-05, "loss": 0.0356, "step": 12090 }, { "epoch": 0.17, "learning_rate": 1.9941891132344678e-05, "loss": 0.0304, "step": 12100 }, { "epoch": 0.17, "learning_rate": 1.9941843092606207e-05, "loss": 0.0384, "step": 12110 }, { "epoch": 0.17, "learning_rate": 1.9941795052867733e-05, "loss": 0.0407, "step": 12120 }, { "epoch": 0.17, "learning_rate": 1.9941747013129262e-05, "loss": 0.035, "step": 12130 }, { "epoch": 0.17, "learning_rate": 1.9941698973390792e-05, "loss": 0.035, "step": 12140 }, { "epoch": 0.18, "learning_rate": 1.9941650933652318e-05, "loss": 0.031, "step": 12150 }, { "epoch": 0.18, "learning_rate": 1.9941602893913847e-05, "loss": 0.0382, "step": 12160 }, { "epoch": 0.18, "learning_rate": 1.9941554854175376e-05, "loss": 0.0312, "step": 12170 }, { "epoch": 0.18, "learning_rate": 1.9941506814436905e-05, "loss": 0.0407, "step": 12180 }, { "epoch": 0.18, "learning_rate": 1.994145877469843e-05, "loss": 0.04, "step": 12190 }, { "epoch": 0.18, "learning_rate": 1.994141073495996e-05, "loss": 0.0396, "step": 12200 }, { "epoch": 0.18, "learning_rate": 1.994136269522149e-05, "loss": 0.0364, "step": 12210 }, { "epoch": 0.18, "learning_rate": 1.9941314655483016e-05, "loss": 0.0314, "step": 12220 }, { "epoch": 0.18, "learning_rate": 1.9941266615744545e-05, "loss": 0.0347, "step": 12230 }, { "epoch": 0.18, "learning_rate": 1.9941218576006074e-05, "loss": 0.0358, "step": 12240 }, { "epoch": 0.18, "learning_rate": 1.9941170536267604e-05, "loss": 0.036, "step": 12250 }, { "epoch": 0.18, "learning_rate": 1.994112249652913e-05, "loss": 0.0383, "step": 12260 }, { "epoch": 0.18, "learning_rate": 1.994107445679066e-05, "loss": 0.0305, "step": 12270 }, { "epoch": 0.18, "learning_rate": 1.9941026417052188e-05, "loss": 0.0269, "step": 12280 }, { "epoch": 0.18, "learning_rate": 1.9940978377313714e-05, "loss": 0.0315, "step": 12290 }, { "epoch": 0.18, "learning_rate": 1.9940930337575243e-05, "loss": 0.0429, "step": 12300 }, { "epoch": 0.18, "learning_rate": 1.9940882297836772e-05, "loss": 0.0358, "step": 12310 }, { "epoch": 0.18, "learning_rate": 1.99408342580983e-05, "loss": 0.0396, "step": 12320 }, { "epoch": 0.18, "learning_rate": 1.9940786218359828e-05, "loss": 0.0327, "step": 12330 }, { "epoch": 0.18, "learning_rate": 1.9940738178621357e-05, "loss": 0.0355, "step": 12340 }, { "epoch": 0.18, "learning_rate": 1.9940690138882886e-05, "loss": 0.0341, "step": 12350 }, { "epoch": 0.18, "learning_rate": 1.9940642099144415e-05, "loss": 0.0331, "step": 12360 }, { "epoch": 0.18, "learning_rate": 1.994059405940594e-05, "loss": 0.0393, "step": 12370 }, { "epoch": 0.18, "learning_rate": 1.994054601966747e-05, "loss": 0.0347, "step": 12380 }, { "epoch": 0.18, "learning_rate": 1.9940497979929e-05, "loss": 0.0423, "step": 12390 }, { "epoch": 0.18, "learning_rate": 1.9940449940190526e-05, "loss": 0.0383, "step": 12400 }, { "epoch": 0.18, "learning_rate": 1.9940401900452055e-05, "loss": 0.0343, "step": 12410 }, { "epoch": 0.18, "learning_rate": 1.9940353860713584e-05, "loss": 0.0442, "step": 12420 }, { "epoch": 0.18, "learning_rate": 1.9940305820975113e-05, "loss": 0.0459, "step": 12430 }, { "epoch": 0.18, "learning_rate": 1.994025778123664e-05, "loss": 0.0339, "step": 12440 }, { "epoch": 0.18, "learning_rate": 1.994020974149817e-05, "loss": 0.042, "step": 12450 }, { "epoch": 0.18, "learning_rate": 1.9940161701759698e-05, "loss": 0.0409, "step": 12460 }, { "epoch": 0.18, "learning_rate": 1.9940113662021224e-05, "loss": 0.0346, "step": 12470 }, { "epoch": 0.18, "learning_rate": 1.9940065622282753e-05, "loss": 0.0361, "step": 12480 }, { "epoch": 0.18, "learning_rate": 1.9940017582544282e-05, "loss": 0.0351, "step": 12490 }, { "epoch": 0.18, "learning_rate": 1.993996954280581e-05, "loss": 0.0334, "step": 12500 }, { "epoch": 0.18, "learning_rate": 1.9939921503067337e-05, "loss": 0.0356, "step": 12510 }, { "epoch": 0.18, "learning_rate": 1.9939873463328867e-05, "loss": 0.0345, "step": 12520 }, { "epoch": 0.18, "learning_rate": 1.9939825423590396e-05, "loss": 0.0335, "step": 12530 }, { "epoch": 0.18, "learning_rate": 1.9939777383851925e-05, "loss": 0.034, "step": 12540 }, { "epoch": 0.18, "learning_rate": 1.993972934411345e-05, "loss": 0.0353, "step": 12550 }, { "epoch": 0.18, "learning_rate": 1.993968130437498e-05, "loss": 0.0315, "step": 12560 }, { "epoch": 0.18, "learning_rate": 1.993963326463651e-05, "loss": 0.0358, "step": 12570 }, { "epoch": 0.18, "learning_rate": 1.9939585224898036e-05, "loss": 0.0343, "step": 12580 }, { "epoch": 0.18, "learning_rate": 1.9939537185159565e-05, "loss": 0.0364, "step": 12590 }, { "epoch": 0.18, "learning_rate": 1.9939489145421094e-05, "loss": 0.039, "step": 12600 }, { "epoch": 0.18, "learning_rate": 1.9939441105682623e-05, "loss": 0.0471, "step": 12610 }, { "epoch": 0.18, "learning_rate": 1.993939306594415e-05, "loss": 0.0384, "step": 12620 }, { "epoch": 0.18, "learning_rate": 1.993934502620568e-05, "loss": 0.034, "step": 12630 }, { "epoch": 0.18, "learning_rate": 1.9939296986467208e-05, "loss": 0.0381, "step": 12640 }, { "epoch": 0.18, "learning_rate": 1.9939248946728734e-05, "loss": 0.0415, "step": 12650 }, { "epoch": 0.18, "learning_rate": 1.9939200906990263e-05, "loss": 0.0341, "step": 12660 }, { "epoch": 0.18, "learning_rate": 1.9939152867251792e-05, "loss": 0.0349, "step": 12670 }, { "epoch": 0.18, "learning_rate": 1.993910482751332e-05, "loss": 0.0404, "step": 12680 }, { "epoch": 0.18, "learning_rate": 1.9939056787774847e-05, "loss": 0.0423, "step": 12690 }, { "epoch": 0.18, "learning_rate": 1.9939008748036377e-05, "loss": 0.0445, "step": 12700 }, { "epoch": 0.18, "learning_rate": 1.9938960708297906e-05, "loss": 0.0426, "step": 12710 }, { "epoch": 0.18, "learning_rate": 1.9938912668559435e-05, "loss": 0.0461, "step": 12720 }, { "epoch": 0.18, "learning_rate": 1.993886462882096e-05, "loss": 0.0323, "step": 12730 }, { "epoch": 0.18, "learning_rate": 1.993881658908249e-05, "loss": 0.0333, "step": 12740 }, { "epoch": 0.18, "learning_rate": 1.993876854934402e-05, "loss": 0.0337, "step": 12750 }, { "epoch": 0.18, "learning_rate": 1.9938720509605546e-05, "loss": 0.0357, "step": 12760 }, { "epoch": 0.18, "learning_rate": 1.9938672469867075e-05, "loss": 0.0402, "step": 12770 }, { "epoch": 0.18, "learning_rate": 1.9938624430128604e-05, "loss": 0.0388, "step": 12780 }, { "epoch": 0.18, "learning_rate": 1.9938576390390133e-05, "loss": 0.0316, "step": 12790 }, { "epoch": 0.18, "learning_rate": 1.993852835065166e-05, "loss": 0.0336, "step": 12800 }, { "epoch": 0.18, "learning_rate": 1.993848031091319e-05, "loss": 0.0385, "step": 12810 }, { "epoch": 0.18, "learning_rate": 1.9938432271174718e-05, "loss": 0.0356, "step": 12820 }, { "epoch": 0.18, "learning_rate": 1.9938384231436244e-05, "loss": 0.0342, "step": 12830 }, { "epoch": 0.19, "learning_rate": 1.9938336191697773e-05, "loss": 0.0376, "step": 12840 }, { "epoch": 0.19, "learning_rate": 1.9938288151959302e-05, "loss": 0.0311, "step": 12850 }, { "epoch": 0.19, "learning_rate": 1.993824011222083e-05, "loss": 0.0286, "step": 12860 }, { "epoch": 0.19, "learning_rate": 1.9938192072482357e-05, "loss": 0.0336, "step": 12870 }, { "epoch": 0.19, "learning_rate": 1.9938144032743887e-05, "loss": 0.0334, "step": 12880 }, { "epoch": 0.19, "learning_rate": 1.9938095993005416e-05, "loss": 0.0339, "step": 12890 }, { "epoch": 0.19, "learning_rate": 1.9938047953266945e-05, "loss": 0.0341, "step": 12900 }, { "epoch": 0.19, "learning_rate": 1.993799991352847e-05, "loss": 0.0345, "step": 12910 }, { "epoch": 0.19, "learning_rate": 1.993795187379e-05, "loss": 0.0367, "step": 12920 }, { "epoch": 0.19, "learning_rate": 1.993790383405153e-05, "loss": 0.0278, "step": 12930 }, { "epoch": 0.19, "learning_rate": 1.9937855794313055e-05, "loss": 0.0344, "step": 12940 }, { "epoch": 0.19, "learning_rate": 1.9937807754574585e-05, "loss": 0.0307, "step": 12950 }, { "epoch": 0.19, "learning_rate": 1.9937759714836114e-05, "loss": 0.035, "step": 12960 }, { "epoch": 0.19, "learning_rate": 1.9937711675097643e-05, "loss": 0.0333, "step": 12970 }, { "epoch": 0.19, "learning_rate": 1.993766363535917e-05, "loss": 0.0318, "step": 12980 }, { "epoch": 0.19, "learning_rate": 1.99376155956207e-05, "loss": 0.0314, "step": 12990 }, { "epoch": 0.19, "learning_rate": 1.9937567555882228e-05, "loss": 0.0343, "step": 13000 }, { "epoch": 0.19, "learning_rate": 1.9937519516143754e-05, "loss": 0.0396, "step": 13010 }, { "epoch": 0.19, "learning_rate": 1.9937471476405283e-05, "loss": 0.0428, "step": 13020 }, { "epoch": 0.19, "learning_rate": 1.9937423436666812e-05, "loss": 0.0353, "step": 13030 }, { "epoch": 0.19, "learning_rate": 1.993737539692834e-05, "loss": 0.0355, "step": 13040 }, { "epoch": 0.19, "learning_rate": 1.9937327357189867e-05, "loss": 0.0361, "step": 13050 }, { "epoch": 0.19, "learning_rate": 1.9937279317451396e-05, "loss": 0.0323, "step": 13060 }, { "epoch": 0.19, "learning_rate": 1.9937231277712926e-05, "loss": 0.0311, "step": 13070 }, { "epoch": 0.19, "learning_rate": 1.9937183237974455e-05, "loss": 0.0308, "step": 13080 }, { "epoch": 0.19, "learning_rate": 1.993713519823598e-05, "loss": 0.037, "step": 13090 }, { "epoch": 0.19, "learning_rate": 1.993708715849751e-05, "loss": 0.0316, "step": 13100 }, { "epoch": 0.19, "learning_rate": 1.993703911875904e-05, "loss": 0.0357, "step": 13110 }, { "epoch": 0.19, "learning_rate": 1.9936991079020565e-05, "loss": 0.0345, "step": 13120 }, { "epoch": 0.19, "learning_rate": 1.9936943039282095e-05, "loss": 0.0391, "step": 13130 }, { "epoch": 0.19, "learning_rate": 1.9936894999543624e-05, "loss": 0.032, "step": 13140 }, { "epoch": 0.19, "learning_rate": 1.9936846959805153e-05, "loss": 0.0345, "step": 13150 }, { "epoch": 0.19, "learning_rate": 1.993679892006668e-05, "loss": 0.0286, "step": 13160 }, { "epoch": 0.19, "learning_rate": 1.9936750880328208e-05, "loss": 0.0291, "step": 13170 }, { "epoch": 0.19, "learning_rate": 1.9936702840589738e-05, "loss": 0.0391, "step": 13180 }, { "epoch": 0.19, "learning_rate": 1.9936654800851263e-05, "loss": 0.0357, "step": 13190 }, { "epoch": 0.19, "learning_rate": 1.9936606761112793e-05, "loss": 0.0316, "step": 13200 }, { "epoch": 0.19, "learning_rate": 1.9936558721374322e-05, "loss": 0.0367, "step": 13210 }, { "epoch": 0.19, "learning_rate": 1.993651068163585e-05, "loss": 0.0315, "step": 13220 }, { "epoch": 0.19, "learning_rate": 1.9936462641897377e-05, "loss": 0.0353, "step": 13230 }, { "epoch": 0.19, "learning_rate": 1.9936414602158906e-05, "loss": 0.0324, "step": 13240 }, { "epoch": 0.19, "learning_rate": 1.9936366562420436e-05, "loss": 0.0418, "step": 13250 }, { "epoch": 0.19, "learning_rate": 1.9936318522681965e-05, "loss": 0.0397, "step": 13260 }, { "epoch": 0.19, "learning_rate": 1.993627048294349e-05, "loss": 0.0363, "step": 13270 }, { "epoch": 0.19, "learning_rate": 1.993622244320502e-05, "loss": 0.0353, "step": 13280 }, { "epoch": 0.19, "learning_rate": 1.993617440346655e-05, "loss": 0.0363, "step": 13290 }, { "epoch": 0.19, "learning_rate": 1.9936126363728075e-05, "loss": 0.0331, "step": 13300 }, { "epoch": 0.19, "learning_rate": 1.9936078323989605e-05, "loss": 0.0271, "step": 13310 }, { "epoch": 0.19, "learning_rate": 1.9936030284251134e-05, "loss": 0.0362, "step": 13320 }, { "epoch": 0.19, "learning_rate": 1.9935982244512663e-05, "loss": 0.0409, "step": 13330 }, { "epoch": 0.19, "learning_rate": 1.993593420477419e-05, "loss": 0.0343, "step": 13340 }, { "epoch": 0.19, "learning_rate": 1.9935886165035718e-05, "loss": 0.0436, "step": 13350 }, { "epoch": 0.19, "learning_rate": 1.9935838125297247e-05, "loss": 0.0305, "step": 13360 }, { "epoch": 0.19, "learning_rate": 1.9935790085558773e-05, "loss": 0.0389, "step": 13370 }, { "epoch": 0.19, "learning_rate": 1.9935742045820303e-05, "loss": 0.0308, "step": 13380 }, { "epoch": 0.19, "learning_rate": 1.993569881005568e-05, "loss": 0.0349, "step": 13390 }, { "epoch": 0.19, "learning_rate": 1.9935650770317207e-05, "loss": 0.0342, "step": 13400 }, { "epoch": 0.19, "learning_rate": 1.9935602730578736e-05, "loss": 0.0348, "step": 13410 }, { "epoch": 0.19, "learning_rate": 1.9935554690840265e-05, "loss": 0.0333, "step": 13420 }, { "epoch": 0.19, "learning_rate": 1.993550665110179e-05, "loss": 0.0356, "step": 13430 }, { "epoch": 0.19, "learning_rate": 1.993545861136332e-05, "loss": 0.0336, "step": 13440 }, { "epoch": 0.19, "learning_rate": 1.993541057162485e-05, "loss": 0.0307, "step": 13450 }, { "epoch": 0.19, "learning_rate": 1.993536253188638e-05, "loss": 0.0388, "step": 13460 }, { "epoch": 0.19, "learning_rate": 1.9935314492147905e-05, "loss": 0.031, "step": 13470 }, { "epoch": 0.19, "learning_rate": 1.9935266452409434e-05, "loss": 0.0343, "step": 13480 }, { "epoch": 0.19, "learning_rate": 1.9935218412670963e-05, "loss": 0.0275, "step": 13490 }, { "epoch": 0.19, "learning_rate": 1.9935170372932492e-05, "loss": 0.0328, "step": 13500 }, { "epoch": 0.19, "learning_rate": 1.993512233319402e-05, "loss": 0.0356, "step": 13510 }, { "epoch": 0.19, "learning_rate": 1.9935074293455548e-05, "loss": 0.0377, "step": 13520 }, { "epoch": 0.19, "learning_rate": 1.9935026253717077e-05, "loss": 0.0309, "step": 13530 }, { "epoch": 0.2, "learning_rate": 1.9934978213978603e-05, "loss": 0.0271, "step": 13540 }, { "epoch": 0.2, "learning_rate": 1.9934930174240132e-05, "loss": 0.0362, "step": 13550 }, { "epoch": 0.2, "learning_rate": 1.993488213450166e-05, "loss": 0.0386, "step": 13560 }, { "epoch": 0.2, "learning_rate": 1.993483409476319e-05, "loss": 0.0301, "step": 13570 }, { "epoch": 0.2, "learning_rate": 1.9934786055024716e-05, "loss": 0.0328, "step": 13580 }, { "epoch": 0.2, "learning_rate": 1.9934738015286246e-05, "loss": 0.0291, "step": 13590 }, { "epoch": 0.2, "learning_rate": 1.9934689975547775e-05, "loss": 0.0338, "step": 13600 }, { "epoch": 0.2, "learning_rate": 1.99346419358093e-05, "loss": 0.0378, "step": 13610 }, { "epoch": 0.2, "learning_rate": 1.993459389607083e-05, "loss": 0.0385, "step": 13620 }, { "epoch": 0.2, "learning_rate": 1.993454585633236e-05, "loss": 0.0425, "step": 13630 }, { "epoch": 0.2, "learning_rate": 1.993449781659389e-05, "loss": 0.0315, "step": 13640 }, { "epoch": 0.2, "learning_rate": 1.9934449776855415e-05, "loss": 0.0335, "step": 13650 }, { "epoch": 0.2, "learning_rate": 1.9934401737116944e-05, "loss": 0.0359, "step": 13660 }, { "epoch": 0.2, "learning_rate": 1.9934353697378473e-05, "loss": 0.0384, "step": 13670 }, { "epoch": 0.2, "learning_rate": 1.9934305657640002e-05, "loss": 0.0382, "step": 13680 }, { "epoch": 0.2, "learning_rate": 1.9934257617901528e-05, "loss": 0.0254, "step": 13690 }, { "epoch": 0.2, "learning_rate": 1.9934209578163058e-05, "loss": 0.0351, "step": 13700 }, { "epoch": 0.2, "learning_rate": 1.9934161538424587e-05, "loss": 0.0293, "step": 13710 }, { "epoch": 0.2, "learning_rate": 1.9934113498686113e-05, "loss": 0.0325, "step": 13720 }, { "epoch": 0.2, "learning_rate": 1.9934065458947642e-05, "loss": 0.0371, "step": 13730 }, { "epoch": 0.2, "learning_rate": 1.993401741920917e-05, "loss": 0.0387, "step": 13740 }, { "epoch": 0.2, "learning_rate": 1.99339693794707e-05, "loss": 0.034, "step": 13750 }, { "epoch": 0.2, "learning_rate": 1.9933921339732226e-05, "loss": 0.0365, "step": 13760 }, { "epoch": 0.2, "learning_rate": 1.9933873299993756e-05, "loss": 0.0343, "step": 13770 }, { "epoch": 0.2, "learning_rate": 1.9933825260255285e-05, "loss": 0.0319, "step": 13780 }, { "epoch": 0.2, "learning_rate": 1.993377722051681e-05, "loss": 0.0349, "step": 13790 }, { "epoch": 0.2, "learning_rate": 1.993372918077834e-05, "loss": 0.0388, "step": 13800 }, { "epoch": 0.2, "learning_rate": 1.993368114103987e-05, "loss": 0.0328, "step": 13810 }, { "epoch": 0.2, "learning_rate": 1.99336331013014e-05, "loss": 0.0345, "step": 13820 }, { "epoch": 0.2, "learning_rate": 1.9933585061562924e-05, "loss": 0.04, "step": 13830 }, { "epoch": 0.2, "learning_rate": 1.9933537021824454e-05, "loss": 0.0338, "step": 13840 }, { "epoch": 0.2, "learning_rate": 1.9933488982085983e-05, "loss": 0.0374, "step": 13850 }, { "epoch": 0.2, "learning_rate": 1.993344094234751e-05, "loss": 0.0358, "step": 13860 }, { "epoch": 0.2, "learning_rate": 1.9933392902609038e-05, "loss": 0.0329, "step": 13870 }, { "epoch": 0.2, "learning_rate": 1.9933344862870567e-05, "loss": 0.0282, "step": 13880 }, { "epoch": 0.2, "learning_rate": 1.9933296823132097e-05, "loss": 0.0333, "step": 13890 }, { "epoch": 0.2, "learning_rate": 1.9933248783393623e-05, "loss": 0.0296, "step": 13900 }, { "epoch": 0.2, "learning_rate": 1.9933200743655152e-05, "loss": 0.038, "step": 13910 }, { "epoch": 0.2, "learning_rate": 1.993315270391668e-05, "loss": 0.0318, "step": 13920 }, { "epoch": 0.2, "learning_rate": 1.993310466417821e-05, "loss": 0.0346, "step": 13930 }, { "epoch": 0.2, "learning_rate": 1.9933056624439736e-05, "loss": 0.0346, "step": 13940 }, { "epoch": 0.2, "learning_rate": 1.9933008584701266e-05, "loss": 0.028, "step": 13950 }, { "epoch": 0.2, "learning_rate": 1.9932960544962795e-05, "loss": 0.0325, "step": 13960 }, { "epoch": 0.2, "learning_rate": 1.993291250522432e-05, "loss": 0.0297, "step": 13970 }, { "epoch": 0.2, "learning_rate": 1.993286446548585e-05, "loss": 0.0361, "step": 13980 }, { "epoch": 0.2, "learning_rate": 1.993281642574738e-05, "loss": 0.0318, "step": 13990 }, { "epoch": 0.2, "learning_rate": 1.993276838600891e-05, "loss": 0.0335, "step": 14000 }, { "epoch": 0.2, "learning_rate": 1.9932720346270434e-05, "loss": 0.0355, "step": 14010 }, { "epoch": 0.2, "learning_rate": 1.9932672306531964e-05, "loss": 0.0337, "step": 14020 }, { "epoch": 0.2, "learning_rate": 1.9932624266793493e-05, "loss": 0.0278, "step": 14030 }, { "epoch": 0.2, "learning_rate": 1.993257622705502e-05, "loss": 0.0386, "step": 14040 }, { "epoch": 0.2, "learning_rate": 1.9932528187316548e-05, "loss": 0.0393, "step": 14050 }, { "epoch": 0.2, "learning_rate": 1.9932480147578077e-05, "loss": 0.0321, "step": 14060 }, { "epoch": 0.2, "learning_rate": 1.9932432107839607e-05, "loss": 0.0269, "step": 14070 }, { "epoch": 0.2, "learning_rate": 1.9932384068101133e-05, "loss": 0.0273, "step": 14080 }, { "epoch": 0.2, "learning_rate": 1.9932336028362662e-05, "loss": 0.0335, "step": 14090 }, { "epoch": 0.2, "learning_rate": 1.993228798862419e-05, "loss": 0.0387, "step": 14100 }, { "epoch": 0.2, "learning_rate": 1.993223994888572e-05, "loss": 0.0391, "step": 14110 }, { "epoch": 0.2, "learning_rate": 1.993219190914725e-05, "loss": 0.0342, "step": 14120 }, { "epoch": 0.2, "learning_rate": 1.993214386940878e-05, "loss": 0.0326, "step": 14130 }, { "epoch": 0.2, "learning_rate": 1.9932095829670305e-05, "loss": 0.0237, "step": 14140 }, { "epoch": 0.2, "learning_rate": 1.9932047789931834e-05, "loss": 0.0319, "step": 14150 }, { "epoch": 0.2, "learning_rate": 1.9931999750193363e-05, "loss": 0.0314, "step": 14160 }, { "epoch": 0.2, "learning_rate": 1.9931951710454893e-05, "loss": 0.0299, "step": 14170 }, { "epoch": 0.2, "learning_rate": 1.9931908474690264e-05, "loss": 0.0358, "step": 14180 }, { "epoch": 0.2, "learning_rate": 1.9931860434951793e-05, "loss": 0.0324, "step": 14190 }, { "epoch": 0.2, "learning_rate": 1.9931812395213322e-05, "loss": 0.0269, "step": 14200 }, { "epoch": 0.2, "learning_rate": 1.9931764355474848e-05, "loss": 0.0304, "step": 14210 }, { "epoch": 0.2, "learning_rate": 1.9931716315736378e-05, "loss": 0.0336, "step": 14220 }, { "epoch": 0.21, "learning_rate": 1.9931668275997907e-05, "loss": 0.027, "step": 14230 }, { "epoch": 0.21, "learning_rate": 1.9931620236259436e-05, "loss": 0.0328, "step": 14240 }, { "epoch": 0.21, "learning_rate": 1.9931572196520962e-05, "loss": 0.0388, "step": 14250 }, { "epoch": 0.21, "learning_rate": 1.993152415678249e-05, "loss": 0.0282, "step": 14260 }, { "epoch": 0.21, "learning_rate": 1.993147611704402e-05, "loss": 0.0332, "step": 14270 }, { "epoch": 0.21, "learning_rate": 1.9931428077305546e-05, "loss": 0.0266, "step": 14280 }, { "epoch": 0.21, "learning_rate": 1.9931380037567076e-05, "loss": 0.0287, "step": 14290 }, { "epoch": 0.21, "learning_rate": 1.9931331997828605e-05, "loss": 0.0313, "step": 14300 }, { "epoch": 0.21, "learning_rate": 1.9931283958090134e-05, "loss": 0.0357, "step": 14310 }, { "epoch": 0.21, "learning_rate": 1.993123591835166e-05, "loss": 0.0299, "step": 14320 }, { "epoch": 0.21, "learning_rate": 1.993118787861319e-05, "loss": 0.0308, "step": 14330 }, { "epoch": 0.21, "learning_rate": 1.993113983887472e-05, "loss": 0.0344, "step": 14340 }, { "epoch": 0.21, "learning_rate": 1.9931091799136248e-05, "loss": 0.0298, "step": 14350 }, { "epoch": 0.21, "learning_rate": 1.9931043759397774e-05, "loss": 0.039, "step": 14360 }, { "epoch": 0.21, "learning_rate": 1.9930995719659303e-05, "loss": 0.0315, "step": 14370 }, { "epoch": 0.21, "learning_rate": 1.9930947679920832e-05, "loss": 0.0345, "step": 14380 }, { "epoch": 0.21, "learning_rate": 1.9930899640182358e-05, "loss": 0.0411, "step": 14390 }, { "epoch": 0.21, "learning_rate": 1.9930851600443887e-05, "loss": 0.0367, "step": 14400 }, { "epoch": 0.21, "learning_rate": 1.9930803560705417e-05, "loss": 0.0352, "step": 14410 }, { "epoch": 0.21, "learning_rate": 1.9930755520966946e-05, "loss": 0.0301, "step": 14420 }, { "epoch": 0.21, "learning_rate": 1.9930707481228472e-05, "loss": 0.0354, "step": 14430 }, { "epoch": 0.21, "learning_rate": 1.993065944149e-05, "loss": 0.0337, "step": 14440 }, { "epoch": 0.21, "learning_rate": 1.993061140175153e-05, "loss": 0.0335, "step": 14450 }, { "epoch": 0.21, "learning_rate": 1.9930563362013056e-05, "loss": 0.0268, "step": 14460 }, { "epoch": 0.21, "learning_rate": 1.9930515322274586e-05, "loss": 0.0318, "step": 14470 }, { "epoch": 0.21, "learning_rate": 1.9930467282536115e-05, "loss": 0.0334, "step": 14480 }, { "epoch": 0.21, "learning_rate": 1.9930419242797644e-05, "loss": 0.028, "step": 14490 }, { "epoch": 0.21, "learning_rate": 1.993037120305917e-05, "loss": 0.036, "step": 14500 }, { "epoch": 0.21, "learning_rate": 1.99303231633207e-05, "loss": 0.0408, "step": 14510 }, { "epoch": 0.21, "learning_rate": 1.993027512358223e-05, "loss": 0.033, "step": 14520 }, { "epoch": 0.21, "learning_rate": 1.9930227083843758e-05, "loss": 0.0311, "step": 14530 }, { "epoch": 0.21, "learning_rate": 1.9930179044105284e-05, "loss": 0.0376, "step": 14540 }, { "epoch": 0.21, "learning_rate": 1.9930131004366813e-05, "loss": 0.0324, "step": 14550 }, { "epoch": 0.21, "learning_rate": 1.9930082964628342e-05, "loss": 0.0409, "step": 14560 }, { "epoch": 0.21, "learning_rate": 1.9930034924889868e-05, "loss": 0.031, "step": 14570 }, { "epoch": 0.21, "learning_rate": 1.9929986885151397e-05, "loss": 0.0375, "step": 14580 }, { "epoch": 0.21, "learning_rate": 1.9929938845412927e-05, "loss": 0.0304, "step": 14590 }, { "epoch": 0.21, "learning_rate": 1.9929890805674456e-05, "loss": 0.0364, "step": 14600 }, { "epoch": 0.21, "learning_rate": 1.9929842765935982e-05, "loss": 0.0361, "step": 14610 }, { "epoch": 0.21, "learning_rate": 1.9929794726197514e-05, "loss": 0.0318, "step": 14620 }, { "epoch": 0.21, "learning_rate": 1.992974668645904e-05, "loss": 0.0339, "step": 14630 }, { "epoch": 0.21, "learning_rate": 1.992969864672057e-05, "loss": 0.0322, "step": 14640 }, { "epoch": 0.21, "learning_rate": 1.99296506069821e-05, "loss": 0.0349, "step": 14650 }, { "epoch": 0.21, "learning_rate": 1.9929602567243628e-05, "loss": 0.0296, "step": 14660 }, { "epoch": 0.21, "learning_rate": 1.9929554527505154e-05, "loss": 0.0341, "step": 14670 }, { "epoch": 0.21, "learning_rate": 1.9929506487766683e-05, "loss": 0.0317, "step": 14680 }, { "epoch": 0.21, "learning_rate": 1.9929458448028213e-05, "loss": 0.0318, "step": 14690 }, { "epoch": 0.21, "learning_rate": 1.992941040828974e-05, "loss": 0.0381, "step": 14700 }, { "epoch": 0.21, "learning_rate": 1.9929362368551268e-05, "loss": 0.0317, "step": 14710 }, { "epoch": 0.21, "learning_rate": 1.9929314328812797e-05, "loss": 0.0236, "step": 14720 }, { "epoch": 0.21, "learning_rate": 1.9929266289074326e-05, "loss": 0.0282, "step": 14730 }, { "epoch": 0.21, "learning_rate": 1.9929218249335852e-05, "loss": 0.026, "step": 14740 }, { "epoch": 0.21, "learning_rate": 1.992917020959738e-05, "loss": 0.0308, "step": 14750 }, { "epoch": 0.21, "learning_rate": 1.992912216985891e-05, "loss": 0.0286, "step": 14760 }, { "epoch": 0.21, "learning_rate": 1.992907413012044e-05, "loss": 0.0329, "step": 14770 }, { "epoch": 0.21, "learning_rate": 1.9929026090381966e-05, "loss": 0.0291, "step": 14780 }, { "epoch": 0.21, "learning_rate": 1.9928978050643495e-05, "loss": 0.0342, "step": 14790 }, { "epoch": 0.21, "learning_rate": 1.9928930010905024e-05, "loss": 0.0334, "step": 14800 }, { "epoch": 0.21, "learning_rate": 1.992888197116655e-05, "loss": 0.0287, "step": 14810 }, { "epoch": 0.21, "learning_rate": 1.992883393142808e-05, "loss": 0.0287, "step": 14820 }, { "epoch": 0.21, "learning_rate": 1.992878589168961e-05, "loss": 0.032, "step": 14830 }, { "epoch": 0.21, "learning_rate": 1.9928737851951138e-05, "loss": 0.0296, "step": 14840 }, { "epoch": 0.21, "learning_rate": 1.9928689812212664e-05, "loss": 0.0333, "step": 14850 }, { "epoch": 0.21, "learning_rate": 1.9928641772474193e-05, "loss": 0.0356, "step": 14860 }, { "epoch": 0.21, "learning_rate": 1.9928593732735722e-05, "loss": 0.0375, "step": 14870 }, { "epoch": 0.21, "learning_rate": 1.992854569299725e-05, "loss": 0.0398, "step": 14880 }, { "epoch": 0.21, "learning_rate": 1.9928497653258778e-05, "loss": 0.0251, "step": 14890 }, { "epoch": 0.21, "learning_rate": 1.9928449613520307e-05, "loss": 0.025, "step": 14900 }, { "epoch": 0.21, "learning_rate": 1.9928401573781836e-05, "loss": 0.0369, "step": 14910 }, { "epoch": 0.22, "learning_rate": 1.9928353534043362e-05, "loss": 0.0268, "step": 14920 }, { "epoch": 0.22, "learning_rate": 1.992830549430489e-05, "loss": 0.0306, "step": 14930 }, { "epoch": 0.22, "learning_rate": 1.992825745456642e-05, "loss": 0.0358, "step": 14940 }, { "epoch": 0.22, "learning_rate": 1.9928209414827946e-05, "loss": 0.0396, "step": 14950 }, { "epoch": 0.22, "learning_rate": 1.9928161375089476e-05, "loss": 0.0326, "step": 14960 }, { "epoch": 0.22, "learning_rate": 1.9928113335351005e-05, "loss": 0.0307, "step": 14970 }, { "epoch": 0.22, "learning_rate": 1.9928065295612534e-05, "loss": 0.0299, "step": 14980 }, { "epoch": 0.22, "learning_rate": 1.992801725587406e-05, "loss": 0.0364, "step": 14990 }, { "epoch": 0.22, "learning_rate": 1.992796921613559e-05, "loss": 0.0341, "step": 15000 }, { "epoch": 0.22, "learning_rate": 1.992792117639712e-05, "loss": 0.0248, "step": 15010 }, { "epoch": 0.22, "learning_rate": 1.9927873136658648e-05, "loss": 0.032, "step": 15020 }, { "epoch": 0.22, "learning_rate": 1.9927825096920174e-05, "loss": 0.0328, "step": 15030 }, { "epoch": 0.22, "learning_rate": 1.9927777057181703e-05, "loss": 0.033, "step": 15040 }, { "epoch": 0.22, "learning_rate": 1.9927729017443232e-05, "loss": 0.0314, "step": 15050 }, { "epoch": 0.22, "learning_rate": 1.9927680977704758e-05, "loss": 0.0293, "step": 15060 }, { "epoch": 0.22, "learning_rate": 1.9927632937966288e-05, "loss": 0.0284, "step": 15070 }, { "epoch": 0.22, "learning_rate": 1.9927584898227817e-05, "loss": 0.0245, "step": 15080 }, { "epoch": 0.22, "learning_rate": 1.9927536858489346e-05, "loss": 0.0317, "step": 15090 }, { "epoch": 0.22, "learning_rate": 1.9927488818750872e-05, "loss": 0.0331, "step": 15100 }, { "epoch": 0.22, "learning_rate": 1.99274407790124e-05, "loss": 0.0312, "step": 15110 }, { "epoch": 0.22, "learning_rate": 1.992739273927393e-05, "loss": 0.0345, "step": 15120 }, { "epoch": 0.22, "learning_rate": 1.9927344699535456e-05, "loss": 0.0285, "step": 15130 }, { "epoch": 0.22, "learning_rate": 1.9927296659796986e-05, "loss": 0.0355, "step": 15140 }, { "epoch": 0.22, "learning_rate": 1.9927248620058515e-05, "loss": 0.0341, "step": 15150 }, { "epoch": 0.22, "learning_rate": 1.9927200580320044e-05, "loss": 0.0315, "step": 15160 }, { "epoch": 0.22, "learning_rate": 1.992715254058157e-05, "loss": 0.0318, "step": 15170 }, { "epoch": 0.22, "learning_rate": 1.99271045008431e-05, "loss": 0.0347, "step": 15180 }, { "epoch": 0.22, "learning_rate": 1.992705646110463e-05, "loss": 0.0329, "step": 15190 }, { "epoch": 0.22, "learning_rate": 1.9927008421366158e-05, "loss": 0.0322, "step": 15200 }, { "epoch": 0.22, "learning_rate": 1.9926960381627684e-05, "loss": 0.0315, "step": 15210 }, { "epoch": 0.22, "learning_rate": 1.9926912341889213e-05, "loss": 0.0392, "step": 15220 }, { "epoch": 0.22, "learning_rate": 1.9926864302150742e-05, "loss": 0.0314, "step": 15230 }, { "epoch": 0.22, "learning_rate": 1.9926816262412268e-05, "loss": 0.0336, "step": 15240 }, { "epoch": 0.22, "learning_rate": 1.9926768222673797e-05, "loss": 0.029, "step": 15250 }, { "epoch": 0.22, "learning_rate": 1.9926720182935327e-05, "loss": 0.0327, "step": 15260 }, { "epoch": 0.22, "learning_rate": 1.9926672143196856e-05, "loss": 0.0305, "step": 15270 }, { "epoch": 0.22, "learning_rate": 1.9926624103458382e-05, "loss": 0.0348, "step": 15280 }, { "epoch": 0.22, "learning_rate": 1.992657606371991e-05, "loss": 0.0361, "step": 15290 }, { "epoch": 0.22, "learning_rate": 1.992652802398144e-05, "loss": 0.0327, "step": 15300 }, { "epoch": 0.22, "learning_rate": 1.9926479984242966e-05, "loss": 0.0311, "step": 15310 }, { "epoch": 0.22, "learning_rate": 1.9926431944504496e-05, "loss": 0.0319, "step": 15320 }, { "epoch": 0.22, "learning_rate": 1.9926383904766025e-05, "loss": 0.0298, "step": 15330 }, { "epoch": 0.22, "learning_rate": 1.9926335865027554e-05, "loss": 0.0321, "step": 15340 }, { "epoch": 0.22, "learning_rate": 1.992628782528908e-05, "loss": 0.0326, "step": 15350 }, { "epoch": 0.22, "learning_rate": 1.992623978555061e-05, "loss": 0.0311, "step": 15360 }, { "epoch": 0.22, "learning_rate": 1.992619174581214e-05, "loss": 0.0241, "step": 15370 }, { "epoch": 0.22, "learning_rate": 1.9926143706073668e-05, "loss": 0.0334, "step": 15380 }, { "epoch": 0.22, "learning_rate": 1.9926095666335194e-05, "loss": 0.0313, "step": 15390 }, { "epoch": 0.22, "learning_rate": 1.9926047626596723e-05, "loss": 0.0334, "step": 15400 }, { "epoch": 0.22, "learning_rate": 1.9925999586858252e-05, "loss": 0.0324, "step": 15410 }, { "epoch": 0.22, "learning_rate": 1.9925951547119778e-05, "loss": 0.0286, "step": 15420 }, { "epoch": 0.22, "learning_rate": 1.9925903507381307e-05, "loss": 0.0253, "step": 15430 }, { "epoch": 0.22, "learning_rate": 1.9925855467642837e-05, "loss": 0.0363, "step": 15440 }, { "epoch": 0.22, "learning_rate": 1.9925807427904366e-05, "loss": 0.0316, "step": 15450 }, { "epoch": 0.22, "learning_rate": 1.9925759388165892e-05, "loss": 0.036, "step": 15460 }, { "epoch": 0.22, "learning_rate": 1.992571134842742e-05, "loss": 0.0314, "step": 15470 }, { "epoch": 0.22, "learning_rate": 1.992566330868895e-05, "loss": 0.0343, "step": 15480 }, { "epoch": 0.22, "learning_rate": 1.9925615268950476e-05, "loss": 0.028, "step": 15490 }, { "epoch": 0.22, "learning_rate": 1.9925567229212005e-05, "loss": 0.0242, "step": 15500 }, { "epoch": 0.22, "learning_rate": 1.9925519189473535e-05, "loss": 0.0269, "step": 15510 }, { "epoch": 0.22, "learning_rate": 1.9925471149735064e-05, "loss": 0.0306, "step": 15520 }, { "epoch": 0.22, "learning_rate": 1.992542310999659e-05, "loss": 0.0412, "step": 15530 }, { "epoch": 0.22, "learning_rate": 1.992537507025812e-05, "loss": 0.0319, "step": 15540 }, { "epoch": 0.22, "learning_rate": 1.992532703051965e-05, "loss": 0.0333, "step": 15550 }, { "epoch": 0.22, "learning_rate": 1.9925278990781178e-05, "loss": 0.0256, "step": 15560 }, { "epoch": 0.22, "learning_rate": 1.9925230951042704e-05, "loss": 0.024, "step": 15570 }, { "epoch": 0.22, "learning_rate": 1.9925182911304233e-05, "loss": 0.0313, "step": 15580 }, { "epoch": 0.22, "learning_rate": 1.9925134871565762e-05, "loss": 0.0319, "step": 15590 }, { "epoch": 0.22, "learning_rate": 1.9925086831827288e-05, "loss": 0.0278, "step": 15600 }, { "epoch": 0.22, "learning_rate": 1.9925038792088817e-05, "loss": 0.0322, "step": 15610 }, { "epoch": 0.23, "learning_rate": 1.9924990752350347e-05, "loss": 0.0261, "step": 15620 }, { "epoch": 0.23, "learning_rate": 1.9924942712611876e-05, "loss": 0.0298, "step": 15630 }, { "epoch": 0.23, "learning_rate": 1.99248946728734e-05, "loss": 0.0351, "step": 15640 }, { "epoch": 0.23, "learning_rate": 1.992484663313493e-05, "loss": 0.0317, "step": 15650 }, { "epoch": 0.23, "learning_rate": 1.992479859339646e-05, "loss": 0.0334, "step": 15660 }, { "epoch": 0.23, "learning_rate": 1.9924750553657986e-05, "loss": 0.0345, "step": 15670 }, { "epoch": 0.23, "learning_rate": 1.9924702513919515e-05, "loss": 0.0302, "step": 15680 }, { "epoch": 0.23, "learning_rate": 1.9924654474181045e-05, "loss": 0.0379, "step": 15690 }, { "epoch": 0.23, "learning_rate": 1.9924606434442574e-05, "loss": 0.0268, "step": 15700 }, { "epoch": 0.23, "learning_rate": 1.99245583947041e-05, "loss": 0.0314, "step": 15710 }, { "epoch": 0.23, "learning_rate": 1.992451035496563e-05, "loss": 0.0271, "step": 15720 }, { "epoch": 0.23, "learning_rate": 1.992446231522716e-05, "loss": 0.0325, "step": 15730 }, { "epoch": 0.23, "learning_rate": 1.9924414275488688e-05, "loss": 0.0387, "step": 15740 }, { "epoch": 0.23, "learning_rate": 1.9924366235750213e-05, "loss": 0.0308, "step": 15750 }, { "epoch": 0.23, "learning_rate": 1.9924318196011743e-05, "loss": 0.0337, "step": 15760 }, { "epoch": 0.23, "learning_rate": 1.9924270156273272e-05, "loss": 0.0289, "step": 15770 }, { "epoch": 0.23, "learning_rate": 1.9924222116534798e-05, "loss": 0.032, "step": 15780 }, { "epoch": 0.23, "learning_rate": 1.9924174076796327e-05, "loss": 0.0344, "step": 15790 }, { "epoch": 0.23, "learning_rate": 1.9924126037057856e-05, "loss": 0.0264, "step": 15800 }, { "epoch": 0.23, "learning_rate": 1.9924077997319386e-05, "loss": 0.038, "step": 15810 }, { "epoch": 0.23, "learning_rate": 1.992402995758091e-05, "loss": 0.0322, "step": 15820 }, { "epoch": 0.23, "learning_rate": 1.992398191784244e-05, "loss": 0.0225, "step": 15830 }, { "epoch": 0.23, "learning_rate": 1.992393387810397e-05, "loss": 0.0276, "step": 15840 }, { "epoch": 0.23, "learning_rate": 1.9923885838365496e-05, "loss": 0.0261, "step": 15850 }, { "epoch": 0.23, "learning_rate": 1.9923837798627025e-05, "loss": 0.0333, "step": 15860 }, { "epoch": 0.23, "learning_rate": 1.9923789758888555e-05, "loss": 0.031, "step": 15870 }, { "epoch": 0.23, "learning_rate": 1.9923741719150084e-05, "loss": 0.0308, "step": 15880 }, { "epoch": 0.23, "learning_rate": 1.992369367941161e-05, "loss": 0.0286, "step": 15890 }, { "epoch": 0.23, "learning_rate": 1.992364563967314e-05, "loss": 0.0304, "step": 15900 }, { "epoch": 0.23, "learning_rate": 1.9923597599934668e-05, "loss": 0.0294, "step": 15910 }, { "epoch": 0.23, "learning_rate": 1.9923549560196198e-05, "loss": 0.0283, "step": 15920 }, { "epoch": 0.23, "learning_rate": 1.9923501520457723e-05, "loss": 0.0248, "step": 15930 }, { "epoch": 0.23, "learning_rate": 1.9923453480719253e-05, "loss": 0.0395, "step": 15940 }, { "epoch": 0.23, "learning_rate": 1.9923405440980782e-05, "loss": 0.0324, "step": 15950 }, { "epoch": 0.23, "learning_rate": 1.9923357401242308e-05, "loss": 0.0374, "step": 15960 }, { "epoch": 0.23, "learning_rate": 1.9923309361503837e-05, "loss": 0.0311, "step": 15970 }, { "epoch": 0.23, "learning_rate": 1.9923261321765366e-05, "loss": 0.037, "step": 15980 }, { "epoch": 0.23, "learning_rate": 1.9923213282026896e-05, "loss": 0.0244, "step": 15990 }, { "epoch": 0.23, "learning_rate": 1.992316524228842e-05, "loss": 0.0337, "step": 16000 }, { "epoch": 0.23, "learning_rate": 1.992311720254995e-05, "loss": 0.0309, "step": 16010 }, { "epoch": 0.23, "learning_rate": 1.992306916281148e-05, "loss": 0.0293, "step": 16020 }, { "epoch": 0.23, "learning_rate": 1.9923021123073006e-05, "loss": 0.0271, "step": 16030 }, { "epoch": 0.23, "learning_rate": 1.9922973083334535e-05, "loss": 0.0303, "step": 16040 }, { "epoch": 0.23, "learning_rate": 1.9922925043596064e-05, "loss": 0.0325, "step": 16050 }, { "epoch": 0.23, "learning_rate": 1.9922877003857594e-05, "loss": 0.0309, "step": 16060 }, { "epoch": 0.23, "learning_rate": 1.992282896411912e-05, "loss": 0.0302, "step": 16070 }, { "epoch": 0.23, "learning_rate": 1.992278092438065e-05, "loss": 0.0312, "step": 16080 }, { "epoch": 0.23, "learning_rate": 1.9922732884642178e-05, "loss": 0.0295, "step": 16090 }, { "epoch": 0.23, "learning_rate": 1.9922684844903707e-05, "loss": 0.0274, "step": 16100 }, { "epoch": 0.23, "learning_rate": 1.9922636805165233e-05, "loss": 0.0263, "step": 16110 }, { "epoch": 0.23, "learning_rate": 1.9922588765426763e-05, "loss": 0.0237, "step": 16120 }, { "epoch": 0.23, "learning_rate": 1.9922540725688292e-05, "loss": 0.0357, "step": 16130 }, { "epoch": 0.23, "learning_rate": 1.9922492685949818e-05, "loss": 0.0332, "step": 16140 }, { "epoch": 0.23, "learning_rate": 1.9922444646211347e-05, "loss": 0.0302, "step": 16150 }, { "epoch": 0.23, "learning_rate": 1.9922396606472876e-05, "loss": 0.0376, "step": 16160 }, { "epoch": 0.23, "learning_rate": 1.9922348566734406e-05, "loss": 0.0334, "step": 16170 }, { "epoch": 0.23, "learning_rate": 1.992230052699593e-05, "loss": 0.0327, "step": 16180 }, { "epoch": 0.23, "learning_rate": 1.992225248725746e-05, "loss": 0.0351, "step": 16190 }, { "epoch": 0.23, "learning_rate": 1.992220444751899e-05, "loss": 0.0282, "step": 16200 }, { "epoch": 0.23, "learning_rate": 1.9922156407780516e-05, "loss": 0.0357, "step": 16210 }, { "epoch": 0.23, "learning_rate": 1.9922108368042045e-05, "loss": 0.0353, "step": 16220 }, { "epoch": 0.23, "learning_rate": 1.9922060328303574e-05, "loss": 0.025, "step": 16230 }, { "epoch": 0.23, "learning_rate": 1.9922012288565104e-05, "loss": 0.0307, "step": 16240 }, { "epoch": 0.23, "learning_rate": 1.992196424882663e-05, "loss": 0.0348, "step": 16250 }, { "epoch": 0.23, "learning_rate": 1.992191620908816e-05, "loss": 0.0324, "step": 16260 }, { "epoch": 0.23, "learning_rate": 1.9921868169349688e-05, "loss": 0.031, "step": 16270 }, { "epoch": 0.23, "learning_rate": 1.9921820129611217e-05, "loss": 0.0279, "step": 16280 }, { "epoch": 0.23, "learning_rate": 1.9921772089872743e-05, "loss": 0.0316, "step": 16290 }, { "epoch": 0.23, "learning_rate": 1.9921724050134272e-05, "loss": 0.0273, "step": 16300 }, { "epoch": 0.24, "learning_rate": 1.9921676010395802e-05, "loss": 0.0279, "step": 16310 }, { "epoch": 0.24, "learning_rate": 1.9921627970657328e-05, "loss": 0.0292, "step": 16320 }, { "epoch": 0.24, "learning_rate": 1.9921579930918857e-05, "loss": 0.033, "step": 16330 }, { "epoch": 0.24, "learning_rate": 1.9921531891180386e-05, "loss": 0.0326, "step": 16340 }, { "epoch": 0.24, "learning_rate": 1.9921483851441915e-05, "loss": 0.0294, "step": 16350 }, { "epoch": 0.24, "learning_rate": 1.992143581170344e-05, "loss": 0.0406, "step": 16360 }, { "epoch": 0.24, "learning_rate": 1.992138777196497e-05, "loss": 0.0352, "step": 16370 }, { "epoch": 0.24, "learning_rate": 1.99213397322265e-05, "loss": 0.0297, "step": 16380 }, { "epoch": 0.24, "learning_rate": 1.9921291692488026e-05, "loss": 0.0262, "step": 16390 }, { "epoch": 0.24, "learning_rate": 1.9921243652749555e-05, "loss": 0.0256, "step": 16400 }, { "epoch": 0.24, "learning_rate": 1.9921195613011084e-05, "loss": 0.0305, "step": 16410 }, { "epoch": 0.24, "learning_rate": 1.9921147573272614e-05, "loss": 0.0333, "step": 16420 }, { "epoch": 0.24, "learning_rate": 1.992109953353414e-05, "loss": 0.0362, "step": 16430 }, { "epoch": 0.24, "learning_rate": 1.992105149379567e-05, "loss": 0.0266, "step": 16440 }, { "epoch": 0.24, "learning_rate": 1.9921003454057198e-05, "loss": 0.0262, "step": 16450 }, { "epoch": 0.24, "learning_rate": 1.9920955414318727e-05, "loss": 0.0285, "step": 16460 }, { "epoch": 0.24, "learning_rate": 1.9920907374580253e-05, "loss": 0.0387, "step": 16470 }, { "epoch": 0.24, "learning_rate": 1.9920859334841782e-05, "loss": 0.026, "step": 16480 }, { "epoch": 0.24, "learning_rate": 1.992081129510331e-05, "loss": 0.0274, "step": 16490 }, { "epoch": 0.24, "learning_rate": 1.9920763255364838e-05, "loss": 0.0341, "step": 16500 }, { "epoch": 0.24, "learning_rate": 1.9920715215626367e-05, "loss": 0.0311, "step": 16510 }, { "epoch": 0.24, "learning_rate": 1.9920667175887896e-05, "loss": 0.0203, "step": 16520 }, { "epoch": 0.24, "learning_rate": 1.9920619136149425e-05, "loss": 0.0282, "step": 16530 }, { "epoch": 0.24, "learning_rate": 1.992057109641095e-05, "loss": 0.0387, "step": 16540 }, { "epoch": 0.24, "learning_rate": 1.992052305667248e-05, "loss": 0.0341, "step": 16550 }, { "epoch": 0.24, "learning_rate": 1.992047501693401e-05, "loss": 0.0393, "step": 16560 }, { "epoch": 0.24, "learning_rate": 1.9920426977195536e-05, "loss": 0.0312, "step": 16570 }, { "epoch": 0.24, "learning_rate": 1.9920378937457065e-05, "loss": 0.0326, "step": 16580 }, { "epoch": 0.24, "learning_rate": 1.9920330897718594e-05, "loss": 0.034, "step": 16590 }, { "epoch": 0.24, "learning_rate": 1.9920282857980123e-05, "loss": 0.0301, "step": 16600 }, { "epoch": 0.24, "learning_rate": 1.992023481824165e-05, "loss": 0.0267, "step": 16610 }, { "epoch": 0.24, "learning_rate": 1.992018677850318e-05, "loss": 0.0352, "step": 16620 }, { "epoch": 0.24, "learning_rate": 1.9920138738764708e-05, "loss": 0.0292, "step": 16630 }, { "epoch": 0.24, "learning_rate": 1.9920090699026237e-05, "loss": 0.0323, "step": 16640 }, { "epoch": 0.24, "learning_rate": 1.9920042659287763e-05, "loss": 0.0302, "step": 16650 }, { "epoch": 0.24, "learning_rate": 1.9919994619549292e-05, "loss": 0.0283, "step": 16660 }, { "epoch": 0.24, "learning_rate": 1.991994657981082e-05, "loss": 0.0326, "step": 16670 }, { "epoch": 0.24, "learning_rate": 1.9919898540072347e-05, "loss": 0.029, "step": 16680 }, { "epoch": 0.24, "learning_rate": 1.9919850500333877e-05, "loss": 0.033, "step": 16690 }, { "epoch": 0.24, "learning_rate": 1.9919802460595406e-05, "loss": 0.0325, "step": 16700 }, { "epoch": 0.24, "learning_rate": 1.9919754420856935e-05, "loss": 0.0265, "step": 16710 }, { "epoch": 0.24, "learning_rate": 1.991970638111846e-05, "loss": 0.03, "step": 16720 }, { "epoch": 0.24, "learning_rate": 1.991965834137999e-05, "loss": 0.0306, "step": 16730 }, { "epoch": 0.24, "learning_rate": 1.991961030164152e-05, "loss": 0.0319, "step": 16740 }, { "epoch": 0.24, "learning_rate": 1.9919562261903046e-05, "loss": 0.0272, "step": 16750 }, { "epoch": 0.24, "learning_rate": 1.9919514222164575e-05, "loss": 0.0341, "step": 16760 }, { "epoch": 0.24, "learning_rate": 1.9919466182426104e-05, "loss": 0.0299, "step": 16770 }, { "epoch": 0.24, "learning_rate": 1.9919418142687633e-05, "loss": 0.0348, "step": 16780 }, { "epoch": 0.24, "learning_rate": 1.991937010294916e-05, "loss": 0.0254, "step": 16790 }, { "epoch": 0.24, "learning_rate": 1.991932206321069e-05, "loss": 0.0266, "step": 16800 }, { "epoch": 0.24, "learning_rate": 1.9919274023472218e-05, "loss": 0.0325, "step": 16810 }, { "epoch": 0.24, "learning_rate": 1.9919225983733744e-05, "loss": 0.0252, "step": 16820 }, { "epoch": 0.24, "learning_rate": 1.9919177943995273e-05, "loss": 0.0297, "step": 16830 }, { "epoch": 0.24, "learning_rate": 1.9919129904256802e-05, "loss": 0.0291, "step": 16840 }, { "epoch": 0.24, "learning_rate": 1.991908186451833e-05, "loss": 0.0252, "step": 16850 }, { "epoch": 0.24, "learning_rate": 1.9919033824779857e-05, "loss": 0.0322, "step": 16860 }, { "epoch": 0.24, "learning_rate": 1.9918985785041387e-05, "loss": 0.0353, "step": 16870 }, { "epoch": 0.24, "learning_rate": 1.9918937745302916e-05, "loss": 0.0327, "step": 16880 }, { "epoch": 0.24, "learning_rate": 1.9918889705564445e-05, "loss": 0.0227, "step": 16890 }, { "epoch": 0.24, "learning_rate": 1.991884166582597e-05, "loss": 0.0257, "step": 16900 }, { "epoch": 0.24, "learning_rate": 1.99187936260875e-05, "loss": 0.0331, "step": 16910 }, { "epoch": 0.24, "learning_rate": 1.991874558634903e-05, "loss": 0.032, "step": 16920 }, { "epoch": 0.24, "learning_rate": 1.9918697546610556e-05, "loss": 0.031, "step": 16930 }, { "epoch": 0.24, "learning_rate": 1.9918649506872085e-05, "loss": 0.0328, "step": 16940 }, { "epoch": 0.24, "learning_rate": 1.9918601467133614e-05, "loss": 0.0287, "step": 16950 }, { "epoch": 0.24, "learning_rate": 1.9918553427395143e-05, "loss": 0.0299, "step": 16960 }, { "epoch": 0.24, "learning_rate": 1.991850538765667e-05, "loss": 0.0279, "step": 16970 }, { "epoch": 0.24, "learning_rate": 1.99184573479182e-05, "loss": 0.0315, "step": 16980 }, { "epoch": 0.24, "learning_rate": 1.9918409308179728e-05, "loss": 0.0315, "step": 16990 }, { "epoch": 0.25, "learning_rate": 1.9918361268441254e-05, "loss": 0.0242, "step": 17000 }, { "epoch": 0.25, "learning_rate": 1.9918313228702783e-05, "loss": 0.027, "step": 17010 }, { "epoch": 0.25, "learning_rate": 1.9918265188964312e-05, "loss": 0.0273, "step": 17020 }, { "epoch": 0.25, "learning_rate": 1.991821714922584e-05, "loss": 0.0286, "step": 17030 }, { "epoch": 0.25, "learning_rate": 1.9918169109487367e-05, "loss": 0.0307, "step": 17040 }, { "epoch": 0.25, "learning_rate": 1.9918121069748897e-05, "loss": 0.0316, "step": 17050 }, { "epoch": 0.25, "learning_rate": 1.9918073030010426e-05, "loss": 0.0245, "step": 17060 }, { "epoch": 0.25, "learning_rate": 1.9918024990271955e-05, "loss": 0.0326, "step": 17070 }, { "epoch": 0.25, "learning_rate": 1.991797695053348e-05, "loss": 0.0299, "step": 17080 }, { "epoch": 0.25, "learning_rate": 1.991792891079501e-05, "loss": 0.0251, "step": 17090 }, { "epoch": 0.25, "learning_rate": 1.991788087105654e-05, "loss": 0.0278, "step": 17100 }, { "epoch": 0.25, "learning_rate": 1.9917832831318065e-05, "loss": 0.0208, "step": 17110 }, { "epoch": 0.25, "learning_rate": 1.9917784791579595e-05, "loss": 0.029, "step": 17120 }, { "epoch": 0.25, "learning_rate": 1.9917736751841124e-05, "loss": 0.0321, "step": 17130 }, { "epoch": 0.25, "learning_rate": 1.9917688712102653e-05, "loss": 0.0284, "step": 17140 }, { "epoch": 0.25, "learning_rate": 1.991764067236418e-05, "loss": 0.0258, "step": 17150 }, { "epoch": 0.25, "learning_rate": 1.991759263262571e-05, "loss": 0.028, "step": 17160 }, { "epoch": 0.25, "learning_rate": 1.9917544592887238e-05, "loss": 0.0287, "step": 17170 }, { "epoch": 0.25, "learning_rate": 1.9917496553148764e-05, "loss": 0.0276, "step": 17180 }, { "epoch": 0.25, "learning_rate": 1.9917448513410296e-05, "loss": 0.0332, "step": 17190 }, { "epoch": 0.25, "learning_rate": 1.9917400473671825e-05, "loss": 0.0313, "step": 17200 }, { "epoch": 0.25, "learning_rate": 1.991735243393335e-05, "loss": 0.0309, "step": 17210 }, { "epoch": 0.25, "learning_rate": 1.991730439419488e-05, "loss": 0.0254, "step": 17220 }, { "epoch": 0.25, "learning_rate": 1.991725635445641e-05, "loss": 0.0276, "step": 17230 }, { "epoch": 0.25, "learning_rate": 1.9917208314717936e-05, "loss": 0.0315, "step": 17240 }, { "epoch": 0.25, "learning_rate": 1.9917160274979465e-05, "loss": 0.0229, "step": 17250 }, { "epoch": 0.25, "learning_rate": 1.9917112235240994e-05, "loss": 0.0288, "step": 17260 }, { "epoch": 0.25, "learning_rate": 1.9917064195502524e-05, "loss": 0.0291, "step": 17270 }, { "epoch": 0.25, "learning_rate": 1.991701615576405e-05, "loss": 0.0296, "step": 17280 }, { "epoch": 0.25, "learning_rate": 1.991696811602558e-05, "loss": 0.0287, "step": 17290 }, { "epoch": 0.25, "learning_rate": 1.9916920076287108e-05, "loss": 0.0283, "step": 17300 }, { "epoch": 0.25, "learning_rate": 1.9916872036548637e-05, "loss": 0.0326, "step": 17310 }, { "epoch": 0.25, "learning_rate": 1.9916823996810163e-05, "loss": 0.0283, "step": 17320 }, { "epoch": 0.25, "learning_rate": 1.9916775957071692e-05, "loss": 0.0373, "step": 17330 }, { "epoch": 0.25, "learning_rate": 1.991672791733322e-05, "loss": 0.0256, "step": 17340 }, { "epoch": 0.25, "learning_rate": 1.9916679877594748e-05, "loss": 0.0312, "step": 17350 }, { "epoch": 0.25, "learning_rate": 1.9916631837856277e-05, "loss": 0.0338, "step": 17360 }, { "epoch": 0.25, "learning_rate": 1.9916583798117806e-05, "loss": 0.0265, "step": 17370 }, { "epoch": 0.25, "learning_rate": 1.9916535758379335e-05, "loss": 0.0259, "step": 17380 }, { "epoch": 0.25, "learning_rate": 1.991648771864086e-05, "loss": 0.0282, "step": 17390 }, { "epoch": 0.25, "learning_rate": 1.991643967890239e-05, "loss": 0.0276, "step": 17400 }, { "epoch": 0.25, "learning_rate": 1.991639163916392e-05, "loss": 0.0279, "step": 17410 }, { "epoch": 0.25, "learning_rate": 1.9916343599425446e-05, "loss": 0.0333, "step": 17420 }, { "epoch": 0.25, "learning_rate": 1.9916295559686975e-05, "loss": 0.0386, "step": 17430 }, { "epoch": 0.25, "learning_rate": 1.9916247519948504e-05, "loss": 0.0276, "step": 17440 }, { "epoch": 0.25, "learning_rate": 1.9916199480210033e-05, "loss": 0.0279, "step": 17450 }, { "epoch": 0.25, "learning_rate": 1.991615144047156e-05, "loss": 0.0269, "step": 17460 }, { "epoch": 0.25, "learning_rate": 1.991610340073309e-05, "loss": 0.0331, "step": 17470 }, { "epoch": 0.25, "learning_rate": 1.9916055360994618e-05, "loss": 0.0291, "step": 17480 }, { "epoch": 0.25, "learning_rate": 1.9916007321256147e-05, "loss": 0.0339, "step": 17490 }, { "epoch": 0.25, "learning_rate": 1.9915959281517673e-05, "loss": 0.0358, "step": 17500 }, { "epoch": 0.25, "learning_rate": 1.9915911241779202e-05, "loss": 0.0287, "step": 17510 }, { "epoch": 0.25, "learning_rate": 1.991586320204073e-05, "loss": 0.0296, "step": 17520 }, { "epoch": 0.25, "learning_rate": 1.9915815162302257e-05, "loss": 0.0299, "step": 17530 }, { "epoch": 0.25, "learning_rate": 1.9915767122563787e-05, "loss": 0.0287, "step": 17540 }, { "epoch": 0.25, "learning_rate": 1.9915719082825316e-05, "loss": 0.0357, "step": 17550 }, { "epoch": 0.25, "learning_rate": 1.9915671043086845e-05, "loss": 0.0307, "step": 17560 }, { "epoch": 0.25, "learning_rate": 1.991562300334837e-05, "loss": 0.0239, "step": 17570 }, { "epoch": 0.25, "learning_rate": 1.99155749636099e-05, "loss": 0.0304, "step": 17580 }, { "epoch": 0.25, "learning_rate": 1.991552692387143e-05, "loss": 0.0313, "step": 17590 }, { "epoch": 0.25, "learning_rate": 1.9915478884132956e-05, "loss": 0.0216, "step": 17600 }, { "epoch": 0.25, "learning_rate": 1.9915430844394485e-05, "loss": 0.032, "step": 17610 }, { "epoch": 0.25, "learning_rate": 1.9915382804656014e-05, "loss": 0.0393, "step": 17620 }, { "epoch": 0.25, "learning_rate": 1.9915334764917543e-05, "loss": 0.03, "step": 17630 }, { "epoch": 0.25, "learning_rate": 1.991528672517907e-05, "loss": 0.0188, "step": 17640 }, { "epoch": 0.25, "learning_rate": 1.99152386854406e-05, "loss": 0.0334, "step": 17650 }, { "epoch": 0.25, "learning_rate": 1.9915190645702128e-05, "loss": 0.031, "step": 17660 }, { "epoch": 0.25, "learning_rate": 1.9915142605963657e-05, "loss": 0.0269, "step": 17670 }, { "epoch": 0.25, "learning_rate": 1.9915094566225183e-05, "loss": 0.0273, "step": 17680 }, { "epoch": 0.25, "learning_rate": 1.9915046526486712e-05, "loss": 0.0305, "step": 17690 }, { "epoch": 0.26, "learning_rate": 1.991499848674824e-05, "loss": 0.0329, "step": 17700 }, { "epoch": 0.26, "learning_rate": 1.9914950447009767e-05, "loss": 0.0255, "step": 17710 }, { "epoch": 0.26, "learning_rate": 1.9914902407271297e-05, "loss": 0.0329, "step": 17720 }, { "epoch": 0.26, "learning_rate": 1.9914854367532826e-05, "loss": 0.0273, "step": 17730 }, { "epoch": 0.26, "learning_rate": 1.9914806327794355e-05, "loss": 0.0326, "step": 17740 }, { "epoch": 0.26, "learning_rate": 1.991475828805588e-05, "loss": 0.0419, "step": 17750 }, { "epoch": 0.26, "learning_rate": 1.991471024831741e-05, "loss": 0.0326, "step": 17760 }, { "epoch": 0.26, "learning_rate": 1.991466220857894e-05, "loss": 0.0281, "step": 17770 }, { "epoch": 0.26, "learning_rate": 1.9914614168840466e-05, "loss": 0.0288, "step": 17780 }, { "epoch": 0.26, "learning_rate": 1.9914566129101995e-05, "loss": 0.0299, "step": 17790 }, { "epoch": 0.26, "learning_rate": 1.9914518089363524e-05, "loss": 0.0236, "step": 17800 }, { "epoch": 0.26, "learning_rate": 1.9914470049625053e-05, "loss": 0.0286, "step": 17810 }, { "epoch": 0.26, "learning_rate": 1.991442200988658e-05, "loss": 0.0296, "step": 17820 }, { "epoch": 0.26, "learning_rate": 1.991437397014811e-05, "loss": 0.0238, "step": 17830 }, { "epoch": 0.26, "learning_rate": 1.9914325930409638e-05, "loss": 0.0328, "step": 17840 }, { "epoch": 0.26, "learning_rate": 1.9914277890671167e-05, "loss": 0.0303, "step": 17850 }, { "epoch": 0.26, "learning_rate": 1.9914229850932693e-05, "loss": 0.0299, "step": 17860 }, { "epoch": 0.26, "learning_rate": 1.9914181811194222e-05, "loss": 0.0372, "step": 17870 }, { "epoch": 0.26, "learning_rate": 1.991413377145575e-05, "loss": 0.0352, "step": 17880 }, { "epoch": 0.26, "learning_rate": 1.9914085731717277e-05, "loss": 0.0257, "step": 17890 }, { "epoch": 0.26, "learning_rate": 1.9914037691978807e-05, "loss": 0.0322, "step": 17900 }, { "epoch": 0.26, "learning_rate": 1.9913989652240336e-05, "loss": 0.0375, "step": 17910 }, { "epoch": 0.26, "learning_rate": 1.9913941612501865e-05, "loss": 0.0231, "step": 17920 }, { "epoch": 0.26, "learning_rate": 1.991389357276339e-05, "loss": 0.0307, "step": 17930 }, { "epoch": 0.26, "learning_rate": 1.991384553302492e-05, "loss": 0.0319, "step": 17940 }, { "epoch": 0.26, "learning_rate": 1.991379749328645e-05, "loss": 0.0271, "step": 17950 }, { "epoch": 0.26, "learning_rate": 1.9913749453547975e-05, "loss": 0.0266, "step": 17960 }, { "epoch": 0.26, "learning_rate": 1.9913701413809505e-05, "loss": 0.0274, "step": 17970 }, { "epoch": 0.26, "learning_rate": 1.9913653374071034e-05, "loss": 0.0295, "step": 17980 }, { "epoch": 0.26, "learning_rate": 1.9913605334332563e-05, "loss": 0.0256, "step": 17990 }, { "epoch": 0.26, "learning_rate": 1.991355729459409e-05, "loss": 0.0242, "step": 18000 }, { "epoch": 0.26, "learning_rate": 1.991350925485562e-05, "loss": 0.0246, "step": 18010 }, { "epoch": 0.26, "learning_rate": 1.9913461215117148e-05, "loss": 0.0294, "step": 18020 }, { "epoch": 0.26, "learning_rate": 1.9913413175378677e-05, "loss": 0.0244, "step": 18030 }, { "epoch": 0.26, "learning_rate": 1.9913365135640203e-05, "loss": 0.0291, "step": 18040 }, { "epoch": 0.26, "learning_rate": 1.9913317095901732e-05, "loss": 0.0259, "step": 18050 }, { "epoch": 0.26, "learning_rate": 1.991326905616326e-05, "loss": 0.0321, "step": 18060 }, { "epoch": 0.26, "learning_rate": 1.9913221016424787e-05, "loss": 0.0305, "step": 18070 }, { "epoch": 0.26, "learning_rate": 1.9913172976686316e-05, "loss": 0.0283, "step": 18080 }, { "epoch": 0.26, "learning_rate": 1.9913124936947846e-05, "loss": 0.0247, "step": 18090 }, { "epoch": 0.26, "learning_rate": 1.9913076897209375e-05, "loss": 0.0285, "step": 18100 }, { "epoch": 0.26, "learning_rate": 1.99130288574709e-05, "loss": 0.0343, "step": 18110 }, { "epoch": 0.26, "learning_rate": 1.991298081773243e-05, "loss": 0.0237, "step": 18120 }, { "epoch": 0.26, "learning_rate": 1.991293277799396e-05, "loss": 0.0283, "step": 18130 }, { "epoch": 0.26, "learning_rate": 1.9912884738255485e-05, "loss": 0.0262, "step": 18140 }, { "epoch": 0.26, "learning_rate": 1.9912836698517015e-05, "loss": 0.032, "step": 18150 }, { "epoch": 0.26, "learning_rate": 1.9912788658778544e-05, "loss": 0.0257, "step": 18160 }, { "epoch": 0.26, "learning_rate": 1.9912740619040073e-05, "loss": 0.0281, "step": 18170 }, { "epoch": 0.26, "learning_rate": 1.99126925793016e-05, "loss": 0.0312, "step": 18180 }, { "epoch": 0.26, "learning_rate": 1.9912644539563128e-05, "loss": 0.0322, "step": 18190 }, { "epoch": 0.26, "learning_rate": 1.9912596499824658e-05, "loss": 0.028, "step": 18200 }, { "epoch": 0.26, "learning_rate": 1.9912548460086183e-05, "loss": 0.0238, "step": 18210 }, { "epoch": 0.26, "learning_rate": 1.9912500420347713e-05, "loss": 0.0253, "step": 18220 }, { "epoch": 0.26, "learning_rate": 1.9912452380609242e-05, "loss": 0.0272, "step": 18230 }, { "epoch": 0.26, "learning_rate": 1.991240434087077e-05, "loss": 0.0266, "step": 18240 }, { "epoch": 0.26, "learning_rate": 1.9912356301132297e-05, "loss": 0.0322, "step": 18250 }, { "epoch": 0.26, "learning_rate": 1.9912308261393826e-05, "loss": 0.0274, "step": 18260 }, { "epoch": 0.26, "learning_rate": 1.9912260221655356e-05, "loss": 0.0292, "step": 18270 }, { "epoch": 0.26, "learning_rate": 1.9912212181916885e-05, "loss": 0.029, "step": 18280 }, { "epoch": 0.26, "learning_rate": 1.991216414217841e-05, "loss": 0.0327, "step": 18290 }, { "epoch": 0.26, "learning_rate": 1.991211610243994e-05, "loss": 0.0256, "step": 18300 }, { "epoch": 0.26, "learning_rate": 1.991206806270147e-05, "loss": 0.0283, "step": 18310 }, { "epoch": 0.26, "learning_rate": 1.9912020022962995e-05, "loss": 0.0333, "step": 18320 }, { "epoch": 0.26, "learning_rate": 1.9911971983224525e-05, "loss": 0.0269, "step": 18330 }, { "epoch": 0.26, "learning_rate": 1.9911923943486054e-05, "loss": 0.0298, "step": 18340 }, { "epoch": 0.26, "learning_rate": 1.9911875903747583e-05, "loss": 0.0335, "step": 18350 }, { "epoch": 0.26, "learning_rate": 1.991182786400911e-05, "loss": 0.0243, "step": 18360 }, { "epoch": 0.26, "learning_rate": 1.9911779824270638e-05, "loss": 0.0258, "step": 18370 }, { "epoch": 0.26, "learning_rate": 1.9911731784532167e-05, "loss": 0.0313, "step": 18380 }, { "epoch": 0.27, "learning_rate": 1.9911683744793693e-05, "loss": 0.0267, "step": 18390 }, { "epoch": 0.27, "learning_rate": 1.9911635705055223e-05, "loss": 0.0356, "step": 18400 }, { "epoch": 0.27, "learning_rate": 1.9911587665316752e-05, "loss": 0.0307, "step": 18410 }, { "epoch": 0.27, "learning_rate": 1.991153962557828e-05, "loss": 0.026, "step": 18420 }, { "epoch": 0.27, "learning_rate": 1.9911491585839807e-05, "loss": 0.0298, "step": 18430 }, { "epoch": 0.27, "learning_rate": 1.9911443546101336e-05, "loss": 0.0236, "step": 18440 }, { "epoch": 0.27, "learning_rate": 1.9911395506362866e-05, "loss": 0.0328, "step": 18450 }, { "epoch": 0.27, "learning_rate": 1.9911347466624395e-05, "loss": 0.0295, "step": 18460 }, { "epoch": 0.27, "learning_rate": 1.991129942688592e-05, "loss": 0.0346, "step": 18470 }, { "epoch": 0.27, "learning_rate": 1.991125138714745e-05, "loss": 0.0377, "step": 18480 }, { "epoch": 0.27, "learning_rate": 1.991120334740898e-05, "loss": 0.0322, "step": 18490 }, { "epoch": 0.27, "learning_rate": 1.9911155307670505e-05, "loss": 0.0299, "step": 18500 }, { "epoch": 0.27, "learning_rate": 1.9911107267932034e-05, "loss": 0.0333, "step": 18510 }, { "epoch": 0.27, "learning_rate": 1.9911059228193564e-05, "loss": 0.0292, "step": 18520 }, { "epoch": 0.27, "learning_rate": 1.9911011188455093e-05, "loss": 0.0224, "step": 18530 }, { "epoch": 0.27, "learning_rate": 1.991096314871662e-05, "loss": 0.0281, "step": 18540 }, { "epoch": 0.27, "learning_rate": 1.9910915108978148e-05, "loss": 0.0337, "step": 18550 }, { "epoch": 0.27, "learning_rate": 1.9910867069239677e-05, "loss": 0.0273, "step": 18560 }, { "epoch": 0.27, "learning_rate": 1.9910819029501203e-05, "loss": 0.0322, "step": 18570 }, { "epoch": 0.27, "learning_rate": 1.9910770989762733e-05, "loss": 0.0332, "step": 18580 }, { "epoch": 0.27, "learning_rate": 1.9910722950024262e-05, "loss": 0.0262, "step": 18590 }, { "epoch": 0.27, "learning_rate": 1.991067491028579e-05, "loss": 0.0305, "step": 18600 }, { "epoch": 0.27, "learning_rate": 1.9910626870547317e-05, "loss": 0.0303, "step": 18610 }, { "epoch": 0.27, "learning_rate": 1.9910578830808846e-05, "loss": 0.0322, "step": 18620 }, { "epoch": 0.27, "learning_rate": 1.9910530791070376e-05, "loss": 0.0261, "step": 18630 }, { "epoch": 0.27, "learning_rate": 1.9910482751331905e-05, "loss": 0.0266, "step": 18640 }, { "epoch": 0.27, "learning_rate": 1.991043471159343e-05, "loss": 0.0379, "step": 18650 }, { "epoch": 0.27, "learning_rate": 1.991038667185496e-05, "loss": 0.0318, "step": 18660 }, { "epoch": 0.27, "learning_rate": 1.991033863211649e-05, "loss": 0.0282, "step": 18670 }, { "epoch": 0.27, "learning_rate": 1.9910290592378015e-05, "loss": 0.0354, "step": 18680 }, { "epoch": 0.27, "learning_rate": 1.9910242552639544e-05, "loss": 0.0373, "step": 18690 }, { "epoch": 0.27, "learning_rate": 1.9910194512901074e-05, "loss": 0.0338, "step": 18700 }, { "epoch": 0.27, "learning_rate": 1.9910146473162603e-05, "loss": 0.0359, "step": 18710 }, { "epoch": 0.27, "learning_rate": 1.991009843342413e-05, "loss": 0.0255, "step": 18720 }, { "epoch": 0.27, "learning_rate": 1.9910050393685658e-05, "loss": 0.0282, "step": 18730 }, { "epoch": 0.27, "learning_rate": 1.9910002353947187e-05, "loss": 0.0292, "step": 18740 }, { "epoch": 0.27, "learning_rate": 1.9909954314208713e-05, "loss": 0.0261, "step": 18750 }, { "epoch": 0.27, "learning_rate": 1.9909906274470242e-05, "loss": 0.0317, "step": 18760 }, { "epoch": 0.27, "learning_rate": 1.9909858234731772e-05, "loss": 0.0246, "step": 18770 }, { "epoch": 0.27, "learning_rate": 1.99098101949933e-05, "loss": 0.0232, "step": 18780 }, { "epoch": 0.27, "learning_rate": 1.9909762155254827e-05, "loss": 0.029, "step": 18790 }, { "epoch": 0.27, "learning_rate": 1.9909714115516356e-05, "loss": 0.032, "step": 18800 }, { "epoch": 0.27, "learning_rate": 1.9909666075777885e-05, "loss": 0.0312, "step": 18810 }, { "epoch": 0.27, "learning_rate": 1.9909618036039415e-05, "loss": 0.0308, "step": 18820 }, { "epoch": 0.27, "learning_rate": 1.990956999630094e-05, "loss": 0.0273, "step": 18830 }, { "epoch": 0.27, "learning_rate": 1.990952195656247e-05, "loss": 0.0287, "step": 18840 }, { "epoch": 0.27, "learning_rate": 1.9909473916824e-05, "loss": 0.0214, "step": 18850 }, { "epoch": 0.27, "learning_rate": 1.9909425877085525e-05, "loss": 0.0237, "step": 18860 }, { "epoch": 0.27, "learning_rate": 1.9909377837347054e-05, "loss": 0.0314, "step": 18870 }, { "epoch": 0.27, "learning_rate": 1.9909329797608584e-05, "loss": 0.0331, "step": 18880 }, { "epoch": 0.27, "learning_rate": 1.9909281757870113e-05, "loss": 0.029, "step": 18890 }, { "epoch": 0.27, "learning_rate": 1.990923371813164e-05, "loss": 0.0358, "step": 18900 }, { "epoch": 0.27, "learning_rate": 1.9909185678393168e-05, "loss": 0.0256, "step": 18910 }, { "epoch": 0.27, "learning_rate": 1.9909137638654697e-05, "loss": 0.0295, "step": 18920 }, { "epoch": 0.27, "learning_rate": 1.9909089598916223e-05, "loss": 0.0312, "step": 18930 }, { "epoch": 0.27, "learning_rate": 1.9909041559177752e-05, "loss": 0.0277, "step": 18940 }, { "epoch": 0.27, "learning_rate": 1.990899351943928e-05, "loss": 0.0313, "step": 18950 }, { "epoch": 0.27, "learning_rate": 1.990894547970081e-05, "loss": 0.0326, "step": 18960 }, { "epoch": 0.27, "learning_rate": 1.9908897439962337e-05, "loss": 0.0246, "step": 18970 }, { "epoch": 0.27, "learning_rate": 1.9908849400223866e-05, "loss": 0.0326, "step": 18980 }, { "epoch": 0.27, "learning_rate": 1.9908801360485395e-05, "loss": 0.0278, "step": 18990 }, { "epoch": 0.27, "learning_rate": 1.9908753320746925e-05, "loss": 0.0225, "step": 19000 }, { "epoch": 0.27, "learning_rate": 1.990870528100845e-05, "loss": 0.0258, "step": 19010 }, { "epoch": 0.27, "learning_rate": 1.990865724126998e-05, "loss": 0.0286, "step": 19020 }, { "epoch": 0.27, "learning_rate": 1.990860920153151e-05, "loss": 0.0253, "step": 19030 }, { "epoch": 0.27, "learning_rate": 1.9908561161793035e-05, "loss": 0.0413, "step": 19040 }, { "epoch": 0.27, "learning_rate": 1.9908513122054564e-05, "loss": 0.0256, "step": 19050 }, { "epoch": 0.27, "learning_rate": 1.9908465082316093e-05, "loss": 0.0301, "step": 19060 }, { "epoch": 0.27, "learning_rate": 1.9908417042577623e-05, "loss": 0.0253, "step": 19070 }, { "epoch": 0.27, "learning_rate": 1.990836900283915e-05, "loss": 0.0315, "step": 19080 }, { "epoch": 0.28, "learning_rate": 1.9908320963100678e-05, "loss": 0.0289, "step": 19090 }, { "epoch": 0.28, "learning_rate": 1.9908272923362207e-05, "loss": 0.0264, "step": 19100 }, { "epoch": 0.28, "learning_rate": 1.9908224883623733e-05, "loss": 0.0373, "step": 19110 }, { "epoch": 0.28, "learning_rate": 1.9908176843885262e-05, "loss": 0.0318, "step": 19120 }, { "epoch": 0.28, "learning_rate": 1.990812880414679e-05, "loss": 0.0246, "step": 19130 }, { "epoch": 0.28, "learning_rate": 1.990808076440832e-05, "loss": 0.0256, "step": 19140 }, { "epoch": 0.28, "learning_rate": 1.9908032724669847e-05, "loss": 0.034, "step": 19150 }, { "epoch": 0.28, "learning_rate": 1.9907984684931376e-05, "loss": 0.027, "step": 19160 }, { "epoch": 0.28, "learning_rate": 1.9907936645192905e-05, "loss": 0.0269, "step": 19170 }, { "epoch": 0.28, "learning_rate": 1.9907888605454435e-05, "loss": 0.0262, "step": 19180 }, { "epoch": 0.28, "learning_rate": 1.990784056571596e-05, "loss": 0.0289, "step": 19190 }, { "epoch": 0.28, "learning_rate": 1.990779252597749e-05, "loss": 0.0281, "step": 19200 }, { "epoch": 0.28, "learning_rate": 1.990774448623902e-05, "loss": 0.0243, "step": 19210 }, { "epoch": 0.28, "learning_rate": 1.9907696446500545e-05, "loss": 0.0208, "step": 19220 }, { "epoch": 0.28, "learning_rate": 1.9907648406762074e-05, "loss": 0.024, "step": 19230 }, { "epoch": 0.28, "learning_rate": 1.9907600367023603e-05, "loss": 0.0331, "step": 19240 }, { "epoch": 0.28, "learning_rate": 1.9907552327285133e-05, "loss": 0.0277, "step": 19250 }, { "epoch": 0.28, "learning_rate": 1.990750428754666e-05, "loss": 0.0229, "step": 19260 }, { "epoch": 0.28, "learning_rate": 1.9907456247808188e-05, "loss": 0.0264, "step": 19270 }, { "epoch": 0.28, "learning_rate": 1.9907408208069717e-05, "loss": 0.0329, "step": 19280 }, { "epoch": 0.28, "learning_rate": 1.9907360168331243e-05, "loss": 0.0306, "step": 19290 }, { "epoch": 0.28, "learning_rate": 1.9907312128592772e-05, "loss": 0.0284, "step": 19300 }, { "epoch": 0.28, "learning_rate": 1.99072640888543e-05, "loss": 0.0283, "step": 19310 }, { "epoch": 0.28, "learning_rate": 1.990721604911583e-05, "loss": 0.0291, "step": 19320 }, { "epoch": 0.28, "learning_rate": 1.9907168009377357e-05, "loss": 0.0261, "step": 19330 }, { "epoch": 0.28, "learning_rate": 1.9907119969638886e-05, "loss": 0.0268, "step": 19340 }, { "epoch": 0.28, "learning_rate": 1.9907071929900415e-05, "loss": 0.0267, "step": 19350 }, { "epoch": 0.28, "learning_rate": 1.9907023890161944e-05, "loss": 0.0283, "step": 19360 }, { "epoch": 0.28, "learning_rate": 1.990697585042347e-05, "loss": 0.0287, "step": 19370 }, { "epoch": 0.28, "learning_rate": 1.9906927810685e-05, "loss": 0.0297, "step": 19380 }, { "epoch": 0.28, "learning_rate": 1.990687977094653e-05, "loss": 0.0342, "step": 19390 }, { "epoch": 0.28, "learning_rate": 1.9906831731208055e-05, "loss": 0.0316, "step": 19400 }, { "epoch": 0.28, "learning_rate": 1.9906783691469584e-05, "loss": 0.0264, "step": 19410 }, { "epoch": 0.28, "learning_rate": 1.9906735651731113e-05, "loss": 0.0289, "step": 19420 }, { "epoch": 0.28, "learning_rate": 1.9906687611992643e-05, "loss": 0.0271, "step": 19430 }, { "epoch": 0.28, "learning_rate": 1.990663957225417e-05, "loss": 0.0275, "step": 19440 }, { "epoch": 0.28, "learning_rate": 1.9906591532515698e-05, "loss": 0.0279, "step": 19450 }, { "epoch": 0.28, "learning_rate": 1.9906543492777227e-05, "loss": 0.0325, "step": 19460 }, { "epoch": 0.28, "learning_rate": 1.9906495453038753e-05, "loss": 0.0276, "step": 19470 }, { "epoch": 0.28, "learning_rate": 1.9906447413300282e-05, "loss": 0.0308, "step": 19480 }, { "epoch": 0.28, "learning_rate": 1.990639937356181e-05, "loss": 0.0317, "step": 19490 }, { "epoch": 0.28, "learning_rate": 1.990635133382334e-05, "loss": 0.0285, "step": 19500 }, { "epoch": 0.28, "learning_rate": 1.9906303294084867e-05, "loss": 0.0225, "step": 19510 }, { "epoch": 0.28, "learning_rate": 1.9906255254346396e-05, "loss": 0.0205, "step": 19520 }, { "epoch": 0.28, "learning_rate": 1.9906207214607925e-05, "loss": 0.0301, "step": 19530 }, { "epoch": 0.28, "learning_rate": 1.9906159174869454e-05, "loss": 0.0296, "step": 19540 }, { "epoch": 0.28, "learning_rate": 1.990611113513098e-05, "loss": 0.0238, "step": 19550 }, { "epoch": 0.28, "learning_rate": 1.990606309539251e-05, "loss": 0.0267, "step": 19560 }, { "epoch": 0.28, "learning_rate": 1.990601505565404e-05, "loss": 0.0224, "step": 19570 }, { "epoch": 0.28, "learning_rate": 1.9905967015915565e-05, "loss": 0.0292, "step": 19580 }, { "epoch": 0.28, "learning_rate": 1.9905918976177094e-05, "loss": 0.0287, "step": 19590 }, { "epoch": 0.28, "learning_rate": 1.9905870936438623e-05, "loss": 0.0199, "step": 19600 }, { "epoch": 0.28, "learning_rate": 1.9905822896700152e-05, "loss": 0.0289, "step": 19610 }, { "epoch": 0.28, "learning_rate": 1.990577485696168e-05, "loss": 0.027, "step": 19620 }, { "epoch": 0.28, "learning_rate": 1.9905726817223208e-05, "loss": 0.0283, "step": 19630 }, { "epoch": 0.28, "learning_rate": 1.9905678777484737e-05, "loss": 0.0245, "step": 19640 }, { "epoch": 0.28, "learning_rate": 1.9905630737746263e-05, "loss": 0.027, "step": 19650 }, { "epoch": 0.28, "learning_rate": 1.9905582698007792e-05, "loss": 0.0263, "step": 19660 }, { "epoch": 0.28, "learning_rate": 1.990553465826932e-05, "loss": 0.0257, "step": 19670 }, { "epoch": 0.28, "learning_rate": 1.990548661853085e-05, "loss": 0.0275, "step": 19680 }, { "epoch": 0.28, "learning_rate": 1.9905438578792376e-05, "loss": 0.0364, "step": 19690 }, { "epoch": 0.28, "learning_rate": 1.9905390539053906e-05, "loss": 0.0312, "step": 19700 }, { "epoch": 0.28, "learning_rate": 1.9905342499315435e-05, "loss": 0.0271, "step": 19710 }, { "epoch": 0.28, "learning_rate": 1.9905294459576964e-05, "loss": 0.0269, "step": 19720 }, { "epoch": 0.28, "learning_rate": 1.990524641983849e-05, "loss": 0.0235, "step": 19730 }, { "epoch": 0.28, "learning_rate": 1.990519838010002e-05, "loss": 0.0254, "step": 19740 }, { "epoch": 0.28, "learning_rate": 1.990515034036155e-05, "loss": 0.0242, "step": 19750 }, { "epoch": 0.28, "learning_rate": 1.9905102300623078e-05, "loss": 0.0239, "step": 19760 }, { "epoch": 0.28, "learning_rate": 1.9905054260884607e-05, "loss": 0.025, "step": 19770 }, { "epoch": 0.29, "learning_rate": 1.9905006221146133e-05, "loss": 0.0302, "step": 19780 }, { "epoch": 0.29, "learning_rate": 1.9904958181407662e-05, "loss": 0.0199, "step": 19790 }, { "epoch": 0.29, "learning_rate": 1.990491014166919e-05, "loss": 0.0313, "step": 19800 }, { "epoch": 0.29, "learning_rate": 1.990486210193072e-05, "loss": 0.0235, "step": 19810 }, { "epoch": 0.29, "learning_rate": 1.9904814062192247e-05, "loss": 0.0273, "step": 19820 }, { "epoch": 0.29, "learning_rate": 1.9904766022453776e-05, "loss": 0.0214, "step": 19830 }, { "epoch": 0.29, "learning_rate": 1.9904717982715305e-05, "loss": 0.0325, "step": 19840 }, { "epoch": 0.29, "learning_rate": 1.9904669942976835e-05, "loss": 0.0316, "step": 19850 }, { "epoch": 0.29, "learning_rate": 1.990462190323836e-05, "loss": 0.0325, "step": 19860 }, { "epoch": 0.29, "learning_rate": 1.990457386349989e-05, "loss": 0.0322, "step": 19870 }, { "epoch": 0.29, "learning_rate": 1.990452582376142e-05, "loss": 0.0278, "step": 19880 }, { "epoch": 0.29, "learning_rate": 1.9904477784022945e-05, "loss": 0.0299, "step": 19890 }, { "epoch": 0.29, "learning_rate": 1.9904429744284474e-05, "loss": 0.0247, "step": 19900 }, { "epoch": 0.29, "learning_rate": 1.9904381704546003e-05, "loss": 0.0314, "step": 19910 }, { "epoch": 0.29, "learning_rate": 1.9904333664807533e-05, "loss": 0.0275, "step": 19920 }, { "epoch": 0.29, "learning_rate": 1.9904290429042904e-05, "loss": 0.0335, "step": 19930 }, { "epoch": 0.29, "learning_rate": 1.9904242389304433e-05, "loss": 0.0237, "step": 19940 }, { "epoch": 0.29, "learning_rate": 1.9904194349565963e-05, "loss": 0.0276, "step": 19950 }, { "epoch": 0.29, "learning_rate": 1.990414630982749e-05, "loss": 0.0293, "step": 19960 }, { "epoch": 0.29, "learning_rate": 1.9904098270089018e-05, "loss": 0.0253, "step": 19970 }, { "epoch": 0.29, "learning_rate": 1.9904050230350547e-05, "loss": 0.0278, "step": 19980 }, { "epoch": 0.29, "learning_rate": 1.9904002190612076e-05, "loss": 0.0244, "step": 19990 }, { "epoch": 0.29, "learning_rate": 1.9903954150873602e-05, "loss": 0.0245, "step": 20000 }, { "epoch": 0.29, "learning_rate": 1.990390611113513e-05, "loss": 0.0264, "step": 20010 }, { "epoch": 0.29, "learning_rate": 1.990385807139666e-05, "loss": 0.0263, "step": 20020 }, { "epoch": 0.29, "learning_rate": 1.990381003165819e-05, "loss": 0.0272, "step": 20030 }, { "epoch": 0.29, "learning_rate": 1.9903761991919716e-05, "loss": 0.0209, "step": 20040 }, { "epoch": 0.29, "learning_rate": 1.9903713952181245e-05, "loss": 0.0329, "step": 20050 }, { "epoch": 0.29, "learning_rate": 1.9903665912442774e-05, "loss": 0.0294, "step": 20060 }, { "epoch": 0.29, "learning_rate": 1.99036178727043e-05, "loss": 0.0224, "step": 20070 }, { "epoch": 0.29, "learning_rate": 1.990356983296583e-05, "loss": 0.0268, "step": 20080 }, { "epoch": 0.29, "learning_rate": 1.990352179322736e-05, "loss": 0.0297, "step": 20090 }, { "epoch": 0.29, "learning_rate": 1.9903473753488888e-05, "loss": 0.0279, "step": 20100 }, { "epoch": 0.29, "learning_rate": 1.9903425713750414e-05, "loss": 0.0249, "step": 20110 }, { "epoch": 0.29, "learning_rate": 1.9903377674011943e-05, "loss": 0.0361, "step": 20120 }, { "epoch": 0.29, "learning_rate": 1.9903329634273472e-05, "loss": 0.0226, "step": 20130 }, { "epoch": 0.29, "learning_rate": 1.9903281594535e-05, "loss": 0.0301, "step": 20140 }, { "epoch": 0.29, "learning_rate": 1.9903233554796528e-05, "loss": 0.0271, "step": 20150 }, { "epoch": 0.29, "learning_rate": 1.9903185515058057e-05, "loss": 0.028, "step": 20160 }, { "epoch": 0.29, "learning_rate": 1.9903137475319586e-05, "loss": 0.0247, "step": 20170 }, { "epoch": 0.29, "learning_rate": 1.9903089435581112e-05, "loss": 0.0293, "step": 20180 }, { "epoch": 0.29, "learning_rate": 1.990304139584264e-05, "loss": 0.0231, "step": 20190 }, { "epoch": 0.29, "learning_rate": 1.990299335610417e-05, "loss": 0.0294, "step": 20200 }, { "epoch": 0.29, "learning_rate": 1.99029453163657e-05, "loss": 0.0302, "step": 20210 }, { "epoch": 0.29, "learning_rate": 1.9902897276627226e-05, "loss": 0.0296, "step": 20220 }, { "epoch": 0.29, "learning_rate": 1.9902849236888755e-05, "loss": 0.0292, "step": 20230 }, { "epoch": 0.29, "learning_rate": 1.9902801197150284e-05, "loss": 0.0334, "step": 20240 }, { "epoch": 0.29, "learning_rate": 1.990275315741181e-05, "loss": 0.0265, "step": 20250 }, { "epoch": 0.29, "learning_rate": 1.9902705117673343e-05, "loss": 0.0308, "step": 20260 }, { "epoch": 0.29, "learning_rate": 1.9902657077934872e-05, "loss": 0.0235, "step": 20270 }, { "epoch": 0.29, "learning_rate": 1.9902609038196398e-05, "loss": 0.026, "step": 20280 }, { "epoch": 0.29, "learning_rate": 1.9902560998457927e-05, "loss": 0.0287, "step": 20290 }, { "epoch": 0.29, "learning_rate": 1.9902512958719456e-05, "loss": 0.0232, "step": 20300 }, { "epoch": 0.29, "learning_rate": 1.9902464918980982e-05, "loss": 0.0288, "step": 20310 }, { "epoch": 0.29, "learning_rate": 1.990241687924251e-05, "loss": 0.0232, "step": 20320 }, { "epoch": 0.29, "learning_rate": 1.990236883950404e-05, "loss": 0.0257, "step": 20330 }, { "epoch": 0.29, "learning_rate": 1.990232079976557e-05, "loss": 0.0252, "step": 20340 }, { "epoch": 0.29, "learning_rate": 1.9902272760027096e-05, "loss": 0.0195, "step": 20350 }, { "epoch": 0.29, "learning_rate": 1.9902224720288625e-05, "loss": 0.0314, "step": 20360 }, { "epoch": 0.29, "learning_rate": 1.9902176680550155e-05, "loss": 0.0332, "step": 20370 }, { "epoch": 0.29, "learning_rate": 1.990212864081168e-05, "loss": 0.0322, "step": 20380 }, { "epoch": 0.29, "learning_rate": 1.990208060107321e-05, "loss": 0.0262, "step": 20390 }, { "epoch": 0.29, "learning_rate": 1.990203256133474e-05, "loss": 0.0301, "step": 20400 }, { "epoch": 0.29, "learning_rate": 1.9901984521596268e-05, "loss": 0.0234, "step": 20410 }, { "epoch": 0.29, "learning_rate": 1.9901936481857794e-05, "loss": 0.0258, "step": 20420 }, { "epoch": 0.29, "learning_rate": 1.9901888442119323e-05, "loss": 0.0297, "step": 20430 }, { "epoch": 0.29, "learning_rate": 1.9901840402380853e-05, "loss": 0.0316, "step": 20440 }, { "epoch": 0.29, "learning_rate": 1.9901792362642382e-05, "loss": 0.0258, "step": 20450 }, { "epoch": 0.29, "learning_rate": 1.9901744322903908e-05, "loss": 0.0283, "step": 20460 }, { "epoch": 0.3, "learning_rate": 1.9901696283165437e-05, "loss": 0.0283, "step": 20470 }, { "epoch": 0.3, "learning_rate": 1.9901648243426966e-05, "loss": 0.0299, "step": 20480 }, { "epoch": 0.3, "learning_rate": 1.9901600203688492e-05, "loss": 0.0317, "step": 20490 }, { "epoch": 0.3, "learning_rate": 1.990155216395002e-05, "loss": 0.0301, "step": 20500 }, { "epoch": 0.3, "learning_rate": 1.990150412421155e-05, "loss": 0.0353, "step": 20510 }, { "epoch": 0.3, "learning_rate": 1.990145608447308e-05, "loss": 0.0236, "step": 20520 }, { "epoch": 0.3, "learning_rate": 1.9901408044734606e-05, "loss": 0.0259, "step": 20530 }, { "epoch": 0.3, "learning_rate": 1.9901360004996135e-05, "loss": 0.0253, "step": 20540 }, { "epoch": 0.3, "learning_rate": 1.9901311965257664e-05, "loss": 0.036, "step": 20550 }, { "epoch": 0.3, "learning_rate": 1.990126392551919e-05, "loss": 0.024, "step": 20560 }, { "epoch": 0.3, "learning_rate": 1.990121588578072e-05, "loss": 0.0274, "step": 20570 }, { "epoch": 0.3, "learning_rate": 1.990116784604225e-05, "loss": 0.0305, "step": 20580 }, { "epoch": 0.3, "learning_rate": 1.9901119806303778e-05, "loss": 0.0318, "step": 20590 }, { "epoch": 0.3, "learning_rate": 1.9901071766565304e-05, "loss": 0.0252, "step": 20600 }, { "epoch": 0.3, "learning_rate": 1.9901023726826833e-05, "loss": 0.0234, "step": 20610 }, { "epoch": 0.3, "learning_rate": 1.9900975687088363e-05, "loss": 0.0265, "step": 20620 }, { "epoch": 0.3, "learning_rate": 1.9900927647349892e-05, "loss": 0.0257, "step": 20630 }, { "epoch": 0.3, "learning_rate": 1.9900879607611418e-05, "loss": 0.0247, "step": 20640 }, { "epoch": 0.3, "learning_rate": 1.9900831567872947e-05, "loss": 0.0339, "step": 20650 }, { "epoch": 0.3, "learning_rate": 1.9900783528134476e-05, "loss": 0.0212, "step": 20660 }, { "epoch": 0.3, "learning_rate": 1.9900735488396002e-05, "loss": 0.0218, "step": 20670 }, { "epoch": 0.3, "learning_rate": 1.990068744865753e-05, "loss": 0.0352, "step": 20680 }, { "epoch": 0.3, "learning_rate": 1.990063940891906e-05, "loss": 0.0314, "step": 20690 }, { "epoch": 0.3, "learning_rate": 1.990059136918059e-05, "loss": 0.0343, "step": 20700 }, { "epoch": 0.3, "learning_rate": 1.9900543329442116e-05, "loss": 0.0289, "step": 20710 }, { "epoch": 0.3, "learning_rate": 1.9900495289703645e-05, "loss": 0.0232, "step": 20720 }, { "epoch": 0.3, "learning_rate": 1.9900447249965174e-05, "loss": 0.0276, "step": 20730 }, { "epoch": 0.3, "learning_rate": 1.99003992102267e-05, "loss": 0.036, "step": 20740 }, { "epoch": 0.3, "learning_rate": 1.990035117048823e-05, "loss": 0.0327, "step": 20750 }, { "epoch": 0.3, "learning_rate": 1.990030313074976e-05, "loss": 0.026, "step": 20760 }, { "epoch": 0.3, "learning_rate": 1.9900255091011288e-05, "loss": 0.0272, "step": 20770 }, { "epoch": 0.3, "learning_rate": 1.9900207051272814e-05, "loss": 0.0255, "step": 20780 }, { "epoch": 0.3, "learning_rate": 1.9900159011534343e-05, "loss": 0.027, "step": 20790 }, { "epoch": 0.3, "learning_rate": 1.9900110971795873e-05, "loss": 0.0254, "step": 20800 }, { "epoch": 0.3, "learning_rate": 1.9900062932057402e-05, "loss": 0.0281, "step": 20810 }, { "epoch": 0.3, "learning_rate": 1.9900014892318928e-05, "loss": 0.0243, "step": 20820 }, { "epoch": 0.3, "learning_rate": 1.9899966852580457e-05, "loss": 0.0244, "step": 20830 }, { "epoch": 0.3, "learning_rate": 1.9899918812841986e-05, "loss": 0.0305, "step": 20840 }, { "epoch": 0.3, "learning_rate": 1.9899870773103512e-05, "loss": 0.0319, "step": 20850 }, { "epoch": 0.3, "learning_rate": 1.989982273336504e-05, "loss": 0.0276, "step": 20860 }, { "epoch": 0.3, "learning_rate": 1.989977469362657e-05, "loss": 0.0386, "step": 20870 }, { "epoch": 0.3, "learning_rate": 1.98997266538881e-05, "loss": 0.0253, "step": 20880 }, { "epoch": 0.3, "learning_rate": 1.9899678614149626e-05, "loss": 0.0244, "step": 20890 }, { "epoch": 0.3, "learning_rate": 1.9899630574411155e-05, "loss": 0.0257, "step": 20900 }, { "epoch": 0.3, "learning_rate": 1.9899582534672684e-05, "loss": 0.0265, "step": 20910 }, { "epoch": 0.3, "learning_rate": 1.989953449493421e-05, "loss": 0.0277, "step": 20920 }, { "epoch": 0.3, "learning_rate": 1.989948645519574e-05, "loss": 0.0248, "step": 20930 }, { "epoch": 0.3, "learning_rate": 1.989943841545727e-05, "loss": 0.0314, "step": 20940 }, { "epoch": 0.3, "learning_rate": 1.9899390375718798e-05, "loss": 0.0257, "step": 20950 }, { "epoch": 0.3, "learning_rate": 1.9899342335980324e-05, "loss": 0.0318, "step": 20960 }, { "epoch": 0.3, "learning_rate": 1.9899294296241853e-05, "loss": 0.0243, "step": 20970 }, { "epoch": 0.3, "learning_rate": 1.9899246256503382e-05, "loss": 0.0302, "step": 20980 }, { "epoch": 0.3, "learning_rate": 1.9899198216764912e-05, "loss": 0.0271, "step": 20990 }, { "epoch": 0.3, "learning_rate": 1.9899150177026438e-05, "loss": 0.0343, "step": 21000 }, { "epoch": 0.3, "learning_rate": 1.9899102137287967e-05, "loss": 0.028, "step": 21010 }, { "epoch": 0.3, "learning_rate": 1.9899054097549496e-05, "loss": 0.0242, "step": 21020 }, { "epoch": 0.3, "learning_rate": 1.9899006057811022e-05, "loss": 0.0253, "step": 21030 }, { "epoch": 0.3, "learning_rate": 1.989895801807255e-05, "loss": 0.0274, "step": 21040 }, { "epoch": 0.3, "learning_rate": 1.989890997833408e-05, "loss": 0.0281, "step": 21050 }, { "epoch": 0.3, "learning_rate": 1.989886193859561e-05, "loss": 0.0279, "step": 21060 }, { "epoch": 0.3, "learning_rate": 1.9898813898857136e-05, "loss": 0.0296, "step": 21070 }, { "epoch": 0.3, "learning_rate": 1.9898765859118665e-05, "loss": 0.0285, "step": 21080 }, { "epoch": 0.3, "learning_rate": 1.9898717819380194e-05, "loss": 0.0267, "step": 21090 }, { "epoch": 0.3, "learning_rate": 1.989866977964172e-05, "loss": 0.0298, "step": 21100 }, { "epoch": 0.3, "learning_rate": 1.989862173990325e-05, "loss": 0.0256, "step": 21110 }, { "epoch": 0.3, "learning_rate": 1.989857370016478e-05, "loss": 0.02, "step": 21120 }, { "epoch": 0.3, "learning_rate": 1.9898525660426308e-05, "loss": 0.0201, "step": 21130 }, { "epoch": 0.3, "learning_rate": 1.9898477620687834e-05, "loss": 0.0317, "step": 21140 }, { "epoch": 0.3, "learning_rate": 1.9898429580949363e-05, "loss": 0.0392, "step": 21150 }, { "epoch": 0.3, "learning_rate": 1.9898381541210892e-05, "loss": 0.0258, "step": 21160 }, { "epoch": 0.31, "learning_rate": 1.989833350147242e-05, "loss": 0.0267, "step": 21170 }, { "epoch": 0.31, "learning_rate": 1.9898285461733948e-05, "loss": 0.0247, "step": 21180 }, { "epoch": 0.31, "learning_rate": 1.9898237421995477e-05, "loss": 0.0269, "step": 21190 }, { "epoch": 0.31, "learning_rate": 1.9898189382257006e-05, "loss": 0.0292, "step": 21200 }, { "epoch": 0.31, "learning_rate": 1.9898141342518532e-05, "loss": 0.0264, "step": 21210 }, { "epoch": 0.31, "learning_rate": 1.989809330278006e-05, "loss": 0.0237, "step": 21220 }, { "epoch": 0.31, "learning_rate": 1.989804526304159e-05, "loss": 0.0239, "step": 21230 }, { "epoch": 0.31, "learning_rate": 1.989799722330312e-05, "loss": 0.0221, "step": 21240 }, { "epoch": 0.31, "learning_rate": 1.9897949183564646e-05, "loss": 0.0249, "step": 21250 }, { "epoch": 0.31, "learning_rate": 1.9897901143826175e-05, "loss": 0.0264, "step": 21260 }, { "epoch": 0.31, "learning_rate": 1.9897853104087704e-05, "loss": 0.0202, "step": 21270 }, { "epoch": 0.31, "learning_rate": 1.989780506434923e-05, "loss": 0.0291, "step": 21280 }, { "epoch": 0.31, "learning_rate": 1.989775702461076e-05, "loss": 0.029, "step": 21290 }, { "epoch": 0.31, "learning_rate": 1.989770898487229e-05, "loss": 0.026, "step": 21300 }, { "epoch": 0.31, "learning_rate": 1.9897660945133818e-05, "loss": 0.0199, "step": 21310 }, { "epoch": 0.31, "learning_rate": 1.9897612905395344e-05, "loss": 0.0252, "step": 21320 }, { "epoch": 0.31, "learning_rate": 1.9897564865656873e-05, "loss": 0.0268, "step": 21330 }, { "epoch": 0.31, "learning_rate": 1.9897516825918402e-05, "loss": 0.0237, "step": 21340 }, { "epoch": 0.31, "learning_rate": 1.9897468786179928e-05, "loss": 0.0341, "step": 21350 }, { "epoch": 0.31, "learning_rate": 1.9897420746441457e-05, "loss": 0.0239, "step": 21360 }, { "epoch": 0.31, "learning_rate": 1.9897372706702987e-05, "loss": 0.033, "step": 21370 }, { "epoch": 0.31, "learning_rate": 1.9897324666964516e-05, "loss": 0.0312, "step": 21380 }, { "epoch": 0.31, "learning_rate": 1.9897276627226042e-05, "loss": 0.0211, "step": 21390 }, { "epoch": 0.31, "learning_rate": 1.989722858748757e-05, "loss": 0.0244, "step": 21400 }, { "epoch": 0.31, "learning_rate": 1.98971805477491e-05, "loss": 0.0214, "step": 21410 }, { "epoch": 0.31, "learning_rate": 1.989713250801063e-05, "loss": 0.0278, "step": 21420 }, { "epoch": 0.31, "learning_rate": 1.9897084468272156e-05, "loss": 0.0245, "step": 21430 }, { "epoch": 0.31, "learning_rate": 1.9897036428533685e-05, "loss": 0.0326, "step": 21440 }, { "epoch": 0.31, "learning_rate": 1.9896988388795214e-05, "loss": 0.0258, "step": 21450 }, { "epoch": 0.31, "learning_rate": 1.989694034905674e-05, "loss": 0.0246, "step": 21460 }, { "epoch": 0.31, "learning_rate": 1.989689230931827e-05, "loss": 0.0287, "step": 21470 }, { "epoch": 0.31, "learning_rate": 1.98968442695798e-05, "loss": 0.0249, "step": 21480 }, { "epoch": 0.31, "learning_rate": 1.9896796229841328e-05, "loss": 0.0265, "step": 21490 }, { "epoch": 0.31, "learning_rate": 1.9896748190102854e-05, "loss": 0.0207, "step": 21500 }, { "epoch": 0.31, "learning_rate": 1.9896700150364383e-05, "loss": 0.0224, "step": 21510 }, { "epoch": 0.31, "learning_rate": 1.9896652110625912e-05, "loss": 0.0301, "step": 21520 }, { "epoch": 0.31, "learning_rate": 1.9896604070887438e-05, "loss": 0.0248, "step": 21530 }, { "epoch": 0.31, "learning_rate": 1.9896556031148967e-05, "loss": 0.0305, "step": 21540 }, { "epoch": 0.31, "learning_rate": 1.9896507991410497e-05, "loss": 0.0191, "step": 21550 }, { "epoch": 0.31, "learning_rate": 1.9896459951672026e-05, "loss": 0.0251, "step": 21560 }, { "epoch": 0.31, "learning_rate": 1.9896411911933552e-05, "loss": 0.0237, "step": 21570 }, { "epoch": 0.31, "learning_rate": 1.989636387219508e-05, "loss": 0.0255, "step": 21580 }, { "epoch": 0.31, "learning_rate": 1.989631583245661e-05, "loss": 0.032, "step": 21590 }, { "epoch": 0.31, "learning_rate": 1.989626779271814e-05, "loss": 0.0263, "step": 21600 }, { "epoch": 0.31, "learning_rate": 1.9896219752979665e-05, "loss": 0.0311, "step": 21610 }, { "epoch": 0.31, "learning_rate": 1.9896171713241195e-05, "loss": 0.0222, "step": 21620 }, { "epoch": 0.31, "learning_rate": 1.9896123673502724e-05, "loss": 0.0381, "step": 21630 }, { "epoch": 0.31, "learning_rate": 1.989607563376425e-05, "loss": 0.024, "step": 21640 }, { "epoch": 0.31, "learning_rate": 1.989602759402578e-05, "loss": 0.0202, "step": 21650 }, { "epoch": 0.31, "learning_rate": 1.989597955428731e-05, "loss": 0.0276, "step": 21660 }, { "epoch": 0.31, "learning_rate": 1.9895931514548838e-05, "loss": 0.0273, "step": 21670 }, { "epoch": 0.31, "learning_rate": 1.9895883474810364e-05, "loss": 0.0289, "step": 21680 }, { "epoch": 0.31, "learning_rate": 1.9895835435071893e-05, "loss": 0.0248, "step": 21690 }, { "epoch": 0.31, "learning_rate": 1.9895787395333422e-05, "loss": 0.0199, "step": 21700 }, { "epoch": 0.31, "learning_rate": 1.9895739355594948e-05, "loss": 0.0279, "step": 21710 }, { "epoch": 0.31, "learning_rate": 1.9895691315856477e-05, "loss": 0.0253, "step": 21720 }, { "epoch": 0.31, "learning_rate": 1.9895643276118007e-05, "loss": 0.0285, "step": 21730 }, { "epoch": 0.31, "learning_rate": 1.9895595236379536e-05, "loss": 0.0219, "step": 21740 }, { "epoch": 0.31, "learning_rate": 1.989554719664106e-05, "loss": 0.0227, "step": 21750 }, { "epoch": 0.31, "learning_rate": 1.989549915690259e-05, "loss": 0.0244, "step": 21760 }, { "epoch": 0.31, "learning_rate": 1.989545111716412e-05, "loss": 0.0237, "step": 21770 }, { "epoch": 0.31, "learning_rate": 1.989540307742565e-05, "loss": 0.0264, "step": 21780 }, { "epoch": 0.31, "learning_rate": 1.9895355037687175e-05, "loss": 0.0311, "step": 21790 }, { "epoch": 0.31, "learning_rate": 1.9895306997948705e-05, "loss": 0.0209, "step": 21800 }, { "epoch": 0.31, "learning_rate": 1.9895258958210234e-05, "loss": 0.0304, "step": 21810 }, { "epoch": 0.31, "learning_rate": 1.989521091847176e-05, "loss": 0.0216, "step": 21820 }, { "epoch": 0.31, "learning_rate": 1.989516287873329e-05, "loss": 0.0287, "step": 21830 }, { "epoch": 0.31, "learning_rate": 1.989511483899482e-05, "loss": 0.0336, "step": 21840 }, { "epoch": 0.31, "learning_rate": 1.9895066799256348e-05, "loss": 0.0302, "step": 21850 }, { "epoch": 0.32, "learning_rate": 1.9895018759517873e-05, "loss": 0.0421, "step": 21860 }, { "epoch": 0.32, "learning_rate": 1.9894970719779403e-05, "loss": 0.0276, "step": 21870 }, { "epoch": 0.32, "learning_rate": 1.9894922680040932e-05, "loss": 0.0317, "step": 21880 }, { "epoch": 0.32, "learning_rate": 1.9894874640302458e-05, "loss": 0.029, "step": 21890 }, { "epoch": 0.32, "learning_rate": 1.9894826600563987e-05, "loss": 0.0365, "step": 21900 }, { "epoch": 0.32, "learning_rate": 1.9894778560825516e-05, "loss": 0.0315, "step": 21910 }, { "epoch": 0.32, "learning_rate": 1.9894730521087046e-05, "loss": 0.031, "step": 21920 }, { "epoch": 0.32, "learning_rate": 1.989468248134857e-05, "loss": 0.026, "step": 21930 }, { "epoch": 0.32, "learning_rate": 1.98946344416101e-05, "loss": 0.0261, "step": 21940 }, { "epoch": 0.32, "learning_rate": 1.989458640187163e-05, "loss": 0.0308, "step": 21950 }, { "epoch": 0.32, "learning_rate": 1.989453836213316e-05, "loss": 0.0316, "step": 21960 }, { "epoch": 0.32, "learning_rate": 1.9894490322394685e-05, "loss": 0.0276, "step": 21970 }, { "epoch": 0.32, "learning_rate": 1.9894442282656215e-05, "loss": 0.0213, "step": 21980 }, { "epoch": 0.32, "learning_rate": 1.9894394242917744e-05, "loss": 0.0252, "step": 21990 }, { "epoch": 0.32, "learning_rate": 1.989434620317927e-05, "loss": 0.0265, "step": 22000 }, { "epoch": 0.32, "learning_rate": 1.98942981634408e-05, "loss": 0.0286, "step": 22010 }, { "epoch": 0.32, "learning_rate": 1.9894250123702328e-05, "loss": 0.0276, "step": 22020 }, { "epoch": 0.32, "learning_rate": 1.9894202083963858e-05, "loss": 0.0311, "step": 22030 }, { "epoch": 0.32, "learning_rate": 1.9894154044225383e-05, "loss": 0.026, "step": 22040 }, { "epoch": 0.32, "learning_rate": 1.9894106004486913e-05, "loss": 0.036, "step": 22050 }, { "epoch": 0.32, "learning_rate": 1.9894057964748442e-05, "loss": 0.0241, "step": 22060 }, { "epoch": 0.32, "learning_rate": 1.9894009925009968e-05, "loss": 0.0267, "step": 22070 }, { "epoch": 0.32, "learning_rate": 1.9893961885271497e-05, "loss": 0.0237, "step": 22080 }, { "epoch": 0.32, "learning_rate": 1.9893913845533026e-05, "loss": 0.0207, "step": 22090 }, { "epoch": 0.32, "learning_rate": 1.9893865805794556e-05, "loss": 0.0295, "step": 22100 }, { "epoch": 0.32, "learning_rate": 1.989382257002993e-05, "loss": 0.0192, "step": 22110 }, { "epoch": 0.32, "learning_rate": 1.989377453029146e-05, "loss": 0.0276, "step": 22120 }, { "epoch": 0.32, "learning_rate": 1.9893726490552985e-05, "loss": 0.0191, "step": 22130 }, { "epoch": 0.32, "learning_rate": 1.9893678450814515e-05, "loss": 0.0254, "step": 22140 }, { "epoch": 0.32, "learning_rate": 1.9893630411076044e-05, "loss": 0.0241, "step": 22150 }, { "epoch": 0.32, "learning_rate": 1.9893582371337573e-05, "loss": 0.0249, "step": 22160 }, { "epoch": 0.32, "learning_rate": 1.98935343315991e-05, "loss": 0.0303, "step": 22170 }, { "epoch": 0.32, "learning_rate": 1.989348629186063e-05, "loss": 0.0266, "step": 22180 }, { "epoch": 0.32, "learning_rate": 1.9893438252122158e-05, "loss": 0.0252, "step": 22190 }, { "epoch": 0.32, "learning_rate": 1.9893390212383687e-05, "loss": 0.0279, "step": 22200 }, { "epoch": 0.32, "learning_rate": 1.9893342172645213e-05, "loss": 0.0226, "step": 22210 }, { "epoch": 0.32, "learning_rate": 1.9893294132906742e-05, "loss": 0.0265, "step": 22220 }, { "epoch": 0.32, "learning_rate": 1.989324609316827e-05, "loss": 0.0274, "step": 22230 }, { "epoch": 0.32, "learning_rate": 1.9893198053429797e-05, "loss": 0.0234, "step": 22240 }, { "epoch": 0.32, "learning_rate": 1.9893150013691326e-05, "loss": 0.0305, "step": 22250 }, { "epoch": 0.32, "learning_rate": 1.9893101973952856e-05, "loss": 0.0276, "step": 22260 }, { "epoch": 0.32, "learning_rate": 1.9893053934214385e-05, "loss": 0.0191, "step": 22270 }, { "epoch": 0.32, "learning_rate": 1.989300589447591e-05, "loss": 0.0278, "step": 22280 }, { "epoch": 0.32, "learning_rate": 1.989295785473744e-05, "loss": 0.0272, "step": 22290 }, { "epoch": 0.32, "learning_rate": 1.989290981499897e-05, "loss": 0.0292, "step": 22300 }, { "epoch": 0.32, "learning_rate": 1.9892861775260495e-05, "loss": 0.0241, "step": 22310 }, { "epoch": 0.32, "learning_rate": 1.9892813735522025e-05, "loss": 0.0331, "step": 22320 }, { "epoch": 0.32, "learning_rate": 1.9892765695783554e-05, "loss": 0.0254, "step": 22330 }, { "epoch": 0.32, "learning_rate": 1.9892717656045083e-05, "loss": 0.0236, "step": 22340 }, { "epoch": 0.32, "learning_rate": 1.989266961630661e-05, "loss": 0.0245, "step": 22350 }, { "epoch": 0.32, "learning_rate": 1.9892621576568138e-05, "loss": 0.0204, "step": 22360 }, { "epoch": 0.32, "learning_rate": 1.9892573536829668e-05, "loss": 0.0295, "step": 22370 }, { "epoch": 0.32, "learning_rate": 1.9892525497091197e-05, "loss": 0.0259, "step": 22380 }, { "epoch": 0.32, "learning_rate": 1.9892477457352723e-05, "loss": 0.0284, "step": 22390 }, { "epoch": 0.32, "learning_rate": 1.9892429417614252e-05, "loss": 0.0261, "step": 22400 }, { "epoch": 0.32, "learning_rate": 1.989238137787578e-05, "loss": 0.0268, "step": 22410 }, { "epoch": 0.32, "learning_rate": 1.9892333338137307e-05, "loss": 0.0241, "step": 22420 }, { "epoch": 0.32, "learning_rate": 1.9892285298398836e-05, "loss": 0.0264, "step": 22430 }, { "epoch": 0.32, "learning_rate": 1.9892237258660366e-05, "loss": 0.0256, "step": 22440 }, { "epoch": 0.32, "learning_rate": 1.9892189218921895e-05, "loss": 0.0266, "step": 22450 }, { "epoch": 0.32, "learning_rate": 1.989214117918342e-05, "loss": 0.0303, "step": 22460 }, { "epoch": 0.32, "learning_rate": 1.989209313944495e-05, "loss": 0.027, "step": 22470 }, { "epoch": 0.32, "learning_rate": 1.989204509970648e-05, "loss": 0.0214, "step": 22480 }, { "epoch": 0.32, "learning_rate": 1.9891997059968005e-05, "loss": 0.0268, "step": 22490 }, { "epoch": 0.32, "learning_rate": 1.9891949020229535e-05, "loss": 0.0269, "step": 22500 }, { "epoch": 0.32, "learning_rate": 1.9891900980491064e-05, "loss": 0.0243, "step": 22510 }, { "epoch": 0.32, "learning_rate": 1.9891852940752593e-05, "loss": 0.0235, "step": 22520 }, { "epoch": 0.32, "learning_rate": 1.989180490101412e-05, "loss": 0.031, "step": 22530 }, { "epoch": 0.32, "learning_rate": 1.9891756861275648e-05, "loss": 0.0221, "step": 22540 }, { "epoch": 0.32, "learning_rate": 1.9891708821537177e-05, "loss": 0.0283, "step": 22550 }, { "epoch": 0.33, "learning_rate": 1.9891660781798707e-05, "loss": 0.0244, "step": 22560 }, { "epoch": 0.33, "learning_rate": 1.9891612742060233e-05, "loss": 0.0297, "step": 22570 }, { "epoch": 0.33, "learning_rate": 1.9891564702321762e-05, "loss": 0.0256, "step": 22580 }, { "epoch": 0.33, "learning_rate": 1.989151666258329e-05, "loss": 0.0265, "step": 22590 }, { "epoch": 0.33, "learning_rate": 1.9891468622844817e-05, "loss": 0.0253, "step": 22600 }, { "epoch": 0.33, "learning_rate": 1.9891420583106346e-05, "loss": 0.037, "step": 22610 }, { "epoch": 0.33, "learning_rate": 1.9891372543367876e-05, "loss": 0.033, "step": 22620 }, { "epoch": 0.33, "learning_rate": 1.9891324503629405e-05, "loss": 0.0272, "step": 22630 }, { "epoch": 0.33, "learning_rate": 1.989127646389093e-05, "loss": 0.0244, "step": 22640 }, { "epoch": 0.33, "learning_rate": 1.989122842415246e-05, "loss": 0.0274, "step": 22650 }, { "epoch": 0.33, "learning_rate": 1.989118038441399e-05, "loss": 0.0281, "step": 22660 }, { "epoch": 0.33, "learning_rate": 1.9891132344675515e-05, "loss": 0.025, "step": 22670 }, { "epoch": 0.33, "learning_rate": 1.9891084304937044e-05, "loss": 0.0294, "step": 22680 }, { "epoch": 0.33, "learning_rate": 1.9891036265198574e-05, "loss": 0.023, "step": 22690 }, { "epoch": 0.33, "learning_rate": 1.9890988225460103e-05, "loss": 0.0192, "step": 22700 }, { "epoch": 0.33, "learning_rate": 1.989094018572163e-05, "loss": 0.0264, "step": 22710 }, { "epoch": 0.33, "learning_rate": 1.9890892145983158e-05, "loss": 0.03, "step": 22720 }, { "epoch": 0.33, "learning_rate": 1.9890844106244687e-05, "loss": 0.0314, "step": 22730 }, { "epoch": 0.33, "learning_rate": 1.9890796066506217e-05, "loss": 0.0214, "step": 22740 }, { "epoch": 0.33, "learning_rate": 1.9890748026767743e-05, "loss": 0.0222, "step": 22750 }, { "epoch": 0.33, "learning_rate": 1.9890699987029272e-05, "loss": 0.0228, "step": 22760 }, { "epoch": 0.33, "learning_rate": 1.98906519472908e-05, "loss": 0.0222, "step": 22770 }, { "epoch": 0.33, "learning_rate": 1.9890603907552327e-05, "loss": 0.0285, "step": 22780 }, { "epoch": 0.33, "learning_rate": 1.9890555867813856e-05, "loss": 0.0278, "step": 22790 }, { "epoch": 0.33, "learning_rate": 1.9890507828075386e-05, "loss": 0.0283, "step": 22800 }, { "epoch": 0.33, "learning_rate": 1.9890459788336915e-05, "loss": 0.0312, "step": 22810 }, { "epoch": 0.33, "learning_rate": 1.989041174859844e-05, "loss": 0.0237, "step": 22820 }, { "epoch": 0.33, "learning_rate": 1.989036370885997e-05, "loss": 0.0253, "step": 22830 }, { "epoch": 0.33, "learning_rate": 1.98903156691215e-05, "loss": 0.023, "step": 22840 }, { "epoch": 0.33, "learning_rate": 1.9890267629383025e-05, "loss": 0.0291, "step": 22850 }, { "epoch": 0.33, "learning_rate": 1.9890219589644554e-05, "loss": 0.0336, "step": 22860 }, { "epoch": 0.33, "learning_rate": 1.9890171549906084e-05, "loss": 0.0342, "step": 22870 }, { "epoch": 0.33, "learning_rate": 1.9890123510167613e-05, "loss": 0.0307, "step": 22880 }, { "epoch": 0.33, "learning_rate": 1.989007547042914e-05, "loss": 0.0263, "step": 22890 }, { "epoch": 0.33, "learning_rate": 1.9890027430690668e-05, "loss": 0.0296, "step": 22900 }, { "epoch": 0.33, "learning_rate": 1.9889979390952197e-05, "loss": 0.0274, "step": 22910 }, { "epoch": 0.33, "learning_rate": 1.9889931351213723e-05, "loss": 0.0284, "step": 22920 }, { "epoch": 0.33, "learning_rate": 1.9889883311475252e-05, "loss": 0.0259, "step": 22930 }, { "epoch": 0.33, "learning_rate": 1.9889835271736782e-05, "loss": 0.0266, "step": 22940 }, { "epoch": 0.33, "learning_rate": 1.988978723199831e-05, "loss": 0.0255, "step": 22950 }, { "epoch": 0.33, "learning_rate": 1.9889739192259837e-05, "loss": 0.0219, "step": 22960 }, { "epoch": 0.33, "learning_rate": 1.9889691152521366e-05, "loss": 0.0293, "step": 22970 }, { "epoch": 0.33, "learning_rate": 1.9889643112782895e-05, "loss": 0.0237, "step": 22980 }, { "epoch": 0.33, "learning_rate": 1.9889595073044425e-05, "loss": 0.0266, "step": 22990 }, { "epoch": 0.33, "learning_rate": 1.988954703330595e-05, "loss": 0.0282, "step": 23000 }, { "epoch": 0.33, "learning_rate": 1.988949899356748e-05, "loss": 0.0308, "step": 23010 }, { "epoch": 0.33, "learning_rate": 1.988945095382901e-05, "loss": 0.029, "step": 23020 }, { "epoch": 0.33, "learning_rate": 1.9889402914090535e-05, "loss": 0.0251, "step": 23030 }, { "epoch": 0.33, "learning_rate": 1.9889354874352064e-05, "loss": 0.0289, "step": 23040 }, { "epoch": 0.33, "learning_rate": 1.9889306834613594e-05, "loss": 0.0217, "step": 23050 }, { "epoch": 0.33, "learning_rate": 1.9889258794875123e-05, "loss": 0.0234, "step": 23060 }, { "epoch": 0.33, "learning_rate": 1.988921075513665e-05, "loss": 0.0316, "step": 23070 }, { "epoch": 0.33, "learning_rate": 1.9889162715398178e-05, "loss": 0.0233, "step": 23080 }, { "epoch": 0.33, "learning_rate": 1.9889114675659707e-05, "loss": 0.0204, "step": 23090 }, { "epoch": 0.33, "learning_rate": 1.9889066635921233e-05, "loss": 0.0291, "step": 23100 }, { "epoch": 0.33, "learning_rate": 1.9889018596182762e-05, "loss": 0.0341, "step": 23110 }, { "epoch": 0.33, "learning_rate": 1.988897055644429e-05, "loss": 0.0246, "step": 23120 }, { "epoch": 0.33, "learning_rate": 1.988892251670582e-05, "loss": 0.0235, "step": 23130 }, { "epoch": 0.33, "learning_rate": 1.9888874476967347e-05, "loss": 0.0242, "step": 23140 }, { "epoch": 0.33, "learning_rate": 1.9888826437228876e-05, "loss": 0.0233, "step": 23150 }, { "epoch": 0.33, "learning_rate": 1.9888778397490405e-05, "loss": 0.0217, "step": 23160 }, { "epoch": 0.33, "learning_rate": 1.9888730357751935e-05, "loss": 0.0316, "step": 23170 }, { "epoch": 0.33, "learning_rate": 1.988868231801346e-05, "loss": 0.0276, "step": 23180 }, { "epoch": 0.33, "learning_rate": 1.988863427827499e-05, "loss": 0.0224, "step": 23190 }, { "epoch": 0.33, "learning_rate": 1.988858623853652e-05, "loss": 0.0237, "step": 23200 }, { "epoch": 0.33, "learning_rate": 1.9888538198798045e-05, "loss": 0.0303, "step": 23210 }, { "epoch": 0.33, "learning_rate": 1.9888490159059574e-05, "loss": 0.0271, "step": 23220 }, { "epoch": 0.33, "learning_rate": 1.9888442119321103e-05, "loss": 0.0219, "step": 23230 }, { "epoch": 0.33, "learning_rate": 1.9888394079582633e-05, "loss": 0.0234, "step": 23240 }, { "epoch": 0.34, "learning_rate": 1.988834603984416e-05, "loss": 0.0279, "step": 23250 }, { "epoch": 0.34, "learning_rate": 1.9888298000105688e-05, "loss": 0.027, "step": 23260 }, { "epoch": 0.34, "learning_rate": 1.9888249960367217e-05, "loss": 0.0264, "step": 23270 }, { "epoch": 0.34, "learning_rate": 1.9888201920628743e-05, "loss": 0.0233, "step": 23280 }, { "epoch": 0.34, "learning_rate": 1.9888153880890272e-05, "loss": 0.0252, "step": 23290 }, { "epoch": 0.34, "learning_rate": 1.98881058411518e-05, "loss": 0.0254, "step": 23300 }, { "epoch": 0.34, "learning_rate": 1.988805780141333e-05, "loss": 0.0266, "step": 23310 }, { "epoch": 0.34, "learning_rate": 1.9888009761674857e-05, "loss": 0.0323, "step": 23320 }, { "epoch": 0.34, "learning_rate": 1.9887961721936386e-05, "loss": 0.0323, "step": 23330 }, { "epoch": 0.34, "learning_rate": 1.9887913682197915e-05, "loss": 0.0307, "step": 23340 }, { "epoch": 0.34, "learning_rate": 1.9887865642459445e-05, "loss": 0.0262, "step": 23350 }, { "epoch": 0.34, "learning_rate": 1.9887817602720974e-05, "loss": 0.0168, "step": 23360 }, { "epoch": 0.34, "learning_rate": 1.9887769562982503e-05, "loss": 0.0194, "step": 23370 }, { "epoch": 0.34, "learning_rate": 1.988772152324403e-05, "loss": 0.0273, "step": 23380 }, { "epoch": 0.34, "learning_rate": 1.9887673483505558e-05, "loss": 0.0286, "step": 23390 }, { "epoch": 0.34, "learning_rate": 1.9887625443767087e-05, "loss": 0.0275, "step": 23400 }, { "epoch": 0.34, "learning_rate": 1.9887577404028617e-05, "loss": 0.0229, "step": 23410 }, { "epoch": 0.34, "learning_rate": 1.9887529364290143e-05, "loss": 0.0261, "step": 23420 }, { "epoch": 0.34, "learning_rate": 1.9887481324551672e-05, "loss": 0.0243, "step": 23430 }, { "epoch": 0.34, "learning_rate": 1.98874332848132e-05, "loss": 0.0264, "step": 23440 }, { "epoch": 0.34, "learning_rate": 1.9887385245074727e-05, "loss": 0.0203, "step": 23450 }, { "epoch": 0.34, "learning_rate": 1.9887337205336256e-05, "loss": 0.0284, "step": 23460 }, { "epoch": 0.34, "learning_rate": 1.9887289165597786e-05, "loss": 0.0251, "step": 23470 }, { "epoch": 0.34, "learning_rate": 1.9887241125859315e-05, "loss": 0.024, "step": 23480 }, { "epoch": 0.34, "learning_rate": 1.988719308612084e-05, "loss": 0.0254, "step": 23490 }, { "epoch": 0.34, "learning_rate": 1.988714504638237e-05, "loss": 0.0228, "step": 23500 }, { "epoch": 0.34, "learning_rate": 1.98870970066439e-05, "loss": 0.0235, "step": 23510 }, { "epoch": 0.34, "learning_rate": 1.9887048966905425e-05, "loss": 0.0205, "step": 23520 }, { "epoch": 0.34, "learning_rate": 1.9887000927166954e-05, "loss": 0.0216, "step": 23530 }, { "epoch": 0.34, "learning_rate": 1.9886952887428484e-05, "loss": 0.026, "step": 23540 }, { "epoch": 0.34, "learning_rate": 1.9886904847690013e-05, "loss": 0.029, "step": 23550 }, { "epoch": 0.34, "learning_rate": 1.988685680795154e-05, "loss": 0.0222, "step": 23560 }, { "epoch": 0.34, "learning_rate": 1.9886808768213068e-05, "loss": 0.0231, "step": 23570 }, { "epoch": 0.34, "learning_rate": 1.9886760728474597e-05, "loss": 0.0321, "step": 23580 }, { "epoch": 0.34, "learning_rate": 1.9886712688736127e-05, "loss": 0.0268, "step": 23590 }, { "epoch": 0.34, "learning_rate": 1.9886664648997653e-05, "loss": 0.0216, "step": 23600 }, { "epoch": 0.34, "learning_rate": 1.9886616609259182e-05, "loss": 0.0297, "step": 23610 }, { "epoch": 0.34, "learning_rate": 1.988656856952071e-05, "loss": 0.0275, "step": 23620 }, { "epoch": 0.34, "learning_rate": 1.9886520529782237e-05, "loss": 0.0274, "step": 23630 }, { "epoch": 0.34, "learning_rate": 1.9886472490043766e-05, "loss": 0.0259, "step": 23640 }, { "epoch": 0.34, "learning_rate": 1.9886424450305296e-05, "loss": 0.0288, "step": 23650 }, { "epoch": 0.34, "learning_rate": 1.9886376410566825e-05, "loss": 0.0216, "step": 23660 }, { "epoch": 0.34, "learning_rate": 1.988632837082835e-05, "loss": 0.0228, "step": 23670 }, { "epoch": 0.34, "learning_rate": 1.988628033108988e-05, "loss": 0.0217, "step": 23680 }, { "epoch": 0.34, "learning_rate": 1.988623229135141e-05, "loss": 0.0281, "step": 23690 }, { "epoch": 0.34, "learning_rate": 1.9886184251612935e-05, "loss": 0.0293, "step": 23700 }, { "epoch": 0.34, "learning_rate": 1.9886136211874464e-05, "loss": 0.0268, "step": 23710 }, { "epoch": 0.34, "learning_rate": 1.9886088172135994e-05, "loss": 0.0263, "step": 23720 }, { "epoch": 0.34, "learning_rate": 1.9886040132397523e-05, "loss": 0.0289, "step": 23730 }, { "epoch": 0.34, "learning_rate": 1.988599209265905e-05, "loss": 0.0252, "step": 23740 }, { "epoch": 0.34, "learning_rate": 1.9885944052920578e-05, "loss": 0.0294, "step": 23750 }, { "epoch": 0.34, "learning_rate": 1.9885896013182107e-05, "loss": 0.0291, "step": 23760 }, { "epoch": 0.34, "learning_rate": 1.9885847973443637e-05, "loss": 0.0242, "step": 23770 }, { "epoch": 0.34, "learning_rate": 1.9885799933705162e-05, "loss": 0.0216, "step": 23780 }, { "epoch": 0.34, "learning_rate": 1.9885751893966692e-05, "loss": 0.0233, "step": 23790 }, { "epoch": 0.34, "learning_rate": 1.988570385422822e-05, "loss": 0.0176, "step": 23800 }, { "epoch": 0.34, "learning_rate": 1.9885655814489747e-05, "loss": 0.0341, "step": 23810 }, { "epoch": 0.34, "learning_rate": 1.9885607774751276e-05, "loss": 0.0211, "step": 23820 }, { "epoch": 0.34, "learning_rate": 1.9885559735012805e-05, "loss": 0.02, "step": 23830 }, { "epoch": 0.34, "learning_rate": 1.9885511695274335e-05, "loss": 0.0265, "step": 23840 }, { "epoch": 0.34, "learning_rate": 1.988546365553586e-05, "loss": 0.0287, "step": 23850 }, { "epoch": 0.34, "learning_rate": 1.988541561579739e-05, "loss": 0.025, "step": 23860 }, { "epoch": 0.34, "learning_rate": 1.988536757605892e-05, "loss": 0.0242, "step": 23870 }, { "epoch": 0.34, "learning_rate": 1.9885319536320445e-05, "loss": 0.0177, "step": 23880 }, { "epoch": 0.34, "learning_rate": 1.9885271496581974e-05, "loss": 0.028, "step": 23890 }, { "epoch": 0.34, "learning_rate": 1.9885223456843504e-05, "loss": 0.0232, "step": 23900 }, { "epoch": 0.34, "learning_rate": 1.9885175417105033e-05, "loss": 0.0285, "step": 23910 }, { "epoch": 0.34, "learning_rate": 1.988512737736656e-05, "loss": 0.0316, "step": 23920 }, { "epoch": 0.34, "learning_rate": 1.9885079337628088e-05, "loss": 0.0219, "step": 23930 }, { "epoch": 0.35, "learning_rate": 1.9885031297889617e-05, "loss": 0.0298, "step": 23940 }, { "epoch": 0.35, "learning_rate": 1.9884983258151146e-05, "loss": 0.0234, "step": 23950 }, { "epoch": 0.35, "learning_rate": 1.9884935218412672e-05, "loss": 0.0298, "step": 23960 }, { "epoch": 0.35, "learning_rate": 1.98848871786742e-05, "loss": 0.0229, "step": 23970 }, { "epoch": 0.35, "learning_rate": 1.988483913893573e-05, "loss": 0.0204, "step": 23980 }, { "epoch": 0.35, "learning_rate": 1.9884791099197257e-05, "loss": 0.0234, "step": 23990 }, { "epoch": 0.35, "learning_rate": 1.9884743059458786e-05, "loss": 0.0242, "step": 24000 }, { "epoch": 0.35, "learning_rate": 1.9884695019720315e-05, "loss": 0.0266, "step": 24010 }, { "epoch": 0.35, "learning_rate": 1.9884646979981845e-05, "loss": 0.0189, "step": 24020 }, { "epoch": 0.35, "learning_rate": 1.988459894024337e-05, "loss": 0.0275, "step": 24030 }, { "epoch": 0.35, "learning_rate": 1.98845509005049e-05, "loss": 0.0291, "step": 24040 }, { "epoch": 0.35, "learning_rate": 1.988450286076643e-05, "loss": 0.0226, "step": 24050 }, { "epoch": 0.35, "learning_rate": 1.9884454821027955e-05, "loss": 0.0257, "step": 24060 }, { "epoch": 0.35, "learning_rate": 1.9884406781289484e-05, "loss": 0.0225, "step": 24070 }, { "epoch": 0.35, "learning_rate": 1.9884358741551013e-05, "loss": 0.0244, "step": 24080 }, { "epoch": 0.35, "learning_rate": 1.9884310701812543e-05, "loss": 0.0204, "step": 24090 }, { "epoch": 0.35, "learning_rate": 1.988426266207407e-05, "loss": 0.0254, "step": 24100 }, { "epoch": 0.35, "learning_rate": 1.9884214622335598e-05, "loss": 0.0194, "step": 24110 }, { "epoch": 0.35, "learning_rate": 1.9884166582597127e-05, "loss": 0.025, "step": 24120 }, { "epoch": 0.35, "learning_rate": 1.9884118542858656e-05, "loss": 0.0239, "step": 24130 }, { "epoch": 0.35, "learning_rate": 1.9884070503120182e-05, "loss": 0.0267, "step": 24140 }, { "epoch": 0.35, "learning_rate": 1.988402246338171e-05, "loss": 0.0243, "step": 24150 }, { "epoch": 0.35, "learning_rate": 1.988397442364324e-05, "loss": 0.0354, "step": 24160 }, { "epoch": 0.35, "learning_rate": 1.9883926383904767e-05, "loss": 0.0223, "step": 24170 }, { "epoch": 0.35, "learning_rate": 1.9883878344166296e-05, "loss": 0.0259, "step": 24180 }, { "epoch": 0.35, "learning_rate": 1.9883830304427825e-05, "loss": 0.0227, "step": 24190 }, { "epoch": 0.35, "learning_rate": 1.9883782264689355e-05, "loss": 0.0211, "step": 24200 }, { "epoch": 0.35, "learning_rate": 1.988373422495088e-05, "loss": 0.0269, "step": 24210 }, { "epoch": 0.35, "learning_rate": 1.988368618521241e-05, "loss": 0.0217, "step": 24220 }, { "epoch": 0.35, "learning_rate": 1.988363814547394e-05, "loss": 0.0213, "step": 24230 }, { "epoch": 0.35, "learning_rate": 1.9883590105735465e-05, "loss": 0.0258, "step": 24240 }, { "epoch": 0.35, "learning_rate": 1.9883542065996994e-05, "loss": 0.0256, "step": 24250 }, { "epoch": 0.35, "learning_rate": 1.9883494026258523e-05, "loss": 0.0201, "step": 24260 }, { "epoch": 0.35, "learning_rate": 1.9883445986520053e-05, "loss": 0.029, "step": 24270 }, { "epoch": 0.35, "learning_rate": 1.988339794678158e-05, "loss": 0.0273, "step": 24280 }, { "epoch": 0.35, "learning_rate": 1.9883349907043108e-05, "loss": 0.0277, "step": 24290 }, { "epoch": 0.35, "learning_rate": 1.9883301867304637e-05, "loss": 0.0278, "step": 24300 }, { "epoch": 0.35, "learning_rate": 1.9883253827566163e-05, "loss": 0.0268, "step": 24310 }, { "epoch": 0.35, "learning_rate": 1.9883205787827692e-05, "loss": 0.0261, "step": 24320 }, { "epoch": 0.35, "learning_rate": 1.988315774808922e-05, "loss": 0.0237, "step": 24330 }, { "epoch": 0.35, "learning_rate": 1.988310970835075e-05, "loss": 0.0209, "step": 24340 }, { "epoch": 0.35, "learning_rate": 1.9883061668612277e-05, "loss": 0.0249, "step": 24350 }, { "epoch": 0.35, "learning_rate": 1.9883013628873806e-05, "loss": 0.0261, "step": 24360 }, { "epoch": 0.35, "learning_rate": 1.9882965589135335e-05, "loss": 0.0263, "step": 24370 }, { "epoch": 0.35, "learning_rate": 1.9882917549396864e-05, "loss": 0.0326, "step": 24380 }, { "epoch": 0.35, "learning_rate": 1.988286950965839e-05, "loss": 0.0307, "step": 24390 }, { "epoch": 0.35, "learning_rate": 1.988282146991992e-05, "loss": 0.0201, "step": 24400 }, { "epoch": 0.35, "learning_rate": 1.988277343018145e-05, "loss": 0.0188, "step": 24410 }, { "epoch": 0.35, "learning_rate": 1.9882725390442975e-05, "loss": 0.0226, "step": 24420 }, { "epoch": 0.35, "learning_rate": 1.9882677350704504e-05, "loss": 0.0219, "step": 24430 }, { "epoch": 0.35, "learning_rate": 1.9882629310966033e-05, "loss": 0.0229, "step": 24440 }, { "epoch": 0.35, "learning_rate": 1.9882581271227563e-05, "loss": 0.0203, "step": 24450 }, { "epoch": 0.35, "learning_rate": 1.988253323148909e-05, "loss": 0.0313, "step": 24460 }, { "epoch": 0.35, "learning_rate": 1.9882485191750618e-05, "loss": 0.0259, "step": 24470 }, { "epoch": 0.35, "learning_rate": 1.9882437152012147e-05, "loss": 0.0332, "step": 24480 }, { "epoch": 0.35, "learning_rate": 1.9882389112273673e-05, "loss": 0.0322, "step": 24490 }, { "epoch": 0.35, "learning_rate": 1.9882341072535202e-05, "loss": 0.0237, "step": 24500 }, { "epoch": 0.35, "learning_rate": 1.988229303279673e-05, "loss": 0.0264, "step": 24510 }, { "epoch": 0.35, "learning_rate": 1.988224499305826e-05, "loss": 0.025, "step": 24520 }, { "epoch": 0.35, "learning_rate": 1.9882196953319787e-05, "loss": 0.0207, "step": 24530 }, { "epoch": 0.35, "learning_rate": 1.9882148913581316e-05, "loss": 0.0245, "step": 24540 }, { "epoch": 0.35, "learning_rate": 1.9882100873842845e-05, "loss": 0.0219, "step": 24550 }, { "epoch": 0.35, "learning_rate": 1.9882052834104374e-05, "loss": 0.023, "step": 24560 }, { "epoch": 0.35, "learning_rate": 1.98820047943659e-05, "loss": 0.033, "step": 24570 }, { "epoch": 0.35, "learning_rate": 1.988195675462743e-05, "loss": 0.0275, "step": 24580 }, { "epoch": 0.35, "learning_rate": 1.988190871488896e-05, "loss": 0.0285, "step": 24590 }, { "epoch": 0.35, "learning_rate": 1.9881860675150485e-05, "loss": 0.0236, "step": 24600 }, { "epoch": 0.35, "learning_rate": 1.9881812635412014e-05, "loss": 0.0247, "step": 24610 }, { "epoch": 0.35, "learning_rate": 1.9881764595673543e-05, "loss": 0.0248, "step": 24620 }, { "epoch": 0.35, "learning_rate": 1.9881716555935072e-05, "loss": 0.0266, "step": 24630 }, { "epoch": 0.36, "learning_rate": 1.98816685161966e-05, "loss": 0.029, "step": 24640 }, { "epoch": 0.36, "learning_rate": 1.9881620476458128e-05, "loss": 0.0271, "step": 24650 }, { "epoch": 0.36, "learning_rate": 1.9881572436719657e-05, "loss": 0.0273, "step": 24660 }, { "epoch": 0.36, "learning_rate": 1.9881524396981183e-05, "loss": 0.0223, "step": 24670 }, { "epoch": 0.36, "learning_rate": 1.9881476357242712e-05, "loss": 0.0285, "step": 24680 }, { "epoch": 0.36, "learning_rate": 1.988142831750424e-05, "loss": 0.0232, "step": 24690 }, { "epoch": 0.36, "learning_rate": 1.988138027776577e-05, "loss": 0.0258, "step": 24700 }, { "epoch": 0.36, "learning_rate": 1.9881332238027296e-05, "loss": 0.0325, "step": 24710 }, { "epoch": 0.36, "learning_rate": 1.9881284198288826e-05, "loss": 0.0248, "step": 24720 }, { "epoch": 0.36, "learning_rate": 1.9881236158550355e-05, "loss": 0.0261, "step": 24730 }, { "epoch": 0.36, "learning_rate": 1.9881188118811884e-05, "loss": 0.0237, "step": 24740 }, { "epoch": 0.36, "learning_rate": 1.988114007907341e-05, "loss": 0.025, "step": 24750 }, { "epoch": 0.36, "learning_rate": 1.988109203933494e-05, "loss": 0.0267, "step": 24760 }, { "epoch": 0.36, "learning_rate": 1.988104399959647e-05, "loss": 0.0233, "step": 24770 }, { "epoch": 0.36, "learning_rate": 1.9880995959857995e-05, "loss": 0.0304, "step": 24780 }, { "epoch": 0.36, "learning_rate": 1.9880947920119524e-05, "loss": 0.0256, "step": 24790 }, { "epoch": 0.36, "learning_rate": 1.9880899880381053e-05, "loss": 0.0243, "step": 24800 }, { "epoch": 0.36, "learning_rate": 1.9880851840642582e-05, "loss": 0.0245, "step": 24810 }, { "epoch": 0.36, "learning_rate": 1.9880803800904108e-05, "loss": 0.0237, "step": 24820 }, { "epoch": 0.36, "learning_rate": 1.9880755761165638e-05, "loss": 0.0261, "step": 24830 }, { "epoch": 0.36, "learning_rate": 1.9880707721427167e-05, "loss": 0.0208, "step": 24840 }, { "epoch": 0.36, "learning_rate": 1.9880659681688693e-05, "loss": 0.0214, "step": 24850 }, { "epoch": 0.36, "learning_rate": 1.9880611641950222e-05, "loss": 0.0191, "step": 24860 }, { "epoch": 0.36, "learning_rate": 1.988056360221175e-05, "loss": 0.0234, "step": 24870 }, { "epoch": 0.36, "learning_rate": 1.988051556247328e-05, "loss": 0.0291, "step": 24880 }, { "epoch": 0.36, "learning_rate": 1.9880467522734806e-05, "loss": 0.0276, "step": 24890 }, { "epoch": 0.36, "learning_rate": 1.9880419482996336e-05, "loss": 0.0191, "step": 24900 }, { "epoch": 0.36, "learning_rate": 1.9880371443257865e-05, "loss": 0.0242, "step": 24910 }, { "epoch": 0.36, "learning_rate": 1.9880323403519394e-05, "loss": 0.0243, "step": 24920 }, { "epoch": 0.36, "learning_rate": 1.988027536378092e-05, "loss": 0.0268, "step": 24930 }, { "epoch": 0.36, "learning_rate": 1.988022732404245e-05, "loss": 0.0338, "step": 24940 }, { "epoch": 0.36, "learning_rate": 1.988017928430398e-05, "loss": 0.0275, "step": 24950 }, { "epoch": 0.36, "learning_rate": 1.9880131244565504e-05, "loss": 0.024, "step": 24960 }, { "epoch": 0.36, "learning_rate": 1.9880083204827034e-05, "loss": 0.0343, "step": 24970 }, { "epoch": 0.36, "learning_rate": 1.9880035165088563e-05, "loss": 0.0222, "step": 24980 }, { "epoch": 0.36, "learning_rate": 1.9879987125350092e-05, "loss": 0.028, "step": 24990 }, { "epoch": 0.36, "learning_rate": 1.9879939085611618e-05, "loss": 0.0247, "step": 25000 }, { "epoch": 0.36, "learning_rate": 1.9879891045873147e-05, "loss": 0.0289, "step": 25010 }, { "epoch": 0.36, "learning_rate": 1.9879843006134677e-05, "loss": 0.0254, "step": 25020 }, { "epoch": 0.36, "learning_rate": 1.9879794966396203e-05, "loss": 0.0212, "step": 25030 }, { "epoch": 0.36, "learning_rate": 1.9879746926657732e-05, "loss": 0.029, "step": 25040 }, { "epoch": 0.36, "learning_rate": 1.987969888691926e-05, "loss": 0.026, "step": 25050 }, { "epoch": 0.36, "learning_rate": 1.987965084718079e-05, "loss": 0.0273, "step": 25060 }, { "epoch": 0.36, "learning_rate": 1.9879602807442316e-05, "loss": 0.0227, "step": 25070 }, { "epoch": 0.36, "learning_rate": 1.9879554767703846e-05, "loss": 0.0198, "step": 25080 }, { "epoch": 0.36, "learning_rate": 1.9879506727965375e-05, "loss": 0.0227, "step": 25090 }, { "epoch": 0.36, "learning_rate": 1.9879458688226904e-05, "loss": 0.0287, "step": 25100 }, { "epoch": 0.36, "learning_rate": 1.987941064848843e-05, "loss": 0.0225, "step": 25110 }, { "epoch": 0.36, "learning_rate": 1.987936260874996e-05, "loss": 0.0267, "step": 25120 }, { "epoch": 0.36, "learning_rate": 1.987931456901149e-05, "loss": 0.0256, "step": 25130 }, { "epoch": 0.36, "learning_rate": 1.9879266529273014e-05, "loss": 0.0219, "step": 25140 }, { "epoch": 0.36, "learning_rate": 1.9879218489534544e-05, "loss": 0.026, "step": 25150 }, { "epoch": 0.36, "learning_rate": 1.9879170449796073e-05, "loss": 0.0285, "step": 25160 }, { "epoch": 0.36, "learning_rate": 1.9879122410057602e-05, "loss": 0.021, "step": 25170 }, { "epoch": 0.36, "learning_rate": 1.9879074370319128e-05, "loss": 0.0256, "step": 25180 }, { "epoch": 0.36, "learning_rate": 1.9879026330580657e-05, "loss": 0.0254, "step": 25190 }, { "epoch": 0.36, "learning_rate": 1.9878978290842187e-05, "loss": 0.0231, "step": 25200 }, { "epoch": 0.36, "learning_rate": 1.9878930251103713e-05, "loss": 0.0268, "step": 25210 }, { "epoch": 0.36, "learning_rate": 1.9878882211365242e-05, "loss": 0.0244, "step": 25220 }, { "epoch": 0.36, "learning_rate": 1.987883417162677e-05, "loss": 0.027, "step": 25230 }, { "epoch": 0.36, "learning_rate": 1.98787861318883e-05, "loss": 0.0273, "step": 25240 }, { "epoch": 0.36, "learning_rate": 1.9878738092149826e-05, "loss": 0.0242, "step": 25250 }, { "epoch": 0.36, "learning_rate": 1.9878690052411355e-05, "loss": 0.023, "step": 25260 }, { "epoch": 0.36, "learning_rate": 1.9878642012672885e-05, "loss": 0.0242, "step": 25270 }, { "epoch": 0.36, "learning_rate": 1.9878593972934414e-05, "loss": 0.0382, "step": 25280 }, { "epoch": 0.36, "learning_rate": 1.987854593319594e-05, "loss": 0.0255, "step": 25290 }, { "epoch": 0.36, "learning_rate": 1.987849789345747e-05, "loss": 0.0242, "step": 25300 }, { "epoch": 0.36, "learning_rate": 1.9878449853719e-05, "loss": 0.0257, "step": 25310 }, { "epoch": 0.36, "learning_rate": 1.9878401813980524e-05, "loss": 0.0201, "step": 25320 }, { "epoch": 0.37, "learning_rate": 1.9878353774242054e-05, "loss": 0.024, "step": 25330 }, { "epoch": 0.37, "learning_rate": 1.9878305734503583e-05, "loss": 0.0313, "step": 25340 }, { "epoch": 0.37, "learning_rate": 1.9878257694765112e-05, "loss": 0.0286, "step": 25350 }, { "epoch": 0.37, "learning_rate": 1.9878209655026638e-05, "loss": 0.0243, "step": 25360 }, { "epoch": 0.37, "learning_rate": 1.9878161615288167e-05, "loss": 0.0228, "step": 25370 }, { "epoch": 0.37, "learning_rate": 1.9878113575549697e-05, "loss": 0.0329, "step": 25380 }, { "epoch": 0.37, "learning_rate": 1.9878065535811222e-05, "loss": 0.0296, "step": 25390 }, { "epoch": 0.37, "learning_rate": 1.987801749607275e-05, "loss": 0.0269, "step": 25400 }, { "epoch": 0.37, "learning_rate": 1.987796945633428e-05, "loss": 0.0269, "step": 25410 }, { "epoch": 0.37, "learning_rate": 1.987792141659581e-05, "loss": 0.0286, "step": 25420 }, { "epoch": 0.37, "learning_rate": 1.9877873376857336e-05, "loss": 0.0242, "step": 25430 }, { "epoch": 0.37, "learning_rate": 1.9877825337118865e-05, "loss": 0.0273, "step": 25440 }, { "epoch": 0.37, "learning_rate": 1.9877777297380395e-05, "loss": 0.0244, "step": 25450 }, { "epoch": 0.37, "learning_rate": 1.9877729257641924e-05, "loss": 0.025, "step": 25460 }, { "epoch": 0.37, "learning_rate": 1.987768121790345e-05, "loss": 0.0237, "step": 25470 }, { "epoch": 0.37, "learning_rate": 1.987763317816498e-05, "loss": 0.0298, "step": 25480 }, { "epoch": 0.37, "learning_rate": 1.987758513842651e-05, "loss": 0.0261, "step": 25490 }, { "epoch": 0.37, "learning_rate": 1.9877537098688034e-05, "loss": 0.0223, "step": 25500 }, { "epoch": 0.37, "learning_rate": 1.9877489058949563e-05, "loss": 0.0288, "step": 25510 }, { "epoch": 0.37, "learning_rate": 1.9877441019211093e-05, "loss": 0.0247, "step": 25520 }, { "epoch": 0.37, "learning_rate": 1.9877392979472622e-05, "loss": 0.025, "step": 25530 }, { "epoch": 0.37, "learning_rate": 1.9877344939734148e-05, "loss": 0.0279, "step": 25540 }, { "epoch": 0.37, "learning_rate": 1.9877296899995677e-05, "loss": 0.0194, "step": 25550 }, { "epoch": 0.37, "learning_rate": 1.9877248860257206e-05, "loss": 0.0249, "step": 25560 }, { "epoch": 0.37, "learning_rate": 1.9877200820518732e-05, "loss": 0.026, "step": 25570 }, { "epoch": 0.37, "learning_rate": 1.987715278078026e-05, "loss": 0.0284, "step": 25580 }, { "epoch": 0.37, "learning_rate": 1.987710474104179e-05, "loss": 0.0254, "step": 25590 }, { "epoch": 0.37, "learning_rate": 1.987705670130332e-05, "loss": 0.0218, "step": 25600 }, { "epoch": 0.37, "learning_rate": 1.9877008661564846e-05, "loss": 0.0234, "step": 25610 }, { "epoch": 0.37, "learning_rate": 1.9876960621826375e-05, "loss": 0.0264, "step": 25620 }, { "epoch": 0.37, "learning_rate": 1.9876912582087905e-05, "loss": 0.0328, "step": 25630 }, { "epoch": 0.37, "learning_rate": 1.9876864542349434e-05, "loss": 0.0243, "step": 25640 }, { "epoch": 0.37, "learning_rate": 1.987681650261096e-05, "loss": 0.0239, "step": 25650 }, { "epoch": 0.37, "learning_rate": 1.987676846287249e-05, "loss": 0.0254, "step": 25660 }, { "epoch": 0.37, "learning_rate": 1.9876720423134018e-05, "loss": 0.0235, "step": 25670 }, { "epoch": 0.37, "learning_rate": 1.9876672383395544e-05, "loss": 0.0227, "step": 25680 }, { "epoch": 0.37, "learning_rate": 1.9876624343657073e-05, "loss": 0.0222, "step": 25690 }, { "epoch": 0.37, "learning_rate": 1.9876576303918603e-05, "loss": 0.0243, "step": 25700 }, { "epoch": 0.37, "learning_rate": 1.9876528264180132e-05, "loss": 0.0235, "step": 25710 }, { "epoch": 0.37, "learning_rate": 1.9876480224441658e-05, "loss": 0.0325, "step": 25720 }, { "epoch": 0.37, "learning_rate": 1.9876432184703187e-05, "loss": 0.0258, "step": 25730 }, { "epoch": 0.37, "learning_rate": 1.9876384144964716e-05, "loss": 0.0265, "step": 25740 }, { "epoch": 0.37, "learning_rate": 1.9876336105226242e-05, "loss": 0.0203, "step": 25750 }, { "epoch": 0.37, "learning_rate": 1.987628806548777e-05, "loss": 0.0287, "step": 25760 }, { "epoch": 0.37, "learning_rate": 1.98762400257493e-05, "loss": 0.0281, "step": 25770 }, { "epoch": 0.37, "learning_rate": 1.987619198601083e-05, "loss": 0.0271, "step": 25780 }, { "epoch": 0.37, "learning_rate": 1.9876143946272356e-05, "loss": 0.025, "step": 25790 }, { "epoch": 0.37, "learning_rate": 1.9876095906533885e-05, "loss": 0.025, "step": 25800 }, { "epoch": 0.37, "learning_rate": 1.9876047866795414e-05, "loss": 0.0245, "step": 25810 }, { "epoch": 0.37, "learning_rate": 1.9875999827056944e-05, "loss": 0.0239, "step": 25820 }, { "epoch": 0.37, "learning_rate": 1.987595178731847e-05, "loss": 0.0278, "step": 25830 }, { "epoch": 0.37, "learning_rate": 1.987590374758e-05, "loss": 0.0232, "step": 25840 }, { "epoch": 0.37, "learning_rate": 1.9875855707841528e-05, "loss": 0.0322, "step": 25850 }, { "epoch": 0.37, "learning_rate": 1.9875807668103054e-05, "loss": 0.0228, "step": 25860 }, { "epoch": 0.37, "learning_rate": 1.9875759628364583e-05, "loss": 0.0239, "step": 25870 }, { "epoch": 0.37, "learning_rate": 1.9875711588626113e-05, "loss": 0.0223, "step": 25880 }, { "epoch": 0.37, "learning_rate": 1.9875663548887642e-05, "loss": 0.0272, "step": 25890 }, { "epoch": 0.37, "learning_rate": 1.987561550914917e-05, "loss": 0.0263, "step": 25900 }, { "epoch": 0.37, "learning_rate": 1.98755674694107e-05, "loss": 0.0215, "step": 25910 }, { "epoch": 0.37, "learning_rate": 1.9875519429672226e-05, "loss": 0.026, "step": 25920 }, { "epoch": 0.37, "learning_rate": 1.9875471389933756e-05, "loss": 0.0265, "step": 25930 }, { "epoch": 0.37, "learning_rate": 1.9875423350195285e-05, "loss": 0.0214, "step": 25940 }, { "epoch": 0.37, "learning_rate": 1.9875375310456814e-05, "loss": 0.0272, "step": 25950 }, { "epoch": 0.37, "learning_rate": 1.987532727071834e-05, "loss": 0.0224, "step": 25960 }, { "epoch": 0.37, "learning_rate": 1.987527923097987e-05, "loss": 0.0277, "step": 25970 }, { "epoch": 0.37, "learning_rate": 1.98752311912414e-05, "loss": 0.0187, "step": 25980 }, { "epoch": 0.37, "learning_rate": 1.9875183151502924e-05, "loss": 0.0248, "step": 25990 }, { "epoch": 0.37, "learning_rate": 1.9875135111764454e-05, "loss": 0.0227, "step": 26000 }, { "epoch": 0.37, "learning_rate": 1.9875087072025983e-05, "loss": 0.0318, "step": 26010 }, { "epoch": 0.37, "learning_rate": 1.9875039032287512e-05, "loss": 0.0275, "step": 26020 }, { "epoch": 0.38, "learning_rate": 1.9874990992549038e-05, "loss": 0.0172, "step": 26030 }, { "epoch": 0.38, "learning_rate": 1.9874942952810567e-05, "loss": 0.0243, "step": 26040 }, { "epoch": 0.38, "learning_rate": 1.9874894913072097e-05, "loss": 0.0285, "step": 26050 }, { "epoch": 0.38, "learning_rate": 1.9874846873333623e-05, "loss": 0.0239, "step": 26060 }, { "epoch": 0.38, "learning_rate": 1.9874798833595152e-05, "loss": 0.0221, "step": 26070 }, { "epoch": 0.38, "learning_rate": 1.987475079385668e-05, "loss": 0.0272, "step": 26080 }, { "epoch": 0.38, "learning_rate": 1.987470275411821e-05, "loss": 0.0208, "step": 26090 }, { "epoch": 0.38, "learning_rate": 1.9874654714379736e-05, "loss": 0.0301, "step": 26100 }, { "epoch": 0.38, "learning_rate": 1.9874606674641265e-05, "loss": 0.0255, "step": 26110 }, { "epoch": 0.38, "learning_rate": 1.9874558634902795e-05, "loss": 0.0231, "step": 26120 }, { "epoch": 0.38, "learning_rate": 1.9874510595164324e-05, "loss": 0.0228, "step": 26130 }, { "epoch": 0.38, "learning_rate": 1.987446255542585e-05, "loss": 0.0212, "step": 26140 }, { "epoch": 0.38, "learning_rate": 1.987441451568738e-05, "loss": 0.0249, "step": 26150 }, { "epoch": 0.38, "learning_rate": 1.9874371279922754e-05, "loss": 0.0278, "step": 26160 }, { "epoch": 0.38, "learning_rate": 1.987432324018428e-05, "loss": 0.0234, "step": 26170 }, { "epoch": 0.38, "learning_rate": 1.987427520044581e-05, "loss": 0.0187, "step": 26180 }, { "epoch": 0.38, "learning_rate": 1.9874227160707338e-05, "loss": 0.0252, "step": 26190 }, { "epoch": 0.38, "learning_rate": 1.9874179120968868e-05, "loss": 0.021, "step": 26200 }, { "epoch": 0.38, "learning_rate": 1.9874131081230393e-05, "loss": 0.0238, "step": 26210 }, { "epoch": 0.38, "learning_rate": 1.9874083041491923e-05, "loss": 0.0269, "step": 26220 }, { "epoch": 0.38, "learning_rate": 1.9874035001753452e-05, "loss": 0.0308, "step": 26230 }, { "epoch": 0.38, "learning_rate": 1.9873986962014978e-05, "loss": 0.0295, "step": 26240 }, { "epoch": 0.38, "learning_rate": 1.9873938922276507e-05, "loss": 0.0203, "step": 26250 }, { "epoch": 0.38, "learning_rate": 1.9873895686511885e-05, "loss": 0.0255, "step": 26260 }, { "epoch": 0.38, "learning_rate": 1.987384764677341e-05, "loss": 0.0252, "step": 26270 }, { "epoch": 0.38, "learning_rate": 1.987379960703494e-05, "loss": 0.02, "step": 26280 }, { "epoch": 0.38, "learning_rate": 1.987375156729647e-05, "loss": 0.0176, "step": 26290 }, { "epoch": 0.38, "learning_rate": 1.9873703527557995e-05, "loss": 0.0292, "step": 26300 }, { "epoch": 0.38, "learning_rate": 1.9873655487819525e-05, "loss": 0.0219, "step": 26310 }, { "epoch": 0.38, "learning_rate": 1.9873607448081054e-05, "loss": 0.0238, "step": 26320 }, { "epoch": 0.38, "learning_rate": 1.9873559408342583e-05, "loss": 0.0209, "step": 26330 }, { "epoch": 0.38, "learning_rate": 1.987351136860411e-05, "loss": 0.0243, "step": 26340 }, { "epoch": 0.38, "learning_rate": 1.987346332886564e-05, "loss": 0.0231, "step": 26350 }, { "epoch": 0.38, "learning_rate": 1.9873415289127168e-05, "loss": 0.0189, "step": 26360 }, { "epoch": 0.38, "learning_rate": 1.9873367249388697e-05, "loss": 0.0201, "step": 26370 }, { "epoch": 0.38, "learning_rate": 1.9873319209650223e-05, "loss": 0.0239, "step": 26380 }, { "epoch": 0.38, "learning_rate": 1.9873271169911752e-05, "loss": 0.0314, "step": 26390 }, { "epoch": 0.38, "learning_rate": 1.987322313017328e-05, "loss": 0.0261, "step": 26400 }, { "epoch": 0.38, "learning_rate": 1.9873175090434807e-05, "loss": 0.0308, "step": 26410 }, { "epoch": 0.38, "learning_rate": 1.9873127050696336e-05, "loss": 0.0259, "step": 26420 }, { "epoch": 0.38, "learning_rate": 1.9873079010957866e-05, "loss": 0.02, "step": 26430 }, { "epoch": 0.38, "learning_rate": 1.9873030971219395e-05, "loss": 0.0295, "step": 26440 }, { "epoch": 0.38, "learning_rate": 1.987298293148092e-05, "loss": 0.0255, "step": 26450 }, { "epoch": 0.38, "learning_rate": 1.987293489174245e-05, "loss": 0.0265, "step": 26460 }, { "epoch": 0.38, "learning_rate": 1.987288685200398e-05, "loss": 0.0215, "step": 26470 }, { "epoch": 0.38, "learning_rate": 1.9872838812265505e-05, "loss": 0.0174, "step": 26480 }, { "epoch": 0.38, "learning_rate": 1.9872790772527035e-05, "loss": 0.0261, "step": 26490 }, { "epoch": 0.38, "learning_rate": 1.9872742732788564e-05, "loss": 0.0258, "step": 26500 }, { "epoch": 0.38, "learning_rate": 1.9872694693050093e-05, "loss": 0.0281, "step": 26510 }, { "epoch": 0.38, "learning_rate": 1.987264665331162e-05, "loss": 0.0194, "step": 26520 }, { "epoch": 0.38, "learning_rate": 1.9872598613573148e-05, "loss": 0.0244, "step": 26530 }, { "epoch": 0.38, "learning_rate": 1.9872550573834678e-05, "loss": 0.0229, "step": 26540 }, { "epoch": 0.38, "learning_rate": 1.9872502534096207e-05, "loss": 0.0239, "step": 26550 }, { "epoch": 0.38, "learning_rate": 1.9872454494357733e-05, "loss": 0.0297, "step": 26560 }, { "epoch": 0.38, "learning_rate": 1.9872406454619262e-05, "loss": 0.0265, "step": 26570 }, { "epoch": 0.38, "learning_rate": 1.987235841488079e-05, "loss": 0.0238, "step": 26580 }, { "epoch": 0.38, "learning_rate": 1.9872310375142317e-05, "loss": 0.0188, "step": 26590 }, { "epoch": 0.38, "learning_rate": 1.9872262335403846e-05, "loss": 0.0282, "step": 26600 }, { "epoch": 0.38, "learning_rate": 1.9872214295665376e-05, "loss": 0.0304, "step": 26610 }, { "epoch": 0.38, "learning_rate": 1.9872166255926905e-05, "loss": 0.0289, "step": 26620 }, { "epoch": 0.38, "learning_rate": 1.987211821618843e-05, "loss": 0.0223, "step": 26630 }, { "epoch": 0.38, "learning_rate": 1.987207017644996e-05, "loss": 0.0196, "step": 26640 }, { "epoch": 0.38, "learning_rate": 1.987202213671149e-05, "loss": 0.024, "step": 26650 }, { "epoch": 0.38, "learning_rate": 1.9871974096973015e-05, "loss": 0.0221, "step": 26660 }, { "epoch": 0.38, "learning_rate": 1.9871926057234545e-05, "loss": 0.022, "step": 26670 }, { "epoch": 0.38, "learning_rate": 1.9871878017496074e-05, "loss": 0.0222, "step": 26680 }, { "epoch": 0.38, "learning_rate": 1.9871829977757603e-05, "loss": 0.0253, "step": 26690 }, { "epoch": 0.38, "learning_rate": 1.987178193801913e-05, "loss": 0.0186, "step": 26700 }, { "epoch": 0.38, "learning_rate": 1.9871733898280658e-05, "loss": 0.0208, "step": 26710 }, { "epoch": 0.39, "learning_rate": 1.9871685858542187e-05, "loss": 0.0206, "step": 26720 }, { "epoch": 0.39, "learning_rate": 1.9871637818803717e-05, "loss": 0.0296, "step": 26730 }, { "epoch": 0.39, "learning_rate": 1.9871589779065243e-05, "loss": 0.02, "step": 26740 }, { "epoch": 0.39, "learning_rate": 1.9871541739326772e-05, "loss": 0.027, "step": 26750 }, { "epoch": 0.39, "learning_rate": 1.98714936995883e-05, "loss": 0.0251, "step": 26760 }, { "epoch": 0.39, "learning_rate": 1.9871445659849827e-05, "loss": 0.0204, "step": 26770 }, { "epoch": 0.39, "learning_rate": 1.9871397620111356e-05, "loss": 0.0289, "step": 26780 }, { "epoch": 0.39, "learning_rate": 1.9871349580372886e-05, "loss": 0.0239, "step": 26790 }, { "epoch": 0.39, "learning_rate": 1.9871301540634415e-05, "loss": 0.0284, "step": 26800 }, { "epoch": 0.39, "learning_rate": 1.987125350089594e-05, "loss": 0.0272, "step": 26810 }, { "epoch": 0.39, "learning_rate": 1.987120546115747e-05, "loss": 0.0185, "step": 26820 }, { "epoch": 0.39, "learning_rate": 1.9871157421419e-05, "loss": 0.0262, "step": 26830 }, { "epoch": 0.39, "learning_rate": 1.9871109381680525e-05, "loss": 0.0309, "step": 26840 }, { "epoch": 0.39, "learning_rate": 1.9871061341942054e-05, "loss": 0.0227, "step": 26850 }, { "epoch": 0.39, "learning_rate": 1.9871013302203584e-05, "loss": 0.0183, "step": 26860 }, { "epoch": 0.39, "learning_rate": 1.9870965262465113e-05, "loss": 0.0197, "step": 26870 }, { "epoch": 0.39, "learning_rate": 1.987091722272664e-05, "loss": 0.0268, "step": 26880 }, { "epoch": 0.39, "learning_rate": 1.9870869182988168e-05, "loss": 0.0269, "step": 26890 }, { "epoch": 0.39, "learning_rate": 1.9870821143249697e-05, "loss": 0.0237, "step": 26900 }, { "epoch": 0.39, "learning_rate": 1.9870773103511227e-05, "loss": 0.0252, "step": 26910 }, { "epoch": 0.39, "learning_rate": 1.9870725063772753e-05, "loss": 0.0199, "step": 26920 }, { "epoch": 0.39, "learning_rate": 1.9870677024034285e-05, "loss": 0.0222, "step": 26930 }, { "epoch": 0.39, "learning_rate": 1.987062898429581e-05, "loss": 0.032, "step": 26940 }, { "epoch": 0.39, "learning_rate": 1.987058094455734e-05, "loss": 0.0189, "step": 26950 }, { "epoch": 0.39, "learning_rate": 1.987053290481887e-05, "loss": 0.0207, "step": 26960 }, { "epoch": 0.39, "learning_rate": 1.98704848650804e-05, "loss": 0.026, "step": 26970 }, { "epoch": 0.39, "learning_rate": 1.9870436825341925e-05, "loss": 0.0262, "step": 26980 }, { "epoch": 0.39, "learning_rate": 1.9870388785603454e-05, "loss": 0.019, "step": 26990 }, { "epoch": 0.39, "learning_rate": 1.9870340745864983e-05, "loss": 0.0169, "step": 27000 }, { "epoch": 0.39, "learning_rate": 1.987029270612651e-05, "loss": 0.0258, "step": 27010 }, { "epoch": 0.39, "learning_rate": 1.987024466638804e-05, "loss": 0.0202, "step": 27020 }, { "epoch": 0.39, "learning_rate": 1.9870196626649568e-05, "loss": 0.0194, "step": 27030 }, { "epoch": 0.39, "learning_rate": 1.9870148586911097e-05, "loss": 0.0249, "step": 27040 }, { "epoch": 0.39, "learning_rate": 1.9870100547172623e-05, "loss": 0.0274, "step": 27050 }, { "epoch": 0.39, "learning_rate": 1.9870052507434152e-05, "loss": 0.0207, "step": 27060 }, { "epoch": 0.39, "learning_rate": 1.987000446769568e-05, "loss": 0.0248, "step": 27070 }, { "epoch": 0.39, "learning_rate": 1.9869956427957207e-05, "loss": 0.015, "step": 27080 }, { "epoch": 0.39, "learning_rate": 1.9869908388218737e-05, "loss": 0.0187, "step": 27090 }, { "epoch": 0.39, "learning_rate": 1.9869860348480266e-05, "loss": 0.0294, "step": 27100 }, { "epoch": 0.39, "learning_rate": 1.9869812308741795e-05, "loss": 0.0209, "step": 27110 }, { "epoch": 0.39, "learning_rate": 1.986976426900332e-05, "loss": 0.0218, "step": 27120 }, { "epoch": 0.39, "learning_rate": 1.986971622926485e-05, "loss": 0.0219, "step": 27130 }, { "epoch": 0.39, "learning_rate": 1.986966818952638e-05, "loss": 0.0251, "step": 27140 }, { "epoch": 0.39, "learning_rate": 1.9869620149787905e-05, "loss": 0.021, "step": 27150 }, { "epoch": 0.39, "learning_rate": 1.9869572110049435e-05, "loss": 0.0223, "step": 27160 }, { "epoch": 0.39, "learning_rate": 1.9869524070310964e-05, "loss": 0.0239, "step": 27170 }, { "epoch": 0.39, "learning_rate": 1.9869476030572493e-05, "loss": 0.0305, "step": 27180 }, { "epoch": 0.39, "learning_rate": 1.986942799083402e-05, "loss": 0.0199, "step": 27190 }, { "epoch": 0.39, "learning_rate": 1.986937995109555e-05, "loss": 0.0222, "step": 27200 }, { "epoch": 0.39, "learning_rate": 1.9869331911357078e-05, "loss": 0.0253, "step": 27210 }, { "epoch": 0.39, "learning_rate": 1.9869283871618607e-05, "loss": 0.0254, "step": 27220 }, { "epoch": 0.39, "learning_rate": 1.9869235831880133e-05, "loss": 0.0249, "step": 27230 }, { "epoch": 0.39, "learning_rate": 1.9869187792141662e-05, "loss": 0.0257, "step": 27240 }, { "epoch": 0.39, "learning_rate": 1.986913975240319e-05, "loss": 0.0217, "step": 27250 }, { "epoch": 0.39, "learning_rate": 1.9869091712664717e-05, "loss": 0.0228, "step": 27260 }, { "epoch": 0.39, "learning_rate": 1.9869043672926246e-05, "loss": 0.0218, "step": 27270 }, { "epoch": 0.39, "learning_rate": 1.9868995633187776e-05, "loss": 0.0209, "step": 27280 }, { "epoch": 0.39, "learning_rate": 1.9868947593449305e-05, "loss": 0.0303, "step": 27290 }, { "epoch": 0.39, "learning_rate": 1.986889955371083e-05, "loss": 0.0203, "step": 27300 }, { "epoch": 0.39, "learning_rate": 1.986885151397236e-05, "loss": 0.0215, "step": 27310 }, { "epoch": 0.39, "learning_rate": 1.986880347423389e-05, "loss": 0.0291, "step": 27320 }, { "epoch": 0.39, "learning_rate": 1.9868755434495415e-05, "loss": 0.0269, "step": 27330 }, { "epoch": 0.39, "learning_rate": 1.9868707394756945e-05, "loss": 0.0333, "step": 27340 }, { "epoch": 0.39, "learning_rate": 1.9868659355018474e-05, "loss": 0.0215, "step": 27350 }, { "epoch": 0.39, "learning_rate": 1.9868611315280003e-05, "loss": 0.0207, "step": 27360 }, { "epoch": 0.39, "learning_rate": 1.986856327554153e-05, "loss": 0.0172, "step": 27370 }, { "epoch": 0.39, "learning_rate": 1.9868515235803058e-05, "loss": 0.0215, "step": 27380 }, { "epoch": 0.39, "learning_rate": 1.9868467196064588e-05, "loss": 0.0337, "step": 27390 }, { "epoch": 0.39, "learning_rate": 1.9868419156326117e-05, "loss": 0.0227, "step": 27400 }, { "epoch": 0.4, "learning_rate": 1.9868371116587643e-05, "loss": 0.0268, "step": 27410 }, { "epoch": 0.4, "learning_rate": 1.9868323076849172e-05, "loss": 0.0237, "step": 27420 }, { "epoch": 0.4, "learning_rate": 1.98682750371107e-05, "loss": 0.0222, "step": 27430 }, { "epoch": 0.4, "learning_rate": 1.9868226997372227e-05, "loss": 0.0238, "step": 27440 }, { "epoch": 0.4, "learning_rate": 1.9868178957633756e-05, "loss": 0.0254, "step": 27450 }, { "epoch": 0.4, "learning_rate": 1.9868130917895286e-05, "loss": 0.0202, "step": 27460 }, { "epoch": 0.4, "learning_rate": 1.9868082878156815e-05, "loss": 0.026, "step": 27470 }, { "epoch": 0.4, "learning_rate": 1.986803483841834e-05, "loss": 0.0219, "step": 27480 }, { "epoch": 0.4, "learning_rate": 1.986798679867987e-05, "loss": 0.0259, "step": 27490 }, { "epoch": 0.4, "learning_rate": 1.98679387589414e-05, "loss": 0.0247, "step": 27500 }, { "epoch": 0.4, "learning_rate": 1.9867890719202925e-05, "loss": 0.0234, "step": 27510 }, { "epoch": 0.4, "learning_rate": 1.9867842679464455e-05, "loss": 0.0267, "step": 27520 }, { "epoch": 0.4, "learning_rate": 1.9867794639725984e-05, "loss": 0.0255, "step": 27530 }, { "epoch": 0.4, "learning_rate": 1.9867746599987513e-05, "loss": 0.0273, "step": 27540 }, { "epoch": 0.4, "learning_rate": 1.986769856024904e-05, "loss": 0.0184, "step": 27550 }, { "epoch": 0.4, "learning_rate": 1.9867650520510568e-05, "loss": 0.0195, "step": 27560 }, { "epoch": 0.4, "learning_rate": 1.9867602480772097e-05, "loss": 0.0222, "step": 27570 }, { "epoch": 0.4, "learning_rate": 1.9867554441033627e-05, "loss": 0.0227, "step": 27580 }, { "epoch": 0.4, "learning_rate": 1.9867506401295153e-05, "loss": 0.0215, "step": 27590 }, { "epoch": 0.4, "learning_rate": 1.9867458361556682e-05, "loss": 0.0298, "step": 27600 }, { "epoch": 0.4, "learning_rate": 1.986741032181821e-05, "loss": 0.0253, "step": 27610 }, { "epoch": 0.4, "learning_rate": 1.9867362282079737e-05, "loss": 0.0229, "step": 27620 }, { "epoch": 0.4, "learning_rate": 1.9867314242341266e-05, "loss": 0.0294, "step": 27630 }, { "epoch": 0.4, "learning_rate": 1.9867266202602796e-05, "loss": 0.0244, "step": 27640 }, { "epoch": 0.4, "learning_rate": 1.9867218162864325e-05, "loss": 0.0346, "step": 27650 }, { "epoch": 0.4, "learning_rate": 1.986717012312585e-05, "loss": 0.0258, "step": 27660 }, { "epoch": 0.4, "learning_rate": 1.986712208338738e-05, "loss": 0.0242, "step": 27670 }, { "epoch": 0.4, "learning_rate": 1.986707404364891e-05, "loss": 0.0212, "step": 27680 }, { "epoch": 0.4, "learning_rate": 1.9867026003910435e-05, "loss": 0.0229, "step": 27690 }, { "epoch": 0.4, "learning_rate": 1.9866977964171964e-05, "loss": 0.0252, "step": 27700 }, { "epoch": 0.4, "learning_rate": 1.9866929924433494e-05, "loss": 0.0204, "step": 27710 }, { "epoch": 0.4, "learning_rate": 1.9866881884695023e-05, "loss": 0.02, "step": 27720 }, { "epoch": 0.4, "learning_rate": 1.986683384495655e-05, "loss": 0.0243, "step": 27730 }, { "epoch": 0.4, "learning_rate": 1.9866785805218078e-05, "loss": 0.026, "step": 27740 }, { "epoch": 0.4, "learning_rate": 1.9866737765479607e-05, "loss": 0.0273, "step": 27750 }, { "epoch": 0.4, "learning_rate": 1.9866689725741137e-05, "loss": 0.027, "step": 27760 }, { "epoch": 0.4, "learning_rate": 1.9866641686002663e-05, "loss": 0.0227, "step": 27770 }, { "epoch": 0.4, "learning_rate": 1.9866593646264192e-05, "loss": 0.0292, "step": 27780 }, { "epoch": 0.4, "learning_rate": 1.986654560652572e-05, "loss": 0.0176, "step": 27790 }, { "epoch": 0.4, "learning_rate": 1.9866497566787247e-05, "loss": 0.0204, "step": 27800 }, { "epoch": 0.4, "learning_rate": 1.9866449527048776e-05, "loss": 0.0235, "step": 27810 }, { "epoch": 0.4, "learning_rate": 1.9866401487310306e-05, "loss": 0.0258, "step": 27820 }, { "epoch": 0.4, "learning_rate": 1.9866353447571835e-05, "loss": 0.0297, "step": 27830 }, { "epoch": 0.4, "learning_rate": 1.986630540783336e-05, "loss": 0.0269, "step": 27840 }, { "epoch": 0.4, "learning_rate": 1.986625736809489e-05, "loss": 0.0201, "step": 27850 }, { "epoch": 0.4, "learning_rate": 1.986620932835642e-05, "loss": 0.03, "step": 27860 }, { "epoch": 0.4, "learning_rate": 1.9866161288617945e-05, "loss": 0.0215, "step": 27870 }, { "epoch": 0.4, "learning_rate": 1.9866113248879474e-05, "loss": 0.0227, "step": 27880 }, { "epoch": 0.4, "learning_rate": 1.9866065209141004e-05, "loss": 0.0259, "step": 27890 }, { "epoch": 0.4, "learning_rate": 1.9866017169402533e-05, "loss": 0.0219, "step": 27900 }, { "epoch": 0.4, "learning_rate": 1.986596912966406e-05, "loss": 0.0234, "step": 27910 }, { "epoch": 0.4, "learning_rate": 1.9865921089925588e-05, "loss": 0.0242, "step": 27920 }, { "epoch": 0.4, "learning_rate": 1.9865873050187117e-05, "loss": 0.0234, "step": 27930 }, { "epoch": 0.4, "learning_rate": 1.9865825010448647e-05, "loss": 0.0309, "step": 27940 }, { "epoch": 0.4, "learning_rate": 1.9865776970710172e-05, "loss": 0.0259, "step": 27950 }, { "epoch": 0.4, "learning_rate": 1.9865728930971702e-05, "loss": 0.0225, "step": 27960 }, { "epoch": 0.4, "learning_rate": 1.986568089123323e-05, "loss": 0.0211, "step": 27970 }, { "epoch": 0.4, "learning_rate": 1.9865632851494757e-05, "loss": 0.0231, "step": 27980 }, { "epoch": 0.4, "learning_rate": 1.9865584811756286e-05, "loss": 0.0192, "step": 27990 }, { "epoch": 0.4, "learning_rate": 1.9865536772017815e-05, "loss": 0.0263, "step": 28000 }, { "epoch": 0.4, "learning_rate": 1.9865488732279345e-05, "loss": 0.0322, "step": 28010 }, { "epoch": 0.4, "learning_rate": 1.986544069254087e-05, "loss": 0.0226, "step": 28020 }, { "epoch": 0.4, "learning_rate": 1.98653926528024e-05, "loss": 0.0296, "step": 28030 }, { "epoch": 0.4, "learning_rate": 1.986534461306393e-05, "loss": 0.0212, "step": 28040 }, { "epoch": 0.4, "learning_rate": 1.9865296573325455e-05, "loss": 0.0265, "step": 28050 }, { "epoch": 0.4, "learning_rate": 1.9865248533586984e-05, "loss": 0.0243, "step": 28060 }, { "epoch": 0.4, "learning_rate": 1.9865200493848514e-05, "loss": 0.0234, "step": 28070 }, { "epoch": 0.4, "learning_rate": 1.9865152454110043e-05, "loss": 0.022, "step": 28080 }, { "epoch": 0.4, "learning_rate": 1.986510441437157e-05, "loss": 0.0238, "step": 28090 }, { "epoch": 0.4, "learning_rate": 1.9865056374633098e-05, "loss": 0.0213, "step": 28100 }, { "epoch": 0.41, "learning_rate": 1.9865008334894627e-05, "loss": 0.0203, "step": 28110 }, { "epoch": 0.41, "learning_rate": 1.9864960295156156e-05, "loss": 0.0292, "step": 28120 }, { "epoch": 0.41, "learning_rate": 1.9864912255417682e-05, "loss": 0.0325, "step": 28130 }, { "epoch": 0.41, "learning_rate": 1.986486421567921e-05, "loss": 0.0199, "step": 28140 }, { "epoch": 0.41, "learning_rate": 1.986481617594074e-05, "loss": 0.022, "step": 28150 }, { "epoch": 0.41, "learning_rate": 1.9864768136202267e-05, "loss": 0.0266, "step": 28160 }, { "epoch": 0.41, "learning_rate": 1.9864720096463796e-05, "loss": 0.0216, "step": 28170 }, { "epoch": 0.41, "learning_rate": 1.9864672056725325e-05, "loss": 0.0264, "step": 28180 }, { "epoch": 0.41, "learning_rate": 1.9864624016986855e-05, "loss": 0.0233, "step": 28190 }, { "epoch": 0.41, "learning_rate": 1.986457597724838e-05, "loss": 0.0238, "step": 28200 }, { "epoch": 0.41, "learning_rate": 1.986452793750991e-05, "loss": 0.0179, "step": 28210 }, { "epoch": 0.41, "learning_rate": 1.986447989777144e-05, "loss": 0.0204, "step": 28220 }, { "epoch": 0.41, "learning_rate": 1.9864431858032965e-05, "loss": 0.0185, "step": 28230 }, { "epoch": 0.41, "learning_rate": 1.9864383818294494e-05, "loss": 0.0259, "step": 28240 }, { "epoch": 0.41, "learning_rate": 1.9864335778556023e-05, "loss": 0.0272, "step": 28250 }, { "epoch": 0.41, "learning_rate": 1.9864287738817553e-05, "loss": 0.0244, "step": 28260 }, { "epoch": 0.41, "learning_rate": 1.986423969907908e-05, "loss": 0.025, "step": 28270 }, { "epoch": 0.41, "learning_rate": 1.9864191659340608e-05, "loss": 0.0193, "step": 28280 }, { "epoch": 0.41, "learning_rate": 1.9864143619602137e-05, "loss": 0.0257, "step": 28290 }, { "epoch": 0.41, "learning_rate": 1.9864095579863666e-05, "loss": 0.026, "step": 28300 }, { "epoch": 0.41, "learning_rate": 1.9864047540125192e-05, "loss": 0.028, "step": 28310 }, { "epoch": 0.41, "learning_rate": 1.986399950038672e-05, "loss": 0.0196, "step": 28320 }, { "epoch": 0.41, "learning_rate": 1.986395146064825e-05, "loss": 0.0223, "step": 28330 }, { "epoch": 0.41, "learning_rate": 1.9863903420909777e-05, "loss": 0.0284, "step": 28340 }, { "epoch": 0.41, "learning_rate": 1.9863855381171306e-05, "loss": 0.0224, "step": 28350 }, { "epoch": 0.41, "learning_rate": 1.9863807341432835e-05, "loss": 0.024, "step": 28360 }, { "epoch": 0.41, "learning_rate": 1.9863759301694365e-05, "loss": 0.0241, "step": 28370 }, { "epoch": 0.41, "learning_rate": 1.986371126195589e-05, "loss": 0.0248, "step": 28380 }, { "epoch": 0.41, "learning_rate": 1.986366322221742e-05, "loss": 0.0236, "step": 28390 }, { "epoch": 0.41, "learning_rate": 1.986361518247895e-05, "loss": 0.0274, "step": 28400 }, { "epoch": 0.41, "learning_rate": 1.9863567142740475e-05, "loss": 0.0211, "step": 28410 }, { "epoch": 0.41, "learning_rate": 1.9863519103002004e-05, "loss": 0.028, "step": 28420 }, { "epoch": 0.41, "learning_rate": 1.9863471063263533e-05, "loss": 0.0216, "step": 28430 }, { "epoch": 0.41, "learning_rate": 1.9863423023525063e-05, "loss": 0.0301, "step": 28440 }, { "epoch": 0.41, "learning_rate": 1.986337498378659e-05, "loss": 0.0221, "step": 28450 }, { "epoch": 0.41, "learning_rate": 1.9863326944048118e-05, "loss": 0.0186, "step": 28460 }, { "epoch": 0.41, "learning_rate": 1.9863278904309647e-05, "loss": 0.0228, "step": 28470 }, { "epoch": 0.41, "learning_rate": 1.9863230864571176e-05, "loss": 0.0201, "step": 28480 }, { "epoch": 0.41, "learning_rate": 1.9863182824832702e-05, "loss": 0.0267, "step": 28490 }, { "epoch": 0.41, "learning_rate": 1.986313478509423e-05, "loss": 0.0206, "step": 28500 }, { "epoch": 0.41, "learning_rate": 1.986308674535576e-05, "loss": 0.0239, "step": 28510 }, { "epoch": 0.41, "learning_rate": 1.9863038705617287e-05, "loss": 0.0202, "step": 28520 }, { "epoch": 0.41, "learning_rate": 1.9862990665878816e-05, "loss": 0.0251, "step": 28530 }, { "epoch": 0.41, "learning_rate": 1.9862942626140345e-05, "loss": 0.0213, "step": 28540 }, { "epoch": 0.41, "learning_rate": 1.9862894586401874e-05, "loss": 0.0232, "step": 28550 }, { "epoch": 0.41, "learning_rate": 1.98628465466634e-05, "loss": 0.0208, "step": 28560 }, { "epoch": 0.41, "learning_rate": 1.986279850692493e-05, "loss": 0.0237, "step": 28570 }, { "epoch": 0.41, "learning_rate": 1.986275046718646e-05, "loss": 0.0216, "step": 28580 }, { "epoch": 0.41, "learning_rate": 1.9862702427447985e-05, "loss": 0.0256, "step": 28590 }, { "epoch": 0.41, "learning_rate": 1.9862654387709514e-05, "loss": 0.0269, "step": 28600 }, { "epoch": 0.41, "learning_rate": 1.9862606347971043e-05, "loss": 0.0207, "step": 28610 }, { "epoch": 0.41, "learning_rate": 1.9862558308232573e-05, "loss": 0.0219, "step": 28620 }, { "epoch": 0.41, "learning_rate": 1.98625102684941e-05, "loss": 0.0165, "step": 28630 }, { "epoch": 0.41, "learning_rate": 1.9862462228755628e-05, "loss": 0.023, "step": 28640 }, { "epoch": 0.41, "learning_rate": 1.9862414189017157e-05, "loss": 0.0257, "step": 28650 }, { "epoch": 0.41, "learning_rate": 1.9862366149278686e-05, "loss": 0.0201, "step": 28660 }, { "epoch": 0.41, "learning_rate": 1.9862318109540212e-05, "loss": 0.0198, "step": 28670 }, { "epoch": 0.41, "learning_rate": 1.986227006980174e-05, "loss": 0.0258, "step": 28680 }, { "epoch": 0.41, "learning_rate": 1.986222203006327e-05, "loss": 0.0226, "step": 28690 }, { "epoch": 0.41, "learning_rate": 1.9862173990324797e-05, "loss": 0.0179, "step": 28700 }, { "epoch": 0.41, "learning_rate": 1.9862125950586326e-05, "loss": 0.0231, "step": 28710 }, { "epoch": 0.41, "learning_rate": 1.9862077910847855e-05, "loss": 0.0328, "step": 28720 }, { "epoch": 0.41, "learning_rate": 1.9862029871109384e-05, "loss": 0.0226, "step": 28730 }, { "epoch": 0.41, "learning_rate": 1.986198183137091e-05, "loss": 0.0299, "step": 28740 }, { "epoch": 0.41, "learning_rate": 1.986193379163244e-05, "loss": 0.0207, "step": 28750 }, { "epoch": 0.41, "learning_rate": 1.986188575189397e-05, "loss": 0.0234, "step": 28760 }, { "epoch": 0.41, "learning_rate": 1.9861837712155495e-05, "loss": 0.0228, "step": 28770 }, { "epoch": 0.41, "learning_rate": 1.9861789672417024e-05, "loss": 0.0224, "step": 28780 }, { "epoch": 0.41, "learning_rate": 1.9861741632678553e-05, "loss": 0.0229, "step": 28790 }, { "epoch": 0.42, "learning_rate": 1.9861693592940082e-05, "loss": 0.0213, "step": 28800 }, { "epoch": 0.42, "learning_rate": 1.986164555320161e-05, "loss": 0.02, "step": 28810 }, { "epoch": 0.42, "learning_rate": 1.9861597513463138e-05, "loss": 0.018, "step": 28820 }, { "epoch": 0.42, "learning_rate": 1.9861549473724667e-05, "loss": 0.028, "step": 28830 }, { "epoch": 0.42, "learning_rate": 1.9861501433986196e-05, "loss": 0.023, "step": 28840 }, { "epoch": 0.42, "learning_rate": 1.9861453394247722e-05, "loss": 0.0287, "step": 28850 }, { "epoch": 0.42, "learning_rate": 1.986140535450925e-05, "loss": 0.023, "step": 28860 }, { "epoch": 0.42, "learning_rate": 1.986135731477078e-05, "loss": 0.023, "step": 28870 }, { "epoch": 0.42, "learning_rate": 1.9861309275032306e-05, "loss": 0.023, "step": 28880 }, { "epoch": 0.42, "learning_rate": 1.9861261235293836e-05, "loss": 0.026, "step": 28890 }, { "epoch": 0.42, "learning_rate": 1.9861213195555365e-05, "loss": 0.0269, "step": 28900 }, { "epoch": 0.42, "learning_rate": 1.9861165155816894e-05, "loss": 0.0202, "step": 28910 }, { "epoch": 0.42, "learning_rate": 1.986111711607842e-05, "loss": 0.0237, "step": 28920 }, { "epoch": 0.42, "learning_rate": 1.986106907633995e-05, "loss": 0.0212, "step": 28930 }, { "epoch": 0.42, "learning_rate": 1.986102103660148e-05, "loss": 0.0206, "step": 28940 }, { "epoch": 0.42, "learning_rate": 1.9860972996863005e-05, "loss": 0.0223, "step": 28950 }, { "epoch": 0.42, "learning_rate": 1.9860924957124534e-05, "loss": 0.0234, "step": 28960 }, { "epoch": 0.42, "learning_rate": 1.9860876917386063e-05, "loss": 0.0239, "step": 28970 }, { "epoch": 0.42, "learning_rate": 1.9860828877647592e-05, "loss": 0.02, "step": 28980 }, { "epoch": 0.42, "learning_rate": 1.9860780837909118e-05, "loss": 0.0272, "step": 28990 }, { "epoch": 0.42, "learning_rate": 1.9860732798170648e-05, "loss": 0.0218, "step": 29000 }, { "epoch": 0.42, "learning_rate": 1.9860684758432177e-05, "loss": 0.0276, "step": 29010 }, { "epoch": 0.42, "learning_rate": 1.9860636718693703e-05, "loss": 0.0211, "step": 29020 }, { "epoch": 0.42, "learning_rate": 1.9860588678955232e-05, "loss": 0.0234, "step": 29030 }, { "epoch": 0.42, "learning_rate": 1.986054063921676e-05, "loss": 0.0234, "step": 29040 }, { "epoch": 0.42, "learning_rate": 1.986049259947829e-05, "loss": 0.0272, "step": 29050 }, { "epoch": 0.42, "learning_rate": 1.9860444559739816e-05, "loss": 0.0243, "step": 29060 }, { "epoch": 0.42, "learning_rate": 1.9860396520001346e-05, "loss": 0.0272, "step": 29070 }, { "epoch": 0.42, "learning_rate": 1.9860348480262875e-05, "loss": 0.0226, "step": 29080 }, { "epoch": 0.42, "learning_rate": 1.9860300440524404e-05, "loss": 0.0201, "step": 29090 }, { "epoch": 0.42, "learning_rate": 1.986025240078593e-05, "loss": 0.0234, "step": 29100 }, { "epoch": 0.42, "learning_rate": 1.986020436104746e-05, "loss": 0.0178, "step": 29110 }, { "epoch": 0.42, "learning_rate": 1.986015632130899e-05, "loss": 0.0213, "step": 29120 }, { "epoch": 0.42, "learning_rate": 1.9860108281570514e-05, "loss": 0.019, "step": 29130 }, { "epoch": 0.42, "learning_rate": 1.9860060241832044e-05, "loss": 0.0194, "step": 29140 }, { "epoch": 0.42, "learning_rate": 1.9860012202093573e-05, "loss": 0.0227, "step": 29150 }, { "epoch": 0.42, "learning_rate": 1.9859964162355102e-05, "loss": 0.0281, "step": 29160 }, { "epoch": 0.42, "learning_rate": 1.9859916122616628e-05, "loss": 0.0224, "step": 29170 }, { "epoch": 0.42, "learning_rate": 1.9859868082878157e-05, "loss": 0.0225, "step": 29180 }, { "epoch": 0.42, "learning_rate": 1.9859820043139687e-05, "loss": 0.0201, "step": 29190 }, { "epoch": 0.42, "learning_rate": 1.9859772003401213e-05, "loss": 0.0227, "step": 29200 }, { "epoch": 0.42, "learning_rate": 1.9859723963662742e-05, "loss": 0.0235, "step": 29210 }, { "epoch": 0.42, "learning_rate": 1.985967592392427e-05, "loss": 0.0244, "step": 29220 }, { "epoch": 0.42, "learning_rate": 1.98596278841858e-05, "loss": 0.0178, "step": 29230 }, { "epoch": 0.42, "learning_rate": 1.9859579844447326e-05, "loss": 0.0243, "step": 29240 }, { "epoch": 0.42, "learning_rate": 1.9859531804708856e-05, "loss": 0.0309, "step": 29250 }, { "epoch": 0.42, "learning_rate": 1.9859483764970385e-05, "loss": 0.0246, "step": 29260 }, { "epoch": 0.42, "learning_rate": 1.9859435725231914e-05, "loss": 0.0164, "step": 29270 }, { "epoch": 0.42, "learning_rate": 1.985938768549344e-05, "loss": 0.0234, "step": 29280 }, { "epoch": 0.42, "learning_rate": 1.985933964575497e-05, "loss": 0.0228, "step": 29290 }, { "epoch": 0.42, "learning_rate": 1.98592916060165e-05, "loss": 0.0219, "step": 29300 }, { "epoch": 0.42, "learning_rate": 1.9859243566278024e-05, "loss": 0.0207, "step": 29310 }, { "epoch": 0.42, "learning_rate": 1.9859195526539554e-05, "loss": 0.0238, "step": 29320 }, { "epoch": 0.42, "learning_rate": 1.9859147486801083e-05, "loss": 0.0246, "step": 29330 }, { "epoch": 0.42, "learning_rate": 1.9859099447062612e-05, "loss": 0.0217, "step": 29340 }, { "epoch": 0.42, "learning_rate": 1.9859051407324138e-05, "loss": 0.0239, "step": 29350 }, { "epoch": 0.42, "learning_rate": 1.9859003367585667e-05, "loss": 0.0205, "step": 29360 }, { "epoch": 0.42, "learning_rate": 1.9858955327847197e-05, "loss": 0.0225, "step": 29370 }, { "epoch": 0.42, "learning_rate": 1.9858907288108723e-05, "loss": 0.0278, "step": 29380 }, { "epoch": 0.42, "learning_rate": 1.9858859248370252e-05, "loss": 0.0223, "step": 29390 }, { "epoch": 0.42, "learning_rate": 1.985881120863178e-05, "loss": 0.0207, "step": 29400 }, { "epoch": 0.42, "learning_rate": 1.985876316889331e-05, "loss": 0.0232, "step": 29410 }, { "epoch": 0.42, "learning_rate": 1.9858715129154836e-05, "loss": 0.0295, "step": 29420 }, { "epoch": 0.42, "learning_rate": 1.9858667089416365e-05, "loss": 0.0293, "step": 29430 }, { "epoch": 0.42, "learning_rate": 1.9858619049677895e-05, "loss": 0.0243, "step": 29440 }, { "epoch": 0.42, "learning_rate": 1.9858571009939424e-05, "loss": 0.0264, "step": 29450 }, { "epoch": 0.42, "learning_rate": 1.985852297020095e-05, "loss": 0.0204, "step": 29460 }, { "epoch": 0.42, "learning_rate": 1.985847493046248e-05, "loss": 0.0164, "step": 29470 }, { "epoch": 0.42, "learning_rate": 1.985842689072401e-05, "loss": 0.0249, "step": 29480 }, { "epoch": 0.43, "learning_rate": 1.9858378850985534e-05, "loss": 0.0185, "step": 29490 }, { "epoch": 0.43, "learning_rate": 1.9858330811247067e-05, "loss": 0.0158, "step": 29500 }, { "epoch": 0.43, "learning_rate": 1.9858282771508596e-05, "loss": 0.0222, "step": 29510 }, { "epoch": 0.43, "learning_rate": 1.9858234731770122e-05, "loss": 0.0167, "step": 29520 }, { "epoch": 0.43, "learning_rate": 1.985818669203165e-05, "loss": 0.022, "step": 29530 }, { "epoch": 0.43, "learning_rate": 1.985813865229318e-05, "loss": 0.0244, "step": 29540 }, { "epoch": 0.43, "learning_rate": 1.9858090612554707e-05, "loss": 0.0207, "step": 29550 }, { "epoch": 0.43, "learning_rate": 1.9858042572816236e-05, "loss": 0.0216, "step": 29560 }, { "epoch": 0.43, "learning_rate": 1.9857994533077765e-05, "loss": 0.0252, "step": 29570 }, { "epoch": 0.43, "learning_rate": 1.9857946493339294e-05, "loss": 0.0242, "step": 29580 }, { "epoch": 0.43, "learning_rate": 1.985789845360082e-05, "loss": 0.0294, "step": 29590 }, { "epoch": 0.43, "learning_rate": 1.985785041386235e-05, "loss": 0.0228, "step": 29600 }, { "epoch": 0.43, "learning_rate": 1.985780237412388e-05, "loss": 0.0307, "step": 29610 }, { "epoch": 0.43, "learning_rate": 1.9857754334385405e-05, "loss": 0.0214, "step": 29620 }, { "epoch": 0.43, "learning_rate": 1.9857706294646934e-05, "loss": 0.0215, "step": 29630 }, { "epoch": 0.43, "learning_rate": 1.9857658254908463e-05, "loss": 0.0198, "step": 29640 }, { "epoch": 0.43, "learning_rate": 1.9857610215169992e-05, "loss": 0.0329, "step": 29650 }, { "epoch": 0.43, "learning_rate": 1.985756217543152e-05, "loss": 0.0223, "step": 29660 }, { "epoch": 0.43, "learning_rate": 1.9857514135693048e-05, "loss": 0.0231, "step": 29670 }, { "epoch": 0.43, "learning_rate": 1.9857466095954577e-05, "loss": 0.0245, "step": 29680 }, { "epoch": 0.43, "learning_rate": 1.9857418056216106e-05, "loss": 0.02, "step": 29690 }, { "epoch": 0.43, "learning_rate": 1.9857370016477632e-05, "loss": 0.0277, "step": 29700 }, { "epoch": 0.43, "learning_rate": 1.985732197673916e-05, "loss": 0.0273, "step": 29710 }, { "epoch": 0.43, "learning_rate": 1.985727393700069e-05, "loss": 0.0247, "step": 29720 }, { "epoch": 0.43, "learning_rate": 1.9857225897262216e-05, "loss": 0.0328, "step": 29730 }, { "epoch": 0.43, "learning_rate": 1.9857177857523746e-05, "loss": 0.0224, "step": 29740 }, { "epoch": 0.43, "learning_rate": 1.9857129817785275e-05, "loss": 0.0264, "step": 29750 }, { "epoch": 0.43, "learning_rate": 1.9857081778046804e-05, "loss": 0.0218, "step": 29760 }, { "epoch": 0.43, "learning_rate": 1.985703373830833e-05, "loss": 0.0165, "step": 29770 }, { "epoch": 0.43, "learning_rate": 1.985698569856986e-05, "loss": 0.0226, "step": 29780 }, { "epoch": 0.43, "learning_rate": 1.985693765883139e-05, "loss": 0.0234, "step": 29790 }, { "epoch": 0.43, "learning_rate": 1.9856889619092915e-05, "loss": 0.0234, "step": 29800 }, { "epoch": 0.43, "learning_rate": 1.9856841579354444e-05, "loss": 0.0255, "step": 29810 }, { "epoch": 0.43, "learning_rate": 1.9856793539615973e-05, "loss": 0.0247, "step": 29820 }, { "epoch": 0.43, "learning_rate": 1.9856745499877502e-05, "loss": 0.024, "step": 29830 }, { "epoch": 0.43, "learning_rate": 1.9856697460139028e-05, "loss": 0.0195, "step": 29840 }, { "epoch": 0.43, "learning_rate": 1.9856649420400558e-05, "loss": 0.0256, "step": 29850 }, { "epoch": 0.43, "learning_rate": 1.9856601380662087e-05, "loss": 0.0258, "step": 29860 }, { "epoch": 0.43, "learning_rate": 1.9856553340923616e-05, "loss": 0.0218, "step": 29870 }, { "epoch": 0.43, "learning_rate": 1.9856505301185142e-05, "loss": 0.0252, "step": 29880 }, { "epoch": 0.43, "learning_rate": 1.985645726144667e-05, "loss": 0.02, "step": 29890 }, { "epoch": 0.43, "learning_rate": 1.98564092217082e-05, "loss": 0.0268, "step": 29900 }, { "epoch": 0.43, "learning_rate": 1.9856361181969726e-05, "loss": 0.021, "step": 29910 }, { "epoch": 0.43, "learning_rate": 1.9856313142231256e-05, "loss": 0.0207, "step": 29920 }, { "epoch": 0.43, "learning_rate": 1.9856265102492785e-05, "loss": 0.0215, "step": 29930 }, { "epoch": 0.43, "learning_rate": 1.9856217062754314e-05, "loss": 0.0167, "step": 29940 }, { "epoch": 0.43, "learning_rate": 1.985616902301584e-05, "loss": 0.0221, "step": 29950 }, { "epoch": 0.43, "learning_rate": 1.985612098327737e-05, "loss": 0.0207, "step": 29960 }, { "epoch": 0.43, "learning_rate": 1.98560729435389e-05, "loss": 0.0229, "step": 29970 }, { "epoch": 0.43, "learning_rate": 1.9856024903800424e-05, "loss": 0.0269, "step": 29980 }, { "epoch": 0.43, "learning_rate": 1.9855976864061954e-05, "loss": 0.0212, "step": 29990 }, { "epoch": 0.43, "learning_rate": 1.9855928824323483e-05, "loss": 0.0227, "step": 30000 }, { "epoch": 0.43, "learning_rate": 1.9855880784585012e-05, "loss": 0.0252, "step": 30010 }, { "epoch": 0.43, "learning_rate": 1.9855832744846538e-05, "loss": 0.019, "step": 30020 }, { "epoch": 0.43, "learning_rate": 1.9855784705108067e-05, "loss": 0.0211, "step": 30030 }, { "epoch": 0.43, "learning_rate": 1.9855736665369597e-05, "loss": 0.0212, "step": 30040 }, { "epoch": 0.43, "learning_rate": 1.9855688625631126e-05, "loss": 0.0216, "step": 30050 }, { "epoch": 0.43, "learning_rate": 1.9855640585892652e-05, "loss": 0.0242, "step": 30060 }, { "epoch": 0.43, "learning_rate": 1.985559254615418e-05, "loss": 0.022, "step": 30070 }, { "epoch": 0.43, "learning_rate": 1.985554450641571e-05, "loss": 0.0164, "step": 30080 }, { "epoch": 0.43, "learning_rate": 1.9855496466677236e-05, "loss": 0.025, "step": 30090 }, { "epoch": 0.43, "learning_rate": 1.9855448426938766e-05, "loss": 0.0174, "step": 30100 }, { "epoch": 0.43, "learning_rate": 1.9855400387200295e-05, "loss": 0.0206, "step": 30110 }, { "epoch": 0.43, "learning_rate": 1.9855352347461824e-05, "loss": 0.0258, "step": 30120 }, { "epoch": 0.43, "learning_rate": 1.985530430772335e-05, "loss": 0.0185, "step": 30130 }, { "epoch": 0.43, "learning_rate": 1.985525626798488e-05, "loss": 0.024, "step": 30140 }, { "epoch": 0.43, "learning_rate": 1.985520822824641e-05, "loss": 0.023, "step": 30150 }, { "epoch": 0.43, "learning_rate": 1.9855160188507934e-05, "loss": 0.0263, "step": 30160 }, { "epoch": 0.43, "learning_rate": 1.9855112148769464e-05, "loss": 0.0221, "step": 30170 }, { "epoch": 0.43, "learning_rate": 1.9855064109030993e-05, "loss": 0.0223, "step": 30180 }, { "epoch": 0.44, "learning_rate": 1.9855016069292522e-05, "loss": 0.027, "step": 30190 }, { "epoch": 0.44, "learning_rate": 1.9854968029554048e-05, "loss": 0.0197, "step": 30200 }, { "epoch": 0.44, "learning_rate": 1.9854919989815577e-05, "loss": 0.019, "step": 30210 }, { "epoch": 0.44, "learning_rate": 1.9854871950077107e-05, "loss": 0.0212, "step": 30220 }, { "epoch": 0.44, "learning_rate": 1.9854823910338636e-05, "loss": 0.0278, "step": 30230 }, { "epoch": 0.44, "learning_rate": 1.9854775870600162e-05, "loss": 0.0322, "step": 30240 }, { "epoch": 0.44, "learning_rate": 1.985472783086169e-05, "loss": 0.0251, "step": 30250 }, { "epoch": 0.44, "learning_rate": 1.985467979112322e-05, "loss": 0.0346, "step": 30260 }, { "epoch": 0.44, "learning_rate": 1.9854631751384746e-05, "loss": 0.02, "step": 30270 }, { "epoch": 0.44, "learning_rate": 1.9854583711646275e-05, "loss": 0.0234, "step": 30280 }, { "epoch": 0.44, "learning_rate": 1.9854535671907805e-05, "loss": 0.0226, "step": 30290 }, { "epoch": 0.44, "learning_rate": 1.985449243614318e-05, "loss": 0.025, "step": 30300 }, { "epoch": 0.44, "learning_rate": 1.985444439640471e-05, "loss": 0.0251, "step": 30310 }, { "epoch": 0.44, "learning_rate": 1.9854396356666238e-05, "loss": 0.0219, "step": 30320 }, { "epoch": 0.44, "learning_rate": 1.9854348316927764e-05, "loss": 0.025, "step": 30330 }, { "epoch": 0.44, "learning_rate": 1.9854300277189293e-05, "loss": 0.0231, "step": 30340 }, { "epoch": 0.44, "learning_rate": 1.9854252237450822e-05, "loss": 0.0217, "step": 30350 }, { "epoch": 0.44, "learning_rate": 1.985420419771235e-05, "loss": 0.0233, "step": 30360 }, { "epoch": 0.44, "learning_rate": 1.9854156157973877e-05, "loss": 0.0256, "step": 30370 }, { "epoch": 0.44, "learning_rate": 1.9854108118235407e-05, "loss": 0.0158, "step": 30380 }, { "epoch": 0.44, "learning_rate": 1.9854060078496936e-05, "loss": 0.0171, "step": 30390 }, { "epoch": 0.44, "learning_rate": 1.9854012038758462e-05, "loss": 0.0234, "step": 30400 }, { "epoch": 0.44, "learning_rate": 1.985396399901999e-05, "loss": 0.0259, "step": 30410 }, { "epoch": 0.44, "learning_rate": 1.985391595928152e-05, "loss": 0.0256, "step": 30420 }, { "epoch": 0.44, "learning_rate": 1.985386791954305e-05, "loss": 0.022, "step": 30430 }, { "epoch": 0.44, "learning_rate": 1.9853819879804576e-05, "loss": 0.0192, "step": 30440 }, { "epoch": 0.44, "learning_rate": 1.9853771840066105e-05, "loss": 0.0174, "step": 30450 }, { "epoch": 0.44, "learning_rate": 1.9853723800327634e-05, "loss": 0.0181, "step": 30460 }, { "epoch": 0.44, "learning_rate": 1.985367576058916e-05, "loss": 0.0228, "step": 30470 }, { "epoch": 0.44, "learning_rate": 1.985362772085069e-05, "loss": 0.0227, "step": 30480 }, { "epoch": 0.44, "learning_rate": 1.985357968111222e-05, "loss": 0.0308, "step": 30490 }, { "epoch": 0.44, "learning_rate": 1.9853531641373748e-05, "loss": 0.0177, "step": 30500 }, { "epoch": 0.44, "learning_rate": 1.9853483601635274e-05, "loss": 0.019, "step": 30510 }, { "epoch": 0.44, "learning_rate": 1.9853435561896803e-05, "loss": 0.025, "step": 30520 }, { "epoch": 0.44, "learning_rate": 1.9853387522158332e-05, "loss": 0.0241, "step": 30530 }, { "epoch": 0.44, "learning_rate": 1.985333948241986e-05, "loss": 0.0272, "step": 30540 }, { "epoch": 0.44, "learning_rate": 1.9853291442681387e-05, "loss": 0.0166, "step": 30550 }, { "epoch": 0.44, "learning_rate": 1.9853243402942917e-05, "loss": 0.0194, "step": 30560 }, { "epoch": 0.44, "learning_rate": 1.9853195363204446e-05, "loss": 0.0266, "step": 30570 }, { "epoch": 0.44, "learning_rate": 1.9853147323465972e-05, "loss": 0.0181, "step": 30580 }, { "epoch": 0.44, "learning_rate": 1.98530992837275e-05, "loss": 0.0214, "step": 30590 }, { "epoch": 0.44, "learning_rate": 1.985305124398903e-05, "loss": 0.0233, "step": 30600 }, { "epoch": 0.44, "learning_rate": 1.985300320425056e-05, "loss": 0.0227, "step": 30610 }, { "epoch": 0.44, "learning_rate": 1.9852955164512086e-05, "loss": 0.0245, "step": 30620 }, { "epoch": 0.44, "learning_rate": 1.9852907124773615e-05, "loss": 0.0196, "step": 30630 }, { "epoch": 0.44, "learning_rate": 1.9852859085035144e-05, "loss": 0.0165, "step": 30640 }, { "epoch": 0.44, "learning_rate": 1.985281104529667e-05, "loss": 0.0237, "step": 30650 }, { "epoch": 0.44, "learning_rate": 1.98527630055582e-05, "loss": 0.0218, "step": 30660 }, { "epoch": 0.44, "learning_rate": 1.985271496581973e-05, "loss": 0.0257, "step": 30670 }, { "epoch": 0.44, "learning_rate": 1.9852666926081258e-05, "loss": 0.0267, "step": 30680 }, { "epoch": 0.44, "learning_rate": 1.9852618886342784e-05, "loss": 0.0222, "step": 30690 }, { "epoch": 0.44, "learning_rate": 1.9852570846604313e-05, "loss": 0.023, "step": 30700 }, { "epoch": 0.44, "learning_rate": 1.9852522806865842e-05, "loss": 0.0262, "step": 30710 }, { "epoch": 0.44, "learning_rate": 1.985247476712737e-05, "loss": 0.0159, "step": 30720 }, { "epoch": 0.44, "learning_rate": 1.9852426727388897e-05, "loss": 0.0203, "step": 30730 }, { "epoch": 0.44, "learning_rate": 1.9852378687650427e-05, "loss": 0.0176, "step": 30740 }, { "epoch": 0.44, "learning_rate": 1.9852330647911956e-05, "loss": 0.0195, "step": 30750 }, { "epoch": 0.44, "learning_rate": 1.9852282608173482e-05, "loss": 0.0213, "step": 30760 }, { "epoch": 0.44, "learning_rate": 1.985223456843501e-05, "loss": 0.0255, "step": 30770 }, { "epoch": 0.44, "learning_rate": 1.985218652869654e-05, "loss": 0.0207, "step": 30780 }, { "epoch": 0.44, "learning_rate": 1.985213848895807e-05, "loss": 0.0154, "step": 30790 }, { "epoch": 0.44, "learning_rate": 1.9852090449219595e-05, "loss": 0.0206, "step": 30800 }, { "epoch": 0.44, "learning_rate": 1.9852042409481125e-05, "loss": 0.0259, "step": 30810 }, { "epoch": 0.44, "learning_rate": 1.9851994369742654e-05, "loss": 0.0203, "step": 30820 }, { "epoch": 0.44, "learning_rate": 1.985194633000418e-05, "loss": 0.0204, "step": 30830 }, { "epoch": 0.44, "learning_rate": 1.985189829026571e-05, "loss": 0.0153, "step": 30840 }, { "epoch": 0.44, "learning_rate": 1.985185025052724e-05, "loss": 0.0249, "step": 30850 }, { "epoch": 0.44, "learning_rate": 1.9851802210788768e-05, "loss": 0.026, "step": 30860 }, { "epoch": 0.44, "learning_rate": 1.9851754171050294e-05, "loss": 0.0242, "step": 30870 }, { "epoch": 0.45, "learning_rate": 1.9851706131311823e-05, "loss": 0.0236, "step": 30880 }, { "epoch": 0.45, "learning_rate": 1.9851658091573352e-05, "loss": 0.023, "step": 30890 }, { "epoch": 0.45, "learning_rate": 1.985161005183488e-05, "loss": 0.0207, "step": 30900 }, { "epoch": 0.45, "learning_rate": 1.9851562012096407e-05, "loss": 0.0266, "step": 30910 }, { "epoch": 0.45, "learning_rate": 1.9851513972357937e-05, "loss": 0.0203, "step": 30920 }, { "epoch": 0.45, "learning_rate": 1.9851465932619466e-05, "loss": 0.0258, "step": 30930 }, { "epoch": 0.45, "learning_rate": 1.985141789288099e-05, "loss": 0.0205, "step": 30940 }, { "epoch": 0.45, "learning_rate": 1.985136985314252e-05, "loss": 0.0248, "step": 30950 }, { "epoch": 0.45, "learning_rate": 1.985132181340405e-05, "loss": 0.0227, "step": 30960 }, { "epoch": 0.45, "learning_rate": 1.985127377366558e-05, "loss": 0.0226, "step": 30970 }, { "epoch": 0.45, "learning_rate": 1.9851225733927105e-05, "loss": 0.0198, "step": 30980 }, { "epoch": 0.45, "learning_rate": 1.9851177694188635e-05, "loss": 0.0281, "step": 30990 }, { "epoch": 0.45, "learning_rate": 1.9851129654450164e-05, "loss": 0.0301, "step": 31000 }, { "epoch": 0.45, "learning_rate": 1.985108161471169e-05, "loss": 0.029, "step": 31010 }, { "epoch": 0.45, "learning_rate": 1.985103357497322e-05, "loss": 0.0291, "step": 31020 }, { "epoch": 0.45, "learning_rate": 1.985098553523475e-05, "loss": 0.0251, "step": 31030 }, { "epoch": 0.45, "learning_rate": 1.9850937495496278e-05, "loss": 0.0163, "step": 31040 }, { "epoch": 0.45, "learning_rate": 1.9850889455757803e-05, "loss": 0.0262, "step": 31050 }, { "epoch": 0.45, "learning_rate": 1.9850841416019333e-05, "loss": 0.0139, "step": 31060 }, { "epoch": 0.45, "learning_rate": 1.9850793376280862e-05, "loss": 0.0235, "step": 31070 }, { "epoch": 0.45, "learning_rate": 1.985074533654239e-05, "loss": 0.0333, "step": 31080 }, { "epoch": 0.45, "learning_rate": 1.9850697296803917e-05, "loss": 0.0264, "step": 31090 }, { "epoch": 0.45, "learning_rate": 1.9850649257065446e-05, "loss": 0.0224, "step": 31100 }, { "epoch": 0.45, "learning_rate": 1.9850601217326976e-05, "loss": 0.0201, "step": 31110 }, { "epoch": 0.45, "learning_rate": 1.98505531775885e-05, "loss": 0.0227, "step": 31120 }, { "epoch": 0.45, "learning_rate": 1.985050513785003e-05, "loss": 0.0227, "step": 31130 }, { "epoch": 0.45, "learning_rate": 1.985045709811156e-05, "loss": 0.0161, "step": 31140 }, { "epoch": 0.45, "learning_rate": 1.985040905837309e-05, "loss": 0.0219, "step": 31150 }, { "epoch": 0.45, "learning_rate": 1.9850361018634615e-05, "loss": 0.0334, "step": 31160 }, { "epoch": 0.45, "learning_rate": 1.9850312978896145e-05, "loss": 0.0206, "step": 31170 }, { "epoch": 0.45, "learning_rate": 1.9850264939157674e-05, "loss": 0.0214, "step": 31180 }, { "epoch": 0.45, "learning_rate": 1.98502168994192e-05, "loss": 0.0218, "step": 31190 }, { "epoch": 0.45, "learning_rate": 1.985016885968073e-05, "loss": 0.0195, "step": 31200 }, { "epoch": 0.45, "learning_rate": 1.9850120819942258e-05, "loss": 0.0207, "step": 31210 }, { "epoch": 0.45, "learning_rate": 1.9850072780203787e-05, "loss": 0.022, "step": 31220 }, { "epoch": 0.45, "learning_rate": 1.9850024740465313e-05, "loss": 0.0171, "step": 31230 }, { "epoch": 0.45, "learning_rate": 1.9849976700726843e-05, "loss": 0.0194, "step": 31240 }, { "epoch": 0.45, "learning_rate": 1.9849928660988372e-05, "loss": 0.0229, "step": 31250 }, { "epoch": 0.45, "learning_rate": 1.98498806212499e-05, "loss": 0.02, "step": 31260 }, { "epoch": 0.45, "learning_rate": 1.9849832581511427e-05, "loss": 0.0195, "step": 31270 }, { "epoch": 0.45, "learning_rate": 1.9849784541772956e-05, "loss": 0.0223, "step": 31280 }, { "epoch": 0.45, "learning_rate": 1.9849736502034486e-05, "loss": 0.0218, "step": 31290 }, { "epoch": 0.45, "learning_rate": 1.984968846229601e-05, "loss": 0.0226, "step": 31300 }, { "epoch": 0.45, "learning_rate": 1.984964042255754e-05, "loss": 0.0203, "step": 31310 }, { "epoch": 0.45, "learning_rate": 1.984959238281907e-05, "loss": 0.0251, "step": 31320 }, { "epoch": 0.45, "learning_rate": 1.98495443430806e-05, "loss": 0.0216, "step": 31330 }, { "epoch": 0.45, "learning_rate": 1.9849496303342125e-05, "loss": 0.0259, "step": 31340 }, { "epoch": 0.45, "learning_rate": 1.9849448263603654e-05, "loss": 0.0186, "step": 31350 }, { "epoch": 0.45, "learning_rate": 1.9849400223865184e-05, "loss": 0.0191, "step": 31360 }, { "epoch": 0.45, "learning_rate": 1.984935218412671e-05, "loss": 0.0194, "step": 31370 }, { "epoch": 0.45, "learning_rate": 1.984930414438824e-05, "loss": 0.0235, "step": 31380 }, { "epoch": 0.45, "learning_rate": 1.9849256104649768e-05, "loss": 0.0194, "step": 31390 }, { "epoch": 0.45, "learning_rate": 1.9849208064911297e-05, "loss": 0.0238, "step": 31400 }, { "epoch": 0.45, "learning_rate": 1.9849160025172823e-05, "loss": 0.0238, "step": 31410 }, { "epoch": 0.45, "learning_rate": 1.9849111985434353e-05, "loss": 0.0226, "step": 31420 }, { "epoch": 0.45, "learning_rate": 1.9849063945695882e-05, "loss": 0.0226, "step": 31430 }, { "epoch": 0.45, "learning_rate": 1.984901590595741e-05, "loss": 0.0251, "step": 31440 }, { "epoch": 0.45, "learning_rate": 1.9848967866218937e-05, "loss": 0.0299, "step": 31450 }, { "epoch": 0.45, "learning_rate": 1.9848919826480466e-05, "loss": 0.0217, "step": 31460 }, { "epoch": 0.45, "learning_rate": 1.9848871786741996e-05, "loss": 0.0246, "step": 31470 }, { "epoch": 0.45, "learning_rate": 1.984882374700352e-05, "loss": 0.0214, "step": 31480 }, { "epoch": 0.45, "learning_rate": 1.984877570726505e-05, "loss": 0.0207, "step": 31490 }, { "epoch": 0.45, "learning_rate": 1.984872766752658e-05, "loss": 0.022, "step": 31500 }, { "epoch": 0.45, "learning_rate": 1.984867962778811e-05, "loss": 0.0208, "step": 31510 }, { "epoch": 0.45, "learning_rate": 1.9848631588049635e-05, "loss": 0.0223, "step": 31520 }, { "epoch": 0.45, "learning_rate": 1.9848583548311164e-05, "loss": 0.0202, "step": 31530 }, { "epoch": 0.45, "learning_rate": 1.9848535508572694e-05, "loss": 0.0225, "step": 31540 }, { "epoch": 0.45, "learning_rate": 1.984848746883422e-05, "loss": 0.0259, "step": 31550 }, { "epoch": 0.45, "learning_rate": 1.984843942909575e-05, "loss": 0.0213, "step": 31560 }, { "epoch": 0.45, "learning_rate": 1.9848391389357278e-05, "loss": 0.0158, "step": 31570 }, { "epoch": 0.46, "learning_rate": 1.9848343349618807e-05, "loss": 0.0249, "step": 31580 }, { "epoch": 0.46, "learning_rate": 1.9848295309880333e-05, "loss": 0.0218, "step": 31590 }, { "epoch": 0.46, "learning_rate": 1.9848247270141862e-05, "loss": 0.0216, "step": 31600 }, { "epoch": 0.46, "learning_rate": 1.9848199230403392e-05, "loss": 0.0231, "step": 31610 }, { "epoch": 0.46, "learning_rate": 1.984815119066492e-05, "loss": 0.0206, "step": 31620 }, { "epoch": 0.46, "learning_rate": 1.9848103150926447e-05, "loss": 0.0232, "step": 31630 }, { "epoch": 0.46, "learning_rate": 1.9848055111187976e-05, "loss": 0.0148, "step": 31640 }, { "epoch": 0.46, "learning_rate": 1.9848007071449505e-05, "loss": 0.0214, "step": 31650 }, { "epoch": 0.46, "learning_rate": 1.984795903171103e-05, "loss": 0.0177, "step": 31660 }, { "epoch": 0.46, "learning_rate": 1.984791099197256e-05, "loss": 0.0257, "step": 31670 }, { "epoch": 0.46, "learning_rate": 1.984786295223409e-05, "loss": 0.0219, "step": 31680 }, { "epoch": 0.46, "learning_rate": 1.984781491249562e-05, "loss": 0.0178, "step": 31690 }, { "epoch": 0.46, "learning_rate": 1.9847766872757145e-05, "loss": 0.0198, "step": 31700 }, { "epoch": 0.46, "learning_rate": 1.9847718833018674e-05, "loss": 0.0214, "step": 31710 }, { "epoch": 0.46, "learning_rate": 1.9847670793280204e-05, "loss": 0.0208, "step": 31720 }, { "epoch": 0.46, "learning_rate": 1.984762275354173e-05, "loss": 0.0203, "step": 31730 }, { "epoch": 0.46, "learning_rate": 1.984757471380326e-05, "loss": 0.0228, "step": 31740 }, { "epoch": 0.46, "learning_rate": 1.9847526674064788e-05, "loss": 0.0188, "step": 31750 }, { "epoch": 0.46, "learning_rate": 1.9847478634326317e-05, "loss": 0.0179, "step": 31760 }, { "epoch": 0.46, "learning_rate": 1.9847430594587843e-05, "loss": 0.0234, "step": 31770 }, { "epoch": 0.46, "learning_rate": 1.9847382554849372e-05, "loss": 0.0252, "step": 31780 }, { "epoch": 0.46, "learning_rate": 1.98473345151109e-05, "loss": 0.0235, "step": 31790 }, { "epoch": 0.46, "learning_rate": 1.984728647537243e-05, "loss": 0.0237, "step": 31800 }, { "epoch": 0.46, "learning_rate": 1.9847238435633957e-05, "loss": 0.018, "step": 31810 }, { "epoch": 0.46, "learning_rate": 1.9847190395895486e-05, "loss": 0.0222, "step": 31820 }, { "epoch": 0.46, "learning_rate": 1.9847142356157015e-05, "loss": 0.0264, "step": 31830 }, { "epoch": 0.46, "learning_rate": 1.984709431641854e-05, "loss": 0.0233, "step": 31840 }, { "epoch": 0.46, "learning_rate": 1.984704627668007e-05, "loss": 0.0232, "step": 31850 }, { "epoch": 0.46, "learning_rate": 1.98469982369416e-05, "loss": 0.0178, "step": 31860 }, { "epoch": 0.46, "learning_rate": 1.984695019720313e-05, "loss": 0.0235, "step": 31870 }, { "epoch": 0.46, "learning_rate": 1.9846902157464655e-05, "loss": 0.0216, "step": 31880 }, { "epoch": 0.46, "learning_rate": 1.9846854117726184e-05, "loss": 0.0219, "step": 31890 }, { "epoch": 0.46, "learning_rate": 1.9846806077987713e-05, "loss": 0.0251, "step": 31900 }, { "epoch": 0.46, "learning_rate": 1.984675803824924e-05, "loss": 0.0283, "step": 31910 }, { "epoch": 0.46, "learning_rate": 1.984670999851077e-05, "loss": 0.0205, "step": 31920 }, { "epoch": 0.46, "learning_rate": 1.9846661958772298e-05, "loss": 0.019, "step": 31930 }, { "epoch": 0.46, "learning_rate": 1.9846613919033827e-05, "loss": 0.0186, "step": 31940 }, { "epoch": 0.46, "learning_rate": 1.9846565879295353e-05, "loss": 0.0256, "step": 31950 }, { "epoch": 0.46, "learning_rate": 1.9846517839556882e-05, "loss": 0.0202, "step": 31960 }, { "epoch": 0.46, "learning_rate": 1.984646979981841e-05, "loss": 0.0245, "step": 31970 }, { "epoch": 0.46, "learning_rate": 1.9846421760079937e-05, "loss": 0.0204, "step": 31980 }, { "epoch": 0.46, "learning_rate": 1.9846373720341467e-05, "loss": 0.0221, "step": 31990 }, { "epoch": 0.46, "learning_rate": 1.9846325680602996e-05, "loss": 0.0196, "step": 32000 }, { "epoch": 0.46, "learning_rate": 1.9846277640864525e-05, "loss": 0.0193, "step": 32010 }, { "epoch": 0.46, "learning_rate": 1.984622960112605e-05, "loss": 0.0239, "step": 32020 }, { "epoch": 0.46, "learning_rate": 1.984618156138758e-05, "loss": 0.0291, "step": 32030 }, { "epoch": 0.46, "learning_rate": 1.984613352164911e-05, "loss": 0.025, "step": 32040 }, { "epoch": 0.46, "learning_rate": 1.984608548191064e-05, "loss": 0.0243, "step": 32050 }, { "epoch": 0.46, "learning_rate": 1.9846037442172165e-05, "loss": 0.0216, "step": 32060 }, { "epoch": 0.46, "learning_rate": 1.9845989402433694e-05, "loss": 0.0214, "step": 32070 }, { "epoch": 0.46, "learning_rate": 1.9845941362695223e-05, "loss": 0.0218, "step": 32080 }, { "epoch": 0.46, "learning_rate": 1.984589332295675e-05, "loss": 0.0323, "step": 32090 }, { "epoch": 0.46, "learning_rate": 1.984584528321828e-05, "loss": 0.0248, "step": 32100 }, { "epoch": 0.46, "learning_rate": 1.9845797243479808e-05, "loss": 0.0232, "step": 32110 }, { "epoch": 0.46, "learning_rate": 1.9845749203741337e-05, "loss": 0.0276, "step": 32120 }, { "epoch": 0.46, "learning_rate": 1.9845701164002863e-05, "loss": 0.0273, "step": 32130 }, { "epoch": 0.46, "learning_rate": 1.9845653124264392e-05, "loss": 0.0186, "step": 32140 }, { "epoch": 0.46, "learning_rate": 1.984560508452592e-05, "loss": 0.0224, "step": 32150 }, { "epoch": 0.46, "learning_rate": 1.9845557044787447e-05, "loss": 0.027, "step": 32160 }, { "epoch": 0.46, "learning_rate": 1.9845509005048977e-05, "loss": 0.0191, "step": 32170 }, { "epoch": 0.46, "learning_rate": 1.9845460965310506e-05, "loss": 0.0218, "step": 32180 }, { "epoch": 0.46, "learning_rate": 1.9845412925572035e-05, "loss": 0.0231, "step": 32190 }, { "epoch": 0.46, "learning_rate": 1.984536488583356e-05, "loss": 0.0251, "step": 32200 }, { "epoch": 0.46, "learning_rate": 1.984531684609509e-05, "loss": 0.0264, "step": 32210 }, { "epoch": 0.46, "learning_rate": 1.984526880635662e-05, "loss": 0.0245, "step": 32220 }, { "epoch": 0.46, "learning_rate": 1.984522076661815e-05, "loss": 0.0211, "step": 32230 }, { "epoch": 0.46, "learning_rate": 1.9845172726879675e-05, "loss": 0.0216, "step": 32240 }, { "epoch": 0.46, "learning_rate": 1.9845124687141204e-05, "loss": 0.0224, "step": 32250 }, { "epoch": 0.46, "learning_rate": 1.9845076647402733e-05, "loss": 0.0208, "step": 32260 }, { "epoch": 0.47, "learning_rate": 1.984502860766426e-05, "loss": 0.0173, "step": 32270 }, { "epoch": 0.47, "learning_rate": 1.984498056792579e-05, "loss": 0.0251, "step": 32280 }, { "epoch": 0.47, "learning_rate": 1.9844932528187318e-05, "loss": 0.022, "step": 32290 }, { "epoch": 0.47, "learning_rate": 1.9844884488448847e-05, "loss": 0.0293, "step": 32300 }, { "epoch": 0.47, "learning_rate": 1.9844836448710373e-05, "loss": 0.0184, "step": 32310 }, { "epoch": 0.47, "learning_rate": 1.9844788408971902e-05, "loss": 0.0205, "step": 32320 }, { "epoch": 0.47, "learning_rate": 1.984474036923343e-05, "loss": 0.0142, "step": 32330 }, { "epoch": 0.47, "learning_rate": 1.9844692329494957e-05, "loss": 0.0245, "step": 32340 }, { "epoch": 0.47, "learning_rate": 1.9844644289756487e-05, "loss": 0.0274, "step": 32350 }, { "epoch": 0.47, "learning_rate": 1.9844596250018016e-05, "loss": 0.0242, "step": 32360 }, { "epoch": 0.47, "learning_rate": 1.9844548210279545e-05, "loss": 0.0275, "step": 32370 }, { "epoch": 0.47, "learning_rate": 1.984450017054107e-05, "loss": 0.0181, "step": 32380 }, { "epoch": 0.47, "learning_rate": 1.98444521308026e-05, "loss": 0.0206, "step": 32390 }, { "epoch": 0.47, "learning_rate": 1.984440409106413e-05, "loss": 0.0259, "step": 32400 }, { "epoch": 0.47, "learning_rate": 1.984435605132566e-05, "loss": 0.0195, "step": 32410 }, { "epoch": 0.47, "learning_rate": 1.9844308011587185e-05, "loss": 0.0221, "step": 32420 }, { "epoch": 0.47, "learning_rate": 1.9844259971848714e-05, "loss": 0.0219, "step": 32430 }, { "epoch": 0.47, "learning_rate": 1.9844211932110243e-05, "loss": 0.0194, "step": 32440 }, { "epoch": 0.47, "learning_rate": 1.984416389237177e-05, "loss": 0.0228, "step": 32450 }, { "epoch": 0.47, "learning_rate": 1.98441158526333e-05, "loss": 0.0256, "step": 32460 }, { "epoch": 0.47, "learning_rate": 1.9844067812894828e-05, "loss": 0.028, "step": 32470 }, { "epoch": 0.47, "learning_rate": 1.9844019773156357e-05, "loss": 0.0244, "step": 32480 }, { "epoch": 0.47, "learning_rate": 1.9843971733417883e-05, "loss": 0.0158, "step": 32490 }, { "epoch": 0.47, "learning_rate": 1.9843923693679412e-05, "loss": 0.0182, "step": 32500 }, { "epoch": 0.47, "learning_rate": 1.984387565394094e-05, "loss": 0.0248, "step": 32510 }, { "epoch": 0.47, "learning_rate": 1.9843827614202467e-05, "loss": 0.0192, "step": 32520 }, { "epoch": 0.47, "learning_rate": 1.9843779574463996e-05, "loss": 0.0257, "step": 32530 }, { "epoch": 0.47, "learning_rate": 1.9843736338699375e-05, "loss": 0.0232, "step": 32540 }, { "epoch": 0.47, "learning_rate": 1.98436882989609e-05, "loss": 0.0218, "step": 32550 }, { "epoch": 0.47, "learning_rate": 1.984364025922243e-05, "loss": 0.023, "step": 32560 }, { "epoch": 0.47, "learning_rate": 1.984359221948396e-05, "loss": 0.0241, "step": 32570 }, { "epoch": 0.47, "learning_rate": 1.9843544179745485e-05, "loss": 0.0243, "step": 32580 }, { "epoch": 0.47, "learning_rate": 1.9843496140007014e-05, "loss": 0.0182, "step": 32590 }, { "epoch": 0.47, "learning_rate": 1.9843448100268543e-05, "loss": 0.0191, "step": 32600 }, { "epoch": 0.47, "learning_rate": 1.9843400060530073e-05, "loss": 0.0206, "step": 32610 }, { "epoch": 0.47, "learning_rate": 1.98433520207916e-05, "loss": 0.0229, "step": 32620 }, { "epoch": 0.47, "learning_rate": 1.9843303981053128e-05, "loss": 0.0204, "step": 32630 }, { "epoch": 0.47, "learning_rate": 1.9843255941314657e-05, "loss": 0.0218, "step": 32640 }, { "epoch": 0.47, "learning_rate": 1.9843207901576186e-05, "loss": 0.0274, "step": 32650 }, { "epoch": 0.47, "learning_rate": 1.9843159861837712e-05, "loss": 0.023, "step": 32660 }, { "epoch": 0.47, "learning_rate": 1.984311182209924e-05, "loss": 0.024, "step": 32670 }, { "epoch": 0.47, "learning_rate": 1.984306378236077e-05, "loss": 0.037, "step": 32680 }, { "epoch": 0.47, "learning_rate": 1.9843015742622297e-05, "loss": 0.0188, "step": 32690 }, { "epoch": 0.47, "learning_rate": 1.9842967702883826e-05, "loss": 0.0245, "step": 32700 }, { "epoch": 0.47, "learning_rate": 1.9842919663145355e-05, "loss": 0.0239, "step": 32710 }, { "epoch": 0.47, "learning_rate": 1.9842871623406884e-05, "loss": 0.019, "step": 32720 }, { "epoch": 0.47, "learning_rate": 1.984282358366841e-05, "loss": 0.0266, "step": 32730 }, { "epoch": 0.47, "learning_rate": 1.984277554392994e-05, "loss": 0.0239, "step": 32740 }, { "epoch": 0.47, "learning_rate": 1.984272750419147e-05, "loss": 0.0247, "step": 32750 }, { "epoch": 0.47, "learning_rate": 1.9842679464452995e-05, "loss": 0.0207, "step": 32760 }, { "epoch": 0.47, "learning_rate": 1.9842631424714524e-05, "loss": 0.0203, "step": 32770 }, { "epoch": 0.47, "learning_rate": 1.9842583384976053e-05, "loss": 0.0213, "step": 32780 }, { "epoch": 0.47, "learning_rate": 1.9842535345237583e-05, "loss": 0.0187, "step": 32790 }, { "epoch": 0.47, "learning_rate": 1.984248730549911e-05, "loss": 0.0192, "step": 32800 }, { "epoch": 0.47, "learning_rate": 1.9842439265760638e-05, "loss": 0.0194, "step": 32810 }, { "epoch": 0.47, "learning_rate": 1.9842391226022167e-05, "loss": 0.0181, "step": 32820 }, { "epoch": 0.47, "learning_rate": 1.9842343186283696e-05, "loss": 0.0249, "step": 32830 }, { "epoch": 0.47, "learning_rate": 1.9842295146545222e-05, "loss": 0.0252, "step": 32840 }, { "epoch": 0.47, "learning_rate": 1.984224710680675e-05, "loss": 0.0181, "step": 32850 }, { "epoch": 0.47, "learning_rate": 1.984219906706828e-05, "loss": 0.0237, "step": 32860 }, { "epoch": 0.47, "learning_rate": 1.9842151027329807e-05, "loss": 0.0233, "step": 32870 }, { "epoch": 0.47, "learning_rate": 1.9842102987591336e-05, "loss": 0.022, "step": 32880 }, { "epoch": 0.47, "learning_rate": 1.9842054947852865e-05, "loss": 0.0235, "step": 32890 }, { "epoch": 0.47, "learning_rate": 1.9842006908114394e-05, "loss": 0.0204, "step": 32900 }, { "epoch": 0.47, "learning_rate": 1.984195886837592e-05, "loss": 0.0234, "step": 32910 }, { "epoch": 0.47, "learning_rate": 1.984191082863745e-05, "loss": 0.0265, "step": 32920 }, { "epoch": 0.47, "learning_rate": 1.984186278889898e-05, "loss": 0.0179, "step": 32930 }, { "epoch": 0.47, "learning_rate": 1.9841814749160505e-05, "loss": 0.0259, "step": 32940 }, { "epoch": 0.47, "learning_rate": 1.9841766709422034e-05, "loss": 0.0207, "step": 32950 }, { "epoch": 0.48, "learning_rate": 1.9841718669683563e-05, "loss": 0.0216, "step": 32960 }, { "epoch": 0.48, "learning_rate": 1.9841670629945092e-05, "loss": 0.0201, "step": 32970 }, { "epoch": 0.48, "learning_rate": 1.9841627394180467e-05, "loss": 0.0207, "step": 32980 }, { "epoch": 0.48, "learning_rate": 1.9841579354441996e-05, "loss": 0.0177, "step": 32990 }, { "epoch": 0.48, "learning_rate": 1.9841531314703522e-05, "loss": 0.0262, "step": 33000 }, { "epoch": 0.48, "learning_rate": 1.984148327496505e-05, "loss": 0.0189, "step": 33010 }, { "epoch": 0.48, "learning_rate": 1.984143523522658e-05, "loss": 0.02, "step": 33020 }, { "epoch": 0.48, "learning_rate": 1.984138719548811e-05, "loss": 0.0276, "step": 33030 }, { "epoch": 0.48, "learning_rate": 1.9841339155749636e-05, "loss": 0.0192, "step": 33040 }, { "epoch": 0.48, "learning_rate": 1.9841291116011165e-05, "loss": 0.0177, "step": 33050 }, { "epoch": 0.48, "learning_rate": 1.9841243076272694e-05, "loss": 0.0209, "step": 33060 }, { "epoch": 0.48, "learning_rate": 1.9841195036534224e-05, "loss": 0.0217, "step": 33070 }, { "epoch": 0.48, "learning_rate": 1.984114699679575e-05, "loss": 0.0208, "step": 33080 }, { "epoch": 0.48, "learning_rate": 1.984109895705728e-05, "loss": 0.0183, "step": 33090 }, { "epoch": 0.48, "learning_rate": 1.9841050917318808e-05, "loss": 0.0259, "step": 33100 }, { "epoch": 0.48, "learning_rate": 1.9841002877580334e-05, "loss": 0.0216, "step": 33110 }, { "epoch": 0.48, "learning_rate": 1.9840954837841863e-05, "loss": 0.0212, "step": 33120 }, { "epoch": 0.48, "learning_rate": 1.9840906798103393e-05, "loss": 0.0177, "step": 33130 }, { "epoch": 0.48, "learning_rate": 1.9840858758364922e-05, "loss": 0.0221, "step": 33140 }, { "epoch": 0.48, "learning_rate": 1.9840810718626448e-05, "loss": 0.0242, "step": 33150 }, { "epoch": 0.48, "learning_rate": 1.9840762678887977e-05, "loss": 0.0219, "step": 33160 }, { "epoch": 0.48, "learning_rate": 1.9840714639149506e-05, "loss": 0.0226, "step": 33170 }, { "epoch": 0.48, "learning_rate": 1.9840666599411032e-05, "loss": 0.0223, "step": 33180 }, { "epoch": 0.48, "learning_rate": 1.984061855967256e-05, "loss": 0.0219, "step": 33190 }, { "epoch": 0.48, "learning_rate": 1.984057051993409e-05, "loss": 0.0247, "step": 33200 }, { "epoch": 0.48, "learning_rate": 1.984052248019562e-05, "loss": 0.0188, "step": 33210 }, { "epoch": 0.48, "learning_rate": 1.9840474440457146e-05, "loss": 0.0263, "step": 33220 }, { "epoch": 0.48, "learning_rate": 1.9840426400718675e-05, "loss": 0.0231, "step": 33230 }, { "epoch": 0.48, "learning_rate": 1.9840378360980204e-05, "loss": 0.0262, "step": 33240 }, { "epoch": 0.48, "learning_rate": 1.984033032124173e-05, "loss": 0.0158, "step": 33250 }, { "epoch": 0.48, "learning_rate": 1.984028228150326e-05, "loss": 0.0218, "step": 33260 }, { "epoch": 0.48, "learning_rate": 1.984023424176479e-05, "loss": 0.0228, "step": 33270 }, { "epoch": 0.48, "learning_rate": 1.9840186202026318e-05, "loss": 0.0225, "step": 33280 }, { "epoch": 0.48, "learning_rate": 1.9840138162287844e-05, "loss": 0.02, "step": 33290 }, { "epoch": 0.48, "learning_rate": 1.9840090122549373e-05, "loss": 0.0215, "step": 33300 }, { "epoch": 0.48, "learning_rate": 1.9840042082810903e-05, "loss": 0.0212, "step": 33310 }, { "epoch": 0.48, "learning_rate": 1.9839994043072432e-05, "loss": 0.0241, "step": 33320 }, { "epoch": 0.48, "learning_rate": 1.9839946003333958e-05, "loss": 0.0186, "step": 33330 }, { "epoch": 0.48, "learning_rate": 1.9839897963595487e-05, "loss": 0.0235, "step": 33340 }, { "epoch": 0.48, "learning_rate": 1.9839849923857016e-05, "loss": 0.0166, "step": 33350 }, { "epoch": 0.48, "learning_rate": 1.9839801884118542e-05, "loss": 0.0259, "step": 33360 }, { "epoch": 0.48, "learning_rate": 1.983975384438007e-05, "loss": 0.0246, "step": 33370 }, { "epoch": 0.48, "learning_rate": 1.98397058046416e-05, "loss": 0.0232, "step": 33380 }, { "epoch": 0.48, "learning_rate": 1.983965776490313e-05, "loss": 0.0259, "step": 33390 }, { "epoch": 0.48, "learning_rate": 1.9839609725164656e-05, "loss": 0.024, "step": 33400 }, { "epoch": 0.48, "learning_rate": 1.9839561685426185e-05, "loss": 0.0181, "step": 33410 }, { "epoch": 0.48, "learning_rate": 1.9839513645687714e-05, "loss": 0.0267, "step": 33420 }, { "epoch": 0.48, "learning_rate": 1.983946560594924e-05, "loss": 0.0218, "step": 33430 }, { "epoch": 0.48, "learning_rate": 1.983941756621077e-05, "loss": 0.0257, "step": 33440 }, { "epoch": 0.48, "learning_rate": 1.98393695264723e-05, "loss": 0.0251, "step": 33450 }, { "epoch": 0.48, "learning_rate": 1.9839321486733828e-05, "loss": 0.0238, "step": 33460 }, { "epoch": 0.48, "learning_rate": 1.9839273446995354e-05, "loss": 0.0183, "step": 33470 }, { "epoch": 0.48, "learning_rate": 1.9839225407256883e-05, "loss": 0.0245, "step": 33480 }, { "epoch": 0.48, "learning_rate": 1.9839177367518412e-05, "loss": 0.0239, "step": 33490 }, { "epoch": 0.48, "learning_rate": 1.9839129327779942e-05, "loss": 0.0248, "step": 33500 }, { "epoch": 0.48, "learning_rate": 1.9839081288041468e-05, "loss": 0.0174, "step": 33510 }, { "epoch": 0.48, "learning_rate": 1.9839033248302997e-05, "loss": 0.0276, "step": 33520 }, { "epoch": 0.48, "learning_rate": 1.9838985208564526e-05, "loss": 0.0141, "step": 33530 }, { "epoch": 0.48, "learning_rate": 1.9838937168826052e-05, "loss": 0.0146, "step": 33540 }, { "epoch": 0.48, "learning_rate": 1.983888912908758e-05, "loss": 0.0207, "step": 33550 }, { "epoch": 0.48, "learning_rate": 1.983884108934911e-05, "loss": 0.0207, "step": 33560 }, { "epoch": 0.48, "learning_rate": 1.983879304961064e-05, "loss": 0.0187, "step": 33570 }, { "epoch": 0.48, "learning_rate": 1.9838745009872166e-05, "loss": 0.0211, "step": 33580 }, { "epoch": 0.48, "learning_rate": 1.9838696970133695e-05, "loss": 0.0186, "step": 33590 }, { "epoch": 0.48, "learning_rate": 1.9838648930395224e-05, "loss": 0.0247, "step": 33600 }, { "epoch": 0.48, "learning_rate": 1.9838600890656753e-05, "loss": 0.0221, "step": 33610 }, { "epoch": 0.48, "learning_rate": 1.9838552850918283e-05, "loss": 0.0154, "step": 33620 }, { "epoch": 0.48, "learning_rate": 1.9838504811179812e-05, "loss": 0.0254, "step": 33630 }, { "epoch": 0.48, "learning_rate": 1.9838456771441338e-05, "loss": 0.0227, "step": 33640 }, { "epoch": 0.48, "learning_rate": 1.9838408731702867e-05, "loss": 0.0196, "step": 33650 }, { "epoch": 0.49, "learning_rate": 1.9838360691964396e-05, "loss": 0.0272, "step": 33660 }, { "epoch": 0.49, "learning_rate": 1.9838312652225922e-05, "loss": 0.0226, "step": 33670 }, { "epoch": 0.49, "learning_rate": 1.983826461248745e-05, "loss": 0.0205, "step": 33680 }, { "epoch": 0.49, "learning_rate": 1.983821657274898e-05, "loss": 0.0196, "step": 33690 }, { "epoch": 0.49, "learning_rate": 1.983816853301051e-05, "loss": 0.0259, "step": 33700 }, { "epoch": 0.49, "learning_rate": 1.9838120493272036e-05, "loss": 0.0206, "step": 33710 }, { "epoch": 0.49, "learning_rate": 1.9838072453533565e-05, "loss": 0.0199, "step": 33720 }, { "epoch": 0.49, "learning_rate": 1.9838024413795095e-05, "loss": 0.0228, "step": 33730 }, { "epoch": 0.49, "learning_rate": 1.9837976374056624e-05, "loss": 0.0187, "step": 33740 }, { "epoch": 0.49, "learning_rate": 1.983792833431815e-05, "loss": 0.0187, "step": 33750 }, { "epoch": 0.49, "learning_rate": 1.983788029457968e-05, "loss": 0.0183, "step": 33760 }, { "epoch": 0.49, "learning_rate": 1.9837832254841208e-05, "loss": 0.0186, "step": 33770 }, { "epoch": 0.49, "learning_rate": 1.9837784215102734e-05, "loss": 0.0213, "step": 33780 }, { "epoch": 0.49, "learning_rate": 1.9837736175364263e-05, "loss": 0.0162, "step": 33790 }, { "epoch": 0.49, "learning_rate": 1.9837688135625793e-05, "loss": 0.0194, "step": 33800 }, { "epoch": 0.49, "learning_rate": 1.9837640095887322e-05, "loss": 0.0212, "step": 33810 }, { "epoch": 0.49, "learning_rate": 1.9837592056148848e-05, "loss": 0.0252, "step": 33820 }, { "epoch": 0.49, "learning_rate": 1.9837544016410377e-05, "loss": 0.0226, "step": 33830 }, { "epoch": 0.49, "learning_rate": 1.9837495976671906e-05, "loss": 0.0205, "step": 33840 }, { "epoch": 0.49, "learning_rate": 1.9837447936933432e-05, "loss": 0.0172, "step": 33850 }, { "epoch": 0.49, "learning_rate": 1.983739989719496e-05, "loss": 0.0239, "step": 33860 }, { "epoch": 0.49, "learning_rate": 1.983735185745649e-05, "loss": 0.0229, "step": 33870 }, { "epoch": 0.49, "learning_rate": 1.983730381771802e-05, "loss": 0.0154, "step": 33880 }, { "epoch": 0.49, "learning_rate": 1.9837255777979546e-05, "loss": 0.0215, "step": 33890 }, { "epoch": 0.49, "learning_rate": 1.9837207738241075e-05, "loss": 0.0212, "step": 33900 }, { "epoch": 0.49, "learning_rate": 1.9837159698502604e-05, "loss": 0.0229, "step": 33910 }, { "epoch": 0.49, "learning_rate": 1.9837111658764134e-05, "loss": 0.0242, "step": 33920 }, { "epoch": 0.49, "learning_rate": 1.983706361902566e-05, "loss": 0.0237, "step": 33930 }, { "epoch": 0.49, "learning_rate": 1.983701557928719e-05, "loss": 0.0187, "step": 33940 }, { "epoch": 0.49, "learning_rate": 1.9836967539548718e-05, "loss": 0.0174, "step": 33950 }, { "epoch": 0.49, "learning_rate": 1.9836919499810244e-05, "loss": 0.0242, "step": 33960 }, { "epoch": 0.49, "learning_rate": 1.9836871460071773e-05, "loss": 0.0165, "step": 33970 }, { "epoch": 0.49, "learning_rate": 1.9836823420333303e-05, "loss": 0.0201, "step": 33980 }, { "epoch": 0.49, "learning_rate": 1.9836775380594832e-05, "loss": 0.0204, "step": 33990 }, { "epoch": 0.49, "learning_rate": 1.9836727340856358e-05, "loss": 0.0248, "step": 34000 }, { "epoch": 0.49, "learning_rate": 1.9836679301117887e-05, "loss": 0.0208, "step": 34010 }, { "epoch": 0.49, "learning_rate": 1.9836631261379416e-05, "loss": 0.0226, "step": 34020 }, { "epoch": 0.49, "learning_rate": 1.9836583221640942e-05, "loss": 0.0184, "step": 34030 }, { "epoch": 0.49, "learning_rate": 1.983653518190247e-05, "loss": 0.0212, "step": 34040 }, { "epoch": 0.49, "learning_rate": 1.9836487142164e-05, "loss": 0.0228, "step": 34050 }, { "epoch": 0.49, "learning_rate": 1.983643910242553e-05, "loss": 0.0202, "step": 34060 }, { "epoch": 0.49, "learning_rate": 1.9836391062687056e-05, "loss": 0.0231, "step": 34070 }, { "epoch": 0.49, "learning_rate": 1.9836343022948585e-05, "loss": 0.0178, "step": 34080 }, { "epoch": 0.49, "learning_rate": 1.9836294983210114e-05, "loss": 0.0262, "step": 34090 }, { "epoch": 0.49, "learning_rate": 1.9836246943471644e-05, "loss": 0.0218, "step": 34100 }, { "epoch": 0.49, "learning_rate": 1.983619890373317e-05, "loss": 0.0197, "step": 34110 }, { "epoch": 0.49, "learning_rate": 1.98361508639947e-05, "loss": 0.0212, "step": 34120 }, { "epoch": 0.49, "learning_rate": 1.9836102824256228e-05, "loss": 0.0219, "step": 34130 }, { "epoch": 0.49, "learning_rate": 1.9836054784517754e-05, "loss": 0.0211, "step": 34140 }, { "epoch": 0.49, "learning_rate": 1.9836006744779283e-05, "loss": 0.0239, "step": 34150 }, { "epoch": 0.49, "learning_rate": 1.9835958705040813e-05, "loss": 0.0237, "step": 34160 }, { "epoch": 0.49, "learning_rate": 1.9835910665302342e-05, "loss": 0.0231, "step": 34170 }, { "epoch": 0.49, "learning_rate": 1.9835862625563868e-05, "loss": 0.0225, "step": 34180 }, { "epoch": 0.49, "learning_rate": 1.9835814585825397e-05, "loss": 0.0176, "step": 34190 }, { "epoch": 0.49, "learning_rate": 1.9835766546086926e-05, "loss": 0.0157, "step": 34200 }, { "epoch": 0.49, "learning_rate": 1.9835718506348452e-05, "loss": 0.024, "step": 34210 }, { "epoch": 0.49, "learning_rate": 1.983567046660998e-05, "loss": 0.0263, "step": 34220 }, { "epoch": 0.49, "learning_rate": 1.983562242687151e-05, "loss": 0.0251, "step": 34230 }, { "epoch": 0.49, "learning_rate": 1.983557438713304e-05, "loss": 0.0193, "step": 34240 }, { "epoch": 0.49, "learning_rate": 1.9835526347394566e-05, "loss": 0.0208, "step": 34250 }, { "epoch": 0.49, "learning_rate": 1.9835478307656095e-05, "loss": 0.0246, "step": 34260 }, { "epoch": 0.49, "learning_rate": 1.9835430267917624e-05, "loss": 0.0172, "step": 34270 }, { "epoch": 0.49, "learning_rate": 1.9835382228179154e-05, "loss": 0.0216, "step": 34280 }, { "epoch": 0.49, "learning_rate": 1.983533418844068e-05, "loss": 0.0278, "step": 34290 }, { "epoch": 0.49, "learning_rate": 1.983528614870221e-05, "loss": 0.0261, "step": 34300 }, { "epoch": 0.49, "learning_rate": 1.9835238108963738e-05, "loss": 0.018, "step": 34310 }, { "epoch": 0.49, "learning_rate": 1.9835190069225264e-05, "loss": 0.0245, "step": 34320 }, { "epoch": 0.49, "learning_rate": 1.9835142029486793e-05, "loss": 0.0201, "step": 34330 }, { "epoch": 0.49, "learning_rate": 1.9835093989748322e-05, "loss": 0.0201, "step": 34340 }, { "epoch": 0.5, "learning_rate": 1.9835045950009852e-05, "loss": 0.0209, "step": 34350 }, { "epoch": 0.5, "learning_rate": 1.9834997910271378e-05, "loss": 0.0268, "step": 34360 }, { "epoch": 0.5, "learning_rate": 1.9834949870532907e-05, "loss": 0.0176, "step": 34370 }, { "epoch": 0.5, "learning_rate": 1.9834901830794436e-05, "loss": 0.0174, "step": 34380 }, { "epoch": 0.5, "learning_rate": 1.9834853791055962e-05, "loss": 0.0282, "step": 34390 }, { "epoch": 0.5, "learning_rate": 1.983480575131749e-05, "loss": 0.028, "step": 34400 }, { "epoch": 0.5, "learning_rate": 1.983475771157902e-05, "loss": 0.0199, "step": 34410 }, { "epoch": 0.5, "learning_rate": 1.983470967184055e-05, "loss": 0.0188, "step": 34420 }, { "epoch": 0.5, "learning_rate": 1.9834661632102076e-05, "loss": 0.0187, "step": 34430 }, { "epoch": 0.5, "learning_rate": 1.9834613592363605e-05, "loss": 0.0224, "step": 34440 }, { "epoch": 0.5, "learning_rate": 1.9834565552625134e-05, "loss": 0.0206, "step": 34450 }, { "epoch": 0.5, "learning_rate": 1.9834517512886664e-05, "loss": 0.0191, "step": 34460 }, { "epoch": 0.5, "learning_rate": 1.983446947314819e-05, "loss": 0.0217, "step": 34470 }, { "epoch": 0.5, "learning_rate": 1.983442143340972e-05, "loss": 0.021, "step": 34480 }, { "epoch": 0.5, "learning_rate": 1.9834373393671248e-05, "loss": 0.0239, "step": 34490 }, { "epoch": 0.5, "learning_rate": 1.9834325353932774e-05, "loss": 0.021, "step": 34500 }, { "epoch": 0.5, "learning_rate": 1.9834277314194303e-05, "loss": 0.0235, "step": 34510 }, { "epoch": 0.5, "learning_rate": 1.9834229274455832e-05, "loss": 0.0197, "step": 34520 }, { "epoch": 0.5, "learning_rate": 1.983418123471736e-05, "loss": 0.0216, "step": 34530 }, { "epoch": 0.5, "learning_rate": 1.9834133194978887e-05, "loss": 0.0199, "step": 34540 }, { "epoch": 0.5, "learning_rate": 1.9834085155240417e-05, "loss": 0.0191, "step": 34550 }, { "epoch": 0.5, "learning_rate": 1.9834037115501946e-05, "loss": 0.0156, "step": 34560 }, { "epoch": 0.5, "learning_rate": 1.9833989075763472e-05, "loss": 0.0242, "step": 34570 }, { "epoch": 0.5, "learning_rate": 1.9833941036025e-05, "loss": 0.0173, "step": 34580 }, { "epoch": 0.5, "learning_rate": 1.983389299628653e-05, "loss": 0.0191, "step": 34590 }, { "epoch": 0.5, "learning_rate": 1.983384495654806e-05, "loss": 0.0222, "step": 34600 }, { "epoch": 0.5, "learning_rate": 1.9833796916809586e-05, "loss": 0.0217, "step": 34610 }, { "epoch": 0.5, "learning_rate": 1.9833748877071115e-05, "loss": 0.0182, "step": 34620 }, { "epoch": 0.5, "learning_rate": 1.9833700837332644e-05, "loss": 0.019, "step": 34630 }, { "epoch": 0.5, "learning_rate": 1.9833652797594173e-05, "loss": 0.0163, "step": 34640 }, { "epoch": 0.5, "learning_rate": 1.98336047578557e-05, "loss": 0.0174, "step": 34650 }, { "epoch": 0.5, "learning_rate": 1.983355671811723e-05, "loss": 0.0227, "step": 34660 }, { "epoch": 0.5, "learning_rate": 1.9833508678378758e-05, "loss": 0.0249, "step": 34670 }, { "epoch": 0.5, "learning_rate": 1.9833460638640284e-05, "loss": 0.0162, "step": 34680 }, { "epoch": 0.5, "learning_rate": 1.9833412598901813e-05, "loss": 0.0231, "step": 34690 }, { "epoch": 0.5, "learning_rate": 1.9833364559163342e-05, "loss": 0.0191, "step": 34700 }, { "epoch": 0.5, "learning_rate": 1.983331651942487e-05, "loss": 0.0205, "step": 34710 }, { "epoch": 0.5, "learning_rate": 1.9833268479686397e-05, "loss": 0.0197, "step": 34720 }, { "epoch": 0.5, "learning_rate": 1.9833220439947927e-05, "loss": 0.0213, "step": 34730 }, { "epoch": 0.5, "learning_rate": 1.9833172400209456e-05, "loss": 0.0208, "step": 34740 }, { "epoch": 0.5, "learning_rate": 1.9833124360470982e-05, "loss": 0.0223, "step": 34750 }, { "epoch": 0.5, "learning_rate": 1.983307632073251e-05, "loss": 0.0197, "step": 34760 }, { "epoch": 0.5, "learning_rate": 1.983302828099404e-05, "loss": 0.0233, "step": 34770 }, { "epoch": 0.5, "learning_rate": 1.983298024125557e-05, "loss": 0.0233, "step": 34780 }, { "epoch": 0.5, "learning_rate": 1.9832932201517096e-05, "loss": 0.0168, "step": 34790 }, { "epoch": 0.5, "learning_rate": 1.9832884161778625e-05, "loss": 0.0204, "step": 34800 }, { "epoch": 0.5, "learning_rate": 1.9832836122040154e-05, "loss": 0.0125, "step": 34810 }, { "epoch": 0.5, "learning_rate": 1.983278808230168e-05, "loss": 0.0179, "step": 34820 }, { "epoch": 0.5, "learning_rate": 1.983274004256321e-05, "loss": 0.0256, "step": 34830 }, { "epoch": 0.5, "learning_rate": 1.983269200282474e-05, "loss": 0.024, "step": 34840 }, { "epoch": 0.5, "learning_rate": 1.9832643963086268e-05, "loss": 0.0167, "step": 34850 }, { "epoch": 0.5, "learning_rate": 1.9832595923347794e-05, "loss": 0.0259, "step": 34860 }, { "epoch": 0.5, "learning_rate": 1.9832547883609323e-05, "loss": 0.0199, "step": 34870 }, { "epoch": 0.5, "learning_rate": 1.9832499843870852e-05, "loss": 0.0215, "step": 34880 }, { "epoch": 0.5, "learning_rate": 1.983245180413238e-05, "loss": 0.0252, "step": 34890 }, { "epoch": 0.5, "learning_rate": 1.9832403764393907e-05, "loss": 0.0254, "step": 34900 }, { "epoch": 0.5, "learning_rate": 1.9832355724655437e-05, "loss": 0.0229, "step": 34910 }, { "epoch": 0.5, "learning_rate": 1.9832307684916966e-05, "loss": 0.027, "step": 34920 }, { "epoch": 0.5, "learning_rate": 1.9832259645178492e-05, "loss": 0.0204, "step": 34930 }, { "epoch": 0.5, "learning_rate": 1.983221160544002e-05, "loss": 0.0225, "step": 34940 }, { "epoch": 0.5, "learning_rate": 1.983216356570155e-05, "loss": 0.0177, "step": 34950 }, { "epoch": 0.5, "learning_rate": 1.983211552596308e-05, "loss": 0.0206, "step": 34960 }, { "epoch": 0.5, "learning_rate": 1.9832067486224605e-05, "loss": 0.0219, "step": 34970 }, { "epoch": 0.5, "learning_rate": 1.9832019446486135e-05, "loss": 0.0259, "step": 34980 }, { "epoch": 0.5, "learning_rate": 1.9831971406747664e-05, "loss": 0.0231, "step": 34990 }, { "epoch": 0.5, "learning_rate": 1.983192336700919e-05, "loss": 0.0248, "step": 35000 }, { "epoch": 0.5, "learning_rate": 1.983187532727072e-05, "loss": 0.0261, "step": 35010 }, { "epoch": 0.5, "learning_rate": 1.983182728753225e-05, "loss": 0.028, "step": 35020 }, { "epoch": 0.5, "learning_rate": 1.9831779247793778e-05, "loss": 0.021, "step": 35030 }, { "epoch": 0.5, "learning_rate": 1.9831731208055304e-05, "loss": 0.0224, "step": 35040 }, { "epoch": 0.51, "learning_rate": 1.9831683168316833e-05, "loss": 0.0219, "step": 35050 }, { "epoch": 0.51, "learning_rate": 1.9831635128578362e-05, "loss": 0.0217, "step": 35060 }, { "epoch": 0.51, "learning_rate": 1.983158708883989e-05, "loss": 0.0189, "step": 35070 }, { "epoch": 0.51, "learning_rate": 1.9831539049101417e-05, "loss": 0.0259, "step": 35080 }, { "epoch": 0.51, "learning_rate": 1.9831491009362947e-05, "loss": 0.0184, "step": 35090 }, { "epoch": 0.51, "learning_rate": 1.9831442969624476e-05, "loss": 0.0195, "step": 35100 }, { "epoch": 0.51, "learning_rate": 1.9831394929886e-05, "loss": 0.0215, "step": 35110 }, { "epoch": 0.51, "learning_rate": 1.983134689014753e-05, "loss": 0.017, "step": 35120 }, { "epoch": 0.51, "learning_rate": 1.983129885040906e-05, "loss": 0.0187, "step": 35130 }, { "epoch": 0.51, "learning_rate": 1.983125081067059e-05, "loss": 0.0289, "step": 35140 }, { "epoch": 0.51, "learning_rate": 1.9831202770932115e-05, "loss": 0.0199, "step": 35150 }, { "epoch": 0.51, "learning_rate": 1.9831154731193645e-05, "loss": 0.0192, "step": 35160 }, { "epoch": 0.51, "learning_rate": 1.9831106691455174e-05, "loss": 0.0217, "step": 35170 }, { "epoch": 0.51, "learning_rate": 1.98310586517167e-05, "loss": 0.0236, "step": 35180 }, { "epoch": 0.51, "learning_rate": 1.983101061197823e-05, "loss": 0.0235, "step": 35190 }, { "epoch": 0.51, "learning_rate": 1.983096257223976e-05, "loss": 0.0235, "step": 35200 }, { "epoch": 0.51, "learning_rate": 1.9830914532501288e-05, "loss": 0.0201, "step": 35210 }, { "epoch": 0.51, "learning_rate": 1.9830866492762813e-05, "loss": 0.0218, "step": 35220 }, { "epoch": 0.51, "learning_rate": 1.9830818453024343e-05, "loss": 0.0204, "step": 35230 }, { "epoch": 0.51, "learning_rate": 1.9830770413285872e-05, "loss": 0.0194, "step": 35240 }, { "epoch": 0.51, "learning_rate": 1.98307223735474e-05, "loss": 0.02, "step": 35250 }, { "epoch": 0.51, "learning_rate": 1.9830674333808927e-05, "loss": 0.021, "step": 35260 }, { "epoch": 0.51, "learning_rate": 1.9830626294070456e-05, "loss": 0.0203, "step": 35270 }, { "epoch": 0.51, "learning_rate": 1.9830578254331986e-05, "loss": 0.0196, "step": 35280 }, { "epoch": 0.51, "learning_rate": 1.983053021459351e-05, "loss": 0.019, "step": 35290 }, { "epoch": 0.51, "learning_rate": 1.983048217485504e-05, "loss": 0.0225, "step": 35300 }, { "epoch": 0.51, "learning_rate": 1.983043413511657e-05, "loss": 0.0198, "step": 35310 }, { "epoch": 0.51, "learning_rate": 1.98303860953781e-05, "loss": 0.0205, "step": 35320 }, { "epoch": 0.51, "learning_rate": 1.9830338055639625e-05, "loss": 0.0247, "step": 35330 }, { "epoch": 0.51, "learning_rate": 1.9830290015901155e-05, "loss": 0.0208, "step": 35340 }, { "epoch": 0.51, "learning_rate": 1.9830241976162684e-05, "loss": 0.0161, "step": 35350 }, { "epoch": 0.51, "learning_rate": 1.983019393642421e-05, "loss": 0.019, "step": 35360 }, { "epoch": 0.51, "learning_rate": 1.983014589668574e-05, "loss": 0.0212, "step": 35370 }, { "epoch": 0.51, "learning_rate": 1.9830097856947268e-05, "loss": 0.0268, "step": 35380 }, { "epoch": 0.51, "learning_rate": 1.9830049817208797e-05, "loss": 0.0216, "step": 35390 }, { "epoch": 0.51, "learning_rate": 1.9830001777470323e-05, "loss": 0.0214, "step": 35400 }, { "epoch": 0.51, "learning_rate": 1.9829953737731853e-05, "loss": 0.0224, "step": 35410 }, { "epoch": 0.51, "learning_rate": 1.9829905697993382e-05, "loss": 0.0232, "step": 35420 }, { "epoch": 0.51, "learning_rate": 1.982985765825491e-05, "loss": 0.0158, "step": 35430 }, { "epoch": 0.51, "learning_rate": 1.9829809618516437e-05, "loss": 0.0216, "step": 35440 }, { "epoch": 0.51, "learning_rate": 1.9829761578777966e-05, "loss": 0.0174, "step": 35450 }, { "epoch": 0.51, "learning_rate": 1.9829713539039496e-05, "loss": 0.019, "step": 35460 }, { "epoch": 0.51, "learning_rate": 1.982966549930102e-05, "loss": 0.018, "step": 35470 }, { "epoch": 0.51, "learning_rate": 1.982961745956255e-05, "loss": 0.0167, "step": 35480 }, { "epoch": 0.51, "learning_rate": 1.982956941982408e-05, "loss": 0.0255, "step": 35490 }, { "epoch": 0.51, "learning_rate": 1.982952138008561e-05, "loss": 0.0193, "step": 35500 }, { "epoch": 0.51, "learning_rate": 1.9829473340347135e-05, "loss": 0.0188, "step": 35510 }, { "epoch": 0.51, "learning_rate": 1.9829425300608664e-05, "loss": 0.0233, "step": 35520 }, { "epoch": 0.51, "learning_rate": 1.9829377260870194e-05, "loss": 0.0211, "step": 35530 }, { "epoch": 0.51, "learning_rate": 1.982932922113172e-05, "loss": 0.0263, "step": 35540 }, { "epoch": 0.51, "learning_rate": 1.982928118139325e-05, "loss": 0.0159, "step": 35550 }, { "epoch": 0.51, "learning_rate": 1.9829233141654778e-05, "loss": 0.0193, "step": 35560 }, { "epoch": 0.51, "learning_rate": 1.9829185101916307e-05, "loss": 0.0195, "step": 35570 }, { "epoch": 0.51, "learning_rate": 1.9829137062177833e-05, "loss": 0.0156, "step": 35580 }, { "epoch": 0.51, "learning_rate": 1.9829089022439363e-05, "loss": 0.0214, "step": 35590 }, { "epoch": 0.51, "learning_rate": 1.9829040982700892e-05, "loss": 0.0227, "step": 35600 }, { "epoch": 0.51, "learning_rate": 1.982899294296242e-05, "loss": 0.0176, "step": 35610 }, { "epoch": 0.51, "learning_rate": 1.9828944903223947e-05, "loss": 0.0172, "step": 35620 }, { "epoch": 0.51, "learning_rate": 1.9828896863485476e-05, "loss": 0.0185, "step": 35630 }, { "epoch": 0.51, "learning_rate": 1.9828848823747006e-05, "loss": 0.0204, "step": 35640 }, { "epoch": 0.51, "learning_rate": 1.982880078400853e-05, "loss": 0.0223, "step": 35650 }, { "epoch": 0.51, "learning_rate": 1.982875274427006e-05, "loss": 0.0188, "step": 35660 }, { "epoch": 0.51, "learning_rate": 1.982870470453159e-05, "loss": 0.0158, "step": 35670 }, { "epoch": 0.51, "learning_rate": 1.982865666479312e-05, "loss": 0.0172, "step": 35680 }, { "epoch": 0.51, "learning_rate": 1.9828608625054645e-05, "loss": 0.0197, "step": 35690 }, { "epoch": 0.51, "learning_rate": 1.9828560585316174e-05, "loss": 0.024, "step": 35700 }, { "epoch": 0.51, "learning_rate": 1.9828512545577704e-05, "loss": 0.0242, "step": 35710 }, { "epoch": 0.51, "learning_rate": 1.982846450583923e-05, "loss": 0.0228, "step": 35720 }, { "epoch": 0.51, "learning_rate": 1.982841646610076e-05, "loss": 0.0221, "step": 35730 }, { "epoch": 0.52, "learning_rate": 1.9828368426362288e-05, "loss": 0.019, "step": 35740 }, { "epoch": 0.52, "learning_rate": 1.9828320386623817e-05, "loss": 0.0202, "step": 35750 }, { "epoch": 0.52, "learning_rate": 1.9828272346885343e-05, "loss": 0.0252, "step": 35760 }, { "epoch": 0.52, "learning_rate": 1.9828224307146872e-05, "loss": 0.0196, "step": 35770 }, { "epoch": 0.52, "learning_rate": 1.9828176267408402e-05, "loss": 0.0241, "step": 35780 }, { "epoch": 0.52, "learning_rate": 1.982812822766993e-05, "loss": 0.0269, "step": 35790 }, { "epoch": 0.52, "learning_rate": 1.9828080187931457e-05, "loss": 0.025, "step": 35800 }, { "epoch": 0.52, "learning_rate": 1.9828032148192986e-05, "loss": 0.0208, "step": 35810 }, { "epoch": 0.52, "learning_rate": 1.9827984108454515e-05, "loss": 0.0243, "step": 35820 }, { "epoch": 0.52, "learning_rate": 1.982793606871604e-05, "loss": 0.0174, "step": 35830 }, { "epoch": 0.52, "learning_rate": 1.982788802897757e-05, "loss": 0.0194, "step": 35840 }, { "epoch": 0.52, "learning_rate": 1.98278399892391e-05, "loss": 0.0243, "step": 35850 }, { "epoch": 0.52, "learning_rate": 1.982779194950063e-05, "loss": 0.0261, "step": 35860 }, { "epoch": 0.52, "learning_rate": 1.9827743909762155e-05, "loss": 0.0231, "step": 35870 }, { "epoch": 0.52, "learning_rate": 1.9827695870023684e-05, "loss": 0.0228, "step": 35880 }, { "epoch": 0.52, "learning_rate": 1.9827647830285214e-05, "loss": 0.031, "step": 35890 }, { "epoch": 0.52, "learning_rate": 1.982759979054674e-05, "loss": 0.0237, "step": 35900 }, { "epoch": 0.52, "learning_rate": 1.982755175080827e-05, "loss": 0.0159, "step": 35910 }, { "epoch": 0.52, "learning_rate": 1.9827503711069798e-05, "loss": 0.0198, "step": 35920 }, { "epoch": 0.52, "learning_rate": 1.9827455671331327e-05, "loss": 0.0172, "step": 35930 }, { "epoch": 0.52, "learning_rate": 1.9827407631592853e-05, "loss": 0.0175, "step": 35940 }, { "epoch": 0.52, "learning_rate": 1.9827359591854382e-05, "loss": 0.0209, "step": 35950 }, { "epoch": 0.52, "learning_rate": 1.982731155211591e-05, "loss": 0.0223, "step": 35960 }, { "epoch": 0.52, "learning_rate": 1.982726351237744e-05, "loss": 0.021, "step": 35970 }, { "epoch": 0.52, "learning_rate": 1.9827215472638967e-05, "loss": 0.0172, "step": 35980 }, { "epoch": 0.52, "learning_rate": 1.9827167432900496e-05, "loss": 0.0189, "step": 35990 }, { "epoch": 0.52, "learning_rate": 1.9827119393162025e-05, "loss": 0.0179, "step": 36000 }, { "epoch": 0.52, "learning_rate": 1.982707135342355e-05, "loss": 0.0204, "step": 36010 }, { "epoch": 0.52, "learning_rate": 1.982702331368508e-05, "loss": 0.017, "step": 36020 }, { "epoch": 0.52, "learning_rate": 1.982697527394661e-05, "loss": 0.023, "step": 36030 }, { "epoch": 0.52, "learning_rate": 1.982692723420814e-05, "loss": 0.0225, "step": 36040 }, { "epoch": 0.52, "learning_rate": 1.9826879194469665e-05, "loss": 0.0227, "step": 36050 }, { "epoch": 0.52, "learning_rate": 1.9826831154731194e-05, "loss": 0.0252, "step": 36060 }, { "epoch": 0.52, "learning_rate": 1.9826783114992723e-05, "loss": 0.0177, "step": 36070 }, { "epoch": 0.52, "learning_rate": 1.982673507525425e-05, "loss": 0.0253, "step": 36080 }, { "epoch": 0.52, "learning_rate": 1.982668703551578e-05, "loss": 0.0154, "step": 36090 }, { "epoch": 0.52, "learning_rate": 1.9826638995777308e-05, "loss": 0.0187, "step": 36100 }, { "epoch": 0.52, "learning_rate": 1.9826590956038837e-05, "loss": 0.0149, "step": 36110 }, { "epoch": 0.52, "learning_rate": 1.9826542916300363e-05, "loss": 0.0162, "step": 36120 }, { "epoch": 0.52, "learning_rate": 1.9826494876561892e-05, "loss": 0.0228, "step": 36130 }, { "epoch": 0.52, "learning_rate": 1.982644683682342e-05, "loss": 0.0244, "step": 36140 }, { "epoch": 0.52, "learning_rate": 1.982639879708495e-05, "loss": 0.0208, "step": 36150 }, { "epoch": 0.52, "learning_rate": 1.982635075734648e-05, "loss": 0.0264, "step": 36160 }, { "epoch": 0.52, "learning_rate": 1.982630271760801e-05, "loss": 0.0255, "step": 36170 }, { "epoch": 0.52, "learning_rate": 1.9826254677869535e-05, "loss": 0.0198, "step": 36180 }, { "epoch": 0.52, "learning_rate": 1.9826206638131065e-05, "loss": 0.0185, "step": 36190 }, { "epoch": 0.52, "learning_rate": 1.9826158598392594e-05, "loss": 0.0167, "step": 36200 }, { "epoch": 0.52, "learning_rate": 1.982611055865412e-05, "loss": 0.0161, "step": 36210 }, { "epoch": 0.52, "learning_rate": 1.982606251891565e-05, "loss": 0.019, "step": 36220 }, { "epoch": 0.52, "learning_rate": 1.9826014479177178e-05, "loss": 0.0173, "step": 36230 }, { "epoch": 0.52, "learning_rate": 1.9825966439438707e-05, "loss": 0.0174, "step": 36240 }, { "epoch": 0.52, "learning_rate": 1.9825918399700233e-05, "loss": 0.0209, "step": 36250 }, { "epoch": 0.52, "learning_rate": 1.9825870359961763e-05, "loss": 0.0188, "step": 36260 }, { "epoch": 0.52, "learning_rate": 1.9825822320223292e-05, "loss": 0.0184, "step": 36270 }, { "epoch": 0.52, "learning_rate": 1.982577428048482e-05, "loss": 0.0246, "step": 36280 }, { "epoch": 0.52, "learning_rate": 1.9825726240746347e-05, "loss": 0.0302, "step": 36290 }, { "epoch": 0.52, "learning_rate": 1.9825678201007876e-05, "loss": 0.0224, "step": 36300 }, { "epoch": 0.52, "learning_rate": 1.9825630161269406e-05, "loss": 0.0244, "step": 36310 }, { "epoch": 0.52, "learning_rate": 1.982558212153093e-05, "loss": 0.0218, "step": 36320 }, { "epoch": 0.52, "learning_rate": 1.982553408179246e-05, "loss": 0.0207, "step": 36330 }, { "epoch": 0.52, "learning_rate": 1.982548604205399e-05, "loss": 0.0224, "step": 36340 }, { "epoch": 0.52, "learning_rate": 1.982543800231552e-05, "loss": 0.0169, "step": 36350 }, { "epoch": 0.52, "learning_rate": 1.9825389962577045e-05, "loss": 0.019, "step": 36360 }, { "epoch": 0.52, "learning_rate": 1.9825341922838574e-05, "loss": 0.0219, "step": 36370 }, { "epoch": 0.52, "learning_rate": 1.9825293883100104e-05, "loss": 0.0198, "step": 36380 }, { "epoch": 0.52, "learning_rate": 1.982524584336163e-05, "loss": 0.0174, "step": 36390 }, { "epoch": 0.52, "learning_rate": 1.982519780362316e-05, "loss": 0.025, "step": 36400 }, { "epoch": 0.52, "learning_rate": 1.9825149763884688e-05, "loss": 0.0193, "step": 36410 }, { "epoch": 0.52, "learning_rate": 1.9825101724146217e-05, "loss": 0.0222, "step": 36420 }, { "epoch": 0.53, "learning_rate": 1.9825053684407743e-05, "loss": 0.0181, "step": 36430 }, { "epoch": 0.53, "learning_rate": 1.9825005644669273e-05, "loss": 0.0232, "step": 36440 }, { "epoch": 0.53, "learning_rate": 1.9824957604930802e-05, "loss": 0.0251, "step": 36450 }, { "epoch": 0.53, "learning_rate": 1.982490956519233e-05, "loss": 0.022, "step": 36460 }, { "epoch": 0.53, "learning_rate": 1.9824861525453857e-05, "loss": 0.0182, "step": 36470 }, { "epoch": 0.53, "learning_rate": 1.9824813485715386e-05, "loss": 0.024, "step": 36480 }, { "epoch": 0.53, "learning_rate": 1.9824765445976916e-05, "loss": 0.0202, "step": 36490 }, { "epoch": 0.53, "learning_rate": 1.982471740623844e-05, "loss": 0.0236, "step": 36500 }, { "epoch": 0.53, "learning_rate": 1.982466936649997e-05, "loss": 0.0179, "step": 36510 }, { "epoch": 0.53, "learning_rate": 1.98246213267615e-05, "loss": 0.0197, "step": 36520 }, { "epoch": 0.53, "learning_rate": 1.982457328702303e-05, "loss": 0.0246, "step": 36530 }, { "epoch": 0.53, "learning_rate": 1.9824525247284555e-05, "loss": 0.025, "step": 36540 }, { "epoch": 0.53, "learning_rate": 1.9824477207546084e-05, "loss": 0.0251, "step": 36550 }, { "epoch": 0.53, "learning_rate": 1.9824429167807614e-05, "loss": 0.0181, "step": 36560 }, { "epoch": 0.53, "learning_rate": 1.982438112806914e-05, "loss": 0.0176, "step": 36570 }, { "epoch": 0.53, "learning_rate": 1.982433308833067e-05, "loss": 0.0248, "step": 36580 }, { "epoch": 0.53, "learning_rate": 1.9824285048592198e-05, "loss": 0.0234, "step": 36590 }, { "epoch": 0.53, "learning_rate": 1.9824237008853727e-05, "loss": 0.0215, "step": 36600 }, { "epoch": 0.53, "learning_rate": 1.9824188969115253e-05, "loss": 0.0188, "step": 36610 }, { "epoch": 0.53, "learning_rate": 1.9824140929376782e-05, "loss": 0.0188, "step": 36620 }, { "epoch": 0.53, "learning_rate": 1.9824092889638312e-05, "loss": 0.02, "step": 36630 }, { "epoch": 0.53, "learning_rate": 1.982404484989984e-05, "loss": 0.023, "step": 36640 }, { "epoch": 0.53, "learning_rate": 1.9823996810161367e-05, "loss": 0.0201, "step": 36650 }, { "epoch": 0.53, "learning_rate": 1.9823948770422896e-05, "loss": 0.0177, "step": 36660 }, { "epoch": 0.53, "learning_rate": 1.9823900730684425e-05, "loss": 0.0273, "step": 36670 }, { "epoch": 0.53, "learning_rate": 1.982385269094595e-05, "loss": 0.0204, "step": 36680 }, { "epoch": 0.53, "learning_rate": 1.982380465120748e-05, "loss": 0.0177, "step": 36690 }, { "epoch": 0.53, "learning_rate": 1.982375661146901e-05, "loss": 0.0235, "step": 36700 }, { "epoch": 0.53, "learning_rate": 1.982370857173054e-05, "loss": 0.0213, "step": 36710 }, { "epoch": 0.53, "learning_rate": 1.9823660531992065e-05, "loss": 0.0229, "step": 36720 }, { "epoch": 0.53, "learning_rate": 1.9823612492253594e-05, "loss": 0.0251, "step": 36730 }, { "epoch": 0.53, "learning_rate": 1.9823564452515124e-05, "loss": 0.0238, "step": 36740 }, { "epoch": 0.53, "learning_rate": 1.982351641277665e-05, "loss": 0.0207, "step": 36750 }, { "epoch": 0.53, "learning_rate": 1.982346837303818e-05, "loss": 0.0231, "step": 36760 }, { "epoch": 0.53, "learning_rate": 1.9823420333299708e-05, "loss": 0.0219, "step": 36770 }, { "epoch": 0.53, "learning_rate": 1.9823372293561237e-05, "loss": 0.0154, "step": 36780 }, { "epoch": 0.53, "learning_rate": 1.9823324253822763e-05, "loss": 0.0225, "step": 36790 }, { "epoch": 0.53, "learning_rate": 1.9823276214084292e-05, "loss": 0.0194, "step": 36800 }, { "epoch": 0.53, "learning_rate": 1.982322817434582e-05, "loss": 0.0226, "step": 36810 }, { "epoch": 0.53, "learning_rate": 1.982318013460735e-05, "loss": 0.0235, "step": 36820 }, { "epoch": 0.53, "learning_rate": 1.9823132094868877e-05, "loss": 0.0274, "step": 36830 }, { "epoch": 0.53, "learning_rate": 1.9823084055130406e-05, "loss": 0.0195, "step": 36840 }, { "epoch": 0.53, "learning_rate": 1.9823036015391935e-05, "loss": 0.0189, "step": 36850 }, { "epoch": 0.53, "learning_rate": 1.982298797565346e-05, "loss": 0.0212, "step": 36860 }, { "epoch": 0.53, "learning_rate": 1.982293993591499e-05, "loss": 0.0191, "step": 36870 }, { "epoch": 0.53, "learning_rate": 1.982289189617652e-05, "loss": 0.019, "step": 36880 }, { "epoch": 0.53, "learning_rate": 1.982284385643805e-05, "loss": 0.0249, "step": 36890 }, { "epoch": 0.53, "learning_rate": 1.9822795816699575e-05, "loss": 0.0146, "step": 36900 }, { "epoch": 0.53, "learning_rate": 1.9822747776961104e-05, "loss": 0.0184, "step": 36910 }, { "epoch": 0.53, "learning_rate": 1.9822699737222633e-05, "loss": 0.0204, "step": 36920 }, { "epoch": 0.53, "learning_rate": 1.982265169748416e-05, "loss": 0.0213, "step": 36930 }, { "epoch": 0.53, "learning_rate": 1.982260365774569e-05, "loss": 0.0214, "step": 36940 }, { "epoch": 0.53, "learning_rate": 1.9822555618007218e-05, "loss": 0.0212, "step": 36950 }, { "epoch": 0.53, "learning_rate": 1.9822507578268747e-05, "loss": 0.0207, "step": 36960 }, { "epoch": 0.53, "learning_rate": 1.9822459538530273e-05, "loss": 0.0191, "step": 36970 }, { "epoch": 0.53, "learning_rate": 1.9822411498791802e-05, "loss": 0.0199, "step": 36980 }, { "epoch": 0.53, "learning_rate": 1.982236345905333e-05, "loss": 0.0296, "step": 36990 }, { "epoch": 0.53, "learning_rate": 1.982231541931486e-05, "loss": 0.022, "step": 37000 }, { "epoch": 0.53, "learning_rate": 1.9822267379576387e-05, "loss": 0.0216, "step": 37010 }, { "epoch": 0.53, "learning_rate": 1.9822219339837916e-05, "loss": 0.017, "step": 37020 }, { "epoch": 0.53, "learning_rate": 1.9822171300099445e-05, "loss": 0.0239, "step": 37030 }, { "epoch": 0.53, "learning_rate": 1.982212326036097e-05, "loss": 0.0238, "step": 37040 }, { "epoch": 0.53, "learning_rate": 1.98220752206225e-05, "loss": 0.0197, "step": 37050 }, { "epoch": 0.53, "learning_rate": 1.982202718088403e-05, "loss": 0.0207, "step": 37060 }, { "epoch": 0.53, "learning_rate": 1.982197914114556e-05, "loss": 0.0225, "step": 37070 }, { "epoch": 0.53, "learning_rate": 1.9821931101407085e-05, "loss": 0.0177, "step": 37080 }, { "epoch": 0.53, "learning_rate": 1.9821883061668614e-05, "loss": 0.0194, "step": 37090 }, { "epoch": 0.53, "learning_rate": 1.9821835021930143e-05, "loss": 0.0191, "step": 37100 }, { "epoch": 0.53, "learning_rate": 1.982178698219167e-05, "loss": 0.019, "step": 37110 }, { "epoch": 0.53, "learning_rate": 1.98217389424532e-05, "loss": 0.0234, "step": 37120 }, { "epoch": 0.54, "learning_rate": 1.9821690902714728e-05, "loss": 0.0189, "step": 37130 }, { "epoch": 0.54, "learning_rate": 1.9821642862976257e-05, "loss": 0.0221, "step": 37140 }, { "epoch": 0.54, "learning_rate": 1.9821594823237783e-05, "loss": 0.0173, "step": 37150 }, { "epoch": 0.54, "learning_rate": 1.9821546783499312e-05, "loss": 0.0156, "step": 37160 }, { "epoch": 0.54, "learning_rate": 1.982149874376084e-05, "loss": 0.0174, "step": 37170 }, { "epoch": 0.54, "learning_rate": 1.982145070402237e-05, "loss": 0.0186, "step": 37180 }, { "epoch": 0.54, "learning_rate": 1.9821402664283897e-05, "loss": 0.0187, "step": 37190 }, { "epoch": 0.54, "learning_rate": 1.9821354624545426e-05, "loss": 0.0204, "step": 37200 }, { "epoch": 0.54, "learning_rate": 1.9821306584806955e-05, "loss": 0.022, "step": 37210 }, { "epoch": 0.54, "learning_rate": 1.982125854506848e-05, "loss": 0.0179, "step": 37220 }, { "epoch": 0.54, "learning_rate": 1.982121050533001e-05, "loss": 0.0157, "step": 37230 }, { "epoch": 0.54, "learning_rate": 1.982116246559154e-05, "loss": 0.0167, "step": 37240 }, { "epoch": 0.54, "learning_rate": 1.982111442585307e-05, "loss": 0.0186, "step": 37250 }, { "epoch": 0.54, "learning_rate": 1.9821066386114595e-05, "loss": 0.0214, "step": 37260 }, { "epoch": 0.54, "learning_rate": 1.9821018346376124e-05, "loss": 0.0247, "step": 37270 }, { "epoch": 0.54, "learning_rate": 1.9820970306637653e-05, "loss": 0.0173, "step": 37280 }, { "epoch": 0.54, "learning_rate": 1.982092226689918e-05, "loss": 0.0174, "step": 37290 }, { "epoch": 0.54, "learning_rate": 1.982087422716071e-05, "loss": 0.018, "step": 37300 }, { "epoch": 0.54, "learning_rate": 1.9820826187422238e-05, "loss": 0.02, "step": 37310 }, { "epoch": 0.54, "learning_rate": 1.9820778147683767e-05, "loss": 0.0212, "step": 37320 }, { "epoch": 0.54, "learning_rate": 1.9820730107945293e-05, "loss": 0.0255, "step": 37330 }, { "epoch": 0.54, "learning_rate": 1.9820682068206822e-05, "loss": 0.0189, "step": 37340 }, { "epoch": 0.54, "learning_rate": 1.982063402846835e-05, "loss": 0.0183, "step": 37350 }, { "epoch": 0.54, "learning_rate": 1.982058598872988e-05, "loss": 0.0227, "step": 37360 }, { "epoch": 0.54, "learning_rate": 1.9820537948991407e-05, "loss": 0.0188, "step": 37370 }, { "epoch": 0.54, "learning_rate": 1.9820489909252936e-05, "loss": 0.0222, "step": 37380 }, { "epoch": 0.54, "learning_rate": 1.9820441869514465e-05, "loss": 0.0184, "step": 37390 }, { "epoch": 0.54, "learning_rate": 1.982039382977599e-05, "loss": 0.0197, "step": 37400 }, { "epoch": 0.54, "learning_rate": 1.982034579003752e-05, "loss": 0.0243, "step": 37410 }, { "epoch": 0.54, "learning_rate": 1.982029775029905e-05, "loss": 0.022, "step": 37420 }, { "epoch": 0.54, "learning_rate": 1.982024971056058e-05, "loss": 0.0174, "step": 37430 }, { "epoch": 0.54, "learning_rate": 1.9820201670822105e-05, "loss": 0.0252, "step": 37440 }, { "epoch": 0.54, "learning_rate": 1.9820153631083634e-05, "loss": 0.0236, "step": 37450 }, { "epoch": 0.54, "learning_rate": 1.9820105591345163e-05, "loss": 0.0207, "step": 37460 }, { "epoch": 0.54, "learning_rate": 1.982005755160669e-05, "loss": 0.0257, "step": 37470 }, { "epoch": 0.54, "learning_rate": 1.982000951186822e-05, "loss": 0.0204, "step": 37480 }, { "epoch": 0.54, "learning_rate": 1.9819961472129748e-05, "loss": 0.0237, "step": 37490 }, { "epoch": 0.54, "learning_rate": 1.9819913432391277e-05, "loss": 0.0195, "step": 37500 }, { "epoch": 0.54, "learning_rate": 1.9819865392652803e-05, "loss": 0.0207, "step": 37510 }, { "epoch": 0.54, "learning_rate": 1.9819817352914332e-05, "loss": 0.0198, "step": 37520 }, { "epoch": 0.54, "learning_rate": 1.981976931317586e-05, "loss": 0.0157, "step": 37530 }, { "epoch": 0.54, "learning_rate": 1.981972127343739e-05, "loss": 0.0179, "step": 37540 }, { "epoch": 0.54, "learning_rate": 1.9819673233698916e-05, "loss": 0.0191, "step": 37550 }, { "epoch": 0.54, "learning_rate": 1.9819625193960446e-05, "loss": 0.0167, "step": 37560 }, { "epoch": 0.54, "learning_rate": 1.9819577154221975e-05, "loss": 0.0198, "step": 37570 }, { "epoch": 0.54, "learning_rate": 1.98195291144835e-05, "loss": 0.0153, "step": 37580 }, { "epoch": 0.54, "learning_rate": 1.981948107474503e-05, "loss": 0.0189, "step": 37590 }, { "epoch": 0.54, "learning_rate": 1.981943303500656e-05, "loss": 0.0178, "step": 37600 }, { "epoch": 0.54, "learning_rate": 1.981938499526809e-05, "loss": 0.0244, "step": 37610 }, { "epoch": 0.54, "learning_rate": 1.9819336955529615e-05, "loss": 0.0227, "step": 37620 }, { "epoch": 0.54, "learning_rate": 1.9819288915791144e-05, "loss": 0.0192, "step": 37630 }, { "epoch": 0.54, "learning_rate": 1.9819240876052673e-05, "loss": 0.0216, "step": 37640 }, { "epoch": 0.54, "learning_rate": 1.98191928363142e-05, "loss": 0.0214, "step": 37650 }, { "epoch": 0.54, "learning_rate": 1.9819144796575728e-05, "loss": 0.0148, "step": 37660 }, { "epoch": 0.54, "learning_rate": 1.9819096756837258e-05, "loss": 0.026, "step": 37670 }, { "epoch": 0.54, "learning_rate": 1.9819048717098787e-05, "loss": 0.0238, "step": 37680 }, { "epoch": 0.54, "learning_rate": 1.9819000677360313e-05, "loss": 0.0233, "step": 37690 }, { "epoch": 0.54, "learning_rate": 1.9818952637621842e-05, "loss": 0.0292, "step": 37700 }, { "epoch": 0.54, "learning_rate": 1.981890459788337e-05, "loss": 0.024, "step": 37710 }, { "epoch": 0.54, "learning_rate": 1.98188565581449e-05, "loss": 0.0156, "step": 37720 }, { "epoch": 0.54, "learning_rate": 1.9818808518406426e-05, "loss": 0.0188, "step": 37730 }, { "epoch": 0.54, "learning_rate": 1.9818760478667956e-05, "loss": 0.0218, "step": 37740 }, { "epoch": 0.54, "learning_rate": 1.9818712438929485e-05, "loss": 0.0188, "step": 37750 }, { "epoch": 0.54, "learning_rate": 1.981866439919101e-05, "loss": 0.0217, "step": 37760 }, { "epoch": 0.54, "learning_rate": 1.981861635945254e-05, "loss": 0.0186, "step": 37770 }, { "epoch": 0.54, "learning_rate": 1.981856831971407e-05, "loss": 0.0179, "step": 37780 }, { "epoch": 0.54, "learning_rate": 1.98185202799756e-05, "loss": 0.0215, "step": 37790 }, { "epoch": 0.54, "learning_rate": 1.9818472240237125e-05, "loss": 0.0264, "step": 37800 }, { "epoch": 0.54, "learning_rate": 1.9818424200498654e-05, "loss": 0.0259, "step": 37810 }, { "epoch": 0.55, "learning_rate": 1.9818376160760183e-05, "loss": 0.021, "step": 37820 }, { "epoch": 0.55, "learning_rate": 1.981832812102171e-05, "loss": 0.0221, "step": 37830 }, { "epoch": 0.55, "learning_rate": 1.9818280081283238e-05, "loss": 0.0207, "step": 37840 }, { "epoch": 0.55, "learning_rate": 1.9818232041544767e-05, "loss": 0.0187, "step": 37850 }, { "epoch": 0.55, "learning_rate": 1.9818184001806297e-05, "loss": 0.0178, "step": 37860 }, { "epoch": 0.55, "learning_rate": 1.9818135962067823e-05, "loss": 0.0228, "step": 37870 }, { "epoch": 0.55, "learning_rate": 1.9818087922329352e-05, "loss": 0.0137, "step": 37880 }, { "epoch": 0.55, "learning_rate": 1.981803988259088e-05, "loss": 0.0199, "step": 37890 }, { "epoch": 0.55, "learning_rate": 1.981799184285241e-05, "loss": 0.0197, "step": 37900 }, { "epoch": 0.55, "learning_rate": 1.9817943803113936e-05, "loss": 0.0244, "step": 37910 }, { "epoch": 0.55, "learning_rate": 1.9817895763375466e-05, "loss": 0.0222, "step": 37920 }, { "epoch": 0.55, "learning_rate": 1.9817847723636995e-05, "loss": 0.0183, "step": 37930 }, { "epoch": 0.55, "learning_rate": 1.981779968389852e-05, "loss": 0.0212, "step": 37940 }, { "epoch": 0.55, "learning_rate": 1.981775164416005e-05, "loss": 0.0247, "step": 37950 }, { "epoch": 0.55, "learning_rate": 1.981770360442158e-05, "loss": 0.0203, "step": 37960 }, { "epoch": 0.55, "learning_rate": 1.981765556468311e-05, "loss": 0.0224, "step": 37970 }, { "epoch": 0.55, "learning_rate": 1.9817607524944634e-05, "loss": 0.019, "step": 37980 }, { "epoch": 0.55, "learning_rate": 1.9817559485206164e-05, "loss": 0.0188, "step": 37990 }, { "epoch": 0.55, "learning_rate": 1.9817511445467693e-05, "loss": 0.02, "step": 38000 }, { "epoch": 0.55, "learning_rate": 1.981746340572922e-05, "loss": 0.0202, "step": 38010 }, { "epoch": 0.55, "learning_rate": 1.9817415365990748e-05, "loss": 0.0191, "step": 38020 }, { "epoch": 0.55, "learning_rate": 1.9817367326252277e-05, "loss": 0.0238, "step": 38030 }, { "epoch": 0.55, "learning_rate": 1.9817319286513807e-05, "loss": 0.0195, "step": 38040 }, { "epoch": 0.55, "learning_rate": 1.9817271246775333e-05, "loss": 0.0172, "step": 38050 }, { "epoch": 0.55, "learning_rate": 1.9817223207036862e-05, "loss": 0.0241, "step": 38060 }, { "epoch": 0.55, "learning_rate": 1.981717516729839e-05, "loss": 0.0213, "step": 38070 }, { "epoch": 0.55, "learning_rate": 1.9817127127559917e-05, "loss": 0.0187, "step": 38080 }, { "epoch": 0.55, "learning_rate": 1.9817079087821446e-05, "loss": 0.0189, "step": 38090 }, { "epoch": 0.55, "learning_rate": 1.9817031048082975e-05, "loss": 0.017, "step": 38100 }, { "epoch": 0.55, "learning_rate": 1.9816983008344505e-05, "loss": 0.0173, "step": 38110 }, { "epoch": 0.55, "learning_rate": 1.981693496860603e-05, "loss": 0.0233, "step": 38120 }, { "epoch": 0.55, "learning_rate": 1.981688692886756e-05, "loss": 0.0241, "step": 38130 }, { "epoch": 0.55, "learning_rate": 1.981683888912909e-05, "loss": 0.0199, "step": 38140 }, { "epoch": 0.55, "learning_rate": 1.981679084939062e-05, "loss": 0.0192, "step": 38150 }, { "epoch": 0.55, "learning_rate": 1.9816742809652144e-05, "loss": 0.0179, "step": 38160 }, { "epoch": 0.55, "learning_rate": 1.9816694769913674e-05, "loss": 0.0184, "step": 38170 }, { "epoch": 0.55, "learning_rate": 1.9816646730175203e-05, "loss": 0.0198, "step": 38180 }, { "epoch": 0.55, "learning_rate": 1.981659869043673e-05, "loss": 0.0228, "step": 38190 }, { "epoch": 0.55, "learning_rate": 1.9816550650698258e-05, "loss": 0.0223, "step": 38200 }, { "epoch": 0.55, "learning_rate": 1.9816502610959787e-05, "loss": 0.0189, "step": 38210 }, { "epoch": 0.55, "learning_rate": 1.9816454571221317e-05, "loss": 0.0149, "step": 38220 }, { "epoch": 0.55, "learning_rate": 1.9816406531482842e-05, "loss": 0.0193, "step": 38230 }, { "epoch": 0.55, "learning_rate": 1.9816358491744372e-05, "loss": 0.0204, "step": 38240 }, { "epoch": 0.55, "learning_rate": 1.98163104520059e-05, "loss": 0.0177, "step": 38250 }, { "epoch": 0.55, "learning_rate": 1.9816262412267427e-05, "loss": 0.0229, "step": 38260 }, { "epoch": 0.55, "learning_rate": 1.9816214372528956e-05, "loss": 0.0183, "step": 38270 }, { "epoch": 0.55, "learning_rate": 1.9816166332790485e-05, "loss": 0.0155, "step": 38280 }, { "epoch": 0.55, "learning_rate": 1.9816118293052015e-05, "loss": 0.0217, "step": 38290 }, { "epoch": 0.55, "learning_rate": 1.981607025331354e-05, "loss": 0.0256, "step": 38300 }, { "epoch": 0.55, "learning_rate": 1.981602221357507e-05, "loss": 0.0201, "step": 38310 }, { "epoch": 0.55, "learning_rate": 1.98159741738366e-05, "loss": 0.0189, "step": 38320 }, { "epoch": 0.55, "learning_rate": 1.981592613409813e-05, "loss": 0.0215, "step": 38330 }, { "epoch": 0.55, "learning_rate": 1.9815878094359654e-05, "loss": 0.0192, "step": 38340 }, { "epoch": 0.55, "learning_rate": 1.9815830054621184e-05, "loss": 0.0171, "step": 38350 }, { "epoch": 0.55, "learning_rate": 1.9815782014882713e-05, "loss": 0.0227, "step": 38360 }, { "epoch": 0.55, "learning_rate": 1.981573397514424e-05, "loss": 0.0199, "step": 38370 }, { "epoch": 0.55, "learning_rate": 1.9815685935405768e-05, "loss": 0.0201, "step": 38380 }, { "epoch": 0.55, "learning_rate": 1.9815637895667297e-05, "loss": 0.0185, "step": 38390 }, { "epoch": 0.55, "learning_rate": 1.9815589855928826e-05, "loss": 0.0174, "step": 38400 }, { "epoch": 0.55, "learning_rate": 1.9815541816190352e-05, "loss": 0.0194, "step": 38410 }, { "epoch": 0.55, "learning_rate": 1.981549377645188e-05, "loss": 0.0214, "step": 38420 }, { "epoch": 0.55, "learning_rate": 1.981544573671341e-05, "loss": 0.0218, "step": 38430 }, { "epoch": 0.55, "learning_rate": 1.9815397696974937e-05, "loss": 0.0272, "step": 38440 }, { "epoch": 0.55, "learning_rate": 1.9815349657236466e-05, "loss": 0.0235, "step": 38450 }, { "epoch": 0.55, "learning_rate": 1.9815301617497995e-05, "loss": 0.0225, "step": 38460 }, { "epoch": 0.55, "learning_rate": 1.9815253577759525e-05, "loss": 0.0167, "step": 38470 }, { "epoch": 0.55, "learning_rate": 1.981520553802105e-05, "loss": 0.0226, "step": 38480 }, { "epoch": 0.55, "learning_rate": 1.981515749828258e-05, "loss": 0.0216, "step": 38490 }, { "epoch": 0.55, "learning_rate": 1.981510945854411e-05, "loss": 0.0204, "step": 38500 }, { "epoch": 0.56, "learning_rate": 1.9815061418805638e-05, "loss": 0.0152, "step": 38510 }, { "epoch": 0.56, "learning_rate": 1.9815013379067164e-05, "loss": 0.0178, "step": 38520 }, { "epoch": 0.56, "learning_rate": 1.9814965339328693e-05, "loss": 0.0208, "step": 38530 }, { "epoch": 0.56, "learning_rate": 1.9814917299590223e-05, "loss": 0.0214, "step": 38540 }, { "epoch": 0.56, "learning_rate": 1.981486925985175e-05, "loss": 0.0234, "step": 38550 }, { "epoch": 0.56, "learning_rate": 1.9814821220113278e-05, "loss": 0.0188, "step": 38560 }, { "epoch": 0.56, "learning_rate": 1.9814773180374807e-05, "loss": 0.0205, "step": 38570 }, { "epoch": 0.56, "learning_rate": 1.9814725140636336e-05, "loss": 0.0175, "step": 38580 }, { "epoch": 0.56, "learning_rate": 1.9814677100897862e-05, "loss": 0.0232, "step": 38590 }, { "epoch": 0.56, "learning_rate": 1.981462906115939e-05, "loss": 0.02, "step": 38600 }, { "epoch": 0.56, "learning_rate": 1.981458102142092e-05, "loss": 0.0162, "step": 38610 }, { "epoch": 0.56, "learning_rate": 1.9814532981682447e-05, "loss": 0.0179, "step": 38620 }, { "epoch": 0.56, "learning_rate": 1.9814484941943976e-05, "loss": 0.0209, "step": 38630 }, { "epoch": 0.56, "learning_rate": 1.9814436902205505e-05, "loss": 0.0218, "step": 38640 }, { "epoch": 0.56, "learning_rate": 1.9814388862467035e-05, "loss": 0.022, "step": 38650 }, { "epoch": 0.56, "learning_rate": 1.981434082272856e-05, "loss": 0.0211, "step": 38660 }, { "epoch": 0.56, "learning_rate": 1.981429278299009e-05, "loss": 0.0214, "step": 38670 }, { "epoch": 0.56, "learning_rate": 1.981424474325162e-05, "loss": 0.0193, "step": 38680 }, { "epoch": 0.56, "learning_rate": 1.9814196703513148e-05, "loss": 0.0194, "step": 38690 }, { "epoch": 0.56, "learning_rate": 1.9814148663774674e-05, "loss": 0.0232, "step": 38700 }, { "epoch": 0.56, "learning_rate": 1.9814100624036203e-05, "loss": 0.0252, "step": 38710 }, { "epoch": 0.56, "learning_rate": 1.9814052584297733e-05, "loss": 0.0225, "step": 38720 }, { "epoch": 0.56, "learning_rate": 1.9814004544559262e-05, "loss": 0.0215, "step": 38730 }, { "epoch": 0.56, "learning_rate": 1.981395650482079e-05, "loss": 0.0204, "step": 38740 }, { "epoch": 0.56, "learning_rate": 1.981390846508232e-05, "loss": 0.0216, "step": 38750 }, { "epoch": 0.56, "learning_rate": 1.9813860425343846e-05, "loss": 0.0197, "step": 38760 }, { "epoch": 0.56, "learning_rate": 1.9813812385605376e-05, "loss": 0.0227, "step": 38770 }, { "epoch": 0.56, "learning_rate": 1.9813764345866905e-05, "loss": 0.022, "step": 38780 }, { "epoch": 0.56, "learning_rate": 1.981371630612843e-05, "loss": 0.0203, "step": 38790 }, { "epoch": 0.56, "learning_rate": 1.981366826638996e-05, "loss": 0.0199, "step": 38800 }, { "epoch": 0.56, "learning_rate": 1.981362022665149e-05, "loss": 0.0168, "step": 38810 }, { "epoch": 0.56, "learning_rate": 1.981357218691302e-05, "loss": 0.024, "step": 38820 }, { "epoch": 0.56, "learning_rate": 1.9813524147174544e-05, "loss": 0.0196, "step": 38830 }, { "epoch": 0.56, "learning_rate": 1.9813476107436074e-05, "loss": 0.0183, "step": 38840 }, { "epoch": 0.56, "learning_rate": 1.9813428067697603e-05, "loss": 0.023, "step": 38850 }, { "epoch": 0.56, "learning_rate": 1.981338002795913e-05, "loss": 0.0183, "step": 38860 }, { "epoch": 0.56, "learning_rate": 1.9813331988220658e-05, "loss": 0.0179, "step": 38870 }, { "epoch": 0.56, "learning_rate": 1.9813283948482187e-05, "loss": 0.0209, "step": 38880 }, { "epoch": 0.56, "learning_rate": 1.9813235908743717e-05, "loss": 0.0198, "step": 38890 }, { "epoch": 0.56, "learning_rate": 1.9813187869005243e-05, "loss": 0.0194, "step": 38900 }, { "epoch": 0.56, "learning_rate": 1.9813139829266772e-05, "loss": 0.02, "step": 38910 }, { "epoch": 0.56, "learning_rate": 1.98130917895283e-05, "loss": 0.0219, "step": 38920 }, { "epoch": 0.56, "learning_rate": 1.981304374978983e-05, "loss": 0.0182, "step": 38930 }, { "epoch": 0.56, "learning_rate": 1.9812995710051356e-05, "loss": 0.025, "step": 38940 }, { "epoch": 0.56, "learning_rate": 1.9812947670312885e-05, "loss": 0.0225, "step": 38950 }, { "epoch": 0.56, "learning_rate": 1.9812899630574415e-05, "loss": 0.0294, "step": 38960 }, { "epoch": 0.56, "learning_rate": 1.981285159083594e-05, "loss": 0.0241, "step": 38970 }, { "epoch": 0.56, "learning_rate": 1.981280355109747e-05, "loss": 0.0213, "step": 38980 }, { "epoch": 0.56, "learning_rate": 1.9812755511359e-05, "loss": 0.0186, "step": 38990 }, { "epoch": 0.56, "learning_rate": 1.981270747162053e-05, "loss": 0.0308, "step": 39000 }, { "epoch": 0.56, "learning_rate": 1.9812659431882054e-05, "loss": 0.0158, "step": 39010 }, { "epoch": 0.56, "learning_rate": 1.9812611392143584e-05, "loss": 0.0215, "step": 39020 }, { "epoch": 0.56, "learning_rate": 1.9812563352405113e-05, "loss": 0.0193, "step": 39030 }, { "epoch": 0.56, "learning_rate": 1.981251531266664e-05, "loss": 0.0152, "step": 39040 }, { "epoch": 0.56, "learning_rate": 1.9812467272928168e-05, "loss": 0.0188, "step": 39050 }, { "epoch": 0.56, "learning_rate": 1.9812419233189697e-05, "loss": 0.017, "step": 39060 }, { "epoch": 0.56, "learning_rate": 1.9812371193451227e-05, "loss": 0.0225, "step": 39070 }, { "epoch": 0.56, "learning_rate": 1.9812323153712752e-05, "loss": 0.0282, "step": 39080 }, { "epoch": 0.56, "learning_rate": 1.9812275113974282e-05, "loss": 0.0187, "step": 39090 }, { "epoch": 0.56, "learning_rate": 1.981222707423581e-05, "loss": 0.0209, "step": 39100 }, { "epoch": 0.56, "learning_rate": 1.981217903449734e-05, "loss": 0.0202, "step": 39110 }, { "epoch": 0.56, "learning_rate": 1.9812130994758866e-05, "loss": 0.0163, "step": 39120 }, { "epoch": 0.56, "learning_rate": 1.9812082955020395e-05, "loss": 0.0165, "step": 39130 }, { "epoch": 0.56, "learning_rate": 1.9812034915281925e-05, "loss": 0.0196, "step": 39140 }, { "epoch": 0.56, "learning_rate": 1.981198687554345e-05, "loss": 0.0177, "step": 39150 }, { "epoch": 0.56, "learning_rate": 1.981193883580498e-05, "loss": 0.0231, "step": 39160 }, { "epoch": 0.56, "learning_rate": 1.981189079606651e-05, "loss": 0.0163, "step": 39170 }, { "epoch": 0.56, "learning_rate": 1.981184275632804e-05, "loss": 0.0166, "step": 39180 }, { "epoch": 0.56, "learning_rate": 1.9811794716589564e-05, "loss": 0.0214, "step": 39190 }, { "epoch": 0.56, "learning_rate": 1.9811746676851094e-05, "loss": 0.0174, "step": 39200 }, { "epoch": 0.57, "learning_rate": 1.9811698637112623e-05, "loss": 0.0206, "step": 39210 }, { "epoch": 0.57, "learning_rate": 1.981165059737415e-05, "loss": 0.0175, "step": 39220 }, { "epoch": 0.57, "learning_rate": 1.9811602557635678e-05, "loss": 0.0216, "step": 39230 }, { "epoch": 0.57, "learning_rate": 1.9811554517897207e-05, "loss": 0.0192, "step": 39240 }, { "epoch": 0.57, "learning_rate": 1.9811506478158736e-05, "loss": 0.0298, "step": 39250 }, { "epoch": 0.57, "learning_rate": 1.9811458438420262e-05, "loss": 0.017, "step": 39260 }, { "epoch": 0.57, "learning_rate": 1.981141039868179e-05, "loss": 0.0197, "step": 39270 }, { "epoch": 0.57, "learning_rate": 1.981136235894332e-05, "loss": 0.0274, "step": 39280 }, { "epoch": 0.57, "learning_rate": 1.981131431920485e-05, "loss": 0.0242, "step": 39290 }, { "epoch": 0.57, "learning_rate": 1.9811266279466376e-05, "loss": 0.0236, "step": 39300 }, { "epoch": 0.57, "learning_rate": 1.9811218239727905e-05, "loss": 0.0305, "step": 39310 }, { "epoch": 0.57, "learning_rate": 1.9811170199989435e-05, "loss": 0.0296, "step": 39320 }, { "epoch": 0.57, "learning_rate": 1.981112696422481e-05, "loss": 0.0165, "step": 39330 }, { "epoch": 0.57, "learning_rate": 1.981107892448634e-05, "loss": 0.0278, "step": 39340 }, { "epoch": 0.57, "learning_rate": 1.9811030884747864e-05, "loss": 0.0188, "step": 39350 }, { "epoch": 0.57, "learning_rate": 1.9810982845009394e-05, "loss": 0.0155, "step": 39360 }, { "epoch": 0.57, "learning_rate": 1.9810934805270923e-05, "loss": 0.0219, "step": 39370 }, { "epoch": 0.57, "learning_rate": 1.9810886765532452e-05, "loss": 0.0231, "step": 39380 }, { "epoch": 0.57, "learning_rate": 1.9810838725793978e-05, "loss": 0.0199, "step": 39390 }, { "epoch": 0.57, "learning_rate": 1.9810790686055507e-05, "loss": 0.0234, "step": 39400 }, { "epoch": 0.57, "learning_rate": 1.9810742646317037e-05, "loss": 0.0236, "step": 39410 }, { "epoch": 0.57, "learning_rate": 1.9810694606578566e-05, "loss": 0.0167, "step": 39420 }, { "epoch": 0.57, "learning_rate": 1.9810646566840092e-05, "loss": 0.0163, "step": 39430 }, { "epoch": 0.57, "learning_rate": 1.981059852710162e-05, "loss": 0.0221, "step": 39440 }, { "epoch": 0.57, "learning_rate": 1.981055048736315e-05, "loss": 0.0216, "step": 39450 }, { "epoch": 0.57, "learning_rate": 1.9810502447624676e-05, "loss": 0.0143, "step": 39460 }, { "epoch": 0.57, "learning_rate": 1.9810454407886205e-05, "loss": 0.0171, "step": 39470 }, { "epoch": 0.57, "learning_rate": 1.9810406368147735e-05, "loss": 0.0243, "step": 39480 }, { "epoch": 0.57, "learning_rate": 1.9810358328409264e-05, "loss": 0.0201, "step": 39490 }, { "epoch": 0.57, "learning_rate": 1.981031028867079e-05, "loss": 0.0202, "step": 39500 }, { "epoch": 0.57, "learning_rate": 1.981026224893232e-05, "loss": 0.0179, "step": 39510 }, { "epoch": 0.57, "learning_rate": 1.981021420919385e-05, "loss": 0.0158, "step": 39520 }, { "epoch": 0.57, "learning_rate": 1.9810166169455374e-05, "loss": 0.0182, "step": 39530 }, { "epoch": 0.57, "learning_rate": 1.9810118129716904e-05, "loss": 0.015, "step": 39540 }, { "epoch": 0.57, "learning_rate": 1.9810070089978433e-05, "loss": 0.0305, "step": 39550 }, { "epoch": 0.57, "learning_rate": 1.9810022050239962e-05, "loss": 0.0301, "step": 39560 }, { "epoch": 0.57, "learning_rate": 1.9809974010501488e-05, "loss": 0.0253, "step": 39570 }, { "epoch": 0.57, "learning_rate": 1.9809925970763017e-05, "loss": 0.017, "step": 39580 }, { "epoch": 0.57, "learning_rate": 1.9809877931024547e-05, "loss": 0.0217, "step": 39590 }, { "epoch": 0.57, "learning_rate": 1.9809829891286076e-05, "loss": 0.0229, "step": 39600 }, { "epoch": 0.57, "learning_rate": 1.98097818515476e-05, "loss": 0.021, "step": 39610 }, { "epoch": 0.57, "learning_rate": 1.980973381180913e-05, "loss": 0.0178, "step": 39620 }, { "epoch": 0.57, "learning_rate": 1.980968577207066e-05, "loss": 0.022, "step": 39630 }, { "epoch": 0.57, "learning_rate": 1.9809637732332186e-05, "loss": 0.0186, "step": 39640 }, { "epoch": 0.57, "learning_rate": 1.9809589692593715e-05, "loss": 0.0176, "step": 39650 }, { "epoch": 0.57, "learning_rate": 1.9809541652855245e-05, "loss": 0.0203, "step": 39660 }, { "epoch": 0.57, "learning_rate": 1.9809493613116774e-05, "loss": 0.0204, "step": 39670 }, { "epoch": 0.57, "learning_rate": 1.98094455733783e-05, "loss": 0.0207, "step": 39680 }, { "epoch": 0.57, "learning_rate": 1.980939753363983e-05, "loss": 0.0227, "step": 39690 }, { "epoch": 0.57, "learning_rate": 1.980934949390136e-05, "loss": 0.0173, "step": 39700 }, { "epoch": 0.57, "learning_rate": 1.9809301454162884e-05, "loss": 0.0196, "step": 39710 }, { "epoch": 0.57, "learning_rate": 1.9809253414424413e-05, "loss": 0.0218, "step": 39720 }, { "epoch": 0.57, "learning_rate": 1.9809205374685943e-05, "loss": 0.0222, "step": 39730 }, { "epoch": 0.57, "learning_rate": 1.9809157334947472e-05, "loss": 0.0151, "step": 39740 }, { "epoch": 0.57, "learning_rate": 1.9809109295208998e-05, "loss": 0.017, "step": 39750 }, { "epoch": 0.57, "learning_rate": 1.9809061255470527e-05, "loss": 0.0257, "step": 39760 }, { "epoch": 0.57, "learning_rate": 1.9809013215732056e-05, "loss": 0.022, "step": 39770 }, { "epoch": 0.57, "learning_rate": 1.9808965175993586e-05, "loss": 0.0208, "step": 39780 }, { "epoch": 0.57, "learning_rate": 1.980891713625511e-05, "loss": 0.0158, "step": 39790 }, { "epoch": 0.57, "learning_rate": 1.980886909651664e-05, "loss": 0.0183, "step": 39800 }, { "epoch": 0.57, "learning_rate": 1.980882105677817e-05, "loss": 0.0176, "step": 39810 }, { "epoch": 0.57, "learning_rate": 1.9808773017039696e-05, "loss": 0.0219, "step": 39820 }, { "epoch": 0.57, "learning_rate": 1.9808724977301225e-05, "loss": 0.0182, "step": 39830 }, { "epoch": 0.57, "learning_rate": 1.9808676937562755e-05, "loss": 0.0162, "step": 39840 }, { "epoch": 0.57, "learning_rate": 1.9808628897824284e-05, "loss": 0.0147, "step": 39850 }, { "epoch": 0.57, "learning_rate": 1.980858085808581e-05, "loss": 0.0172, "step": 39860 }, { "epoch": 0.57, "learning_rate": 1.980853281834734e-05, "loss": 0.0185, "step": 39870 }, { "epoch": 0.57, "learning_rate": 1.9808484778608868e-05, "loss": 0.0219, "step": 39880 }, { "epoch": 0.57, "learning_rate": 1.9808436738870394e-05, "loss": 0.0207, "step": 39890 }, { "epoch": 0.58, "learning_rate": 1.9808388699131923e-05, "loss": 0.0184, "step": 39900 }, { "epoch": 0.58, "learning_rate": 1.9808340659393453e-05, "loss": 0.0241, "step": 39910 }, { "epoch": 0.58, "learning_rate": 1.9808292619654982e-05, "loss": 0.0224, "step": 39920 }, { "epoch": 0.58, "learning_rate": 1.9808244579916508e-05, "loss": 0.0214, "step": 39930 }, { "epoch": 0.58, "learning_rate": 1.9808196540178037e-05, "loss": 0.0235, "step": 39940 }, { "epoch": 0.58, "learning_rate": 1.9808148500439566e-05, "loss": 0.0179, "step": 39950 }, { "epoch": 0.58, "learning_rate": 1.9808100460701096e-05, "loss": 0.0277, "step": 39960 }, { "epoch": 0.58, "learning_rate": 1.980805242096262e-05, "loss": 0.018, "step": 39970 }, { "epoch": 0.58, "learning_rate": 1.980800438122415e-05, "loss": 0.0183, "step": 39980 }, { "epoch": 0.58, "learning_rate": 1.980795634148568e-05, "loss": 0.0211, "step": 39990 }, { "epoch": 0.58, "learning_rate": 1.9807908301747206e-05, "loss": 0.0232, "step": 40000 }, { "epoch": 0.58, "learning_rate": 1.9807860262008735e-05, "loss": 0.0204, "step": 40010 }, { "epoch": 0.58, "learning_rate": 1.9807812222270264e-05, "loss": 0.0208, "step": 40020 }, { "epoch": 0.58, "learning_rate": 1.9807764182531794e-05, "loss": 0.0164, "step": 40030 }, { "epoch": 0.58, "learning_rate": 1.980771614279332e-05, "loss": 0.0234, "step": 40040 }, { "epoch": 0.58, "learning_rate": 1.980766810305485e-05, "loss": 0.0182, "step": 40050 }, { "epoch": 0.58, "learning_rate": 1.9807620063316378e-05, "loss": 0.0205, "step": 40060 }, { "epoch": 0.58, "learning_rate": 1.9807572023577904e-05, "loss": 0.0187, "step": 40070 }, { "epoch": 0.58, "learning_rate": 1.9807523983839433e-05, "loss": 0.0164, "step": 40080 }, { "epoch": 0.58, "learning_rate": 1.9807475944100963e-05, "loss": 0.0232, "step": 40090 }, { "epoch": 0.58, "learning_rate": 1.9807427904362492e-05, "loss": 0.0259, "step": 40100 }, { "epoch": 0.58, "learning_rate": 1.9807379864624018e-05, "loss": 0.0277, "step": 40110 }, { "epoch": 0.58, "learning_rate": 1.9807331824885547e-05, "loss": 0.0223, "step": 40120 }, { "epoch": 0.58, "learning_rate": 1.9807283785147076e-05, "loss": 0.023, "step": 40130 }, { "epoch": 0.58, "learning_rate": 1.9807235745408606e-05, "loss": 0.0232, "step": 40140 }, { "epoch": 0.58, "learning_rate": 1.980718770567013e-05, "loss": 0.022, "step": 40150 }, { "epoch": 0.58, "learning_rate": 1.980713966593166e-05, "loss": 0.0192, "step": 40160 }, { "epoch": 0.58, "learning_rate": 1.980709162619319e-05, "loss": 0.0199, "step": 40170 }, { "epoch": 0.58, "learning_rate": 1.9807043586454716e-05, "loss": 0.0148, "step": 40180 }, { "epoch": 0.58, "learning_rate": 1.9806995546716245e-05, "loss": 0.0216, "step": 40190 }, { "epoch": 0.58, "learning_rate": 1.9806947506977774e-05, "loss": 0.0195, "step": 40200 }, { "epoch": 0.58, "learning_rate": 1.9806899467239304e-05, "loss": 0.0208, "step": 40210 }, { "epoch": 0.58, "learning_rate": 1.980685142750083e-05, "loss": 0.0191, "step": 40220 }, { "epoch": 0.58, "learning_rate": 1.980680338776236e-05, "loss": 0.0239, "step": 40230 }, { "epoch": 0.58, "learning_rate": 1.9806755348023888e-05, "loss": 0.0188, "step": 40240 }, { "epoch": 0.58, "learning_rate": 1.9806707308285414e-05, "loss": 0.015, "step": 40250 }, { "epoch": 0.58, "learning_rate": 1.9806659268546943e-05, "loss": 0.0227, "step": 40260 }, { "epoch": 0.58, "learning_rate": 1.9806611228808473e-05, "loss": 0.0248, "step": 40270 }, { "epoch": 0.58, "learning_rate": 1.9806563189070002e-05, "loss": 0.0246, "step": 40280 }, { "epoch": 0.58, "learning_rate": 1.9806515149331528e-05, "loss": 0.0244, "step": 40290 }, { "epoch": 0.58, "learning_rate": 1.9806467109593057e-05, "loss": 0.0204, "step": 40300 }, { "epoch": 0.58, "learning_rate": 1.9806419069854586e-05, "loss": 0.0217, "step": 40310 }, { "epoch": 0.58, "learning_rate": 1.9806371030116115e-05, "loss": 0.024, "step": 40320 }, { "epoch": 0.58, "learning_rate": 1.980632299037764e-05, "loss": 0.0146, "step": 40330 }, { "epoch": 0.58, "learning_rate": 1.980627495063917e-05, "loss": 0.0213, "step": 40340 }, { "epoch": 0.58, "learning_rate": 1.98062269109007e-05, "loss": 0.0185, "step": 40350 }, { "epoch": 0.58, "learning_rate": 1.9806178871162226e-05, "loss": 0.0261, "step": 40360 }, { "epoch": 0.58, "learning_rate": 1.9806130831423755e-05, "loss": 0.02, "step": 40370 }, { "epoch": 0.58, "learning_rate": 1.9806082791685284e-05, "loss": 0.0198, "step": 40380 }, { "epoch": 0.58, "learning_rate": 1.9806034751946814e-05, "loss": 0.0175, "step": 40390 }, { "epoch": 0.58, "learning_rate": 1.980598671220834e-05, "loss": 0.0208, "step": 40400 }, { "epoch": 0.58, "learning_rate": 1.980593867246987e-05, "loss": 0.024, "step": 40410 }, { "epoch": 0.58, "learning_rate": 1.9805890632731398e-05, "loss": 0.0137, "step": 40420 }, { "epoch": 0.58, "learning_rate": 1.9805847396966773e-05, "loss": 0.0209, "step": 40430 }, { "epoch": 0.58, "learning_rate": 1.9805799357228302e-05, "loss": 0.0219, "step": 40440 }, { "epoch": 0.58, "learning_rate": 1.980575131748983e-05, "loss": 0.0271, "step": 40450 }, { "epoch": 0.58, "learning_rate": 1.9805703277751357e-05, "loss": 0.0203, "step": 40460 }, { "epoch": 0.58, "learning_rate": 1.9805655238012886e-05, "loss": 0.0211, "step": 40470 }, { "epoch": 0.58, "learning_rate": 1.9805607198274416e-05, "loss": 0.022, "step": 40480 }, { "epoch": 0.58, "learning_rate": 1.980555915853594e-05, "loss": 0.0164, "step": 40490 }, { "epoch": 0.58, "learning_rate": 1.980551111879747e-05, "loss": 0.0243, "step": 40500 }, { "epoch": 0.58, "learning_rate": 1.9805463079059e-05, "loss": 0.0205, "step": 40510 }, { "epoch": 0.58, "learning_rate": 1.980541503932053e-05, "loss": 0.0177, "step": 40520 }, { "epoch": 0.58, "learning_rate": 1.9805366999582055e-05, "loss": 0.0178, "step": 40530 }, { "epoch": 0.58, "learning_rate": 1.9805318959843584e-05, "loss": 0.0136, "step": 40540 }, { "epoch": 0.58, "learning_rate": 1.9805270920105114e-05, "loss": 0.0153, "step": 40550 }, { "epoch": 0.58, "learning_rate": 1.9805222880366643e-05, "loss": 0.0214, "step": 40560 }, { "epoch": 0.58, "learning_rate": 1.980517484062817e-05, "loss": 0.0213, "step": 40570 }, { "epoch": 0.58, "learning_rate": 1.9805126800889698e-05, "loss": 0.0207, "step": 40580 }, { "epoch": 0.58, "learning_rate": 1.9805078761151227e-05, "loss": 0.0198, "step": 40590 }, { "epoch": 0.59, "learning_rate": 1.9805030721412753e-05, "loss": 0.0205, "step": 40600 }, { "epoch": 0.59, "learning_rate": 1.9804982681674283e-05, "loss": 0.0138, "step": 40610 }, { "epoch": 0.59, "learning_rate": 1.9804934641935812e-05, "loss": 0.02, "step": 40620 }, { "epoch": 0.59, "learning_rate": 1.980488660219734e-05, "loss": 0.0217, "step": 40630 }, { "epoch": 0.59, "learning_rate": 1.9804838562458867e-05, "loss": 0.0181, "step": 40640 }, { "epoch": 0.59, "learning_rate": 1.9804790522720396e-05, "loss": 0.022, "step": 40650 }, { "epoch": 0.59, "learning_rate": 1.9804742482981926e-05, "loss": 0.0184, "step": 40660 }, { "epoch": 0.59, "learning_rate": 1.980469444324345e-05, "loss": 0.0184, "step": 40670 }, { "epoch": 0.59, "learning_rate": 1.980464640350498e-05, "loss": 0.0247, "step": 40680 }, { "epoch": 0.59, "learning_rate": 1.980459836376651e-05, "loss": 0.0261, "step": 40690 }, { "epoch": 0.59, "learning_rate": 1.980455032402804e-05, "loss": 0.0189, "step": 40700 }, { "epoch": 0.59, "learning_rate": 1.9804502284289565e-05, "loss": 0.0168, "step": 40710 }, { "epoch": 0.59, "learning_rate": 1.9804454244551094e-05, "loss": 0.0253, "step": 40720 }, { "epoch": 0.59, "learning_rate": 1.9804406204812624e-05, "loss": 0.0208, "step": 40730 }, { "epoch": 0.59, "learning_rate": 1.9804358165074153e-05, "loss": 0.0169, "step": 40740 }, { "epoch": 0.59, "learning_rate": 1.980431012533568e-05, "loss": 0.0165, "step": 40750 }, { "epoch": 0.59, "learning_rate": 1.9804262085597208e-05, "loss": 0.0152, "step": 40760 }, { "epoch": 0.59, "learning_rate": 1.9804214045858737e-05, "loss": 0.0202, "step": 40770 }, { "epoch": 0.59, "learning_rate": 1.9804166006120263e-05, "loss": 0.0169, "step": 40780 }, { "epoch": 0.59, "learning_rate": 1.9804117966381792e-05, "loss": 0.0174, "step": 40790 }, { "epoch": 0.59, "learning_rate": 1.9804069926643322e-05, "loss": 0.019, "step": 40800 }, { "epoch": 0.59, "learning_rate": 1.980402188690485e-05, "loss": 0.0179, "step": 40810 }, { "epoch": 0.59, "learning_rate": 1.9803973847166377e-05, "loss": 0.024, "step": 40820 }, { "epoch": 0.59, "learning_rate": 1.9803925807427906e-05, "loss": 0.0202, "step": 40830 }, { "epoch": 0.59, "learning_rate": 1.9803877767689435e-05, "loss": 0.0224, "step": 40840 }, { "epoch": 0.59, "learning_rate": 1.980382972795096e-05, "loss": 0.0183, "step": 40850 }, { "epoch": 0.59, "learning_rate": 1.980378168821249e-05, "loss": 0.0252, "step": 40860 }, { "epoch": 0.59, "learning_rate": 1.980373364847402e-05, "loss": 0.0189, "step": 40870 }, { "epoch": 0.59, "learning_rate": 1.980368560873555e-05, "loss": 0.0163, "step": 40880 }, { "epoch": 0.59, "learning_rate": 1.9803637568997075e-05, "loss": 0.0158, "step": 40890 }, { "epoch": 0.59, "learning_rate": 1.9803589529258604e-05, "loss": 0.0277, "step": 40900 }, { "epoch": 0.59, "learning_rate": 1.9803541489520134e-05, "loss": 0.0187, "step": 40910 }, { "epoch": 0.59, "learning_rate": 1.980349344978166e-05, "loss": 0.018, "step": 40920 }, { "epoch": 0.59, "learning_rate": 1.980344541004319e-05, "loss": 0.0191, "step": 40930 }, { "epoch": 0.59, "learning_rate": 1.9803397370304718e-05, "loss": 0.0214, "step": 40940 }, { "epoch": 0.59, "learning_rate": 1.9803349330566247e-05, "loss": 0.0164, "step": 40950 }, { "epoch": 0.59, "learning_rate": 1.9803301290827773e-05, "loss": 0.0177, "step": 40960 }, { "epoch": 0.59, "learning_rate": 1.9803253251089302e-05, "loss": 0.0187, "step": 40970 }, { "epoch": 0.59, "learning_rate": 1.980320521135083e-05, "loss": 0.0222, "step": 40980 }, { "epoch": 0.59, "learning_rate": 1.980315717161236e-05, "loss": 0.0162, "step": 40990 }, { "epoch": 0.59, "learning_rate": 1.9803109131873887e-05, "loss": 0.0322, "step": 41000 }, { "epoch": 0.59, "learning_rate": 1.9803061092135416e-05, "loss": 0.0177, "step": 41010 }, { "epoch": 0.59, "learning_rate": 1.9803013052396945e-05, "loss": 0.021, "step": 41020 }, { "epoch": 0.59, "learning_rate": 1.980296501265847e-05, "loss": 0.022, "step": 41030 }, { "epoch": 0.59, "learning_rate": 1.980291697292e-05, "loss": 0.0195, "step": 41040 }, { "epoch": 0.59, "learning_rate": 1.980286893318153e-05, "loss": 0.0222, "step": 41050 }, { "epoch": 0.59, "learning_rate": 1.980282089344306e-05, "loss": 0.0182, "step": 41060 }, { "epoch": 0.59, "learning_rate": 1.9802772853704585e-05, "loss": 0.0221, "step": 41070 }, { "epoch": 0.59, "learning_rate": 1.9802724813966114e-05, "loss": 0.0188, "step": 41080 }, { "epoch": 0.59, "learning_rate": 1.9802676774227643e-05, "loss": 0.0185, "step": 41090 }, { "epoch": 0.59, "learning_rate": 1.980262873448917e-05, "loss": 0.0215, "step": 41100 }, { "epoch": 0.59, "learning_rate": 1.98025806947507e-05, "loss": 0.017, "step": 41110 }, { "epoch": 0.59, "learning_rate": 1.9802532655012228e-05, "loss": 0.0157, "step": 41120 }, { "epoch": 0.59, "learning_rate": 1.9802484615273757e-05, "loss": 0.0177, "step": 41130 }, { "epoch": 0.59, "learning_rate": 1.9802436575535283e-05, "loss": 0.0231, "step": 41140 }, { "epoch": 0.59, "learning_rate": 1.9802388535796812e-05, "loss": 0.0132, "step": 41150 }, { "epoch": 0.59, "learning_rate": 1.980234049605834e-05, "loss": 0.0175, "step": 41160 }, { "epoch": 0.59, "learning_rate": 1.980229245631987e-05, "loss": 0.0135, "step": 41170 }, { "epoch": 0.59, "learning_rate": 1.9802244416581397e-05, "loss": 0.0225, "step": 41180 }, { "epoch": 0.59, "learning_rate": 1.9802196376842926e-05, "loss": 0.0165, "step": 41190 }, { "epoch": 0.59, "learning_rate": 1.9802148337104455e-05, "loss": 0.0137, "step": 41200 }, { "epoch": 0.59, "learning_rate": 1.980210029736598e-05, "loss": 0.0264, "step": 41210 }, { "epoch": 0.59, "learning_rate": 1.980205225762751e-05, "loss": 0.0167, "step": 41220 }, { "epoch": 0.59, "learning_rate": 1.980200421788904e-05, "loss": 0.0228, "step": 41230 }, { "epoch": 0.59, "learning_rate": 1.980195617815057e-05, "loss": 0.0184, "step": 41240 }, { "epoch": 0.59, "learning_rate": 1.9801908138412095e-05, "loss": 0.0214, "step": 41250 }, { "epoch": 0.59, "learning_rate": 1.9801860098673624e-05, "loss": 0.0227, "step": 41260 }, { "epoch": 0.59, "learning_rate": 1.9801812058935153e-05, "loss": 0.0219, "step": 41270 }, { "epoch": 0.59, "learning_rate": 1.980176401919668e-05, "loss": 0.0202, "step": 41280 }, { "epoch": 0.6, "learning_rate": 1.980171597945821e-05, "loss": 0.0222, "step": 41290 }, { "epoch": 0.6, "learning_rate": 1.9801667939719738e-05, "loss": 0.0193, "step": 41300 }, { "epoch": 0.6, "learning_rate": 1.9801619899981267e-05, "loss": 0.0248, "step": 41310 }, { "epoch": 0.6, "learning_rate": 1.9801571860242793e-05, "loss": 0.0192, "step": 41320 }, { "epoch": 0.6, "learning_rate": 1.9801523820504322e-05, "loss": 0.0175, "step": 41330 }, { "epoch": 0.6, "learning_rate": 1.980147578076585e-05, "loss": 0.0198, "step": 41340 }, { "epoch": 0.6, "learning_rate": 1.980142774102738e-05, "loss": 0.0141, "step": 41350 }, { "epoch": 0.6, "learning_rate": 1.9801379701288907e-05, "loss": 0.0176, "step": 41360 }, { "epoch": 0.6, "learning_rate": 1.9801331661550436e-05, "loss": 0.0199, "step": 41370 }, { "epoch": 0.6, "learning_rate": 1.9801283621811965e-05, "loss": 0.0231, "step": 41380 }, { "epoch": 0.6, "learning_rate": 1.980123558207349e-05, "loss": 0.0226, "step": 41390 }, { "epoch": 0.6, "learning_rate": 1.980118754233502e-05, "loss": 0.0198, "step": 41400 }, { "epoch": 0.6, "learning_rate": 1.980113950259655e-05, "loss": 0.0221, "step": 41410 }, { "epoch": 0.6, "learning_rate": 1.980109146285808e-05, "loss": 0.017, "step": 41420 }, { "epoch": 0.6, "learning_rate": 1.9801043423119605e-05, "loss": 0.0206, "step": 41430 }, { "epoch": 0.6, "learning_rate": 1.9800995383381134e-05, "loss": 0.0164, "step": 41440 }, { "epoch": 0.6, "learning_rate": 1.9800947343642663e-05, "loss": 0.0205, "step": 41450 }, { "epoch": 0.6, "learning_rate": 1.980089930390419e-05, "loss": 0.0244, "step": 41460 }, { "epoch": 0.6, "learning_rate": 1.980085126416572e-05, "loss": 0.0221, "step": 41470 }, { "epoch": 0.6, "learning_rate": 1.9800803224427248e-05, "loss": 0.0205, "step": 41480 }, { "epoch": 0.6, "learning_rate": 1.9800755184688777e-05, "loss": 0.0176, "step": 41490 }, { "epoch": 0.6, "learning_rate": 1.9800707144950303e-05, "loss": 0.0195, "step": 41500 }, { "epoch": 0.6, "learning_rate": 1.9800659105211832e-05, "loss": 0.0155, "step": 41510 }, { "epoch": 0.6, "learning_rate": 1.980061106547336e-05, "loss": 0.0192, "step": 41520 }, { "epoch": 0.6, "learning_rate": 1.980056302573489e-05, "loss": 0.0217, "step": 41530 }, { "epoch": 0.6, "learning_rate": 1.9800514985996417e-05, "loss": 0.0196, "step": 41540 }, { "epoch": 0.6, "learning_rate": 1.9800466946257946e-05, "loss": 0.0198, "step": 41550 }, { "epoch": 0.6, "learning_rate": 1.9800418906519475e-05, "loss": 0.019, "step": 41560 }, { "epoch": 0.6, "learning_rate": 1.9800370866781e-05, "loss": 0.014, "step": 41570 }, { "epoch": 0.6, "learning_rate": 1.980032282704253e-05, "loss": 0.0201, "step": 41580 }, { "epoch": 0.6, "learning_rate": 1.980027478730406e-05, "loss": 0.0215, "step": 41590 }, { "epoch": 0.6, "learning_rate": 1.980022674756559e-05, "loss": 0.0199, "step": 41600 }, { "epoch": 0.6, "learning_rate": 1.9800178707827115e-05, "loss": 0.0202, "step": 41610 }, { "epoch": 0.6, "learning_rate": 1.9800130668088644e-05, "loss": 0.0175, "step": 41620 }, { "epoch": 0.6, "learning_rate": 1.9800082628350173e-05, "loss": 0.0218, "step": 41630 }, { "epoch": 0.6, "learning_rate": 1.98000345886117e-05, "loss": 0.0208, "step": 41640 }, { "epoch": 0.6, "learning_rate": 1.979998654887323e-05, "loss": 0.0198, "step": 41650 }, { "epoch": 0.6, "learning_rate": 1.9799938509134758e-05, "loss": 0.022, "step": 41660 }, { "epoch": 0.6, "learning_rate": 1.9799890469396287e-05, "loss": 0.0159, "step": 41670 }, { "epoch": 0.6, "learning_rate": 1.9799842429657813e-05, "loss": 0.018, "step": 41680 }, { "epoch": 0.6, "learning_rate": 1.9799794389919342e-05, "loss": 0.0147, "step": 41690 }, { "epoch": 0.6, "learning_rate": 1.979974635018087e-05, "loss": 0.0164, "step": 41700 }, { "epoch": 0.6, "learning_rate": 1.97996983104424e-05, "loss": 0.0189, "step": 41710 }, { "epoch": 0.6, "learning_rate": 1.9799650270703926e-05, "loss": 0.0252, "step": 41720 }, { "epoch": 0.6, "learning_rate": 1.9799602230965456e-05, "loss": 0.0175, "step": 41730 }, { "epoch": 0.6, "learning_rate": 1.9799554191226985e-05, "loss": 0.0156, "step": 41740 }, { "epoch": 0.6, "learning_rate": 1.979950615148851e-05, "loss": 0.0157, "step": 41750 }, { "epoch": 0.6, "learning_rate": 1.979945811175004e-05, "loss": 0.0183, "step": 41760 }, { "epoch": 0.6, "learning_rate": 1.979941007201157e-05, "loss": 0.0198, "step": 41770 }, { "epoch": 0.6, "learning_rate": 1.97993620322731e-05, "loss": 0.0273, "step": 41780 }, { "epoch": 0.6, "learning_rate": 1.9799313992534625e-05, "loss": 0.0211, "step": 41790 }, { "epoch": 0.6, "learning_rate": 1.9799265952796154e-05, "loss": 0.0182, "step": 41800 }, { "epoch": 0.6, "learning_rate": 1.9799217913057683e-05, "loss": 0.0222, "step": 41810 }, { "epoch": 0.6, "learning_rate": 1.979916987331921e-05, "loss": 0.0193, "step": 41820 }, { "epoch": 0.6, "learning_rate": 1.9799121833580738e-05, "loss": 0.0215, "step": 41830 }, { "epoch": 0.6, "learning_rate": 1.9799073793842268e-05, "loss": 0.0143, "step": 41840 }, { "epoch": 0.6, "learning_rate": 1.9799025754103797e-05, "loss": 0.0221, "step": 41850 }, { "epoch": 0.6, "learning_rate": 1.9798977714365323e-05, "loss": 0.0183, "step": 41860 }, { "epoch": 0.6, "learning_rate": 1.9798929674626852e-05, "loss": 0.0196, "step": 41870 }, { "epoch": 0.6, "learning_rate": 1.979888163488838e-05, "loss": 0.0207, "step": 41880 }, { "epoch": 0.6, "learning_rate": 1.979883359514991e-05, "loss": 0.0142, "step": 41890 }, { "epoch": 0.6, "learning_rate": 1.9798785555411436e-05, "loss": 0.0162, "step": 41900 }, { "epoch": 0.6, "learning_rate": 1.9798737515672966e-05, "loss": 0.022, "step": 41910 }, { "epoch": 0.6, "learning_rate": 1.9798689475934495e-05, "loss": 0.0222, "step": 41920 }, { "epoch": 0.6, "learning_rate": 1.979864143619602e-05, "loss": 0.0169, "step": 41930 }, { "epoch": 0.6, "learning_rate": 1.979859339645755e-05, "loss": 0.0152, "step": 41940 }, { "epoch": 0.6, "learning_rate": 1.979854535671908e-05, "loss": 0.0158, "step": 41950 }, { "epoch": 0.6, "learning_rate": 1.979849731698061e-05, "loss": 0.0169, "step": 41960 }, { "epoch": 0.6, "learning_rate": 1.9798449277242134e-05, "loss": 0.0181, "step": 41970 }, { "epoch": 0.61, "learning_rate": 1.9798401237503664e-05, "loss": 0.0166, "step": 41980 }, { "epoch": 0.61, "learning_rate": 1.9798353197765193e-05, "loss": 0.0232, "step": 41990 }, { "epoch": 0.61, "learning_rate": 1.979830515802672e-05, "loss": 0.0196, "step": 42000 }, { "epoch": 0.61, "learning_rate": 1.9798257118288248e-05, "loss": 0.0211, "step": 42010 }, { "epoch": 0.61, "learning_rate": 1.9798209078549777e-05, "loss": 0.0121, "step": 42020 }, { "epoch": 0.61, "learning_rate": 1.9798161038811307e-05, "loss": 0.0212, "step": 42030 }, { "epoch": 0.61, "learning_rate": 1.9798112999072833e-05, "loss": 0.0188, "step": 42040 }, { "epoch": 0.61, "learning_rate": 1.9798064959334362e-05, "loss": 0.0133, "step": 42050 }, { "epoch": 0.61, "learning_rate": 1.979801691959589e-05, "loss": 0.02, "step": 42060 }, { "epoch": 0.61, "learning_rate": 1.979796887985742e-05, "loss": 0.0199, "step": 42070 }, { "epoch": 0.61, "learning_rate": 1.9797920840118946e-05, "loss": 0.0187, "step": 42080 }, { "epoch": 0.61, "learning_rate": 1.9797872800380476e-05, "loss": 0.0167, "step": 42090 }, { "epoch": 0.61, "learning_rate": 1.9797824760642005e-05, "loss": 0.0204, "step": 42100 }, { "epoch": 0.61, "learning_rate": 1.979777672090353e-05, "loss": 0.0247, "step": 42110 }, { "epoch": 0.61, "learning_rate": 1.979772868116506e-05, "loss": 0.0222, "step": 42120 }, { "epoch": 0.61, "learning_rate": 1.979768064142659e-05, "loss": 0.0203, "step": 42130 }, { "epoch": 0.61, "learning_rate": 1.979763260168812e-05, "loss": 0.0229, "step": 42140 }, { "epoch": 0.61, "learning_rate": 1.9797584561949644e-05, "loss": 0.0165, "step": 42150 }, { "epoch": 0.61, "learning_rate": 1.9797536522211174e-05, "loss": 0.0158, "step": 42160 }, { "epoch": 0.61, "learning_rate": 1.9797488482472703e-05, "loss": 0.0186, "step": 42170 }, { "epoch": 0.61, "learning_rate": 1.979744044273423e-05, "loss": 0.0244, "step": 42180 }, { "epoch": 0.61, "learning_rate": 1.9797392402995758e-05, "loss": 0.0191, "step": 42190 }, { "epoch": 0.61, "learning_rate": 1.9797344363257287e-05, "loss": 0.0153, "step": 42200 }, { "epoch": 0.61, "learning_rate": 1.9797296323518817e-05, "loss": 0.0202, "step": 42210 }, { "epoch": 0.61, "learning_rate": 1.9797248283780343e-05, "loss": 0.0163, "step": 42220 }, { "epoch": 0.61, "learning_rate": 1.9797200244041872e-05, "loss": 0.0184, "step": 42230 }, { "epoch": 0.61, "learning_rate": 1.97971522043034e-05, "loss": 0.0336, "step": 42240 }, { "epoch": 0.61, "learning_rate": 1.979710416456493e-05, "loss": 0.0205, "step": 42250 }, { "epoch": 0.61, "learning_rate": 1.9797056124826456e-05, "loss": 0.0174, "step": 42260 }, { "epoch": 0.61, "learning_rate": 1.9797008085087985e-05, "loss": 0.0171, "step": 42270 }, { "epoch": 0.61, "learning_rate": 1.9796960045349515e-05, "loss": 0.0181, "step": 42280 }, { "epoch": 0.61, "learning_rate": 1.979691200561104e-05, "loss": 0.0238, "step": 42290 }, { "epoch": 0.61, "learning_rate": 1.979686396587257e-05, "loss": 0.0173, "step": 42300 }, { "epoch": 0.61, "learning_rate": 1.97968159261341e-05, "loss": 0.015, "step": 42310 }, { "epoch": 0.61, "learning_rate": 1.979676788639563e-05, "loss": 0.0207, "step": 42320 }, { "epoch": 0.61, "learning_rate": 1.9796719846657158e-05, "loss": 0.0169, "step": 42330 }, { "epoch": 0.61, "learning_rate": 1.9796671806918687e-05, "loss": 0.0186, "step": 42340 }, { "epoch": 0.61, "learning_rate": 1.9796623767180213e-05, "loss": 0.0211, "step": 42350 }, { "epoch": 0.61, "learning_rate": 1.9796575727441742e-05, "loss": 0.0201, "step": 42360 }, { "epoch": 0.61, "learning_rate": 1.979652768770327e-05, "loss": 0.0214, "step": 42370 }, { "epoch": 0.61, "learning_rate": 1.97964796479648e-05, "loss": 0.0192, "step": 42380 }, { "epoch": 0.61, "learning_rate": 1.9796431608226327e-05, "loss": 0.0215, "step": 42390 }, { "epoch": 0.61, "learning_rate": 1.9796383568487856e-05, "loss": 0.0271, "step": 42400 }, { "epoch": 0.61, "learning_rate": 1.9796335528749385e-05, "loss": 0.0208, "step": 42410 }, { "epoch": 0.61, "learning_rate": 1.979628748901091e-05, "loss": 0.0161, "step": 42420 }, { "epoch": 0.61, "learning_rate": 1.979623944927244e-05, "loss": 0.0163, "step": 42430 }, { "epoch": 0.61, "learning_rate": 1.979619140953397e-05, "loss": 0.0197, "step": 42440 }, { "epoch": 0.61, "learning_rate": 1.97961433697955e-05, "loss": 0.0158, "step": 42450 }, { "epoch": 0.61, "learning_rate": 1.9796095330057025e-05, "loss": 0.0181, "step": 42460 }, { "epoch": 0.61, "learning_rate": 1.9796047290318554e-05, "loss": 0.0232, "step": 42470 }, { "epoch": 0.61, "learning_rate": 1.9795999250580083e-05, "loss": 0.0229, "step": 42480 }, { "epoch": 0.61, "learning_rate": 1.979595121084161e-05, "loss": 0.0261, "step": 42490 }, { "epoch": 0.61, "learning_rate": 1.979590317110314e-05, "loss": 0.0197, "step": 42500 }, { "epoch": 0.61, "learning_rate": 1.9795855131364668e-05, "loss": 0.0205, "step": 42510 }, { "epoch": 0.61, "learning_rate": 1.9795807091626197e-05, "loss": 0.0168, "step": 42520 }, { "epoch": 0.61, "learning_rate": 1.9795759051887723e-05, "loss": 0.0147, "step": 42530 }, { "epoch": 0.61, "learning_rate": 1.9795711012149252e-05, "loss": 0.0209, "step": 42540 }, { "epoch": 0.61, "learning_rate": 1.979566297241078e-05, "loss": 0.0183, "step": 42550 }, { "epoch": 0.61, "learning_rate": 1.979561493267231e-05, "loss": 0.0184, "step": 42560 }, { "epoch": 0.61, "learning_rate": 1.9795566892933836e-05, "loss": 0.0151, "step": 42570 }, { "epoch": 0.61, "learning_rate": 1.9795518853195366e-05, "loss": 0.0175, "step": 42580 }, { "epoch": 0.61, "learning_rate": 1.9795470813456895e-05, "loss": 0.0208, "step": 42590 }, { "epoch": 0.61, "learning_rate": 1.979542277371842e-05, "loss": 0.0235, "step": 42600 }, { "epoch": 0.61, "learning_rate": 1.979537473397995e-05, "loss": 0.0213, "step": 42610 }, { "epoch": 0.61, "learning_rate": 1.979532669424148e-05, "loss": 0.024, "step": 42620 }, { "epoch": 0.61, "learning_rate": 1.979527865450301e-05, "loss": 0.016, "step": 42630 }, { "epoch": 0.61, "learning_rate": 1.9795230614764535e-05, "loss": 0.0202, "step": 42640 }, { "epoch": 0.61, "learning_rate": 1.9795182575026064e-05, "loss": 0.018, "step": 42650 }, { "epoch": 0.61, "learning_rate": 1.9795134535287593e-05, "loss": 0.019, "step": 42660 }, { "epoch": 0.61, "learning_rate": 1.979508649554912e-05, "loss": 0.0195, "step": 42670 }, { "epoch": 0.62, "learning_rate": 1.9795038455810648e-05, "loss": 0.0217, "step": 42680 }, { "epoch": 0.62, "learning_rate": 1.9794990416072178e-05, "loss": 0.017, "step": 42690 }, { "epoch": 0.62, "learning_rate": 1.9794942376333707e-05, "loss": 0.0171, "step": 42700 }, { "epoch": 0.62, "learning_rate": 1.9794894336595233e-05, "loss": 0.0194, "step": 42710 }, { "epoch": 0.62, "learning_rate": 1.9794846296856762e-05, "loss": 0.0216, "step": 42720 }, { "epoch": 0.62, "learning_rate": 1.979479825711829e-05, "loss": 0.0169, "step": 42730 }, { "epoch": 0.62, "learning_rate": 1.979475021737982e-05, "loss": 0.0194, "step": 42740 }, { "epoch": 0.62, "learning_rate": 1.9794702177641346e-05, "loss": 0.0239, "step": 42750 }, { "epoch": 0.62, "learning_rate": 1.9794654137902876e-05, "loss": 0.0171, "step": 42760 }, { "epoch": 0.62, "learning_rate": 1.9794606098164405e-05, "loss": 0.0183, "step": 42770 }, { "epoch": 0.62, "learning_rate": 1.979455805842593e-05, "loss": 0.0175, "step": 42780 }, { "epoch": 0.62, "learning_rate": 1.979451001868746e-05, "loss": 0.0246, "step": 42790 }, { "epoch": 0.62, "learning_rate": 1.979446197894899e-05, "loss": 0.0185, "step": 42800 }, { "epoch": 0.62, "learning_rate": 1.979441393921052e-05, "loss": 0.0154, "step": 42810 }, { "epoch": 0.62, "learning_rate": 1.9794365899472044e-05, "loss": 0.0165, "step": 42820 }, { "epoch": 0.62, "learning_rate": 1.9794317859733574e-05, "loss": 0.0201, "step": 42830 }, { "epoch": 0.62, "learning_rate": 1.9794269819995103e-05, "loss": 0.026, "step": 42840 }, { "epoch": 0.62, "learning_rate": 1.979422178025663e-05, "loss": 0.0241, "step": 42850 }, { "epoch": 0.62, "learning_rate": 1.9794173740518158e-05, "loss": 0.0144, "step": 42860 }, { "epoch": 0.62, "learning_rate": 1.9794125700779687e-05, "loss": 0.0198, "step": 42870 }, { "epoch": 0.62, "learning_rate": 1.9794077661041217e-05, "loss": 0.0284, "step": 42880 }, { "epoch": 0.62, "learning_rate": 1.9794029621302743e-05, "loss": 0.0155, "step": 42890 }, { "epoch": 0.62, "learning_rate": 1.9793981581564272e-05, "loss": 0.0166, "step": 42900 }, { "epoch": 0.62, "learning_rate": 1.97939335418258e-05, "loss": 0.0206, "step": 42910 }, { "epoch": 0.62, "learning_rate": 1.979388550208733e-05, "loss": 0.019, "step": 42920 }, { "epoch": 0.62, "learning_rate": 1.9793837462348856e-05, "loss": 0.017, "step": 42930 }, { "epoch": 0.62, "learning_rate": 1.9793789422610386e-05, "loss": 0.0191, "step": 42940 }, { "epoch": 0.62, "learning_rate": 1.9793741382871915e-05, "loss": 0.02, "step": 42950 }, { "epoch": 0.62, "learning_rate": 1.979369334313344e-05, "loss": 0.0225, "step": 42960 }, { "epoch": 0.62, "learning_rate": 1.979364530339497e-05, "loss": 0.0187, "step": 42970 }, { "epoch": 0.62, "learning_rate": 1.97935972636565e-05, "loss": 0.018, "step": 42980 }, { "epoch": 0.62, "learning_rate": 1.979354922391803e-05, "loss": 0.019, "step": 42990 }, { "epoch": 0.62, "learning_rate": 1.9793501184179554e-05, "loss": 0.021, "step": 43000 }, { "epoch": 0.62, "learning_rate": 1.9793457948414932e-05, "loss": 0.0167, "step": 43010 }, { "epoch": 0.62, "learning_rate": 1.979340990867646e-05, "loss": 0.018, "step": 43020 }, { "epoch": 0.62, "learning_rate": 1.9793361868937988e-05, "loss": 0.0239, "step": 43030 }, { "epoch": 0.62, "learning_rate": 1.9793313829199517e-05, "loss": 0.0261, "step": 43040 }, { "epoch": 0.62, "learning_rate": 1.9793265789461046e-05, "loss": 0.022, "step": 43050 }, { "epoch": 0.62, "learning_rate": 1.9793217749722572e-05, "loss": 0.0175, "step": 43060 }, { "epoch": 0.62, "learning_rate": 1.97931697099841e-05, "loss": 0.0189, "step": 43070 }, { "epoch": 0.62, "learning_rate": 1.979312167024563e-05, "loss": 0.0199, "step": 43080 }, { "epoch": 0.62, "learning_rate": 1.9793073630507156e-05, "loss": 0.0192, "step": 43090 }, { "epoch": 0.62, "learning_rate": 1.9793025590768686e-05, "loss": 0.0201, "step": 43100 }, { "epoch": 0.62, "learning_rate": 1.9792977551030215e-05, "loss": 0.0175, "step": 43110 }, { "epoch": 0.62, "learning_rate": 1.9792929511291744e-05, "loss": 0.0246, "step": 43120 }, { "epoch": 0.62, "learning_rate": 1.979288147155327e-05, "loss": 0.0197, "step": 43130 }, { "epoch": 0.62, "learning_rate": 1.97928334318148e-05, "loss": 0.0217, "step": 43140 }, { "epoch": 0.62, "learning_rate": 1.979278539207633e-05, "loss": 0.0207, "step": 43150 }, { "epoch": 0.62, "learning_rate": 1.9792742156311703e-05, "loss": 0.0216, "step": 43160 }, { "epoch": 0.62, "learning_rate": 1.979269411657323e-05, "loss": 0.0206, "step": 43170 }, { "epoch": 0.62, "learning_rate": 1.979264607683476e-05, "loss": 0.0235, "step": 43180 }, { "epoch": 0.62, "learning_rate": 1.9792598037096288e-05, "loss": 0.0207, "step": 43190 }, { "epoch": 0.62, "learning_rate": 1.9792549997357814e-05, "loss": 0.0233, "step": 43200 }, { "epoch": 0.62, "learning_rate": 1.9792501957619343e-05, "loss": 0.0196, "step": 43210 }, { "epoch": 0.62, "learning_rate": 1.9792453917880872e-05, "loss": 0.0176, "step": 43220 }, { "epoch": 0.62, "learning_rate": 1.97924058781424e-05, "loss": 0.0225, "step": 43230 }, { "epoch": 0.62, "learning_rate": 1.9792357838403927e-05, "loss": 0.0221, "step": 43240 }, { "epoch": 0.62, "learning_rate": 1.9792309798665457e-05, "loss": 0.0159, "step": 43250 }, { "epoch": 0.62, "learning_rate": 1.9792261758926986e-05, "loss": 0.0178, "step": 43260 }, { "epoch": 0.62, "learning_rate": 1.9792213719188512e-05, "loss": 0.0213, "step": 43270 }, { "epoch": 0.62, "learning_rate": 1.979216567945004e-05, "loss": 0.0177, "step": 43280 }, { "epoch": 0.62, "learning_rate": 1.979211763971157e-05, "loss": 0.0244, "step": 43290 }, { "epoch": 0.62, "learning_rate": 1.97920695999731e-05, "loss": 0.019, "step": 43300 }, { "epoch": 0.62, "learning_rate": 1.9792021560234625e-05, "loss": 0.0166, "step": 43310 }, { "epoch": 0.62, "learning_rate": 1.9791973520496155e-05, "loss": 0.0207, "step": 43320 }, { "epoch": 0.62, "learning_rate": 1.9791925480757684e-05, "loss": 0.024, "step": 43330 }, { "epoch": 0.62, "learning_rate": 1.9791877441019213e-05, "loss": 0.0222, "step": 43340 }, { "epoch": 0.62, "learning_rate": 1.9791829401280743e-05, "loss": 0.0186, "step": 43350 }, { "epoch": 0.62, "learning_rate": 1.9791781361542272e-05, "loss": 0.0175, "step": 43360 }, { "epoch": 0.63, "learning_rate": 1.9791733321803798e-05, "loss": 0.0149, "step": 43370 }, { "epoch": 0.63, "learning_rate": 1.9791685282065327e-05, "loss": 0.0229, "step": 43380 }, { "epoch": 0.63, "learning_rate": 1.9791637242326856e-05, "loss": 0.0152, "step": 43390 }, { "epoch": 0.63, "learning_rate": 1.9791589202588385e-05, "loss": 0.0274, "step": 43400 }, { "epoch": 0.63, "learning_rate": 1.979154116284991e-05, "loss": 0.0218, "step": 43410 }, { "epoch": 0.63, "learning_rate": 1.979149312311144e-05, "loss": 0.0221, "step": 43420 }, { "epoch": 0.63, "learning_rate": 1.9791449887346815e-05, "loss": 0.0217, "step": 43430 }, { "epoch": 0.63, "learning_rate": 1.979140184760834e-05, "loss": 0.0183, "step": 43440 }, { "epoch": 0.63, "learning_rate": 1.979135380786987e-05, "loss": 0.0188, "step": 43450 }, { "epoch": 0.63, "learning_rate": 1.97913057681314e-05, "loss": 0.0188, "step": 43460 }, { "epoch": 0.63, "learning_rate": 1.979125772839293e-05, "loss": 0.019, "step": 43470 }, { "epoch": 0.63, "learning_rate": 1.9791209688654455e-05, "loss": 0.0175, "step": 43480 }, { "epoch": 0.63, "learning_rate": 1.9791161648915984e-05, "loss": 0.02, "step": 43490 }, { "epoch": 0.63, "learning_rate": 1.9791113609177513e-05, "loss": 0.0175, "step": 43500 }, { "epoch": 0.63, "learning_rate": 1.979106556943904e-05, "loss": 0.0205, "step": 43510 }, { "epoch": 0.63, "learning_rate": 1.979101752970057e-05, "loss": 0.0201, "step": 43520 }, { "epoch": 0.63, "learning_rate": 1.9790969489962098e-05, "loss": 0.0147, "step": 43530 }, { "epoch": 0.63, "learning_rate": 1.9790921450223627e-05, "loss": 0.0244, "step": 43540 }, { "epoch": 0.63, "learning_rate": 1.9790873410485153e-05, "loss": 0.0148, "step": 43550 }, { "epoch": 0.63, "learning_rate": 1.9790825370746682e-05, "loss": 0.0177, "step": 43560 }, { "epoch": 0.63, "learning_rate": 1.979077733100821e-05, "loss": 0.0185, "step": 43570 }, { "epoch": 0.63, "learning_rate": 1.979072929126974e-05, "loss": 0.0209, "step": 43580 }, { "epoch": 0.63, "learning_rate": 1.9790681251531267e-05, "loss": 0.0177, "step": 43590 }, { "epoch": 0.63, "learning_rate": 1.9790633211792796e-05, "loss": 0.0163, "step": 43600 }, { "epoch": 0.63, "learning_rate": 1.9790585172054325e-05, "loss": 0.0144, "step": 43610 }, { "epoch": 0.63, "learning_rate": 1.979053713231585e-05, "loss": 0.019, "step": 43620 }, { "epoch": 0.63, "learning_rate": 1.979048909257738e-05, "loss": 0.0224, "step": 43630 }, { "epoch": 0.63, "learning_rate": 1.979044105283891e-05, "loss": 0.0213, "step": 43640 }, { "epoch": 0.63, "learning_rate": 1.979039301310044e-05, "loss": 0.0193, "step": 43650 }, { "epoch": 0.63, "learning_rate": 1.9790344973361965e-05, "loss": 0.022, "step": 43660 }, { "epoch": 0.63, "learning_rate": 1.9790296933623494e-05, "loss": 0.0194, "step": 43670 }, { "epoch": 0.63, "learning_rate": 1.9790248893885023e-05, "loss": 0.0208, "step": 43680 }, { "epoch": 0.63, "learning_rate": 1.979020085414655e-05, "loss": 0.0238, "step": 43690 }, { "epoch": 0.63, "learning_rate": 1.979015281440808e-05, "loss": 0.0173, "step": 43700 }, { "epoch": 0.63, "learning_rate": 1.9790104774669608e-05, "loss": 0.0168, "step": 43710 }, { "epoch": 0.63, "learning_rate": 1.9790056734931137e-05, "loss": 0.0175, "step": 43720 }, { "epoch": 0.63, "learning_rate": 1.9790008695192663e-05, "loss": 0.0142, "step": 43730 }, { "epoch": 0.63, "learning_rate": 1.9789960655454192e-05, "loss": 0.0228, "step": 43740 }, { "epoch": 0.63, "learning_rate": 1.978991261571572e-05, "loss": 0.0257, "step": 43750 }, { "epoch": 0.63, "learning_rate": 1.9789864575977247e-05, "loss": 0.0247, "step": 43760 }, { "epoch": 0.63, "learning_rate": 1.9789816536238777e-05, "loss": 0.022, "step": 43770 }, { "epoch": 0.63, "learning_rate": 1.9789768496500306e-05, "loss": 0.0203, "step": 43780 }, { "epoch": 0.63, "learning_rate": 1.9789720456761835e-05, "loss": 0.024, "step": 43790 }, { "epoch": 0.63, "learning_rate": 1.978967241702336e-05, "loss": 0.0227, "step": 43800 }, { "epoch": 0.63, "learning_rate": 1.978962437728489e-05, "loss": 0.0177, "step": 43810 }, { "epoch": 0.63, "learning_rate": 1.978957633754642e-05, "loss": 0.0128, "step": 43820 }, { "epoch": 0.63, "learning_rate": 1.978952829780795e-05, "loss": 0.0209, "step": 43830 }, { "epoch": 0.63, "learning_rate": 1.9789480258069475e-05, "loss": 0.0161, "step": 43840 }, { "epoch": 0.63, "learning_rate": 1.9789432218331004e-05, "loss": 0.0194, "step": 43850 }, { "epoch": 0.63, "learning_rate": 1.9789384178592533e-05, "loss": 0.0263, "step": 43860 }, { "epoch": 0.63, "learning_rate": 1.9789336138854062e-05, "loss": 0.0156, "step": 43870 }, { "epoch": 0.63, "learning_rate": 1.9789288099115592e-05, "loss": 0.0158, "step": 43880 }, { "epoch": 0.63, "learning_rate": 1.978924005937712e-05, "loss": 0.0167, "step": 43890 }, { "epoch": 0.63, "learning_rate": 1.9789192019638647e-05, "loss": 0.0229, "step": 43900 }, { "epoch": 0.63, "learning_rate": 1.9789143979900176e-05, "loss": 0.0216, "step": 43910 }, { "epoch": 0.63, "learning_rate": 1.9789095940161705e-05, "loss": 0.0247, "step": 43920 }, { "epoch": 0.63, "learning_rate": 1.978904790042323e-05, "loss": 0.0189, "step": 43930 }, { "epoch": 0.63, "learning_rate": 1.978899986068476e-05, "loss": 0.0207, "step": 43940 }, { "epoch": 0.63, "learning_rate": 1.978895182094629e-05, "loss": 0.0188, "step": 43950 }, { "epoch": 0.63, "learning_rate": 1.978890378120782e-05, "loss": 0.0152, "step": 43960 }, { "epoch": 0.63, "learning_rate": 1.9788855741469345e-05, "loss": 0.0219, "step": 43970 }, { "epoch": 0.63, "learning_rate": 1.9788807701730874e-05, "loss": 0.0322, "step": 43980 }, { "epoch": 0.63, "learning_rate": 1.9788759661992404e-05, "loss": 0.0173, "step": 43990 }, { "epoch": 0.63, "learning_rate": 1.978871162225393e-05, "loss": 0.0183, "step": 44000 }, { "epoch": 0.63, "learning_rate": 1.978866358251546e-05, "loss": 0.0215, "step": 44010 }, { "epoch": 0.63, "learning_rate": 1.9788615542776988e-05, "loss": 0.015, "step": 44020 }, { "epoch": 0.63, "learning_rate": 1.9788567503038517e-05, "loss": 0.0148, "step": 44030 }, { "epoch": 0.63, "learning_rate": 1.9788519463300043e-05, "loss": 0.017, "step": 44040 }, { "epoch": 0.63, "learning_rate": 1.9788471423561572e-05, "loss": 0.0196, "step": 44050 }, { "epoch": 0.63, "learning_rate": 1.97884233838231e-05, "loss": 0.0181, "step": 44060 }, { "epoch": 0.64, "learning_rate": 1.978837534408463e-05, "loss": 0.0158, "step": 44070 }, { "epoch": 0.64, "learning_rate": 1.9788327304346157e-05, "loss": 0.0165, "step": 44080 }, { "epoch": 0.64, "learning_rate": 1.9788279264607686e-05, "loss": 0.0198, "step": 44090 }, { "epoch": 0.64, "learning_rate": 1.9788231224869215e-05, "loss": 0.0131, "step": 44100 }, { "epoch": 0.64, "learning_rate": 1.978818318513074e-05, "loss": 0.022, "step": 44110 }, { "epoch": 0.64, "learning_rate": 1.978813514539227e-05, "loss": 0.022, "step": 44120 }, { "epoch": 0.64, "learning_rate": 1.97880871056538e-05, "loss": 0.0194, "step": 44130 }, { "epoch": 0.64, "learning_rate": 1.978803906591533e-05, "loss": 0.0134, "step": 44140 }, { "epoch": 0.64, "learning_rate": 1.9787991026176855e-05, "loss": 0.0133, "step": 44150 }, { "epoch": 0.64, "learning_rate": 1.9787942986438384e-05, "loss": 0.019, "step": 44160 }, { "epoch": 0.64, "learning_rate": 1.9787894946699913e-05, "loss": 0.0218, "step": 44170 }, { "epoch": 0.64, "learning_rate": 1.978784690696144e-05, "loss": 0.016, "step": 44180 }, { "epoch": 0.64, "learning_rate": 1.978779886722297e-05, "loss": 0.0179, "step": 44190 }, { "epoch": 0.64, "learning_rate": 1.9787750827484498e-05, "loss": 0.0139, "step": 44200 }, { "epoch": 0.64, "learning_rate": 1.9787702787746027e-05, "loss": 0.0164, "step": 44210 }, { "epoch": 0.64, "learning_rate": 1.9787654748007553e-05, "loss": 0.0159, "step": 44220 }, { "epoch": 0.64, "learning_rate": 1.9787606708269082e-05, "loss": 0.0177, "step": 44230 }, { "epoch": 0.64, "learning_rate": 1.978755866853061e-05, "loss": 0.018, "step": 44240 }, { "epoch": 0.64, "learning_rate": 1.978751062879214e-05, "loss": 0.0182, "step": 44250 }, { "epoch": 0.64, "learning_rate": 1.9787462589053667e-05, "loss": 0.0189, "step": 44260 }, { "epoch": 0.64, "learning_rate": 1.9787414549315196e-05, "loss": 0.02, "step": 44270 }, { "epoch": 0.64, "learning_rate": 1.9787366509576725e-05, "loss": 0.0183, "step": 44280 }, { "epoch": 0.64, "learning_rate": 1.978731846983825e-05, "loss": 0.0185, "step": 44290 }, { "epoch": 0.64, "learning_rate": 1.978727043009978e-05, "loss": 0.0171, "step": 44300 }, { "epoch": 0.64, "learning_rate": 1.978722239036131e-05, "loss": 0.0167, "step": 44310 }, { "epoch": 0.64, "learning_rate": 1.978717435062284e-05, "loss": 0.0194, "step": 44320 }, { "epoch": 0.64, "learning_rate": 1.9787126310884365e-05, "loss": 0.0174, "step": 44330 }, { "epoch": 0.64, "learning_rate": 1.9787078271145894e-05, "loss": 0.0169, "step": 44340 }, { "epoch": 0.64, "learning_rate": 1.9787030231407423e-05, "loss": 0.0155, "step": 44350 }, { "epoch": 0.64, "learning_rate": 1.978698219166895e-05, "loss": 0.0163, "step": 44360 }, { "epoch": 0.64, "learning_rate": 1.978693415193048e-05, "loss": 0.0194, "step": 44370 }, { "epoch": 0.64, "learning_rate": 1.9786886112192008e-05, "loss": 0.0159, "step": 44380 }, { "epoch": 0.64, "learning_rate": 1.9786838072453537e-05, "loss": 0.0161, "step": 44390 }, { "epoch": 0.64, "learning_rate": 1.9786790032715063e-05, "loss": 0.0229, "step": 44400 }, { "epoch": 0.64, "learning_rate": 1.9786741992976592e-05, "loss": 0.0275, "step": 44410 }, { "epoch": 0.64, "learning_rate": 1.978669395323812e-05, "loss": 0.019, "step": 44420 }, { "epoch": 0.64, "learning_rate": 1.978664591349965e-05, "loss": 0.0267, "step": 44430 }, { "epoch": 0.64, "learning_rate": 1.9786597873761177e-05, "loss": 0.0236, "step": 44440 }, { "epoch": 0.64, "learning_rate": 1.9786549834022706e-05, "loss": 0.02, "step": 44450 }, { "epoch": 0.64, "learning_rate": 1.9786501794284235e-05, "loss": 0.0153, "step": 44460 }, { "epoch": 0.64, "learning_rate": 1.978645375454576e-05, "loss": 0.0184, "step": 44470 }, { "epoch": 0.64, "learning_rate": 1.978640571480729e-05, "loss": 0.0211, "step": 44480 }, { "epoch": 0.64, "learning_rate": 1.978635767506882e-05, "loss": 0.0197, "step": 44490 }, { "epoch": 0.64, "learning_rate": 1.978630963533035e-05, "loss": 0.0191, "step": 44500 }, { "epoch": 0.64, "learning_rate": 1.9786261595591875e-05, "loss": 0.0165, "step": 44510 }, { "epoch": 0.64, "learning_rate": 1.9786213555853404e-05, "loss": 0.0195, "step": 44520 }, { "epoch": 0.64, "learning_rate": 1.9786165516114933e-05, "loss": 0.0202, "step": 44530 }, { "epoch": 0.64, "learning_rate": 1.978611747637646e-05, "loss": 0.0182, "step": 44540 }, { "epoch": 0.64, "learning_rate": 1.978606943663799e-05, "loss": 0.0126, "step": 44550 }, { "epoch": 0.64, "learning_rate": 1.9786021396899518e-05, "loss": 0.0186, "step": 44560 }, { "epoch": 0.64, "learning_rate": 1.9785973357161047e-05, "loss": 0.021, "step": 44570 }, { "epoch": 0.64, "learning_rate": 1.9785925317422573e-05, "loss": 0.0137, "step": 44580 }, { "epoch": 0.64, "learning_rate": 1.9785877277684102e-05, "loss": 0.0223, "step": 44590 }, { "epoch": 0.64, "learning_rate": 1.978582923794563e-05, "loss": 0.016, "step": 44600 }, { "epoch": 0.64, "learning_rate": 1.978578119820716e-05, "loss": 0.02, "step": 44610 }, { "epoch": 0.64, "learning_rate": 1.9785733158468687e-05, "loss": 0.018, "step": 44620 }, { "epoch": 0.64, "learning_rate": 1.9785685118730216e-05, "loss": 0.0159, "step": 44630 }, { "epoch": 0.64, "learning_rate": 1.9785637078991745e-05, "loss": 0.0226, "step": 44640 }, { "epoch": 0.64, "learning_rate": 1.978558903925327e-05, "loss": 0.0237, "step": 44650 }, { "epoch": 0.64, "learning_rate": 1.97855409995148e-05, "loss": 0.0184, "step": 44660 }, { "epoch": 0.64, "learning_rate": 1.978549295977633e-05, "loss": 0.0148, "step": 44670 }, { "epoch": 0.64, "learning_rate": 1.978544492003786e-05, "loss": 0.0162, "step": 44680 }, { "epoch": 0.64, "learning_rate": 1.9785396880299385e-05, "loss": 0.0184, "step": 44690 }, { "epoch": 0.64, "learning_rate": 1.9785348840560914e-05, "loss": 0.0161, "step": 44700 }, { "epoch": 0.64, "learning_rate": 1.9785300800822443e-05, "loss": 0.0196, "step": 44710 }, { "epoch": 0.64, "learning_rate": 1.978525276108397e-05, "loss": 0.0226, "step": 44720 }, { "epoch": 0.64, "learning_rate": 1.97852047213455e-05, "loss": 0.0245, "step": 44730 }, { "epoch": 0.64, "learning_rate": 1.9785156681607028e-05, "loss": 0.0235, "step": 44740 }, { "epoch": 0.64, "learning_rate": 1.9785108641868557e-05, "loss": 0.0223, "step": 44750 }, { "epoch": 0.65, "learning_rate": 1.9785060602130083e-05, "loss": 0.0157, "step": 44760 }, { "epoch": 0.65, "learning_rate": 1.9785012562391612e-05, "loss": 0.0142, "step": 44770 }, { "epoch": 0.65, "learning_rate": 1.978496452265314e-05, "loss": 0.0127, "step": 44780 }, { "epoch": 0.65, "learning_rate": 1.978491648291467e-05, "loss": 0.0177, "step": 44790 }, { "epoch": 0.65, "learning_rate": 1.9784868443176196e-05, "loss": 0.0156, "step": 44800 }, { "epoch": 0.65, "learning_rate": 1.9784820403437726e-05, "loss": 0.0148, "step": 44810 }, { "epoch": 0.65, "learning_rate": 1.9784772363699255e-05, "loss": 0.0207, "step": 44820 }, { "epoch": 0.65, "learning_rate": 1.978472432396078e-05, "loss": 0.0145, "step": 44830 }, { "epoch": 0.65, "learning_rate": 1.978467628422231e-05, "loss": 0.0173, "step": 44840 }, { "epoch": 0.65, "learning_rate": 1.978462824448384e-05, "loss": 0.0163, "step": 44850 }, { "epoch": 0.65, "learning_rate": 1.978458020474537e-05, "loss": 0.0205, "step": 44860 }, { "epoch": 0.65, "learning_rate": 1.9784532165006895e-05, "loss": 0.0227, "step": 44870 }, { "epoch": 0.65, "learning_rate": 1.9784484125268424e-05, "loss": 0.0218, "step": 44880 }, { "epoch": 0.65, "learning_rate": 1.9784436085529953e-05, "loss": 0.0198, "step": 44890 }, { "epoch": 0.65, "learning_rate": 1.978438804579148e-05, "loss": 0.0222, "step": 44900 }, { "epoch": 0.65, "learning_rate": 1.9784340006053008e-05, "loss": 0.0209, "step": 44910 }, { "epoch": 0.65, "learning_rate": 1.9784291966314538e-05, "loss": 0.0161, "step": 44920 }, { "epoch": 0.65, "learning_rate": 1.9784243926576067e-05, "loss": 0.0215, "step": 44930 }, { "epoch": 0.65, "learning_rate": 1.9784195886837593e-05, "loss": 0.0168, "step": 44940 }, { "epoch": 0.65, "learning_rate": 1.9784147847099122e-05, "loss": 0.0234, "step": 44950 }, { "epoch": 0.65, "learning_rate": 1.978409980736065e-05, "loss": 0.016, "step": 44960 }, { "epoch": 0.65, "learning_rate": 1.978405176762218e-05, "loss": 0.018, "step": 44970 }, { "epoch": 0.65, "learning_rate": 1.9784003727883706e-05, "loss": 0.0171, "step": 44980 }, { "epoch": 0.65, "learning_rate": 1.9783955688145236e-05, "loss": 0.0269, "step": 44990 }, { "epoch": 0.65, "learning_rate": 1.9783907648406765e-05, "loss": 0.0192, "step": 45000 }, { "epoch": 0.65, "learning_rate": 1.978385960866829e-05, "loss": 0.0265, "step": 45010 }, { "epoch": 0.65, "learning_rate": 1.978381156892982e-05, "loss": 0.0142, "step": 45020 }, { "epoch": 0.65, "learning_rate": 1.978376352919135e-05, "loss": 0.0288, "step": 45030 }, { "epoch": 0.65, "learning_rate": 1.978371548945288e-05, "loss": 0.0211, "step": 45040 }, { "epoch": 0.65, "learning_rate": 1.9783667449714405e-05, "loss": 0.0202, "step": 45050 }, { "epoch": 0.65, "learning_rate": 1.9783619409975934e-05, "loss": 0.0118, "step": 45060 }, { "epoch": 0.65, "learning_rate": 1.9783571370237463e-05, "loss": 0.0183, "step": 45070 }, { "epoch": 0.65, "learning_rate": 1.978352333049899e-05, "loss": 0.0197, "step": 45080 }, { "epoch": 0.65, "learning_rate": 1.9783475290760518e-05, "loss": 0.0236, "step": 45090 }, { "epoch": 0.65, "learning_rate": 1.9783427251022047e-05, "loss": 0.0185, "step": 45100 }, { "epoch": 0.65, "learning_rate": 1.9783379211283577e-05, "loss": 0.0188, "step": 45110 }, { "epoch": 0.65, "learning_rate": 1.9783331171545103e-05, "loss": 0.0163, "step": 45120 }, { "epoch": 0.65, "learning_rate": 1.9783283131806632e-05, "loss": 0.0232, "step": 45130 }, { "epoch": 0.65, "learning_rate": 1.978323509206816e-05, "loss": 0.0183, "step": 45140 }, { "epoch": 0.65, "learning_rate": 1.9783187052329687e-05, "loss": 0.017, "step": 45150 }, { "epoch": 0.65, "learning_rate": 1.9783139012591216e-05, "loss": 0.0215, "step": 45160 }, { "epoch": 0.65, "learning_rate": 1.9783090972852746e-05, "loss": 0.025, "step": 45170 }, { "epoch": 0.65, "learning_rate": 1.9783042933114275e-05, "loss": 0.0182, "step": 45180 }, { "epoch": 0.65, "learning_rate": 1.97829948933758e-05, "loss": 0.0175, "step": 45190 }, { "epoch": 0.65, "learning_rate": 1.978294685363733e-05, "loss": 0.0188, "step": 45200 }, { "epoch": 0.65, "learning_rate": 1.978289881389886e-05, "loss": 0.0231, "step": 45210 }, { "epoch": 0.65, "learning_rate": 1.978285077416039e-05, "loss": 0.0184, "step": 45220 }, { "epoch": 0.65, "learning_rate": 1.9782802734421914e-05, "loss": 0.0126, "step": 45230 }, { "epoch": 0.65, "learning_rate": 1.9782754694683444e-05, "loss": 0.0233, "step": 45240 }, { "epoch": 0.65, "learning_rate": 1.9782706654944973e-05, "loss": 0.0183, "step": 45250 }, { "epoch": 0.65, "learning_rate": 1.97826586152065e-05, "loss": 0.0163, "step": 45260 }, { "epoch": 0.65, "learning_rate": 1.9782610575468028e-05, "loss": 0.0173, "step": 45270 }, { "epoch": 0.65, "learning_rate": 1.9782562535729557e-05, "loss": 0.0201, "step": 45280 }, { "epoch": 0.65, "learning_rate": 1.9782514495991087e-05, "loss": 0.0162, "step": 45290 }, { "epoch": 0.65, "learning_rate": 1.9782466456252613e-05, "loss": 0.0193, "step": 45300 }, { "epoch": 0.65, "learning_rate": 1.9782418416514142e-05, "loss": 0.0187, "step": 45310 }, { "epoch": 0.65, "learning_rate": 1.978237037677567e-05, "loss": 0.0215, "step": 45320 }, { "epoch": 0.65, "learning_rate": 1.9782322337037197e-05, "loss": 0.0219, "step": 45330 }, { "epoch": 0.65, "learning_rate": 1.9782274297298726e-05, "loss": 0.0186, "step": 45340 }, { "epoch": 0.65, "learning_rate": 1.9782226257560255e-05, "loss": 0.018, "step": 45350 }, { "epoch": 0.65, "learning_rate": 1.9782178217821785e-05, "loss": 0.021, "step": 45360 }, { "epoch": 0.65, "learning_rate": 1.978213017808331e-05, "loss": 0.0187, "step": 45370 }, { "epoch": 0.65, "learning_rate": 1.978208213834484e-05, "loss": 0.0145, "step": 45380 }, { "epoch": 0.65, "learning_rate": 1.978203409860637e-05, "loss": 0.0184, "step": 45390 }, { "epoch": 0.65, "learning_rate": 1.97819860588679e-05, "loss": 0.024, "step": 45400 }, { "epoch": 0.65, "learning_rate": 1.9781938019129424e-05, "loss": 0.0246, "step": 45410 }, { "epoch": 0.65, "learning_rate": 1.9781889979390954e-05, "loss": 0.0245, "step": 45420 }, { "epoch": 0.65, "learning_rate": 1.9781841939652483e-05, "loss": 0.0183, "step": 45430 }, { "epoch": 0.65, "learning_rate": 1.978179389991401e-05, "loss": 0.0156, "step": 45440 }, { "epoch": 0.66, "learning_rate": 1.9781745860175538e-05, "loss": 0.0183, "step": 45450 }, { "epoch": 0.66, "learning_rate": 1.9781697820437067e-05, "loss": 0.0202, "step": 45460 }, { "epoch": 0.66, "learning_rate": 1.9781649780698597e-05, "loss": 0.0171, "step": 45470 }, { "epoch": 0.66, "learning_rate": 1.9781601740960122e-05, "loss": 0.0119, "step": 45480 }, { "epoch": 0.66, "learning_rate": 1.9781553701221652e-05, "loss": 0.0181, "step": 45490 }, { "epoch": 0.66, "learning_rate": 1.978150566148318e-05, "loss": 0.0152, "step": 45500 }, { "epoch": 0.66, "learning_rate": 1.9781457621744707e-05, "loss": 0.0211, "step": 45510 }, { "epoch": 0.66, "learning_rate": 1.9781409582006236e-05, "loss": 0.0228, "step": 45520 }, { "epoch": 0.66, "learning_rate": 1.9781361542267765e-05, "loss": 0.0199, "step": 45530 }, { "epoch": 0.66, "learning_rate": 1.9781313502529295e-05, "loss": 0.0194, "step": 45540 }, { "epoch": 0.66, "learning_rate": 1.978126546279082e-05, "loss": 0.024, "step": 45550 }, { "epoch": 0.66, "learning_rate": 1.978121742305235e-05, "loss": 0.0166, "step": 45560 }, { "epoch": 0.66, "learning_rate": 1.978116938331388e-05, "loss": 0.0158, "step": 45570 }, { "epoch": 0.66, "learning_rate": 1.978112134357541e-05, "loss": 0.0183, "step": 45580 }, { "epoch": 0.66, "learning_rate": 1.9781073303836934e-05, "loss": 0.0174, "step": 45590 }, { "epoch": 0.66, "learning_rate": 1.9781025264098464e-05, "loss": 0.0237, "step": 45600 }, { "epoch": 0.66, "learning_rate": 1.9780977224359993e-05, "loss": 0.0172, "step": 45610 }, { "epoch": 0.66, "learning_rate": 1.978092918462152e-05, "loss": 0.0193, "step": 45620 }, { "epoch": 0.66, "learning_rate": 1.9780881144883048e-05, "loss": 0.014, "step": 45630 }, { "epoch": 0.66, "learning_rate": 1.9780833105144577e-05, "loss": 0.0205, "step": 45640 }, { "epoch": 0.66, "learning_rate": 1.9780785065406106e-05, "loss": 0.0196, "step": 45650 }, { "epoch": 0.66, "learning_rate": 1.9780737025667632e-05, "loss": 0.0168, "step": 45660 }, { "epoch": 0.66, "learning_rate": 1.978068898592916e-05, "loss": 0.0175, "step": 45670 }, { "epoch": 0.66, "learning_rate": 1.978064094619069e-05, "loss": 0.016, "step": 45680 }, { "epoch": 0.66, "learning_rate": 1.9780592906452217e-05, "loss": 0.0207, "step": 45690 }, { "epoch": 0.66, "learning_rate": 1.9780544866713746e-05, "loss": 0.0184, "step": 45700 }, { "epoch": 0.66, "learning_rate": 1.9780496826975275e-05, "loss": 0.0169, "step": 45710 }, { "epoch": 0.66, "learning_rate": 1.9780448787236805e-05, "loss": 0.019, "step": 45720 }, { "epoch": 0.66, "learning_rate": 1.978040074749833e-05, "loss": 0.0179, "step": 45730 }, { "epoch": 0.66, "learning_rate": 1.978035270775986e-05, "loss": 0.0181, "step": 45740 }, { "epoch": 0.66, "learning_rate": 1.978030466802139e-05, "loss": 0.0174, "step": 45750 }, { "epoch": 0.66, "learning_rate": 1.9780256628282918e-05, "loss": 0.0176, "step": 45760 }, { "epoch": 0.66, "learning_rate": 1.9780208588544444e-05, "loss": 0.0174, "step": 45770 }, { "epoch": 0.66, "learning_rate": 1.9780160548805973e-05, "loss": 0.0164, "step": 45780 }, { "epoch": 0.66, "learning_rate": 1.9780112509067503e-05, "loss": 0.0214, "step": 45790 }, { "epoch": 0.66, "learning_rate": 1.978006446932903e-05, "loss": 0.025, "step": 45800 }, { "epoch": 0.66, "learning_rate": 1.9780016429590558e-05, "loss": 0.0225, "step": 45810 }, { "epoch": 0.66, "learning_rate": 1.9779968389852087e-05, "loss": 0.0211, "step": 45820 }, { "epoch": 0.66, "learning_rate": 1.9779920350113616e-05, "loss": 0.0233, "step": 45830 }, { "epoch": 0.66, "learning_rate": 1.9779872310375142e-05, "loss": 0.0149, "step": 45840 }, { "epoch": 0.66, "learning_rate": 1.977982427063667e-05, "loss": 0.0186, "step": 45850 }, { "epoch": 0.66, "learning_rate": 1.97797762308982e-05, "loss": 0.0198, "step": 45860 }, { "epoch": 0.66, "learning_rate": 1.9779728191159727e-05, "loss": 0.0157, "step": 45870 }, { "epoch": 0.66, "learning_rate": 1.9779680151421256e-05, "loss": 0.0163, "step": 45880 }, { "epoch": 0.66, "learning_rate": 1.9779632111682785e-05, "loss": 0.0235, "step": 45890 }, { "epoch": 0.66, "learning_rate": 1.9779584071944315e-05, "loss": 0.0188, "step": 45900 }, { "epoch": 0.66, "learning_rate": 1.977953603220584e-05, "loss": 0.0156, "step": 45910 }, { "epoch": 0.66, "learning_rate": 1.977948799246737e-05, "loss": 0.0186, "step": 45920 }, { "epoch": 0.66, "learning_rate": 1.97794399527289e-05, "loss": 0.0229, "step": 45930 }, { "epoch": 0.66, "learning_rate": 1.9779391912990428e-05, "loss": 0.0158, "step": 45940 }, { "epoch": 0.66, "learning_rate": 1.9779343873251954e-05, "loss": 0.0208, "step": 45950 }, { "epoch": 0.66, "learning_rate": 1.9779295833513483e-05, "loss": 0.0176, "step": 45960 }, { "epoch": 0.66, "learning_rate": 1.9779247793775013e-05, "loss": 0.0193, "step": 45970 }, { "epoch": 0.66, "learning_rate": 1.977919975403654e-05, "loss": 0.024, "step": 45980 }, { "epoch": 0.66, "learning_rate": 1.9779151714298068e-05, "loss": 0.0182, "step": 45990 }, { "epoch": 0.66, "learning_rate": 1.9779103674559597e-05, "loss": 0.0203, "step": 46000 }, { "epoch": 0.66, "learning_rate": 1.9779055634821126e-05, "loss": 0.0231, "step": 46010 }, { "epoch": 0.66, "learning_rate": 1.9779007595082652e-05, "loss": 0.0195, "step": 46020 }, { "epoch": 0.66, "learning_rate": 1.977895955534418e-05, "loss": 0.0178, "step": 46030 }, { "epoch": 0.66, "learning_rate": 1.977891151560571e-05, "loss": 0.0184, "step": 46040 }, { "epoch": 0.66, "learning_rate": 1.9778863475867237e-05, "loss": 0.0196, "step": 46050 }, { "epoch": 0.66, "learning_rate": 1.9778815436128766e-05, "loss": 0.0129, "step": 46060 }, { "epoch": 0.66, "learning_rate": 1.9778767396390295e-05, "loss": 0.0189, "step": 46070 }, { "epoch": 0.66, "learning_rate": 1.9778719356651824e-05, "loss": 0.0183, "step": 46080 }, { "epoch": 0.66, "learning_rate": 1.977867131691335e-05, "loss": 0.0174, "step": 46090 }, { "epoch": 0.66, "learning_rate": 1.977862327717488e-05, "loss": 0.0229, "step": 46100 }, { "epoch": 0.66, "learning_rate": 1.977857523743641e-05, "loss": 0.0157, "step": 46110 }, { "epoch": 0.66, "learning_rate": 1.9778527197697938e-05, "loss": 0.0196, "step": 46120 }, { "epoch": 0.66, "learning_rate": 1.9778479157959464e-05, "loss": 0.0231, "step": 46130 }, { "epoch": 0.66, "learning_rate": 1.9778431118220993e-05, "loss": 0.0213, "step": 46140 }, { "epoch": 0.67, "learning_rate": 1.9778383078482523e-05, "loss": 0.0163, "step": 46150 }, { "epoch": 0.67, "learning_rate": 1.977833503874405e-05, "loss": 0.0259, "step": 46160 }, { "epoch": 0.67, "learning_rate": 1.9778286999005578e-05, "loss": 0.0171, "step": 46170 }, { "epoch": 0.67, "learning_rate": 1.9778238959267107e-05, "loss": 0.0145, "step": 46180 }, { "epoch": 0.67, "learning_rate": 1.9778190919528636e-05, "loss": 0.0224, "step": 46190 }, { "epoch": 0.67, "learning_rate": 1.9778142879790162e-05, "loss": 0.0152, "step": 46200 }, { "epoch": 0.67, "learning_rate": 1.977809484005169e-05, "loss": 0.0206, "step": 46210 }, { "epoch": 0.67, "learning_rate": 1.977804680031322e-05, "loss": 0.0183, "step": 46220 }, { "epoch": 0.67, "learning_rate": 1.9777998760574747e-05, "loss": 0.014, "step": 46230 }, { "epoch": 0.67, "learning_rate": 1.9777950720836276e-05, "loss": 0.0212, "step": 46240 }, { "epoch": 0.67, "learning_rate": 1.9777902681097805e-05, "loss": 0.0185, "step": 46250 }, { "epoch": 0.67, "learning_rate": 1.9777854641359334e-05, "loss": 0.0198, "step": 46260 }, { "epoch": 0.67, "learning_rate": 1.977780660162086e-05, "loss": 0.0227, "step": 46270 }, { "epoch": 0.67, "learning_rate": 1.977775856188239e-05, "loss": 0.0204, "step": 46280 }, { "epoch": 0.67, "learning_rate": 1.977771052214392e-05, "loss": 0.0181, "step": 46290 }, { "epoch": 0.67, "learning_rate": 1.9777662482405448e-05, "loss": 0.0176, "step": 46300 }, { "epoch": 0.67, "learning_rate": 1.9777614442666974e-05, "loss": 0.0259, "step": 46310 }, { "epoch": 0.67, "learning_rate": 1.9777566402928503e-05, "loss": 0.0152, "step": 46320 }, { "epoch": 0.67, "learning_rate": 1.9777518363190032e-05, "loss": 0.0155, "step": 46330 }, { "epoch": 0.67, "learning_rate": 1.977747032345156e-05, "loss": 0.0162, "step": 46340 }, { "epoch": 0.67, "learning_rate": 1.9777422283713088e-05, "loss": 0.0177, "step": 46350 }, { "epoch": 0.67, "learning_rate": 1.9777374243974617e-05, "loss": 0.0219, "step": 46360 }, { "epoch": 0.67, "learning_rate": 1.9777326204236146e-05, "loss": 0.0189, "step": 46370 }, { "epoch": 0.67, "learning_rate": 1.9777278164497672e-05, "loss": 0.016, "step": 46380 }, { "epoch": 0.67, "learning_rate": 1.97772301247592e-05, "loss": 0.019, "step": 46390 }, { "epoch": 0.67, "learning_rate": 1.977718208502073e-05, "loss": 0.0242, "step": 46400 }, { "epoch": 0.67, "learning_rate": 1.9777134045282256e-05, "loss": 0.0226, "step": 46410 }, { "epoch": 0.67, "learning_rate": 1.977708600554379e-05, "loss": 0.022, "step": 46420 }, { "epoch": 0.67, "learning_rate": 1.977703796580532e-05, "loss": 0.018, "step": 46430 }, { "epoch": 0.67, "learning_rate": 1.9776989926066844e-05, "loss": 0.0233, "step": 46440 }, { "epoch": 0.67, "learning_rate": 1.9776941886328374e-05, "loss": 0.0188, "step": 46450 }, { "epoch": 0.67, "learning_rate": 1.9776893846589903e-05, "loss": 0.0235, "step": 46460 }, { "epoch": 0.67, "learning_rate": 1.977684580685143e-05, "loss": 0.0195, "step": 46470 }, { "epoch": 0.67, "learning_rate": 1.9776797767112958e-05, "loss": 0.0152, "step": 46480 }, { "epoch": 0.67, "learning_rate": 1.9776749727374487e-05, "loss": 0.0171, "step": 46490 }, { "epoch": 0.67, "learning_rate": 1.9776701687636016e-05, "loss": 0.0158, "step": 46500 }, { "epoch": 0.67, "learning_rate": 1.9776653647897542e-05, "loss": 0.0253, "step": 46510 }, { "epoch": 0.67, "learning_rate": 1.977660560815907e-05, "loss": 0.0178, "step": 46520 }, { "epoch": 0.67, "learning_rate": 1.97765575684206e-05, "loss": 0.0168, "step": 46530 }, { "epoch": 0.67, "learning_rate": 1.977650952868213e-05, "loss": 0.0199, "step": 46540 }, { "epoch": 0.67, "learning_rate": 1.9776461488943656e-05, "loss": 0.018, "step": 46550 }, { "epoch": 0.67, "learning_rate": 1.9776413449205185e-05, "loss": 0.02, "step": 46560 }, { "epoch": 0.67, "learning_rate": 1.9776365409466715e-05, "loss": 0.0186, "step": 46570 }, { "epoch": 0.67, "learning_rate": 1.977631736972824e-05, "loss": 0.016, "step": 46580 }, { "epoch": 0.67, "learning_rate": 1.977626932998977e-05, "loss": 0.0221, "step": 46590 }, { "epoch": 0.67, "learning_rate": 1.97762212902513e-05, "loss": 0.0139, "step": 46600 }, { "epoch": 0.67, "learning_rate": 1.9776173250512828e-05, "loss": 0.0186, "step": 46610 }, { "epoch": 0.67, "learning_rate": 1.9776125210774354e-05, "loss": 0.0154, "step": 46620 }, { "epoch": 0.67, "learning_rate": 1.9776077171035883e-05, "loss": 0.0181, "step": 46630 }, { "epoch": 0.67, "learning_rate": 1.9776029131297413e-05, "loss": 0.0187, "step": 46640 }, { "epoch": 0.67, "learning_rate": 1.977598109155894e-05, "loss": 0.0171, "step": 46650 }, { "epoch": 0.67, "learning_rate": 1.9775933051820468e-05, "loss": 0.0237, "step": 46660 }, { "epoch": 0.67, "learning_rate": 1.9775885012081997e-05, "loss": 0.0176, "step": 46670 }, { "epoch": 0.67, "learning_rate": 1.9775836972343526e-05, "loss": 0.0173, "step": 46680 }, { "epoch": 0.67, "learning_rate": 1.9775788932605052e-05, "loss": 0.0193, "step": 46690 }, { "epoch": 0.67, "learning_rate": 1.977574089286658e-05, "loss": 0.0131, "step": 46700 }, { "epoch": 0.67, "learning_rate": 1.977569285312811e-05, "loss": 0.0154, "step": 46710 }, { "epoch": 0.67, "learning_rate": 1.9775644813389637e-05, "loss": 0.0201, "step": 46720 }, { "epoch": 0.67, "learning_rate": 1.9775596773651166e-05, "loss": 0.0227, "step": 46730 }, { "epoch": 0.67, "learning_rate": 1.9775548733912695e-05, "loss": 0.0142, "step": 46740 }, { "epoch": 0.67, "learning_rate": 1.9775500694174225e-05, "loss": 0.0177, "step": 46750 }, { "epoch": 0.67, "learning_rate": 1.977545265443575e-05, "loss": 0.0263, "step": 46760 }, { "epoch": 0.67, "learning_rate": 1.977540461469728e-05, "loss": 0.0148, "step": 46770 }, { "epoch": 0.67, "learning_rate": 1.977535657495881e-05, "loss": 0.0206, "step": 46780 }, { "epoch": 0.67, "learning_rate": 1.9775308535220338e-05, "loss": 0.0161, "step": 46790 }, { "epoch": 0.67, "learning_rate": 1.9775260495481864e-05, "loss": 0.0179, "step": 46800 }, { "epoch": 0.67, "learning_rate": 1.9775212455743393e-05, "loss": 0.0232, "step": 46810 }, { "epoch": 0.67, "learning_rate": 1.9775164416004923e-05, "loss": 0.0155, "step": 46820 }, { "epoch": 0.67, "learning_rate": 1.977511637626645e-05, "loss": 0.0183, "step": 46830 }, { "epoch": 0.68, "learning_rate": 1.9775068336527978e-05, "loss": 0.0194, "step": 46840 }, { "epoch": 0.68, "learning_rate": 1.9775020296789507e-05, "loss": 0.0241, "step": 46850 }, { "epoch": 0.68, "learning_rate": 1.9774972257051036e-05, "loss": 0.0172, "step": 46860 }, { "epoch": 0.68, "learning_rate": 1.9774924217312562e-05, "loss": 0.0151, "step": 46870 }, { "epoch": 0.68, "learning_rate": 1.977487617757409e-05, "loss": 0.0228, "step": 46880 }, { "epoch": 0.68, "learning_rate": 1.977482813783562e-05, "loss": 0.0161, "step": 46890 }, { "epoch": 0.68, "learning_rate": 1.9774780098097147e-05, "loss": 0.0163, "step": 46900 }, { "epoch": 0.68, "learning_rate": 1.9774732058358676e-05, "loss": 0.0194, "step": 46910 }, { "epoch": 0.68, "learning_rate": 1.9774684018620205e-05, "loss": 0.0157, "step": 46920 }, { "epoch": 0.68, "learning_rate": 1.9774635978881734e-05, "loss": 0.0188, "step": 46930 }, { "epoch": 0.68, "learning_rate": 1.977458793914326e-05, "loss": 0.0147, "step": 46940 }, { "epoch": 0.68, "learning_rate": 1.977453989940479e-05, "loss": 0.0182, "step": 46950 }, { "epoch": 0.68, "learning_rate": 1.977449185966632e-05, "loss": 0.0189, "step": 46960 }, { "epoch": 0.68, "learning_rate": 1.9774443819927848e-05, "loss": 0.0167, "step": 46970 }, { "epoch": 0.68, "learning_rate": 1.9774395780189374e-05, "loss": 0.0185, "step": 46980 }, { "epoch": 0.68, "learning_rate": 1.9774347740450903e-05, "loss": 0.0199, "step": 46990 }, { "epoch": 0.68, "learning_rate": 1.9774299700712433e-05, "loss": 0.0258, "step": 47000 }, { "epoch": 0.68, "learning_rate": 1.977425166097396e-05, "loss": 0.0234, "step": 47010 }, { "epoch": 0.68, "learning_rate": 1.9774203621235488e-05, "loss": 0.0196, "step": 47020 }, { "epoch": 0.68, "learning_rate": 1.9774155581497017e-05, "loss": 0.0175, "step": 47030 }, { "epoch": 0.68, "learning_rate": 1.9774107541758546e-05, "loss": 0.0198, "step": 47040 }, { "epoch": 0.68, "learning_rate": 1.9774059502020072e-05, "loss": 0.0286, "step": 47050 }, { "epoch": 0.68, "learning_rate": 1.97740114622816e-05, "loss": 0.0151, "step": 47060 }, { "epoch": 0.68, "learning_rate": 1.977396342254313e-05, "loss": 0.0226, "step": 47070 }, { "epoch": 0.68, "learning_rate": 1.9773915382804657e-05, "loss": 0.0183, "step": 47080 }, { "epoch": 0.68, "learning_rate": 1.9773867343066186e-05, "loss": 0.0193, "step": 47090 }, { "epoch": 0.68, "learning_rate": 1.9773819303327715e-05, "loss": 0.0171, "step": 47100 }, { "epoch": 0.68, "learning_rate": 1.9773771263589244e-05, "loss": 0.0244, "step": 47110 }, { "epoch": 0.68, "learning_rate": 1.977372322385077e-05, "loss": 0.0191, "step": 47120 }, { "epoch": 0.68, "learning_rate": 1.97736751841123e-05, "loss": 0.0214, "step": 47130 }, { "epoch": 0.68, "learning_rate": 1.977362714437383e-05, "loss": 0.0224, "step": 47140 }, { "epoch": 0.68, "learning_rate": 1.9773579104635358e-05, "loss": 0.024, "step": 47150 }, { "epoch": 0.68, "learning_rate": 1.9773531064896884e-05, "loss": 0.0146, "step": 47160 }, { "epoch": 0.68, "learning_rate": 1.9773483025158413e-05, "loss": 0.0198, "step": 47170 }, { "epoch": 0.68, "learning_rate": 1.9773434985419942e-05, "loss": 0.0221, "step": 47180 }, { "epoch": 0.68, "learning_rate": 1.977338694568147e-05, "loss": 0.0148, "step": 47190 }, { "epoch": 0.68, "learning_rate": 1.9773338905942998e-05, "loss": 0.0169, "step": 47200 }, { "epoch": 0.68, "learning_rate": 1.9773290866204527e-05, "loss": 0.0231, "step": 47210 }, { "epoch": 0.68, "learning_rate": 1.9773242826466056e-05, "loss": 0.0211, "step": 47220 }, { "epoch": 0.68, "learning_rate": 1.9773194786727582e-05, "loss": 0.0155, "step": 47230 }, { "epoch": 0.68, "learning_rate": 1.977314674698911e-05, "loss": 0.0203, "step": 47240 }, { "epoch": 0.68, "learning_rate": 1.977309870725064e-05, "loss": 0.0179, "step": 47250 }, { "epoch": 0.68, "learning_rate": 1.9773050667512166e-05, "loss": 0.0244, "step": 47260 }, { "epoch": 0.68, "learning_rate": 1.9773002627773696e-05, "loss": 0.0235, "step": 47270 }, { "epoch": 0.68, "learning_rate": 1.9772954588035225e-05, "loss": 0.0171, "step": 47280 }, { "epoch": 0.68, "learning_rate": 1.9772906548296754e-05, "loss": 0.0215, "step": 47290 }, { "epoch": 0.68, "learning_rate": 1.977285850855828e-05, "loss": 0.0195, "step": 47300 }, { "epoch": 0.68, "learning_rate": 1.977281046881981e-05, "loss": 0.0172, "step": 47310 }, { "epoch": 0.68, "learning_rate": 1.977276242908134e-05, "loss": 0.0129, "step": 47320 }, { "epoch": 0.68, "learning_rate": 1.9772714389342868e-05, "loss": 0.021, "step": 47330 }, { "epoch": 0.68, "learning_rate": 1.9772666349604394e-05, "loss": 0.021, "step": 47340 }, { "epoch": 0.68, "learning_rate": 1.9772618309865923e-05, "loss": 0.019, "step": 47350 }, { "epoch": 0.68, "learning_rate": 1.9772570270127452e-05, "loss": 0.021, "step": 47360 }, { "epoch": 0.68, "learning_rate": 1.9772522230388978e-05, "loss": 0.0153, "step": 47370 }, { "epoch": 0.68, "learning_rate": 1.9772474190650508e-05, "loss": 0.0225, "step": 47380 }, { "epoch": 0.68, "learning_rate": 1.9772426150912037e-05, "loss": 0.0192, "step": 47390 }, { "epoch": 0.68, "learning_rate": 1.9772378111173566e-05, "loss": 0.0152, "step": 47400 }, { "epoch": 0.68, "learning_rate": 1.9772330071435092e-05, "loss": 0.0165, "step": 47410 }, { "epoch": 0.68, "learning_rate": 1.977228203169662e-05, "loss": 0.0394, "step": 47420 }, { "epoch": 0.68, "learning_rate": 1.977223399195815e-05, "loss": 0.0194, "step": 47430 }, { "epoch": 0.68, "learning_rate": 1.9772185952219676e-05, "loss": 0.0145, "step": 47440 }, { "epoch": 0.68, "learning_rate": 1.9772137912481206e-05, "loss": 0.0191, "step": 47450 }, { "epoch": 0.68, "learning_rate": 1.9772089872742735e-05, "loss": 0.0153, "step": 47460 }, { "epoch": 0.68, "learning_rate": 1.9772041833004264e-05, "loss": 0.0236, "step": 47470 }, { "epoch": 0.68, "learning_rate": 1.977199379326579e-05, "loss": 0.0189, "step": 47480 }, { "epoch": 0.68, "learning_rate": 1.977194575352732e-05, "loss": 0.0191, "step": 47490 }, { "epoch": 0.68, "learning_rate": 1.977189771378885e-05, "loss": 0.0193, "step": 47500 }, { "epoch": 0.68, "learning_rate": 1.9771849674050378e-05, "loss": 0.0225, "step": 47510 }, { "epoch": 0.68, "learning_rate": 1.9771801634311904e-05, "loss": 0.0183, "step": 47520 }, { "epoch": 0.68, "learning_rate": 1.9771753594573433e-05, "loss": 0.0194, "step": 47530 }, { "epoch": 0.69, "learning_rate": 1.9771705554834962e-05, "loss": 0.0179, "step": 47540 }, { "epoch": 0.69, "learning_rate": 1.9771657515096488e-05, "loss": 0.0202, "step": 47550 }, { "epoch": 0.69, "learning_rate": 1.9771609475358017e-05, "loss": 0.017, "step": 47560 }, { "epoch": 0.69, "learning_rate": 1.9771561435619547e-05, "loss": 0.0162, "step": 47570 }, { "epoch": 0.69, "learning_rate": 1.9771513395881076e-05, "loss": 0.0204, "step": 47580 }, { "epoch": 0.69, "learning_rate": 1.9771465356142602e-05, "loss": 0.0176, "step": 47590 }, { "epoch": 0.69, "learning_rate": 1.977141731640413e-05, "loss": 0.0128, "step": 47600 }, { "epoch": 0.69, "learning_rate": 1.977136927666566e-05, "loss": 0.019, "step": 47610 }, { "epoch": 0.69, "learning_rate": 1.9771321236927186e-05, "loss": 0.0208, "step": 47620 }, { "epoch": 0.69, "learning_rate": 1.9771273197188716e-05, "loss": 0.0198, "step": 47630 }, { "epoch": 0.69, "learning_rate": 1.9771225157450245e-05, "loss": 0.0163, "step": 47640 }, { "epoch": 0.69, "learning_rate": 1.9771177117711774e-05, "loss": 0.018, "step": 47650 }, { "epoch": 0.69, "learning_rate": 1.97711290779733e-05, "loss": 0.0208, "step": 47660 }, { "epoch": 0.69, "learning_rate": 1.977108103823483e-05, "loss": 0.0157, "step": 47670 }, { "epoch": 0.69, "learning_rate": 1.977103299849636e-05, "loss": 0.017, "step": 47680 }, { "epoch": 0.69, "learning_rate": 1.9770984958757888e-05, "loss": 0.019, "step": 47690 }, { "epoch": 0.69, "learning_rate": 1.9770936919019414e-05, "loss": 0.0204, "step": 47700 }, { "epoch": 0.69, "learning_rate": 1.9770888879280943e-05, "loss": 0.0168, "step": 47710 }, { "epoch": 0.69, "learning_rate": 1.9770840839542472e-05, "loss": 0.015, "step": 47720 }, { "epoch": 0.69, "learning_rate": 1.9770792799803998e-05, "loss": 0.0121, "step": 47730 }, { "epoch": 0.69, "learning_rate": 1.9770744760065527e-05, "loss": 0.0201, "step": 47740 }, { "epoch": 0.69, "learning_rate": 1.9770696720327057e-05, "loss": 0.0166, "step": 47750 }, { "epoch": 0.69, "learning_rate": 1.9770648680588586e-05, "loss": 0.0176, "step": 47760 }, { "epoch": 0.69, "learning_rate": 1.9770600640850112e-05, "loss": 0.0205, "step": 47770 }, { "epoch": 0.69, "learning_rate": 1.977055260111164e-05, "loss": 0.0151, "step": 47780 }, { "epoch": 0.69, "learning_rate": 1.977050456137317e-05, "loss": 0.0154, "step": 47790 }, { "epoch": 0.69, "learning_rate": 1.9770456521634696e-05, "loss": 0.0174, "step": 47800 }, { "epoch": 0.69, "learning_rate": 1.9770408481896225e-05, "loss": 0.0151, "step": 47810 }, { "epoch": 0.69, "learning_rate": 1.9770360442157755e-05, "loss": 0.0188, "step": 47820 }, { "epoch": 0.69, "learning_rate": 1.9770312402419284e-05, "loss": 0.012, "step": 47830 }, { "epoch": 0.69, "learning_rate": 1.977026436268081e-05, "loss": 0.0284, "step": 47840 }, { "epoch": 0.69, "learning_rate": 1.977021632294234e-05, "loss": 0.0227, "step": 47850 }, { "epoch": 0.69, "learning_rate": 1.977016828320387e-05, "loss": 0.02, "step": 47860 }, { "epoch": 0.69, "learning_rate": 1.9770120243465398e-05, "loss": 0.0203, "step": 47870 }, { "epoch": 0.69, "learning_rate": 1.9770072203726924e-05, "loss": 0.0181, "step": 47880 }, { "epoch": 0.69, "learning_rate": 1.9770024163988453e-05, "loss": 0.0239, "step": 47890 }, { "epoch": 0.69, "learning_rate": 1.9769976124249982e-05, "loss": 0.0207, "step": 47900 }, { "epoch": 0.69, "learning_rate": 1.9769928084511508e-05, "loss": 0.0173, "step": 47910 }, { "epoch": 0.69, "learning_rate": 1.9769880044773037e-05, "loss": 0.0179, "step": 47920 }, { "epoch": 0.69, "learning_rate": 1.9769832005034567e-05, "loss": 0.0181, "step": 47930 }, { "epoch": 0.69, "learning_rate": 1.9769783965296096e-05, "loss": 0.0217, "step": 47940 }, { "epoch": 0.69, "learning_rate": 1.976973592555762e-05, "loss": 0.0238, "step": 47950 }, { "epoch": 0.69, "learning_rate": 1.976968788581915e-05, "loss": 0.0196, "step": 47960 }, { "epoch": 0.69, "learning_rate": 1.976963984608068e-05, "loss": 0.0161, "step": 47970 }, { "epoch": 0.69, "learning_rate": 1.9769591806342206e-05, "loss": 0.0138, "step": 47980 }, { "epoch": 0.69, "learning_rate": 1.9769543766603735e-05, "loss": 0.0233, "step": 47990 }, { "epoch": 0.69, "learning_rate": 1.9769495726865265e-05, "loss": 0.0204, "step": 48000 }, { "epoch": 0.69, "learning_rate": 1.9769447687126794e-05, "loss": 0.0212, "step": 48010 }, { "epoch": 0.69, "learning_rate": 1.976939964738832e-05, "loss": 0.0218, "step": 48020 }, { "epoch": 0.69, "learning_rate": 1.976935160764985e-05, "loss": 0.0189, "step": 48030 }, { "epoch": 0.69, "learning_rate": 1.976930356791138e-05, "loss": 0.0178, "step": 48040 }, { "epoch": 0.69, "learning_rate": 1.9769255528172908e-05, "loss": 0.0142, "step": 48050 }, { "epoch": 0.69, "learning_rate": 1.9769207488434433e-05, "loss": 0.0163, "step": 48060 }, { "epoch": 0.69, "learning_rate": 1.9769159448695963e-05, "loss": 0.0229, "step": 48070 }, { "epoch": 0.69, "learning_rate": 1.9769111408957492e-05, "loss": 0.0177, "step": 48080 }, { "epoch": 0.69, "learning_rate": 1.9769063369219018e-05, "loss": 0.0155, "step": 48090 }, { "epoch": 0.69, "learning_rate": 1.9769015329480547e-05, "loss": 0.0177, "step": 48100 }, { "epoch": 0.69, "learning_rate": 1.9768967289742076e-05, "loss": 0.0196, "step": 48110 }, { "epoch": 0.69, "learning_rate": 1.9768919250003606e-05, "loss": 0.0273, "step": 48120 }, { "epoch": 0.69, "learning_rate": 1.976887121026513e-05, "loss": 0.0178, "step": 48130 }, { "epoch": 0.69, "learning_rate": 1.976882317052666e-05, "loss": 0.0127, "step": 48140 }, { "epoch": 0.69, "learning_rate": 1.976877513078819e-05, "loss": 0.0239, "step": 48150 }, { "epoch": 0.69, "learning_rate": 1.9768727091049716e-05, "loss": 0.0149, "step": 48160 }, { "epoch": 0.69, "learning_rate": 1.9768679051311245e-05, "loss": 0.0181, "step": 48170 }, { "epoch": 0.69, "learning_rate": 1.9768631011572775e-05, "loss": 0.0171, "step": 48180 }, { "epoch": 0.69, "learning_rate": 1.9768582971834304e-05, "loss": 0.0198, "step": 48190 }, { "epoch": 0.69, "learning_rate": 1.976853493209583e-05, "loss": 0.015, "step": 48200 }, { "epoch": 0.69, "learning_rate": 1.976848689235736e-05, "loss": 0.0205, "step": 48210 }, { "epoch": 0.69, "learning_rate": 1.9768438852618888e-05, "loss": 0.021, "step": 48220 }, { "epoch": 0.7, "learning_rate": 1.9768390812880418e-05, "loss": 0.0196, "step": 48230 }, { "epoch": 0.7, "learning_rate": 1.9768342773141943e-05, "loss": 0.0203, "step": 48240 }, { "epoch": 0.7, "learning_rate": 1.9768294733403473e-05, "loss": 0.013, "step": 48250 }, { "epoch": 0.7, "learning_rate": 1.9768246693665002e-05, "loss": 0.0262, "step": 48260 }, { "epoch": 0.7, "learning_rate": 1.9768198653926528e-05, "loss": 0.0195, "step": 48270 }, { "epoch": 0.7, "learning_rate": 1.9768150614188057e-05, "loss": 0.0168, "step": 48280 }, { "epoch": 0.7, "learning_rate": 1.9768102574449586e-05, "loss": 0.0183, "step": 48290 }, { "epoch": 0.7, "learning_rate": 1.9768054534711116e-05, "loss": 0.0202, "step": 48300 }, { "epoch": 0.7, "learning_rate": 1.976800649497264e-05, "loss": 0.0188, "step": 48310 }, { "epoch": 0.7, "learning_rate": 1.976795845523417e-05, "loss": 0.0192, "step": 48320 }, { "epoch": 0.7, "learning_rate": 1.97679104154957e-05, "loss": 0.02, "step": 48330 }, { "epoch": 0.7, "learning_rate": 1.9767862375757226e-05, "loss": 0.0172, "step": 48340 }, { "epoch": 0.7, "learning_rate": 1.9767814336018755e-05, "loss": 0.0192, "step": 48350 }, { "epoch": 0.7, "learning_rate": 1.9767766296280284e-05, "loss": 0.0158, "step": 48360 }, { "epoch": 0.7, "learning_rate": 1.9767718256541814e-05, "loss": 0.0172, "step": 48370 }, { "epoch": 0.7, "learning_rate": 1.976767021680334e-05, "loss": 0.0138, "step": 48380 }, { "epoch": 0.7, "learning_rate": 1.976762217706487e-05, "loss": 0.0151, "step": 48390 }, { "epoch": 0.7, "learning_rate": 1.9767574137326398e-05, "loss": 0.0162, "step": 48400 }, { "epoch": 0.7, "learning_rate": 1.9767526097587924e-05, "loss": 0.02, "step": 48410 }, { "epoch": 0.7, "learning_rate": 1.9767478057849453e-05, "loss": 0.0188, "step": 48420 }, { "epoch": 0.7, "learning_rate": 1.9767430018110983e-05, "loss": 0.0155, "step": 48430 }, { "epoch": 0.7, "learning_rate": 1.9767381978372512e-05, "loss": 0.0178, "step": 48440 }, { "epoch": 0.7, "learning_rate": 1.9767333938634038e-05, "loss": 0.0229, "step": 48450 }, { "epoch": 0.7, "learning_rate": 1.9767285898895567e-05, "loss": 0.016, "step": 48460 }, { "epoch": 0.7, "learning_rate": 1.9767237859157096e-05, "loss": 0.0164, "step": 48470 }, { "epoch": 0.7, "learning_rate": 1.9767189819418626e-05, "loss": 0.0197, "step": 48480 }, { "epoch": 0.7, "learning_rate": 1.976714177968015e-05, "loss": 0.0183, "step": 48490 }, { "epoch": 0.7, "learning_rate": 1.976709373994168e-05, "loss": 0.0155, "step": 48500 }, { "epoch": 0.7, "learning_rate": 1.976704570020321e-05, "loss": 0.0181, "step": 48510 }, { "epoch": 0.7, "learning_rate": 1.9766997660464736e-05, "loss": 0.0196, "step": 48520 }, { "epoch": 0.7, "learning_rate": 1.9766949620726265e-05, "loss": 0.0138, "step": 48530 }, { "epoch": 0.7, "learning_rate": 1.9766901580987794e-05, "loss": 0.0157, "step": 48540 }, { "epoch": 0.7, "learning_rate": 1.9766853541249324e-05, "loss": 0.021, "step": 48550 }, { "epoch": 0.7, "learning_rate": 1.976680550151085e-05, "loss": 0.0148, "step": 48560 }, { "epoch": 0.7, "learning_rate": 1.976675746177238e-05, "loss": 0.0198, "step": 48570 }, { "epoch": 0.7, "learning_rate": 1.9766709422033908e-05, "loss": 0.0179, "step": 48580 }, { "epoch": 0.7, "learning_rate": 1.9766661382295434e-05, "loss": 0.0186, "step": 48590 }, { "epoch": 0.7, "learning_rate": 1.9766613342556963e-05, "loss": 0.0243, "step": 48600 }, { "epoch": 0.7, "learning_rate": 1.9766565302818492e-05, "loss": 0.0198, "step": 48610 }, { "epoch": 0.7, "learning_rate": 1.9766517263080022e-05, "loss": 0.0183, "step": 48620 }, { "epoch": 0.7, "learning_rate": 1.9766469223341548e-05, "loss": 0.021, "step": 48630 }, { "epoch": 0.7, "learning_rate": 1.9766421183603077e-05, "loss": 0.0182, "step": 48640 }, { "epoch": 0.7, "learning_rate": 1.9766373143864606e-05, "loss": 0.0202, "step": 48650 }, { "epoch": 0.7, "learning_rate": 1.9766325104126135e-05, "loss": 0.0156, "step": 48660 }, { "epoch": 0.7, "learning_rate": 1.976627706438766e-05, "loss": 0.0197, "step": 48670 }, { "epoch": 0.7, "learning_rate": 1.976622902464919e-05, "loss": 0.0208, "step": 48680 }, { "epoch": 0.7, "learning_rate": 1.976618098491072e-05, "loss": 0.0132, "step": 48690 }, { "epoch": 0.7, "learning_rate": 1.9766132945172246e-05, "loss": 0.0205, "step": 48700 }, { "epoch": 0.7, "learning_rate": 1.9766084905433775e-05, "loss": 0.0141, "step": 48710 }, { "epoch": 0.7, "learning_rate": 1.9766036865695304e-05, "loss": 0.0178, "step": 48720 }, { "epoch": 0.7, "learning_rate": 1.9765988825956834e-05, "loss": 0.0196, "step": 48730 }, { "epoch": 0.7, "learning_rate": 1.976594078621836e-05, "loss": 0.0191, "step": 48740 }, { "epoch": 0.7, "learning_rate": 1.976589274647989e-05, "loss": 0.0196, "step": 48750 }, { "epoch": 0.7, "learning_rate": 1.9765844706741418e-05, "loss": 0.0125, "step": 48760 }, { "epoch": 0.7, "learning_rate": 1.9765796667002944e-05, "loss": 0.0125, "step": 48770 }, { "epoch": 0.7, "learning_rate": 1.9765748627264473e-05, "loss": 0.0181, "step": 48780 }, { "epoch": 0.7, "learning_rate": 1.9765700587526002e-05, "loss": 0.0199, "step": 48790 }, { "epoch": 0.7, "learning_rate": 1.976565254778753e-05, "loss": 0.023, "step": 48800 }, { "epoch": 0.7, "learning_rate": 1.9765604508049058e-05, "loss": 0.0174, "step": 48810 }, { "epoch": 0.7, "learning_rate": 1.9765556468310587e-05, "loss": 0.0145, "step": 48820 }, { "epoch": 0.7, "learning_rate": 1.9765508428572116e-05, "loss": 0.0157, "step": 48830 }, { "epoch": 0.7, "learning_rate": 1.9765460388833645e-05, "loss": 0.0186, "step": 48840 }, { "epoch": 0.7, "learning_rate": 1.976541234909517e-05, "loss": 0.0183, "step": 48850 }, { "epoch": 0.7, "learning_rate": 1.97653643093567e-05, "loss": 0.0184, "step": 48860 }, { "epoch": 0.7, "learning_rate": 1.976531626961823e-05, "loss": 0.0201, "step": 48870 }, { "epoch": 0.7, "learning_rate": 1.9765268229879756e-05, "loss": 0.0206, "step": 48880 }, { "epoch": 0.7, "learning_rate": 1.9765220190141285e-05, "loss": 0.0158, "step": 48890 }, { "epoch": 0.7, "learning_rate": 1.9765172150402814e-05, "loss": 0.018, "step": 48900 }, { "epoch": 0.7, "learning_rate": 1.9765124110664343e-05, "loss": 0.0146, "step": 48910 }, { "epoch": 0.71, "learning_rate": 1.976507607092587e-05, "loss": 0.0191, "step": 48920 }, { "epoch": 0.71, "learning_rate": 1.97650280311874e-05, "loss": 0.0193, "step": 48930 }, { "epoch": 0.71, "learning_rate": 1.9764979991448928e-05, "loss": 0.0186, "step": 48940 }, { "epoch": 0.71, "learning_rate": 1.9764931951710454e-05, "loss": 0.0168, "step": 48950 }, { "epoch": 0.71, "learning_rate": 1.9764883911971983e-05, "loss": 0.0157, "step": 48960 }, { "epoch": 0.71, "learning_rate": 1.9764835872233512e-05, "loss": 0.018, "step": 48970 }, { "epoch": 0.71, "learning_rate": 1.976478783249504e-05, "loss": 0.0325, "step": 48980 }, { "epoch": 0.71, "learning_rate": 1.976473979275657e-05, "loss": 0.0209, "step": 48990 }, { "epoch": 0.71, "learning_rate": 1.97646917530181e-05, "loss": 0.0174, "step": 49000 }, { "epoch": 0.71, "learning_rate": 1.9764643713279626e-05, "loss": 0.0184, "step": 49010 }, { "epoch": 0.71, "learning_rate": 1.9764595673541155e-05, "loss": 0.018, "step": 49020 }, { "epoch": 0.71, "learning_rate": 1.9764547633802685e-05, "loss": 0.0207, "step": 49030 }, { "epoch": 0.71, "learning_rate": 1.9764499594064214e-05, "loss": 0.02, "step": 49040 }, { "epoch": 0.71, "learning_rate": 1.976445155432574e-05, "loss": 0.0233, "step": 49050 }, { "epoch": 0.71, "learning_rate": 1.976440351458727e-05, "loss": 0.0198, "step": 49060 }, { "epoch": 0.71, "learning_rate": 1.9764355474848798e-05, "loss": 0.0239, "step": 49070 }, { "epoch": 0.71, "learning_rate": 1.9764307435110328e-05, "loss": 0.0168, "step": 49080 }, { "epoch": 0.71, "learning_rate": 1.9764259395371853e-05, "loss": 0.0245, "step": 49090 }, { "epoch": 0.71, "learning_rate": 1.9764211355633383e-05, "loss": 0.0203, "step": 49100 }, { "epoch": 0.71, "learning_rate": 1.9764163315894912e-05, "loss": 0.0173, "step": 49110 }, { "epoch": 0.71, "learning_rate": 1.9764115276156438e-05, "loss": 0.0189, "step": 49120 }, { "epoch": 0.71, "learning_rate": 1.9764067236417967e-05, "loss": 0.0166, "step": 49130 }, { "epoch": 0.71, "learning_rate": 1.9764019196679496e-05, "loss": 0.0144, "step": 49140 }, { "epoch": 0.71, "learning_rate": 1.9763971156941026e-05, "loss": 0.0184, "step": 49150 }, { "epoch": 0.71, "learning_rate": 1.976392311720255e-05, "loss": 0.0222, "step": 49160 }, { "epoch": 0.71, "learning_rate": 1.976387507746408e-05, "loss": 0.0173, "step": 49170 }, { "epoch": 0.71, "learning_rate": 1.976382703772561e-05, "loss": 0.0239, "step": 49180 }, { "epoch": 0.71, "learning_rate": 1.9763778997987136e-05, "loss": 0.0183, "step": 49190 }, { "epoch": 0.71, "learning_rate": 1.9763730958248665e-05, "loss": 0.0185, "step": 49200 }, { "epoch": 0.71, "learning_rate": 1.9763682918510194e-05, "loss": 0.0177, "step": 49210 }, { "epoch": 0.71, "learning_rate": 1.9763634878771724e-05, "loss": 0.0163, "step": 49220 }, { "epoch": 0.71, "learning_rate": 1.976358683903325e-05, "loss": 0.0166, "step": 49230 }, { "epoch": 0.71, "learning_rate": 1.976353879929478e-05, "loss": 0.0154, "step": 49240 }, { "epoch": 0.71, "learning_rate": 1.9763490759556308e-05, "loss": 0.0236, "step": 49250 }, { "epoch": 0.71, "learning_rate": 1.9763442719817837e-05, "loss": 0.0159, "step": 49260 }, { "epoch": 0.71, "learning_rate": 1.9763394680079363e-05, "loss": 0.0178, "step": 49270 }, { "epoch": 0.71, "learning_rate": 1.9763346640340893e-05, "loss": 0.0217, "step": 49280 }, { "epoch": 0.71, "learning_rate": 1.9763298600602422e-05, "loss": 0.0188, "step": 49290 }, { "epoch": 0.71, "learning_rate": 1.9763250560863948e-05, "loss": 0.0204, "step": 49300 }, { "epoch": 0.71, "learning_rate": 1.9763202521125477e-05, "loss": 0.0191, "step": 49310 }, { "epoch": 0.71, "learning_rate": 1.9763154481387006e-05, "loss": 0.0156, "step": 49320 }, { "epoch": 0.71, "learning_rate": 1.9763106441648536e-05, "loss": 0.0188, "step": 49330 }, { "epoch": 0.71, "learning_rate": 1.976305840191006e-05, "loss": 0.0138, "step": 49340 }, { "epoch": 0.71, "learning_rate": 1.976301036217159e-05, "loss": 0.0178, "step": 49350 }, { "epoch": 0.71, "learning_rate": 1.976296232243312e-05, "loss": 0.0175, "step": 49360 }, { "epoch": 0.71, "learning_rate": 1.9762914282694646e-05, "loss": 0.0128, "step": 49370 }, { "epoch": 0.71, "learning_rate": 1.9762866242956175e-05, "loss": 0.0188, "step": 49380 }, { "epoch": 0.71, "learning_rate": 1.9762818203217704e-05, "loss": 0.0217, "step": 49390 }, { "epoch": 0.71, "learning_rate": 1.9762770163479234e-05, "loss": 0.0175, "step": 49400 }, { "epoch": 0.71, "learning_rate": 1.976272212374076e-05, "loss": 0.0214, "step": 49410 }, { "epoch": 0.71, "learning_rate": 1.976267408400229e-05, "loss": 0.0187, "step": 49420 }, { "epoch": 0.71, "learning_rate": 1.9762626044263818e-05, "loss": 0.0153, "step": 49430 }, { "epoch": 0.71, "learning_rate": 1.9762578004525347e-05, "loss": 0.0192, "step": 49440 }, { "epoch": 0.71, "learning_rate": 1.9762529964786873e-05, "loss": 0.0189, "step": 49450 }, { "epoch": 0.71, "learning_rate": 1.9762481925048402e-05, "loss": 0.0157, "step": 49460 }, { "epoch": 0.71, "learning_rate": 1.9762433885309932e-05, "loss": 0.0176, "step": 49470 }, { "epoch": 0.71, "learning_rate": 1.9762385845571458e-05, "loss": 0.0191, "step": 49480 }, { "epoch": 0.71, "learning_rate": 1.9762337805832987e-05, "loss": 0.0156, "step": 49490 }, { "epoch": 0.71, "learning_rate": 1.9762289766094516e-05, "loss": 0.0167, "step": 49500 }, { "epoch": 0.71, "learning_rate": 1.9762241726356045e-05, "loss": 0.0171, "step": 49510 }, { "epoch": 0.71, "learning_rate": 1.976219368661757e-05, "loss": 0.0169, "step": 49520 }, { "epoch": 0.71, "learning_rate": 1.97621456468791e-05, "loss": 0.0131, "step": 49530 }, { "epoch": 0.71, "learning_rate": 1.976209760714063e-05, "loss": 0.0215, "step": 49540 }, { "epoch": 0.71, "learning_rate": 1.9762054371376005e-05, "loss": 0.0205, "step": 49550 }, { "epoch": 0.71, "learning_rate": 1.9762006331637534e-05, "loss": 0.019, "step": 49560 }, { "epoch": 0.71, "learning_rate": 1.9761958291899063e-05, "loss": 0.0164, "step": 49570 }, { "epoch": 0.71, "learning_rate": 1.976191025216059e-05, "loss": 0.0175, "step": 49580 }, { "epoch": 0.71, "learning_rate": 1.9761862212422118e-05, "loss": 0.0162, "step": 49590 }, { "epoch": 0.71, "learning_rate": 1.9761814172683647e-05, "loss": 0.0169, "step": 49600 }, { "epoch": 0.71, "learning_rate": 1.9761766132945173e-05, "loss": 0.0154, "step": 49610 }, { "epoch": 0.72, "learning_rate": 1.9761718093206703e-05, "loss": 0.0178, "step": 49620 }, { "epoch": 0.72, "learning_rate": 1.9761670053468232e-05, "loss": 0.0151, "step": 49630 }, { "epoch": 0.72, "learning_rate": 1.976162201372976e-05, "loss": 0.0181, "step": 49640 }, { "epoch": 0.72, "learning_rate": 1.9761573973991287e-05, "loss": 0.0137, "step": 49650 }, { "epoch": 0.72, "learning_rate": 1.9761525934252816e-05, "loss": 0.0179, "step": 49660 }, { "epoch": 0.72, "learning_rate": 1.9761477894514346e-05, "loss": 0.0172, "step": 49670 }, { "epoch": 0.72, "learning_rate": 1.976142985477587e-05, "loss": 0.0119, "step": 49680 }, { "epoch": 0.72, "learning_rate": 1.97613818150374e-05, "loss": 0.0168, "step": 49690 }, { "epoch": 0.72, "learning_rate": 1.976133377529893e-05, "loss": 0.0179, "step": 49700 }, { "epoch": 0.72, "learning_rate": 1.976128573556046e-05, "loss": 0.014, "step": 49710 }, { "epoch": 0.72, "learning_rate": 1.9761237695821985e-05, "loss": 0.0182, "step": 49720 }, { "epoch": 0.72, "learning_rate": 1.9761189656083514e-05, "loss": 0.0206, "step": 49730 }, { "epoch": 0.72, "learning_rate": 1.9761141616345044e-05, "loss": 0.0178, "step": 49740 }, { "epoch": 0.72, "learning_rate": 1.9761093576606573e-05, "loss": 0.0121, "step": 49750 }, { "epoch": 0.72, "learning_rate": 1.97610455368681e-05, "loss": 0.0201, "step": 49760 }, { "epoch": 0.72, "learning_rate": 1.9760997497129628e-05, "loss": 0.0236, "step": 49770 }, { "epoch": 0.72, "learning_rate": 1.9760949457391157e-05, "loss": 0.0174, "step": 49780 }, { "epoch": 0.72, "learning_rate": 1.9760901417652683e-05, "loss": 0.0218, "step": 49790 }, { "epoch": 0.72, "learning_rate": 1.9760853377914213e-05, "loss": 0.0199, "step": 49800 }, { "epoch": 0.72, "learning_rate": 1.9760805338175742e-05, "loss": 0.0127, "step": 49810 }, { "epoch": 0.72, "learning_rate": 1.976075729843727e-05, "loss": 0.0217, "step": 49820 }, { "epoch": 0.72, "learning_rate": 1.9760709258698797e-05, "loss": 0.0159, "step": 49830 }, { "epoch": 0.72, "learning_rate": 1.9760661218960326e-05, "loss": 0.014, "step": 49840 }, { "epoch": 0.72, "learning_rate": 1.9760613179221856e-05, "loss": 0.0148, "step": 49850 }, { "epoch": 0.72, "learning_rate": 1.976056513948338e-05, "loss": 0.022, "step": 49860 }, { "epoch": 0.72, "learning_rate": 1.976051709974491e-05, "loss": 0.0201, "step": 49870 }, { "epoch": 0.72, "learning_rate": 1.976046906000644e-05, "loss": 0.0194, "step": 49880 }, { "epoch": 0.72, "learning_rate": 1.976042102026797e-05, "loss": 0.0238, "step": 49890 }, { "epoch": 0.72, "learning_rate": 1.9760372980529495e-05, "loss": 0.0129, "step": 49900 }, { "epoch": 0.72, "learning_rate": 1.9760324940791024e-05, "loss": 0.0133, "step": 49910 }, { "epoch": 0.72, "learning_rate": 1.9760276901052554e-05, "loss": 0.0184, "step": 49920 }, { "epoch": 0.72, "learning_rate": 1.9760228861314083e-05, "loss": 0.0163, "step": 49930 }, { "epoch": 0.72, "learning_rate": 1.976018082157561e-05, "loss": 0.0114, "step": 49940 }, { "epoch": 0.72, "learning_rate": 1.9760132781837138e-05, "loss": 0.0166, "step": 49950 }, { "epoch": 0.72, "learning_rate": 1.9760084742098667e-05, "loss": 0.0201, "step": 49960 }, { "epoch": 0.72, "learning_rate": 1.9760036702360193e-05, "loss": 0.021, "step": 49970 }, { "epoch": 0.72, "learning_rate": 1.9759988662621722e-05, "loss": 0.0218, "step": 49980 }, { "epoch": 0.72, "learning_rate": 1.9759940622883252e-05, "loss": 0.0165, "step": 49990 }, { "epoch": 0.72, "learning_rate": 1.975989258314478e-05, "loss": 0.0235, "step": 50000 }, { "epoch": 0.72, "learning_rate": 1.9759844543406307e-05, "loss": 0.0189, "step": 50010 }, { "epoch": 0.72, "learning_rate": 1.9759796503667836e-05, "loss": 0.0217, "step": 50020 }, { "epoch": 0.72, "learning_rate": 1.9759748463929365e-05, "loss": 0.0179, "step": 50030 }, { "epoch": 0.72, "learning_rate": 1.975970042419089e-05, "loss": 0.0191, "step": 50040 }, { "epoch": 0.72, "learning_rate": 1.975965238445242e-05, "loss": 0.0177, "step": 50050 }, { "epoch": 0.72, "learning_rate": 1.975960434471395e-05, "loss": 0.0151, "step": 50060 }, { "epoch": 0.72, "learning_rate": 1.975955630497548e-05, "loss": 0.022, "step": 50070 }, { "epoch": 0.72, "learning_rate": 1.9759508265237005e-05, "loss": 0.0181, "step": 50080 }, { "epoch": 0.72, "learning_rate": 1.9759460225498534e-05, "loss": 0.0203, "step": 50090 }, { "epoch": 0.72, "learning_rate": 1.9759412185760064e-05, "loss": 0.0171, "step": 50100 }, { "epoch": 0.72, "learning_rate": 1.9759364146021593e-05, "loss": 0.0187, "step": 50110 }, { "epoch": 0.72, "learning_rate": 1.975931610628312e-05, "loss": 0.0194, "step": 50120 }, { "epoch": 0.72, "learning_rate": 1.9759268066544648e-05, "loss": 0.0165, "step": 50130 }, { "epoch": 0.72, "learning_rate": 1.9759220026806177e-05, "loss": 0.0152, "step": 50140 }, { "epoch": 0.72, "learning_rate": 1.9759171987067703e-05, "loss": 0.0132, "step": 50150 }, { "epoch": 0.72, "learning_rate": 1.9759123947329232e-05, "loss": 0.0223, "step": 50160 }, { "epoch": 0.72, "learning_rate": 1.975907590759076e-05, "loss": 0.0162, "step": 50170 }, { "epoch": 0.72, "learning_rate": 1.975902786785229e-05, "loss": 0.019, "step": 50180 }, { "epoch": 0.72, "learning_rate": 1.9758979828113817e-05, "loss": 0.0206, "step": 50190 }, { "epoch": 0.72, "learning_rate": 1.9758931788375346e-05, "loss": 0.0168, "step": 50200 }, { "epoch": 0.72, "learning_rate": 1.9758883748636875e-05, "loss": 0.0199, "step": 50210 }, { "epoch": 0.72, "learning_rate": 1.97588357088984e-05, "loss": 0.0212, "step": 50220 }, { "epoch": 0.72, "learning_rate": 1.975878766915993e-05, "loss": 0.0224, "step": 50230 }, { "epoch": 0.72, "learning_rate": 1.975873962942146e-05, "loss": 0.0208, "step": 50240 }, { "epoch": 0.72, "learning_rate": 1.975869158968299e-05, "loss": 0.0192, "step": 50250 }, { "epoch": 0.72, "learning_rate": 1.9758643549944515e-05, "loss": 0.0157, "step": 50260 }, { "epoch": 0.72, "learning_rate": 1.9758595510206044e-05, "loss": 0.0195, "step": 50270 }, { "epoch": 0.72, "learning_rate": 1.9758547470467573e-05, "loss": 0.0154, "step": 50280 }, { "epoch": 0.72, "learning_rate": 1.9758499430729103e-05, "loss": 0.0181, "step": 50290 }, { "epoch": 0.72, "learning_rate": 1.975845139099063e-05, "loss": 0.0139, "step": 50300 }, { "epoch": 0.73, "learning_rate": 1.9758403351252158e-05, "loss": 0.0166, "step": 50310 }, { "epoch": 0.73, "learning_rate": 1.9758355311513687e-05, "loss": 0.0188, "step": 50320 }, { "epoch": 0.73, "learning_rate": 1.9758307271775213e-05, "loss": 0.0123, "step": 50330 }, { "epoch": 0.73, "learning_rate": 1.9758259232036742e-05, "loss": 0.016, "step": 50340 }, { "epoch": 0.73, "learning_rate": 1.975821119229827e-05, "loss": 0.0171, "step": 50350 }, { "epoch": 0.73, "learning_rate": 1.97581631525598e-05, "loss": 0.0242, "step": 50360 }, { "epoch": 0.73, "learning_rate": 1.9758115112821327e-05, "loss": 0.0161, "step": 50370 }, { "epoch": 0.73, "learning_rate": 1.9758067073082856e-05, "loss": 0.016, "step": 50380 }, { "epoch": 0.73, "learning_rate": 1.9758019033344385e-05, "loss": 0.0131, "step": 50390 }, { "epoch": 0.73, "learning_rate": 1.975797099360591e-05, "loss": 0.0169, "step": 50400 }, { "epoch": 0.73, "learning_rate": 1.975792295386744e-05, "loss": 0.0159, "step": 50410 }, { "epoch": 0.73, "learning_rate": 1.975787491412897e-05, "loss": 0.0156, "step": 50420 }, { "epoch": 0.73, "learning_rate": 1.97578268743905e-05, "loss": 0.0187, "step": 50430 }, { "epoch": 0.73, "learning_rate": 1.9757778834652025e-05, "loss": 0.0183, "step": 50440 }, { "epoch": 0.73, "learning_rate": 1.9757730794913554e-05, "loss": 0.0153, "step": 50450 }, { "epoch": 0.73, "learning_rate": 1.9757682755175083e-05, "loss": 0.0175, "step": 50460 }, { "epoch": 0.73, "learning_rate": 1.9757634715436613e-05, "loss": 0.0187, "step": 50470 }, { "epoch": 0.73, "learning_rate": 1.975758667569814e-05, "loss": 0.0156, "step": 50480 }, { "epoch": 0.73, "learning_rate": 1.9757538635959668e-05, "loss": 0.0168, "step": 50490 }, { "epoch": 0.73, "learning_rate": 1.9757490596221197e-05, "loss": 0.015, "step": 50500 }, { "epoch": 0.73, "learning_rate": 1.9757442556482723e-05, "loss": 0.017, "step": 50510 }, { "epoch": 0.73, "learning_rate": 1.9757394516744252e-05, "loss": 0.0144, "step": 50520 }, { "epoch": 0.73, "learning_rate": 1.975734647700578e-05, "loss": 0.0195, "step": 50530 }, { "epoch": 0.73, "learning_rate": 1.975729843726731e-05, "loss": 0.0134, "step": 50540 }, { "epoch": 0.73, "learning_rate": 1.9757250397528837e-05, "loss": 0.019, "step": 50550 }, { "epoch": 0.73, "learning_rate": 1.9757202357790366e-05, "loss": 0.0189, "step": 50560 }, { "epoch": 0.73, "learning_rate": 1.9757154318051895e-05, "loss": 0.0186, "step": 50570 }, { "epoch": 0.73, "learning_rate": 1.975710627831342e-05, "loss": 0.0182, "step": 50580 }, { "epoch": 0.73, "learning_rate": 1.975705823857495e-05, "loss": 0.016, "step": 50590 }, { "epoch": 0.73, "learning_rate": 1.975701019883648e-05, "loss": 0.019, "step": 50600 }, { "epoch": 0.73, "learning_rate": 1.975696215909801e-05, "loss": 0.0186, "step": 50610 }, { "epoch": 0.73, "learning_rate": 1.9756914119359535e-05, "loss": 0.0166, "step": 50620 }, { "epoch": 0.73, "learning_rate": 1.9756866079621064e-05, "loss": 0.019, "step": 50630 }, { "epoch": 0.73, "learning_rate": 1.9756818039882593e-05, "loss": 0.0125, "step": 50640 }, { "epoch": 0.73, "learning_rate": 1.9756770000144123e-05, "loss": 0.0133, "step": 50650 }, { "epoch": 0.73, "learning_rate": 1.975672196040565e-05, "loss": 0.0234, "step": 50660 }, { "epoch": 0.73, "learning_rate": 1.9756673920667178e-05, "loss": 0.0203, "step": 50670 }, { "epoch": 0.73, "learning_rate": 1.9756625880928707e-05, "loss": 0.0173, "step": 50680 }, { "epoch": 0.73, "learning_rate": 1.9756577841190233e-05, "loss": 0.0173, "step": 50690 }, { "epoch": 0.73, "learning_rate": 1.9756529801451762e-05, "loss": 0.024, "step": 50700 }, { "epoch": 0.73, "learning_rate": 1.975648176171329e-05, "loss": 0.0179, "step": 50710 }, { "epoch": 0.73, "learning_rate": 1.975643372197482e-05, "loss": 0.016, "step": 50720 }, { "epoch": 0.73, "learning_rate": 1.9756385682236347e-05, "loss": 0.0212, "step": 50730 }, { "epoch": 0.73, "learning_rate": 1.9756337642497876e-05, "loss": 0.0155, "step": 50740 }, { "epoch": 0.73, "learning_rate": 1.9756289602759405e-05, "loss": 0.0199, "step": 50750 }, { "epoch": 0.73, "learning_rate": 1.975624156302093e-05, "loss": 0.0192, "step": 50760 }, { "epoch": 0.73, "learning_rate": 1.975619352328246e-05, "loss": 0.0229, "step": 50770 }, { "epoch": 0.73, "learning_rate": 1.975614548354399e-05, "loss": 0.0177, "step": 50780 }, { "epoch": 0.73, "learning_rate": 1.975609744380552e-05, "loss": 0.0197, "step": 50790 }, { "epoch": 0.73, "learning_rate": 1.9756049404067045e-05, "loss": 0.0159, "step": 50800 }, { "epoch": 0.73, "learning_rate": 1.9756001364328574e-05, "loss": 0.0166, "step": 50810 }, { "epoch": 0.73, "learning_rate": 1.9755953324590103e-05, "loss": 0.0183, "step": 50820 }, { "epoch": 0.73, "learning_rate": 1.9755905284851632e-05, "loss": 0.0166, "step": 50830 }, { "epoch": 0.73, "learning_rate": 1.975585724511316e-05, "loss": 0.0134, "step": 50840 }, { "epoch": 0.73, "learning_rate": 1.9755809205374688e-05, "loss": 0.0251, "step": 50850 }, { "epoch": 0.73, "learning_rate": 1.9755761165636217e-05, "loss": 0.0142, "step": 50860 }, { "epoch": 0.73, "learning_rate": 1.9755713125897743e-05, "loss": 0.0173, "step": 50870 }, { "epoch": 0.73, "learning_rate": 1.9755665086159272e-05, "loss": 0.0215, "step": 50880 }, { "epoch": 0.73, "learning_rate": 1.97556170464208e-05, "loss": 0.0167, "step": 50890 }, { "epoch": 0.73, "learning_rate": 1.975556900668233e-05, "loss": 0.0204, "step": 50900 }, { "epoch": 0.73, "learning_rate": 1.9755520966943856e-05, "loss": 0.0172, "step": 50910 }, { "epoch": 0.73, "learning_rate": 1.9755472927205386e-05, "loss": 0.0195, "step": 50920 }, { "epoch": 0.73, "learning_rate": 1.9755424887466915e-05, "loss": 0.0162, "step": 50930 }, { "epoch": 0.73, "learning_rate": 1.975537684772844e-05, "loss": 0.0171, "step": 50940 }, { "epoch": 0.73, "learning_rate": 1.975532880798997e-05, "loss": 0.0207, "step": 50950 }, { "epoch": 0.73, "learning_rate": 1.97552807682515e-05, "loss": 0.0147, "step": 50960 }, { "epoch": 0.73, "learning_rate": 1.975523272851303e-05, "loss": 0.0159, "step": 50970 }, { "epoch": 0.73, "learning_rate": 1.9755184688774555e-05, "loss": 0.0154, "step": 50980 }, { "epoch": 0.73, "learning_rate": 1.9755136649036084e-05, "loss": 0.0192, "step": 50990 }, { "epoch": 0.74, "learning_rate": 1.9755088609297613e-05, "loss": 0.0145, "step": 51000 }, { "epoch": 0.74, "learning_rate": 1.9755040569559142e-05, "loss": 0.0187, "step": 51010 }, { "epoch": 0.74, "learning_rate": 1.9754992529820668e-05, "loss": 0.0151, "step": 51020 }, { "epoch": 0.74, "learning_rate": 1.9754944490082198e-05, "loss": 0.0276, "step": 51030 }, { "epoch": 0.74, "learning_rate": 1.9754896450343727e-05, "loss": 0.0169, "step": 51040 }, { "epoch": 0.74, "learning_rate": 1.9754848410605253e-05, "loss": 0.0188, "step": 51050 }, { "epoch": 0.74, "learning_rate": 1.9754800370866782e-05, "loss": 0.0143, "step": 51060 }, { "epoch": 0.74, "learning_rate": 1.975475233112831e-05, "loss": 0.0121, "step": 51070 }, { "epoch": 0.74, "learning_rate": 1.975470429138984e-05, "loss": 0.0193, "step": 51080 }, { "epoch": 0.74, "learning_rate": 1.9754656251651366e-05, "loss": 0.0138, "step": 51090 }, { "epoch": 0.74, "learning_rate": 1.9754608211912896e-05, "loss": 0.0174, "step": 51100 }, { "epoch": 0.74, "learning_rate": 1.9754560172174425e-05, "loss": 0.0141, "step": 51110 }, { "epoch": 0.74, "learning_rate": 1.975451213243595e-05, "loss": 0.017, "step": 51120 }, { "epoch": 0.74, "learning_rate": 1.975446409269748e-05, "loss": 0.0163, "step": 51130 }, { "epoch": 0.74, "learning_rate": 1.975441605295901e-05, "loss": 0.0183, "step": 51140 }, { "epoch": 0.74, "learning_rate": 1.975436801322054e-05, "loss": 0.0182, "step": 51150 }, { "epoch": 0.74, "learning_rate": 1.9754319973482064e-05, "loss": 0.0168, "step": 51160 }, { "epoch": 0.74, "learning_rate": 1.9754271933743594e-05, "loss": 0.0188, "step": 51170 }, { "epoch": 0.74, "learning_rate": 1.9754223894005123e-05, "loss": 0.0124, "step": 51180 }, { "epoch": 0.74, "learning_rate": 1.9754175854266652e-05, "loss": 0.0188, "step": 51190 }, { "epoch": 0.74, "learning_rate": 1.9754127814528178e-05, "loss": 0.0234, "step": 51200 }, { "epoch": 0.74, "learning_rate": 1.9754079774789707e-05, "loss": 0.0178, "step": 51210 }, { "epoch": 0.74, "learning_rate": 1.9754031735051237e-05, "loss": 0.0165, "step": 51220 }, { "epoch": 0.74, "learning_rate": 1.9753983695312763e-05, "loss": 0.0187, "step": 51230 }, { "epoch": 0.74, "learning_rate": 1.9753935655574292e-05, "loss": 0.0134, "step": 51240 }, { "epoch": 0.74, "learning_rate": 1.975388761583582e-05, "loss": 0.0218, "step": 51250 }, { "epoch": 0.74, "learning_rate": 1.975383957609735e-05, "loss": 0.0178, "step": 51260 }, { "epoch": 0.74, "learning_rate": 1.9753791536358876e-05, "loss": 0.0159, "step": 51270 }, { "epoch": 0.74, "learning_rate": 1.9753743496620406e-05, "loss": 0.0217, "step": 51280 }, { "epoch": 0.74, "learning_rate": 1.9753695456881935e-05, "loss": 0.0235, "step": 51290 }, { "epoch": 0.74, "learning_rate": 1.975364741714346e-05, "loss": 0.0201, "step": 51300 }, { "epoch": 0.74, "learning_rate": 1.975359937740499e-05, "loss": 0.0151, "step": 51310 }, { "epoch": 0.74, "learning_rate": 1.975355133766652e-05, "loss": 0.0222, "step": 51320 }, { "epoch": 0.74, "learning_rate": 1.975350329792805e-05, "loss": 0.0195, "step": 51330 }, { "epoch": 0.74, "learning_rate": 1.9753455258189574e-05, "loss": 0.0193, "step": 51340 }, { "epoch": 0.74, "learning_rate": 1.9753407218451104e-05, "loss": 0.0252, "step": 51350 }, { "epoch": 0.74, "learning_rate": 1.9753359178712633e-05, "loss": 0.0147, "step": 51360 }, { "epoch": 0.74, "learning_rate": 1.9753311138974162e-05, "loss": 0.0202, "step": 51370 }, { "epoch": 0.74, "learning_rate": 1.9753263099235688e-05, "loss": 0.0159, "step": 51380 }, { "epoch": 0.74, "learning_rate": 1.9753215059497217e-05, "loss": 0.0164, "step": 51390 }, { "epoch": 0.74, "learning_rate": 1.9753167019758747e-05, "loss": 0.0193, "step": 51400 }, { "epoch": 0.74, "learning_rate": 1.9753118980020273e-05, "loss": 0.0183, "step": 51410 }, { "epoch": 0.74, "learning_rate": 1.9753070940281802e-05, "loss": 0.0183, "step": 51420 }, { "epoch": 0.74, "learning_rate": 1.975302290054333e-05, "loss": 0.0174, "step": 51430 }, { "epoch": 0.74, "learning_rate": 1.975297486080486e-05, "loss": 0.0162, "step": 51440 }, { "epoch": 0.74, "learning_rate": 1.9752926821066386e-05, "loss": 0.0153, "step": 51450 }, { "epoch": 0.74, "learning_rate": 1.9752878781327915e-05, "loss": 0.0175, "step": 51460 }, { "epoch": 0.74, "learning_rate": 1.9752830741589445e-05, "loss": 0.0191, "step": 51470 }, { "epoch": 0.74, "learning_rate": 1.975278270185097e-05, "loss": 0.0204, "step": 51480 }, { "epoch": 0.74, "learning_rate": 1.97527346621125e-05, "loss": 0.021, "step": 51490 }, { "epoch": 0.74, "learning_rate": 1.975268662237403e-05, "loss": 0.0148, "step": 51500 }, { "epoch": 0.74, "learning_rate": 1.975263858263556e-05, "loss": 0.0161, "step": 51510 }, { "epoch": 0.74, "learning_rate": 1.9752590542897084e-05, "loss": 0.0191, "step": 51520 }, { "epoch": 0.74, "learning_rate": 1.9752542503158614e-05, "loss": 0.0188, "step": 51530 }, { "epoch": 0.74, "learning_rate": 1.9752494463420143e-05, "loss": 0.0189, "step": 51540 }, { "epoch": 0.74, "learning_rate": 1.975244642368167e-05, "loss": 0.0199, "step": 51550 }, { "epoch": 0.74, "learning_rate": 1.9752398383943198e-05, "loss": 0.0189, "step": 51560 }, { "epoch": 0.74, "learning_rate": 1.9752350344204727e-05, "loss": 0.0192, "step": 51570 }, { "epoch": 0.74, "learning_rate": 1.9752302304466257e-05, "loss": 0.0158, "step": 51580 }, { "epoch": 0.74, "learning_rate": 1.9752254264727782e-05, "loss": 0.0177, "step": 51590 }, { "epoch": 0.74, "learning_rate": 1.9752206224989312e-05, "loss": 0.0181, "step": 51600 }, { "epoch": 0.74, "learning_rate": 1.975215818525084e-05, "loss": 0.0142, "step": 51610 }, { "epoch": 0.74, "learning_rate": 1.975211014551237e-05, "loss": 0.0125, "step": 51620 }, { "epoch": 0.74, "learning_rate": 1.9752062105773896e-05, "loss": 0.0208, "step": 51630 }, { "epoch": 0.74, "learning_rate": 1.9752014066035425e-05, "loss": 0.014, "step": 51640 }, { "epoch": 0.74, "learning_rate": 1.9751966026296955e-05, "loss": 0.0185, "step": 51650 }, { "epoch": 0.74, "learning_rate": 1.975191798655848e-05, "loss": 0.0202, "step": 51660 }, { "epoch": 0.74, "learning_rate": 1.975186994682001e-05, "loss": 0.0167, "step": 51670 }, { "epoch": 0.74, "learning_rate": 1.975182190708154e-05, "loss": 0.0192, "step": 51680 }, { "epoch": 0.74, "learning_rate": 1.975177386734307e-05, "loss": 0.0163, "step": 51690 }, { "epoch": 0.75, "learning_rate": 1.9751725827604594e-05, "loss": 0.0143, "step": 51700 }, { "epoch": 0.75, "learning_rate": 1.9751677787866124e-05, "loss": 0.0293, "step": 51710 }, { "epoch": 0.75, "learning_rate": 1.9751629748127653e-05, "loss": 0.0179, "step": 51720 }, { "epoch": 0.75, "learning_rate": 1.975158170838918e-05, "loss": 0.0193, "step": 51730 }, { "epoch": 0.75, "learning_rate": 1.9751533668650708e-05, "loss": 0.0213, "step": 51740 }, { "epoch": 0.75, "learning_rate": 1.9751485628912237e-05, "loss": 0.0158, "step": 51750 }, { "epoch": 0.75, "learning_rate": 1.9751437589173766e-05, "loss": 0.0166, "step": 51760 }, { "epoch": 0.75, "learning_rate": 1.9751389549435292e-05, "loss": 0.0181, "step": 51770 }, { "epoch": 0.75, "learning_rate": 1.975134150969682e-05, "loss": 0.0212, "step": 51780 }, { "epoch": 0.75, "learning_rate": 1.975129346995835e-05, "loss": 0.0128, "step": 51790 }, { "epoch": 0.75, "learning_rate": 1.975124543021988e-05, "loss": 0.0152, "step": 51800 }, { "epoch": 0.75, "learning_rate": 1.9751197390481406e-05, "loss": 0.0156, "step": 51810 }, { "epoch": 0.75, "learning_rate": 1.9751149350742935e-05, "loss": 0.0223, "step": 51820 }, { "epoch": 0.75, "learning_rate": 1.9751101311004465e-05, "loss": 0.0134, "step": 51830 }, { "epoch": 0.75, "learning_rate": 1.975105327126599e-05, "loss": 0.0206, "step": 51840 }, { "epoch": 0.75, "learning_rate": 1.975100523152752e-05, "loss": 0.0126, "step": 51850 }, { "epoch": 0.75, "learning_rate": 1.975095719178905e-05, "loss": 0.017, "step": 51860 }, { "epoch": 0.75, "learning_rate": 1.9750913956024424e-05, "loss": 0.0358, "step": 51870 }, { "epoch": 0.75, "learning_rate": 1.9750865916285953e-05, "loss": 0.0227, "step": 51880 }, { "epoch": 0.75, "learning_rate": 1.9750817876547482e-05, "loss": 0.0158, "step": 51890 }, { "epoch": 0.75, "learning_rate": 1.9750769836809008e-05, "loss": 0.0179, "step": 51900 }, { "epoch": 0.75, "learning_rate": 1.9750721797070537e-05, "loss": 0.015, "step": 51910 }, { "epoch": 0.75, "learning_rate": 1.9750673757332067e-05, "loss": 0.0179, "step": 51920 }, { "epoch": 0.75, "learning_rate": 1.9750625717593596e-05, "loss": 0.0151, "step": 51930 }, { "epoch": 0.75, "learning_rate": 1.9750577677855122e-05, "loss": 0.0199, "step": 51940 }, { "epoch": 0.75, "learning_rate": 1.975052963811665e-05, "loss": 0.0142, "step": 51950 }, { "epoch": 0.75, "learning_rate": 1.975048159837818e-05, "loss": 0.0188, "step": 51960 }, { "epoch": 0.75, "learning_rate": 1.9750433558639706e-05, "loss": 0.0159, "step": 51970 }, { "epoch": 0.75, "learning_rate": 1.9750385518901235e-05, "loss": 0.0172, "step": 51980 }, { "epoch": 0.75, "learning_rate": 1.9750337479162765e-05, "loss": 0.0158, "step": 51990 }, { "epoch": 0.75, "learning_rate": 1.9750289439424294e-05, "loss": 0.0218, "step": 52000 }, { "epoch": 0.75, "learning_rate": 1.975024139968582e-05, "loss": 0.0151, "step": 52010 }, { "epoch": 0.75, "learning_rate": 1.975019335994735e-05, "loss": 0.0184, "step": 52020 }, { "epoch": 0.75, "learning_rate": 1.975014532020888e-05, "loss": 0.014, "step": 52030 }, { "epoch": 0.75, "learning_rate": 1.9750097280470408e-05, "loss": 0.0204, "step": 52040 }, { "epoch": 0.75, "learning_rate": 1.9750049240731934e-05, "loss": 0.0145, "step": 52050 }, { "epoch": 0.75, "learning_rate": 1.9750001200993463e-05, "loss": 0.0236, "step": 52060 }, { "epoch": 0.75, "learning_rate": 1.9749953161254992e-05, "loss": 0.0162, "step": 52070 }, { "epoch": 0.75, "learning_rate": 1.9749905121516518e-05, "loss": 0.0173, "step": 52080 }, { "epoch": 0.75, "learning_rate": 1.9749857081778047e-05, "loss": 0.0197, "step": 52090 }, { "epoch": 0.75, "learning_rate": 1.9749809042039577e-05, "loss": 0.0206, "step": 52100 }, { "epoch": 0.75, "learning_rate": 1.9749761002301106e-05, "loss": 0.0206, "step": 52110 }, { "epoch": 0.75, "learning_rate": 1.974971296256263e-05, "loss": 0.0141, "step": 52120 }, { "epoch": 0.75, "learning_rate": 1.974966492282416e-05, "loss": 0.0147, "step": 52130 }, { "epoch": 0.75, "learning_rate": 1.974961688308569e-05, "loss": 0.0172, "step": 52140 }, { "epoch": 0.75, "learning_rate": 1.9749568843347216e-05, "loss": 0.0173, "step": 52150 }, { "epoch": 0.75, "learning_rate": 1.9749520803608745e-05, "loss": 0.0188, "step": 52160 }, { "epoch": 0.75, "learning_rate": 1.9749472763870275e-05, "loss": 0.0165, "step": 52170 }, { "epoch": 0.75, "learning_rate": 1.9749424724131804e-05, "loss": 0.0138, "step": 52180 }, { "epoch": 0.75, "learning_rate": 1.974937668439333e-05, "loss": 0.0258, "step": 52190 }, { "epoch": 0.75, "learning_rate": 1.974932864465486e-05, "loss": 0.0145, "step": 52200 }, { "epoch": 0.75, "learning_rate": 1.974928060491639e-05, "loss": 0.0213, "step": 52210 }, { "epoch": 0.75, "learning_rate": 1.9749232565177918e-05, "loss": 0.0173, "step": 52220 }, { "epoch": 0.75, "learning_rate": 1.9749184525439443e-05, "loss": 0.0157, "step": 52230 }, { "epoch": 0.75, "learning_rate": 1.9749136485700973e-05, "loss": 0.0223, "step": 52240 }, { "epoch": 0.75, "learning_rate": 1.9749088445962502e-05, "loss": 0.0162, "step": 52250 }, { "epoch": 0.75, "learning_rate": 1.9749040406224028e-05, "loss": 0.0193, "step": 52260 }, { "epoch": 0.75, "learning_rate": 1.9748992366485557e-05, "loss": 0.013, "step": 52270 }, { "epoch": 0.75, "learning_rate": 1.9748944326747086e-05, "loss": 0.0141, "step": 52280 }, { "epoch": 0.75, "learning_rate": 1.9748896287008616e-05, "loss": 0.0178, "step": 52290 }, { "epoch": 0.75, "learning_rate": 1.974884824727014e-05, "loss": 0.0169, "step": 52300 }, { "epoch": 0.75, "learning_rate": 1.974880020753167e-05, "loss": 0.022, "step": 52310 }, { "epoch": 0.75, "learning_rate": 1.97487521677932e-05, "loss": 0.015, "step": 52320 }, { "epoch": 0.75, "learning_rate": 1.9748704128054726e-05, "loss": 0.0152, "step": 52330 }, { "epoch": 0.75, "learning_rate": 1.9748656088316255e-05, "loss": 0.0224, "step": 52340 }, { "epoch": 0.75, "learning_rate": 1.9748608048577785e-05, "loss": 0.0219, "step": 52350 }, { "epoch": 0.75, "learning_rate": 1.9748560008839314e-05, "loss": 0.0201, "step": 52360 }, { "epoch": 0.75, "learning_rate": 1.974851196910084e-05, "loss": 0.0143, "step": 52370 }, { "epoch": 0.75, "learning_rate": 1.974846392936237e-05, "loss": 0.014, "step": 52380 }, { "epoch": 0.76, "learning_rate": 1.9748415889623898e-05, "loss": 0.0172, "step": 52390 }, { "epoch": 0.76, "learning_rate": 1.9748367849885428e-05, "loss": 0.0146, "step": 52400 }, { "epoch": 0.76, "learning_rate": 1.9748319810146953e-05, "loss": 0.018, "step": 52410 }, { "epoch": 0.76, "learning_rate": 1.9748271770408483e-05, "loss": 0.0218, "step": 52420 }, { "epoch": 0.76, "learning_rate": 1.9748223730670012e-05, "loss": 0.0265, "step": 52430 }, { "epoch": 0.76, "learning_rate": 1.9748175690931538e-05, "loss": 0.0148, "step": 52440 }, { "epoch": 0.76, "learning_rate": 1.9748127651193067e-05, "loss": 0.0177, "step": 52450 }, { "epoch": 0.76, "learning_rate": 1.9748079611454596e-05, "loss": 0.0199, "step": 52460 }, { "epoch": 0.76, "learning_rate": 1.9748031571716126e-05, "loss": 0.0172, "step": 52470 }, { "epoch": 0.76, "learning_rate": 1.974798353197765e-05, "loss": 0.0193, "step": 52480 }, { "epoch": 0.76, "learning_rate": 1.974793549223918e-05, "loss": 0.0128, "step": 52490 }, { "epoch": 0.76, "learning_rate": 1.974788745250071e-05, "loss": 0.0149, "step": 52500 }, { "epoch": 0.76, "learning_rate": 1.9747839412762236e-05, "loss": 0.0151, "step": 52510 }, { "epoch": 0.76, "learning_rate": 1.9747791373023765e-05, "loss": 0.0183, "step": 52520 }, { "epoch": 0.76, "learning_rate": 1.9747743333285294e-05, "loss": 0.0202, "step": 52530 }, { "epoch": 0.76, "learning_rate": 1.9747695293546824e-05, "loss": 0.013, "step": 52540 }, { "epoch": 0.76, "learning_rate": 1.974764725380835e-05, "loss": 0.0198, "step": 52550 }, { "epoch": 0.76, "learning_rate": 1.974759921406988e-05, "loss": 0.0212, "step": 52560 }, { "epoch": 0.76, "learning_rate": 1.9747551174331408e-05, "loss": 0.0201, "step": 52570 }, { "epoch": 0.76, "learning_rate": 1.9747503134592937e-05, "loss": 0.0185, "step": 52580 }, { "epoch": 0.76, "learning_rate": 1.9747455094854467e-05, "loss": 0.0208, "step": 52590 }, { "epoch": 0.76, "learning_rate": 1.9747407055115996e-05, "loss": 0.0091, "step": 52600 }, { "epoch": 0.76, "learning_rate": 1.9747359015377522e-05, "loss": 0.0237, "step": 52610 }, { "epoch": 0.76, "learning_rate": 1.974731097563905e-05, "loss": 0.016, "step": 52620 }, { "epoch": 0.76, "learning_rate": 1.974726293590058e-05, "loss": 0.0169, "step": 52630 }, { "epoch": 0.76, "learning_rate": 1.9747214896162106e-05, "loss": 0.0187, "step": 52640 }, { "epoch": 0.76, "learning_rate": 1.9747166856423636e-05, "loss": 0.0153, "step": 52650 }, { "epoch": 0.76, "learning_rate": 1.9747118816685165e-05, "loss": 0.0196, "step": 52660 }, { "epoch": 0.76, "learning_rate": 1.9747070776946694e-05, "loss": 0.0167, "step": 52670 }, { "epoch": 0.76, "learning_rate": 1.974702273720822e-05, "loss": 0.0208, "step": 52680 }, { "epoch": 0.76, "learning_rate": 1.974697469746975e-05, "loss": 0.0205, "step": 52690 }, { "epoch": 0.76, "learning_rate": 1.974692665773128e-05, "loss": 0.0168, "step": 52700 }, { "epoch": 0.76, "learning_rate": 1.9746878617992808e-05, "loss": 0.0196, "step": 52710 }, { "epoch": 0.76, "learning_rate": 1.9746830578254334e-05, "loss": 0.02, "step": 52720 }, { "epoch": 0.76, "learning_rate": 1.9746782538515863e-05, "loss": 0.0165, "step": 52730 }, { "epoch": 0.76, "learning_rate": 1.9746734498777392e-05, "loss": 0.0149, "step": 52740 }, { "epoch": 0.76, "learning_rate": 1.9746686459038918e-05, "loss": 0.0145, "step": 52750 }, { "epoch": 0.76, "learning_rate": 1.9746638419300447e-05, "loss": 0.0199, "step": 52760 }, { "epoch": 0.76, "learning_rate": 1.9746590379561977e-05, "loss": 0.0101, "step": 52770 }, { "epoch": 0.76, "learning_rate": 1.9746542339823506e-05, "loss": 0.0185, "step": 52780 }, { "epoch": 0.76, "learning_rate": 1.9746494300085032e-05, "loss": 0.0145, "step": 52790 }, { "epoch": 0.76, "learning_rate": 1.974644626034656e-05, "loss": 0.0179, "step": 52800 }, { "epoch": 0.76, "learning_rate": 1.974639822060809e-05, "loss": 0.0166, "step": 52810 }, { "epoch": 0.76, "learning_rate": 1.9746350180869616e-05, "loss": 0.024, "step": 52820 }, { "epoch": 0.76, "learning_rate": 1.9746302141131145e-05, "loss": 0.0152, "step": 52830 }, { "epoch": 0.76, "learning_rate": 1.9746254101392675e-05, "loss": 0.0162, "step": 52840 }, { "epoch": 0.76, "learning_rate": 1.9746206061654204e-05, "loss": 0.0144, "step": 52850 }, { "epoch": 0.76, "learning_rate": 1.974615802191573e-05, "loss": 0.0172, "step": 52860 }, { "epoch": 0.76, "learning_rate": 1.974610998217726e-05, "loss": 0.0167, "step": 52870 }, { "epoch": 0.76, "learning_rate": 1.974606194243879e-05, "loss": 0.0259, "step": 52880 }, { "epoch": 0.76, "learning_rate": 1.9746013902700318e-05, "loss": 0.018, "step": 52890 }, { "epoch": 0.76, "learning_rate": 1.9745965862961844e-05, "loss": 0.0155, "step": 52900 }, { "epoch": 0.76, "learning_rate": 1.9745917823223373e-05, "loss": 0.0152, "step": 52910 }, { "epoch": 0.76, "learning_rate": 1.9745869783484902e-05, "loss": 0.0143, "step": 52920 }, { "epoch": 0.76, "learning_rate": 1.9745821743746428e-05, "loss": 0.0201, "step": 52930 }, { "epoch": 0.76, "learning_rate": 1.9745773704007957e-05, "loss": 0.0161, "step": 52940 }, { "epoch": 0.76, "learning_rate": 1.9745725664269487e-05, "loss": 0.02, "step": 52950 }, { "epoch": 0.76, "learning_rate": 1.9745677624531016e-05, "loss": 0.0176, "step": 52960 }, { "epoch": 0.76, "learning_rate": 1.974562958479254e-05, "loss": 0.0166, "step": 52970 }, { "epoch": 0.76, "learning_rate": 1.974558154505407e-05, "loss": 0.0144, "step": 52980 }, { "epoch": 0.76, "learning_rate": 1.97455335053156e-05, "loss": 0.0116, "step": 52990 }, { "epoch": 0.76, "learning_rate": 1.9745485465577126e-05, "loss": 0.0217, "step": 53000 }, { "epoch": 0.76, "learning_rate": 1.9745437425838655e-05, "loss": 0.0139, "step": 53010 }, { "epoch": 0.76, "learning_rate": 1.9745389386100185e-05, "loss": 0.0175, "step": 53020 }, { "epoch": 0.76, "learning_rate": 1.9745341346361714e-05, "loss": 0.0171, "step": 53030 }, { "epoch": 0.76, "learning_rate": 1.974529330662324e-05, "loss": 0.0199, "step": 53040 }, { "epoch": 0.76, "learning_rate": 1.974524526688477e-05, "loss": 0.0124, "step": 53050 }, { "epoch": 0.76, "learning_rate": 1.97451972271463e-05, "loss": 0.0183, "step": 53060 }, { "epoch": 0.76, "learning_rate": 1.9745149187407828e-05, "loss": 0.0224, "step": 53070 }, { "epoch": 0.76, "learning_rate": 1.9745101147669353e-05, "loss": 0.0188, "step": 53080 }, { "epoch": 0.77, "learning_rate": 1.9745053107930883e-05, "loss": 0.0188, "step": 53090 }, { "epoch": 0.77, "learning_rate": 1.9745005068192412e-05, "loss": 0.0229, "step": 53100 }, { "epoch": 0.77, "learning_rate": 1.9744957028453938e-05, "loss": 0.0196, "step": 53110 }, { "epoch": 0.77, "learning_rate": 1.9744908988715467e-05, "loss": 0.0151, "step": 53120 }, { "epoch": 0.77, "learning_rate": 1.9744860948976996e-05, "loss": 0.0171, "step": 53130 }, { "epoch": 0.77, "learning_rate": 1.9744812909238526e-05, "loss": 0.0204, "step": 53140 }, { "epoch": 0.77, "learning_rate": 1.974476486950005e-05, "loss": 0.0223, "step": 53150 }, { "epoch": 0.77, "learning_rate": 1.974471682976158e-05, "loss": 0.0171, "step": 53160 }, { "epoch": 0.77, "learning_rate": 1.974466879002311e-05, "loss": 0.0158, "step": 53170 }, { "epoch": 0.77, "learning_rate": 1.9744620750284636e-05, "loss": 0.0148, "step": 53180 }, { "epoch": 0.77, "learning_rate": 1.9744572710546165e-05, "loss": 0.0187, "step": 53190 }, { "epoch": 0.77, "learning_rate": 1.9744524670807695e-05, "loss": 0.018, "step": 53200 }, { "epoch": 0.77, "learning_rate": 1.9744476631069224e-05, "loss": 0.0178, "step": 53210 }, { "epoch": 0.77, "learning_rate": 1.974442859133075e-05, "loss": 0.0173, "step": 53220 }, { "epoch": 0.77, "learning_rate": 1.974438055159228e-05, "loss": 0.02, "step": 53230 }, { "epoch": 0.77, "learning_rate": 1.9744332511853808e-05, "loss": 0.0199, "step": 53240 }, { "epoch": 0.77, "learning_rate": 1.9744284472115338e-05, "loss": 0.0211, "step": 53250 }, { "epoch": 0.77, "learning_rate": 1.9744236432376863e-05, "loss": 0.0279, "step": 53260 }, { "epoch": 0.77, "learning_rate": 1.9744188392638393e-05, "loss": 0.0167, "step": 53270 }, { "epoch": 0.77, "learning_rate": 1.9744140352899922e-05, "loss": 0.0156, "step": 53280 }, { "epoch": 0.77, "learning_rate": 1.9744092313161448e-05, "loss": 0.0172, "step": 53290 }, { "epoch": 0.77, "learning_rate": 1.9744044273422977e-05, "loss": 0.0171, "step": 53300 }, { "epoch": 0.77, "learning_rate": 1.9743996233684506e-05, "loss": 0.0125, "step": 53310 }, { "epoch": 0.77, "learning_rate": 1.9743948193946036e-05, "loss": 0.0167, "step": 53320 }, { "epoch": 0.77, "learning_rate": 1.974390015420756e-05, "loss": 0.0261, "step": 53330 }, { "epoch": 0.77, "learning_rate": 1.974385211446909e-05, "loss": 0.0135, "step": 53340 }, { "epoch": 0.77, "learning_rate": 1.974380407473062e-05, "loss": 0.0175, "step": 53350 }, { "epoch": 0.77, "learning_rate": 1.9743756034992146e-05, "loss": 0.0209, "step": 53360 }, { "epoch": 0.77, "learning_rate": 1.9743707995253675e-05, "loss": 0.019, "step": 53370 }, { "epoch": 0.77, "learning_rate": 1.9743659955515204e-05, "loss": 0.0145, "step": 53380 }, { "epoch": 0.77, "learning_rate": 1.9743611915776734e-05, "loss": 0.0156, "step": 53390 }, { "epoch": 0.77, "learning_rate": 1.974356387603826e-05, "loss": 0.0189, "step": 53400 }, { "epoch": 0.77, "learning_rate": 1.974351583629979e-05, "loss": 0.0192, "step": 53410 }, { "epoch": 0.77, "learning_rate": 1.9743467796561318e-05, "loss": 0.0167, "step": 53420 }, { "epoch": 0.77, "learning_rate": 1.9743419756822847e-05, "loss": 0.0193, "step": 53430 }, { "epoch": 0.77, "learning_rate": 1.9743371717084373e-05, "loss": 0.0134, "step": 53440 }, { "epoch": 0.77, "learning_rate": 1.9743323677345903e-05, "loss": 0.0135, "step": 53450 }, { "epoch": 0.77, "learning_rate": 1.9743275637607432e-05, "loss": 0.0202, "step": 53460 }, { "epoch": 0.77, "learning_rate": 1.9743227597868958e-05, "loss": 0.0177, "step": 53470 }, { "epoch": 0.77, "learning_rate": 1.9743179558130487e-05, "loss": 0.0198, "step": 53480 }, { "epoch": 0.77, "learning_rate": 1.9743131518392016e-05, "loss": 0.0123, "step": 53490 }, { "epoch": 0.77, "learning_rate": 1.9743083478653546e-05, "loss": 0.0133, "step": 53500 }, { "epoch": 0.77, "learning_rate": 1.974303543891507e-05, "loss": 0.0205, "step": 53510 }, { "epoch": 0.77, "learning_rate": 1.97429873991766e-05, "loss": 0.0177, "step": 53520 }, { "epoch": 0.77, "learning_rate": 1.974293935943813e-05, "loss": 0.017, "step": 53530 }, { "epoch": 0.77, "learning_rate": 1.9742891319699656e-05, "loss": 0.0148, "step": 53540 }, { "epoch": 0.77, "learning_rate": 1.9742843279961185e-05, "loss": 0.0171, "step": 53550 }, { "epoch": 0.77, "learning_rate": 1.9742795240222714e-05, "loss": 0.0237, "step": 53560 }, { "epoch": 0.77, "learning_rate": 1.9742747200484244e-05, "loss": 0.0204, "step": 53570 }, { "epoch": 0.77, "learning_rate": 1.974269916074577e-05, "loss": 0.0183, "step": 53580 }, { "epoch": 0.77, "learning_rate": 1.97426511210073e-05, "loss": 0.0263, "step": 53590 }, { "epoch": 0.77, "learning_rate": 1.9742603081268828e-05, "loss": 0.0196, "step": 53600 }, { "epoch": 0.77, "learning_rate": 1.9742555041530357e-05, "loss": 0.0212, "step": 53610 }, { "epoch": 0.77, "learning_rate": 1.9742507001791883e-05, "loss": 0.0177, "step": 53620 }, { "epoch": 0.77, "learning_rate": 1.9742458962053412e-05, "loss": 0.0195, "step": 53630 }, { "epoch": 0.77, "learning_rate": 1.9742410922314942e-05, "loss": 0.0153, "step": 53640 }, { "epoch": 0.77, "learning_rate": 1.9742362882576468e-05, "loss": 0.0188, "step": 53650 }, { "epoch": 0.77, "learning_rate": 1.9742314842837997e-05, "loss": 0.0183, "step": 53660 }, { "epoch": 0.77, "learning_rate": 1.9742266803099526e-05, "loss": 0.0209, "step": 53670 }, { "epoch": 0.77, "learning_rate": 1.9742218763361055e-05, "loss": 0.0175, "step": 53680 }, { "epoch": 0.77, "learning_rate": 1.974217072362258e-05, "loss": 0.0185, "step": 53690 }, { "epoch": 0.77, "learning_rate": 1.974212268388411e-05, "loss": 0.0096, "step": 53700 }, { "epoch": 0.77, "learning_rate": 1.974207464414564e-05, "loss": 0.0172, "step": 53710 }, { "epoch": 0.77, "learning_rate": 1.9742026604407166e-05, "loss": 0.0175, "step": 53720 }, { "epoch": 0.77, "learning_rate": 1.9741978564668695e-05, "loss": 0.0216, "step": 53730 }, { "epoch": 0.77, "learning_rate": 1.9741930524930224e-05, "loss": 0.0179, "step": 53740 }, { "epoch": 0.77, "learning_rate": 1.9741882485191754e-05, "loss": 0.0199, "step": 53750 }, { "epoch": 0.77, "learning_rate": 1.974183444545328e-05, "loss": 0.0232, "step": 53760 }, { "epoch": 0.77, "learning_rate": 1.974178640571481e-05, "loss": 0.0122, "step": 53770 }, { "epoch": 0.78, "learning_rate": 1.9741738365976338e-05, "loss": 0.0151, "step": 53780 }, { "epoch": 0.78, "learning_rate": 1.9741690326237867e-05, "loss": 0.0145, "step": 53790 }, { "epoch": 0.78, "learning_rate": 1.9741642286499393e-05, "loss": 0.0198, "step": 53800 }, { "epoch": 0.78, "learning_rate": 1.9741594246760922e-05, "loss": 0.0119, "step": 53810 }, { "epoch": 0.78, "learning_rate": 1.974154620702245e-05, "loss": 0.0165, "step": 53820 }, { "epoch": 0.78, "learning_rate": 1.9741498167283978e-05, "loss": 0.0195, "step": 53830 }, { "epoch": 0.78, "learning_rate": 1.9741450127545507e-05, "loss": 0.0144, "step": 53840 }, { "epoch": 0.78, "learning_rate": 1.9741402087807036e-05, "loss": 0.0154, "step": 53850 }, { "epoch": 0.78, "learning_rate": 1.9741354048068565e-05, "loss": 0.0188, "step": 53860 }, { "epoch": 0.78, "learning_rate": 1.974130600833009e-05, "loss": 0.0219, "step": 53870 }, { "epoch": 0.78, "learning_rate": 1.974125796859162e-05, "loss": 0.0144, "step": 53880 }, { "epoch": 0.78, "learning_rate": 1.974120992885315e-05, "loss": 0.0188, "step": 53890 }, { "epoch": 0.78, "learning_rate": 1.9741161889114676e-05, "loss": 0.0182, "step": 53900 }, { "epoch": 0.78, "learning_rate": 1.9741113849376205e-05, "loss": 0.0191, "step": 53910 }, { "epoch": 0.78, "learning_rate": 1.9741065809637734e-05, "loss": 0.0126, "step": 53920 }, { "epoch": 0.78, "learning_rate": 1.9741017769899263e-05, "loss": 0.0217, "step": 53930 }, { "epoch": 0.78, "learning_rate": 1.974096973016079e-05, "loss": 0.0188, "step": 53940 }, { "epoch": 0.78, "learning_rate": 1.974092169042232e-05, "loss": 0.0132, "step": 53950 }, { "epoch": 0.78, "learning_rate": 1.9740873650683848e-05, "loss": 0.0231, "step": 53960 }, { "epoch": 0.78, "learning_rate": 1.9740825610945377e-05, "loss": 0.0251, "step": 53970 }, { "epoch": 0.78, "learning_rate": 1.9740777571206903e-05, "loss": 0.0171, "step": 53980 }, { "epoch": 0.78, "learning_rate": 1.9740729531468432e-05, "loss": 0.0186, "step": 53990 }, { "epoch": 0.78, "learning_rate": 1.974068149172996e-05, "loss": 0.0199, "step": 54000 }, { "epoch": 0.78, "learning_rate": 1.9740633451991487e-05, "loss": 0.0304, "step": 54010 }, { "epoch": 0.78, "learning_rate": 1.9740585412253017e-05, "loss": 0.0172, "step": 54020 }, { "epoch": 0.78, "learning_rate": 1.9740537372514546e-05, "loss": 0.0188, "step": 54030 }, { "epoch": 0.78, "learning_rate": 1.9740489332776075e-05, "loss": 0.0197, "step": 54040 }, { "epoch": 0.78, "learning_rate": 1.97404412930376e-05, "loss": 0.0153, "step": 54050 }, { "epoch": 0.78, "learning_rate": 1.974039325329913e-05, "loss": 0.0138, "step": 54060 }, { "epoch": 0.78, "learning_rate": 1.974034521356066e-05, "loss": 0.0206, "step": 54070 }, { "epoch": 0.78, "learning_rate": 1.9740297173822186e-05, "loss": 0.021, "step": 54080 }, { "epoch": 0.78, "learning_rate": 1.9740249134083715e-05, "loss": 0.0205, "step": 54090 }, { "epoch": 0.78, "learning_rate": 1.9740201094345244e-05, "loss": 0.0169, "step": 54100 }, { "epoch": 0.78, "learning_rate": 1.9740153054606773e-05, "loss": 0.0138, "step": 54110 }, { "epoch": 0.78, "learning_rate": 1.97401050148683e-05, "loss": 0.0216, "step": 54120 }, { "epoch": 0.78, "learning_rate": 1.974005697512983e-05, "loss": 0.0189, "step": 54130 }, { "epoch": 0.78, "learning_rate": 1.9740008935391358e-05, "loss": 0.0162, "step": 54140 }, { "epoch": 0.78, "learning_rate": 1.9739960895652887e-05, "loss": 0.0124, "step": 54150 }, { "epoch": 0.78, "learning_rate": 1.9739912855914413e-05, "loss": 0.0177, "step": 54160 }, { "epoch": 0.78, "learning_rate": 1.9739864816175942e-05, "loss": 0.0154, "step": 54170 }, { "epoch": 0.78, "learning_rate": 1.973981677643747e-05, "loss": 0.0226, "step": 54180 }, { "epoch": 0.78, "learning_rate": 1.9739768736698997e-05, "loss": 0.0168, "step": 54190 }, { "epoch": 0.78, "learning_rate": 1.9739720696960527e-05, "loss": 0.0177, "step": 54200 }, { "epoch": 0.78, "learning_rate": 1.9739672657222056e-05, "loss": 0.0182, "step": 54210 }, { "epoch": 0.78, "learning_rate": 1.9739624617483585e-05, "loss": 0.0178, "step": 54220 }, { "epoch": 0.78, "learning_rate": 1.973957657774511e-05, "loss": 0.0174, "step": 54230 }, { "epoch": 0.78, "learning_rate": 1.973952853800664e-05, "loss": 0.0147, "step": 54240 }, { "epoch": 0.78, "learning_rate": 1.973948049826817e-05, "loss": 0.0147, "step": 54250 }, { "epoch": 0.78, "learning_rate": 1.9739432458529696e-05, "loss": 0.0133, "step": 54260 }, { "epoch": 0.78, "learning_rate": 1.9739384418791225e-05, "loss": 0.0176, "step": 54270 }, { "epoch": 0.78, "learning_rate": 1.9739336379052754e-05, "loss": 0.0135, "step": 54280 }, { "epoch": 0.78, "learning_rate": 1.9739288339314283e-05, "loss": 0.0171, "step": 54290 }, { "epoch": 0.78, "learning_rate": 1.973924029957581e-05, "loss": 0.0158, "step": 54300 }, { "epoch": 0.78, "learning_rate": 1.973919225983734e-05, "loss": 0.0179, "step": 54310 }, { "epoch": 0.78, "learning_rate": 1.9739144220098868e-05, "loss": 0.0158, "step": 54320 }, { "epoch": 0.78, "learning_rate": 1.9739096180360397e-05, "loss": 0.0134, "step": 54330 }, { "epoch": 0.78, "learning_rate": 1.9739048140621923e-05, "loss": 0.015, "step": 54340 }, { "epoch": 0.78, "learning_rate": 1.9739000100883452e-05, "loss": 0.0134, "step": 54350 }, { "epoch": 0.78, "learning_rate": 1.973895206114498e-05, "loss": 0.0132, "step": 54360 }, { "epoch": 0.78, "learning_rate": 1.9738904021406507e-05, "loss": 0.0193, "step": 54370 }, { "epoch": 0.78, "learning_rate": 1.9738855981668037e-05, "loss": 0.0142, "step": 54380 }, { "epoch": 0.78, "learning_rate": 1.9738807941929566e-05, "loss": 0.0159, "step": 54390 }, { "epoch": 0.78, "learning_rate": 1.9738759902191095e-05, "loss": 0.0159, "step": 54400 }, { "epoch": 0.78, "learning_rate": 1.973871186245262e-05, "loss": 0.0134, "step": 54410 }, { "epoch": 0.78, "learning_rate": 1.973866382271415e-05, "loss": 0.0135, "step": 54420 }, { "epoch": 0.78, "learning_rate": 1.973861578297568e-05, "loss": 0.0122, "step": 54430 }, { "epoch": 0.78, "learning_rate": 1.9738567743237205e-05, "loss": 0.0221, "step": 54440 }, { "epoch": 0.78, "learning_rate": 1.9738519703498735e-05, "loss": 0.014, "step": 54450 }, { "epoch": 0.78, "learning_rate": 1.9738471663760264e-05, "loss": 0.0187, "step": 54460 }, { "epoch": 0.79, "learning_rate": 1.9738423624021793e-05, "loss": 0.0164, "step": 54470 }, { "epoch": 0.79, "learning_rate": 1.973837558428332e-05, "loss": 0.0177, "step": 54480 }, { "epoch": 0.79, "learning_rate": 1.973832754454485e-05, "loss": 0.0231, "step": 54490 }, { "epoch": 0.79, "learning_rate": 1.9738279504806378e-05, "loss": 0.0164, "step": 54500 }, { "epoch": 0.79, "learning_rate": 1.9738231465067904e-05, "loss": 0.0174, "step": 54510 }, { "epoch": 0.79, "learning_rate": 1.9738183425329433e-05, "loss": 0.0161, "step": 54520 }, { "epoch": 0.79, "learning_rate": 1.9738135385590962e-05, "loss": 0.0191, "step": 54530 }, { "epoch": 0.79, "learning_rate": 1.973808734585249e-05, "loss": 0.0211, "step": 54540 }, { "epoch": 0.79, "learning_rate": 1.9738039306114017e-05, "loss": 0.0189, "step": 54550 }, { "epoch": 0.79, "learning_rate": 1.9737991266375546e-05, "loss": 0.0174, "step": 54560 }, { "epoch": 0.79, "learning_rate": 1.9737943226637076e-05, "loss": 0.0139, "step": 54570 }, { "epoch": 0.79, "learning_rate": 1.9737895186898605e-05, "loss": 0.022, "step": 54580 }, { "epoch": 0.79, "learning_rate": 1.973784714716013e-05, "loss": 0.0151, "step": 54590 }, { "epoch": 0.79, "learning_rate": 1.973779910742166e-05, "loss": 0.0132, "step": 54600 }, { "epoch": 0.79, "learning_rate": 1.973775106768319e-05, "loss": 0.0212, "step": 54610 }, { "epoch": 0.79, "learning_rate": 1.9737703027944715e-05, "loss": 0.012, "step": 54620 }, { "epoch": 0.79, "learning_rate": 1.9737654988206245e-05, "loss": 0.0169, "step": 54630 }, { "epoch": 0.79, "learning_rate": 1.9737606948467774e-05, "loss": 0.0154, "step": 54640 }, { "epoch": 0.79, "learning_rate": 1.9737558908729303e-05, "loss": 0.0134, "step": 54650 }, { "epoch": 0.79, "learning_rate": 1.973751086899083e-05, "loss": 0.0159, "step": 54660 }, { "epoch": 0.79, "learning_rate": 1.9737462829252358e-05, "loss": 0.0172, "step": 54670 }, { "epoch": 0.79, "learning_rate": 1.9737414789513888e-05, "loss": 0.0181, "step": 54680 }, { "epoch": 0.79, "learning_rate": 1.9737366749775413e-05, "loss": 0.0218, "step": 54690 }, { "epoch": 0.79, "learning_rate": 1.9737318710036943e-05, "loss": 0.0166, "step": 54700 }, { "epoch": 0.79, "learning_rate": 1.9737270670298472e-05, "loss": 0.0173, "step": 54710 }, { "epoch": 0.79, "learning_rate": 1.973722263056e-05, "loss": 0.0148, "step": 54720 }, { "epoch": 0.79, "learning_rate": 1.9737174590821527e-05, "loss": 0.0204, "step": 54730 }, { "epoch": 0.79, "learning_rate": 1.9737126551083056e-05, "loss": 0.0153, "step": 54740 }, { "epoch": 0.79, "learning_rate": 1.9737078511344586e-05, "loss": 0.0162, "step": 54750 }, { "epoch": 0.79, "learning_rate": 1.9737030471606115e-05, "loss": 0.0151, "step": 54760 }, { "epoch": 0.79, "learning_rate": 1.973698243186764e-05, "loss": 0.018, "step": 54770 }, { "epoch": 0.79, "learning_rate": 1.973693439212917e-05, "loss": 0.0185, "step": 54780 }, { "epoch": 0.79, "learning_rate": 1.97368863523907e-05, "loss": 0.0168, "step": 54790 }, { "epoch": 0.79, "learning_rate": 1.9736838312652225e-05, "loss": 0.0152, "step": 54800 }, { "epoch": 0.79, "learning_rate": 1.9736790272913755e-05, "loss": 0.014, "step": 54810 }, { "epoch": 0.79, "learning_rate": 1.9736742233175284e-05, "loss": 0.0159, "step": 54820 }, { "epoch": 0.79, "learning_rate": 1.9736694193436813e-05, "loss": 0.0165, "step": 54830 }, { "epoch": 0.79, "learning_rate": 1.973664615369834e-05, "loss": 0.0184, "step": 54840 }, { "epoch": 0.79, "learning_rate": 1.9736598113959868e-05, "loss": 0.0151, "step": 54850 }, { "epoch": 0.79, "learning_rate": 1.9736550074221397e-05, "loss": 0.0164, "step": 54860 }, { "epoch": 0.79, "learning_rate": 1.9736502034482923e-05, "loss": 0.018, "step": 54870 }, { "epoch": 0.79, "learning_rate": 1.9736453994744453e-05, "loss": 0.0218, "step": 54880 }, { "epoch": 0.79, "learning_rate": 1.9736405955005982e-05, "loss": 0.0135, "step": 54890 }, { "epoch": 0.79, "learning_rate": 1.973635791526751e-05, "loss": 0.0185, "step": 54900 }, { "epoch": 0.79, "learning_rate": 1.9736309875529037e-05, "loss": 0.0214, "step": 54910 }, { "epoch": 0.79, "learning_rate": 1.9736261835790566e-05, "loss": 0.0122, "step": 54920 }, { "epoch": 0.79, "learning_rate": 1.973621860002594e-05, "loss": 0.0168, "step": 54930 }, { "epoch": 0.79, "learning_rate": 1.973617056028747e-05, "loss": 0.0155, "step": 54940 }, { "epoch": 0.79, "learning_rate": 1.9736122520549e-05, "loss": 0.0163, "step": 54950 }, { "epoch": 0.79, "learning_rate": 1.973607448081053e-05, "loss": 0.0199, "step": 54960 }, { "epoch": 0.79, "learning_rate": 1.9736026441072055e-05, "loss": 0.0189, "step": 54970 }, { "epoch": 0.79, "learning_rate": 1.9735978401333584e-05, "loss": 0.0161, "step": 54980 }, { "epoch": 0.79, "learning_rate": 1.9735930361595113e-05, "loss": 0.0099, "step": 54990 }, { "epoch": 0.79, "learning_rate": 1.9735882321856642e-05, "loss": 0.0153, "step": 55000 }, { "epoch": 0.79, "learning_rate": 1.973583428211817e-05, "loss": 0.019, "step": 55010 }, { "epoch": 0.79, "learning_rate": 1.9735786242379698e-05, "loss": 0.0229, "step": 55020 }, { "epoch": 0.79, "learning_rate": 1.9735738202641227e-05, "loss": 0.0131, "step": 55030 }, { "epoch": 0.79, "learning_rate": 1.9735690162902753e-05, "loss": 0.0203, "step": 55040 }, { "epoch": 0.79, "learning_rate": 1.9735642123164282e-05, "loss": 0.0162, "step": 55050 }, { "epoch": 0.79, "learning_rate": 1.973559408342581e-05, "loss": 0.0187, "step": 55060 }, { "epoch": 0.79, "learning_rate": 1.973554604368734e-05, "loss": 0.0147, "step": 55070 }, { "epoch": 0.79, "learning_rate": 1.9735498003948866e-05, "loss": 0.0204, "step": 55080 }, { "epoch": 0.79, "learning_rate": 1.9735449964210396e-05, "loss": 0.0191, "step": 55090 }, { "epoch": 0.79, "learning_rate": 1.9735401924471925e-05, "loss": 0.0169, "step": 55100 }, { "epoch": 0.79, "learning_rate": 1.973535388473345e-05, "loss": 0.0191, "step": 55110 }, { "epoch": 0.79, "learning_rate": 1.973530584499498e-05, "loss": 0.0211, "step": 55120 }, { "epoch": 0.79, "learning_rate": 1.973525780525651e-05, "loss": 0.0178, "step": 55130 }, { "epoch": 0.79, "learning_rate": 1.973520976551804e-05, "loss": 0.0186, "step": 55140 }, { "epoch": 0.79, "learning_rate": 1.9735161725779565e-05, "loss": 0.013, "step": 55150 }, { "epoch": 0.79, "learning_rate": 1.9735113686041094e-05, "loss": 0.0192, "step": 55160 }, { "epoch": 0.8, "learning_rate": 1.9735065646302623e-05, "loss": 0.0179, "step": 55170 }, { "epoch": 0.8, "learning_rate": 1.9735017606564152e-05, "loss": 0.0123, "step": 55180 }, { "epoch": 0.8, "learning_rate": 1.9734969566825678e-05, "loss": 0.0232, "step": 55190 }, { "epoch": 0.8, "learning_rate": 1.9734921527087208e-05, "loss": 0.017, "step": 55200 }, { "epoch": 0.8, "learning_rate": 1.9734873487348737e-05, "loss": 0.0177, "step": 55210 }, { "epoch": 0.8, "learning_rate": 1.9734825447610263e-05, "loss": 0.0152, "step": 55220 }, { "epoch": 0.8, "learning_rate": 1.9734777407871792e-05, "loss": 0.0141, "step": 55230 }, { "epoch": 0.8, "learning_rate": 1.973472936813332e-05, "loss": 0.0184, "step": 55240 }, { "epoch": 0.8, "learning_rate": 1.973468132839485e-05, "loss": 0.0206, "step": 55250 }, { "epoch": 0.8, "learning_rate": 1.9734633288656376e-05, "loss": 0.0154, "step": 55260 }, { "epoch": 0.8, "learning_rate": 1.9734585248917906e-05, "loss": 0.0236, "step": 55270 }, { "epoch": 0.8, "learning_rate": 1.9734537209179435e-05, "loss": 0.0185, "step": 55280 }, { "epoch": 0.8, "learning_rate": 1.973448916944096e-05, "loss": 0.0173, "step": 55290 }, { "epoch": 0.8, "learning_rate": 1.973444112970249e-05, "loss": 0.0168, "step": 55300 }, { "epoch": 0.8, "learning_rate": 1.973439308996402e-05, "loss": 0.0182, "step": 55310 }, { "epoch": 0.8, "learning_rate": 1.973434505022555e-05, "loss": 0.022, "step": 55320 }, { "epoch": 0.8, "learning_rate": 1.9734297010487074e-05, "loss": 0.0194, "step": 55330 }, { "epoch": 0.8, "learning_rate": 1.9734248970748604e-05, "loss": 0.018, "step": 55340 }, { "epoch": 0.8, "learning_rate": 1.9734200931010133e-05, "loss": 0.0155, "step": 55350 }, { "epoch": 0.8, "learning_rate": 1.9734152891271662e-05, "loss": 0.0195, "step": 55360 }, { "epoch": 0.8, "learning_rate": 1.9734104851533188e-05, "loss": 0.0146, "step": 55370 }, { "epoch": 0.8, "learning_rate": 1.9734056811794717e-05, "loss": 0.0157, "step": 55380 }, { "epoch": 0.8, "learning_rate": 1.9734008772056247e-05, "loss": 0.0187, "step": 55390 }, { "epoch": 0.8, "learning_rate": 1.9733960732317773e-05, "loss": 0.0154, "step": 55400 }, { "epoch": 0.8, "learning_rate": 1.9733912692579302e-05, "loss": 0.0136, "step": 55410 }, { "epoch": 0.8, "learning_rate": 1.973386465284083e-05, "loss": 0.017, "step": 55420 }, { "epoch": 0.8, "learning_rate": 1.973381661310236e-05, "loss": 0.0181, "step": 55430 }, { "epoch": 0.8, "learning_rate": 1.9733768573363886e-05, "loss": 0.0168, "step": 55440 }, { "epoch": 0.8, "learning_rate": 1.9733720533625416e-05, "loss": 0.0172, "step": 55450 }, { "epoch": 0.8, "learning_rate": 1.9733672493886945e-05, "loss": 0.0179, "step": 55460 }, { "epoch": 0.8, "learning_rate": 1.973362445414847e-05, "loss": 0.0176, "step": 55470 }, { "epoch": 0.8, "learning_rate": 1.973357641441e-05, "loss": 0.0203, "step": 55480 }, { "epoch": 0.8, "learning_rate": 1.973352837467153e-05, "loss": 0.0152, "step": 55490 }, { "epoch": 0.8, "learning_rate": 1.973348033493306e-05, "loss": 0.016, "step": 55500 }, { "epoch": 0.8, "learning_rate": 1.9733432295194584e-05, "loss": 0.0153, "step": 55510 }, { "epoch": 0.8, "learning_rate": 1.9733384255456114e-05, "loss": 0.0119, "step": 55520 }, { "epoch": 0.8, "learning_rate": 1.9733336215717643e-05, "loss": 0.0145, "step": 55530 }, { "epoch": 0.8, "learning_rate": 1.9733288175979172e-05, "loss": 0.0165, "step": 55540 }, { "epoch": 0.8, "learning_rate": 1.9733240136240698e-05, "loss": 0.0135, "step": 55550 }, { "epoch": 0.8, "learning_rate": 1.9733192096502227e-05, "loss": 0.0186, "step": 55560 }, { "epoch": 0.8, "learning_rate": 1.9733144056763757e-05, "loss": 0.019, "step": 55570 }, { "epoch": 0.8, "learning_rate": 1.9733096017025283e-05, "loss": 0.0153, "step": 55580 }, { "epoch": 0.8, "learning_rate": 1.9733047977286812e-05, "loss": 0.0157, "step": 55590 }, { "epoch": 0.8, "learning_rate": 1.973299993754834e-05, "loss": 0.0137, "step": 55600 }, { "epoch": 0.8, "learning_rate": 1.973295189780987e-05, "loss": 0.0177, "step": 55610 }, { "epoch": 0.8, "learning_rate": 1.9732903858071396e-05, "loss": 0.0129, "step": 55620 }, { "epoch": 0.8, "learning_rate": 1.9732855818332925e-05, "loss": 0.0175, "step": 55630 }, { "epoch": 0.8, "learning_rate": 1.9732807778594455e-05, "loss": 0.0221, "step": 55640 }, { "epoch": 0.8, "learning_rate": 1.973275973885598e-05, "loss": 0.0204, "step": 55650 }, { "epoch": 0.8, "learning_rate": 1.9732711699117513e-05, "loss": 0.0201, "step": 55660 }, { "epoch": 0.8, "learning_rate": 1.9732663659379043e-05, "loss": 0.0165, "step": 55670 }, { "epoch": 0.8, "learning_rate": 1.973261561964057e-05, "loss": 0.0135, "step": 55680 }, { "epoch": 0.8, "learning_rate": 1.9732567579902098e-05, "loss": 0.0158, "step": 55690 }, { "epoch": 0.8, "learning_rate": 1.9732519540163627e-05, "loss": 0.0179, "step": 55700 }, { "epoch": 0.8, "learning_rate": 1.9732471500425153e-05, "loss": 0.0194, "step": 55710 }, { "epoch": 0.8, "learning_rate": 1.9732423460686682e-05, "loss": 0.0196, "step": 55720 }, { "epoch": 0.8, "learning_rate": 1.973237542094821e-05, "loss": 0.0179, "step": 55730 }, { "epoch": 0.8, "learning_rate": 1.973232738120974e-05, "loss": 0.0163, "step": 55740 }, { "epoch": 0.8, "learning_rate": 1.9732279341471267e-05, "loss": 0.0151, "step": 55750 }, { "epoch": 0.8, "learning_rate": 1.9732231301732796e-05, "loss": 0.0164, "step": 55760 }, { "epoch": 0.8, "learning_rate": 1.9732183261994325e-05, "loss": 0.0197, "step": 55770 }, { "epoch": 0.8, "learning_rate": 1.973213522225585e-05, "loss": 0.0153, "step": 55780 }, { "epoch": 0.8, "learning_rate": 1.973208718251738e-05, "loss": 0.0134, "step": 55790 }, { "epoch": 0.8, "learning_rate": 1.973203914277891e-05, "loss": 0.0147, "step": 55800 }, { "epoch": 0.8, "learning_rate": 1.973199110304044e-05, "loss": 0.0165, "step": 55810 }, { "epoch": 0.8, "learning_rate": 1.9731943063301965e-05, "loss": 0.0191, "step": 55820 }, { "epoch": 0.8, "learning_rate": 1.9731895023563494e-05, "loss": 0.0149, "step": 55830 }, { "epoch": 0.8, "learning_rate": 1.9731846983825023e-05, "loss": 0.0168, "step": 55840 }, { "epoch": 0.8, "learning_rate": 1.9731798944086552e-05, "loss": 0.018, "step": 55850 }, { "epoch": 0.81, "learning_rate": 1.973175090434808e-05, "loss": 0.0141, "step": 55860 }, { "epoch": 0.81, "learning_rate": 1.9731702864609608e-05, "loss": 0.0188, "step": 55870 }, { "epoch": 0.81, "learning_rate": 1.9731654824871137e-05, "loss": 0.0171, "step": 55880 }, { "epoch": 0.81, "learning_rate": 1.9731606785132663e-05, "loss": 0.016, "step": 55890 }, { "epoch": 0.81, "learning_rate": 1.9731558745394192e-05, "loss": 0.0159, "step": 55900 }, { "epoch": 0.81, "learning_rate": 1.973151070565572e-05, "loss": 0.0175, "step": 55910 }, { "epoch": 0.81, "learning_rate": 1.973146266591725e-05, "loss": 0.0165, "step": 55920 }, { "epoch": 0.81, "learning_rate": 1.9731414626178776e-05, "loss": 0.0159, "step": 55930 }, { "epoch": 0.81, "learning_rate": 1.9731366586440306e-05, "loss": 0.0143, "step": 55940 }, { "epoch": 0.81, "learning_rate": 1.9731318546701835e-05, "loss": 0.0168, "step": 55950 }, { "epoch": 0.81, "learning_rate": 1.973127050696336e-05, "loss": 0.0174, "step": 55960 }, { "epoch": 0.81, "learning_rate": 1.973122246722489e-05, "loss": 0.018, "step": 55970 }, { "epoch": 0.81, "learning_rate": 1.973117442748642e-05, "loss": 0.0168, "step": 55980 }, { "epoch": 0.81, "learning_rate": 1.973112638774795e-05, "loss": 0.0135, "step": 55990 }, { "epoch": 0.81, "learning_rate": 1.9731078348009475e-05, "loss": 0.0221, "step": 56000 }, { "epoch": 0.81, "learning_rate": 1.9731030308271004e-05, "loss": 0.0183, "step": 56010 }, { "epoch": 0.81, "learning_rate": 1.9730982268532533e-05, "loss": 0.0151, "step": 56020 }, { "epoch": 0.81, "learning_rate": 1.9730934228794062e-05, "loss": 0.0151, "step": 56030 }, { "epoch": 0.81, "learning_rate": 1.9730886189055588e-05, "loss": 0.0154, "step": 56040 }, { "epoch": 0.81, "learning_rate": 1.9730838149317118e-05, "loss": 0.0153, "step": 56050 }, { "epoch": 0.81, "learning_rate": 1.9730790109578647e-05, "loss": 0.0174, "step": 56060 }, { "epoch": 0.81, "learning_rate": 1.9730742069840173e-05, "loss": 0.0215, "step": 56070 }, { "epoch": 0.81, "learning_rate": 1.9730694030101702e-05, "loss": 0.0198, "step": 56080 }, { "epoch": 0.81, "learning_rate": 1.973064599036323e-05, "loss": 0.0135, "step": 56090 }, { "epoch": 0.81, "learning_rate": 1.973059795062476e-05, "loss": 0.018, "step": 56100 }, { "epoch": 0.81, "learning_rate": 1.9730549910886286e-05, "loss": 0.013, "step": 56110 }, { "epoch": 0.81, "learning_rate": 1.9730501871147816e-05, "loss": 0.0249, "step": 56120 }, { "epoch": 0.81, "learning_rate": 1.9730453831409345e-05, "loss": 0.0186, "step": 56130 }, { "epoch": 0.81, "learning_rate": 1.973040579167087e-05, "loss": 0.0159, "step": 56140 }, { "epoch": 0.81, "learning_rate": 1.97303577519324e-05, "loss": 0.0147, "step": 56150 }, { "epoch": 0.81, "learning_rate": 1.973030971219393e-05, "loss": 0.015, "step": 56160 }, { "epoch": 0.81, "learning_rate": 1.973026167245546e-05, "loss": 0.0188, "step": 56170 }, { "epoch": 0.81, "learning_rate": 1.9730213632716984e-05, "loss": 0.0182, "step": 56180 }, { "epoch": 0.81, "learning_rate": 1.9730165592978514e-05, "loss": 0.0182, "step": 56190 }, { "epoch": 0.81, "learning_rate": 1.9730117553240043e-05, "loss": 0.0186, "step": 56200 }, { "epoch": 0.81, "learning_rate": 1.9730069513501572e-05, "loss": 0.0246, "step": 56210 }, { "epoch": 0.81, "learning_rate": 1.9730021473763098e-05, "loss": 0.0177, "step": 56220 }, { "epoch": 0.81, "learning_rate": 1.9729973434024627e-05, "loss": 0.014, "step": 56230 }, { "epoch": 0.81, "learning_rate": 1.9729925394286157e-05, "loss": 0.0173, "step": 56240 }, { "epoch": 0.81, "learning_rate": 1.9729877354547683e-05, "loss": 0.0172, "step": 56250 }, { "epoch": 0.81, "learning_rate": 1.9729829314809212e-05, "loss": 0.02, "step": 56260 }, { "epoch": 0.81, "learning_rate": 1.972978127507074e-05, "loss": 0.0134, "step": 56270 }, { "epoch": 0.81, "learning_rate": 1.972973323533227e-05, "loss": 0.0156, "step": 56280 }, { "epoch": 0.81, "learning_rate": 1.9729685195593796e-05, "loss": 0.0184, "step": 56290 }, { "epoch": 0.81, "learning_rate": 1.9729637155855326e-05, "loss": 0.0171, "step": 56300 }, { "epoch": 0.81, "learning_rate": 1.9729589116116855e-05, "loss": 0.0124, "step": 56310 }, { "epoch": 0.81, "learning_rate": 1.972954107637838e-05, "loss": 0.0163, "step": 56320 }, { "epoch": 0.81, "learning_rate": 1.972949303663991e-05, "loss": 0.0153, "step": 56330 }, { "epoch": 0.81, "learning_rate": 1.972944499690144e-05, "loss": 0.0146, "step": 56340 }, { "epoch": 0.81, "learning_rate": 1.972939695716297e-05, "loss": 0.0174, "step": 56350 }, { "epoch": 0.81, "learning_rate": 1.9729348917424494e-05, "loss": 0.0226, "step": 56360 }, { "epoch": 0.81, "learning_rate": 1.9729300877686024e-05, "loss": 0.0151, "step": 56370 }, { "epoch": 0.81, "learning_rate": 1.9729252837947553e-05, "loss": 0.0169, "step": 56380 }, { "epoch": 0.81, "learning_rate": 1.9729204798209082e-05, "loss": 0.018, "step": 56390 }, { "epoch": 0.81, "learning_rate": 1.9729156758470608e-05, "loss": 0.0168, "step": 56400 }, { "epoch": 0.81, "learning_rate": 1.9729108718732137e-05, "loss": 0.0129, "step": 56410 }, { "epoch": 0.81, "learning_rate": 1.9729060678993667e-05, "loss": 0.0161, "step": 56420 }, { "epoch": 0.81, "learning_rate": 1.9729012639255193e-05, "loss": 0.0155, "step": 56430 }, { "epoch": 0.81, "learning_rate": 1.9728964599516722e-05, "loss": 0.0188, "step": 56440 }, { "epoch": 0.81, "learning_rate": 1.972891655977825e-05, "loss": 0.0217, "step": 56450 }, { "epoch": 0.81, "learning_rate": 1.972886852003978e-05, "loss": 0.0135, "step": 56460 }, { "epoch": 0.81, "learning_rate": 1.9728820480301306e-05, "loss": 0.0159, "step": 56470 }, { "epoch": 0.81, "learning_rate": 1.9728772440562835e-05, "loss": 0.0229, "step": 56480 }, { "epoch": 0.81, "learning_rate": 1.9728724400824365e-05, "loss": 0.0206, "step": 56490 }, { "epoch": 0.81, "learning_rate": 1.972867636108589e-05, "loss": 0.016, "step": 56500 }, { "epoch": 0.81, "learning_rate": 1.972862832134742e-05, "loss": 0.0164, "step": 56510 }, { "epoch": 0.81, "learning_rate": 1.972858028160895e-05, "loss": 0.0162, "step": 56520 }, { "epoch": 0.81, "learning_rate": 1.972853224187048e-05, "loss": 0.0164, "step": 56530 }, { "epoch": 0.81, "learning_rate": 1.9728484202132004e-05, "loss": 0.016, "step": 56540 }, { "epoch": 0.81, "learning_rate": 1.9728436162393534e-05, "loss": 0.0135, "step": 56550 }, { "epoch": 0.82, "learning_rate": 1.9728388122655063e-05, "loss": 0.0175, "step": 56560 }, { "epoch": 0.82, "learning_rate": 1.9728340082916592e-05, "loss": 0.0192, "step": 56570 }, { "epoch": 0.82, "learning_rate": 1.9728292043178118e-05, "loss": 0.0204, "step": 56580 }, { "epoch": 0.82, "learning_rate": 1.9728244003439647e-05, "loss": 0.0206, "step": 56590 }, { "epoch": 0.82, "learning_rate": 1.9728195963701177e-05, "loss": 0.027, "step": 56600 }, { "epoch": 0.82, "learning_rate": 1.9728147923962702e-05, "loss": 0.0153, "step": 56610 }, { "epoch": 0.82, "learning_rate": 1.9728099884224232e-05, "loss": 0.0184, "step": 56620 }, { "epoch": 0.82, "learning_rate": 1.972805184448576e-05, "loss": 0.0195, "step": 56630 }, { "epoch": 0.82, "learning_rate": 1.972800380474729e-05, "loss": 0.0194, "step": 56640 }, { "epoch": 0.82, "learning_rate": 1.9727955765008816e-05, "loss": 0.019, "step": 56650 }, { "epoch": 0.82, "learning_rate": 1.9727907725270345e-05, "loss": 0.0171, "step": 56660 }, { "epoch": 0.82, "learning_rate": 1.9727859685531875e-05, "loss": 0.0256, "step": 56670 }, { "epoch": 0.82, "learning_rate": 1.97278116457934e-05, "loss": 0.0171, "step": 56680 }, { "epoch": 0.82, "learning_rate": 1.972776360605493e-05, "loss": 0.0173, "step": 56690 }, { "epoch": 0.82, "learning_rate": 1.972771556631646e-05, "loss": 0.0188, "step": 56700 }, { "epoch": 0.82, "learning_rate": 1.972766752657799e-05, "loss": 0.0163, "step": 56710 }, { "epoch": 0.82, "learning_rate": 1.9727619486839514e-05, "loss": 0.0139, "step": 56720 }, { "epoch": 0.82, "learning_rate": 1.9727571447101044e-05, "loss": 0.0124, "step": 56730 }, { "epoch": 0.82, "learning_rate": 1.9727523407362573e-05, "loss": 0.0172, "step": 56740 }, { "epoch": 0.82, "learning_rate": 1.9727475367624102e-05, "loss": 0.0143, "step": 56750 }, { "epoch": 0.82, "learning_rate": 1.9727427327885628e-05, "loss": 0.0162, "step": 56760 }, { "epoch": 0.82, "learning_rate": 1.9727379288147157e-05, "loss": 0.0168, "step": 56770 }, { "epoch": 0.82, "learning_rate": 1.9727331248408686e-05, "loss": 0.0248, "step": 56780 }, { "epoch": 0.82, "learning_rate": 1.9727283208670212e-05, "loss": 0.0172, "step": 56790 }, { "epoch": 0.82, "learning_rate": 1.972723516893174e-05, "loss": 0.0124, "step": 56800 }, { "epoch": 0.82, "learning_rate": 1.972718712919327e-05, "loss": 0.0191, "step": 56810 }, { "epoch": 0.82, "learning_rate": 1.97271390894548e-05, "loss": 0.0182, "step": 56820 }, { "epoch": 0.82, "learning_rate": 1.9727091049716326e-05, "loss": 0.0139, "step": 56830 }, { "epoch": 0.82, "learning_rate": 1.9727043009977855e-05, "loss": 0.0135, "step": 56840 }, { "epoch": 0.82, "learning_rate": 1.9726994970239385e-05, "loss": 0.0189, "step": 56850 }, { "epoch": 0.82, "learning_rate": 1.972694693050091e-05, "loss": 0.018, "step": 56860 }, { "epoch": 0.82, "learning_rate": 1.972689889076244e-05, "loss": 0.0132, "step": 56870 }, { "epoch": 0.82, "learning_rate": 1.972685085102397e-05, "loss": 0.0161, "step": 56880 }, { "epoch": 0.82, "learning_rate": 1.9726802811285498e-05, "loss": 0.016, "step": 56890 }, { "epoch": 0.82, "learning_rate": 1.9726754771547024e-05, "loss": 0.0166, "step": 56900 }, { "epoch": 0.82, "learning_rate": 1.9726706731808553e-05, "loss": 0.0183, "step": 56910 }, { "epoch": 0.82, "learning_rate": 1.9726658692070083e-05, "loss": 0.016, "step": 56920 }, { "epoch": 0.82, "learning_rate": 1.9726610652331612e-05, "loss": 0.0189, "step": 56930 }, { "epoch": 0.82, "learning_rate": 1.9726562612593138e-05, "loss": 0.0152, "step": 56940 }, { "epoch": 0.82, "learning_rate": 1.9726514572854667e-05, "loss": 0.0167, "step": 56950 }, { "epoch": 0.82, "learning_rate": 1.9726466533116196e-05, "loss": 0.0152, "step": 56960 }, { "epoch": 0.82, "learning_rate": 1.9726418493377722e-05, "loss": 0.0227, "step": 56970 }, { "epoch": 0.82, "learning_rate": 1.972637045363925e-05, "loss": 0.0143, "step": 56980 }, { "epoch": 0.82, "learning_rate": 1.972632241390078e-05, "loss": 0.0159, "step": 56990 }, { "epoch": 0.82, "learning_rate": 1.972627437416231e-05, "loss": 0.0197, "step": 57000 }, { "epoch": 0.82, "learning_rate": 1.9726226334423836e-05, "loss": 0.0156, "step": 57010 }, { "epoch": 0.82, "learning_rate": 1.9726178294685365e-05, "loss": 0.0161, "step": 57020 }, { "epoch": 0.82, "learning_rate": 1.9726130254946894e-05, "loss": 0.0169, "step": 57030 }, { "epoch": 0.82, "learning_rate": 1.972608221520842e-05, "loss": 0.0175, "step": 57040 }, { "epoch": 0.82, "learning_rate": 1.972603417546995e-05, "loss": 0.0159, "step": 57050 }, { "epoch": 0.82, "learning_rate": 1.972598613573148e-05, "loss": 0.0194, "step": 57060 }, { "epoch": 0.82, "learning_rate": 1.9725938095993008e-05, "loss": 0.0165, "step": 57070 }, { "epoch": 0.82, "learning_rate": 1.9725890056254534e-05, "loss": 0.023, "step": 57080 }, { "epoch": 0.82, "learning_rate": 1.9725842016516063e-05, "loss": 0.0138, "step": 57090 }, { "epoch": 0.82, "learning_rate": 1.9725798780751438e-05, "loss": 0.0176, "step": 57100 }, { "epoch": 0.82, "learning_rate": 1.9725750741012967e-05, "loss": 0.0136, "step": 57110 }, { "epoch": 0.82, "learning_rate": 1.9725702701274497e-05, "loss": 0.02, "step": 57120 }, { "epoch": 0.82, "learning_rate": 1.9725654661536026e-05, "loss": 0.0201, "step": 57130 }, { "epoch": 0.82, "learning_rate": 1.972560662179755e-05, "loss": 0.0156, "step": 57140 }, { "epoch": 0.82, "learning_rate": 1.972555858205908e-05, "loss": 0.0172, "step": 57150 }, { "epoch": 0.82, "learning_rate": 1.972551054232061e-05, "loss": 0.0199, "step": 57160 }, { "epoch": 0.82, "learning_rate": 1.972546250258214e-05, "loss": 0.0148, "step": 57170 }, { "epoch": 0.82, "learning_rate": 1.9725414462843665e-05, "loss": 0.0132, "step": 57180 }, { "epoch": 0.82, "learning_rate": 1.9725366423105195e-05, "loss": 0.0143, "step": 57190 }, { "epoch": 0.82, "learning_rate": 1.9725318383366724e-05, "loss": 0.0153, "step": 57200 }, { "epoch": 0.82, "learning_rate": 1.972527034362825e-05, "loss": 0.0147, "step": 57210 }, { "epoch": 0.82, "learning_rate": 1.972522230388978e-05, "loss": 0.0195, "step": 57220 }, { "epoch": 0.82, "learning_rate": 1.972517426415131e-05, "loss": 0.0154, "step": 57230 }, { "epoch": 0.82, "learning_rate": 1.9725126224412838e-05, "loss": 0.0186, "step": 57240 }, { "epoch": 0.83, "learning_rate": 1.9725078184674363e-05, "loss": 0.0148, "step": 57250 }, { "epoch": 0.83, "learning_rate": 1.9725030144935893e-05, "loss": 0.0166, "step": 57260 }, { "epoch": 0.83, "learning_rate": 1.9724982105197422e-05, "loss": 0.0155, "step": 57270 }, { "epoch": 0.83, "learning_rate": 1.9724934065458948e-05, "loss": 0.022, "step": 57280 }, { "epoch": 0.83, "learning_rate": 1.9724886025720477e-05, "loss": 0.0157, "step": 57290 }, { "epoch": 0.83, "learning_rate": 1.9724837985982006e-05, "loss": 0.0175, "step": 57300 }, { "epoch": 0.83, "learning_rate": 1.9724789946243536e-05, "loss": 0.0169, "step": 57310 }, { "epoch": 0.83, "learning_rate": 1.972474190650506e-05, "loss": 0.0169, "step": 57320 }, { "epoch": 0.83, "learning_rate": 1.972469386676659e-05, "loss": 0.0114, "step": 57330 }, { "epoch": 0.83, "learning_rate": 1.972464582702812e-05, "loss": 0.0122, "step": 57340 }, { "epoch": 0.83, "learning_rate": 1.9724597787289646e-05, "loss": 0.0163, "step": 57350 }, { "epoch": 0.83, "learning_rate": 1.9724549747551175e-05, "loss": 0.0164, "step": 57360 }, { "epoch": 0.83, "learning_rate": 1.9724501707812705e-05, "loss": 0.0172, "step": 57370 }, { "epoch": 0.83, "learning_rate": 1.9724453668074234e-05, "loss": 0.0124, "step": 57380 }, { "epoch": 0.83, "learning_rate": 1.972440562833576e-05, "loss": 0.0155, "step": 57390 }, { "epoch": 0.83, "learning_rate": 1.972435758859729e-05, "loss": 0.0176, "step": 57400 }, { "epoch": 0.83, "learning_rate": 1.9724309548858818e-05, "loss": 0.0152, "step": 57410 }, { "epoch": 0.83, "learning_rate": 1.9724261509120348e-05, "loss": 0.0112, "step": 57420 }, { "epoch": 0.83, "learning_rate": 1.9724213469381873e-05, "loss": 0.0191, "step": 57430 }, { "epoch": 0.83, "learning_rate": 1.9724165429643403e-05, "loss": 0.0116, "step": 57440 }, { "epoch": 0.83, "learning_rate": 1.9724117389904932e-05, "loss": 0.018, "step": 57450 }, { "epoch": 0.83, "learning_rate": 1.9724069350166458e-05, "loss": 0.0159, "step": 57460 }, { "epoch": 0.83, "learning_rate": 1.9724021310427987e-05, "loss": 0.0191, "step": 57470 }, { "epoch": 0.83, "learning_rate": 1.9723973270689516e-05, "loss": 0.0139, "step": 57480 }, { "epoch": 0.83, "learning_rate": 1.9723925230951046e-05, "loss": 0.0202, "step": 57490 }, { "epoch": 0.83, "learning_rate": 1.972387719121257e-05, "loss": 0.0119, "step": 57500 }, { "epoch": 0.83, "learning_rate": 1.97238291514741e-05, "loss": 0.0173, "step": 57510 }, { "epoch": 0.83, "learning_rate": 1.972378111173563e-05, "loss": 0.0197, "step": 57520 }, { "epoch": 0.83, "learning_rate": 1.9723733071997156e-05, "loss": 0.0171, "step": 57530 }, { "epoch": 0.83, "learning_rate": 1.9723685032258685e-05, "loss": 0.0178, "step": 57540 }, { "epoch": 0.83, "learning_rate": 1.9723636992520214e-05, "loss": 0.0194, "step": 57550 }, { "epoch": 0.83, "learning_rate": 1.9723588952781744e-05, "loss": 0.0154, "step": 57560 }, { "epoch": 0.83, "learning_rate": 1.972354091304327e-05, "loss": 0.0129, "step": 57570 }, { "epoch": 0.83, "learning_rate": 1.97234928733048e-05, "loss": 0.0103, "step": 57580 }, { "epoch": 0.83, "learning_rate": 1.9723444833566328e-05, "loss": 0.015, "step": 57590 }, { "epoch": 0.83, "learning_rate": 1.9723396793827857e-05, "loss": 0.0119, "step": 57600 }, { "epoch": 0.83, "learning_rate": 1.9723348754089383e-05, "loss": 0.0141, "step": 57610 }, { "epoch": 0.83, "learning_rate": 1.9723300714350913e-05, "loss": 0.0183, "step": 57620 }, { "epoch": 0.83, "learning_rate": 1.9723252674612442e-05, "loss": 0.0143, "step": 57630 }, { "epoch": 0.83, "learning_rate": 1.9723204634873968e-05, "loss": 0.0149, "step": 57640 }, { "epoch": 0.83, "learning_rate": 1.9723156595135497e-05, "loss": 0.0157, "step": 57650 }, { "epoch": 0.83, "learning_rate": 1.9723108555397026e-05, "loss": 0.0138, "step": 57660 }, { "epoch": 0.83, "learning_rate": 1.9723060515658556e-05, "loss": 0.0196, "step": 57670 }, { "epoch": 0.83, "learning_rate": 1.972301247592008e-05, "loss": 0.0204, "step": 57680 }, { "epoch": 0.83, "learning_rate": 1.972296443618161e-05, "loss": 0.019, "step": 57690 }, { "epoch": 0.83, "learning_rate": 1.972291639644314e-05, "loss": 0.0165, "step": 57700 }, { "epoch": 0.83, "learning_rate": 1.9722868356704666e-05, "loss": 0.0142, "step": 57710 }, { "epoch": 0.83, "learning_rate": 1.9722820316966195e-05, "loss": 0.016, "step": 57720 }, { "epoch": 0.83, "learning_rate": 1.9722772277227724e-05, "loss": 0.013, "step": 57730 }, { "epoch": 0.83, "learning_rate": 1.9722724237489254e-05, "loss": 0.0195, "step": 57740 }, { "epoch": 0.83, "learning_rate": 1.972267619775078e-05, "loss": 0.0125, "step": 57750 }, { "epoch": 0.83, "learning_rate": 1.972262815801231e-05, "loss": 0.0217, "step": 57760 }, { "epoch": 0.83, "learning_rate": 1.9722580118273838e-05, "loss": 0.0155, "step": 57770 }, { "epoch": 0.83, "learning_rate": 1.9722532078535367e-05, "loss": 0.0165, "step": 57780 }, { "epoch": 0.83, "learning_rate": 1.9722484038796893e-05, "loss": 0.0203, "step": 57790 }, { "epoch": 0.83, "learning_rate": 1.9722435999058422e-05, "loss": 0.0156, "step": 57800 }, { "epoch": 0.83, "learning_rate": 1.9722387959319952e-05, "loss": 0.0176, "step": 57810 }, { "epoch": 0.83, "learning_rate": 1.9722339919581478e-05, "loss": 0.0137, "step": 57820 }, { "epoch": 0.83, "learning_rate": 1.9722291879843007e-05, "loss": 0.0147, "step": 57830 }, { "epoch": 0.83, "learning_rate": 1.9722243840104536e-05, "loss": 0.0194, "step": 57840 }, { "epoch": 0.83, "learning_rate": 1.9722195800366065e-05, "loss": 0.0137, "step": 57850 }, { "epoch": 0.83, "learning_rate": 1.972214776062759e-05, "loss": 0.0155, "step": 57860 }, { "epoch": 0.83, "learning_rate": 1.972209972088912e-05, "loss": 0.0152, "step": 57870 }, { "epoch": 0.83, "learning_rate": 1.972205168115065e-05, "loss": 0.0268, "step": 57880 }, { "epoch": 0.83, "learning_rate": 1.9722003641412176e-05, "loss": 0.023, "step": 57890 }, { "epoch": 0.83, "learning_rate": 1.9721955601673705e-05, "loss": 0.0142, "step": 57900 }, { "epoch": 0.83, "learning_rate": 1.9721907561935234e-05, "loss": 0.0125, "step": 57910 }, { "epoch": 0.83, "learning_rate": 1.9721859522196764e-05, "loss": 0.0165, "step": 57920 }, { "epoch": 0.83, "learning_rate": 1.972181148245829e-05, "loss": 0.0168, "step": 57930 }, { "epoch": 0.84, "learning_rate": 1.972176344271982e-05, "loss": 0.0188, "step": 57940 }, { "epoch": 0.84, "learning_rate": 1.9721715402981348e-05, "loss": 0.0167, "step": 57950 }, { "epoch": 0.84, "learning_rate": 1.9721667363242877e-05, "loss": 0.0208, "step": 57960 }, { "epoch": 0.84, "learning_rate": 1.9721619323504403e-05, "loss": 0.0168, "step": 57970 }, { "epoch": 0.84, "learning_rate": 1.9721571283765932e-05, "loss": 0.0137, "step": 57980 }, { "epoch": 0.84, "learning_rate": 1.972152324402746e-05, "loss": 0.0193, "step": 57990 }, { "epoch": 0.84, "learning_rate": 1.9721475204288988e-05, "loss": 0.0146, "step": 58000 }, { "epoch": 0.84, "learning_rate": 1.9721427164550517e-05, "loss": 0.0208, "step": 58010 }, { "epoch": 0.84, "learning_rate": 1.9721379124812046e-05, "loss": 0.0153, "step": 58020 }, { "epoch": 0.84, "learning_rate": 1.9721331085073575e-05, "loss": 0.0128, "step": 58030 }, { "epoch": 0.84, "learning_rate": 1.97212830453351e-05, "loss": 0.0179, "step": 58040 }, { "epoch": 0.84, "learning_rate": 1.972123500559663e-05, "loss": 0.0184, "step": 58050 }, { "epoch": 0.84, "learning_rate": 1.972118696585816e-05, "loss": 0.0153, "step": 58060 }, { "epoch": 0.84, "learning_rate": 1.9721138926119686e-05, "loss": 0.0154, "step": 58070 }, { "epoch": 0.84, "learning_rate": 1.9721090886381215e-05, "loss": 0.0202, "step": 58080 }, { "epoch": 0.84, "learning_rate": 1.9721042846642744e-05, "loss": 0.0236, "step": 58090 }, { "epoch": 0.84, "learning_rate": 1.9720994806904273e-05, "loss": 0.0163, "step": 58100 }, { "epoch": 0.84, "learning_rate": 1.97209467671658e-05, "loss": 0.0229, "step": 58110 }, { "epoch": 0.84, "learning_rate": 1.972089872742733e-05, "loss": 0.0191, "step": 58120 }, { "epoch": 0.84, "learning_rate": 1.9720850687688858e-05, "loss": 0.0171, "step": 58130 }, { "epoch": 0.84, "learning_rate": 1.9720802647950387e-05, "loss": 0.0207, "step": 58140 }, { "epoch": 0.84, "learning_rate": 1.9720754608211913e-05, "loss": 0.0171, "step": 58150 }, { "epoch": 0.84, "learning_rate": 1.9720706568473442e-05, "loss": 0.0152, "step": 58160 }, { "epoch": 0.84, "learning_rate": 1.972065852873497e-05, "loss": 0.0194, "step": 58170 }, { "epoch": 0.84, "learning_rate": 1.9720610488996497e-05, "loss": 0.0159, "step": 58180 }, { "epoch": 0.84, "learning_rate": 1.9720562449258027e-05, "loss": 0.0139, "step": 58190 }, { "epoch": 0.84, "learning_rate": 1.9720514409519556e-05, "loss": 0.0136, "step": 58200 }, { "epoch": 0.84, "learning_rate": 1.9720466369781085e-05, "loss": 0.0127, "step": 58210 }, { "epoch": 0.84, "learning_rate": 1.972041833004261e-05, "loss": 0.0141, "step": 58220 }, { "epoch": 0.84, "learning_rate": 1.972037029030414e-05, "loss": 0.0183, "step": 58230 }, { "epoch": 0.84, "learning_rate": 1.972032225056567e-05, "loss": 0.0195, "step": 58240 }, { "epoch": 0.84, "learning_rate": 1.9720274210827196e-05, "loss": 0.0171, "step": 58250 }, { "epoch": 0.84, "learning_rate": 1.9720226171088725e-05, "loss": 0.0159, "step": 58260 }, { "epoch": 0.84, "learning_rate": 1.9720178131350254e-05, "loss": 0.0164, "step": 58270 }, { "epoch": 0.84, "learning_rate": 1.9720130091611783e-05, "loss": 0.0177, "step": 58280 }, { "epoch": 0.84, "learning_rate": 1.972008205187331e-05, "loss": 0.0146, "step": 58290 }, { "epoch": 0.84, "learning_rate": 1.972003401213484e-05, "loss": 0.0151, "step": 58300 }, { "epoch": 0.84, "learning_rate": 1.9719985972396368e-05, "loss": 0.0139, "step": 58310 }, { "epoch": 0.84, "learning_rate": 1.9719937932657897e-05, "loss": 0.0239, "step": 58320 }, { "epoch": 0.84, "learning_rate": 1.9719889892919423e-05, "loss": 0.0157, "step": 58330 }, { "epoch": 0.84, "learning_rate": 1.9719841853180952e-05, "loss": 0.023, "step": 58340 }, { "epoch": 0.84, "learning_rate": 1.971979381344248e-05, "loss": 0.0171, "step": 58350 }, { "epoch": 0.84, "learning_rate": 1.9719745773704007e-05, "loss": 0.0146, "step": 58360 }, { "epoch": 0.84, "learning_rate": 1.9719697733965537e-05, "loss": 0.0216, "step": 58370 }, { "epoch": 0.84, "learning_rate": 1.9719649694227066e-05, "loss": 0.0157, "step": 58380 }, { "epoch": 0.84, "learning_rate": 1.9719601654488595e-05, "loss": 0.0154, "step": 58390 }, { "epoch": 0.84, "learning_rate": 1.971955361475012e-05, "loss": 0.0195, "step": 58400 }, { "epoch": 0.84, "learning_rate": 1.971950557501165e-05, "loss": 0.0141, "step": 58410 }, { "epoch": 0.84, "learning_rate": 1.971945753527318e-05, "loss": 0.0192, "step": 58420 }, { "epoch": 0.84, "learning_rate": 1.9719409495534705e-05, "loss": 0.0149, "step": 58430 }, { "epoch": 0.84, "learning_rate": 1.9719361455796235e-05, "loss": 0.0117, "step": 58440 }, { "epoch": 0.84, "learning_rate": 1.9719313416057764e-05, "loss": 0.0126, "step": 58450 }, { "epoch": 0.84, "learning_rate": 1.9719265376319293e-05, "loss": 0.0193, "step": 58460 }, { "epoch": 0.84, "learning_rate": 1.971921733658082e-05, "loss": 0.0138, "step": 58470 }, { "epoch": 0.84, "learning_rate": 1.971916929684235e-05, "loss": 0.0176, "step": 58480 }, { "epoch": 0.84, "learning_rate": 1.9719121257103878e-05, "loss": 0.0161, "step": 58490 }, { "epoch": 0.84, "learning_rate": 1.9719073217365407e-05, "loss": 0.0161, "step": 58500 }, { "epoch": 0.84, "learning_rate": 1.9719025177626933e-05, "loss": 0.0181, "step": 58510 }, { "epoch": 0.84, "learning_rate": 1.9718977137888462e-05, "loss": 0.0151, "step": 58520 }, { "epoch": 0.84, "learning_rate": 1.971892909814999e-05, "loss": 0.0124, "step": 58530 }, { "epoch": 0.84, "learning_rate": 1.9718881058411517e-05, "loss": 0.0159, "step": 58540 }, { "epoch": 0.84, "learning_rate": 1.9718833018673047e-05, "loss": 0.0214, "step": 58550 }, { "epoch": 0.84, "learning_rate": 1.9718784978934576e-05, "loss": 0.0164, "step": 58560 }, { "epoch": 0.84, "learning_rate": 1.9718736939196105e-05, "loss": 0.0143, "step": 58570 }, { "epoch": 0.84, "learning_rate": 1.971868889945763e-05, "loss": 0.0117, "step": 58580 }, { "epoch": 0.84, "learning_rate": 1.971864085971916e-05, "loss": 0.0144, "step": 58590 }, { "epoch": 0.84, "learning_rate": 1.971859281998069e-05, "loss": 0.017, "step": 58600 }, { "epoch": 0.84, "learning_rate": 1.9718544780242215e-05, "loss": 0.0138, "step": 58610 }, { "epoch": 0.84, "learning_rate": 1.9718496740503745e-05, "loss": 0.0178, "step": 58620 }, { "epoch": 0.84, "learning_rate": 1.9718448700765274e-05, "loss": 0.0156, "step": 58630 }, { "epoch": 0.85, "learning_rate": 1.9718400661026803e-05, "loss": 0.0143, "step": 58640 }, { "epoch": 0.85, "learning_rate": 1.971835262128833e-05, "loss": 0.0192, "step": 58650 }, { "epoch": 0.85, "learning_rate": 1.971830458154986e-05, "loss": 0.0148, "step": 58660 }, { "epoch": 0.85, "learning_rate": 1.9718256541811388e-05, "loss": 0.0177, "step": 58670 }, { "epoch": 0.85, "learning_rate": 1.9718208502072917e-05, "loss": 0.0176, "step": 58680 }, { "epoch": 0.85, "learning_rate": 1.9718160462334443e-05, "loss": 0.014, "step": 58690 }, { "epoch": 0.85, "learning_rate": 1.9718112422595972e-05, "loss": 0.0157, "step": 58700 }, { "epoch": 0.85, "learning_rate": 1.97180643828575e-05, "loss": 0.0187, "step": 58710 }, { "epoch": 0.85, "learning_rate": 1.9718016343119027e-05, "loss": 0.0171, "step": 58720 }, { "epoch": 0.85, "learning_rate": 1.971796830338056e-05, "loss": 0.0174, "step": 58730 }, { "epoch": 0.85, "learning_rate": 1.9717920263642086e-05, "loss": 0.0176, "step": 58740 }, { "epoch": 0.85, "learning_rate": 1.9717872223903615e-05, "loss": 0.0159, "step": 58750 }, { "epoch": 0.85, "learning_rate": 1.9717824184165144e-05, "loss": 0.0137, "step": 58760 }, { "epoch": 0.85, "learning_rate": 1.9717776144426674e-05, "loss": 0.0181, "step": 58770 }, { "epoch": 0.85, "learning_rate": 1.97177281046882e-05, "loss": 0.0226, "step": 58780 }, { "epoch": 0.85, "learning_rate": 1.971768006494973e-05, "loss": 0.0138, "step": 58790 }, { "epoch": 0.85, "learning_rate": 1.9717632025211258e-05, "loss": 0.0137, "step": 58800 }, { "epoch": 0.85, "learning_rate": 1.9717583985472787e-05, "loss": 0.0146, "step": 58810 }, { "epoch": 0.85, "learning_rate": 1.9717535945734313e-05, "loss": 0.0156, "step": 58820 }, { "epoch": 0.85, "learning_rate": 1.9717487905995842e-05, "loss": 0.0171, "step": 58830 }, { "epoch": 0.85, "learning_rate": 1.971743986625737e-05, "loss": 0.0137, "step": 58840 }, { "epoch": 0.85, "learning_rate": 1.9717391826518898e-05, "loss": 0.0117, "step": 58850 }, { "epoch": 0.85, "learning_rate": 1.9717343786780427e-05, "loss": 0.0148, "step": 58860 }, { "epoch": 0.85, "learning_rate": 1.9717295747041956e-05, "loss": 0.0176, "step": 58870 }, { "epoch": 0.85, "learning_rate": 1.9717247707303485e-05, "loss": 0.0119, "step": 58880 }, { "epoch": 0.85, "learning_rate": 1.971719966756501e-05, "loss": 0.0106, "step": 58890 }, { "epoch": 0.85, "learning_rate": 1.971715162782654e-05, "loss": 0.0152, "step": 58900 }, { "epoch": 0.85, "learning_rate": 1.971710358808807e-05, "loss": 0.0154, "step": 58910 }, { "epoch": 0.85, "learning_rate": 1.9717055548349596e-05, "loss": 0.0142, "step": 58920 }, { "epoch": 0.85, "learning_rate": 1.9717007508611125e-05, "loss": 0.0228, "step": 58930 }, { "epoch": 0.85, "learning_rate": 1.9716959468872654e-05, "loss": 0.0176, "step": 58940 }, { "epoch": 0.85, "learning_rate": 1.9716911429134183e-05, "loss": 0.0165, "step": 58950 }, { "epoch": 0.85, "learning_rate": 1.971686338939571e-05, "loss": 0.0132, "step": 58960 }, { "epoch": 0.85, "learning_rate": 1.971681534965724e-05, "loss": 0.0175, "step": 58970 }, { "epoch": 0.85, "learning_rate": 1.9716767309918768e-05, "loss": 0.0145, "step": 58980 }, { "epoch": 0.85, "learning_rate": 1.9716719270180297e-05, "loss": 0.013, "step": 58990 }, { "epoch": 0.85, "learning_rate": 1.9716671230441823e-05, "loss": 0.017, "step": 59000 }, { "epoch": 0.85, "learning_rate": 1.9716623190703352e-05, "loss": 0.0107, "step": 59010 }, { "epoch": 0.85, "learning_rate": 1.971657515096488e-05, "loss": 0.0165, "step": 59020 }, { "epoch": 0.85, "learning_rate": 1.9716527111226407e-05, "loss": 0.016, "step": 59030 }, { "epoch": 0.85, "learning_rate": 1.9716479071487937e-05, "loss": 0.0157, "step": 59040 }, { "epoch": 0.85, "learning_rate": 1.9716431031749466e-05, "loss": 0.0179, "step": 59050 }, { "epoch": 0.85, "learning_rate": 1.9716382992010995e-05, "loss": 0.0212, "step": 59060 }, { "epoch": 0.85, "learning_rate": 1.971633495227252e-05, "loss": 0.0141, "step": 59070 }, { "epoch": 0.85, "learning_rate": 1.971628691253405e-05, "loss": 0.017, "step": 59080 }, { "epoch": 0.85, "learning_rate": 1.971623887279558e-05, "loss": 0.0151, "step": 59090 }, { "epoch": 0.85, "learning_rate": 1.9716190833057106e-05, "loss": 0.017, "step": 59100 }, { "epoch": 0.85, "learning_rate": 1.9716142793318635e-05, "loss": 0.02, "step": 59110 }, { "epoch": 0.85, "learning_rate": 1.9716094753580164e-05, "loss": 0.0211, "step": 59120 }, { "epoch": 0.85, "learning_rate": 1.9716046713841693e-05, "loss": 0.0177, "step": 59130 }, { "epoch": 0.85, "learning_rate": 1.971599867410322e-05, "loss": 0.0179, "step": 59140 }, { "epoch": 0.85, "learning_rate": 1.971595063436475e-05, "loss": 0.0115, "step": 59150 }, { "epoch": 0.85, "learning_rate": 1.9715902594626278e-05, "loss": 0.0121, "step": 59160 }, { "epoch": 0.85, "learning_rate": 1.9715854554887807e-05, "loss": 0.0216, "step": 59170 }, { "epoch": 0.85, "learning_rate": 1.9715806515149333e-05, "loss": 0.0189, "step": 59180 }, { "epoch": 0.85, "learning_rate": 1.9715758475410862e-05, "loss": 0.0189, "step": 59190 }, { "epoch": 0.85, "learning_rate": 1.971571043567239e-05, "loss": 0.0169, "step": 59200 }, { "epoch": 0.85, "learning_rate": 1.9715662395933917e-05, "loss": 0.0145, "step": 59210 }, { "epoch": 0.85, "learning_rate": 1.9715614356195447e-05, "loss": 0.0149, "step": 59220 }, { "epoch": 0.85, "learning_rate": 1.9715566316456976e-05, "loss": 0.0141, "step": 59230 }, { "epoch": 0.85, "learning_rate": 1.9715518276718505e-05, "loss": 0.0165, "step": 59240 }, { "epoch": 0.85, "learning_rate": 1.971547023698003e-05, "loss": 0.0216, "step": 59250 }, { "epoch": 0.85, "learning_rate": 1.971542219724156e-05, "loss": 0.0144, "step": 59260 }, { "epoch": 0.85, "learning_rate": 1.971537415750309e-05, "loss": 0.0152, "step": 59270 }, { "epoch": 0.85, "learning_rate": 1.9715326117764616e-05, "loss": 0.0131, "step": 59280 }, { "epoch": 0.85, "learning_rate": 1.9715278078026145e-05, "loss": 0.0193, "step": 59290 }, { "epoch": 0.85, "learning_rate": 1.9715230038287674e-05, "loss": 0.0209, "step": 59300 }, { "epoch": 0.85, "learning_rate": 1.9715181998549203e-05, "loss": 0.0169, "step": 59310 }, { "epoch": 0.85, "learning_rate": 1.971513395881073e-05, "loss": 0.0149, "step": 59320 }, { "epoch": 0.86, "learning_rate": 1.971508591907226e-05, "loss": 0.0157, "step": 59330 }, { "epoch": 0.86, "learning_rate": 1.9715037879333788e-05, "loss": 0.0194, "step": 59340 }, { "epoch": 0.86, "learning_rate": 1.9714989839595317e-05, "loss": 0.012, "step": 59350 }, { "epoch": 0.86, "learning_rate": 1.9714941799856843e-05, "loss": 0.0261, "step": 59360 }, { "epoch": 0.86, "learning_rate": 1.9714893760118372e-05, "loss": 0.0122, "step": 59370 }, { "epoch": 0.86, "learning_rate": 1.97148457203799e-05, "loss": 0.0136, "step": 59380 }, { "epoch": 0.86, "learning_rate": 1.9714797680641427e-05, "loss": 0.0134, "step": 59390 }, { "epoch": 0.86, "learning_rate": 1.9714749640902957e-05, "loss": 0.0142, "step": 59400 }, { "epoch": 0.86, "learning_rate": 1.9714701601164486e-05, "loss": 0.0258, "step": 59410 }, { "epoch": 0.86, "learning_rate": 1.9714653561426015e-05, "loss": 0.0171, "step": 59420 }, { "epoch": 0.86, "learning_rate": 1.971460552168754e-05, "loss": 0.015, "step": 59430 }, { "epoch": 0.86, "learning_rate": 1.971455748194907e-05, "loss": 0.0176, "step": 59440 }, { "epoch": 0.86, "learning_rate": 1.97145094422106e-05, "loss": 0.0109, "step": 59450 }, { "epoch": 0.86, "learning_rate": 1.9714461402472125e-05, "loss": 0.0158, "step": 59460 }, { "epoch": 0.86, "learning_rate": 1.9714413362733655e-05, "loss": 0.0222, "step": 59470 }, { "epoch": 0.86, "learning_rate": 1.9714365322995184e-05, "loss": 0.0135, "step": 59480 }, { "epoch": 0.86, "learning_rate": 1.9714317283256713e-05, "loss": 0.0175, "step": 59490 }, { "epoch": 0.86, "learning_rate": 1.971426924351824e-05, "loss": 0.0207, "step": 59500 }, { "epoch": 0.86, "learning_rate": 1.971422120377977e-05, "loss": 0.0131, "step": 59510 }, { "epoch": 0.86, "learning_rate": 1.9714173164041298e-05, "loss": 0.0166, "step": 59520 }, { "epoch": 0.86, "learning_rate": 1.9714125124302827e-05, "loss": 0.0138, "step": 59530 }, { "epoch": 0.86, "learning_rate": 1.9714077084564353e-05, "loss": 0.0167, "step": 59540 }, { "epoch": 0.86, "learning_rate": 1.9714029044825882e-05, "loss": 0.0166, "step": 59550 }, { "epoch": 0.86, "learning_rate": 1.971398100508741e-05, "loss": 0.0167, "step": 59560 }, { "epoch": 0.86, "learning_rate": 1.9713937769322786e-05, "loss": 0.0166, "step": 59570 }, { "epoch": 0.86, "learning_rate": 1.9713889729584315e-05, "loss": 0.0199, "step": 59580 }, { "epoch": 0.86, "learning_rate": 1.9713841689845845e-05, "loss": 0.0148, "step": 59590 }, { "epoch": 0.86, "learning_rate": 1.971379365010737e-05, "loss": 0.0218, "step": 59600 }, { "epoch": 0.86, "learning_rate": 1.97137456103689e-05, "loss": 0.0146, "step": 59610 }, { "epoch": 0.86, "learning_rate": 1.971369757063043e-05, "loss": 0.0162, "step": 59620 }, { "epoch": 0.86, "learning_rate": 1.9713649530891955e-05, "loss": 0.0193, "step": 59630 }, { "epoch": 0.86, "learning_rate": 1.9713601491153484e-05, "loss": 0.022, "step": 59640 }, { "epoch": 0.86, "learning_rate": 1.9713553451415013e-05, "loss": 0.0216, "step": 59650 }, { "epoch": 0.86, "learning_rate": 1.9713505411676543e-05, "loss": 0.0157, "step": 59660 }, { "epoch": 0.86, "learning_rate": 1.971345737193807e-05, "loss": 0.013, "step": 59670 }, { "epoch": 0.86, "learning_rate": 1.9713409332199598e-05, "loss": 0.0166, "step": 59680 }, { "epoch": 0.86, "learning_rate": 1.9713361292461127e-05, "loss": 0.0172, "step": 59690 }, { "epoch": 0.86, "learning_rate": 1.9713313252722653e-05, "loss": 0.0163, "step": 59700 }, { "epoch": 0.86, "learning_rate": 1.9713265212984182e-05, "loss": 0.0126, "step": 59710 }, { "epoch": 0.86, "learning_rate": 1.971321717324571e-05, "loss": 0.0168, "step": 59720 }, { "epoch": 0.86, "learning_rate": 1.971316913350724e-05, "loss": 0.0166, "step": 59730 }, { "epoch": 0.86, "learning_rate": 1.9713121093768767e-05, "loss": 0.0234, "step": 59740 }, { "epoch": 0.86, "learning_rate": 1.9713073054030296e-05, "loss": 0.0135, "step": 59750 }, { "epoch": 0.86, "learning_rate": 1.9713025014291825e-05, "loss": 0.013, "step": 59760 }, { "epoch": 0.86, "learning_rate": 1.9712976974553354e-05, "loss": 0.0166, "step": 59770 }, { "epoch": 0.86, "learning_rate": 1.971292893481488e-05, "loss": 0.0111, "step": 59780 }, { "epoch": 0.86, "learning_rate": 1.971288089507641e-05, "loss": 0.0196, "step": 59790 }, { "epoch": 0.86, "learning_rate": 1.971283285533794e-05, "loss": 0.0123, "step": 59800 }, { "epoch": 0.86, "learning_rate": 1.9712784815599465e-05, "loss": 0.014, "step": 59810 }, { "epoch": 0.86, "learning_rate": 1.9712736775860994e-05, "loss": 0.0237, "step": 59820 }, { "epoch": 0.86, "learning_rate": 1.9712688736122523e-05, "loss": 0.0157, "step": 59830 }, { "epoch": 0.86, "learning_rate": 1.9712640696384053e-05, "loss": 0.0186, "step": 59840 }, { "epoch": 0.86, "learning_rate": 1.971259265664558e-05, "loss": 0.0173, "step": 59850 }, { "epoch": 0.86, "learning_rate": 1.9712544616907108e-05, "loss": 0.0172, "step": 59860 }, { "epoch": 0.86, "learning_rate": 1.9712496577168637e-05, "loss": 0.0241, "step": 59870 }, { "epoch": 0.86, "learning_rate": 1.9712448537430163e-05, "loss": 0.0122, "step": 59880 }, { "epoch": 0.86, "learning_rate": 1.9712400497691692e-05, "loss": 0.0151, "step": 59890 }, { "epoch": 0.86, "learning_rate": 1.971235245795322e-05, "loss": 0.0161, "step": 59900 }, { "epoch": 0.86, "learning_rate": 1.971230441821475e-05, "loss": 0.0159, "step": 59910 }, { "epoch": 0.86, "learning_rate": 1.9712256378476277e-05, "loss": 0.0133, "step": 59920 }, { "epoch": 0.86, "learning_rate": 1.9712208338737806e-05, "loss": 0.0184, "step": 59930 }, { "epoch": 0.86, "learning_rate": 1.9712160298999335e-05, "loss": 0.0127, "step": 59940 }, { "epoch": 0.86, "learning_rate": 1.9712112259260864e-05, "loss": 0.0185, "step": 59950 }, { "epoch": 0.86, "learning_rate": 1.971206421952239e-05, "loss": 0.0201, "step": 59960 }, { "epoch": 0.86, "learning_rate": 1.971201617978392e-05, "loss": 0.0124, "step": 59970 }, { "epoch": 0.86, "learning_rate": 1.971196814004545e-05, "loss": 0.0144, "step": 59980 }, { "epoch": 0.86, "learning_rate": 1.9711920100306975e-05, "loss": 0.0147, "step": 59990 }, { "epoch": 0.86, "learning_rate": 1.9711872060568504e-05, "loss": 0.0164, "step": 60000 }, { "epoch": 0.86, "learning_rate": 1.9711824020830033e-05, "loss": 0.0174, "step": 60010 }, { "epoch": 0.87, "learning_rate": 1.9711775981091562e-05, "loss": 0.0137, "step": 60020 }, { "epoch": 0.87, "learning_rate": 1.971172794135309e-05, "loss": 0.0159, "step": 60030 }, { "epoch": 0.87, "learning_rate": 1.9711679901614618e-05, "loss": 0.014, "step": 60040 }, { "epoch": 0.87, "learning_rate": 1.9711631861876147e-05, "loss": 0.0147, "step": 60050 }, { "epoch": 0.87, "learning_rate": 1.9711583822137673e-05, "loss": 0.0209, "step": 60060 }, { "epoch": 0.87, "learning_rate": 1.9711535782399202e-05, "loss": 0.0149, "step": 60070 }, { "epoch": 0.87, "learning_rate": 1.971148774266073e-05, "loss": 0.0105, "step": 60080 }, { "epoch": 0.87, "learning_rate": 1.971143970292226e-05, "loss": 0.0123, "step": 60090 }, { "epoch": 0.87, "learning_rate": 1.9711391663183786e-05, "loss": 0.016, "step": 60100 }, { "epoch": 0.87, "learning_rate": 1.9711343623445316e-05, "loss": 0.0124, "step": 60110 }, { "epoch": 0.87, "learning_rate": 1.9711295583706845e-05, "loss": 0.0203, "step": 60120 }, { "epoch": 0.87, "learning_rate": 1.9711247543968374e-05, "loss": 0.0175, "step": 60130 }, { "epoch": 0.87, "learning_rate": 1.97111995042299e-05, "loss": 0.0194, "step": 60140 }, { "epoch": 0.87, "learning_rate": 1.971115146449143e-05, "loss": 0.0142, "step": 60150 }, { "epoch": 0.87, "learning_rate": 1.971110342475296e-05, "loss": 0.0156, "step": 60160 }, { "epoch": 0.87, "learning_rate": 1.9711055385014485e-05, "loss": 0.0135, "step": 60170 }, { "epoch": 0.87, "learning_rate": 1.9711007345276014e-05, "loss": 0.0147, "step": 60180 }, { "epoch": 0.87, "learning_rate": 1.9710959305537543e-05, "loss": 0.016, "step": 60190 }, { "epoch": 0.87, "learning_rate": 1.9710911265799072e-05, "loss": 0.0164, "step": 60200 }, { "epoch": 0.87, "learning_rate": 1.9710863226060598e-05, "loss": 0.0221, "step": 60210 }, { "epoch": 0.87, "learning_rate": 1.9710815186322128e-05, "loss": 0.0148, "step": 60220 }, { "epoch": 0.87, "learning_rate": 1.9710767146583657e-05, "loss": 0.0146, "step": 60230 }, { "epoch": 0.87, "learning_rate": 1.9710719106845183e-05, "loss": 0.0141, "step": 60240 }, { "epoch": 0.87, "learning_rate": 1.9710671067106712e-05, "loss": 0.0159, "step": 60250 }, { "epoch": 0.87, "learning_rate": 1.971062302736824e-05, "loss": 0.0166, "step": 60260 }, { "epoch": 0.87, "learning_rate": 1.971057498762977e-05, "loss": 0.0208, "step": 60270 }, { "epoch": 0.87, "learning_rate": 1.9710526947891296e-05, "loss": 0.0157, "step": 60280 }, { "epoch": 0.87, "learning_rate": 1.9710478908152826e-05, "loss": 0.0178, "step": 60290 }, { "epoch": 0.87, "learning_rate": 1.9710430868414355e-05, "loss": 0.0172, "step": 60300 }, { "epoch": 0.87, "learning_rate": 1.971038282867588e-05, "loss": 0.0154, "step": 60310 }, { "epoch": 0.87, "learning_rate": 1.971033478893741e-05, "loss": 0.0185, "step": 60320 }, { "epoch": 0.87, "learning_rate": 1.971028674919894e-05, "loss": 0.0224, "step": 60330 }, { "epoch": 0.87, "learning_rate": 1.971023870946047e-05, "loss": 0.0179, "step": 60340 }, { "epoch": 0.87, "learning_rate": 1.9710190669721994e-05, "loss": 0.0144, "step": 60350 }, { "epoch": 0.87, "learning_rate": 1.9710142629983524e-05, "loss": 0.0165, "step": 60360 }, { "epoch": 0.87, "learning_rate": 1.9710094590245053e-05, "loss": 0.0201, "step": 60370 }, { "epoch": 0.87, "learning_rate": 1.9710046550506582e-05, "loss": 0.0185, "step": 60380 }, { "epoch": 0.87, "learning_rate": 1.9709998510768108e-05, "loss": 0.0143, "step": 60390 }, { "epoch": 0.87, "learning_rate": 1.9709950471029637e-05, "loss": 0.0156, "step": 60400 }, { "epoch": 0.87, "learning_rate": 1.9709902431291167e-05, "loss": 0.0206, "step": 60410 }, { "epoch": 0.87, "learning_rate": 1.9709854391552693e-05, "loss": 0.0153, "step": 60420 }, { "epoch": 0.87, "learning_rate": 1.9709806351814222e-05, "loss": 0.0146, "step": 60430 }, { "epoch": 0.87, "learning_rate": 1.970975831207575e-05, "loss": 0.0199, "step": 60440 }, { "epoch": 0.87, "learning_rate": 1.970971027233728e-05, "loss": 0.0139, "step": 60450 }, { "epoch": 0.87, "learning_rate": 1.9709662232598806e-05, "loss": 0.0163, "step": 60460 }, { "epoch": 0.87, "learning_rate": 1.9709614192860336e-05, "loss": 0.0163, "step": 60470 }, { "epoch": 0.87, "learning_rate": 1.9709566153121865e-05, "loss": 0.0175, "step": 60480 }, { "epoch": 0.87, "learning_rate": 1.970951811338339e-05, "loss": 0.0141, "step": 60490 }, { "epoch": 0.87, "learning_rate": 1.970947007364492e-05, "loss": 0.0169, "step": 60500 }, { "epoch": 0.87, "learning_rate": 1.970942203390645e-05, "loss": 0.0194, "step": 60510 }, { "epoch": 0.87, "learning_rate": 1.970937399416798e-05, "loss": 0.0152, "step": 60520 }, { "epoch": 0.87, "learning_rate": 1.9709325954429504e-05, "loss": 0.0158, "step": 60530 }, { "epoch": 0.87, "learning_rate": 1.9709277914691034e-05, "loss": 0.0162, "step": 60540 }, { "epoch": 0.87, "learning_rate": 1.9709229874952563e-05, "loss": 0.0145, "step": 60550 }, { "epoch": 0.87, "learning_rate": 1.9709181835214092e-05, "loss": 0.0127, "step": 60560 }, { "epoch": 0.87, "learning_rate": 1.9709133795475618e-05, "loss": 0.0172, "step": 60570 }, { "epoch": 0.87, "learning_rate": 1.9709085755737147e-05, "loss": 0.0142, "step": 60580 }, { "epoch": 0.87, "learning_rate": 1.9709037715998677e-05, "loss": 0.0129, "step": 60590 }, { "epoch": 0.87, "learning_rate": 1.9708989676260203e-05, "loss": 0.0175, "step": 60600 }, { "epoch": 0.87, "learning_rate": 1.9708941636521732e-05, "loss": 0.0191, "step": 60610 }, { "epoch": 0.87, "learning_rate": 1.970889359678326e-05, "loss": 0.0159, "step": 60620 }, { "epoch": 0.87, "learning_rate": 1.970884555704479e-05, "loss": 0.0198, "step": 60630 }, { "epoch": 0.87, "learning_rate": 1.9708797517306316e-05, "loss": 0.0172, "step": 60640 }, { "epoch": 0.87, "learning_rate": 1.9708749477567845e-05, "loss": 0.0172, "step": 60650 }, { "epoch": 0.87, "learning_rate": 1.9708701437829375e-05, "loss": 0.0193, "step": 60660 }, { "epoch": 0.87, "learning_rate": 1.97086533980909e-05, "loss": 0.0157, "step": 60670 }, { "epoch": 0.87, "learning_rate": 1.970860535835243e-05, "loss": 0.0162, "step": 60680 }, { "epoch": 0.87, "learning_rate": 1.970855731861396e-05, "loss": 0.0171, "step": 60690 }, { "epoch": 0.87, "learning_rate": 1.970850927887549e-05, "loss": 0.0128, "step": 60700 }, { "epoch": 0.87, "learning_rate": 1.9708461239137014e-05, "loss": 0.0194, "step": 60710 }, { "epoch": 0.88, "learning_rate": 1.9708413199398544e-05, "loss": 0.0202, "step": 60720 }, { "epoch": 0.88, "learning_rate": 1.9708365159660073e-05, "loss": 0.0121, "step": 60730 }, { "epoch": 0.88, "learning_rate": 1.9708317119921602e-05, "loss": 0.0145, "step": 60740 }, { "epoch": 0.88, "learning_rate": 1.9708269080183128e-05, "loss": 0.0174, "step": 60750 }, { "epoch": 0.88, "learning_rate": 1.9708221040444657e-05, "loss": 0.0137, "step": 60760 }, { "epoch": 0.88, "learning_rate": 1.9708173000706187e-05, "loss": 0.0153, "step": 60770 }, { "epoch": 0.88, "learning_rate": 1.9708124960967712e-05, "loss": 0.0224, "step": 60780 }, { "epoch": 0.88, "learning_rate": 1.9708076921229242e-05, "loss": 0.0135, "step": 60790 }, { "epoch": 0.88, "learning_rate": 1.970802888149077e-05, "loss": 0.015, "step": 60800 }, { "epoch": 0.88, "learning_rate": 1.97079808417523e-05, "loss": 0.0146, "step": 60810 }, { "epoch": 0.88, "learning_rate": 1.9707932802013826e-05, "loss": 0.0205, "step": 60820 }, { "epoch": 0.88, "learning_rate": 1.9707884762275355e-05, "loss": 0.0135, "step": 60830 }, { "epoch": 0.88, "learning_rate": 1.9707836722536885e-05, "loss": 0.0172, "step": 60840 }, { "epoch": 0.88, "learning_rate": 1.970778868279841e-05, "loss": 0.0156, "step": 60850 }, { "epoch": 0.88, "learning_rate": 1.970774064305994e-05, "loss": 0.0132, "step": 60860 }, { "epoch": 0.88, "learning_rate": 1.970769260332147e-05, "loss": 0.0143, "step": 60870 }, { "epoch": 0.88, "learning_rate": 1.9707644563583e-05, "loss": 0.0121, "step": 60880 }, { "epoch": 0.88, "learning_rate": 1.9707596523844524e-05, "loss": 0.0166, "step": 60890 }, { "epoch": 0.88, "learning_rate": 1.9707548484106054e-05, "loss": 0.019, "step": 60900 }, { "epoch": 0.88, "learning_rate": 1.9707500444367583e-05, "loss": 0.0168, "step": 60910 }, { "epoch": 0.88, "learning_rate": 1.9707452404629112e-05, "loss": 0.0146, "step": 60920 }, { "epoch": 0.88, "learning_rate": 1.9707404364890638e-05, "loss": 0.0151, "step": 60930 }, { "epoch": 0.88, "learning_rate": 1.9707356325152167e-05, "loss": 0.0162, "step": 60940 }, { "epoch": 0.88, "learning_rate": 1.9707308285413696e-05, "loss": 0.0172, "step": 60950 }, { "epoch": 0.88, "learning_rate": 1.9707260245675222e-05, "loss": 0.0261, "step": 60960 }, { "epoch": 0.88, "learning_rate": 1.970721220593675e-05, "loss": 0.0157, "step": 60970 }, { "epoch": 0.88, "learning_rate": 1.970716416619828e-05, "loss": 0.0182, "step": 60980 }, { "epoch": 0.88, "learning_rate": 1.970711612645981e-05, "loss": 0.014, "step": 60990 }, { "epoch": 0.88, "learning_rate": 1.9707068086721336e-05, "loss": 0.0171, "step": 61000 }, { "epoch": 0.88, "learning_rate": 1.9707020046982865e-05, "loss": 0.0181, "step": 61010 }, { "epoch": 0.88, "learning_rate": 1.9706972007244395e-05, "loss": 0.0141, "step": 61020 }, { "epoch": 0.88, "learning_rate": 1.970692396750592e-05, "loss": 0.0142, "step": 61030 }, { "epoch": 0.88, "learning_rate": 1.970687592776745e-05, "loss": 0.0116, "step": 61040 }, { "epoch": 0.88, "learning_rate": 1.970682788802898e-05, "loss": 0.0189, "step": 61050 }, { "epoch": 0.88, "learning_rate": 1.9706779848290508e-05, "loss": 0.0189, "step": 61060 }, { "epoch": 0.88, "learning_rate": 1.9706731808552034e-05, "loss": 0.0158, "step": 61070 }, { "epoch": 0.88, "learning_rate": 1.9706683768813563e-05, "loss": 0.0137, "step": 61080 }, { "epoch": 0.88, "learning_rate": 1.9706635729075093e-05, "loss": 0.0222, "step": 61090 }, { "epoch": 0.88, "learning_rate": 1.9706587689336622e-05, "loss": 0.0203, "step": 61100 }, { "epoch": 0.88, "learning_rate": 1.9706539649598148e-05, "loss": 0.021, "step": 61110 }, { "epoch": 0.88, "learning_rate": 1.9706491609859677e-05, "loss": 0.0149, "step": 61120 }, { "epoch": 0.88, "learning_rate": 1.9706443570121206e-05, "loss": 0.0197, "step": 61130 }, { "epoch": 0.88, "learning_rate": 1.9706395530382732e-05, "loss": 0.0177, "step": 61140 }, { "epoch": 0.88, "learning_rate": 1.970634749064426e-05, "loss": 0.0116, "step": 61150 }, { "epoch": 0.88, "learning_rate": 1.970629945090579e-05, "loss": 0.0162, "step": 61160 }, { "epoch": 0.88, "learning_rate": 1.970625141116732e-05, "loss": 0.0133, "step": 61170 }, { "epoch": 0.88, "learning_rate": 1.9706203371428846e-05, "loss": 0.0129, "step": 61180 }, { "epoch": 0.88, "learning_rate": 1.9706155331690375e-05, "loss": 0.0187, "step": 61190 }, { "epoch": 0.88, "learning_rate": 1.9706107291951904e-05, "loss": 0.0135, "step": 61200 }, { "epoch": 0.88, "learning_rate": 1.970605925221343e-05, "loss": 0.0143, "step": 61210 }, { "epoch": 0.88, "learning_rate": 1.970601121247496e-05, "loss": 0.0115, "step": 61220 }, { "epoch": 0.88, "learning_rate": 1.970596317273649e-05, "loss": 0.017, "step": 61230 }, { "epoch": 0.88, "learning_rate": 1.9705915132998018e-05, "loss": 0.0181, "step": 61240 }, { "epoch": 0.88, "learning_rate": 1.9705867093259544e-05, "loss": 0.0171, "step": 61250 }, { "epoch": 0.88, "learning_rate": 1.9705819053521073e-05, "loss": 0.0155, "step": 61260 }, { "epoch": 0.88, "learning_rate": 1.9705771013782603e-05, "loss": 0.0142, "step": 61270 }, { "epoch": 0.88, "learning_rate": 1.9705722974044132e-05, "loss": 0.0165, "step": 61280 }, { "epoch": 0.88, "learning_rate": 1.9705674934305658e-05, "loss": 0.0154, "step": 61290 }, { "epoch": 0.88, "learning_rate": 1.9705626894567187e-05, "loss": 0.0187, "step": 61300 }, { "epoch": 0.88, "learning_rate": 1.9705578854828716e-05, "loss": 0.0184, "step": 61310 }, { "epoch": 0.88, "learning_rate": 1.9705530815090242e-05, "loss": 0.0167, "step": 61320 }, { "epoch": 0.88, "learning_rate": 1.970548277535177e-05, "loss": 0.0166, "step": 61330 }, { "epoch": 0.88, "learning_rate": 1.97054347356133e-05, "loss": 0.0138, "step": 61340 }, { "epoch": 0.88, "learning_rate": 1.970538669587483e-05, "loss": 0.0108, "step": 61350 }, { "epoch": 0.88, "learning_rate": 1.9705338656136356e-05, "loss": 0.0189, "step": 61360 }, { "epoch": 0.88, "learning_rate": 1.9705290616397885e-05, "loss": 0.0175, "step": 61370 }, { "epoch": 0.88, "learning_rate": 1.9705242576659414e-05, "loss": 0.0197, "step": 61380 }, { "epoch": 0.88, "learning_rate": 1.970519453692094e-05, "loss": 0.0128, "step": 61390 }, { "epoch": 0.88, "learning_rate": 1.970514649718247e-05, "loss": 0.0163, "step": 61400 }, { "epoch": 0.89, "learning_rate": 1.9705098457444e-05, "loss": 0.0142, "step": 61410 }, { "epoch": 0.89, "learning_rate": 1.9705050417705528e-05, "loss": 0.0212, "step": 61420 }, { "epoch": 0.89, "learning_rate": 1.9705002377967054e-05, "loss": 0.0144, "step": 61430 }, { "epoch": 0.89, "learning_rate": 1.9704954338228583e-05, "loss": 0.0132, "step": 61440 }, { "epoch": 0.89, "learning_rate": 1.9704906298490113e-05, "loss": 0.017, "step": 61450 }, { "epoch": 0.89, "learning_rate": 1.9704858258751642e-05, "loss": 0.0162, "step": 61460 }, { "epoch": 0.89, "learning_rate": 1.9704810219013168e-05, "loss": 0.0126, "step": 61470 }, { "epoch": 0.89, "learning_rate": 1.9704762179274697e-05, "loss": 0.0153, "step": 61480 }, { "epoch": 0.89, "learning_rate": 1.9704714139536226e-05, "loss": 0.0146, "step": 61490 }, { "epoch": 0.89, "learning_rate": 1.9704666099797752e-05, "loss": 0.0189, "step": 61500 }, { "epoch": 0.89, "learning_rate": 1.970461806005928e-05, "loss": 0.0165, "step": 61510 }, { "epoch": 0.89, "learning_rate": 1.970457002032081e-05, "loss": 0.0212, "step": 61520 }, { "epoch": 0.89, "learning_rate": 1.970452198058234e-05, "loss": 0.0157, "step": 61530 }, { "epoch": 0.89, "learning_rate": 1.9704473940843866e-05, "loss": 0.0126, "step": 61540 }, { "epoch": 0.89, "learning_rate": 1.9704425901105395e-05, "loss": 0.017, "step": 61550 }, { "epoch": 0.89, "learning_rate": 1.9704377861366924e-05, "loss": 0.0173, "step": 61560 }, { "epoch": 0.89, "learning_rate": 1.970432982162845e-05, "loss": 0.0225, "step": 61570 }, { "epoch": 0.89, "learning_rate": 1.970428178188998e-05, "loss": 0.0162, "step": 61580 }, { "epoch": 0.89, "learning_rate": 1.970423374215151e-05, "loss": 0.0137, "step": 61590 }, { "epoch": 0.89, "learning_rate": 1.9704185702413038e-05, "loss": 0.0139, "step": 61600 }, { "epoch": 0.89, "learning_rate": 1.9704137662674564e-05, "loss": 0.0155, "step": 61610 }, { "epoch": 0.89, "learning_rate": 1.9704089622936093e-05, "loss": 0.0179, "step": 61620 }, { "epoch": 0.89, "learning_rate": 1.9704041583197622e-05, "loss": 0.0166, "step": 61630 }, { "epoch": 0.89, "learning_rate": 1.9703993543459152e-05, "loss": 0.0173, "step": 61640 }, { "epoch": 0.89, "learning_rate": 1.9703945503720678e-05, "loss": 0.0147, "step": 61650 }, { "epoch": 0.89, "learning_rate": 1.9703897463982207e-05, "loss": 0.0152, "step": 61660 }, { "epoch": 0.89, "learning_rate": 1.9703849424243736e-05, "loss": 0.019, "step": 61670 }, { "epoch": 0.89, "learning_rate": 1.9703801384505262e-05, "loss": 0.0119, "step": 61680 }, { "epoch": 0.89, "learning_rate": 1.970375334476679e-05, "loss": 0.0129, "step": 61690 }, { "epoch": 0.89, "learning_rate": 1.970370530502832e-05, "loss": 0.0184, "step": 61700 }, { "epoch": 0.89, "learning_rate": 1.970365726528985e-05, "loss": 0.016, "step": 61710 }, { "epoch": 0.89, "learning_rate": 1.9703609225551376e-05, "loss": 0.0152, "step": 61720 }, { "epoch": 0.89, "learning_rate": 1.9703561185812905e-05, "loss": 0.0157, "step": 61730 }, { "epoch": 0.89, "learning_rate": 1.9703513146074434e-05, "loss": 0.0174, "step": 61740 }, { "epoch": 0.89, "learning_rate": 1.970346510633596e-05, "loss": 0.0133, "step": 61750 }, { "epoch": 0.89, "learning_rate": 1.970341706659749e-05, "loss": 0.0143, "step": 61760 }, { "epoch": 0.89, "learning_rate": 1.970336902685902e-05, "loss": 0.0181, "step": 61770 }, { "epoch": 0.89, "learning_rate": 1.9703320987120548e-05, "loss": 0.0174, "step": 61780 }, { "epoch": 0.89, "learning_rate": 1.9703272947382074e-05, "loss": 0.0166, "step": 61790 }, { "epoch": 0.89, "learning_rate": 1.9703224907643603e-05, "loss": 0.0148, "step": 61800 }, { "epoch": 0.89, "learning_rate": 1.9703176867905132e-05, "loss": 0.0172, "step": 61810 }, { "epoch": 0.89, "learning_rate": 1.970312882816666e-05, "loss": 0.0136, "step": 61820 }, { "epoch": 0.89, "learning_rate": 1.970308078842819e-05, "loss": 0.0186, "step": 61830 }, { "epoch": 0.89, "learning_rate": 1.970303274868972e-05, "loss": 0.0174, "step": 61840 }, { "epoch": 0.89, "learning_rate": 1.9702984708951246e-05, "loss": 0.0208, "step": 61850 }, { "epoch": 0.89, "learning_rate": 1.9702936669212775e-05, "loss": 0.0155, "step": 61860 }, { "epoch": 0.89, "learning_rate": 1.9702888629474305e-05, "loss": 0.0132, "step": 61870 }, { "epoch": 0.89, "learning_rate": 1.970284058973583e-05, "loss": 0.0137, "step": 61880 }, { "epoch": 0.89, "learning_rate": 1.970279254999736e-05, "loss": 0.0158, "step": 61890 }, { "epoch": 0.89, "learning_rate": 1.970274451025889e-05, "loss": 0.0177, "step": 61900 }, { "epoch": 0.89, "learning_rate": 1.9702696470520418e-05, "loss": 0.017, "step": 61910 }, { "epoch": 0.89, "learning_rate": 1.9702648430781944e-05, "loss": 0.0167, "step": 61920 }, { "epoch": 0.89, "learning_rate": 1.9702600391043473e-05, "loss": 0.0206, "step": 61930 }, { "epoch": 0.89, "learning_rate": 1.9702552351305003e-05, "loss": 0.0187, "step": 61940 }, { "epoch": 0.89, "learning_rate": 1.9702504311566532e-05, "loss": 0.017, "step": 61950 }, { "epoch": 0.89, "learning_rate": 1.9702456271828058e-05, "loss": 0.0154, "step": 61960 }, { "epoch": 0.89, "learning_rate": 1.9702408232089587e-05, "loss": 0.013, "step": 61970 }, { "epoch": 0.89, "learning_rate": 1.9702360192351116e-05, "loss": 0.0148, "step": 61980 }, { "epoch": 0.89, "learning_rate": 1.9702312152612642e-05, "loss": 0.015, "step": 61990 }, { "epoch": 0.89, "learning_rate": 1.970226411287417e-05, "loss": 0.0183, "step": 62000 }, { "epoch": 0.89, "learning_rate": 1.97022160731357e-05, "loss": 0.0145, "step": 62010 }, { "epoch": 0.89, "learning_rate": 1.970216803339723e-05, "loss": 0.0169, "step": 62020 }, { "epoch": 0.89, "learning_rate": 1.9702119993658756e-05, "loss": 0.0188, "step": 62030 }, { "epoch": 0.89, "learning_rate": 1.9702071953920285e-05, "loss": 0.0168, "step": 62040 }, { "epoch": 0.89, "learning_rate": 1.9702023914181814e-05, "loss": 0.0181, "step": 62050 }, { "epoch": 0.89, "learning_rate": 1.970197587444334e-05, "loss": 0.017, "step": 62060 }, { "epoch": 0.89, "learning_rate": 1.970192783470487e-05, "loss": 0.0127, "step": 62070 }, { "epoch": 0.89, "learning_rate": 1.97018797949664e-05, "loss": 0.0164, "step": 62080 }, { "epoch": 0.89, "learning_rate": 1.9701831755227928e-05, "loss": 0.0183, "step": 62090 }, { "epoch": 0.89, "learning_rate": 1.9701783715489454e-05, "loss": 0.0119, "step": 62100 }, { "epoch": 0.9, "learning_rate": 1.9701735675750983e-05, "loss": 0.0152, "step": 62110 }, { "epoch": 0.9, "learning_rate": 1.9701687636012513e-05, "loss": 0.0147, "step": 62120 }, { "epoch": 0.9, "learning_rate": 1.9701639596274042e-05, "loss": 0.0176, "step": 62130 }, { "epoch": 0.9, "learning_rate": 1.9701591556535568e-05, "loss": 0.0172, "step": 62140 }, { "epoch": 0.9, "learning_rate": 1.9701543516797097e-05, "loss": 0.0112, "step": 62150 }, { "epoch": 0.9, "learning_rate": 1.9701495477058626e-05, "loss": 0.0124, "step": 62160 }, { "epoch": 0.9, "learning_rate": 1.9701447437320152e-05, "loss": 0.0171, "step": 62170 }, { "epoch": 0.9, "learning_rate": 1.970139939758168e-05, "loss": 0.0172, "step": 62180 }, { "epoch": 0.9, "learning_rate": 1.970135135784321e-05, "loss": 0.0146, "step": 62190 }, { "epoch": 0.9, "learning_rate": 1.970130331810474e-05, "loss": 0.0162, "step": 62200 }, { "epoch": 0.9, "learning_rate": 1.9701255278366266e-05, "loss": 0.017, "step": 62210 }, { "epoch": 0.9, "learning_rate": 1.9701207238627795e-05, "loss": 0.016, "step": 62220 }, { "epoch": 0.9, "learning_rate": 1.9701159198889324e-05, "loss": 0.0177, "step": 62230 }, { "epoch": 0.9, "learning_rate": 1.970111115915085e-05, "loss": 0.0175, "step": 62240 }, { "epoch": 0.9, "learning_rate": 1.970106311941238e-05, "loss": 0.0146, "step": 62250 }, { "epoch": 0.9, "learning_rate": 1.970101507967391e-05, "loss": 0.0167, "step": 62260 }, { "epoch": 0.9, "learning_rate": 1.9700967039935438e-05, "loss": 0.0134, "step": 62270 }, { "epoch": 0.9, "learning_rate": 1.9700919000196964e-05, "loss": 0.0182, "step": 62280 }, { "epoch": 0.9, "learning_rate": 1.9700870960458493e-05, "loss": 0.0245, "step": 62290 }, { "epoch": 0.9, "learning_rate": 1.9700822920720023e-05, "loss": 0.0204, "step": 62300 }, { "epoch": 0.9, "learning_rate": 1.9700774880981552e-05, "loss": 0.0181, "step": 62310 }, { "epoch": 0.9, "learning_rate": 1.9700726841243078e-05, "loss": 0.0157, "step": 62320 }, { "epoch": 0.9, "learning_rate": 1.9700678801504607e-05, "loss": 0.018, "step": 62330 }, { "epoch": 0.9, "learning_rate": 1.9700630761766136e-05, "loss": 0.0163, "step": 62340 }, { "epoch": 0.9, "learning_rate": 1.9700582722027662e-05, "loss": 0.0196, "step": 62350 }, { "epoch": 0.9, "learning_rate": 1.970053468228919e-05, "loss": 0.0158, "step": 62360 }, { "epoch": 0.9, "learning_rate": 1.970048664255072e-05, "loss": 0.0116, "step": 62370 }, { "epoch": 0.9, "learning_rate": 1.970043860281225e-05, "loss": 0.0183, "step": 62380 }, { "epoch": 0.9, "learning_rate": 1.9700390563073776e-05, "loss": 0.0128, "step": 62390 }, { "epoch": 0.9, "learning_rate": 1.9700342523335305e-05, "loss": 0.0155, "step": 62400 }, { "epoch": 0.9, "learning_rate": 1.9700294483596834e-05, "loss": 0.0125, "step": 62410 }, { "epoch": 0.9, "learning_rate": 1.970024644385836e-05, "loss": 0.0111, "step": 62420 }, { "epoch": 0.9, "learning_rate": 1.970019840411989e-05, "loss": 0.0162, "step": 62430 }, { "epoch": 0.9, "learning_rate": 1.970015036438142e-05, "loss": 0.0168, "step": 62440 }, { "epoch": 0.9, "learning_rate": 1.9700102324642948e-05, "loss": 0.0181, "step": 62450 }, { "epoch": 0.9, "learning_rate": 1.9700054284904474e-05, "loss": 0.0186, "step": 62460 }, { "epoch": 0.9, "learning_rate": 1.9700006245166003e-05, "loss": 0.0167, "step": 62470 }, { "epoch": 0.9, "learning_rate": 1.9699958205427532e-05, "loss": 0.0162, "step": 62480 }, { "epoch": 0.9, "learning_rate": 1.9699910165689062e-05, "loss": 0.0128, "step": 62490 }, { "epoch": 0.9, "learning_rate": 1.9699862125950588e-05, "loss": 0.0133, "step": 62500 }, { "epoch": 0.9, "learning_rate": 1.9699814086212117e-05, "loss": 0.0129, "step": 62510 }, { "epoch": 0.9, "learning_rate": 1.9699766046473646e-05, "loss": 0.0179, "step": 62520 }, { "epoch": 0.9, "learning_rate": 1.9699718006735172e-05, "loss": 0.0188, "step": 62530 }, { "epoch": 0.9, "learning_rate": 1.96996699669967e-05, "loss": 0.018, "step": 62540 }, { "epoch": 0.9, "learning_rate": 1.969962192725823e-05, "loss": 0.014, "step": 62550 }, { "epoch": 0.9, "learning_rate": 1.969957388751976e-05, "loss": 0.0198, "step": 62560 }, { "epoch": 0.9, "learning_rate": 1.9699525847781286e-05, "loss": 0.0144, "step": 62570 }, { "epoch": 0.9, "learning_rate": 1.9699477808042815e-05, "loss": 0.0184, "step": 62580 }, { "epoch": 0.9, "learning_rate": 1.9699429768304344e-05, "loss": 0.0151, "step": 62590 }, { "epoch": 0.9, "learning_rate": 1.969938172856587e-05, "loss": 0.0174, "step": 62600 }, { "epoch": 0.9, "learning_rate": 1.96993336888274e-05, "loss": 0.017, "step": 62610 }, { "epoch": 0.9, "learning_rate": 1.969928564908893e-05, "loss": 0.0114, "step": 62620 }, { "epoch": 0.9, "learning_rate": 1.9699237609350458e-05, "loss": 0.0153, "step": 62630 }, { "epoch": 0.9, "learning_rate": 1.9699189569611984e-05, "loss": 0.0149, "step": 62640 }, { "epoch": 0.9, "learning_rate": 1.9699141529873513e-05, "loss": 0.0156, "step": 62650 }, { "epoch": 0.9, "learning_rate": 1.9699093490135042e-05, "loss": 0.0133, "step": 62660 }, { "epoch": 0.9, "learning_rate": 1.969904545039657e-05, "loss": 0.016, "step": 62670 }, { "epoch": 0.9, "learning_rate": 1.9698997410658097e-05, "loss": 0.0125, "step": 62680 }, { "epoch": 0.9, "learning_rate": 1.9698949370919627e-05, "loss": 0.0147, "step": 62690 }, { "epoch": 0.9, "learning_rate": 1.9698901331181156e-05, "loss": 0.0143, "step": 62700 }, { "epoch": 0.9, "learning_rate": 1.9698853291442682e-05, "loss": 0.0163, "step": 62710 }, { "epoch": 0.9, "learning_rate": 1.969880525170421e-05, "loss": 0.0158, "step": 62720 }, { "epoch": 0.9, "learning_rate": 1.969875721196574e-05, "loss": 0.0179, "step": 62730 }, { "epoch": 0.9, "learning_rate": 1.969870917222727e-05, "loss": 0.0132, "step": 62740 }, { "epoch": 0.9, "learning_rate": 1.9698661132488796e-05, "loss": 0.0127, "step": 62750 }, { "epoch": 0.9, "learning_rate": 1.9698613092750325e-05, "loss": 0.0185, "step": 62760 }, { "epoch": 0.9, "learning_rate": 1.9698565053011854e-05, "loss": 0.0127, "step": 62770 }, { "epoch": 0.9, "learning_rate": 1.969851701327338e-05, "loss": 0.0175, "step": 62780 }, { "epoch": 0.9, "learning_rate": 1.969846897353491e-05, "loss": 0.0187, "step": 62790 }, { "epoch": 0.91, "learning_rate": 1.969842093379644e-05, "loss": 0.0113, "step": 62800 }, { "epoch": 0.91, "learning_rate": 1.9698372894057968e-05, "loss": 0.0179, "step": 62810 }, { "epoch": 0.91, "learning_rate": 1.9698324854319494e-05, "loss": 0.0136, "step": 62820 }, { "epoch": 0.91, "learning_rate": 1.9698276814581023e-05, "loss": 0.0183, "step": 62830 }, { "epoch": 0.91, "learning_rate": 1.9698228774842552e-05, "loss": 0.0155, "step": 62840 }, { "epoch": 0.91, "learning_rate": 1.969818073510408e-05, "loss": 0.0168, "step": 62850 }, { "epoch": 0.91, "learning_rate": 1.9698132695365607e-05, "loss": 0.0186, "step": 62860 }, { "epoch": 0.91, "learning_rate": 1.9698084655627137e-05, "loss": 0.0178, "step": 62870 }, { "epoch": 0.91, "learning_rate": 1.9698036615888666e-05, "loss": 0.0224, "step": 62880 }, { "epoch": 0.91, "learning_rate": 1.9697988576150192e-05, "loss": 0.0159, "step": 62890 }, { "epoch": 0.91, "learning_rate": 1.969794053641172e-05, "loss": 0.0144, "step": 62900 }, { "epoch": 0.91, "learning_rate": 1.969789249667325e-05, "loss": 0.0167, "step": 62910 }, { "epoch": 0.91, "learning_rate": 1.969784445693478e-05, "loss": 0.0161, "step": 62920 }, { "epoch": 0.91, "learning_rate": 1.9697796417196306e-05, "loss": 0.021, "step": 62930 }, { "epoch": 0.91, "learning_rate": 1.9697748377457835e-05, "loss": 0.0216, "step": 62940 }, { "epoch": 0.91, "learning_rate": 1.9697700337719364e-05, "loss": 0.0171, "step": 62950 }, { "epoch": 0.91, "learning_rate": 1.969765229798089e-05, "loss": 0.0133, "step": 62960 }, { "epoch": 0.91, "learning_rate": 1.969760425824242e-05, "loss": 0.0181, "step": 62970 }, { "epoch": 0.91, "learning_rate": 1.969755621850395e-05, "loss": 0.0135, "step": 62980 }, { "epoch": 0.91, "learning_rate": 1.9697508178765478e-05, "loss": 0.017, "step": 62990 }, { "epoch": 0.91, "learning_rate": 1.9697460139027004e-05, "loss": 0.0133, "step": 63000 }, { "epoch": 0.91, "learning_rate": 1.9697412099288533e-05, "loss": 0.0122, "step": 63010 }, { "epoch": 0.91, "learning_rate": 1.9697364059550062e-05, "loss": 0.017, "step": 63020 }, { "epoch": 0.91, "learning_rate": 1.969731601981159e-05, "loss": 0.014, "step": 63030 }, { "epoch": 0.91, "learning_rate": 1.9697267980073117e-05, "loss": 0.0218, "step": 63040 }, { "epoch": 0.91, "learning_rate": 1.9697219940334647e-05, "loss": 0.02, "step": 63050 }, { "epoch": 0.91, "learning_rate": 1.9697171900596176e-05, "loss": 0.0131, "step": 63060 }, { "epoch": 0.91, "learning_rate": 1.9697123860857702e-05, "loss": 0.0111, "step": 63070 }, { "epoch": 0.91, "learning_rate": 1.969707582111923e-05, "loss": 0.0185, "step": 63080 }, { "epoch": 0.91, "learning_rate": 1.969702778138076e-05, "loss": 0.0137, "step": 63090 }, { "epoch": 0.91, "learning_rate": 1.969697974164229e-05, "loss": 0.0174, "step": 63100 }, { "epoch": 0.91, "learning_rate": 1.9696931701903815e-05, "loss": 0.0206, "step": 63110 }, { "epoch": 0.91, "learning_rate": 1.9696883662165345e-05, "loss": 0.0139, "step": 63120 }, { "epoch": 0.91, "learning_rate": 1.9696835622426874e-05, "loss": 0.0136, "step": 63130 }, { "epoch": 0.91, "learning_rate": 1.96967875826884e-05, "loss": 0.0113, "step": 63140 }, { "epoch": 0.91, "learning_rate": 1.969673954294993e-05, "loss": 0.0152, "step": 63150 }, { "epoch": 0.91, "learning_rate": 1.969669150321146e-05, "loss": 0.0141, "step": 63160 }, { "epoch": 0.91, "learning_rate": 1.9696643463472988e-05, "loss": 0.0196, "step": 63170 }, { "epoch": 0.91, "learning_rate": 1.9696595423734514e-05, "loss": 0.0119, "step": 63180 }, { "epoch": 0.91, "learning_rate": 1.9696547383996043e-05, "loss": 0.0231, "step": 63190 }, { "epoch": 0.91, "learning_rate": 1.9696499344257572e-05, "loss": 0.019, "step": 63200 }, { "epoch": 0.91, "learning_rate": 1.96964513045191e-05, "loss": 0.012, "step": 63210 }, { "epoch": 0.91, "learning_rate": 1.9696403264780627e-05, "loss": 0.02, "step": 63220 }, { "epoch": 0.91, "learning_rate": 1.9696355225042157e-05, "loss": 0.0149, "step": 63230 }, { "epoch": 0.91, "learning_rate": 1.9696307185303686e-05, "loss": 0.0129, "step": 63240 }, { "epoch": 0.91, "learning_rate": 1.969625914556521e-05, "loss": 0.0126, "step": 63250 }, { "epoch": 0.91, "learning_rate": 1.969621110582674e-05, "loss": 0.0127, "step": 63260 }, { "epoch": 0.91, "learning_rate": 1.969616306608827e-05, "loss": 0.0213, "step": 63270 }, { "epoch": 0.91, "learning_rate": 1.96961150263498e-05, "loss": 0.0128, "step": 63280 }, { "epoch": 0.91, "learning_rate": 1.9696066986611325e-05, "loss": 0.0147, "step": 63290 }, { "epoch": 0.91, "learning_rate": 1.9696018946872855e-05, "loss": 0.0148, "step": 63300 }, { "epoch": 0.91, "learning_rate": 1.9695970907134384e-05, "loss": 0.0162, "step": 63310 }, { "epoch": 0.91, "learning_rate": 1.969592286739591e-05, "loss": 0.0138, "step": 63320 }, { "epoch": 0.91, "learning_rate": 1.969587482765744e-05, "loss": 0.0117, "step": 63330 }, { "epoch": 0.91, "learning_rate": 1.969582678791897e-05, "loss": 0.0161, "step": 63340 }, { "epoch": 0.91, "learning_rate": 1.9695778748180498e-05, "loss": 0.0168, "step": 63350 }, { "epoch": 0.91, "learning_rate": 1.9695730708442023e-05, "loss": 0.0154, "step": 63360 }, { "epoch": 0.91, "learning_rate": 1.9695682668703553e-05, "loss": 0.0127, "step": 63370 }, { "epoch": 0.91, "learning_rate": 1.9695634628965082e-05, "loss": 0.0185, "step": 63380 }, { "epoch": 0.91, "learning_rate": 1.969558658922661e-05, "loss": 0.0147, "step": 63390 }, { "epoch": 0.91, "learning_rate": 1.9695538549488137e-05, "loss": 0.0141, "step": 63400 }, { "epoch": 0.91, "learning_rate": 1.9695490509749666e-05, "loss": 0.0164, "step": 63410 }, { "epoch": 0.91, "learning_rate": 1.969544727398504e-05, "loss": 0.0134, "step": 63420 }, { "epoch": 0.91, "learning_rate": 1.969539923424657e-05, "loss": 0.0181, "step": 63430 }, { "epoch": 0.91, "learning_rate": 1.96953511945081e-05, "loss": 0.0111, "step": 63440 }, { "epoch": 0.91, "learning_rate": 1.9695303154769625e-05, "loss": 0.0151, "step": 63450 }, { "epoch": 0.91, "learning_rate": 1.9695255115031155e-05, "loss": 0.0142, "step": 63460 }, { "epoch": 0.91, "learning_rate": 1.9695207075292684e-05, "loss": 0.0183, "step": 63470 }, { "epoch": 0.91, "learning_rate": 1.9695159035554213e-05, "loss": 0.0183, "step": 63480 }, { "epoch": 0.92, "learning_rate": 1.969511099581574e-05, "loss": 0.0188, "step": 63490 }, { "epoch": 0.92, "learning_rate": 1.969506295607727e-05, "loss": 0.0161, "step": 63500 }, { "epoch": 0.92, "learning_rate": 1.9695014916338798e-05, "loss": 0.0146, "step": 63510 }, { "epoch": 0.92, "learning_rate": 1.9694966876600327e-05, "loss": 0.0164, "step": 63520 }, { "epoch": 0.92, "learning_rate": 1.9694918836861853e-05, "loss": 0.0163, "step": 63530 }, { "epoch": 0.92, "learning_rate": 1.9694870797123382e-05, "loss": 0.0156, "step": 63540 }, { "epoch": 0.92, "learning_rate": 1.969482275738491e-05, "loss": 0.0163, "step": 63550 }, { "epoch": 0.92, "learning_rate": 1.9694774717646437e-05, "loss": 0.017, "step": 63560 }, { "epoch": 0.92, "learning_rate": 1.9694726677907967e-05, "loss": 0.012, "step": 63570 }, { "epoch": 0.92, "learning_rate": 1.9694678638169496e-05, "loss": 0.0179, "step": 63580 }, { "epoch": 0.92, "learning_rate": 1.9694630598431025e-05, "loss": 0.0125, "step": 63590 }, { "epoch": 0.92, "learning_rate": 1.969458255869255e-05, "loss": 0.0181, "step": 63600 }, { "epoch": 0.92, "learning_rate": 1.969453451895408e-05, "loss": 0.0153, "step": 63610 }, { "epoch": 0.92, "learning_rate": 1.969448647921561e-05, "loss": 0.0154, "step": 63620 }, { "epoch": 0.92, "learning_rate": 1.9694438439477135e-05, "loss": 0.0145, "step": 63630 }, { "epoch": 0.92, "learning_rate": 1.9694390399738665e-05, "loss": 0.0171, "step": 63640 }, { "epoch": 0.92, "learning_rate": 1.9694342360000194e-05, "loss": 0.0193, "step": 63650 }, { "epoch": 0.92, "learning_rate": 1.9694294320261723e-05, "loss": 0.0153, "step": 63660 }, { "epoch": 0.92, "learning_rate": 1.969424628052325e-05, "loss": 0.0134, "step": 63670 }, { "epoch": 0.92, "learning_rate": 1.969419824078478e-05, "loss": 0.0183, "step": 63680 }, { "epoch": 0.92, "learning_rate": 1.9694150201046308e-05, "loss": 0.0184, "step": 63690 }, { "epoch": 0.92, "learning_rate": 1.9694102161307837e-05, "loss": 0.0148, "step": 63700 }, { "epoch": 0.92, "learning_rate": 1.9694054121569363e-05, "loss": 0.0164, "step": 63710 }, { "epoch": 0.92, "learning_rate": 1.9694006081830892e-05, "loss": 0.0159, "step": 63720 }, { "epoch": 0.92, "learning_rate": 1.969395804209242e-05, "loss": 0.0186, "step": 63730 }, { "epoch": 0.92, "learning_rate": 1.9693910002353947e-05, "loss": 0.0173, "step": 63740 }, { "epoch": 0.92, "learning_rate": 1.9693861962615476e-05, "loss": 0.0152, "step": 63750 }, { "epoch": 0.92, "learning_rate": 1.9693813922877006e-05, "loss": 0.014, "step": 63760 }, { "epoch": 0.92, "learning_rate": 1.9693765883138535e-05, "loss": 0.0159, "step": 63770 }, { "epoch": 0.92, "learning_rate": 1.969371784340006e-05, "loss": 0.0137, "step": 63780 }, { "epoch": 0.92, "learning_rate": 1.969366980366159e-05, "loss": 0.015, "step": 63790 }, { "epoch": 0.92, "learning_rate": 1.969362176392312e-05, "loss": 0.0196, "step": 63800 }, { "epoch": 0.92, "learning_rate": 1.9693573724184645e-05, "loss": 0.0173, "step": 63810 }, { "epoch": 0.92, "learning_rate": 1.9693525684446175e-05, "loss": 0.0132, "step": 63820 }, { "epoch": 0.92, "learning_rate": 1.9693477644707704e-05, "loss": 0.0153, "step": 63830 }, { "epoch": 0.92, "learning_rate": 1.9693429604969233e-05, "loss": 0.018, "step": 63840 }, { "epoch": 0.92, "learning_rate": 1.969338156523076e-05, "loss": 0.0136, "step": 63850 }, { "epoch": 0.92, "learning_rate": 1.9693333525492288e-05, "loss": 0.0197, "step": 63860 }, { "epoch": 0.92, "learning_rate": 1.9693285485753818e-05, "loss": 0.0123, "step": 63870 }, { "epoch": 0.92, "learning_rate": 1.9693237446015347e-05, "loss": 0.0171, "step": 63880 }, { "epoch": 0.92, "learning_rate": 1.9693189406276873e-05, "loss": 0.014, "step": 63890 }, { "epoch": 0.92, "learning_rate": 1.9693141366538402e-05, "loss": 0.0178, "step": 63900 }, { "epoch": 0.92, "learning_rate": 1.969309332679993e-05, "loss": 0.0139, "step": 63910 }, { "epoch": 0.92, "learning_rate": 1.9693045287061457e-05, "loss": 0.0137, "step": 63920 }, { "epoch": 0.92, "learning_rate": 1.9692997247322986e-05, "loss": 0.0101, "step": 63930 }, { "epoch": 0.92, "learning_rate": 1.9692949207584516e-05, "loss": 0.0171, "step": 63940 }, { "epoch": 0.92, "learning_rate": 1.9692901167846045e-05, "loss": 0.0141, "step": 63950 }, { "epoch": 0.92, "learning_rate": 1.969285312810757e-05, "loss": 0.0148, "step": 63960 }, { "epoch": 0.92, "learning_rate": 1.96928050883691e-05, "loss": 0.0143, "step": 63970 }, { "epoch": 0.92, "learning_rate": 1.969275704863063e-05, "loss": 0.0117, "step": 63980 }, { "epoch": 0.92, "learning_rate": 1.9692709008892155e-05, "loss": 0.0163, "step": 63990 }, { "epoch": 0.92, "learning_rate": 1.9692660969153685e-05, "loss": 0.0107, "step": 64000 }, { "epoch": 0.92, "learning_rate": 1.9692612929415214e-05, "loss": 0.0171, "step": 64010 }, { "epoch": 0.92, "learning_rate": 1.9692564889676743e-05, "loss": 0.0219, "step": 64020 }, { "epoch": 0.92, "learning_rate": 1.969251684993827e-05, "loss": 0.0154, "step": 64030 }, { "epoch": 0.92, "learning_rate": 1.9692468810199798e-05, "loss": 0.0128, "step": 64040 }, { "epoch": 0.92, "learning_rate": 1.9692420770461327e-05, "loss": 0.0141, "step": 64050 }, { "epoch": 0.92, "learning_rate": 1.9692372730722857e-05, "loss": 0.0153, "step": 64060 }, { "epoch": 0.92, "learning_rate": 1.9692324690984383e-05, "loss": 0.0157, "step": 64070 }, { "epoch": 0.92, "learning_rate": 1.9692276651245912e-05, "loss": 0.0153, "step": 64080 }, { "epoch": 0.92, "learning_rate": 1.969222861150744e-05, "loss": 0.013, "step": 64090 }, { "epoch": 0.92, "learning_rate": 1.9692180571768967e-05, "loss": 0.0156, "step": 64100 }, { "epoch": 0.92, "learning_rate": 1.9692132532030496e-05, "loss": 0.0165, "step": 64110 }, { "epoch": 0.92, "learning_rate": 1.9692084492292026e-05, "loss": 0.0138, "step": 64120 }, { "epoch": 0.92, "learning_rate": 1.9692036452553555e-05, "loss": 0.0163, "step": 64130 }, { "epoch": 0.92, "learning_rate": 1.969198841281508e-05, "loss": 0.0169, "step": 64140 }, { "epoch": 0.92, "learning_rate": 1.969194037307661e-05, "loss": 0.0172, "step": 64150 }, { "epoch": 0.92, "learning_rate": 1.969189233333814e-05, "loss": 0.0174, "step": 64160 }, { "epoch": 0.92, "learning_rate": 1.9691844293599665e-05, "loss": 0.0142, "step": 64170 }, { "epoch": 0.92, "learning_rate": 1.9691796253861194e-05, "loss": 0.0159, "step": 64180 }, { "epoch": 0.93, "learning_rate": 1.9691748214122724e-05, "loss": 0.0225, "step": 64190 }, { "epoch": 0.93, "learning_rate": 1.9691700174384253e-05, "loss": 0.014, "step": 64200 }, { "epoch": 0.93, "learning_rate": 1.969165213464578e-05, "loss": 0.0101, "step": 64210 }, { "epoch": 0.93, "learning_rate": 1.9691604094907308e-05, "loss": 0.0161, "step": 64220 }, { "epoch": 0.93, "learning_rate": 1.9691556055168837e-05, "loss": 0.0141, "step": 64230 }, { "epoch": 0.93, "learning_rate": 1.9691508015430367e-05, "loss": 0.0123, "step": 64240 }, { "epoch": 0.93, "learning_rate": 1.9691459975691893e-05, "loss": 0.0154, "step": 64250 }, { "epoch": 0.93, "learning_rate": 1.9691411935953422e-05, "loss": 0.0144, "step": 64260 }, { "epoch": 0.93, "learning_rate": 1.969136389621495e-05, "loss": 0.02, "step": 64270 }, { "epoch": 0.93, "learning_rate": 1.9691315856476477e-05, "loss": 0.0185, "step": 64280 }, { "epoch": 0.93, "learning_rate": 1.9691267816738006e-05, "loss": 0.018, "step": 64290 }, { "epoch": 0.93, "learning_rate": 1.9691219776999535e-05, "loss": 0.0179, "step": 64300 }, { "epoch": 0.93, "learning_rate": 1.9691171737261065e-05, "loss": 0.0157, "step": 64310 }, { "epoch": 0.93, "learning_rate": 1.969112369752259e-05, "loss": 0.0136, "step": 64320 }, { "epoch": 0.93, "learning_rate": 1.969107565778412e-05, "loss": 0.0147, "step": 64330 }, { "epoch": 0.93, "learning_rate": 1.969102761804565e-05, "loss": 0.0152, "step": 64340 }, { "epoch": 0.93, "learning_rate": 1.9690979578307175e-05, "loss": 0.0171, "step": 64350 }, { "epoch": 0.93, "learning_rate": 1.9690931538568704e-05, "loss": 0.0206, "step": 64360 }, { "epoch": 0.93, "learning_rate": 1.9690883498830234e-05, "loss": 0.0186, "step": 64370 }, { "epoch": 0.93, "learning_rate": 1.9690835459091763e-05, "loss": 0.0129, "step": 64380 }, { "epoch": 0.93, "learning_rate": 1.969078741935329e-05, "loss": 0.0198, "step": 64390 }, { "epoch": 0.93, "learning_rate": 1.9690739379614818e-05, "loss": 0.0115, "step": 64400 }, { "epoch": 0.93, "learning_rate": 1.9690691339876347e-05, "loss": 0.0175, "step": 64410 }, { "epoch": 0.93, "learning_rate": 1.9690643300137877e-05, "loss": 0.0143, "step": 64420 }, { "epoch": 0.93, "learning_rate": 1.9690595260399402e-05, "loss": 0.0169, "step": 64430 }, { "epoch": 0.93, "learning_rate": 1.9690547220660932e-05, "loss": 0.0189, "step": 64440 }, { "epoch": 0.93, "learning_rate": 1.969049918092246e-05, "loss": 0.0168, "step": 64450 }, { "epoch": 0.93, "learning_rate": 1.9690451141183987e-05, "loss": 0.0142, "step": 64460 }, { "epoch": 0.93, "learning_rate": 1.9690403101445516e-05, "loss": 0.0168, "step": 64470 }, { "epoch": 0.93, "learning_rate": 1.9690355061707045e-05, "loss": 0.017, "step": 64480 }, { "epoch": 0.93, "learning_rate": 1.9690307021968575e-05, "loss": 0.0147, "step": 64490 }, { "epoch": 0.93, "learning_rate": 1.96902589822301e-05, "loss": 0.0187, "step": 64500 }, { "epoch": 0.93, "learning_rate": 1.969021094249163e-05, "loss": 0.0185, "step": 64510 }, { "epoch": 0.93, "learning_rate": 1.969016290275316e-05, "loss": 0.0225, "step": 64520 }, { "epoch": 0.93, "learning_rate": 1.9690114863014685e-05, "loss": 0.0133, "step": 64530 }, { "epoch": 0.93, "learning_rate": 1.9690066823276214e-05, "loss": 0.0186, "step": 64540 }, { "epoch": 0.93, "learning_rate": 1.9690018783537744e-05, "loss": 0.0208, "step": 64550 }, { "epoch": 0.93, "learning_rate": 1.9689970743799273e-05, "loss": 0.016, "step": 64560 }, { "epoch": 0.93, "learning_rate": 1.96899227040608e-05, "loss": 0.0168, "step": 64570 }, { "epoch": 0.93, "learning_rate": 1.9689874664322328e-05, "loss": 0.0118, "step": 64580 }, { "epoch": 0.93, "learning_rate": 1.9689826624583857e-05, "loss": 0.0107, "step": 64590 }, { "epoch": 0.93, "learning_rate": 1.9689778584845386e-05, "loss": 0.0108, "step": 64600 }, { "epoch": 0.93, "learning_rate": 1.9689730545106912e-05, "loss": 0.0129, "step": 64610 }, { "epoch": 0.93, "learning_rate": 1.968968250536844e-05, "loss": 0.0185, "step": 64620 }, { "epoch": 0.93, "learning_rate": 1.968963446562997e-05, "loss": 0.0156, "step": 64630 }, { "epoch": 0.93, "learning_rate": 1.9689586425891497e-05, "loss": 0.0172, "step": 64640 }, { "epoch": 0.93, "learning_rate": 1.9689538386153026e-05, "loss": 0.0169, "step": 64650 }, { "epoch": 0.93, "learning_rate": 1.9689490346414555e-05, "loss": 0.0156, "step": 64660 }, { "epoch": 0.93, "learning_rate": 1.9689442306676085e-05, "loss": 0.0167, "step": 64670 }, { "epoch": 0.93, "learning_rate": 1.968939426693761e-05, "loss": 0.0147, "step": 64680 }, { "epoch": 0.93, "learning_rate": 1.968934622719914e-05, "loss": 0.0171, "step": 64690 }, { "epoch": 0.93, "learning_rate": 1.968929818746067e-05, "loss": 0.0139, "step": 64700 }, { "epoch": 0.93, "learning_rate": 1.9689250147722195e-05, "loss": 0.0128, "step": 64710 }, { "epoch": 0.93, "learning_rate": 1.9689202107983724e-05, "loss": 0.0148, "step": 64720 }, { "epoch": 0.93, "learning_rate": 1.9689154068245253e-05, "loss": 0.0148, "step": 64730 }, { "epoch": 0.93, "learning_rate": 1.9689106028506783e-05, "loss": 0.0187, "step": 64740 }, { "epoch": 0.93, "learning_rate": 1.968905798876831e-05, "loss": 0.0143, "step": 64750 }, { "epoch": 0.93, "learning_rate": 1.9689009949029838e-05, "loss": 0.0128, "step": 64760 }, { "epoch": 0.93, "learning_rate": 1.9688961909291367e-05, "loss": 0.0176, "step": 64770 }, { "epoch": 0.93, "learning_rate": 1.9688913869552896e-05, "loss": 0.0167, "step": 64780 }, { "epoch": 0.93, "learning_rate": 1.9688865829814422e-05, "loss": 0.0134, "step": 64790 }, { "epoch": 0.93, "learning_rate": 1.968881779007595e-05, "loss": 0.0153, "step": 64800 }, { "epoch": 0.93, "learning_rate": 1.968876975033748e-05, "loss": 0.0146, "step": 64810 }, { "epoch": 0.93, "learning_rate": 1.9688721710599007e-05, "loss": 0.0149, "step": 64820 }, { "epoch": 0.93, "learning_rate": 1.9688673670860536e-05, "loss": 0.0134, "step": 64830 }, { "epoch": 0.93, "learning_rate": 1.9688625631122065e-05, "loss": 0.0171, "step": 64840 }, { "epoch": 0.93, "learning_rate": 1.9688577591383595e-05, "loss": 0.0121, "step": 64850 }, { "epoch": 0.93, "learning_rate": 1.968852955164512e-05, "loss": 0.0149, "step": 64860 }, { "epoch": 0.93, "learning_rate": 1.968848151190665e-05, "loss": 0.0123, "step": 64870 }, { "epoch": 0.94, "learning_rate": 1.968843347216818e-05, "loss": 0.0185, "step": 64880 }, { "epoch": 0.94, "learning_rate": 1.9688385432429708e-05, "loss": 0.02, "step": 64890 }, { "epoch": 0.94, "learning_rate": 1.9688337392691237e-05, "loss": 0.0138, "step": 64900 }, { "epoch": 0.94, "learning_rate": 1.9688289352952767e-05, "loss": 0.0204, "step": 64910 }, { "epoch": 0.94, "learning_rate": 1.9688241313214293e-05, "loss": 0.0155, "step": 64920 }, { "epoch": 0.94, "learning_rate": 1.9688193273475822e-05, "loss": 0.0198, "step": 64930 }, { "epoch": 0.94, "learning_rate": 1.968814523373735e-05, "loss": 0.0236, "step": 64940 }, { "epoch": 0.94, "learning_rate": 1.9688097193998877e-05, "loss": 0.0114, "step": 64950 }, { "epoch": 0.94, "learning_rate": 1.9688049154260406e-05, "loss": 0.0164, "step": 64960 }, { "epoch": 0.94, "learning_rate": 1.9688001114521936e-05, "loss": 0.0149, "step": 64970 }, { "epoch": 0.94, "learning_rate": 1.9687953074783465e-05, "loss": 0.017, "step": 64980 }, { "epoch": 0.94, "learning_rate": 1.968790503504499e-05, "loss": 0.0115, "step": 64990 }, { "epoch": 0.94, "learning_rate": 1.968785699530652e-05, "loss": 0.0201, "step": 65000 }, { "epoch": 0.94, "learning_rate": 1.968780895556805e-05, "loss": 0.0169, "step": 65010 }, { "epoch": 0.94, "learning_rate": 1.9687760915829575e-05, "loss": 0.015, "step": 65020 }, { "epoch": 0.94, "learning_rate": 1.9687712876091104e-05, "loss": 0.0149, "step": 65030 }, { "epoch": 0.94, "learning_rate": 1.9687664836352634e-05, "loss": 0.012, "step": 65040 }, { "epoch": 0.94, "learning_rate": 1.9687616796614163e-05, "loss": 0.0149, "step": 65050 }, { "epoch": 0.94, "learning_rate": 1.968756875687569e-05, "loss": 0.017, "step": 65060 }, { "epoch": 0.94, "learning_rate": 1.9687520717137218e-05, "loss": 0.0186, "step": 65070 }, { "epoch": 0.94, "learning_rate": 1.9687472677398747e-05, "loss": 0.0129, "step": 65080 }, { "epoch": 0.94, "learning_rate": 1.9687424637660277e-05, "loss": 0.0165, "step": 65090 }, { "epoch": 0.94, "learning_rate": 1.9687376597921803e-05, "loss": 0.0118, "step": 65100 }, { "epoch": 0.94, "learning_rate": 1.9687328558183332e-05, "loss": 0.0191, "step": 65110 }, { "epoch": 0.94, "learning_rate": 1.968728051844486e-05, "loss": 0.0122, "step": 65120 }, { "epoch": 0.94, "learning_rate": 1.9687232478706387e-05, "loss": 0.0184, "step": 65130 }, { "epoch": 0.94, "learning_rate": 1.9687184438967916e-05, "loss": 0.0173, "step": 65140 }, { "epoch": 0.94, "learning_rate": 1.9687136399229446e-05, "loss": 0.0183, "step": 65150 }, { "epoch": 0.94, "learning_rate": 1.9687088359490975e-05, "loss": 0.0129, "step": 65160 }, { "epoch": 0.94, "learning_rate": 1.96870403197525e-05, "loss": 0.0218, "step": 65170 }, { "epoch": 0.94, "learning_rate": 1.968699228001403e-05, "loss": 0.0185, "step": 65180 }, { "epoch": 0.94, "learning_rate": 1.968694424027556e-05, "loss": 0.0151, "step": 65190 }, { "epoch": 0.94, "learning_rate": 1.9686896200537085e-05, "loss": 0.016, "step": 65200 }, { "epoch": 0.94, "learning_rate": 1.9686848160798614e-05, "loss": 0.0153, "step": 65210 }, { "epoch": 0.94, "learning_rate": 1.9686800121060144e-05, "loss": 0.0145, "step": 65220 }, { "epoch": 0.94, "learning_rate": 1.9686752081321673e-05, "loss": 0.0137, "step": 65230 }, { "epoch": 0.94, "learning_rate": 1.96867040415832e-05, "loss": 0.0134, "step": 65240 }, { "epoch": 0.94, "learning_rate": 1.9686656001844728e-05, "loss": 0.0173, "step": 65250 }, { "epoch": 0.94, "learning_rate": 1.9686607962106257e-05, "loss": 0.0137, "step": 65260 }, { "epoch": 0.94, "learning_rate": 1.9686559922367787e-05, "loss": 0.0152, "step": 65270 }, { "epoch": 0.94, "learning_rate": 1.9686511882629312e-05, "loss": 0.0144, "step": 65280 }, { "epoch": 0.94, "learning_rate": 1.9686463842890842e-05, "loss": 0.0188, "step": 65290 }, { "epoch": 0.94, "learning_rate": 1.968641580315237e-05, "loss": 0.0196, "step": 65300 }, { "epoch": 0.94, "learning_rate": 1.9686367763413897e-05, "loss": 0.0175, "step": 65310 }, { "epoch": 0.94, "learning_rate": 1.9686319723675426e-05, "loss": 0.0148, "step": 65320 }, { "epoch": 0.94, "learning_rate": 1.9686271683936955e-05, "loss": 0.0122, "step": 65330 }, { "epoch": 0.94, "learning_rate": 1.9686223644198485e-05, "loss": 0.0094, "step": 65340 }, { "epoch": 0.94, "learning_rate": 1.968617560446001e-05, "loss": 0.0135, "step": 65350 }, { "epoch": 0.94, "learning_rate": 1.968612756472154e-05, "loss": 0.0156, "step": 65360 }, { "epoch": 0.94, "learning_rate": 1.968607952498307e-05, "loss": 0.0132, "step": 65370 }, { "epoch": 0.94, "learning_rate": 1.9686031485244595e-05, "loss": 0.0134, "step": 65380 }, { "epoch": 0.94, "learning_rate": 1.9685983445506124e-05, "loss": 0.0148, "step": 65390 }, { "epoch": 0.94, "learning_rate": 1.9685935405767654e-05, "loss": 0.0144, "step": 65400 }, { "epoch": 0.94, "learning_rate": 1.9685887366029183e-05, "loss": 0.014, "step": 65410 }, { "epoch": 0.94, "learning_rate": 1.968583932629071e-05, "loss": 0.0212, "step": 65420 }, { "epoch": 0.94, "learning_rate": 1.9685791286552238e-05, "loss": 0.0124, "step": 65430 }, { "epoch": 0.94, "learning_rate": 1.9685743246813767e-05, "loss": 0.0167, "step": 65440 }, { "epoch": 0.94, "learning_rate": 1.9685695207075296e-05, "loss": 0.0155, "step": 65450 }, { "epoch": 0.94, "learning_rate": 1.9685647167336822e-05, "loss": 0.0146, "step": 65460 }, { "epoch": 0.94, "learning_rate": 1.968559912759835e-05, "loss": 0.0146, "step": 65470 }, { "epoch": 0.94, "learning_rate": 1.968555108785988e-05, "loss": 0.0143, "step": 65480 }, { "epoch": 0.94, "learning_rate": 1.9685503048121407e-05, "loss": 0.0162, "step": 65490 }, { "epoch": 0.94, "learning_rate": 1.9685455008382936e-05, "loss": 0.0143, "step": 65500 }, { "epoch": 0.94, "learning_rate": 1.9685406968644465e-05, "loss": 0.0139, "step": 65510 }, { "epoch": 0.94, "learning_rate": 1.9685358928905995e-05, "loss": 0.0141, "step": 65520 }, { "epoch": 0.94, "learning_rate": 1.968531088916752e-05, "loss": 0.0203, "step": 65530 }, { "epoch": 0.94, "learning_rate": 1.968526284942905e-05, "loss": 0.015, "step": 65540 }, { "epoch": 0.94, "learning_rate": 1.968521480969058e-05, "loss": 0.0121, "step": 65550 }, { "epoch": 0.94, "learning_rate": 1.9685166769952105e-05, "loss": 0.019, "step": 65560 }, { "epoch": 0.94, "learning_rate": 1.9685118730213634e-05, "loss": 0.0115, "step": 65570 }, { "epoch": 0.95, "learning_rate": 1.9685070690475163e-05, "loss": 0.0154, "step": 65580 }, { "epoch": 0.95, "learning_rate": 1.9685022650736693e-05, "loss": 0.0193, "step": 65590 }, { "epoch": 0.95, "learning_rate": 1.968497461099822e-05, "loss": 0.0135, "step": 65600 }, { "epoch": 0.95, "learning_rate": 1.9684926571259748e-05, "loss": 0.015, "step": 65610 }, { "epoch": 0.95, "learning_rate": 1.9684878531521277e-05, "loss": 0.0191, "step": 65620 }, { "epoch": 0.95, "learning_rate": 1.9684830491782806e-05, "loss": 0.0206, "step": 65630 }, { "epoch": 0.95, "learning_rate": 1.9684782452044332e-05, "loss": 0.014, "step": 65640 }, { "epoch": 0.95, "learning_rate": 1.968473441230586e-05, "loss": 0.0152, "step": 65650 }, { "epoch": 0.95, "learning_rate": 1.968468637256739e-05, "loss": 0.0137, "step": 65660 }, { "epoch": 0.95, "learning_rate": 1.9684638332828917e-05, "loss": 0.0125, "step": 65670 }, { "epoch": 0.95, "learning_rate": 1.9684590293090446e-05, "loss": 0.0133, "step": 65680 }, { "epoch": 0.95, "learning_rate": 1.9684542253351975e-05, "loss": 0.0154, "step": 65690 }, { "epoch": 0.95, "learning_rate": 1.9684494213613505e-05, "loss": 0.0137, "step": 65700 }, { "epoch": 0.95, "learning_rate": 1.968444617387503e-05, "loss": 0.0119, "step": 65710 }, { "epoch": 0.95, "learning_rate": 1.968439813413656e-05, "loss": 0.0163, "step": 65720 }, { "epoch": 0.95, "learning_rate": 1.968435009439809e-05, "loss": 0.0121, "step": 65730 }, { "epoch": 0.95, "learning_rate": 1.9684302054659615e-05, "loss": 0.016, "step": 65740 }, { "epoch": 0.95, "learning_rate": 1.9684254014921144e-05, "loss": 0.012, "step": 65750 }, { "epoch": 0.95, "learning_rate": 1.9684205975182673e-05, "loss": 0.0168, "step": 65760 }, { "epoch": 0.95, "learning_rate": 1.9684157935444203e-05, "loss": 0.015, "step": 65770 }, { "epoch": 0.95, "learning_rate": 1.968410989570573e-05, "loss": 0.015, "step": 65780 }, { "epoch": 0.95, "learning_rate": 1.9684061855967258e-05, "loss": 0.0166, "step": 65790 }, { "epoch": 0.95, "learning_rate": 1.9684013816228787e-05, "loss": 0.0119, "step": 65800 }, { "epoch": 0.95, "learning_rate": 1.9683965776490316e-05, "loss": 0.0166, "step": 65810 }, { "epoch": 0.95, "learning_rate": 1.9683917736751842e-05, "loss": 0.0145, "step": 65820 }, { "epoch": 0.95, "learning_rate": 1.968386969701337e-05, "loss": 0.0135, "step": 65830 }, { "epoch": 0.95, "learning_rate": 1.96838216572749e-05, "loss": 0.0197, "step": 65840 }, { "epoch": 0.95, "learning_rate": 1.9683773617536427e-05, "loss": 0.0172, "step": 65850 }, { "epoch": 0.95, "learning_rate": 1.9683725577797956e-05, "loss": 0.0151, "step": 65860 }, { "epoch": 0.95, "learning_rate": 1.9683677538059485e-05, "loss": 0.0128, "step": 65870 }, { "epoch": 0.95, "learning_rate": 1.9683629498321014e-05, "loss": 0.0172, "step": 65880 }, { "epoch": 0.95, "learning_rate": 1.968358145858254e-05, "loss": 0.0141, "step": 65890 }, { "epoch": 0.95, "learning_rate": 1.968353341884407e-05, "loss": 0.0116, "step": 65900 }, { "epoch": 0.95, "learning_rate": 1.96834853791056e-05, "loss": 0.0199, "step": 65910 }, { "epoch": 0.95, "learning_rate": 1.9683437339367125e-05, "loss": 0.0179, "step": 65920 }, { "epoch": 0.95, "learning_rate": 1.9683389299628654e-05, "loss": 0.0122, "step": 65930 }, { "epoch": 0.95, "learning_rate": 1.9683341259890183e-05, "loss": 0.0139, "step": 65940 }, { "epoch": 0.95, "learning_rate": 1.9683293220151713e-05, "loss": 0.0164, "step": 65950 }, { "epoch": 0.95, "learning_rate": 1.968324518041324e-05, "loss": 0.0189, "step": 65960 }, { "epoch": 0.95, "learning_rate": 1.9683197140674768e-05, "loss": 0.0173, "step": 65970 }, { "epoch": 0.95, "learning_rate": 1.9683149100936297e-05, "loss": 0.0176, "step": 65980 }, { "epoch": 0.95, "learning_rate": 1.9683101061197826e-05, "loss": 0.0228, "step": 65990 }, { "epoch": 0.95, "learning_rate": 1.9683053021459352e-05, "loss": 0.0215, "step": 66000 }, { "epoch": 0.95, "learning_rate": 1.968300498172088e-05, "loss": 0.013, "step": 66010 }, { "epoch": 0.95, "learning_rate": 1.968295694198241e-05, "loss": 0.0181, "step": 66020 }, { "epoch": 0.95, "learning_rate": 1.9682908902243937e-05, "loss": 0.0146, "step": 66030 }, { "epoch": 0.95, "learning_rate": 1.9682860862505466e-05, "loss": 0.0173, "step": 66040 }, { "epoch": 0.95, "learning_rate": 1.9682812822766995e-05, "loss": 0.0137, "step": 66050 }, { "epoch": 0.95, "learning_rate": 1.9682764783028524e-05, "loss": 0.0149, "step": 66060 }, { "epoch": 0.95, "learning_rate": 1.968271674329005e-05, "loss": 0.017, "step": 66070 }, { "epoch": 0.95, "learning_rate": 1.968266870355158e-05, "loss": 0.0174, "step": 66080 }, { "epoch": 0.95, "learning_rate": 1.968262066381311e-05, "loss": 0.0174, "step": 66090 }, { "epoch": 0.95, "learning_rate": 1.9682572624074635e-05, "loss": 0.0202, "step": 66100 }, { "epoch": 0.95, "learning_rate": 1.9682524584336164e-05, "loss": 0.0132, "step": 66110 }, { "epoch": 0.95, "learning_rate": 1.9682481348571542e-05, "loss": 0.0144, "step": 66120 }, { "epoch": 0.95, "learning_rate": 1.9682433308833068e-05, "loss": 0.0131, "step": 66130 }, { "epoch": 0.95, "learning_rate": 1.9682385269094597e-05, "loss": 0.0155, "step": 66140 }, { "epoch": 0.95, "learning_rate": 1.9682337229356126e-05, "loss": 0.0151, "step": 66150 }, { "epoch": 0.95, "learning_rate": 1.9682289189617652e-05, "loss": 0.0176, "step": 66160 }, { "epoch": 0.95, "learning_rate": 1.968224114987918e-05, "loss": 0.0196, "step": 66170 }, { "epoch": 0.95, "learning_rate": 1.968219311014071e-05, "loss": 0.0159, "step": 66180 }, { "epoch": 0.95, "learning_rate": 1.968214507040224e-05, "loss": 0.0162, "step": 66190 }, { "epoch": 0.95, "learning_rate": 1.9682097030663766e-05, "loss": 0.0192, "step": 66200 }, { "epoch": 0.95, "learning_rate": 1.9682048990925295e-05, "loss": 0.012, "step": 66210 }, { "epoch": 0.95, "learning_rate": 1.9682000951186824e-05, "loss": 0.0134, "step": 66220 }, { "epoch": 0.95, "learning_rate": 1.9681952911448354e-05, "loss": 0.0163, "step": 66230 }, { "epoch": 0.95, "learning_rate": 1.968190487170988e-05, "loss": 0.0137, "step": 66240 }, { "epoch": 0.95, "learning_rate": 1.968185683197141e-05, "loss": 0.0137, "step": 66250 }, { "epoch": 0.95, "learning_rate": 1.9681808792232938e-05, "loss": 0.0116, "step": 66260 }, { "epoch": 0.96, "learning_rate": 1.9681760752494464e-05, "loss": 0.0158, "step": 66270 }, { "epoch": 0.96, "learning_rate": 1.9681712712755993e-05, "loss": 0.0199, "step": 66280 }, { "epoch": 0.96, "learning_rate": 1.9681664673017523e-05, "loss": 0.0149, "step": 66290 }, { "epoch": 0.96, "learning_rate": 1.9681616633279052e-05, "loss": 0.017, "step": 66300 }, { "epoch": 0.96, "learning_rate": 1.9681568593540578e-05, "loss": 0.0159, "step": 66310 }, { "epoch": 0.96, "learning_rate": 1.9681520553802107e-05, "loss": 0.0145, "step": 66320 }, { "epoch": 0.96, "learning_rate": 1.9681472514063636e-05, "loss": 0.0136, "step": 66330 }, { "epoch": 0.96, "learning_rate": 1.9681424474325162e-05, "loss": 0.0142, "step": 66340 }, { "epoch": 0.96, "learning_rate": 1.968137643458669e-05, "loss": 0.0173, "step": 66350 }, { "epoch": 0.96, "learning_rate": 1.968132839484822e-05, "loss": 0.0271, "step": 66360 }, { "epoch": 0.96, "learning_rate": 1.968128035510975e-05, "loss": 0.018, "step": 66370 }, { "epoch": 0.96, "learning_rate": 1.9681232315371276e-05, "loss": 0.0166, "step": 66380 }, { "epoch": 0.96, "learning_rate": 1.9681184275632805e-05, "loss": 0.0166, "step": 66390 }, { "epoch": 0.96, "learning_rate": 1.9681136235894334e-05, "loss": 0.0149, "step": 66400 }, { "epoch": 0.96, "learning_rate": 1.968108819615586e-05, "loss": 0.0161, "step": 66410 }, { "epoch": 0.96, "learning_rate": 1.968104015641739e-05, "loss": 0.0193, "step": 66420 }, { "epoch": 0.96, "learning_rate": 1.968099211667892e-05, "loss": 0.012, "step": 66430 }, { "epoch": 0.96, "learning_rate": 1.9680944076940448e-05, "loss": 0.0181, "step": 66440 }, { "epoch": 0.96, "learning_rate": 1.9680896037201974e-05, "loss": 0.0236, "step": 66450 }, { "epoch": 0.96, "learning_rate": 1.9680847997463503e-05, "loss": 0.0132, "step": 66460 }, { "epoch": 0.96, "learning_rate": 1.9680799957725033e-05, "loss": 0.0176, "step": 66470 }, { "epoch": 0.96, "learning_rate": 1.9680751917986562e-05, "loss": 0.0144, "step": 66480 }, { "epoch": 0.96, "learning_rate": 1.9680703878248088e-05, "loss": 0.0174, "step": 66490 }, { "epoch": 0.96, "learning_rate": 1.9680655838509617e-05, "loss": 0.0163, "step": 66500 }, { "epoch": 0.96, "learning_rate": 1.9680607798771146e-05, "loss": 0.0107, "step": 66510 }, { "epoch": 0.96, "learning_rate": 1.9680559759032672e-05, "loss": 0.0196, "step": 66520 }, { "epoch": 0.96, "learning_rate": 1.96805117192942e-05, "loss": 0.0148, "step": 66530 }, { "epoch": 0.96, "learning_rate": 1.968046367955573e-05, "loss": 0.015, "step": 66540 }, { "epoch": 0.96, "learning_rate": 1.968041563981726e-05, "loss": 0.0143, "step": 66550 }, { "epoch": 0.96, "learning_rate": 1.9680367600078786e-05, "loss": 0.014, "step": 66560 }, { "epoch": 0.96, "learning_rate": 1.9680319560340315e-05, "loss": 0.0145, "step": 66570 }, { "epoch": 0.96, "learning_rate": 1.9680271520601844e-05, "loss": 0.0181, "step": 66580 }, { "epoch": 0.96, "learning_rate": 1.968022348086337e-05, "loss": 0.0133, "step": 66590 }, { "epoch": 0.96, "learning_rate": 1.96801754411249e-05, "loss": 0.0178, "step": 66600 }, { "epoch": 0.96, "learning_rate": 1.968012740138643e-05, "loss": 0.0122, "step": 66610 }, { "epoch": 0.96, "learning_rate": 1.9680079361647958e-05, "loss": 0.0149, "step": 66620 }, { "epoch": 0.96, "learning_rate": 1.9680031321909484e-05, "loss": 0.0222, "step": 66630 }, { "epoch": 0.96, "learning_rate": 1.9679983282171013e-05, "loss": 0.0134, "step": 66640 }, { "epoch": 0.96, "learning_rate": 1.9679935242432542e-05, "loss": 0.0194, "step": 66650 }, { "epoch": 0.96, "learning_rate": 1.9679887202694072e-05, "loss": 0.0146, "step": 66660 }, { "epoch": 0.96, "learning_rate": 1.9679839162955598e-05, "loss": 0.0139, "step": 66670 }, { "epoch": 0.96, "learning_rate": 1.9679791123217127e-05, "loss": 0.0161, "step": 66680 }, { "epoch": 0.96, "learning_rate": 1.9679743083478656e-05, "loss": 0.0178, "step": 66690 }, { "epoch": 0.96, "learning_rate": 1.9679695043740182e-05, "loss": 0.0161, "step": 66700 }, { "epoch": 0.96, "learning_rate": 1.967964700400171e-05, "loss": 0.0138, "step": 66710 }, { "epoch": 0.96, "learning_rate": 1.967959896426324e-05, "loss": 0.0118, "step": 66720 }, { "epoch": 0.96, "learning_rate": 1.967955092452477e-05, "loss": 0.0134, "step": 66730 }, { "epoch": 0.96, "learning_rate": 1.9679502884786296e-05, "loss": 0.014, "step": 66740 }, { "epoch": 0.96, "learning_rate": 1.9679454845047825e-05, "loss": 0.015, "step": 66750 }, { "epoch": 0.96, "learning_rate": 1.9679406805309354e-05, "loss": 0.0167, "step": 66760 }, { "epoch": 0.96, "learning_rate": 1.967935876557088e-05, "loss": 0.0124, "step": 66770 }, { "epoch": 0.96, "learning_rate": 1.967931072583241e-05, "loss": 0.0195, "step": 66780 }, { "epoch": 0.96, "learning_rate": 1.967926268609394e-05, "loss": 0.016, "step": 66790 }, { "epoch": 0.96, "learning_rate": 1.9679214646355468e-05, "loss": 0.0118, "step": 66800 }, { "epoch": 0.96, "learning_rate": 1.9679166606616994e-05, "loss": 0.0132, "step": 66810 }, { "epoch": 0.96, "learning_rate": 1.9679118566878523e-05, "loss": 0.0155, "step": 66820 }, { "epoch": 0.96, "learning_rate": 1.9679070527140052e-05, "loss": 0.0137, "step": 66830 }, { "epoch": 0.96, "learning_rate": 1.967902248740158e-05, "loss": 0.0143, "step": 66840 }, { "epoch": 0.96, "learning_rate": 1.9678974447663107e-05, "loss": 0.0129, "step": 66850 }, { "epoch": 0.96, "learning_rate": 1.9678926407924637e-05, "loss": 0.0156, "step": 66860 }, { "epoch": 0.96, "learning_rate": 1.9678878368186166e-05, "loss": 0.016, "step": 66870 }, { "epoch": 0.96, "learning_rate": 1.9678830328447692e-05, "loss": 0.0121, "step": 66880 }, { "epoch": 0.96, "learning_rate": 1.967878228870922e-05, "loss": 0.0147, "step": 66890 }, { "epoch": 0.96, "learning_rate": 1.967873424897075e-05, "loss": 0.0149, "step": 66900 }, { "epoch": 0.96, "learning_rate": 1.967868620923228e-05, "loss": 0.013, "step": 66910 }, { "epoch": 0.96, "learning_rate": 1.9678638169493806e-05, "loss": 0.0121, "step": 66920 }, { "epoch": 0.96, "learning_rate": 1.9678590129755335e-05, "loss": 0.012, "step": 66930 }, { "epoch": 0.96, "learning_rate": 1.9678542090016864e-05, "loss": 0.0132, "step": 66940 }, { "epoch": 0.96, "learning_rate": 1.967849405027839e-05, "loss": 0.0148, "step": 66950 }, { "epoch": 0.97, "learning_rate": 1.967844601053992e-05, "loss": 0.0186, "step": 66960 }, { "epoch": 0.97, "learning_rate": 1.967839797080145e-05, "loss": 0.017, "step": 66970 }, { "epoch": 0.97, "learning_rate": 1.9678349931062978e-05, "loss": 0.0132, "step": 66980 }, { "epoch": 0.97, "learning_rate": 1.9678301891324504e-05, "loss": 0.0138, "step": 66990 }, { "epoch": 0.97, "learning_rate": 1.9678253851586033e-05, "loss": 0.0186, "step": 67000 }, { "epoch": 0.97, "learning_rate": 1.9678205811847562e-05, "loss": 0.0123, "step": 67010 }, { "epoch": 0.97, "learning_rate": 1.967815777210909e-05, "loss": 0.0144, "step": 67020 }, { "epoch": 0.97, "learning_rate": 1.9678109732370617e-05, "loss": 0.0159, "step": 67030 }, { "epoch": 0.97, "learning_rate": 1.9678061692632147e-05, "loss": 0.0199, "step": 67040 }, { "epoch": 0.97, "learning_rate": 1.9678013652893676e-05, "loss": 0.0125, "step": 67050 }, { "epoch": 0.97, "learning_rate": 1.9677965613155202e-05, "loss": 0.0151, "step": 67060 }, { "epoch": 0.97, "learning_rate": 1.967791757341673e-05, "loss": 0.0138, "step": 67070 }, { "epoch": 0.97, "learning_rate": 1.967786953367826e-05, "loss": 0.0132, "step": 67080 }, { "epoch": 0.97, "learning_rate": 1.967782149393979e-05, "loss": 0.0165, "step": 67090 }, { "epoch": 0.97, "learning_rate": 1.9677773454201316e-05, "loss": 0.0141, "step": 67100 }, { "epoch": 0.97, "learning_rate": 1.9677725414462845e-05, "loss": 0.0142, "step": 67110 }, { "epoch": 0.97, "learning_rate": 1.9677677374724374e-05, "loss": 0.0142, "step": 67120 }, { "epoch": 0.97, "learning_rate": 1.96776293349859e-05, "loss": 0.0171, "step": 67130 }, { "epoch": 0.97, "learning_rate": 1.967758129524743e-05, "loss": 0.0167, "step": 67140 }, { "epoch": 0.97, "learning_rate": 1.967753325550896e-05, "loss": 0.0171, "step": 67150 }, { "epoch": 0.97, "learning_rate": 1.9677485215770488e-05, "loss": 0.016, "step": 67160 }, { "epoch": 0.97, "learning_rate": 1.9677437176032014e-05, "loss": 0.0145, "step": 67170 }, { "epoch": 0.97, "learning_rate": 1.9677389136293543e-05, "loss": 0.0116, "step": 67180 }, { "epoch": 0.97, "learning_rate": 1.9677341096555072e-05, "loss": 0.0183, "step": 67190 }, { "epoch": 0.97, "learning_rate": 1.96772930568166e-05, "loss": 0.0121, "step": 67200 }, { "epoch": 0.97, "learning_rate": 1.9677245017078127e-05, "loss": 0.0173, "step": 67210 }, { "epoch": 0.97, "learning_rate": 1.9677196977339657e-05, "loss": 0.0161, "step": 67220 }, { "epoch": 0.97, "learning_rate": 1.9677148937601186e-05, "loss": 0.0104, "step": 67230 }, { "epoch": 0.97, "learning_rate": 1.9677100897862712e-05, "loss": 0.0136, "step": 67240 }, { "epoch": 0.97, "learning_rate": 1.967705285812424e-05, "loss": 0.0117, "step": 67250 }, { "epoch": 0.97, "learning_rate": 1.967700481838577e-05, "loss": 0.0121, "step": 67260 }, { "epoch": 0.97, "learning_rate": 1.96769567786473e-05, "loss": 0.0155, "step": 67270 }, { "epoch": 0.97, "learning_rate": 1.9676908738908825e-05, "loss": 0.0191, "step": 67280 }, { "epoch": 0.97, "learning_rate": 1.9676860699170355e-05, "loss": 0.0154, "step": 67290 }, { "epoch": 0.97, "learning_rate": 1.9676812659431884e-05, "loss": 0.0153, "step": 67300 }, { "epoch": 0.97, "learning_rate": 1.967676461969341e-05, "loss": 0.0127, "step": 67310 }, { "epoch": 0.97, "learning_rate": 1.967671657995494e-05, "loss": 0.0142, "step": 67320 }, { "epoch": 0.97, "learning_rate": 1.967666854021647e-05, "loss": 0.0151, "step": 67330 }, { "epoch": 0.97, "learning_rate": 1.9676620500477998e-05, "loss": 0.0139, "step": 67340 }, { "epoch": 0.97, "learning_rate": 1.9676572460739524e-05, "loss": 0.0129, "step": 67350 }, { "epoch": 0.97, "learning_rate": 1.9676524421001053e-05, "loss": 0.0158, "step": 67360 }, { "epoch": 0.97, "learning_rate": 1.9676476381262582e-05, "loss": 0.0189, "step": 67370 }, { "epoch": 0.97, "learning_rate": 1.967642834152411e-05, "loss": 0.0154, "step": 67380 }, { "epoch": 0.97, "learning_rate": 1.9676380301785637e-05, "loss": 0.0143, "step": 67390 }, { "epoch": 0.97, "learning_rate": 1.9676332262047167e-05, "loss": 0.0197, "step": 67400 }, { "epoch": 0.97, "learning_rate": 1.9676284222308696e-05, "loss": 0.0124, "step": 67410 }, { "epoch": 0.97, "learning_rate": 1.967623618257022e-05, "loss": 0.0175, "step": 67420 }, { "epoch": 0.97, "learning_rate": 1.967618814283175e-05, "loss": 0.0148, "step": 67430 }, { "epoch": 0.97, "learning_rate": 1.967614010309328e-05, "loss": 0.0147, "step": 67440 }, { "epoch": 0.97, "learning_rate": 1.967609206335481e-05, "loss": 0.0152, "step": 67450 }, { "epoch": 0.97, "learning_rate": 1.9676044023616335e-05, "loss": 0.0139, "step": 67460 }, { "epoch": 0.97, "learning_rate": 1.9675995983877865e-05, "loss": 0.0155, "step": 67470 }, { "epoch": 0.97, "learning_rate": 1.9675947944139394e-05, "loss": 0.0191, "step": 67480 }, { "epoch": 0.97, "learning_rate": 1.967589990440092e-05, "loss": 0.0165, "step": 67490 }, { "epoch": 0.97, "learning_rate": 1.967585186466245e-05, "loss": 0.016, "step": 67500 }, { "epoch": 0.97, "learning_rate": 1.967580382492398e-05, "loss": 0.0127, "step": 67510 }, { "epoch": 0.97, "learning_rate": 1.9675755785185508e-05, "loss": 0.0238, "step": 67520 }, { "epoch": 0.97, "learning_rate": 1.9675707745447033e-05, "loss": 0.0126, "step": 67530 }, { "epoch": 0.97, "learning_rate": 1.9675659705708563e-05, "loss": 0.0141, "step": 67540 }, { "epoch": 0.97, "learning_rate": 1.9675611665970092e-05, "loss": 0.0173, "step": 67550 }, { "epoch": 0.97, "learning_rate": 1.967556362623162e-05, "loss": 0.0179, "step": 67560 }, { "epoch": 0.97, "learning_rate": 1.9675515586493147e-05, "loss": 0.0148, "step": 67570 }, { "epoch": 0.97, "learning_rate": 1.9675467546754676e-05, "loss": 0.0191, "step": 67580 }, { "epoch": 0.97, "learning_rate": 1.9675419507016206e-05, "loss": 0.0131, "step": 67590 }, { "epoch": 0.97, "learning_rate": 1.967537146727773e-05, "loss": 0.0133, "step": 67600 }, { "epoch": 0.97, "learning_rate": 1.967532342753926e-05, "loss": 0.0151, "step": 67610 }, { "epoch": 0.97, "learning_rate": 1.967527538780079e-05, "loss": 0.0184, "step": 67620 }, { "epoch": 0.97, "learning_rate": 1.967522734806232e-05, "loss": 0.0155, "step": 67630 }, { "epoch": 0.97, "learning_rate": 1.9675179308323845e-05, "loss": 0.0125, "step": 67640 }, { "epoch": 0.97, "learning_rate": 1.9675131268585375e-05, "loss": 0.0162, "step": 67650 }, { "epoch": 0.98, "learning_rate": 1.9675083228846904e-05, "loss": 0.0147, "step": 67660 }, { "epoch": 0.98, "learning_rate": 1.967503518910843e-05, "loss": 0.0224, "step": 67670 }, { "epoch": 0.98, "learning_rate": 1.967498714936996e-05, "loss": 0.0195, "step": 67680 }, { "epoch": 0.98, "learning_rate": 1.9674939109631488e-05, "loss": 0.0142, "step": 67690 }, { "epoch": 0.98, "learning_rate": 1.9674891069893017e-05, "loss": 0.0122, "step": 67700 }, { "epoch": 0.98, "learning_rate": 1.9674843030154543e-05, "loss": 0.014, "step": 67710 }, { "epoch": 0.98, "learning_rate": 1.9674794990416073e-05, "loss": 0.0178, "step": 67720 }, { "epoch": 0.98, "learning_rate": 1.9674746950677602e-05, "loss": 0.0127, "step": 67730 }, { "epoch": 0.98, "learning_rate": 1.967469891093913e-05, "loss": 0.0167, "step": 67740 }, { "epoch": 0.98, "learning_rate": 1.9674650871200657e-05, "loss": 0.0142, "step": 67750 }, { "epoch": 0.98, "learning_rate": 1.9674602831462186e-05, "loss": 0.0144, "step": 67760 }, { "epoch": 0.98, "learning_rate": 1.9674554791723716e-05, "loss": 0.0125, "step": 67770 }, { "epoch": 0.98, "learning_rate": 1.967450675198524e-05, "loss": 0.0116, "step": 67780 }, { "epoch": 0.98, "learning_rate": 1.967445871224677e-05, "loss": 0.0152, "step": 67790 }, { "epoch": 0.98, "learning_rate": 1.96744106725083e-05, "loss": 0.017, "step": 67800 }, { "epoch": 0.98, "learning_rate": 1.967436263276983e-05, "loss": 0.0164, "step": 67810 }, { "epoch": 0.98, "learning_rate": 1.9674314593031355e-05, "loss": 0.0103, "step": 67820 }, { "epoch": 0.98, "learning_rate": 1.9674266553292884e-05, "loss": 0.0112, "step": 67830 }, { "epoch": 0.98, "learning_rate": 1.9674218513554414e-05, "loss": 0.0159, "step": 67840 }, { "epoch": 0.98, "learning_rate": 1.967417047381594e-05, "loss": 0.0168, "step": 67850 }, { "epoch": 0.98, "learning_rate": 1.967412243407747e-05, "loss": 0.0185, "step": 67860 }, { "epoch": 0.98, "learning_rate": 1.9674074394338998e-05, "loss": 0.0143, "step": 67870 }, { "epoch": 0.98, "learning_rate": 1.9674026354600527e-05, "loss": 0.0131, "step": 67880 }, { "epoch": 0.98, "learning_rate": 1.9673978314862053e-05, "loss": 0.0118, "step": 67890 }, { "epoch": 0.98, "learning_rate": 1.9673930275123583e-05, "loss": 0.0165, "step": 67900 }, { "epoch": 0.98, "learning_rate": 1.9673882235385112e-05, "loss": 0.0167, "step": 67910 }, { "epoch": 0.98, "learning_rate": 1.967383419564664e-05, "loss": 0.0141, "step": 67920 }, { "epoch": 0.98, "learning_rate": 1.9673786155908167e-05, "loss": 0.013, "step": 67930 }, { "epoch": 0.98, "learning_rate": 1.9673738116169696e-05, "loss": 0.0167, "step": 67940 }, { "epoch": 0.98, "learning_rate": 1.9673690076431226e-05, "loss": 0.014, "step": 67950 }, { "epoch": 0.98, "learning_rate": 1.9673642036692755e-05, "loss": 0.0123, "step": 67960 }, { "epoch": 0.98, "learning_rate": 1.9673593996954284e-05, "loss": 0.0158, "step": 67970 }, { "epoch": 0.98, "learning_rate": 1.967354595721581e-05, "loss": 0.0098, "step": 67980 }, { "epoch": 0.98, "learning_rate": 1.967349791747734e-05, "loss": 0.0164, "step": 67990 }, { "epoch": 0.98, "learning_rate": 1.967344987773887e-05, "loss": 0.0124, "step": 68000 }, { "epoch": 0.98, "learning_rate": 1.9673401838000398e-05, "loss": 0.0126, "step": 68010 }, { "epoch": 0.98, "learning_rate": 1.9673353798261924e-05, "loss": 0.0162, "step": 68020 }, { "epoch": 0.98, "learning_rate": 1.9673305758523453e-05, "loss": 0.0159, "step": 68030 }, { "epoch": 0.98, "learning_rate": 1.9673257718784982e-05, "loss": 0.0164, "step": 68040 }, { "epoch": 0.98, "learning_rate": 1.967320967904651e-05, "loss": 0.0169, "step": 68050 }, { "epoch": 0.98, "learning_rate": 1.9673161639308037e-05, "loss": 0.0148, "step": 68060 }, { "epoch": 0.98, "learning_rate": 1.9673113599569567e-05, "loss": 0.0133, "step": 68070 }, { "epoch": 0.98, "learning_rate": 1.9673065559831096e-05, "loss": 0.017, "step": 68080 }, { "epoch": 0.98, "learning_rate": 1.9673017520092622e-05, "loss": 0.0159, "step": 68090 }, { "epoch": 0.98, "learning_rate": 1.967296948035415e-05, "loss": 0.0214, "step": 68100 }, { "epoch": 0.98, "learning_rate": 1.967292144061568e-05, "loss": 0.0193, "step": 68110 }, { "epoch": 0.98, "learning_rate": 1.967287340087721e-05, "loss": 0.0159, "step": 68120 }, { "epoch": 0.98, "learning_rate": 1.9672825361138735e-05, "loss": 0.0112, "step": 68130 }, { "epoch": 0.98, "learning_rate": 1.9672777321400265e-05, "loss": 0.0169, "step": 68140 }, { "epoch": 0.98, "learning_rate": 1.9672729281661794e-05, "loss": 0.0154, "step": 68150 }, { "epoch": 0.98, "learning_rate": 1.967268124192332e-05, "loss": 0.0156, "step": 68160 }, { "epoch": 0.98, "learning_rate": 1.967263320218485e-05, "loss": 0.019, "step": 68170 }, { "epoch": 0.98, "learning_rate": 1.967258516244638e-05, "loss": 0.0149, "step": 68180 }, { "epoch": 0.98, "learning_rate": 1.9672537122707908e-05, "loss": 0.0113, "step": 68190 }, { "epoch": 0.98, "learning_rate": 1.9672489082969434e-05, "loss": 0.0161, "step": 68200 }, { "epoch": 0.98, "learning_rate": 1.9672441043230963e-05, "loss": 0.0165, "step": 68210 }, { "epoch": 0.98, "learning_rate": 1.9672393003492492e-05, "loss": 0.0203, "step": 68220 }, { "epoch": 0.98, "learning_rate": 1.967234496375402e-05, "loss": 0.0145, "step": 68230 }, { "epoch": 0.98, "learning_rate": 1.9672296924015547e-05, "loss": 0.0143, "step": 68240 }, { "epoch": 0.98, "learning_rate": 1.9672248884277077e-05, "loss": 0.0151, "step": 68250 }, { "epoch": 0.98, "learning_rate": 1.9672200844538606e-05, "loss": 0.0134, "step": 68260 }, { "epoch": 0.98, "learning_rate": 1.967215280480013e-05, "loss": 0.0134, "step": 68270 }, { "epoch": 0.98, "learning_rate": 1.967210476506166e-05, "loss": 0.0169, "step": 68280 }, { "epoch": 0.98, "learning_rate": 1.967205672532319e-05, "loss": 0.0204, "step": 68290 }, { "epoch": 0.98, "learning_rate": 1.967200868558472e-05, "loss": 0.0123, "step": 68300 }, { "epoch": 0.98, "learning_rate": 1.9671960645846245e-05, "loss": 0.0147, "step": 68310 }, { "epoch": 0.98, "learning_rate": 1.9671912606107775e-05, "loss": 0.0168, "step": 68320 }, { "epoch": 0.98, "learning_rate": 1.9671864566369304e-05, "loss": 0.0173, "step": 68330 }, { "epoch": 0.98, "learning_rate": 1.967181652663083e-05, "loss": 0.0169, "step": 68340 }, { "epoch": 0.99, "learning_rate": 1.967176848689236e-05, "loss": 0.0121, "step": 68350 }, { "epoch": 0.99, "learning_rate": 1.967172044715389e-05, "loss": 0.0246, "step": 68360 }, { "epoch": 0.99, "learning_rate": 1.9671672407415418e-05, "loss": 0.0135, "step": 68370 }, { "epoch": 0.99, "learning_rate": 1.9671624367676943e-05, "loss": 0.0128, "step": 68380 }, { "epoch": 0.99, "learning_rate": 1.9671576327938473e-05, "loss": 0.0175, "step": 68390 }, { "epoch": 0.99, "learning_rate": 1.9671528288200002e-05, "loss": 0.0136, "step": 68400 }, { "epoch": 0.99, "learning_rate": 1.967148024846153e-05, "loss": 0.016, "step": 68410 }, { "epoch": 0.99, "learning_rate": 1.9671432208723057e-05, "loss": 0.0132, "step": 68420 }, { "epoch": 0.99, "learning_rate": 1.9671384168984586e-05, "loss": 0.0215, "step": 68430 }, { "epoch": 0.99, "learning_rate": 1.9671336129246116e-05, "loss": 0.0208, "step": 68440 }, { "epoch": 0.99, "learning_rate": 1.967128808950764e-05, "loss": 0.0163, "step": 68450 }, { "epoch": 0.99, "learning_rate": 1.967124004976917e-05, "loss": 0.0198, "step": 68460 }, { "epoch": 0.99, "learning_rate": 1.96711920100307e-05, "loss": 0.0146, "step": 68470 }, { "epoch": 0.99, "learning_rate": 1.967114397029223e-05, "loss": 0.0136, "step": 68480 }, { "epoch": 0.99, "learning_rate": 1.9671095930553755e-05, "loss": 0.0119, "step": 68490 }, { "epoch": 0.99, "learning_rate": 1.9671047890815285e-05, "loss": 0.0163, "step": 68500 }, { "epoch": 0.99, "learning_rate": 1.9670999851076814e-05, "loss": 0.0119, "step": 68510 }, { "epoch": 0.99, "learning_rate": 1.967095181133834e-05, "loss": 0.0114, "step": 68520 }, { "epoch": 0.99, "learning_rate": 1.967090377159987e-05, "loss": 0.0144, "step": 68530 }, { "epoch": 0.99, "learning_rate": 1.9670855731861398e-05, "loss": 0.0135, "step": 68540 }, { "epoch": 0.99, "learning_rate": 1.9670807692122927e-05, "loss": 0.0215, "step": 68550 }, { "epoch": 0.99, "learning_rate": 1.9670759652384453e-05, "loss": 0.0207, "step": 68560 }, { "epoch": 0.99, "learning_rate": 1.9670711612645983e-05, "loss": 0.0203, "step": 68570 }, { "epoch": 0.99, "learning_rate": 1.9670663572907512e-05, "loss": 0.0127, "step": 68580 }, { "epoch": 0.99, "learning_rate": 1.967061553316904e-05, "loss": 0.0135, "step": 68590 }, { "epoch": 0.99, "learning_rate": 1.9670567493430567e-05, "loss": 0.0169, "step": 68600 }, { "epoch": 0.99, "learning_rate": 1.9670519453692096e-05, "loss": 0.0161, "step": 68610 }, { "epoch": 0.99, "learning_rate": 1.9670471413953626e-05, "loss": 0.0243, "step": 68620 }, { "epoch": 0.99, "learning_rate": 1.967042337421515e-05, "loss": 0.0175, "step": 68630 }, { "epoch": 0.99, "learning_rate": 1.967037533447668e-05, "loss": 0.0115, "step": 68640 }, { "epoch": 0.99, "learning_rate": 1.967032729473821e-05, "loss": 0.0148, "step": 68650 }, { "epoch": 0.99, "learning_rate": 1.967027925499974e-05, "loss": 0.0174, "step": 68660 }, { "epoch": 0.99, "learning_rate": 1.9670231215261265e-05, "loss": 0.0135, "step": 68670 }, { "epoch": 0.99, "learning_rate": 1.9670183175522794e-05, "loss": 0.0115, "step": 68680 }, { "epoch": 0.99, "learning_rate": 1.9670135135784324e-05, "loss": 0.0136, "step": 68690 }, { "epoch": 0.99, "learning_rate": 1.96700919000197e-05, "loss": 0.0131, "step": 68700 }, { "epoch": 0.99, "learning_rate": 1.9670043860281228e-05, "loss": 0.0128, "step": 68710 }, { "epoch": 0.99, "learning_rate": 1.9669995820542757e-05, "loss": 0.0166, "step": 68720 }, { "epoch": 0.99, "learning_rate": 1.9669947780804283e-05, "loss": 0.0207, "step": 68730 }, { "epoch": 0.99, "learning_rate": 1.9669899741065812e-05, "loss": 0.0122, "step": 68740 }, { "epoch": 0.99, "learning_rate": 1.966985170132734e-05, "loss": 0.0172, "step": 68750 }, { "epoch": 0.99, "learning_rate": 1.9669803661588867e-05, "loss": 0.0138, "step": 68760 }, { "epoch": 0.99, "learning_rate": 1.9669755621850396e-05, "loss": 0.0107, "step": 68770 }, { "epoch": 0.99, "learning_rate": 1.9669707582111926e-05, "loss": 0.0184, "step": 68780 }, { "epoch": 0.99, "learning_rate": 1.9669659542373455e-05, "loss": 0.0123, "step": 68790 }, { "epoch": 0.99, "learning_rate": 1.966961150263498e-05, "loss": 0.0159, "step": 68800 }, { "epoch": 0.99, "learning_rate": 1.966956346289651e-05, "loss": 0.0129, "step": 68810 }, { "epoch": 0.99, "learning_rate": 1.966951542315804e-05, "loss": 0.0133, "step": 68820 }, { "epoch": 0.99, "learning_rate": 1.966946738341957e-05, "loss": 0.014, "step": 68830 }, { "epoch": 0.99, "learning_rate": 1.9669419343681095e-05, "loss": 0.019, "step": 68840 }, { "epoch": 0.99, "learning_rate": 1.9669371303942624e-05, "loss": 0.0176, "step": 68850 }, { "epoch": 0.99, "learning_rate": 1.9669323264204153e-05, "loss": 0.0131, "step": 68860 }, { "epoch": 0.99, "learning_rate": 1.966927522446568e-05, "loss": 0.0135, "step": 68870 }, { "epoch": 0.99, "learning_rate": 1.9669227184727208e-05, "loss": 0.0154, "step": 68880 }, { "epoch": 0.99, "learning_rate": 1.9669179144988738e-05, "loss": 0.0118, "step": 68890 }, { "epoch": 0.99, "learning_rate": 1.9669131105250267e-05, "loss": 0.0103, "step": 68900 }, { "epoch": 0.99, "learning_rate": 1.9669083065511793e-05, "loss": 0.0151, "step": 68910 }, { "epoch": 0.99, "learning_rate": 1.9669035025773322e-05, "loss": 0.0137, "step": 68920 }, { "epoch": 0.99, "learning_rate": 1.966898698603485e-05, "loss": 0.0147, "step": 68930 }, { "epoch": 0.99, "learning_rate": 1.9668938946296377e-05, "loss": 0.015, "step": 68940 }, { "epoch": 0.99, "learning_rate": 1.9668890906557906e-05, "loss": 0.0182, "step": 68950 }, { "epoch": 0.99, "learning_rate": 1.9668842866819436e-05, "loss": 0.0149, "step": 68960 }, { "epoch": 0.99, "learning_rate": 1.9668794827080965e-05, "loss": 0.0131, "step": 68970 }, { "epoch": 0.99, "learning_rate": 1.966874678734249e-05, "loss": 0.0137, "step": 68980 }, { "epoch": 0.99, "learning_rate": 1.966869874760402e-05, "loss": 0.0137, "step": 68990 }, { "epoch": 0.99, "learning_rate": 1.966865070786555e-05, "loss": 0.0101, "step": 69000 }, { "epoch": 0.99, "learning_rate": 1.966860266812708e-05, "loss": 0.016, "step": 69010 }, { "epoch": 0.99, "learning_rate": 1.9668554628388605e-05, "loss": 0.0133, "step": 69020 }, { "epoch": 0.99, "learning_rate": 1.9668506588650134e-05, "loss": 0.0178, "step": 69030 }, { "epoch": 0.99, "learning_rate": 1.9668458548911663e-05, "loss": 0.0131, "step": 69040 }, { "epoch": 1.0, "learning_rate": 1.966841050917319e-05, "loss": 0.0142, "step": 69050 }, { "epoch": 1.0, "learning_rate": 1.9668362469434718e-05, "loss": 0.0147, "step": 69060 }, { "epoch": 1.0, "learning_rate": 1.9668314429696247e-05, "loss": 0.0164, "step": 69070 }, { "epoch": 1.0, "learning_rate": 1.9668266389957777e-05, "loss": 0.0123, "step": 69080 }, { "epoch": 1.0, "learning_rate": 1.9668218350219303e-05, "loss": 0.0152, "step": 69090 }, { "epoch": 1.0, "learning_rate": 1.9668170310480832e-05, "loss": 0.0183, "step": 69100 }, { "epoch": 1.0, "learning_rate": 1.966812227074236e-05, "loss": 0.0405, "step": 69110 }, { "epoch": 1.0, "learning_rate": 1.9668074231003887e-05, "loss": 0.0136, "step": 69120 }, { "epoch": 1.0, "learning_rate": 1.9668026191265416e-05, "loss": 0.0182, "step": 69130 }, { "epoch": 1.0, "learning_rate": 1.9667978151526946e-05, "loss": 0.0161, "step": 69140 }, { "epoch": 1.0, "learning_rate": 1.9667930111788475e-05, "loss": 0.0142, "step": 69150 }, { "epoch": 1.0, "learning_rate": 1.966788207205e-05, "loss": 0.0145, "step": 69160 }, { "epoch": 1.0, "learning_rate": 1.966783403231153e-05, "loss": 0.012, "step": 69170 }, { "epoch": 1.0, "learning_rate": 1.966778599257306e-05, "loss": 0.0207, "step": 69180 }, { "epoch": 1.0, "learning_rate": 1.966773795283459e-05, "loss": 0.0206, "step": 69190 }, { "epoch": 1.0, "learning_rate": 1.9667689913096114e-05, "loss": 0.016, "step": 69200 }, { "epoch": 1.0, "learning_rate": 1.9667641873357644e-05, "loss": 0.0153, "step": 69210 }, { "epoch": 1.0, "learning_rate": 1.9667593833619173e-05, "loss": 0.0157, "step": 69220 }, { "epoch": 1.0, "learning_rate": 1.96675457938807e-05, "loss": 0.0207, "step": 69230 }, { "epoch": 1.0, "learning_rate": 1.9667497754142228e-05, "loss": 0.0171, "step": 69240 }, { "epoch": 1.0, "learning_rate": 1.9667449714403757e-05, "loss": 0.011, "step": 69250 }, { "epoch": 1.0, "learning_rate": 1.9667401674665287e-05, "loss": 0.0116, "step": 69260 }, { "epoch": 1.0, "learning_rate": 1.9667353634926813e-05, "loss": 0.0186, "step": 69270 }, { "epoch": 1.0, "learning_rate": 1.9667305595188342e-05, "loss": 0.0174, "step": 69280 }, { "epoch": 1.0, "learning_rate": 1.966725755544987e-05, "loss": 0.0138, "step": 69290 }, { "epoch": 1.0, "learning_rate": 1.9667209515711397e-05, "loss": 0.0106, "step": 69300 }, { "epoch": 1.0, "learning_rate": 1.9667161475972926e-05, "loss": 0.0142, "step": 69310 }, { "epoch": 1.0, "learning_rate": 1.9667113436234455e-05, "loss": 0.0143, "step": 69320 }, { "epoch": 1.0, "learning_rate": 1.9667065396495985e-05, "loss": 0.0184, "step": 69330 }, { "epoch": 1.0, "learning_rate": 1.966701735675751e-05, "loss": 0.0146, "step": 69340 }, { "epoch": 1.0, "learning_rate": 1.966696931701904e-05, "loss": 0.0187, "step": 69350 }, { "epoch": 1.0, "learning_rate": 1.966692127728057e-05, "loss": 0.0133, "step": 69360 }, { "epoch": 1.0, "learning_rate": 1.9666873237542095e-05, "loss": 0.0186, "step": 69370 }, { "epoch": 1.0, "learning_rate": 1.9666825197803624e-05, "loss": 0.0138, "step": 69380 }, { "epoch": 1.0, "learning_rate": 1.9666777158065154e-05, "loss": 0.0134, "step": 69390 }, { "epoch": 1.0, "learning_rate": 1.9666729118326683e-05, "loss": 0.009, "step": 69400 }, { "epoch": 1.0, "learning_rate": 1.966668107858821e-05, "loss": 0.0172, "step": 69410 }, { "epoch": 1.0, "learning_rate": 1.9666633038849738e-05, "loss": 0.0123, "step": 69420 }, { "epoch": 1.0, "learning_rate": 1.9666584999111267e-05, "loss": 0.0111, "step": 69430 }, { "epoch": 1.0, "learning_rate": 1.9666536959372797e-05, "loss": 0.009, "step": 69440 }, { "epoch": 1.0, "learning_rate": 1.9666488919634322e-05, "loss": 0.0124, "step": 69450 }, { "epoch": 1.0, "learning_rate": 1.9666440879895852e-05, "loss": 0.0171, "step": 69460 }, { "epoch": 1.0, "learning_rate": 1.966639284015738e-05, "loss": 0.0131, "step": 69470 }, { "epoch": 1.0, "learning_rate": 1.9666344800418907e-05, "loss": 0.0123, "step": 69480 }, { "epoch": 1.0, "learning_rate": 1.9666296760680436e-05, "loss": 0.0189, "step": 69490 }, { "epoch": 1.0, "learning_rate": 1.9666248720941965e-05, "loss": 0.0158, "step": 69500 }, { "epoch": 1.0, "learning_rate": 1.9666200681203495e-05, "loss": 0.0109, "step": 69510 }, { "epoch": 1.0, "learning_rate": 1.966615264146502e-05, "loss": 0.0082, "step": 69520 }, { "epoch": 1.0, "learning_rate": 1.966610460172655e-05, "loss": 0.0164, "step": 69530 }, { "epoch": 1.0, "learning_rate": 1.966605656198808e-05, "loss": 0.0139, "step": 69540 }, { "epoch": 1.0, "learning_rate": 1.9666008522249605e-05, "loss": 0.0157, "step": 69550 }, { "epoch": 1.0, "learning_rate": 1.9665960482511134e-05, "loss": 0.0146, "step": 69560 }, { "epoch": 1.0, "learning_rate": 1.9665912442772664e-05, "loss": 0.0176, "step": 69570 }, { "epoch": 1.0, "learning_rate": 1.9665864403034193e-05, "loss": 0.0128, "step": 69580 }, { "epoch": 1.0, "learning_rate": 1.966581636329572e-05, "loss": 0.0111, "step": 69590 }, { "epoch": 1.0, "learning_rate": 1.9665768323557248e-05, "loss": 0.0172, "step": 69600 }, { "epoch": 1.0, "learning_rate": 1.9665720283818777e-05, "loss": 0.0111, "step": 69610 }, { "epoch": 1.0, "learning_rate": 1.9665672244080306e-05, "loss": 0.0107, "step": 69620 }, { "epoch": 1.0, "learning_rate": 1.9665624204341832e-05, "loss": 0.0121, "step": 69630 }, { "epoch": 1.0, "learning_rate": 1.966557616460336e-05, "loss": 0.0152, "step": 69640 }, { "epoch": 1.0, "learning_rate": 1.966552812486489e-05, "loss": 0.0103, "step": 69650 }, { "epoch": 1.0, "learning_rate": 1.9665480085126417e-05, "loss": 0.0128, "step": 69660 }, { "epoch": 1.0, "learning_rate": 1.9665432045387946e-05, "loss": 0.0117, "step": 69670 }, { "epoch": 1.0, "learning_rate": 1.9665384005649475e-05, "loss": 0.0131, "step": 69680 }, { "epoch": 1.0, "learning_rate": 1.9665335965911005e-05, "loss": 0.0139, "step": 69690 }, { "epoch": 1.0, "learning_rate": 1.966528792617253e-05, "loss": 0.009, "step": 69700 }, { "epoch": 1.0, "learning_rate": 1.966523988643406e-05, "loss": 0.0154, "step": 69710 }, { "epoch": 1.0, "learning_rate": 1.966519184669559e-05, "loss": 0.0135, "step": 69720 }, { "epoch": 1.0, "learning_rate": 1.9665143806957115e-05, "loss": 0.0119, "step": 69730 }, { "epoch": 1.01, "learning_rate": 1.9665095767218644e-05, "loss": 0.0107, "step": 69740 }, { "epoch": 1.01, "learning_rate": 1.9665047727480173e-05, "loss": 0.0113, "step": 69750 }, { "epoch": 1.01, "learning_rate": 1.9664999687741703e-05, "loss": 0.0118, "step": 69760 }, { "epoch": 1.01, "learning_rate": 1.966495164800323e-05, "loss": 0.012, "step": 69770 }, { "epoch": 1.01, "learning_rate": 1.9664903608264758e-05, "loss": 0.0155, "step": 69780 }, { "epoch": 1.01, "learning_rate": 1.9664855568526287e-05, "loss": 0.0131, "step": 69790 }, { "epoch": 1.01, "learning_rate": 1.9664807528787816e-05, "loss": 0.0117, "step": 69800 }, { "epoch": 1.01, "learning_rate": 1.9664759489049342e-05, "loss": 0.0102, "step": 69810 }, { "epoch": 1.01, "learning_rate": 1.966471144931087e-05, "loss": 0.0117, "step": 69820 }, { "epoch": 1.01, "learning_rate": 1.96646634095724e-05, "loss": 0.0126, "step": 69830 }, { "epoch": 1.01, "learning_rate": 1.9664615369833927e-05, "loss": 0.0158, "step": 69840 }, { "epoch": 1.01, "learning_rate": 1.9664567330095456e-05, "loss": 0.0104, "step": 69850 }, { "epoch": 1.01, "learning_rate": 1.9664519290356985e-05, "loss": 0.0179, "step": 69860 }, { "epoch": 1.01, "learning_rate": 1.9664471250618515e-05, "loss": 0.0153, "step": 69870 }, { "epoch": 1.01, "learning_rate": 1.966442321088004e-05, "loss": 0.0215, "step": 69880 }, { "epoch": 1.01, "learning_rate": 1.966437517114157e-05, "loss": 0.0121, "step": 69890 }, { "epoch": 1.01, "learning_rate": 1.96643271314031e-05, "loss": 0.0123, "step": 69900 }, { "epoch": 1.01, "learning_rate": 1.9664279091664625e-05, "loss": 0.0141, "step": 69910 }, { "epoch": 1.01, "learning_rate": 1.9664231051926154e-05, "loss": 0.0129, "step": 69920 }, { "epoch": 1.01, "learning_rate": 1.9664183012187683e-05, "loss": 0.0139, "step": 69930 }, { "epoch": 1.01, "learning_rate": 1.9664134972449213e-05, "loss": 0.013, "step": 69940 }, { "epoch": 1.01, "learning_rate": 1.966408693271074e-05, "loss": 0.0123, "step": 69950 }, { "epoch": 1.01, "learning_rate": 1.9664038892972268e-05, "loss": 0.0191, "step": 69960 }, { "epoch": 1.01, "learning_rate": 1.9663990853233797e-05, "loss": 0.0119, "step": 69970 }, { "epoch": 1.01, "learning_rate": 1.9663942813495326e-05, "loss": 0.0115, "step": 69980 }, { "epoch": 1.01, "learning_rate": 1.9663894773756852e-05, "loss": 0.0092, "step": 69990 }, { "epoch": 1.01, "learning_rate": 1.966384673401838e-05, "loss": 0.0204, "step": 70000 }, { "epoch": 1.01, "learning_rate": 1.966379869427991e-05, "loss": 0.0124, "step": 70010 }, { "epoch": 1.01, "learning_rate": 1.9663750654541437e-05, "loss": 0.0161, "step": 70020 }, { "epoch": 1.01, "learning_rate": 1.9663702614802966e-05, "loss": 0.0087, "step": 70030 }, { "epoch": 1.01, "learning_rate": 1.9663654575064495e-05, "loss": 0.0148, "step": 70040 }, { "epoch": 1.01, "learning_rate": 1.9663606535326024e-05, "loss": 0.0199, "step": 70050 }, { "epoch": 1.01, "learning_rate": 1.966355849558755e-05, "loss": 0.0108, "step": 70060 }, { "epoch": 1.01, "learning_rate": 1.966351045584908e-05, "loss": 0.0174, "step": 70070 }, { "epoch": 1.01, "learning_rate": 1.966346241611061e-05, "loss": 0.0137, "step": 70080 }, { "epoch": 1.01, "learning_rate": 1.9663414376372135e-05, "loss": 0.0118, "step": 70090 }, { "epoch": 1.01, "learning_rate": 1.9663366336633664e-05, "loss": 0.0096, "step": 70100 }, { "epoch": 1.01, "learning_rate": 1.9663318296895193e-05, "loss": 0.0103, "step": 70110 }, { "epoch": 1.01, "learning_rate": 1.9663270257156723e-05, "loss": 0.014, "step": 70120 }, { "epoch": 1.01, "learning_rate": 1.966322221741825e-05, "loss": 0.0155, "step": 70130 }, { "epoch": 1.01, "learning_rate": 1.9663174177679778e-05, "loss": 0.0124, "step": 70140 }, { "epoch": 1.01, "learning_rate": 1.9663126137941307e-05, "loss": 0.011, "step": 70150 }, { "epoch": 1.01, "learning_rate": 1.9663078098202836e-05, "loss": 0.0116, "step": 70160 }, { "epoch": 1.01, "learning_rate": 1.9663030058464362e-05, "loss": 0.0155, "step": 70170 }, { "epoch": 1.01, "learning_rate": 1.966298201872589e-05, "loss": 0.0143, "step": 70180 }, { "epoch": 1.01, "learning_rate": 1.966293397898742e-05, "loss": 0.0093, "step": 70190 }, { "epoch": 1.01, "learning_rate": 1.9662885939248947e-05, "loss": 0.0114, "step": 70200 }, { "epoch": 1.01, "learning_rate": 1.9662837899510476e-05, "loss": 0.0132, "step": 70210 }, { "epoch": 1.01, "learning_rate": 1.9662789859772005e-05, "loss": 0.0174, "step": 70220 }, { "epoch": 1.01, "learning_rate": 1.9662741820033534e-05, "loss": 0.0112, "step": 70230 }, { "epoch": 1.01, "learning_rate": 1.966269378029506e-05, "loss": 0.0128, "step": 70240 }, { "epoch": 1.01, "learning_rate": 1.966264574055659e-05, "loss": 0.0155, "step": 70250 }, { "epoch": 1.01, "learning_rate": 1.966259770081812e-05, "loss": 0.0117, "step": 70260 }, { "epoch": 1.01, "learning_rate": 1.9662549661079645e-05, "loss": 0.0198, "step": 70270 }, { "epoch": 1.01, "learning_rate": 1.9662501621341174e-05, "loss": 0.0178, "step": 70280 }, { "epoch": 1.01, "learning_rate": 1.9662453581602703e-05, "loss": 0.0108, "step": 70290 }, { "epoch": 1.01, "learning_rate": 1.9662405541864232e-05, "loss": 0.0144, "step": 70300 }, { "epoch": 1.01, "learning_rate": 1.966235750212576e-05, "loss": 0.0088, "step": 70310 }, { "epoch": 1.01, "learning_rate": 1.9662309462387288e-05, "loss": 0.0125, "step": 70320 }, { "epoch": 1.01, "learning_rate": 1.9662261422648817e-05, "loss": 0.016, "step": 70330 }, { "epoch": 1.01, "learning_rate": 1.9662213382910346e-05, "loss": 0.0137, "step": 70340 }, { "epoch": 1.01, "learning_rate": 1.9662165343171872e-05, "loss": 0.0125, "step": 70350 }, { "epoch": 1.01, "learning_rate": 1.96621173034334e-05, "loss": 0.0152, "step": 70360 }, { "epoch": 1.01, "learning_rate": 1.966206926369493e-05, "loss": 0.0124, "step": 70370 }, { "epoch": 1.01, "learning_rate": 1.9662021223956456e-05, "loss": 0.0127, "step": 70380 }, { "epoch": 1.01, "learning_rate": 1.9661973184217986e-05, "loss": 0.0132, "step": 70390 }, { "epoch": 1.01, "learning_rate": 1.9661925144479515e-05, "loss": 0.0176, "step": 70400 }, { "epoch": 1.01, "learning_rate": 1.9661877104741044e-05, "loss": 0.0162, "step": 70410 }, { "epoch": 1.01, "learning_rate": 1.966182906500257e-05, "loss": 0.0139, "step": 70420 }, { "epoch": 1.02, "learning_rate": 1.96617810252641e-05, "loss": 0.0173, "step": 70430 }, { "epoch": 1.02, "learning_rate": 1.966173298552563e-05, "loss": 0.0139, "step": 70440 }, { "epoch": 1.02, "learning_rate": 1.9661684945787155e-05, "loss": 0.0123, "step": 70450 }, { "epoch": 1.02, "learning_rate": 1.9661636906048684e-05, "loss": 0.0188, "step": 70460 }, { "epoch": 1.02, "learning_rate": 1.9661588866310213e-05, "loss": 0.0197, "step": 70470 }, { "epoch": 1.02, "learning_rate": 1.9661540826571742e-05, "loss": 0.0177, "step": 70480 }, { "epoch": 1.02, "learning_rate": 1.9661492786833268e-05, "loss": 0.0115, "step": 70490 }, { "epoch": 1.02, "learning_rate": 1.9661444747094798e-05, "loss": 0.0201, "step": 70500 }, { "epoch": 1.02, "learning_rate": 1.9661396707356327e-05, "loss": 0.0138, "step": 70510 }, { "epoch": 1.02, "learning_rate": 1.9661348667617856e-05, "loss": 0.0134, "step": 70520 }, { "epoch": 1.02, "learning_rate": 1.9661300627879382e-05, "loss": 0.0142, "step": 70530 }, { "epoch": 1.02, "learning_rate": 1.966125258814091e-05, "loss": 0.0139, "step": 70540 }, { "epoch": 1.02, "learning_rate": 1.966120454840244e-05, "loss": 0.0125, "step": 70550 }, { "epoch": 1.02, "learning_rate": 1.9661156508663966e-05, "loss": 0.0165, "step": 70560 }, { "epoch": 1.02, "learning_rate": 1.9661108468925496e-05, "loss": 0.0152, "step": 70570 }, { "epoch": 1.02, "learning_rate": 1.9661060429187025e-05, "loss": 0.0152, "step": 70580 }, { "epoch": 1.02, "learning_rate": 1.9661012389448554e-05, "loss": 0.0122, "step": 70590 }, { "epoch": 1.02, "learning_rate": 1.966096434971008e-05, "loss": 0.0083, "step": 70600 }, { "epoch": 1.02, "learning_rate": 1.966091630997161e-05, "loss": 0.0107, "step": 70610 }, { "epoch": 1.02, "learning_rate": 1.966086827023314e-05, "loss": 0.0127, "step": 70620 }, { "epoch": 1.02, "learning_rate": 1.9660820230494664e-05, "loss": 0.0137, "step": 70630 }, { "epoch": 1.02, "learning_rate": 1.9660772190756194e-05, "loss": 0.0102, "step": 70640 }, { "epoch": 1.02, "learning_rate": 1.9660724151017723e-05, "loss": 0.0119, "step": 70650 }, { "epoch": 1.02, "learning_rate": 1.9660676111279252e-05, "loss": 0.0135, "step": 70660 }, { "epoch": 1.02, "learning_rate": 1.9660628071540778e-05, "loss": 0.0114, "step": 70670 }, { "epoch": 1.02, "learning_rate": 1.9660580031802307e-05, "loss": 0.0136, "step": 70680 }, { "epoch": 1.02, "learning_rate": 1.9660531992063837e-05, "loss": 0.0115, "step": 70690 }, { "epoch": 1.02, "learning_rate": 1.9660483952325366e-05, "loss": 0.0145, "step": 70700 }, { "epoch": 1.02, "learning_rate": 1.9660435912586892e-05, "loss": 0.0124, "step": 70710 }, { "epoch": 1.02, "learning_rate": 1.966038787284842e-05, "loss": 0.0126, "step": 70720 }, { "epoch": 1.02, "learning_rate": 1.966033983310995e-05, "loss": 0.0159, "step": 70730 }, { "epoch": 1.02, "learning_rate": 1.9660291793371476e-05, "loss": 0.0142, "step": 70740 }, { "epoch": 1.02, "learning_rate": 1.9660243753633006e-05, "loss": 0.0123, "step": 70750 }, { "epoch": 1.02, "learning_rate": 1.9660195713894535e-05, "loss": 0.016, "step": 70760 }, { "epoch": 1.02, "learning_rate": 1.9660147674156064e-05, "loss": 0.0159, "step": 70770 }, { "epoch": 1.02, "learning_rate": 1.966009963441759e-05, "loss": 0.0129, "step": 70780 }, { "epoch": 1.02, "learning_rate": 1.966005159467912e-05, "loss": 0.0121, "step": 70790 }, { "epoch": 1.02, "learning_rate": 1.966000355494065e-05, "loss": 0.014, "step": 70800 }, { "epoch": 1.02, "learning_rate": 1.9659955515202174e-05, "loss": 0.0104, "step": 70810 }, { "epoch": 1.02, "learning_rate": 1.9659907475463704e-05, "loss": 0.0087, "step": 70820 }, { "epoch": 1.02, "learning_rate": 1.9659859435725233e-05, "loss": 0.0143, "step": 70830 }, { "epoch": 1.02, "learning_rate": 1.9659811395986762e-05, "loss": 0.0098, "step": 70840 }, { "epoch": 1.02, "learning_rate": 1.9659763356248288e-05, "loss": 0.0156, "step": 70850 }, { "epoch": 1.02, "learning_rate": 1.9659715316509817e-05, "loss": 0.015, "step": 70860 }, { "epoch": 1.02, "learning_rate": 1.9659667276771347e-05, "loss": 0.0088, "step": 70870 }, { "epoch": 1.02, "learning_rate": 1.9659619237032876e-05, "loss": 0.0104, "step": 70880 }, { "epoch": 1.02, "learning_rate": 1.9659571197294402e-05, "loss": 0.0106, "step": 70890 }, { "epoch": 1.02, "learning_rate": 1.965952315755593e-05, "loss": 0.0122, "step": 70900 }, { "epoch": 1.02, "learning_rate": 1.965947511781746e-05, "loss": 0.0101, "step": 70910 }, { "epoch": 1.02, "learning_rate": 1.9659427078078986e-05, "loss": 0.0104, "step": 70920 }, { "epoch": 1.02, "learning_rate": 1.9659379038340515e-05, "loss": 0.0132, "step": 70930 }, { "epoch": 1.02, "learning_rate": 1.9659330998602045e-05, "loss": 0.0117, "step": 70940 }, { "epoch": 1.02, "learning_rate": 1.9659282958863574e-05, "loss": 0.0118, "step": 70950 }, { "epoch": 1.02, "learning_rate": 1.96592349191251e-05, "loss": 0.0179, "step": 70960 }, { "epoch": 1.02, "learning_rate": 1.965918687938663e-05, "loss": 0.0081, "step": 70970 }, { "epoch": 1.02, "learning_rate": 1.965913883964816e-05, "loss": 0.0163, "step": 70980 }, { "epoch": 1.02, "learning_rate": 1.9659090799909684e-05, "loss": 0.0134, "step": 70990 }, { "epoch": 1.02, "learning_rate": 1.9659042760171214e-05, "loss": 0.0131, "step": 71000 }, { "epoch": 1.02, "learning_rate": 1.9658994720432743e-05, "loss": 0.0097, "step": 71010 }, { "epoch": 1.02, "learning_rate": 1.9658946680694272e-05, "loss": 0.0192, "step": 71020 }, { "epoch": 1.02, "learning_rate": 1.9658898640955798e-05, "loss": 0.0157, "step": 71030 }, { "epoch": 1.02, "learning_rate": 1.965885060121733e-05, "loss": 0.0125, "step": 71040 }, { "epoch": 1.02, "learning_rate": 1.9658802561478857e-05, "loss": 0.0135, "step": 71050 }, { "epoch": 1.02, "learning_rate": 1.9658754521740386e-05, "loss": 0.0127, "step": 71060 }, { "epoch": 1.02, "learning_rate": 1.9658706482001915e-05, "loss": 0.0134, "step": 71070 }, { "epoch": 1.02, "learning_rate": 1.9658658442263444e-05, "loss": 0.016, "step": 71080 }, { "epoch": 1.02, "learning_rate": 1.965861040252497e-05, "loss": 0.0117, "step": 71090 }, { "epoch": 1.02, "learning_rate": 1.96585623627865e-05, "loss": 0.0156, "step": 71100 }, { "epoch": 1.02, "learning_rate": 1.965851432304803e-05, "loss": 0.0096, "step": 71110 }, { "epoch": 1.02, "learning_rate": 1.9658466283309555e-05, "loss": 0.0135, "step": 71120 }, { "epoch": 1.03, "learning_rate": 1.9658418243571084e-05, "loss": 0.0118, "step": 71130 }, { "epoch": 1.03, "learning_rate": 1.9658370203832613e-05, "loss": 0.0119, "step": 71140 }, { "epoch": 1.03, "learning_rate": 1.9658322164094142e-05, "loss": 0.0148, "step": 71150 }, { "epoch": 1.03, "learning_rate": 1.965827412435567e-05, "loss": 0.0151, "step": 71160 }, { "epoch": 1.03, "learning_rate": 1.9658226084617198e-05, "loss": 0.0121, "step": 71170 }, { "epoch": 1.03, "learning_rate": 1.9658178044878727e-05, "loss": 0.0097, "step": 71180 }, { "epoch": 1.03, "learning_rate": 1.9658130005140256e-05, "loss": 0.0138, "step": 71190 }, { "epoch": 1.03, "learning_rate": 1.9658081965401782e-05, "loss": 0.0128, "step": 71200 }, { "epoch": 1.03, "learning_rate": 1.965803392566331e-05, "loss": 0.0115, "step": 71210 }, { "epoch": 1.03, "learning_rate": 1.965798588592484e-05, "loss": 0.0108, "step": 71220 }, { "epoch": 1.03, "learning_rate": 1.9657937846186366e-05, "loss": 0.0088, "step": 71230 }, { "epoch": 1.03, "learning_rate": 1.9657889806447896e-05, "loss": 0.0141, "step": 71240 }, { "epoch": 1.03, "learning_rate": 1.9657841766709425e-05, "loss": 0.0105, "step": 71250 }, { "epoch": 1.03, "learning_rate": 1.9657793726970954e-05, "loss": 0.0099, "step": 71260 }, { "epoch": 1.03, "learning_rate": 1.965774568723248e-05, "loss": 0.0137, "step": 71270 }, { "epoch": 1.03, "learning_rate": 1.9657702451467855e-05, "loss": 0.0085, "step": 71280 }, { "epoch": 1.03, "learning_rate": 1.9657654411729384e-05, "loss": 0.0105, "step": 71290 }, { "epoch": 1.03, "learning_rate": 1.965760637199091e-05, "loss": 0.0145, "step": 71300 }, { "epoch": 1.03, "learning_rate": 1.965755833225244e-05, "loss": 0.0131, "step": 71310 }, { "epoch": 1.03, "learning_rate": 1.965751029251397e-05, "loss": 0.0124, "step": 71320 }, { "epoch": 1.03, "learning_rate": 1.9657462252775498e-05, "loss": 0.0114, "step": 71330 }, { "epoch": 1.03, "learning_rate": 1.9657414213037024e-05, "loss": 0.0144, "step": 71340 }, { "epoch": 1.03, "learning_rate": 1.9657366173298553e-05, "loss": 0.0097, "step": 71350 }, { "epoch": 1.03, "learning_rate": 1.9657318133560082e-05, "loss": 0.0178, "step": 71360 }, { "epoch": 1.03, "learning_rate": 1.965727009382161e-05, "loss": 0.0165, "step": 71370 }, { "epoch": 1.03, "learning_rate": 1.9657222054083137e-05, "loss": 0.0168, "step": 71380 }, { "epoch": 1.03, "learning_rate": 1.9657174014344667e-05, "loss": 0.0124, "step": 71390 }, { "epoch": 1.03, "learning_rate": 1.9657125974606196e-05, "loss": 0.0133, "step": 71400 }, { "epoch": 1.03, "learning_rate": 1.9657077934867722e-05, "loss": 0.017, "step": 71410 }, { "epoch": 1.03, "learning_rate": 1.965702989512925e-05, "loss": 0.016, "step": 71420 }, { "epoch": 1.03, "learning_rate": 1.965698185539078e-05, "loss": 0.0126, "step": 71430 }, { "epoch": 1.03, "learning_rate": 1.965693381565231e-05, "loss": 0.0137, "step": 71440 }, { "epoch": 1.03, "learning_rate": 1.9656885775913835e-05, "loss": 0.013, "step": 71450 }, { "epoch": 1.03, "learning_rate": 1.9656837736175365e-05, "loss": 0.0163, "step": 71460 }, { "epoch": 1.03, "learning_rate": 1.9656789696436894e-05, "loss": 0.0118, "step": 71470 }, { "epoch": 1.03, "learning_rate": 1.965674165669842e-05, "loss": 0.0131, "step": 71480 }, { "epoch": 1.03, "learning_rate": 1.965669361695995e-05, "loss": 0.014, "step": 71490 }, { "epoch": 1.03, "learning_rate": 1.965664557722148e-05, "loss": 0.0116, "step": 71500 }, { "epoch": 1.03, "learning_rate": 1.9656597537483008e-05, "loss": 0.0117, "step": 71510 }, { "epoch": 1.03, "learning_rate": 1.9656549497744534e-05, "loss": 0.0118, "step": 71520 }, { "epoch": 1.03, "learning_rate": 1.9656501458006063e-05, "loss": 0.0201, "step": 71530 }, { "epoch": 1.03, "learning_rate": 1.9656453418267592e-05, "loss": 0.016, "step": 71540 }, { "epoch": 1.03, "learning_rate": 1.965640537852912e-05, "loss": 0.0114, "step": 71550 }, { "epoch": 1.03, "learning_rate": 1.965635733879065e-05, "loss": 0.0135, "step": 71560 }, { "epoch": 1.03, "learning_rate": 1.965630929905218e-05, "loss": 0.0097, "step": 71570 }, { "epoch": 1.03, "learning_rate": 1.9656261259313706e-05, "loss": 0.0117, "step": 71580 }, { "epoch": 1.03, "learning_rate": 1.9656213219575235e-05, "loss": 0.0119, "step": 71590 }, { "epoch": 1.03, "learning_rate": 1.9656165179836764e-05, "loss": 0.0134, "step": 71600 }, { "epoch": 1.03, "learning_rate": 1.9656117140098294e-05, "loss": 0.0132, "step": 71610 }, { "epoch": 1.03, "learning_rate": 1.965606910035982e-05, "loss": 0.0117, "step": 71620 }, { "epoch": 1.03, "learning_rate": 1.965602106062135e-05, "loss": 0.0146, "step": 71630 }, { "epoch": 1.03, "learning_rate": 1.9655973020882878e-05, "loss": 0.0134, "step": 71640 }, { "epoch": 1.03, "learning_rate": 1.9655924981144404e-05, "loss": 0.0124, "step": 71650 }, { "epoch": 1.03, "learning_rate": 1.9655876941405933e-05, "loss": 0.0135, "step": 71660 }, { "epoch": 1.03, "learning_rate": 1.9655828901667462e-05, "loss": 0.0148, "step": 71670 }, { "epoch": 1.03, "learning_rate": 1.9655780861928992e-05, "loss": 0.0219, "step": 71680 }, { "epoch": 1.03, "learning_rate": 1.9655732822190518e-05, "loss": 0.0119, "step": 71690 }, { "epoch": 1.03, "learning_rate": 1.9655684782452047e-05, "loss": 0.0146, "step": 71700 }, { "epoch": 1.03, "learning_rate": 1.9655636742713576e-05, "loss": 0.0147, "step": 71710 }, { "epoch": 1.03, "learning_rate": 1.9655588702975102e-05, "loss": 0.0164, "step": 71720 }, { "epoch": 1.03, "learning_rate": 1.965554066323663e-05, "loss": 0.0127, "step": 71730 }, { "epoch": 1.03, "learning_rate": 1.965549262349816e-05, "loss": 0.0124, "step": 71740 }, { "epoch": 1.03, "learning_rate": 1.965544458375969e-05, "loss": 0.0193, "step": 71750 }, { "epoch": 1.03, "learning_rate": 1.9655396544021216e-05, "loss": 0.0127, "step": 71760 }, { "epoch": 1.03, "learning_rate": 1.9655348504282745e-05, "loss": 0.0137, "step": 71770 }, { "epoch": 1.03, "learning_rate": 1.9655300464544274e-05, "loss": 0.013, "step": 71780 }, { "epoch": 1.03, "learning_rate": 1.9655252424805803e-05, "loss": 0.0126, "step": 71790 }, { "epoch": 1.03, "learning_rate": 1.965520438506733e-05, "loss": 0.0125, "step": 71800 }, { "epoch": 1.03, "learning_rate": 1.965515634532886e-05, "loss": 0.0118, "step": 71810 }, { "epoch": 1.04, "learning_rate": 1.9655108305590388e-05, "loss": 0.0143, "step": 71820 }, { "epoch": 1.04, "learning_rate": 1.9655060265851914e-05, "loss": 0.012, "step": 71830 }, { "epoch": 1.04, "learning_rate": 1.9655012226113443e-05, "loss": 0.0154, "step": 71840 }, { "epoch": 1.04, "learning_rate": 1.9654964186374972e-05, "loss": 0.0122, "step": 71850 }, { "epoch": 1.04, "learning_rate": 1.96549161466365e-05, "loss": 0.0127, "step": 71860 }, { "epoch": 1.04, "learning_rate": 1.9654868106898027e-05, "loss": 0.013, "step": 71870 }, { "epoch": 1.04, "learning_rate": 1.9654820067159557e-05, "loss": 0.0139, "step": 71880 }, { "epoch": 1.04, "learning_rate": 1.9654772027421086e-05, "loss": 0.0134, "step": 71890 }, { "epoch": 1.04, "learning_rate": 1.9654723987682612e-05, "loss": 0.0157, "step": 71900 }, { "epoch": 1.04, "learning_rate": 1.965467594794414e-05, "loss": 0.0114, "step": 71910 }, { "epoch": 1.04, "learning_rate": 1.965462790820567e-05, "loss": 0.0117, "step": 71920 }, { "epoch": 1.04, "learning_rate": 1.96545798684672e-05, "loss": 0.0122, "step": 71930 }, { "epoch": 1.04, "learning_rate": 1.9654531828728726e-05, "loss": 0.0192, "step": 71940 }, { "epoch": 1.04, "learning_rate": 1.9654483788990255e-05, "loss": 0.0132, "step": 71950 }, { "epoch": 1.04, "learning_rate": 1.9654435749251784e-05, "loss": 0.0111, "step": 71960 }, { "epoch": 1.04, "learning_rate": 1.9654387709513313e-05, "loss": 0.0143, "step": 71970 }, { "epoch": 1.04, "learning_rate": 1.965433966977484e-05, "loss": 0.014, "step": 71980 }, { "epoch": 1.04, "learning_rate": 1.965429163003637e-05, "loss": 0.0123, "step": 71990 }, { "epoch": 1.04, "learning_rate": 1.9654243590297898e-05, "loss": 0.0104, "step": 72000 }, { "epoch": 1.04, "learning_rate": 1.9654195550559424e-05, "loss": 0.0107, "step": 72010 }, { "epoch": 1.04, "learning_rate": 1.9654147510820953e-05, "loss": 0.0178, "step": 72020 }, { "epoch": 1.04, "learning_rate": 1.9654099471082482e-05, "loss": 0.0142, "step": 72030 }, { "epoch": 1.04, "learning_rate": 1.965405143134401e-05, "loss": 0.0154, "step": 72040 }, { "epoch": 1.04, "learning_rate": 1.9654003391605537e-05, "loss": 0.0092, "step": 72050 }, { "epoch": 1.04, "learning_rate": 1.9653955351867067e-05, "loss": 0.0125, "step": 72060 }, { "epoch": 1.04, "learning_rate": 1.9653907312128596e-05, "loss": 0.0161, "step": 72070 }, { "epoch": 1.04, "learning_rate": 1.9653859272390122e-05, "loss": 0.013, "step": 72080 }, { "epoch": 1.04, "learning_rate": 1.965381123265165e-05, "loss": 0.011, "step": 72090 }, { "epoch": 1.04, "learning_rate": 1.965376319291318e-05, "loss": 0.014, "step": 72100 }, { "epoch": 1.04, "learning_rate": 1.965371515317471e-05, "loss": 0.0181, "step": 72110 }, { "epoch": 1.04, "learning_rate": 1.9653667113436236e-05, "loss": 0.0136, "step": 72120 }, { "epoch": 1.04, "learning_rate": 1.9653619073697765e-05, "loss": 0.0169, "step": 72130 }, { "epoch": 1.04, "learning_rate": 1.9653571033959294e-05, "loss": 0.0144, "step": 72140 }, { "epoch": 1.04, "learning_rate": 1.9653522994220823e-05, "loss": 0.0116, "step": 72150 }, { "epoch": 1.04, "learning_rate": 1.965347495448235e-05, "loss": 0.0164, "step": 72160 }, { "epoch": 1.04, "learning_rate": 1.965342691474388e-05, "loss": 0.0112, "step": 72170 }, { "epoch": 1.04, "learning_rate": 1.9653378875005408e-05, "loss": 0.0115, "step": 72180 }, { "epoch": 1.04, "learning_rate": 1.9653330835266934e-05, "loss": 0.0153, "step": 72190 }, { "epoch": 1.04, "learning_rate": 1.9653282795528463e-05, "loss": 0.0188, "step": 72200 }, { "epoch": 1.04, "learning_rate": 1.9653234755789992e-05, "loss": 0.0173, "step": 72210 }, { "epoch": 1.04, "learning_rate": 1.965318671605152e-05, "loss": 0.0122, "step": 72220 }, { "epoch": 1.04, "learning_rate": 1.9653138676313047e-05, "loss": 0.0122, "step": 72230 }, { "epoch": 1.04, "learning_rate": 1.9653090636574577e-05, "loss": 0.0119, "step": 72240 }, { "epoch": 1.04, "learning_rate": 1.9653042596836106e-05, "loss": 0.0185, "step": 72250 }, { "epoch": 1.04, "learning_rate": 1.9652994557097632e-05, "loss": 0.016, "step": 72260 }, { "epoch": 1.04, "learning_rate": 1.965294651735916e-05, "loss": 0.0111, "step": 72270 }, { "epoch": 1.04, "learning_rate": 1.965289847762069e-05, "loss": 0.0155, "step": 72280 }, { "epoch": 1.04, "learning_rate": 1.965285043788222e-05, "loss": 0.0138, "step": 72290 }, { "epoch": 1.04, "learning_rate": 1.9652802398143745e-05, "loss": 0.0121, "step": 72300 }, { "epoch": 1.04, "learning_rate": 1.9652754358405275e-05, "loss": 0.0139, "step": 72310 }, { "epoch": 1.04, "learning_rate": 1.9652706318666804e-05, "loss": 0.0187, "step": 72320 }, { "epoch": 1.04, "learning_rate": 1.9652658278928333e-05, "loss": 0.0161, "step": 72330 }, { "epoch": 1.04, "learning_rate": 1.965261023918986e-05, "loss": 0.017, "step": 72340 }, { "epoch": 1.04, "learning_rate": 1.965256219945139e-05, "loss": 0.0165, "step": 72350 }, { "epoch": 1.04, "learning_rate": 1.9652514159712918e-05, "loss": 0.011, "step": 72360 }, { "epoch": 1.04, "learning_rate": 1.9652466119974444e-05, "loss": 0.0159, "step": 72370 }, { "epoch": 1.04, "learning_rate": 1.9652418080235973e-05, "loss": 0.0157, "step": 72380 }, { "epoch": 1.04, "learning_rate": 1.9652370040497502e-05, "loss": 0.0155, "step": 72390 }, { "epoch": 1.04, "learning_rate": 1.965232200075903e-05, "loss": 0.011, "step": 72400 }, { "epoch": 1.04, "learning_rate": 1.9652273961020557e-05, "loss": 0.0129, "step": 72410 }, { "epoch": 1.04, "learning_rate": 1.9652225921282087e-05, "loss": 0.0121, "step": 72420 }, { "epoch": 1.04, "learning_rate": 1.9652177881543616e-05, "loss": 0.0158, "step": 72430 }, { "epoch": 1.04, "learning_rate": 1.965212984180514e-05, "loss": 0.0111, "step": 72440 }, { "epoch": 1.04, "learning_rate": 1.965208180206667e-05, "loss": 0.0163, "step": 72450 }, { "epoch": 1.04, "learning_rate": 1.96520337623282e-05, "loss": 0.0151, "step": 72460 }, { "epoch": 1.04, "learning_rate": 1.965198572258973e-05, "loss": 0.0188, "step": 72470 }, { "epoch": 1.04, "learning_rate": 1.9651937682851255e-05, "loss": 0.0132, "step": 72480 }, { "epoch": 1.04, "learning_rate": 1.9651889643112785e-05, "loss": 0.0136, "step": 72490 }, { "epoch": 1.04, "learning_rate": 1.9651841603374314e-05, "loss": 0.0092, "step": 72500 }, { "epoch": 1.05, "learning_rate": 1.965179356363584e-05, "loss": 0.0137, "step": 72510 }, { "epoch": 1.05, "learning_rate": 1.965174552389737e-05, "loss": 0.0187, "step": 72520 }, { "epoch": 1.05, "learning_rate": 1.96516974841589e-05, "loss": 0.0147, "step": 72530 }, { "epoch": 1.05, "learning_rate": 1.9651649444420428e-05, "loss": 0.0092, "step": 72540 }, { "epoch": 1.05, "learning_rate": 1.9651601404681953e-05, "loss": 0.0096, "step": 72550 }, { "epoch": 1.05, "learning_rate": 1.9651553364943483e-05, "loss": 0.0146, "step": 72560 }, { "epoch": 1.05, "learning_rate": 1.9651505325205012e-05, "loss": 0.018, "step": 72570 }, { "epoch": 1.05, "learning_rate": 1.965145728546654e-05, "loss": 0.0115, "step": 72580 }, { "epoch": 1.05, "learning_rate": 1.9651409245728067e-05, "loss": 0.0158, "step": 72590 }, { "epoch": 1.05, "learning_rate": 1.9651361205989596e-05, "loss": 0.0091, "step": 72600 }, { "epoch": 1.05, "learning_rate": 1.9651313166251126e-05, "loss": 0.0153, "step": 72610 }, { "epoch": 1.05, "learning_rate": 1.965126512651265e-05, "loss": 0.0143, "step": 72620 }, { "epoch": 1.05, "learning_rate": 1.965121708677418e-05, "loss": 0.011, "step": 72630 }, { "epoch": 1.05, "learning_rate": 1.965116904703571e-05, "loss": 0.0103, "step": 72640 }, { "epoch": 1.05, "learning_rate": 1.965112100729724e-05, "loss": 0.0108, "step": 72650 }, { "epoch": 1.05, "learning_rate": 1.9651072967558765e-05, "loss": 0.0153, "step": 72660 }, { "epoch": 1.05, "learning_rate": 1.9651024927820295e-05, "loss": 0.0126, "step": 72670 }, { "epoch": 1.05, "learning_rate": 1.9650976888081824e-05, "loss": 0.0094, "step": 72680 }, { "epoch": 1.05, "learning_rate": 1.965092884834335e-05, "loss": 0.0113, "step": 72690 }, { "epoch": 1.05, "learning_rate": 1.965088080860488e-05, "loss": 0.0132, "step": 72700 }, { "epoch": 1.05, "learning_rate": 1.9650832768866408e-05, "loss": 0.0133, "step": 72710 }, { "epoch": 1.05, "learning_rate": 1.9650784729127937e-05, "loss": 0.0198, "step": 72720 }, { "epoch": 1.05, "learning_rate": 1.9650736689389463e-05, "loss": 0.0114, "step": 72730 }, { "epoch": 1.05, "learning_rate": 1.9650688649650993e-05, "loss": 0.0138, "step": 72740 }, { "epoch": 1.05, "learning_rate": 1.9650640609912522e-05, "loss": 0.0116, "step": 72750 }, { "epoch": 1.05, "learning_rate": 1.965059257017405e-05, "loss": 0.0121, "step": 72760 }, { "epoch": 1.05, "learning_rate": 1.9650544530435577e-05, "loss": 0.0134, "step": 72770 }, { "epoch": 1.05, "learning_rate": 1.9650496490697106e-05, "loss": 0.0117, "step": 72780 }, { "epoch": 1.05, "learning_rate": 1.9650448450958636e-05, "loss": 0.0121, "step": 72790 }, { "epoch": 1.05, "learning_rate": 1.965040041122016e-05, "loss": 0.0131, "step": 72800 }, { "epoch": 1.05, "learning_rate": 1.965035237148169e-05, "loss": 0.0113, "step": 72810 }, { "epoch": 1.05, "learning_rate": 1.965030433174322e-05, "loss": 0.0126, "step": 72820 }, { "epoch": 1.05, "learning_rate": 1.965025629200475e-05, "loss": 0.0128, "step": 72830 }, { "epoch": 1.05, "learning_rate": 1.9650208252266275e-05, "loss": 0.0162, "step": 72840 }, { "epoch": 1.05, "learning_rate": 1.9650160212527804e-05, "loss": 0.0138, "step": 72850 }, { "epoch": 1.05, "learning_rate": 1.9650112172789334e-05, "loss": 0.0178, "step": 72860 }, { "epoch": 1.05, "learning_rate": 1.965006413305086e-05, "loss": 0.0108, "step": 72870 }, { "epoch": 1.05, "learning_rate": 1.965001609331239e-05, "loss": 0.0135, "step": 72880 }, { "epoch": 1.05, "learning_rate": 1.9649968053573918e-05, "loss": 0.0151, "step": 72890 }, { "epoch": 1.05, "learning_rate": 1.9649920013835447e-05, "loss": 0.0156, "step": 72900 }, { "epoch": 1.05, "learning_rate": 1.9649871974096973e-05, "loss": 0.0129, "step": 72910 }, { "epoch": 1.05, "learning_rate": 1.9649823934358503e-05, "loss": 0.0213, "step": 72920 }, { "epoch": 1.05, "learning_rate": 1.9649775894620032e-05, "loss": 0.0117, "step": 72930 }, { "epoch": 1.05, "learning_rate": 1.964972785488156e-05, "loss": 0.0119, "step": 72940 }, { "epoch": 1.05, "learning_rate": 1.9649679815143087e-05, "loss": 0.0108, "step": 72950 }, { "epoch": 1.05, "learning_rate": 1.9649631775404616e-05, "loss": 0.0134, "step": 72960 }, { "epoch": 1.05, "learning_rate": 1.9649583735666146e-05, "loss": 0.0135, "step": 72970 }, { "epoch": 1.05, "learning_rate": 1.964953569592767e-05, "loss": 0.0128, "step": 72980 }, { "epoch": 1.05, "learning_rate": 1.96494876561892e-05, "loss": 0.0115, "step": 72990 }, { "epoch": 1.05, "learning_rate": 1.964943961645073e-05, "loss": 0.0118, "step": 73000 }, { "epoch": 1.05, "learning_rate": 1.964939157671226e-05, "loss": 0.0126, "step": 73010 }, { "epoch": 1.05, "learning_rate": 1.9649343536973785e-05, "loss": 0.0128, "step": 73020 }, { "epoch": 1.05, "learning_rate": 1.9649295497235314e-05, "loss": 0.0138, "step": 73030 }, { "epoch": 1.05, "learning_rate": 1.9649247457496844e-05, "loss": 0.0111, "step": 73040 }, { "epoch": 1.05, "learning_rate": 1.964919941775837e-05, "loss": 0.0108, "step": 73050 }, { "epoch": 1.05, "learning_rate": 1.96491513780199e-05, "loss": 0.0081, "step": 73060 }, { "epoch": 1.05, "learning_rate": 1.9649103338281428e-05, "loss": 0.0119, "step": 73070 }, { "epoch": 1.05, "learning_rate": 1.9649055298542957e-05, "loss": 0.0122, "step": 73080 }, { "epoch": 1.05, "learning_rate": 1.9649007258804483e-05, "loss": 0.0158, "step": 73090 }, { "epoch": 1.05, "learning_rate": 1.9648959219066012e-05, "loss": 0.0102, "step": 73100 }, { "epoch": 1.05, "learning_rate": 1.9648911179327542e-05, "loss": 0.011, "step": 73110 }, { "epoch": 1.05, "learning_rate": 1.964886313958907e-05, "loss": 0.0161, "step": 73120 }, { "epoch": 1.05, "learning_rate": 1.9648815099850597e-05, "loss": 0.0143, "step": 73130 }, { "epoch": 1.05, "learning_rate": 1.9648767060112126e-05, "loss": 0.0131, "step": 73140 }, { "epoch": 1.05, "learning_rate": 1.9648719020373655e-05, "loss": 0.0103, "step": 73150 }, { "epoch": 1.05, "learning_rate": 1.964867098063518e-05, "loss": 0.0142, "step": 73160 }, { "epoch": 1.05, "learning_rate": 1.964862294089671e-05, "loss": 0.0122, "step": 73170 }, { "epoch": 1.05, "learning_rate": 1.964857490115824e-05, "loss": 0.0127, "step": 73180 }, { "epoch": 1.05, "learning_rate": 1.964852686141977e-05, "loss": 0.0143, "step": 73190 }, { "epoch": 1.05, "learning_rate": 1.9648478821681295e-05, "loss": 0.0169, "step": 73200 }, { "epoch": 1.06, "learning_rate": 1.9648430781942824e-05, "loss": 0.0121, "step": 73210 }, { "epoch": 1.06, "learning_rate": 1.9648382742204354e-05, "loss": 0.0128, "step": 73220 }, { "epoch": 1.06, "learning_rate": 1.964833470246588e-05, "loss": 0.0155, "step": 73230 }, { "epoch": 1.06, "learning_rate": 1.964828666272741e-05, "loss": 0.016, "step": 73240 }, { "epoch": 1.06, "learning_rate": 1.9648238622988938e-05, "loss": 0.0105, "step": 73250 }, { "epoch": 1.06, "learning_rate": 1.9648190583250467e-05, "loss": 0.0136, "step": 73260 }, { "epoch": 1.06, "learning_rate": 1.9648142543511993e-05, "loss": 0.0117, "step": 73270 }, { "epoch": 1.06, "learning_rate": 1.9648094503773522e-05, "loss": 0.0116, "step": 73280 }, { "epoch": 1.06, "learning_rate": 1.964804646403505e-05, "loss": 0.0135, "step": 73290 }, { "epoch": 1.06, "learning_rate": 1.964799842429658e-05, "loss": 0.0156, "step": 73300 }, { "epoch": 1.06, "learning_rate": 1.9647950384558107e-05, "loss": 0.0145, "step": 73310 }, { "epoch": 1.06, "learning_rate": 1.9647902344819636e-05, "loss": 0.016, "step": 73320 }, { "epoch": 1.06, "learning_rate": 1.9647854305081165e-05, "loss": 0.0106, "step": 73330 }, { "epoch": 1.06, "learning_rate": 1.964780626534269e-05, "loss": 0.0131, "step": 73340 }, { "epoch": 1.06, "learning_rate": 1.964775822560422e-05, "loss": 0.0153, "step": 73350 }, { "epoch": 1.06, "learning_rate": 1.964771018586575e-05, "loss": 0.0159, "step": 73360 }, { "epoch": 1.06, "learning_rate": 1.964766214612728e-05, "loss": 0.0157, "step": 73370 }, { "epoch": 1.06, "learning_rate": 1.9647614106388805e-05, "loss": 0.0113, "step": 73380 }, { "epoch": 1.06, "learning_rate": 1.9647566066650334e-05, "loss": 0.0106, "step": 73390 }, { "epoch": 1.06, "learning_rate": 1.9647518026911863e-05, "loss": 0.0163, "step": 73400 }, { "epoch": 1.06, "learning_rate": 1.964746998717339e-05, "loss": 0.0115, "step": 73410 }, { "epoch": 1.06, "learning_rate": 1.964742194743492e-05, "loss": 0.0119, "step": 73420 }, { "epoch": 1.06, "learning_rate": 1.9647373907696448e-05, "loss": 0.0149, "step": 73430 }, { "epoch": 1.06, "learning_rate": 1.9647325867957977e-05, "loss": 0.01, "step": 73440 }, { "epoch": 1.06, "learning_rate": 1.9647277828219503e-05, "loss": 0.0097, "step": 73450 }, { "epoch": 1.06, "learning_rate": 1.9647229788481032e-05, "loss": 0.0156, "step": 73460 }, { "epoch": 1.06, "learning_rate": 1.964718174874256e-05, "loss": 0.0099, "step": 73470 }, { "epoch": 1.06, "learning_rate": 1.964713370900409e-05, "loss": 0.0159, "step": 73480 }, { "epoch": 1.06, "learning_rate": 1.9647085669265617e-05, "loss": 0.0128, "step": 73490 }, { "epoch": 1.06, "learning_rate": 1.9647037629527146e-05, "loss": 0.0157, "step": 73500 }, { "epoch": 1.06, "learning_rate": 1.9646989589788675e-05, "loss": 0.0118, "step": 73510 }, { "epoch": 1.06, "learning_rate": 1.96469415500502e-05, "loss": 0.0119, "step": 73520 }, { "epoch": 1.06, "learning_rate": 1.964689351031173e-05, "loss": 0.0107, "step": 73530 }, { "epoch": 1.06, "learning_rate": 1.964684547057326e-05, "loss": 0.0136, "step": 73540 }, { "epoch": 1.06, "learning_rate": 1.964679743083479e-05, "loss": 0.0152, "step": 73550 }, { "epoch": 1.06, "learning_rate": 1.9646749391096315e-05, "loss": 0.0135, "step": 73560 }, { "epoch": 1.06, "learning_rate": 1.9646701351357844e-05, "loss": 0.0156, "step": 73570 }, { "epoch": 1.06, "learning_rate": 1.9646653311619373e-05, "loss": 0.0149, "step": 73580 }, { "epoch": 1.06, "learning_rate": 1.96466052718809e-05, "loss": 0.015, "step": 73590 }, { "epoch": 1.06, "learning_rate": 1.964655723214243e-05, "loss": 0.0134, "step": 73600 }, { "epoch": 1.06, "learning_rate": 1.9646509192403958e-05, "loss": 0.0121, "step": 73610 }, { "epoch": 1.06, "learning_rate": 1.9646461152665487e-05, "loss": 0.0154, "step": 73620 }, { "epoch": 1.06, "learning_rate": 1.9646413112927013e-05, "loss": 0.0136, "step": 73630 }, { "epoch": 1.06, "learning_rate": 1.9646365073188542e-05, "loss": 0.0128, "step": 73640 }, { "epoch": 1.06, "learning_rate": 1.964631703345007e-05, "loss": 0.0144, "step": 73650 }, { "epoch": 1.06, "learning_rate": 1.96462689937116e-05, "loss": 0.0091, "step": 73660 }, { "epoch": 1.06, "learning_rate": 1.9646220953973127e-05, "loss": 0.0123, "step": 73670 }, { "epoch": 1.06, "learning_rate": 1.9646172914234656e-05, "loss": 0.0112, "step": 73680 }, { "epoch": 1.06, "learning_rate": 1.9646124874496185e-05, "loss": 0.0168, "step": 73690 }, { "epoch": 1.06, "learning_rate": 1.964607683475771e-05, "loss": 0.0143, "step": 73700 }, { "epoch": 1.06, "learning_rate": 1.964602879501924e-05, "loss": 0.0112, "step": 73710 }, { "epoch": 1.06, "learning_rate": 1.964598075528077e-05, "loss": 0.0194, "step": 73720 }, { "epoch": 1.06, "learning_rate": 1.96459327155423e-05, "loss": 0.0092, "step": 73730 }, { "epoch": 1.06, "learning_rate": 1.9645884675803825e-05, "loss": 0.0111, "step": 73740 }, { "epoch": 1.06, "learning_rate": 1.9645836636065354e-05, "loss": 0.0157, "step": 73750 }, { "epoch": 1.06, "learning_rate": 1.9645788596326883e-05, "loss": 0.0122, "step": 73760 }, { "epoch": 1.06, "learning_rate": 1.964574055658841e-05, "loss": 0.0147, "step": 73770 }, { "epoch": 1.06, "learning_rate": 1.964569251684994e-05, "loss": 0.012, "step": 73780 }, { "epoch": 1.06, "learning_rate": 1.9645644477111468e-05, "loss": 0.0174, "step": 73790 }, { "epoch": 1.06, "learning_rate": 1.9645596437372997e-05, "loss": 0.0153, "step": 73800 }, { "epoch": 1.06, "learning_rate": 1.9645548397634523e-05, "loss": 0.0152, "step": 73810 }, { "epoch": 1.06, "learning_rate": 1.9645500357896052e-05, "loss": 0.0104, "step": 73820 }, { "epoch": 1.06, "learning_rate": 1.964545231815758e-05, "loss": 0.0111, "step": 73830 }, { "epoch": 1.06, "learning_rate": 1.964540427841911e-05, "loss": 0.0182, "step": 73840 }, { "epoch": 1.06, "learning_rate": 1.9645356238680637e-05, "loss": 0.0083, "step": 73850 }, { "epoch": 1.06, "learning_rate": 1.9645308198942166e-05, "loss": 0.0152, "step": 73860 }, { "epoch": 1.06, "learning_rate": 1.9645260159203695e-05, "loss": 0.0137, "step": 73870 }, { "epoch": 1.06, "learning_rate": 1.964521211946522e-05, "loss": 0.0172, "step": 73880 }, { "epoch": 1.06, "learning_rate": 1.964516407972675e-05, "loss": 0.0105, "step": 73890 }, { "epoch": 1.07, "learning_rate": 1.964511603998828e-05, "loss": 0.0121, "step": 73900 }, { "epoch": 1.07, "learning_rate": 1.964506800024981e-05, "loss": 0.0114, "step": 73910 }, { "epoch": 1.07, "learning_rate": 1.9645019960511335e-05, "loss": 0.0134, "step": 73920 }, { "epoch": 1.07, "learning_rate": 1.9644971920772864e-05, "loss": 0.0152, "step": 73930 }, { "epoch": 1.07, "learning_rate": 1.9644923881034393e-05, "loss": 0.0116, "step": 73940 }, { "epoch": 1.07, "learning_rate": 1.964487584129592e-05, "loss": 0.0151, "step": 73950 }, { "epoch": 1.07, "learning_rate": 1.964482780155745e-05, "loss": 0.0131, "step": 73960 }, { "epoch": 1.07, "learning_rate": 1.9644779761818978e-05, "loss": 0.0088, "step": 73970 }, { "epoch": 1.07, "learning_rate": 1.9644731722080507e-05, "loss": 0.0125, "step": 73980 }, { "epoch": 1.07, "learning_rate": 1.9644683682342033e-05, "loss": 0.0152, "step": 73990 }, { "epoch": 1.07, "learning_rate": 1.9644635642603562e-05, "loss": 0.0134, "step": 74000 }, { "epoch": 1.07, "learning_rate": 1.964458760286509e-05, "loss": 0.0175, "step": 74010 }, { "epoch": 1.07, "learning_rate": 1.964453956312662e-05, "loss": 0.0132, "step": 74020 }, { "epoch": 1.07, "learning_rate": 1.9644491523388146e-05, "loss": 0.0089, "step": 74030 }, { "epoch": 1.07, "learning_rate": 1.9644443483649676e-05, "loss": 0.0123, "step": 74040 }, { "epoch": 1.07, "learning_rate": 1.9644395443911205e-05, "loss": 0.0132, "step": 74050 }, { "epoch": 1.07, "learning_rate": 1.964434740417273e-05, "loss": 0.0127, "step": 74060 }, { "epoch": 1.07, "learning_rate": 1.964429936443426e-05, "loss": 0.0086, "step": 74070 }, { "epoch": 1.07, "learning_rate": 1.964425132469579e-05, "loss": 0.0097, "step": 74080 }, { "epoch": 1.07, "learning_rate": 1.964420328495732e-05, "loss": 0.009, "step": 74090 }, { "epoch": 1.07, "learning_rate": 1.9644155245218845e-05, "loss": 0.0177, "step": 74100 }, { "epoch": 1.07, "learning_rate": 1.9644107205480374e-05, "loss": 0.0122, "step": 74110 }, { "epoch": 1.07, "learning_rate": 1.9644059165741903e-05, "loss": 0.0183, "step": 74120 }, { "epoch": 1.07, "learning_rate": 1.9644011126003432e-05, "loss": 0.013, "step": 74130 }, { "epoch": 1.07, "learning_rate": 1.964396308626496e-05, "loss": 0.0124, "step": 74140 }, { "epoch": 1.07, "learning_rate": 1.964391504652649e-05, "loss": 0.0118, "step": 74150 }, { "epoch": 1.07, "learning_rate": 1.9643867006788017e-05, "loss": 0.0182, "step": 74160 }, { "epoch": 1.07, "learning_rate": 1.9643818967049546e-05, "loss": 0.0132, "step": 74170 }, { "epoch": 1.07, "learning_rate": 1.9643770927311075e-05, "loss": 0.01, "step": 74180 }, { "epoch": 1.07, "learning_rate": 1.96437228875726e-05, "loss": 0.0143, "step": 74190 }, { "epoch": 1.07, "learning_rate": 1.964367484783413e-05, "loss": 0.0125, "step": 74200 }, { "epoch": 1.07, "learning_rate": 1.964362680809566e-05, "loss": 0.0122, "step": 74210 }, { "epoch": 1.07, "learning_rate": 1.964357876835719e-05, "loss": 0.0128, "step": 74220 }, { "epoch": 1.07, "learning_rate": 1.9643530728618715e-05, "loss": 0.0119, "step": 74230 }, { "epoch": 1.07, "learning_rate": 1.9643482688880244e-05, "loss": 0.0162, "step": 74240 }, { "epoch": 1.07, "learning_rate": 1.9643434649141773e-05, "loss": 0.0144, "step": 74250 }, { "epoch": 1.07, "learning_rate": 1.96433866094033e-05, "loss": 0.0135, "step": 74260 }, { "epoch": 1.07, "learning_rate": 1.964333856966483e-05, "loss": 0.0128, "step": 74270 }, { "epoch": 1.07, "learning_rate": 1.9643290529926358e-05, "loss": 0.013, "step": 74280 }, { "epoch": 1.07, "learning_rate": 1.9643242490187887e-05, "loss": 0.0138, "step": 74290 }, { "epoch": 1.07, "learning_rate": 1.9643194450449413e-05, "loss": 0.0096, "step": 74300 }, { "epoch": 1.07, "learning_rate": 1.9643146410710942e-05, "loss": 0.0148, "step": 74310 }, { "epoch": 1.07, "learning_rate": 1.964309837097247e-05, "loss": 0.0077, "step": 74320 }, { "epoch": 1.07, "learning_rate": 1.9643050331234e-05, "loss": 0.0129, "step": 74330 }, { "epoch": 1.07, "learning_rate": 1.9643002291495527e-05, "loss": 0.0159, "step": 74340 }, { "epoch": 1.07, "learning_rate": 1.9642954251757056e-05, "loss": 0.0163, "step": 74350 }, { "epoch": 1.07, "learning_rate": 1.9642906212018585e-05, "loss": 0.01, "step": 74360 }, { "epoch": 1.07, "learning_rate": 1.964285817228011e-05, "loss": 0.0184, "step": 74370 }, { "epoch": 1.07, "learning_rate": 1.964281013254164e-05, "loss": 0.0127, "step": 74380 }, { "epoch": 1.07, "learning_rate": 1.964276209280317e-05, "loss": 0.0098, "step": 74390 }, { "epoch": 1.07, "learning_rate": 1.96427140530647e-05, "loss": 0.0144, "step": 74400 }, { "epoch": 1.07, "learning_rate": 1.9642666013326225e-05, "loss": 0.0123, "step": 74410 }, { "epoch": 1.07, "learning_rate": 1.9642617973587754e-05, "loss": 0.0118, "step": 74420 }, { "epoch": 1.07, "learning_rate": 1.9642569933849283e-05, "loss": 0.0128, "step": 74430 }, { "epoch": 1.07, "learning_rate": 1.964252189411081e-05, "loss": 0.0098, "step": 74440 }, { "epoch": 1.07, "learning_rate": 1.964247385437234e-05, "loss": 0.0216, "step": 74450 }, { "epoch": 1.07, "learning_rate": 1.9642425814633868e-05, "loss": 0.0121, "step": 74460 }, { "epoch": 1.07, "learning_rate": 1.9642377774895397e-05, "loss": 0.0128, "step": 74470 }, { "epoch": 1.07, "learning_rate": 1.9642329735156923e-05, "loss": 0.0099, "step": 74480 }, { "epoch": 1.07, "learning_rate": 1.9642281695418452e-05, "loss": 0.0124, "step": 74490 }, { "epoch": 1.07, "learning_rate": 1.964223365567998e-05, "loss": 0.0103, "step": 74500 }, { "epoch": 1.07, "learning_rate": 1.964218561594151e-05, "loss": 0.011, "step": 74510 }, { "epoch": 1.07, "learning_rate": 1.9642137576203037e-05, "loss": 0.0142, "step": 74520 }, { "epoch": 1.07, "learning_rate": 1.9642089536464566e-05, "loss": 0.0093, "step": 74530 }, { "epoch": 1.07, "learning_rate": 1.9642041496726095e-05, "loss": 0.0124, "step": 74540 }, { "epoch": 1.07, "learning_rate": 1.964199345698762e-05, "loss": 0.0148, "step": 74550 }, { "epoch": 1.07, "learning_rate": 1.964194541724915e-05, "loss": 0.0104, "step": 74560 }, { "epoch": 1.07, "learning_rate": 1.964189737751068e-05, "loss": 0.0134, "step": 74570 }, { "epoch": 1.07, "learning_rate": 1.964184933777221e-05, "loss": 0.0193, "step": 74580 }, { "epoch": 1.07, "learning_rate": 1.9641801298033735e-05, "loss": 0.0144, "step": 74590 }, { "epoch": 1.08, "learning_rate": 1.9641753258295264e-05, "loss": 0.0111, "step": 74600 }, { "epoch": 1.08, "learning_rate": 1.9641705218556793e-05, "loss": 0.0119, "step": 74610 }, { "epoch": 1.08, "learning_rate": 1.964165717881832e-05, "loss": 0.0099, "step": 74620 }, { "epoch": 1.08, "learning_rate": 1.964160913907985e-05, "loss": 0.0137, "step": 74630 }, { "epoch": 1.08, "learning_rate": 1.9641561099341378e-05, "loss": 0.0103, "step": 74640 }, { "epoch": 1.08, "learning_rate": 1.9641513059602907e-05, "loss": 0.0136, "step": 74650 }, { "epoch": 1.08, "learning_rate": 1.9641465019864433e-05, "loss": 0.014, "step": 74660 }, { "epoch": 1.08, "learning_rate": 1.9641416980125962e-05, "loss": 0.0166, "step": 74670 }, { "epoch": 1.08, "learning_rate": 1.964136894038749e-05, "loss": 0.0154, "step": 74680 }, { "epoch": 1.08, "learning_rate": 1.964132090064902e-05, "loss": 0.0153, "step": 74690 }, { "epoch": 1.08, "learning_rate": 1.9641272860910547e-05, "loss": 0.0166, "step": 74700 }, { "epoch": 1.08, "learning_rate": 1.9641224821172076e-05, "loss": 0.0141, "step": 74710 }, { "epoch": 1.08, "learning_rate": 1.9641176781433605e-05, "loss": 0.0099, "step": 74720 }, { "epoch": 1.08, "learning_rate": 1.964112874169513e-05, "loss": 0.0118, "step": 74730 }, { "epoch": 1.08, "learning_rate": 1.964108070195666e-05, "loss": 0.0135, "step": 74740 }, { "epoch": 1.08, "learning_rate": 1.964103266221819e-05, "loss": 0.0118, "step": 74750 }, { "epoch": 1.08, "learning_rate": 1.964098462247972e-05, "loss": 0.0112, "step": 74760 }, { "epoch": 1.08, "learning_rate": 1.9640936582741245e-05, "loss": 0.0161, "step": 74770 }, { "epoch": 1.08, "learning_rate": 1.9640888543002774e-05, "loss": 0.0134, "step": 74780 }, { "epoch": 1.08, "learning_rate": 1.9640840503264303e-05, "loss": 0.0146, "step": 74790 }, { "epoch": 1.08, "learning_rate": 1.964079246352583e-05, "loss": 0.0136, "step": 74800 }, { "epoch": 1.08, "learning_rate": 1.964074442378736e-05, "loss": 0.0073, "step": 74810 }, { "epoch": 1.08, "learning_rate": 1.9640696384048888e-05, "loss": 0.0112, "step": 74820 }, { "epoch": 1.08, "learning_rate": 1.9640648344310417e-05, "loss": 0.0133, "step": 74830 }, { "epoch": 1.08, "learning_rate": 1.9640600304571943e-05, "loss": 0.01, "step": 74840 }, { "epoch": 1.08, "learning_rate": 1.9640552264833472e-05, "loss": 0.0174, "step": 74850 }, { "epoch": 1.08, "learning_rate": 1.9640504225095e-05, "loss": 0.0161, "step": 74860 }, { "epoch": 1.08, "learning_rate": 1.964045618535653e-05, "loss": 0.0112, "step": 74870 }, { "epoch": 1.08, "learning_rate": 1.9640408145618056e-05, "loss": 0.0126, "step": 74880 }, { "epoch": 1.08, "learning_rate": 1.9640360105879586e-05, "loss": 0.0129, "step": 74890 }, { "epoch": 1.08, "learning_rate": 1.9640312066141115e-05, "loss": 0.0117, "step": 74900 }, { "epoch": 1.08, "learning_rate": 1.964026402640264e-05, "loss": 0.0168, "step": 74910 }, { "epoch": 1.08, "learning_rate": 1.964021598666417e-05, "loss": 0.0141, "step": 74920 }, { "epoch": 1.08, "learning_rate": 1.96401679469257e-05, "loss": 0.0106, "step": 74930 }, { "epoch": 1.08, "learning_rate": 1.964011990718723e-05, "loss": 0.0097, "step": 74940 }, { "epoch": 1.08, "learning_rate": 1.9640071867448755e-05, "loss": 0.0135, "step": 74950 }, { "epoch": 1.08, "learning_rate": 1.9640023827710284e-05, "loss": 0.0144, "step": 74960 }, { "epoch": 1.08, "learning_rate": 1.9639975787971813e-05, "loss": 0.0131, "step": 74970 }, { "epoch": 1.08, "learning_rate": 1.963992774823334e-05, "loss": 0.0112, "step": 74980 }, { "epoch": 1.08, "learning_rate": 1.9639879708494868e-05, "loss": 0.011, "step": 74990 }, { "epoch": 1.08, "learning_rate": 1.9639831668756398e-05, "loss": 0.0116, "step": 75000 }, { "epoch": 1.08, "learning_rate": 1.9639783629017927e-05, "loss": 0.0115, "step": 75010 }, { "epoch": 1.08, "learning_rate": 1.9639735589279453e-05, "loss": 0.0144, "step": 75020 }, { "epoch": 1.08, "learning_rate": 1.9639687549540982e-05, "loss": 0.0132, "step": 75030 }, { "epoch": 1.08, "learning_rate": 1.963963950980251e-05, "loss": 0.0144, "step": 75040 }, { "epoch": 1.08, "learning_rate": 1.963959147006404e-05, "loss": 0.0135, "step": 75050 }, { "epoch": 1.08, "learning_rate": 1.9639543430325566e-05, "loss": 0.0122, "step": 75060 }, { "epoch": 1.08, "learning_rate": 1.9639495390587096e-05, "loss": 0.0115, "step": 75070 }, { "epoch": 1.08, "learning_rate": 1.9639447350848625e-05, "loss": 0.0097, "step": 75080 }, { "epoch": 1.08, "learning_rate": 1.963939931111015e-05, "loss": 0.0092, "step": 75090 }, { "epoch": 1.08, "learning_rate": 1.963935127137168e-05, "loss": 0.0095, "step": 75100 }, { "epoch": 1.08, "learning_rate": 1.963930323163321e-05, "loss": 0.0111, "step": 75110 }, { "epoch": 1.08, "learning_rate": 1.963925519189474e-05, "loss": 0.0135, "step": 75120 }, { "epoch": 1.08, "learning_rate": 1.9639207152156264e-05, "loss": 0.0131, "step": 75130 }, { "epoch": 1.08, "learning_rate": 1.9639159112417794e-05, "loss": 0.0153, "step": 75140 }, { "epoch": 1.08, "learning_rate": 1.9639111072679323e-05, "loss": 0.0141, "step": 75150 }, { "epoch": 1.08, "learning_rate": 1.963906303294085e-05, "loss": 0.0142, "step": 75160 }, { "epoch": 1.08, "learning_rate": 1.9639014993202378e-05, "loss": 0.0116, "step": 75170 }, { "epoch": 1.08, "learning_rate": 1.9638966953463907e-05, "loss": 0.0156, "step": 75180 }, { "epoch": 1.08, "learning_rate": 1.9638918913725437e-05, "loss": 0.0158, "step": 75190 }, { "epoch": 1.08, "learning_rate": 1.9638870873986963e-05, "loss": 0.0115, "step": 75200 }, { "epoch": 1.08, "learning_rate": 1.9638822834248492e-05, "loss": 0.0264, "step": 75210 }, { "epoch": 1.08, "learning_rate": 1.963877479451002e-05, "loss": 0.0134, "step": 75220 }, { "epoch": 1.08, "learning_rate": 1.963872675477155e-05, "loss": 0.0123, "step": 75230 }, { "epoch": 1.08, "learning_rate": 1.9638678715033076e-05, "loss": 0.0166, "step": 75240 }, { "epoch": 1.08, "learning_rate": 1.9638630675294606e-05, "loss": 0.0124, "step": 75250 }, { "epoch": 1.08, "learning_rate": 1.9638582635556135e-05, "loss": 0.0129, "step": 75260 }, { "epoch": 1.08, "learning_rate": 1.963853459581766e-05, "loss": 0.0169, "step": 75270 }, { "epoch": 1.08, "learning_rate": 1.963848655607919e-05, "loss": 0.0132, "step": 75280 }, { "epoch": 1.09, "learning_rate": 1.963843851634072e-05, "loss": 0.012, "step": 75290 }, { "epoch": 1.09, "learning_rate": 1.963839047660225e-05, "loss": 0.0121, "step": 75300 }, { "epoch": 1.09, "learning_rate": 1.9638342436863774e-05, "loss": 0.0132, "step": 75310 }, { "epoch": 1.09, "learning_rate": 1.9638294397125304e-05, "loss": 0.0145, "step": 75320 }, { "epoch": 1.09, "learning_rate": 1.9638246357386833e-05, "loss": 0.0128, "step": 75330 }, { "epoch": 1.09, "learning_rate": 1.963819831764836e-05, "loss": 0.0109, "step": 75340 }, { "epoch": 1.09, "learning_rate": 1.9638150277909888e-05, "loss": 0.0084, "step": 75350 }, { "epoch": 1.09, "learning_rate": 1.9638102238171417e-05, "loss": 0.0101, "step": 75360 }, { "epoch": 1.09, "learning_rate": 1.9638054198432947e-05, "loss": 0.0134, "step": 75370 }, { "epoch": 1.09, "learning_rate": 1.9638006158694473e-05, "loss": 0.0126, "step": 75380 }, { "epoch": 1.09, "learning_rate": 1.9637958118956002e-05, "loss": 0.0162, "step": 75390 }, { "epoch": 1.09, "learning_rate": 1.963791007921753e-05, "loss": 0.0114, "step": 75400 }, { "epoch": 1.09, "learning_rate": 1.963786203947906e-05, "loss": 0.013, "step": 75410 }, { "epoch": 1.09, "learning_rate": 1.9637813999740586e-05, "loss": 0.0132, "step": 75420 }, { "epoch": 1.09, "learning_rate": 1.9637770763975964e-05, "loss": 0.0152, "step": 75430 }, { "epoch": 1.09, "learning_rate": 1.963772272423749e-05, "loss": 0.0137, "step": 75440 }, { "epoch": 1.09, "learning_rate": 1.963767468449902e-05, "loss": 0.0105, "step": 75450 }, { "epoch": 1.09, "learning_rate": 1.963762664476055e-05, "loss": 0.012, "step": 75460 }, { "epoch": 1.09, "learning_rate": 1.9637578605022075e-05, "loss": 0.0125, "step": 75470 }, { "epoch": 1.09, "learning_rate": 1.9637530565283604e-05, "loss": 0.0118, "step": 75480 }, { "epoch": 1.09, "learning_rate": 1.9637482525545133e-05, "loss": 0.0113, "step": 75490 }, { "epoch": 1.09, "learning_rate": 1.9637434485806662e-05, "loss": 0.0126, "step": 75500 }, { "epoch": 1.09, "learning_rate": 1.9637386446068188e-05, "loss": 0.012, "step": 75510 }, { "epoch": 1.09, "learning_rate": 1.9637338406329718e-05, "loss": 0.012, "step": 75520 }, { "epoch": 1.09, "learning_rate": 1.9637290366591247e-05, "loss": 0.0105, "step": 75530 }, { "epoch": 1.09, "learning_rate": 1.9637242326852776e-05, "loss": 0.0199, "step": 75540 }, { "epoch": 1.09, "learning_rate": 1.9637194287114302e-05, "loss": 0.0115, "step": 75550 }, { "epoch": 1.09, "learning_rate": 1.963714624737583e-05, "loss": 0.0138, "step": 75560 }, { "epoch": 1.09, "learning_rate": 1.963709820763736e-05, "loss": 0.0116, "step": 75570 }, { "epoch": 1.09, "learning_rate": 1.9637050167898886e-05, "loss": 0.0155, "step": 75580 }, { "epoch": 1.09, "learning_rate": 1.9637002128160416e-05, "loss": 0.014, "step": 75590 }, { "epoch": 1.09, "learning_rate": 1.9636954088421945e-05, "loss": 0.0121, "step": 75600 }, { "epoch": 1.09, "learning_rate": 1.9636906048683474e-05, "loss": 0.0099, "step": 75610 }, { "epoch": 1.09, "learning_rate": 1.9636858008945e-05, "loss": 0.0144, "step": 75620 }, { "epoch": 1.09, "learning_rate": 1.963680996920653e-05, "loss": 0.0142, "step": 75630 }, { "epoch": 1.09, "learning_rate": 1.963676192946806e-05, "loss": 0.0199, "step": 75640 }, { "epoch": 1.09, "learning_rate": 1.9636713889729584e-05, "loss": 0.0125, "step": 75650 }, { "epoch": 1.09, "learning_rate": 1.9636665849991114e-05, "loss": 0.0119, "step": 75660 }, { "epoch": 1.09, "learning_rate": 1.9636617810252643e-05, "loss": 0.0125, "step": 75670 }, { "epoch": 1.09, "learning_rate": 1.9636569770514172e-05, "loss": 0.0072, "step": 75680 }, { "epoch": 1.09, "learning_rate": 1.9636521730775698e-05, "loss": 0.011, "step": 75690 }, { "epoch": 1.09, "learning_rate": 1.9636473691037227e-05, "loss": 0.0121, "step": 75700 }, { "epoch": 1.09, "learning_rate": 1.9636425651298757e-05, "loss": 0.0112, "step": 75710 }, { "epoch": 1.09, "learning_rate": 1.9636377611560286e-05, "loss": 0.0118, "step": 75720 }, { "epoch": 1.09, "learning_rate": 1.9636329571821812e-05, "loss": 0.015, "step": 75730 }, { "epoch": 1.09, "learning_rate": 1.963628153208334e-05, "loss": 0.0113, "step": 75740 }, { "epoch": 1.09, "learning_rate": 1.963623349234487e-05, "loss": 0.0174, "step": 75750 }, { "epoch": 1.09, "learning_rate": 1.9636185452606396e-05, "loss": 0.0124, "step": 75760 }, { "epoch": 1.09, "learning_rate": 1.9636137412867926e-05, "loss": 0.0208, "step": 75770 }, { "epoch": 1.09, "learning_rate": 1.9636089373129455e-05, "loss": 0.0123, "step": 75780 }, { "epoch": 1.09, "learning_rate": 1.9636041333390984e-05, "loss": 0.0181, "step": 75790 }, { "epoch": 1.09, "learning_rate": 1.963599329365251e-05, "loss": 0.0133, "step": 75800 }, { "epoch": 1.09, "learning_rate": 1.963594525391404e-05, "loss": 0.0091, "step": 75810 }, { "epoch": 1.09, "learning_rate": 1.963589721417557e-05, "loss": 0.012, "step": 75820 }, { "epoch": 1.09, "learning_rate": 1.9635849174437094e-05, "loss": 0.0128, "step": 75830 }, { "epoch": 1.09, "learning_rate": 1.9635801134698624e-05, "loss": 0.0121, "step": 75840 }, { "epoch": 1.09, "learning_rate": 1.9635753094960153e-05, "loss": 0.0128, "step": 75850 }, { "epoch": 1.09, "learning_rate": 1.9635705055221682e-05, "loss": 0.0131, "step": 75860 }, { "epoch": 1.09, "learning_rate": 1.9635657015483208e-05, "loss": 0.0114, "step": 75870 }, { "epoch": 1.09, "learning_rate": 1.9635608975744737e-05, "loss": 0.012, "step": 75880 }, { "epoch": 1.09, "learning_rate": 1.9635560936006267e-05, "loss": 0.0159, "step": 75890 }, { "epoch": 1.09, "learning_rate": 1.9635512896267796e-05, "loss": 0.0098, "step": 75900 }, { "epoch": 1.09, "learning_rate": 1.9635464856529322e-05, "loss": 0.0137, "step": 75910 }, { "epoch": 1.09, "learning_rate": 1.963541681679085e-05, "loss": 0.0111, "step": 75920 }, { "epoch": 1.09, "learning_rate": 1.963536877705238e-05, "loss": 0.0136, "step": 75930 }, { "epoch": 1.09, "learning_rate": 1.9635320737313906e-05, "loss": 0.0127, "step": 75940 }, { "epoch": 1.09, "learning_rate": 1.9635272697575435e-05, "loss": 0.0116, "step": 75950 }, { "epoch": 1.09, "learning_rate": 1.9635224657836965e-05, "loss": 0.0099, "step": 75960 }, { "epoch": 1.09, "learning_rate": 1.9635176618098494e-05, "loss": 0.0133, "step": 75970 }, { "epoch": 1.1, "learning_rate": 1.963512857836002e-05, "loss": 0.0168, "step": 75980 }, { "epoch": 1.1, "learning_rate": 1.963508053862155e-05, "loss": 0.0119, "step": 75990 }, { "epoch": 1.1, "learning_rate": 1.963503249888308e-05, "loss": 0.0106, "step": 76000 }, { "epoch": 1.1, "learning_rate": 1.9634984459144604e-05, "loss": 0.0132, "step": 76010 }, { "epoch": 1.1, "learning_rate": 1.9634936419406134e-05, "loss": 0.0084, "step": 76020 }, { "epoch": 1.1, "learning_rate": 1.9634888379667663e-05, "loss": 0.012, "step": 76030 }, { "epoch": 1.1, "learning_rate": 1.9634840339929192e-05, "loss": 0.0117, "step": 76040 }, { "epoch": 1.1, "learning_rate": 1.9634792300190718e-05, "loss": 0.0107, "step": 76050 }, { "epoch": 1.1, "learning_rate": 1.9634744260452247e-05, "loss": 0.0122, "step": 76060 }, { "epoch": 1.1, "learning_rate": 1.9634696220713777e-05, "loss": 0.014, "step": 76070 }, { "epoch": 1.1, "learning_rate": 1.9634648180975306e-05, "loss": 0.0141, "step": 76080 }, { "epoch": 1.1, "learning_rate": 1.963460014123683e-05, "loss": 0.0129, "step": 76090 }, { "epoch": 1.1, "learning_rate": 1.963455210149836e-05, "loss": 0.012, "step": 76100 }, { "epoch": 1.1, "learning_rate": 1.963450406175989e-05, "loss": 0.0124, "step": 76110 }, { "epoch": 1.1, "learning_rate": 1.9634456022021416e-05, "loss": 0.0147, "step": 76120 }, { "epoch": 1.1, "learning_rate": 1.9634407982282945e-05, "loss": 0.0127, "step": 76130 }, { "epoch": 1.1, "learning_rate": 1.9634359942544475e-05, "loss": 0.0123, "step": 76140 }, { "epoch": 1.1, "learning_rate": 1.9634311902806004e-05, "loss": 0.0121, "step": 76150 }, { "epoch": 1.1, "learning_rate": 1.963426386306753e-05, "loss": 0.0166, "step": 76160 }, { "epoch": 1.1, "learning_rate": 1.963421582332906e-05, "loss": 0.0165, "step": 76170 }, { "epoch": 1.1, "learning_rate": 1.963416778359059e-05, "loss": 0.0151, "step": 76180 }, { "epoch": 1.1, "learning_rate": 1.9634119743852114e-05, "loss": 0.0141, "step": 76190 }, { "epoch": 1.1, "learning_rate": 1.9634071704113643e-05, "loss": 0.0143, "step": 76200 }, { "epoch": 1.1, "learning_rate": 1.9634023664375173e-05, "loss": 0.0094, "step": 76210 }, { "epoch": 1.1, "learning_rate": 1.9633975624636702e-05, "loss": 0.0115, "step": 76220 }, { "epoch": 1.1, "learning_rate": 1.9633927584898228e-05, "loss": 0.0181, "step": 76230 }, { "epoch": 1.1, "learning_rate": 1.9633879545159757e-05, "loss": 0.0144, "step": 76240 }, { "epoch": 1.1, "learning_rate": 1.9633831505421286e-05, "loss": 0.0157, "step": 76250 }, { "epoch": 1.1, "learning_rate": 1.9633783465682816e-05, "loss": 0.0109, "step": 76260 }, { "epoch": 1.1, "learning_rate": 1.963373542594434e-05, "loss": 0.0104, "step": 76270 }, { "epoch": 1.1, "learning_rate": 1.963368738620587e-05, "loss": 0.014, "step": 76280 }, { "epoch": 1.1, "learning_rate": 1.96336393464674e-05, "loss": 0.0162, "step": 76290 }, { "epoch": 1.1, "learning_rate": 1.9633591306728926e-05, "loss": 0.0093, "step": 76300 }, { "epoch": 1.1, "learning_rate": 1.9633543266990455e-05, "loss": 0.0132, "step": 76310 }, { "epoch": 1.1, "learning_rate": 1.9633495227251985e-05, "loss": 0.0137, "step": 76320 }, { "epoch": 1.1, "learning_rate": 1.9633447187513514e-05, "loss": 0.0129, "step": 76330 }, { "epoch": 1.1, "learning_rate": 1.963339914777504e-05, "loss": 0.0127, "step": 76340 }, { "epoch": 1.1, "learning_rate": 1.963335110803657e-05, "loss": 0.0092, "step": 76350 }, { "epoch": 1.1, "learning_rate": 1.9633303068298098e-05, "loss": 0.0117, "step": 76360 }, { "epoch": 1.1, "learning_rate": 1.9633255028559624e-05, "loss": 0.0117, "step": 76370 }, { "epoch": 1.1, "learning_rate": 1.9633206988821153e-05, "loss": 0.0143, "step": 76380 }, { "epoch": 1.1, "learning_rate": 1.9633158949082683e-05, "loss": 0.0095, "step": 76390 }, { "epoch": 1.1, "learning_rate": 1.9633110909344212e-05, "loss": 0.0129, "step": 76400 }, { "epoch": 1.1, "learning_rate": 1.9633062869605738e-05, "loss": 0.0115, "step": 76410 }, { "epoch": 1.1, "learning_rate": 1.9633014829867267e-05, "loss": 0.0131, "step": 76420 }, { "epoch": 1.1, "learning_rate": 1.9632966790128796e-05, "loss": 0.0089, "step": 76430 }, { "epoch": 1.1, "learning_rate": 1.9632918750390326e-05, "loss": 0.0139, "step": 76440 }, { "epoch": 1.1, "learning_rate": 1.963287071065185e-05, "loss": 0.0146, "step": 76450 }, { "epoch": 1.1, "learning_rate": 1.963282267091338e-05, "loss": 0.0105, "step": 76460 }, { "epoch": 1.1, "learning_rate": 1.963277463117491e-05, "loss": 0.0083, "step": 76470 }, { "epoch": 1.1, "learning_rate": 1.9632726591436436e-05, "loss": 0.0105, "step": 76480 }, { "epoch": 1.1, "learning_rate": 1.9632678551697965e-05, "loss": 0.0181, "step": 76490 }, { "epoch": 1.1, "learning_rate": 1.9632630511959494e-05, "loss": 0.0149, "step": 76500 }, { "epoch": 1.1, "learning_rate": 1.9632582472221024e-05, "loss": 0.0105, "step": 76510 }, { "epoch": 1.1, "learning_rate": 1.963253443248255e-05, "loss": 0.0111, "step": 76520 }, { "epoch": 1.1, "learning_rate": 1.963248639274408e-05, "loss": 0.0108, "step": 76530 }, { "epoch": 1.1, "learning_rate": 1.9632438353005608e-05, "loss": 0.0175, "step": 76540 }, { "epoch": 1.1, "learning_rate": 1.9632390313267134e-05, "loss": 0.015, "step": 76550 }, { "epoch": 1.1, "learning_rate": 1.9632342273528663e-05, "loss": 0.014, "step": 76560 }, { "epoch": 1.1, "learning_rate": 1.9632294233790193e-05, "loss": 0.0111, "step": 76570 }, { "epoch": 1.1, "learning_rate": 1.9632246194051722e-05, "loss": 0.013, "step": 76580 }, { "epoch": 1.1, "learning_rate": 1.9632198154313248e-05, "loss": 0.013, "step": 76590 }, { "epoch": 1.1, "learning_rate": 1.9632150114574777e-05, "loss": 0.0134, "step": 76600 }, { "epoch": 1.1, "learning_rate": 1.9632102074836306e-05, "loss": 0.0177, "step": 76610 }, { "epoch": 1.1, "learning_rate": 1.9632054035097836e-05, "loss": 0.0132, "step": 76620 }, { "epoch": 1.1, "learning_rate": 1.963200599535936e-05, "loss": 0.0103, "step": 76630 }, { "epoch": 1.1, "learning_rate": 1.963195795562089e-05, "loss": 0.0132, "step": 76640 }, { "epoch": 1.1, "learning_rate": 1.963190991588242e-05, "loss": 0.0137, "step": 76650 }, { "epoch": 1.1, "learning_rate": 1.9631861876143946e-05, "loss": 0.0152, "step": 76660 }, { "epoch": 1.1, "learning_rate": 1.9631813836405475e-05, "loss": 0.0115, "step": 76670 }, { "epoch": 1.11, "learning_rate": 1.9631765796667004e-05, "loss": 0.0137, "step": 76680 }, { "epoch": 1.11, "learning_rate": 1.9631717756928534e-05, "loss": 0.0152, "step": 76690 }, { "epoch": 1.11, "learning_rate": 1.963166971719006e-05, "loss": 0.0151, "step": 76700 }, { "epoch": 1.11, "learning_rate": 1.963162167745159e-05, "loss": 0.0122, "step": 76710 }, { "epoch": 1.11, "learning_rate": 1.9631573637713118e-05, "loss": 0.0115, "step": 76720 }, { "epoch": 1.11, "learning_rate": 1.9631525597974644e-05, "loss": 0.0122, "step": 76730 }, { "epoch": 1.11, "learning_rate": 1.9631477558236173e-05, "loss": 0.0145, "step": 76740 }, { "epoch": 1.11, "learning_rate": 1.9631429518497703e-05, "loss": 0.0133, "step": 76750 }, { "epoch": 1.11, "learning_rate": 1.9631381478759232e-05, "loss": 0.0114, "step": 76760 }, { "epoch": 1.11, "learning_rate": 1.9631333439020758e-05, "loss": 0.0108, "step": 76770 }, { "epoch": 1.11, "learning_rate": 1.9631285399282287e-05, "loss": 0.0175, "step": 76780 }, { "epoch": 1.11, "learning_rate": 1.9631237359543816e-05, "loss": 0.0153, "step": 76790 }, { "epoch": 1.11, "learning_rate": 1.9631189319805345e-05, "loss": 0.0125, "step": 76800 }, { "epoch": 1.11, "learning_rate": 1.963114128006687e-05, "loss": 0.0093, "step": 76810 }, { "epoch": 1.11, "learning_rate": 1.96310932403284e-05, "loss": 0.0159, "step": 76820 }, { "epoch": 1.11, "learning_rate": 1.963104520058993e-05, "loss": 0.0172, "step": 76830 }, { "epoch": 1.11, "learning_rate": 1.9630997160851456e-05, "loss": 0.0139, "step": 76840 }, { "epoch": 1.11, "learning_rate": 1.9630949121112985e-05, "loss": 0.0098, "step": 76850 }, { "epoch": 1.11, "learning_rate": 1.9630901081374514e-05, "loss": 0.0151, "step": 76860 }, { "epoch": 1.11, "learning_rate": 1.9630853041636044e-05, "loss": 0.0115, "step": 76870 }, { "epoch": 1.11, "learning_rate": 1.963080500189757e-05, "loss": 0.0136, "step": 76880 }, { "epoch": 1.11, "learning_rate": 1.96307569621591e-05, "loss": 0.0124, "step": 76890 }, { "epoch": 1.11, "learning_rate": 1.9630708922420628e-05, "loss": 0.0136, "step": 76900 }, { "epoch": 1.11, "learning_rate": 1.9630660882682154e-05, "loss": 0.0115, "step": 76910 }, { "epoch": 1.11, "learning_rate": 1.9630612842943683e-05, "loss": 0.0108, "step": 76920 }, { "epoch": 1.11, "learning_rate": 1.9630564803205212e-05, "loss": 0.0136, "step": 76930 }, { "epoch": 1.11, "learning_rate": 1.963051676346674e-05, "loss": 0.0129, "step": 76940 }, { "epoch": 1.11, "learning_rate": 1.9630468723728268e-05, "loss": 0.0111, "step": 76950 }, { "epoch": 1.11, "learning_rate": 1.9630420683989797e-05, "loss": 0.0109, "step": 76960 }, { "epoch": 1.11, "learning_rate": 1.9630372644251326e-05, "loss": 0.0111, "step": 76970 }, { "epoch": 1.11, "learning_rate": 1.9630324604512855e-05, "loss": 0.0136, "step": 76980 }, { "epoch": 1.11, "learning_rate": 1.963027656477438e-05, "loss": 0.0112, "step": 76990 }, { "epoch": 1.11, "learning_rate": 1.963022852503591e-05, "loss": 0.0096, "step": 77000 }, { "epoch": 1.11, "learning_rate": 1.963018048529744e-05, "loss": 0.0157, "step": 77010 }, { "epoch": 1.11, "learning_rate": 1.9630132445558966e-05, "loss": 0.0127, "step": 77020 }, { "epoch": 1.11, "learning_rate": 1.9630084405820495e-05, "loss": 0.0159, "step": 77030 }, { "epoch": 1.11, "learning_rate": 1.9630036366082024e-05, "loss": 0.0138, "step": 77040 }, { "epoch": 1.11, "learning_rate": 1.9629988326343553e-05, "loss": 0.013, "step": 77050 }, { "epoch": 1.11, "learning_rate": 1.962994028660508e-05, "loss": 0.0139, "step": 77060 }, { "epoch": 1.11, "learning_rate": 1.962989224686661e-05, "loss": 0.0131, "step": 77070 }, { "epoch": 1.11, "learning_rate": 1.9629844207128138e-05, "loss": 0.0147, "step": 77080 }, { "epoch": 1.11, "learning_rate": 1.9629796167389664e-05, "loss": 0.0146, "step": 77090 }, { "epoch": 1.11, "learning_rate": 1.9629748127651193e-05, "loss": 0.0109, "step": 77100 }, { "epoch": 1.11, "learning_rate": 1.9629700087912722e-05, "loss": 0.0143, "step": 77110 }, { "epoch": 1.11, "learning_rate": 1.962965204817425e-05, "loss": 0.0116, "step": 77120 }, { "epoch": 1.11, "learning_rate": 1.9629604008435777e-05, "loss": 0.0121, "step": 77130 }, { "epoch": 1.11, "learning_rate": 1.9629555968697307e-05, "loss": 0.0143, "step": 77140 }, { "epoch": 1.11, "learning_rate": 1.9629507928958836e-05, "loss": 0.0169, "step": 77150 }, { "epoch": 1.11, "learning_rate": 1.9629459889220365e-05, "loss": 0.0119, "step": 77160 }, { "epoch": 1.11, "learning_rate": 1.962941184948189e-05, "loss": 0.0105, "step": 77170 }, { "epoch": 1.11, "learning_rate": 1.962936380974342e-05, "loss": 0.0093, "step": 77180 }, { "epoch": 1.11, "learning_rate": 1.962931577000495e-05, "loss": 0.0114, "step": 77190 }, { "epoch": 1.11, "learning_rate": 1.962926773026648e-05, "loss": 0.0114, "step": 77200 }, { "epoch": 1.11, "learning_rate": 1.9629219690528008e-05, "loss": 0.0104, "step": 77210 }, { "epoch": 1.11, "learning_rate": 1.9629171650789534e-05, "loss": 0.0112, "step": 77220 }, { "epoch": 1.11, "learning_rate": 1.9629123611051063e-05, "loss": 0.0121, "step": 77230 }, { "epoch": 1.11, "learning_rate": 1.9629075571312593e-05, "loss": 0.0196, "step": 77240 }, { "epoch": 1.11, "learning_rate": 1.9629027531574122e-05, "loss": 0.0127, "step": 77250 }, { "epoch": 1.11, "learning_rate": 1.9628979491835648e-05, "loss": 0.0135, "step": 77260 }, { "epoch": 1.11, "learning_rate": 1.9628931452097177e-05, "loss": 0.0125, "step": 77270 }, { "epoch": 1.11, "learning_rate": 1.9628883412358706e-05, "loss": 0.0144, "step": 77280 }, { "epoch": 1.11, "learning_rate": 1.9628835372620236e-05, "loss": 0.0111, "step": 77290 }, { "epoch": 1.11, "learning_rate": 1.962878733288176e-05, "loss": 0.0102, "step": 77300 }, { "epoch": 1.11, "learning_rate": 1.962873929314329e-05, "loss": 0.0151, "step": 77310 }, { "epoch": 1.11, "learning_rate": 1.962869125340482e-05, "loss": 0.0106, "step": 77320 }, { "epoch": 1.11, "learning_rate": 1.9628643213666346e-05, "loss": 0.0117, "step": 77330 }, { "epoch": 1.11, "learning_rate": 1.9628595173927875e-05, "loss": 0.0109, "step": 77340 }, { "epoch": 1.11, "learning_rate": 1.9628547134189404e-05, "loss": 0.0157, "step": 77350 }, { "epoch": 1.11, "learning_rate": 1.9628499094450934e-05, "loss": 0.0134, "step": 77360 }, { "epoch": 1.12, "learning_rate": 1.962845105471246e-05, "loss": 0.0139, "step": 77370 }, { "epoch": 1.12, "learning_rate": 1.962840301497399e-05, "loss": 0.0144, "step": 77380 }, { "epoch": 1.12, "learning_rate": 1.9628354975235518e-05, "loss": 0.0117, "step": 77390 }, { "epoch": 1.12, "learning_rate": 1.9628306935497044e-05, "loss": 0.0103, "step": 77400 }, { "epoch": 1.12, "learning_rate": 1.9628258895758573e-05, "loss": 0.0131, "step": 77410 }, { "epoch": 1.12, "learning_rate": 1.9628210856020103e-05, "loss": 0.0129, "step": 77420 }, { "epoch": 1.12, "learning_rate": 1.9628162816281632e-05, "loss": 0.0135, "step": 77430 }, { "epoch": 1.12, "learning_rate": 1.9628114776543158e-05, "loss": 0.0139, "step": 77440 }, { "epoch": 1.12, "learning_rate": 1.9628066736804687e-05, "loss": 0.0097, "step": 77450 }, { "epoch": 1.12, "learning_rate": 1.9628018697066216e-05, "loss": 0.0129, "step": 77460 }, { "epoch": 1.12, "learning_rate": 1.9627970657327746e-05, "loss": 0.0101, "step": 77470 }, { "epoch": 1.12, "learning_rate": 1.962792261758927e-05, "loss": 0.0184, "step": 77480 }, { "epoch": 1.12, "learning_rate": 1.96278745778508e-05, "loss": 0.012, "step": 77490 }, { "epoch": 1.12, "learning_rate": 1.962782653811233e-05, "loss": 0.0127, "step": 77500 }, { "epoch": 1.12, "learning_rate": 1.9627778498373856e-05, "loss": 0.0134, "step": 77510 }, { "epoch": 1.12, "learning_rate": 1.9627730458635385e-05, "loss": 0.0146, "step": 77520 }, { "epoch": 1.12, "learning_rate": 1.9627682418896914e-05, "loss": 0.0135, "step": 77530 }, { "epoch": 1.12, "learning_rate": 1.9627634379158444e-05, "loss": 0.0174, "step": 77540 }, { "epoch": 1.12, "learning_rate": 1.962758633941997e-05, "loss": 0.0114, "step": 77550 }, { "epoch": 1.12, "learning_rate": 1.96275382996815e-05, "loss": 0.0124, "step": 77560 }, { "epoch": 1.12, "learning_rate": 1.9627490259943028e-05, "loss": 0.0145, "step": 77570 }, { "epoch": 1.12, "learning_rate": 1.9627442220204554e-05, "loss": 0.0117, "step": 77580 }, { "epoch": 1.12, "learning_rate": 1.9627394180466083e-05, "loss": 0.0155, "step": 77590 }, { "epoch": 1.12, "learning_rate": 1.9627346140727613e-05, "loss": 0.0127, "step": 77600 }, { "epoch": 1.12, "learning_rate": 1.9627298100989142e-05, "loss": 0.0092, "step": 77610 }, { "epoch": 1.12, "learning_rate": 1.9627250061250668e-05, "loss": 0.0117, "step": 77620 }, { "epoch": 1.12, "learning_rate": 1.9627202021512197e-05, "loss": 0.0082, "step": 77630 }, { "epoch": 1.12, "learning_rate": 1.9627153981773726e-05, "loss": 0.0175, "step": 77640 }, { "epoch": 1.12, "learning_rate": 1.9627105942035255e-05, "loss": 0.0125, "step": 77650 }, { "epoch": 1.12, "learning_rate": 1.962705790229678e-05, "loss": 0.0147, "step": 77660 }, { "epoch": 1.12, "learning_rate": 1.962700986255831e-05, "loss": 0.0101, "step": 77670 }, { "epoch": 1.12, "learning_rate": 1.962696182281984e-05, "loss": 0.011, "step": 77680 }, { "epoch": 1.12, "learning_rate": 1.9626913783081366e-05, "loss": 0.0103, "step": 77690 }, { "epoch": 1.12, "learning_rate": 1.9626865743342895e-05, "loss": 0.0164, "step": 77700 }, { "epoch": 1.12, "learning_rate": 1.9626817703604424e-05, "loss": 0.0171, "step": 77710 }, { "epoch": 1.12, "learning_rate": 1.9626769663865954e-05, "loss": 0.0083, "step": 77720 }, { "epoch": 1.12, "learning_rate": 1.962672162412748e-05, "loss": 0.0185, "step": 77730 }, { "epoch": 1.12, "learning_rate": 1.962667358438901e-05, "loss": 0.0125, "step": 77740 }, { "epoch": 1.12, "learning_rate": 1.9626625544650538e-05, "loss": 0.0122, "step": 77750 }, { "epoch": 1.12, "learning_rate": 1.9626577504912064e-05, "loss": 0.0128, "step": 77760 }, { "epoch": 1.12, "learning_rate": 1.9626529465173593e-05, "loss": 0.0131, "step": 77770 }, { "epoch": 1.12, "learning_rate": 1.9626481425435122e-05, "loss": 0.0127, "step": 77780 }, { "epoch": 1.12, "learning_rate": 1.962643338569665e-05, "loss": 0.0104, "step": 77790 }, { "epoch": 1.12, "learning_rate": 1.9626385345958178e-05, "loss": 0.0161, "step": 77800 }, { "epoch": 1.12, "learning_rate": 1.9626337306219707e-05, "loss": 0.0146, "step": 77810 }, { "epoch": 1.12, "learning_rate": 1.9626289266481236e-05, "loss": 0.0154, "step": 77820 }, { "epoch": 1.12, "learning_rate": 1.9626241226742765e-05, "loss": 0.0088, "step": 77830 }, { "epoch": 1.12, "learning_rate": 1.962619318700429e-05, "loss": 0.0108, "step": 77840 }, { "epoch": 1.12, "learning_rate": 1.962614514726582e-05, "loss": 0.0132, "step": 77850 }, { "epoch": 1.12, "learning_rate": 1.962609710752735e-05, "loss": 0.0111, "step": 77860 }, { "epoch": 1.12, "learning_rate": 1.9626049067788876e-05, "loss": 0.01, "step": 77870 }, { "epoch": 1.12, "learning_rate": 1.9626001028050405e-05, "loss": 0.0127, "step": 77880 }, { "epoch": 1.12, "learning_rate": 1.9625952988311934e-05, "loss": 0.0127, "step": 77890 }, { "epoch": 1.12, "learning_rate": 1.9625904948573463e-05, "loss": 0.0102, "step": 77900 }, { "epoch": 1.12, "learning_rate": 1.962585690883499e-05, "loss": 0.0109, "step": 77910 }, { "epoch": 1.12, "learning_rate": 1.962580886909652e-05, "loss": 0.0149, "step": 77920 }, { "epoch": 1.12, "learning_rate": 1.9625760829358048e-05, "loss": 0.0124, "step": 77930 }, { "epoch": 1.12, "learning_rate": 1.9625712789619574e-05, "loss": 0.0118, "step": 77940 }, { "epoch": 1.12, "learning_rate": 1.9625664749881103e-05, "loss": 0.0126, "step": 77950 }, { "epoch": 1.12, "learning_rate": 1.9625616710142632e-05, "loss": 0.0106, "step": 77960 }, { "epoch": 1.12, "learning_rate": 1.962556867040416e-05, "loss": 0.0119, "step": 77970 }, { "epoch": 1.12, "learning_rate": 1.9625520630665687e-05, "loss": 0.0153, "step": 77980 }, { "epoch": 1.12, "learning_rate": 1.9625472590927217e-05, "loss": 0.0126, "step": 77990 }, { "epoch": 1.12, "learning_rate": 1.9625424551188746e-05, "loss": 0.0112, "step": 78000 }, { "epoch": 1.12, "learning_rate": 1.9625376511450275e-05, "loss": 0.0116, "step": 78010 }, { "epoch": 1.12, "learning_rate": 1.96253284717118e-05, "loss": 0.0094, "step": 78020 }, { "epoch": 1.12, "learning_rate": 1.962528043197333e-05, "loss": 0.0106, "step": 78030 }, { "epoch": 1.12, "learning_rate": 1.962523239223486e-05, "loss": 0.0163, "step": 78040 }, { "epoch": 1.12, "learning_rate": 1.9625184352496386e-05, "loss": 0.0139, "step": 78050 }, { "epoch": 1.12, "learning_rate": 1.9625136312757915e-05, "loss": 0.0112, "step": 78060 }, { "epoch": 1.13, "learning_rate": 1.9625093076993293e-05, "loss": 0.0103, "step": 78070 }, { "epoch": 1.13, "learning_rate": 1.962504503725482e-05, "loss": 0.0117, "step": 78080 }, { "epoch": 1.13, "learning_rate": 1.9624996997516348e-05, "loss": 0.0173, "step": 78090 }, { "epoch": 1.13, "learning_rate": 1.9624948957777877e-05, "loss": 0.0092, "step": 78100 }, { "epoch": 1.13, "learning_rate": 1.9624900918039403e-05, "loss": 0.0133, "step": 78110 }, { "epoch": 1.13, "learning_rate": 1.9624852878300932e-05, "loss": 0.0121, "step": 78120 }, { "epoch": 1.13, "learning_rate": 1.9624804838562462e-05, "loss": 0.0115, "step": 78130 }, { "epoch": 1.13, "learning_rate": 1.962475679882399e-05, "loss": 0.0138, "step": 78140 }, { "epoch": 1.13, "learning_rate": 1.9624708759085517e-05, "loss": 0.0091, "step": 78150 }, { "epoch": 1.13, "learning_rate": 1.9624660719347046e-05, "loss": 0.0109, "step": 78160 }, { "epoch": 1.13, "learning_rate": 1.9624612679608575e-05, "loss": 0.0128, "step": 78170 }, { "epoch": 1.13, "learning_rate": 1.96245646398701e-05, "loss": 0.0136, "step": 78180 }, { "epoch": 1.13, "learning_rate": 1.962451660013163e-05, "loss": 0.0105, "step": 78190 }, { "epoch": 1.13, "learning_rate": 1.962446856039316e-05, "loss": 0.0138, "step": 78200 }, { "epoch": 1.13, "learning_rate": 1.962442052065469e-05, "loss": 0.0195, "step": 78210 }, { "epoch": 1.13, "learning_rate": 1.9624372480916215e-05, "loss": 0.0127, "step": 78220 }, { "epoch": 1.13, "learning_rate": 1.9624324441177744e-05, "loss": 0.0098, "step": 78230 }, { "epoch": 1.13, "learning_rate": 1.9624276401439274e-05, "loss": 0.0174, "step": 78240 }, { "epoch": 1.13, "learning_rate": 1.9624228361700803e-05, "loss": 0.0162, "step": 78250 }, { "epoch": 1.13, "learning_rate": 1.962418032196233e-05, "loss": 0.0117, "step": 78260 }, { "epoch": 1.13, "learning_rate": 1.9624132282223858e-05, "loss": 0.0156, "step": 78270 }, { "epoch": 1.13, "learning_rate": 1.9624084242485387e-05, "loss": 0.021, "step": 78280 }, { "epoch": 1.13, "learning_rate": 1.9624036202746913e-05, "loss": 0.0114, "step": 78290 }, { "epoch": 1.13, "learning_rate": 1.9623988163008442e-05, "loss": 0.0083, "step": 78300 }, { "epoch": 1.13, "learning_rate": 1.962394012326997e-05, "loss": 0.0147, "step": 78310 }, { "epoch": 1.13, "learning_rate": 1.96238920835315e-05, "loss": 0.0126, "step": 78320 }, { "epoch": 1.13, "learning_rate": 1.9623844043793027e-05, "loss": 0.0085, "step": 78330 }, { "epoch": 1.13, "learning_rate": 1.9623796004054556e-05, "loss": 0.0073, "step": 78340 }, { "epoch": 1.13, "learning_rate": 1.9623747964316085e-05, "loss": 0.0124, "step": 78350 }, { "epoch": 1.13, "learning_rate": 1.962369992457761e-05, "loss": 0.0108, "step": 78360 }, { "epoch": 1.13, "learning_rate": 1.962365188483914e-05, "loss": 0.0126, "step": 78370 }, { "epoch": 1.13, "learning_rate": 1.962360384510067e-05, "loss": 0.0157, "step": 78380 }, { "epoch": 1.13, "learning_rate": 1.96235558053622e-05, "loss": 0.0142, "step": 78390 }, { "epoch": 1.13, "learning_rate": 1.9623507765623725e-05, "loss": 0.0101, "step": 78400 }, { "epoch": 1.13, "learning_rate": 1.9623459725885254e-05, "loss": 0.0077, "step": 78410 }, { "epoch": 1.13, "learning_rate": 1.9623411686146783e-05, "loss": 0.0135, "step": 78420 }, { "epoch": 1.13, "learning_rate": 1.9623363646408313e-05, "loss": 0.0155, "step": 78430 }, { "epoch": 1.13, "learning_rate": 1.962331560666984e-05, "loss": 0.0114, "step": 78440 }, { "epoch": 1.13, "learning_rate": 1.9623267566931368e-05, "loss": 0.0149, "step": 78450 }, { "epoch": 1.13, "learning_rate": 1.9623219527192897e-05, "loss": 0.0119, "step": 78460 }, { "epoch": 1.13, "learning_rate": 1.9623171487454423e-05, "loss": 0.0172, "step": 78470 }, { "epoch": 1.13, "learning_rate": 1.9623123447715952e-05, "loss": 0.0098, "step": 78480 }, { "epoch": 1.13, "learning_rate": 1.962307540797748e-05, "loss": 0.0154, "step": 78490 }, { "epoch": 1.13, "learning_rate": 1.962302736823901e-05, "loss": 0.0113, "step": 78500 }, { "epoch": 1.13, "learning_rate": 1.9622979328500537e-05, "loss": 0.0146, "step": 78510 }, { "epoch": 1.13, "learning_rate": 1.9622931288762066e-05, "loss": 0.0139, "step": 78520 }, { "epoch": 1.13, "learning_rate": 1.9622883249023595e-05, "loss": 0.0102, "step": 78530 }, { "epoch": 1.13, "learning_rate": 1.962283520928512e-05, "loss": 0.0143, "step": 78540 }, { "epoch": 1.13, "learning_rate": 1.96227919735205e-05, "loss": 0.0141, "step": 78550 }, { "epoch": 1.13, "learning_rate": 1.962274393378203e-05, "loss": 0.0177, "step": 78560 }, { "epoch": 1.13, "learning_rate": 1.9622695894043554e-05, "loss": 0.0128, "step": 78570 }, { "epoch": 1.13, "learning_rate": 1.9622647854305084e-05, "loss": 0.017, "step": 78580 }, { "epoch": 1.13, "learning_rate": 1.9622599814566613e-05, "loss": 0.0133, "step": 78590 }, { "epoch": 1.13, "learning_rate": 1.962255177482814e-05, "loss": 0.0155, "step": 78600 }, { "epoch": 1.13, "learning_rate": 1.9622503735089668e-05, "loss": 0.012, "step": 78610 }, { "epoch": 1.13, "learning_rate": 1.9622455695351197e-05, "loss": 0.0117, "step": 78620 }, { "epoch": 1.13, "learning_rate": 1.9622407655612727e-05, "loss": 0.0138, "step": 78630 }, { "epoch": 1.13, "learning_rate": 1.9622359615874252e-05, "loss": 0.0134, "step": 78640 }, { "epoch": 1.13, "learning_rate": 1.9622311576135782e-05, "loss": 0.0122, "step": 78650 }, { "epoch": 1.13, "learning_rate": 1.962226353639731e-05, "loss": 0.0128, "step": 78660 }, { "epoch": 1.13, "learning_rate": 1.9622215496658837e-05, "loss": 0.0136, "step": 78670 }, { "epoch": 1.13, "learning_rate": 1.9622167456920366e-05, "loss": 0.0192, "step": 78680 }, { "epoch": 1.13, "learning_rate": 1.9622119417181895e-05, "loss": 0.015, "step": 78690 }, { "epoch": 1.13, "learning_rate": 1.9622071377443425e-05, "loss": 0.0121, "step": 78700 }, { "epoch": 1.13, "learning_rate": 1.962202333770495e-05, "loss": 0.012, "step": 78710 }, { "epoch": 1.13, "learning_rate": 1.962197529796648e-05, "loss": 0.0158, "step": 78720 }, { "epoch": 1.13, "learning_rate": 1.962192725822801e-05, "loss": 0.0115, "step": 78730 }, { "epoch": 1.13, "learning_rate": 1.962187921848954e-05, "loss": 0.0139, "step": 78740 }, { "epoch": 1.13, "learning_rate": 1.9621831178751064e-05, "loss": 0.0174, "step": 78750 }, { "epoch": 1.14, "learning_rate": 1.9621783139012594e-05, "loss": 0.0121, "step": 78760 }, { "epoch": 1.14, "learning_rate": 1.9621735099274123e-05, "loss": 0.0124, "step": 78770 }, { "epoch": 1.14, "learning_rate": 1.962168705953565e-05, "loss": 0.0112, "step": 78780 }, { "epoch": 1.14, "learning_rate": 1.9621639019797178e-05, "loss": 0.0138, "step": 78790 }, { "epoch": 1.14, "learning_rate": 1.9621590980058707e-05, "loss": 0.0098, "step": 78800 }, { "epoch": 1.14, "learning_rate": 1.9621542940320236e-05, "loss": 0.0108, "step": 78810 }, { "epoch": 1.14, "learning_rate": 1.9621494900581762e-05, "loss": 0.0113, "step": 78820 }, { "epoch": 1.14, "learning_rate": 1.962144686084329e-05, "loss": 0.014, "step": 78830 }, { "epoch": 1.14, "learning_rate": 1.962139882110482e-05, "loss": 0.0123, "step": 78840 }, { "epoch": 1.14, "learning_rate": 1.9621350781366347e-05, "loss": 0.0139, "step": 78850 }, { "epoch": 1.14, "learning_rate": 1.9621302741627876e-05, "loss": 0.017, "step": 78860 }, { "epoch": 1.14, "learning_rate": 1.9621254701889405e-05, "loss": 0.0132, "step": 78870 }, { "epoch": 1.14, "learning_rate": 1.9621206662150935e-05, "loss": 0.0112, "step": 78880 }, { "epoch": 1.14, "learning_rate": 1.962115862241246e-05, "loss": 0.0112, "step": 78890 }, { "epoch": 1.14, "learning_rate": 1.962111058267399e-05, "loss": 0.0153, "step": 78900 }, { "epoch": 1.14, "learning_rate": 1.962106254293552e-05, "loss": 0.0124, "step": 78910 }, { "epoch": 1.14, "learning_rate": 1.9621014503197048e-05, "loss": 0.0141, "step": 78920 }, { "epoch": 1.14, "learning_rate": 1.9620966463458574e-05, "loss": 0.0145, "step": 78930 }, { "epoch": 1.14, "learning_rate": 1.9620918423720103e-05, "loss": 0.0178, "step": 78940 }, { "epoch": 1.14, "learning_rate": 1.9620870383981633e-05, "loss": 0.0151, "step": 78950 }, { "epoch": 1.14, "learning_rate": 1.962082234424316e-05, "loss": 0.0106, "step": 78960 }, { "epoch": 1.14, "learning_rate": 1.9620774304504688e-05, "loss": 0.0126, "step": 78970 }, { "epoch": 1.14, "learning_rate": 1.9620726264766217e-05, "loss": 0.0068, "step": 78980 }, { "epoch": 1.14, "learning_rate": 1.9620678225027746e-05, "loss": 0.0153, "step": 78990 }, { "epoch": 1.14, "learning_rate": 1.9620630185289272e-05, "loss": 0.0138, "step": 79000 }, { "epoch": 1.14, "learning_rate": 1.96205821455508e-05, "loss": 0.0158, "step": 79010 }, { "epoch": 1.14, "learning_rate": 1.962053410581233e-05, "loss": 0.0099, "step": 79020 }, { "epoch": 1.14, "learning_rate": 1.9620486066073857e-05, "loss": 0.0104, "step": 79030 }, { "epoch": 1.14, "learning_rate": 1.9620438026335386e-05, "loss": 0.0154, "step": 79040 }, { "epoch": 1.14, "learning_rate": 1.9620389986596915e-05, "loss": 0.0134, "step": 79050 }, { "epoch": 1.14, "learning_rate": 1.9620341946858445e-05, "loss": 0.0139, "step": 79060 }, { "epoch": 1.14, "learning_rate": 1.962029390711997e-05, "loss": 0.0123, "step": 79070 }, { "epoch": 1.14, "learning_rate": 1.96202458673815e-05, "loss": 0.0146, "step": 79080 }, { "epoch": 1.14, "learning_rate": 1.962019782764303e-05, "loss": 0.0107, "step": 79090 }, { "epoch": 1.14, "learning_rate": 1.9620149787904558e-05, "loss": 0.0139, "step": 79100 }, { "epoch": 1.14, "learning_rate": 1.9620101748166084e-05, "loss": 0.0127, "step": 79110 }, { "epoch": 1.14, "learning_rate": 1.9620053708427613e-05, "loss": 0.0183, "step": 79120 }, { "epoch": 1.14, "learning_rate": 1.9620005668689143e-05, "loss": 0.0128, "step": 79130 }, { "epoch": 1.14, "learning_rate": 1.961995762895067e-05, "loss": 0.0105, "step": 79140 }, { "epoch": 1.14, "learning_rate": 1.9619909589212198e-05, "loss": 0.0179, "step": 79150 }, { "epoch": 1.14, "learning_rate": 1.9619861549473727e-05, "loss": 0.0187, "step": 79160 }, { "epoch": 1.14, "learning_rate": 1.9619813509735256e-05, "loss": 0.0135, "step": 79170 }, { "epoch": 1.14, "learning_rate": 1.9619765469996782e-05, "loss": 0.0094, "step": 79180 }, { "epoch": 1.14, "learning_rate": 1.961971743025831e-05, "loss": 0.016, "step": 79190 }, { "epoch": 1.14, "learning_rate": 1.961966939051984e-05, "loss": 0.015, "step": 79200 }, { "epoch": 1.14, "learning_rate": 1.9619621350781367e-05, "loss": 0.0166, "step": 79210 }, { "epoch": 1.14, "learning_rate": 1.9619573311042896e-05, "loss": 0.0123, "step": 79220 }, { "epoch": 1.14, "learning_rate": 1.9619525271304425e-05, "loss": 0.0098, "step": 79230 }, { "epoch": 1.14, "learning_rate": 1.9619477231565954e-05, "loss": 0.0151, "step": 79240 }, { "epoch": 1.14, "learning_rate": 1.961942919182748e-05, "loss": 0.0128, "step": 79250 }, { "epoch": 1.14, "learning_rate": 1.961938115208901e-05, "loss": 0.0104, "step": 79260 }, { "epoch": 1.14, "learning_rate": 1.961933311235054e-05, "loss": 0.0099, "step": 79270 }, { "epoch": 1.14, "learning_rate": 1.9619285072612068e-05, "loss": 0.0136, "step": 79280 }, { "epoch": 1.14, "learning_rate": 1.9619237032873594e-05, "loss": 0.0072, "step": 79290 }, { "epoch": 1.14, "learning_rate": 1.9619188993135123e-05, "loss": 0.0111, "step": 79300 }, { "epoch": 1.14, "learning_rate": 1.9619140953396653e-05, "loss": 0.0106, "step": 79310 }, { "epoch": 1.14, "learning_rate": 1.961909291365818e-05, "loss": 0.0139, "step": 79320 }, { "epoch": 1.14, "learning_rate": 1.9619044873919708e-05, "loss": 0.0094, "step": 79330 }, { "epoch": 1.14, "learning_rate": 1.9618996834181237e-05, "loss": 0.0077, "step": 79340 }, { "epoch": 1.14, "learning_rate": 1.9618948794442766e-05, "loss": 0.0127, "step": 79350 }, { "epoch": 1.14, "learning_rate": 1.9618900754704292e-05, "loss": 0.0099, "step": 79360 }, { "epoch": 1.14, "learning_rate": 1.961885271496582e-05, "loss": 0.0095, "step": 79370 }, { "epoch": 1.14, "learning_rate": 1.961880467522735e-05, "loss": 0.0174, "step": 79380 }, { "epoch": 1.14, "learning_rate": 1.9618756635488877e-05, "loss": 0.01, "step": 79390 }, { "epoch": 1.14, "learning_rate": 1.9618708595750406e-05, "loss": 0.0115, "step": 79400 }, { "epoch": 1.14, "learning_rate": 1.9618660556011935e-05, "loss": 0.0147, "step": 79410 }, { "epoch": 1.14, "learning_rate": 1.9618612516273464e-05, "loss": 0.0129, "step": 79420 }, { "epoch": 1.14, "learning_rate": 1.961856447653499e-05, "loss": 0.0151, "step": 79430 }, { "epoch": 1.14, "learning_rate": 1.961851643679652e-05, "loss": 0.0135, "step": 79440 }, { "epoch": 1.15, "learning_rate": 1.961846839705805e-05, "loss": 0.0149, "step": 79450 }, { "epoch": 1.15, "learning_rate": 1.9618420357319578e-05, "loss": 0.0118, "step": 79460 }, { "epoch": 1.15, "learning_rate": 1.9618372317581104e-05, "loss": 0.0159, "step": 79470 }, { "epoch": 1.15, "learning_rate": 1.9618324277842633e-05, "loss": 0.0115, "step": 79480 }, { "epoch": 1.15, "learning_rate": 1.9618276238104162e-05, "loss": 0.0104, "step": 79490 }, { "epoch": 1.15, "learning_rate": 1.961822819836569e-05, "loss": 0.0088, "step": 79500 }, { "epoch": 1.15, "learning_rate": 1.9618180158627218e-05, "loss": 0.0143, "step": 79510 }, { "epoch": 1.15, "learning_rate": 1.9618132118888747e-05, "loss": 0.0133, "step": 79520 }, { "epoch": 1.15, "learning_rate": 1.9618084079150276e-05, "loss": 0.0116, "step": 79530 }, { "epoch": 1.15, "learning_rate": 1.9618036039411802e-05, "loss": 0.01, "step": 79540 }, { "epoch": 1.15, "learning_rate": 1.961798799967333e-05, "loss": 0.0122, "step": 79550 }, { "epoch": 1.15, "learning_rate": 1.961793995993486e-05, "loss": 0.0122, "step": 79560 }, { "epoch": 1.15, "learning_rate": 1.9617891920196386e-05, "loss": 0.0134, "step": 79570 }, { "epoch": 1.15, "learning_rate": 1.9617843880457916e-05, "loss": 0.0279, "step": 79580 }, { "epoch": 1.15, "learning_rate": 1.9617795840719445e-05, "loss": 0.0138, "step": 79590 }, { "epoch": 1.15, "learning_rate": 1.9617747800980974e-05, "loss": 0.0116, "step": 79600 }, { "epoch": 1.15, "learning_rate": 1.96176997612425e-05, "loss": 0.0122, "step": 79610 }, { "epoch": 1.15, "learning_rate": 1.961765172150403e-05, "loss": 0.0123, "step": 79620 }, { "epoch": 1.15, "learning_rate": 1.961760368176556e-05, "loss": 0.014, "step": 79630 }, { "epoch": 1.15, "learning_rate": 1.9617555642027088e-05, "loss": 0.0113, "step": 79640 }, { "epoch": 1.15, "learning_rate": 1.9617507602288614e-05, "loss": 0.0162, "step": 79650 }, { "epoch": 1.15, "learning_rate": 1.9617459562550143e-05, "loss": 0.0117, "step": 79660 }, { "epoch": 1.15, "learning_rate": 1.9617411522811672e-05, "loss": 0.0108, "step": 79670 }, { "epoch": 1.15, "learning_rate": 1.9617363483073198e-05, "loss": 0.0129, "step": 79680 }, { "epoch": 1.15, "learning_rate": 1.9617315443334728e-05, "loss": 0.012, "step": 79690 }, { "epoch": 1.15, "learning_rate": 1.9617267403596257e-05, "loss": 0.0118, "step": 79700 }, { "epoch": 1.15, "learning_rate": 1.9617219363857786e-05, "loss": 0.0101, "step": 79710 }, { "epoch": 1.15, "learning_rate": 1.9617171324119312e-05, "loss": 0.0134, "step": 79720 }, { "epoch": 1.15, "learning_rate": 1.961712328438084e-05, "loss": 0.0182, "step": 79730 }, { "epoch": 1.15, "learning_rate": 1.961707524464237e-05, "loss": 0.0131, "step": 79740 }, { "epoch": 1.15, "learning_rate": 1.9617027204903896e-05, "loss": 0.0117, "step": 79750 }, { "epoch": 1.15, "learning_rate": 1.9616979165165426e-05, "loss": 0.0207, "step": 79760 }, { "epoch": 1.15, "learning_rate": 1.9616931125426955e-05, "loss": 0.0153, "step": 79770 }, { "epoch": 1.15, "learning_rate": 1.9616883085688484e-05, "loss": 0.0136, "step": 79780 }, { "epoch": 1.15, "learning_rate": 1.961683504595001e-05, "loss": 0.0123, "step": 79790 }, { "epoch": 1.15, "learning_rate": 1.961678700621154e-05, "loss": 0.0127, "step": 79800 }, { "epoch": 1.15, "learning_rate": 1.961673896647307e-05, "loss": 0.0102, "step": 79810 }, { "epoch": 1.15, "learning_rate": 1.9616690926734598e-05, "loss": 0.0111, "step": 79820 }, { "epoch": 1.15, "learning_rate": 1.9616642886996124e-05, "loss": 0.0138, "step": 79830 }, { "epoch": 1.15, "learning_rate": 1.9616594847257653e-05, "loss": 0.015, "step": 79840 }, { "epoch": 1.15, "learning_rate": 1.9616546807519182e-05, "loss": 0.015, "step": 79850 }, { "epoch": 1.15, "learning_rate": 1.9616498767780708e-05, "loss": 0.0155, "step": 79860 }, { "epoch": 1.15, "learning_rate": 1.9616450728042237e-05, "loss": 0.0118, "step": 79870 }, { "epoch": 1.15, "learning_rate": 1.9616402688303767e-05, "loss": 0.0098, "step": 79880 }, { "epoch": 1.15, "learning_rate": 1.9616354648565296e-05, "loss": 0.0117, "step": 79890 }, { "epoch": 1.15, "learning_rate": 1.9616306608826822e-05, "loss": 0.011, "step": 79900 }, { "epoch": 1.15, "learning_rate": 1.961625856908835e-05, "loss": 0.009, "step": 79910 }, { "epoch": 1.15, "learning_rate": 1.961621052934988e-05, "loss": 0.0134, "step": 79920 }, { "epoch": 1.15, "learning_rate": 1.9616162489611406e-05, "loss": 0.0099, "step": 79930 }, { "epoch": 1.15, "learning_rate": 1.9616114449872936e-05, "loss": 0.0107, "step": 79940 }, { "epoch": 1.15, "learning_rate": 1.9616066410134465e-05, "loss": 0.0139, "step": 79950 }, { "epoch": 1.15, "learning_rate": 1.9616018370395994e-05, "loss": 0.0135, "step": 79960 }, { "epoch": 1.15, "learning_rate": 1.961597033065752e-05, "loss": 0.01, "step": 79970 }, { "epoch": 1.15, "learning_rate": 1.961592229091905e-05, "loss": 0.0128, "step": 79980 }, { "epoch": 1.15, "learning_rate": 1.961587425118058e-05, "loss": 0.0102, "step": 79990 }, { "epoch": 1.15, "learning_rate": 1.9615826211442108e-05, "loss": 0.0104, "step": 80000 }, { "epoch": 1.15, "learning_rate": 1.9615778171703634e-05, "loss": 0.0104, "step": 80010 }, { "epoch": 1.15, "learning_rate": 1.9615730131965163e-05, "loss": 0.0115, "step": 80020 }, { "epoch": 1.15, "learning_rate": 1.9615682092226692e-05, "loss": 0.0121, "step": 80030 }, { "epoch": 1.15, "learning_rate": 1.9615634052488218e-05, "loss": 0.0116, "step": 80040 }, { "epoch": 1.15, "learning_rate": 1.9615586012749747e-05, "loss": 0.0111, "step": 80050 }, { "epoch": 1.15, "learning_rate": 1.9615537973011277e-05, "loss": 0.0108, "step": 80060 }, { "epoch": 1.15, "learning_rate": 1.9615489933272806e-05, "loss": 0.014, "step": 80070 }, { "epoch": 1.15, "learning_rate": 1.9615441893534332e-05, "loss": 0.0142, "step": 80080 }, { "epoch": 1.15, "learning_rate": 1.961539385379586e-05, "loss": 0.0127, "step": 80090 }, { "epoch": 1.15, "learning_rate": 1.961534581405739e-05, "loss": 0.017, "step": 80100 }, { "epoch": 1.15, "learning_rate": 1.9615297774318916e-05, "loss": 0.0122, "step": 80110 }, { "epoch": 1.15, "learning_rate": 1.9615249734580445e-05, "loss": 0.0129, "step": 80120 }, { "epoch": 1.15, "learning_rate": 1.9615201694841975e-05, "loss": 0.0133, "step": 80130 }, { "epoch": 1.15, "learning_rate": 1.9615153655103504e-05, "loss": 0.015, "step": 80140 }, { "epoch": 1.16, "learning_rate": 1.961510561536503e-05, "loss": 0.0113, "step": 80150 }, { "epoch": 1.16, "learning_rate": 1.961505757562656e-05, "loss": 0.0196, "step": 80160 }, { "epoch": 1.16, "learning_rate": 1.961500953588809e-05, "loss": 0.0132, "step": 80170 }, { "epoch": 1.16, "learning_rate": 1.9614961496149614e-05, "loss": 0.0142, "step": 80180 }, { "epoch": 1.16, "learning_rate": 1.9614913456411144e-05, "loss": 0.0116, "step": 80190 }, { "epoch": 1.16, "learning_rate": 1.9614865416672673e-05, "loss": 0.0107, "step": 80200 }, { "epoch": 1.16, "learning_rate": 1.9614817376934202e-05, "loss": 0.0147, "step": 80210 }, { "epoch": 1.16, "learning_rate": 1.9614769337195728e-05, "loss": 0.0142, "step": 80220 }, { "epoch": 1.16, "learning_rate": 1.9614721297457257e-05, "loss": 0.0114, "step": 80230 }, { "epoch": 1.16, "learning_rate": 1.9614673257718787e-05, "loss": 0.0123, "step": 80240 }, { "epoch": 1.16, "learning_rate": 1.9614625217980316e-05, "loss": 0.0104, "step": 80250 }, { "epoch": 1.16, "learning_rate": 1.961457717824184e-05, "loss": 0.0108, "step": 80260 }, { "epoch": 1.16, "learning_rate": 1.961452913850337e-05, "loss": 0.015, "step": 80270 }, { "epoch": 1.16, "learning_rate": 1.96144810987649e-05, "loss": 0.0119, "step": 80280 }, { "epoch": 1.16, "learning_rate": 1.9614433059026426e-05, "loss": 0.0141, "step": 80290 }, { "epoch": 1.16, "learning_rate": 1.9614385019287955e-05, "loss": 0.0108, "step": 80300 }, { "epoch": 1.16, "learning_rate": 1.9614336979549485e-05, "loss": 0.0118, "step": 80310 }, { "epoch": 1.16, "learning_rate": 1.9614288939811014e-05, "loss": 0.0109, "step": 80320 }, { "epoch": 1.16, "learning_rate": 1.961424090007254e-05, "loss": 0.0125, "step": 80330 }, { "epoch": 1.16, "learning_rate": 1.961419286033407e-05, "loss": 0.0145, "step": 80340 }, { "epoch": 1.16, "learning_rate": 1.96141448205956e-05, "loss": 0.0126, "step": 80350 }, { "epoch": 1.16, "learning_rate": 1.9614096780857124e-05, "loss": 0.0111, "step": 80360 }, { "epoch": 1.16, "learning_rate": 1.9614048741118653e-05, "loss": 0.012, "step": 80370 }, { "epoch": 1.16, "learning_rate": 1.9614000701380183e-05, "loss": 0.0107, "step": 80380 }, { "epoch": 1.16, "learning_rate": 1.9613952661641712e-05, "loss": 0.0105, "step": 80390 }, { "epoch": 1.16, "learning_rate": 1.9613904621903238e-05, "loss": 0.0139, "step": 80400 }, { "epoch": 1.16, "learning_rate": 1.9613856582164767e-05, "loss": 0.0131, "step": 80410 }, { "epoch": 1.16, "learning_rate": 1.9613808542426296e-05, "loss": 0.0144, "step": 80420 }, { "epoch": 1.16, "learning_rate": 1.9613760502687826e-05, "loss": 0.0129, "step": 80430 }, { "epoch": 1.16, "learning_rate": 1.961371246294935e-05, "loss": 0.0111, "step": 80440 }, { "epoch": 1.16, "learning_rate": 1.961366442321088e-05, "loss": 0.0174, "step": 80450 }, { "epoch": 1.16, "learning_rate": 1.961361638347241e-05, "loss": 0.0131, "step": 80460 }, { "epoch": 1.16, "learning_rate": 1.9613568343733936e-05, "loss": 0.0131, "step": 80470 }, { "epoch": 1.16, "learning_rate": 1.9613520303995465e-05, "loss": 0.0147, "step": 80480 }, { "epoch": 1.16, "learning_rate": 1.9613472264256995e-05, "loss": 0.0112, "step": 80490 }, { "epoch": 1.16, "learning_rate": 1.9613424224518524e-05, "loss": 0.0134, "step": 80500 }, { "epoch": 1.16, "learning_rate": 1.961337618478005e-05, "loss": 0.0128, "step": 80510 }, { "epoch": 1.16, "learning_rate": 1.961332814504158e-05, "loss": 0.0164, "step": 80520 }, { "epoch": 1.16, "learning_rate": 1.9613280105303108e-05, "loss": 0.011, "step": 80530 }, { "epoch": 1.16, "learning_rate": 1.9613232065564634e-05, "loss": 0.0089, "step": 80540 }, { "epoch": 1.16, "learning_rate": 1.9613184025826163e-05, "loss": 0.0119, "step": 80550 }, { "epoch": 1.16, "learning_rate": 1.9613135986087693e-05, "loss": 0.0115, "step": 80560 }, { "epoch": 1.16, "learning_rate": 1.9613087946349222e-05, "loss": 0.0126, "step": 80570 }, { "epoch": 1.16, "learning_rate": 1.9613039906610748e-05, "loss": 0.0114, "step": 80580 }, { "epoch": 1.16, "learning_rate": 1.9612991866872277e-05, "loss": 0.0099, "step": 80590 }, { "epoch": 1.16, "learning_rate": 1.9612943827133806e-05, "loss": 0.0116, "step": 80600 }, { "epoch": 1.16, "learning_rate": 1.9612895787395336e-05, "loss": 0.0169, "step": 80610 }, { "epoch": 1.16, "learning_rate": 1.961284774765686e-05, "loss": 0.0111, "step": 80620 }, { "epoch": 1.16, "learning_rate": 1.961279970791839e-05, "loss": 0.0102, "step": 80630 }, { "epoch": 1.16, "learning_rate": 1.961275166817992e-05, "loss": 0.0145, "step": 80640 }, { "epoch": 1.16, "learning_rate": 1.9612703628441446e-05, "loss": 0.0113, "step": 80650 }, { "epoch": 1.16, "learning_rate": 1.9612655588702975e-05, "loss": 0.0147, "step": 80660 }, { "epoch": 1.16, "learning_rate": 1.9612607548964504e-05, "loss": 0.0156, "step": 80670 }, { "epoch": 1.16, "learning_rate": 1.9612559509226034e-05, "loss": 0.0136, "step": 80680 }, { "epoch": 1.16, "learning_rate": 1.961251146948756e-05, "loss": 0.0145, "step": 80690 }, { "epoch": 1.16, "learning_rate": 1.961246342974909e-05, "loss": 0.0102, "step": 80700 }, { "epoch": 1.16, "learning_rate": 1.9612415390010618e-05, "loss": 0.0131, "step": 80710 }, { "epoch": 1.16, "learning_rate": 1.9612367350272144e-05, "loss": 0.0115, "step": 80720 }, { "epoch": 1.16, "learning_rate": 1.9612319310533673e-05, "loss": 0.0125, "step": 80730 }, { "epoch": 1.16, "learning_rate": 1.9612271270795203e-05, "loss": 0.0188, "step": 80740 }, { "epoch": 1.16, "learning_rate": 1.9612223231056732e-05, "loss": 0.0142, "step": 80750 }, { "epoch": 1.16, "learning_rate": 1.9612175191318258e-05, "loss": 0.0147, "step": 80760 }, { "epoch": 1.16, "learning_rate": 1.9612127151579787e-05, "loss": 0.0141, "step": 80770 }, { "epoch": 1.16, "learning_rate": 1.9612079111841316e-05, "loss": 0.016, "step": 80780 }, { "epoch": 1.16, "learning_rate": 1.9612031072102846e-05, "loss": 0.008, "step": 80790 }, { "epoch": 1.16, "learning_rate": 1.9611983032364375e-05, "loss": 0.0118, "step": 80800 }, { "epoch": 1.16, "learning_rate": 1.9611934992625904e-05, "loss": 0.0135, "step": 80810 }, { "epoch": 1.16, "learning_rate": 1.961188695288743e-05, "loss": 0.0135, "step": 80820 }, { "epoch": 1.16, "learning_rate": 1.961183891314896e-05, "loss": 0.0128, "step": 80830 }, { "epoch": 1.17, "learning_rate": 1.961179087341049e-05, "loss": 0.009, "step": 80840 }, { "epoch": 1.17, "learning_rate": 1.9611742833672018e-05, "loss": 0.0096, "step": 80850 }, { "epoch": 1.17, "learning_rate": 1.9611694793933544e-05, "loss": 0.0146, "step": 80860 }, { "epoch": 1.17, "learning_rate": 1.9611646754195073e-05, "loss": 0.0119, "step": 80870 }, { "epoch": 1.17, "learning_rate": 1.9611598714456602e-05, "loss": 0.0115, "step": 80880 }, { "epoch": 1.17, "learning_rate": 1.9611550674718128e-05, "loss": 0.0101, "step": 80890 }, { "epoch": 1.17, "learning_rate": 1.9611502634979657e-05, "loss": 0.0156, "step": 80900 }, { "epoch": 1.17, "learning_rate": 1.9611454595241187e-05, "loss": 0.0142, "step": 80910 }, { "epoch": 1.17, "learning_rate": 1.9611406555502716e-05, "loss": 0.0108, "step": 80920 }, { "epoch": 1.17, "learning_rate": 1.9611358515764242e-05, "loss": 0.0133, "step": 80930 }, { "epoch": 1.17, "learning_rate": 1.961131047602577e-05, "loss": 0.0149, "step": 80940 }, { "epoch": 1.17, "learning_rate": 1.96112624362873e-05, "loss": 0.0169, "step": 80950 }, { "epoch": 1.17, "learning_rate": 1.9611214396548826e-05, "loss": 0.0106, "step": 80960 }, { "epoch": 1.17, "learning_rate": 1.9611166356810355e-05, "loss": 0.0154, "step": 80970 }, { "epoch": 1.17, "learning_rate": 1.9611118317071885e-05, "loss": 0.0095, "step": 80980 }, { "epoch": 1.17, "learning_rate": 1.9611070277333414e-05, "loss": 0.0106, "step": 80990 }, { "epoch": 1.17, "learning_rate": 1.961102223759494e-05, "loss": 0.0108, "step": 81000 }, { "epoch": 1.17, "learning_rate": 1.961097419785647e-05, "loss": 0.0098, "step": 81010 }, { "epoch": 1.17, "learning_rate": 1.9610926158118e-05, "loss": 0.0157, "step": 81020 }, { "epoch": 1.17, "learning_rate": 1.9610878118379528e-05, "loss": 0.0106, "step": 81030 }, { "epoch": 1.17, "learning_rate": 1.9610830078641054e-05, "loss": 0.0168, "step": 81040 }, { "epoch": 1.17, "learning_rate": 1.9610782038902583e-05, "loss": 0.0109, "step": 81050 }, { "epoch": 1.17, "learning_rate": 1.9610733999164112e-05, "loss": 0.02, "step": 81060 }, { "epoch": 1.17, "learning_rate": 1.9610685959425638e-05, "loss": 0.0187, "step": 81070 }, { "epoch": 1.17, "learning_rate": 1.9610637919687167e-05, "loss": 0.0121, "step": 81080 }, { "epoch": 1.17, "learning_rate": 1.9610589879948697e-05, "loss": 0.0125, "step": 81090 }, { "epoch": 1.17, "learning_rate": 1.9610541840210226e-05, "loss": 0.0153, "step": 81100 }, { "epoch": 1.17, "learning_rate": 1.961049380047175e-05, "loss": 0.0106, "step": 81110 }, { "epoch": 1.17, "learning_rate": 1.961044576073328e-05, "loss": 0.0109, "step": 81120 }, { "epoch": 1.17, "learning_rate": 1.961039772099481e-05, "loss": 0.0138, "step": 81130 }, { "epoch": 1.17, "learning_rate": 1.9610349681256336e-05, "loss": 0.0163, "step": 81140 }, { "epoch": 1.17, "learning_rate": 1.9610301641517865e-05, "loss": 0.0123, "step": 81150 }, { "epoch": 1.17, "learning_rate": 1.9610253601779395e-05, "loss": 0.0153, "step": 81160 }, { "epoch": 1.17, "learning_rate": 1.9610205562040924e-05, "loss": 0.0221, "step": 81170 }, { "epoch": 1.17, "learning_rate": 1.961015752230245e-05, "loss": 0.0123, "step": 81180 }, { "epoch": 1.17, "learning_rate": 1.961010948256398e-05, "loss": 0.0118, "step": 81190 }, { "epoch": 1.17, "learning_rate": 1.961006144282551e-05, "loss": 0.0131, "step": 81200 }, { "epoch": 1.17, "learning_rate": 1.9610013403087038e-05, "loss": 0.012, "step": 81210 }, { "epoch": 1.17, "learning_rate": 1.9609965363348563e-05, "loss": 0.0151, "step": 81220 }, { "epoch": 1.17, "learning_rate": 1.9609917323610093e-05, "loss": 0.0156, "step": 81230 }, { "epoch": 1.17, "learning_rate": 1.9609869283871622e-05, "loss": 0.0139, "step": 81240 }, { "epoch": 1.17, "learning_rate": 1.9609821244133148e-05, "loss": 0.0103, "step": 81250 }, { "epoch": 1.17, "learning_rate": 1.9609773204394677e-05, "loss": 0.0097, "step": 81260 }, { "epoch": 1.17, "learning_rate": 1.9609725164656206e-05, "loss": 0.0133, "step": 81270 }, { "epoch": 1.17, "learning_rate": 1.9609677124917736e-05, "loss": 0.0134, "step": 81280 }, { "epoch": 1.17, "learning_rate": 1.960962908517926e-05, "loss": 0.0129, "step": 81290 }, { "epoch": 1.17, "learning_rate": 1.960958104544079e-05, "loss": 0.0119, "step": 81300 }, { "epoch": 1.17, "learning_rate": 1.960953300570232e-05, "loss": 0.0151, "step": 81310 }, { "epoch": 1.17, "learning_rate": 1.9609484965963846e-05, "loss": 0.0121, "step": 81320 }, { "epoch": 1.17, "learning_rate": 1.9609436926225375e-05, "loss": 0.0168, "step": 81330 }, { "epoch": 1.17, "learning_rate": 1.9609388886486905e-05, "loss": 0.0102, "step": 81340 }, { "epoch": 1.17, "learning_rate": 1.9609340846748434e-05, "loss": 0.0115, "step": 81350 }, { "epoch": 1.17, "learning_rate": 1.960929280700996e-05, "loss": 0.0107, "step": 81360 }, { "epoch": 1.17, "learning_rate": 1.960924476727149e-05, "loss": 0.02, "step": 81370 }, { "epoch": 1.17, "learning_rate": 1.9609196727533018e-05, "loss": 0.0111, "step": 81380 }, { "epoch": 1.17, "learning_rate": 1.9609148687794548e-05, "loss": 0.0193, "step": 81390 }, { "epoch": 1.17, "learning_rate": 1.9609100648056073e-05, "loss": 0.0112, "step": 81400 }, { "epoch": 1.17, "learning_rate": 1.9609052608317603e-05, "loss": 0.0153, "step": 81410 }, { "epoch": 1.17, "learning_rate": 1.9609004568579132e-05, "loss": 0.0094, "step": 81420 }, { "epoch": 1.17, "learning_rate": 1.9608956528840658e-05, "loss": 0.016, "step": 81430 }, { "epoch": 1.17, "learning_rate": 1.9608908489102187e-05, "loss": 0.0113, "step": 81440 }, { "epoch": 1.17, "learning_rate": 1.9608860449363716e-05, "loss": 0.0145, "step": 81450 }, { "epoch": 1.17, "learning_rate": 1.9608812409625246e-05, "loss": 0.0158, "step": 81460 }, { "epoch": 1.17, "learning_rate": 1.960876436988677e-05, "loss": 0.0139, "step": 81470 }, { "epoch": 1.17, "learning_rate": 1.96087163301483e-05, "loss": 0.016, "step": 81480 }, { "epoch": 1.17, "learning_rate": 1.960866829040983e-05, "loss": 0.0137, "step": 81490 }, { "epoch": 1.17, "learning_rate": 1.9608620250671356e-05, "loss": 0.0139, "step": 81500 }, { "epoch": 1.17, "learning_rate": 1.9608572210932885e-05, "loss": 0.0136, "step": 81510 }, { "epoch": 1.17, "learning_rate": 1.9608524171194414e-05, "loss": 0.0143, "step": 81520 }, { "epoch": 1.18, "learning_rate": 1.9608476131455944e-05, "loss": 0.0152, "step": 81530 }, { "epoch": 1.18, "learning_rate": 1.960842809171747e-05, "loss": 0.0128, "step": 81540 }, { "epoch": 1.18, "learning_rate": 1.9608380051979e-05, "loss": 0.0132, "step": 81550 }, { "epoch": 1.18, "learning_rate": 1.9608332012240528e-05, "loss": 0.013, "step": 81560 }, { "epoch": 1.18, "learning_rate": 1.9608283972502054e-05, "loss": 0.0148, "step": 81570 }, { "epoch": 1.18, "learning_rate": 1.9608235932763583e-05, "loss": 0.015, "step": 81580 }, { "epoch": 1.18, "learning_rate": 1.9608187893025113e-05, "loss": 0.0113, "step": 81590 }, { "epoch": 1.18, "learning_rate": 1.9608139853286642e-05, "loss": 0.0106, "step": 81600 }, { "epoch": 1.18, "learning_rate": 1.9608091813548168e-05, "loss": 0.0153, "step": 81610 }, { "epoch": 1.18, "learning_rate": 1.9608043773809697e-05, "loss": 0.0099, "step": 81620 }, { "epoch": 1.18, "learning_rate": 1.9607995734071226e-05, "loss": 0.0123, "step": 81630 }, { "epoch": 1.18, "learning_rate": 1.9607947694332756e-05, "loss": 0.0112, "step": 81640 }, { "epoch": 1.18, "learning_rate": 1.960789965459428e-05, "loss": 0.0111, "step": 81650 }, { "epoch": 1.18, "learning_rate": 1.960785161485581e-05, "loss": 0.0079, "step": 81660 }, { "epoch": 1.18, "learning_rate": 1.960780357511734e-05, "loss": 0.0098, "step": 81670 }, { "epoch": 1.18, "learning_rate": 1.9607755535378866e-05, "loss": 0.0143, "step": 81680 }, { "epoch": 1.18, "learning_rate": 1.9607707495640395e-05, "loss": 0.0142, "step": 81690 }, { "epoch": 1.18, "learning_rate": 1.9607659455901924e-05, "loss": 0.0141, "step": 81700 }, { "epoch": 1.18, "learning_rate": 1.9607611416163454e-05, "loss": 0.0122, "step": 81710 }, { "epoch": 1.18, "learning_rate": 1.960756337642498e-05, "loss": 0.0114, "step": 81720 }, { "epoch": 1.18, "learning_rate": 1.960751533668651e-05, "loss": 0.0123, "step": 81730 }, { "epoch": 1.18, "learning_rate": 1.9607467296948038e-05, "loss": 0.0123, "step": 81740 }, { "epoch": 1.18, "learning_rate": 1.9607419257209564e-05, "loss": 0.016, "step": 81750 }, { "epoch": 1.18, "learning_rate": 1.9607371217471093e-05, "loss": 0.0129, "step": 81760 }, { "epoch": 1.18, "learning_rate": 1.9607323177732622e-05, "loss": 0.0146, "step": 81770 }, { "epoch": 1.18, "learning_rate": 1.9607275137994152e-05, "loss": 0.0139, "step": 81780 }, { "epoch": 1.18, "learning_rate": 1.9607227098255678e-05, "loss": 0.0166, "step": 81790 }, { "epoch": 1.18, "learning_rate": 1.9607179058517207e-05, "loss": 0.0098, "step": 81800 }, { "epoch": 1.18, "learning_rate": 1.9607131018778736e-05, "loss": 0.0102, "step": 81810 }, { "epoch": 1.18, "learning_rate": 1.9607082979040265e-05, "loss": 0.0148, "step": 81820 }, { "epoch": 1.18, "learning_rate": 1.960703493930179e-05, "loss": 0.0152, "step": 81830 }, { "epoch": 1.18, "learning_rate": 1.960698689956332e-05, "loss": 0.0132, "step": 81840 }, { "epoch": 1.18, "learning_rate": 1.960693885982485e-05, "loss": 0.0136, "step": 81850 }, { "epoch": 1.18, "learning_rate": 1.9606890820086376e-05, "loss": 0.0148, "step": 81860 }, { "epoch": 1.18, "learning_rate": 1.9606842780347905e-05, "loss": 0.0157, "step": 81870 }, { "epoch": 1.18, "learning_rate": 1.9606794740609434e-05, "loss": 0.0126, "step": 81880 }, { "epoch": 1.18, "learning_rate": 1.9606746700870964e-05, "loss": 0.01, "step": 81890 }, { "epoch": 1.18, "learning_rate": 1.960669866113249e-05, "loss": 0.012, "step": 81900 }, { "epoch": 1.18, "learning_rate": 1.960665062139402e-05, "loss": 0.0157, "step": 81910 }, { "epoch": 1.18, "learning_rate": 1.9606602581655548e-05, "loss": 0.0107, "step": 81920 }, { "epoch": 1.18, "learning_rate": 1.9606554541917074e-05, "loss": 0.0132, "step": 81930 }, { "epoch": 1.18, "learning_rate": 1.9606506502178603e-05, "loss": 0.0171, "step": 81940 }, { "epoch": 1.18, "learning_rate": 1.9606458462440132e-05, "loss": 0.0126, "step": 81950 }, { "epoch": 1.18, "learning_rate": 1.960641042270166e-05, "loss": 0.0119, "step": 81960 }, { "epoch": 1.18, "learning_rate": 1.9606362382963188e-05, "loss": 0.0159, "step": 81970 }, { "epoch": 1.18, "learning_rate": 1.9606314343224717e-05, "loss": 0.0107, "step": 81980 }, { "epoch": 1.18, "learning_rate": 1.9606266303486246e-05, "loss": 0.0158, "step": 81990 }, { "epoch": 1.18, "learning_rate": 1.9606218263747775e-05, "loss": 0.016, "step": 82000 }, { "epoch": 1.18, "learning_rate": 1.96061702240093e-05, "loss": 0.0086, "step": 82010 }, { "epoch": 1.18, "learning_rate": 1.960612218427083e-05, "loss": 0.0116, "step": 82020 }, { "epoch": 1.18, "learning_rate": 1.960607414453236e-05, "loss": 0.0103, "step": 82030 }, { "epoch": 1.18, "learning_rate": 1.9606026104793886e-05, "loss": 0.0166, "step": 82040 }, { "epoch": 1.18, "learning_rate": 1.9605978065055415e-05, "loss": 0.0172, "step": 82050 }, { "epoch": 1.18, "learning_rate": 1.9605930025316944e-05, "loss": 0.0139, "step": 82060 }, { "epoch": 1.18, "learning_rate": 1.9605881985578473e-05, "loss": 0.0141, "step": 82070 }, { "epoch": 1.18, "learning_rate": 1.960583394584e-05, "loss": 0.0096, "step": 82080 }, { "epoch": 1.18, "learning_rate": 1.960578590610153e-05, "loss": 0.0152, "step": 82090 }, { "epoch": 1.18, "learning_rate": 1.9605737866363058e-05, "loss": 0.0128, "step": 82100 }, { "epoch": 1.18, "learning_rate": 1.9605689826624584e-05, "loss": 0.0186, "step": 82110 }, { "epoch": 1.18, "learning_rate": 1.9605641786886113e-05, "loss": 0.0138, "step": 82120 }, { "epoch": 1.18, "learning_rate": 1.9605593747147642e-05, "loss": 0.0101, "step": 82130 }, { "epoch": 1.18, "learning_rate": 1.960554570740917e-05, "loss": 0.0114, "step": 82140 }, { "epoch": 1.18, "learning_rate": 1.9605497667670697e-05, "loss": 0.0124, "step": 82150 }, { "epoch": 1.18, "learning_rate": 1.9605449627932227e-05, "loss": 0.0158, "step": 82160 }, { "epoch": 1.18, "learning_rate": 1.9605401588193756e-05, "loss": 0.0122, "step": 82170 }, { "epoch": 1.18, "learning_rate": 1.9605353548455285e-05, "loss": 0.0114, "step": 82180 }, { "epoch": 1.18, "learning_rate": 1.960530550871681e-05, "loss": 0.0095, "step": 82190 }, { "epoch": 1.18, "learning_rate": 1.960525746897834e-05, "loss": 0.0114, "step": 82200 }, { "epoch": 1.18, "learning_rate": 1.960520942923987e-05, "loss": 0.0106, "step": 82210 }, { "epoch": 1.18, "learning_rate": 1.9605161389501396e-05, "loss": 0.0112, "step": 82220 }, { "epoch": 1.19, "learning_rate": 1.9605113349762925e-05, "loss": 0.0141, "step": 82230 }, { "epoch": 1.19, "learning_rate": 1.9605065310024454e-05, "loss": 0.0118, "step": 82240 }, { "epoch": 1.19, "learning_rate": 1.9605017270285983e-05, "loss": 0.011, "step": 82250 }, { "epoch": 1.19, "learning_rate": 1.960496923054751e-05, "loss": 0.0119, "step": 82260 }, { "epoch": 1.19, "learning_rate": 1.960492119080904e-05, "loss": 0.0119, "step": 82270 }, { "epoch": 1.19, "learning_rate": 1.9604873151070568e-05, "loss": 0.0131, "step": 82280 }, { "epoch": 1.19, "learning_rate": 1.9604825111332094e-05, "loss": 0.0102, "step": 82290 }, { "epoch": 1.19, "learning_rate": 1.9604777071593623e-05, "loss": 0.0098, "step": 82300 }, { "epoch": 1.19, "learning_rate": 1.9604729031855152e-05, "loss": 0.0115, "step": 82310 }, { "epoch": 1.19, "learning_rate": 1.960468099211668e-05, "loss": 0.0128, "step": 82320 }, { "epoch": 1.19, "learning_rate": 1.9604632952378207e-05, "loss": 0.012, "step": 82330 }, { "epoch": 1.19, "learning_rate": 1.9604584912639737e-05, "loss": 0.0131, "step": 82340 }, { "epoch": 1.19, "learning_rate": 1.9604536872901266e-05, "loss": 0.0133, "step": 82350 }, { "epoch": 1.19, "learning_rate": 1.9604488833162795e-05, "loss": 0.0138, "step": 82360 }, { "epoch": 1.19, "learning_rate": 1.960444079342432e-05, "loss": 0.0121, "step": 82370 }, { "epoch": 1.19, "learning_rate": 1.960439275368585e-05, "loss": 0.0126, "step": 82380 }, { "epoch": 1.19, "learning_rate": 1.960434471394738e-05, "loss": 0.0134, "step": 82390 }, { "epoch": 1.19, "learning_rate": 1.9604296674208906e-05, "loss": 0.0122, "step": 82400 }, { "epoch": 1.19, "learning_rate": 1.9604248634470435e-05, "loss": 0.0101, "step": 82410 }, { "epoch": 1.19, "learning_rate": 1.9604200594731964e-05, "loss": 0.0155, "step": 82420 }, { "epoch": 1.19, "learning_rate": 1.9604152554993493e-05, "loss": 0.0168, "step": 82430 }, { "epoch": 1.19, "learning_rate": 1.960410451525502e-05, "loss": 0.0104, "step": 82440 }, { "epoch": 1.19, "learning_rate": 1.960405647551655e-05, "loss": 0.0177, "step": 82450 }, { "epoch": 1.19, "learning_rate": 1.9604008435778078e-05, "loss": 0.0098, "step": 82460 }, { "epoch": 1.19, "learning_rate": 1.9603960396039604e-05, "loss": 0.0148, "step": 82470 }, { "epoch": 1.19, "learning_rate": 1.9603912356301133e-05, "loss": 0.0186, "step": 82480 }, { "epoch": 1.19, "learning_rate": 1.9603864316562662e-05, "loss": 0.014, "step": 82490 }, { "epoch": 1.19, "learning_rate": 1.960381627682419e-05, "loss": 0.0126, "step": 82500 }, { "epoch": 1.19, "learning_rate": 1.9603768237085717e-05, "loss": 0.0188, "step": 82510 }, { "epoch": 1.19, "learning_rate": 1.9603720197347247e-05, "loss": 0.0119, "step": 82520 }, { "epoch": 1.19, "learning_rate": 1.9603672157608776e-05, "loss": 0.0126, "step": 82530 }, { "epoch": 1.19, "learning_rate": 1.9603624117870305e-05, "loss": 0.0128, "step": 82540 }, { "epoch": 1.19, "learning_rate": 1.960357607813183e-05, "loss": 0.0143, "step": 82550 }, { "epoch": 1.19, "learning_rate": 1.960352803839336e-05, "loss": 0.0211, "step": 82560 }, { "epoch": 1.19, "learning_rate": 1.960347999865489e-05, "loss": 0.0093, "step": 82570 }, { "epoch": 1.19, "learning_rate": 1.9603431958916415e-05, "loss": 0.0197, "step": 82580 }, { "epoch": 1.19, "learning_rate": 1.9603383919177945e-05, "loss": 0.0115, "step": 82590 }, { "epoch": 1.19, "learning_rate": 1.9603335879439474e-05, "loss": 0.0177, "step": 82600 }, { "epoch": 1.19, "learning_rate": 1.9603287839701003e-05, "loss": 0.0088, "step": 82610 }, { "epoch": 1.19, "learning_rate": 1.960323979996253e-05, "loss": 0.0147, "step": 82620 }, { "epoch": 1.19, "learning_rate": 1.960319176022406e-05, "loss": 0.0142, "step": 82630 }, { "epoch": 1.19, "learning_rate": 1.9603143720485588e-05, "loss": 0.0092, "step": 82640 }, { "epoch": 1.19, "learning_rate": 1.9603095680747114e-05, "loss": 0.0125, "step": 82650 }, { "epoch": 1.19, "learning_rate": 1.9603047641008643e-05, "loss": 0.0115, "step": 82660 }, { "epoch": 1.19, "learning_rate": 1.9602999601270172e-05, "loss": 0.0103, "step": 82670 }, { "epoch": 1.19, "learning_rate": 1.96029515615317e-05, "loss": 0.0123, "step": 82680 }, { "epoch": 1.19, "learning_rate": 1.9602903521793227e-05, "loss": 0.0136, "step": 82690 }, { "epoch": 1.19, "learning_rate": 1.9602855482054756e-05, "loss": 0.0116, "step": 82700 }, { "epoch": 1.19, "learning_rate": 1.9602807442316286e-05, "loss": 0.0116, "step": 82710 }, { "epoch": 1.19, "learning_rate": 1.9602759402577815e-05, "loss": 0.0162, "step": 82720 }, { "epoch": 1.19, "learning_rate": 1.960271136283934e-05, "loss": 0.021, "step": 82730 }, { "epoch": 1.19, "learning_rate": 1.960266332310087e-05, "loss": 0.0157, "step": 82740 }, { "epoch": 1.19, "learning_rate": 1.96026152833624e-05, "loss": 0.0134, "step": 82750 }, { "epoch": 1.19, "learning_rate": 1.9602567243623925e-05, "loss": 0.017, "step": 82760 }, { "epoch": 1.19, "learning_rate": 1.9602519203885455e-05, "loss": 0.0186, "step": 82770 }, { "epoch": 1.19, "learning_rate": 1.9602471164146984e-05, "loss": 0.0146, "step": 82780 }, { "epoch": 1.19, "learning_rate": 1.9602423124408513e-05, "loss": 0.0101, "step": 82790 }, { "epoch": 1.19, "learning_rate": 1.960237508467004e-05, "loss": 0.014, "step": 82800 }, { "epoch": 1.19, "learning_rate": 1.9602327044931568e-05, "loss": 0.0124, "step": 82810 }, { "epoch": 1.19, "learning_rate": 1.9602279005193098e-05, "loss": 0.0127, "step": 82820 }, { "epoch": 1.19, "learning_rate": 1.9602230965454623e-05, "loss": 0.0067, "step": 82830 }, { "epoch": 1.19, "learning_rate": 1.9602182925716153e-05, "loss": 0.0158, "step": 82840 }, { "epoch": 1.19, "learning_rate": 1.9602134885977682e-05, "loss": 0.0125, "step": 82850 }, { "epoch": 1.19, "learning_rate": 1.960208684623921e-05, "loss": 0.0101, "step": 82860 }, { "epoch": 1.19, "learning_rate": 1.9602038806500737e-05, "loss": 0.0174, "step": 82870 }, { "epoch": 1.19, "learning_rate": 1.9601990766762266e-05, "loss": 0.0122, "step": 82880 }, { "epoch": 1.19, "learning_rate": 1.9601942727023796e-05, "loss": 0.015, "step": 82890 }, { "epoch": 1.19, "learning_rate": 1.9601894687285325e-05, "loss": 0.0122, "step": 82900 }, { "epoch": 1.19, "learning_rate": 1.960184664754685e-05, "loss": 0.0157, "step": 82910 }, { "epoch": 1.2, "learning_rate": 1.960179860780838e-05, "loss": 0.0107, "step": 82920 }, { "epoch": 1.2, "learning_rate": 1.960175056806991e-05, "loss": 0.0138, "step": 82930 }, { "epoch": 1.2, "learning_rate": 1.9601702528331435e-05, "loss": 0.0135, "step": 82940 }, { "epoch": 1.2, "learning_rate": 1.9601654488592965e-05, "loss": 0.0116, "step": 82950 }, { "epoch": 1.2, "learning_rate": 1.9601606448854494e-05, "loss": 0.0147, "step": 82960 }, { "epoch": 1.2, "learning_rate": 1.9601558409116023e-05, "loss": 0.0128, "step": 82970 }, { "epoch": 1.2, "learning_rate": 1.960151036937755e-05, "loss": 0.022, "step": 82980 }, { "epoch": 1.2, "learning_rate": 1.9601462329639078e-05, "loss": 0.0123, "step": 82990 }, { "epoch": 1.2, "learning_rate": 1.9601414289900607e-05, "loss": 0.0164, "step": 83000 }, { "epoch": 1.2, "learning_rate": 1.9601366250162133e-05, "loss": 0.0159, "step": 83010 }, { "epoch": 1.2, "learning_rate": 1.9601318210423663e-05, "loss": 0.0157, "step": 83020 }, { "epoch": 1.2, "learning_rate": 1.9601270170685192e-05, "loss": 0.0108, "step": 83030 }, { "epoch": 1.2, "learning_rate": 1.960122213094672e-05, "loss": 0.0125, "step": 83040 }, { "epoch": 1.2, "learning_rate": 1.9601174091208247e-05, "loss": 0.0142, "step": 83050 }, { "epoch": 1.2, "learning_rate": 1.9601126051469776e-05, "loss": 0.0141, "step": 83060 }, { "epoch": 1.2, "learning_rate": 1.9601078011731306e-05, "loss": 0.0121, "step": 83070 }, { "epoch": 1.2, "learning_rate": 1.9601029971992835e-05, "loss": 0.0097, "step": 83080 }, { "epoch": 1.2, "learning_rate": 1.960098193225436e-05, "loss": 0.015, "step": 83090 }, { "epoch": 1.2, "learning_rate": 1.960093389251589e-05, "loss": 0.0119, "step": 83100 }, { "epoch": 1.2, "learning_rate": 1.960088585277742e-05, "loss": 0.0124, "step": 83110 }, { "epoch": 1.2, "learning_rate": 1.9600837813038945e-05, "loss": 0.0146, "step": 83120 }, { "epoch": 1.2, "learning_rate": 1.9600789773300474e-05, "loss": 0.012, "step": 83130 }, { "epoch": 1.2, "learning_rate": 1.9600741733562004e-05, "loss": 0.0158, "step": 83140 }, { "epoch": 1.2, "learning_rate": 1.9600693693823533e-05, "loss": 0.0121, "step": 83150 }, { "epoch": 1.2, "learning_rate": 1.960064565408506e-05, "loss": 0.0128, "step": 83160 }, { "epoch": 1.2, "learning_rate": 1.9600597614346588e-05, "loss": 0.0122, "step": 83170 }, { "epoch": 1.2, "learning_rate": 1.9600549574608117e-05, "loss": 0.0129, "step": 83180 }, { "epoch": 1.2, "learning_rate": 1.9600501534869643e-05, "loss": 0.0135, "step": 83190 }, { "epoch": 1.2, "learning_rate": 1.9600453495131173e-05, "loss": 0.0153, "step": 83200 }, { "epoch": 1.2, "learning_rate": 1.9600405455392702e-05, "loss": 0.0122, "step": 83210 }, { "epoch": 1.2, "learning_rate": 1.960035741565423e-05, "loss": 0.0191, "step": 83220 }, { "epoch": 1.2, "learning_rate": 1.9600309375915757e-05, "loss": 0.0077, "step": 83230 }, { "epoch": 1.2, "learning_rate": 1.9600261336177286e-05, "loss": 0.0115, "step": 83240 }, { "epoch": 1.2, "learning_rate": 1.9600213296438816e-05, "loss": 0.014, "step": 83250 }, { "epoch": 1.2, "learning_rate": 1.9600165256700345e-05, "loss": 0.0121, "step": 83260 }, { "epoch": 1.2, "learning_rate": 1.960011721696187e-05, "loss": 0.0136, "step": 83270 }, { "epoch": 1.2, "learning_rate": 1.96000691772234e-05, "loss": 0.0113, "step": 83280 }, { "epoch": 1.2, "learning_rate": 1.960002113748493e-05, "loss": 0.01, "step": 83290 }, { "epoch": 1.2, "learning_rate": 1.9599973097746455e-05, "loss": 0.0107, "step": 83300 }, { "epoch": 1.2, "learning_rate": 1.9599925058007984e-05, "loss": 0.0134, "step": 83310 }, { "epoch": 1.2, "learning_rate": 1.9599877018269514e-05, "loss": 0.0108, "step": 83320 }, { "epoch": 1.2, "learning_rate": 1.9599828978531043e-05, "loss": 0.0135, "step": 83330 }, { "epoch": 1.2, "learning_rate": 1.959978093879257e-05, "loss": 0.0134, "step": 83340 }, { "epoch": 1.2, "learning_rate": 1.95997328990541e-05, "loss": 0.018, "step": 83350 }, { "epoch": 1.2, "learning_rate": 1.9599684859315627e-05, "loss": 0.0114, "step": 83360 }, { "epoch": 1.2, "learning_rate": 1.9599636819577157e-05, "loss": 0.011, "step": 83370 }, { "epoch": 1.2, "learning_rate": 1.9599588779838686e-05, "loss": 0.0127, "step": 83380 }, { "epoch": 1.2, "learning_rate": 1.9599540740100215e-05, "loss": 0.014, "step": 83390 }, { "epoch": 1.2, "learning_rate": 1.959949270036174e-05, "loss": 0.0112, "step": 83400 }, { "epoch": 1.2, "learning_rate": 1.959944466062327e-05, "loss": 0.0127, "step": 83410 }, { "epoch": 1.2, "learning_rate": 1.95993966208848e-05, "loss": 0.0103, "step": 83420 }, { "epoch": 1.2, "learning_rate": 1.9599348581146325e-05, "loss": 0.0117, "step": 83430 }, { "epoch": 1.2, "learning_rate": 1.9599300541407855e-05, "loss": 0.0089, "step": 83440 }, { "epoch": 1.2, "learning_rate": 1.9599252501669384e-05, "loss": 0.0116, "step": 83450 }, { "epoch": 1.2, "learning_rate": 1.9599204461930913e-05, "loss": 0.0136, "step": 83460 }, { "epoch": 1.2, "learning_rate": 1.959915642219244e-05, "loss": 0.0136, "step": 83470 }, { "epoch": 1.2, "learning_rate": 1.959910838245397e-05, "loss": 0.0142, "step": 83480 }, { "epoch": 1.2, "learning_rate": 1.9599060342715498e-05, "loss": 0.0103, "step": 83490 }, { "epoch": 1.2, "learning_rate": 1.9599012302977024e-05, "loss": 0.0129, "step": 83500 }, { "epoch": 1.2, "learning_rate": 1.9598964263238553e-05, "loss": 0.0139, "step": 83510 }, { "epoch": 1.2, "learning_rate": 1.9598916223500082e-05, "loss": 0.0118, "step": 83520 }, { "epoch": 1.2, "learning_rate": 1.959886818376161e-05, "loss": 0.0095, "step": 83530 }, { "epoch": 1.2, "learning_rate": 1.9598820144023137e-05, "loss": 0.0135, "step": 83540 }, { "epoch": 1.2, "learning_rate": 1.9598772104284666e-05, "loss": 0.0125, "step": 83550 }, { "epoch": 1.2, "learning_rate": 1.9598724064546196e-05, "loss": 0.0109, "step": 83560 }, { "epoch": 1.2, "learning_rate": 1.9598676024807725e-05, "loss": 0.0157, "step": 83570 }, { "epoch": 1.2, "learning_rate": 1.959862798506925e-05, "loss": 0.0125, "step": 83580 }, { "epoch": 1.2, "learning_rate": 1.959857994533078e-05, "loss": 0.0109, "step": 83590 }, { "epoch": 1.2, "learning_rate": 1.959853190559231e-05, "loss": 0.0108, "step": 83600 }, { "epoch": 1.2, "learning_rate": 1.9598483865853835e-05, "loss": 0.0118, "step": 83610 }, { "epoch": 1.21, "learning_rate": 1.9598435826115365e-05, "loss": 0.0127, "step": 83620 }, { "epoch": 1.21, "learning_rate": 1.959839259035074e-05, "loss": 0.0136, "step": 83630 }, { "epoch": 1.21, "learning_rate": 1.959834455061227e-05, "loss": 0.0131, "step": 83640 }, { "epoch": 1.21, "learning_rate": 1.9598296510873794e-05, "loss": 0.011, "step": 83650 }, { "epoch": 1.21, "learning_rate": 1.9598248471135324e-05, "loss": 0.0136, "step": 83660 }, { "epoch": 1.21, "learning_rate": 1.9598200431396853e-05, "loss": 0.015, "step": 83670 }, { "epoch": 1.21, "learning_rate": 1.959815239165838e-05, "loss": 0.0162, "step": 83680 }, { "epoch": 1.21, "learning_rate": 1.9598104351919908e-05, "loss": 0.0112, "step": 83690 }, { "epoch": 1.21, "learning_rate": 1.9598056312181437e-05, "loss": 0.0139, "step": 83700 }, { "epoch": 1.21, "learning_rate": 1.9598008272442967e-05, "loss": 0.0122, "step": 83710 }, { "epoch": 1.21, "learning_rate": 1.9597960232704493e-05, "loss": 0.0115, "step": 83720 }, { "epoch": 1.21, "learning_rate": 1.9597912192966022e-05, "loss": 0.0122, "step": 83730 }, { "epoch": 1.21, "learning_rate": 1.959786415322755e-05, "loss": 0.0107, "step": 83740 }, { "epoch": 1.21, "learning_rate": 1.959781611348908e-05, "loss": 0.0103, "step": 83750 }, { "epoch": 1.21, "learning_rate": 1.9597768073750606e-05, "loss": 0.0108, "step": 83760 }, { "epoch": 1.21, "learning_rate": 1.9597720034012135e-05, "loss": 0.008, "step": 83770 }, { "epoch": 1.21, "learning_rate": 1.9597671994273665e-05, "loss": 0.0143, "step": 83780 }, { "epoch": 1.21, "learning_rate": 1.959762395453519e-05, "loss": 0.0097, "step": 83790 }, { "epoch": 1.21, "learning_rate": 1.959757591479672e-05, "loss": 0.0151, "step": 83800 }, { "epoch": 1.21, "learning_rate": 1.959752787505825e-05, "loss": 0.0151, "step": 83810 }, { "epoch": 1.21, "learning_rate": 1.959747983531978e-05, "loss": 0.0161, "step": 83820 }, { "epoch": 1.21, "learning_rate": 1.9597431795581304e-05, "loss": 0.012, "step": 83830 }, { "epoch": 1.21, "learning_rate": 1.9597383755842834e-05, "loss": 0.0127, "step": 83840 }, { "epoch": 1.21, "learning_rate": 1.9597335716104363e-05, "loss": 0.0171, "step": 83850 }, { "epoch": 1.21, "learning_rate": 1.9597287676365892e-05, "loss": 0.0121, "step": 83860 }, { "epoch": 1.21, "learning_rate": 1.959723963662742e-05, "loss": 0.0116, "step": 83870 }, { "epoch": 1.21, "learning_rate": 1.959719159688895e-05, "loss": 0.0103, "step": 83880 }, { "epoch": 1.21, "learning_rate": 1.9597143557150477e-05, "loss": 0.0129, "step": 83890 }, { "epoch": 1.21, "learning_rate": 1.9597095517412006e-05, "loss": 0.0112, "step": 83900 }, { "epoch": 1.21, "learning_rate": 1.9597047477673535e-05, "loss": 0.0115, "step": 83910 }, { "epoch": 1.21, "learning_rate": 1.959699943793506e-05, "loss": 0.0139, "step": 83920 }, { "epoch": 1.21, "learning_rate": 1.959695139819659e-05, "loss": 0.0129, "step": 83930 }, { "epoch": 1.21, "learning_rate": 1.959690335845812e-05, "loss": 0.0144, "step": 83940 }, { "epoch": 1.21, "learning_rate": 1.959685531871965e-05, "loss": 0.007, "step": 83950 }, { "epoch": 1.21, "learning_rate": 1.9596807278981175e-05, "loss": 0.0155, "step": 83960 }, { "epoch": 1.21, "learning_rate": 1.9596759239242704e-05, "loss": 0.0088, "step": 83970 }, { "epoch": 1.21, "learning_rate": 1.9596711199504233e-05, "loss": 0.0124, "step": 83980 }, { "epoch": 1.21, "learning_rate": 1.9596663159765762e-05, "loss": 0.0115, "step": 83990 }, { "epoch": 1.21, "learning_rate": 1.959661512002729e-05, "loss": 0.0136, "step": 84000 }, { "epoch": 1.21, "learning_rate": 1.9596567080288818e-05, "loss": 0.0129, "step": 84010 }, { "epoch": 1.21, "learning_rate": 1.9596519040550347e-05, "loss": 0.0117, "step": 84020 }, { "epoch": 1.21, "learning_rate": 1.9596471000811873e-05, "loss": 0.0102, "step": 84030 }, { "epoch": 1.21, "learning_rate": 1.9596422961073402e-05, "loss": 0.0159, "step": 84040 }, { "epoch": 1.21, "learning_rate": 1.959637492133493e-05, "loss": 0.0096, "step": 84050 }, { "epoch": 1.21, "learning_rate": 1.959632688159646e-05, "loss": 0.0115, "step": 84060 }, { "epoch": 1.21, "learning_rate": 1.9596278841857986e-05, "loss": 0.012, "step": 84070 }, { "epoch": 1.21, "learning_rate": 1.9596230802119516e-05, "loss": 0.0082, "step": 84080 }, { "epoch": 1.21, "learning_rate": 1.9596182762381045e-05, "loss": 0.0095, "step": 84090 }, { "epoch": 1.21, "learning_rate": 1.959613472264257e-05, "loss": 0.015, "step": 84100 }, { "epoch": 1.21, "learning_rate": 1.95960866829041e-05, "loss": 0.0146, "step": 84110 }, { "epoch": 1.21, "learning_rate": 1.959603864316563e-05, "loss": 0.0133, "step": 84120 }, { "epoch": 1.21, "learning_rate": 1.959599060342716e-05, "loss": 0.0136, "step": 84130 }, { "epoch": 1.21, "learning_rate": 1.9595942563688685e-05, "loss": 0.0141, "step": 84140 }, { "epoch": 1.21, "learning_rate": 1.9595894523950214e-05, "loss": 0.0122, "step": 84150 }, { "epoch": 1.21, "learning_rate": 1.9595846484211743e-05, "loss": 0.0145, "step": 84160 }, { "epoch": 1.21, "learning_rate": 1.9595798444473272e-05, "loss": 0.0131, "step": 84170 }, { "epoch": 1.21, "learning_rate": 1.9595750404734798e-05, "loss": 0.009, "step": 84180 }, { "epoch": 1.21, "learning_rate": 1.9595702364996328e-05, "loss": 0.0148, "step": 84190 }, { "epoch": 1.21, "learning_rate": 1.9595654325257857e-05, "loss": 0.0122, "step": 84200 }, { "epoch": 1.21, "learning_rate": 1.9595606285519383e-05, "loss": 0.0134, "step": 84210 }, { "epoch": 1.21, "learning_rate": 1.9595558245780912e-05, "loss": 0.0114, "step": 84220 }, { "epoch": 1.21, "learning_rate": 1.959551020604244e-05, "loss": 0.0124, "step": 84230 }, { "epoch": 1.21, "learning_rate": 1.959546216630397e-05, "loss": 0.011, "step": 84240 }, { "epoch": 1.21, "learning_rate": 1.9595414126565496e-05, "loss": 0.0095, "step": 84250 }, { "epoch": 1.21, "learning_rate": 1.9595366086827026e-05, "loss": 0.0101, "step": 84260 }, { "epoch": 1.21, "learning_rate": 1.9595318047088555e-05, "loss": 0.0099, "step": 84270 }, { "epoch": 1.21, "learning_rate": 1.959527000735008e-05, "loss": 0.0104, "step": 84280 }, { "epoch": 1.21, "learning_rate": 1.959522196761161e-05, "loss": 0.0159, "step": 84290 }, { "epoch": 1.21, "learning_rate": 1.959517392787314e-05, "loss": 0.0176, "step": 84300 }, { "epoch": 1.22, "learning_rate": 1.959512588813467e-05, "loss": 0.0143, "step": 84310 }, { "epoch": 1.22, "learning_rate": 1.9595077848396194e-05, "loss": 0.0114, "step": 84320 }, { "epoch": 1.22, "learning_rate": 1.9595029808657724e-05, "loss": 0.0125, "step": 84330 }, { "epoch": 1.22, "learning_rate": 1.9594981768919253e-05, "loss": 0.0114, "step": 84340 }, { "epoch": 1.22, "learning_rate": 1.9594933729180782e-05, "loss": 0.0116, "step": 84350 }, { "epoch": 1.22, "learning_rate": 1.9594885689442308e-05, "loss": 0.0149, "step": 84360 }, { "epoch": 1.22, "learning_rate": 1.9594837649703837e-05, "loss": 0.0105, "step": 84370 }, { "epoch": 1.22, "learning_rate": 1.9594789609965367e-05, "loss": 0.0105, "step": 84380 }, { "epoch": 1.22, "learning_rate": 1.9594741570226893e-05, "loss": 0.0109, "step": 84390 }, { "epoch": 1.22, "learning_rate": 1.9594693530488422e-05, "loss": 0.0146, "step": 84400 }, { "epoch": 1.22, "learning_rate": 1.959464549074995e-05, "loss": 0.0149, "step": 84410 }, { "epoch": 1.22, "learning_rate": 1.959459745101148e-05, "loss": 0.0149, "step": 84420 }, { "epoch": 1.22, "learning_rate": 1.9594549411273006e-05, "loss": 0.0113, "step": 84430 }, { "epoch": 1.22, "learning_rate": 1.9594501371534536e-05, "loss": 0.0149, "step": 84440 }, { "epoch": 1.22, "learning_rate": 1.9594453331796065e-05, "loss": 0.0122, "step": 84450 }, { "epoch": 1.22, "learning_rate": 1.959440529205759e-05, "loss": 0.0142, "step": 84460 }, { "epoch": 1.22, "learning_rate": 1.959435725231912e-05, "loss": 0.0111, "step": 84470 }, { "epoch": 1.22, "learning_rate": 1.959430921258065e-05, "loss": 0.0137, "step": 84480 }, { "epoch": 1.22, "learning_rate": 1.959426117284218e-05, "loss": 0.0105, "step": 84490 }, { "epoch": 1.22, "learning_rate": 1.9594213133103704e-05, "loss": 0.0151, "step": 84500 }, { "epoch": 1.22, "learning_rate": 1.9594165093365234e-05, "loss": 0.0075, "step": 84510 }, { "epoch": 1.22, "learning_rate": 1.9594117053626763e-05, "loss": 0.0149, "step": 84520 }, { "epoch": 1.22, "learning_rate": 1.959406901388829e-05, "loss": 0.0127, "step": 84530 }, { "epoch": 1.22, "learning_rate": 1.9594020974149818e-05, "loss": 0.0109, "step": 84540 }, { "epoch": 1.22, "learning_rate": 1.9593972934411347e-05, "loss": 0.0101, "step": 84550 }, { "epoch": 1.22, "learning_rate": 1.9593924894672877e-05, "loss": 0.0176, "step": 84560 }, { "epoch": 1.22, "learning_rate": 1.9593876854934403e-05, "loss": 0.0125, "step": 84570 }, { "epoch": 1.22, "learning_rate": 1.9593828815195932e-05, "loss": 0.0156, "step": 84580 }, { "epoch": 1.22, "learning_rate": 1.959378077545746e-05, "loss": 0.0088, "step": 84590 }, { "epoch": 1.22, "learning_rate": 1.959373273571899e-05, "loss": 0.0153, "step": 84600 }, { "epoch": 1.22, "learning_rate": 1.9593684695980516e-05, "loss": 0.0127, "step": 84610 }, { "epoch": 1.22, "learning_rate": 1.9593636656242045e-05, "loss": 0.0119, "step": 84620 }, { "epoch": 1.22, "learning_rate": 1.9593588616503575e-05, "loss": 0.016, "step": 84630 }, { "epoch": 1.22, "learning_rate": 1.95935405767651e-05, "loss": 0.0107, "step": 84640 }, { "epoch": 1.22, "learning_rate": 1.959349253702663e-05, "loss": 0.0166, "step": 84650 }, { "epoch": 1.22, "learning_rate": 1.959344449728816e-05, "loss": 0.0158, "step": 84660 }, { "epoch": 1.22, "learning_rate": 1.959339645754969e-05, "loss": 0.014, "step": 84670 }, { "epoch": 1.22, "learning_rate": 1.9593348417811214e-05, "loss": 0.0139, "step": 84680 }, { "epoch": 1.22, "learning_rate": 1.9593300378072744e-05, "loss": 0.0114, "step": 84690 }, { "epoch": 1.22, "learning_rate": 1.9593252338334273e-05, "loss": 0.0177, "step": 84700 }, { "epoch": 1.22, "learning_rate": 1.95932042985958e-05, "loss": 0.0167, "step": 84710 }, { "epoch": 1.22, "learning_rate": 1.9593156258857328e-05, "loss": 0.0167, "step": 84720 }, { "epoch": 1.22, "learning_rate": 1.9593108219118857e-05, "loss": 0.0141, "step": 84730 }, { "epoch": 1.22, "learning_rate": 1.9593060179380387e-05, "loss": 0.0111, "step": 84740 }, { "epoch": 1.22, "learning_rate": 1.9593012139641912e-05, "loss": 0.0134, "step": 84750 }, { "epoch": 1.22, "learning_rate": 1.9592964099903442e-05, "loss": 0.0092, "step": 84760 }, { "epoch": 1.22, "learning_rate": 1.959291606016497e-05, "loss": 0.0118, "step": 84770 }, { "epoch": 1.22, "learning_rate": 1.95928680204265e-05, "loss": 0.0145, "step": 84780 }, { "epoch": 1.22, "learning_rate": 1.9592819980688026e-05, "loss": 0.0107, "step": 84790 }, { "epoch": 1.22, "learning_rate": 1.9592771940949555e-05, "loss": 0.0122, "step": 84800 }, { "epoch": 1.22, "learning_rate": 1.9592723901211085e-05, "loss": 0.0108, "step": 84810 }, { "epoch": 1.22, "learning_rate": 1.959267586147261e-05, "loss": 0.0115, "step": 84820 }, { "epoch": 1.22, "learning_rate": 1.959262782173414e-05, "loss": 0.0144, "step": 84830 }, { "epoch": 1.22, "learning_rate": 1.959257978199567e-05, "loss": 0.0102, "step": 84840 }, { "epoch": 1.22, "learning_rate": 1.95925317422572e-05, "loss": 0.0118, "step": 84850 }, { "epoch": 1.22, "learning_rate": 1.9592483702518724e-05, "loss": 0.011, "step": 84860 }, { "epoch": 1.22, "learning_rate": 1.9592435662780254e-05, "loss": 0.0101, "step": 84870 }, { "epoch": 1.22, "learning_rate": 1.9592387623041783e-05, "loss": 0.0128, "step": 84880 }, { "epoch": 1.22, "learning_rate": 1.959233958330331e-05, "loss": 0.0108, "step": 84890 }, { "epoch": 1.22, "learning_rate": 1.9592291543564838e-05, "loss": 0.0146, "step": 84900 }, { "epoch": 1.22, "learning_rate": 1.9592243503826367e-05, "loss": 0.0093, "step": 84910 }, { "epoch": 1.22, "learning_rate": 1.9592195464087896e-05, "loss": 0.0099, "step": 84920 }, { "epoch": 1.22, "learning_rate": 1.9592147424349422e-05, "loss": 0.0145, "step": 84930 }, { "epoch": 1.22, "learning_rate": 1.959209938461095e-05, "loss": 0.012, "step": 84940 }, { "epoch": 1.22, "learning_rate": 1.959205134487248e-05, "loss": 0.0144, "step": 84950 }, { "epoch": 1.22, "learning_rate": 1.959200330513401e-05, "loss": 0.0126, "step": 84960 }, { "epoch": 1.22, "learning_rate": 1.9591955265395536e-05, "loss": 0.0118, "step": 84970 }, { "epoch": 1.22, "learning_rate": 1.9591907225657065e-05, "loss": 0.0165, "step": 84980 }, { "epoch": 1.22, "learning_rate": 1.9591859185918595e-05, "loss": 0.0123, "step": 84990 }, { "epoch": 1.23, "learning_rate": 1.959181114618012e-05, "loss": 0.0109, "step": 85000 }, { "epoch": 1.23, "learning_rate": 1.959176310644165e-05, "loss": 0.009, "step": 85010 }, { "epoch": 1.23, "learning_rate": 1.959171506670318e-05, "loss": 0.0195, "step": 85020 }, { "epoch": 1.23, "learning_rate": 1.9591667026964708e-05, "loss": 0.0131, "step": 85030 }, { "epoch": 1.23, "learning_rate": 1.9591618987226234e-05, "loss": 0.0117, "step": 85040 }, { "epoch": 1.23, "learning_rate": 1.9591570947487763e-05, "loss": 0.0153, "step": 85050 }, { "epoch": 1.23, "learning_rate": 1.9591522907749293e-05, "loss": 0.0096, "step": 85060 }, { "epoch": 1.23, "learning_rate": 1.959147486801082e-05, "loss": 0.0128, "step": 85070 }, { "epoch": 1.23, "learning_rate": 1.9591426828272348e-05, "loss": 0.0143, "step": 85080 }, { "epoch": 1.23, "learning_rate": 1.9591378788533877e-05, "loss": 0.0106, "step": 85090 }, { "epoch": 1.23, "learning_rate": 1.9591330748795406e-05, "loss": 0.0189, "step": 85100 }, { "epoch": 1.23, "learning_rate": 1.9591282709056932e-05, "loss": 0.0134, "step": 85110 }, { "epoch": 1.23, "learning_rate": 1.959123466931846e-05, "loss": 0.0144, "step": 85120 }, { "epoch": 1.23, "learning_rate": 1.959118662957999e-05, "loss": 0.0126, "step": 85130 }, { "epoch": 1.23, "learning_rate": 1.959113858984152e-05, "loss": 0.0131, "step": 85140 }, { "epoch": 1.23, "learning_rate": 1.9591090550103046e-05, "loss": 0.0151, "step": 85150 }, { "epoch": 1.23, "learning_rate": 1.9591042510364575e-05, "loss": 0.0104, "step": 85160 }, { "epoch": 1.23, "learning_rate": 1.9590994470626104e-05, "loss": 0.0133, "step": 85170 }, { "epoch": 1.23, "learning_rate": 1.959094643088763e-05, "loss": 0.0121, "step": 85180 }, { "epoch": 1.23, "learning_rate": 1.959089839114916e-05, "loss": 0.0088, "step": 85190 }, { "epoch": 1.23, "learning_rate": 1.959085035141069e-05, "loss": 0.0152, "step": 85200 }, { "epoch": 1.23, "learning_rate": 1.9590802311672218e-05, "loss": 0.016, "step": 85210 }, { "epoch": 1.23, "learning_rate": 1.9590754271933744e-05, "loss": 0.0169, "step": 85220 }, { "epoch": 1.23, "learning_rate": 1.9590706232195273e-05, "loss": 0.0098, "step": 85230 }, { "epoch": 1.23, "learning_rate": 1.9590658192456803e-05, "loss": 0.0165, "step": 85240 }, { "epoch": 1.23, "learning_rate": 1.959061015271833e-05, "loss": 0.0158, "step": 85250 }, { "epoch": 1.23, "learning_rate": 1.9590562112979858e-05, "loss": 0.0099, "step": 85260 }, { "epoch": 1.23, "learning_rate": 1.9590514073241387e-05, "loss": 0.0151, "step": 85270 }, { "epoch": 1.23, "learning_rate": 1.9590466033502916e-05, "loss": 0.0101, "step": 85280 }, { "epoch": 1.23, "learning_rate": 1.9590417993764442e-05, "loss": 0.0136, "step": 85290 }, { "epoch": 1.23, "learning_rate": 1.959036995402597e-05, "loss": 0.0143, "step": 85300 }, { "epoch": 1.23, "learning_rate": 1.95903219142875e-05, "loss": 0.0114, "step": 85310 }, { "epoch": 1.23, "learning_rate": 1.959027387454903e-05, "loss": 0.0156, "step": 85320 }, { "epoch": 1.23, "learning_rate": 1.9590225834810556e-05, "loss": 0.0107, "step": 85330 }, { "epoch": 1.23, "learning_rate": 1.9590177795072085e-05, "loss": 0.0115, "step": 85340 }, { "epoch": 1.23, "learning_rate": 1.9590129755333614e-05, "loss": 0.0177, "step": 85350 }, { "epoch": 1.23, "learning_rate": 1.959008171559514e-05, "loss": 0.0127, "step": 85360 }, { "epoch": 1.23, "learning_rate": 1.959003367585667e-05, "loss": 0.0127, "step": 85370 }, { "epoch": 1.23, "learning_rate": 1.95899856361182e-05, "loss": 0.0121, "step": 85380 }, { "epoch": 1.23, "learning_rate": 1.9589937596379728e-05, "loss": 0.0097, "step": 85390 }, { "epoch": 1.23, "learning_rate": 1.9589889556641254e-05, "loss": 0.0136, "step": 85400 }, { "epoch": 1.23, "learning_rate": 1.9589841516902783e-05, "loss": 0.0109, "step": 85410 }, { "epoch": 1.23, "learning_rate": 1.9589793477164313e-05, "loss": 0.0109, "step": 85420 }, { "epoch": 1.23, "learning_rate": 1.958974543742584e-05, "loss": 0.0106, "step": 85430 }, { "epoch": 1.23, "learning_rate": 1.9589697397687368e-05, "loss": 0.0098, "step": 85440 }, { "epoch": 1.23, "learning_rate": 1.9589649357948897e-05, "loss": 0.0131, "step": 85450 }, { "epoch": 1.23, "learning_rate": 1.9589601318210426e-05, "loss": 0.0148, "step": 85460 }, { "epoch": 1.23, "learning_rate": 1.9589553278471952e-05, "loss": 0.0133, "step": 85470 }, { "epoch": 1.23, "learning_rate": 1.958950523873348e-05, "loss": 0.0112, "step": 85480 }, { "epoch": 1.23, "learning_rate": 1.958945719899501e-05, "loss": 0.0126, "step": 85490 }, { "epoch": 1.23, "learning_rate": 1.958940915925654e-05, "loss": 0.0114, "step": 85500 }, { "epoch": 1.23, "learning_rate": 1.9589361119518066e-05, "loss": 0.0133, "step": 85510 }, { "epoch": 1.23, "learning_rate": 1.9589313079779595e-05, "loss": 0.0107, "step": 85520 }, { "epoch": 1.23, "learning_rate": 1.9589265040041124e-05, "loss": 0.009, "step": 85530 }, { "epoch": 1.23, "learning_rate": 1.958921700030265e-05, "loss": 0.0115, "step": 85540 }, { "epoch": 1.23, "learning_rate": 1.958916896056418e-05, "loss": 0.0118, "step": 85550 }, { "epoch": 1.23, "learning_rate": 1.958912092082571e-05, "loss": 0.0148, "step": 85560 }, { "epoch": 1.23, "learning_rate": 1.9589072881087238e-05, "loss": 0.0103, "step": 85570 }, { "epoch": 1.23, "learning_rate": 1.9589024841348764e-05, "loss": 0.0139, "step": 85580 }, { "epoch": 1.23, "learning_rate": 1.9588976801610293e-05, "loss": 0.0123, "step": 85590 }, { "epoch": 1.23, "learning_rate": 1.9588928761871822e-05, "loss": 0.0163, "step": 85600 }, { "epoch": 1.23, "learning_rate": 1.958888072213335e-05, "loss": 0.0144, "step": 85610 }, { "epoch": 1.23, "learning_rate": 1.9588832682394878e-05, "loss": 0.0121, "step": 85620 }, { "epoch": 1.23, "learning_rate": 1.9588784642656407e-05, "loss": 0.0088, "step": 85630 }, { "epoch": 1.23, "learning_rate": 1.9588736602917936e-05, "loss": 0.0096, "step": 85640 }, { "epoch": 1.23, "learning_rate": 1.958869336715331e-05, "loss": 0.0148, "step": 85650 }, { "epoch": 1.23, "learning_rate": 1.958864532741484e-05, "loss": 0.01, "step": 85660 }, { "epoch": 1.23, "learning_rate": 1.9588597287676366e-05, "loss": 0.0093, "step": 85670 }, { "epoch": 1.23, "learning_rate": 1.9588549247937895e-05, "loss": 0.0109, "step": 85680 }, { "epoch": 1.23, "learning_rate": 1.9588501208199424e-05, "loss": 0.0125, "step": 85690 }, { "epoch": 1.24, "learning_rate": 1.9588453168460954e-05, "loss": 0.0138, "step": 85700 }, { "epoch": 1.24, "learning_rate": 1.958840512872248e-05, "loss": 0.0121, "step": 85710 }, { "epoch": 1.24, "learning_rate": 1.958835708898401e-05, "loss": 0.0105, "step": 85720 }, { "epoch": 1.24, "learning_rate": 1.9588309049245538e-05, "loss": 0.0173, "step": 85730 }, { "epoch": 1.24, "learning_rate": 1.9588261009507067e-05, "loss": 0.0119, "step": 85740 }, { "epoch": 1.24, "learning_rate": 1.9588212969768593e-05, "loss": 0.0119, "step": 85750 }, { "epoch": 1.24, "learning_rate": 1.9588164930030123e-05, "loss": 0.0106, "step": 85760 }, { "epoch": 1.24, "learning_rate": 1.9588116890291652e-05, "loss": 0.0148, "step": 85770 }, { "epoch": 1.24, "learning_rate": 1.9588068850553178e-05, "loss": 0.0133, "step": 85780 }, { "epoch": 1.24, "learning_rate": 1.9588020810814707e-05, "loss": 0.0146, "step": 85790 }, { "epoch": 1.24, "learning_rate": 1.9587972771076236e-05, "loss": 0.0111, "step": 85800 }, { "epoch": 1.24, "learning_rate": 1.9587924731337766e-05, "loss": 0.0257, "step": 85810 }, { "epoch": 1.24, "learning_rate": 1.958787669159929e-05, "loss": 0.0137, "step": 85820 }, { "epoch": 1.24, "learning_rate": 1.958782865186082e-05, "loss": 0.0119, "step": 85830 }, { "epoch": 1.24, "learning_rate": 1.958778061212235e-05, "loss": 0.0103, "step": 85840 }, { "epoch": 1.24, "learning_rate": 1.9587732572383876e-05, "loss": 0.0114, "step": 85850 }, { "epoch": 1.24, "learning_rate": 1.9587684532645405e-05, "loss": 0.0165, "step": 85860 }, { "epoch": 1.24, "learning_rate": 1.9587636492906934e-05, "loss": 0.0125, "step": 85870 }, { "epoch": 1.24, "learning_rate": 1.9587588453168464e-05, "loss": 0.0125, "step": 85880 }, { "epoch": 1.24, "learning_rate": 1.958754041342999e-05, "loss": 0.0137, "step": 85890 }, { "epoch": 1.24, "learning_rate": 1.958749237369152e-05, "loss": 0.0135, "step": 85900 }, { "epoch": 1.24, "learning_rate": 1.9587444333953048e-05, "loss": 0.0144, "step": 85910 }, { "epoch": 1.24, "learning_rate": 1.9587396294214577e-05, "loss": 0.0087, "step": 85920 }, { "epoch": 1.24, "learning_rate": 1.9587348254476103e-05, "loss": 0.013, "step": 85930 }, { "epoch": 1.24, "learning_rate": 1.9587300214737632e-05, "loss": 0.0104, "step": 85940 }, { "epoch": 1.24, "learning_rate": 1.9587252174999162e-05, "loss": 0.0102, "step": 85950 }, { "epoch": 1.24, "learning_rate": 1.9587204135260688e-05, "loss": 0.0159, "step": 85960 }, { "epoch": 1.24, "learning_rate": 1.9587156095522217e-05, "loss": 0.0128, "step": 85970 }, { "epoch": 1.24, "learning_rate": 1.9587108055783746e-05, "loss": 0.0098, "step": 85980 }, { "epoch": 1.24, "learning_rate": 1.9587060016045275e-05, "loss": 0.014, "step": 85990 }, { "epoch": 1.24, "learning_rate": 1.95870119763068e-05, "loss": 0.012, "step": 86000 }, { "epoch": 1.24, "learning_rate": 1.958696393656833e-05, "loss": 0.0145, "step": 86010 }, { "epoch": 1.24, "learning_rate": 1.958691589682986e-05, "loss": 0.0089, "step": 86020 }, { "epoch": 1.24, "learning_rate": 1.9586867857091386e-05, "loss": 0.0101, "step": 86030 }, { "epoch": 1.24, "learning_rate": 1.9586819817352915e-05, "loss": 0.0132, "step": 86040 }, { "epoch": 1.24, "learning_rate": 1.9586771777614444e-05, "loss": 0.0181, "step": 86050 }, { "epoch": 1.24, "learning_rate": 1.9586723737875974e-05, "loss": 0.0128, "step": 86060 }, { "epoch": 1.24, "learning_rate": 1.95866756981375e-05, "loss": 0.0141, "step": 86070 }, { "epoch": 1.24, "learning_rate": 1.958662765839903e-05, "loss": 0.0136, "step": 86080 }, { "epoch": 1.24, "learning_rate": 1.9586579618660558e-05, "loss": 0.0118, "step": 86090 }, { "epoch": 1.24, "learning_rate": 1.9586531578922087e-05, "loss": 0.0113, "step": 86100 }, { "epoch": 1.24, "learning_rate": 1.9586483539183613e-05, "loss": 0.0136, "step": 86110 }, { "epoch": 1.24, "learning_rate": 1.9586435499445142e-05, "loss": 0.0108, "step": 86120 }, { "epoch": 1.24, "learning_rate": 1.958638745970667e-05, "loss": 0.0131, "step": 86130 }, { "epoch": 1.24, "learning_rate": 1.9586339419968198e-05, "loss": 0.01, "step": 86140 }, { "epoch": 1.24, "learning_rate": 1.9586291380229727e-05, "loss": 0.0122, "step": 86150 }, { "epoch": 1.24, "learning_rate": 1.9586243340491256e-05, "loss": 0.0113, "step": 86160 }, { "epoch": 1.24, "learning_rate": 1.9586195300752785e-05, "loss": 0.0131, "step": 86170 }, { "epoch": 1.24, "learning_rate": 1.958614726101431e-05, "loss": 0.0146, "step": 86180 }, { "epoch": 1.24, "learning_rate": 1.958609922127584e-05, "loss": 0.0145, "step": 86190 }, { "epoch": 1.24, "learning_rate": 1.958605118153737e-05, "loss": 0.0142, "step": 86200 }, { "epoch": 1.24, "learning_rate": 1.9586003141798896e-05, "loss": 0.0146, "step": 86210 }, { "epoch": 1.24, "learning_rate": 1.9585955102060425e-05, "loss": 0.0111, "step": 86220 }, { "epoch": 1.24, "learning_rate": 1.9585907062321954e-05, "loss": 0.0151, "step": 86230 }, { "epoch": 1.24, "learning_rate": 1.9585859022583483e-05, "loss": 0.0104, "step": 86240 }, { "epoch": 1.24, "learning_rate": 1.958581098284501e-05, "loss": 0.0131, "step": 86250 }, { "epoch": 1.24, "learning_rate": 1.958576294310654e-05, "loss": 0.0129, "step": 86260 }, { "epoch": 1.24, "learning_rate": 1.9585714903368068e-05, "loss": 0.0081, "step": 86270 }, { "epoch": 1.24, "learning_rate": 1.9585666863629594e-05, "loss": 0.0131, "step": 86280 }, { "epoch": 1.24, "learning_rate": 1.9585618823891123e-05, "loss": 0.0155, "step": 86290 }, { "epoch": 1.24, "learning_rate": 1.9585570784152652e-05, "loss": 0.0115, "step": 86300 }, { "epoch": 1.24, "learning_rate": 1.958552274441418e-05, "loss": 0.0127, "step": 86310 }, { "epoch": 1.24, "learning_rate": 1.9585474704675707e-05, "loss": 0.0088, "step": 86320 }, { "epoch": 1.24, "learning_rate": 1.9585426664937237e-05, "loss": 0.0214, "step": 86330 }, { "epoch": 1.24, "learning_rate": 1.9585378625198766e-05, "loss": 0.0121, "step": 86340 }, { "epoch": 1.24, "learning_rate": 1.9585330585460295e-05, "loss": 0.0125, "step": 86350 }, { "epoch": 1.24, "learning_rate": 1.958528254572182e-05, "loss": 0.0093, "step": 86360 }, { "epoch": 1.24, "learning_rate": 1.958523450598335e-05, "loss": 0.0144, "step": 86370 }, { "epoch": 1.24, "learning_rate": 1.958518646624488e-05, "loss": 0.014, "step": 86380 }, { "epoch": 1.25, "learning_rate": 1.9585138426506406e-05, "loss": 0.0131, "step": 86390 }, { "epoch": 1.25, "learning_rate": 1.9585090386767935e-05, "loss": 0.0084, "step": 86400 }, { "epoch": 1.25, "learning_rate": 1.9585042347029464e-05, "loss": 0.0105, "step": 86410 }, { "epoch": 1.25, "learning_rate": 1.9584994307290993e-05, "loss": 0.0134, "step": 86420 }, { "epoch": 1.25, "learning_rate": 1.958494626755252e-05, "loss": 0.0132, "step": 86430 }, { "epoch": 1.25, "learning_rate": 1.958489822781405e-05, "loss": 0.0106, "step": 86440 }, { "epoch": 1.25, "learning_rate": 1.9584850188075578e-05, "loss": 0.0139, "step": 86450 }, { "epoch": 1.25, "learning_rate": 1.9584802148337104e-05, "loss": 0.0128, "step": 86460 }, { "epoch": 1.25, "learning_rate": 1.9584754108598633e-05, "loss": 0.0116, "step": 86470 }, { "epoch": 1.25, "learning_rate": 1.9584706068860162e-05, "loss": 0.0115, "step": 86480 }, { "epoch": 1.25, "learning_rate": 1.958465802912169e-05, "loss": 0.0098, "step": 86490 }, { "epoch": 1.25, "learning_rate": 1.9584609989383217e-05, "loss": 0.0107, "step": 86500 }, { "epoch": 1.25, "learning_rate": 1.9584561949644747e-05, "loss": 0.0118, "step": 86510 }, { "epoch": 1.25, "learning_rate": 1.9584513909906276e-05, "loss": 0.0111, "step": 86520 }, { "epoch": 1.25, "learning_rate": 1.9584465870167805e-05, "loss": 0.0123, "step": 86530 }, { "epoch": 1.25, "learning_rate": 1.958441783042933e-05, "loss": 0.0105, "step": 86540 }, { "epoch": 1.25, "learning_rate": 1.958436979069086e-05, "loss": 0.0104, "step": 86550 }, { "epoch": 1.25, "learning_rate": 1.958432175095239e-05, "loss": 0.0144, "step": 86560 }, { "epoch": 1.25, "learning_rate": 1.9584273711213916e-05, "loss": 0.0133, "step": 86570 }, { "epoch": 1.25, "learning_rate": 1.9584225671475445e-05, "loss": 0.0135, "step": 86580 }, { "epoch": 1.25, "learning_rate": 1.9584177631736974e-05, "loss": 0.0102, "step": 86590 }, { "epoch": 1.25, "learning_rate": 1.9584129591998503e-05, "loss": 0.0136, "step": 86600 }, { "epoch": 1.25, "learning_rate": 1.958408155226003e-05, "loss": 0.0101, "step": 86610 }, { "epoch": 1.25, "learning_rate": 1.958403351252156e-05, "loss": 0.0082, "step": 86620 }, { "epoch": 1.25, "learning_rate": 1.9583985472783088e-05, "loss": 0.0109, "step": 86630 }, { "epoch": 1.25, "learning_rate": 1.9583937433044614e-05, "loss": 0.0187, "step": 86640 }, { "epoch": 1.25, "learning_rate": 1.9583889393306143e-05, "loss": 0.0112, "step": 86650 }, { "epoch": 1.25, "learning_rate": 1.9583841353567672e-05, "loss": 0.0135, "step": 86660 }, { "epoch": 1.25, "learning_rate": 1.95837933138292e-05, "loss": 0.0109, "step": 86670 }, { "epoch": 1.25, "learning_rate": 1.9583745274090727e-05, "loss": 0.0084, "step": 86680 }, { "epoch": 1.25, "learning_rate": 1.9583697234352257e-05, "loss": 0.0132, "step": 86690 }, { "epoch": 1.25, "learning_rate": 1.9583649194613786e-05, "loss": 0.0149, "step": 86700 }, { "epoch": 1.25, "learning_rate": 1.9583601154875315e-05, "loss": 0.0141, "step": 86710 }, { "epoch": 1.25, "learning_rate": 1.958355311513684e-05, "loss": 0.0085, "step": 86720 }, { "epoch": 1.25, "learning_rate": 1.958350507539837e-05, "loss": 0.0134, "step": 86730 }, { "epoch": 1.25, "learning_rate": 1.95834570356599e-05, "loss": 0.0109, "step": 86740 }, { "epoch": 1.25, "learning_rate": 1.9583408995921425e-05, "loss": 0.012, "step": 86750 }, { "epoch": 1.25, "learning_rate": 1.9583360956182955e-05, "loss": 0.0154, "step": 86760 }, { "epoch": 1.25, "learning_rate": 1.9583312916444484e-05, "loss": 0.0096, "step": 86770 }, { "epoch": 1.25, "learning_rate": 1.9583264876706013e-05, "loss": 0.0134, "step": 86780 }, { "epoch": 1.25, "learning_rate": 1.958321683696754e-05, "loss": 0.0113, "step": 86790 }, { "epoch": 1.25, "learning_rate": 1.958316879722907e-05, "loss": 0.0098, "step": 86800 }, { "epoch": 1.25, "learning_rate": 1.9583120757490598e-05, "loss": 0.0109, "step": 86810 }, { "epoch": 1.25, "learning_rate": 1.9583072717752124e-05, "loss": 0.0185, "step": 86820 }, { "epoch": 1.25, "learning_rate": 1.9583024678013653e-05, "loss": 0.0107, "step": 86830 }, { "epoch": 1.25, "learning_rate": 1.9582976638275182e-05, "loss": 0.0127, "step": 86840 }, { "epoch": 1.25, "learning_rate": 1.958292859853671e-05, "loss": 0.0137, "step": 86850 }, { "epoch": 1.25, "learning_rate": 1.9582880558798237e-05, "loss": 0.0139, "step": 86860 }, { "epoch": 1.25, "learning_rate": 1.9582832519059766e-05, "loss": 0.0088, "step": 86870 }, { "epoch": 1.25, "learning_rate": 1.9582784479321296e-05, "loss": 0.0127, "step": 86880 }, { "epoch": 1.25, "learning_rate": 1.9582736439582825e-05, "loss": 0.0152, "step": 86890 }, { "epoch": 1.25, "learning_rate": 1.958268839984435e-05, "loss": 0.011, "step": 86900 }, { "epoch": 1.25, "learning_rate": 1.958264036010588e-05, "loss": 0.012, "step": 86910 }, { "epoch": 1.25, "learning_rate": 1.958259232036741e-05, "loss": 0.0128, "step": 86920 }, { "epoch": 1.25, "learning_rate": 1.9582544280628935e-05, "loss": 0.0122, "step": 86930 }, { "epoch": 1.25, "learning_rate": 1.9582496240890468e-05, "loss": 0.0123, "step": 86940 }, { "epoch": 1.25, "learning_rate": 1.9582448201151997e-05, "loss": 0.0109, "step": 86950 }, { "epoch": 1.25, "learning_rate": 1.9582400161413523e-05, "loss": 0.0141, "step": 86960 }, { "epoch": 1.25, "learning_rate": 1.9582352121675052e-05, "loss": 0.0151, "step": 86970 }, { "epoch": 1.25, "learning_rate": 1.958230408193658e-05, "loss": 0.0115, "step": 86980 }, { "epoch": 1.25, "learning_rate": 1.9582256042198108e-05, "loss": 0.0122, "step": 86990 }, { "epoch": 1.25, "learning_rate": 1.9582208002459637e-05, "loss": 0.0099, "step": 87000 }, { "epoch": 1.25, "learning_rate": 1.9582159962721166e-05, "loss": 0.01, "step": 87010 }, { "epoch": 1.25, "learning_rate": 1.9582111922982695e-05, "loss": 0.0149, "step": 87020 }, { "epoch": 1.25, "learning_rate": 1.958206388324422e-05, "loss": 0.0102, "step": 87030 }, { "epoch": 1.25, "learning_rate": 1.958201584350575e-05, "loss": 0.013, "step": 87040 }, { "epoch": 1.25, "learning_rate": 1.958196780376728e-05, "loss": 0.0111, "step": 87050 }, { "epoch": 1.25, "learning_rate": 1.9581919764028806e-05, "loss": 0.0101, "step": 87060 }, { "epoch": 1.25, "learning_rate": 1.9581871724290335e-05, "loss": 0.009, "step": 87070 }, { "epoch": 1.25, "learning_rate": 1.9581823684551864e-05, "loss": 0.0162, "step": 87080 }, { "epoch": 1.26, "learning_rate": 1.9581775644813393e-05, "loss": 0.0141, "step": 87090 }, { "epoch": 1.26, "learning_rate": 1.958172760507492e-05, "loss": 0.0108, "step": 87100 }, { "epoch": 1.26, "learning_rate": 1.958167956533645e-05, "loss": 0.0131, "step": 87110 }, { "epoch": 1.26, "learning_rate": 1.9581631525597978e-05, "loss": 0.0124, "step": 87120 }, { "epoch": 1.26, "learning_rate": 1.9581583485859507e-05, "loss": 0.0121, "step": 87130 }, { "epoch": 1.26, "learning_rate": 1.9581535446121033e-05, "loss": 0.0121, "step": 87140 }, { "epoch": 1.26, "learning_rate": 1.9581487406382562e-05, "loss": 0.0157, "step": 87150 }, { "epoch": 1.26, "learning_rate": 1.958143936664409e-05, "loss": 0.0087, "step": 87160 }, { "epoch": 1.26, "learning_rate": 1.9581391326905617e-05, "loss": 0.0113, "step": 87170 }, { "epoch": 1.26, "learning_rate": 1.9581343287167147e-05, "loss": 0.0153, "step": 87180 }, { "epoch": 1.26, "learning_rate": 1.9581295247428676e-05, "loss": 0.0156, "step": 87190 }, { "epoch": 1.26, "learning_rate": 1.9581247207690205e-05, "loss": 0.0114, "step": 87200 }, { "epoch": 1.26, "learning_rate": 1.958119916795173e-05, "loss": 0.0124, "step": 87210 }, { "epoch": 1.26, "learning_rate": 1.958115112821326e-05, "loss": 0.0129, "step": 87220 }, { "epoch": 1.26, "learning_rate": 1.9581107892448635e-05, "loss": 0.0151, "step": 87230 }, { "epoch": 1.26, "learning_rate": 1.958105985271016e-05, "loss": 0.0112, "step": 87240 }, { "epoch": 1.26, "learning_rate": 1.958101181297169e-05, "loss": 0.0106, "step": 87250 }, { "epoch": 1.26, "learning_rate": 1.958096377323322e-05, "loss": 0.0113, "step": 87260 }, { "epoch": 1.26, "learning_rate": 1.958091573349475e-05, "loss": 0.0082, "step": 87270 }, { "epoch": 1.26, "learning_rate": 1.9580867693756275e-05, "loss": 0.0159, "step": 87280 }, { "epoch": 1.26, "learning_rate": 1.9580819654017804e-05, "loss": 0.0147, "step": 87290 }, { "epoch": 1.26, "learning_rate": 1.9580771614279333e-05, "loss": 0.0094, "step": 87300 }, { "epoch": 1.26, "learning_rate": 1.9580723574540862e-05, "loss": 0.0112, "step": 87310 }, { "epoch": 1.26, "learning_rate": 1.958067553480239e-05, "loss": 0.016, "step": 87320 }, { "epoch": 1.26, "learning_rate": 1.9580627495063918e-05, "loss": 0.0092, "step": 87330 }, { "epoch": 1.26, "learning_rate": 1.9580579455325447e-05, "loss": 0.015, "step": 87340 }, { "epoch": 1.26, "learning_rate": 1.9580531415586973e-05, "loss": 0.0175, "step": 87350 }, { "epoch": 1.26, "learning_rate": 1.9580483375848502e-05, "loss": 0.0126, "step": 87360 }, { "epoch": 1.26, "learning_rate": 1.958043533611003e-05, "loss": 0.0152, "step": 87370 }, { "epoch": 1.26, "learning_rate": 1.958038729637156e-05, "loss": 0.0158, "step": 87380 }, { "epoch": 1.26, "learning_rate": 1.9580339256633086e-05, "loss": 0.0128, "step": 87390 }, { "epoch": 1.26, "learning_rate": 1.9580291216894616e-05, "loss": 0.0099, "step": 87400 }, { "epoch": 1.26, "learning_rate": 1.9580243177156145e-05, "loss": 0.0086, "step": 87410 }, { "epoch": 1.26, "learning_rate": 1.958019513741767e-05, "loss": 0.0139, "step": 87420 }, { "epoch": 1.26, "learning_rate": 1.95801470976792e-05, "loss": 0.0091, "step": 87430 }, { "epoch": 1.26, "learning_rate": 1.958009905794073e-05, "loss": 0.0135, "step": 87440 }, { "epoch": 1.26, "learning_rate": 1.958005101820226e-05, "loss": 0.0155, "step": 87450 }, { "epoch": 1.26, "learning_rate": 1.9580002978463788e-05, "loss": 0.0141, "step": 87460 }, { "epoch": 1.26, "learning_rate": 1.9579954938725317e-05, "loss": 0.0096, "step": 87470 }, { "epoch": 1.26, "learning_rate": 1.9579906898986843e-05, "loss": 0.0108, "step": 87480 }, { "epoch": 1.26, "learning_rate": 1.9579858859248372e-05, "loss": 0.0129, "step": 87490 }, { "epoch": 1.26, "learning_rate": 1.95798108195099e-05, "loss": 0.0088, "step": 87500 }, { "epoch": 1.26, "learning_rate": 1.957976277977143e-05, "loss": 0.0096, "step": 87510 }, { "epoch": 1.26, "learning_rate": 1.9579714740032957e-05, "loss": 0.0135, "step": 87520 }, { "epoch": 1.26, "learning_rate": 1.9579666700294486e-05, "loss": 0.019, "step": 87530 }, { "epoch": 1.26, "learning_rate": 1.9579618660556015e-05, "loss": 0.0094, "step": 87540 }, { "epoch": 1.26, "learning_rate": 1.957957062081754e-05, "loss": 0.0131, "step": 87550 }, { "epoch": 1.26, "learning_rate": 1.957952258107907e-05, "loss": 0.0108, "step": 87560 }, { "epoch": 1.26, "learning_rate": 1.95794745413406e-05, "loss": 0.0115, "step": 87570 }, { "epoch": 1.26, "learning_rate": 1.957942650160213e-05, "loss": 0.0127, "step": 87580 }, { "epoch": 1.26, "learning_rate": 1.9579378461863655e-05, "loss": 0.0148, "step": 87590 }, { "epoch": 1.26, "learning_rate": 1.9579330422125184e-05, "loss": 0.0088, "step": 87600 }, { "epoch": 1.26, "learning_rate": 1.9579282382386713e-05, "loss": 0.0142, "step": 87610 }, { "epoch": 1.26, "learning_rate": 1.9579234342648243e-05, "loss": 0.0144, "step": 87620 }, { "epoch": 1.26, "learning_rate": 1.957918630290977e-05, "loss": 0.0125, "step": 87630 }, { "epoch": 1.26, "learning_rate": 1.9579138263171298e-05, "loss": 0.0152, "step": 87640 }, { "epoch": 1.26, "learning_rate": 1.9579090223432827e-05, "loss": 0.0111, "step": 87650 }, { "epoch": 1.26, "learning_rate": 1.9579042183694353e-05, "loss": 0.0111, "step": 87660 }, { "epoch": 1.26, "learning_rate": 1.9578994143955882e-05, "loss": 0.0118, "step": 87670 }, { "epoch": 1.26, "learning_rate": 1.957894610421741e-05, "loss": 0.0113, "step": 87680 }, { "epoch": 1.26, "learning_rate": 1.957889806447894e-05, "loss": 0.0118, "step": 87690 }, { "epoch": 1.26, "learning_rate": 1.9578850024740467e-05, "loss": 0.0159, "step": 87700 }, { "epoch": 1.26, "learning_rate": 1.9578801985001996e-05, "loss": 0.012, "step": 87710 }, { "epoch": 1.26, "learning_rate": 1.9578753945263525e-05, "loss": 0.0124, "step": 87720 }, { "epoch": 1.26, "learning_rate": 1.957870590552505e-05, "loss": 0.007, "step": 87730 }, { "epoch": 1.26, "learning_rate": 1.957865786578658e-05, "loss": 0.031, "step": 87740 }, { "epoch": 1.26, "learning_rate": 1.957860982604811e-05, "loss": 0.0115, "step": 87750 }, { "epoch": 1.26, "learning_rate": 1.957856178630964e-05, "loss": 0.0121, "step": 87760 }, { "epoch": 1.26, "learning_rate": 1.9578513746571165e-05, "loss": 0.01, "step": 87770 }, { "epoch": 1.27, "learning_rate": 1.9578465706832694e-05, "loss": 0.0082, "step": 87780 }, { "epoch": 1.27, "learning_rate": 1.9578417667094223e-05, "loss": 0.0143, "step": 87790 }, { "epoch": 1.27, "learning_rate": 1.9578369627355753e-05, "loss": 0.0148, "step": 87800 }, { "epoch": 1.27, "learning_rate": 1.957832158761728e-05, "loss": 0.0085, "step": 87810 }, { "epoch": 1.27, "learning_rate": 1.9578273547878808e-05, "loss": 0.0103, "step": 87820 }, { "epoch": 1.27, "learning_rate": 1.9578225508140337e-05, "loss": 0.014, "step": 87830 }, { "epoch": 1.27, "learning_rate": 1.9578177468401863e-05, "loss": 0.0124, "step": 87840 }, { "epoch": 1.27, "learning_rate": 1.9578129428663392e-05, "loss": 0.0113, "step": 87850 }, { "epoch": 1.27, "learning_rate": 1.957808138892492e-05, "loss": 0.0107, "step": 87860 }, { "epoch": 1.27, "learning_rate": 1.957803334918645e-05, "loss": 0.0111, "step": 87870 }, { "epoch": 1.27, "learning_rate": 1.9577985309447977e-05, "loss": 0.0123, "step": 87880 }, { "epoch": 1.27, "learning_rate": 1.9577937269709506e-05, "loss": 0.0099, "step": 87890 }, { "epoch": 1.27, "learning_rate": 1.9577889229971035e-05, "loss": 0.0148, "step": 87900 }, { "epoch": 1.27, "learning_rate": 1.957784119023256e-05, "loss": 0.0101, "step": 87910 }, { "epoch": 1.27, "learning_rate": 1.957779315049409e-05, "loss": 0.0127, "step": 87920 }, { "epoch": 1.27, "learning_rate": 1.957774511075562e-05, "loss": 0.0121, "step": 87930 }, { "epoch": 1.27, "learning_rate": 1.957769707101715e-05, "loss": 0.0126, "step": 87940 }, { "epoch": 1.27, "learning_rate": 1.9577649031278675e-05, "loss": 0.0118, "step": 87950 }, { "epoch": 1.27, "learning_rate": 1.9577600991540204e-05, "loss": 0.0208, "step": 87960 }, { "epoch": 1.27, "learning_rate": 1.9577552951801733e-05, "loss": 0.0093, "step": 87970 }, { "epoch": 1.27, "learning_rate": 1.9577504912063263e-05, "loss": 0.0141, "step": 87980 }, { "epoch": 1.27, "learning_rate": 1.957745687232479e-05, "loss": 0.0129, "step": 87990 }, { "epoch": 1.27, "learning_rate": 1.9577408832586318e-05, "loss": 0.014, "step": 88000 }, { "epoch": 1.27, "learning_rate": 1.9577360792847847e-05, "loss": 0.0127, "step": 88010 }, { "epoch": 1.27, "learning_rate": 1.9577312753109373e-05, "loss": 0.0097, "step": 88020 }, { "epoch": 1.27, "learning_rate": 1.9577264713370902e-05, "loss": 0.0153, "step": 88030 }, { "epoch": 1.27, "learning_rate": 1.957721667363243e-05, "loss": 0.0123, "step": 88040 }, { "epoch": 1.27, "learning_rate": 1.957716863389396e-05, "loss": 0.0218, "step": 88050 }, { "epoch": 1.27, "learning_rate": 1.9577120594155487e-05, "loss": 0.0151, "step": 88060 }, { "epoch": 1.27, "learning_rate": 1.9577072554417016e-05, "loss": 0.0161, "step": 88070 }, { "epoch": 1.27, "learning_rate": 1.9577024514678545e-05, "loss": 0.0094, "step": 88080 }, { "epoch": 1.27, "learning_rate": 1.957697647494007e-05, "loss": 0.0127, "step": 88090 }, { "epoch": 1.27, "learning_rate": 1.95769284352016e-05, "loss": 0.0152, "step": 88100 }, { "epoch": 1.27, "learning_rate": 1.957688039546313e-05, "loss": 0.0079, "step": 88110 }, { "epoch": 1.27, "learning_rate": 1.957683235572466e-05, "loss": 0.0136, "step": 88120 }, { "epoch": 1.27, "learning_rate": 1.9576784315986185e-05, "loss": 0.0082, "step": 88130 }, { "epoch": 1.27, "learning_rate": 1.9576736276247714e-05, "loss": 0.0126, "step": 88140 }, { "epoch": 1.27, "learning_rate": 1.9576688236509243e-05, "loss": 0.0148, "step": 88150 }, { "epoch": 1.27, "learning_rate": 1.9576640196770772e-05, "loss": 0.0115, "step": 88160 }, { "epoch": 1.27, "learning_rate": 1.95765921570323e-05, "loss": 0.0122, "step": 88170 }, { "epoch": 1.27, "learning_rate": 1.9576544117293828e-05, "loss": 0.0118, "step": 88180 }, { "epoch": 1.27, "learning_rate": 1.9576496077555357e-05, "loss": 0.0152, "step": 88190 }, { "epoch": 1.27, "learning_rate": 1.9576448037816883e-05, "loss": 0.0129, "step": 88200 }, { "epoch": 1.27, "learning_rate": 1.9576399998078412e-05, "loss": 0.0119, "step": 88210 }, { "epoch": 1.27, "learning_rate": 1.957635195833994e-05, "loss": 0.0178, "step": 88220 }, { "epoch": 1.27, "learning_rate": 1.957630391860147e-05, "loss": 0.0119, "step": 88230 }, { "epoch": 1.27, "learning_rate": 1.9576255878862996e-05, "loss": 0.0131, "step": 88240 }, { "epoch": 1.27, "learning_rate": 1.9576207839124526e-05, "loss": 0.0112, "step": 88250 }, { "epoch": 1.27, "learning_rate": 1.95761646033599e-05, "loss": 0.0223, "step": 88260 }, { "epoch": 1.27, "learning_rate": 1.957611656362143e-05, "loss": 0.0115, "step": 88270 }, { "epoch": 1.27, "learning_rate": 1.957606852388296e-05, "loss": 0.0145, "step": 88280 }, { "epoch": 1.27, "learning_rate": 1.9576020484144488e-05, "loss": 0.0103, "step": 88290 }, { "epoch": 1.27, "learning_rate": 1.9575972444406014e-05, "loss": 0.013, "step": 88300 }, { "epoch": 1.27, "learning_rate": 1.9575924404667543e-05, "loss": 0.0101, "step": 88310 }, { "epoch": 1.27, "learning_rate": 1.9575876364929073e-05, "loss": 0.0126, "step": 88320 }, { "epoch": 1.27, "learning_rate": 1.95758283251906e-05, "loss": 0.0119, "step": 88330 }, { "epoch": 1.27, "learning_rate": 1.9575780285452128e-05, "loss": 0.0123, "step": 88340 }, { "epoch": 1.27, "learning_rate": 1.9575732245713657e-05, "loss": 0.0074, "step": 88350 }, { "epoch": 1.27, "learning_rate": 1.9575684205975186e-05, "loss": 0.0146, "step": 88360 }, { "epoch": 1.27, "learning_rate": 1.9575636166236712e-05, "loss": 0.0084, "step": 88370 }, { "epoch": 1.27, "learning_rate": 1.957558812649824e-05, "loss": 0.0095, "step": 88380 }, { "epoch": 1.27, "learning_rate": 1.957554008675977e-05, "loss": 0.0158, "step": 88390 }, { "epoch": 1.27, "learning_rate": 1.95754920470213e-05, "loss": 0.0141, "step": 88400 }, { "epoch": 1.27, "learning_rate": 1.9575444007282826e-05, "loss": 0.0107, "step": 88410 }, { "epoch": 1.27, "learning_rate": 1.9575395967544355e-05, "loss": 0.0086, "step": 88420 }, { "epoch": 1.27, "learning_rate": 1.9575347927805884e-05, "loss": 0.0121, "step": 88430 }, { "epoch": 1.27, "learning_rate": 1.957529988806741e-05, "loss": 0.0123, "step": 88440 }, { "epoch": 1.27, "learning_rate": 1.957525184832894e-05, "loss": 0.011, "step": 88450 }, { "epoch": 1.27, "learning_rate": 1.957520380859047e-05, "loss": 0.0148, "step": 88460 }, { "epoch": 1.28, "learning_rate": 1.9575155768851998e-05, "loss": 0.0103, "step": 88470 }, { "epoch": 1.28, "learning_rate": 1.9575107729113524e-05, "loss": 0.016, "step": 88480 }, { "epoch": 1.28, "learning_rate": 1.9575059689375053e-05, "loss": 0.0131, "step": 88490 }, { "epoch": 1.28, "learning_rate": 1.9575011649636583e-05, "loss": 0.0107, "step": 88500 }, { "epoch": 1.28, "learning_rate": 1.957496360989811e-05, "loss": 0.0116, "step": 88510 }, { "epoch": 1.28, "learning_rate": 1.9574915570159638e-05, "loss": 0.013, "step": 88520 }, { "epoch": 1.28, "learning_rate": 1.9574867530421167e-05, "loss": 0.011, "step": 88530 }, { "epoch": 1.28, "learning_rate": 1.9574819490682696e-05, "loss": 0.0123, "step": 88540 }, { "epoch": 1.28, "learning_rate": 1.9574771450944222e-05, "loss": 0.0132, "step": 88550 }, { "epoch": 1.28, "learning_rate": 1.957472341120575e-05, "loss": 0.0108, "step": 88560 }, { "epoch": 1.28, "learning_rate": 1.957467537146728e-05, "loss": 0.0113, "step": 88570 }, { "epoch": 1.28, "learning_rate": 1.957462733172881e-05, "loss": 0.0118, "step": 88580 }, { "epoch": 1.28, "learning_rate": 1.9574579291990336e-05, "loss": 0.0111, "step": 88590 }, { "epoch": 1.28, "learning_rate": 1.9574531252251865e-05, "loss": 0.0131, "step": 88600 }, { "epoch": 1.28, "learning_rate": 1.9574483212513394e-05, "loss": 0.0115, "step": 88610 }, { "epoch": 1.28, "learning_rate": 1.957443517277492e-05, "loss": 0.0119, "step": 88620 }, { "epoch": 1.28, "learning_rate": 1.957438713303645e-05, "loss": 0.0158, "step": 88630 }, { "epoch": 1.28, "learning_rate": 1.957433909329798e-05, "loss": 0.0114, "step": 88640 }, { "epoch": 1.28, "learning_rate": 1.9574291053559508e-05, "loss": 0.0158, "step": 88650 }, { "epoch": 1.28, "learning_rate": 1.9574243013821034e-05, "loss": 0.0118, "step": 88660 }, { "epoch": 1.28, "learning_rate": 1.9574194974082563e-05, "loss": 0.0113, "step": 88670 }, { "epoch": 1.28, "learning_rate": 1.9574146934344092e-05, "loss": 0.0103, "step": 88680 }, { "epoch": 1.28, "learning_rate": 1.957409889460562e-05, "loss": 0.0142, "step": 88690 }, { "epoch": 1.28, "learning_rate": 1.9574050854867148e-05, "loss": 0.0077, "step": 88700 }, { "epoch": 1.28, "learning_rate": 1.9574002815128677e-05, "loss": 0.0096, "step": 88710 }, { "epoch": 1.28, "learning_rate": 1.9573954775390206e-05, "loss": 0.0156, "step": 88720 }, { "epoch": 1.28, "learning_rate": 1.9573906735651732e-05, "loss": 0.0139, "step": 88730 }, { "epoch": 1.28, "learning_rate": 1.957385869591326e-05, "loss": 0.0138, "step": 88740 }, { "epoch": 1.28, "learning_rate": 1.957381065617479e-05, "loss": 0.0094, "step": 88750 }, { "epoch": 1.28, "learning_rate": 1.957376261643632e-05, "loss": 0.0075, "step": 88760 }, { "epoch": 1.28, "learning_rate": 1.9573714576697846e-05, "loss": 0.0135, "step": 88770 }, { "epoch": 1.28, "learning_rate": 1.9573666536959375e-05, "loss": 0.0122, "step": 88780 }, { "epoch": 1.28, "learning_rate": 1.9573618497220904e-05, "loss": 0.0123, "step": 88790 }, { "epoch": 1.28, "learning_rate": 1.957357045748243e-05, "loss": 0.0107, "step": 88800 }, { "epoch": 1.28, "learning_rate": 1.957352241774396e-05, "loss": 0.0109, "step": 88810 }, { "epoch": 1.28, "learning_rate": 1.957347437800549e-05, "loss": 0.0147, "step": 88820 }, { "epoch": 1.28, "learning_rate": 1.9573426338267018e-05, "loss": 0.0135, "step": 88830 }, { "epoch": 1.28, "learning_rate": 1.9573378298528544e-05, "loss": 0.0101, "step": 88840 }, { "epoch": 1.28, "learning_rate": 1.9573330258790073e-05, "loss": 0.016, "step": 88850 }, { "epoch": 1.28, "learning_rate": 1.9573282219051602e-05, "loss": 0.0115, "step": 88860 }, { "epoch": 1.28, "learning_rate": 1.9573234179313128e-05, "loss": 0.0131, "step": 88870 }, { "epoch": 1.28, "learning_rate": 1.9573186139574658e-05, "loss": 0.0121, "step": 88880 }, { "epoch": 1.28, "learning_rate": 1.9573138099836187e-05, "loss": 0.0105, "step": 88890 }, { "epoch": 1.28, "learning_rate": 1.9573090060097716e-05, "loss": 0.0126, "step": 88900 }, { "epoch": 1.28, "learning_rate": 1.9573042020359242e-05, "loss": 0.0118, "step": 88910 }, { "epoch": 1.28, "learning_rate": 1.957299398062077e-05, "loss": 0.009, "step": 88920 }, { "epoch": 1.28, "learning_rate": 1.95729459408823e-05, "loss": 0.0107, "step": 88930 }, { "epoch": 1.28, "learning_rate": 1.9572897901143826e-05, "loss": 0.0128, "step": 88940 }, { "epoch": 1.28, "learning_rate": 1.9572849861405356e-05, "loss": 0.0133, "step": 88950 }, { "epoch": 1.28, "learning_rate": 1.9572801821666885e-05, "loss": 0.0105, "step": 88960 }, { "epoch": 1.28, "learning_rate": 1.9572753781928414e-05, "loss": 0.0123, "step": 88970 }, { "epoch": 1.28, "learning_rate": 1.957270574218994e-05, "loss": 0.0124, "step": 88980 }, { "epoch": 1.28, "learning_rate": 1.957265770245147e-05, "loss": 0.0097, "step": 88990 }, { "epoch": 1.28, "learning_rate": 1.9572609662713e-05, "loss": 0.0101, "step": 89000 }, { "epoch": 1.28, "learning_rate": 1.9572561622974528e-05, "loss": 0.011, "step": 89010 }, { "epoch": 1.28, "learning_rate": 1.9572513583236054e-05, "loss": 0.0122, "step": 89020 }, { "epoch": 1.28, "learning_rate": 1.9572465543497583e-05, "loss": 0.0126, "step": 89030 }, { "epoch": 1.28, "learning_rate": 1.9572417503759112e-05, "loss": 0.0135, "step": 89040 }, { "epoch": 1.28, "learning_rate": 1.9572369464020638e-05, "loss": 0.0128, "step": 89050 }, { "epoch": 1.28, "learning_rate": 1.9572321424282167e-05, "loss": 0.0128, "step": 89060 }, { "epoch": 1.28, "learning_rate": 1.9572273384543697e-05, "loss": 0.013, "step": 89070 }, { "epoch": 1.28, "learning_rate": 1.9572225344805226e-05, "loss": 0.0142, "step": 89080 }, { "epoch": 1.28, "learning_rate": 1.9572177305066752e-05, "loss": 0.0117, "step": 89090 }, { "epoch": 1.28, "learning_rate": 1.957212926532828e-05, "loss": 0.0128, "step": 89100 }, { "epoch": 1.28, "learning_rate": 1.957208122558981e-05, "loss": 0.0143, "step": 89110 }, { "epoch": 1.28, "learning_rate": 1.9572033185851336e-05, "loss": 0.0123, "step": 89120 }, { "epoch": 1.28, "learning_rate": 1.9571985146112866e-05, "loss": 0.0122, "step": 89130 }, { "epoch": 1.28, "learning_rate": 1.9571937106374395e-05, "loss": 0.0098, "step": 89140 }, { "epoch": 1.28, "learning_rate": 1.9571889066635924e-05, "loss": 0.0146, "step": 89150 }, { "epoch": 1.28, "learning_rate": 1.957184102689745e-05, "loss": 0.0126, "step": 89160 }, { "epoch": 1.29, "learning_rate": 1.957179298715898e-05, "loss": 0.0146, "step": 89170 }, { "epoch": 1.29, "learning_rate": 1.957174494742051e-05, "loss": 0.0116, "step": 89180 }, { "epoch": 1.29, "learning_rate": 1.9571696907682038e-05, "loss": 0.0106, "step": 89190 }, { "epoch": 1.29, "learning_rate": 1.9571648867943564e-05, "loss": 0.0105, "step": 89200 }, { "epoch": 1.29, "learning_rate": 1.9571600828205093e-05, "loss": 0.0129, "step": 89210 }, { "epoch": 1.29, "learning_rate": 1.9571552788466622e-05, "loss": 0.0184, "step": 89220 }, { "epoch": 1.29, "learning_rate": 1.9571504748728148e-05, "loss": 0.0114, "step": 89230 }, { "epoch": 1.29, "learning_rate": 1.9571456708989677e-05, "loss": 0.0092, "step": 89240 }, { "epoch": 1.29, "learning_rate": 1.9571408669251207e-05, "loss": 0.0215, "step": 89250 }, { "epoch": 1.29, "learning_rate": 1.9571360629512736e-05, "loss": 0.0104, "step": 89260 }, { "epoch": 1.29, "learning_rate": 1.9571312589774262e-05, "loss": 0.013, "step": 89270 }, { "epoch": 1.29, "learning_rate": 1.957126455003579e-05, "loss": 0.0171, "step": 89280 }, { "epoch": 1.29, "learning_rate": 1.957121651029732e-05, "loss": 0.0115, "step": 89290 }, { "epoch": 1.29, "learning_rate": 1.9571168470558846e-05, "loss": 0.0105, "step": 89300 }, { "epoch": 1.29, "learning_rate": 1.9571120430820375e-05, "loss": 0.0109, "step": 89310 }, { "epoch": 1.29, "learning_rate": 1.9571072391081905e-05, "loss": 0.012, "step": 89320 }, { "epoch": 1.29, "learning_rate": 1.9571024351343434e-05, "loss": 0.0108, "step": 89330 }, { "epoch": 1.29, "learning_rate": 1.957097631160496e-05, "loss": 0.0152, "step": 89340 }, { "epoch": 1.29, "learning_rate": 1.957092827186649e-05, "loss": 0.0134, "step": 89350 }, { "epoch": 1.29, "learning_rate": 1.957088023212802e-05, "loss": 0.0096, "step": 89360 }, { "epoch": 1.29, "learning_rate": 1.9570832192389548e-05, "loss": 0.0116, "step": 89370 }, { "epoch": 1.29, "learning_rate": 1.9570784152651074e-05, "loss": 0.0147, "step": 89380 }, { "epoch": 1.29, "learning_rate": 1.9570736112912603e-05, "loss": 0.0108, "step": 89390 }, { "epoch": 1.29, "learning_rate": 1.9570688073174132e-05, "loss": 0.0108, "step": 89400 }, { "epoch": 1.29, "learning_rate": 1.9570640033435658e-05, "loss": 0.0115, "step": 89410 }, { "epoch": 1.29, "learning_rate": 1.9570591993697187e-05, "loss": 0.0104, "step": 89420 }, { "epoch": 1.29, "learning_rate": 1.9570543953958717e-05, "loss": 0.0105, "step": 89430 }, { "epoch": 1.29, "learning_rate": 1.9570495914220246e-05, "loss": 0.0147, "step": 89440 }, { "epoch": 1.29, "learning_rate": 1.957044787448177e-05, "loss": 0.0123, "step": 89450 }, { "epoch": 1.29, "learning_rate": 1.95703998347433e-05, "loss": 0.011, "step": 89460 }, { "epoch": 1.29, "learning_rate": 1.957035179500483e-05, "loss": 0.0174, "step": 89470 }, { "epoch": 1.29, "learning_rate": 1.9570303755266356e-05, "loss": 0.011, "step": 89480 }, { "epoch": 1.29, "learning_rate": 1.9570255715527885e-05, "loss": 0.0107, "step": 89490 }, { "epoch": 1.29, "learning_rate": 1.9570207675789415e-05, "loss": 0.0095, "step": 89500 }, { "epoch": 1.29, "learning_rate": 1.9570159636050944e-05, "loss": 0.0104, "step": 89510 }, { "epoch": 1.29, "learning_rate": 1.957011159631247e-05, "loss": 0.0096, "step": 89520 }, { "epoch": 1.29, "learning_rate": 1.9570063556574e-05, "loss": 0.0122, "step": 89530 }, { "epoch": 1.29, "learning_rate": 1.957001551683553e-05, "loss": 0.0104, "step": 89540 }, { "epoch": 1.29, "learning_rate": 1.9569967477097058e-05, "loss": 0.0115, "step": 89550 }, { "epoch": 1.29, "learning_rate": 1.9569919437358583e-05, "loss": 0.0134, "step": 89560 }, { "epoch": 1.29, "learning_rate": 1.9569871397620113e-05, "loss": 0.0117, "step": 89570 }, { "epoch": 1.29, "learning_rate": 1.9569823357881642e-05, "loss": 0.0148, "step": 89580 }, { "epoch": 1.29, "learning_rate": 1.9569775318143168e-05, "loss": 0.0114, "step": 89590 }, { "epoch": 1.29, "learning_rate": 1.9569727278404697e-05, "loss": 0.0089, "step": 89600 }, { "epoch": 1.29, "learning_rate": 1.9569679238666226e-05, "loss": 0.0101, "step": 89610 }, { "epoch": 1.29, "learning_rate": 1.9569631198927756e-05, "loss": 0.0117, "step": 89620 }, { "epoch": 1.29, "learning_rate": 1.956958315918928e-05, "loss": 0.0138, "step": 89630 }, { "epoch": 1.29, "learning_rate": 1.956953511945081e-05, "loss": 0.0133, "step": 89640 }, { "epoch": 1.29, "learning_rate": 1.956948707971234e-05, "loss": 0.0161, "step": 89650 }, { "epoch": 1.29, "learning_rate": 1.9569439039973866e-05, "loss": 0.011, "step": 89660 }, { "epoch": 1.29, "learning_rate": 1.9569391000235395e-05, "loss": 0.012, "step": 89670 }, { "epoch": 1.29, "learning_rate": 1.9569342960496925e-05, "loss": 0.0132, "step": 89680 }, { "epoch": 1.29, "learning_rate": 1.9569294920758454e-05, "loss": 0.0121, "step": 89690 }, { "epoch": 1.29, "learning_rate": 1.956924688101998e-05, "loss": 0.0124, "step": 89700 }, { "epoch": 1.29, "learning_rate": 1.956919884128151e-05, "loss": 0.01, "step": 89710 }, { "epoch": 1.29, "learning_rate": 1.9569150801543038e-05, "loss": 0.0138, "step": 89720 }, { "epoch": 1.29, "learning_rate": 1.9569102761804568e-05, "loss": 0.0161, "step": 89730 }, { "epoch": 1.29, "learning_rate": 1.9569054722066093e-05, "loss": 0.0112, "step": 89740 }, { "epoch": 1.29, "learning_rate": 1.9569006682327623e-05, "loss": 0.0111, "step": 89750 }, { "epoch": 1.29, "learning_rate": 1.9568958642589152e-05, "loss": 0.0142, "step": 89760 }, { "epoch": 1.29, "learning_rate": 1.9568910602850678e-05, "loss": 0.0139, "step": 89770 }, { "epoch": 1.29, "learning_rate": 1.9568862563112207e-05, "loss": 0.0124, "step": 89780 }, { "epoch": 1.29, "learning_rate": 1.9568814523373736e-05, "loss": 0.0133, "step": 89790 }, { "epoch": 1.29, "learning_rate": 1.9568766483635266e-05, "loss": 0.0104, "step": 89800 }, { "epoch": 1.29, "learning_rate": 1.956871844389679e-05, "loss": 0.011, "step": 89810 }, { "epoch": 1.29, "learning_rate": 1.956867040415832e-05, "loss": 0.01, "step": 89820 }, { "epoch": 1.29, "learning_rate": 1.956862236441985e-05, "loss": 0.013, "step": 89830 }, { "epoch": 1.29, "learning_rate": 1.9568574324681376e-05, "loss": 0.0121, "step": 89840 }, { "epoch": 1.29, "learning_rate": 1.9568526284942905e-05, "loss": 0.0114, "step": 89850 }, { "epoch": 1.3, "learning_rate": 1.9568478245204434e-05, "loss": 0.013, "step": 89860 }, { "epoch": 1.3, "learning_rate": 1.9568430205465964e-05, "loss": 0.011, "step": 89870 }, { "epoch": 1.3, "learning_rate": 1.956838216572749e-05, "loss": 0.0166, "step": 89880 }, { "epoch": 1.3, "learning_rate": 1.956833412598902e-05, "loss": 0.0124, "step": 89890 }, { "epoch": 1.3, "learning_rate": 1.9568286086250548e-05, "loss": 0.0125, "step": 89900 }, { "epoch": 1.3, "learning_rate": 1.9568238046512077e-05, "loss": 0.0102, "step": 89910 }, { "epoch": 1.3, "learning_rate": 1.9568190006773603e-05, "loss": 0.0129, "step": 89920 }, { "epoch": 1.3, "learning_rate": 1.9568141967035133e-05, "loss": 0.0147, "step": 89930 }, { "epoch": 1.3, "learning_rate": 1.9568093927296662e-05, "loss": 0.0117, "step": 89940 }, { "epoch": 1.3, "learning_rate": 1.9568045887558188e-05, "loss": 0.0114, "step": 89950 }, { "epoch": 1.3, "learning_rate": 1.9567997847819717e-05, "loss": 0.0195, "step": 89960 }, { "epoch": 1.3, "learning_rate": 1.9567949808081246e-05, "loss": 0.0115, "step": 89970 }, { "epoch": 1.3, "learning_rate": 1.9567901768342776e-05, "loss": 0.0149, "step": 89980 }, { "epoch": 1.3, "learning_rate": 1.95678537286043e-05, "loss": 0.0111, "step": 89990 }, { "epoch": 1.3, "learning_rate": 1.956780568886583e-05, "loss": 0.0105, "step": 90000 }, { "epoch": 1.3, "learning_rate": 1.956775764912736e-05, "loss": 0.0077, "step": 90010 }, { "epoch": 1.3, "learning_rate": 1.9567709609388886e-05, "loss": 0.0176, "step": 90020 }, { "epoch": 1.3, "learning_rate": 1.9567661569650415e-05, "loss": 0.0134, "step": 90030 }, { "epoch": 1.3, "learning_rate": 1.9567613529911944e-05, "loss": 0.0108, "step": 90040 }, { "epoch": 1.3, "learning_rate": 1.9567565490173474e-05, "loss": 0.017, "step": 90050 }, { "epoch": 1.3, "learning_rate": 1.9567517450435e-05, "loss": 0.0182, "step": 90060 }, { "epoch": 1.3, "learning_rate": 1.956746941069653e-05, "loss": 0.0115, "step": 90070 }, { "epoch": 1.3, "learning_rate": 1.9567421370958058e-05, "loss": 0.0122, "step": 90080 }, { "epoch": 1.3, "learning_rate": 1.9567373331219587e-05, "loss": 0.0136, "step": 90090 }, { "epoch": 1.3, "learning_rate": 1.9567325291481113e-05, "loss": 0.0108, "step": 90100 }, { "epoch": 1.3, "learning_rate": 1.9567277251742642e-05, "loss": 0.0118, "step": 90110 }, { "epoch": 1.3, "learning_rate": 1.9567229212004172e-05, "loss": 0.0107, "step": 90120 }, { "epoch": 1.3, "learning_rate": 1.9567181172265698e-05, "loss": 0.01, "step": 90130 }, { "epoch": 1.3, "learning_rate": 1.9567133132527227e-05, "loss": 0.0092, "step": 90140 }, { "epoch": 1.3, "learning_rate": 1.9567085092788756e-05, "loss": 0.0126, "step": 90150 }, { "epoch": 1.3, "learning_rate": 1.9567037053050285e-05, "loss": 0.011, "step": 90160 }, { "epoch": 1.3, "learning_rate": 1.956698901331181e-05, "loss": 0.0157, "step": 90170 }, { "epoch": 1.3, "learning_rate": 1.956694097357334e-05, "loss": 0.0143, "step": 90180 }, { "epoch": 1.3, "learning_rate": 1.956689293383487e-05, "loss": 0.0132, "step": 90190 }, { "epoch": 1.3, "learning_rate": 1.9566844894096396e-05, "loss": 0.0104, "step": 90200 }, { "epoch": 1.3, "learning_rate": 1.9566796854357925e-05, "loss": 0.0131, "step": 90210 }, { "epoch": 1.3, "learning_rate": 1.9566748814619454e-05, "loss": 0.013, "step": 90220 }, { "epoch": 1.3, "learning_rate": 1.9566700774880984e-05, "loss": 0.0125, "step": 90230 }, { "epoch": 1.3, "learning_rate": 1.956665273514251e-05, "loss": 0.0158, "step": 90240 }, { "epoch": 1.3, "learning_rate": 1.956660469540404e-05, "loss": 0.0109, "step": 90250 }, { "epoch": 1.3, "learning_rate": 1.9566556655665568e-05, "loss": 0.0224, "step": 90260 }, { "epoch": 1.3, "learning_rate": 1.9566508615927097e-05, "loss": 0.0155, "step": 90270 }, { "epoch": 1.3, "learning_rate": 1.9566460576188623e-05, "loss": 0.0141, "step": 90280 }, { "epoch": 1.3, "learning_rate": 1.9566412536450152e-05, "loss": 0.0106, "step": 90290 }, { "epoch": 1.3, "learning_rate": 1.956636449671168e-05, "loss": 0.0126, "step": 90300 }, { "epoch": 1.3, "learning_rate": 1.9566316456973208e-05, "loss": 0.0082, "step": 90310 }, { "epoch": 1.3, "learning_rate": 1.9566268417234737e-05, "loss": 0.0154, "step": 90320 }, { "epoch": 1.3, "learning_rate": 1.9566220377496266e-05, "loss": 0.0108, "step": 90330 }, { "epoch": 1.3, "learning_rate": 1.9566172337757795e-05, "loss": 0.0126, "step": 90340 }, { "epoch": 1.3, "learning_rate": 1.956612429801932e-05, "loss": 0.0103, "step": 90350 }, { "epoch": 1.3, "learning_rate": 1.956607625828085e-05, "loss": 0.013, "step": 90360 }, { "epoch": 1.3, "learning_rate": 1.956602821854238e-05, "loss": 0.0106, "step": 90370 }, { "epoch": 1.3, "learning_rate": 1.9565980178803906e-05, "loss": 0.0172, "step": 90380 }, { "epoch": 1.3, "learning_rate": 1.9565932139065435e-05, "loss": 0.0141, "step": 90390 }, { "epoch": 1.3, "learning_rate": 1.9565884099326964e-05, "loss": 0.0106, "step": 90400 }, { "epoch": 1.3, "learning_rate": 1.9565836059588493e-05, "loss": 0.0086, "step": 90410 }, { "epoch": 1.3, "learning_rate": 1.956578801985002e-05, "loss": 0.0136, "step": 90420 }, { "epoch": 1.3, "learning_rate": 1.956573998011155e-05, "loss": 0.0117, "step": 90430 }, { "epoch": 1.3, "learning_rate": 1.9565691940373078e-05, "loss": 0.0086, "step": 90440 }, { "epoch": 1.3, "learning_rate": 1.9565643900634607e-05, "loss": 0.0129, "step": 90450 }, { "epoch": 1.3, "learning_rate": 1.9565595860896133e-05, "loss": 0.0156, "step": 90460 }, { "epoch": 1.3, "learning_rate": 1.9565547821157662e-05, "loss": 0.0145, "step": 90470 }, { "epoch": 1.3, "learning_rate": 1.956549978141919e-05, "loss": 0.0092, "step": 90480 }, { "epoch": 1.3, "learning_rate": 1.9565451741680717e-05, "loss": 0.0127, "step": 90490 }, { "epoch": 1.3, "learning_rate": 1.9565403701942247e-05, "loss": 0.0133, "step": 90500 }, { "epoch": 1.3, "learning_rate": 1.9565355662203776e-05, "loss": 0.0096, "step": 90510 }, { "epoch": 1.3, "learning_rate": 1.9565307622465305e-05, "loss": 0.0153, "step": 90520 }, { "epoch": 1.3, "learning_rate": 1.9565259582726835e-05, "loss": 0.0132, "step": 90530 }, { "epoch": 1.3, "learning_rate": 1.9565211542988364e-05, "loss": 0.0152, "step": 90540 }, { "epoch": 1.3, "learning_rate": 1.956516350324989e-05, "loss": 0.0111, "step": 90550 }, { "epoch": 1.31, "learning_rate": 1.956511546351142e-05, "loss": 0.0143, "step": 90560 }, { "epoch": 1.31, "learning_rate": 1.9565067423772948e-05, "loss": 0.0106, "step": 90570 }, { "epoch": 1.31, "learning_rate": 1.9565019384034478e-05, "loss": 0.014, "step": 90580 }, { "epoch": 1.31, "learning_rate": 1.9564971344296003e-05, "loss": 0.0109, "step": 90590 }, { "epoch": 1.31, "learning_rate": 1.9564923304557533e-05, "loss": 0.0127, "step": 90600 }, { "epoch": 1.31, "learning_rate": 1.9564875264819062e-05, "loss": 0.0147, "step": 90610 }, { "epoch": 1.31, "learning_rate": 1.9564827225080588e-05, "loss": 0.0088, "step": 90620 }, { "epoch": 1.31, "learning_rate": 1.9564779185342117e-05, "loss": 0.0122, "step": 90630 }, { "epoch": 1.31, "learning_rate": 1.9564731145603646e-05, "loss": 0.0097, "step": 90640 }, { "epoch": 1.31, "learning_rate": 1.9564683105865176e-05, "loss": 0.0129, "step": 90650 }, { "epoch": 1.31, "learning_rate": 1.95646350661267e-05, "loss": 0.0108, "step": 90660 }, { "epoch": 1.31, "learning_rate": 1.956458702638823e-05, "loss": 0.011, "step": 90670 }, { "epoch": 1.31, "learning_rate": 1.956453898664976e-05, "loss": 0.0106, "step": 90680 }, { "epoch": 1.31, "learning_rate": 1.9564490946911286e-05, "loss": 0.009, "step": 90690 }, { "epoch": 1.31, "learning_rate": 1.9564442907172815e-05, "loss": 0.017, "step": 90700 }, { "epoch": 1.31, "learning_rate": 1.9564394867434344e-05, "loss": 0.0091, "step": 90710 }, { "epoch": 1.31, "learning_rate": 1.9564346827695874e-05, "loss": 0.0141, "step": 90720 }, { "epoch": 1.31, "learning_rate": 1.95642987879574e-05, "loss": 0.0163, "step": 90730 }, { "epoch": 1.31, "learning_rate": 1.956425074821893e-05, "loss": 0.0115, "step": 90740 }, { "epoch": 1.31, "learning_rate": 1.9564202708480458e-05, "loss": 0.0145, "step": 90750 }, { "epoch": 1.31, "learning_rate": 1.9564154668741987e-05, "loss": 0.009, "step": 90760 }, { "epoch": 1.31, "learning_rate": 1.9564106629003513e-05, "loss": 0.0149, "step": 90770 }, { "epoch": 1.31, "learning_rate": 1.9564058589265043e-05, "loss": 0.012, "step": 90780 }, { "epoch": 1.31, "learning_rate": 1.9564010549526572e-05, "loss": 0.012, "step": 90790 }, { "epoch": 1.31, "learning_rate": 1.9563962509788098e-05, "loss": 0.0113, "step": 90800 }, { "epoch": 1.31, "learning_rate": 1.9563914470049627e-05, "loss": 0.0151, "step": 90810 }, { "epoch": 1.31, "learning_rate": 1.9563866430311156e-05, "loss": 0.0184, "step": 90820 }, { "epoch": 1.31, "learning_rate": 1.9563818390572686e-05, "loss": 0.011, "step": 90830 }, { "epoch": 1.31, "learning_rate": 1.956377035083421e-05, "loss": 0.0104, "step": 90840 }, { "epoch": 1.31, "learning_rate": 1.956372231109574e-05, "loss": 0.0095, "step": 90850 }, { "epoch": 1.31, "learning_rate": 1.956367427135727e-05, "loss": 0.0098, "step": 90860 }, { "epoch": 1.31, "learning_rate": 1.9563626231618796e-05, "loss": 0.0113, "step": 90870 }, { "epoch": 1.31, "learning_rate": 1.9563578191880325e-05, "loss": 0.0142, "step": 90880 }, { "epoch": 1.31, "learning_rate": 1.9563530152141854e-05, "loss": 0.0181, "step": 90890 }, { "epoch": 1.31, "learning_rate": 1.9563482112403384e-05, "loss": 0.0118, "step": 90900 }, { "epoch": 1.31, "learning_rate": 1.956343407266491e-05, "loss": 0.0137, "step": 90910 }, { "epoch": 1.31, "learning_rate": 1.956338603292644e-05, "loss": 0.0085, "step": 90920 }, { "epoch": 1.31, "learning_rate": 1.9563337993187968e-05, "loss": 0.0106, "step": 90930 }, { "epoch": 1.31, "learning_rate": 1.9563289953449497e-05, "loss": 0.0126, "step": 90940 }, { "epoch": 1.31, "learning_rate": 1.9563241913711023e-05, "loss": 0.0165, "step": 90950 }, { "epoch": 1.31, "learning_rate": 1.9563193873972552e-05, "loss": 0.0152, "step": 90960 }, { "epoch": 1.31, "learning_rate": 1.9563145834234082e-05, "loss": 0.012, "step": 90970 }, { "epoch": 1.31, "learning_rate": 1.9563097794495608e-05, "loss": 0.0129, "step": 90980 }, { "epoch": 1.31, "learning_rate": 1.9563049754757137e-05, "loss": 0.0163, "step": 90990 }, { "epoch": 1.31, "learning_rate": 1.9563001715018666e-05, "loss": 0.0146, "step": 91000 }, { "epoch": 1.31, "learning_rate": 1.9562953675280195e-05, "loss": 0.0163, "step": 91010 }, { "epoch": 1.31, "learning_rate": 1.956290563554172e-05, "loss": 0.0128, "step": 91020 }, { "epoch": 1.31, "learning_rate": 1.956285759580325e-05, "loss": 0.0157, "step": 91030 }, { "epoch": 1.31, "learning_rate": 1.956280955606478e-05, "loss": 0.0129, "step": 91040 }, { "epoch": 1.31, "learning_rate": 1.9562761516326306e-05, "loss": 0.0117, "step": 91050 }, { "epoch": 1.31, "learning_rate": 1.9562713476587835e-05, "loss": 0.0108, "step": 91060 }, { "epoch": 1.31, "learning_rate": 1.9562665436849364e-05, "loss": 0.012, "step": 91070 }, { "epoch": 1.31, "learning_rate": 1.9562617397110894e-05, "loss": 0.0104, "step": 91080 }, { "epoch": 1.31, "learning_rate": 1.956256935737242e-05, "loss": 0.0118, "step": 91090 }, { "epoch": 1.31, "learning_rate": 1.956252131763395e-05, "loss": 0.0116, "step": 91100 }, { "epoch": 1.31, "learning_rate": 1.9562473277895478e-05, "loss": 0.0079, "step": 91110 }, { "epoch": 1.31, "learning_rate": 1.9562425238157007e-05, "loss": 0.0109, "step": 91120 }, { "epoch": 1.31, "learning_rate": 1.9562377198418533e-05, "loss": 0.0122, "step": 91130 }, { "epoch": 1.31, "learning_rate": 1.9562329158680062e-05, "loss": 0.0159, "step": 91140 }, { "epoch": 1.31, "learning_rate": 1.956228111894159e-05, "loss": 0.0167, "step": 91150 }, { "epoch": 1.31, "learning_rate": 1.9562233079203118e-05, "loss": 0.0141, "step": 91160 }, { "epoch": 1.31, "learning_rate": 1.9562185039464647e-05, "loss": 0.0118, "step": 91170 }, { "epoch": 1.31, "learning_rate": 1.9562136999726176e-05, "loss": 0.0168, "step": 91180 }, { "epoch": 1.31, "learning_rate": 1.9562088959987705e-05, "loss": 0.0133, "step": 91190 }, { "epoch": 1.31, "learning_rate": 1.956204092024923e-05, "loss": 0.012, "step": 91200 }, { "epoch": 1.31, "learning_rate": 1.956199288051076e-05, "loss": 0.0084, "step": 91210 }, { "epoch": 1.31, "learning_rate": 1.956194484077229e-05, "loss": 0.0095, "step": 91220 }, { "epoch": 1.31, "learning_rate": 1.9561896801033816e-05, "loss": 0.0105, "step": 91230 }, { "epoch": 1.31, "learning_rate": 1.9561848761295345e-05, "loss": 0.0116, "step": 91240 }, { "epoch": 1.32, "learning_rate": 1.9561800721556874e-05, "loss": 0.0117, "step": 91250 }, { "epoch": 1.32, "learning_rate": 1.9561752681818403e-05, "loss": 0.0116, "step": 91260 }, { "epoch": 1.32, "learning_rate": 1.956170464207993e-05, "loss": 0.0131, "step": 91270 }, { "epoch": 1.32, "learning_rate": 1.956165660234146e-05, "loss": 0.0136, "step": 91280 }, { "epoch": 1.32, "learning_rate": 1.9561608562602988e-05, "loss": 0.0086, "step": 91290 }, { "epoch": 1.32, "learning_rate": 1.9561560522864517e-05, "loss": 0.0146, "step": 91300 }, { "epoch": 1.32, "learning_rate": 1.9561512483126043e-05, "loss": 0.0162, "step": 91310 }, { "epoch": 1.32, "learning_rate": 1.9561464443387572e-05, "loss": 0.0104, "step": 91320 }, { "epoch": 1.32, "learning_rate": 1.95614164036491e-05, "loss": 0.0146, "step": 91330 }, { "epoch": 1.32, "learning_rate": 1.9561368363910627e-05, "loss": 0.0097, "step": 91340 }, { "epoch": 1.32, "learning_rate": 1.9561320324172157e-05, "loss": 0.0121, "step": 91350 }, { "epoch": 1.32, "learning_rate": 1.9561272284433686e-05, "loss": 0.0075, "step": 91360 }, { "epoch": 1.32, "learning_rate": 1.9561224244695215e-05, "loss": 0.0188, "step": 91370 }, { "epoch": 1.32, "learning_rate": 1.956117620495674e-05, "loss": 0.0112, "step": 91380 }, { "epoch": 1.32, "learning_rate": 1.956112816521827e-05, "loss": 0.012, "step": 91390 }, { "epoch": 1.32, "learning_rate": 1.95610801254798e-05, "loss": 0.0103, "step": 91400 }, { "epoch": 1.32, "learning_rate": 1.9561032085741326e-05, "loss": 0.013, "step": 91410 }, { "epoch": 1.32, "learning_rate": 1.9560984046002855e-05, "loss": 0.0137, "step": 91420 }, { "epoch": 1.32, "learning_rate": 1.9560936006264384e-05, "loss": 0.0086, "step": 91430 }, { "epoch": 1.32, "learning_rate": 1.9560887966525913e-05, "loss": 0.01, "step": 91440 }, { "epoch": 1.32, "learning_rate": 1.956083992678744e-05, "loss": 0.0081, "step": 91450 }, { "epoch": 1.32, "learning_rate": 1.956079188704897e-05, "loss": 0.0113, "step": 91460 }, { "epoch": 1.32, "learning_rate": 1.9560743847310498e-05, "loss": 0.0098, "step": 91470 }, { "epoch": 1.32, "learning_rate": 1.9560695807572027e-05, "loss": 0.0149, "step": 91480 }, { "epoch": 1.32, "learning_rate": 1.9560647767833553e-05, "loss": 0.0107, "step": 91490 }, { "epoch": 1.32, "learning_rate": 1.9560599728095082e-05, "loss": 0.0116, "step": 91500 }, { "epoch": 1.32, "learning_rate": 1.956055168835661e-05, "loss": 0.0144, "step": 91510 }, { "epoch": 1.32, "learning_rate": 1.9560503648618137e-05, "loss": 0.0125, "step": 91520 }, { "epoch": 1.32, "learning_rate": 1.9560455608879667e-05, "loss": 0.0123, "step": 91530 }, { "epoch": 1.32, "learning_rate": 1.9560407569141196e-05, "loss": 0.0116, "step": 91540 }, { "epoch": 1.32, "learning_rate": 1.9560359529402725e-05, "loss": 0.0101, "step": 91550 }, { "epoch": 1.32, "learning_rate": 1.956031148966425e-05, "loss": 0.0132, "step": 91560 }, { "epoch": 1.32, "learning_rate": 1.956026344992578e-05, "loss": 0.0122, "step": 91570 }, { "epoch": 1.32, "learning_rate": 1.956021541018731e-05, "loss": 0.0102, "step": 91580 }, { "epoch": 1.32, "learning_rate": 1.9560167370448836e-05, "loss": 0.0124, "step": 91590 }, { "epoch": 1.32, "learning_rate": 1.9560119330710365e-05, "loss": 0.0155, "step": 91600 }, { "epoch": 1.32, "learning_rate": 1.9560071290971894e-05, "loss": 0.0152, "step": 91610 }, { "epoch": 1.32, "learning_rate": 1.9560023251233423e-05, "loss": 0.013, "step": 91620 }, { "epoch": 1.32, "learning_rate": 1.955997521149495e-05, "loss": 0.0132, "step": 91630 }, { "epoch": 1.32, "learning_rate": 1.955992717175648e-05, "loss": 0.0103, "step": 91640 }, { "epoch": 1.32, "learning_rate": 1.9559879132018008e-05, "loss": 0.0128, "step": 91650 }, { "epoch": 1.32, "learning_rate": 1.9559831092279537e-05, "loss": 0.0098, "step": 91660 }, { "epoch": 1.32, "learning_rate": 1.9559783052541063e-05, "loss": 0.0086, "step": 91670 }, { "epoch": 1.32, "learning_rate": 1.9559735012802592e-05, "loss": 0.0153, "step": 91680 }, { "epoch": 1.32, "learning_rate": 1.955968697306412e-05, "loss": 0.0113, "step": 91690 }, { "epoch": 1.32, "learning_rate": 1.9559638933325647e-05, "loss": 0.0107, "step": 91700 }, { "epoch": 1.32, "learning_rate": 1.9559590893587177e-05, "loss": 0.0112, "step": 91710 }, { "epoch": 1.32, "learning_rate": 1.9559542853848706e-05, "loss": 0.0129, "step": 91720 }, { "epoch": 1.32, "learning_rate": 1.9559494814110235e-05, "loss": 0.0083, "step": 91730 }, { "epoch": 1.32, "learning_rate": 1.955944677437176e-05, "loss": 0.0119, "step": 91740 }, { "epoch": 1.32, "learning_rate": 1.955939873463329e-05, "loss": 0.0133, "step": 91750 }, { "epoch": 1.32, "learning_rate": 1.955935069489482e-05, "loss": 0.01, "step": 91760 }, { "epoch": 1.32, "learning_rate": 1.9559302655156345e-05, "loss": 0.0137, "step": 91770 }, { "epoch": 1.32, "learning_rate": 1.9559254615417875e-05, "loss": 0.0143, "step": 91780 }, { "epoch": 1.32, "learning_rate": 1.9559206575679404e-05, "loss": 0.0154, "step": 91790 }, { "epoch": 1.32, "learning_rate": 1.9559158535940933e-05, "loss": 0.0088, "step": 91800 }, { "epoch": 1.32, "learning_rate": 1.955911049620246e-05, "loss": 0.0141, "step": 91810 }, { "epoch": 1.32, "learning_rate": 1.955906245646399e-05, "loss": 0.0101, "step": 91820 }, { "epoch": 1.32, "learning_rate": 1.9559014416725518e-05, "loss": 0.0117, "step": 91830 }, { "epoch": 1.32, "learning_rate": 1.9558966376987047e-05, "loss": 0.0121, "step": 91840 }, { "epoch": 1.32, "learning_rate": 1.9558918337248573e-05, "loss": 0.0115, "step": 91850 }, { "epoch": 1.32, "learning_rate": 1.9558870297510102e-05, "loss": 0.0131, "step": 91860 }, { "epoch": 1.32, "learning_rate": 1.955882225777163e-05, "loss": 0.0096, "step": 91870 }, { "epoch": 1.32, "learning_rate": 1.9558774218033157e-05, "loss": 0.0124, "step": 91880 }, { "epoch": 1.32, "learning_rate": 1.9558726178294686e-05, "loss": 0.012, "step": 91890 }, { "epoch": 1.32, "learning_rate": 1.9558678138556216e-05, "loss": 0.0118, "step": 91900 }, { "epoch": 1.32, "learning_rate": 1.9558630098817745e-05, "loss": 0.016, "step": 91910 }, { "epoch": 1.32, "learning_rate": 1.955858205907927e-05, "loss": 0.0128, "step": 91920 }, { "epoch": 1.32, "learning_rate": 1.95585340193408e-05, "loss": 0.0098, "step": 91930 }, { "epoch": 1.33, "learning_rate": 1.955848597960233e-05, "loss": 0.013, "step": 91940 }, { "epoch": 1.33, "learning_rate": 1.9558437939863855e-05, "loss": 0.0152, "step": 91950 }, { "epoch": 1.33, "learning_rate": 1.9558389900125385e-05, "loss": 0.011, "step": 91960 }, { "epoch": 1.33, "learning_rate": 1.9558341860386914e-05, "loss": 0.0112, "step": 91970 }, { "epoch": 1.33, "learning_rate": 1.9558293820648443e-05, "loss": 0.0149, "step": 91980 }, { "epoch": 1.33, "learning_rate": 1.955824578090997e-05, "loss": 0.0109, "step": 91990 }, { "epoch": 1.33, "learning_rate": 1.9558197741171498e-05, "loss": 0.0115, "step": 92000 }, { "epoch": 1.33, "learning_rate": 1.9558149701433028e-05, "loss": 0.0134, "step": 92010 }, { "epoch": 1.33, "learning_rate": 1.9558101661694557e-05, "loss": 0.011, "step": 92020 }, { "epoch": 1.33, "learning_rate": 1.9558053621956083e-05, "loss": 0.0124, "step": 92030 }, { "epoch": 1.33, "learning_rate": 1.9558005582217612e-05, "loss": 0.0146, "step": 92040 }, { "epoch": 1.33, "learning_rate": 1.955795754247914e-05, "loss": 0.0098, "step": 92050 }, { "epoch": 1.33, "learning_rate": 1.9557909502740667e-05, "loss": 0.0141, "step": 92060 }, { "epoch": 1.33, "learning_rate": 1.9557861463002196e-05, "loss": 0.0118, "step": 92070 }, { "epoch": 1.33, "learning_rate": 1.9557813423263726e-05, "loss": 0.01, "step": 92080 }, { "epoch": 1.33, "learning_rate": 1.9557765383525255e-05, "loss": 0.0186, "step": 92090 }, { "epoch": 1.33, "learning_rate": 1.955771734378678e-05, "loss": 0.0117, "step": 92100 }, { "epoch": 1.33, "learning_rate": 1.955766930404831e-05, "loss": 0.0098, "step": 92110 }, { "epoch": 1.33, "learning_rate": 1.955762126430984e-05, "loss": 0.0098, "step": 92120 }, { "epoch": 1.33, "learning_rate": 1.9557573224571365e-05, "loss": 0.0123, "step": 92130 }, { "epoch": 1.33, "learning_rate": 1.9557525184832895e-05, "loss": 0.0096, "step": 92140 }, { "epoch": 1.33, "learning_rate": 1.9557477145094424e-05, "loss": 0.0135, "step": 92150 }, { "epoch": 1.33, "learning_rate": 1.9557429105355953e-05, "loss": 0.0123, "step": 92160 }, { "epoch": 1.33, "learning_rate": 1.955738106561748e-05, "loss": 0.0096, "step": 92170 }, { "epoch": 1.33, "learning_rate": 1.9557333025879008e-05, "loss": 0.0104, "step": 92180 }, { "epoch": 1.33, "learning_rate": 1.9557284986140537e-05, "loss": 0.0119, "step": 92190 }, { "epoch": 1.33, "learning_rate": 1.9557236946402063e-05, "loss": 0.0137, "step": 92200 }, { "epoch": 1.33, "learning_rate": 1.9557188906663593e-05, "loss": 0.0117, "step": 92210 }, { "epoch": 1.33, "learning_rate": 1.9557140866925122e-05, "loss": 0.0141, "step": 92220 }, { "epoch": 1.33, "learning_rate": 1.955709282718665e-05, "loss": 0.0097, "step": 92230 }, { "epoch": 1.33, "learning_rate": 1.9557044787448177e-05, "loss": 0.0131, "step": 92240 }, { "epoch": 1.33, "learning_rate": 1.9556996747709706e-05, "loss": 0.0084, "step": 92250 }, { "epoch": 1.33, "learning_rate": 1.9556948707971236e-05, "loss": 0.0096, "step": 92260 }, { "epoch": 1.33, "learning_rate": 1.9556900668232765e-05, "loss": 0.01, "step": 92270 }, { "epoch": 1.33, "learning_rate": 1.955685262849429e-05, "loss": 0.0136, "step": 92280 }, { "epoch": 1.33, "learning_rate": 1.955680458875582e-05, "loss": 0.0116, "step": 92290 }, { "epoch": 1.33, "learning_rate": 1.955675654901735e-05, "loss": 0.0161, "step": 92300 }, { "epoch": 1.33, "learning_rate": 1.9556708509278875e-05, "loss": 0.0197, "step": 92310 }, { "epoch": 1.33, "learning_rate": 1.9556660469540404e-05, "loss": 0.0114, "step": 92320 }, { "epoch": 1.33, "learning_rate": 1.9556612429801934e-05, "loss": 0.013, "step": 92330 }, { "epoch": 1.33, "learning_rate": 1.9556564390063463e-05, "loss": 0.0108, "step": 92340 }, { "epoch": 1.33, "learning_rate": 1.955651635032499e-05, "loss": 0.011, "step": 92350 }, { "epoch": 1.33, "learning_rate": 1.9556468310586518e-05, "loss": 0.0106, "step": 92360 }, { "epoch": 1.33, "learning_rate": 1.9556420270848047e-05, "loss": 0.0095, "step": 92370 }, { "epoch": 1.33, "learning_rate": 1.9556372231109573e-05, "loss": 0.0149, "step": 92380 }, { "epoch": 1.33, "learning_rate": 1.9556324191371103e-05, "loss": 0.0107, "step": 92390 }, { "epoch": 1.33, "learning_rate": 1.9556276151632632e-05, "loss": 0.0132, "step": 92400 }, { "epoch": 1.33, "learning_rate": 1.955622811189416e-05, "loss": 0.0123, "step": 92410 }, { "epoch": 1.33, "learning_rate": 1.9556180072155687e-05, "loss": 0.0079, "step": 92420 }, { "epoch": 1.33, "learning_rate": 1.9556132032417216e-05, "loss": 0.0068, "step": 92430 }, { "epoch": 1.33, "learning_rate": 1.9556083992678746e-05, "loss": 0.0109, "step": 92440 }, { "epoch": 1.33, "learning_rate": 1.9556035952940275e-05, "loss": 0.0161, "step": 92450 }, { "epoch": 1.33, "learning_rate": 1.95559879132018e-05, "loss": 0.0124, "step": 92460 }, { "epoch": 1.33, "learning_rate": 1.955593987346333e-05, "loss": 0.0103, "step": 92470 }, { "epoch": 1.33, "learning_rate": 1.955589183372486e-05, "loss": 0.0098, "step": 92480 }, { "epoch": 1.33, "learning_rate": 1.9555843793986385e-05, "loss": 0.0127, "step": 92490 }, { "epoch": 1.33, "learning_rate": 1.9555795754247914e-05, "loss": 0.0135, "step": 92500 }, { "epoch": 1.33, "learning_rate": 1.9555747714509444e-05, "loss": 0.0137, "step": 92510 }, { "epoch": 1.33, "learning_rate": 1.9555699674770973e-05, "loss": 0.0103, "step": 92520 }, { "epoch": 1.33, "learning_rate": 1.95556516350325e-05, "loss": 0.0116, "step": 92530 }, { "epoch": 1.33, "learning_rate": 1.9555603595294028e-05, "loss": 0.0124, "step": 92540 }, { "epoch": 1.33, "learning_rate": 1.9555555555555557e-05, "loss": 0.011, "step": 92550 }, { "epoch": 1.33, "learning_rate": 1.9555507515817083e-05, "loss": 0.0139, "step": 92560 }, { "epoch": 1.33, "learning_rate": 1.9555459476078612e-05, "loss": 0.0098, "step": 92570 }, { "epoch": 1.33, "learning_rate": 1.9555411436340142e-05, "loss": 0.0141, "step": 92580 }, { "epoch": 1.33, "learning_rate": 1.955536339660167e-05, "loss": 0.0115, "step": 92590 }, { "epoch": 1.33, "learning_rate": 1.9555320160837046e-05, "loss": 0.0118, "step": 92600 }, { "epoch": 1.33, "learning_rate": 1.9555272121098575e-05, "loss": 0.01, "step": 92610 }, { "epoch": 1.33, "learning_rate": 1.95552240813601e-05, "loss": 0.013, "step": 92620 }, { "epoch": 1.33, "learning_rate": 1.955517604162163e-05, "loss": 0.0115, "step": 92630 }, { "epoch": 1.34, "learning_rate": 1.955512800188316e-05, "loss": 0.0119, "step": 92640 }, { "epoch": 1.34, "learning_rate": 1.955507996214469e-05, "loss": 0.0126, "step": 92650 }, { "epoch": 1.34, "learning_rate": 1.9555031922406214e-05, "loss": 0.009, "step": 92660 }, { "epoch": 1.34, "learning_rate": 1.9554983882667744e-05, "loss": 0.0126, "step": 92670 }, { "epoch": 1.34, "learning_rate": 1.9554935842929273e-05, "loss": 0.0119, "step": 92680 }, { "epoch": 1.34, "learning_rate": 1.9554887803190802e-05, "loss": 0.0142, "step": 92690 }, { "epoch": 1.34, "learning_rate": 1.9554839763452328e-05, "loss": 0.0119, "step": 92700 }, { "epoch": 1.34, "learning_rate": 1.9554791723713857e-05, "loss": 0.0149, "step": 92710 }, { "epoch": 1.34, "learning_rate": 1.9554743683975387e-05, "loss": 0.0115, "step": 92720 }, { "epoch": 1.34, "learning_rate": 1.9554695644236913e-05, "loss": 0.0112, "step": 92730 }, { "epoch": 1.34, "learning_rate": 1.9554647604498442e-05, "loss": 0.014, "step": 92740 }, { "epoch": 1.34, "learning_rate": 1.955459956475997e-05, "loss": 0.014, "step": 92750 }, { "epoch": 1.34, "learning_rate": 1.95545515250215e-05, "loss": 0.0115, "step": 92760 }, { "epoch": 1.34, "learning_rate": 1.9554503485283026e-05, "loss": 0.0129, "step": 92770 }, { "epoch": 1.34, "learning_rate": 1.9554455445544556e-05, "loss": 0.0135, "step": 92780 }, { "epoch": 1.34, "learning_rate": 1.9554407405806085e-05, "loss": 0.0116, "step": 92790 }, { "epoch": 1.34, "learning_rate": 1.955435936606761e-05, "loss": 0.0168, "step": 92800 }, { "epoch": 1.34, "learning_rate": 1.955431132632914e-05, "loss": 0.0131, "step": 92810 }, { "epoch": 1.34, "learning_rate": 1.955426328659067e-05, "loss": 0.0095, "step": 92820 }, { "epoch": 1.34, "learning_rate": 1.95542152468522e-05, "loss": 0.0127, "step": 92830 }, { "epoch": 1.34, "learning_rate": 1.9554167207113724e-05, "loss": 0.012, "step": 92840 }, { "epoch": 1.34, "learning_rate": 1.9554119167375254e-05, "loss": 0.0192, "step": 92850 }, { "epoch": 1.34, "learning_rate": 1.9554071127636783e-05, "loss": 0.0123, "step": 92860 }, { "epoch": 1.34, "learning_rate": 1.9554023087898312e-05, "loss": 0.0114, "step": 92870 }, { "epoch": 1.34, "learning_rate": 1.9553975048159838e-05, "loss": 0.0093, "step": 92880 }, { "epoch": 1.34, "learning_rate": 1.9553927008421367e-05, "loss": 0.0109, "step": 92890 }, { "epoch": 1.34, "learning_rate": 1.9553878968682897e-05, "loss": 0.0106, "step": 92900 }, { "epoch": 1.34, "learning_rate": 1.9553830928944423e-05, "loss": 0.0126, "step": 92910 }, { "epoch": 1.34, "learning_rate": 1.9553782889205952e-05, "loss": 0.0129, "step": 92920 }, { "epoch": 1.34, "learning_rate": 1.955373484946748e-05, "loss": 0.0108, "step": 92930 }, { "epoch": 1.34, "learning_rate": 1.955368680972901e-05, "loss": 0.0144, "step": 92940 }, { "epoch": 1.34, "learning_rate": 1.9553638769990536e-05, "loss": 0.0111, "step": 92950 }, { "epoch": 1.34, "learning_rate": 1.9553590730252065e-05, "loss": 0.0121, "step": 92960 }, { "epoch": 1.34, "learning_rate": 1.9553542690513595e-05, "loss": 0.0098, "step": 92970 }, { "epoch": 1.34, "learning_rate": 1.955349465077512e-05, "loss": 0.0119, "step": 92980 }, { "epoch": 1.34, "learning_rate": 1.955344661103665e-05, "loss": 0.0124, "step": 92990 }, { "epoch": 1.34, "learning_rate": 1.955339857129818e-05, "loss": 0.0173, "step": 93000 }, { "epoch": 1.34, "learning_rate": 1.955335053155971e-05, "loss": 0.0149, "step": 93010 }, { "epoch": 1.34, "learning_rate": 1.9553302491821234e-05, "loss": 0.0094, "step": 93020 }, { "epoch": 1.34, "learning_rate": 1.9553254452082764e-05, "loss": 0.0076, "step": 93030 }, { "epoch": 1.34, "learning_rate": 1.9553206412344293e-05, "loss": 0.0099, "step": 93040 }, { "epoch": 1.34, "learning_rate": 1.9553158372605822e-05, "loss": 0.0123, "step": 93050 }, { "epoch": 1.34, "learning_rate": 1.9553110332867348e-05, "loss": 0.0085, "step": 93060 }, { "epoch": 1.34, "learning_rate": 1.9553062293128877e-05, "loss": 0.0082, "step": 93070 }, { "epoch": 1.34, "learning_rate": 1.9553014253390407e-05, "loss": 0.0109, "step": 93080 }, { "epoch": 1.34, "learning_rate": 1.9552966213651932e-05, "loss": 0.0091, "step": 93090 }, { "epoch": 1.34, "learning_rate": 1.9552918173913462e-05, "loss": 0.0133, "step": 93100 }, { "epoch": 1.34, "learning_rate": 1.955287013417499e-05, "loss": 0.0093, "step": 93110 }, { "epoch": 1.34, "learning_rate": 1.955282209443652e-05, "loss": 0.0125, "step": 93120 }, { "epoch": 1.34, "learning_rate": 1.9552774054698046e-05, "loss": 0.0129, "step": 93130 }, { "epoch": 1.34, "learning_rate": 1.9552726014959575e-05, "loss": 0.0128, "step": 93140 }, { "epoch": 1.34, "learning_rate": 1.9552677975221105e-05, "loss": 0.0112, "step": 93150 }, { "epoch": 1.34, "learning_rate": 1.955262993548263e-05, "loss": 0.0123, "step": 93160 }, { "epoch": 1.34, "learning_rate": 1.955258189574416e-05, "loss": 0.0097, "step": 93170 }, { "epoch": 1.34, "learning_rate": 1.955253385600569e-05, "loss": 0.0096, "step": 93180 }, { "epoch": 1.34, "learning_rate": 1.955248581626722e-05, "loss": 0.0107, "step": 93190 }, { "epoch": 1.34, "learning_rate": 1.9552437776528744e-05, "loss": 0.0103, "step": 93200 }, { "epoch": 1.34, "learning_rate": 1.9552389736790274e-05, "loss": 0.0118, "step": 93210 }, { "epoch": 1.34, "learning_rate": 1.9552341697051803e-05, "loss": 0.0122, "step": 93220 }, { "epoch": 1.34, "learning_rate": 1.9552293657313332e-05, "loss": 0.0148, "step": 93230 }, { "epoch": 1.34, "learning_rate": 1.9552245617574858e-05, "loss": 0.0109, "step": 93240 }, { "epoch": 1.34, "learning_rate": 1.9552197577836387e-05, "loss": 0.0094, "step": 93250 }, { "epoch": 1.34, "learning_rate": 1.9552149538097916e-05, "loss": 0.0149, "step": 93260 }, { "epoch": 1.34, "learning_rate": 1.9552101498359442e-05, "loss": 0.0133, "step": 93270 }, { "epoch": 1.34, "learning_rate": 1.955205345862097e-05, "loss": 0.012, "step": 93280 }, { "epoch": 1.34, "learning_rate": 1.95520054188825e-05, "loss": 0.0133, "step": 93290 }, { "epoch": 1.34, "learning_rate": 1.955195737914403e-05, "loss": 0.0116, "step": 93300 }, { "epoch": 1.34, "learning_rate": 1.9551909339405556e-05, "loss": 0.0108, "step": 93310 }, { "epoch": 1.34, "learning_rate": 1.9551861299667085e-05, "loss": 0.0153, "step": 93320 }, { "epoch": 1.35, "learning_rate": 1.9551813259928615e-05, "loss": 0.014, "step": 93330 }, { "epoch": 1.35, "learning_rate": 1.955176522019014e-05, "loss": 0.0118, "step": 93340 }, { "epoch": 1.35, "learning_rate": 1.955171718045167e-05, "loss": 0.0111, "step": 93350 }, { "epoch": 1.35, "learning_rate": 1.95516691407132e-05, "loss": 0.0136, "step": 93360 }, { "epoch": 1.35, "learning_rate": 1.9551621100974728e-05, "loss": 0.0091, "step": 93370 }, { "epoch": 1.35, "learning_rate": 1.9551573061236254e-05, "loss": 0.0143, "step": 93380 }, { "epoch": 1.35, "learning_rate": 1.9551525021497783e-05, "loss": 0.0121, "step": 93390 }, { "epoch": 1.35, "learning_rate": 1.9551476981759313e-05, "loss": 0.0136, "step": 93400 }, { "epoch": 1.35, "learning_rate": 1.9551428942020842e-05, "loss": 0.0097, "step": 93410 }, { "epoch": 1.35, "learning_rate": 1.9551380902282368e-05, "loss": 0.0096, "step": 93420 }, { "epoch": 1.35, "learning_rate": 1.9551332862543897e-05, "loss": 0.0087, "step": 93430 }, { "epoch": 1.35, "learning_rate": 1.9551284822805426e-05, "loss": 0.014, "step": 93440 }, { "epoch": 1.35, "learning_rate": 1.9551236783066952e-05, "loss": 0.014, "step": 93450 }, { "epoch": 1.35, "learning_rate": 1.955118874332848e-05, "loss": 0.0124, "step": 93460 }, { "epoch": 1.35, "learning_rate": 1.955114070359001e-05, "loss": 0.012, "step": 93470 }, { "epoch": 1.35, "learning_rate": 1.955109266385154e-05, "loss": 0.0118, "step": 93480 }, { "epoch": 1.35, "learning_rate": 1.9551044624113066e-05, "loss": 0.0152, "step": 93490 }, { "epoch": 1.35, "learning_rate": 1.9550996584374595e-05, "loss": 0.0096, "step": 93500 }, { "epoch": 1.35, "learning_rate": 1.9550948544636124e-05, "loss": 0.0117, "step": 93510 }, { "epoch": 1.35, "learning_rate": 1.955090050489765e-05, "loss": 0.0106, "step": 93520 }, { "epoch": 1.35, "learning_rate": 1.955085246515918e-05, "loss": 0.01, "step": 93530 }, { "epoch": 1.35, "learning_rate": 1.955080442542071e-05, "loss": 0.0208, "step": 93540 }, { "epoch": 1.35, "learning_rate": 1.9550756385682238e-05, "loss": 0.0077, "step": 93550 }, { "epoch": 1.35, "learning_rate": 1.9550708345943764e-05, "loss": 0.0117, "step": 93560 }, { "epoch": 1.35, "learning_rate": 1.9550660306205293e-05, "loss": 0.0155, "step": 93570 }, { "epoch": 1.35, "learning_rate": 1.9550612266466823e-05, "loss": 0.0075, "step": 93580 }, { "epoch": 1.35, "learning_rate": 1.9550564226728352e-05, "loss": 0.0174, "step": 93590 }, { "epoch": 1.35, "learning_rate": 1.9550516186989878e-05, "loss": 0.0079, "step": 93600 }, { "epoch": 1.35, "learning_rate": 1.955046814725141e-05, "loss": 0.018, "step": 93610 }, { "epoch": 1.35, "learning_rate": 1.9550420107512936e-05, "loss": 0.0128, "step": 93620 }, { "epoch": 1.35, "learning_rate": 1.9550372067774466e-05, "loss": 0.012, "step": 93630 }, { "epoch": 1.35, "learning_rate": 1.9550324028035995e-05, "loss": 0.012, "step": 93640 }, { "epoch": 1.35, "learning_rate": 1.955027598829752e-05, "loss": 0.0117, "step": 93650 }, { "epoch": 1.35, "learning_rate": 1.955022794855905e-05, "loss": 0.0098, "step": 93660 }, { "epoch": 1.35, "learning_rate": 1.955017990882058e-05, "loss": 0.0118, "step": 93670 }, { "epoch": 1.35, "learning_rate": 1.955013186908211e-05, "loss": 0.0101, "step": 93680 }, { "epoch": 1.35, "learning_rate": 1.9550083829343634e-05, "loss": 0.0128, "step": 93690 }, { "epoch": 1.35, "learning_rate": 1.9550035789605164e-05, "loss": 0.0079, "step": 93700 }, { "epoch": 1.35, "learning_rate": 1.9549987749866693e-05, "loss": 0.0145, "step": 93710 }, { "epoch": 1.35, "learning_rate": 1.9549939710128222e-05, "loss": 0.0085, "step": 93720 }, { "epoch": 1.35, "learning_rate": 1.9549891670389748e-05, "loss": 0.0126, "step": 93730 }, { "epoch": 1.35, "learning_rate": 1.9549843630651277e-05, "loss": 0.0139, "step": 93740 }, { "epoch": 1.35, "learning_rate": 1.9549795590912807e-05, "loss": 0.0112, "step": 93750 }, { "epoch": 1.35, "learning_rate": 1.9549747551174333e-05, "loss": 0.0107, "step": 93760 }, { "epoch": 1.35, "learning_rate": 1.9549699511435862e-05, "loss": 0.0084, "step": 93770 }, { "epoch": 1.35, "learning_rate": 1.954965147169739e-05, "loss": 0.0111, "step": 93780 }, { "epoch": 1.35, "learning_rate": 1.954960343195892e-05, "loss": 0.015, "step": 93790 }, { "epoch": 1.35, "learning_rate": 1.9549555392220446e-05, "loss": 0.0091, "step": 93800 }, { "epoch": 1.35, "learning_rate": 1.9549507352481975e-05, "loss": 0.0122, "step": 93810 }, { "epoch": 1.35, "learning_rate": 1.9549459312743505e-05, "loss": 0.0119, "step": 93820 }, { "epoch": 1.35, "learning_rate": 1.954941127300503e-05, "loss": 0.012, "step": 93830 }, { "epoch": 1.35, "learning_rate": 1.954936323326656e-05, "loss": 0.0134, "step": 93840 }, { "epoch": 1.35, "learning_rate": 1.954931519352809e-05, "loss": 0.0102, "step": 93850 }, { "epoch": 1.35, "learning_rate": 1.954926715378962e-05, "loss": 0.0137, "step": 93860 }, { "epoch": 1.35, "learning_rate": 1.9549219114051144e-05, "loss": 0.0093, "step": 93870 }, { "epoch": 1.35, "learning_rate": 1.9549171074312674e-05, "loss": 0.0104, "step": 93880 }, { "epoch": 1.35, "learning_rate": 1.9549123034574203e-05, "loss": 0.009, "step": 93890 }, { "epoch": 1.35, "learning_rate": 1.9549074994835732e-05, "loss": 0.01, "step": 93900 }, { "epoch": 1.35, "learning_rate": 1.9549026955097258e-05, "loss": 0.0129, "step": 93910 }, { "epoch": 1.35, "learning_rate": 1.9548978915358787e-05, "loss": 0.0091, "step": 93920 }, { "epoch": 1.35, "learning_rate": 1.9548930875620317e-05, "loss": 0.0113, "step": 93930 }, { "epoch": 1.35, "learning_rate": 1.9548882835881842e-05, "loss": 0.0106, "step": 93940 }, { "epoch": 1.35, "learning_rate": 1.9548834796143372e-05, "loss": 0.0132, "step": 93950 }, { "epoch": 1.35, "learning_rate": 1.95487867564049e-05, "loss": 0.0103, "step": 93960 }, { "epoch": 1.35, "learning_rate": 1.954873871666643e-05, "loss": 0.0123, "step": 93970 }, { "epoch": 1.35, "learning_rate": 1.9548690676927956e-05, "loss": 0.009, "step": 93980 }, { "epoch": 1.35, "learning_rate": 1.9548642637189485e-05, "loss": 0.0143, "step": 93990 }, { "epoch": 1.35, "learning_rate": 1.9548594597451015e-05, "loss": 0.011, "step": 94000 }, { "epoch": 1.35, "learning_rate": 1.954854655771254e-05, "loss": 0.0096, "step": 94010 }, { "epoch": 1.36, "learning_rate": 1.954849851797407e-05, "loss": 0.0084, "step": 94020 }, { "epoch": 1.36, "learning_rate": 1.95484504782356e-05, "loss": 0.0134, "step": 94030 }, { "epoch": 1.36, "learning_rate": 1.954840243849713e-05, "loss": 0.0123, "step": 94040 }, { "epoch": 1.36, "learning_rate": 1.9548354398758654e-05, "loss": 0.0106, "step": 94050 }, { "epoch": 1.36, "learning_rate": 1.9548306359020184e-05, "loss": 0.0089, "step": 94060 }, { "epoch": 1.36, "learning_rate": 1.9548258319281713e-05, "loss": 0.0114, "step": 94070 }, { "epoch": 1.36, "learning_rate": 1.9548210279543242e-05, "loss": 0.0117, "step": 94080 }, { "epoch": 1.36, "learning_rate": 1.9548162239804768e-05, "loss": 0.0122, "step": 94090 }, { "epoch": 1.36, "learning_rate": 1.9548114200066297e-05, "loss": 0.0095, "step": 94100 }, { "epoch": 1.36, "learning_rate": 1.9548066160327826e-05, "loss": 0.0114, "step": 94110 }, { "epoch": 1.36, "learning_rate": 1.9548018120589352e-05, "loss": 0.01, "step": 94120 }, { "epoch": 1.36, "learning_rate": 1.954797008085088e-05, "loss": 0.0121, "step": 94130 }, { "epoch": 1.36, "learning_rate": 1.954792204111241e-05, "loss": 0.0097, "step": 94140 }, { "epoch": 1.36, "learning_rate": 1.954787400137394e-05, "loss": 0.0154, "step": 94150 }, { "epoch": 1.36, "learning_rate": 1.9547825961635466e-05, "loss": 0.0123, "step": 94160 }, { "epoch": 1.36, "learning_rate": 1.9547777921896995e-05, "loss": 0.0124, "step": 94170 }, { "epoch": 1.36, "learning_rate": 1.9547729882158525e-05, "loss": 0.0088, "step": 94180 }, { "epoch": 1.36, "learning_rate": 1.954768184242005e-05, "loss": 0.0106, "step": 94190 }, { "epoch": 1.36, "learning_rate": 1.954763380268158e-05, "loss": 0.0109, "step": 94200 }, { "epoch": 1.36, "learning_rate": 1.954758576294311e-05, "loss": 0.0107, "step": 94210 }, { "epoch": 1.36, "learning_rate": 1.9547537723204638e-05, "loss": 0.0135, "step": 94220 }, { "epoch": 1.36, "learning_rate": 1.9547489683466164e-05, "loss": 0.016, "step": 94230 }, { "epoch": 1.36, "learning_rate": 1.9547441643727693e-05, "loss": 0.016, "step": 94240 }, { "epoch": 1.36, "learning_rate": 1.9547393603989223e-05, "loss": 0.0143, "step": 94250 }, { "epoch": 1.36, "learning_rate": 1.9547345564250752e-05, "loss": 0.0086, "step": 94260 }, { "epoch": 1.36, "learning_rate": 1.9547297524512278e-05, "loss": 0.0113, "step": 94270 }, { "epoch": 1.36, "learning_rate": 1.9547249484773807e-05, "loss": 0.0111, "step": 94280 }, { "epoch": 1.36, "learning_rate": 1.9547201445035336e-05, "loss": 0.0127, "step": 94290 }, { "epoch": 1.36, "learning_rate": 1.9547153405296862e-05, "loss": 0.0104, "step": 94300 }, { "epoch": 1.36, "learning_rate": 1.954710536555839e-05, "loss": 0.0111, "step": 94310 }, { "epoch": 1.36, "learning_rate": 1.954705732581992e-05, "loss": 0.0117, "step": 94320 }, { "epoch": 1.36, "learning_rate": 1.954700928608145e-05, "loss": 0.0139, "step": 94330 }, { "epoch": 1.36, "learning_rate": 1.9546961246342976e-05, "loss": 0.0123, "step": 94340 }, { "epoch": 1.36, "learning_rate": 1.9546913206604505e-05, "loss": 0.0127, "step": 94350 }, { "epoch": 1.36, "learning_rate": 1.9546865166866034e-05, "loss": 0.0102, "step": 94360 }, { "epoch": 1.36, "learning_rate": 1.954681712712756e-05, "loss": 0.0113, "step": 94370 }, { "epoch": 1.36, "learning_rate": 1.954676908738909e-05, "loss": 0.0103, "step": 94380 }, { "epoch": 1.36, "learning_rate": 1.954672104765062e-05, "loss": 0.0101, "step": 94390 }, { "epoch": 1.36, "learning_rate": 1.9546673007912148e-05, "loss": 0.0116, "step": 94400 }, { "epoch": 1.36, "learning_rate": 1.9546624968173674e-05, "loss": 0.0116, "step": 94410 }, { "epoch": 1.36, "learning_rate": 1.9546576928435203e-05, "loss": 0.0099, "step": 94420 }, { "epoch": 1.36, "learning_rate": 1.9546528888696733e-05, "loss": 0.0247, "step": 94430 }, { "epoch": 1.36, "learning_rate": 1.9546480848958262e-05, "loss": 0.0097, "step": 94440 }, { "epoch": 1.36, "learning_rate": 1.9546437613193637e-05, "loss": 0.011, "step": 94450 }, { "epoch": 1.36, "learning_rate": 1.9546389573455166e-05, "loss": 0.0131, "step": 94460 }, { "epoch": 1.36, "learning_rate": 1.954634153371669e-05, "loss": 0.012, "step": 94470 }, { "epoch": 1.36, "learning_rate": 1.954629349397822e-05, "loss": 0.0164, "step": 94480 }, { "epoch": 1.36, "learning_rate": 1.954624545423975e-05, "loss": 0.0186, "step": 94490 }, { "epoch": 1.36, "learning_rate": 1.954619741450128e-05, "loss": 0.009, "step": 94500 }, { "epoch": 1.36, "learning_rate": 1.9546149374762805e-05, "loss": 0.0147, "step": 94510 }, { "epoch": 1.36, "learning_rate": 1.9546101335024335e-05, "loss": 0.0163, "step": 94520 }, { "epoch": 1.36, "learning_rate": 1.9546053295285864e-05, "loss": 0.0104, "step": 94530 }, { "epoch": 1.36, "learning_rate": 1.954600525554739e-05, "loss": 0.0102, "step": 94540 }, { "epoch": 1.36, "learning_rate": 1.954595721580892e-05, "loss": 0.0141, "step": 94550 }, { "epoch": 1.36, "learning_rate": 1.954590917607045e-05, "loss": 0.0091, "step": 94560 }, { "epoch": 1.36, "learning_rate": 1.9545861136331978e-05, "loss": 0.0104, "step": 94570 }, { "epoch": 1.36, "learning_rate": 1.9545813096593503e-05, "loss": 0.0123, "step": 94580 }, { "epoch": 1.36, "learning_rate": 1.9545765056855033e-05, "loss": 0.0146, "step": 94590 }, { "epoch": 1.36, "learning_rate": 1.9545717017116562e-05, "loss": 0.01, "step": 94600 }, { "epoch": 1.36, "learning_rate": 1.9545668977378088e-05, "loss": 0.0106, "step": 94610 }, { "epoch": 1.36, "learning_rate": 1.9545620937639617e-05, "loss": 0.0112, "step": 94620 }, { "epoch": 1.36, "learning_rate": 1.9545572897901146e-05, "loss": 0.0147, "step": 94630 }, { "epoch": 1.36, "learning_rate": 1.9545524858162676e-05, "loss": 0.0078, "step": 94640 }, { "epoch": 1.36, "learning_rate": 1.95454768184242e-05, "loss": 0.0173, "step": 94650 }, { "epoch": 1.36, "learning_rate": 1.954542877868573e-05, "loss": 0.0128, "step": 94660 }, { "epoch": 1.36, "learning_rate": 1.954538073894726e-05, "loss": 0.0105, "step": 94670 }, { "epoch": 1.36, "learning_rate": 1.954533269920879e-05, "loss": 0.0114, "step": 94680 }, { "epoch": 1.36, "learning_rate": 1.9545284659470315e-05, "loss": 0.01, "step": 94690 }, { "epoch": 1.36, "learning_rate": 1.9545236619731845e-05, "loss": 0.0101, "step": 94700 }, { "epoch": 1.36, "learning_rate": 1.9545188579993374e-05, "loss": 0.0123, "step": 94710 }, { "epoch": 1.37, "learning_rate": 1.95451405402549e-05, "loss": 0.0102, "step": 94720 }, { "epoch": 1.37, "learning_rate": 1.954509250051643e-05, "loss": 0.0116, "step": 94730 }, { "epoch": 1.37, "learning_rate": 1.9545044460777958e-05, "loss": 0.0104, "step": 94740 }, { "epoch": 1.37, "learning_rate": 1.9544996421039488e-05, "loss": 0.0097, "step": 94750 }, { "epoch": 1.37, "learning_rate": 1.9544948381301013e-05, "loss": 0.0121, "step": 94760 }, { "epoch": 1.37, "learning_rate": 1.9544900341562543e-05, "loss": 0.0126, "step": 94770 }, { "epoch": 1.37, "learning_rate": 1.9544852301824072e-05, "loss": 0.0102, "step": 94780 }, { "epoch": 1.37, "learning_rate": 1.9544804262085598e-05, "loss": 0.0094, "step": 94790 }, { "epoch": 1.37, "learning_rate": 1.9544756222347127e-05, "loss": 0.0103, "step": 94800 }, { "epoch": 1.37, "learning_rate": 1.9544708182608656e-05, "loss": 0.0086, "step": 94810 }, { "epoch": 1.37, "learning_rate": 1.9544660142870186e-05, "loss": 0.0105, "step": 94820 }, { "epoch": 1.37, "learning_rate": 1.954461210313171e-05, "loss": 0.0101, "step": 94830 }, { "epoch": 1.37, "learning_rate": 1.954456406339324e-05, "loss": 0.0098, "step": 94840 }, { "epoch": 1.37, "learning_rate": 1.954451602365477e-05, "loss": 0.0129, "step": 94850 }, { "epoch": 1.37, "learning_rate": 1.95444679839163e-05, "loss": 0.0137, "step": 94860 }, { "epoch": 1.37, "learning_rate": 1.9544419944177825e-05, "loss": 0.0087, "step": 94870 }, { "epoch": 1.37, "learning_rate": 1.9544371904439354e-05, "loss": 0.012, "step": 94880 }, { "epoch": 1.37, "learning_rate": 1.9544323864700884e-05, "loss": 0.0113, "step": 94890 }, { "epoch": 1.37, "learning_rate": 1.954427582496241e-05, "loss": 0.0133, "step": 94900 }, { "epoch": 1.37, "learning_rate": 1.954422778522394e-05, "loss": 0.0111, "step": 94910 }, { "epoch": 1.37, "learning_rate": 1.9544179745485468e-05, "loss": 0.01, "step": 94920 }, { "epoch": 1.37, "learning_rate": 1.9544131705746997e-05, "loss": 0.01, "step": 94930 }, { "epoch": 1.37, "learning_rate": 1.9544083666008523e-05, "loss": 0.0092, "step": 94940 }, { "epoch": 1.37, "learning_rate": 1.9544035626270053e-05, "loss": 0.011, "step": 94950 }, { "epoch": 1.37, "learning_rate": 1.9543987586531582e-05, "loss": 0.0146, "step": 94960 }, { "epoch": 1.37, "learning_rate": 1.9543939546793108e-05, "loss": 0.0144, "step": 94970 }, { "epoch": 1.37, "learning_rate": 1.9543891507054637e-05, "loss": 0.0095, "step": 94980 }, { "epoch": 1.37, "learning_rate": 1.9543843467316166e-05, "loss": 0.0163, "step": 94990 }, { "epoch": 1.37, "learning_rate": 1.9543795427577696e-05, "loss": 0.0152, "step": 95000 }, { "epoch": 1.37, "learning_rate": 1.954374738783922e-05, "loss": 0.0074, "step": 95010 }, { "epoch": 1.37, "learning_rate": 1.954369934810075e-05, "loss": 0.0119, "step": 95020 }, { "epoch": 1.37, "learning_rate": 1.954365130836228e-05, "loss": 0.0103, "step": 95030 }, { "epoch": 1.37, "learning_rate": 1.9543603268623806e-05, "loss": 0.0107, "step": 95040 }, { "epoch": 1.37, "learning_rate": 1.9543555228885335e-05, "loss": 0.0139, "step": 95050 }, { "epoch": 1.37, "learning_rate": 1.9543507189146864e-05, "loss": 0.0119, "step": 95060 }, { "epoch": 1.37, "learning_rate": 1.9543459149408394e-05, "loss": 0.0118, "step": 95070 }, { "epoch": 1.37, "learning_rate": 1.954341110966992e-05, "loss": 0.0204, "step": 95080 }, { "epoch": 1.37, "learning_rate": 1.954336306993145e-05, "loss": 0.008, "step": 95090 }, { "epoch": 1.37, "learning_rate": 1.9543315030192978e-05, "loss": 0.0123, "step": 95100 }, { "epoch": 1.37, "learning_rate": 1.9543266990454507e-05, "loss": 0.0144, "step": 95110 }, { "epoch": 1.37, "learning_rate": 1.9543218950716033e-05, "loss": 0.0164, "step": 95120 }, { "epoch": 1.37, "learning_rate": 1.9543170910977562e-05, "loss": 0.0148, "step": 95130 }, { "epoch": 1.37, "learning_rate": 1.9543122871239092e-05, "loss": 0.0103, "step": 95140 }, { "epoch": 1.37, "learning_rate": 1.9543074831500618e-05, "loss": 0.0101, "step": 95150 }, { "epoch": 1.37, "learning_rate": 1.9543026791762147e-05, "loss": 0.0107, "step": 95160 }, { "epoch": 1.37, "learning_rate": 1.9542978752023676e-05, "loss": 0.0107, "step": 95170 }, { "epoch": 1.37, "learning_rate": 1.9542930712285205e-05, "loss": 0.0075, "step": 95180 }, { "epoch": 1.37, "learning_rate": 1.954288267254673e-05, "loss": 0.0173, "step": 95190 }, { "epoch": 1.37, "learning_rate": 1.954283463280826e-05, "loss": 0.0172, "step": 95200 }, { "epoch": 1.37, "learning_rate": 1.954278659306979e-05, "loss": 0.0127, "step": 95210 }, { "epoch": 1.37, "learning_rate": 1.9542738553331316e-05, "loss": 0.0081, "step": 95220 }, { "epoch": 1.37, "learning_rate": 1.9542690513592845e-05, "loss": 0.0147, "step": 95230 }, { "epoch": 1.37, "learning_rate": 1.9542642473854374e-05, "loss": 0.0116, "step": 95240 }, { "epoch": 1.37, "learning_rate": 1.9542594434115904e-05, "loss": 0.0144, "step": 95250 }, { "epoch": 1.37, "learning_rate": 1.954254639437743e-05, "loss": 0.0112, "step": 95260 }, { "epoch": 1.37, "learning_rate": 1.954249835463896e-05, "loss": 0.0108, "step": 95270 }, { "epoch": 1.37, "learning_rate": 1.9542450314900488e-05, "loss": 0.0102, "step": 95280 }, { "epoch": 1.37, "learning_rate": 1.9542402275162017e-05, "loss": 0.0096, "step": 95290 }, { "epoch": 1.37, "learning_rate": 1.9542354235423543e-05, "loss": 0.0118, "step": 95300 }, { "epoch": 1.37, "learning_rate": 1.9542306195685072e-05, "loss": 0.0078, "step": 95310 }, { "epoch": 1.37, "learning_rate": 1.95422581559466e-05, "loss": 0.015, "step": 95320 }, { "epoch": 1.37, "learning_rate": 1.9542210116208128e-05, "loss": 0.0129, "step": 95330 }, { "epoch": 1.37, "learning_rate": 1.9542162076469657e-05, "loss": 0.0113, "step": 95340 }, { "epoch": 1.37, "learning_rate": 1.9542114036731186e-05, "loss": 0.0092, "step": 95350 }, { "epoch": 1.37, "learning_rate": 1.9542065996992715e-05, "loss": 0.0094, "step": 95360 }, { "epoch": 1.37, "learning_rate": 1.954201795725424e-05, "loss": 0.0141, "step": 95370 }, { "epoch": 1.37, "learning_rate": 1.954196991751577e-05, "loss": 0.0104, "step": 95380 }, { "epoch": 1.37, "learning_rate": 1.95419218777773e-05, "loss": 0.0176, "step": 95390 }, { "epoch": 1.37, "learning_rate": 1.9541873838038826e-05, "loss": 0.0114, "step": 95400 }, { "epoch": 1.38, "learning_rate": 1.9541825798300355e-05, "loss": 0.0094, "step": 95410 }, { "epoch": 1.38, "learning_rate": 1.9541777758561884e-05, "loss": 0.0122, "step": 95420 }, { "epoch": 1.38, "learning_rate": 1.9541729718823413e-05, "loss": 0.0103, "step": 95430 }, { "epoch": 1.38, "learning_rate": 1.954168167908494e-05, "loss": 0.0116, "step": 95440 }, { "epoch": 1.38, "learning_rate": 1.954163363934647e-05, "loss": 0.0163, "step": 95450 }, { "epoch": 1.38, "learning_rate": 1.9541585599607998e-05, "loss": 0.0102, "step": 95460 }, { "epoch": 1.38, "learning_rate": 1.9541537559869527e-05, "loss": 0.0104, "step": 95470 }, { "epoch": 1.38, "learning_rate": 1.9541489520131053e-05, "loss": 0.0151, "step": 95480 }, { "epoch": 1.38, "learning_rate": 1.9541441480392582e-05, "loss": 0.0106, "step": 95490 }, { "epoch": 1.38, "learning_rate": 1.954139344065411e-05, "loss": 0.0128, "step": 95500 }, { "epoch": 1.38, "learning_rate": 1.9541345400915637e-05, "loss": 0.0138, "step": 95510 }, { "epoch": 1.38, "learning_rate": 1.9541297361177167e-05, "loss": 0.0122, "step": 95520 }, { "epoch": 1.38, "learning_rate": 1.9541249321438696e-05, "loss": 0.0112, "step": 95530 }, { "epoch": 1.38, "learning_rate": 1.9541201281700225e-05, "loss": 0.0104, "step": 95540 }, { "epoch": 1.38, "learning_rate": 1.954115324196175e-05, "loss": 0.0087, "step": 95550 }, { "epoch": 1.38, "learning_rate": 1.954110520222328e-05, "loss": 0.0114, "step": 95560 }, { "epoch": 1.38, "learning_rate": 1.954105716248481e-05, "loss": 0.01, "step": 95570 }, { "epoch": 1.38, "learning_rate": 1.9541009122746336e-05, "loss": 0.0128, "step": 95580 }, { "epoch": 1.38, "learning_rate": 1.9540961083007865e-05, "loss": 0.0101, "step": 95590 }, { "epoch": 1.38, "learning_rate": 1.9540913043269394e-05, "loss": 0.0164, "step": 95600 }, { "epoch": 1.38, "learning_rate": 1.9540865003530923e-05, "loss": 0.0092, "step": 95610 }, { "epoch": 1.38, "learning_rate": 1.954081696379245e-05, "loss": 0.0136, "step": 95620 }, { "epoch": 1.38, "learning_rate": 1.954076892405398e-05, "loss": 0.0119, "step": 95630 }, { "epoch": 1.38, "learning_rate": 1.9540720884315508e-05, "loss": 0.0117, "step": 95640 }, { "epoch": 1.38, "learning_rate": 1.9540672844577037e-05, "loss": 0.0097, "step": 95650 }, { "epoch": 1.38, "learning_rate": 1.9540624804838563e-05, "loss": 0.0099, "step": 95660 }, { "epoch": 1.38, "learning_rate": 1.9540576765100092e-05, "loss": 0.0125, "step": 95670 }, { "epoch": 1.38, "learning_rate": 1.954052872536162e-05, "loss": 0.0112, "step": 95680 }, { "epoch": 1.38, "learning_rate": 1.9540480685623147e-05, "loss": 0.0121, "step": 95690 }, { "epoch": 1.38, "learning_rate": 1.9540432645884677e-05, "loss": 0.0094, "step": 95700 }, { "epoch": 1.38, "learning_rate": 1.9540384606146206e-05, "loss": 0.0126, "step": 95710 }, { "epoch": 1.38, "learning_rate": 1.9540336566407735e-05, "loss": 0.0117, "step": 95720 }, { "epoch": 1.38, "learning_rate": 1.954028852666926e-05, "loss": 0.0125, "step": 95730 }, { "epoch": 1.38, "learning_rate": 1.954024048693079e-05, "loss": 0.0112, "step": 95740 }, { "epoch": 1.38, "learning_rate": 1.954019244719232e-05, "loss": 0.0127, "step": 95750 }, { "epoch": 1.38, "learning_rate": 1.9540144407453845e-05, "loss": 0.0097, "step": 95760 }, { "epoch": 1.38, "learning_rate": 1.9540096367715375e-05, "loss": 0.0103, "step": 95770 }, { "epoch": 1.38, "learning_rate": 1.9540048327976904e-05, "loss": 0.0075, "step": 95780 }, { "epoch": 1.38, "learning_rate": 1.9540000288238433e-05, "loss": 0.0138, "step": 95790 }, { "epoch": 1.38, "learning_rate": 1.953995224849996e-05, "loss": 0.0078, "step": 95800 }, { "epoch": 1.38, "learning_rate": 1.953990420876149e-05, "loss": 0.0106, "step": 95810 }, { "epoch": 1.38, "learning_rate": 1.9539856169023018e-05, "loss": 0.0097, "step": 95820 }, { "epoch": 1.38, "learning_rate": 1.9539808129284547e-05, "loss": 0.0086, "step": 95830 }, { "epoch": 1.38, "learning_rate": 1.9539760089546073e-05, "loss": 0.0114, "step": 95840 }, { "epoch": 1.38, "learning_rate": 1.9539712049807602e-05, "loss": 0.0152, "step": 95850 }, { "epoch": 1.38, "learning_rate": 1.953966401006913e-05, "loss": 0.0167, "step": 95860 }, { "epoch": 1.38, "learning_rate": 1.9539615970330657e-05, "loss": 0.0114, "step": 95870 }, { "epoch": 1.38, "learning_rate": 1.9539567930592187e-05, "loss": 0.0116, "step": 95880 }, { "epoch": 1.38, "learning_rate": 1.9539519890853716e-05, "loss": 0.0113, "step": 95890 }, { "epoch": 1.38, "learning_rate": 1.9539471851115245e-05, "loss": 0.0144, "step": 95900 }, { "epoch": 1.38, "learning_rate": 1.953942381137677e-05, "loss": 0.0088, "step": 95910 }, { "epoch": 1.38, "learning_rate": 1.95393757716383e-05, "loss": 0.01, "step": 95920 }, { "epoch": 1.38, "learning_rate": 1.953932773189983e-05, "loss": 0.0154, "step": 95930 }, { "epoch": 1.38, "learning_rate": 1.9539279692161355e-05, "loss": 0.0103, "step": 95940 }, { "epoch": 1.38, "learning_rate": 1.9539231652422885e-05, "loss": 0.011, "step": 95950 }, { "epoch": 1.38, "learning_rate": 1.9539183612684414e-05, "loss": 0.0084, "step": 95960 }, { "epoch": 1.38, "learning_rate": 1.9539135572945943e-05, "loss": 0.012, "step": 95970 }, { "epoch": 1.38, "learning_rate": 1.953908753320747e-05, "loss": 0.0117, "step": 95980 }, { "epoch": 1.38, "learning_rate": 1.9539039493469e-05, "loss": 0.0132, "step": 95990 }, { "epoch": 1.38, "learning_rate": 1.9538991453730528e-05, "loss": 0.0099, "step": 96000 }, { "epoch": 1.38, "learning_rate": 1.9538943413992057e-05, "loss": 0.0077, "step": 96010 }, { "epoch": 1.38, "learning_rate": 1.9538895374253583e-05, "loss": 0.0185, "step": 96020 }, { "epoch": 1.38, "learning_rate": 1.9538847334515112e-05, "loss": 0.0123, "step": 96030 }, { "epoch": 1.38, "learning_rate": 1.953879929477664e-05, "loss": 0.0138, "step": 96040 }, { "epoch": 1.38, "learning_rate": 1.9538751255038167e-05, "loss": 0.0095, "step": 96050 }, { "epoch": 1.38, "learning_rate": 1.9538703215299696e-05, "loss": 0.0124, "step": 96060 }, { "epoch": 1.38, "learning_rate": 1.9538655175561226e-05, "loss": 0.013, "step": 96070 }, { "epoch": 1.38, "learning_rate": 1.9538607135822755e-05, "loss": 0.0074, "step": 96080 }, { "epoch": 1.38, "learning_rate": 1.953855909608428e-05, "loss": 0.0075, "step": 96090 }, { "epoch": 1.38, "learning_rate": 1.953851105634581e-05, "loss": 0.0117, "step": 96100 }, { "epoch": 1.39, "learning_rate": 1.953846301660734e-05, "loss": 0.0099, "step": 96110 }, { "epoch": 1.39, "learning_rate": 1.9538414976868865e-05, "loss": 0.0114, "step": 96120 }, { "epoch": 1.39, "learning_rate": 1.9538366937130395e-05, "loss": 0.0099, "step": 96130 }, { "epoch": 1.39, "learning_rate": 1.9538318897391924e-05, "loss": 0.0103, "step": 96140 }, { "epoch": 1.39, "learning_rate": 1.9538270857653453e-05, "loss": 0.0079, "step": 96150 }, { "epoch": 1.39, "learning_rate": 1.953822281791498e-05, "loss": 0.0119, "step": 96160 }, { "epoch": 1.39, "learning_rate": 1.9538174778176508e-05, "loss": 0.0133, "step": 96170 }, { "epoch": 1.39, "learning_rate": 1.9538126738438038e-05, "loss": 0.0102, "step": 96180 }, { "epoch": 1.39, "learning_rate": 1.9538078698699567e-05, "loss": 0.0098, "step": 96190 }, { "epoch": 1.39, "learning_rate": 1.9538030658961093e-05, "loss": 0.0127, "step": 96200 }, { "epoch": 1.39, "learning_rate": 1.9537982619222622e-05, "loss": 0.013, "step": 96210 }, { "epoch": 1.39, "learning_rate": 1.953793457948415e-05, "loss": 0.0142, "step": 96220 }, { "epoch": 1.39, "learning_rate": 1.9537886539745677e-05, "loss": 0.0072, "step": 96230 }, { "epoch": 1.39, "learning_rate": 1.9537838500007206e-05, "loss": 0.0105, "step": 96240 }, { "epoch": 1.39, "learning_rate": 1.9537790460268736e-05, "loss": 0.0126, "step": 96250 }, { "epoch": 1.39, "learning_rate": 1.9537742420530265e-05, "loss": 0.0083, "step": 96260 }, { "epoch": 1.39, "learning_rate": 1.953769438079179e-05, "loss": 0.0111, "step": 96270 }, { "epoch": 1.39, "learning_rate": 1.953764634105332e-05, "loss": 0.0126, "step": 96280 }, { "epoch": 1.39, "learning_rate": 1.953759830131485e-05, "loss": 0.0111, "step": 96290 }, { "epoch": 1.39, "learning_rate": 1.9537550261576375e-05, "loss": 0.0108, "step": 96300 }, { "epoch": 1.39, "learning_rate": 1.9537502221837905e-05, "loss": 0.0124, "step": 96310 }, { "epoch": 1.39, "learning_rate": 1.9537454182099434e-05, "loss": 0.0122, "step": 96320 }, { "epoch": 1.39, "learning_rate": 1.9537406142360963e-05, "loss": 0.0122, "step": 96330 }, { "epoch": 1.39, "learning_rate": 1.953735810262249e-05, "loss": 0.0095, "step": 96340 }, { "epoch": 1.39, "learning_rate": 1.9537310062884018e-05, "loss": 0.011, "step": 96350 }, { "epoch": 1.39, "learning_rate": 1.9537262023145547e-05, "loss": 0.0134, "step": 96360 }, { "epoch": 1.39, "learning_rate": 1.9537213983407077e-05, "loss": 0.011, "step": 96370 }, { "epoch": 1.39, "learning_rate": 1.9537165943668603e-05, "loss": 0.0118, "step": 96380 }, { "epoch": 1.39, "learning_rate": 1.9537117903930132e-05, "loss": 0.0125, "step": 96390 }, { "epoch": 1.39, "learning_rate": 1.953706986419166e-05, "loss": 0.0114, "step": 96400 }, { "epoch": 1.39, "learning_rate": 1.9537021824453187e-05, "loss": 0.0114, "step": 96410 }, { "epoch": 1.39, "learning_rate": 1.9536973784714716e-05, "loss": 0.0122, "step": 96420 }, { "epoch": 1.39, "learning_rate": 1.9536925744976246e-05, "loss": 0.011, "step": 96430 }, { "epoch": 1.39, "learning_rate": 1.9536877705237775e-05, "loss": 0.0141, "step": 96440 }, { "epoch": 1.39, "learning_rate": 1.95368296654993e-05, "loss": 0.0097, "step": 96450 }, { "epoch": 1.39, "learning_rate": 1.953678162576083e-05, "loss": 0.0139, "step": 96460 }, { "epoch": 1.39, "learning_rate": 1.953673358602236e-05, "loss": 0.0118, "step": 96470 }, { "epoch": 1.39, "learning_rate": 1.9536685546283885e-05, "loss": 0.0137, "step": 96480 }, { "epoch": 1.39, "learning_rate": 1.9536637506545414e-05, "loss": 0.0131, "step": 96490 }, { "epoch": 1.39, "learning_rate": 1.9536589466806944e-05, "loss": 0.0106, "step": 96500 }, { "epoch": 1.39, "learning_rate": 1.9536541427068473e-05, "loss": 0.0125, "step": 96510 }, { "epoch": 1.39, "learning_rate": 1.953649338733e-05, "loss": 0.0136, "step": 96520 }, { "epoch": 1.39, "learning_rate": 1.9536445347591528e-05, "loss": 0.0125, "step": 96530 }, { "epoch": 1.39, "learning_rate": 1.9536397307853057e-05, "loss": 0.0104, "step": 96540 }, { "epoch": 1.39, "learning_rate": 1.9536349268114587e-05, "loss": 0.0175, "step": 96550 }, { "epoch": 1.39, "learning_rate": 1.9536301228376113e-05, "loss": 0.0141, "step": 96560 }, { "epoch": 1.39, "learning_rate": 1.9536253188637642e-05, "loss": 0.0104, "step": 96570 }, { "epoch": 1.39, "learning_rate": 1.953620514889917e-05, "loss": 0.0141, "step": 96580 }, { "epoch": 1.39, "learning_rate": 1.9536157109160697e-05, "loss": 0.0149, "step": 96590 }, { "epoch": 1.39, "learning_rate": 1.9536109069422226e-05, "loss": 0.0112, "step": 96600 }, { "epoch": 1.39, "learning_rate": 1.9536061029683755e-05, "loss": 0.0123, "step": 96610 }, { "epoch": 1.39, "learning_rate": 1.9536012989945285e-05, "loss": 0.0116, "step": 96620 }, { "epoch": 1.39, "learning_rate": 1.953596495020681e-05, "loss": 0.0124, "step": 96630 }, { "epoch": 1.39, "learning_rate": 1.953591691046834e-05, "loss": 0.0098, "step": 96640 }, { "epoch": 1.39, "learning_rate": 1.953586887072987e-05, "loss": 0.0112, "step": 96650 }, { "epoch": 1.39, "learning_rate": 1.9535820830991395e-05, "loss": 0.0124, "step": 96660 }, { "epoch": 1.39, "learning_rate": 1.9535772791252924e-05, "loss": 0.0129, "step": 96670 }, { "epoch": 1.39, "learning_rate": 1.9535724751514454e-05, "loss": 0.0136, "step": 96680 }, { "epoch": 1.39, "learning_rate": 1.9535676711775983e-05, "loss": 0.0148, "step": 96690 }, { "epoch": 1.39, "learning_rate": 1.9535628672037512e-05, "loss": 0.0112, "step": 96700 }, { "epoch": 1.39, "learning_rate": 1.953558063229904e-05, "loss": 0.0108, "step": 96710 }, { "epoch": 1.39, "learning_rate": 1.9535532592560567e-05, "loss": 0.0118, "step": 96720 }, { "epoch": 1.39, "learning_rate": 1.9535484552822097e-05, "loss": 0.0098, "step": 96730 }, { "epoch": 1.39, "learning_rate": 1.9535436513083626e-05, "loss": 0.0147, "step": 96740 }, { "epoch": 1.39, "learning_rate": 1.9535388473345155e-05, "loss": 0.0155, "step": 96750 }, { "epoch": 1.39, "learning_rate": 1.953534043360668e-05, "loss": 0.0114, "step": 96760 }, { "epoch": 1.39, "learning_rate": 1.953529239386821e-05, "loss": 0.0089, "step": 96770 }, { "epoch": 1.39, "learning_rate": 1.953524435412974e-05, "loss": 0.0137, "step": 96780 }, { "epoch": 1.39, "learning_rate": 1.9535196314391265e-05, "loss": 0.0085, "step": 96790 }, { "epoch": 1.4, "learning_rate": 1.9535148274652795e-05, "loss": 0.0112, "step": 96800 }, { "epoch": 1.4, "learning_rate": 1.9535100234914324e-05, "loss": 0.0135, "step": 96810 }, { "epoch": 1.4, "learning_rate": 1.9535052195175853e-05, "loss": 0.0121, "step": 96820 }, { "epoch": 1.4, "learning_rate": 1.953500415543738e-05, "loss": 0.0102, "step": 96830 }, { "epoch": 1.4, "learning_rate": 1.953495611569891e-05, "loss": 0.0114, "step": 96840 }, { "epoch": 1.4, "learning_rate": 1.9534908075960438e-05, "loss": 0.0086, "step": 96850 }, { "epoch": 1.4, "learning_rate": 1.9534860036221967e-05, "loss": 0.0225, "step": 96860 }, { "epoch": 1.4, "learning_rate": 1.9534811996483493e-05, "loss": 0.0133, "step": 96870 }, { "epoch": 1.4, "learning_rate": 1.9534763956745022e-05, "loss": 0.0096, "step": 96880 }, { "epoch": 1.4, "learning_rate": 1.953471591700655e-05, "loss": 0.0115, "step": 96890 }, { "epoch": 1.4, "learning_rate": 1.9534667877268077e-05, "loss": 0.0109, "step": 96900 }, { "epoch": 1.4, "learning_rate": 1.9534619837529606e-05, "loss": 0.0139, "step": 96910 }, { "epoch": 1.4, "learning_rate": 1.9534571797791136e-05, "loss": 0.0121, "step": 96920 }, { "epoch": 1.4, "learning_rate": 1.9534523758052665e-05, "loss": 0.0109, "step": 96930 }, { "epoch": 1.4, "learning_rate": 1.953447571831419e-05, "loss": 0.0092, "step": 96940 }, { "epoch": 1.4, "learning_rate": 1.953442767857572e-05, "loss": 0.0123, "step": 96950 }, { "epoch": 1.4, "learning_rate": 1.953437963883725e-05, "loss": 0.0089, "step": 96960 }, { "epoch": 1.4, "learning_rate": 1.9534331599098775e-05, "loss": 0.0128, "step": 96970 }, { "epoch": 1.4, "learning_rate": 1.9534283559360305e-05, "loss": 0.0128, "step": 96980 }, { "epoch": 1.4, "learning_rate": 1.9534235519621834e-05, "loss": 0.0103, "step": 96990 }, { "epoch": 1.4, "learning_rate": 1.9534187479883363e-05, "loss": 0.0126, "step": 97000 }, { "epoch": 1.4, "learning_rate": 1.953413944014489e-05, "loss": 0.0104, "step": 97010 }, { "epoch": 1.4, "learning_rate": 1.9534091400406418e-05, "loss": 0.0096, "step": 97020 }, { "epoch": 1.4, "learning_rate": 1.9534043360667948e-05, "loss": 0.0098, "step": 97030 }, { "epoch": 1.4, "learning_rate": 1.9533995320929477e-05, "loss": 0.0109, "step": 97040 }, { "epoch": 1.4, "learning_rate": 1.9533947281191003e-05, "loss": 0.0078, "step": 97050 }, { "epoch": 1.4, "learning_rate": 1.9533899241452532e-05, "loss": 0.0115, "step": 97060 }, { "epoch": 1.4, "learning_rate": 1.953385120171406e-05, "loss": 0.0122, "step": 97070 }, { "epoch": 1.4, "learning_rate": 1.9533803161975587e-05, "loss": 0.0096, "step": 97080 }, { "epoch": 1.4, "learning_rate": 1.9533755122237116e-05, "loss": 0.0118, "step": 97090 }, { "epoch": 1.4, "learning_rate": 1.9533707082498646e-05, "loss": 0.0115, "step": 97100 }, { "epoch": 1.4, "learning_rate": 1.9533659042760175e-05, "loss": 0.0137, "step": 97110 }, { "epoch": 1.4, "learning_rate": 1.95336110030217e-05, "loss": 0.0118, "step": 97120 }, { "epoch": 1.4, "learning_rate": 1.953356296328323e-05, "loss": 0.0103, "step": 97130 }, { "epoch": 1.4, "learning_rate": 1.953351492354476e-05, "loss": 0.0132, "step": 97140 }, { "epoch": 1.4, "learning_rate": 1.9533466883806285e-05, "loss": 0.0111, "step": 97150 }, { "epoch": 1.4, "learning_rate": 1.9533418844067815e-05, "loss": 0.0163, "step": 97160 }, { "epoch": 1.4, "learning_rate": 1.9533370804329344e-05, "loss": 0.0123, "step": 97170 }, { "epoch": 1.4, "learning_rate": 1.9533322764590873e-05, "loss": 0.0152, "step": 97180 }, { "epoch": 1.4, "learning_rate": 1.95332747248524e-05, "loss": 0.0093, "step": 97190 }, { "epoch": 1.4, "learning_rate": 1.9533226685113928e-05, "loss": 0.0126, "step": 97200 }, { "epoch": 1.4, "learning_rate": 1.9533178645375457e-05, "loss": 0.0104, "step": 97210 }, { "epoch": 1.4, "learning_rate": 1.9533130605636987e-05, "loss": 0.0113, "step": 97220 }, { "epoch": 1.4, "learning_rate": 1.9533082565898513e-05, "loss": 0.0161, "step": 97230 }, { "epoch": 1.4, "learning_rate": 1.9533034526160042e-05, "loss": 0.0121, "step": 97240 }, { "epoch": 1.4, "learning_rate": 1.953298648642157e-05, "loss": 0.0166, "step": 97250 }, { "epoch": 1.4, "learning_rate": 1.9532938446683097e-05, "loss": 0.0098, "step": 97260 }, { "epoch": 1.4, "learning_rate": 1.9532890406944626e-05, "loss": 0.0093, "step": 97270 }, { "epoch": 1.4, "learning_rate": 1.9532842367206156e-05, "loss": 0.0093, "step": 97280 }, { "epoch": 1.4, "learning_rate": 1.9532794327467685e-05, "loss": 0.0097, "step": 97290 }, { "epoch": 1.4, "learning_rate": 1.953274628772921e-05, "loss": 0.0156, "step": 97300 }, { "epoch": 1.4, "learning_rate": 1.953269824799074e-05, "loss": 0.0157, "step": 97310 }, { "epoch": 1.4, "learning_rate": 1.953265020825227e-05, "loss": 0.0121, "step": 97320 }, { "epoch": 1.4, "learning_rate": 1.9532602168513795e-05, "loss": 0.0106, "step": 97330 }, { "epoch": 1.4, "learning_rate": 1.9532554128775324e-05, "loss": 0.0102, "step": 97340 }, { "epoch": 1.4, "learning_rate": 1.9532506089036854e-05, "loss": 0.0141, "step": 97350 }, { "epoch": 1.4, "learning_rate": 1.9532458049298383e-05, "loss": 0.0117, "step": 97360 }, { "epoch": 1.4, "learning_rate": 1.953241000955991e-05, "loss": 0.014, "step": 97370 }, { "epoch": 1.4, "learning_rate": 1.9532361969821438e-05, "loss": 0.009, "step": 97380 }, { "epoch": 1.4, "learning_rate": 1.9532313930082967e-05, "loss": 0.0128, "step": 97390 }, { "epoch": 1.4, "learning_rate": 1.9532265890344497e-05, "loss": 0.0101, "step": 97400 }, { "epoch": 1.4, "learning_rate": 1.9532217850606023e-05, "loss": 0.0194, "step": 97410 }, { "epoch": 1.4, "learning_rate": 1.9532169810867552e-05, "loss": 0.0102, "step": 97420 }, { "epoch": 1.4, "learning_rate": 1.953212177112908e-05, "loss": 0.0127, "step": 97430 }, { "epoch": 1.4, "learning_rate": 1.9532073731390607e-05, "loss": 0.0103, "step": 97440 }, { "epoch": 1.4, "learning_rate": 1.9532025691652136e-05, "loss": 0.0068, "step": 97450 }, { "epoch": 1.4, "learning_rate": 1.9531977651913666e-05, "loss": 0.0104, "step": 97460 }, { "epoch": 1.4, "learning_rate": 1.9531929612175195e-05, "loss": 0.0132, "step": 97470 }, { "epoch": 1.4, "learning_rate": 1.953188157243672e-05, "loss": 0.0119, "step": 97480 }, { "epoch": 1.41, "learning_rate": 1.953183353269825e-05, "loss": 0.0104, "step": 97490 }, { "epoch": 1.41, "learning_rate": 1.953178549295978e-05, "loss": 0.0081, "step": 97500 }, { "epoch": 1.41, "learning_rate": 1.9531737453221305e-05, "loss": 0.0116, "step": 97510 }, { "epoch": 1.41, "learning_rate": 1.9531689413482834e-05, "loss": 0.0122, "step": 97520 }, { "epoch": 1.41, "learning_rate": 1.9531641373744364e-05, "loss": 0.0131, "step": 97530 }, { "epoch": 1.41, "learning_rate": 1.9531593334005893e-05, "loss": 0.0162, "step": 97540 }, { "epoch": 1.41, "learning_rate": 1.953154529426742e-05, "loss": 0.0109, "step": 97550 }, { "epoch": 1.41, "learning_rate": 1.9531497254528948e-05, "loss": 0.0088, "step": 97560 }, { "epoch": 1.41, "learning_rate": 1.9531449214790477e-05, "loss": 0.0154, "step": 97570 }, { "epoch": 1.41, "learning_rate": 1.9531401175052007e-05, "loss": 0.0087, "step": 97580 }, { "epoch": 1.41, "learning_rate": 1.9531353135313532e-05, "loss": 0.0157, "step": 97590 }, { "epoch": 1.41, "learning_rate": 1.9531305095575062e-05, "loss": 0.0096, "step": 97600 }, { "epoch": 1.41, "learning_rate": 1.953125705583659e-05, "loss": 0.007, "step": 97610 }, { "epoch": 1.41, "learning_rate": 1.9531209016098117e-05, "loss": 0.0078, "step": 97620 }, { "epoch": 1.41, "learning_rate": 1.9531160976359646e-05, "loss": 0.0113, "step": 97630 }, { "epoch": 1.41, "learning_rate": 1.9531112936621175e-05, "loss": 0.0121, "step": 97640 }, { "epoch": 1.41, "learning_rate": 1.9531064896882705e-05, "loss": 0.0091, "step": 97650 }, { "epoch": 1.41, "learning_rate": 1.953101685714423e-05, "loss": 0.0091, "step": 97660 }, { "epoch": 1.41, "learning_rate": 1.953096881740576e-05, "loss": 0.0096, "step": 97670 }, { "epoch": 1.41, "learning_rate": 1.953092077766729e-05, "loss": 0.0159, "step": 97680 }, { "epoch": 1.41, "learning_rate": 1.9530872737928815e-05, "loss": 0.0098, "step": 97690 }, { "epoch": 1.41, "learning_rate": 1.9530824698190344e-05, "loss": 0.0133, "step": 97700 }, { "epoch": 1.41, "learning_rate": 1.9530776658451874e-05, "loss": 0.0096, "step": 97710 }, { "epoch": 1.41, "learning_rate": 1.9530728618713403e-05, "loss": 0.0124, "step": 97720 }, { "epoch": 1.41, "learning_rate": 1.953068057897493e-05, "loss": 0.0118, "step": 97730 }, { "epoch": 1.41, "learning_rate": 1.9530632539236458e-05, "loss": 0.0126, "step": 97740 }, { "epoch": 1.41, "learning_rate": 1.9530584499497987e-05, "loss": 0.0128, "step": 97750 }, { "epoch": 1.41, "learning_rate": 1.9530536459759516e-05, "loss": 0.0127, "step": 97760 }, { "epoch": 1.41, "learning_rate": 1.9530488420021042e-05, "loss": 0.0171, "step": 97770 }, { "epoch": 1.41, "learning_rate": 1.953044038028257e-05, "loss": 0.0131, "step": 97780 }, { "epoch": 1.41, "learning_rate": 1.95303923405441e-05, "loss": 0.0091, "step": 97790 }, { "epoch": 1.41, "learning_rate": 1.9530344300805627e-05, "loss": 0.0132, "step": 97800 }, { "epoch": 1.41, "learning_rate": 1.9530296261067156e-05, "loss": 0.0101, "step": 97810 }, { "epoch": 1.41, "learning_rate": 1.9530248221328685e-05, "loss": 0.0099, "step": 97820 }, { "epoch": 1.41, "learning_rate": 1.9530200181590215e-05, "loss": 0.0105, "step": 97830 }, { "epoch": 1.41, "learning_rate": 1.953015214185174e-05, "loss": 0.0121, "step": 97840 }, { "epoch": 1.41, "learning_rate": 1.953010410211327e-05, "loss": 0.0109, "step": 97850 }, { "epoch": 1.41, "learning_rate": 1.95300560623748e-05, "loss": 0.0157, "step": 97860 }, { "epoch": 1.41, "learning_rate": 1.9530008022636325e-05, "loss": 0.0132, "step": 97870 }, { "epoch": 1.41, "learning_rate": 1.9529959982897854e-05, "loss": 0.0131, "step": 97880 }, { "epoch": 1.41, "learning_rate": 1.9529911943159383e-05, "loss": 0.0115, "step": 97890 }, { "epoch": 1.41, "learning_rate": 1.9529863903420913e-05, "loss": 0.0084, "step": 97900 }, { "epoch": 1.41, "learning_rate": 1.952981586368244e-05, "loss": 0.0097, "step": 97910 }, { "epoch": 1.41, "learning_rate": 1.9529767823943968e-05, "loss": 0.0089, "step": 97920 }, { "epoch": 1.41, "learning_rate": 1.9529719784205497e-05, "loss": 0.0132, "step": 97930 }, { "epoch": 1.41, "learning_rate": 1.9529671744467026e-05, "loss": 0.0158, "step": 97940 }, { "epoch": 1.41, "learning_rate": 1.9529623704728552e-05, "loss": 0.0127, "step": 97950 }, { "epoch": 1.41, "learning_rate": 1.952957566499008e-05, "loss": 0.0106, "step": 97960 }, { "epoch": 1.41, "learning_rate": 1.952952762525161e-05, "loss": 0.0115, "step": 97970 }, { "epoch": 1.41, "learning_rate": 1.9529479585513137e-05, "loss": 0.0138, "step": 97980 }, { "epoch": 1.41, "learning_rate": 1.9529431545774666e-05, "loss": 0.012, "step": 97990 }, { "epoch": 1.41, "learning_rate": 1.9529383506036195e-05, "loss": 0.0118, "step": 98000 }, { "epoch": 1.41, "learning_rate": 1.9529335466297725e-05, "loss": 0.0119, "step": 98010 }, { "epoch": 1.41, "learning_rate": 1.952928742655925e-05, "loss": 0.0101, "step": 98020 }, { "epoch": 1.41, "learning_rate": 1.952923938682078e-05, "loss": 0.0148, "step": 98030 }, { "epoch": 1.41, "learning_rate": 1.952919134708231e-05, "loss": 0.0112, "step": 98040 }, { "epoch": 1.41, "learning_rate": 1.9529143307343835e-05, "loss": 0.0135, "step": 98050 }, { "epoch": 1.41, "learning_rate": 1.9529095267605364e-05, "loss": 0.0143, "step": 98060 }, { "epoch": 1.41, "learning_rate": 1.9529047227866893e-05, "loss": 0.0107, "step": 98070 }, { "epoch": 1.41, "learning_rate": 1.9528999188128423e-05, "loss": 0.0123, "step": 98080 }, { "epoch": 1.41, "learning_rate": 1.952895114838995e-05, "loss": 0.0125, "step": 98090 }, { "epoch": 1.41, "learning_rate": 1.9528903108651478e-05, "loss": 0.0086, "step": 98100 }, { "epoch": 1.41, "learning_rate": 1.9528855068913007e-05, "loss": 0.0083, "step": 98110 }, { "epoch": 1.41, "learning_rate": 1.9528807029174536e-05, "loss": 0.0116, "step": 98120 }, { "epoch": 1.41, "learning_rate": 1.9528758989436062e-05, "loss": 0.011, "step": 98130 }, { "epoch": 1.41, "learning_rate": 1.952871094969759e-05, "loss": 0.014, "step": 98140 }, { "epoch": 1.41, "learning_rate": 1.952866290995912e-05, "loss": 0.0108, "step": 98150 }, { "epoch": 1.41, "learning_rate": 1.9528614870220647e-05, "loss": 0.0132, "step": 98160 }, { "epoch": 1.41, "learning_rate": 1.9528566830482176e-05, "loss": 0.0084, "step": 98170 }, { "epoch": 1.41, "learning_rate": 1.9528518790743705e-05, "loss": 0.0105, "step": 98180 }, { "epoch": 1.42, "learning_rate": 1.9528470751005234e-05, "loss": 0.0121, "step": 98190 }, { "epoch": 1.42, "learning_rate": 1.952842271126676e-05, "loss": 0.0101, "step": 98200 }, { "epoch": 1.42, "learning_rate": 1.952837467152829e-05, "loss": 0.0088, "step": 98210 }, { "epoch": 1.42, "learning_rate": 1.952832663178982e-05, "loss": 0.0112, "step": 98220 }, { "epoch": 1.42, "learning_rate": 1.9528278592051345e-05, "loss": 0.0128, "step": 98230 }, { "epoch": 1.42, "learning_rate": 1.9528230552312874e-05, "loss": 0.0144, "step": 98240 }, { "epoch": 1.42, "learning_rate": 1.9528182512574403e-05, "loss": 0.0118, "step": 98250 }, { "epoch": 1.42, "learning_rate": 1.9528134472835933e-05, "loss": 0.0127, "step": 98260 }, { "epoch": 1.42, "learning_rate": 1.952808643309746e-05, "loss": 0.01, "step": 98270 }, { "epoch": 1.42, "learning_rate": 1.9528038393358988e-05, "loss": 0.009, "step": 98280 }, { "epoch": 1.42, "learning_rate": 1.9527990353620517e-05, "loss": 0.0145, "step": 98290 }, { "epoch": 1.42, "learning_rate": 1.9527942313882043e-05, "loss": 0.0137, "step": 98300 }, { "epoch": 1.42, "learning_rate": 1.9527894274143572e-05, "loss": 0.0176, "step": 98310 }, { "epoch": 1.42, "learning_rate": 1.95278462344051e-05, "loss": 0.0098, "step": 98320 }, { "epoch": 1.42, "learning_rate": 1.952779819466663e-05, "loss": 0.0103, "step": 98330 }, { "epoch": 1.42, "learning_rate": 1.9527750154928157e-05, "loss": 0.0126, "step": 98340 }, { "epoch": 1.42, "learning_rate": 1.9527702115189686e-05, "loss": 0.016, "step": 98350 }, { "epoch": 1.42, "learning_rate": 1.9527654075451215e-05, "loss": 0.0115, "step": 98360 }, { "epoch": 1.42, "learning_rate": 1.9527606035712744e-05, "loss": 0.0105, "step": 98370 }, { "epoch": 1.42, "learning_rate": 1.952755799597427e-05, "loss": 0.011, "step": 98380 }, { "epoch": 1.42, "learning_rate": 1.95275099562358e-05, "loss": 0.0155, "step": 98390 }, { "epoch": 1.42, "learning_rate": 1.952746191649733e-05, "loss": 0.0123, "step": 98400 }, { "epoch": 1.42, "learning_rate": 1.9527413876758855e-05, "loss": 0.0135, "step": 98410 }, { "epoch": 1.42, "learning_rate": 1.9527365837020384e-05, "loss": 0.0132, "step": 98420 }, { "epoch": 1.42, "learning_rate": 1.9527317797281913e-05, "loss": 0.0159, "step": 98430 }, { "epoch": 1.42, "learning_rate": 1.9527269757543442e-05, "loss": 0.0129, "step": 98440 }, { "epoch": 1.42, "learning_rate": 1.952722171780497e-05, "loss": 0.0143, "step": 98450 }, { "epoch": 1.42, "learning_rate": 1.9527173678066498e-05, "loss": 0.0123, "step": 98460 }, { "epoch": 1.42, "learning_rate": 1.9527125638328027e-05, "loss": 0.012, "step": 98470 }, { "epoch": 1.42, "learning_rate": 1.9527077598589553e-05, "loss": 0.0143, "step": 98480 }, { "epoch": 1.42, "learning_rate": 1.9527029558851082e-05, "loss": 0.0138, "step": 98490 }, { "epoch": 1.42, "learning_rate": 1.952698151911261e-05, "loss": 0.0108, "step": 98500 }, { "epoch": 1.42, "learning_rate": 1.952693347937414e-05, "loss": 0.0129, "step": 98510 }, { "epoch": 1.42, "learning_rate": 1.9526885439635666e-05, "loss": 0.0122, "step": 98520 }, { "epoch": 1.42, "learning_rate": 1.9526837399897196e-05, "loss": 0.0122, "step": 98530 }, { "epoch": 1.42, "learning_rate": 1.9526789360158725e-05, "loss": 0.015, "step": 98540 }, { "epoch": 1.42, "learning_rate": 1.9526741320420254e-05, "loss": 0.009, "step": 98550 }, { "epoch": 1.42, "learning_rate": 1.952669328068178e-05, "loss": 0.012, "step": 98560 }, { "epoch": 1.42, "learning_rate": 1.952664524094331e-05, "loss": 0.0114, "step": 98570 }, { "epoch": 1.42, "learning_rate": 1.952659720120484e-05, "loss": 0.0112, "step": 98580 }, { "epoch": 1.42, "learning_rate": 1.9526549161466365e-05, "loss": 0.014, "step": 98590 }, { "epoch": 1.42, "learning_rate": 1.9526501121727894e-05, "loss": 0.0092, "step": 98600 }, { "epoch": 1.42, "learning_rate": 1.9526453081989423e-05, "loss": 0.0134, "step": 98610 }, { "epoch": 1.42, "learning_rate": 1.9526405042250952e-05, "loss": 0.0118, "step": 98620 }, { "epoch": 1.42, "learning_rate": 1.9526357002512478e-05, "loss": 0.0125, "step": 98630 }, { "epoch": 1.42, "learning_rate": 1.9526308962774008e-05, "loss": 0.0111, "step": 98640 }, { "epoch": 1.42, "learning_rate": 1.9526260923035537e-05, "loss": 0.0106, "step": 98650 }, { "epoch": 1.42, "learning_rate": 1.9526212883297063e-05, "loss": 0.01, "step": 98660 }, { "epoch": 1.42, "learning_rate": 1.9526164843558592e-05, "loss": 0.0091, "step": 98670 }, { "epoch": 1.42, "learning_rate": 1.952611680382012e-05, "loss": 0.0124, "step": 98680 }, { "epoch": 1.42, "learning_rate": 1.952606876408165e-05, "loss": 0.0079, "step": 98690 }, { "epoch": 1.42, "learning_rate": 1.9526020724343176e-05, "loss": 0.015, "step": 98700 }, { "epoch": 1.42, "learning_rate": 1.9525972684604706e-05, "loss": 0.0088, "step": 98710 }, { "epoch": 1.42, "learning_rate": 1.9525924644866235e-05, "loss": 0.0136, "step": 98720 }, { "epoch": 1.42, "learning_rate": 1.9525876605127764e-05, "loss": 0.0089, "step": 98730 }, { "epoch": 1.42, "learning_rate": 1.952582856538929e-05, "loss": 0.0085, "step": 98740 }, { "epoch": 1.42, "learning_rate": 1.952578052565082e-05, "loss": 0.0107, "step": 98750 }, { "epoch": 1.42, "learning_rate": 1.952573248591235e-05, "loss": 0.0125, "step": 98760 }, { "epoch": 1.42, "learning_rate": 1.9525684446173874e-05, "loss": 0.0114, "step": 98770 }, { "epoch": 1.42, "learning_rate": 1.9525636406435404e-05, "loss": 0.0125, "step": 98780 }, { "epoch": 1.42, "learning_rate": 1.9525588366696933e-05, "loss": 0.0119, "step": 98790 }, { "epoch": 1.42, "learning_rate": 1.9525540326958462e-05, "loss": 0.0136, "step": 98800 }, { "epoch": 1.42, "learning_rate": 1.9525492287219988e-05, "loss": 0.0142, "step": 98810 }, { "epoch": 1.42, "learning_rate": 1.9525444247481517e-05, "loss": 0.014, "step": 98820 }, { "epoch": 1.42, "learning_rate": 1.9525396207743047e-05, "loss": 0.0086, "step": 98830 }, { "epoch": 1.42, "learning_rate": 1.9525348168004573e-05, "loss": 0.0103, "step": 98840 }, { "epoch": 1.42, "learning_rate": 1.9525300128266102e-05, "loss": 0.0143, "step": 98850 }, { "epoch": 1.42, "learning_rate": 1.952525208852763e-05, "loss": 0.0125, "step": 98860 }, { "epoch": 1.42, "learning_rate": 1.952520404878916e-05, "loss": 0.0129, "step": 98870 }, { "epoch": 1.43, "learning_rate": 1.9525156009050686e-05, "loss": 0.01, "step": 98880 }, { "epoch": 1.43, "learning_rate": 1.9525107969312216e-05, "loss": 0.0141, "step": 98890 }, { "epoch": 1.43, "learning_rate": 1.952506473354759e-05, "loss": 0.0139, "step": 98900 }, { "epoch": 1.43, "learning_rate": 1.952501669380912e-05, "loss": 0.0088, "step": 98910 }, { "epoch": 1.43, "learning_rate": 1.952496865407065e-05, "loss": 0.0139, "step": 98920 }, { "epoch": 1.43, "learning_rate": 1.9524920614332178e-05, "loss": 0.0084, "step": 98930 }, { "epoch": 1.43, "learning_rate": 1.9524872574593704e-05, "loss": 0.0107, "step": 98940 }, { "epoch": 1.43, "learning_rate": 1.9524824534855233e-05, "loss": 0.0107, "step": 98950 }, { "epoch": 1.43, "learning_rate": 1.9524776495116762e-05, "loss": 0.0104, "step": 98960 }, { "epoch": 1.43, "learning_rate": 1.9524728455378292e-05, "loss": 0.0115, "step": 98970 }, { "epoch": 1.43, "learning_rate": 1.9524680415639818e-05, "loss": 0.0083, "step": 98980 }, { "epoch": 1.43, "learning_rate": 1.9524632375901347e-05, "loss": 0.0118, "step": 98990 }, { "epoch": 1.43, "learning_rate": 1.9524584336162876e-05, "loss": 0.011, "step": 99000 }, { "epoch": 1.43, "learning_rate": 1.9524536296424402e-05, "loss": 0.0149, "step": 99010 }, { "epoch": 1.43, "learning_rate": 1.952448825668593e-05, "loss": 0.0157, "step": 99020 }, { "epoch": 1.43, "learning_rate": 1.952444021694746e-05, "loss": 0.0145, "step": 99030 }, { "epoch": 1.43, "learning_rate": 1.952439217720899e-05, "loss": 0.0097, "step": 99040 }, { "epoch": 1.43, "learning_rate": 1.9524344137470516e-05, "loss": 0.0141, "step": 99050 }, { "epoch": 1.43, "learning_rate": 1.9524296097732045e-05, "loss": 0.0133, "step": 99060 }, { "epoch": 1.43, "learning_rate": 1.9524248057993574e-05, "loss": 0.0144, "step": 99070 }, { "epoch": 1.43, "learning_rate": 1.95242000182551e-05, "loss": 0.0089, "step": 99080 }, { "epoch": 1.43, "learning_rate": 1.952415197851663e-05, "loss": 0.0086, "step": 99090 }, { "epoch": 1.43, "learning_rate": 1.952410393877816e-05, "loss": 0.0108, "step": 99100 }, { "epoch": 1.43, "learning_rate": 1.9524055899039688e-05, "loss": 0.0104, "step": 99110 }, { "epoch": 1.43, "learning_rate": 1.9524007859301214e-05, "loss": 0.0113, "step": 99120 }, { "epoch": 1.43, "learning_rate": 1.9523959819562743e-05, "loss": 0.0095, "step": 99130 }, { "epoch": 1.43, "learning_rate": 1.9523911779824272e-05, "loss": 0.0163, "step": 99140 }, { "epoch": 1.43, "learning_rate": 1.95238637400858e-05, "loss": 0.0087, "step": 99150 }, { "epoch": 1.43, "learning_rate": 1.9523815700347327e-05, "loss": 0.0145, "step": 99160 }, { "epoch": 1.43, "learning_rate": 1.9523767660608857e-05, "loss": 0.0128, "step": 99170 }, { "epoch": 1.43, "learning_rate": 1.9523719620870386e-05, "loss": 0.012, "step": 99180 }, { "epoch": 1.43, "learning_rate": 1.9523671581131912e-05, "loss": 0.0122, "step": 99190 }, { "epoch": 1.43, "learning_rate": 1.952362354139344e-05, "loss": 0.0104, "step": 99200 }, { "epoch": 1.43, "learning_rate": 1.952357550165497e-05, "loss": 0.013, "step": 99210 }, { "epoch": 1.43, "learning_rate": 1.95235274619165e-05, "loss": 0.011, "step": 99220 }, { "epoch": 1.43, "learning_rate": 1.9523479422178026e-05, "loss": 0.0101, "step": 99230 }, { "epoch": 1.43, "learning_rate": 1.9523431382439555e-05, "loss": 0.0097, "step": 99240 }, { "epoch": 1.43, "learning_rate": 1.9523383342701084e-05, "loss": 0.0117, "step": 99250 }, { "epoch": 1.43, "learning_rate": 1.952333530296261e-05, "loss": 0.0132, "step": 99260 }, { "epoch": 1.43, "learning_rate": 1.952328726322414e-05, "loss": 0.0082, "step": 99270 }, { "epoch": 1.43, "learning_rate": 1.952323922348567e-05, "loss": 0.0095, "step": 99280 }, { "epoch": 1.43, "learning_rate": 1.9523191183747198e-05, "loss": 0.0112, "step": 99290 }, { "epoch": 1.43, "learning_rate": 1.9523143144008724e-05, "loss": 0.0088, "step": 99300 }, { "epoch": 1.43, "learning_rate": 1.9523095104270253e-05, "loss": 0.013, "step": 99310 }, { "epoch": 1.43, "learning_rate": 1.9523047064531782e-05, "loss": 0.011, "step": 99320 }, { "epoch": 1.43, "learning_rate": 1.952299902479331e-05, "loss": 0.009, "step": 99330 }, { "epoch": 1.43, "learning_rate": 1.9522950985054837e-05, "loss": 0.0087, "step": 99340 }, { "epoch": 1.43, "learning_rate": 1.9522902945316367e-05, "loss": 0.0149, "step": 99350 }, { "epoch": 1.43, "learning_rate": 1.9522854905577896e-05, "loss": 0.0125, "step": 99360 }, { "epoch": 1.43, "learning_rate": 1.9522806865839422e-05, "loss": 0.011, "step": 99370 }, { "epoch": 1.43, "learning_rate": 1.952275882610095e-05, "loss": 0.0088, "step": 99380 }, { "epoch": 1.43, "learning_rate": 1.952271078636248e-05, "loss": 0.0137, "step": 99390 }, { "epoch": 1.43, "learning_rate": 1.952266274662401e-05, "loss": 0.0118, "step": 99400 }, { "epoch": 1.43, "learning_rate": 1.9522614706885536e-05, "loss": 0.0138, "step": 99410 }, { "epoch": 1.43, "learning_rate": 1.9522566667147065e-05, "loss": 0.0151, "step": 99420 }, { "epoch": 1.43, "learning_rate": 1.9522518627408594e-05, "loss": 0.0122, "step": 99430 }, { "epoch": 1.43, "learning_rate": 1.952247058767012e-05, "loss": 0.0108, "step": 99440 }, { "epoch": 1.43, "learning_rate": 1.952242254793165e-05, "loss": 0.0144, "step": 99450 }, { "epoch": 1.43, "learning_rate": 1.952237450819318e-05, "loss": 0.0187, "step": 99460 }, { "epoch": 1.43, "learning_rate": 1.9522326468454708e-05, "loss": 0.0131, "step": 99470 }, { "epoch": 1.43, "learning_rate": 1.9522278428716234e-05, "loss": 0.0095, "step": 99480 }, { "epoch": 1.43, "learning_rate": 1.9522230388977763e-05, "loss": 0.0107, "step": 99490 }, { "epoch": 1.43, "learning_rate": 1.9522182349239292e-05, "loss": 0.0143, "step": 99500 }, { "epoch": 1.43, "learning_rate": 1.952213430950082e-05, "loss": 0.0097, "step": 99510 }, { "epoch": 1.43, "learning_rate": 1.9522086269762347e-05, "loss": 0.013, "step": 99520 }, { "epoch": 1.43, "learning_rate": 1.9522038230023877e-05, "loss": 0.01, "step": 99530 }, { "epoch": 1.43, "learning_rate": 1.9521990190285406e-05, "loss": 0.0122, "step": 99540 }, { "epoch": 1.43, "learning_rate": 1.9521942150546932e-05, "loss": 0.0121, "step": 99550 }, { "epoch": 1.43, "learning_rate": 1.952189411080846e-05, "loss": 0.0096, "step": 99560 }, { "epoch": 1.43, "learning_rate": 1.952184607106999e-05, "loss": 0.0116, "step": 99570 }, { "epoch": 1.44, "learning_rate": 1.952179803133152e-05, "loss": 0.01, "step": 99580 }, { "epoch": 1.44, "learning_rate": 1.9521749991593045e-05, "loss": 0.0146, "step": 99590 }, { "epoch": 1.44, "learning_rate": 1.9521701951854575e-05, "loss": 0.0137, "step": 99600 }, { "epoch": 1.44, "learning_rate": 1.9521653912116104e-05, "loss": 0.0098, "step": 99610 }, { "epoch": 1.44, "learning_rate": 1.952160587237763e-05, "loss": 0.0138, "step": 99620 }, { "epoch": 1.44, "learning_rate": 1.952155783263916e-05, "loss": 0.0088, "step": 99630 }, { "epoch": 1.44, "learning_rate": 1.952150979290069e-05, "loss": 0.0101, "step": 99640 }, { "epoch": 1.44, "learning_rate": 1.9521461753162218e-05, "loss": 0.0094, "step": 99650 }, { "epoch": 1.44, "learning_rate": 1.9521413713423744e-05, "loss": 0.0098, "step": 99660 }, { "epoch": 1.44, "learning_rate": 1.9521365673685273e-05, "loss": 0.0086, "step": 99670 }, { "epoch": 1.44, "learning_rate": 1.9521317633946802e-05, "loss": 0.0099, "step": 99680 }, { "epoch": 1.44, "learning_rate": 1.952126959420833e-05, "loss": 0.0133, "step": 99690 }, { "epoch": 1.44, "learning_rate": 1.9521221554469857e-05, "loss": 0.0151, "step": 99700 }, { "epoch": 1.44, "learning_rate": 1.9521173514731387e-05, "loss": 0.0106, "step": 99710 }, { "epoch": 1.44, "learning_rate": 1.9521125474992916e-05, "loss": 0.0122, "step": 99720 }, { "epoch": 1.44, "learning_rate": 1.952107743525444e-05, "loss": 0.0102, "step": 99730 }, { "epoch": 1.44, "learning_rate": 1.952102939551597e-05, "loss": 0.01, "step": 99740 }, { "epoch": 1.44, "learning_rate": 1.95209813557775e-05, "loss": 0.0104, "step": 99750 }, { "epoch": 1.44, "learning_rate": 1.952093331603903e-05, "loss": 0.0126, "step": 99760 }, { "epoch": 1.44, "learning_rate": 1.952088527630056e-05, "loss": 0.0092, "step": 99770 }, { "epoch": 1.44, "learning_rate": 1.9520837236562088e-05, "loss": 0.0113, "step": 99780 }, { "epoch": 1.44, "learning_rate": 1.9520789196823614e-05, "loss": 0.0099, "step": 99790 }, { "epoch": 1.44, "learning_rate": 1.9520741157085143e-05, "loss": 0.0129, "step": 99800 }, { "epoch": 1.44, "learning_rate": 1.9520693117346672e-05, "loss": 0.011, "step": 99810 }, { "epoch": 1.44, "learning_rate": 1.9520645077608202e-05, "loss": 0.0131, "step": 99820 }, { "epoch": 1.44, "learning_rate": 1.9520597037869728e-05, "loss": 0.0114, "step": 99830 }, { "epoch": 1.44, "learning_rate": 1.9520548998131257e-05, "loss": 0.0101, "step": 99840 }, { "epoch": 1.44, "learning_rate": 1.9520500958392786e-05, "loss": 0.0094, "step": 99850 }, { "epoch": 1.44, "learning_rate": 1.9520452918654312e-05, "loss": 0.0111, "step": 99860 }, { "epoch": 1.44, "learning_rate": 1.952040487891584e-05, "loss": 0.009, "step": 99870 }, { "epoch": 1.44, "learning_rate": 1.952035683917737e-05, "loss": 0.0087, "step": 99880 }, { "epoch": 1.44, "learning_rate": 1.95203087994389e-05, "loss": 0.0106, "step": 99890 }, { "epoch": 1.44, "learning_rate": 1.9520260759700426e-05, "loss": 0.0117, "step": 99900 }, { "epoch": 1.44, "learning_rate": 1.9520212719961955e-05, "loss": 0.0105, "step": 99910 }, { "epoch": 1.44, "learning_rate": 1.9520164680223484e-05, "loss": 0.0141, "step": 99920 }, { "epoch": 1.44, "learning_rate": 1.952011664048501e-05, "loss": 0.0138, "step": 99930 }, { "epoch": 1.44, "learning_rate": 1.952006860074654e-05, "loss": 0.011, "step": 99940 }, { "epoch": 1.44, "learning_rate": 1.952002056100807e-05, "loss": 0.0094, "step": 99950 }, { "epoch": 1.44, "learning_rate": 1.9519972521269598e-05, "loss": 0.0068, "step": 99960 }, { "epoch": 1.44, "learning_rate": 1.9519924481531124e-05, "loss": 0.0102, "step": 99970 }, { "epoch": 1.44, "learning_rate": 1.9519876441792653e-05, "loss": 0.0086, "step": 99980 }, { "epoch": 1.44, "learning_rate": 1.9519828402054182e-05, "loss": 0.0088, "step": 99990 }, { "epoch": 1.44, "learning_rate": 1.951978036231571e-05, "loss": 0.0107, "step": 100000 }, { "epoch": 1.44, "learning_rate": 1.9519732322577237e-05, "loss": 0.0127, "step": 100010 }, { "epoch": 1.44, "learning_rate": 1.9519684282838767e-05, "loss": 0.0096, "step": 100020 }, { "epoch": 1.44, "learning_rate": 1.9519636243100296e-05, "loss": 0.012, "step": 100030 }, { "epoch": 1.44, "learning_rate": 1.9519588203361822e-05, "loss": 0.014, "step": 100040 }, { "epoch": 1.44, "learning_rate": 1.951954016362335e-05, "loss": 0.0081, "step": 100050 }, { "epoch": 1.44, "learning_rate": 1.951949212388488e-05, "loss": 0.0155, "step": 100060 }, { "epoch": 1.44, "learning_rate": 1.951944408414641e-05, "loss": 0.0154, "step": 100070 }, { "epoch": 1.44, "learning_rate": 1.9519396044407936e-05, "loss": 0.0155, "step": 100080 }, { "epoch": 1.44, "learning_rate": 1.9519348004669465e-05, "loss": 0.0104, "step": 100090 }, { "epoch": 1.44, "learning_rate": 1.9519299964930994e-05, "loss": 0.0137, "step": 100100 }, { "epoch": 1.44, "learning_rate": 1.951925192519252e-05, "loss": 0.0098, "step": 100110 }, { "epoch": 1.44, "learning_rate": 1.951920388545405e-05, "loss": 0.0127, "step": 100120 }, { "epoch": 1.44, "learning_rate": 1.951915584571558e-05, "loss": 0.0105, "step": 100130 }, { "epoch": 1.44, "learning_rate": 1.9519107805977108e-05, "loss": 0.0163, "step": 100140 }, { "epoch": 1.44, "learning_rate": 1.9519059766238634e-05, "loss": 0.0102, "step": 100150 }, { "epoch": 1.44, "learning_rate": 1.9519011726500163e-05, "loss": 0.0116, "step": 100160 }, { "epoch": 1.44, "learning_rate": 1.9518963686761692e-05, "loss": 0.0079, "step": 100170 }, { "epoch": 1.44, "learning_rate": 1.951891564702322e-05, "loss": 0.0119, "step": 100180 }, { "epoch": 1.44, "learning_rate": 1.9518867607284747e-05, "loss": 0.0084, "step": 100190 }, { "epoch": 1.44, "learning_rate": 1.9518819567546277e-05, "loss": 0.0106, "step": 100200 }, { "epoch": 1.44, "learning_rate": 1.9518771527807806e-05, "loss": 0.0091, "step": 100210 }, { "epoch": 1.44, "learning_rate": 1.9518723488069332e-05, "loss": 0.0083, "step": 100220 }, { "epoch": 1.44, "learning_rate": 1.951867544833086e-05, "loss": 0.0111, "step": 100230 }, { "epoch": 1.44, "learning_rate": 1.951862740859239e-05, "loss": 0.0084, "step": 100240 }, { "epoch": 1.44, "learning_rate": 1.951857936885392e-05, "loss": 0.0092, "step": 100250 }, { "epoch": 1.44, "learning_rate": 1.9518531329115446e-05, "loss": 0.0114, "step": 100260 }, { "epoch": 1.45, "learning_rate": 1.9518483289376975e-05, "loss": 0.0141, "step": 100270 }, { "epoch": 1.45, "learning_rate": 1.9518435249638504e-05, "loss": 0.0167, "step": 100280 }, { "epoch": 1.45, "learning_rate": 1.951838720990003e-05, "loss": 0.0139, "step": 100290 }, { "epoch": 1.45, "learning_rate": 1.951833917016156e-05, "loss": 0.0094, "step": 100300 }, { "epoch": 1.45, "learning_rate": 1.951829113042309e-05, "loss": 0.0076, "step": 100310 }, { "epoch": 1.45, "learning_rate": 1.9518243090684618e-05, "loss": 0.0096, "step": 100320 }, { "epoch": 1.45, "learning_rate": 1.9518195050946144e-05, "loss": 0.0097, "step": 100330 }, { "epoch": 1.45, "learning_rate": 1.9518147011207673e-05, "loss": 0.0105, "step": 100340 }, { "epoch": 1.45, "learning_rate": 1.9518098971469202e-05, "loss": 0.013, "step": 100350 }, { "epoch": 1.45, "learning_rate": 1.951805093173073e-05, "loss": 0.0114, "step": 100360 }, { "epoch": 1.45, "learning_rate": 1.9518002891992257e-05, "loss": 0.0075, "step": 100370 }, { "epoch": 1.45, "learning_rate": 1.9517954852253787e-05, "loss": 0.0127, "step": 100380 }, { "epoch": 1.45, "learning_rate": 1.9517906812515316e-05, "loss": 0.0094, "step": 100390 }, { "epoch": 1.45, "learning_rate": 1.9517858772776842e-05, "loss": 0.0128, "step": 100400 }, { "epoch": 1.45, "learning_rate": 1.951781073303837e-05, "loss": 0.0131, "step": 100410 }, { "epoch": 1.45, "learning_rate": 1.95177626932999e-05, "loss": 0.0128, "step": 100420 }, { "epoch": 1.45, "learning_rate": 1.951771465356143e-05, "loss": 0.0122, "step": 100430 }, { "epoch": 1.45, "learning_rate": 1.9517666613822955e-05, "loss": 0.0071, "step": 100440 }, { "epoch": 1.45, "learning_rate": 1.9517618574084485e-05, "loss": 0.0144, "step": 100450 }, { "epoch": 1.45, "learning_rate": 1.9517570534346014e-05, "loss": 0.0123, "step": 100460 }, { "epoch": 1.45, "learning_rate": 1.951752249460754e-05, "loss": 0.0167, "step": 100470 }, { "epoch": 1.45, "learning_rate": 1.951747445486907e-05, "loss": 0.0143, "step": 100480 }, { "epoch": 1.45, "learning_rate": 1.95174264151306e-05, "loss": 0.0131, "step": 100490 }, { "epoch": 1.45, "learning_rate": 1.9517378375392128e-05, "loss": 0.012, "step": 100500 }, { "epoch": 1.45, "learning_rate": 1.9517330335653654e-05, "loss": 0.0081, "step": 100510 }, { "epoch": 1.45, "learning_rate": 1.9517282295915183e-05, "loss": 0.0153, "step": 100520 }, { "epoch": 1.45, "learning_rate": 1.9517234256176712e-05, "loss": 0.0106, "step": 100530 }, { "epoch": 1.45, "learning_rate": 1.951718621643824e-05, "loss": 0.0143, "step": 100540 }, { "epoch": 1.45, "learning_rate": 1.9517138176699767e-05, "loss": 0.0118, "step": 100550 }, { "epoch": 1.45, "learning_rate": 1.9517090136961297e-05, "loss": 0.0141, "step": 100560 }, { "epoch": 1.45, "learning_rate": 1.9517042097222826e-05, "loss": 0.0126, "step": 100570 }, { "epoch": 1.45, "learning_rate": 1.951699405748435e-05, "loss": 0.012, "step": 100580 }, { "epoch": 1.45, "learning_rate": 1.951694601774588e-05, "loss": 0.0098, "step": 100590 }, { "epoch": 1.45, "learning_rate": 1.951689797800741e-05, "loss": 0.0131, "step": 100600 }, { "epoch": 1.45, "learning_rate": 1.951684993826894e-05, "loss": 0.0127, "step": 100610 }, { "epoch": 1.45, "learning_rate": 1.9516801898530465e-05, "loss": 0.0137, "step": 100620 }, { "epoch": 1.45, "learning_rate": 1.9516753858791995e-05, "loss": 0.0121, "step": 100630 }, { "epoch": 1.45, "learning_rate": 1.9516705819053524e-05, "loss": 0.0117, "step": 100640 }, { "epoch": 1.45, "learning_rate": 1.951665777931505e-05, "loss": 0.0106, "step": 100650 }, { "epoch": 1.45, "learning_rate": 1.951660973957658e-05, "loss": 0.0095, "step": 100660 }, { "epoch": 1.45, "learning_rate": 1.951656169983811e-05, "loss": 0.0091, "step": 100670 }, { "epoch": 1.45, "learning_rate": 1.9516513660099638e-05, "loss": 0.0116, "step": 100680 }, { "epoch": 1.45, "learning_rate": 1.9516465620361163e-05, "loss": 0.01, "step": 100690 }, { "epoch": 1.45, "learning_rate": 1.9516417580622693e-05, "loss": 0.0111, "step": 100700 }, { "epoch": 1.45, "learning_rate": 1.9516369540884222e-05, "loss": 0.0118, "step": 100710 }, { "epoch": 1.45, "learning_rate": 1.951632150114575e-05, "loss": 0.015, "step": 100720 }, { "epoch": 1.45, "learning_rate": 1.9516273461407277e-05, "loss": 0.012, "step": 100730 }, { "epoch": 1.45, "learning_rate": 1.9516225421668806e-05, "loss": 0.0131, "step": 100740 }, { "epoch": 1.45, "learning_rate": 1.9516177381930336e-05, "loss": 0.0101, "step": 100750 }, { "epoch": 1.45, "learning_rate": 1.951612934219186e-05, "loss": 0.0144, "step": 100760 }, { "epoch": 1.45, "learning_rate": 1.951608130245339e-05, "loss": 0.0157, "step": 100770 }, { "epoch": 1.45, "learning_rate": 1.951603326271492e-05, "loss": 0.0142, "step": 100780 }, { "epoch": 1.45, "learning_rate": 1.951598522297645e-05, "loss": 0.0105, "step": 100790 }, { "epoch": 1.45, "learning_rate": 1.9515937183237975e-05, "loss": 0.0109, "step": 100800 }, { "epoch": 1.45, "learning_rate": 1.9515889143499505e-05, "loss": 0.0125, "step": 100810 }, { "epoch": 1.45, "learning_rate": 1.9515841103761034e-05, "loss": 0.0134, "step": 100820 }, { "epoch": 1.45, "learning_rate": 1.951579306402256e-05, "loss": 0.0092, "step": 100830 }, { "epoch": 1.45, "learning_rate": 1.951574502428409e-05, "loss": 0.0165, "step": 100840 }, { "epoch": 1.45, "learning_rate": 1.9515696984545618e-05, "loss": 0.013, "step": 100850 }, { "epoch": 1.45, "learning_rate": 1.9515648944807147e-05, "loss": 0.0112, "step": 100860 }, { "epoch": 1.45, "learning_rate": 1.9515600905068673e-05, "loss": 0.0105, "step": 100870 }, { "epoch": 1.45, "learning_rate": 1.9515552865330203e-05, "loss": 0.0131, "step": 100880 }, { "epoch": 1.45, "learning_rate": 1.9515504825591732e-05, "loss": 0.0115, "step": 100890 }, { "epoch": 1.45, "learning_rate": 1.951545678585326e-05, "loss": 0.0099, "step": 100900 }, { "epoch": 1.45, "learning_rate": 1.9515408746114787e-05, "loss": 0.0137, "step": 100910 }, { "epoch": 1.45, "learning_rate": 1.9515360706376316e-05, "loss": 0.0125, "step": 100920 }, { "epoch": 1.45, "learning_rate": 1.9515312666637846e-05, "loss": 0.0107, "step": 100930 }, { "epoch": 1.45, "learning_rate": 1.951526462689937e-05, "loss": 0.0137, "step": 100940 }, { "epoch": 1.45, "learning_rate": 1.95152165871609e-05, "loss": 0.0098, "step": 100950 }, { "epoch": 1.46, "learning_rate": 1.951516854742243e-05, "loss": 0.0143, "step": 100960 }, { "epoch": 1.46, "learning_rate": 1.951512050768396e-05, "loss": 0.0118, "step": 100970 }, { "epoch": 1.46, "learning_rate": 1.9515072467945485e-05, "loss": 0.0134, "step": 100980 }, { "epoch": 1.46, "learning_rate": 1.9515024428207014e-05, "loss": 0.0117, "step": 100990 }, { "epoch": 1.46, "learning_rate": 1.9514976388468544e-05, "loss": 0.0119, "step": 101000 }, { "epoch": 1.46, "learning_rate": 1.951492834873007e-05, "loss": 0.0113, "step": 101010 }, { "epoch": 1.46, "learning_rate": 1.95148803089916e-05, "loss": 0.0142, "step": 101020 }, { "epoch": 1.46, "learning_rate": 1.9514832269253128e-05, "loss": 0.0091, "step": 101030 }, { "epoch": 1.46, "learning_rate": 1.9514784229514657e-05, "loss": 0.0101, "step": 101040 }, { "epoch": 1.46, "learning_rate": 1.9514736189776183e-05, "loss": 0.0106, "step": 101050 }, { "epoch": 1.46, "learning_rate": 1.9514688150037713e-05, "loss": 0.0119, "step": 101060 }, { "epoch": 1.46, "learning_rate": 1.9514640110299242e-05, "loss": 0.0109, "step": 101070 }, { "epoch": 1.46, "learning_rate": 1.951459207056077e-05, "loss": 0.0104, "step": 101080 }, { "epoch": 1.46, "learning_rate": 1.9514544030822297e-05, "loss": 0.0117, "step": 101090 }, { "epoch": 1.46, "learning_rate": 1.9514495991083826e-05, "loss": 0.013, "step": 101100 }, { "epoch": 1.46, "learning_rate": 1.9514447951345356e-05, "loss": 0.0087, "step": 101110 }, { "epoch": 1.46, "learning_rate": 1.951439991160688e-05, "loss": 0.0127, "step": 101120 }, { "epoch": 1.46, "learning_rate": 1.951435187186841e-05, "loss": 0.0073, "step": 101130 }, { "epoch": 1.46, "learning_rate": 1.951430383212994e-05, "loss": 0.0104, "step": 101140 }, { "epoch": 1.46, "learning_rate": 1.951425579239147e-05, "loss": 0.0112, "step": 101150 }, { "epoch": 1.46, "learning_rate": 1.9514207752652995e-05, "loss": 0.0121, "step": 101160 }, { "epoch": 1.46, "learning_rate": 1.9514159712914524e-05, "loss": 0.0118, "step": 101170 }, { "epoch": 1.46, "learning_rate": 1.9514111673176054e-05, "loss": 0.011, "step": 101180 }, { "epoch": 1.46, "learning_rate": 1.951406363343758e-05, "loss": 0.0096, "step": 101190 }, { "epoch": 1.46, "learning_rate": 1.951401559369911e-05, "loss": 0.0088, "step": 101200 }, { "epoch": 1.46, "learning_rate": 1.9513967553960638e-05, "loss": 0.0141, "step": 101210 }, { "epoch": 1.46, "learning_rate": 1.9513919514222167e-05, "loss": 0.0142, "step": 101220 }, { "epoch": 1.46, "learning_rate": 1.9513871474483693e-05, "loss": 0.0096, "step": 101230 }, { "epoch": 1.46, "learning_rate": 1.9513823434745222e-05, "loss": 0.0119, "step": 101240 }, { "epoch": 1.46, "learning_rate": 1.9513775395006752e-05, "loss": 0.0146, "step": 101250 }, { "epoch": 1.46, "learning_rate": 1.951372735526828e-05, "loss": 0.0162, "step": 101260 }, { "epoch": 1.46, "learning_rate": 1.9513679315529807e-05, "loss": 0.011, "step": 101270 }, { "epoch": 1.46, "learning_rate": 1.9513631275791336e-05, "loss": 0.0096, "step": 101280 }, { "epoch": 1.46, "learning_rate": 1.9513583236052865e-05, "loss": 0.0145, "step": 101290 }, { "epoch": 1.46, "learning_rate": 1.951353519631439e-05, "loss": 0.0087, "step": 101300 }, { "epoch": 1.46, "learning_rate": 1.951348715657592e-05, "loss": 0.0122, "step": 101310 }, { "epoch": 1.46, "learning_rate": 1.951343911683745e-05, "loss": 0.0078, "step": 101320 }, { "epoch": 1.46, "learning_rate": 1.951339107709898e-05, "loss": 0.0123, "step": 101330 }, { "epoch": 1.46, "learning_rate": 1.9513343037360505e-05, "loss": 0.0103, "step": 101340 }, { "epoch": 1.46, "learning_rate": 1.9513294997622034e-05, "loss": 0.01, "step": 101350 }, { "epoch": 1.46, "learning_rate": 1.9513246957883564e-05, "loss": 0.0095, "step": 101360 }, { "epoch": 1.46, "learning_rate": 1.951319891814509e-05, "loss": 0.0063, "step": 101370 }, { "epoch": 1.46, "learning_rate": 1.951315087840662e-05, "loss": 0.0126, "step": 101380 }, { "epoch": 1.46, "learning_rate": 1.9513102838668148e-05, "loss": 0.0075, "step": 101390 }, { "epoch": 1.46, "learning_rate": 1.9513054798929677e-05, "loss": 0.0129, "step": 101400 }, { "epoch": 1.46, "learning_rate": 1.9513006759191203e-05, "loss": 0.0113, "step": 101410 }, { "epoch": 1.46, "learning_rate": 1.9512958719452732e-05, "loss": 0.0082, "step": 101420 }, { "epoch": 1.46, "learning_rate": 1.951291067971426e-05, "loss": 0.0109, "step": 101430 }, { "epoch": 1.46, "learning_rate": 1.9512862639975788e-05, "loss": 0.015, "step": 101440 }, { "epoch": 1.46, "learning_rate": 1.9512814600237317e-05, "loss": 0.0121, "step": 101450 }, { "epoch": 1.46, "learning_rate": 1.9512766560498846e-05, "loss": 0.0111, "step": 101460 }, { "epoch": 1.46, "learning_rate": 1.9512718520760375e-05, "loss": 0.0069, "step": 101470 }, { "epoch": 1.46, "learning_rate": 1.95126704810219e-05, "loss": 0.0079, "step": 101480 }, { "epoch": 1.46, "learning_rate": 1.951262244128343e-05, "loss": 0.0111, "step": 101490 }, { "epoch": 1.46, "learning_rate": 1.951257440154496e-05, "loss": 0.0095, "step": 101500 }, { "epoch": 1.46, "learning_rate": 1.951252636180649e-05, "loss": 0.0154, "step": 101510 }, { "epoch": 1.46, "learning_rate": 1.9512478322068015e-05, "loss": 0.0124, "step": 101520 }, { "epoch": 1.46, "learning_rate": 1.9512430282329544e-05, "loss": 0.0081, "step": 101530 }, { "epoch": 1.46, "learning_rate": 1.9512382242591073e-05, "loss": 0.0085, "step": 101540 }, { "epoch": 1.46, "learning_rate": 1.95123342028526e-05, "loss": 0.0161, "step": 101550 }, { "epoch": 1.46, "learning_rate": 1.951228616311413e-05, "loss": 0.0121, "step": 101560 }, { "epoch": 1.46, "learning_rate": 1.9512238123375658e-05, "loss": 0.0088, "step": 101570 }, { "epoch": 1.46, "learning_rate": 1.9512190083637187e-05, "loss": 0.0095, "step": 101580 }, { "epoch": 1.46, "learning_rate": 1.9512142043898713e-05, "loss": 0.0092, "step": 101590 }, { "epoch": 1.46, "learning_rate": 1.9512094004160242e-05, "loss": 0.0092, "step": 101600 }, { "epoch": 1.46, "learning_rate": 1.951204596442177e-05, "loss": 0.0121, "step": 101610 }, { "epoch": 1.46, "learning_rate": 1.9511997924683297e-05, "loss": 0.0083, "step": 101620 }, { "epoch": 1.46, "learning_rate": 1.9511949884944827e-05, "loss": 0.0122, "step": 101630 }, { "epoch": 1.46, "learning_rate": 1.9511901845206356e-05, "loss": 0.0144, "step": 101640 }, { "epoch": 1.46, "learning_rate": 1.9511853805467885e-05, "loss": 0.0116, "step": 101650 }, { "epoch": 1.47, "learning_rate": 1.951180576572941e-05, "loss": 0.01, "step": 101660 }, { "epoch": 1.47, "learning_rate": 1.951175772599094e-05, "loss": 0.0088, "step": 101670 }, { "epoch": 1.47, "learning_rate": 1.951170968625247e-05, "loss": 0.0093, "step": 101680 }, { "epoch": 1.47, "learning_rate": 1.9511661646514e-05, "loss": 0.0108, "step": 101690 }, { "epoch": 1.47, "learning_rate": 1.9511613606775525e-05, "loss": 0.0142, "step": 101700 }, { "epoch": 1.47, "learning_rate": 1.9511565567037054e-05, "loss": 0.0131, "step": 101710 }, { "epoch": 1.47, "learning_rate": 1.9511517527298583e-05, "loss": 0.0106, "step": 101720 }, { "epoch": 1.47, "learning_rate": 1.951146948756011e-05, "loss": 0.0085, "step": 101730 }, { "epoch": 1.47, "learning_rate": 1.951142144782164e-05, "loss": 0.0114, "step": 101740 }, { "epoch": 1.47, "learning_rate": 1.9511373408083168e-05, "loss": 0.0122, "step": 101750 }, { "epoch": 1.47, "learning_rate": 1.9511325368344697e-05, "loss": 0.0161, "step": 101760 }, { "epoch": 1.47, "learning_rate": 1.9511277328606223e-05, "loss": 0.0089, "step": 101770 }, { "epoch": 1.47, "learning_rate": 1.9511229288867752e-05, "loss": 0.0123, "step": 101780 }, { "epoch": 1.47, "learning_rate": 1.951118124912928e-05, "loss": 0.015, "step": 101790 }, { "epoch": 1.47, "learning_rate": 1.9511133209390807e-05, "loss": 0.0101, "step": 101800 }, { "epoch": 1.47, "learning_rate": 1.9511085169652337e-05, "loss": 0.0157, "step": 101810 }, { "epoch": 1.47, "learning_rate": 1.9511037129913866e-05, "loss": 0.0132, "step": 101820 }, { "epoch": 1.47, "learning_rate": 1.9510989090175395e-05, "loss": 0.0141, "step": 101830 }, { "epoch": 1.47, "learning_rate": 1.951094105043692e-05, "loss": 0.0101, "step": 101840 }, { "epoch": 1.47, "learning_rate": 1.951089301069845e-05, "loss": 0.0105, "step": 101850 }, { "epoch": 1.47, "learning_rate": 1.951084497095998e-05, "loss": 0.0126, "step": 101860 }, { "epoch": 1.47, "learning_rate": 1.951079693122151e-05, "loss": 0.0114, "step": 101870 }, { "epoch": 1.47, "learning_rate": 1.9510748891483035e-05, "loss": 0.0102, "step": 101880 }, { "epoch": 1.47, "learning_rate": 1.9510700851744564e-05, "loss": 0.0163, "step": 101890 }, { "epoch": 1.47, "learning_rate": 1.9510652812006093e-05, "loss": 0.0121, "step": 101900 }, { "epoch": 1.47, "learning_rate": 1.951060477226762e-05, "loss": 0.0095, "step": 101910 }, { "epoch": 1.47, "learning_rate": 1.951055673252915e-05, "loss": 0.0119, "step": 101920 }, { "epoch": 1.47, "learning_rate": 1.9510508692790678e-05, "loss": 0.0119, "step": 101930 }, { "epoch": 1.47, "learning_rate": 1.9510460653052207e-05, "loss": 0.0079, "step": 101940 }, { "epoch": 1.47, "learning_rate": 1.9510412613313733e-05, "loss": 0.0122, "step": 101950 }, { "epoch": 1.47, "learning_rate": 1.9510364573575262e-05, "loss": 0.0106, "step": 101960 }, { "epoch": 1.47, "learning_rate": 1.951031653383679e-05, "loss": 0.0135, "step": 101970 }, { "epoch": 1.47, "learning_rate": 1.9510268494098317e-05, "loss": 0.0153, "step": 101980 }, { "epoch": 1.47, "learning_rate": 1.9510220454359847e-05, "loss": 0.0139, "step": 101990 }, { "epoch": 1.47, "learning_rate": 1.9510172414621376e-05, "loss": 0.0093, "step": 102000 }, { "epoch": 1.47, "learning_rate": 1.9510124374882905e-05, "loss": 0.0075, "step": 102010 }, { "epoch": 1.47, "learning_rate": 1.951007633514443e-05, "loss": 0.009, "step": 102020 }, { "epoch": 1.47, "learning_rate": 1.951003309937981e-05, "loss": 0.0097, "step": 102030 }, { "epoch": 1.47, "learning_rate": 1.9509985059641335e-05, "loss": 0.0111, "step": 102040 }, { "epoch": 1.47, "learning_rate": 1.9509937019902864e-05, "loss": 0.0098, "step": 102050 }, { "epoch": 1.47, "learning_rate": 1.9509888980164393e-05, "loss": 0.0091, "step": 102060 }, { "epoch": 1.47, "learning_rate": 1.9509840940425923e-05, "loss": 0.0114, "step": 102070 }, { "epoch": 1.47, "learning_rate": 1.950979290068745e-05, "loss": 0.014, "step": 102080 }, { "epoch": 1.47, "learning_rate": 1.9509744860948978e-05, "loss": 0.0131, "step": 102090 }, { "epoch": 1.47, "learning_rate": 1.9509696821210507e-05, "loss": 0.01, "step": 102100 }, { "epoch": 1.47, "learning_rate": 1.9509648781472036e-05, "loss": 0.0125, "step": 102110 }, { "epoch": 1.47, "learning_rate": 1.9509600741733562e-05, "loss": 0.0147, "step": 102120 }, { "epoch": 1.47, "learning_rate": 1.950955270199509e-05, "loss": 0.0146, "step": 102130 }, { "epoch": 1.47, "learning_rate": 1.950950466225662e-05, "loss": 0.0141, "step": 102140 }, { "epoch": 1.47, "learning_rate": 1.9509456622518147e-05, "loss": 0.0072, "step": 102150 }, { "epoch": 1.47, "learning_rate": 1.9509408582779676e-05, "loss": 0.0149, "step": 102160 }, { "epoch": 1.47, "learning_rate": 1.9509360543041205e-05, "loss": 0.0118, "step": 102170 }, { "epoch": 1.47, "learning_rate": 1.9509312503302735e-05, "loss": 0.0107, "step": 102180 }, { "epoch": 1.47, "learning_rate": 1.950926446356426e-05, "loss": 0.0126, "step": 102190 }, { "epoch": 1.47, "learning_rate": 1.950921642382579e-05, "loss": 0.0089, "step": 102200 }, { "epoch": 1.47, "learning_rate": 1.950916838408732e-05, "loss": 0.0117, "step": 102210 }, { "epoch": 1.47, "learning_rate": 1.9509120344348845e-05, "loss": 0.0101, "step": 102220 }, { "epoch": 1.47, "learning_rate": 1.9509072304610374e-05, "loss": 0.0127, "step": 102230 }, { "epoch": 1.47, "learning_rate": 1.9509024264871903e-05, "loss": 0.0124, "step": 102240 }, { "epoch": 1.47, "learning_rate": 1.9508976225133433e-05, "loss": 0.01, "step": 102250 }, { "epoch": 1.47, "learning_rate": 1.950892818539496e-05, "loss": 0.0106, "step": 102260 }, { "epoch": 1.47, "learning_rate": 1.9508880145656488e-05, "loss": 0.0133, "step": 102270 }, { "epoch": 1.47, "learning_rate": 1.9508832105918017e-05, "loss": 0.0124, "step": 102280 }, { "epoch": 1.47, "learning_rate": 1.9508784066179546e-05, "loss": 0.0098, "step": 102290 }, { "epoch": 1.47, "learning_rate": 1.9508736026441072e-05, "loss": 0.0138, "step": 102300 }, { "epoch": 1.47, "learning_rate": 1.95086879867026e-05, "loss": 0.0144, "step": 102310 }, { "epoch": 1.47, "learning_rate": 1.950863994696413e-05, "loss": 0.0131, "step": 102320 }, { "epoch": 1.47, "learning_rate": 1.9508591907225657e-05, "loss": 0.0169, "step": 102330 }, { "epoch": 1.47, "learning_rate": 1.9508543867487186e-05, "loss": 0.0111, "step": 102340 }, { "epoch": 1.48, "learning_rate": 1.9508495827748715e-05, "loss": 0.0101, "step": 102350 }, { "epoch": 1.48, "learning_rate": 1.9508447788010244e-05, "loss": 0.0113, "step": 102360 }, { "epoch": 1.48, "learning_rate": 1.950839974827177e-05, "loss": 0.0123, "step": 102370 }, { "epoch": 1.48, "learning_rate": 1.95083517085333e-05, "loss": 0.0157, "step": 102380 }, { "epoch": 1.48, "learning_rate": 1.950830366879483e-05, "loss": 0.0116, "step": 102390 }, { "epoch": 1.48, "learning_rate": 1.9508255629056355e-05, "loss": 0.0109, "step": 102400 }, { "epoch": 1.48, "learning_rate": 1.9508207589317884e-05, "loss": 0.0093, "step": 102410 }, { "epoch": 1.48, "learning_rate": 1.9508159549579413e-05, "loss": 0.0188, "step": 102420 }, { "epoch": 1.48, "learning_rate": 1.9508111509840943e-05, "loss": 0.0137, "step": 102430 }, { "epoch": 1.48, "learning_rate": 1.950806347010247e-05, "loss": 0.013, "step": 102440 }, { "epoch": 1.48, "learning_rate": 1.9508015430363998e-05, "loss": 0.0114, "step": 102450 }, { "epoch": 1.48, "learning_rate": 1.9507967390625527e-05, "loss": 0.0095, "step": 102460 }, { "epoch": 1.48, "learning_rate": 1.9507919350887056e-05, "loss": 0.0139, "step": 102470 }, { "epoch": 1.48, "learning_rate": 1.9507871311148582e-05, "loss": 0.0116, "step": 102480 }, { "epoch": 1.48, "learning_rate": 1.950782327141011e-05, "loss": 0.0097, "step": 102490 }, { "epoch": 1.48, "learning_rate": 1.950777523167164e-05, "loss": 0.0139, "step": 102500 }, { "epoch": 1.48, "learning_rate": 1.9507727191933167e-05, "loss": 0.008, "step": 102510 }, { "epoch": 1.48, "learning_rate": 1.9507679152194696e-05, "loss": 0.0103, "step": 102520 }, { "epoch": 1.48, "learning_rate": 1.9507631112456225e-05, "loss": 0.0073, "step": 102530 }, { "epoch": 1.48, "learning_rate": 1.9507583072717754e-05, "loss": 0.0092, "step": 102540 }, { "epoch": 1.48, "learning_rate": 1.950753503297928e-05, "loss": 0.0103, "step": 102550 }, { "epoch": 1.48, "learning_rate": 1.950748699324081e-05, "loss": 0.0153, "step": 102560 }, { "epoch": 1.48, "learning_rate": 1.950743895350234e-05, "loss": 0.0103, "step": 102570 }, { "epoch": 1.48, "learning_rate": 1.9507390913763865e-05, "loss": 0.0118, "step": 102580 }, { "epoch": 1.48, "learning_rate": 1.9507342874025394e-05, "loss": 0.0092, "step": 102590 }, { "epoch": 1.48, "learning_rate": 1.9507294834286923e-05, "loss": 0.0075, "step": 102600 }, { "epoch": 1.48, "learning_rate": 1.9507246794548452e-05, "loss": 0.0107, "step": 102610 }, { "epoch": 1.48, "learning_rate": 1.950719875480998e-05, "loss": 0.0133, "step": 102620 }, { "epoch": 1.48, "learning_rate": 1.9507150715071508e-05, "loss": 0.0132, "step": 102630 }, { "epoch": 1.48, "learning_rate": 1.9507102675333037e-05, "loss": 0.013, "step": 102640 }, { "epoch": 1.48, "learning_rate": 1.9507054635594566e-05, "loss": 0.014, "step": 102650 }, { "epoch": 1.48, "learning_rate": 1.9507006595856092e-05, "loss": 0.0094, "step": 102660 }, { "epoch": 1.48, "learning_rate": 1.950695855611762e-05, "loss": 0.0117, "step": 102670 }, { "epoch": 1.48, "learning_rate": 1.950691051637915e-05, "loss": 0.0109, "step": 102680 }, { "epoch": 1.48, "learning_rate": 1.9506862476640676e-05, "loss": 0.0129, "step": 102690 }, { "epoch": 1.48, "learning_rate": 1.9506814436902206e-05, "loss": 0.0125, "step": 102700 }, { "epoch": 1.48, "learning_rate": 1.9506766397163735e-05, "loss": 0.0111, "step": 102710 }, { "epoch": 1.48, "learning_rate": 1.9506718357425264e-05, "loss": 0.01, "step": 102720 }, { "epoch": 1.48, "learning_rate": 1.950667031768679e-05, "loss": 0.0107, "step": 102730 }, { "epoch": 1.48, "learning_rate": 1.950662227794832e-05, "loss": 0.0132, "step": 102740 }, { "epoch": 1.48, "learning_rate": 1.950657423820985e-05, "loss": 0.0165, "step": 102750 }, { "epoch": 1.48, "learning_rate": 1.9506526198471375e-05, "loss": 0.009, "step": 102760 }, { "epoch": 1.48, "learning_rate": 1.9506478158732904e-05, "loss": 0.012, "step": 102770 }, { "epoch": 1.48, "learning_rate": 1.9506430118994433e-05, "loss": 0.0109, "step": 102780 }, { "epoch": 1.48, "learning_rate": 1.9506382079255962e-05, "loss": 0.0078, "step": 102790 }, { "epoch": 1.48, "learning_rate": 1.9506334039517488e-05, "loss": 0.0145, "step": 102800 }, { "epoch": 1.48, "learning_rate": 1.9506285999779018e-05, "loss": 0.0154, "step": 102810 }, { "epoch": 1.48, "learning_rate": 1.9506237960040547e-05, "loss": 0.0093, "step": 102820 }, { "epoch": 1.48, "learning_rate": 1.9506189920302076e-05, "loss": 0.0134, "step": 102830 }, { "epoch": 1.48, "learning_rate": 1.9506141880563605e-05, "loss": 0.013, "step": 102840 }, { "epoch": 1.48, "learning_rate": 1.9506093840825135e-05, "loss": 0.01, "step": 102850 }, { "epoch": 1.48, "learning_rate": 1.950604580108666e-05, "loss": 0.018, "step": 102860 }, { "epoch": 1.48, "learning_rate": 1.950599776134819e-05, "loss": 0.0086, "step": 102870 }, { "epoch": 1.48, "learning_rate": 1.950594972160972e-05, "loss": 0.0092, "step": 102880 }, { "epoch": 1.48, "learning_rate": 1.9505901681871245e-05, "loss": 0.0132, "step": 102890 }, { "epoch": 1.48, "learning_rate": 1.9505853642132774e-05, "loss": 0.0146, "step": 102900 }, { "epoch": 1.48, "learning_rate": 1.9505805602394303e-05, "loss": 0.0108, "step": 102910 }, { "epoch": 1.48, "learning_rate": 1.9505757562655833e-05, "loss": 0.0165, "step": 102920 }, { "epoch": 1.48, "learning_rate": 1.950570952291736e-05, "loss": 0.0085, "step": 102930 }, { "epoch": 1.48, "learning_rate": 1.9505661483178888e-05, "loss": 0.0088, "step": 102940 }, { "epoch": 1.48, "learning_rate": 1.9505613443440417e-05, "loss": 0.0075, "step": 102950 }, { "epoch": 1.48, "learning_rate": 1.9505565403701946e-05, "loss": 0.0116, "step": 102960 }, { "epoch": 1.48, "learning_rate": 1.9505517363963472e-05, "loss": 0.0168, "step": 102970 }, { "epoch": 1.48, "learning_rate": 1.9505469324225e-05, "loss": 0.0132, "step": 102980 }, { "epoch": 1.48, "learning_rate": 1.950542128448653e-05, "loss": 0.0125, "step": 102990 }, { "epoch": 1.48, "learning_rate": 1.9505373244748057e-05, "loss": 0.0087, "step": 103000 }, { "epoch": 1.48, "learning_rate": 1.9505325205009586e-05, "loss": 0.0114, "step": 103010 }, { "epoch": 1.48, "learning_rate": 1.9505277165271115e-05, "loss": 0.0118, "step": 103020 }, { "epoch": 1.48, "learning_rate": 1.9505229125532645e-05, "loss": 0.0123, "step": 103030 }, { "epoch": 1.49, "learning_rate": 1.950518108579417e-05, "loss": 0.0093, "step": 103040 }, { "epoch": 1.49, "learning_rate": 1.95051330460557e-05, "loss": 0.0096, "step": 103050 }, { "epoch": 1.49, "learning_rate": 1.950508500631723e-05, "loss": 0.0079, "step": 103060 }, { "epoch": 1.49, "learning_rate": 1.9505036966578755e-05, "loss": 0.0107, "step": 103070 }, { "epoch": 1.49, "learning_rate": 1.9504988926840284e-05, "loss": 0.0115, "step": 103080 }, { "epoch": 1.49, "learning_rate": 1.9504940887101813e-05, "loss": 0.0099, "step": 103090 }, { "epoch": 1.49, "learning_rate": 1.9504892847363343e-05, "loss": 0.0088, "step": 103100 }, { "epoch": 1.49, "learning_rate": 1.950484480762487e-05, "loss": 0.0108, "step": 103110 }, { "epoch": 1.49, "learning_rate": 1.9504796767886398e-05, "loss": 0.0123, "step": 103120 }, { "epoch": 1.49, "learning_rate": 1.9504748728147927e-05, "loss": 0.0113, "step": 103130 }, { "epoch": 1.49, "learning_rate": 1.9504700688409456e-05, "loss": 0.0108, "step": 103140 }, { "epoch": 1.49, "learning_rate": 1.9504652648670982e-05, "loss": 0.0068, "step": 103150 }, { "epoch": 1.49, "learning_rate": 1.950460460893251e-05, "loss": 0.0161, "step": 103160 }, { "epoch": 1.49, "learning_rate": 1.950455656919404e-05, "loss": 0.012, "step": 103170 }, { "epoch": 1.49, "learning_rate": 1.9504508529455567e-05, "loss": 0.0123, "step": 103180 }, { "epoch": 1.49, "learning_rate": 1.9504460489717096e-05, "loss": 0.0152, "step": 103190 }, { "epoch": 1.49, "learning_rate": 1.9504412449978625e-05, "loss": 0.0116, "step": 103200 }, { "epoch": 1.49, "learning_rate": 1.9504364410240154e-05, "loss": 0.0107, "step": 103210 }, { "epoch": 1.49, "learning_rate": 1.950431637050168e-05, "loss": 0.0216, "step": 103220 }, { "epoch": 1.49, "learning_rate": 1.950426833076321e-05, "loss": 0.0112, "step": 103230 }, { "epoch": 1.49, "learning_rate": 1.950422029102474e-05, "loss": 0.0102, "step": 103240 }, { "epoch": 1.49, "learning_rate": 1.9504172251286265e-05, "loss": 0.0155, "step": 103250 }, { "epoch": 1.49, "learning_rate": 1.9504124211547794e-05, "loss": 0.0107, "step": 103260 }, { "epoch": 1.49, "learning_rate": 1.9504076171809323e-05, "loss": 0.0121, "step": 103270 }, { "epoch": 1.49, "learning_rate": 1.9504028132070853e-05, "loss": 0.0079, "step": 103280 }, { "epoch": 1.49, "learning_rate": 1.950398009233238e-05, "loss": 0.0132, "step": 103290 }, { "epoch": 1.49, "learning_rate": 1.9503932052593908e-05, "loss": 0.0083, "step": 103300 }, { "epoch": 1.49, "learning_rate": 1.9503884012855437e-05, "loss": 0.0103, "step": 103310 }, { "epoch": 1.49, "learning_rate": 1.9503835973116966e-05, "loss": 0.0125, "step": 103320 }, { "epoch": 1.49, "learning_rate": 1.9503787933378492e-05, "loss": 0.0173, "step": 103330 }, { "epoch": 1.49, "learning_rate": 1.950373989364002e-05, "loss": 0.0095, "step": 103340 }, { "epoch": 1.49, "learning_rate": 1.950369185390155e-05, "loss": 0.0093, "step": 103350 }, { "epoch": 1.49, "learning_rate": 1.9503643814163077e-05, "loss": 0.0139, "step": 103360 }, { "epoch": 1.49, "learning_rate": 1.9503595774424606e-05, "loss": 0.0078, "step": 103370 }, { "epoch": 1.49, "learning_rate": 1.9503547734686135e-05, "loss": 0.0162, "step": 103380 }, { "epoch": 1.49, "learning_rate": 1.9503499694947664e-05, "loss": 0.0094, "step": 103390 }, { "epoch": 1.49, "learning_rate": 1.950345165520919e-05, "loss": 0.0098, "step": 103400 }, { "epoch": 1.49, "learning_rate": 1.950340361547072e-05, "loss": 0.0089, "step": 103410 }, { "epoch": 1.49, "learning_rate": 1.950335557573225e-05, "loss": 0.0155, "step": 103420 }, { "epoch": 1.49, "learning_rate": 1.9503307535993775e-05, "loss": 0.0113, "step": 103430 }, { "epoch": 1.49, "learning_rate": 1.9503259496255304e-05, "loss": 0.0102, "step": 103440 }, { "epoch": 1.49, "learning_rate": 1.9503211456516833e-05, "loss": 0.0111, "step": 103450 }, { "epoch": 1.49, "learning_rate": 1.9503163416778362e-05, "loss": 0.0098, "step": 103460 }, { "epoch": 1.49, "learning_rate": 1.950311537703989e-05, "loss": 0.011, "step": 103470 }, { "epoch": 1.49, "learning_rate": 1.9503067337301418e-05, "loss": 0.0086, "step": 103480 }, { "epoch": 1.49, "learning_rate": 1.9503019297562947e-05, "loss": 0.0126, "step": 103490 }, { "epoch": 1.49, "learning_rate": 1.9502971257824476e-05, "loss": 0.0075, "step": 103500 }, { "epoch": 1.49, "learning_rate": 1.9502923218086002e-05, "loss": 0.029, "step": 103510 }, { "epoch": 1.49, "learning_rate": 1.950287517834753e-05, "loss": 0.0107, "step": 103520 }, { "epoch": 1.49, "learning_rate": 1.950282713860906e-05, "loss": 0.0166, "step": 103530 }, { "epoch": 1.49, "learning_rate": 1.9502779098870586e-05, "loss": 0.0082, "step": 103540 }, { "epoch": 1.49, "learning_rate": 1.9502731059132116e-05, "loss": 0.0102, "step": 103550 }, { "epoch": 1.49, "learning_rate": 1.9502683019393645e-05, "loss": 0.0147, "step": 103560 }, { "epoch": 1.49, "learning_rate": 1.9502634979655174e-05, "loss": 0.0094, "step": 103570 }, { "epoch": 1.49, "learning_rate": 1.95025869399167e-05, "loss": 0.0096, "step": 103580 }, { "epoch": 1.49, "learning_rate": 1.950253890017823e-05, "loss": 0.009, "step": 103590 }, { "epoch": 1.49, "learning_rate": 1.950249086043976e-05, "loss": 0.0101, "step": 103600 }, { "epoch": 1.49, "learning_rate": 1.9502442820701285e-05, "loss": 0.0117, "step": 103610 }, { "epoch": 1.49, "learning_rate": 1.9502394780962814e-05, "loss": 0.0113, "step": 103620 }, { "epoch": 1.49, "learning_rate": 1.9502346741224343e-05, "loss": 0.0102, "step": 103630 }, { "epoch": 1.49, "learning_rate": 1.9502298701485872e-05, "loss": 0.0081, "step": 103640 }, { "epoch": 1.49, "learning_rate": 1.9502250661747398e-05, "loss": 0.0117, "step": 103650 }, { "epoch": 1.49, "learning_rate": 1.9502202622008928e-05, "loss": 0.0122, "step": 103660 }, { "epoch": 1.49, "learning_rate": 1.9502154582270457e-05, "loss": 0.0128, "step": 103670 }, { "epoch": 1.49, "learning_rate": 1.9502106542531986e-05, "loss": 0.0114, "step": 103680 }, { "epoch": 1.49, "learning_rate": 1.9502058502793512e-05, "loss": 0.0109, "step": 103690 }, { "epoch": 1.49, "learning_rate": 1.950201046305504e-05, "loss": 0.0077, "step": 103700 }, { "epoch": 1.49, "learning_rate": 1.950196242331657e-05, "loss": 0.011, "step": 103710 }, { "epoch": 1.49, "learning_rate": 1.9501914383578096e-05, "loss": 0.0116, "step": 103720 }, { "epoch": 1.49, "learning_rate": 1.9501866343839626e-05, "loss": 0.0124, "step": 103730 }, { "epoch": 1.5, "learning_rate": 1.9501818304101155e-05, "loss": 0.0095, "step": 103740 }, { "epoch": 1.5, "learning_rate": 1.9501770264362684e-05, "loss": 0.0187, "step": 103750 }, { "epoch": 1.5, "learning_rate": 1.950172222462421e-05, "loss": 0.011, "step": 103760 }, { "epoch": 1.5, "learning_rate": 1.950167418488574e-05, "loss": 0.0108, "step": 103770 }, { "epoch": 1.5, "learning_rate": 1.950162614514727e-05, "loss": 0.0121, "step": 103780 }, { "epoch": 1.5, "learning_rate": 1.9501578105408794e-05, "loss": 0.0078, "step": 103790 }, { "epoch": 1.5, "learning_rate": 1.9501530065670324e-05, "loss": 0.012, "step": 103800 }, { "epoch": 1.5, "learning_rate": 1.9501482025931853e-05, "loss": 0.014, "step": 103810 }, { "epoch": 1.5, "learning_rate": 1.9501433986193382e-05, "loss": 0.014, "step": 103820 }, { "epoch": 1.5, "learning_rate": 1.9501385946454908e-05, "loss": 0.0154, "step": 103830 }, { "epoch": 1.5, "learning_rate": 1.9501337906716437e-05, "loss": 0.0132, "step": 103840 }, { "epoch": 1.5, "learning_rate": 1.9501289866977967e-05, "loss": 0.0096, "step": 103850 }, { "epoch": 1.5, "learning_rate": 1.9501241827239496e-05, "loss": 0.0132, "step": 103860 }, { "epoch": 1.5, "learning_rate": 1.9501193787501022e-05, "loss": 0.0122, "step": 103870 }, { "epoch": 1.5, "learning_rate": 1.950114574776255e-05, "loss": 0.0082, "step": 103880 }, { "epoch": 1.5, "learning_rate": 1.950109770802408e-05, "loss": 0.0088, "step": 103890 }, { "epoch": 1.5, "learning_rate": 1.9501049668285606e-05, "loss": 0.0096, "step": 103900 }, { "epoch": 1.5, "learning_rate": 1.9501001628547136e-05, "loss": 0.0121, "step": 103910 }, { "epoch": 1.5, "learning_rate": 1.9500953588808665e-05, "loss": 0.0135, "step": 103920 }, { "epoch": 1.5, "learning_rate": 1.9500905549070194e-05, "loss": 0.0104, "step": 103930 }, { "epoch": 1.5, "learning_rate": 1.950085750933172e-05, "loss": 0.0119, "step": 103940 }, { "epoch": 1.5, "learning_rate": 1.950080946959325e-05, "loss": 0.0118, "step": 103950 }, { "epoch": 1.5, "learning_rate": 1.950076142985478e-05, "loss": 0.0076, "step": 103960 }, { "epoch": 1.5, "learning_rate": 1.9500713390116304e-05, "loss": 0.0111, "step": 103970 }, { "epoch": 1.5, "learning_rate": 1.9500665350377834e-05, "loss": 0.0107, "step": 103980 }, { "epoch": 1.5, "learning_rate": 1.9500617310639363e-05, "loss": 0.0122, "step": 103990 }, { "epoch": 1.5, "learning_rate": 1.9500569270900892e-05, "loss": 0.0081, "step": 104000 }, { "epoch": 1.5, "learning_rate": 1.9500521231162418e-05, "loss": 0.0101, "step": 104010 }, { "epoch": 1.5, "learning_rate": 1.9500473191423947e-05, "loss": 0.0135, "step": 104020 }, { "epoch": 1.5, "learning_rate": 1.9500425151685477e-05, "loss": 0.0102, "step": 104030 }, { "epoch": 1.5, "learning_rate": 1.9500377111947006e-05, "loss": 0.0122, "step": 104040 }, { "epoch": 1.5, "learning_rate": 1.9500329072208532e-05, "loss": 0.0134, "step": 104050 }, { "epoch": 1.5, "learning_rate": 1.950028103247006e-05, "loss": 0.0155, "step": 104060 }, { "epoch": 1.5, "learning_rate": 1.950023299273159e-05, "loss": 0.0089, "step": 104070 }, { "epoch": 1.5, "learning_rate": 1.9500184952993116e-05, "loss": 0.0117, "step": 104080 }, { "epoch": 1.5, "learning_rate": 1.9500136913254645e-05, "loss": 0.0105, "step": 104090 }, { "epoch": 1.5, "learning_rate": 1.9500088873516175e-05, "loss": 0.0094, "step": 104100 }, { "epoch": 1.5, "learning_rate": 1.9500040833777704e-05, "loss": 0.0058, "step": 104110 }, { "epoch": 1.5, "learning_rate": 1.949999279403923e-05, "loss": 0.0096, "step": 104120 }, { "epoch": 1.5, "learning_rate": 1.949994475430076e-05, "loss": 0.0124, "step": 104130 }, { "epoch": 1.5, "learning_rate": 1.949989671456229e-05, "loss": 0.0087, "step": 104140 }, { "epoch": 1.5, "learning_rate": 1.9499848674823814e-05, "loss": 0.0107, "step": 104150 }, { "epoch": 1.5, "learning_rate": 1.9499800635085344e-05, "loss": 0.0073, "step": 104160 }, { "epoch": 1.5, "learning_rate": 1.9499752595346873e-05, "loss": 0.014, "step": 104170 }, { "epoch": 1.5, "learning_rate": 1.9499704555608402e-05, "loss": 0.0102, "step": 104180 }, { "epoch": 1.5, "learning_rate": 1.9499656515869928e-05, "loss": 0.0099, "step": 104190 }, { "epoch": 1.5, "learning_rate": 1.9499608476131457e-05, "loss": 0.0109, "step": 104200 }, { "epoch": 1.5, "learning_rate": 1.9499560436392987e-05, "loss": 0.0103, "step": 104210 }, { "epoch": 1.5, "learning_rate": 1.9499512396654516e-05, "loss": 0.01, "step": 104220 }, { "epoch": 1.5, "learning_rate": 1.949946435691604e-05, "loss": 0.0112, "step": 104230 }, { "epoch": 1.5, "learning_rate": 1.949941631717757e-05, "loss": 0.0102, "step": 104240 }, { "epoch": 1.5, "learning_rate": 1.94993682774391e-05, "loss": 0.0072, "step": 104250 }, { "epoch": 1.5, "learning_rate": 1.9499320237700626e-05, "loss": 0.0076, "step": 104260 }, { "epoch": 1.5, "learning_rate": 1.9499272197962155e-05, "loss": 0.012, "step": 104270 }, { "epoch": 1.5, "learning_rate": 1.9499224158223685e-05, "loss": 0.013, "step": 104280 }, { "epoch": 1.5, "learning_rate": 1.9499176118485214e-05, "loss": 0.0125, "step": 104290 }, { "epoch": 1.5, "learning_rate": 1.949912807874674e-05, "loss": 0.0088, "step": 104300 }, { "epoch": 1.5, "learning_rate": 1.949908003900827e-05, "loss": 0.011, "step": 104310 }, { "epoch": 1.5, "learning_rate": 1.94990319992698e-05, "loss": 0.0113, "step": 104320 }, { "epoch": 1.5, "learning_rate": 1.9498983959531324e-05, "loss": 0.0075, "step": 104330 }, { "epoch": 1.5, "learning_rate": 1.9498935919792853e-05, "loss": 0.0112, "step": 104340 }, { "epoch": 1.5, "learning_rate": 1.9498887880054383e-05, "loss": 0.0106, "step": 104350 }, { "epoch": 1.5, "learning_rate": 1.9498839840315912e-05, "loss": 0.0159, "step": 104360 }, { "epoch": 1.5, "learning_rate": 1.9498791800577438e-05, "loss": 0.0113, "step": 104370 }, { "epoch": 1.5, "learning_rate": 1.9498743760838967e-05, "loss": 0.0095, "step": 104380 }, { "epoch": 1.5, "learning_rate": 1.9498695721100496e-05, "loss": 0.0066, "step": 104390 }, { "epoch": 1.5, "learning_rate": 1.9498647681362022e-05, "loss": 0.0114, "step": 104400 }, { "epoch": 1.5, "learning_rate": 1.949859964162355e-05, "loss": 0.0098, "step": 104410 }, { "epoch": 1.5, "learning_rate": 1.949855160188508e-05, "loss": 0.0066, "step": 104420 }, { "epoch": 1.51, "learning_rate": 1.949850356214661e-05, "loss": 0.0087, "step": 104430 }, { "epoch": 1.51, "learning_rate": 1.9498455522408136e-05, "loss": 0.0135, "step": 104440 }, { "epoch": 1.51, "learning_rate": 1.9498407482669665e-05, "loss": 0.0124, "step": 104450 }, { "epoch": 1.51, "learning_rate": 1.9498359442931195e-05, "loss": 0.0138, "step": 104460 }, { "epoch": 1.51, "learning_rate": 1.9498311403192724e-05, "loss": 0.0096, "step": 104470 }, { "epoch": 1.51, "learning_rate": 1.949826336345425e-05, "loss": 0.0138, "step": 104480 }, { "epoch": 1.51, "learning_rate": 1.949821532371578e-05, "loss": 0.0116, "step": 104490 }, { "epoch": 1.51, "learning_rate": 1.9498167283977308e-05, "loss": 0.0111, "step": 104500 }, { "epoch": 1.51, "learning_rate": 1.9498119244238834e-05, "loss": 0.0118, "step": 104510 }, { "epoch": 1.51, "learning_rate": 1.9498071204500363e-05, "loss": 0.0129, "step": 104520 }, { "epoch": 1.51, "learning_rate": 1.9498023164761893e-05, "loss": 0.012, "step": 104530 }, { "epoch": 1.51, "learning_rate": 1.9497975125023422e-05, "loss": 0.0103, "step": 104540 }, { "epoch": 1.51, "learning_rate": 1.9497927085284948e-05, "loss": 0.0118, "step": 104550 }, { "epoch": 1.51, "learning_rate": 1.9497879045546477e-05, "loss": 0.0137, "step": 104560 }, { "epoch": 1.51, "learning_rate": 1.9497831005808006e-05, "loss": 0.0134, "step": 104570 }, { "epoch": 1.51, "learning_rate": 1.9497782966069532e-05, "loss": 0.0099, "step": 104580 }, { "epoch": 1.51, "learning_rate": 1.949773492633106e-05, "loss": 0.0111, "step": 104590 }, { "epoch": 1.51, "learning_rate": 1.949768688659259e-05, "loss": 0.0106, "step": 104600 }, { "epoch": 1.51, "learning_rate": 1.949763884685412e-05, "loss": 0.0131, "step": 104610 }, { "epoch": 1.51, "learning_rate": 1.9497590807115646e-05, "loss": 0.0131, "step": 104620 }, { "epoch": 1.51, "learning_rate": 1.9497542767377175e-05, "loss": 0.0179, "step": 104630 }, { "epoch": 1.51, "learning_rate": 1.9497494727638704e-05, "loss": 0.0119, "step": 104640 }, { "epoch": 1.51, "learning_rate": 1.9497446687900234e-05, "loss": 0.0159, "step": 104650 }, { "epoch": 1.51, "learning_rate": 1.949739864816176e-05, "loss": 0.0118, "step": 104660 }, { "epoch": 1.51, "learning_rate": 1.949735060842329e-05, "loss": 0.0118, "step": 104670 }, { "epoch": 1.51, "learning_rate": 1.9497302568684818e-05, "loss": 0.0117, "step": 104680 }, { "epoch": 1.51, "learning_rate": 1.9497254528946344e-05, "loss": 0.0122, "step": 104690 }, { "epoch": 1.51, "learning_rate": 1.9497206489207873e-05, "loss": 0.0138, "step": 104700 }, { "epoch": 1.51, "learning_rate": 1.9497158449469403e-05, "loss": 0.0096, "step": 104710 }, { "epoch": 1.51, "learning_rate": 1.9497110409730932e-05, "loss": 0.0108, "step": 104720 }, { "epoch": 1.51, "learning_rate": 1.9497062369992458e-05, "loss": 0.0081, "step": 104730 }, { "epoch": 1.51, "learning_rate": 1.9497014330253987e-05, "loss": 0.0134, "step": 104740 }, { "epoch": 1.51, "learning_rate": 1.9496966290515516e-05, "loss": 0.0142, "step": 104750 }, { "epoch": 1.51, "learning_rate": 1.9496918250777042e-05, "loss": 0.0112, "step": 104760 }, { "epoch": 1.51, "learning_rate": 1.949687021103857e-05, "loss": 0.0116, "step": 104770 }, { "epoch": 1.51, "learning_rate": 1.94968221713001e-05, "loss": 0.0115, "step": 104780 }, { "epoch": 1.51, "learning_rate": 1.949677413156163e-05, "loss": 0.0182, "step": 104790 }, { "epoch": 1.51, "learning_rate": 1.9496726091823156e-05, "loss": 0.0134, "step": 104800 }, { "epoch": 1.51, "learning_rate": 1.9496678052084685e-05, "loss": 0.0142, "step": 104810 }, { "epoch": 1.51, "learning_rate": 1.9496630012346214e-05, "loss": 0.0102, "step": 104820 }, { "epoch": 1.51, "learning_rate": 1.9496581972607744e-05, "loss": 0.01, "step": 104830 }, { "epoch": 1.51, "learning_rate": 1.949653393286927e-05, "loss": 0.0106, "step": 104840 }, { "epoch": 1.51, "learning_rate": 1.94964858931308e-05, "loss": 0.0099, "step": 104850 }, { "epoch": 1.51, "learning_rate": 1.9496437853392328e-05, "loss": 0.0084, "step": 104860 }, { "epoch": 1.51, "learning_rate": 1.9496389813653854e-05, "loss": 0.0142, "step": 104870 }, { "epoch": 1.51, "learning_rate": 1.9496341773915383e-05, "loss": 0.0093, "step": 104880 }, { "epoch": 1.51, "learning_rate": 1.9496293734176913e-05, "loss": 0.0146, "step": 104890 }, { "epoch": 1.51, "learning_rate": 1.9496245694438442e-05, "loss": 0.0103, "step": 104900 }, { "epoch": 1.51, "learning_rate": 1.9496197654699968e-05, "loss": 0.0079, "step": 104910 }, { "epoch": 1.51, "learning_rate": 1.9496149614961497e-05, "loss": 0.0102, "step": 104920 }, { "epoch": 1.51, "learning_rate": 1.9496101575223026e-05, "loss": 0.0068, "step": 104930 }, { "epoch": 1.51, "learning_rate": 1.9496053535484552e-05, "loss": 0.0155, "step": 104940 }, { "epoch": 1.51, "learning_rate": 1.949600549574608e-05, "loss": 0.0112, "step": 104950 }, { "epoch": 1.51, "learning_rate": 1.949595745600761e-05, "loss": 0.0096, "step": 104960 }, { "epoch": 1.51, "learning_rate": 1.949590941626914e-05, "loss": 0.0101, "step": 104970 }, { "epoch": 1.51, "learning_rate": 1.9495861376530666e-05, "loss": 0.0119, "step": 104980 }, { "epoch": 1.51, "learning_rate": 1.9495813336792195e-05, "loss": 0.0155, "step": 104990 }, { "epoch": 1.51, "learning_rate": 1.9495765297053724e-05, "loss": 0.0127, "step": 105000 }, { "epoch": 1.51, "learning_rate": 1.9495717257315254e-05, "loss": 0.0126, "step": 105010 }, { "epoch": 1.51, "learning_rate": 1.949566921757678e-05, "loss": 0.0126, "step": 105020 }, { "epoch": 1.51, "learning_rate": 1.949562117783831e-05, "loss": 0.0108, "step": 105030 }, { "epoch": 1.51, "learning_rate": 1.9495573138099838e-05, "loss": 0.0112, "step": 105040 }, { "epoch": 1.51, "learning_rate": 1.9495525098361364e-05, "loss": 0.0127, "step": 105050 }, { "epoch": 1.51, "learning_rate": 1.9495477058622893e-05, "loss": 0.0119, "step": 105060 }, { "epoch": 1.51, "learning_rate": 1.9495429018884422e-05, "loss": 0.0127, "step": 105070 }, { "epoch": 1.51, "learning_rate": 1.949538097914595e-05, "loss": 0.0091, "step": 105080 }, { "epoch": 1.51, "learning_rate": 1.9495332939407478e-05, "loss": 0.0106, "step": 105090 }, { "epoch": 1.51, "learning_rate": 1.9495284899669007e-05, "loss": 0.0094, "step": 105100 }, { "epoch": 1.51, "learning_rate": 1.9495236859930536e-05, "loss": 0.0095, "step": 105110 }, { "epoch": 1.51, "learning_rate": 1.9495188820192062e-05, "loss": 0.0121, "step": 105120 }, { "epoch": 1.52, "learning_rate": 1.949514078045359e-05, "loss": 0.0136, "step": 105130 }, { "epoch": 1.52, "learning_rate": 1.949509274071512e-05, "loss": 0.0081, "step": 105140 }, { "epoch": 1.52, "learning_rate": 1.949504470097665e-05, "loss": 0.0126, "step": 105150 }, { "epoch": 1.52, "learning_rate": 1.9494996661238176e-05, "loss": 0.0225, "step": 105160 }, { "epoch": 1.52, "learning_rate": 1.9494948621499705e-05, "loss": 0.0099, "step": 105170 }, { "epoch": 1.52, "learning_rate": 1.9494900581761234e-05, "loss": 0.0122, "step": 105180 }, { "epoch": 1.52, "learning_rate": 1.9494852542022763e-05, "loss": 0.0123, "step": 105190 }, { "epoch": 1.52, "learning_rate": 1.949480450228429e-05, "loss": 0.0132, "step": 105200 }, { "epoch": 1.52, "learning_rate": 1.949475646254582e-05, "loss": 0.0074, "step": 105210 }, { "epoch": 1.52, "learning_rate": 1.9494708422807348e-05, "loss": 0.0147, "step": 105220 }, { "epoch": 1.52, "learning_rate": 1.9494665187042723e-05, "loss": 0.008, "step": 105230 }, { "epoch": 1.52, "learning_rate": 1.9494617147304252e-05, "loss": 0.01, "step": 105240 }, { "epoch": 1.52, "learning_rate": 1.949456910756578e-05, "loss": 0.0106, "step": 105250 }, { "epoch": 1.52, "learning_rate": 1.9494521067827307e-05, "loss": 0.013, "step": 105260 }, { "epoch": 1.52, "learning_rate": 1.9494473028088836e-05, "loss": 0.0151, "step": 105270 }, { "epoch": 1.52, "learning_rate": 1.9494424988350366e-05, "loss": 0.0111, "step": 105280 }, { "epoch": 1.52, "learning_rate": 1.949437694861189e-05, "loss": 0.0101, "step": 105290 }, { "epoch": 1.52, "learning_rate": 1.949432890887342e-05, "loss": 0.0103, "step": 105300 }, { "epoch": 1.52, "learning_rate": 1.949428086913495e-05, "loss": 0.0134, "step": 105310 }, { "epoch": 1.52, "learning_rate": 1.949423282939648e-05, "loss": 0.0093, "step": 105320 }, { "epoch": 1.52, "learning_rate": 1.9494184789658005e-05, "loss": 0.015, "step": 105330 }, { "epoch": 1.52, "learning_rate": 1.9494136749919534e-05, "loss": 0.0135, "step": 105340 }, { "epoch": 1.52, "learning_rate": 1.9494088710181064e-05, "loss": 0.0101, "step": 105350 }, { "epoch": 1.52, "learning_rate": 1.949404067044259e-05, "loss": 0.008, "step": 105360 }, { "epoch": 1.52, "learning_rate": 1.949399263070412e-05, "loss": 0.013, "step": 105370 }, { "epoch": 1.52, "learning_rate": 1.9493944590965648e-05, "loss": 0.0094, "step": 105380 }, { "epoch": 1.52, "learning_rate": 1.9493896551227177e-05, "loss": 0.008, "step": 105390 }, { "epoch": 1.52, "learning_rate": 1.9493848511488703e-05, "loss": 0.011, "step": 105400 }, { "epoch": 1.52, "learning_rate": 1.9493800471750232e-05, "loss": 0.0114, "step": 105410 }, { "epoch": 1.52, "learning_rate": 1.9493752432011762e-05, "loss": 0.0089, "step": 105420 }, { "epoch": 1.52, "learning_rate": 1.949370439227329e-05, "loss": 0.0087, "step": 105430 }, { "epoch": 1.52, "learning_rate": 1.9493656352534817e-05, "loss": 0.0142, "step": 105440 }, { "epoch": 1.52, "learning_rate": 1.9493608312796346e-05, "loss": 0.0129, "step": 105450 }, { "epoch": 1.52, "learning_rate": 1.9493560273057875e-05, "loss": 0.0124, "step": 105460 }, { "epoch": 1.52, "learning_rate": 1.94935122333194e-05, "loss": 0.0087, "step": 105470 }, { "epoch": 1.52, "learning_rate": 1.949346419358093e-05, "loss": 0.0084, "step": 105480 }, { "epoch": 1.52, "learning_rate": 1.949341615384246e-05, "loss": 0.0104, "step": 105490 }, { "epoch": 1.52, "learning_rate": 1.949336811410399e-05, "loss": 0.0114, "step": 105500 }, { "epoch": 1.52, "learning_rate": 1.9493320074365515e-05, "loss": 0.0107, "step": 105510 }, { "epoch": 1.52, "learning_rate": 1.9493272034627044e-05, "loss": 0.0129, "step": 105520 }, { "epoch": 1.52, "learning_rate": 1.9493223994888574e-05, "loss": 0.0085, "step": 105530 }, { "epoch": 1.52, "learning_rate": 1.94931759551501e-05, "loss": 0.0139, "step": 105540 }, { "epoch": 1.52, "learning_rate": 1.949312791541163e-05, "loss": 0.0105, "step": 105550 }, { "epoch": 1.52, "learning_rate": 1.9493079875673158e-05, "loss": 0.0129, "step": 105560 }, { "epoch": 1.52, "learning_rate": 1.9493031835934687e-05, "loss": 0.0109, "step": 105570 }, { "epoch": 1.52, "learning_rate": 1.9492983796196213e-05, "loss": 0.0148, "step": 105580 }, { "epoch": 1.52, "learning_rate": 1.9492935756457742e-05, "loss": 0.011, "step": 105590 }, { "epoch": 1.52, "learning_rate": 1.949288771671927e-05, "loss": 0.0111, "step": 105600 }, { "epoch": 1.52, "learning_rate": 1.94928396769808e-05, "loss": 0.0119, "step": 105610 }, { "epoch": 1.52, "learning_rate": 1.9492791637242327e-05, "loss": 0.0103, "step": 105620 }, { "epoch": 1.52, "learning_rate": 1.9492743597503856e-05, "loss": 0.0131, "step": 105630 }, { "epoch": 1.52, "learning_rate": 1.9492695557765385e-05, "loss": 0.0122, "step": 105640 }, { "epoch": 1.52, "learning_rate": 1.949264751802691e-05, "loss": 0.0144, "step": 105650 }, { "epoch": 1.52, "learning_rate": 1.949259947828844e-05, "loss": 0.0109, "step": 105660 }, { "epoch": 1.52, "learning_rate": 1.949255143854997e-05, "loss": 0.0093, "step": 105670 }, { "epoch": 1.52, "learning_rate": 1.94925033988115e-05, "loss": 0.013, "step": 105680 }, { "epoch": 1.52, "learning_rate": 1.9492455359073025e-05, "loss": 0.0093, "step": 105690 }, { "epoch": 1.52, "learning_rate": 1.9492407319334554e-05, "loss": 0.0118, "step": 105700 }, { "epoch": 1.52, "learning_rate": 1.9492359279596083e-05, "loss": 0.0169, "step": 105710 }, { "epoch": 1.52, "learning_rate": 1.949231123985761e-05, "loss": 0.0109, "step": 105720 }, { "epoch": 1.52, "learning_rate": 1.949226320011914e-05, "loss": 0.0123, "step": 105730 }, { "epoch": 1.52, "learning_rate": 1.9492215160380668e-05, "loss": 0.0091, "step": 105740 }, { "epoch": 1.52, "learning_rate": 1.9492167120642197e-05, "loss": 0.0084, "step": 105750 }, { "epoch": 1.52, "learning_rate": 1.9492119080903723e-05, "loss": 0.0131, "step": 105760 }, { "epoch": 1.52, "learning_rate": 1.9492071041165252e-05, "loss": 0.0125, "step": 105770 }, { "epoch": 1.52, "learning_rate": 1.949202300142678e-05, "loss": 0.0134, "step": 105780 }, { "epoch": 1.52, "learning_rate": 1.949197496168831e-05, "loss": 0.0124, "step": 105790 }, { "epoch": 1.52, "learning_rate": 1.9491926921949837e-05, "loss": 0.0149, "step": 105800 }, { "epoch": 1.52, "learning_rate": 1.9491878882211366e-05, "loss": 0.0162, "step": 105810 }, { "epoch": 1.53, "learning_rate": 1.9491830842472895e-05, "loss": 0.0104, "step": 105820 }, { "epoch": 1.53, "learning_rate": 1.949178280273442e-05, "loss": 0.0109, "step": 105830 }, { "epoch": 1.53, "learning_rate": 1.949173476299595e-05, "loss": 0.0131, "step": 105840 }, { "epoch": 1.53, "learning_rate": 1.949168672325748e-05, "loss": 0.0106, "step": 105850 }, { "epoch": 1.53, "learning_rate": 1.949163868351901e-05, "loss": 0.0133, "step": 105860 }, { "epoch": 1.53, "learning_rate": 1.9491590643780535e-05, "loss": 0.0096, "step": 105870 }, { "epoch": 1.53, "learning_rate": 1.9491542604042064e-05, "loss": 0.0108, "step": 105880 }, { "epoch": 1.53, "learning_rate": 1.9491494564303593e-05, "loss": 0.0113, "step": 105890 }, { "epoch": 1.53, "learning_rate": 1.949144652456512e-05, "loss": 0.0113, "step": 105900 }, { "epoch": 1.53, "learning_rate": 1.949139848482665e-05, "loss": 0.0083, "step": 105910 }, { "epoch": 1.53, "learning_rate": 1.949135044508818e-05, "loss": 0.0119, "step": 105920 }, { "epoch": 1.53, "learning_rate": 1.9491302405349707e-05, "loss": 0.0133, "step": 105930 }, { "epoch": 1.53, "learning_rate": 1.9491254365611236e-05, "loss": 0.0116, "step": 105940 }, { "epoch": 1.53, "learning_rate": 1.9491206325872766e-05, "loss": 0.011, "step": 105950 }, { "epoch": 1.53, "learning_rate": 1.949115828613429e-05, "loss": 0.0125, "step": 105960 }, { "epoch": 1.53, "learning_rate": 1.949111024639582e-05, "loss": 0.0119, "step": 105970 }, { "epoch": 1.53, "learning_rate": 1.949106220665735e-05, "loss": 0.013, "step": 105980 }, { "epoch": 1.53, "learning_rate": 1.949101416691888e-05, "loss": 0.0113, "step": 105990 }, { "epoch": 1.53, "learning_rate": 1.9490966127180405e-05, "loss": 0.014, "step": 106000 }, { "epoch": 1.53, "learning_rate": 1.9490918087441934e-05, "loss": 0.0138, "step": 106010 }, { "epoch": 1.53, "learning_rate": 1.9490870047703464e-05, "loss": 0.012, "step": 106020 }, { "epoch": 1.53, "learning_rate": 1.949082200796499e-05, "loss": 0.0131, "step": 106030 }, { "epoch": 1.53, "learning_rate": 1.949077396822652e-05, "loss": 0.0098, "step": 106040 }, { "epoch": 1.53, "learning_rate": 1.9490725928488048e-05, "loss": 0.0105, "step": 106050 }, { "epoch": 1.53, "learning_rate": 1.9490677888749577e-05, "loss": 0.0154, "step": 106060 }, { "epoch": 1.53, "learning_rate": 1.9490629849011103e-05, "loss": 0.0099, "step": 106070 }, { "epoch": 1.53, "learning_rate": 1.9490581809272633e-05, "loss": 0.0073, "step": 106080 }, { "epoch": 1.53, "learning_rate": 1.9490533769534162e-05, "loss": 0.0119, "step": 106090 }, { "epoch": 1.53, "learning_rate": 1.949048572979569e-05, "loss": 0.0089, "step": 106100 }, { "epoch": 1.53, "learning_rate": 1.9490437690057217e-05, "loss": 0.0107, "step": 106110 }, { "epoch": 1.53, "learning_rate": 1.9490389650318746e-05, "loss": 0.0097, "step": 106120 }, { "epoch": 1.53, "learning_rate": 1.9490341610580276e-05, "loss": 0.0153, "step": 106130 }, { "epoch": 1.53, "learning_rate": 1.94902935708418e-05, "loss": 0.0149, "step": 106140 }, { "epoch": 1.53, "learning_rate": 1.949024553110333e-05, "loss": 0.0116, "step": 106150 }, { "epoch": 1.53, "learning_rate": 1.949019749136486e-05, "loss": 0.0107, "step": 106160 }, { "epoch": 1.53, "learning_rate": 1.949014945162639e-05, "loss": 0.0122, "step": 106170 }, { "epoch": 1.53, "learning_rate": 1.9490101411887915e-05, "loss": 0.0144, "step": 106180 }, { "epoch": 1.53, "learning_rate": 1.9490053372149444e-05, "loss": 0.015, "step": 106190 }, { "epoch": 1.53, "learning_rate": 1.9490005332410974e-05, "loss": 0.0071, "step": 106200 }, { "epoch": 1.53, "learning_rate": 1.94899572926725e-05, "loss": 0.0122, "step": 106210 }, { "epoch": 1.53, "learning_rate": 1.948990925293403e-05, "loss": 0.0117, "step": 106220 }, { "epoch": 1.53, "learning_rate": 1.9489861213195558e-05, "loss": 0.0105, "step": 106230 }, { "epoch": 1.53, "learning_rate": 1.9489813173457087e-05, "loss": 0.0127, "step": 106240 }, { "epoch": 1.53, "learning_rate": 1.9489765133718613e-05, "loss": 0.0105, "step": 106250 }, { "epoch": 1.53, "learning_rate": 1.9489717093980142e-05, "loss": 0.0097, "step": 106260 }, { "epoch": 1.53, "learning_rate": 1.9489669054241672e-05, "loss": 0.012, "step": 106270 }, { "epoch": 1.53, "learning_rate": 1.94896210145032e-05, "loss": 0.0119, "step": 106280 }, { "epoch": 1.53, "learning_rate": 1.9489572974764727e-05, "loss": 0.0112, "step": 106290 }, { "epoch": 1.53, "learning_rate": 1.9489524935026256e-05, "loss": 0.0109, "step": 106300 }, { "epoch": 1.53, "learning_rate": 1.9489476895287785e-05, "loss": 0.0083, "step": 106310 }, { "epoch": 1.53, "learning_rate": 1.948942885554931e-05, "loss": 0.0126, "step": 106320 }, { "epoch": 1.53, "learning_rate": 1.948938081581084e-05, "loss": 0.0152, "step": 106330 }, { "epoch": 1.53, "learning_rate": 1.948933277607237e-05, "loss": 0.0087, "step": 106340 }, { "epoch": 1.53, "learning_rate": 1.94892847363339e-05, "loss": 0.0115, "step": 106350 }, { "epoch": 1.53, "learning_rate": 1.9489236696595425e-05, "loss": 0.0129, "step": 106360 }, { "epoch": 1.53, "learning_rate": 1.9489188656856954e-05, "loss": 0.0142, "step": 106370 }, { "epoch": 1.53, "learning_rate": 1.9489140617118484e-05, "loss": 0.0093, "step": 106380 }, { "epoch": 1.53, "learning_rate": 1.948909257738001e-05, "loss": 0.0087, "step": 106390 }, { "epoch": 1.53, "learning_rate": 1.948904453764154e-05, "loss": 0.0104, "step": 106400 }, { "epoch": 1.53, "learning_rate": 1.9488996497903068e-05, "loss": 0.0102, "step": 106410 }, { "epoch": 1.53, "learning_rate": 1.9488948458164597e-05, "loss": 0.0137, "step": 106420 }, { "epoch": 1.53, "learning_rate": 1.9488900418426123e-05, "loss": 0.0102, "step": 106430 }, { "epoch": 1.53, "learning_rate": 1.9488852378687652e-05, "loss": 0.0091, "step": 106440 }, { "epoch": 1.53, "learning_rate": 1.948880433894918e-05, "loss": 0.0095, "step": 106450 }, { "epoch": 1.53, "learning_rate": 1.948875629921071e-05, "loss": 0.0083, "step": 106460 }, { "epoch": 1.53, "learning_rate": 1.9488708259472237e-05, "loss": 0.0115, "step": 106470 }, { "epoch": 1.53, "learning_rate": 1.9488660219733766e-05, "loss": 0.0083, "step": 106480 }, { "epoch": 1.53, "learning_rate": 1.9488612179995295e-05, "loss": 0.0081, "step": 106490 }, { "epoch": 1.53, "learning_rate": 1.948856414025682e-05, "loss": 0.0087, "step": 106500 }, { "epoch": 1.54, "learning_rate": 1.948851610051835e-05, "loss": 0.0112, "step": 106510 }, { "epoch": 1.54, "learning_rate": 1.948846806077988e-05, "loss": 0.0082, "step": 106520 }, { "epoch": 1.54, "learning_rate": 1.948842002104141e-05, "loss": 0.0085, "step": 106530 }, { "epoch": 1.54, "learning_rate": 1.9488371981302935e-05, "loss": 0.0089, "step": 106540 }, { "epoch": 1.54, "learning_rate": 1.9488323941564464e-05, "loss": 0.0136, "step": 106550 }, { "epoch": 1.54, "learning_rate": 1.9488275901825993e-05, "loss": 0.0112, "step": 106560 }, { "epoch": 1.54, "learning_rate": 1.948822786208752e-05, "loss": 0.0103, "step": 106570 }, { "epoch": 1.54, "learning_rate": 1.948817982234905e-05, "loss": 0.0127, "step": 106580 }, { "epoch": 1.54, "learning_rate": 1.9488131782610578e-05, "loss": 0.0094, "step": 106590 }, { "epoch": 1.54, "learning_rate": 1.9488083742872107e-05, "loss": 0.0097, "step": 106600 }, { "epoch": 1.54, "learning_rate": 1.9488035703133633e-05, "loss": 0.0134, "step": 106610 }, { "epoch": 1.54, "learning_rate": 1.9487987663395162e-05, "loss": 0.0089, "step": 106620 }, { "epoch": 1.54, "learning_rate": 1.948793962365669e-05, "loss": 0.0121, "step": 106630 }, { "epoch": 1.54, "learning_rate": 1.948789158391822e-05, "loss": 0.0145, "step": 106640 }, { "epoch": 1.54, "learning_rate": 1.9487843544179747e-05, "loss": 0.0092, "step": 106650 }, { "epoch": 1.54, "learning_rate": 1.9487795504441276e-05, "loss": 0.014, "step": 106660 }, { "epoch": 1.54, "learning_rate": 1.9487747464702805e-05, "loss": 0.012, "step": 106670 }, { "epoch": 1.54, "learning_rate": 1.948769942496433e-05, "loss": 0.009, "step": 106680 }, { "epoch": 1.54, "learning_rate": 1.948765138522586e-05, "loss": 0.015, "step": 106690 }, { "epoch": 1.54, "learning_rate": 1.948760334548739e-05, "loss": 0.0158, "step": 106700 }, { "epoch": 1.54, "learning_rate": 1.948755530574892e-05, "loss": 0.0127, "step": 106710 }, { "epoch": 1.54, "learning_rate": 1.9487507266010445e-05, "loss": 0.0115, "step": 106720 }, { "epoch": 1.54, "learning_rate": 1.9487459226271974e-05, "loss": 0.0067, "step": 106730 }, { "epoch": 1.54, "learning_rate": 1.9487411186533503e-05, "loss": 0.0101, "step": 106740 }, { "epoch": 1.54, "learning_rate": 1.948736314679503e-05, "loss": 0.0122, "step": 106750 }, { "epoch": 1.54, "learning_rate": 1.948731510705656e-05, "loss": 0.0104, "step": 106760 }, { "epoch": 1.54, "learning_rate": 1.9487267067318088e-05, "loss": 0.0117, "step": 106770 }, { "epoch": 1.54, "learning_rate": 1.9487219027579617e-05, "loss": 0.0115, "step": 106780 }, { "epoch": 1.54, "learning_rate": 1.9487170987841143e-05, "loss": 0.0112, "step": 106790 }, { "epoch": 1.54, "learning_rate": 1.9487122948102672e-05, "loss": 0.0096, "step": 106800 }, { "epoch": 1.54, "learning_rate": 1.94870749083642e-05, "loss": 0.0106, "step": 106810 }, { "epoch": 1.54, "learning_rate": 1.948702686862573e-05, "loss": 0.0095, "step": 106820 }, { "epoch": 1.54, "learning_rate": 1.9486978828887257e-05, "loss": 0.0092, "step": 106830 }, { "epoch": 1.54, "learning_rate": 1.9486930789148786e-05, "loss": 0.0097, "step": 106840 }, { "epoch": 1.54, "learning_rate": 1.9486882749410315e-05, "loss": 0.0147, "step": 106850 }, { "epoch": 1.54, "learning_rate": 1.948683470967184e-05, "loss": 0.0101, "step": 106860 }, { "epoch": 1.54, "learning_rate": 1.948678666993337e-05, "loss": 0.018, "step": 106870 }, { "epoch": 1.54, "learning_rate": 1.94867386301949e-05, "loss": 0.012, "step": 106880 }, { "epoch": 1.54, "learning_rate": 1.948669059045643e-05, "loss": 0.0116, "step": 106890 }, { "epoch": 1.54, "learning_rate": 1.9486642550717955e-05, "loss": 0.0139, "step": 106900 }, { "epoch": 1.54, "learning_rate": 1.9486594510979484e-05, "loss": 0.0104, "step": 106910 }, { "epoch": 1.54, "learning_rate": 1.9486546471241013e-05, "loss": 0.0112, "step": 106920 }, { "epoch": 1.54, "learning_rate": 1.948649843150254e-05, "loss": 0.0114, "step": 106930 }, { "epoch": 1.54, "learning_rate": 1.948645039176407e-05, "loss": 0.0124, "step": 106940 }, { "epoch": 1.54, "learning_rate": 1.9486402352025598e-05, "loss": 0.0115, "step": 106950 }, { "epoch": 1.54, "learning_rate": 1.9486354312287127e-05, "loss": 0.0106, "step": 106960 }, { "epoch": 1.54, "learning_rate": 1.9486306272548653e-05, "loss": 0.0112, "step": 106970 }, { "epoch": 1.54, "learning_rate": 1.9486258232810182e-05, "loss": 0.0106, "step": 106980 }, { "epoch": 1.54, "learning_rate": 1.948621019307171e-05, "loss": 0.0115, "step": 106990 }, { "epoch": 1.54, "learning_rate": 1.948616215333324e-05, "loss": 0.0098, "step": 107000 }, { "epoch": 1.54, "learning_rate": 1.9486114113594767e-05, "loss": 0.0076, "step": 107010 }, { "epoch": 1.54, "learning_rate": 1.9486066073856296e-05, "loss": 0.0076, "step": 107020 }, { "epoch": 1.54, "learning_rate": 1.9486018034117825e-05, "loss": 0.0096, "step": 107030 }, { "epoch": 1.54, "learning_rate": 1.948596999437935e-05, "loss": 0.0148, "step": 107040 }, { "epoch": 1.54, "learning_rate": 1.948592195464088e-05, "loss": 0.0147, "step": 107050 }, { "epoch": 1.54, "learning_rate": 1.948587391490241e-05, "loss": 0.0127, "step": 107060 }, { "epoch": 1.54, "learning_rate": 1.948582587516394e-05, "loss": 0.0111, "step": 107070 }, { "epoch": 1.54, "learning_rate": 1.9485777835425465e-05, "loss": 0.0113, "step": 107080 }, { "epoch": 1.54, "learning_rate": 1.9485729795686994e-05, "loss": 0.0088, "step": 107090 }, { "epoch": 1.54, "learning_rate": 1.9485681755948523e-05, "loss": 0.0156, "step": 107100 }, { "epoch": 1.54, "learning_rate": 1.948563371621005e-05, "loss": 0.0141, "step": 107110 }, { "epoch": 1.54, "learning_rate": 1.948558567647158e-05, "loss": 0.0124, "step": 107120 }, { "epoch": 1.54, "learning_rate": 1.9485537636733108e-05, "loss": 0.0094, "step": 107130 }, { "epoch": 1.54, "learning_rate": 1.9485489596994637e-05, "loss": 0.0141, "step": 107140 }, { "epoch": 1.54, "learning_rate": 1.9485441557256163e-05, "loss": 0.0104, "step": 107150 }, { "epoch": 1.54, "learning_rate": 1.9485393517517692e-05, "loss": 0.0113, "step": 107160 }, { "epoch": 1.54, "learning_rate": 1.948534547777922e-05, "loss": 0.011, "step": 107170 }, { "epoch": 1.54, "learning_rate": 1.948529743804075e-05, "loss": 0.0102, "step": 107180 }, { "epoch": 1.54, "learning_rate": 1.9485249398302276e-05, "loss": 0.01, "step": 107190 }, { "epoch": 1.54, "learning_rate": 1.9485201358563806e-05, "loss": 0.0092, "step": 107200 }, { "epoch": 1.55, "learning_rate": 1.9485153318825335e-05, "loss": 0.0056, "step": 107210 }, { "epoch": 1.55, "learning_rate": 1.948510527908686e-05, "loss": 0.0094, "step": 107220 }, { "epoch": 1.55, "learning_rate": 1.948505723934839e-05, "loss": 0.008, "step": 107230 }, { "epoch": 1.55, "learning_rate": 1.948500919960992e-05, "loss": 0.0082, "step": 107240 }, { "epoch": 1.55, "learning_rate": 1.948496115987145e-05, "loss": 0.0107, "step": 107250 }, { "epoch": 1.55, "learning_rate": 1.9484913120132975e-05, "loss": 0.0107, "step": 107260 }, { "epoch": 1.55, "learning_rate": 1.9484865080394504e-05, "loss": 0.0087, "step": 107270 }, { "epoch": 1.55, "learning_rate": 1.9484817040656033e-05, "loss": 0.0095, "step": 107280 }, { "epoch": 1.55, "learning_rate": 1.948476900091756e-05, "loss": 0.0079, "step": 107290 }, { "epoch": 1.55, "learning_rate": 1.9484720961179088e-05, "loss": 0.0162, "step": 107300 }, { "epoch": 1.55, "learning_rate": 1.9484672921440618e-05, "loss": 0.0126, "step": 107310 }, { "epoch": 1.55, "learning_rate": 1.9484624881702147e-05, "loss": 0.0094, "step": 107320 }, { "epoch": 1.55, "learning_rate": 1.9484576841963673e-05, "loss": 0.0085, "step": 107330 }, { "epoch": 1.55, "learning_rate": 1.9484528802225202e-05, "loss": 0.0128, "step": 107340 }, { "epoch": 1.55, "learning_rate": 1.948448076248673e-05, "loss": 0.0092, "step": 107350 }, { "epoch": 1.55, "learning_rate": 1.9484432722748257e-05, "loss": 0.0089, "step": 107360 }, { "epoch": 1.55, "learning_rate": 1.9484384683009786e-05, "loss": 0.0129, "step": 107370 }, { "epoch": 1.55, "learning_rate": 1.9484336643271316e-05, "loss": 0.0092, "step": 107380 }, { "epoch": 1.55, "learning_rate": 1.9484288603532845e-05, "loss": 0.0089, "step": 107390 }, { "epoch": 1.55, "learning_rate": 1.948424056379437e-05, "loss": 0.0094, "step": 107400 }, { "epoch": 1.55, "learning_rate": 1.94841925240559e-05, "loss": 0.0167, "step": 107410 }, { "epoch": 1.55, "learning_rate": 1.948414448431743e-05, "loss": 0.013, "step": 107420 }, { "epoch": 1.55, "learning_rate": 1.948409644457896e-05, "loss": 0.007, "step": 107430 }, { "epoch": 1.55, "learning_rate": 1.9484048404840485e-05, "loss": 0.0108, "step": 107440 }, { "epoch": 1.55, "learning_rate": 1.9484000365102014e-05, "loss": 0.0132, "step": 107450 }, { "epoch": 1.55, "learning_rate": 1.9483952325363543e-05, "loss": 0.0108, "step": 107460 }, { "epoch": 1.55, "learning_rate": 1.948390428562507e-05, "loss": 0.0091, "step": 107470 }, { "epoch": 1.55, "learning_rate": 1.9483861049860447e-05, "loss": 0.0092, "step": 107480 }, { "epoch": 1.55, "learning_rate": 1.9483813010121976e-05, "loss": 0.0165, "step": 107490 }, { "epoch": 1.55, "learning_rate": 1.9483764970383502e-05, "loss": 0.0131, "step": 107500 }, { "epoch": 1.55, "learning_rate": 1.948371693064503e-05, "loss": 0.0138, "step": 107510 }, { "epoch": 1.55, "learning_rate": 1.948366889090656e-05, "loss": 0.0119, "step": 107520 }, { "epoch": 1.55, "learning_rate": 1.9483620851168087e-05, "loss": 0.011, "step": 107530 }, { "epoch": 1.55, "learning_rate": 1.9483572811429616e-05, "loss": 0.0115, "step": 107540 }, { "epoch": 1.55, "learning_rate": 1.9483524771691145e-05, "loss": 0.0113, "step": 107550 }, { "epoch": 1.55, "learning_rate": 1.9483476731952674e-05, "loss": 0.011, "step": 107560 }, { "epoch": 1.55, "learning_rate": 1.94834286922142e-05, "loss": 0.0077, "step": 107570 }, { "epoch": 1.55, "learning_rate": 1.948338065247573e-05, "loss": 0.0128, "step": 107580 }, { "epoch": 1.55, "learning_rate": 1.948333261273726e-05, "loss": 0.0079, "step": 107590 }, { "epoch": 1.55, "learning_rate": 1.9483284572998785e-05, "loss": 0.0112, "step": 107600 }, { "epoch": 1.55, "learning_rate": 1.9483236533260314e-05, "loss": 0.0102, "step": 107610 }, { "epoch": 1.55, "learning_rate": 1.9483188493521843e-05, "loss": 0.0113, "step": 107620 }, { "epoch": 1.55, "learning_rate": 1.9483140453783372e-05, "loss": 0.0105, "step": 107630 }, { "epoch": 1.55, "learning_rate": 1.94830924140449e-05, "loss": 0.0089, "step": 107640 }, { "epoch": 1.55, "learning_rate": 1.9483044374306428e-05, "loss": 0.0086, "step": 107650 }, { "epoch": 1.55, "learning_rate": 1.9482996334567957e-05, "loss": 0.0106, "step": 107660 }, { "epoch": 1.55, "learning_rate": 1.9482948294829486e-05, "loss": 0.0111, "step": 107670 }, { "epoch": 1.55, "learning_rate": 1.9482900255091012e-05, "loss": 0.0122, "step": 107680 }, { "epoch": 1.55, "learning_rate": 1.948285221535254e-05, "loss": 0.0075, "step": 107690 }, { "epoch": 1.55, "learning_rate": 1.948280417561407e-05, "loss": 0.0098, "step": 107700 }, { "epoch": 1.55, "learning_rate": 1.9482756135875596e-05, "loss": 0.0155, "step": 107710 }, { "epoch": 1.55, "learning_rate": 1.9482708096137126e-05, "loss": 0.0097, "step": 107720 }, { "epoch": 1.55, "learning_rate": 1.9482660056398655e-05, "loss": 0.0099, "step": 107730 }, { "epoch": 1.55, "learning_rate": 1.9482612016660184e-05, "loss": 0.0093, "step": 107740 }, { "epoch": 1.55, "learning_rate": 1.948256397692171e-05, "loss": 0.0138, "step": 107750 }, { "epoch": 1.55, "learning_rate": 1.948251593718324e-05, "loss": 0.0107, "step": 107760 }, { "epoch": 1.55, "learning_rate": 1.948246789744477e-05, "loss": 0.0088, "step": 107770 }, { "epoch": 1.55, "learning_rate": 1.9482419857706295e-05, "loss": 0.0116, "step": 107780 }, { "epoch": 1.55, "learning_rate": 1.9482371817967824e-05, "loss": 0.011, "step": 107790 }, { "epoch": 1.55, "learning_rate": 1.9482323778229353e-05, "loss": 0.0094, "step": 107800 }, { "epoch": 1.55, "learning_rate": 1.9482275738490882e-05, "loss": 0.01, "step": 107810 }, { "epoch": 1.55, "learning_rate": 1.9482227698752408e-05, "loss": 0.0101, "step": 107820 }, { "epoch": 1.55, "learning_rate": 1.9482179659013938e-05, "loss": 0.0131, "step": 107830 }, { "epoch": 1.55, "learning_rate": 1.9482131619275467e-05, "loss": 0.0116, "step": 107840 }, { "epoch": 1.55, "learning_rate": 1.9482083579536996e-05, "loss": 0.0098, "step": 107850 }, { "epoch": 1.55, "learning_rate": 1.9482035539798522e-05, "loss": 0.0131, "step": 107860 }, { "epoch": 1.55, "learning_rate": 1.948198750006005e-05, "loss": 0.013, "step": 107870 }, { "epoch": 1.55, "learning_rate": 1.948193946032158e-05, "loss": 0.0094, "step": 107880 }, { "epoch": 1.55, "learning_rate": 1.9481891420583106e-05, "loss": 0.0105, "step": 107890 }, { "epoch": 1.56, "learning_rate": 1.9481843380844636e-05, "loss": 0.0107, "step": 107900 }, { "epoch": 1.56, "learning_rate": 1.9481795341106165e-05, "loss": 0.0091, "step": 107910 }, { "epoch": 1.56, "learning_rate": 1.9481747301367694e-05, "loss": 0.0099, "step": 107920 }, { "epoch": 1.56, "learning_rate": 1.948169926162922e-05, "loss": 0.0092, "step": 107930 }, { "epoch": 1.56, "learning_rate": 1.948165122189075e-05, "loss": 0.0127, "step": 107940 }, { "epoch": 1.56, "learning_rate": 1.948160318215228e-05, "loss": 0.0123, "step": 107950 }, { "epoch": 1.56, "learning_rate": 1.9481555142413804e-05, "loss": 0.012, "step": 107960 }, { "epoch": 1.56, "learning_rate": 1.9481507102675334e-05, "loss": 0.0133, "step": 107970 }, { "epoch": 1.56, "learning_rate": 1.9481459062936863e-05, "loss": 0.011, "step": 107980 }, { "epoch": 1.56, "learning_rate": 1.9481411023198392e-05, "loss": 0.01, "step": 107990 }, { "epoch": 1.56, "learning_rate": 1.9481362983459918e-05, "loss": 0.009, "step": 108000 }, { "epoch": 1.56, "learning_rate": 1.9481314943721447e-05, "loss": 0.0129, "step": 108010 }, { "epoch": 1.56, "learning_rate": 1.9481266903982977e-05, "loss": 0.0079, "step": 108020 }, { "epoch": 1.56, "learning_rate": 1.9481218864244506e-05, "loss": 0.007, "step": 108030 }, { "epoch": 1.56, "learning_rate": 1.9481170824506032e-05, "loss": 0.0103, "step": 108040 }, { "epoch": 1.56, "learning_rate": 1.948112278476756e-05, "loss": 0.0124, "step": 108050 }, { "epoch": 1.56, "learning_rate": 1.948107474502909e-05, "loss": 0.0133, "step": 108060 }, { "epoch": 1.56, "learning_rate": 1.9481026705290616e-05, "loss": 0.0098, "step": 108070 }, { "epoch": 1.56, "learning_rate": 1.9480978665552146e-05, "loss": 0.0139, "step": 108080 }, { "epoch": 1.56, "learning_rate": 1.9480930625813675e-05, "loss": 0.0095, "step": 108090 }, { "epoch": 1.56, "learning_rate": 1.9480882586075204e-05, "loss": 0.0147, "step": 108100 }, { "epoch": 1.56, "learning_rate": 1.948083454633673e-05, "loss": 0.0126, "step": 108110 }, { "epoch": 1.56, "learning_rate": 1.948078650659826e-05, "loss": 0.0143, "step": 108120 }, { "epoch": 1.56, "learning_rate": 1.948073846685979e-05, "loss": 0.013, "step": 108130 }, { "epoch": 1.56, "learning_rate": 1.9480690427121314e-05, "loss": 0.0145, "step": 108140 }, { "epoch": 1.56, "learning_rate": 1.9480642387382844e-05, "loss": 0.0124, "step": 108150 }, { "epoch": 1.56, "learning_rate": 1.9480594347644373e-05, "loss": 0.0125, "step": 108160 }, { "epoch": 1.56, "learning_rate": 1.9480546307905902e-05, "loss": 0.0094, "step": 108170 }, { "epoch": 1.56, "learning_rate": 1.9480498268167428e-05, "loss": 0.0105, "step": 108180 }, { "epoch": 1.56, "learning_rate": 1.9480450228428957e-05, "loss": 0.0151, "step": 108190 }, { "epoch": 1.56, "learning_rate": 1.9480402188690487e-05, "loss": 0.0097, "step": 108200 }, { "epoch": 1.56, "learning_rate": 1.9480354148952016e-05, "loss": 0.0092, "step": 108210 }, { "epoch": 1.56, "learning_rate": 1.9480306109213542e-05, "loss": 0.0092, "step": 108220 }, { "epoch": 1.56, "learning_rate": 1.948025806947507e-05, "loss": 0.0162, "step": 108230 }, { "epoch": 1.56, "learning_rate": 1.94802100297366e-05, "loss": 0.0089, "step": 108240 }, { "epoch": 1.56, "learning_rate": 1.9480161989998126e-05, "loss": 0.0139, "step": 108250 }, { "epoch": 1.56, "learning_rate": 1.9480113950259655e-05, "loss": 0.0125, "step": 108260 }, { "epoch": 1.56, "learning_rate": 1.9480065910521185e-05, "loss": 0.0097, "step": 108270 }, { "epoch": 1.56, "learning_rate": 1.9480017870782714e-05, "loss": 0.0128, "step": 108280 }, { "epoch": 1.56, "learning_rate": 1.947996983104424e-05, "loss": 0.0087, "step": 108290 }, { "epoch": 1.56, "learning_rate": 1.947992179130577e-05, "loss": 0.0085, "step": 108300 }, { "epoch": 1.56, "learning_rate": 1.94798737515673e-05, "loss": 0.0138, "step": 108310 }, { "epoch": 1.56, "learning_rate": 1.9479825711828824e-05, "loss": 0.0111, "step": 108320 }, { "epoch": 1.56, "learning_rate": 1.9479777672090354e-05, "loss": 0.0125, "step": 108330 }, { "epoch": 1.56, "learning_rate": 1.9479729632351883e-05, "loss": 0.0107, "step": 108340 }, { "epoch": 1.56, "learning_rate": 1.9479681592613412e-05, "loss": 0.0114, "step": 108350 }, { "epoch": 1.56, "learning_rate": 1.9479633552874938e-05, "loss": 0.0082, "step": 108360 }, { "epoch": 1.56, "learning_rate": 1.9479585513136467e-05, "loss": 0.0119, "step": 108370 }, { "epoch": 1.56, "learning_rate": 1.9479537473397997e-05, "loss": 0.0127, "step": 108380 }, { "epoch": 1.56, "learning_rate": 1.9479489433659526e-05, "loss": 0.0078, "step": 108390 }, { "epoch": 1.56, "learning_rate": 1.947944139392105e-05, "loss": 0.0088, "step": 108400 }, { "epoch": 1.56, "learning_rate": 1.947939335418258e-05, "loss": 0.0092, "step": 108410 }, { "epoch": 1.56, "learning_rate": 1.947934531444411e-05, "loss": 0.0118, "step": 108420 }, { "epoch": 1.56, "learning_rate": 1.9479297274705636e-05, "loss": 0.0082, "step": 108430 }, { "epoch": 1.56, "learning_rate": 1.9479249234967165e-05, "loss": 0.0093, "step": 108440 }, { "epoch": 1.56, "learning_rate": 1.9479201195228695e-05, "loss": 0.0085, "step": 108450 }, { "epoch": 1.56, "learning_rate": 1.9479153155490224e-05, "loss": 0.0075, "step": 108460 }, { "epoch": 1.56, "learning_rate": 1.947910511575175e-05, "loss": 0.0104, "step": 108470 }, { "epoch": 1.56, "learning_rate": 1.947905707601328e-05, "loss": 0.0098, "step": 108480 }, { "epoch": 1.56, "learning_rate": 1.947900903627481e-05, "loss": 0.0109, "step": 108490 }, { "epoch": 1.56, "learning_rate": 1.9478960996536334e-05, "loss": 0.013, "step": 108500 }, { "epoch": 1.56, "learning_rate": 1.9478912956797863e-05, "loss": 0.012, "step": 108510 }, { "epoch": 1.56, "learning_rate": 1.9478864917059393e-05, "loss": 0.0134, "step": 108520 }, { "epoch": 1.56, "learning_rate": 1.9478816877320922e-05, "loss": 0.0131, "step": 108530 }, { "epoch": 1.56, "learning_rate": 1.9478768837582448e-05, "loss": 0.0112, "step": 108540 }, { "epoch": 1.56, "learning_rate": 1.9478720797843977e-05, "loss": 0.0087, "step": 108550 }, { "epoch": 1.56, "learning_rate": 1.9478672758105506e-05, "loss": 0.0112, "step": 108560 }, { "epoch": 1.56, "learning_rate": 1.9478624718367036e-05, "loss": 0.012, "step": 108570 }, { "epoch": 1.56, "learning_rate": 1.947857667862856e-05, "loss": 0.0107, "step": 108580 }, { "epoch": 1.56, "learning_rate": 1.947852863889009e-05, "loss": 0.0124, "step": 108590 }, { "epoch": 1.57, "learning_rate": 1.947848059915162e-05, "loss": 0.0136, "step": 108600 }, { "epoch": 1.57, "learning_rate": 1.9478432559413146e-05, "loss": 0.0102, "step": 108610 }, { "epoch": 1.57, "learning_rate": 1.9478384519674675e-05, "loss": 0.0122, "step": 108620 }, { "epoch": 1.57, "learning_rate": 1.9478336479936205e-05, "loss": 0.0121, "step": 108630 }, { "epoch": 1.57, "learning_rate": 1.9478288440197734e-05, "loss": 0.0135, "step": 108640 }, { "epoch": 1.57, "learning_rate": 1.947824040045926e-05, "loss": 0.0118, "step": 108650 }, { "epoch": 1.57, "learning_rate": 1.947819236072079e-05, "loss": 0.0116, "step": 108660 }, { "epoch": 1.57, "learning_rate": 1.9478144320982318e-05, "loss": 0.0113, "step": 108670 }, { "epoch": 1.57, "learning_rate": 1.9478096281243844e-05, "loss": 0.0107, "step": 108680 }, { "epoch": 1.57, "learning_rate": 1.9478048241505373e-05, "loss": 0.0105, "step": 108690 }, { "epoch": 1.57, "learning_rate": 1.9478000201766903e-05, "loss": 0.01, "step": 108700 }, { "epoch": 1.57, "learning_rate": 1.9477952162028432e-05, "loss": 0.0097, "step": 108710 }, { "epoch": 1.57, "learning_rate": 1.9477904122289958e-05, "loss": 0.0167, "step": 108720 }, { "epoch": 1.57, "learning_rate": 1.9477856082551487e-05, "loss": 0.0108, "step": 108730 }, { "epoch": 1.57, "learning_rate": 1.9477808042813016e-05, "loss": 0.0107, "step": 108740 }, { "epoch": 1.57, "learning_rate": 1.9477760003074546e-05, "loss": 0.0133, "step": 108750 }, { "epoch": 1.57, "learning_rate": 1.947771196333607e-05, "loss": 0.0104, "step": 108760 }, { "epoch": 1.57, "learning_rate": 1.94776639235976e-05, "loss": 0.0132, "step": 108770 }, { "epoch": 1.57, "learning_rate": 1.947761588385913e-05, "loss": 0.0098, "step": 108780 }, { "epoch": 1.57, "learning_rate": 1.9477567844120656e-05, "loss": 0.0129, "step": 108790 }, { "epoch": 1.57, "learning_rate": 1.9477519804382185e-05, "loss": 0.013, "step": 108800 }, { "epoch": 1.57, "learning_rate": 1.9477471764643714e-05, "loss": 0.0101, "step": 108810 }, { "epoch": 1.57, "learning_rate": 1.9477423724905244e-05, "loss": 0.0117, "step": 108820 }, { "epoch": 1.57, "learning_rate": 1.947737568516677e-05, "loss": 0.0097, "step": 108830 }, { "epoch": 1.57, "learning_rate": 1.94773276454283e-05, "loss": 0.0117, "step": 108840 }, { "epoch": 1.57, "learning_rate": 1.9477279605689828e-05, "loss": 0.0097, "step": 108850 }, { "epoch": 1.57, "learning_rate": 1.9477231565951354e-05, "loss": 0.0151, "step": 108860 }, { "epoch": 1.57, "learning_rate": 1.9477183526212883e-05, "loss": 0.013, "step": 108870 }, { "epoch": 1.57, "learning_rate": 1.9477135486474413e-05, "loss": 0.0111, "step": 108880 }, { "epoch": 1.57, "learning_rate": 1.9477087446735942e-05, "loss": 0.0099, "step": 108890 }, { "epoch": 1.57, "learning_rate": 1.9477039406997468e-05, "loss": 0.0139, "step": 108900 }, { "epoch": 1.57, "learning_rate": 1.9476991367258997e-05, "loss": 0.0101, "step": 108910 }, { "epoch": 1.57, "learning_rate": 1.9476943327520526e-05, "loss": 0.0101, "step": 108920 }, { "epoch": 1.57, "learning_rate": 1.9476895287782052e-05, "loss": 0.0113, "step": 108930 }, { "epoch": 1.57, "learning_rate": 1.947684724804358e-05, "loss": 0.0098, "step": 108940 }, { "epoch": 1.57, "learning_rate": 1.947679920830511e-05, "loss": 0.0116, "step": 108950 }, { "epoch": 1.57, "learning_rate": 1.947675116856664e-05, "loss": 0.0091, "step": 108960 }, { "epoch": 1.57, "learning_rate": 1.9476703128828166e-05, "loss": 0.0127, "step": 108970 }, { "epoch": 1.57, "learning_rate": 1.9476655089089695e-05, "loss": 0.0115, "step": 108980 }, { "epoch": 1.57, "learning_rate": 1.9476607049351224e-05, "loss": 0.0103, "step": 108990 }, { "epoch": 1.57, "learning_rate": 1.9476559009612754e-05, "loss": 0.0108, "step": 109000 }, { "epoch": 1.57, "learning_rate": 1.9476510969874283e-05, "loss": 0.0098, "step": 109010 }, { "epoch": 1.57, "learning_rate": 1.9476462930135812e-05, "loss": 0.0092, "step": 109020 }, { "epoch": 1.57, "learning_rate": 1.9476414890397338e-05, "loss": 0.0107, "step": 109030 }, { "epoch": 1.57, "learning_rate": 1.9476366850658867e-05, "loss": 0.0124, "step": 109040 }, { "epoch": 1.57, "learning_rate": 1.9476318810920397e-05, "loss": 0.0105, "step": 109050 }, { "epoch": 1.57, "learning_rate": 1.9476270771181926e-05, "loss": 0.0121, "step": 109060 }, { "epoch": 1.57, "learning_rate": 1.9476222731443452e-05, "loss": 0.0145, "step": 109070 }, { "epoch": 1.57, "learning_rate": 1.947617469170498e-05, "loss": 0.0101, "step": 109080 }, { "epoch": 1.57, "learning_rate": 1.947612665196651e-05, "loss": 0.0106, "step": 109090 }, { "epoch": 1.57, "learning_rate": 1.9476078612228036e-05, "loss": 0.0131, "step": 109100 }, { "epoch": 1.57, "learning_rate": 1.9476030572489565e-05, "loss": 0.0152, "step": 109110 }, { "epoch": 1.57, "learning_rate": 1.9475982532751095e-05, "loss": 0.0115, "step": 109120 }, { "epoch": 1.57, "learning_rate": 1.9475934493012624e-05, "loss": 0.0124, "step": 109130 }, { "epoch": 1.57, "learning_rate": 1.947588645327415e-05, "loss": 0.0098, "step": 109140 }, { "epoch": 1.57, "learning_rate": 1.947583841353568e-05, "loss": 0.0092, "step": 109150 }, { "epoch": 1.57, "learning_rate": 1.947579037379721e-05, "loss": 0.0119, "step": 109160 }, { "epoch": 1.57, "learning_rate": 1.9475742334058734e-05, "loss": 0.0113, "step": 109170 }, { "epoch": 1.57, "learning_rate": 1.9475694294320264e-05, "loss": 0.0109, "step": 109180 }, { "epoch": 1.57, "learning_rate": 1.9475646254581793e-05, "loss": 0.0101, "step": 109190 }, { "epoch": 1.57, "learning_rate": 1.9475598214843322e-05, "loss": 0.0079, "step": 109200 }, { "epoch": 1.57, "learning_rate": 1.9475550175104848e-05, "loss": 0.0108, "step": 109210 }, { "epoch": 1.57, "learning_rate": 1.9475502135366377e-05, "loss": 0.0085, "step": 109220 }, { "epoch": 1.57, "learning_rate": 1.9475454095627907e-05, "loss": 0.0104, "step": 109230 }, { "epoch": 1.57, "learning_rate": 1.9475406055889436e-05, "loss": 0.0128, "step": 109240 }, { "epoch": 1.57, "learning_rate": 1.947535801615096e-05, "loss": 0.0124, "step": 109250 }, { "epoch": 1.57, "learning_rate": 1.947530997641249e-05, "loss": 0.0106, "step": 109260 }, { "epoch": 1.57, "learning_rate": 1.947526193667402e-05, "loss": 0.0122, "step": 109270 }, { "epoch": 1.57, "learning_rate": 1.9475213896935546e-05, "loss": 0.0116, "step": 109280 }, { "epoch": 1.58, "learning_rate": 1.9475165857197075e-05, "loss": 0.0107, "step": 109290 }, { "epoch": 1.58, "learning_rate": 1.9475117817458605e-05, "loss": 0.0119, "step": 109300 }, { "epoch": 1.58, "learning_rate": 1.9475069777720134e-05, "loss": 0.0109, "step": 109310 }, { "epoch": 1.58, "learning_rate": 1.947502173798166e-05, "loss": 0.0067, "step": 109320 }, { "epoch": 1.58, "learning_rate": 1.947497369824319e-05, "loss": 0.0094, "step": 109330 }, { "epoch": 1.58, "learning_rate": 1.947492565850472e-05, "loss": 0.013, "step": 109340 }, { "epoch": 1.58, "learning_rate": 1.9474877618766244e-05, "loss": 0.008, "step": 109350 }, { "epoch": 1.58, "learning_rate": 1.9474829579027773e-05, "loss": 0.0097, "step": 109360 }, { "epoch": 1.58, "learning_rate": 1.9474781539289303e-05, "loss": 0.0097, "step": 109370 }, { "epoch": 1.58, "learning_rate": 1.9474733499550832e-05, "loss": 0.009, "step": 109380 }, { "epoch": 1.58, "learning_rate": 1.9474685459812358e-05, "loss": 0.0129, "step": 109390 }, { "epoch": 1.58, "learning_rate": 1.9474637420073887e-05, "loss": 0.0118, "step": 109400 }, { "epoch": 1.58, "learning_rate": 1.9474589380335416e-05, "loss": 0.0083, "step": 109410 }, { "epoch": 1.58, "learning_rate": 1.9474541340596946e-05, "loss": 0.0117, "step": 109420 }, { "epoch": 1.58, "learning_rate": 1.947449330085847e-05, "loss": 0.0115, "step": 109430 }, { "epoch": 1.58, "learning_rate": 1.947444526112e-05, "loss": 0.0102, "step": 109440 }, { "epoch": 1.58, "learning_rate": 1.947439722138153e-05, "loss": 0.0098, "step": 109450 }, { "epoch": 1.58, "learning_rate": 1.9474349181643056e-05, "loss": 0.0092, "step": 109460 }, { "epoch": 1.58, "learning_rate": 1.9474301141904585e-05, "loss": 0.0113, "step": 109470 }, { "epoch": 1.58, "learning_rate": 1.9474253102166115e-05, "loss": 0.0082, "step": 109480 }, { "epoch": 1.58, "learning_rate": 1.9474205062427644e-05, "loss": 0.0109, "step": 109490 }, { "epoch": 1.58, "learning_rate": 1.947415702268917e-05, "loss": 0.0073, "step": 109500 }, { "epoch": 1.58, "learning_rate": 1.94741089829507e-05, "loss": 0.0083, "step": 109510 }, { "epoch": 1.58, "learning_rate": 1.9474060943212228e-05, "loss": 0.0101, "step": 109520 }, { "epoch": 1.58, "learning_rate": 1.9474012903473754e-05, "loss": 0.0108, "step": 109530 }, { "epoch": 1.58, "learning_rate": 1.9473964863735283e-05, "loss": 0.0107, "step": 109540 }, { "epoch": 1.58, "learning_rate": 1.9473916823996813e-05, "loss": 0.0126, "step": 109550 }, { "epoch": 1.58, "learning_rate": 1.9473868784258342e-05, "loss": 0.0125, "step": 109560 }, { "epoch": 1.58, "learning_rate": 1.9473820744519868e-05, "loss": 0.0123, "step": 109570 }, { "epoch": 1.58, "learning_rate": 1.9473772704781397e-05, "loss": 0.0135, "step": 109580 }, { "epoch": 1.58, "learning_rate": 1.9473724665042926e-05, "loss": 0.0133, "step": 109590 }, { "epoch": 1.58, "learning_rate": 1.9473676625304456e-05, "loss": 0.0111, "step": 109600 }, { "epoch": 1.58, "learning_rate": 1.947362858556598e-05, "loss": 0.009, "step": 109610 }, { "epoch": 1.58, "learning_rate": 1.947358054582751e-05, "loss": 0.0108, "step": 109620 }, { "epoch": 1.58, "learning_rate": 1.947353250608904e-05, "loss": 0.0128, "step": 109630 }, { "epoch": 1.58, "learning_rate": 1.9473484466350566e-05, "loss": 0.0094, "step": 109640 }, { "epoch": 1.58, "learning_rate": 1.9473436426612095e-05, "loss": 0.0129, "step": 109650 }, { "epoch": 1.58, "learning_rate": 1.9473388386873624e-05, "loss": 0.0128, "step": 109660 }, { "epoch": 1.58, "learning_rate": 1.9473340347135154e-05, "loss": 0.0072, "step": 109670 }, { "epoch": 1.58, "learning_rate": 1.947329230739668e-05, "loss": 0.0093, "step": 109680 }, { "epoch": 1.58, "learning_rate": 1.947324426765821e-05, "loss": 0.0096, "step": 109690 }, { "epoch": 1.58, "learning_rate": 1.9473196227919738e-05, "loss": 0.0073, "step": 109700 }, { "epoch": 1.58, "learning_rate": 1.9473148188181264e-05, "loss": 0.0086, "step": 109710 }, { "epoch": 1.58, "learning_rate": 1.9473100148442793e-05, "loss": 0.0088, "step": 109720 }, { "epoch": 1.58, "learning_rate": 1.9473052108704323e-05, "loss": 0.0103, "step": 109730 }, { "epoch": 1.58, "learning_rate": 1.9473004068965852e-05, "loss": 0.0109, "step": 109740 }, { "epoch": 1.58, "learning_rate": 1.9472956029227378e-05, "loss": 0.0105, "step": 109750 }, { "epoch": 1.58, "learning_rate": 1.9472907989488907e-05, "loss": 0.0176, "step": 109760 }, { "epoch": 1.58, "learning_rate": 1.9472859949750436e-05, "loss": 0.0117, "step": 109770 }, { "epoch": 1.58, "learning_rate": 1.9472811910011966e-05, "loss": 0.0131, "step": 109780 }, { "epoch": 1.58, "learning_rate": 1.947276387027349e-05, "loss": 0.0099, "step": 109790 }, { "epoch": 1.58, "learning_rate": 1.947271583053502e-05, "loss": 0.0147, "step": 109800 }, { "epoch": 1.58, "learning_rate": 1.947266779079655e-05, "loss": 0.0153, "step": 109810 }, { "epoch": 1.58, "learning_rate": 1.9472619751058076e-05, "loss": 0.0098, "step": 109820 }, { "epoch": 1.58, "learning_rate": 1.9472571711319605e-05, "loss": 0.0091, "step": 109830 }, { "epoch": 1.58, "learning_rate": 1.9472523671581134e-05, "loss": 0.0146, "step": 109840 }, { "epoch": 1.58, "learning_rate": 1.9472475631842664e-05, "loss": 0.0081, "step": 109850 }, { "epoch": 1.58, "learning_rate": 1.947242759210419e-05, "loss": 0.0124, "step": 109860 }, { "epoch": 1.58, "learning_rate": 1.947237955236572e-05, "loss": 0.015, "step": 109870 }, { "epoch": 1.58, "learning_rate": 1.9472331512627248e-05, "loss": 0.0113, "step": 109880 }, { "epoch": 1.58, "learning_rate": 1.9472283472888774e-05, "loss": 0.0084, "step": 109890 }, { "epoch": 1.58, "learning_rate": 1.9472235433150303e-05, "loss": 0.0106, "step": 109900 }, { "epoch": 1.58, "learning_rate": 1.9472187393411833e-05, "loss": 0.0101, "step": 109910 }, { "epoch": 1.58, "learning_rate": 1.9472139353673362e-05, "loss": 0.01, "step": 109920 }, { "epoch": 1.58, "learning_rate": 1.9472091313934888e-05, "loss": 0.0118, "step": 109930 }, { "epoch": 1.58, "learning_rate": 1.9472043274196417e-05, "loss": 0.0087, "step": 109940 }, { "epoch": 1.58, "learning_rate": 1.9471995234457946e-05, "loss": 0.0087, "step": 109950 }, { "epoch": 1.58, "learning_rate": 1.9471947194719475e-05, "loss": 0.0125, "step": 109960 }, { "epoch": 1.58, "learning_rate": 1.9471899154981e-05, "loss": 0.0095, "step": 109970 }, { "epoch": 1.59, "learning_rate": 1.947185111524253e-05, "loss": 0.0103, "step": 109980 }, { "epoch": 1.59, "learning_rate": 1.947180307550406e-05, "loss": 0.0087, "step": 109990 }, { "epoch": 1.59, "learning_rate": 1.9471755035765586e-05, "loss": 0.0109, "step": 110000 }, { "epoch": 1.59, "learning_rate": 1.9471706996027115e-05, "loss": 0.0115, "step": 110010 }, { "epoch": 1.59, "learning_rate": 1.9471658956288644e-05, "loss": 0.0133, "step": 110020 }, { "epoch": 1.59, "learning_rate": 1.9471610916550174e-05, "loss": 0.0107, "step": 110030 }, { "epoch": 1.59, "learning_rate": 1.94715628768117e-05, "loss": 0.0098, "step": 110040 }, { "epoch": 1.59, "learning_rate": 1.947151483707323e-05, "loss": 0.012, "step": 110050 }, { "epoch": 1.59, "learning_rate": 1.9471466797334758e-05, "loss": 0.0087, "step": 110060 }, { "epoch": 1.59, "learning_rate": 1.9471418757596284e-05, "loss": 0.0098, "step": 110070 }, { "epoch": 1.59, "learning_rate": 1.9471370717857813e-05, "loss": 0.0094, "step": 110080 }, { "epoch": 1.59, "learning_rate": 1.9471322678119342e-05, "loss": 0.0102, "step": 110090 }, { "epoch": 1.59, "learning_rate": 1.947127463838087e-05, "loss": 0.013, "step": 110100 }, { "epoch": 1.59, "learning_rate": 1.9471226598642398e-05, "loss": 0.0123, "step": 110110 }, { "epoch": 1.59, "learning_rate": 1.9471178558903927e-05, "loss": 0.0117, "step": 110120 }, { "epoch": 1.59, "learning_rate": 1.9471130519165456e-05, "loss": 0.01, "step": 110130 }, { "epoch": 1.59, "learning_rate": 1.9471082479426985e-05, "loss": 0.0114, "step": 110140 }, { "epoch": 1.59, "learning_rate": 1.947103443968851e-05, "loss": 0.0114, "step": 110150 }, { "epoch": 1.59, "learning_rate": 1.947098639995004e-05, "loss": 0.0142, "step": 110160 }, { "epoch": 1.59, "learning_rate": 1.947093836021157e-05, "loss": 0.0108, "step": 110170 }, { "epoch": 1.59, "learning_rate": 1.9470890320473096e-05, "loss": 0.0106, "step": 110180 }, { "epoch": 1.59, "learning_rate": 1.9470842280734625e-05, "loss": 0.0105, "step": 110190 }, { "epoch": 1.59, "learning_rate": 1.9470794240996154e-05, "loss": 0.0099, "step": 110200 }, { "epoch": 1.59, "learning_rate": 1.9470746201257683e-05, "loss": 0.0117, "step": 110210 }, { "epoch": 1.59, "learning_rate": 1.947069816151921e-05, "loss": 0.0108, "step": 110220 }, { "epoch": 1.59, "learning_rate": 1.947065012178074e-05, "loss": 0.0103, "step": 110230 }, { "epoch": 1.59, "learning_rate": 1.9470606886016113e-05, "loss": 0.0108, "step": 110240 }, { "epoch": 1.59, "learning_rate": 1.9470558846277643e-05, "loss": 0.0116, "step": 110250 }, { "epoch": 1.59, "learning_rate": 1.9470510806539172e-05, "loss": 0.0115, "step": 110260 }, { "epoch": 1.59, "learning_rate": 1.94704627668007e-05, "loss": 0.0121, "step": 110270 }, { "epoch": 1.59, "learning_rate": 1.9470414727062227e-05, "loss": 0.0118, "step": 110280 }, { "epoch": 1.59, "learning_rate": 1.9470366687323756e-05, "loss": 0.011, "step": 110290 }, { "epoch": 1.59, "learning_rate": 1.9470318647585286e-05, "loss": 0.0121, "step": 110300 }, { "epoch": 1.59, "learning_rate": 1.947027060784681e-05, "loss": 0.0102, "step": 110310 }, { "epoch": 1.59, "learning_rate": 1.947022256810834e-05, "loss": 0.0163, "step": 110320 }, { "epoch": 1.59, "learning_rate": 1.947017452836987e-05, "loss": 0.0131, "step": 110330 }, { "epoch": 1.59, "learning_rate": 1.94701264886314e-05, "loss": 0.0099, "step": 110340 }, { "epoch": 1.59, "learning_rate": 1.9470078448892925e-05, "loss": 0.0134, "step": 110350 }, { "epoch": 1.59, "learning_rate": 1.9470030409154454e-05, "loss": 0.0121, "step": 110360 }, { "epoch": 1.59, "learning_rate": 1.9469982369415984e-05, "loss": 0.0134, "step": 110370 }, { "epoch": 1.59, "learning_rate": 1.946993432967751e-05, "loss": 0.0087, "step": 110380 }, { "epoch": 1.59, "learning_rate": 1.946988628993904e-05, "loss": 0.0081, "step": 110390 }, { "epoch": 1.59, "learning_rate": 1.9469838250200568e-05, "loss": 0.0066, "step": 110400 }, { "epoch": 1.59, "learning_rate": 1.9469790210462097e-05, "loss": 0.0112, "step": 110410 }, { "epoch": 1.59, "learning_rate": 1.9469742170723623e-05, "loss": 0.0162, "step": 110420 }, { "epoch": 1.59, "learning_rate": 1.9469694130985152e-05, "loss": 0.0112, "step": 110430 }, { "epoch": 1.59, "learning_rate": 1.9469646091246682e-05, "loss": 0.0113, "step": 110440 }, { "epoch": 1.59, "learning_rate": 1.946959805150821e-05, "loss": 0.0126, "step": 110450 }, { "epoch": 1.59, "learning_rate": 1.9469550011769737e-05, "loss": 0.0104, "step": 110460 }, { "epoch": 1.59, "learning_rate": 1.9469501972031266e-05, "loss": 0.0099, "step": 110470 }, { "epoch": 1.59, "learning_rate": 1.9469453932292795e-05, "loss": 0.0093, "step": 110480 }, { "epoch": 1.59, "learning_rate": 1.946940589255432e-05, "loss": 0.0117, "step": 110490 }, { "epoch": 1.59, "learning_rate": 1.946935785281585e-05, "loss": 0.0107, "step": 110500 }, { "epoch": 1.59, "learning_rate": 1.946930981307738e-05, "loss": 0.0084, "step": 110510 }, { "epoch": 1.59, "learning_rate": 1.946926177333891e-05, "loss": 0.0131, "step": 110520 }, { "epoch": 1.59, "learning_rate": 1.9469213733600435e-05, "loss": 0.0126, "step": 110530 }, { "epoch": 1.59, "learning_rate": 1.9469165693861964e-05, "loss": 0.0128, "step": 110540 }, { "epoch": 1.59, "learning_rate": 1.9469117654123494e-05, "loss": 0.0111, "step": 110550 }, { "epoch": 1.59, "learning_rate": 1.946906961438502e-05, "loss": 0.012, "step": 110560 }, { "epoch": 1.59, "learning_rate": 1.946902157464655e-05, "loss": 0.013, "step": 110570 }, { "epoch": 1.59, "learning_rate": 1.9468973534908078e-05, "loss": 0.0086, "step": 110580 }, { "epoch": 1.59, "learning_rate": 1.9468925495169607e-05, "loss": 0.0095, "step": 110590 }, { "epoch": 1.59, "learning_rate": 1.9468877455431133e-05, "loss": 0.0101, "step": 110600 }, { "epoch": 1.59, "learning_rate": 1.9468829415692662e-05, "loss": 0.0093, "step": 110610 }, { "epoch": 1.59, "learning_rate": 1.946878137595419e-05, "loss": 0.0105, "step": 110620 }, { "epoch": 1.59, "learning_rate": 1.946873333621572e-05, "loss": 0.0108, "step": 110630 }, { "epoch": 1.59, "learning_rate": 1.9468685296477247e-05, "loss": 0.014, "step": 110640 }, { "epoch": 1.59, "learning_rate": 1.9468637256738776e-05, "loss": 0.0102, "step": 110650 }, { "epoch": 1.59, "learning_rate": 1.9468589217000305e-05, "loss": 0.0089, "step": 110660 }, { "epoch": 1.59, "learning_rate": 1.946854117726183e-05, "loss": 0.0097, "step": 110670 }, { "epoch": 1.6, "learning_rate": 1.946849313752336e-05, "loss": 0.0086, "step": 110680 }, { "epoch": 1.6, "learning_rate": 1.946844509778489e-05, "loss": 0.0119, "step": 110690 }, { "epoch": 1.6, "learning_rate": 1.946839705804642e-05, "loss": 0.009, "step": 110700 }, { "epoch": 1.6, "learning_rate": 1.9468349018307945e-05, "loss": 0.0098, "step": 110710 }, { "epoch": 1.6, "learning_rate": 1.9468300978569474e-05, "loss": 0.0082, "step": 110720 }, { "epoch": 1.6, "learning_rate": 1.9468252938831003e-05, "loss": 0.014, "step": 110730 }, { "epoch": 1.6, "learning_rate": 1.946820489909253e-05, "loss": 0.0108, "step": 110740 }, { "epoch": 1.6, "learning_rate": 1.946815685935406e-05, "loss": 0.0116, "step": 110750 }, { "epoch": 1.6, "learning_rate": 1.9468108819615588e-05, "loss": 0.0122, "step": 110760 }, { "epoch": 1.6, "learning_rate": 1.9468060779877117e-05, "loss": 0.0128, "step": 110770 }, { "epoch": 1.6, "learning_rate": 1.9468012740138643e-05, "loss": 0.0098, "step": 110780 }, { "epoch": 1.6, "learning_rate": 1.9467964700400172e-05, "loss": 0.0111, "step": 110790 }, { "epoch": 1.6, "learning_rate": 1.94679166606617e-05, "loss": 0.0135, "step": 110800 }, { "epoch": 1.6, "learning_rate": 1.946786862092323e-05, "loss": 0.0122, "step": 110810 }, { "epoch": 1.6, "learning_rate": 1.9467820581184757e-05, "loss": 0.008, "step": 110820 }, { "epoch": 1.6, "learning_rate": 1.9467772541446286e-05, "loss": 0.0109, "step": 110830 }, { "epoch": 1.6, "learning_rate": 1.9467724501707815e-05, "loss": 0.0093, "step": 110840 }, { "epoch": 1.6, "learning_rate": 1.946767646196934e-05, "loss": 0.011, "step": 110850 }, { "epoch": 1.6, "learning_rate": 1.946762842223087e-05, "loss": 0.0129, "step": 110860 }, { "epoch": 1.6, "learning_rate": 1.94675803824924e-05, "loss": 0.0082, "step": 110870 }, { "epoch": 1.6, "learning_rate": 1.946753234275393e-05, "loss": 0.0134, "step": 110880 }, { "epoch": 1.6, "learning_rate": 1.9467484303015455e-05, "loss": 0.0141, "step": 110890 }, { "epoch": 1.6, "learning_rate": 1.9467436263276984e-05, "loss": 0.0087, "step": 110900 }, { "epoch": 1.6, "learning_rate": 1.9467388223538513e-05, "loss": 0.0151, "step": 110910 }, { "epoch": 1.6, "learning_rate": 1.946734018380004e-05, "loss": 0.0095, "step": 110920 }, { "epoch": 1.6, "learning_rate": 1.946729214406157e-05, "loss": 0.0146, "step": 110930 }, { "epoch": 1.6, "learning_rate": 1.9467244104323098e-05, "loss": 0.0122, "step": 110940 }, { "epoch": 1.6, "learning_rate": 1.9467196064584627e-05, "loss": 0.0128, "step": 110950 }, { "epoch": 1.6, "learning_rate": 1.9467148024846153e-05, "loss": 0.0094, "step": 110960 }, { "epoch": 1.6, "learning_rate": 1.9467099985107682e-05, "loss": 0.008, "step": 110970 }, { "epoch": 1.6, "learning_rate": 1.946705194536921e-05, "loss": 0.0111, "step": 110980 }, { "epoch": 1.6, "learning_rate": 1.946700390563074e-05, "loss": 0.01, "step": 110990 }, { "epoch": 1.6, "learning_rate": 1.9466955865892267e-05, "loss": 0.009, "step": 111000 }, { "epoch": 1.6, "learning_rate": 1.9466907826153796e-05, "loss": 0.0094, "step": 111010 }, { "epoch": 1.6, "learning_rate": 1.9466859786415325e-05, "loss": 0.0153, "step": 111020 }, { "epoch": 1.6, "learning_rate": 1.946681174667685e-05, "loss": 0.0123, "step": 111030 }, { "epoch": 1.6, "learning_rate": 1.946676370693838e-05, "loss": 0.0103, "step": 111040 }, { "epoch": 1.6, "learning_rate": 1.946671566719991e-05, "loss": 0.014, "step": 111050 }, { "epoch": 1.6, "learning_rate": 1.946666762746144e-05, "loss": 0.009, "step": 111060 }, { "epoch": 1.6, "learning_rate": 1.9466619587722965e-05, "loss": 0.0106, "step": 111070 }, { "epoch": 1.6, "learning_rate": 1.9466571547984494e-05, "loss": 0.0082, "step": 111080 }, { "epoch": 1.6, "learning_rate": 1.9466523508246023e-05, "loss": 0.0157, "step": 111090 }, { "epoch": 1.6, "learning_rate": 1.946647546850755e-05, "loss": 0.0096, "step": 111100 }, { "epoch": 1.6, "learning_rate": 1.946642742876908e-05, "loss": 0.011, "step": 111110 }, { "epoch": 1.6, "learning_rate": 1.9466379389030608e-05, "loss": 0.0096, "step": 111120 }, { "epoch": 1.6, "learning_rate": 1.9466331349292137e-05, "loss": 0.0119, "step": 111130 }, { "epoch": 1.6, "learning_rate": 1.9466283309553663e-05, "loss": 0.0099, "step": 111140 }, { "epoch": 1.6, "learning_rate": 1.9466235269815192e-05, "loss": 0.0104, "step": 111150 }, { "epoch": 1.6, "learning_rate": 1.946618723007672e-05, "loss": 0.0125, "step": 111160 }, { "epoch": 1.6, "learning_rate": 1.946613919033825e-05, "loss": 0.016, "step": 111170 }, { "epoch": 1.6, "learning_rate": 1.9466091150599777e-05, "loss": 0.0109, "step": 111180 }, { "epoch": 1.6, "learning_rate": 1.9466043110861306e-05, "loss": 0.015, "step": 111190 }, { "epoch": 1.6, "learning_rate": 1.9465995071122835e-05, "loss": 0.0056, "step": 111200 }, { "epoch": 1.6, "learning_rate": 1.946594703138436e-05, "loss": 0.0093, "step": 111210 }, { "epoch": 1.6, "learning_rate": 1.946589899164589e-05, "loss": 0.011, "step": 111220 }, { "epoch": 1.6, "learning_rate": 1.946585095190742e-05, "loss": 0.0157, "step": 111230 }, { "epoch": 1.6, "learning_rate": 1.946580291216895e-05, "loss": 0.0108, "step": 111240 }, { "epoch": 1.6, "learning_rate": 1.9465754872430475e-05, "loss": 0.0123, "step": 111250 }, { "epoch": 1.6, "learning_rate": 1.9465706832692004e-05, "loss": 0.0115, "step": 111260 }, { "epoch": 1.6, "learning_rate": 1.9465658792953533e-05, "loss": 0.012, "step": 111270 }, { "epoch": 1.6, "learning_rate": 1.946561075321506e-05, "loss": 0.009, "step": 111280 }, { "epoch": 1.6, "learning_rate": 1.946556271347659e-05, "loss": 0.0125, "step": 111290 }, { "epoch": 1.6, "learning_rate": 1.9465514673738118e-05, "loss": 0.013, "step": 111300 }, { "epoch": 1.6, "learning_rate": 1.9465466633999647e-05, "loss": 0.0136, "step": 111310 }, { "epoch": 1.6, "learning_rate": 1.9465418594261173e-05, "loss": 0.0094, "step": 111320 }, { "epoch": 1.6, "learning_rate": 1.9465370554522702e-05, "loss": 0.0081, "step": 111330 }, { "epoch": 1.6, "learning_rate": 1.946532251478423e-05, "loss": 0.0111, "step": 111340 }, { "epoch": 1.6, "learning_rate": 1.946527447504576e-05, "loss": 0.0086, "step": 111350 }, { "epoch": 1.6, "learning_rate": 1.9465226435307286e-05, "loss": 0.0086, "step": 111360 }, { "epoch": 1.61, "learning_rate": 1.9465178395568816e-05, "loss": 0.0091, "step": 111370 }, { "epoch": 1.61, "learning_rate": 1.9465130355830345e-05, "loss": 0.0122, "step": 111380 }, { "epoch": 1.61, "learning_rate": 1.946508231609187e-05, "loss": 0.0078, "step": 111390 }, { "epoch": 1.61, "learning_rate": 1.94650342763534e-05, "loss": 0.0105, "step": 111400 }, { "epoch": 1.61, "learning_rate": 1.946498623661493e-05, "loss": 0.0094, "step": 111410 }, { "epoch": 1.61, "learning_rate": 1.946493819687646e-05, "loss": 0.0106, "step": 111420 }, { "epoch": 1.61, "learning_rate": 1.9464890157137985e-05, "loss": 0.0085, "step": 111430 }, { "epoch": 1.61, "learning_rate": 1.9464842117399514e-05, "loss": 0.0138, "step": 111440 }, { "epoch": 1.61, "learning_rate": 1.9464794077661043e-05, "loss": 0.0086, "step": 111450 }, { "epoch": 1.61, "learning_rate": 1.946474603792257e-05, "loss": 0.0105, "step": 111460 }, { "epoch": 1.61, "learning_rate": 1.9464697998184098e-05, "loss": 0.0113, "step": 111470 }, { "epoch": 1.61, "learning_rate": 1.9464649958445628e-05, "loss": 0.0122, "step": 111480 }, { "epoch": 1.61, "learning_rate": 1.9464601918707157e-05, "loss": 0.0104, "step": 111490 }, { "epoch": 1.61, "learning_rate": 1.9464553878968683e-05, "loss": 0.0108, "step": 111500 }, { "epoch": 1.61, "learning_rate": 1.9464505839230212e-05, "loss": 0.0075, "step": 111510 }, { "epoch": 1.61, "learning_rate": 1.946445779949174e-05, "loss": 0.014, "step": 111520 }, { "epoch": 1.61, "learning_rate": 1.946440975975327e-05, "loss": 0.0123, "step": 111530 }, { "epoch": 1.61, "learning_rate": 1.9464361720014796e-05, "loss": 0.0147, "step": 111540 }, { "epoch": 1.61, "learning_rate": 1.9464313680276326e-05, "loss": 0.0088, "step": 111550 }, { "epoch": 1.61, "learning_rate": 1.9464265640537855e-05, "loss": 0.0114, "step": 111560 }, { "epoch": 1.61, "learning_rate": 1.946421760079938e-05, "loss": 0.0134, "step": 111570 }, { "epoch": 1.61, "learning_rate": 1.946416956106091e-05, "loss": 0.0091, "step": 111580 }, { "epoch": 1.61, "learning_rate": 1.946412152132244e-05, "loss": 0.0126, "step": 111590 }, { "epoch": 1.61, "learning_rate": 1.946407348158397e-05, "loss": 0.0098, "step": 111600 }, { "epoch": 1.61, "learning_rate": 1.9464025441845494e-05, "loss": 0.0186, "step": 111610 }, { "epoch": 1.61, "learning_rate": 1.9463977402107024e-05, "loss": 0.0103, "step": 111620 }, { "epoch": 1.61, "learning_rate": 1.9463929362368553e-05, "loss": 0.0101, "step": 111630 }, { "epoch": 1.61, "learning_rate": 1.946388132263008e-05, "loss": 0.0092, "step": 111640 }, { "epoch": 1.61, "learning_rate": 1.9463833282891608e-05, "loss": 0.0164, "step": 111650 }, { "epoch": 1.61, "learning_rate": 1.9463785243153137e-05, "loss": 0.012, "step": 111660 }, { "epoch": 1.61, "learning_rate": 1.9463737203414667e-05, "loss": 0.0098, "step": 111670 }, { "epoch": 1.61, "learning_rate": 1.9463689163676193e-05, "loss": 0.0082, "step": 111680 }, { "epoch": 1.61, "learning_rate": 1.9463641123937722e-05, "loss": 0.0102, "step": 111690 }, { "epoch": 1.61, "learning_rate": 1.946359308419925e-05, "loss": 0.0105, "step": 111700 }, { "epoch": 1.61, "learning_rate": 1.946354504446078e-05, "loss": 0.0105, "step": 111710 }, { "epoch": 1.61, "learning_rate": 1.9463497004722306e-05, "loss": 0.0134, "step": 111720 }, { "epoch": 1.61, "learning_rate": 1.9463448964983836e-05, "loss": 0.009, "step": 111730 }, { "epoch": 1.61, "learning_rate": 1.9463400925245365e-05, "loss": 0.0102, "step": 111740 }, { "epoch": 1.61, "learning_rate": 1.946335288550689e-05, "loss": 0.0121, "step": 111750 }, { "epoch": 1.61, "learning_rate": 1.946330484576842e-05, "loss": 0.0137, "step": 111760 }, { "epoch": 1.61, "learning_rate": 1.946325680602995e-05, "loss": 0.0086, "step": 111770 }, { "epoch": 1.61, "learning_rate": 1.946320876629148e-05, "loss": 0.0102, "step": 111780 }, { "epoch": 1.61, "learning_rate": 1.9463160726553004e-05, "loss": 0.0105, "step": 111790 }, { "epoch": 1.61, "learning_rate": 1.9463112686814534e-05, "loss": 0.0095, "step": 111800 }, { "epoch": 1.61, "learning_rate": 1.9463064647076063e-05, "loss": 0.0082, "step": 111810 }, { "epoch": 1.61, "learning_rate": 1.946301660733759e-05, "loss": 0.0124, "step": 111820 }, { "epoch": 1.61, "learning_rate": 1.9462968567599118e-05, "loss": 0.0101, "step": 111830 }, { "epoch": 1.61, "learning_rate": 1.9462920527860647e-05, "loss": 0.0124, "step": 111840 }, { "epoch": 1.61, "learning_rate": 1.9462872488122177e-05, "loss": 0.0138, "step": 111850 }, { "epoch": 1.61, "learning_rate": 1.9462824448383703e-05, "loss": 0.0074, "step": 111860 }, { "epoch": 1.61, "learning_rate": 1.9462776408645232e-05, "loss": 0.0114, "step": 111870 }, { "epoch": 1.61, "learning_rate": 1.946272836890676e-05, "loss": 0.0078, "step": 111880 }, { "epoch": 1.61, "learning_rate": 1.946268032916829e-05, "loss": 0.0088, "step": 111890 }, { "epoch": 1.61, "learning_rate": 1.9462632289429816e-05, "loss": 0.0097, "step": 111900 }, { "epoch": 1.61, "learning_rate": 1.9462584249691345e-05, "loss": 0.0243, "step": 111910 }, { "epoch": 1.61, "learning_rate": 1.9462536209952875e-05, "loss": 0.0079, "step": 111920 }, { "epoch": 1.61, "learning_rate": 1.94624881702144e-05, "loss": 0.0125, "step": 111930 }, { "epoch": 1.61, "learning_rate": 1.946244013047593e-05, "loss": 0.0073, "step": 111940 }, { "epoch": 1.61, "learning_rate": 1.946239209073746e-05, "loss": 0.0112, "step": 111950 }, { "epoch": 1.61, "learning_rate": 1.946234405099899e-05, "loss": 0.0129, "step": 111960 }, { "epoch": 1.61, "learning_rate": 1.9462296011260514e-05, "loss": 0.0105, "step": 111970 }, { "epoch": 1.61, "learning_rate": 1.9462247971522044e-05, "loss": 0.0077, "step": 111980 }, { "epoch": 1.61, "learning_rate": 1.9462199931783573e-05, "loss": 0.009, "step": 111990 }, { "epoch": 1.61, "learning_rate": 1.94621518920451e-05, "loss": 0.01, "step": 112000 }, { "epoch": 1.61, "learning_rate": 1.9462103852306628e-05, "loss": 0.01, "step": 112010 }, { "epoch": 1.61, "learning_rate": 1.9462055812568157e-05, "loss": 0.0099, "step": 112020 }, { "epoch": 1.61, "learning_rate": 1.9462007772829687e-05, "loss": 0.0115, "step": 112030 }, { "epoch": 1.61, "learning_rate": 1.9461959733091212e-05, "loss": 0.0095, "step": 112040 }, { "epoch": 1.61, "learning_rate": 1.9461911693352742e-05, "loss": 0.0113, "step": 112050 }, { "epoch": 1.61, "learning_rate": 1.946186365361427e-05, "loss": 0.0128, "step": 112060 }, { "epoch": 1.62, "learning_rate": 1.94618156138758e-05, "loss": 0.0109, "step": 112070 }, { "epoch": 1.62, "learning_rate": 1.946176757413733e-05, "loss": 0.0088, "step": 112080 }, { "epoch": 1.62, "learning_rate": 1.946171953439886e-05, "loss": 0.0104, "step": 112090 }, { "epoch": 1.62, "learning_rate": 1.9461671494660385e-05, "loss": 0.0077, "step": 112100 }, { "epoch": 1.62, "learning_rate": 1.9461623454921914e-05, "loss": 0.0099, "step": 112110 }, { "epoch": 1.62, "learning_rate": 1.9461575415183443e-05, "loss": 0.0109, "step": 112120 }, { "epoch": 1.62, "learning_rate": 1.946152737544497e-05, "loss": 0.0099, "step": 112130 }, { "epoch": 1.62, "learning_rate": 1.94614793357065e-05, "loss": 0.011, "step": 112140 }, { "epoch": 1.62, "learning_rate": 1.9461431295968028e-05, "loss": 0.0144, "step": 112150 }, { "epoch": 1.62, "learning_rate": 1.9461383256229557e-05, "loss": 0.0101, "step": 112160 }, { "epoch": 1.62, "learning_rate": 1.9461335216491083e-05, "loss": 0.0127, "step": 112170 }, { "epoch": 1.62, "learning_rate": 1.9461287176752612e-05, "loss": 0.0116, "step": 112180 }, { "epoch": 1.62, "learning_rate": 1.946123913701414e-05, "loss": 0.0078, "step": 112190 }, { "epoch": 1.62, "learning_rate": 1.946119109727567e-05, "loss": 0.0105, "step": 112200 }, { "epoch": 1.62, "learning_rate": 1.9461143057537196e-05, "loss": 0.0116, "step": 112210 }, { "epoch": 1.62, "learning_rate": 1.9461095017798726e-05, "loss": 0.011, "step": 112220 }, { "epoch": 1.62, "learning_rate": 1.9461046978060255e-05, "loss": 0.0082, "step": 112230 }, { "epoch": 1.62, "learning_rate": 1.946099893832178e-05, "loss": 0.0088, "step": 112240 }, { "epoch": 1.62, "learning_rate": 1.946095089858331e-05, "loss": 0.0123, "step": 112250 }, { "epoch": 1.62, "learning_rate": 1.946090285884484e-05, "loss": 0.0092, "step": 112260 }, { "epoch": 1.62, "learning_rate": 1.946085481910637e-05, "loss": 0.0118, "step": 112270 }, { "epoch": 1.62, "learning_rate": 1.9460806779367895e-05, "loss": 0.0101, "step": 112280 }, { "epoch": 1.62, "learning_rate": 1.9460758739629424e-05, "loss": 0.0116, "step": 112290 }, { "epoch": 1.62, "learning_rate": 1.9460710699890953e-05, "loss": 0.0095, "step": 112300 }, { "epoch": 1.62, "learning_rate": 1.946066266015248e-05, "loss": 0.0093, "step": 112310 }, { "epoch": 1.62, "learning_rate": 1.9460614620414008e-05, "loss": 0.0118, "step": 112320 }, { "epoch": 1.62, "learning_rate": 1.9460566580675538e-05, "loss": 0.0117, "step": 112330 }, { "epoch": 1.62, "learning_rate": 1.9460518540937067e-05, "loss": 0.0076, "step": 112340 }, { "epoch": 1.62, "learning_rate": 1.9460470501198593e-05, "loss": 0.0136, "step": 112350 }, { "epoch": 1.62, "learning_rate": 1.9460422461460122e-05, "loss": 0.0121, "step": 112360 }, { "epoch": 1.62, "learning_rate": 1.946037442172165e-05, "loss": 0.0105, "step": 112370 }, { "epoch": 1.62, "learning_rate": 1.946032638198318e-05, "loss": 0.01, "step": 112380 }, { "epoch": 1.62, "learning_rate": 1.9460278342244706e-05, "loss": 0.0134, "step": 112390 }, { "epoch": 1.62, "learning_rate": 1.9460230302506236e-05, "loss": 0.009, "step": 112400 }, { "epoch": 1.62, "learning_rate": 1.9460182262767765e-05, "loss": 0.0147, "step": 112410 }, { "epoch": 1.62, "learning_rate": 1.946013422302929e-05, "loss": 0.0075, "step": 112420 }, { "epoch": 1.62, "learning_rate": 1.946008618329082e-05, "loss": 0.0096, "step": 112430 }, { "epoch": 1.62, "learning_rate": 1.946003814355235e-05, "loss": 0.0117, "step": 112440 }, { "epoch": 1.62, "learning_rate": 1.945999010381388e-05, "loss": 0.012, "step": 112450 }, { "epoch": 1.62, "learning_rate": 1.9459942064075404e-05, "loss": 0.0108, "step": 112460 }, { "epoch": 1.62, "learning_rate": 1.9459894024336934e-05, "loss": 0.0084, "step": 112470 }, { "epoch": 1.62, "learning_rate": 1.9459845984598463e-05, "loss": 0.0101, "step": 112480 }, { "epoch": 1.62, "learning_rate": 1.945979794485999e-05, "loss": 0.0105, "step": 112490 }, { "epoch": 1.62, "learning_rate": 1.9459749905121518e-05, "loss": 0.0113, "step": 112500 }, { "epoch": 1.62, "learning_rate": 1.9459701865383047e-05, "loss": 0.0085, "step": 112510 }, { "epoch": 1.62, "learning_rate": 1.9459653825644577e-05, "loss": 0.0115, "step": 112520 }, { "epoch": 1.62, "learning_rate": 1.9459605785906103e-05, "loss": 0.0124, "step": 112530 }, { "epoch": 1.62, "learning_rate": 1.9459557746167632e-05, "loss": 0.0109, "step": 112540 }, { "epoch": 1.62, "learning_rate": 1.945950970642916e-05, "loss": 0.0096, "step": 112550 }, { "epoch": 1.62, "learning_rate": 1.945946166669069e-05, "loss": 0.0134, "step": 112560 }, { "epoch": 1.62, "learning_rate": 1.9459413626952216e-05, "loss": 0.0132, "step": 112570 }, { "epoch": 1.62, "learning_rate": 1.9459365587213746e-05, "loss": 0.0079, "step": 112580 }, { "epoch": 1.62, "learning_rate": 1.9459317547475275e-05, "loss": 0.0094, "step": 112590 }, { "epoch": 1.62, "learning_rate": 1.94592695077368e-05, "loss": 0.0101, "step": 112600 }, { "epoch": 1.62, "learning_rate": 1.945922146799833e-05, "loss": 0.0135, "step": 112610 }, { "epoch": 1.62, "learning_rate": 1.945917342825986e-05, "loss": 0.0102, "step": 112620 }, { "epoch": 1.62, "learning_rate": 1.945912538852139e-05, "loss": 0.0117, "step": 112630 }, { "epoch": 1.62, "learning_rate": 1.9459077348782914e-05, "loss": 0.0094, "step": 112640 }, { "epoch": 1.62, "learning_rate": 1.9459029309044444e-05, "loss": 0.0097, "step": 112650 }, { "epoch": 1.62, "learning_rate": 1.9458981269305973e-05, "loss": 0.0105, "step": 112660 }, { "epoch": 1.62, "learning_rate": 1.94589332295675e-05, "loss": 0.0112, "step": 112670 }, { "epoch": 1.62, "learning_rate": 1.9458885189829028e-05, "loss": 0.0126, "step": 112680 }, { "epoch": 1.62, "learning_rate": 1.9458837150090557e-05, "loss": 0.0131, "step": 112690 }, { "epoch": 1.62, "learning_rate": 1.9458789110352087e-05, "loss": 0.0116, "step": 112700 }, { "epoch": 1.62, "learning_rate": 1.9458741070613613e-05, "loss": 0.0137, "step": 112710 }, { "epoch": 1.62, "learning_rate": 1.9458693030875142e-05, "loss": 0.0133, "step": 112720 }, { "epoch": 1.62, "learning_rate": 1.945864499113667e-05, "loss": 0.0148, "step": 112730 }, { "epoch": 1.62, "learning_rate": 1.94585969513982e-05, "loss": 0.0115, "step": 112740 }, { "epoch": 1.62, "learning_rate": 1.9458548911659726e-05, "loss": 0.0127, "step": 112750 }, { "epoch": 1.63, "learning_rate": 1.9458500871921255e-05, "loss": 0.0113, "step": 112760 }, { "epoch": 1.63, "learning_rate": 1.9458452832182785e-05, "loss": 0.0073, "step": 112770 }, { "epoch": 1.63, "learning_rate": 1.945840479244431e-05, "loss": 0.0121, "step": 112780 }, { "epoch": 1.63, "learning_rate": 1.945835675270584e-05, "loss": 0.008, "step": 112790 }, { "epoch": 1.63, "learning_rate": 1.945830871296737e-05, "loss": 0.0074, "step": 112800 }, { "epoch": 1.63, "learning_rate": 1.94582606732289e-05, "loss": 0.0087, "step": 112810 }, { "epoch": 1.63, "learning_rate": 1.9458212633490424e-05, "loss": 0.0107, "step": 112820 }, { "epoch": 1.63, "learning_rate": 1.9458164593751954e-05, "loss": 0.0086, "step": 112830 }, { "epoch": 1.63, "learning_rate": 1.9458116554013483e-05, "loss": 0.0124, "step": 112840 }, { "epoch": 1.63, "learning_rate": 1.945806851427501e-05, "loss": 0.0112, "step": 112850 }, { "epoch": 1.63, "learning_rate": 1.9458020474536538e-05, "loss": 0.0107, "step": 112860 }, { "epoch": 1.63, "learning_rate": 1.9457972434798067e-05, "loss": 0.0086, "step": 112870 }, { "epoch": 1.63, "learning_rate": 1.9457924395059597e-05, "loss": 0.0099, "step": 112880 }, { "epoch": 1.63, "learning_rate": 1.9457876355321122e-05, "loss": 0.019, "step": 112890 }, { "epoch": 1.63, "learning_rate": 1.9457828315582652e-05, "loss": 0.0098, "step": 112900 }, { "epoch": 1.63, "learning_rate": 1.945778027584418e-05, "loss": 0.0125, "step": 112910 }, { "epoch": 1.63, "learning_rate": 1.945773223610571e-05, "loss": 0.0083, "step": 112920 }, { "epoch": 1.63, "learning_rate": 1.9457684196367236e-05, "loss": 0.0096, "step": 112930 }, { "epoch": 1.63, "learning_rate": 1.9457636156628765e-05, "loss": 0.0104, "step": 112940 }, { "epoch": 1.63, "learning_rate": 1.9457588116890295e-05, "loss": 0.0097, "step": 112950 }, { "epoch": 1.63, "learning_rate": 1.945754007715182e-05, "loss": 0.0137, "step": 112960 }, { "epoch": 1.63, "learning_rate": 1.945749203741335e-05, "loss": 0.0143, "step": 112970 }, { "epoch": 1.63, "learning_rate": 1.945744399767488e-05, "loss": 0.0102, "step": 112980 }, { "epoch": 1.63, "learning_rate": 1.945739595793641e-05, "loss": 0.0091, "step": 112990 }, { "epoch": 1.63, "learning_rate": 1.9457347918197934e-05, "loss": 0.0099, "step": 113000 }, { "epoch": 1.63, "learning_rate": 1.9457299878459464e-05, "loss": 0.0143, "step": 113010 }, { "epoch": 1.63, "learning_rate": 1.9457251838720993e-05, "loss": 0.0124, "step": 113020 }, { "epoch": 1.63, "learning_rate": 1.945720379898252e-05, "loss": 0.01, "step": 113030 }, { "epoch": 1.63, "learning_rate": 1.9457155759244048e-05, "loss": 0.0106, "step": 113040 }, { "epoch": 1.63, "learning_rate": 1.9457107719505577e-05, "loss": 0.0077, "step": 113050 }, { "epoch": 1.63, "learning_rate": 1.9457059679767106e-05, "loss": 0.0108, "step": 113060 }, { "epoch": 1.63, "learning_rate": 1.9457011640028632e-05, "loss": 0.0123, "step": 113070 }, { "epoch": 1.63, "learning_rate": 1.945696360029016e-05, "loss": 0.0108, "step": 113080 }, { "epoch": 1.63, "learning_rate": 1.945691556055169e-05, "loss": 0.0146, "step": 113090 }, { "epoch": 1.63, "learning_rate": 1.945686752081322e-05, "loss": 0.0101, "step": 113100 }, { "epoch": 1.63, "learning_rate": 1.9456819481074746e-05, "loss": 0.0117, "step": 113110 }, { "epoch": 1.63, "learning_rate": 1.9456771441336275e-05, "loss": 0.0081, "step": 113120 }, { "epoch": 1.63, "learning_rate": 1.9456723401597805e-05, "loss": 0.0121, "step": 113130 }, { "epoch": 1.63, "learning_rate": 1.945667536185933e-05, "loss": 0.0135, "step": 113140 }, { "epoch": 1.63, "learning_rate": 1.945662732212086e-05, "loss": 0.0145, "step": 113150 }, { "epoch": 1.63, "learning_rate": 1.945657928238239e-05, "loss": 0.0116, "step": 113160 }, { "epoch": 1.63, "learning_rate": 1.9456531242643918e-05, "loss": 0.0089, "step": 113170 }, { "epoch": 1.63, "learning_rate": 1.9456483202905444e-05, "loss": 0.0124, "step": 113180 }, { "epoch": 1.63, "learning_rate": 1.9456435163166973e-05, "loss": 0.0117, "step": 113190 }, { "epoch": 1.63, "learning_rate": 1.9456387123428503e-05, "loss": 0.0147, "step": 113200 }, { "epoch": 1.63, "learning_rate": 1.945633908369003e-05, "loss": 0.0083, "step": 113210 }, { "epoch": 1.63, "learning_rate": 1.9456291043951558e-05, "loss": 0.0127, "step": 113220 }, { "epoch": 1.63, "learning_rate": 1.9456243004213087e-05, "loss": 0.013, "step": 113230 }, { "epoch": 1.63, "learning_rate": 1.9456194964474616e-05, "loss": 0.0128, "step": 113240 }, { "epoch": 1.63, "learning_rate": 1.9456146924736142e-05, "loss": 0.0125, "step": 113250 }, { "epoch": 1.63, "learning_rate": 1.945609888499767e-05, "loss": 0.0099, "step": 113260 }, { "epoch": 1.63, "learning_rate": 1.94560508452592e-05, "loss": 0.0113, "step": 113270 }, { "epoch": 1.63, "learning_rate": 1.945600280552073e-05, "loss": 0.0098, "step": 113280 }, { "epoch": 1.63, "learning_rate": 1.9455954765782256e-05, "loss": 0.0091, "step": 113290 }, { "epoch": 1.63, "learning_rate": 1.9455906726043785e-05, "loss": 0.0144, "step": 113300 }, { "epoch": 1.63, "learning_rate": 1.9455858686305315e-05, "loss": 0.0093, "step": 113310 }, { "epoch": 1.63, "learning_rate": 1.945581064656684e-05, "loss": 0.0093, "step": 113320 }, { "epoch": 1.63, "learning_rate": 1.945576260682837e-05, "loss": 0.0106, "step": 113330 }, { "epoch": 1.63, "learning_rate": 1.94557145670899e-05, "loss": 0.0115, "step": 113340 }, { "epoch": 1.63, "learning_rate": 1.9455666527351428e-05, "loss": 0.0077, "step": 113350 }, { "epoch": 1.63, "learning_rate": 1.9455618487612954e-05, "loss": 0.0092, "step": 113360 }, { "epoch": 1.63, "learning_rate": 1.9455570447874483e-05, "loss": 0.0109, "step": 113370 }, { "epoch": 1.63, "learning_rate": 1.9455522408136013e-05, "loss": 0.01, "step": 113380 }, { "epoch": 1.63, "learning_rate": 1.945547436839754e-05, "loss": 0.0142, "step": 113390 }, { "epoch": 1.63, "learning_rate": 1.9455426328659068e-05, "loss": 0.0108, "step": 113400 }, { "epoch": 1.63, "learning_rate": 1.9455378288920597e-05, "loss": 0.0106, "step": 113410 }, { "epoch": 1.63, "learning_rate": 1.9455330249182126e-05, "loss": 0.0103, "step": 113420 }, { "epoch": 1.63, "learning_rate": 1.9455282209443652e-05, "loss": 0.0093, "step": 113430 }, { "epoch": 1.63, "learning_rate": 1.945523416970518e-05, "loss": 0.0099, "step": 113440 }, { "epoch": 1.64, "learning_rate": 1.945518612996671e-05, "loss": 0.009, "step": 113450 }, { "epoch": 1.64, "learning_rate": 1.9455138090228237e-05, "loss": 0.0167, "step": 113460 }, { "epoch": 1.64, "learning_rate": 1.9455090050489766e-05, "loss": 0.0089, "step": 113470 }, { "epoch": 1.64, "learning_rate": 1.9455042010751295e-05, "loss": 0.0119, "step": 113480 }, { "epoch": 1.64, "learning_rate": 1.9454993971012824e-05, "loss": 0.0098, "step": 113490 }, { "epoch": 1.64, "learning_rate": 1.945494593127435e-05, "loss": 0.0158, "step": 113500 }, { "epoch": 1.64, "learning_rate": 1.945489789153588e-05, "loss": 0.0089, "step": 113510 }, { "epoch": 1.64, "learning_rate": 1.945484985179741e-05, "loss": 0.0135, "step": 113520 }, { "epoch": 1.64, "learning_rate": 1.9454801812058938e-05, "loss": 0.0145, "step": 113530 }, { "epoch": 1.64, "learning_rate": 1.9454753772320464e-05, "loss": 0.0075, "step": 113540 }, { "epoch": 1.64, "learning_rate": 1.9454705732581993e-05, "loss": 0.0093, "step": 113550 }, { "epoch": 1.64, "learning_rate": 1.9454657692843523e-05, "loss": 0.0095, "step": 113560 }, { "epoch": 1.64, "learning_rate": 1.945460965310505e-05, "loss": 0.0149, "step": 113570 }, { "epoch": 1.64, "learning_rate": 1.9454561613366578e-05, "loss": 0.0109, "step": 113580 }, { "epoch": 1.64, "learning_rate": 1.9454513573628107e-05, "loss": 0.0167, "step": 113590 }, { "epoch": 1.64, "learning_rate": 1.9454465533889636e-05, "loss": 0.013, "step": 113600 }, { "epoch": 1.64, "learning_rate": 1.9454417494151162e-05, "loss": 0.011, "step": 113610 }, { "epoch": 1.64, "learning_rate": 1.945436945441269e-05, "loss": 0.0112, "step": 113620 }, { "epoch": 1.64, "learning_rate": 1.945432141467422e-05, "loss": 0.0113, "step": 113630 }, { "epoch": 1.64, "learning_rate": 1.9454273374935747e-05, "loss": 0.0112, "step": 113640 }, { "epoch": 1.64, "learning_rate": 1.9454225335197276e-05, "loss": 0.0107, "step": 113650 }, { "epoch": 1.64, "learning_rate": 1.9454177295458805e-05, "loss": 0.009, "step": 113660 }, { "epoch": 1.64, "learning_rate": 1.9454129255720334e-05, "loss": 0.0128, "step": 113670 }, { "epoch": 1.64, "learning_rate": 1.945408121598186e-05, "loss": 0.0103, "step": 113680 }, { "epoch": 1.64, "learning_rate": 1.945403317624339e-05, "loss": 0.0082, "step": 113690 }, { "epoch": 1.64, "learning_rate": 1.945398513650492e-05, "loss": 0.0118, "step": 113700 }, { "epoch": 1.64, "learning_rate": 1.9453937096766448e-05, "loss": 0.0176, "step": 113710 }, { "epoch": 1.64, "learning_rate": 1.9453889057027974e-05, "loss": 0.0109, "step": 113720 }, { "epoch": 1.64, "learning_rate": 1.9453841017289503e-05, "loss": 0.0122, "step": 113730 }, { "epoch": 1.64, "learning_rate": 1.9453792977551032e-05, "loss": 0.014, "step": 113740 }, { "epoch": 1.64, "learning_rate": 1.945374493781256e-05, "loss": 0.0127, "step": 113750 }, { "epoch": 1.64, "learning_rate": 1.9453696898074088e-05, "loss": 0.0115, "step": 113760 }, { "epoch": 1.64, "learning_rate": 1.9453648858335617e-05, "loss": 0.0136, "step": 113770 }, { "epoch": 1.64, "learning_rate": 1.9453600818597146e-05, "loss": 0.0118, "step": 113780 }, { "epoch": 1.64, "learning_rate": 1.9453552778858672e-05, "loss": 0.0095, "step": 113790 }, { "epoch": 1.64, "learning_rate": 1.94535047391202e-05, "loss": 0.0074, "step": 113800 }, { "epoch": 1.64, "learning_rate": 1.945345669938173e-05, "loss": 0.0097, "step": 113810 }, { "epoch": 1.64, "learning_rate": 1.9453408659643256e-05, "loss": 0.0161, "step": 113820 }, { "epoch": 1.64, "learning_rate": 1.9453360619904786e-05, "loss": 0.0077, "step": 113830 }, { "epoch": 1.64, "learning_rate": 1.9453312580166315e-05, "loss": 0.0102, "step": 113840 }, { "epoch": 1.64, "learning_rate": 1.9453264540427844e-05, "loss": 0.0071, "step": 113850 }, { "epoch": 1.64, "learning_rate": 1.945321650068937e-05, "loss": 0.011, "step": 113860 }, { "epoch": 1.64, "learning_rate": 1.94531684609509e-05, "loss": 0.0107, "step": 113870 }, { "epoch": 1.64, "learning_rate": 1.945312042121243e-05, "loss": 0.0096, "step": 113880 }, { "epoch": 1.64, "learning_rate": 1.9453072381473958e-05, "loss": 0.0116, "step": 113890 }, { "epoch": 1.64, "learning_rate": 1.9453024341735484e-05, "loss": 0.0121, "step": 113900 }, { "epoch": 1.64, "learning_rate": 1.9452976301997013e-05, "loss": 0.012, "step": 113910 }, { "epoch": 1.64, "learning_rate": 1.9452928262258542e-05, "loss": 0.0117, "step": 113920 }, { "epoch": 1.64, "learning_rate": 1.9452880222520068e-05, "loss": 0.0134, "step": 113930 }, { "epoch": 1.64, "learning_rate": 1.9452832182781598e-05, "loss": 0.0132, "step": 113940 }, { "epoch": 1.64, "learning_rate": 1.9452784143043127e-05, "loss": 0.0099, "step": 113950 }, { "epoch": 1.64, "learning_rate": 1.9452736103304656e-05, "loss": 0.0182, "step": 113960 }, { "epoch": 1.64, "learning_rate": 1.9452688063566182e-05, "loss": 0.0117, "step": 113970 }, { "epoch": 1.64, "learning_rate": 1.945264002382771e-05, "loss": 0.0098, "step": 113980 }, { "epoch": 1.64, "learning_rate": 1.945259198408924e-05, "loss": 0.0104, "step": 113990 }, { "epoch": 1.64, "learning_rate": 1.9452543944350766e-05, "loss": 0.0103, "step": 114000 }, { "epoch": 1.64, "learning_rate": 1.9452495904612296e-05, "loss": 0.0087, "step": 114010 }, { "epoch": 1.64, "learning_rate": 1.9452447864873825e-05, "loss": 0.0115, "step": 114020 }, { "epoch": 1.64, "learning_rate": 1.9452399825135354e-05, "loss": 0.0084, "step": 114030 }, { "epoch": 1.64, "learning_rate": 1.945235178539688e-05, "loss": 0.0114, "step": 114040 }, { "epoch": 1.64, "learning_rate": 1.945230374565841e-05, "loss": 0.0149, "step": 114050 }, { "epoch": 1.64, "learning_rate": 1.945225570591994e-05, "loss": 0.0099, "step": 114060 }, { "epoch": 1.64, "learning_rate": 1.9452207666181468e-05, "loss": 0.0088, "step": 114070 }, { "epoch": 1.64, "learning_rate": 1.9452159626442994e-05, "loss": 0.0109, "step": 114080 }, { "epoch": 1.64, "learning_rate": 1.9452111586704523e-05, "loss": 0.0098, "step": 114090 }, { "epoch": 1.64, "learning_rate": 1.9452063546966052e-05, "loss": 0.0102, "step": 114100 }, { "epoch": 1.64, "learning_rate": 1.9452015507227578e-05, "loss": 0.0115, "step": 114110 }, { "epoch": 1.64, "learning_rate": 1.9451967467489107e-05, "loss": 0.0096, "step": 114120 }, { "epoch": 1.64, "learning_rate": 1.9451919427750637e-05, "loss": 0.0104, "step": 114130 }, { "epoch": 1.64, "learning_rate": 1.9451871388012166e-05, "loss": 0.0115, "step": 114140 }, { "epoch": 1.65, "learning_rate": 1.9451823348273692e-05, "loss": 0.0077, "step": 114150 }, { "epoch": 1.65, "learning_rate": 1.945177530853522e-05, "loss": 0.0165, "step": 114160 }, { "epoch": 1.65, "learning_rate": 1.945172726879675e-05, "loss": 0.014, "step": 114170 }, { "epoch": 1.65, "learning_rate": 1.9451679229058276e-05, "loss": 0.0109, "step": 114180 }, { "epoch": 1.65, "learning_rate": 1.9451631189319806e-05, "loss": 0.0108, "step": 114190 }, { "epoch": 1.65, "learning_rate": 1.9451583149581335e-05, "loss": 0.0112, "step": 114200 }, { "epoch": 1.65, "learning_rate": 1.9451535109842864e-05, "loss": 0.0096, "step": 114210 }, { "epoch": 1.65, "learning_rate": 1.945148707010439e-05, "loss": 0.0065, "step": 114220 }, { "epoch": 1.65, "learning_rate": 1.945143903036592e-05, "loss": 0.0115, "step": 114230 }, { "epoch": 1.65, "learning_rate": 1.945139099062745e-05, "loss": 0.0101, "step": 114240 }, { "epoch": 1.65, "learning_rate": 1.9451342950888978e-05, "loss": 0.01, "step": 114250 }, { "epoch": 1.65, "learning_rate": 1.9451294911150504e-05, "loss": 0.0099, "step": 114260 }, { "epoch": 1.65, "learning_rate": 1.9451246871412033e-05, "loss": 0.0108, "step": 114270 }, { "epoch": 1.65, "learning_rate": 1.9451198831673562e-05, "loss": 0.016, "step": 114280 }, { "epoch": 1.65, "learning_rate": 1.9451150791935088e-05, "loss": 0.0074, "step": 114290 }, { "epoch": 1.65, "learning_rate": 1.9451102752196617e-05, "loss": 0.0105, "step": 114300 }, { "epoch": 1.65, "learning_rate": 1.9451054712458147e-05, "loss": 0.01, "step": 114310 }, { "epoch": 1.65, "learning_rate": 1.945101147669352e-05, "loss": 0.0115, "step": 114320 }, { "epoch": 1.65, "learning_rate": 1.945096343695505e-05, "loss": 0.0094, "step": 114330 }, { "epoch": 1.65, "learning_rate": 1.945091539721658e-05, "loss": 0.0077, "step": 114340 }, { "epoch": 1.65, "learning_rate": 1.9450867357478106e-05, "loss": 0.0108, "step": 114350 }, { "epoch": 1.65, "learning_rate": 1.9450819317739635e-05, "loss": 0.0102, "step": 114360 }, { "epoch": 1.65, "learning_rate": 1.9450771278001164e-05, "loss": 0.0096, "step": 114370 }, { "epoch": 1.65, "learning_rate": 1.9450723238262693e-05, "loss": 0.0113, "step": 114380 }, { "epoch": 1.65, "learning_rate": 1.945067519852422e-05, "loss": 0.0121, "step": 114390 }, { "epoch": 1.65, "learning_rate": 1.945062715878575e-05, "loss": 0.01, "step": 114400 }, { "epoch": 1.65, "learning_rate": 1.9450579119047278e-05, "loss": 0.0148, "step": 114410 }, { "epoch": 1.65, "learning_rate": 1.9450531079308804e-05, "loss": 0.0094, "step": 114420 }, { "epoch": 1.65, "learning_rate": 1.9450483039570333e-05, "loss": 0.0106, "step": 114430 }, { "epoch": 1.65, "learning_rate": 1.9450434999831862e-05, "loss": 0.0146, "step": 114440 }, { "epoch": 1.65, "learning_rate": 1.945038696009339e-05, "loss": 0.0105, "step": 114450 }, { "epoch": 1.65, "learning_rate": 1.9450338920354917e-05, "loss": 0.0105, "step": 114460 }, { "epoch": 1.65, "learning_rate": 1.9450290880616447e-05, "loss": 0.0128, "step": 114470 }, { "epoch": 1.65, "learning_rate": 1.9450242840877976e-05, "loss": 0.0096, "step": 114480 }, { "epoch": 1.65, "learning_rate": 1.9450194801139505e-05, "loss": 0.0113, "step": 114490 }, { "epoch": 1.65, "learning_rate": 1.945014676140103e-05, "loss": 0.0117, "step": 114500 }, { "epoch": 1.65, "learning_rate": 1.945009872166256e-05, "loss": 0.0089, "step": 114510 }, { "epoch": 1.65, "learning_rate": 1.945005068192409e-05, "loss": 0.0123, "step": 114520 }, { "epoch": 1.65, "learning_rate": 1.9450002642185616e-05, "loss": 0.0096, "step": 114530 }, { "epoch": 1.65, "learning_rate": 1.9449954602447145e-05, "loss": 0.0088, "step": 114540 }, { "epoch": 1.65, "learning_rate": 1.9449906562708674e-05, "loss": 0.0094, "step": 114550 }, { "epoch": 1.65, "learning_rate": 1.9449858522970203e-05, "loss": 0.0132, "step": 114560 }, { "epoch": 1.65, "learning_rate": 1.944981048323173e-05, "loss": 0.0122, "step": 114570 }, { "epoch": 1.65, "learning_rate": 1.944976244349326e-05, "loss": 0.0148, "step": 114580 }, { "epoch": 1.65, "learning_rate": 1.9449714403754788e-05, "loss": 0.0099, "step": 114590 }, { "epoch": 1.65, "learning_rate": 1.9449666364016314e-05, "loss": 0.0111, "step": 114600 }, { "epoch": 1.65, "learning_rate": 1.9449618324277843e-05, "loss": 0.0146, "step": 114610 }, { "epoch": 1.65, "learning_rate": 1.9449570284539372e-05, "loss": 0.0106, "step": 114620 }, { "epoch": 1.65, "learning_rate": 1.94495222448009e-05, "loss": 0.0127, "step": 114630 }, { "epoch": 1.65, "learning_rate": 1.9449474205062427e-05, "loss": 0.0092, "step": 114640 }, { "epoch": 1.65, "learning_rate": 1.9449426165323957e-05, "loss": 0.0098, "step": 114650 }, { "epoch": 1.65, "learning_rate": 1.9449378125585486e-05, "loss": 0.008, "step": 114660 }, { "epoch": 1.65, "learning_rate": 1.9449330085847015e-05, "loss": 0.0151, "step": 114670 }, { "epoch": 1.65, "learning_rate": 1.944928204610854e-05, "loss": 0.0127, "step": 114680 }, { "epoch": 1.65, "learning_rate": 1.944923400637007e-05, "loss": 0.007, "step": 114690 }, { "epoch": 1.65, "learning_rate": 1.94491859666316e-05, "loss": 0.0091, "step": 114700 }, { "epoch": 1.65, "learning_rate": 1.9449137926893126e-05, "loss": 0.0071, "step": 114710 }, { "epoch": 1.65, "learning_rate": 1.9449089887154655e-05, "loss": 0.011, "step": 114720 }, { "epoch": 1.65, "learning_rate": 1.9449041847416184e-05, "loss": 0.012, "step": 114730 }, { "epoch": 1.65, "learning_rate": 1.9448993807677713e-05, "loss": 0.015, "step": 114740 }, { "epoch": 1.65, "learning_rate": 1.944894576793924e-05, "loss": 0.0094, "step": 114750 }, { "epoch": 1.65, "learning_rate": 1.944889772820077e-05, "loss": 0.0149, "step": 114760 }, { "epoch": 1.65, "learning_rate": 1.9448849688462298e-05, "loss": 0.0101, "step": 114770 }, { "epoch": 1.65, "learning_rate": 1.9448801648723824e-05, "loss": 0.0132, "step": 114780 }, { "epoch": 1.65, "learning_rate": 1.9448753608985353e-05, "loss": 0.0096, "step": 114790 }, { "epoch": 1.65, "learning_rate": 1.9448705569246882e-05, "loss": 0.0104, "step": 114800 }, { "epoch": 1.65, "learning_rate": 1.944865752950841e-05, "loss": 0.0082, "step": 114810 }, { "epoch": 1.65, "learning_rate": 1.9448609489769937e-05, "loss": 0.0142, "step": 114820 }, { "epoch": 1.65, "learning_rate": 1.9448561450031467e-05, "loss": 0.0093, "step": 114830 }, { "epoch": 1.66, "learning_rate": 1.9448513410292996e-05, "loss": 0.0074, "step": 114840 }, { "epoch": 1.66, "learning_rate": 1.9448465370554525e-05, "loss": 0.0121, "step": 114850 }, { "epoch": 1.66, "learning_rate": 1.944841733081605e-05, "loss": 0.0108, "step": 114860 }, { "epoch": 1.66, "learning_rate": 1.944836929107758e-05, "loss": 0.0082, "step": 114870 }, { "epoch": 1.66, "learning_rate": 1.944832125133911e-05, "loss": 0.0079, "step": 114880 }, { "epoch": 1.66, "learning_rate": 1.9448273211600635e-05, "loss": 0.0066, "step": 114890 }, { "epoch": 1.66, "learning_rate": 1.9448225171862165e-05, "loss": 0.0117, "step": 114900 }, { "epoch": 1.66, "learning_rate": 1.9448177132123694e-05, "loss": 0.0101, "step": 114910 }, { "epoch": 1.66, "learning_rate": 1.9448129092385223e-05, "loss": 0.0073, "step": 114920 }, { "epoch": 1.66, "learning_rate": 1.944808105264675e-05, "loss": 0.0081, "step": 114930 }, { "epoch": 1.66, "learning_rate": 1.944803301290828e-05, "loss": 0.0126, "step": 114940 }, { "epoch": 1.66, "learning_rate": 1.9447984973169808e-05, "loss": 0.0122, "step": 114950 }, { "epoch": 1.66, "learning_rate": 1.9447936933431334e-05, "loss": 0.0127, "step": 114960 }, { "epoch": 1.66, "learning_rate": 1.9447888893692863e-05, "loss": 0.0093, "step": 114970 }, { "epoch": 1.66, "learning_rate": 1.9447840853954392e-05, "loss": 0.0115, "step": 114980 }, { "epoch": 1.66, "learning_rate": 1.944779281421592e-05, "loss": 0.0128, "step": 114990 }, { "epoch": 1.66, "learning_rate": 1.9447744774477447e-05, "loss": 0.0106, "step": 115000 }, { "epoch": 1.66, "learning_rate": 1.9447696734738976e-05, "loss": 0.0094, "step": 115010 }, { "epoch": 1.66, "learning_rate": 1.9447648695000506e-05, "loss": 0.0081, "step": 115020 }, { "epoch": 1.66, "learning_rate": 1.944760065526203e-05, "loss": 0.0121, "step": 115030 }, { "epoch": 1.66, "learning_rate": 1.944755261552356e-05, "loss": 0.0121, "step": 115040 }, { "epoch": 1.66, "learning_rate": 1.944750457578509e-05, "loss": 0.0113, "step": 115050 }, { "epoch": 1.66, "learning_rate": 1.944745653604662e-05, "loss": 0.0101, "step": 115060 }, { "epoch": 1.66, "learning_rate": 1.9447408496308145e-05, "loss": 0.0085, "step": 115070 }, { "epoch": 1.66, "learning_rate": 1.9447360456569675e-05, "loss": 0.0099, "step": 115080 }, { "epoch": 1.66, "learning_rate": 1.9447312416831204e-05, "loss": 0.0108, "step": 115090 }, { "epoch": 1.66, "learning_rate": 1.9447264377092733e-05, "loss": 0.0128, "step": 115100 }, { "epoch": 1.66, "learning_rate": 1.944721633735426e-05, "loss": 0.0084, "step": 115110 }, { "epoch": 1.66, "learning_rate": 1.9447168297615788e-05, "loss": 0.0112, "step": 115120 }, { "epoch": 1.66, "learning_rate": 1.9447120257877318e-05, "loss": 0.0114, "step": 115130 }, { "epoch": 1.66, "learning_rate": 1.9447072218138843e-05, "loss": 0.0091, "step": 115140 }, { "epoch": 1.66, "learning_rate": 1.9447024178400376e-05, "loss": 0.0183, "step": 115150 }, { "epoch": 1.66, "learning_rate": 1.9446976138661905e-05, "loss": 0.0124, "step": 115160 }, { "epoch": 1.66, "learning_rate": 1.944692809892343e-05, "loss": 0.0121, "step": 115170 }, { "epoch": 1.66, "learning_rate": 1.944688005918496e-05, "loss": 0.0096, "step": 115180 }, { "epoch": 1.66, "learning_rate": 1.944683201944649e-05, "loss": 0.0107, "step": 115190 }, { "epoch": 1.66, "learning_rate": 1.9446783979708016e-05, "loss": 0.0108, "step": 115200 }, { "epoch": 1.66, "learning_rate": 1.9446735939969545e-05, "loss": 0.0093, "step": 115210 }, { "epoch": 1.66, "learning_rate": 1.9446687900231074e-05, "loss": 0.0074, "step": 115220 }, { "epoch": 1.66, "learning_rate": 1.9446639860492603e-05, "loss": 0.0097, "step": 115230 }, { "epoch": 1.66, "learning_rate": 1.944659182075413e-05, "loss": 0.0107, "step": 115240 }, { "epoch": 1.66, "learning_rate": 1.944654378101566e-05, "loss": 0.0148, "step": 115250 }, { "epoch": 1.66, "learning_rate": 1.9446495741277188e-05, "loss": 0.0124, "step": 115260 }, { "epoch": 1.66, "learning_rate": 1.9446447701538714e-05, "loss": 0.0082, "step": 115270 }, { "epoch": 1.66, "learning_rate": 1.9446399661800243e-05, "loss": 0.0089, "step": 115280 }, { "epoch": 1.66, "learning_rate": 1.9446351622061772e-05, "loss": 0.0117, "step": 115290 }, { "epoch": 1.66, "learning_rate": 1.94463035823233e-05, "loss": 0.0149, "step": 115300 }, { "epoch": 1.66, "learning_rate": 1.9446255542584827e-05, "loss": 0.0096, "step": 115310 }, { "epoch": 1.66, "learning_rate": 1.9446207502846357e-05, "loss": 0.0092, "step": 115320 }, { "epoch": 1.66, "learning_rate": 1.9446159463107886e-05, "loss": 0.0097, "step": 115330 }, { "epoch": 1.66, "learning_rate": 1.9446111423369415e-05, "loss": 0.0162, "step": 115340 }, { "epoch": 1.66, "learning_rate": 1.944606338363094e-05, "loss": 0.0172, "step": 115350 }, { "epoch": 1.66, "learning_rate": 1.944601534389247e-05, "loss": 0.0115, "step": 115360 }, { "epoch": 1.66, "learning_rate": 1.9445967304154e-05, "loss": 0.0077, "step": 115370 }, { "epoch": 1.66, "learning_rate": 1.9445919264415526e-05, "loss": 0.01, "step": 115380 }, { "epoch": 1.66, "learning_rate": 1.9445871224677055e-05, "loss": 0.0119, "step": 115390 }, { "epoch": 1.66, "learning_rate": 1.9445823184938584e-05, "loss": 0.0088, "step": 115400 }, { "epoch": 1.66, "learning_rate": 1.9445775145200113e-05, "loss": 0.0093, "step": 115410 }, { "epoch": 1.66, "learning_rate": 1.944572710546164e-05, "loss": 0.0083, "step": 115420 }, { "epoch": 1.66, "learning_rate": 1.944567906572317e-05, "loss": 0.0113, "step": 115430 }, { "epoch": 1.66, "learning_rate": 1.9445631025984698e-05, "loss": 0.0089, "step": 115440 }, { "epoch": 1.66, "learning_rate": 1.9445582986246224e-05, "loss": 0.0098, "step": 115450 }, { "epoch": 1.66, "learning_rate": 1.9445534946507753e-05, "loss": 0.0079, "step": 115460 }, { "epoch": 1.66, "learning_rate": 1.9445486906769282e-05, "loss": 0.012, "step": 115470 }, { "epoch": 1.66, "learning_rate": 1.944543886703081e-05, "loss": 0.009, "step": 115480 }, { "epoch": 1.66, "learning_rate": 1.9445390827292337e-05, "loss": 0.0114, "step": 115490 }, { "epoch": 1.66, "learning_rate": 1.9445342787553867e-05, "loss": 0.0079, "step": 115500 }, { "epoch": 1.66, "learning_rate": 1.9445294747815396e-05, "loss": 0.0122, "step": 115510 }, { "epoch": 1.66, "learning_rate": 1.9445246708076925e-05, "loss": 0.0072, "step": 115520 }, { "epoch": 1.67, "learning_rate": 1.944519866833845e-05, "loss": 0.0141, "step": 115530 }, { "epoch": 1.67, "learning_rate": 1.944515062859998e-05, "loss": 0.0108, "step": 115540 }, { "epoch": 1.67, "learning_rate": 1.944510258886151e-05, "loss": 0.0125, "step": 115550 }, { "epoch": 1.67, "learning_rate": 1.9445054549123036e-05, "loss": 0.0117, "step": 115560 }, { "epoch": 1.67, "learning_rate": 1.9445006509384565e-05, "loss": 0.0088, "step": 115570 }, { "epoch": 1.67, "learning_rate": 1.9444958469646094e-05, "loss": 0.0141, "step": 115580 }, { "epoch": 1.67, "learning_rate": 1.9444910429907623e-05, "loss": 0.009, "step": 115590 }, { "epoch": 1.67, "learning_rate": 1.944486239016915e-05, "loss": 0.0107, "step": 115600 }, { "epoch": 1.67, "learning_rate": 1.944481435043068e-05, "loss": 0.0098, "step": 115610 }, { "epoch": 1.67, "learning_rate": 1.9444766310692208e-05, "loss": 0.0089, "step": 115620 }, { "epoch": 1.67, "learning_rate": 1.9444718270953734e-05, "loss": 0.0105, "step": 115630 }, { "epoch": 1.67, "learning_rate": 1.9444670231215263e-05, "loss": 0.0085, "step": 115640 }, { "epoch": 1.67, "learning_rate": 1.9444622191476792e-05, "loss": 0.0125, "step": 115650 }, { "epoch": 1.67, "learning_rate": 1.944457415173832e-05, "loss": 0.0117, "step": 115660 }, { "epoch": 1.67, "learning_rate": 1.9444526111999847e-05, "loss": 0.0124, "step": 115670 }, { "epoch": 1.67, "learning_rate": 1.9444478072261377e-05, "loss": 0.0125, "step": 115680 }, { "epoch": 1.67, "learning_rate": 1.9444430032522906e-05, "loss": 0.0093, "step": 115690 }, { "epoch": 1.67, "learning_rate": 1.9444381992784435e-05, "loss": 0.0065, "step": 115700 }, { "epoch": 1.67, "learning_rate": 1.944433395304596e-05, "loss": 0.0147, "step": 115710 }, { "epoch": 1.67, "learning_rate": 1.944428591330749e-05, "loss": 0.0153, "step": 115720 }, { "epoch": 1.67, "learning_rate": 1.944423787356902e-05, "loss": 0.0096, "step": 115730 }, { "epoch": 1.67, "learning_rate": 1.9444189833830545e-05, "loss": 0.0099, "step": 115740 }, { "epoch": 1.67, "learning_rate": 1.9444141794092075e-05, "loss": 0.0115, "step": 115750 }, { "epoch": 1.67, "learning_rate": 1.9444093754353604e-05, "loss": 0.0089, "step": 115760 }, { "epoch": 1.67, "learning_rate": 1.9444045714615133e-05, "loss": 0.0079, "step": 115770 }, { "epoch": 1.67, "learning_rate": 1.944399767487666e-05, "loss": 0.0099, "step": 115780 }, { "epoch": 1.67, "learning_rate": 1.944394963513819e-05, "loss": 0.0106, "step": 115790 }, { "epoch": 1.67, "learning_rate": 1.9443901595399718e-05, "loss": 0.0082, "step": 115800 }, { "epoch": 1.67, "learning_rate": 1.9443853555661244e-05, "loss": 0.016, "step": 115810 }, { "epoch": 1.67, "learning_rate": 1.9443805515922773e-05, "loss": 0.0084, "step": 115820 }, { "epoch": 1.67, "learning_rate": 1.9443757476184302e-05, "loss": 0.0112, "step": 115830 }, { "epoch": 1.67, "learning_rate": 1.944370943644583e-05, "loss": 0.0113, "step": 115840 }, { "epoch": 1.67, "learning_rate": 1.9443661396707357e-05, "loss": 0.0084, "step": 115850 }, { "epoch": 1.67, "learning_rate": 1.9443613356968886e-05, "loss": 0.0124, "step": 115860 }, { "epoch": 1.67, "learning_rate": 1.9443565317230416e-05, "loss": 0.0111, "step": 115870 }, { "epoch": 1.67, "learning_rate": 1.9443517277491945e-05, "loss": 0.0104, "step": 115880 }, { "epoch": 1.67, "learning_rate": 1.944346923775347e-05, "loss": 0.0123, "step": 115890 }, { "epoch": 1.67, "learning_rate": 1.9443421198015e-05, "loss": 0.007, "step": 115900 }, { "epoch": 1.67, "learning_rate": 1.944337315827653e-05, "loss": 0.0112, "step": 115910 }, { "epoch": 1.67, "learning_rate": 1.9443325118538055e-05, "loss": 0.0056, "step": 115920 }, { "epoch": 1.67, "learning_rate": 1.9443277078799585e-05, "loss": 0.0151, "step": 115930 }, { "epoch": 1.67, "learning_rate": 1.9443229039061114e-05, "loss": 0.0093, "step": 115940 }, { "epoch": 1.67, "learning_rate": 1.9443180999322643e-05, "loss": 0.0097, "step": 115950 }, { "epoch": 1.67, "learning_rate": 1.944313295958417e-05, "loss": 0.0078, "step": 115960 }, { "epoch": 1.67, "learning_rate": 1.9443084919845698e-05, "loss": 0.0121, "step": 115970 }, { "epoch": 1.67, "learning_rate": 1.9443036880107228e-05, "loss": 0.0101, "step": 115980 }, { "epoch": 1.67, "learning_rate": 1.9442988840368753e-05, "loss": 0.0107, "step": 115990 }, { "epoch": 1.67, "learning_rate": 1.9442940800630283e-05, "loss": 0.017, "step": 116000 }, { "epoch": 1.67, "learning_rate": 1.9442892760891812e-05, "loss": 0.0149, "step": 116010 }, { "epoch": 1.67, "learning_rate": 1.944284472115334e-05, "loss": 0.0115, "step": 116020 }, { "epoch": 1.67, "learning_rate": 1.9442796681414867e-05, "loss": 0.0131, "step": 116030 }, { "epoch": 1.67, "learning_rate": 1.9442748641676396e-05, "loss": 0.0119, "step": 116040 }, { "epoch": 1.67, "learning_rate": 1.9442700601937926e-05, "loss": 0.0084, "step": 116050 }, { "epoch": 1.67, "learning_rate": 1.9442652562199455e-05, "loss": 0.0097, "step": 116060 }, { "epoch": 1.67, "learning_rate": 1.944260452246098e-05, "loss": 0.0101, "step": 116070 }, { "epoch": 1.67, "learning_rate": 1.944255648272251e-05, "loss": 0.0114, "step": 116080 }, { "epoch": 1.67, "learning_rate": 1.944250844298404e-05, "loss": 0.0089, "step": 116090 }, { "epoch": 1.67, "learning_rate": 1.9442460403245565e-05, "loss": 0.0088, "step": 116100 }, { "epoch": 1.67, "learning_rate": 1.9442412363507095e-05, "loss": 0.0116, "step": 116110 }, { "epoch": 1.67, "learning_rate": 1.9442364323768624e-05, "loss": 0.0096, "step": 116120 }, { "epoch": 1.67, "learning_rate": 1.9442316284030153e-05, "loss": 0.0111, "step": 116130 }, { "epoch": 1.67, "learning_rate": 1.944226824429168e-05, "loss": 0.0088, "step": 116140 }, { "epoch": 1.67, "learning_rate": 1.9442220204553208e-05, "loss": 0.0117, "step": 116150 }, { "epoch": 1.67, "learning_rate": 1.9442172164814737e-05, "loss": 0.0078, "step": 116160 }, { "epoch": 1.67, "learning_rate": 1.9442124125076263e-05, "loss": 0.0091, "step": 116170 }, { "epoch": 1.67, "learning_rate": 1.9442076085337793e-05, "loss": 0.0105, "step": 116180 }, { "epoch": 1.67, "learning_rate": 1.9442028045599322e-05, "loss": 0.0143, "step": 116190 }, { "epoch": 1.67, "learning_rate": 1.944198000586085e-05, "loss": 0.0132, "step": 116200 }, { "epoch": 1.67, "learning_rate": 1.9441931966122377e-05, "loss": 0.0122, "step": 116210 }, { "epoch": 1.67, "learning_rate": 1.9441883926383906e-05, "loss": 0.0143, "step": 116220 }, { "epoch": 1.68, "learning_rate": 1.9441835886645436e-05, "loss": 0.0099, "step": 116230 }, { "epoch": 1.68, "learning_rate": 1.9441787846906965e-05, "loss": 0.0115, "step": 116240 }, { "epoch": 1.68, "learning_rate": 1.944173980716849e-05, "loss": 0.0117, "step": 116250 }, { "epoch": 1.68, "learning_rate": 1.944169176743002e-05, "loss": 0.0086, "step": 116260 }, { "epoch": 1.68, "learning_rate": 1.944164372769155e-05, "loss": 0.0113, "step": 116270 }, { "epoch": 1.68, "learning_rate": 1.9441595687953075e-05, "loss": 0.0097, "step": 116280 }, { "epoch": 1.68, "learning_rate": 1.9441547648214604e-05, "loss": 0.0097, "step": 116290 }, { "epoch": 1.68, "learning_rate": 1.9441499608476134e-05, "loss": 0.0117, "step": 116300 }, { "epoch": 1.68, "learning_rate": 1.9441451568737663e-05, "loss": 0.0086, "step": 116310 }, { "epoch": 1.68, "learning_rate": 1.944140352899919e-05, "loss": 0.0093, "step": 116320 }, { "epoch": 1.68, "learning_rate": 1.9441355489260718e-05, "loss": 0.0112, "step": 116330 }, { "epoch": 1.68, "learning_rate": 1.9441307449522247e-05, "loss": 0.0079, "step": 116340 }, { "epoch": 1.68, "learning_rate": 1.9441259409783773e-05, "loss": 0.009, "step": 116350 }, { "epoch": 1.68, "learning_rate": 1.9441211370045303e-05, "loss": 0.0095, "step": 116360 }, { "epoch": 1.68, "learning_rate": 1.9441163330306832e-05, "loss": 0.0082, "step": 116370 }, { "epoch": 1.68, "learning_rate": 1.944111529056836e-05, "loss": 0.0083, "step": 116380 }, { "epoch": 1.68, "learning_rate": 1.9441067250829887e-05, "loss": 0.0131, "step": 116390 }, { "epoch": 1.68, "learning_rate": 1.9441019211091416e-05, "loss": 0.0116, "step": 116400 }, { "epoch": 1.68, "learning_rate": 1.9440971171352946e-05, "loss": 0.011, "step": 116410 }, { "epoch": 1.68, "learning_rate": 1.9440923131614475e-05, "loss": 0.012, "step": 116420 }, { "epoch": 1.68, "learning_rate": 1.9440875091876e-05, "loss": 0.0113, "step": 116430 }, { "epoch": 1.68, "learning_rate": 1.944082705213753e-05, "loss": 0.0104, "step": 116440 }, { "epoch": 1.68, "learning_rate": 1.944077901239906e-05, "loss": 0.0087, "step": 116450 }, { "epoch": 1.68, "learning_rate": 1.9440730972660585e-05, "loss": 0.0079, "step": 116460 }, { "epoch": 1.68, "learning_rate": 1.9440682932922114e-05, "loss": 0.0165, "step": 116470 }, { "epoch": 1.68, "learning_rate": 1.9440634893183644e-05, "loss": 0.0098, "step": 116480 }, { "epoch": 1.68, "learning_rate": 1.9440586853445173e-05, "loss": 0.0091, "step": 116490 }, { "epoch": 1.68, "learning_rate": 1.94405388137067e-05, "loss": 0.0073, "step": 116500 }, { "epoch": 1.68, "learning_rate": 1.9440490773968228e-05, "loss": 0.0085, "step": 116510 }, { "epoch": 1.68, "learning_rate": 1.9440442734229757e-05, "loss": 0.0115, "step": 116520 }, { "epoch": 1.68, "learning_rate": 1.9440394694491283e-05, "loss": 0.0125, "step": 116530 }, { "epoch": 1.68, "learning_rate": 1.9440346654752812e-05, "loss": 0.0128, "step": 116540 }, { "epoch": 1.68, "learning_rate": 1.9440298615014342e-05, "loss": 0.0087, "step": 116550 }, { "epoch": 1.68, "learning_rate": 1.944025057527587e-05, "loss": 0.0097, "step": 116560 }, { "epoch": 1.68, "learning_rate": 1.9440202535537397e-05, "loss": 0.011, "step": 116570 }, { "epoch": 1.68, "learning_rate": 1.9440154495798926e-05, "loss": 0.0096, "step": 116580 }, { "epoch": 1.68, "learning_rate": 1.9440106456060455e-05, "loss": 0.0131, "step": 116590 }, { "epoch": 1.68, "learning_rate": 1.944005841632198e-05, "loss": 0.0118, "step": 116600 }, { "epoch": 1.68, "learning_rate": 1.944001037658351e-05, "loss": 0.0114, "step": 116610 }, { "epoch": 1.68, "learning_rate": 1.943996233684504e-05, "loss": 0.0094, "step": 116620 }, { "epoch": 1.68, "learning_rate": 1.943991429710657e-05, "loss": 0.0102, "step": 116630 }, { "epoch": 1.68, "learning_rate": 1.9439866257368095e-05, "loss": 0.0097, "step": 116640 }, { "epoch": 1.68, "learning_rate": 1.9439818217629624e-05, "loss": 0.0092, "step": 116650 }, { "epoch": 1.68, "learning_rate": 1.9439770177891154e-05, "loss": 0.0104, "step": 116660 }, { "epoch": 1.68, "learning_rate": 1.9439722138152683e-05, "loss": 0.0111, "step": 116670 }, { "epoch": 1.68, "learning_rate": 1.943967409841421e-05, "loss": 0.0091, "step": 116680 }, { "epoch": 1.68, "learning_rate": 1.9439626058675738e-05, "loss": 0.0157, "step": 116690 }, { "epoch": 1.68, "learning_rate": 1.9439578018937267e-05, "loss": 0.016, "step": 116700 }, { "epoch": 1.68, "learning_rate": 1.9439529979198793e-05, "loss": 0.0117, "step": 116710 }, { "epoch": 1.68, "learning_rate": 1.9439481939460322e-05, "loss": 0.0146, "step": 116720 }, { "epoch": 1.68, "learning_rate": 1.943943389972185e-05, "loss": 0.0155, "step": 116730 }, { "epoch": 1.68, "learning_rate": 1.943938585998338e-05, "loss": 0.0117, "step": 116740 }, { "epoch": 1.68, "learning_rate": 1.9439337820244907e-05, "loss": 0.0099, "step": 116750 }, { "epoch": 1.68, "learning_rate": 1.9439289780506436e-05, "loss": 0.012, "step": 116760 }, { "epoch": 1.68, "learning_rate": 1.9439241740767965e-05, "loss": 0.0105, "step": 116770 }, { "epoch": 1.68, "learning_rate": 1.943919370102949e-05, "loss": 0.0104, "step": 116780 }, { "epoch": 1.68, "learning_rate": 1.943914566129102e-05, "loss": 0.008, "step": 116790 }, { "epoch": 1.68, "learning_rate": 1.943909762155255e-05, "loss": 0.0106, "step": 116800 }, { "epoch": 1.68, "learning_rate": 1.943904958181408e-05, "loss": 0.0113, "step": 116810 }, { "epoch": 1.68, "learning_rate": 1.9439001542075605e-05, "loss": 0.0111, "step": 116820 }, { "epoch": 1.68, "learning_rate": 1.9438953502337134e-05, "loss": 0.0133, "step": 116830 }, { "epoch": 1.68, "learning_rate": 1.9438905462598663e-05, "loss": 0.0105, "step": 116840 }, { "epoch": 1.68, "learning_rate": 1.9438857422860193e-05, "loss": 0.0101, "step": 116850 }, { "epoch": 1.68, "learning_rate": 1.943880938312172e-05, "loss": 0.0121, "step": 116860 }, { "epoch": 1.68, "learning_rate": 1.9438761343383248e-05, "loss": 0.0088, "step": 116870 }, { "epoch": 1.68, "learning_rate": 1.9438713303644777e-05, "loss": 0.0111, "step": 116880 }, { "epoch": 1.68, "learning_rate": 1.9438665263906303e-05, "loss": 0.0104, "step": 116890 }, { "epoch": 1.68, "learning_rate": 1.9438617224167832e-05, "loss": 0.0117, "step": 116900 }, { "epoch": 1.68, "learning_rate": 1.943856918442936e-05, "loss": 0.0117, "step": 116910 }, { "epoch": 1.69, "learning_rate": 1.943852114469089e-05, "loss": 0.0084, "step": 116920 }, { "epoch": 1.69, "learning_rate": 1.9438473104952417e-05, "loss": 0.0113, "step": 116930 }, { "epoch": 1.69, "learning_rate": 1.9438425065213946e-05, "loss": 0.0107, "step": 116940 }, { "epoch": 1.69, "learning_rate": 1.9438377025475475e-05, "loss": 0.0136, "step": 116950 }, { "epoch": 1.69, "learning_rate": 1.9438328985737e-05, "loss": 0.0094, "step": 116960 }, { "epoch": 1.69, "learning_rate": 1.943828094599853e-05, "loss": 0.0106, "step": 116970 }, { "epoch": 1.69, "learning_rate": 1.943823290626006e-05, "loss": 0.0104, "step": 116980 }, { "epoch": 1.69, "learning_rate": 1.943818486652159e-05, "loss": 0.0087, "step": 116990 }, { "epoch": 1.69, "learning_rate": 1.9438136826783115e-05, "loss": 0.0134, "step": 117000 }, { "epoch": 1.69, "learning_rate": 1.9438088787044644e-05, "loss": 0.0111, "step": 117010 }, { "epoch": 1.69, "learning_rate": 1.9438040747306173e-05, "loss": 0.0096, "step": 117020 }, { "epoch": 1.69, "learning_rate": 1.9437992707567703e-05, "loss": 0.0123, "step": 117030 }, { "epoch": 1.69, "learning_rate": 1.943794466782923e-05, "loss": 0.0102, "step": 117040 }, { "epoch": 1.69, "learning_rate": 1.9437896628090758e-05, "loss": 0.0088, "step": 117050 }, { "epoch": 1.69, "learning_rate": 1.9437848588352287e-05, "loss": 0.0138, "step": 117060 }, { "epoch": 1.69, "learning_rate": 1.9437800548613813e-05, "loss": 0.0119, "step": 117070 }, { "epoch": 1.69, "learning_rate": 1.9437752508875342e-05, "loss": 0.0078, "step": 117080 }, { "epoch": 1.69, "learning_rate": 1.943770446913687e-05, "loss": 0.0148, "step": 117090 }, { "epoch": 1.69, "learning_rate": 1.94376564293984e-05, "loss": 0.0104, "step": 117100 }, { "epoch": 1.69, "learning_rate": 1.9437608389659927e-05, "loss": 0.0096, "step": 117110 }, { "epoch": 1.69, "learning_rate": 1.9437560349921456e-05, "loss": 0.007, "step": 117120 }, { "epoch": 1.69, "learning_rate": 1.9437512310182985e-05, "loss": 0.0115, "step": 117130 }, { "epoch": 1.69, "learning_rate": 1.943746427044451e-05, "loss": 0.0098, "step": 117140 }, { "epoch": 1.69, "learning_rate": 1.943741623070604e-05, "loss": 0.0094, "step": 117150 }, { "epoch": 1.69, "learning_rate": 1.943736819096757e-05, "loss": 0.0076, "step": 117160 }, { "epoch": 1.69, "learning_rate": 1.94373201512291e-05, "loss": 0.0111, "step": 117170 }, { "epoch": 1.69, "learning_rate": 1.9437272111490625e-05, "loss": 0.0075, "step": 117180 }, { "epoch": 1.69, "learning_rate": 1.9437224071752154e-05, "loss": 0.0108, "step": 117190 }, { "epoch": 1.69, "learning_rate": 1.9437176032013683e-05, "loss": 0.0121, "step": 117200 }, { "epoch": 1.69, "learning_rate": 1.9437127992275213e-05, "loss": 0.0077, "step": 117210 }, { "epoch": 1.69, "learning_rate": 1.943707995253674e-05, "loss": 0.0154, "step": 117220 }, { "epoch": 1.69, "learning_rate": 1.9437031912798268e-05, "loss": 0.0097, "step": 117230 }, { "epoch": 1.69, "learning_rate": 1.9436983873059797e-05, "loss": 0.0096, "step": 117240 }, { "epoch": 1.69, "learning_rate": 1.943694063729517e-05, "loss": 0.0135, "step": 117250 }, { "epoch": 1.69, "learning_rate": 1.94368925975567e-05, "loss": 0.0092, "step": 117260 }, { "epoch": 1.69, "learning_rate": 1.943684455781823e-05, "loss": 0.0122, "step": 117270 }, { "epoch": 1.69, "learning_rate": 1.9436796518079756e-05, "loss": 0.0103, "step": 117280 }, { "epoch": 1.69, "learning_rate": 1.9436748478341285e-05, "loss": 0.0081, "step": 117290 }, { "epoch": 1.69, "learning_rate": 1.9436700438602815e-05, "loss": 0.0123, "step": 117300 }, { "epoch": 1.69, "learning_rate": 1.943665239886434e-05, "loss": 0.0114, "step": 117310 }, { "epoch": 1.69, "learning_rate": 1.943660435912587e-05, "loss": 0.013, "step": 117320 }, { "epoch": 1.69, "learning_rate": 1.94365563193874e-05, "loss": 0.0123, "step": 117330 }, { "epoch": 1.69, "learning_rate": 1.9436508279648928e-05, "loss": 0.0135, "step": 117340 }, { "epoch": 1.69, "learning_rate": 1.9436460239910454e-05, "loss": 0.012, "step": 117350 }, { "epoch": 1.69, "learning_rate": 1.9436412200171983e-05, "loss": 0.0083, "step": 117360 }, { "epoch": 1.69, "learning_rate": 1.9436364160433513e-05, "loss": 0.0103, "step": 117370 }, { "epoch": 1.69, "learning_rate": 1.943631612069504e-05, "loss": 0.0135, "step": 117380 }, { "epoch": 1.69, "learning_rate": 1.9436268080956568e-05, "loss": 0.0101, "step": 117390 }, { "epoch": 1.69, "learning_rate": 1.9436220041218097e-05, "loss": 0.0117, "step": 117400 }, { "epoch": 1.69, "learning_rate": 1.9436172001479626e-05, "loss": 0.0092, "step": 117410 }, { "epoch": 1.69, "learning_rate": 1.9436123961741152e-05, "loss": 0.0083, "step": 117420 }, { "epoch": 1.69, "learning_rate": 1.943607592200268e-05, "loss": 0.0077, "step": 117430 }, { "epoch": 1.69, "learning_rate": 1.943602788226421e-05, "loss": 0.013, "step": 117440 }, { "epoch": 1.69, "learning_rate": 1.943597984252574e-05, "loss": 0.0144, "step": 117450 }, { "epoch": 1.69, "learning_rate": 1.9435931802787266e-05, "loss": 0.0079, "step": 117460 }, { "epoch": 1.69, "learning_rate": 1.9435883763048795e-05, "loss": 0.0107, "step": 117470 }, { "epoch": 1.69, "learning_rate": 1.9435835723310324e-05, "loss": 0.0091, "step": 117480 }, { "epoch": 1.69, "learning_rate": 1.943578768357185e-05, "loss": 0.0115, "step": 117490 }, { "epoch": 1.69, "learning_rate": 1.943573964383338e-05, "loss": 0.0077, "step": 117500 }, { "epoch": 1.69, "learning_rate": 1.943569160409491e-05, "loss": 0.009, "step": 117510 }, { "epoch": 1.69, "learning_rate": 1.9435643564356438e-05, "loss": 0.007, "step": 117520 }, { "epoch": 1.69, "learning_rate": 1.9435595524617964e-05, "loss": 0.0103, "step": 117530 }, { "epoch": 1.69, "learning_rate": 1.9435547484879493e-05, "loss": 0.0091, "step": 117540 }, { "epoch": 1.69, "learning_rate": 1.9435499445141023e-05, "loss": 0.0103, "step": 117550 }, { "epoch": 1.69, "learning_rate": 1.943545140540255e-05, "loss": 0.0077, "step": 117560 }, { "epoch": 1.69, "learning_rate": 1.9435403365664078e-05, "loss": 0.0133, "step": 117570 }, { "epoch": 1.69, "learning_rate": 1.9435355325925607e-05, "loss": 0.0132, "step": 117580 }, { "epoch": 1.69, "learning_rate": 1.9435307286187136e-05, "loss": 0.0103, "step": 117590 }, { "epoch": 1.69, "learning_rate": 1.9435259246448662e-05, "loss": 0.0076, "step": 117600 }, { "epoch": 1.69, "learning_rate": 1.943521120671019e-05, "loss": 0.0095, "step": 117610 }, { "epoch": 1.7, "learning_rate": 1.943516316697172e-05, "loss": 0.0109, "step": 117620 }, { "epoch": 1.7, "learning_rate": 1.943511512723325e-05, "loss": 0.0074, "step": 117630 }, { "epoch": 1.7, "learning_rate": 1.9435067087494776e-05, "loss": 0.0126, "step": 117640 }, { "epoch": 1.7, "learning_rate": 1.9435019047756305e-05, "loss": 0.0078, "step": 117650 }, { "epoch": 1.7, "learning_rate": 1.9434971008017834e-05, "loss": 0.0107, "step": 117660 }, { "epoch": 1.7, "learning_rate": 1.943492296827936e-05, "loss": 0.0123, "step": 117670 }, { "epoch": 1.7, "learning_rate": 1.943487492854089e-05, "loss": 0.0065, "step": 117680 }, { "epoch": 1.7, "learning_rate": 1.943482688880242e-05, "loss": 0.01, "step": 117690 }, { "epoch": 1.7, "learning_rate": 1.9434778849063948e-05, "loss": 0.0131, "step": 117700 }, { "epoch": 1.7, "learning_rate": 1.9434730809325474e-05, "loss": 0.0117, "step": 117710 }, { "epoch": 1.7, "learning_rate": 1.9434682769587003e-05, "loss": 0.0132, "step": 117720 }, { "epoch": 1.7, "learning_rate": 1.9434634729848533e-05, "loss": 0.0096, "step": 117730 }, { "epoch": 1.7, "learning_rate": 1.943458669011006e-05, "loss": 0.0097, "step": 117740 }, { "epoch": 1.7, "learning_rate": 1.9434538650371588e-05, "loss": 0.0114, "step": 117750 }, { "epoch": 1.7, "learning_rate": 1.9434490610633117e-05, "loss": 0.0109, "step": 117760 }, { "epoch": 1.7, "learning_rate": 1.9434442570894646e-05, "loss": 0.0107, "step": 117770 }, { "epoch": 1.7, "learning_rate": 1.9434394531156172e-05, "loss": 0.011, "step": 117780 }, { "epoch": 1.7, "learning_rate": 1.94343464914177e-05, "loss": 0.0104, "step": 117790 }, { "epoch": 1.7, "learning_rate": 1.943429845167923e-05, "loss": 0.0095, "step": 117800 }, { "epoch": 1.7, "learning_rate": 1.943425041194076e-05, "loss": 0.0111, "step": 117810 }, { "epoch": 1.7, "learning_rate": 1.9434202372202286e-05, "loss": 0.0126, "step": 117820 }, { "epoch": 1.7, "learning_rate": 1.9434154332463815e-05, "loss": 0.0092, "step": 117830 }, { "epoch": 1.7, "learning_rate": 1.9434106292725344e-05, "loss": 0.0135, "step": 117840 }, { "epoch": 1.7, "learning_rate": 1.943405825298687e-05, "loss": 0.0104, "step": 117850 }, { "epoch": 1.7, "learning_rate": 1.94340102132484e-05, "loss": 0.0106, "step": 117860 }, { "epoch": 1.7, "learning_rate": 1.943396217350993e-05, "loss": 0.0118, "step": 117870 }, { "epoch": 1.7, "learning_rate": 1.9433914133771458e-05, "loss": 0.0133, "step": 117880 }, { "epoch": 1.7, "learning_rate": 1.9433866094032984e-05, "loss": 0.0144, "step": 117890 }, { "epoch": 1.7, "learning_rate": 1.9433818054294513e-05, "loss": 0.0151, "step": 117900 }, { "epoch": 1.7, "learning_rate": 1.9433770014556042e-05, "loss": 0.0098, "step": 117910 }, { "epoch": 1.7, "learning_rate": 1.943372197481757e-05, "loss": 0.0142, "step": 117920 }, { "epoch": 1.7, "learning_rate": 1.9433673935079098e-05, "loss": 0.0137, "step": 117930 }, { "epoch": 1.7, "learning_rate": 1.9433625895340627e-05, "loss": 0.0124, "step": 117940 }, { "epoch": 1.7, "learning_rate": 1.9433577855602156e-05, "loss": 0.0097, "step": 117950 }, { "epoch": 1.7, "learning_rate": 1.9433529815863682e-05, "loss": 0.0094, "step": 117960 }, { "epoch": 1.7, "learning_rate": 1.943348177612521e-05, "loss": 0.0187, "step": 117970 }, { "epoch": 1.7, "learning_rate": 1.943343373638674e-05, "loss": 0.0105, "step": 117980 }, { "epoch": 1.7, "learning_rate": 1.943338569664827e-05, "loss": 0.0126, "step": 117990 }, { "epoch": 1.7, "learning_rate": 1.9433337656909796e-05, "loss": 0.0094, "step": 118000 }, { "epoch": 1.7, "learning_rate": 1.9433289617171325e-05, "loss": 0.0108, "step": 118010 }, { "epoch": 1.7, "learning_rate": 1.9433241577432854e-05, "loss": 0.0077, "step": 118020 }, { "epoch": 1.7, "learning_rate": 1.943319353769438e-05, "loss": 0.0083, "step": 118030 }, { "epoch": 1.7, "learning_rate": 1.943314549795591e-05, "loss": 0.0085, "step": 118040 }, { "epoch": 1.7, "learning_rate": 1.943309745821744e-05, "loss": 0.0099, "step": 118050 }, { "epoch": 1.7, "learning_rate": 1.9433049418478968e-05, "loss": 0.011, "step": 118060 }, { "epoch": 1.7, "learning_rate": 1.9433001378740494e-05, "loss": 0.0103, "step": 118070 }, { "epoch": 1.7, "learning_rate": 1.9432953339002023e-05, "loss": 0.0086, "step": 118080 }, { "epoch": 1.7, "learning_rate": 1.9432905299263552e-05, "loss": 0.0074, "step": 118090 }, { "epoch": 1.7, "learning_rate": 1.9432857259525078e-05, "loss": 0.0099, "step": 118100 }, { "epoch": 1.7, "learning_rate": 1.9432809219786608e-05, "loss": 0.0104, "step": 118110 }, { "epoch": 1.7, "learning_rate": 1.9432761180048137e-05, "loss": 0.0073, "step": 118120 }, { "epoch": 1.7, "learning_rate": 1.9432713140309666e-05, "loss": 0.0137, "step": 118130 }, { "epoch": 1.7, "learning_rate": 1.9432665100571192e-05, "loss": 0.0122, "step": 118140 }, { "epoch": 1.7, "learning_rate": 1.943261706083272e-05, "loss": 0.0098, "step": 118150 }, { "epoch": 1.7, "learning_rate": 1.943256902109425e-05, "loss": 0.0102, "step": 118160 }, { "epoch": 1.7, "learning_rate": 1.9432520981355776e-05, "loss": 0.0085, "step": 118170 }, { "epoch": 1.7, "learning_rate": 1.9432472941617306e-05, "loss": 0.0104, "step": 118180 }, { "epoch": 1.7, "learning_rate": 1.9432424901878835e-05, "loss": 0.0086, "step": 118190 }, { "epoch": 1.7, "learning_rate": 1.9432376862140364e-05, "loss": 0.0087, "step": 118200 }, { "epoch": 1.7, "learning_rate": 1.943232882240189e-05, "loss": 0.0088, "step": 118210 }, { "epoch": 1.7, "learning_rate": 1.943228078266342e-05, "loss": 0.0106, "step": 118220 }, { "epoch": 1.7, "learning_rate": 1.943223274292495e-05, "loss": 0.0071, "step": 118230 }, { "epoch": 1.7, "learning_rate": 1.9432184703186478e-05, "loss": 0.0125, "step": 118240 }, { "epoch": 1.7, "learning_rate": 1.9432136663448007e-05, "loss": 0.0085, "step": 118250 }, { "epoch": 1.7, "learning_rate": 1.9432088623709536e-05, "loss": 0.0097, "step": 118260 }, { "epoch": 1.7, "learning_rate": 1.9432040583971062e-05, "loss": 0.0117, "step": 118270 }, { "epoch": 1.7, "learning_rate": 1.943199254423259e-05, "loss": 0.009, "step": 118280 }, { "epoch": 1.7, "learning_rate": 1.943194450449412e-05, "loss": 0.0119, "step": 118290 }, { "epoch": 1.7, "learning_rate": 1.943189646475565e-05, "loss": 0.0083, "step": 118300 }, { "epoch": 1.71, "learning_rate": 1.9431848425017176e-05, "loss": 0.0145, "step": 118310 }, { "epoch": 1.71, "learning_rate": 1.9431800385278705e-05, "loss": 0.0085, "step": 118320 }, { "epoch": 1.71, "learning_rate": 1.9431752345540234e-05, "loss": 0.008, "step": 118330 }, { "epoch": 1.71, "learning_rate": 1.943170430580176e-05, "loss": 0.0099, "step": 118340 }, { "epoch": 1.71, "learning_rate": 1.943165626606329e-05, "loss": 0.0111, "step": 118350 }, { "epoch": 1.71, "learning_rate": 1.943160822632482e-05, "loss": 0.0084, "step": 118360 }, { "epoch": 1.71, "learning_rate": 1.9431560186586348e-05, "loss": 0.0142, "step": 118370 }, { "epoch": 1.71, "learning_rate": 1.9431512146847874e-05, "loss": 0.0106, "step": 118380 }, { "epoch": 1.71, "learning_rate": 1.9431464107109403e-05, "loss": 0.013, "step": 118390 }, { "epoch": 1.71, "learning_rate": 1.9431416067370933e-05, "loss": 0.0117, "step": 118400 }, { "epoch": 1.71, "learning_rate": 1.943136802763246e-05, "loss": 0.0095, "step": 118410 }, { "epoch": 1.71, "learning_rate": 1.9431319987893988e-05, "loss": 0.015, "step": 118420 }, { "epoch": 1.71, "learning_rate": 1.9431271948155517e-05, "loss": 0.0087, "step": 118430 }, { "epoch": 1.71, "learning_rate": 1.9431223908417046e-05, "loss": 0.0123, "step": 118440 }, { "epoch": 1.71, "learning_rate": 1.9431175868678572e-05, "loss": 0.0118, "step": 118450 }, { "epoch": 1.71, "learning_rate": 1.94311278289401e-05, "loss": 0.0091, "step": 118460 }, { "epoch": 1.71, "learning_rate": 1.943107978920163e-05, "loss": 0.0093, "step": 118470 }, { "epoch": 1.71, "learning_rate": 1.943103174946316e-05, "loss": 0.0079, "step": 118480 }, { "epoch": 1.71, "learning_rate": 1.9430983709724686e-05, "loss": 0.0128, "step": 118490 }, { "epoch": 1.71, "learning_rate": 1.9430935669986215e-05, "loss": 0.0132, "step": 118500 }, { "epoch": 1.71, "learning_rate": 1.9430887630247744e-05, "loss": 0.0108, "step": 118510 }, { "epoch": 1.71, "learning_rate": 1.943083959050927e-05, "loss": 0.0088, "step": 118520 }, { "epoch": 1.71, "learning_rate": 1.94307915507708e-05, "loss": 0.0093, "step": 118530 }, { "epoch": 1.71, "learning_rate": 1.943074351103233e-05, "loss": 0.0105, "step": 118540 }, { "epoch": 1.71, "learning_rate": 1.9430695471293858e-05, "loss": 0.0085, "step": 118550 }, { "epoch": 1.71, "learning_rate": 1.9430647431555384e-05, "loss": 0.0092, "step": 118560 }, { "epoch": 1.71, "learning_rate": 1.9430599391816913e-05, "loss": 0.0111, "step": 118570 }, { "epoch": 1.71, "learning_rate": 1.9430551352078443e-05, "loss": 0.0055, "step": 118580 }, { "epoch": 1.71, "learning_rate": 1.943050331233997e-05, "loss": 0.0106, "step": 118590 }, { "epoch": 1.71, "learning_rate": 1.9430460076575343e-05, "loss": 0.0092, "step": 118600 }, { "epoch": 1.71, "learning_rate": 1.9430412036836872e-05, "loss": 0.01, "step": 118610 }, { "epoch": 1.71, "learning_rate": 1.94303639970984e-05, "loss": 0.0086, "step": 118620 }, { "epoch": 1.71, "learning_rate": 1.9430315957359927e-05, "loss": 0.0119, "step": 118630 }, { "epoch": 1.71, "learning_rate": 1.9430267917621457e-05, "loss": 0.0107, "step": 118640 }, { "epoch": 1.71, "learning_rate": 1.9430219877882986e-05, "loss": 0.0115, "step": 118650 }, { "epoch": 1.71, "learning_rate": 1.9430171838144515e-05, "loss": 0.0102, "step": 118660 }, { "epoch": 1.71, "learning_rate": 1.943012379840604e-05, "loss": 0.012, "step": 118670 }, { "epoch": 1.71, "learning_rate": 1.943007575866757e-05, "loss": 0.0107, "step": 118680 }, { "epoch": 1.71, "learning_rate": 1.94300277189291e-05, "loss": 0.0076, "step": 118690 }, { "epoch": 1.71, "learning_rate": 1.9429979679190626e-05, "loss": 0.0078, "step": 118700 }, { "epoch": 1.71, "learning_rate": 1.9429931639452155e-05, "loss": 0.0128, "step": 118710 }, { "epoch": 1.71, "learning_rate": 1.9429888403687533e-05, "loss": 0.01, "step": 118720 }, { "epoch": 1.71, "learning_rate": 1.942984036394906e-05, "loss": 0.0098, "step": 118730 }, { "epoch": 1.71, "learning_rate": 1.9429792324210588e-05, "loss": 0.0096, "step": 118740 }, { "epoch": 1.71, "learning_rate": 1.9429744284472117e-05, "loss": 0.01, "step": 118750 }, { "epoch": 1.71, "learning_rate": 1.9429696244733643e-05, "loss": 0.0113, "step": 118760 }, { "epoch": 1.71, "learning_rate": 1.9429648204995172e-05, "loss": 0.0072, "step": 118770 }, { "epoch": 1.71, "learning_rate": 1.9429600165256702e-05, "loss": 0.0109, "step": 118780 }, { "epoch": 1.71, "learning_rate": 1.942955212551823e-05, "loss": 0.0081, "step": 118790 }, { "epoch": 1.71, "learning_rate": 1.9429504085779757e-05, "loss": 0.0088, "step": 118800 }, { "epoch": 1.71, "learning_rate": 1.9429456046041286e-05, "loss": 0.0095, "step": 118810 }, { "epoch": 1.71, "learning_rate": 1.9429408006302815e-05, "loss": 0.0093, "step": 118820 }, { "epoch": 1.71, "learning_rate": 1.942935996656434e-05, "loss": 0.0074, "step": 118830 }, { "epoch": 1.71, "learning_rate": 1.942931192682587e-05, "loss": 0.0101, "step": 118840 }, { "epoch": 1.71, "learning_rate": 1.94292638870874e-05, "loss": 0.0092, "step": 118850 }, { "epoch": 1.71, "learning_rate": 1.942921584734893e-05, "loss": 0.0091, "step": 118860 }, { "epoch": 1.71, "learning_rate": 1.9429167807610455e-05, "loss": 0.0109, "step": 118870 }, { "epoch": 1.71, "learning_rate": 1.9429119767871984e-05, "loss": 0.0096, "step": 118880 }, { "epoch": 1.71, "learning_rate": 1.9429071728133514e-05, "loss": 0.0135, "step": 118890 }, { "epoch": 1.71, "learning_rate": 1.9429023688395043e-05, "loss": 0.0088, "step": 118900 }, { "epoch": 1.71, "learning_rate": 1.942897564865657e-05, "loss": 0.0104, "step": 118910 }, { "epoch": 1.71, "learning_rate": 1.9428927608918098e-05, "loss": 0.0124, "step": 118920 }, { "epoch": 1.71, "learning_rate": 1.9428879569179627e-05, "loss": 0.0125, "step": 118930 }, { "epoch": 1.71, "learning_rate": 1.9428831529441153e-05, "loss": 0.0125, "step": 118940 }, { "epoch": 1.71, "learning_rate": 1.9428783489702682e-05, "loss": 0.0095, "step": 118950 }, { "epoch": 1.71, "learning_rate": 1.942873544996421e-05, "loss": 0.0113, "step": 118960 }, { "epoch": 1.71, "learning_rate": 1.942868741022574e-05, "loss": 0.0115, "step": 118970 }, { "epoch": 1.71, "learning_rate": 1.9428639370487267e-05, "loss": 0.0135, "step": 118980 }, { "epoch": 1.71, "learning_rate": 1.9428591330748796e-05, "loss": 0.0091, "step": 118990 }, { "epoch": 1.72, "learning_rate": 1.9428543291010325e-05, "loss": 0.009, "step": 119000 }, { "epoch": 1.72, "learning_rate": 1.942849525127185e-05, "loss": 0.0134, "step": 119010 }, { "epoch": 1.72, "learning_rate": 1.942844721153338e-05, "loss": 0.0092, "step": 119020 }, { "epoch": 1.72, "learning_rate": 1.942839917179491e-05, "loss": 0.0108, "step": 119030 }, { "epoch": 1.72, "learning_rate": 1.942835113205644e-05, "loss": 0.012, "step": 119040 }, { "epoch": 1.72, "learning_rate": 1.9428303092317965e-05, "loss": 0.0068, "step": 119050 }, { "epoch": 1.72, "learning_rate": 1.9428255052579494e-05, "loss": 0.0109, "step": 119060 }, { "epoch": 1.72, "learning_rate": 1.9428207012841023e-05, "loss": 0.0103, "step": 119070 }, { "epoch": 1.72, "learning_rate": 1.9428158973102553e-05, "loss": 0.0093, "step": 119080 }, { "epoch": 1.72, "learning_rate": 1.942811093336408e-05, "loss": 0.0125, "step": 119090 }, { "epoch": 1.72, "learning_rate": 1.9428062893625608e-05, "loss": 0.008, "step": 119100 }, { "epoch": 1.72, "learning_rate": 1.9428014853887137e-05, "loss": 0.009, "step": 119110 }, { "epoch": 1.72, "learning_rate": 1.9427966814148663e-05, "loss": 0.0089, "step": 119120 }, { "epoch": 1.72, "learning_rate": 1.9427918774410192e-05, "loss": 0.0076, "step": 119130 }, { "epoch": 1.72, "learning_rate": 1.942787073467172e-05, "loss": 0.0127, "step": 119140 }, { "epoch": 1.72, "learning_rate": 1.942782269493325e-05, "loss": 0.0075, "step": 119150 }, { "epoch": 1.72, "learning_rate": 1.9427774655194777e-05, "loss": 0.0086, "step": 119160 }, { "epoch": 1.72, "learning_rate": 1.9427726615456306e-05, "loss": 0.0072, "step": 119170 }, { "epoch": 1.72, "learning_rate": 1.9427678575717835e-05, "loss": 0.0118, "step": 119180 }, { "epoch": 1.72, "learning_rate": 1.942763053597936e-05, "loss": 0.0102, "step": 119190 }, { "epoch": 1.72, "learning_rate": 1.942758249624089e-05, "loss": 0.011, "step": 119200 }, { "epoch": 1.72, "learning_rate": 1.942753445650242e-05, "loss": 0.0089, "step": 119210 }, { "epoch": 1.72, "learning_rate": 1.942748641676395e-05, "loss": 0.0095, "step": 119220 }, { "epoch": 1.72, "learning_rate": 1.9427438377025475e-05, "loss": 0.0072, "step": 119230 }, { "epoch": 1.72, "learning_rate": 1.9427390337287004e-05, "loss": 0.0086, "step": 119240 }, { "epoch": 1.72, "learning_rate": 1.9427342297548533e-05, "loss": 0.0082, "step": 119250 }, { "epoch": 1.72, "learning_rate": 1.9427294257810063e-05, "loss": 0.0112, "step": 119260 }, { "epoch": 1.72, "learning_rate": 1.9427246218071592e-05, "loss": 0.0082, "step": 119270 }, { "epoch": 1.72, "learning_rate": 1.942719817833312e-05, "loss": 0.0134, "step": 119280 }, { "epoch": 1.72, "learning_rate": 1.9427150138594647e-05, "loss": 0.0071, "step": 119290 }, { "epoch": 1.72, "learning_rate": 1.9427102098856176e-05, "loss": 0.0129, "step": 119300 }, { "epoch": 1.72, "learning_rate": 1.9427054059117706e-05, "loss": 0.0068, "step": 119310 }, { "epoch": 1.72, "learning_rate": 1.942700601937923e-05, "loss": 0.0091, "step": 119320 }, { "epoch": 1.72, "learning_rate": 1.942695797964076e-05, "loss": 0.0139, "step": 119330 }, { "epoch": 1.72, "learning_rate": 1.942690993990229e-05, "loss": 0.0222, "step": 119340 }, { "epoch": 1.72, "learning_rate": 1.942686190016382e-05, "loss": 0.0098, "step": 119350 }, { "epoch": 1.72, "learning_rate": 1.9426813860425345e-05, "loss": 0.01, "step": 119360 }, { "epoch": 1.72, "learning_rate": 1.9426765820686874e-05, "loss": 0.0131, "step": 119370 }, { "epoch": 1.72, "learning_rate": 1.9426717780948404e-05, "loss": 0.0141, "step": 119380 }, { "epoch": 1.72, "learning_rate": 1.9426669741209933e-05, "loss": 0.0084, "step": 119390 }, { "epoch": 1.72, "learning_rate": 1.942662170147146e-05, "loss": 0.0106, "step": 119400 }, { "epoch": 1.72, "learning_rate": 1.9426573661732988e-05, "loss": 0.0137, "step": 119410 }, { "epoch": 1.72, "learning_rate": 1.9426525621994517e-05, "loss": 0.011, "step": 119420 }, { "epoch": 1.72, "learning_rate": 1.9426477582256043e-05, "loss": 0.0107, "step": 119430 }, { "epoch": 1.72, "learning_rate": 1.9426429542517573e-05, "loss": 0.0088, "step": 119440 }, { "epoch": 1.72, "learning_rate": 1.9426381502779102e-05, "loss": 0.0087, "step": 119450 }, { "epoch": 1.72, "learning_rate": 1.942633346304063e-05, "loss": 0.0096, "step": 119460 }, { "epoch": 1.72, "learning_rate": 1.9426285423302157e-05, "loss": 0.0099, "step": 119470 }, { "epoch": 1.72, "learning_rate": 1.9426237383563686e-05, "loss": 0.0105, "step": 119480 }, { "epoch": 1.72, "learning_rate": 1.9426189343825216e-05, "loss": 0.009, "step": 119490 }, { "epoch": 1.72, "learning_rate": 1.942614130408674e-05, "loss": 0.0114, "step": 119500 }, { "epoch": 1.72, "learning_rate": 1.942609326434827e-05, "loss": 0.0121, "step": 119510 }, { "epoch": 1.72, "learning_rate": 1.94260452246098e-05, "loss": 0.0092, "step": 119520 }, { "epoch": 1.72, "learning_rate": 1.942599718487133e-05, "loss": 0.0117, "step": 119530 }, { "epoch": 1.72, "learning_rate": 1.9425949145132855e-05, "loss": 0.0091, "step": 119540 }, { "epoch": 1.72, "learning_rate": 1.9425901105394384e-05, "loss": 0.0114, "step": 119550 }, { "epoch": 1.72, "learning_rate": 1.9425853065655914e-05, "loss": 0.0125, "step": 119560 }, { "epoch": 1.72, "learning_rate": 1.9425805025917443e-05, "loss": 0.0085, "step": 119570 }, { "epoch": 1.72, "learning_rate": 1.942575698617897e-05, "loss": 0.0111, "step": 119580 }, { "epoch": 1.72, "learning_rate": 1.9425708946440498e-05, "loss": 0.011, "step": 119590 }, { "epoch": 1.72, "learning_rate": 1.9425660906702027e-05, "loss": 0.0113, "step": 119600 }, { "epoch": 1.72, "learning_rate": 1.9425612866963553e-05, "loss": 0.0096, "step": 119610 }, { "epoch": 1.72, "learning_rate": 1.9425564827225082e-05, "loss": 0.009, "step": 119620 }, { "epoch": 1.72, "learning_rate": 1.9425516787486612e-05, "loss": 0.0138, "step": 119630 }, { "epoch": 1.72, "learning_rate": 1.942546874774814e-05, "loss": 0.0108, "step": 119640 }, { "epoch": 1.72, "learning_rate": 1.9425420708009667e-05, "loss": 0.0111, "step": 119650 }, { "epoch": 1.72, "learning_rate": 1.9425372668271196e-05, "loss": 0.0111, "step": 119660 }, { "epoch": 1.72, "learning_rate": 1.9425324628532725e-05, "loss": 0.0091, "step": 119670 }, { "epoch": 1.72, "learning_rate": 1.942527658879425e-05, "loss": 0.0077, "step": 119680 }, { "epoch": 1.72, "learning_rate": 1.942522854905578e-05, "loss": 0.0087, "step": 119690 }, { "epoch": 1.73, "learning_rate": 1.942518050931731e-05, "loss": 0.01, "step": 119700 }, { "epoch": 1.73, "learning_rate": 1.942513246957884e-05, "loss": 0.0121, "step": 119710 }, { "epoch": 1.73, "learning_rate": 1.9425084429840365e-05, "loss": 0.0135, "step": 119720 }, { "epoch": 1.73, "learning_rate": 1.9425036390101894e-05, "loss": 0.0177, "step": 119730 }, { "epoch": 1.73, "learning_rate": 1.9424988350363424e-05, "loss": 0.0128, "step": 119740 }, { "epoch": 1.73, "learning_rate": 1.9424940310624953e-05, "loss": 0.0114, "step": 119750 }, { "epoch": 1.73, "learning_rate": 1.942489227088648e-05, "loss": 0.0105, "step": 119760 }, { "epoch": 1.73, "learning_rate": 1.9424844231148008e-05, "loss": 0.0105, "step": 119770 }, { "epoch": 1.73, "learning_rate": 1.9424796191409537e-05, "loss": 0.0087, "step": 119780 }, { "epoch": 1.73, "learning_rate": 1.9424748151671063e-05, "loss": 0.0062, "step": 119790 }, { "epoch": 1.73, "learning_rate": 1.9424700111932592e-05, "loss": 0.0118, "step": 119800 }, { "epoch": 1.73, "learning_rate": 1.942465207219412e-05, "loss": 0.0084, "step": 119810 }, { "epoch": 1.73, "learning_rate": 1.942460403245565e-05, "loss": 0.0111, "step": 119820 }, { "epoch": 1.73, "learning_rate": 1.9424555992717177e-05, "loss": 0.0084, "step": 119830 }, { "epoch": 1.73, "learning_rate": 1.9424507952978706e-05, "loss": 0.0081, "step": 119840 }, { "epoch": 1.73, "learning_rate": 1.9424459913240235e-05, "loss": 0.0131, "step": 119850 }, { "epoch": 1.73, "learning_rate": 1.942441187350176e-05, "loss": 0.0127, "step": 119860 }, { "epoch": 1.73, "learning_rate": 1.942436383376329e-05, "loss": 0.0084, "step": 119870 }, { "epoch": 1.73, "learning_rate": 1.942431579402482e-05, "loss": 0.0106, "step": 119880 }, { "epoch": 1.73, "learning_rate": 1.942426775428635e-05, "loss": 0.0112, "step": 119890 }, { "epoch": 1.73, "learning_rate": 1.9424219714547875e-05, "loss": 0.0129, "step": 119900 }, { "epoch": 1.73, "learning_rate": 1.9424171674809404e-05, "loss": 0.0092, "step": 119910 }, { "epoch": 1.73, "learning_rate": 1.9424123635070933e-05, "loss": 0.0115, "step": 119920 }, { "epoch": 1.73, "learning_rate": 1.9424075595332463e-05, "loss": 0.0127, "step": 119930 }, { "epoch": 1.73, "learning_rate": 1.942402755559399e-05, "loss": 0.0092, "step": 119940 }, { "epoch": 1.73, "learning_rate": 1.9423979515855518e-05, "loss": 0.0098, "step": 119950 }, { "epoch": 1.73, "learning_rate": 1.9423931476117047e-05, "loss": 0.0106, "step": 119960 }, { "epoch": 1.73, "learning_rate": 1.9423883436378573e-05, "loss": 0.01, "step": 119970 }, { "epoch": 1.73, "learning_rate": 1.9423835396640102e-05, "loss": 0.0104, "step": 119980 }, { "epoch": 1.73, "learning_rate": 1.942378735690163e-05, "loss": 0.0126, "step": 119990 }, { "epoch": 1.73, "learning_rate": 1.942373931716316e-05, "loss": 0.0081, "step": 120000 }, { "epoch": 1.73, "learning_rate": 1.9423691277424687e-05, "loss": 0.0127, "step": 120010 }, { "epoch": 1.73, "learning_rate": 1.9423643237686216e-05, "loss": 0.0102, "step": 120020 }, { "epoch": 1.73, "learning_rate": 1.9423595197947745e-05, "loss": 0.0151, "step": 120030 }, { "epoch": 1.73, "learning_rate": 1.942354715820927e-05, "loss": 0.016, "step": 120040 }, { "epoch": 1.73, "learning_rate": 1.94234991184708e-05, "loss": 0.0084, "step": 120050 }, { "epoch": 1.73, "learning_rate": 1.942345107873233e-05, "loss": 0.0162, "step": 120060 }, { "epoch": 1.73, "learning_rate": 1.942340303899386e-05, "loss": 0.0093, "step": 120070 }, { "epoch": 1.73, "learning_rate": 1.9423354999255385e-05, "loss": 0.0075, "step": 120080 }, { "epoch": 1.73, "learning_rate": 1.9423306959516914e-05, "loss": 0.0106, "step": 120090 }, { "epoch": 1.73, "learning_rate": 1.9423258919778443e-05, "loss": 0.0111, "step": 120100 }, { "epoch": 1.73, "learning_rate": 1.9423210880039973e-05, "loss": 0.0136, "step": 120110 }, { "epoch": 1.73, "learning_rate": 1.94231628403015e-05, "loss": 0.0126, "step": 120120 }, { "epoch": 1.73, "learning_rate": 1.9423114800563028e-05, "loss": 0.0114, "step": 120130 }, { "epoch": 1.73, "learning_rate": 1.9423066760824557e-05, "loss": 0.0101, "step": 120140 }, { "epoch": 1.73, "learning_rate": 1.9423018721086083e-05, "loss": 0.0089, "step": 120150 }, { "epoch": 1.73, "learning_rate": 1.9422970681347612e-05, "loss": 0.0095, "step": 120160 }, { "epoch": 1.73, "learning_rate": 1.942292264160914e-05, "loss": 0.0105, "step": 120170 }, { "epoch": 1.73, "learning_rate": 1.942287460187067e-05, "loss": 0.0107, "step": 120180 }, { "epoch": 1.73, "learning_rate": 1.9422826562132197e-05, "loss": 0.0114, "step": 120190 }, { "epoch": 1.73, "learning_rate": 1.9422778522393726e-05, "loss": 0.0113, "step": 120200 }, { "epoch": 1.73, "learning_rate": 1.9422730482655255e-05, "loss": 0.0113, "step": 120210 }, { "epoch": 1.73, "learning_rate": 1.942268244291678e-05, "loss": 0.0086, "step": 120220 }, { "epoch": 1.73, "learning_rate": 1.942263440317831e-05, "loss": 0.011, "step": 120230 }, { "epoch": 1.73, "learning_rate": 1.942258636343984e-05, "loss": 0.0094, "step": 120240 }, { "epoch": 1.73, "learning_rate": 1.942253832370137e-05, "loss": 0.012, "step": 120250 }, { "epoch": 1.73, "learning_rate": 1.9422490283962895e-05, "loss": 0.0095, "step": 120260 }, { "epoch": 1.73, "learning_rate": 1.9422442244224424e-05, "loss": 0.0093, "step": 120270 }, { "epoch": 1.73, "learning_rate": 1.9422394204485953e-05, "loss": 0.0116, "step": 120280 }, { "epoch": 1.73, "learning_rate": 1.9422346164747483e-05, "loss": 0.0098, "step": 120290 }, { "epoch": 1.73, "learning_rate": 1.942229812500901e-05, "loss": 0.0092, "step": 120300 }, { "epoch": 1.73, "learning_rate": 1.9422250085270538e-05, "loss": 0.0072, "step": 120310 }, { "epoch": 1.73, "learning_rate": 1.9422202045532067e-05, "loss": 0.0146, "step": 120320 }, { "epoch": 1.73, "learning_rate": 1.9422154005793593e-05, "loss": 0.0105, "step": 120330 }, { "epoch": 1.73, "learning_rate": 1.9422105966055122e-05, "loss": 0.01, "step": 120340 }, { "epoch": 1.73, "learning_rate": 1.942205792631665e-05, "loss": 0.012, "step": 120350 }, { "epoch": 1.73, "learning_rate": 1.942200988657818e-05, "loss": 0.0084, "step": 120360 }, { "epoch": 1.73, "learning_rate": 1.9421961846839707e-05, "loss": 0.01, "step": 120370 }, { "epoch": 1.73, "learning_rate": 1.9421913807101236e-05, "loss": 0.0134, "step": 120380 }, { "epoch": 1.74, "learning_rate": 1.9421865767362765e-05, "loss": 0.008, "step": 120390 }, { "epoch": 1.74, "learning_rate": 1.942181772762429e-05, "loss": 0.0111, "step": 120400 }, { "epoch": 1.74, "learning_rate": 1.942176968788582e-05, "loss": 0.0087, "step": 120410 }, { "epoch": 1.74, "learning_rate": 1.942172164814735e-05, "loss": 0.0144, "step": 120420 }, { "epoch": 1.74, "learning_rate": 1.942167360840888e-05, "loss": 0.0111, "step": 120430 }, { "epoch": 1.74, "learning_rate": 1.9421625568670405e-05, "loss": 0.0109, "step": 120440 }, { "epoch": 1.74, "learning_rate": 1.9421577528931934e-05, "loss": 0.0133, "step": 120450 }, { "epoch": 1.74, "learning_rate": 1.9421529489193463e-05, "loss": 0.0117, "step": 120460 }, { "epoch": 1.74, "learning_rate": 1.9421481449454992e-05, "loss": 0.011, "step": 120470 }, { "epoch": 1.74, "learning_rate": 1.942143340971652e-05, "loss": 0.0078, "step": 120480 }, { "epoch": 1.74, "learning_rate": 1.9421385369978048e-05, "loss": 0.0099, "step": 120490 }, { "epoch": 1.74, "learning_rate": 1.9421337330239577e-05, "loss": 0.0101, "step": 120500 }, { "epoch": 1.74, "learning_rate": 1.9421289290501103e-05, "loss": 0.0094, "step": 120510 }, { "epoch": 1.74, "learning_rate": 1.9421241250762632e-05, "loss": 0.0119, "step": 120520 }, { "epoch": 1.74, "learning_rate": 1.942119321102416e-05, "loss": 0.0092, "step": 120530 }, { "epoch": 1.74, "learning_rate": 1.942114517128569e-05, "loss": 0.0112, "step": 120540 }, { "epoch": 1.74, "learning_rate": 1.9421097131547216e-05, "loss": 0.009, "step": 120550 }, { "epoch": 1.74, "learning_rate": 1.9421049091808746e-05, "loss": 0.0061, "step": 120560 }, { "epoch": 1.74, "learning_rate": 1.9421001052070275e-05, "loss": 0.0066, "step": 120570 }, { "epoch": 1.74, "learning_rate": 1.94209530123318e-05, "loss": 0.0131, "step": 120580 }, { "epoch": 1.74, "learning_rate": 1.942090497259333e-05, "loss": 0.0098, "step": 120590 }, { "epoch": 1.74, "learning_rate": 1.942085693285486e-05, "loss": 0.0107, "step": 120600 }, { "epoch": 1.74, "learning_rate": 1.942080889311639e-05, "loss": 0.0097, "step": 120610 }, { "epoch": 1.74, "learning_rate": 1.9420760853377915e-05, "loss": 0.007, "step": 120620 }, { "epoch": 1.74, "learning_rate": 1.9420712813639444e-05, "loss": 0.0125, "step": 120630 }, { "epoch": 1.74, "learning_rate": 1.9420664773900973e-05, "loss": 0.0084, "step": 120640 }, { "epoch": 1.74, "learning_rate": 1.9420616734162502e-05, "loss": 0.0105, "step": 120650 }, { "epoch": 1.74, "learning_rate": 1.9420568694424028e-05, "loss": 0.0113, "step": 120660 }, { "epoch": 1.74, "learning_rate": 1.9420520654685558e-05, "loss": 0.0081, "step": 120670 }, { "epoch": 1.74, "learning_rate": 1.9420472614947087e-05, "loss": 0.012, "step": 120680 }, { "epoch": 1.74, "learning_rate": 1.9420424575208613e-05, "loss": 0.0079, "step": 120690 }, { "epoch": 1.74, "learning_rate": 1.9420376535470142e-05, "loss": 0.0072, "step": 120700 }, { "epoch": 1.74, "learning_rate": 1.942032849573167e-05, "loss": 0.0077, "step": 120710 }, { "epoch": 1.74, "learning_rate": 1.94202804559932e-05, "loss": 0.01, "step": 120720 }, { "epoch": 1.74, "learning_rate": 1.9420232416254726e-05, "loss": 0.0165, "step": 120730 }, { "epoch": 1.74, "learning_rate": 1.9420184376516256e-05, "loss": 0.0115, "step": 120740 }, { "epoch": 1.74, "learning_rate": 1.9420136336777785e-05, "loss": 0.0134, "step": 120750 }, { "epoch": 1.74, "learning_rate": 1.942008829703931e-05, "loss": 0.0095, "step": 120760 }, { "epoch": 1.74, "learning_rate": 1.942004025730084e-05, "loss": 0.0111, "step": 120770 }, { "epoch": 1.74, "learning_rate": 1.941999221756237e-05, "loss": 0.0119, "step": 120780 }, { "epoch": 1.74, "learning_rate": 1.94199441778239e-05, "loss": 0.0092, "step": 120790 }, { "epoch": 1.74, "learning_rate": 1.9419896138085424e-05, "loss": 0.0102, "step": 120800 }, { "epoch": 1.74, "learning_rate": 1.9419848098346954e-05, "loss": 0.0099, "step": 120810 }, { "epoch": 1.74, "learning_rate": 1.9419800058608483e-05, "loss": 0.0114, "step": 120820 }, { "epoch": 1.74, "learning_rate": 1.941975201887001e-05, "loss": 0.0101, "step": 120830 }, { "epoch": 1.74, "learning_rate": 1.9419703979131538e-05, "loss": 0.0078, "step": 120840 }, { "epoch": 1.74, "learning_rate": 1.9419655939393067e-05, "loss": 0.0084, "step": 120850 }, { "epoch": 1.74, "learning_rate": 1.9419607899654597e-05, "loss": 0.0089, "step": 120860 }, { "epoch": 1.74, "learning_rate": 1.9419559859916123e-05, "loss": 0.0135, "step": 120870 }, { "epoch": 1.74, "learning_rate": 1.9419511820177652e-05, "loss": 0.0079, "step": 120880 }, { "epoch": 1.74, "learning_rate": 1.941946378043918e-05, "loss": 0.0065, "step": 120890 }, { "epoch": 1.74, "learning_rate": 1.941941574070071e-05, "loss": 0.0103, "step": 120900 }, { "epoch": 1.74, "learning_rate": 1.9419367700962236e-05, "loss": 0.0118, "step": 120910 }, { "epoch": 1.74, "learning_rate": 1.9419319661223766e-05, "loss": 0.012, "step": 120920 }, { "epoch": 1.74, "learning_rate": 1.9419271621485295e-05, "loss": 0.0075, "step": 120930 }, { "epoch": 1.74, "learning_rate": 1.941922358174682e-05, "loss": 0.0099, "step": 120940 }, { "epoch": 1.74, "learning_rate": 1.941917554200835e-05, "loss": 0.0127, "step": 120950 }, { "epoch": 1.74, "learning_rate": 1.941912750226988e-05, "loss": 0.0079, "step": 120960 }, { "epoch": 1.74, "learning_rate": 1.941907946253141e-05, "loss": 0.009, "step": 120970 }, { "epoch": 1.74, "learning_rate": 1.9419031422792934e-05, "loss": 0.0103, "step": 120980 }, { "epoch": 1.74, "learning_rate": 1.9418983383054464e-05, "loss": 0.0109, "step": 120990 }, { "epoch": 1.74, "learning_rate": 1.9418935343315993e-05, "loss": 0.0136, "step": 121000 }, { "epoch": 1.74, "learning_rate": 1.941888730357752e-05, "loss": 0.0111, "step": 121010 }, { "epoch": 1.74, "learning_rate": 1.9418839263839048e-05, "loss": 0.0109, "step": 121020 }, { "epoch": 1.74, "learning_rate": 1.9418791224100577e-05, "loss": 0.0102, "step": 121030 }, { "epoch": 1.74, "learning_rate": 1.9418743184362107e-05, "loss": 0.0089, "step": 121040 }, { "epoch": 1.74, "learning_rate": 1.9418695144623633e-05, "loss": 0.0089, "step": 121050 }, { "epoch": 1.74, "learning_rate": 1.9418647104885162e-05, "loss": 0.0132, "step": 121060 }, { "epoch": 1.74, "learning_rate": 1.941859906514669e-05, "loss": 0.0108, "step": 121070 }, { "epoch": 1.74, "learning_rate": 1.941855102540822e-05, "loss": 0.0105, "step": 121080 }, { "epoch": 1.75, "learning_rate": 1.9418502985669746e-05, "loss": 0.0101, "step": 121090 }, { "epoch": 1.75, "learning_rate": 1.9418454945931275e-05, "loss": 0.0099, "step": 121100 }, { "epoch": 1.75, "learning_rate": 1.9418406906192805e-05, "loss": 0.0072, "step": 121110 }, { "epoch": 1.75, "learning_rate": 1.941835886645433e-05, "loss": 0.0092, "step": 121120 }, { "epoch": 1.75, "learning_rate": 1.941831082671586e-05, "loss": 0.0077, "step": 121130 }, { "epoch": 1.75, "learning_rate": 1.941826278697739e-05, "loss": 0.0081, "step": 121140 }, { "epoch": 1.75, "learning_rate": 1.941821474723892e-05, "loss": 0.0137, "step": 121150 }, { "epoch": 1.75, "learning_rate": 1.9418166707500444e-05, "loss": 0.0072, "step": 121160 }, { "epoch": 1.75, "learning_rate": 1.9418118667761974e-05, "loss": 0.0089, "step": 121170 }, { "epoch": 1.75, "learning_rate": 1.9418070628023503e-05, "loss": 0.0111, "step": 121180 }, { "epoch": 1.75, "learning_rate": 1.941802258828503e-05, "loss": 0.0133, "step": 121190 }, { "epoch": 1.75, "learning_rate": 1.9417974548546558e-05, "loss": 0.0091, "step": 121200 }, { "epoch": 1.75, "learning_rate": 1.9417926508808087e-05, "loss": 0.0109, "step": 121210 }, { "epoch": 1.75, "learning_rate": 1.9417878469069617e-05, "loss": 0.0091, "step": 121220 }, { "epoch": 1.75, "learning_rate": 1.9417830429331142e-05, "loss": 0.0138, "step": 121230 }, { "epoch": 1.75, "learning_rate": 1.9417782389592672e-05, "loss": 0.0085, "step": 121240 }, { "epoch": 1.75, "learning_rate": 1.94177343498542e-05, "loss": 0.0119, "step": 121250 }, { "epoch": 1.75, "learning_rate": 1.941768631011573e-05, "loss": 0.0078, "step": 121260 }, { "epoch": 1.75, "learning_rate": 1.9417638270377256e-05, "loss": 0.0084, "step": 121270 }, { "epoch": 1.75, "learning_rate": 1.9417590230638785e-05, "loss": 0.0096, "step": 121280 }, { "epoch": 1.75, "learning_rate": 1.9417542190900315e-05, "loss": 0.0123, "step": 121290 }, { "epoch": 1.75, "learning_rate": 1.941749415116184e-05, "loss": 0.0162, "step": 121300 }, { "epoch": 1.75, "learning_rate": 1.941744611142337e-05, "loss": 0.0124, "step": 121310 }, { "epoch": 1.75, "learning_rate": 1.94173980716849e-05, "loss": 0.0115, "step": 121320 }, { "epoch": 1.75, "learning_rate": 1.941735003194643e-05, "loss": 0.0107, "step": 121330 }, { "epoch": 1.75, "learning_rate": 1.9417301992207954e-05, "loss": 0.0091, "step": 121340 }, { "epoch": 1.75, "learning_rate": 1.9417253952469484e-05, "loss": 0.0108, "step": 121350 }, { "epoch": 1.75, "learning_rate": 1.9417205912731013e-05, "loss": 0.0136, "step": 121360 }, { "epoch": 1.75, "learning_rate": 1.941715787299254e-05, "loss": 0.0102, "step": 121370 }, { "epoch": 1.75, "learning_rate": 1.9417109833254068e-05, "loss": 0.0104, "step": 121380 }, { "epoch": 1.75, "learning_rate": 1.9417061793515597e-05, "loss": 0.0095, "step": 121390 }, { "epoch": 1.75, "learning_rate": 1.9417013753777126e-05, "loss": 0.0123, "step": 121400 }, { "epoch": 1.75, "learning_rate": 1.9416965714038652e-05, "loss": 0.0086, "step": 121410 }, { "epoch": 1.75, "learning_rate": 1.941692247827403e-05, "loss": 0.0137, "step": 121420 }, { "epoch": 1.75, "learning_rate": 1.9416874438535556e-05, "loss": 0.0134, "step": 121430 }, { "epoch": 1.75, "learning_rate": 1.9416826398797086e-05, "loss": 0.0078, "step": 121440 }, { "epoch": 1.75, "learning_rate": 1.9416778359058615e-05, "loss": 0.0121, "step": 121450 }, { "epoch": 1.75, "learning_rate": 1.9416730319320144e-05, "loss": 0.0113, "step": 121460 }, { "epoch": 1.75, "learning_rate": 1.941668227958167e-05, "loss": 0.0112, "step": 121470 }, { "epoch": 1.75, "learning_rate": 1.94166342398432e-05, "loss": 0.0099, "step": 121480 }, { "epoch": 1.75, "learning_rate": 1.941658620010473e-05, "loss": 0.012, "step": 121490 }, { "epoch": 1.75, "learning_rate": 1.9416538160366258e-05, "loss": 0.0083, "step": 121500 }, { "epoch": 1.75, "learning_rate": 1.9416490120627784e-05, "loss": 0.0112, "step": 121510 }, { "epoch": 1.75, "learning_rate": 1.9416442080889313e-05, "loss": 0.0135, "step": 121520 }, { "epoch": 1.75, "learning_rate": 1.9416394041150842e-05, "loss": 0.0112, "step": 121530 }, { "epoch": 1.75, "learning_rate": 1.9416346001412368e-05, "loss": 0.0132, "step": 121540 }, { "epoch": 1.75, "learning_rate": 1.9416297961673897e-05, "loss": 0.0081, "step": 121550 }, { "epoch": 1.75, "learning_rate": 1.9416249921935427e-05, "loss": 0.0101, "step": 121560 }, { "epoch": 1.75, "learning_rate": 1.9416201882196956e-05, "loss": 0.0129, "step": 121570 }, { "epoch": 1.75, "learning_rate": 1.9416153842458482e-05, "loss": 0.0094, "step": 121580 }, { "epoch": 1.75, "learning_rate": 1.941610580272001e-05, "loss": 0.0095, "step": 121590 }, { "epoch": 1.75, "learning_rate": 1.941605776298154e-05, "loss": 0.0119, "step": 121600 }, { "epoch": 1.75, "learning_rate": 1.9416009723243066e-05, "loss": 0.0098, "step": 121610 }, { "epoch": 1.75, "learning_rate": 1.9415961683504595e-05, "loss": 0.0071, "step": 121620 }, { "epoch": 1.75, "learning_rate": 1.9415913643766125e-05, "loss": 0.0099, "step": 121630 }, { "epoch": 1.75, "learning_rate": 1.9415865604027654e-05, "loss": 0.0073, "step": 121640 }, { "epoch": 1.75, "learning_rate": 1.941581756428918e-05, "loss": 0.0059, "step": 121650 }, { "epoch": 1.75, "learning_rate": 1.941576952455071e-05, "loss": 0.0172, "step": 121660 }, { "epoch": 1.75, "learning_rate": 1.941572148481224e-05, "loss": 0.0108, "step": 121670 }, { "epoch": 1.75, "learning_rate": 1.9415673445073768e-05, "loss": 0.0086, "step": 121680 }, { "epoch": 1.75, "learning_rate": 1.9415625405335294e-05, "loss": 0.0087, "step": 121690 }, { "epoch": 1.75, "learning_rate": 1.9415577365596823e-05, "loss": 0.0087, "step": 121700 }, { "epoch": 1.75, "learning_rate": 1.9415529325858352e-05, "loss": 0.0095, "step": 121710 }, { "epoch": 1.75, "learning_rate": 1.9415481286119878e-05, "loss": 0.0137, "step": 121720 }, { "epoch": 1.75, "learning_rate": 1.9415433246381407e-05, "loss": 0.0094, "step": 121730 }, { "epoch": 1.75, "learning_rate": 1.9415385206642937e-05, "loss": 0.0096, "step": 121740 }, { "epoch": 1.75, "learning_rate": 1.9415337166904466e-05, "loss": 0.015, "step": 121750 }, { "epoch": 1.75, "learning_rate": 1.941528912716599e-05, "loss": 0.0092, "step": 121760 }, { "epoch": 1.75, "learning_rate": 1.941524108742752e-05, "loss": 0.0082, "step": 121770 }, { "epoch": 1.76, "learning_rate": 1.941519304768905e-05, "loss": 0.012, "step": 121780 }, { "epoch": 1.76, "learning_rate": 1.9415145007950576e-05, "loss": 0.0115, "step": 121790 }, { "epoch": 1.76, "learning_rate": 1.9415096968212105e-05, "loss": 0.01, "step": 121800 }, { "epoch": 1.76, "learning_rate": 1.9415048928473635e-05, "loss": 0.0156, "step": 121810 }, { "epoch": 1.76, "learning_rate": 1.9415000888735164e-05, "loss": 0.011, "step": 121820 }, { "epoch": 1.76, "learning_rate": 1.941495284899669e-05, "loss": 0.009, "step": 121830 }, { "epoch": 1.76, "learning_rate": 1.941490480925822e-05, "loss": 0.0111, "step": 121840 }, { "epoch": 1.76, "learning_rate": 1.941485676951975e-05, "loss": 0.0115, "step": 121850 }, { "epoch": 1.76, "learning_rate": 1.9414808729781278e-05, "loss": 0.0109, "step": 121860 }, { "epoch": 1.76, "learning_rate": 1.9414760690042803e-05, "loss": 0.0107, "step": 121870 }, { "epoch": 1.76, "learning_rate": 1.9414712650304333e-05, "loss": 0.0091, "step": 121880 }, { "epoch": 1.76, "learning_rate": 1.9414664610565862e-05, "loss": 0.011, "step": 121890 }, { "epoch": 1.76, "learning_rate": 1.9414616570827388e-05, "loss": 0.0072, "step": 121900 }, { "epoch": 1.76, "learning_rate": 1.9414568531088917e-05, "loss": 0.0098, "step": 121910 }, { "epoch": 1.76, "learning_rate": 1.9414520491350446e-05, "loss": 0.0075, "step": 121920 }, { "epoch": 1.76, "learning_rate": 1.9414472451611976e-05, "loss": 0.0083, "step": 121930 }, { "epoch": 1.76, "learning_rate": 1.94144244118735e-05, "loss": 0.0098, "step": 121940 }, { "epoch": 1.76, "learning_rate": 1.941437637213503e-05, "loss": 0.0088, "step": 121950 }, { "epoch": 1.76, "learning_rate": 1.941432833239656e-05, "loss": 0.0114, "step": 121960 }, { "epoch": 1.76, "learning_rate": 1.9414280292658086e-05, "loss": 0.0081, "step": 121970 }, { "epoch": 1.76, "learning_rate": 1.9414232252919615e-05, "loss": 0.0117, "step": 121980 }, { "epoch": 1.76, "learning_rate": 1.9414184213181145e-05, "loss": 0.0094, "step": 121990 }, { "epoch": 1.76, "learning_rate": 1.9414136173442674e-05, "loss": 0.0132, "step": 122000 }, { "epoch": 1.76, "learning_rate": 1.94140881337042e-05, "loss": 0.0084, "step": 122010 }, { "epoch": 1.76, "learning_rate": 1.941404009396573e-05, "loss": 0.0105, "step": 122020 }, { "epoch": 1.76, "learning_rate": 1.9413992054227258e-05, "loss": 0.0118, "step": 122030 }, { "epoch": 1.76, "learning_rate": 1.9413944014488788e-05, "loss": 0.0118, "step": 122040 }, { "epoch": 1.76, "learning_rate": 1.9413895974750313e-05, "loss": 0.0152, "step": 122050 }, { "epoch": 1.76, "learning_rate": 1.9413847935011843e-05, "loss": 0.0096, "step": 122060 }, { "epoch": 1.76, "learning_rate": 1.9413799895273372e-05, "loss": 0.0119, "step": 122070 }, { "epoch": 1.76, "learning_rate": 1.9413751855534898e-05, "loss": 0.0121, "step": 122080 }, { "epoch": 1.76, "learning_rate": 1.9413703815796427e-05, "loss": 0.0101, "step": 122090 }, { "epoch": 1.76, "learning_rate": 1.9413655776057956e-05, "loss": 0.0118, "step": 122100 }, { "epoch": 1.76, "learning_rate": 1.9413607736319486e-05, "loss": 0.0106, "step": 122110 }, { "epoch": 1.76, "learning_rate": 1.941355969658101e-05, "loss": 0.0067, "step": 122120 }, { "epoch": 1.76, "learning_rate": 1.941351165684254e-05, "loss": 0.0084, "step": 122130 }, { "epoch": 1.76, "learning_rate": 1.941346361710407e-05, "loss": 0.0073, "step": 122140 }, { "epoch": 1.76, "learning_rate": 1.9413415577365596e-05, "loss": 0.0119, "step": 122150 }, { "epoch": 1.76, "learning_rate": 1.9413367537627125e-05, "loss": 0.0091, "step": 122160 }, { "epoch": 1.76, "learning_rate": 1.9413319497888654e-05, "loss": 0.0071, "step": 122170 }, { "epoch": 1.76, "learning_rate": 1.9413271458150184e-05, "loss": 0.0142, "step": 122180 }, { "epoch": 1.76, "learning_rate": 1.941322341841171e-05, "loss": 0.0129, "step": 122190 }, { "epoch": 1.76, "learning_rate": 1.941317537867324e-05, "loss": 0.011, "step": 122200 }, { "epoch": 1.76, "learning_rate": 1.9413127338934768e-05, "loss": 0.0082, "step": 122210 }, { "epoch": 1.76, "learning_rate": 1.9413079299196297e-05, "loss": 0.008, "step": 122220 }, { "epoch": 1.76, "learning_rate": 1.9413031259457823e-05, "loss": 0.0106, "step": 122230 }, { "epoch": 1.76, "learning_rate": 1.9412983219719353e-05, "loss": 0.0088, "step": 122240 }, { "epoch": 1.76, "learning_rate": 1.9412935179980882e-05, "loss": 0.0106, "step": 122250 }, { "epoch": 1.76, "learning_rate": 1.9412887140242408e-05, "loss": 0.0085, "step": 122260 }, { "epoch": 1.76, "learning_rate": 1.9412839100503937e-05, "loss": 0.0091, "step": 122270 }, { "epoch": 1.76, "learning_rate": 1.9412791060765466e-05, "loss": 0.0094, "step": 122280 }, { "epoch": 1.76, "learning_rate": 1.9412743021026996e-05, "loss": 0.0133, "step": 122290 }, { "epoch": 1.76, "learning_rate": 1.941269498128852e-05, "loss": 0.0081, "step": 122300 }, { "epoch": 1.76, "learning_rate": 1.941264694155005e-05, "loss": 0.0098, "step": 122310 }, { "epoch": 1.76, "learning_rate": 1.941259890181158e-05, "loss": 0.0062, "step": 122320 }, { "epoch": 1.76, "learning_rate": 1.941255086207311e-05, "loss": 0.0102, "step": 122330 }, { "epoch": 1.76, "learning_rate": 1.941250282233464e-05, "loss": 0.015, "step": 122340 }, { "epoch": 1.76, "learning_rate": 1.9412454782596168e-05, "loss": 0.0064, "step": 122350 }, { "epoch": 1.76, "learning_rate": 1.9412406742857694e-05, "loss": 0.0089, "step": 122360 }, { "epoch": 1.76, "learning_rate": 1.9412358703119223e-05, "loss": 0.0089, "step": 122370 }, { "epoch": 1.76, "learning_rate": 1.9412310663380752e-05, "loss": 0.0093, "step": 122380 }, { "epoch": 1.76, "learning_rate": 1.9412262623642278e-05, "loss": 0.01, "step": 122390 }, { "epoch": 1.76, "learning_rate": 1.9412214583903807e-05, "loss": 0.0135, "step": 122400 }, { "epoch": 1.76, "learning_rate": 1.9412166544165337e-05, "loss": 0.0081, "step": 122410 }, { "epoch": 1.76, "learning_rate": 1.9412118504426866e-05, "loss": 0.0111, "step": 122420 }, { "epoch": 1.76, "learning_rate": 1.9412070464688392e-05, "loss": 0.0102, "step": 122430 }, { "epoch": 1.76, "learning_rate": 1.941202242494992e-05, "loss": 0.0055, "step": 122440 }, { "epoch": 1.76, "learning_rate": 1.941197438521145e-05, "loss": 0.0084, "step": 122450 }, { "epoch": 1.76, "learning_rate": 1.9411926345472976e-05, "loss": 0.008, "step": 122460 }, { "epoch": 1.77, "learning_rate": 1.9411878305734505e-05, "loss": 0.0122, "step": 122470 }, { "epoch": 1.77, "learning_rate": 1.9411830265996035e-05, "loss": 0.0145, "step": 122480 }, { "epoch": 1.77, "learning_rate": 1.9411782226257564e-05, "loss": 0.0091, "step": 122490 }, { "epoch": 1.77, "learning_rate": 1.941173418651909e-05, "loss": 0.0117, "step": 122500 }, { "epoch": 1.77, "learning_rate": 1.941168614678062e-05, "loss": 0.013, "step": 122510 }, { "epoch": 1.77, "learning_rate": 1.941163810704215e-05, "loss": 0.0097, "step": 122520 }, { "epoch": 1.77, "learning_rate": 1.9411590067303678e-05, "loss": 0.01, "step": 122530 }, { "epoch": 1.77, "learning_rate": 1.9411542027565204e-05, "loss": 0.0093, "step": 122540 }, { "epoch": 1.77, "learning_rate": 1.9411493987826733e-05, "loss": 0.0086, "step": 122550 }, { "epoch": 1.77, "learning_rate": 1.9411445948088262e-05, "loss": 0.0085, "step": 122560 }, { "epoch": 1.77, "learning_rate": 1.9411397908349788e-05, "loss": 0.0131, "step": 122570 }, { "epoch": 1.77, "learning_rate": 1.9411349868611317e-05, "loss": 0.0094, "step": 122580 }, { "epoch": 1.77, "learning_rate": 1.9411301828872847e-05, "loss": 0.0095, "step": 122590 }, { "epoch": 1.77, "learning_rate": 1.9411253789134376e-05, "loss": 0.0114, "step": 122600 }, { "epoch": 1.77, "learning_rate": 1.94112057493959e-05, "loss": 0.0074, "step": 122610 }, { "epoch": 1.77, "learning_rate": 1.941115770965743e-05, "loss": 0.0089, "step": 122620 }, { "epoch": 1.77, "learning_rate": 1.941110966991896e-05, "loss": 0.0094, "step": 122630 }, { "epoch": 1.77, "learning_rate": 1.9411061630180486e-05, "loss": 0.0134, "step": 122640 }, { "epoch": 1.77, "learning_rate": 1.9411013590442015e-05, "loss": 0.0059, "step": 122650 }, { "epoch": 1.77, "learning_rate": 1.9410965550703545e-05, "loss": 0.0099, "step": 122660 }, { "epoch": 1.77, "learning_rate": 1.9410917510965074e-05, "loss": 0.0081, "step": 122670 }, { "epoch": 1.77, "learning_rate": 1.94108694712266e-05, "loss": 0.0127, "step": 122680 }, { "epoch": 1.77, "learning_rate": 1.941082143148813e-05, "loss": 0.0108, "step": 122690 }, { "epoch": 1.77, "learning_rate": 1.941077339174966e-05, "loss": 0.0075, "step": 122700 }, { "epoch": 1.77, "learning_rate": 1.9410725352011188e-05, "loss": 0.0088, "step": 122710 }, { "epoch": 1.77, "learning_rate": 1.9410677312272713e-05, "loss": 0.0068, "step": 122720 }, { "epoch": 1.77, "learning_rate": 1.9410629272534243e-05, "loss": 0.0114, "step": 122730 }, { "epoch": 1.77, "learning_rate": 1.9410581232795772e-05, "loss": 0.0077, "step": 122740 }, { "epoch": 1.77, "learning_rate": 1.9410533193057298e-05, "loss": 0.0108, "step": 122750 }, { "epoch": 1.77, "learning_rate": 1.9410485153318827e-05, "loss": 0.007, "step": 122760 }, { "epoch": 1.77, "learning_rate": 1.9410437113580356e-05, "loss": 0.0111, "step": 122770 }, { "epoch": 1.77, "learning_rate": 1.9410389073841886e-05, "loss": 0.0076, "step": 122780 }, { "epoch": 1.77, "learning_rate": 1.941034103410341e-05, "loss": 0.0112, "step": 122790 }, { "epoch": 1.77, "learning_rate": 1.941029299436494e-05, "loss": 0.0068, "step": 122800 }, { "epoch": 1.77, "learning_rate": 1.941024495462647e-05, "loss": 0.0104, "step": 122810 }, { "epoch": 1.77, "learning_rate": 1.9410196914887996e-05, "loss": 0.0106, "step": 122820 }, { "epoch": 1.77, "learning_rate": 1.9410148875149525e-05, "loss": 0.0117, "step": 122830 }, { "epoch": 1.77, "learning_rate": 1.9410100835411055e-05, "loss": 0.0099, "step": 122840 }, { "epoch": 1.77, "learning_rate": 1.9410052795672584e-05, "loss": 0.008, "step": 122850 }, { "epoch": 1.77, "learning_rate": 1.941000475593411e-05, "loss": 0.0098, "step": 122860 }, { "epoch": 1.77, "learning_rate": 1.940995671619564e-05, "loss": 0.0077, "step": 122870 }, { "epoch": 1.77, "learning_rate": 1.9409908676457168e-05, "loss": 0.0116, "step": 122880 }, { "epoch": 1.77, "learning_rate": 1.9409860636718698e-05, "loss": 0.0115, "step": 122890 }, { "epoch": 1.77, "learning_rate": 1.9409812596980223e-05, "loss": 0.0138, "step": 122900 }, { "epoch": 1.77, "learning_rate": 1.9409764557241753e-05, "loss": 0.0104, "step": 122910 }, { "epoch": 1.77, "learning_rate": 1.9409716517503282e-05, "loss": 0.0116, "step": 122920 }, { "epoch": 1.77, "learning_rate": 1.9409668477764808e-05, "loss": 0.0104, "step": 122930 }, { "epoch": 1.77, "learning_rate": 1.9409620438026337e-05, "loss": 0.0118, "step": 122940 }, { "epoch": 1.77, "learning_rate": 1.9409572398287866e-05, "loss": 0.0129, "step": 122950 }, { "epoch": 1.77, "learning_rate": 1.9409524358549396e-05, "loss": 0.0095, "step": 122960 }, { "epoch": 1.77, "learning_rate": 1.940947631881092e-05, "loss": 0.0174, "step": 122970 }, { "epoch": 1.77, "learning_rate": 1.940942827907245e-05, "loss": 0.0094, "step": 122980 }, { "epoch": 1.77, "learning_rate": 1.940938023933398e-05, "loss": 0.0112, "step": 122990 }, { "epoch": 1.77, "learning_rate": 1.9409332199595506e-05, "loss": 0.0107, "step": 123000 }, { "epoch": 1.77, "learning_rate": 1.9409284159857035e-05, "loss": 0.0122, "step": 123010 }, { "epoch": 1.77, "learning_rate": 1.9409236120118564e-05, "loss": 0.0118, "step": 123020 }, { "epoch": 1.77, "learning_rate": 1.9409188080380094e-05, "loss": 0.0096, "step": 123030 }, { "epoch": 1.77, "learning_rate": 1.940914004064162e-05, "loss": 0.0102, "step": 123040 }, { "epoch": 1.77, "learning_rate": 1.940909200090315e-05, "loss": 0.0098, "step": 123050 }, { "epoch": 1.77, "learning_rate": 1.9409043961164678e-05, "loss": 0.0067, "step": 123060 }, { "epoch": 1.77, "learning_rate": 1.9408995921426207e-05, "loss": 0.0103, "step": 123070 }, { "epoch": 1.77, "learning_rate": 1.9408947881687733e-05, "loss": 0.0089, "step": 123080 }, { "epoch": 1.77, "learning_rate": 1.9408899841949263e-05, "loss": 0.0089, "step": 123090 }, { "epoch": 1.77, "learning_rate": 1.9408851802210792e-05, "loss": 0.0087, "step": 123100 }, { "epoch": 1.77, "learning_rate": 1.9408803762472318e-05, "loss": 0.0091, "step": 123110 }, { "epoch": 1.77, "learning_rate": 1.9408755722733847e-05, "loss": 0.0127, "step": 123120 }, { "epoch": 1.77, "learning_rate": 1.9408707682995376e-05, "loss": 0.0132, "step": 123130 }, { "epoch": 1.77, "learning_rate": 1.9408659643256906e-05, "loss": 0.0099, "step": 123140 }, { "epoch": 1.77, "learning_rate": 1.940861160351843e-05, "loss": 0.0098, "step": 123150 }, { "epoch": 1.77, "learning_rate": 1.940856356377996e-05, "loss": 0.0106, "step": 123160 }, { "epoch": 1.78, "learning_rate": 1.940851552404149e-05, "loss": 0.0103, "step": 123170 }, { "epoch": 1.78, "learning_rate": 1.9408467484303016e-05, "loss": 0.0064, "step": 123180 }, { "epoch": 1.78, "learning_rate": 1.9408419444564545e-05, "loss": 0.0092, "step": 123190 }, { "epoch": 1.78, "learning_rate": 1.9408371404826074e-05, "loss": 0.0077, "step": 123200 }, { "epoch": 1.78, "learning_rate": 1.9408323365087604e-05, "loss": 0.0106, "step": 123210 }, { "epoch": 1.78, "learning_rate": 1.940827532534913e-05, "loss": 0.0094, "step": 123220 }, { "epoch": 1.78, "learning_rate": 1.940822728561066e-05, "loss": 0.0124, "step": 123230 }, { "epoch": 1.78, "learning_rate": 1.9408179245872188e-05, "loss": 0.0098, "step": 123240 }, { "epoch": 1.78, "learning_rate": 1.9408131206133717e-05, "loss": 0.0067, "step": 123250 }, { "epoch": 1.78, "learning_rate": 1.9408083166395243e-05, "loss": 0.0104, "step": 123260 }, { "epoch": 1.78, "learning_rate": 1.9408035126656772e-05, "loss": 0.0087, "step": 123270 }, { "epoch": 1.78, "learning_rate": 1.9407987086918302e-05, "loss": 0.0091, "step": 123280 }, { "epoch": 1.78, "learning_rate": 1.9407939047179828e-05, "loss": 0.0087, "step": 123290 }, { "epoch": 1.78, "learning_rate": 1.9407891007441357e-05, "loss": 0.0092, "step": 123300 }, { "epoch": 1.78, "learning_rate": 1.9407842967702886e-05, "loss": 0.008, "step": 123310 }, { "epoch": 1.78, "learning_rate": 1.9407794927964415e-05, "loss": 0.0134, "step": 123320 }, { "epoch": 1.78, "learning_rate": 1.940774688822594e-05, "loss": 0.0141, "step": 123330 }, { "epoch": 1.78, "learning_rate": 1.940769884848747e-05, "loss": 0.0123, "step": 123340 }, { "epoch": 1.78, "learning_rate": 1.9407650808749e-05, "loss": 0.0113, "step": 123350 }, { "epoch": 1.78, "learning_rate": 1.9407602769010526e-05, "loss": 0.0111, "step": 123360 }, { "epoch": 1.78, "learning_rate": 1.9407554729272055e-05, "loss": 0.0125, "step": 123370 }, { "epoch": 1.78, "learning_rate": 1.9407506689533584e-05, "loss": 0.0114, "step": 123380 }, { "epoch": 1.78, "learning_rate": 1.9407458649795114e-05, "loss": 0.0076, "step": 123390 }, { "epoch": 1.78, "learning_rate": 1.940741061005664e-05, "loss": 0.0104, "step": 123400 }, { "epoch": 1.78, "learning_rate": 1.940736257031817e-05, "loss": 0.0098, "step": 123410 }, { "epoch": 1.78, "learning_rate": 1.9407314530579698e-05, "loss": 0.0102, "step": 123420 }, { "epoch": 1.78, "learning_rate": 1.9407266490841227e-05, "loss": 0.0153, "step": 123430 }, { "epoch": 1.78, "learning_rate": 1.9407218451102753e-05, "loss": 0.008, "step": 123440 }, { "epoch": 1.78, "learning_rate": 1.9407170411364282e-05, "loss": 0.007, "step": 123450 }, { "epoch": 1.78, "learning_rate": 1.940712237162581e-05, "loss": 0.0078, "step": 123460 }, { "epoch": 1.78, "learning_rate": 1.9407074331887338e-05, "loss": 0.0084, "step": 123470 }, { "epoch": 1.78, "learning_rate": 1.9407026292148867e-05, "loss": 0.0106, "step": 123480 }, { "epoch": 1.78, "learning_rate": 1.9406978252410396e-05, "loss": 0.0129, "step": 123490 }, { "epoch": 1.78, "learning_rate": 1.9406930212671925e-05, "loss": 0.0126, "step": 123500 }, { "epoch": 1.78, "learning_rate": 1.940688217293345e-05, "loss": 0.0103, "step": 123510 }, { "epoch": 1.78, "learning_rate": 1.940683413319498e-05, "loss": 0.0122, "step": 123520 }, { "epoch": 1.78, "learning_rate": 1.940678609345651e-05, "loss": 0.0098, "step": 123530 }, { "epoch": 1.78, "learning_rate": 1.9406738053718036e-05, "loss": 0.0079, "step": 123540 }, { "epoch": 1.78, "learning_rate": 1.9406690013979565e-05, "loss": 0.0085, "step": 123550 }, { "epoch": 1.78, "learning_rate": 1.9406641974241094e-05, "loss": 0.0118, "step": 123560 }, { "epoch": 1.78, "learning_rate": 1.9406593934502623e-05, "loss": 0.0101, "step": 123570 }, { "epoch": 1.78, "learning_rate": 1.940654589476415e-05, "loss": 0.0108, "step": 123580 }, { "epoch": 1.78, "learning_rate": 1.940649785502568e-05, "loss": 0.0095, "step": 123590 }, { "epoch": 1.78, "learning_rate": 1.9406449815287208e-05, "loss": 0.0096, "step": 123600 }, { "epoch": 1.78, "learning_rate": 1.9406401775548737e-05, "loss": 0.0092, "step": 123610 }, { "epoch": 1.78, "learning_rate": 1.9406353735810263e-05, "loss": 0.0103, "step": 123620 }, { "epoch": 1.78, "learning_rate": 1.9406305696071792e-05, "loss": 0.007, "step": 123630 }, { "epoch": 1.78, "learning_rate": 1.940625765633332e-05, "loss": 0.0137, "step": 123640 }, { "epoch": 1.78, "learning_rate": 1.9406209616594847e-05, "loss": 0.0113, "step": 123650 }, { "epoch": 1.78, "learning_rate": 1.9406161576856377e-05, "loss": 0.0124, "step": 123660 }, { "epoch": 1.78, "learning_rate": 1.9406113537117906e-05, "loss": 0.0076, "step": 123670 }, { "epoch": 1.78, "learning_rate": 1.9406065497379435e-05, "loss": 0.0083, "step": 123680 }, { "epoch": 1.78, "learning_rate": 1.940601745764096e-05, "loss": 0.0121, "step": 123690 }, { "epoch": 1.78, "learning_rate": 1.940596941790249e-05, "loss": 0.009, "step": 123700 }, { "epoch": 1.78, "learning_rate": 1.940592137816402e-05, "loss": 0.0066, "step": 123710 }, { "epoch": 1.78, "learning_rate": 1.9405873338425546e-05, "loss": 0.0124, "step": 123720 }, { "epoch": 1.78, "learning_rate": 1.9405825298687075e-05, "loss": 0.0116, "step": 123730 }, { "epoch": 1.78, "learning_rate": 1.9405777258948604e-05, "loss": 0.01, "step": 123740 }, { "epoch": 1.78, "learning_rate": 1.9405729219210133e-05, "loss": 0.0093, "step": 123750 }, { "epoch": 1.78, "learning_rate": 1.940568117947166e-05, "loss": 0.0101, "step": 123760 }, { "epoch": 1.78, "learning_rate": 1.940563313973319e-05, "loss": 0.011, "step": 123770 }, { "epoch": 1.78, "learning_rate": 1.9405585099994718e-05, "loss": 0.0099, "step": 123780 }, { "epoch": 1.78, "learning_rate": 1.9405537060256247e-05, "loss": 0.0088, "step": 123790 }, { "epoch": 1.78, "learning_rate": 1.9405489020517773e-05, "loss": 0.0089, "step": 123800 }, { "epoch": 1.78, "learning_rate": 1.9405440980779302e-05, "loss": 0.008, "step": 123810 }, { "epoch": 1.78, "learning_rate": 1.940539294104083e-05, "loss": 0.0095, "step": 123820 }, { "epoch": 1.78, "learning_rate": 1.9405344901302357e-05, "loss": 0.0103, "step": 123830 }, { "epoch": 1.78, "learning_rate": 1.9405296861563887e-05, "loss": 0.0134, "step": 123840 }, { "epoch": 1.78, "learning_rate": 1.9405248821825416e-05, "loss": 0.0079, "step": 123850 }, { "epoch": 1.79, "learning_rate": 1.9405200782086945e-05, "loss": 0.012, "step": 123860 }, { "epoch": 1.79, "learning_rate": 1.940515274234847e-05, "loss": 0.0124, "step": 123870 }, { "epoch": 1.79, "learning_rate": 1.940510470261e-05, "loss": 0.0072, "step": 123880 }, { "epoch": 1.79, "learning_rate": 1.940505666287153e-05, "loss": 0.0084, "step": 123890 }, { "epoch": 1.79, "learning_rate": 1.9405008623133056e-05, "loss": 0.0103, "step": 123900 }, { "epoch": 1.79, "learning_rate": 1.9404960583394585e-05, "loss": 0.0134, "step": 123910 }, { "epoch": 1.79, "learning_rate": 1.9404912543656114e-05, "loss": 0.0109, "step": 123920 }, { "epoch": 1.79, "learning_rate": 1.9404864503917643e-05, "loss": 0.0106, "step": 123930 }, { "epoch": 1.79, "learning_rate": 1.940481646417917e-05, "loss": 0.0123, "step": 123940 }, { "epoch": 1.79, "learning_rate": 1.94047684244407e-05, "loss": 0.0086, "step": 123950 }, { "epoch": 1.79, "learning_rate": 1.9404720384702228e-05, "loss": 0.0149, "step": 123960 }, { "epoch": 1.79, "learning_rate": 1.9404672344963754e-05, "loss": 0.0119, "step": 123970 }, { "epoch": 1.79, "learning_rate": 1.9404624305225283e-05, "loss": 0.0105, "step": 123980 }, { "epoch": 1.79, "learning_rate": 1.9404576265486812e-05, "loss": 0.0102, "step": 123990 }, { "epoch": 1.79, "learning_rate": 1.940452822574834e-05, "loss": 0.008, "step": 124000 }, { "epoch": 1.79, "learning_rate": 1.9404480186009867e-05, "loss": 0.009, "step": 124010 }, { "epoch": 1.79, "learning_rate": 1.9404432146271397e-05, "loss": 0.0111, "step": 124020 }, { "epoch": 1.79, "learning_rate": 1.9404384106532926e-05, "loss": 0.0127, "step": 124030 }, { "epoch": 1.79, "learning_rate": 1.9404336066794455e-05, "loss": 0.0105, "step": 124040 }, { "epoch": 1.79, "learning_rate": 1.940428802705598e-05, "loss": 0.0081, "step": 124050 }, { "epoch": 1.79, "learning_rate": 1.940423998731751e-05, "loss": 0.0108, "step": 124060 }, { "epoch": 1.79, "learning_rate": 1.940419194757904e-05, "loss": 0.0099, "step": 124070 }, { "epoch": 1.79, "learning_rate": 1.9404143907840565e-05, "loss": 0.0097, "step": 124080 }, { "epoch": 1.79, "learning_rate": 1.9404095868102095e-05, "loss": 0.0102, "step": 124090 }, { "epoch": 1.79, "learning_rate": 1.9404047828363624e-05, "loss": 0.0101, "step": 124100 }, { "epoch": 1.79, "learning_rate": 1.9403999788625153e-05, "loss": 0.01, "step": 124110 }, { "epoch": 1.79, "learning_rate": 1.940395174888668e-05, "loss": 0.0151, "step": 124120 }, { "epoch": 1.79, "learning_rate": 1.940390370914821e-05, "loss": 0.0093, "step": 124130 }, { "epoch": 1.79, "learning_rate": 1.9403855669409738e-05, "loss": 0.0142, "step": 124140 }, { "epoch": 1.79, "learning_rate": 1.9403807629671264e-05, "loss": 0.0087, "step": 124150 }, { "epoch": 1.79, "learning_rate": 1.9403759589932793e-05, "loss": 0.0072, "step": 124160 }, { "epoch": 1.79, "learning_rate": 1.9403711550194322e-05, "loss": 0.0103, "step": 124170 }, { "epoch": 1.79, "learning_rate": 1.940366351045585e-05, "loss": 0.0108, "step": 124180 }, { "epoch": 1.79, "learning_rate": 1.9403615470717377e-05, "loss": 0.0114, "step": 124190 }, { "epoch": 1.79, "learning_rate": 1.9403567430978906e-05, "loss": 0.011, "step": 124200 }, { "epoch": 1.79, "learning_rate": 1.9403519391240436e-05, "loss": 0.0083, "step": 124210 }, { "epoch": 1.79, "learning_rate": 1.9403471351501965e-05, "loss": 0.0113, "step": 124220 }, { "epoch": 1.79, "learning_rate": 1.940342331176349e-05, "loss": 0.0085, "step": 124230 }, { "epoch": 1.79, "learning_rate": 1.940337527202502e-05, "loss": 0.0109, "step": 124240 }, { "epoch": 1.79, "learning_rate": 1.940332723228655e-05, "loss": 0.0097, "step": 124250 }, { "epoch": 1.79, "learning_rate": 1.9403279192548075e-05, "loss": 0.0114, "step": 124260 }, { "epoch": 1.79, "learning_rate": 1.9403231152809605e-05, "loss": 0.0095, "step": 124270 }, { "epoch": 1.79, "learning_rate": 1.9403183113071134e-05, "loss": 0.0111, "step": 124280 }, { "epoch": 1.79, "learning_rate": 1.9403135073332663e-05, "loss": 0.012, "step": 124290 }, { "epoch": 1.79, "learning_rate": 1.940308703359419e-05, "loss": 0.0155, "step": 124300 }, { "epoch": 1.79, "learning_rate": 1.9403038993855718e-05, "loss": 0.0101, "step": 124310 }, { "epoch": 1.79, "learning_rate": 1.9402990954117248e-05, "loss": 0.0091, "step": 124320 }, { "epoch": 1.79, "learning_rate": 1.9402942914378773e-05, "loss": 0.0076, "step": 124330 }, { "epoch": 1.79, "learning_rate": 1.9402894874640303e-05, "loss": 0.0109, "step": 124340 }, { "epoch": 1.79, "learning_rate": 1.9402846834901832e-05, "loss": 0.009, "step": 124350 }, { "epoch": 1.79, "learning_rate": 1.940279879516336e-05, "loss": 0.0117, "step": 124360 }, { "epoch": 1.79, "learning_rate": 1.9402750755424887e-05, "loss": 0.012, "step": 124370 }, { "epoch": 1.79, "learning_rate": 1.9402702715686416e-05, "loss": 0.0099, "step": 124380 }, { "epoch": 1.79, "learning_rate": 1.9402654675947946e-05, "loss": 0.0094, "step": 124390 }, { "epoch": 1.79, "learning_rate": 1.9402606636209475e-05, "loss": 0.0075, "step": 124400 }, { "epoch": 1.79, "learning_rate": 1.9402558596471e-05, "loss": 0.012, "step": 124410 }, { "epoch": 1.79, "learning_rate": 1.940251055673253e-05, "loss": 0.0102, "step": 124420 }, { "epoch": 1.79, "learning_rate": 1.940246251699406e-05, "loss": 0.0096, "step": 124430 }, { "epoch": 1.79, "learning_rate": 1.9402414477255585e-05, "loss": 0.0097, "step": 124440 }, { "epoch": 1.79, "learning_rate": 1.9402366437517115e-05, "loss": 0.0096, "step": 124450 }, { "epoch": 1.79, "learning_rate": 1.9402318397778644e-05, "loss": 0.0075, "step": 124460 }, { "epoch": 1.79, "learning_rate": 1.9402270358040173e-05, "loss": 0.0106, "step": 124470 }, { "epoch": 1.79, "learning_rate": 1.94022223183017e-05, "loss": 0.0089, "step": 124480 }, { "epoch": 1.79, "learning_rate": 1.9402174278563228e-05, "loss": 0.0078, "step": 124490 }, { "epoch": 1.79, "learning_rate": 1.9402126238824757e-05, "loss": 0.0121, "step": 124500 }, { "epoch": 1.79, "learning_rate": 1.9402078199086283e-05, "loss": 0.0105, "step": 124510 }, { "epoch": 1.79, "learning_rate": 1.9402030159347813e-05, "loss": 0.0132, "step": 124520 }, { "epoch": 1.79, "learning_rate": 1.9401982119609342e-05, "loss": 0.0111, "step": 124530 }, { "epoch": 1.79, "learning_rate": 1.940193407987087e-05, "loss": 0.0078, "step": 124540 }, { "epoch": 1.8, "learning_rate": 1.9401886040132397e-05, "loss": 0.0119, "step": 124550 }, { "epoch": 1.8, "learning_rate": 1.9401838000393926e-05, "loss": 0.0101, "step": 124560 }, { "epoch": 1.8, "learning_rate": 1.9401789960655456e-05, "loss": 0.0099, "step": 124570 }, { "epoch": 1.8, "learning_rate": 1.9401741920916985e-05, "loss": 0.0108, "step": 124580 }, { "epoch": 1.8, "learning_rate": 1.940169388117851e-05, "loss": 0.0114, "step": 124590 }, { "epoch": 1.8, "learning_rate": 1.940164584144004e-05, "loss": 0.01, "step": 124600 }, { "epoch": 1.8, "learning_rate": 1.940159780170157e-05, "loss": 0.0116, "step": 124610 }, { "epoch": 1.8, "learning_rate": 1.9401549761963095e-05, "loss": 0.0084, "step": 124620 }, { "epoch": 1.8, "learning_rate": 1.9401501722224624e-05, "loss": 0.0099, "step": 124630 }, { "epoch": 1.8, "learning_rate": 1.9401453682486154e-05, "loss": 0.0074, "step": 124640 }, { "epoch": 1.8, "learning_rate": 1.9401405642747683e-05, "loss": 0.0097, "step": 124650 }, { "epoch": 1.8, "learning_rate": 1.940135760300921e-05, "loss": 0.011, "step": 124660 }, { "epoch": 1.8, "learning_rate": 1.9401309563270738e-05, "loss": 0.0082, "step": 124670 }, { "epoch": 1.8, "learning_rate": 1.9401261523532267e-05, "loss": 0.0102, "step": 124680 }, { "epoch": 1.8, "learning_rate": 1.9401213483793793e-05, "loss": 0.0112, "step": 124690 }, { "epoch": 1.8, "learning_rate": 1.9401165444055323e-05, "loss": 0.0088, "step": 124700 }, { "epoch": 1.8, "learning_rate": 1.9401117404316852e-05, "loss": 0.0081, "step": 124710 }, { "epoch": 1.8, "learning_rate": 1.940106936457838e-05, "loss": 0.01, "step": 124720 }, { "epoch": 1.8, "learning_rate": 1.9401021324839907e-05, "loss": 0.0127, "step": 124730 }, { "epoch": 1.8, "learning_rate": 1.9400973285101436e-05, "loss": 0.0101, "step": 124740 }, { "epoch": 1.8, "learning_rate": 1.9400925245362966e-05, "loss": 0.0102, "step": 124750 }, { "epoch": 1.8, "learning_rate": 1.9400877205624495e-05, "loss": 0.0091, "step": 124760 }, { "epoch": 1.8, "learning_rate": 1.940082916588602e-05, "loss": 0.0095, "step": 124770 }, { "epoch": 1.8, "learning_rate": 1.940078112614755e-05, "loss": 0.0072, "step": 124780 }, { "epoch": 1.8, "learning_rate": 1.940073308640908e-05, "loss": 0.0097, "step": 124790 }, { "epoch": 1.8, "learning_rate": 1.9400685046670605e-05, "loss": 0.0086, "step": 124800 }, { "epoch": 1.8, "learning_rate": 1.9400637006932134e-05, "loss": 0.0115, "step": 124810 }, { "epoch": 1.8, "learning_rate": 1.9400588967193664e-05, "loss": 0.0092, "step": 124820 }, { "epoch": 1.8, "learning_rate": 1.9400540927455193e-05, "loss": 0.0112, "step": 124830 }, { "epoch": 1.8, "learning_rate": 1.940049288771672e-05, "loss": 0.0105, "step": 124840 }, { "epoch": 1.8, "learning_rate": 1.9400444847978248e-05, "loss": 0.0106, "step": 124850 }, { "epoch": 1.8, "learning_rate": 1.9400396808239777e-05, "loss": 0.0122, "step": 124860 }, { "epoch": 1.8, "learning_rate": 1.9400348768501303e-05, "loss": 0.0079, "step": 124870 }, { "epoch": 1.8, "learning_rate": 1.9400300728762832e-05, "loss": 0.0085, "step": 124880 }, { "epoch": 1.8, "learning_rate": 1.9400252689024362e-05, "loss": 0.0104, "step": 124890 }, { "epoch": 1.8, "learning_rate": 1.940020464928589e-05, "loss": 0.0094, "step": 124900 }, { "epoch": 1.8, "learning_rate": 1.940015660954742e-05, "loss": 0.009, "step": 124910 }, { "epoch": 1.8, "learning_rate": 1.940010856980895e-05, "loss": 0.0101, "step": 124920 }, { "epoch": 1.8, "learning_rate": 1.9400060530070475e-05, "loss": 0.0063, "step": 124930 }, { "epoch": 1.8, "learning_rate": 1.9400012490332005e-05, "loss": 0.0104, "step": 124940 }, { "epoch": 1.8, "learning_rate": 1.9399964450593534e-05, "loss": 0.0091, "step": 124950 }, { "epoch": 1.8, "learning_rate": 1.9399916410855063e-05, "loss": 0.0121, "step": 124960 }, { "epoch": 1.8, "learning_rate": 1.939986837111659e-05, "loss": 0.0096, "step": 124970 }, { "epoch": 1.8, "learning_rate": 1.939982033137812e-05, "loss": 0.0093, "step": 124980 }, { "epoch": 1.8, "learning_rate": 1.9399772291639648e-05, "loss": 0.01, "step": 124990 }, { "epoch": 1.8, "learning_rate": 1.9399724251901177e-05, "loss": 0.0083, "step": 125000 }, { "epoch": 1.8, "learning_rate": 1.9399676212162703e-05, "loss": 0.0173, "step": 125010 }, { "epoch": 1.8, "learning_rate": 1.9399628172424232e-05, "loss": 0.0106, "step": 125020 }, { "epoch": 1.8, "learning_rate": 1.939958013268576e-05, "loss": 0.0108, "step": 125030 }, { "epoch": 1.8, "learning_rate": 1.9399532092947287e-05, "loss": 0.0094, "step": 125040 }, { "epoch": 1.8, "learning_rate": 1.9399484053208816e-05, "loss": 0.0128, "step": 125050 }, { "epoch": 1.8, "learning_rate": 1.9399436013470346e-05, "loss": 0.0113, "step": 125060 }, { "epoch": 1.8, "learning_rate": 1.9399387973731875e-05, "loss": 0.0091, "step": 125070 }, { "epoch": 1.8, "learning_rate": 1.93993399339934e-05, "loss": 0.0101, "step": 125080 }, { "epoch": 1.8, "learning_rate": 1.939929189425493e-05, "loss": 0.0147, "step": 125090 }, { "epoch": 1.8, "learning_rate": 1.939924385451646e-05, "loss": 0.0078, "step": 125100 }, { "epoch": 1.8, "learning_rate": 1.9399195814777985e-05, "loss": 0.0084, "step": 125110 }, { "epoch": 1.8, "learning_rate": 1.9399147775039515e-05, "loss": 0.0078, "step": 125120 }, { "epoch": 1.8, "learning_rate": 1.9399099735301044e-05, "loss": 0.0095, "step": 125130 }, { "epoch": 1.8, "learning_rate": 1.9399051695562573e-05, "loss": 0.0098, "step": 125140 }, { "epoch": 1.8, "learning_rate": 1.93990036558241e-05, "loss": 0.0076, "step": 125150 }, { "epoch": 1.8, "learning_rate": 1.9398955616085628e-05, "loss": 0.0144, "step": 125160 }, { "epoch": 1.8, "learning_rate": 1.9398907576347158e-05, "loss": 0.0083, "step": 125170 }, { "epoch": 1.8, "learning_rate": 1.9398859536608687e-05, "loss": 0.0101, "step": 125180 }, { "epoch": 1.8, "learning_rate": 1.9398811496870213e-05, "loss": 0.011, "step": 125190 }, { "epoch": 1.8, "learning_rate": 1.9398763457131742e-05, "loss": 0.0103, "step": 125200 }, { "epoch": 1.8, "learning_rate": 1.939871541739327e-05, "loss": 0.0077, "step": 125210 }, { "epoch": 1.8, "learning_rate": 1.9398667377654797e-05, "loss": 0.0096, "step": 125220 }, { "epoch": 1.8, "learning_rate": 1.9398619337916326e-05, "loss": 0.0116, "step": 125230 }, { "epoch": 1.8, "learning_rate": 1.9398571298177856e-05, "loss": 0.012, "step": 125240 }, { "epoch": 1.81, "learning_rate": 1.9398523258439385e-05, "loss": 0.0078, "step": 125250 }, { "epoch": 1.81, "learning_rate": 1.939847521870091e-05, "loss": 0.0095, "step": 125260 }, { "epoch": 1.81, "learning_rate": 1.939842717896244e-05, "loss": 0.0083, "step": 125270 }, { "epoch": 1.81, "learning_rate": 1.939837913922397e-05, "loss": 0.0133, "step": 125280 }, { "epoch": 1.81, "learning_rate": 1.9398331099485495e-05, "loss": 0.0098, "step": 125290 }, { "epoch": 1.81, "learning_rate": 1.9398283059747025e-05, "loss": 0.0089, "step": 125300 }, { "epoch": 1.81, "learning_rate": 1.9398235020008554e-05, "loss": 0.01, "step": 125310 }, { "epoch": 1.81, "learning_rate": 1.9398186980270083e-05, "loss": 0.0132, "step": 125320 }, { "epoch": 1.81, "learning_rate": 1.939813894053161e-05, "loss": 0.0084, "step": 125330 }, { "epoch": 1.81, "learning_rate": 1.9398090900793138e-05, "loss": 0.014, "step": 125340 }, { "epoch": 1.81, "learning_rate": 1.9398042861054667e-05, "loss": 0.0156, "step": 125350 }, { "epoch": 1.81, "learning_rate": 1.9397994821316193e-05, "loss": 0.0086, "step": 125360 }, { "epoch": 1.81, "learning_rate": 1.9397946781577723e-05, "loss": 0.0103, "step": 125370 }, { "epoch": 1.81, "learning_rate": 1.9397898741839252e-05, "loss": 0.013, "step": 125380 }, { "epoch": 1.81, "learning_rate": 1.939785070210078e-05, "loss": 0.0114, "step": 125390 }, { "epoch": 1.81, "learning_rate": 1.9397802662362307e-05, "loss": 0.0075, "step": 125400 }, { "epoch": 1.81, "learning_rate": 1.9397754622623836e-05, "loss": 0.0108, "step": 125410 }, { "epoch": 1.81, "learning_rate": 1.9397706582885366e-05, "loss": 0.0141, "step": 125420 }, { "epoch": 1.81, "learning_rate": 1.9397658543146895e-05, "loss": 0.0087, "step": 125430 }, { "epoch": 1.81, "learning_rate": 1.939761050340842e-05, "loss": 0.0133, "step": 125440 }, { "epoch": 1.81, "learning_rate": 1.939756246366995e-05, "loss": 0.0089, "step": 125450 }, { "epoch": 1.81, "learning_rate": 1.939751442393148e-05, "loss": 0.0151, "step": 125460 }, { "epoch": 1.81, "learning_rate": 1.9397466384193005e-05, "loss": 0.0068, "step": 125470 }, { "epoch": 1.81, "learning_rate": 1.9397418344454534e-05, "loss": 0.009, "step": 125480 }, { "epoch": 1.81, "learning_rate": 1.9397370304716064e-05, "loss": 0.0098, "step": 125490 }, { "epoch": 1.81, "learning_rate": 1.9397322264977593e-05, "loss": 0.0081, "step": 125500 }, { "epoch": 1.81, "learning_rate": 1.939727422523912e-05, "loss": 0.0085, "step": 125510 }, { "epoch": 1.81, "learning_rate": 1.9397226185500648e-05, "loss": 0.0125, "step": 125520 }, { "epoch": 1.81, "learning_rate": 1.9397178145762177e-05, "loss": 0.0133, "step": 125530 }, { "epoch": 1.81, "learning_rate": 1.9397130106023703e-05, "loss": 0.0123, "step": 125540 }, { "epoch": 1.81, "learning_rate": 1.9397082066285233e-05, "loss": 0.0131, "step": 125550 }, { "epoch": 1.81, "learning_rate": 1.9397034026546762e-05, "loss": 0.0082, "step": 125560 }, { "epoch": 1.81, "learning_rate": 1.939698598680829e-05, "loss": 0.0106, "step": 125570 }, { "epoch": 1.81, "learning_rate": 1.9396937947069817e-05, "loss": 0.0092, "step": 125580 }, { "epoch": 1.81, "learning_rate": 1.9396889907331346e-05, "loss": 0.01, "step": 125590 }, { "epoch": 1.81, "learning_rate": 1.9396841867592876e-05, "loss": 0.0083, "step": 125600 }, { "epoch": 1.81, "learning_rate": 1.9396793827854405e-05, "loss": 0.0087, "step": 125610 }, { "epoch": 1.81, "learning_rate": 1.939674578811593e-05, "loss": 0.0139, "step": 125620 }, { "epoch": 1.81, "learning_rate": 1.939669774837746e-05, "loss": 0.0099, "step": 125630 }, { "epoch": 1.81, "learning_rate": 1.939664970863899e-05, "loss": 0.0097, "step": 125640 }, { "epoch": 1.81, "learning_rate": 1.9396601668900515e-05, "loss": 0.0104, "step": 125650 }, { "epoch": 1.81, "learning_rate": 1.9396553629162044e-05, "loss": 0.0167, "step": 125660 }, { "epoch": 1.81, "learning_rate": 1.9396505589423574e-05, "loss": 0.0082, "step": 125670 }, { "epoch": 1.81, "learning_rate": 1.9396457549685103e-05, "loss": 0.0088, "step": 125680 }, { "epoch": 1.81, "learning_rate": 1.939640950994663e-05, "loss": 0.012, "step": 125690 }, { "epoch": 1.81, "learning_rate": 1.9396361470208158e-05, "loss": 0.012, "step": 125700 }, { "epoch": 1.81, "learning_rate": 1.9396313430469687e-05, "loss": 0.0074, "step": 125710 }, { "epoch": 1.81, "learning_rate": 1.9396265390731213e-05, "loss": 0.009, "step": 125720 }, { "epoch": 1.81, "learning_rate": 1.9396217350992742e-05, "loss": 0.012, "step": 125730 }, { "epoch": 1.81, "learning_rate": 1.9396169311254272e-05, "loss": 0.0074, "step": 125740 }, { "epoch": 1.81, "learning_rate": 1.93961212715158e-05, "loss": 0.0083, "step": 125750 }, { "epoch": 1.81, "learning_rate": 1.9396073231777327e-05, "loss": 0.0157, "step": 125760 }, { "epoch": 1.81, "learning_rate": 1.9396025192038856e-05, "loss": 0.0097, "step": 125770 }, { "epoch": 1.81, "learning_rate": 1.9395977152300385e-05, "loss": 0.0123, "step": 125780 }, { "epoch": 1.81, "learning_rate": 1.9395929112561915e-05, "loss": 0.0106, "step": 125790 }, { "epoch": 1.81, "learning_rate": 1.939588107282344e-05, "loss": 0.0096, "step": 125800 }, { "epoch": 1.81, "learning_rate": 1.939583303308497e-05, "loss": 0.011, "step": 125810 }, { "epoch": 1.81, "learning_rate": 1.93957849933465e-05, "loss": 0.01, "step": 125820 }, { "epoch": 1.81, "learning_rate": 1.9395736953608025e-05, "loss": 0.0127, "step": 125830 }, { "epoch": 1.81, "learning_rate": 1.9395688913869554e-05, "loss": 0.0076, "step": 125840 }, { "epoch": 1.81, "learning_rate": 1.9395640874131084e-05, "loss": 0.011, "step": 125850 }, { "epoch": 1.81, "learning_rate": 1.9395592834392613e-05, "loss": 0.0085, "step": 125860 }, { "epoch": 1.81, "learning_rate": 1.939554479465414e-05, "loss": 0.0088, "step": 125870 }, { "epoch": 1.81, "learning_rate": 1.9395496754915668e-05, "loss": 0.0121, "step": 125880 }, { "epoch": 1.81, "learning_rate": 1.9395448715177197e-05, "loss": 0.0091, "step": 125890 }, { "epoch": 1.81, "learning_rate": 1.9395400675438723e-05, "loss": 0.0102, "step": 125900 }, { "epoch": 1.81, "learning_rate": 1.9395352635700252e-05, "loss": 0.0083, "step": 125910 }, { "epoch": 1.81, "learning_rate": 1.939530459596178e-05, "loss": 0.0082, "step": 125920 }, { "epoch": 1.81, "learning_rate": 1.939525655622331e-05, "loss": 0.0116, "step": 125930 }, { "epoch": 1.82, "learning_rate": 1.9395208516484837e-05, "loss": 0.0086, "step": 125940 }, { "epoch": 1.82, "learning_rate": 1.9395160476746366e-05, "loss": 0.0076, "step": 125950 }, { "epoch": 1.82, "learning_rate": 1.9395112437007895e-05, "loss": 0.0086, "step": 125960 }, { "epoch": 1.82, "learning_rate": 1.9395064397269425e-05, "loss": 0.0087, "step": 125970 }, { "epoch": 1.82, "learning_rate": 1.939501635753095e-05, "loss": 0.0145, "step": 125980 }, { "epoch": 1.82, "learning_rate": 1.939496831779248e-05, "loss": 0.0082, "step": 125990 }, { "epoch": 1.82, "learning_rate": 1.939492027805401e-05, "loss": 0.009, "step": 126000 }, { "epoch": 1.82, "learning_rate": 1.9394872238315535e-05, "loss": 0.0091, "step": 126010 }, { "epoch": 1.82, "learning_rate": 1.9394824198577064e-05, "loss": 0.0111, "step": 126020 }, { "epoch": 1.82, "learning_rate": 1.9394776158838593e-05, "loss": 0.0096, "step": 126030 }, { "epoch": 1.82, "learning_rate": 1.9394728119100123e-05, "loss": 0.0082, "step": 126040 }, { "epoch": 1.82, "learning_rate": 1.939468007936165e-05, "loss": 0.0108, "step": 126050 }, { "epoch": 1.82, "learning_rate": 1.9394632039623178e-05, "loss": 0.0104, "step": 126060 }, { "epoch": 1.82, "learning_rate": 1.9394583999884707e-05, "loss": 0.0094, "step": 126070 }, { "epoch": 1.82, "learning_rate": 1.9394535960146233e-05, "loss": 0.008, "step": 126080 }, { "epoch": 1.82, "learning_rate": 1.9394487920407762e-05, "loss": 0.0084, "step": 126090 }, { "epoch": 1.82, "learning_rate": 1.939443988066929e-05, "loss": 0.0075, "step": 126100 }, { "epoch": 1.82, "learning_rate": 1.939439184093082e-05, "loss": 0.009, "step": 126110 }, { "epoch": 1.82, "learning_rate": 1.9394343801192347e-05, "loss": 0.01, "step": 126120 }, { "epoch": 1.82, "learning_rate": 1.9394295761453876e-05, "loss": 0.0107, "step": 126130 }, { "epoch": 1.82, "learning_rate": 1.9394247721715405e-05, "loss": 0.0111, "step": 126140 }, { "epoch": 1.82, "learning_rate": 1.9394199681976935e-05, "loss": 0.0081, "step": 126150 }, { "epoch": 1.82, "learning_rate": 1.939415164223846e-05, "loss": 0.0124, "step": 126160 }, { "epoch": 1.82, "learning_rate": 1.939410360249999e-05, "loss": 0.0126, "step": 126170 }, { "epoch": 1.82, "learning_rate": 1.939405556276152e-05, "loss": 0.011, "step": 126180 }, { "epoch": 1.82, "learning_rate": 1.9394007523023045e-05, "loss": 0.0097, "step": 126190 }, { "epoch": 1.82, "learning_rate": 1.9393959483284574e-05, "loss": 0.0083, "step": 126200 }, { "epoch": 1.82, "learning_rate": 1.9393911443546103e-05, "loss": 0.0112, "step": 126210 }, { "epoch": 1.82, "learning_rate": 1.9393863403807633e-05, "loss": 0.0102, "step": 126220 }, { "epoch": 1.82, "learning_rate": 1.939381536406916e-05, "loss": 0.0108, "step": 126230 }, { "epoch": 1.82, "learning_rate": 1.9393767324330688e-05, "loss": 0.0096, "step": 126240 }, { "epoch": 1.82, "learning_rate": 1.9393719284592217e-05, "loss": 0.0115, "step": 126250 }, { "epoch": 1.82, "learning_rate": 1.9393671244853743e-05, "loss": 0.0092, "step": 126260 }, { "epoch": 1.82, "learning_rate": 1.9393623205115272e-05, "loss": 0.0085, "step": 126270 }, { "epoch": 1.82, "learning_rate": 1.93935751653768e-05, "loss": 0.0089, "step": 126280 }, { "epoch": 1.82, "learning_rate": 1.939352712563833e-05, "loss": 0.0118, "step": 126290 }, { "epoch": 1.82, "learning_rate": 1.9393479085899857e-05, "loss": 0.0121, "step": 126300 }, { "epoch": 1.82, "learning_rate": 1.9393431046161386e-05, "loss": 0.0091, "step": 126310 }, { "epoch": 1.82, "learning_rate": 1.9393383006422915e-05, "loss": 0.0099, "step": 126320 }, { "epoch": 1.82, "learning_rate": 1.9393334966684444e-05, "loss": 0.011, "step": 126330 }, { "epoch": 1.82, "learning_rate": 1.939328692694597e-05, "loss": 0.0107, "step": 126340 }, { "epoch": 1.82, "learning_rate": 1.93932388872075e-05, "loss": 0.0123, "step": 126350 }, { "epoch": 1.82, "learning_rate": 1.939319084746903e-05, "loss": 0.0138, "step": 126360 }, { "epoch": 1.82, "learning_rate": 1.9393142807730555e-05, "loss": 0.008, "step": 126370 }, { "epoch": 1.82, "learning_rate": 1.9393094767992084e-05, "loss": 0.0077, "step": 126380 }, { "epoch": 1.82, "learning_rate": 1.9393046728253613e-05, "loss": 0.0129, "step": 126390 }, { "epoch": 1.82, "learning_rate": 1.9392998688515143e-05, "loss": 0.012, "step": 126400 }, { "epoch": 1.82, "learning_rate": 1.939295064877667e-05, "loss": 0.0089, "step": 126410 }, { "epoch": 1.82, "learning_rate": 1.9392902609038198e-05, "loss": 0.009, "step": 126420 }, { "epoch": 1.82, "learning_rate": 1.9392854569299727e-05, "loss": 0.01, "step": 126430 }, { "epoch": 1.82, "learning_rate": 1.9392806529561253e-05, "loss": 0.0099, "step": 126440 }, { "epoch": 1.82, "learning_rate": 1.9392758489822782e-05, "loss": 0.0104, "step": 126450 }, { "epoch": 1.82, "learning_rate": 1.939271045008431e-05, "loss": 0.0108, "step": 126460 }, { "epoch": 1.82, "learning_rate": 1.939266241034584e-05, "loss": 0.0077, "step": 126470 }, { "epoch": 1.82, "learning_rate": 1.9392614370607367e-05, "loss": 0.0115, "step": 126480 }, { "epoch": 1.82, "learning_rate": 1.9392566330868896e-05, "loss": 0.0081, "step": 126490 }, { "epoch": 1.82, "learning_rate": 1.9392518291130425e-05, "loss": 0.0106, "step": 126500 }, { "epoch": 1.82, "learning_rate": 1.9392470251391954e-05, "loss": 0.0109, "step": 126510 }, { "epoch": 1.82, "learning_rate": 1.939242221165348e-05, "loss": 0.0104, "step": 126520 }, { "epoch": 1.82, "learning_rate": 1.939237417191501e-05, "loss": 0.0106, "step": 126530 }, { "epoch": 1.82, "learning_rate": 1.939232613217654e-05, "loss": 0.013, "step": 126540 }, { "epoch": 1.82, "learning_rate": 1.9392278092438065e-05, "loss": 0.0079, "step": 126550 }, { "epoch": 1.82, "learning_rate": 1.9392230052699594e-05, "loss": 0.0112, "step": 126560 }, { "epoch": 1.82, "learning_rate": 1.9392182012961123e-05, "loss": 0.0099, "step": 126570 }, { "epoch": 1.82, "learning_rate": 1.9392133973222652e-05, "loss": 0.0124, "step": 126580 }, { "epoch": 1.82, "learning_rate": 1.939208593348418e-05, "loss": 0.0144, "step": 126590 }, { "epoch": 1.82, "learning_rate": 1.9392037893745708e-05, "loss": 0.0099, "step": 126600 }, { "epoch": 1.82, "learning_rate": 1.9391989854007237e-05, "loss": 0.0077, "step": 126610 }, { "epoch": 1.82, "learning_rate": 1.9391941814268763e-05, "loss": 0.01, "step": 126620 }, { "epoch": 1.82, "learning_rate": 1.9391893774530292e-05, "loss": 0.0086, "step": 126630 }, { "epoch": 1.83, "learning_rate": 1.939184573479182e-05, "loss": 0.0136, "step": 126640 }, { "epoch": 1.83, "learning_rate": 1.939179769505335e-05, "loss": 0.0085, "step": 126650 }, { "epoch": 1.83, "learning_rate": 1.9391749655314876e-05, "loss": 0.0146, "step": 126660 }, { "epoch": 1.83, "learning_rate": 1.9391701615576406e-05, "loss": 0.0149, "step": 126670 }, { "epoch": 1.83, "learning_rate": 1.9391653575837935e-05, "loss": 0.0075, "step": 126680 }, { "epoch": 1.83, "learning_rate": 1.9391605536099464e-05, "loss": 0.0089, "step": 126690 }, { "epoch": 1.83, "learning_rate": 1.939155749636099e-05, "loss": 0.015, "step": 126700 }, { "epoch": 1.83, "learning_rate": 1.939150945662252e-05, "loss": 0.0116, "step": 126710 }, { "epoch": 1.83, "learning_rate": 1.939146141688405e-05, "loss": 0.0072, "step": 126720 }, { "epoch": 1.83, "learning_rate": 1.9391413377145575e-05, "loss": 0.0125, "step": 126730 }, { "epoch": 1.83, "learning_rate": 1.9391365337407104e-05, "loss": 0.009, "step": 126740 }, { "epoch": 1.83, "learning_rate": 1.9391322101642482e-05, "loss": 0.0089, "step": 126750 }, { "epoch": 1.83, "learning_rate": 1.9391274061904008e-05, "loss": 0.0081, "step": 126760 }, { "epoch": 1.83, "learning_rate": 1.9391226022165537e-05, "loss": 0.0153, "step": 126770 }, { "epoch": 1.83, "learning_rate": 1.9391177982427066e-05, "loss": 0.0083, "step": 126780 }, { "epoch": 1.83, "learning_rate": 1.9391129942688592e-05, "loss": 0.0128, "step": 126790 }, { "epoch": 1.83, "learning_rate": 1.939108190295012e-05, "loss": 0.0116, "step": 126800 }, { "epoch": 1.83, "learning_rate": 1.939103386321165e-05, "loss": 0.0078, "step": 126810 }, { "epoch": 1.83, "learning_rate": 1.939098582347318e-05, "loss": 0.0109, "step": 126820 }, { "epoch": 1.83, "learning_rate": 1.9390937783734706e-05, "loss": 0.0102, "step": 126830 }, { "epoch": 1.83, "learning_rate": 1.9390889743996235e-05, "loss": 0.0143, "step": 126840 }, { "epoch": 1.83, "learning_rate": 1.9390841704257764e-05, "loss": 0.011, "step": 126850 }, { "epoch": 1.83, "learning_rate": 1.939079366451929e-05, "loss": 0.0132, "step": 126860 }, { "epoch": 1.83, "learning_rate": 1.939074562478082e-05, "loss": 0.0082, "step": 126870 }, { "epoch": 1.83, "learning_rate": 1.939069758504235e-05, "loss": 0.0101, "step": 126880 }, { "epoch": 1.83, "learning_rate": 1.9390649545303878e-05, "loss": 0.0114, "step": 126890 }, { "epoch": 1.83, "learning_rate": 1.9390601505565404e-05, "loss": 0.0084, "step": 126900 }, { "epoch": 1.83, "learning_rate": 1.9390553465826933e-05, "loss": 0.0097, "step": 126910 }, { "epoch": 1.83, "learning_rate": 1.9390505426088463e-05, "loss": 0.0099, "step": 126920 }, { "epoch": 1.83, "learning_rate": 1.939045738634999e-05, "loss": 0.0129, "step": 126930 }, { "epoch": 1.83, "learning_rate": 1.9390409346611518e-05, "loss": 0.0098, "step": 126940 }, { "epoch": 1.83, "learning_rate": 1.9390361306873047e-05, "loss": 0.01, "step": 126950 }, { "epoch": 1.83, "learning_rate": 1.9390313267134576e-05, "loss": 0.0076, "step": 126960 }, { "epoch": 1.83, "learning_rate": 1.9390265227396102e-05, "loss": 0.0117, "step": 126970 }, { "epoch": 1.83, "learning_rate": 1.939021718765763e-05, "loss": 0.0125, "step": 126980 }, { "epoch": 1.83, "learning_rate": 1.939016914791916e-05, "loss": 0.0117, "step": 126990 }, { "epoch": 1.83, "learning_rate": 1.939012110818069e-05, "loss": 0.0096, "step": 127000 }, { "epoch": 1.83, "learning_rate": 1.9390073068442216e-05, "loss": 0.01, "step": 127010 }, { "epoch": 1.83, "learning_rate": 1.9390025028703745e-05, "loss": 0.0126, "step": 127020 }, { "epoch": 1.83, "learning_rate": 1.9389976988965274e-05, "loss": 0.008, "step": 127030 }, { "epoch": 1.83, "learning_rate": 1.93899289492268e-05, "loss": 0.0092, "step": 127040 }, { "epoch": 1.83, "learning_rate": 1.938988090948833e-05, "loss": 0.013, "step": 127050 }, { "epoch": 1.83, "learning_rate": 1.938983286974986e-05, "loss": 0.0081, "step": 127060 }, { "epoch": 1.83, "learning_rate": 1.9389784830011388e-05, "loss": 0.0092, "step": 127070 }, { "epoch": 1.83, "learning_rate": 1.9389736790272914e-05, "loss": 0.0107, "step": 127080 }, { "epoch": 1.83, "learning_rate": 1.9389688750534443e-05, "loss": 0.0118, "step": 127090 }, { "epoch": 1.83, "learning_rate": 1.9389640710795972e-05, "loss": 0.0068, "step": 127100 }, { "epoch": 1.83, "learning_rate": 1.93895926710575e-05, "loss": 0.0102, "step": 127110 }, { "epoch": 1.83, "learning_rate": 1.9389544631319028e-05, "loss": 0.0091, "step": 127120 }, { "epoch": 1.83, "learning_rate": 1.9389496591580557e-05, "loss": 0.0077, "step": 127130 }, { "epoch": 1.83, "learning_rate": 1.9389448551842086e-05, "loss": 0.0092, "step": 127140 }, { "epoch": 1.83, "learning_rate": 1.9389400512103612e-05, "loss": 0.0122, "step": 127150 }, { "epoch": 1.83, "learning_rate": 1.938935247236514e-05, "loss": 0.0096, "step": 127160 }, { "epoch": 1.83, "learning_rate": 1.938930443262667e-05, "loss": 0.0123, "step": 127170 }, { "epoch": 1.83, "learning_rate": 1.93892563928882e-05, "loss": 0.0079, "step": 127180 }, { "epoch": 1.83, "learning_rate": 1.9389208353149726e-05, "loss": 0.007, "step": 127190 }, { "epoch": 1.83, "learning_rate": 1.9389160313411255e-05, "loss": 0.0109, "step": 127200 }, { "epoch": 1.83, "learning_rate": 1.9389112273672784e-05, "loss": 0.0089, "step": 127210 }, { "epoch": 1.83, "learning_rate": 1.938906423393431e-05, "loss": 0.0086, "step": 127220 }, { "epoch": 1.83, "learning_rate": 1.938901619419584e-05, "loss": 0.0117, "step": 127230 }, { "epoch": 1.83, "learning_rate": 1.938896815445737e-05, "loss": 0.0091, "step": 127240 }, { "epoch": 1.83, "learning_rate": 1.9388920114718898e-05, "loss": 0.0107, "step": 127250 }, { "epoch": 1.83, "learning_rate": 1.9388872074980424e-05, "loss": 0.0081, "step": 127260 }, { "epoch": 1.83, "learning_rate": 1.9388824035241953e-05, "loss": 0.0079, "step": 127270 }, { "epoch": 1.83, "learning_rate": 1.9388775995503482e-05, "loss": 0.0047, "step": 127280 }, { "epoch": 1.83, "learning_rate": 1.9388727955765008e-05, "loss": 0.0089, "step": 127290 }, { "epoch": 1.83, "learning_rate": 1.9388679916026537e-05, "loss": 0.0118, "step": 127300 }, { "epoch": 1.83, "learning_rate": 1.9388631876288067e-05, "loss": 0.0098, "step": 127310 }, { "epoch": 1.83, "learning_rate": 1.9388583836549596e-05, "loss": 0.0085, "step": 127320 }, { "epoch": 1.84, "learning_rate": 1.9388535796811122e-05, "loss": 0.0082, "step": 127330 }, { "epoch": 1.84, "learning_rate": 1.938848775707265e-05, "loss": 0.0065, "step": 127340 }, { "epoch": 1.84, "learning_rate": 1.938843971733418e-05, "loss": 0.0071, "step": 127350 }, { "epoch": 1.84, "learning_rate": 1.938839167759571e-05, "loss": 0.0133, "step": 127360 }, { "epoch": 1.84, "learning_rate": 1.9388343637857236e-05, "loss": 0.01, "step": 127370 }, { "epoch": 1.84, "learning_rate": 1.9388295598118765e-05, "loss": 0.0083, "step": 127380 }, { "epoch": 1.84, "learning_rate": 1.9388247558380294e-05, "loss": 0.0122, "step": 127390 }, { "epoch": 1.84, "learning_rate": 1.938819951864182e-05, "loss": 0.0075, "step": 127400 }, { "epoch": 1.84, "learning_rate": 1.938815147890335e-05, "loss": 0.0096, "step": 127410 }, { "epoch": 1.84, "learning_rate": 1.938810343916488e-05, "loss": 0.007, "step": 127420 }, { "epoch": 1.84, "learning_rate": 1.9388055399426408e-05, "loss": 0.0066, "step": 127430 }, { "epoch": 1.84, "learning_rate": 1.9388007359687934e-05, "loss": 0.0098, "step": 127440 }, { "epoch": 1.84, "learning_rate": 1.9387959319949463e-05, "loss": 0.0102, "step": 127450 }, { "epoch": 1.84, "learning_rate": 1.9387911280210992e-05, "loss": 0.0104, "step": 127460 }, { "epoch": 1.84, "learning_rate": 1.9387863240472518e-05, "loss": 0.0111, "step": 127470 }, { "epoch": 1.84, "learning_rate": 1.9387815200734047e-05, "loss": 0.0102, "step": 127480 }, { "epoch": 1.84, "learning_rate": 1.9387767160995577e-05, "loss": 0.0106, "step": 127490 }, { "epoch": 1.84, "learning_rate": 1.9387719121257106e-05, "loss": 0.0094, "step": 127500 }, { "epoch": 1.84, "learning_rate": 1.9387671081518632e-05, "loss": 0.013, "step": 127510 }, { "epoch": 1.84, "learning_rate": 1.938762304178016e-05, "loss": 0.0081, "step": 127520 }, { "epoch": 1.84, "learning_rate": 1.938757500204169e-05, "loss": 0.0096, "step": 127530 }, { "epoch": 1.84, "learning_rate": 1.938752696230322e-05, "loss": 0.0083, "step": 127540 }, { "epoch": 1.84, "learning_rate": 1.9387478922564746e-05, "loss": 0.0139, "step": 127550 }, { "epoch": 1.84, "learning_rate": 1.9387430882826275e-05, "loss": 0.0135, "step": 127560 }, { "epoch": 1.84, "learning_rate": 1.9387382843087804e-05, "loss": 0.0123, "step": 127570 }, { "epoch": 1.84, "learning_rate": 1.938733480334933e-05, "loss": 0.0089, "step": 127580 }, { "epoch": 1.84, "learning_rate": 1.938728676361086e-05, "loss": 0.0098, "step": 127590 }, { "epoch": 1.84, "learning_rate": 1.938723872387239e-05, "loss": 0.0091, "step": 127600 }, { "epoch": 1.84, "learning_rate": 1.9387190684133918e-05, "loss": 0.017, "step": 127610 }, { "epoch": 1.84, "learning_rate": 1.9387142644395444e-05, "loss": 0.0138, "step": 127620 }, { "epoch": 1.84, "learning_rate": 1.9387094604656973e-05, "loss": 0.0109, "step": 127630 }, { "epoch": 1.84, "learning_rate": 1.9387046564918502e-05, "loss": 0.0071, "step": 127640 }, { "epoch": 1.84, "learning_rate": 1.9386998525180028e-05, "loss": 0.0078, "step": 127650 }, { "epoch": 1.84, "learning_rate": 1.9386950485441557e-05, "loss": 0.0103, "step": 127660 }, { "epoch": 1.84, "learning_rate": 1.9386902445703087e-05, "loss": 0.0088, "step": 127670 }, { "epoch": 1.84, "learning_rate": 1.9386854405964616e-05, "loss": 0.007, "step": 127680 }, { "epoch": 1.84, "learning_rate": 1.9386806366226142e-05, "loss": 0.0099, "step": 127690 }, { "epoch": 1.84, "learning_rate": 1.938675832648767e-05, "loss": 0.0085, "step": 127700 }, { "epoch": 1.84, "learning_rate": 1.93867102867492e-05, "loss": 0.0101, "step": 127710 }, { "epoch": 1.84, "learning_rate": 1.938666224701073e-05, "loss": 0.0114, "step": 127720 }, { "epoch": 1.84, "learning_rate": 1.9386614207272255e-05, "loss": 0.007, "step": 127730 }, { "epoch": 1.84, "learning_rate": 1.9386566167533785e-05, "loss": 0.0116, "step": 127740 }, { "epoch": 1.84, "learning_rate": 1.9386518127795314e-05, "loss": 0.009, "step": 127750 }, { "epoch": 1.84, "learning_rate": 1.938647008805684e-05, "loss": 0.0119, "step": 127760 }, { "epoch": 1.84, "learning_rate": 1.938642204831837e-05, "loss": 0.0114, "step": 127770 }, { "epoch": 1.84, "learning_rate": 1.93863740085799e-05, "loss": 0.009, "step": 127780 }, { "epoch": 1.84, "learning_rate": 1.9386325968841428e-05, "loss": 0.0139, "step": 127790 }, { "epoch": 1.84, "learning_rate": 1.9386277929102954e-05, "loss": 0.0112, "step": 127800 }, { "epoch": 1.84, "learning_rate": 1.9386229889364483e-05, "loss": 0.0092, "step": 127810 }, { "epoch": 1.84, "learning_rate": 1.9386181849626012e-05, "loss": 0.0081, "step": 127820 }, { "epoch": 1.84, "learning_rate": 1.9386133809887538e-05, "loss": 0.0114, "step": 127830 }, { "epoch": 1.84, "learning_rate": 1.9386085770149067e-05, "loss": 0.0096, "step": 127840 }, { "epoch": 1.84, "learning_rate": 1.9386037730410597e-05, "loss": 0.0083, "step": 127850 }, { "epoch": 1.84, "learning_rate": 1.9385989690672126e-05, "loss": 0.0106, "step": 127860 }, { "epoch": 1.84, "learning_rate": 1.938594165093365e-05, "loss": 0.0111, "step": 127870 }, { "epoch": 1.84, "learning_rate": 1.938589361119518e-05, "loss": 0.0102, "step": 127880 }, { "epoch": 1.84, "learning_rate": 1.938584557145671e-05, "loss": 0.0132, "step": 127890 }, { "epoch": 1.84, "learning_rate": 1.938579753171824e-05, "loss": 0.0102, "step": 127900 }, { "epoch": 1.84, "learning_rate": 1.9385749491979765e-05, "loss": 0.012, "step": 127910 }, { "epoch": 1.84, "learning_rate": 1.9385701452241295e-05, "loss": 0.0109, "step": 127920 }, { "epoch": 1.84, "learning_rate": 1.9385653412502824e-05, "loss": 0.0084, "step": 127930 }, { "epoch": 1.84, "learning_rate": 1.938560537276435e-05, "loss": 0.0089, "step": 127940 }, { "epoch": 1.84, "learning_rate": 1.938555733302588e-05, "loss": 0.0105, "step": 127950 }, { "epoch": 1.84, "learning_rate": 1.938550929328741e-05, "loss": 0.0099, "step": 127960 }, { "epoch": 1.84, "learning_rate": 1.9385461253548938e-05, "loss": 0.0088, "step": 127970 }, { "epoch": 1.84, "learning_rate": 1.9385413213810467e-05, "loss": 0.0089, "step": 127980 }, { "epoch": 1.84, "learning_rate": 1.9385365174071996e-05, "loss": 0.0096, "step": 127990 }, { "epoch": 1.84, "learning_rate": 1.9385317134333522e-05, "loss": 0.007, "step": 128000 }, { "epoch": 1.84, "learning_rate": 1.938526909459505e-05, "loss": 0.0089, "step": 128010 }, { "epoch": 1.85, "learning_rate": 1.938522105485658e-05, "loss": 0.0076, "step": 128020 }, { "epoch": 1.85, "learning_rate": 1.938517301511811e-05, "loss": 0.0127, "step": 128030 }, { "epoch": 1.85, "learning_rate": 1.9385124975379636e-05, "loss": 0.0103, "step": 128040 }, { "epoch": 1.85, "learning_rate": 1.9385076935641165e-05, "loss": 0.0138, "step": 128050 }, { "epoch": 1.85, "learning_rate": 1.9385028895902694e-05, "loss": 0.0077, "step": 128060 }, { "epoch": 1.85, "learning_rate": 1.938498085616422e-05, "loss": 0.0093, "step": 128070 }, { "epoch": 1.85, "learning_rate": 1.938493281642575e-05, "loss": 0.0107, "step": 128080 }, { "epoch": 1.85, "learning_rate": 1.938488477668728e-05, "loss": 0.0139, "step": 128090 }, { "epoch": 1.85, "learning_rate": 1.9384836736948808e-05, "loss": 0.0081, "step": 128100 }, { "epoch": 1.85, "learning_rate": 1.9384788697210334e-05, "loss": 0.007, "step": 128110 }, { "epoch": 1.85, "learning_rate": 1.9384740657471863e-05, "loss": 0.0091, "step": 128120 }, { "epoch": 1.85, "learning_rate": 1.9384692617733392e-05, "loss": 0.0099, "step": 128130 }, { "epoch": 1.85, "learning_rate": 1.938464457799492e-05, "loss": 0.0122, "step": 128140 }, { "epoch": 1.85, "learning_rate": 1.9384596538256448e-05, "loss": 0.0093, "step": 128150 }, { "epoch": 1.85, "learning_rate": 1.9384548498517977e-05, "loss": 0.0083, "step": 128160 }, { "epoch": 1.85, "learning_rate": 1.9384500458779506e-05, "loss": 0.0135, "step": 128170 }, { "epoch": 1.85, "learning_rate": 1.9384452419041032e-05, "loss": 0.0093, "step": 128180 }, { "epoch": 1.85, "learning_rate": 1.938440437930256e-05, "loss": 0.0104, "step": 128190 }, { "epoch": 1.85, "learning_rate": 1.938435633956409e-05, "loss": 0.0128, "step": 128200 }, { "epoch": 1.85, "learning_rate": 1.938430829982562e-05, "loss": 0.0077, "step": 128210 }, { "epoch": 1.85, "learning_rate": 1.9384260260087146e-05, "loss": 0.0074, "step": 128220 }, { "epoch": 1.85, "learning_rate": 1.9384212220348675e-05, "loss": 0.0088, "step": 128230 }, { "epoch": 1.85, "learning_rate": 1.9384164180610204e-05, "loss": 0.0089, "step": 128240 }, { "epoch": 1.85, "learning_rate": 1.938411614087173e-05, "loss": 0.0114, "step": 128250 }, { "epoch": 1.85, "learning_rate": 1.938406810113326e-05, "loss": 0.0101, "step": 128260 }, { "epoch": 1.85, "learning_rate": 1.938402006139479e-05, "loss": 0.0096, "step": 128270 }, { "epoch": 1.85, "learning_rate": 1.9383972021656318e-05, "loss": 0.0077, "step": 128280 }, { "epoch": 1.85, "learning_rate": 1.9383923981917844e-05, "loss": 0.0095, "step": 128290 }, { "epoch": 1.85, "learning_rate": 1.9383875942179373e-05, "loss": 0.0093, "step": 128300 }, { "epoch": 1.85, "learning_rate": 1.9383827902440902e-05, "loss": 0.0075, "step": 128310 }, { "epoch": 1.85, "learning_rate": 1.9383779862702428e-05, "loss": 0.0077, "step": 128320 }, { "epoch": 1.85, "learning_rate": 1.9383731822963957e-05, "loss": 0.0125, "step": 128330 }, { "epoch": 1.85, "learning_rate": 1.9383683783225487e-05, "loss": 0.0087, "step": 128340 }, { "epoch": 1.85, "learning_rate": 1.9383635743487016e-05, "loss": 0.009, "step": 128350 }, { "epoch": 1.85, "learning_rate": 1.9383587703748542e-05, "loss": 0.0089, "step": 128360 }, { "epoch": 1.85, "learning_rate": 1.938353966401007e-05, "loss": 0.012, "step": 128370 }, { "epoch": 1.85, "learning_rate": 1.93834916242716e-05, "loss": 0.0085, "step": 128380 }, { "epoch": 1.85, "learning_rate": 1.938344358453313e-05, "loss": 0.0096, "step": 128390 }, { "epoch": 1.85, "learning_rate": 1.9383395544794656e-05, "loss": 0.0151, "step": 128400 }, { "epoch": 1.85, "learning_rate": 1.9383347505056185e-05, "loss": 0.0091, "step": 128410 }, { "epoch": 1.85, "learning_rate": 1.9383299465317714e-05, "loss": 0.009, "step": 128420 }, { "epoch": 1.85, "learning_rate": 1.938325142557924e-05, "loss": 0.0098, "step": 128430 }, { "epoch": 1.85, "learning_rate": 1.938320338584077e-05, "loss": 0.0106, "step": 128440 }, { "epoch": 1.85, "learning_rate": 1.93831553461023e-05, "loss": 0.0098, "step": 128450 }, { "epoch": 1.85, "learning_rate": 1.9383107306363828e-05, "loss": 0.0115, "step": 128460 }, { "epoch": 1.85, "learning_rate": 1.9383059266625354e-05, "loss": 0.008, "step": 128470 }, { "epoch": 1.85, "learning_rate": 1.9383011226886883e-05, "loss": 0.0099, "step": 128480 }, { "epoch": 1.85, "learning_rate": 1.9382963187148412e-05, "loss": 0.0157, "step": 128490 }, { "epoch": 1.85, "learning_rate": 1.9382915147409938e-05, "loss": 0.0099, "step": 128500 }, { "epoch": 1.85, "learning_rate": 1.9382867107671467e-05, "loss": 0.008, "step": 128510 }, { "epoch": 1.85, "learning_rate": 1.9382819067932997e-05, "loss": 0.0068, "step": 128520 }, { "epoch": 1.85, "learning_rate": 1.9382771028194526e-05, "loss": 0.0088, "step": 128530 }, { "epoch": 1.85, "learning_rate": 1.9382722988456052e-05, "loss": 0.009, "step": 128540 }, { "epoch": 1.85, "learning_rate": 1.938267494871758e-05, "loss": 0.0075, "step": 128550 }, { "epoch": 1.85, "learning_rate": 1.938262690897911e-05, "loss": 0.0104, "step": 128560 }, { "epoch": 1.85, "learning_rate": 1.938257886924064e-05, "loss": 0.0108, "step": 128570 }, { "epoch": 1.85, "learning_rate": 1.9382530829502165e-05, "loss": 0.0159, "step": 128580 }, { "epoch": 1.85, "learning_rate": 1.9382482789763695e-05, "loss": 0.0118, "step": 128590 }, { "epoch": 1.85, "learning_rate": 1.9382434750025224e-05, "loss": 0.0073, "step": 128600 }, { "epoch": 1.85, "learning_rate": 1.938238671028675e-05, "loss": 0.0071, "step": 128610 }, { "epoch": 1.85, "learning_rate": 1.938233867054828e-05, "loss": 0.009, "step": 128620 }, { "epoch": 1.85, "learning_rate": 1.9382295434783657e-05, "loss": 0.0137, "step": 128630 }, { "epoch": 1.85, "learning_rate": 1.9382247395045183e-05, "loss": 0.0114, "step": 128640 }, { "epoch": 1.85, "learning_rate": 1.9382199355306712e-05, "loss": 0.0125, "step": 128650 }, { "epoch": 1.85, "learning_rate": 1.938215131556824e-05, "loss": 0.0091, "step": 128660 }, { "epoch": 1.85, "learning_rate": 1.9382103275829767e-05, "loss": 0.0077, "step": 128670 }, { "epoch": 1.85, "learning_rate": 1.9382055236091297e-05, "loss": 0.0084, "step": 128680 }, { "epoch": 1.85, "learning_rate": 1.9382007196352826e-05, "loss": 0.0095, "step": 128690 }, { "epoch": 1.85, "learning_rate": 1.9381959156614355e-05, "loss": 0.0072, "step": 128700 }, { "epoch": 1.85, "learning_rate": 1.938191111687588e-05, "loss": 0.0089, "step": 128710 }, { "epoch": 1.86, "learning_rate": 1.938186307713741e-05, "loss": 0.0093, "step": 128720 }, { "epoch": 1.86, "learning_rate": 1.938181503739894e-05, "loss": 0.0074, "step": 128730 }, { "epoch": 1.86, "learning_rate": 1.938177180163431e-05, "loss": 0.011, "step": 128740 }, { "epoch": 1.86, "learning_rate": 1.938172376189584e-05, "loss": 0.0086, "step": 128750 }, { "epoch": 1.86, "learning_rate": 1.938167572215737e-05, "loss": 0.0131, "step": 128760 }, { "epoch": 1.86, "learning_rate": 1.93816276824189e-05, "loss": 0.0112, "step": 128770 }, { "epoch": 1.86, "learning_rate": 1.9381579642680425e-05, "loss": 0.0113, "step": 128780 }, { "epoch": 1.86, "learning_rate": 1.9381531602941954e-05, "loss": 0.0131, "step": 128790 }, { "epoch": 1.86, "learning_rate": 1.9381483563203483e-05, "loss": 0.0106, "step": 128800 }, { "epoch": 1.86, "learning_rate": 1.9381435523465012e-05, "loss": 0.0132, "step": 128810 }, { "epoch": 1.86, "learning_rate": 1.938138748372654e-05, "loss": 0.0108, "step": 128820 }, { "epoch": 1.86, "learning_rate": 1.9381339443988068e-05, "loss": 0.0081, "step": 128830 }, { "epoch": 1.86, "learning_rate": 1.9381291404249597e-05, "loss": 0.0098, "step": 128840 }, { "epoch": 1.86, "learning_rate": 1.9381243364511123e-05, "loss": 0.0094, "step": 128850 }, { "epoch": 1.86, "learning_rate": 1.9381195324772652e-05, "loss": 0.011, "step": 128860 }, { "epoch": 1.86, "learning_rate": 1.938114728503418e-05, "loss": 0.0102, "step": 128870 }, { "epoch": 1.86, "learning_rate": 1.938109924529571e-05, "loss": 0.0092, "step": 128880 }, { "epoch": 1.86, "learning_rate": 1.9381051205557236e-05, "loss": 0.0108, "step": 128890 }, { "epoch": 1.86, "learning_rate": 1.9381003165818766e-05, "loss": 0.0119, "step": 128900 }, { "epoch": 1.86, "learning_rate": 1.9380955126080295e-05, "loss": 0.0106, "step": 128910 }, { "epoch": 1.86, "learning_rate": 1.938090708634182e-05, "loss": 0.0121, "step": 128920 }, { "epoch": 1.86, "learning_rate": 1.938085904660335e-05, "loss": 0.0087, "step": 128930 }, { "epoch": 1.86, "learning_rate": 1.938081100686488e-05, "loss": 0.0096, "step": 128940 }, { "epoch": 1.86, "learning_rate": 1.938076296712641e-05, "loss": 0.0098, "step": 128950 }, { "epoch": 1.86, "learning_rate": 1.9380714927387935e-05, "loss": 0.0091, "step": 128960 }, { "epoch": 1.86, "learning_rate": 1.9380666887649464e-05, "loss": 0.0096, "step": 128970 }, { "epoch": 1.86, "learning_rate": 1.9380618847910993e-05, "loss": 0.0074, "step": 128980 }, { "epoch": 1.86, "learning_rate": 1.9380570808172522e-05, "loss": 0.0078, "step": 128990 }, { "epoch": 1.86, "learning_rate": 1.938052276843405e-05, "loss": 0.0089, "step": 129000 }, { "epoch": 1.86, "learning_rate": 1.938047472869558e-05, "loss": 0.0073, "step": 129010 }, { "epoch": 1.86, "learning_rate": 1.9380426688957107e-05, "loss": 0.0087, "step": 129020 }, { "epoch": 1.86, "learning_rate": 1.9380378649218636e-05, "loss": 0.0104, "step": 129030 }, { "epoch": 1.86, "learning_rate": 1.9380330609480165e-05, "loss": 0.0102, "step": 129040 }, { "epoch": 1.86, "learning_rate": 1.9380282569741695e-05, "loss": 0.0067, "step": 129050 }, { "epoch": 1.86, "learning_rate": 1.938023453000322e-05, "loss": 0.009, "step": 129060 }, { "epoch": 1.86, "learning_rate": 1.938018649026475e-05, "loss": 0.009, "step": 129070 }, { "epoch": 1.86, "learning_rate": 1.938013845052628e-05, "loss": 0.0188, "step": 129080 }, { "epoch": 1.86, "learning_rate": 1.9380090410787805e-05, "loss": 0.013, "step": 129090 }, { "epoch": 1.86, "learning_rate": 1.9380042371049334e-05, "loss": 0.0087, "step": 129100 }, { "epoch": 1.86, "learning_rate": 1.9379994331310863e-05, "loss": 0.0112, "step": 129110 }, { "epoch": 1.86, "learning_rate": 1.9379946291572393e-05, "loss": 0.0058, "step": 129120 }, { "epoch": 1.86, "learning_rate": 1.937989825183392e-05, "loss": 0.0117, "step": 129130 }, { "epoch": 1.86, "learning_rate": 1.9379850212095448e-05, "loss": 0.0065, "step": 129140 }, { "epoch": 1.86, "learning_rate": 1.9379802172356977e-05, "loss": 0.0094, "step": 129150 }, { "epoch": 1.86, "learning_rate": 1.9379754132618503e-05, "loss": 0.0111, "step": 129160 }, { "epoch": 1.86, "learning_rate": 1.9379706092880032e-05, "loss": 0.0112, "step": 129170 }, { "epoch": 1.86, "learning_rate": 1.937965805314156e-05, "loss": 0.0084, "step": 129180 }, { "epoch": 1.86, "learning_rate": 1.937961001340309e-05, "loss": 0.0085, "step": 129190 }, { "epoch": 1.86, "learning_rate": 1.9379561973664617e-05, "loss": 0.0108, "step": 129200 }, { "epoch": 1.86, "learning_rate": 1.9379513933926146e-05, "loss": 0.0077, "step": 129210 }, { "epoch": 1.86, "learning_rate": 1.9379465894187675e-05, "loss": 0.0068, "step": 129220 }, { "epoch": 1.86, "learning_rate": 1.9379417854449205e-05, "loss": 0.009, "step": 129230 }, { "epoch": 1.86, "learning_rate": 1.937936981471073e-05, "loss": 0.0054, "step": 129240 }, { "epoch": 1.86, "learning_rate": 1.937932177497226e-05, "loss": 0.0097, "step": 129250 }, { "epoch": 1.86, "learning_rate": 1.937927373523379e-05, "loss": 0.0075, "step": 129260 }, { "epoch": 1.86, "learning_rate": 1.9379225695495315e-05, "loss": 0.0087, "step": 129270 }, { "epoch": 1.86, "learning_rate": 1.9379177655756844e-05, "loss": 0.007, "step": 129280 }, { "epoch": 1.86, "learning_rate": 1.9379129616018373e-05, "loss": 0.0114, "step": 129290 }, { "epoch": 1.86, "learning_rate": 1.9379081576279903e-05, "loss": 0.0116, "step": 129300 }, { "epoch": 1.86, "learning_rate": 1.937903353654143e-05, "loss": 0.0101, "step": 129310 }, { "epoch": 1.86, "learning_rate": 1.9378985496802958e-05, "loss": 0.0077, "step": 129320 }, { "epoch": 1.86, "learning_rate": 1.9378937457064487e-05, "loss": 0.0067, "step": 129330 }, { "epoch": 1.86, "learning_rate": 1.9378889417326013e-05, "loss": 0.0147, "step": 129340 }, { "epoch": 1.86, "learning_rate": 1.9378841377587542e-05, "loss": 0.0102, "step": 129350 }, { "epoch": 1.86, "learning_rate": 1.937879333784907e-05, "loss": 0.0097, "step": 129360 }, { "epoch": 1.86, "learning_rate": 1.93787452981106e-05, "loss": 0.0107, "step": 129370 }, { "epoch": 1.86, "learning_rate": 1.9378697258372127e-05, "loss": 0.0101, "step": 129380 }, { "epoch": 1.86, "learning_rate": 1.9378649218633656e-05, "loss": 0.0081, "step": 129390 }, { "epoch": 1.86, "learning_rate": 1.9378601178895185e-05, "loss": 0.0103, "step": 129400 }, { "epoch": 1.87, "learning_rate": 1.9378553139156714e-05, "loss": 0.0083, "step": 129410 }, { "epoch": 1.87, "learning_rate": 1.937850509941824e-05, "loss": 0.0075, "step": 129420 }, { "epoch": 1.87, "learning_rate": 1.937845705967977e-05, "loss": 0.0066, "step": 129430 }, { "epoch": 1.87, "learning_rate": 1.93784090199413e-05, "loss": 0.0157, "step": 129440 }, { "epoch": 1.87, "learning_rate": 1.9378360980202825e-05, "loss": 0.0061, "step": 129450 }, { "epoch": 1.87, "learning_rate": 1.9378312940464354e-05, "loss": 0.0103, "step": 129460 }, { "epoch": 1.87, "learning_rate": 1.9378264900725883e-05, "loss": 0.0066, "step": 129470 }, { "epoch": 1.87, "learning_rate": 1.9378216860987413e-05, "loss": 0.0144, "step": 129480 }, { "epoch": 1.87, "learning_rate": 1.937816882124894e-05, "loss": 0.013, "step": 129490 }, { "epoch": 1.87, "learning_rate": 1.9378120781510468e-05, "loss": 0.0127, "step": 129500 }, { "epoch": 1.87, "learning_rate": 1.9378072741771997e-05, "loss": 0.0073, "step": 129510 }, { "epoch": 1.87, "learning_rate": 1.9378024702033523e-05, "loss": 0.0089, "step": 129520 }, { "epoch": 1.87, "learning_rate": 1.9377976662295052e-05, "loss": 0.0167, "step": 129530 }, { "epoch": 1.87, "learning_rate": 1.937792862255658e-05, "loss": 0.0147, "step": 129540 }, { "epoch": 1.87, "learning_rate": 1.937788058281811e-05, "loss": 0.0125, "step": 129550 }, { "epoch": 1.87, "learning_rate": 1.9377832543079637e-05, "loss": 0.0095, "step": 129560 }, { "epoch": 1.87, "learning_rate": 1.9377784503341166e-05, "loss": 0.0103, "step": 129570 }, { "epoch": 1.87, "learning_rate": 1.9377736463602695e-05, "loss": 0.0127, "step": 129580 }, { "epoch": 1.87, "learning_rate": 1.9377688423864224e-05, "loss": 0.0089, "step": 129590 }, { "epoch": 1.87, "learning_rate": 1.937764038412575e-05, "loss": 0.0101, "step": 129600 }, { "epoch": 1.87, "learning_rate": 1.937759234438728e-05, "loss": 0.0103, "step": 129610 }, { "epoch": 1.87, "learning_rate": 1.937754430464881e-05, "loss": 0.0104, "step": 129620 }, { "epoch": 1.87, "learning_rate": 1.9377496264910335e-05, "loss": 0.0084, "step": 129630 }, { "epoch": 1.87, "learning_rate": 1.9377448225171864e-05, "loss": 0.0157, "step": 129640 }, { "epoch": 1.87, "learning_rate": 1.9377400185433393e-05, "loss": 0.0076, "step": 129650 }, { "epoch": 1.87, "learning_rate": 1.9377352145694922e-05, "loss": 0.0104, "step": 129660 }, { "epoch": 1.87, "learning_rate": 1.937730410595645e-05, "loss": 0.0082, "step": 129670 }, { "epoch": 1.87, "learning_rate": 1.9377256066217978e-05, "loss": 0.0099, "step": 129680 }, { "epoch": 1.87, "learning_rate": 1.9377208026479507e-05, "loss": 0.0104, "step": 129690 }, { "epoch": 1.87, "learning_rate": 1.9377159986741033e-05, "loss": 0.0104, "step": 129700 }, { "epoch": 1.87, "learning_rate": 1.9377111947002562e-05, "loss": 0.0116, "step": 129710 }, { "epoch": 1.87, "learning_rate": 1.937706390726409e-05, "loss": 0.008, "step": 129720 }, { "epoch": 1.87, "learning_rate": 1.937701586752562e-05, "loss": 0.0081, "step": 129730 }, { "epoch": 1.87, "learning_rate": 1.9376967827787146e-05, "loss": 0.0082, "step": 129740 }, { "epoch": 1.87, "learning_rate": 1.9376919788048676e-05, "loss": 0.0099, "step": 129750 }, { "epoch": 1.87, "learning_rate": 1.9376871748310205e-05, "loss": 0.0127, "step": 129760 }, { "epoch": 1.87, "learning_rate": 1.937682370857173e-05, "loss": 0.0078, "step": 129770 }, { "epoch": 1.87, "learning_rate": 1.937677566883326e-05, "loss": 0.009, "step": 129780 }, { "epoch": 1.87, "learning_rate": 1.937672762909479e-05, "loss": 0.0093, "step": 129790 }, { "epoch": 1.87, "learning_rate": 1.937667958935632e-05, "loss": 0.0082, "step": 129800 }, { "epoch": 1.87, "learning_rate": 1.9376631549617845e-05, "loss": 0.0067, "step": 129810 }, { "epoch": 1.87, "learning_rate": 1.9376583509879374e-05, "loss": 0.007, "step": 129820 }, { "epoch": 1.87, "learning_rate": 1.9376535470140903e-05, "loss": 0.0078, "step": 129830 }, { "epoch": 1.87, "learning_rate": 1.9376487430402432e-05, "loss": 0.0106, "step": 129840 }, { "epoch": 1.87, "learning_rate": 1.9376439390663958e-05, "loss": 0.01, "step": 129850 }, { "epoch": 1.87, "learning_rate": 1.9376391350925488e-05, "loss": 0.0108, "step": 129860 }, { "epoch": 1.87, "learning_rate": 1.9376343311187017e-05, "loss": 0.0103, "step": 129870 }, { "epoch": 1.87, "learning_rate": 1.9376295271448543e-05, "loss": 0.0106, "step": 129880 }, { "epoch": 1.87, "learning_rate": 1.9376247231710072e-05, "loss": 0.0091, "step": 129890 }, { "epoch": 1.87, "learning_rate": 1.93761991919716e-05, "loss": 0.0085, "step": 129900 }, { "epoch": 1.87, "learning_rate": 1.937615115223313e-05, "loss": 0.0142, "step": 129910 }, { "epoch": 1.87, "learning_rate": 1.9376103112494656e-05, "loss": 0.0061, "step": 129920 }, { "epoch": 1.87, "learning_rate": 1.9376055072756186e-05, "loss": 0.0102, "step": 129930 }, { "epoch": 1.87, "learning_rate": 1.9376007033017715e-05, "loss": 0.0096, "step": 129940 }, { "epoch": 1.87, "learning_rate": 1.937595899327924e-05, "loss": 0.0053, "step": 129950 }, { "epoch": 1.87, "learning_rate": 1.937591095354077e-05, "loss": 0.0083, "step": 129960 }, { "epoch": 1.87, "learning_rate": 1.93758629138023e-05, "loss": 0.0081, "step": 129970 }, { "epoch": 1.87, "learning_rate": 1.937581487406383e-05, "loss": 0.0096, "step": 129980 }, { "epoch": 1.87, "learning_rate": 1.9375766834325354e-05, "loss": 0.0098, "step": 129990 }, { "epoch": 1.87, "learning_rate": 1.9375718794586884e-05, "loss": 0.0107, "step": 130000 }, { "epoch": 1.87, "learning_rate": 1.9375670754848413e-05, "loss": 0.0102, "step": 130010 }, { "epoch": 1.87, "learning_rate": 1.9375622715109942e-05, "loss": 0.0075, "step": 130020 }, { "epoch": 1.87, "learning_rate": 1.9375574675371468e-05, "loss": 0.0061, "step": 130030 }, { "epoch": 1.87, "learning_rate": 1.9375526635632997e-05, "loss": 0.0102, "step": 130040 }, { "epoch": 1.87, "learning_rate": 1.9375478595894527e-05, "loss": 0.0114, "step": 130050 }, { "epoch": 1.87, "learning_rate": 1.9375430556156053e-05, "loss": 0.0154, "step": 130060 }, { "epoch": 1.87, "learning_rate": 1.9375382516417582e-05, "loss": 0.009, "step": 130070 }, { "epoch": 1.87, "learning_rate": 1.937533447667911e-05, "loss": 0.0064, "step": 130080 }, { "epoch": 1.87, "learning_rate": 1.937528643694064e-05, "loss": 0.0092, "step": 130090 }, { "epoch": 1.87, "learning_rate": 1.9375238397202166e-05, "loss": 0.0091, "step": 130100 }, { "epoch": 1.88, "learning_rate": 1.9375190357463696e-05, "loss": 0.0095, "step": 130110 }, { "epoch": 1.88, "learning_rate": 1.9375142317725225e-05, "loss": 0.0113, "step": 130120 }, { "epoch": 1.88, "learning_rate": 1.937509427798675e-05, "loss": 0.0072, "step": 130130 }, { "epoch": 1.88, "learning_rate": 1.937504623824828e-05, "loss": 0.0132, "step": 130140 }, { "epoch": 1.88, "learning_rate": 1.937499819850981e-05, "loss": 0.01, "step": 130150 }, { "epoch": 1.88, "learning_rate": 1.937495015877134e-05, "loss": 0.0109, "step": 130160 }, { "epoch": 1.88, "learning_rate": 1.9374902119032864e-05, "loss": 0.0112, "step": 130170 }, { "epoch": 1.88, "learning_rate": 1.9374854079294394e-05, "loss": 0.0107, "step": 130180 }, { "epoch": 1.88, "learning_rate": 1.9374806039555923e-05, "loss": 0.009, "step": 130190 }, { "epoch": 1.88, "learning_rate": 1.9374757999817452e-05, "loss": 0.0056, "step": 130200 }, { "epoch": 1.88, "learning_rate": 1.9374709960078978e-05, "loss": 0.0096, "step": 130210 }, { "epoch": 1.88, "learning_rate": 1.9374661920340507e-05, "loss": 0.0069, "step": 130220 }, { "epoch": 1.88, "learning_rate": 1.9374613880602037e-05, "loss": 0.0097, "step": 130230 }, { "epoch": 1.88, "learning_rate": 1.9374565840863563e-05, "loss": 0.0116, "step": 130240 }, { "epoch": 1.88, "learning_rate": 1.9374517801125092e-05, "loss": 0.0086, "step": 130250 }, { "epoch": 1.88, "learning_rate": 1.937446976138662e-05, "loss": 0.0091, "step": 130260 }, { "epoch": 1.88, "learning_rate": 1.937442172164815e-05, "loss": 0.011, "step": 130270 }, { "epoch": 1.88, "learning_rate": 1.9374373681909676e-05, "loss": 0.012, "step": 130280 }, { "epoch": 1.88, "learning_rate": 1.9374325642171205e-05, "loss": 0.0101, "step": 130290 }, { "epoch": 1.88, "learning_rate": 1.9374277602432735e-05, "loss": 0.0079, "step": 130300 }, { "epoch": 1.88, "learning_rate": 1.937422956269426e-05, "loss": 0.0119, "step": 130310 }, { "epoch": 1.88, "learning_rate": 1.937418152295579e-05, "loss": 0.0101, "step": 130320 }, { "epoch": 1.88, "learning_rate": 1.937413348321732e-05, "loss": 0.0091, "step": 130330 }, { "epoch": 1.88, "learning_rate": 1.937408544347885e-05, "loss": 0.0087, "step": 130340 }, { "epoch": 1.88, "learning_rate": 1.9374037403740374e-05, "loss": 0.0117, "step": 130350 }, { "epoch": 1.88, "learning_rate": 1.9373989364001904e-05, "loss": 0.007, "step": 130360 }, { "epoch": 1.88, "learning_rate": 1.9373941324263433e-05, "loss": 0.0109, "step": 130370 }, { "epoch": 1.88, "learning_rate": 1.9373893284524962e-05, "loss": 0.0074, "step": 130380 }, { "epoch": 1.88, "learning_rate": 1.9373845244786488e-05, "loss": 0.0092, "step": 130390 }, { "epoch": 1.88, "learning_rate": 1.9373797205048017e-05, "loss": 0.0087, "step": 130400 }, { "epoch": 1.88, "learning_rate": 1.9373749165309547e-05, "loss": 0.0117, "step": 130410 }, { "epoch": 1.88, "learning_rate": 1.9373701125571072e-05, "loss": 0.009, "step": 130420 }, { "epoch": 1.88, "learning_rate": 1.9373653085832602e-05, "loss": 0.0083, "step": 130430 }, { "epoch": 1.88, "learning_rate": 1.937360504609413e-05, "loss": 0.0107, "step": 130440 }, { "epoch": 1.88, "learning_rate": 1.937355700635566e-05, "loss": 0.008, "step": 130450 }, { "epoch": 1.88, "learning_rate": 1.9373508966617186e-05, "loss": 0.0087, "step": 130460 }, { "epoch": 1.88, "learning_rate": 1.9373460926878715e-05, "loss": 0.0084, "step": 130470 }, { "epoch": 1.88, "learning_rate": 1.9373412887140245e-05, "loss": 0.0093, "step": 130480 }, { "epoch": 1.88, "learning_rate": 1.937336484740177e-05, "loss": 0.0117, "step": 130490 }, { "epoch": 1.88, "learning_rate": 1.93733168076633e-05, "loss": 0.0083, "step": 130500 }, { "epoch": 1.88, "learning_rate": 1.937326876792483e-05, "loss": 0.0088, "step": 130510 }, { "epoch": 1.88, "learning_rate": 1.937322072818636e-05, "loss": 0.012, "step": 130520 }, { "epoch": 1.88, "learning_rate": 1.9373172688447884e-05, "loss": 0.0082, "step": 130530 }, { "epoch": 1.88, "learning_rate": 1.9373124648709414e-05, "loss": 0.0078, "step": 130540 }, { "epoch": 1.88, "learning_rate": 1.9373076608970943e-05, "loss": 0.012, "step": 130550 }, { "epoch": 1.88, "learning_rate": 1.9373028569232472e-05, "loss": 0.009, "step": 130560 }, { "epoch": 1.88, "learning_rate": 1.9372980529493998e-05, "loss": 0.0129, "step": 130570 }, { "epoch": 1.88, "learning_rate": 1.9372932489755527e-05, "loss": 0.008, "step": 130580 }, { "epoch": 1.88, "learning_rate": 1.9372884450017056e-05, "loss": 0.0165, "step": 130590 }, { "epoch": 1.88, "learning_rate": 1.9372836410278582e-05, "loss": 0.0099, "step": 130600 }, { "epoch": 1.88, "learning_rate": 1.937278837054011e-05, "loss": 0.0105, "step": 130610 }, { "epoch": 1.88, "learning_rate": 1.937274033080164e-05, "loss": 0.0098, "step": 130620 }, { "epoch": 1.88, "learning_rate": 1.937269229106317e-05, "loss": 0.0093, "step": 130630 }, { "epoch": 1.88, "learning_rate": 1.9372644251324696e-05, "loss": 0.0083, "step": 130640 }, { "epoch": 1.88, "learning_rate": 1.9372596211586225e-05, "loss": 0.0127, "step": 130650 }, { "epoch": 1.88, "learning_rate": 1.9372548171847755e-05, "loss": 0.0093, "step": 130660 }, { "epoch": 1.88, "learning_rate": 1.937250013210928e-05, "loss": 0.0066, "step": 130670 }, { "epoch": 1.88, "learning_rate": 1.937245209237081e-05, "loss": 0.0102, "step": 130680 }, { "epoch": 1.88, "learning_rate": 1.937240405263234e-05, "loss": 0.0069, "step": 130690 }, { "epoch": 1.88, "learning_rate": 1.9372356012893868e-05, "loss": 0.0154, "step": 130700 }, { "epoch": 1.88, "learning_rate": 1.9372307973155394e-05, "loss": 0.0089, "step": 130710 }, { "epoch": 1.88, "learning_rate": 1.9372259933416923e-05, "loss": 0.0078, "step": 130720 }, { "epoch": 1.88, "learning_rate": 1.9372211893678453e-05, "loss": 0.012, "step": 130730 }, { "epoch": 1.88, "learning_rate": 1.9372163853939982e-05, "loss": 0.0094, "step": 130740 }, { "epoch": 1.88, "learning_rate": 1.9372115814201508e-05, "loss": 0.0074, "step": 130750 }, { "epoch": 1.88, "learning_rate": 1.9372067774463037e-05, "loss": 0.0106, "step": 130760 }, { "epoch": 1.88, "learning_rate": 1.9372019734724566e-05, "loss": 0.0088, "step": 130770 }, { "epoch": 1.88, "learning_rate": 1.9371971694986092e-05, "loss": 0.0119, "step": 130780 }, { "epoch": 1.88, "learning_rate": 1.937192365524762e-05, "loss": 0.0112, "step": 130790 }, { "epoch": 1.89, "learning_rate": 1.937187561550915e-05, "loss": 0.0104, "step": 130800 }, { "epoch": 1.89, "learning_rate": 1.937182757577068e-05, "loss": 0.0096, "step": 130810 }, { "epoch": 1.89, "learning_rate": 1.9371779536032206e-05, "loss": 0.0147, "step": 130820 }, { "epoch": 1.89, "learning_rate": 1.9371731496293735e-05, "loss": 0.0096, "step": 130830 }, { "epoch": 1.89, "learning_rate": 1.9371683456555264e-05, "loss": 0.0128, "step": 130840 }, { "epoch": 1.89, "learning_rate": 1.937163541681679e-05, "loss": 0.0119, "step": 130850 }, { "epoch": 1.89, "learning_rate": 1.937158737707832e-05, "loss": 0.0143, "step": 130860 }, { "epoch": 1.89, "learning_rate": 1.937153933733985e-05, "loss": 0.0104, "step": 130870 }, { "epoch": 1.89, "learning_rate": 1.9371491297601378e-05, "loss": 0.0102, "step": 130880 }, { "epoch": 1.89, "learning_rate": 1.9371443257862904e-05, "loss": 0.0084, "step": 130890 }, { "epoch": 1.89, "learning_rate": 1.9371395218124433e-05, "loss": 0.0092, "step": 130900 }, { "epoch": 1.89, "learning_rate": 1.9371347178385963e-05, "loss": 0.0112, "step": 130910 }, { "epoch": 1.89, "learning_rate": 1.9371299138647492e-05, "loss": 0.0095, "step": 130920 }, { "epoch": 1.89, "learning_rate": 1.9371251098909018e-05, "loss": 0.0076, "step": 130930 }, { "epoch": 1.89, "learning_rate": 1.9371203059170547e-05, "loss": 0.0103, "step": 130940 }, { "epoch": 1.89, "learning_rate": 1.9371155019432076e-05, "loss": 0.0085, "step": 130950 }, { "epoch": 1.89, "learning_rate": 1.9371106979693602e-05, "loss": 0.0107, "step": 130960 }, { "epoch": 1.89, "learning_rate": 1.937105893995513e-05, "loss": 0.01, "step": 130970 }, { "epoch": 1.89, "learning_rate": 1.937101090021666e-05, "loss": 0.0094, "step": 130980 }, { "epoch": 1.89, "learning_rate": 1.937096286047819e-05, "loss": 0.0108, "step": 130990 }, { "epoch": 1.89, "learning_rate": 1.9370914820739716e-05, "loss": 0.0087, "step": 131000 }, { "epoch": 1.89, "learning_rate": 1.9370866781001245e-05, "loss": 0.0103, "step": 131010 }, { "epoch": 1.89, "learning_rate": 1.9370818741262774e-05, "loss": 0.0098, "step": 131020 }, { "epoch": 1.89, "learning_rate": 1.93707707015243e-05, "loss": 0.0086, "step": 131030 }, { "epoch": 1.89, "learning_rate": 1.937072266178583e-05, "loss": 0.0091, "step": 131040 }, { "epoch": 1.89, "learning_rate": 1.937067462204736e-05, "loss": 0.0145, "step": 131050 }, { "epoch": 1.89, "learning_rate": 1.9370626582308888e-05, "loss": 0.0104, "step": 131060 }, { "epoch": 1.89, "learning_rate": 1.9370578542570414e-05, "loss": 0.009, "step": 131070 }, { "epoch": 1.89, "learning_rate": 1.9370530502831943e-05, "loss": 0.0074, "step": 131080 }, { "epoch": 1.89, "learning_rate": 1.9370482463093473e-05, "loss": 0.0078, "step": 131090 }, { "epoch": 1.89, "learning_rate": 1.9370434423355002e-05, "loss": 0.0104, "step": 131100 }, { "epoch": 1.89, "learning_rate": 1.9370386383616528e-05, "loss": 0.0061, "step": 131110 }, { "epoch": 1.89, "learning_rate": 1.9370338343878057e-05, "loss": 0.0126, "step": 131120 }, { "epoch": 1.89, "learning_rate": 1.9370290304139586e-05, "loss": 0.0126, "step": 131130 }, { "epoch": 1.89, "learning_rate": 1.9370242264401112e-05, "loss": 0.0098, "step": 131140 }, { "epoch": 1.89, "learning_rate": 1.937019422466264e-05, "loss": 0.0051, "step": 131150 }, { "epoch": 1.89, "learning_rate": 1.937014618492417e-05, "loss": 0.0114, "step": 131160 }, { "epoch": 1.89, "learning_rate": 1.93700981451857e-05, "loss": 0.0123, "step": 131170 }, { "epoch": 1.89, "learning_rate": 1.9370050105447226e-05, "loss": 0.0079, "step": 131180 }, { "epoch": 1.89, "learning_rate": 1.9370002065708755e-05, "loss": 0.0111, "step": 131190 }, { "epoch": 1.89, "learning_rate": 1.9369954025970284e-05, "loss": 0.01, "step": 131200 }, { "epoch": 1.89, "learning_rate": 1.936990598623181e-05, "loss": 0.0101, "step": 131210 }, { "epoch": 1.89, "learning_rate": 1.936985794649334e-05, "loss": 0.0099, "step": 131220 }, { "epoch": 1.89, "learning_rate": 1.936980990675487e-05, "loss": 0.0055, "step": 131230 }, { "epoch": 1.89, "learning_rate": 1.9369761867016398e-05, "loss": 0.0076, "step": 131240 }, { "epoch": 1.89, "learning_rate": 1.9369713827277924e-05, "loss": 0.0083, "step": 131250 }, { "epoch": 1.89, "learning_rate": 1.9369665787539453e-05, "loss": 0.0109, "step": 131260 }, { "epoch": 1.89, "learning_rate": 1.9369617747800982e-05, "loss": 0.0056, "step": 131270 }, { "epoch": 1.89, "learning_rate": 1.9369569708062512e-05, "loss": 0.0127, "step": 131280 }, { "epoch": 1.89, "learning_rate": 1.9369521668324038e-05, "loss": 0.0106, "step": 131290 }, { "epoch": 1.89, "learning_rate": 1.9369473628585567e-05, "loss": 0.0087, "step": 131300 }, { "epoch": 1.89, "learning_rate": 1.9369425588847096e-05, "loss": 0.0113, "step": 131310 }, { "epoch": 1.89, "learning_rate": 1.9369377549108622e-05, "loss": 0.0084, "step": 131320 }, { "epoch": 1.89, "learning_rate": 1.936932950937015e-05, "loss": 0.0132, "step": 131330 }, { "epoch": 1.89, "learning_rate": 1.936928146963168e-05, "loss": 0.0109, "step": 131340 }, { "epoch": 1.89, "learning_rate": 1.936923342989321e-05, "loss": 0.0093, "step": 131350 }, { "epoch": 1.89, "learning_rate": 1.9369185390154736e-05, "loss": 0.011, "step": 131360 }, { "epoch": 1.89, "learning_rate": 1.9369137350416265e-05, "loss": 0.009, "step": 131370 }, { "epoch": 1.89, "learning_rate": 1.9369089310677794e-05, "loss": 0.0047, "step": 131380 }, { "epoch": 1.89, "learning_rate": 1.936904127093932e-05, "loss": 0.0135, "step": 131390 }, { "epoch": 1.89, "learning_rate": 1.936899323120085e-05, "loss": 0.0087, "step": 131400 }, { "epoch": 1.89, "learning_rate": 1.936894519146238e-05, "loss": 0.0149, "step": 131410 }, { "epoch": 1.89, "learning_rate": 1.9368897151723908e-05, "loss": 0.0102, "step": 131420 }, { "epoch": 1.89, "learning_rate": 1.9368849111985434e-05, "loss": 0.0108, "step": 131430 }, { "epoch": 1.89, "learning_rate": 1.9368801072246963e-05, "loss": 0.0091, "step": 131440 }, { "epoch": 1.89, "learning_rate": 1.9368753032508492e-05, "loss": 0.0092, "step": 131450 }, { "epoch": 1.89, "learning_rate": 1.9368704992770018e-05, "loss": 0.013, "step": 131460 }, { "epoch": 1.89, "learning_rate": 1.9368656953031547e-05, "loss": 0.008, "step": 131470 }, { "epoch": 1.89, "learning_rate": 1.9368608913293077e-05, "loss": 0.0093, "step": 131480 }, { "epoch": 1.9, "learning_rate": 1.9368560873554606e-05, "loss": 0.0091, "step": 131490 }, { "epoch": 1.9, "learning_rate": 1.9368512833816132e-05, "loss": 0.0096, "step": 131500 }, { "epoch": 1.9, "learning_rate": 1.936846479407766e-05, "loss": 0.009, "step": 131510 }, { "epoch": 1.9, "learning_rate": 1.936841675433919e-05, "loss": 0.0096, "step": 131520 }, { "epoch": 1.9, "learning_rate": 1.936836871460072e-05, "loss": 0.0085, "step": 131530 }, { "epoch": 1.9, "learning_rate": 1.9368320674862246e-05, "loss": 0.0098, "step": 131540 }, { "epoch": 1.9, "learning_rate": 1.9368272635123775e-05, "loss": 0.0113, "step": 131550 }, { "epoch": 1.9, "learning_rate": 1.9368224595385304e-05, "loss": 0.0084, "step": 131560 }, { "epoch": 1.9, "learning_rate": 1.9368176555646833e-05, "loss": 0.014, "step": 131570 }, { "epoch": 1.9, "learning_rate": 1.9368128515908363e-05, "loss": 0.0075, "step": 131580 }, { "epoch": 1.9, "learning_rate": 1.9368080476169892e-05, "loss": 0.0106, "step": 131590 }, { "epoch": 1.9, "learning_rate": 1.9368032436431418e-05, "loss": 0.0104, "step": 131600 }, { "epoch": 1.9, "learning_rate": 1.9367984396692947e-05, "loss": 0.0088, "step": 131610 }, { "epoch": 1.9, "learning_rate": 1.9367936356954476e-05, "loss": 0.01, "step": 131620 }, { "epoch": 1.9, "learning_rate": 1.9367888317216002e-05, "loss": 0.012, "step": 131630 }, { "epoch": 1.9, "learning_rate": 1.936784027747753e-05, "loss": 0.0098, "step": 131640 }, { "epoch": 1.9, "learning_rate": 1.936779223773906e-05, "loss": 0.0088, "step": 131650 }, { "epoch": 1.9, "learning_rate": 1.936774419800059e-05, "loss": 0.008, "step": 131660 }, { "epoch": 1.9, "learning_rate": 1.9367696158262116e-05, "loss": 0.0085, "step": 131670 }, { "epoch": 1.9, "learning_rate": 1.9367648118523645e-05, "loss": 0.0108, "step": 131680 }, { "epoch": 1.9, "learning_rate": 1.9367600078785174e-05, "loss": 0.0117, "step": 131690 }, { "epoch": 1.9, "learning_rate": 1.93675520390467e-05, "loss": 0.0109, "step": 131700 }, { "epoch": 1.9, "learning_rate": 1.936750399930823e-05, "loss": 0.0063, "step": 131710 }, { "epoch": 1.9, "learning_rate": 1.936745595956976e-05, "loss": 0.009, "step": 131720 }, { "epoch": 1.9, "learning_rate": 1.9367407919831288e-05, "loss": 0.0087, "step": 131730 }, { "epoch": 1.9, "learning_rate": 1.9367359880092814e-05, "loss": 0.0081, "step": 131740 }, { "epoch": 1.9, "learning_rate": 1.9367311840354343e-05, "loss": 0.0124, "step": 131750 }, { "epoch": 1.9, "learning_rate": 1.9367263800615873e-05, "loss": 0.0106, "step": 131760 }, { "epoch": 1.9, "learning_rate": 1.9367215760877402e-05, "loss": 0.0093, "step": 131770 }, { "epoch": 1.9, "learning_rate": 1.9367167721138928e-05, "loss": 0.0061, "step": 131780 }, { "epoch": 1.9, "learning_rate": 1.9367119681400457e-05, "loss": 0.0101, "step": 131790 }, { "epoch": 1.9, "learning_rate": 1.9367071641661986e-05, "loss": 0.0077, "step": 131800 }, { "epoch": 1.9, "learning_rate": 1.9367023601923512e-05, "loss": 0.0106, "step": 131810 }, { "epoch": 1.9, "learning_rate": 1.936697556218504e-05, "loss": 0.0103, "step": 131820 }, { "epoch": 1.9, "learning_rate": 1.936692752244657e-05, "loss": 0.0099, "step": 131830 }, { "epoch": 1.9, "learning_rate": 1.93668794827081e-05, "loss": 0.0082, "step": 131840 }, { "epoch": 1.9, "learning_rate": 1.9366831442969626e-05, "loss": 0.0086, "step": 131850 }, { "epoch": 1.9, "learning_rate": 1.9366783403231155e-05, "loss": 0.0118, "step": 131860 }, { "epoch": 1.9, "learning_rate": 1.9366735363492684e-05, "loss": 0.0082, "step": 131870 }, { "epoch": 1.9, "learning_rate": 1.936668732375421e-05, "loss": 0.0069, "step": 131880 }, { "epoch": 1.9, "learning_rate": 1.936663928401574e-05, "loss": 0.0099, "step": 131890 }, { "epoch": 1.9, "learning_rate": 1.936659124427727e-05, "loss": 0.0099, "step": 131900 }, { "epoch": 1.9, "learning_rate": 1.9366543204538798e-05, "loss": 0.0098, "step": 131910 }, { "epoch": 1.9, "learning_rate": 1.9366495164800324e-05, "loss": 0.0087, "step": 131920 }, { "epoch": 1.9, "learning_rate": 1.9366447125061853e-05, "loss": 0.0104, "step": 131930 }, { "epoch": 1.9, "learning_rate": 1.9366399085323383e-05, "loss": 0.008, "step": 131940 }, { "epoch": 1.9, "learning_rate": 1.9366351045584912e-05, "loss": 0.0101, "step": 131950 }, { "epoch": 1.9, "learning_rate": 1.9366303005846438e-05, "loss": 0.0111, "step": 131960 }, { "epoch": 1.9, "learning_rate": 1.9366254966107967e-05, "loss": 0.0079, "step": 131970 }, { "epoch": 1.9, "learning_rate": 1.9366206926369496e-05, "loss": 0.0091, "step": 131980 }, { "epoch": 1.9, "learning_rate": 1.9366158886631022e-05, "loss": 0.0061, "step": 131990 }, { "epoch": 1.9, "learning_rate": 1.936611084689255e-05, "loss": 0.0221, "step": 132000 }, { "epoch": 1.9, "learning_rate": 1.936606280715408e-05, "loss": 0.0081, "step": 132010 }, { "epoch": 1.9, "learning_rate": 1.936601476741561e-05, "loss": 0.012, "step": 132020 }, { "epoch": 1.9, "learning_rate": 1.9365966727677136e-05, "loss": 0.0147, "step": 132030 }, { "epoch": 1.9, "learning_rate": 1.9365918687938665e-05, "loss": 0.013, "step": 132040 }, { "epoch": 1.9, "learning_rate": 1.9365870648200194e-05, "loss": 0.008, "step": 132050 }, { "epoch": 1.9, "learning_rate": 1.936582260846172e-05, "loss": 0.0085, "step": 132060 }, { "epoch": 1.9, "learning_rate": 1.936577456872325e-05, "loss": 0.0169, "step": 132070 }, { "epoch": 1.9, "learning_rate": 1.936572652898478e-05, "loss": 0.008, "step": 132080 }, { "epoch": 1.9, "learning_rate": 1.9365678489246308e-05, "loss": 0.0111, "step": 132090 }, { "epoch": 1.9, "learning_rate": 1.9365630449507834e-05, "loss": 0.01, "step": 132100 }, { "epoch": 1.9, "learning_rate": 1.9365582409769363e-05, "loss": 0.0083, "step": 132110 }, { "epoch": 1.9, "learning_rate": 1.9365534370030892e-05, "loss": 0.0092, "step": 132120 }, { "epoch": 1.9, "learning_rate": 1.9365486330292422e-05, "loss": 0.0114, "step": 132130 }, { "epoch": 1.9, "learning_rate": 1.9365438290553948e-05, "loss": 0.0095, "step": 132140 }, { "epoch": 1.9, "learning_rate": 1.9365390250815477e-05, "loss": 0.0142, "step": 132150 }, { "epoch": 1.9, "learning_rate": 1.9365342211077006e-05, "loss": 0.0095, "step": 132160 }, { "epoch": 1.9, "learning_rate": 1.9365294171338532e-05, "loss": 0.0111, "step": 132170 }, { "epoch": 1.9, "learning_rate": 1.936524613160006e-05, "loss": 0.0091, "step": 132180 }, { "epoch": 1.91, "learning_rate": 1.936519809186159e-05, "loss": 0.0098, "step": 132190 }, { "epoch": 1.91, "learning_rate": 1.936515005212312e-05, "loss": 0.0088, "step": 132200 }, { "epoch": 1.91, "learning_rate": 1.9365102012384646e-05, "loss": 0.0085, "step": 132210 }, { "epoch": 1.91, "learning_rate": 1.9365053972646175e-05, "loss": 0.0097, "step": 132220 }, { "epoch": 1.91, "learning_rate": 1.9365005932907704e-05, "loss": 0.0079, "step": 132230 }, { "epoch": 1.91, "learning_rate": 1.936495789316923e-05, "loss": 0.0101, "step": 132240 }, { "epoch": 1.91, "learning_rate": 1.936490985343076e-05, "loss": 0.0109, "step": 132250 }, { "epoch": 1.91, "learning_rate": 1.936486181369229e-05, "loss": 0.0098, "step": 132260 }, { "epoch": 1.91, "learning_rate": 1.9364813773953818e-05, "loss": 0.0084, "step": 132270 }, { "epoch": 1.91, "learning_rate": 1.9364765734215344e-05, "loss": 0.0103, "step": 132280 }, { "epoch": 1.91, "learning_rate": 1.9364717694476873e-05, "loss": 0.013, "step": 132290 }, { "epoch": 1.91, "learning_rate": 1.9364669654738402e-05, "loss": 0.0142, "step": 132300 }, { "epoch": 1.91, "learning_rate": 1.936462161499993e-05, "loss": 0.0122, "step": 132310 }, { "epoch": 1.91, "learning_rate": 1.9364573575261457e-05, "loss": 0.0087, "step": 132320 }, { "epoch": 1.91, "learning_rate": 1.9364525535522987e-05, "loss": 0.0098, "step": 132330 }, { "epoch": 1.91, "learning_rate": 1.9364477495784516e-05, "loss": 0.0109, "step": 132340 }, { "epoch": 1.91, "learning_rate": 1.9364429456046042e-05, "loss": 0.0119, "step": 132350 }, { "epoch": 1.91, "learning_rate": 1.936438141630757e-05, "loss": 0.0109, "step": 132360 }, { "epoch": 1.91, "learning_rate": 1.93643333765691e-05, "loss": 0.0074, "step": 132370 }, { "epoch": 1.91, "learning_rate": 1.936428533683063e-05, "loss": 0.0117, "step": 132380 }, { "epoch": 1.91, "learning_rate": 1.9364237297092156e-05, "loss": 0.0131, "step": 132390 }, { "epoch": 1.91, "learning_rate": 1.9364189257353685e-05, "loss": 0.0076, "step": 132400 }, { "epoch": 1.91, "learning_rate": 1.9364141217615214e-05, "loss": 0.0091, "step": 132410 }, { "epoch": 1.91, "learning_rate": 1.936409317787674e-05, "loss": 0.0104, "step": 132420 }, { "epoch": 1.91, "learning_rate": 1.936404513813827e-05, "loss": 0.0106, "step": 132430 }, { "epoch": 1.91, "learning_rate": 1.93639970983998e-05, "loss": 0.0082, "step": 132440 }, { "epoch": 1.91, "learning_rate": 1.9363949058661328e-05, "loss": 0.0101, "step": 132450 }, { "epoch": 1.91, "learning_rate": 1.9363901018922854e-05, "loss": 0.0075, "step": 132460 }, { "epoch": 1.91, "learning_rate": 1.9363852979184383e-05, "loss": 0.0094, "step": 132470 }, { "epoch": 1.91, "learning_rate": 1.9363804939445912e-05, "loss": 0.0059, "step": 132480 }, { "epoch": 1.91, "learning_rate": 1.936375689970744e-05, "loss": 0.0104, "step": 132490 }, { "epoch": 1.91, "learning_rate": 1.9363708859968967e-05, "loss": 0.0108, "step": 132500 }, { "epoch": 1.91, "learning_rate": 1.9363660820230497e-05, "loss": 0.0098, "step": 132510 }, { "epoch": 1.91, "learning_rate": 1.9363612780492026e-05, "loss": 0.0089, "step": 132520 }, { "epoch": 1.91, "learning_rate": 1.9363564740753552e-05, "loss": 0.0092, "step": 132530 }, { "epoch": 1.91, "learning_rate": 1.936351670101508e-05, "loss": 0.0085, "step": 132540 }, { "epoch": 1.91, "learning_rate": 1.936346866127661e-05, "loss": 0.0071, "step": 132550 }, { "epoch": 1.91, "learning_rate": 1.936342062153814e-05, "loss": 0.0112, "step": 132560 }, { "epoch": 1.91, "learning_rate": 1.9363372581799666e-05, "loss": 0.0118, "step": 132570 }, { "epoch": 1.91, "learning_rate": 1.9363324542061195e-05, "loss": 0.008, "step": 132580 }, { "epoch": 1.91, "learning_rate": 1.9363276502322724e-05, "loss": 0.0096, "step": 132590 }, { "epoch": 1.91, "learning_rate": 1.936322846258425e-05, "loss": 0.009, "step": 132600 }, { "epoch": 1.91, "learning_rate": 1.936318042284578e-05, "loss": 0.009, "step": 132610 }, { "epoch": 1.91, "learning_rate": 1.936313238310731e-05, "loss": 0.0091, "step": 132620 }, { "epoch": 1.91, "learning_rate": 1.9363084343368838e-05, "loss": 0.0179, "step": 132630 }, { "epoch": 1.91, "learning_rate": 1.9363036303630364e-05, "loss": 0.0094, "step": 132640 }, { "epoch": 1.91, "learning_rate": 1.9362988263891893e-05, "loss": 0.0084, "step": 132650 }, { "epoch": 1.91, "learning_rate": 1.9362940224153422e-05, "loss": 0.0116, "step": 132660 }, { "epoch": 1.91, "learning_rate": 1.936289218441495e-05, "loss": 0.0108, "step": 132670 }, { "epoch": 1.91, "learning_rate": 1.9362844144676477e-05, "loss": 0.0131, "step": 132680 }, { "epoch": 1.91, "learning_rate": 1.9362796104938007e-05, "loss": 0.0079, "step": 132690 }, { "epoch": 1.91, "learning_rate": 1.9362748065199536e-05, "loss": 0.0073, "step": 132700 }, { "epoch": 1.91, "learning_rate": 1.9362700025461062e-05, "loss": 0.0059, "step": 132710 }, { "epoch": 1.91, "learning_rate": 1.936265198572259e-05, "loss": 0.0086, "step": 132720 }, { "epoch": 1.91, "learning_rate": 1.936260394598412e-05, "loss": 0.0101, "step": 132730 }, { "epoch": 1.91, "learning_rate": 1.936255590624565e-05, "loss": 0.0097, "step": 132740 }, { "epoch": 1.91, "learning_rate": 1.9362507866507175e-05, "loss": 0.0107, "step": 132750 }, { "epoch": 1.91, "learning_rate": 1.9362459826768705e-05, "loss": 0.0085, "step": 132760 }, { "epoch": 1.91, "learning_rate": 1.9362411787030234e-05, "loss": 0.0112, "step": 132770 }, { "epoch": 1.91, "learning_rate": 1.936236374729176e-05, "loss": 0.0117, "step": 132780 }, { "epoch": 1.91, "learning_rate": 1.936231570755329e-05, "loss": 0.008, "step": 132790 }, { "epoch": 1.91, "learning_rate": 1.936226766781482e-05, "loss": 0.0069, "step": 132800 }, { "epoch": 1.91, "learning_rate": 1.9362219628076348e-05, "loss": 0.0072, "step": 132810 }, { "epoch": 1.91, "learning_rate": 1.9362171588337874e-05, "loss": 0.012, "step": 132820 }, { "epoch": 1.91, "learning_rate": 1.9362123548599403e-05, "loss": 0.0113, "step": 132830 }, { "epoch": 1.91, "learning_rate": 1.9362075508860932e-05, "loss": 0.0129, "step": 132840 }, { "epoch": 1.91, "learning_rate": 1.936202746912246e-05, "loss": 0.0092, "step": 132850 }, { "epoch": 1.91, "learning_rate": 1.9361979429383987e-05, "loss": 0.011, "step": 132860 }, { "epoch": 1.91, "learning_rate": 1.9361931389645517e-05, "loss": 0.0091, "step": 132870 }, { "epoch": 1.92, "learning_rate": 1.9361883349907046e-05, "loss": 0.0135, "step": 132880 }, { "epoch": 1.92, "learning_rate": 1.936183531016857e-05, "loss": 0.0122, "step": 132890 }, { "epoch": 1.92, "learning_rate": 1.93617872704301e-05, "loss": 0.009, "step": 132900 }, { "epoch": 1.92, "learning_rate": 1.936173923069163e-05, "loss": 0.0087, "step": 132910 }, { "epoch": 1.92, "learning_rate": 1.936169119095316e-05, "loss": 0.0118, "step": 132920 }, { "epoch": 1.92, "learning_rate": 1.9361643151214685e-05, "loss": 0.0107, "step": 132930 }, { "epoch": 1.92, "learning_rate": 1.9361595111476215e-05, "loss": 0.0085, "step": 132940 }, { "epoch": 1.92, "learning_rate": 1.9361547071737744e-05, "loss": 0.0083, "step": 132950 }, { "epoch": 1.92, "learning_rate": 1.936149903199927e-05, "loss": 0.0094, "step": 132960 }, { "epoch": 1.92, "learning_rate": 1.93614509922608e-05, "loss": 0.0129, "step": 132970 }, { "epoch": 1.92, "learning_rate": 1.936140295252233e-05, "loss": 0.0088, "step": 132980 }, { "epoch": 1.92, "learning_rate": 1.9361354912783858e-05, "loss": 0.0091, "step": 132990 }, { "epoch": 1.92, "learning_rate": 1.9361306873045383e-05, "loss": 0.0105, "step": 133000 }, { "epoch": 1.92, "learning_rate": 1.9361258833306913e-05, "loss": 0.0135, "step": 133010 }, { "epoch": 1.92, "learning_rate": 1.9361210793568442e-05, "loss": 0.008, "step": 133020 }, { "epoch": 1.92, "learning_rate": 1.9361162753829968e-05, "loss": 0.0071, "step": 133030 }, { "epoch": 1.92, "learning_rate": 1.9361114714091497e-05, "loss": 0.0121, "step": 133040 }, { "epoch": 1.92, "learning_rate": 1.9361066674353026e-05, "loss": 0.0149, "step": 133050 }, { "epoch": 1.92, "learning_rate": 1.9361018634614556e-05, "loss": 0.0098, "step": 133060 }, { "epoch": 1.92, "learning_rate": 1.936097059487608e-05, "loss": 0.0109, "step": 133070 }, { "epoch": 1.92, "learning_rate": 1.936092255513761e-05, "loss": 0.0089, "step": 133080 }, { "epoch": 1.92, "learning_rate": 1.936087451539914e-05, "loss": 0.0112, "step": 133090 }, { "epoch": 1.92, "learning_rate": 1.936082647566067e-05, "loss": 0.0117, "step": 133100 }, { "epoch": 1.92, "learning_rate": 1.9360778435922195e-05, "loss": 0.0076, "step": 133110 }, { "epoch": 1.92, "learning_rate": 1.9360730396183725e-05, "loss": 0.0101, "step": 133120 }, { "epoch": 1.92, "learning_rate": 1.9360682356445254e-05, "loss": 0.0084, "step": 133130 }, { "epoch": 1.92, "learning_rate": 1.936063431670678e-05, "loss": 0.0081, "step": 133140 }, { "epoch": 1.92, "learning_rate": 1.936058627696831e-05, "loss": 0.0086, "step": 133150 }, { "epoch": 1.92, "learning_rate": 1.9360538237229838e-05, "loss": 0.0084, "step": 133160 }, { "epoch": 1.92, "learning_rate": 1.9360490197491367e-05, "loss": 0.0135, "step": 133170 }, { "epoch": 1.92, "learning_rate": 1.9360442157752893e-05, "loss": 0.0146, "step": 133180 }, { "epoch": 1.92, "learning_rate": 1.9360394118014423e-05, "loss": 0.008, "step": 133190 }, { "epoch": 1.92, "learning_rate": 1.9360346078275952e-05, "loss": 0.0064, "step": 133200 }, { "epoch": 1.92, "learning_rate": 1.9360298038537478e-05, "loss": 0.0085, "step": 133210 }, { "epoch": 1.92, "learning_rate": 1.9360249998799007e-05, "loss": 0.0119, "step": 133220 }, { "epoch": 1.92, "learning_rate": 1.9360201959060536e-05, "loss": 0.0064, "step": 133230 }, { "epoch": 1.92, "learning_rate": 1.9360153919322066e-05, "loss": 0.01, "step": 133240 }, { "epoch": 1.92, "learning_rate": 1.936010587958359e-05, "loss": 0.0132, "step": 133250 }, { "epoch": 1.92, "learning_rate": 1.936005783984512e-05, "loss": 0.0082, "step": 133260 }, { "epoch": 1.92, "learning_rate": 1.936000980010665e-05, "loss": 0.0104, "step": 133270 }, { "epoch": 1.92, "learning_rate": 1.935996176036818e-05, "loss": 0.0147, "step": 133280 }, { "epoch": 1.92, "learning_rate": 1.9359913720629705e-05, "loss": 0.0103, "step": 133290 }, { "epoch": 1.92, "learning_rate": 1.9359865680891234e-05, "loss": 0.0101, "step": 133300 }, { "epoch": 1.92, "learning_rate": 1.9359817641152764e-05, "loss": 0.0121, "step": 133310 }, { "epoch": 1.92, "learning_rate": 1.935976960141429e-05, "loss": 0.0089, "step": 133320 }, { "epoch": 1.92, "learning_rate": 1.935972156167582e-05, "loss": 0.0088, "step": 133330 }, { "epoch": 1.92, "learning_rate": 1.9359673521937348e-05, "loss": 0.005, "step": 133340 }, { "epoch": 1.92, "learning_rate": 1.9359625482198877e-05, "loss": 0.0134, "step": 133350 }, { "epoch": 1.92, "learning_rate": 1.9359577442460403e-05, "loss": 0.0105, "step": 133360 }, { "epoch": 1.92, "learning_rate": 1.9359529402721933e-05, "loss": 0.0087, "step": 133370 }, { "epoch": 1.92, "learning_rate": 1.9359481362983462e-05, "loss": 0.0107, "step": 133380 }, { "epoch": 1.92, "learning_rate": 1.9359433323244988e-05, "loss": 0.01, "step": 133390 }, { "epoch": 1.92, "learning_rate": 1.9359385283506517e-05, "loss": 0.012, "step": 133400 }, { "epoch": 1.92, "learning_rate": 1.9359337243768046e-05, "loss": 0.0108, "step": 133410 }, { "epoch": 1.92, "learning_rate": 1.9359289204029576e-05, "loss": 0.0086, "step": 133420 }, { "epoch": 1.92, "learning_rate": 1.93592411642911e-05, "loss": 0.0064, "step": 133430 }, { "epoch": 1.92, "learning_rate": 1.935919312455263e-05, "loss": 0.0085, "step": 133440 }, { "epoch": 1.92, "learning_rate": 1.935914508481416e-05, "loss": 0.0079, "step": 133450 }, { "epoch": 1.92, "learning_rate": 1.935909704507569e-05, "loss": 0.0096, "step": 133460 }, { "epoch": 1.92, "learning_rate": 1.9359049005337215e-05, "loss": 0.0086, "step": 133470 }, { "epoch": 1.92, "learning_rate": 1.9359000965598744e-05, "loss": 0.0091, "step": 133480 }, { "epoch": 1.92, "learning_rate": 1.9358952925860274e-05, "loss": 0.0109, "step": 133490 }, { "epoch": 1.92, "learning_rate": 1.93589048861218e-05, "loss": 0.0094, "step": 133500 }, { "epoch": 1.92, "learning_rate": 1.935885684638333e-05, "loss": 0.0088, "step": 133510 }, { "epoch": 1.92, "learning_rate": 1.9358808806644858e-05, "loss": 0.0089, "step": 133520 }, { "epoch": 1.92, "learning_rate": 1.9358760766906387e-05, "loss": 0.0082, "step": 133530 }, { "epoch": 1.92, "learning_rate": 1.9358712727167913e-05, "loss": 0.0114, "step": 133540 }, { "epoch": 1.92, "learning_rate": 1.9358664687429442e-05, "loss": 0.0077, "step": 133550 }, { "epoch": 1.92, "learning_rate": 1.9358616647690972e-05, "loss": 0.0092, "step": 133560 }, { "epoch": 1.93, "learning_rate": 1.9358568607952498e-05, "loss": 0.0084, "step": 133570 }, { "epoch": 1.93, "learning_rate": 1.9358520568214027e-05, "loss": 0.0101, "step": 133580 }, { "epoch": 1.93, "learning_rate": 1.9358472528475556e-05, "loss": 0.0089, "step": 133590 }, { "epoch": 1.93, "learning_rate": 1.9358424488737085e-05, "loss": 0.008, "step": 133600 }, { "epoch": 1.93, "learning_rate": 1.935837644899861e-05, "loss": 0.0113, "step": 133610 }, { "epoch": 1.93, "learning_rate": 1.935832840926014e-05, "loss": 0.0097, "step": 133620 }, { "epoch": 1.93, "learning_rate": 1.935828036952167e-05, "loss": 0.0094, "step": 133630 }, { "epoch": 1.93, "learning_rate": 1.93582323297832e-05, "loss": 0.0064, "step": 133640 }, { "epoch": 1.93, "learning_rate": 1.9358184290044725e-05, "loss": 0.0129, "step": 133650 }, { "epoch": 1.93, "learning_rate": 1.9358136250306254e-05, "loss": 0.0081, "step": 133660 }, { "epoch": 1.93, "learning_rate": 1.9358088210567784e-05, "loss": 0.0084, "step": 133670 }, { "epoch": 1.93, "learning_rate": 1.935804017082931e-05, "loss": 0.0112, "step": 133680 }, { "epoch": 1.93, "learning_rate": 1.935799213109084e-05, "loss": 0.0152, "step": 133690 }, { "epoch": 1.93, "learning_rate": 1.9357944091352368e-05, "loss": 0.0076, "step": 133700 }, { "epoch": 1.93, "learning_rate": 1.9357896051613897e-05, "loss": 0.0085, "step": 133710 }, { "epoch": 1.93, "learning_rate": 1.9357848011875423e-05, "loss": 0.0084, "step": 133720 }, { "epoch": 1.93, "learning_rate": 1.9357799972136952e-05, "loss": 0.0101, "step": 133730 }, { "epoch": 1.93, "learning_rate": 1.935775193239848e-05, "loss": 0.011, "step": 133740 }, { "epoch": 1.93, "learning_rate": 1.9357703892660008e-05, "loss": 0.0106, "step": 133750 }, { "epoch": 1.93, "learning_rate": 1.9357655852921537e-05, "loss": 0.0111, "step": 133760 }, { "epoch": 1.93, "learning_rate": 1.9357607813183066e-05, "loss": 0.0107, "step": 133770 }, { "epoch": 1.93, "learning_rate": 1.9357559773444595e-05, "loss": 0.0092, "step": 133780 }, { "epoch": 1.93, "learning_rate": 1.935751173370612e-05, "loss": 0.0075, "step": 133790 }, { "epoch": 1.93, "learning_rate": 1.935746369396765e-05, "loss": 0.0124, "step": 133800 }, { "epoch": 1.93, "learning_rate": 1.935741565422918e-05, "loss": 0.0141, "step": 133810 }, { "epoch": 1.93, "learning_rate": 1.935736761449071e-05, "loss": 0.0107, "step": 133820 }, { "epoch": 1.93, "learning_rate": 1.9357319574752235e-05, "loss": 0.0118, "step": 133830 }, { "epoch": 1.93, "learning_rate": 1.9357271535013764e-05, "loss": 0.01, "step": 133840 }, { "epoch": 1.93, "learning_rate": 1.9357223495275293e-05, "loss": 0.0083, "step": 133850 }, { "epoch": 1.93, "learning_rate": 1.935717545553682e-05, "loss": 0.0095, "step": 133860 }, { "epoch": 1.93, "learning_rate": 1.935712741579835e-05, "loss": 0.0092, "step": 133870 }, { "epoch": 1.93, "learning_rate": 1.9357079376059878e-05, "loss": 0.0071, "step": 133880 }, { "epoch": 1.93, "learning_rate": 1.9357031336321407e-05, "loss": 0.011, "step": 133890 }, { "epoch": 1.93, "learning_rate": 1.9356983296582933e-05, "loss": 0.0095, "step": 133900 }, { "epoch": 1.93, "learning_rate": 1.9356935256844462e-05, "loss": 0.0111, "step": 133910 }, { "epoch": 1.93, "learning_rate": 1.935688721710599e-05, "loss": 0.0076, "step": 133920 }, { "epoch": 1.93, "learning_rate": 1.9356839177367517e-05, "loss": 0.011, "step": 133930 }, { "epoch": 1.93, "learning_rate": 1.9356791137629047e-05, "loss": 0.011, "step": 133940 }, { "epoch": 1.93, "learning_rate": 1.9356743097890576e-05, "loss": 0.0108, "step": 133950 }, { "epoch": 1.93, "learning_rate": 1.9356695058152105e-05, "loss": 0.0093, "step": 133960 }, { "epoch": 1.93, "learning_rate": 1.935664701841363e-05, "loss": 0.0168, "step": 133970 }, { "epoch": 1.93, "learning_rate": 1.935659897867516e-05, "loss": 0.0067, "step": 133980 }, { "epoch": 1.93, "learning_rate": 1.935655093893669e-05, "loss": 0.0099, "step": 133990 }, { "epoch": 1.93, "learning_rate": 1.935650289919822e-05, "loss": 0.011, "step": 134000 }, { "epoch": 1.93, "learning_rate": 1.9356454859459745e-05, "loss": 0.0107, "step": 134010 }, { "epoch": 1.93, "learning_rate": 1.9356406819721274e-05, "loss": 0.0087, "step": 134020 }, { "epoch": 1.93, "learning_rate": 1.9356358779982803e-05, "loss": 0.0091, "step": 134030 }, { "epoch": 1.93, "learning_rate": 1.935631074024433e-05, "loss": 0.0077, "step": 134040 }, { "epoch": 1.93, "learning_rate": 1.935626270050586e-05, "loss": 0.0085, "step": 134050 }, { "epoch": 1.93, "learning_rate": 1.9356214660767388e-05, "loss": 0.0104, "step": 134060 }, { "epoch": 1.93, "learning_rate": 1.9356166621028917e-05, "loss": 0.0078, "step": 134070 }, { "epoch": 1.93, "learning_rate": 1.9356118581290443e-05, "loss": 0.0077, "step": 134080 }, { "epoch": 1.93, "learning_rate": 1.9356070541551972e-05, "loss": 0.0111, "step": 134090 }, { "epoch": 1.93, "learning_rate": 1.93560225018135e-05, "loss": 0.0078, "step": 134100 }, { "epoch": 1.93, "learning_rate": 1.9355974462075027e-05, "loss": 0.0116, "step": 134110 }, { "epoch": 1.93, "learning_rate": 1.9355926422336557e-05, "loss": 0.0114, "step": 134120 }, { "epoch": 1.93, "learning_rate": 1.935587838259809e-05, "loss": 0.0104, "step": 134130 }, { "epoch": 1.93, "learning_rate": 1.9355830342859615e-05, "loss": 0.0096, "step": 134140 }, { "epoch": 1.93, "learning_rate": 1.9355782303121144e-05, "loss": 0.0099, "step": 134150 }, { "epoch": 1.93, "learning_rate": 1.9355734263382674e-05, "loss": 0.0099, "step": 134160 }, { "epoch": 1.93, "learning_rate": 1.93556862236442e-05, "loss": 0.0108, "step": 134170 }, { "epoch": 1.93, "learning_rate": 1.935563818390573e-05, "loss": 0.0094, "step": 134180 }, { "epoch": 1.93, "learning_rate": 1.9355590144167258e-05, "loss": 0.0102, "step": 134190 }, { "epoch": 1.93, "learning_rate": 1.9355542104428787e-05, "loss": 0.0102, "step": 134200 }, { "epoch": 1.93, "learning_rate": 1.9355494064690313e-05, "loss": 0.0119, "step": 134210 }, { "epoch": 1.93, "learning_rate": 1.9355446024951843e-05, "loss": 0.0076, "step": 134220 }, { "epoch": 1.93, "learning_rate": 1.9355397985213372e-05, "loss": 0.0118, "step": 134230 }, { "epoch": 1.93, "learning_rate": 1.93553499454749e-05, "loss": 0.0104, "step": 134240 }, { "epoch": 1.93, "learning_rate": 1.9355301905736427e-05, "loss": 0.0097, "step": 134250 }, { "epoch": 1.93, "learning_rate": 1.9355253865997956e-05, "loss": 0.0139, "step": 134260 }, { "epoch": 1.94, "learning_rate": 1.9355205826259486e-05, "loss": 0.0101, "step": 134270 }, { "epoch": 1.94, "learning_rate": 1.935515778652101e-05, "loss": 0.0076, "step": 134280 }, { "epoch": 1.94, "learning_rate": 1.935510974678254e-05, "loss": 0.0113, "step": 134290 }, { "epoch": 1.94, "learning_rate": 1.935506170704407e-05, "loss": 0.012, "step": 134300 }, { "epoch": 1.94, "learning_rate": 1.93550136673056e-05, "loss": 0.011, "step": 134310 }, { "epoch": 1.94, "learning_rate": 1.9354965627567125e-05, "loss": 0.0092, "step": 134320 }, { "epoch": 1.94, "learning_rate": 1.9354917587828654e-05, "loss": 0.0115, "step": 134330 }, { "epoch": 1.94, "learning_rate": 1.9354869548090184e-05, "loss": 0.0081, "step": 134340 }, { "epoch": 1.94, "learning_rate": 1.935482150835171e-05, "loss": 0.0081, "step": 134350 }, { "epoch": 1.94, "learning_rate": 1.935477346861324e-05, "loss": 0.008, "step": 134360 }, { "epoch": 1.94, "learning_rate": 1.9354725428874768e-05, "loss": 0.0092, "step": 134370 }, { "epoch": 1.94, "learning_rate": 1.9354677389136297e-05, "loss": 0.0123, "step": 134380 }, { "epoch": 1.94, "learning_rate": 1.9354629349397823e-05, "loss": 0.0179, "step": 134390 }, { "epoch": 1.94, "learning_rate": 1.9354581309659352e-05, "loss": 0.009, "step": 134400 }, { "epoch": 1.94, "learning_rate": 1.9354533269920882e-05, "loss": 0.0125, "step": 134410 }, { "epoch": 1.94, "learning_rate": 1.9354485230182408e-05, "loss": 0.0147, "step": 134420 }, { "epoch": 1.94, "learning_rate": 1.9354437190443937e-05, "loss": 0.0116, "step": 134430 }, { "epoch": 1.94, "learning_rate": 1.9354389150705466e-05, "loss": 0.0103, "step": 134440 }, { "epoch": 1.94, "learning_rate": 1.9354341110966995e-05, "loss": 0.0106, "step": 134450 }, { "epoch": 1.94, "learning_rate": 1.935429307122852e-05, "loss": 0.0096, "step": 134460 }, { "epoch": 1.94, "learning_rate": 1.935424503149005e-05, "loss": 0.0102, "step": 134470 }, { "epoch": 1.94, "learning_rate": 1.935419699175158e-05, "loss": 0.008, "step": 134480 }, { "epoch": 1.94, "learning_rate": 1.935414895201311e-05, "loss": 0.0082, "step": 134490 }, { "epoch": 1.94, "learning_rate": 1.9354100912274635e-05, "loss": 0.0102, "step": 134500 }, { "epoch": 1.94, "learning_rate": 1.9354052872536164e-05, "loss": 0.0097, "step": 134510 }, { "epoch": 1.94, "learning_rate": 1.9354004832797694e-05, "loss": 0.0103, "step": 134520 }, { "epoch": 1.94, "learning_rate": 1.935395679305922e-05, "loss": 0.0095, "step": 134530 }, { "epoch": 1.94, "learning_rate": 1.935390875332075e-05, "loss": 0.0054, "step": 134540 }, { "epoch": 1.94, "learning_rate": 1.9353860713582278e-05, "loss": 0.0073, "step": 134550 }, { "epoch": 1.94, "learning_rate": 1.9353812673843807e-05, "loss": 0.0122, "step": 134560 }, { "epoch": 1.94, "learning_rate": 1.9353764634105333e-05, "loss": 0.0097, "step": 134570 }, { "epoch": 1.94, "learning_rate": 1.9353716594366862e-05, "loss": 0.0091, "step": 134580 }, { "epoch": 1.94, "learning_rate": 1.935366855462839e-05, "loss": 0.0076, "step": 134590 }, { "epoch": 1.94, "learning_rate": 1.9353620514889918e-05, "loss": 0.0074, "step": 134600 }, { "epoch": 1.94, "learning_rate": 1.9353572475151447e-05, "loss": 0.01, "step": 134610 }, { "epoch": 1.94, "learning_rate": 1.9353524435412976e-05, "loss": 0.0126, "step": 134620 }, { "epoch": 1.94, "learning_rate": 1.9353476395674505e-05, "loss": 0.0123, "step": 134630 }, { "epoch": 1.94, "learning_rate": 1.935342835593603e-05, "loss": 0.0084, "step": 134640 }, { "epoch": 1.94, "learning_rate": 1.935338031619756e-05, "loss": 0.0114, "step": 134650 }, { "epoch": 1.94, "learning_rate": 1.935333227645909e-05, "loss": 0.0101, "step": 134660 }, { "epoch": 1.94, "learning_rate": 1.935328423672062e-05, "loss": 0.0122, "step": 134670 }, { "epoch": 1.94, "learning_rate": 1.9353236196982145e-05, "loss": 0.0086, "step": 134680 }, { "epoch": 1.94, "learning_rate": 1.9353188157243674e-05, "loss": 0.0067, "step": 134690 }, { "epoch": 1.94, "learning_rate": 1.9353140117505203e-05, "loss": 0.0071, "step": 134700 }, { "epoch": 1.94, "learning_rate": 1.935309207776673e-05, "loss": 0.0074, "step": 134710 }, { "epoch": 1.94, "learning_rate": 1.935304403802826e-05, "loss": 0.0127, "step": 134720 }, { "epoch": 1.94, "learning_rate": 1.9352995998289788e-05, "loss": 0.0098, "step": 134730 }, { "epoch": 1.94, "learning_rate": 1.9352947958551317e-05, "loss": 0.0088, "step": 134740 }, { "epoch": 1.94, "learning_rate": 1.9352899918812843e-05, "loss": 0.0095, "step": 134750 }, { "epoch": 1.94, "learning_rate": 1.9352851879074372e-05, "loss": 0.0067, "step": 134760 }, { "epoch": 1.94, "learning_rate": 1.93528038393359e-05, "loss": 0.0075, "step": 134770 }, { "epoch": 1.94, "learning_rate": 1.9352755799597427e-05, "loss": 0.0093, "step": 134780 }, { "epoch": 1.94, "learning_rate": 1.9352707759858957e-05, "loss": 0.0104, "step": 134790 }, { "epoch": 1.94, "learning_rate": 1.9352659720120486e-05, "loss": 0.0105, "step": 134800 }, { "epoch": 1.94, "learning_rate": 1.9352611680382015e-05, "loss": 0.0094, "step": 134810 }, { "epoch": 1.94, "learning_rate": 1.935256364064354e-05, "loss": 0.0099, "step": 134820 }, { "epoch": 1.94, "learning_rate": 1.935251560090507e-05, "loss": 0.0078, "step": 134830 }, { "epoch": 1.94, "learning_rate": 1.93524675611666e-05, "loss": 0.009, "step": 134840 }, { "epoch": 1.94, "learning_rate": 1.935241952142813e-05, "loss": 0.0104, "step": 134850 }, { "epoch": 1.94, "learning_rate": 1.9352371481689655e-05, "loss": 0.0076, "step": 134860 }, { "epoch": 1.94, "learning_rate": 1.9352323441951184e-05, "loss": 0.0092, "step": 134870 }, { "epoch": 1.94, "learning_rate": 1.9352275402212713e-05, "loss": 0.0104, "step": 134880 }, { "epoch": 1.94, "learning_rate": 1.935222736247424e-05, "loss": 0.0099, "step": 134890 }, { "epoch": 1.94, "learning_rate": 1.935217932273577e-05, "loss": 0.0089, "step": 134900 }, { "epoch": 1.94, "learning_rate": 1.9352131282997298e-05, "loss": 0.0073, "step": 134910 }, { "epoch": 1.94, "learning_rate": 1.9352083243258827e-05, "loss": 0.0114, "step": 134920 }, { "epoch": 1.94, "learning_rate": 1.9352035203520353e-05, "loss": 0.0099, "step": 134930 }, { "epoch": 1.94, "learning_rate": 1.9351987163781882e-05, "loss": 0.011, "step": 134940 }, { "epoch": 1.94, "learning_rate": 1.935193912404341e-05, "loss": 0.0094, "step": 134950 }, { "epoch": 1.95, "learning_rate": 1.9351891084304937e-05, "loss": 0.0126, "step": 134960 }, { "epoch": 1.95, "learning_rate": 1.9351843044566467e-05, "loss": 0.0089, "step": 134970 }, { "epoch": 1.95, "learning_rate": 1.9351795004827996e-05, "loss": 0.0089, "step": 134980 }, { "epoch": 1.95, "learning_rate": 1.9351746965089525e-05, "loss": 0.0108, "step": 134990 }, { "epoch": 1.95, "learning_rate": 1.935169892535105e-05, "loss": 0.0078, "step": 135000 }, { "epoch": 1.95, "learning_rate": 1.935165088561258e-05, "loss": 0.0083, "step": 135010 }, { "epoch": 1.95, "learning_rate": 1.935160284587411e-05, "loss": 0.0106, "step": 135020 }, { "epoch": 1.95, "learning_rate": 1.935155480613564e-05, "loss": 0.0067, "step": 135030 }, { "epoch": 1.95, "learning_rate": 1.9351506766397165e-05, "loss": 0.0082, "step": 135040 }, { "epoch": 1.95, "learning_rate": 1.9351458726658694e-05, "loss": 0.0079, "step": 135050 }, { "epoch": 1.95, "learning_rate": 1.9351410686920223e-05, "loss": 0.0098, "step": 135060 }, { "epoch": 1.95, "learning_rate": 1.935136264718175e-05, "loss": 0.0087, "step": 135070 }, { "epoch": 1.95, "learning_rate": 1.935131460744328e-05, "loss": 0.0108, "step": 135080 }, { "epoch": 1.95, "learning_rate": 1.9351266567704808e-05, "loss": 0.0092, "step": 135090 }, { "epoch": 1.95, "learning_rate": 1.9351218527966337e-05, "loss": 0.0094, "step": 135100 }, { "epoch": 1.95, "learning_rate": 1.9351170488227863e-05, "loss": 0.0116, "step": 135110 }, { "epoch": 1.95, "learning_rate": 1.9351122448489392e-05, "loss": 0.0087, "step": 135120 }, { "epoch": 1.95, "learning_rate": 1.935107440875092e-05, "loss": 0.0076, "step": 135130 }, { "epoch": 1.95, "learning_rate": 1.9351026369012447e-05, "loss": 0.0093, "step": 135140 }, { "epoch": 1.95, "learning_rate": 1.9350978329273977e-05, "loss": 0.0071, "step": 135150 }, { "epoch": 1.95, "learning_rate": 1.9350930289535506e-05, "loss": 0.0081, "step": 135160 }, { "epoch": 1.95, "learning_rate": 1.9350882249797035e-05, "loss": 0.0083, "step": 135170 }, { "epoch": 1.95, "learning_rate": 1.935083421005856e-05, "loss": 0.008, "step": 135180 }, { "epoch": 1.95, "learning_rate": 1.935078617032009e-05, "loss": 0.0101, "step": 135190 }, { "epoch": 1.95, "learning_rate": 1.935073813058162e-05, "loss": 0.0119, "step": 135200 }, { "epoch": 1.95, "learning_rate": 1.935069009084315e-05, "loss": 0.0105, "step": 135210 }, { "epoch": 1.95, "learning_rate": 1.9350642051104675e-05, "loss": 0.008, "step": 135220 }, { "epoch": 1.95, "learning_rate": 1.9350594011366204e-05, "loss": 0.0079, "step": 135230 }, { "epoch": 1.95, "learning_rate": 1.9350545971627733e-05, "loss": 0.0093, "step": 135240 }, { "epoch": 1.95, "learning_rate": 1.935049793188926e-05, "loss": 0.0104, "step": 135250 }, { "epoch": 1.95, "learning_rate": 1.935044989215079e-05, "loss": 0.0084, "step": 135260 }, { "epoch": 1.95, "learning_rate": 1.9350401852412318e-05, "loss": 0.0093, "step": 135270 }, { "epoch": 1.95, "learning_rate": 1.9350353812673847e-05, "loss": 0.0068, "step": 135280 }, { "epoch": 1.95, "learning_rate": 1.9350305772935373e-05, "loss": 0.0115, "step": 135290 }, { "epoch": 1.95, "learning_rate": 1.9350257733196902e-05, "loss": 0.0104, "step": 135300 }, { "epoch": 1.95, "learning_rate": 1.935020969345843e-05, "loss": 0.0101, "step": 135310 }, { "epoch": 1.95, "learning_rate": 1.9350161653719957e-05, "loss": 0.0122, "step": 135320 }, { "epoch": 1.95, "learning_rate": 1.9350113613981486e-05, "loss": 0.0116, "step": 135330 }, { "epoch": 1.95, "learning_rate": 1.9350065574243016e-05, "loss": 0.009, "step": 135340 }, { "epoch": 1.95, "learning_rate": 1.9350017534504545e-05, "loss": 0.0093, "step": 135350 }, { "epoch": 1.95, "learning_rate": 1.934996949476607e-05, "loss": 0.0074, "step": 135360 }, { "epoch": 1.95, "learning_rate": 1.93499214550276e-05, "loss": 0.0073, "step": 135370 }, { "epoch": 1.95, "learning_rate": 1.934987341528913e-05, "loss": 0.0099, "step": 135380 }, { "epoch": 1.95, "learning_rate": 1.934982537555066e-05, "loss": 0.0096, "step": 135390 }, { "epoch": 1.95, "learning_rate": 1.9349777335812185e-05, "loss": 0.0104, "step": 135400 }, { "epoch": 1.95, "learning_rate": 1.9349729296073714e-05, "loss": 0.0081, "step": 135410 }, { "epoch": 1.95, "learning_rate": 1.9349681256335243e-05, "loss": 0.0067, "step": 135420 }, { "epoch": 1.95, "learning_rate": 1.934963321659677e-05, "loss": 0.0119, "step": 135430 }, { "epoch": 1.95, "learning_rate": 1.9349585176858298e-05, "loss": 0.0086, "step": 135440 }, { "epoch": 1.95, "learning_rate": 1.9349537137119828e-05, "loss": 0.0119, "step": 135450 }, { "epoch": 1.95, "learning_rate": 1.9349489097381357e-05, "loss": 0.0093, "step": 135460 }, { "epoch": 1.95, "learning_rate": 1.9349441057642883e-05, "loss": 0.0089, "step": 135470 }, { "epoch": 1.95, "learning_rate": 1.9349393017904412e-05, "loss": 0.0101, "step": 135480 }, { "epoch": 1.95, "learning_rate": 1.934934497816594e-05, "loss": 0.0101, "step": 135490 }, { "epoch": 1.95, "learning_rate": 1.9349296938427467e-05, "loss": 0.0114, "step": 135500 }, { "epoch": 1.95, "learning_rate": 1.9349248898688996e-05, "loss": 0.0104, "step": 135510 }, { "epoch": 1.95, "learning_rate": 1.9349200858950526e-05, "loss": 0.0101, "step": 135520 }, { "epoch": 1.95, "learning_rate": 1.9349152819212055e-05, "loss": 0.0108, "step": 135530 }, { "epoch": 1.95, "learning_rate": 1.934910477947358e-05, "loss": 0.0094, "step": 135540 }, { "epoch": 1.95, "learning_rate": 1.934905673973511e-05, "loss": 0.0093, "step": 135550 }, { "epoch": 1.95, "learning_rate": 1.934900869999664e-05, "loss": 0.0114, "step": 135560 }, { "epoch": 1.95, "learning_rate": 1.934896066025817e-05, "loss": 0.0102, "step": 135570 }, { "epoch": 1.95, "learning_rate": 1.9348912620519695e-05, "loss": 0.0091, "step": 135580 }, { "epoch": 1.95, "learning_rate": 1.9348864580781224e-05, "loss": 0.0094, "step": 135590 }, { "epoch": 1.95, "learning_rate": 1.9348816541042753e-05, "loss": 0.0079, "step": 135600 }, { "epoch": 1.95, "learning_rate": 1.934876850130428e-05, "loss": 0.0138, "step": 135610 }, { "epoch": 1.95, "learning_rate": 1.9348720461565808e-05, "loss": 0.0077, "step": 135620 }, { "epoch": 1.95, "learning_rate": 1.9348672421827337e-05, "loss": 0.0078, "step": 135630 }, { "epoch": 1.95, "learning_rate": 1.9348624382088867e-05, "loss": 0.0094, "step": 135640 }, { "epoch": 1.95, "learning_rate": 1.9348576342350393e-05, "loss": 0.0106, "step": 135650 }, { "epoch": 1.96, "learning_rate": 1.9348528302611922e-05, "loss": 0.0084, "step": 135660 }, { "epoch": 1.96, "learning_rate": 1.934848026287345e-05, "loss": 0.0121, "step": 135670 }, { "epoch": 1.96, "learning_rate": 1.9348432223134977e-05, "loss": 0.0115, "step": 135680 }, { "epoch": 1.96, "learning_rate": 1.9348388987370355e-05, "loss": 0.0102, "step": 135690 }, { "epoch": 1.96, "learning_rate": 1.9348340947631884e-05, "loss": 0.01, "step": 135700 }, { "epoch": 1.96, "learning_rate": 1.934829290789341e-05, "loss": 0.0115, "step": 135710 }, { "epoch": 1.96, "learning_rate": 1.934824486815494e-05, "loss": 0.0132, "step": 135720 }, { "epoch": 1.96, "learning_rate": 1.934819682841647e-05, "loss": 0.0105, "step": 135730 }, { "epoch": 1.96, "learning_rate": 1.9348148788677995e-05, "loss": 0.009, "step": 135740 }, { "epoch": 1.96, "learning_rate": 1.9348100748939524e-05, "loss": 0.0096, "step": 135750 }, { "epoch": 1.96, "learning_rate": 1.9348052709201053e-05, "loss": 0.0108, "step": 135760 }, { "epoch": 1.96, "learning_rate": 1.9348004669462582e-05, "loss": 0.0081, "step": 135770 }, { "epoch": 1.96, "learning_rate": 1.934795662972411e-05, "loss": 0.0099, "step": 135780 }, { "epoch": 1.96, "learning_rate": 1.9347908589985638e-05, "loss": 0.0076, "step": 135790 }, { "epoch": 1.96, "learning_rate": 1.9347860550247167e-05, "loss": 0.0078, "step": 135800 }, { "epoch": 1.96, "learning_rate": 1.9347812510508696e-05, "loss": 0.0085, "step": 135810 }, { "epoch": 1.96, "learning_rate": 1.9347764470770222e-05, "loss": 0.0076, "step": 135820 }, { "epoch": 1.96, "learning_rate": 1.934771643103175e-05, "loss": 0.0126, "step": 135830 }, { "epoch": 1.96, "learning_rate": 1.934766839129328e-05, "loss": 0.008, "step": 135840 }, { "epoch": 1.96, "learning_rate": 1.9347620351554806e-05, "loss": 0.0097, "step": 135850 }, { "epoch": 1.96, "learning_rate": 1.9347572311816336e-05, "loss": 0.0094, "step": 135860 }, { "epoch": 1.96, "learning_rate": 1.9347524272077865e-05, "loss": 0.0099, "step": 135870 }, { "epoch": 1.96, "learning_rate": 1.9347476232339394e-05, "loss": 0.0065, "step": 135880 }, { "epoch": 1.96, "learning_rate": 1.934742819260092e-05, "loss": 0.0086, "step": 135890 }, { "epoch": 1.96, "learning_rate": 1.934738015286245e-05, "loss": 0.0105, "step": 135900 }, { "epoch": 1.96, "learning_rate": 1.934733211312398e-05, "loss": 0.0057, "step": 135910 }, { "epoch": 1.96, "learning_rate": 1.9347284073385505e-05, "loss": 0.0092, "step": 135920 }, { "epoch": 1.96, "learning_rate": 1.9347236033647034e-05, "loss": 0.01, "step": 135930 }, { "epoch": 1.96, "learning_rate": 1.9347187993908563e-05, "loss": 0.0111, "step": 135940 }, { "epoch": 1.96, "learning_rate": 1.9347139954170092e-05, "loss": 0.0094, "step": 135950 }, { "epoch": 1.96, "learning_rate": 1.9347091914431618e-05, "loss": 0.0076, "step": 135960 }, { "epoch": 1.96, "learning_rate": 1.9347043874693148e-05, "loss": 0.0115, "step": 135970 }, { "epoch": 1.96, "learning_rate": 1.9346995834954677e-05, "loss": 0.0112, "step": 135980 }, { "epoch": 1.96, "learning_rate": 1.9346947795216203e-05, "loss": 0.0097, "step": 135990 }, { "epoch": 1.96, "learning_rate": 1.9346899755477732e-05, "loss": 0.0091, "step": 136000 }, { "epoch": 1.96, "learning_rate": 1.934685171573926e-05, "loss": 0.0104, "step": 136010 }, { "epoch": 1.96, "learning_rate": 1.934680367600079e-05, "loss": 0.0094, "step": 136020 }, { "epoch": 1.96, "learning_rate": 1.9346755636262316e-05, "loss": 0.0072, "step": 136030 }, { "epoch": 1.96, "learning_rate": 1.9346707596523846e-05, "loss": 0.0087, "step": 136040 }, { "epoch": 1.96, "learning_rate": 1.9346659556785375e-05, "loss": 0.0118, "step": 136050 }, { "epoch": 1.96, "learning_rate": 1.9346611517046904e-05, "loss": 0.0097, "step": 136060 }, { "epoch": 1.96, "learning_rate": 1.934656347730843e-05, "loss": 0.0067, "step": 136070 }, { "epoch": 1.96, "learning_rate": 1.934651543756996e-05, "loss": 0.0083, "step": 136080 }, { "epoch": 1.96, "learning_rate": 1.934646739783149e-05, "loss": 0.0107, "step": 136090 }, { "epoch": 1.96, "learning_rate": 1.9346419358093014e-05, "loss": 0.0094, "step": 136100 }, { "epoch": 1.96, "learning_rate": 1.9346371318354544e-05, "loss": 0.0073, "step": 136110 }, { "epoch": 1.96, "learning_rate": 1.9346323278616073e-05, "loss": 0.0097, "step": 136120 }, { "epoch": 1.96, "learning_rate": 1.9346275238877602e-05, "loss": 0.0136, "step": 136130 }, { "epoch": 1.96, "learning_rate": 1.9346227199139128e-05, "loss": 0.0103, "step": 136140 }, { "epoch": 1.96, "learning_rate": 1.9346179159400657e-05, "loss": 0.011, "step": 136150 }, { "epoch": 1.96, "learning_rate": 1.9346131119662187e-05, "loss": 0.0115, "step": 136160 }, { "epoch": 1.96, "learning_rate": 1.9346083079923713e-05, "loss": 0.0065, "step": 136170 }, { "epoch": 1.96, "learning_rate": 1.9346035040185242e-05, "loss": 0.0109, "step": 136180 }, { "epoch": 1.96, "learning_rate": 1.934598700044677e-05, "loss": 0.0087, "step": 136190 }, { "epoch": 1.96, "learning_rate": 1.93459389607083e-05, "loss": 0.0057, "step": 136200 }, { "epoch": 1.96, "learning_rate": 1.9345890920969826e-05, "loss": 0.0091, "step": 136210 }, { "epoch": 1.96, "learning_rate": 1.9345842881231356e-05, "loss": 0.0125, "step": 136220 }, { "epoch": 1.96, "learning_rate": 1.9345794841492885e-05, "loss": 0.01, "step": 136230 }, { "epoch": 1.96, "learning_rate": 1.9345746801754414e-05, "loss": 0.0066, "step": 136240 }, { "epoch": 1.96, "learning_rate": 1.934569876201594e-05, "loss": 0.0088, "step": 136250 }, { "epoch": 1.96, "learning_rate": 1.934565072227747e-05, "loss": 0.0086, "step": 136260 }, { "epoch": 1.96, "learning_rate": 1.9345602682539e-05, "loss": 0.0073, "step": 136270 }, { "epoch": 1.96, "learning_rate": 1.9345554642800524e-05, "loss": 0.0104, "step": 136280 }, { "epoch": 1.96, "learning_rate": 1.9345506603062054e-05, "loss": 0.0086, "step": 136290 }, { "epoch": 1.96, "learning_rate": 1.9345458563323583e-05, "loss": 0.0129, "step": 136300 }, { "epoch": 1.96, "learning_rate": 1.9345410523585112e-05, "loss": 0.0088, "step": 136310 }, { "epoch": 1.96, "learning_rate": 1.9345362483846638e-05, "loss": 0.0078, "step": 136320 }, { "epoch": 1.96, "learning_rate": 1.9345314444108167e-05, "loss": 0.0092, "step": 136330 }, { "epoch": 1.96, "learning_rate": 1.9345266404369697e-05, "loss": 0.0072, "step": 136340 }, { "epoch": 1.97, "learning_rate": 1.9345218364631223e-05, "loss": 0.0109, "step": 136350 }, { "epoch": 1.97, "learning_rate": 1.9345170324892752e-05, "loss": 0.0116, "step": 136360 }, { "epoch": 1.97, "learning_rate": 1.934512228515428e-05, "loss": 0.0078, "step": 136370 }, { "epoch": 1.97, "learning_rate": 1.934507424541581e-05, "loss": 0.009, "step": 136380 }, { "epoch": 1.97, "learning_rate": 1.9345026205677336e-05, "loss": 0.0065, "step": 136390 }, { "epoch": 1.97, "learning_rate": 1.9344978165938865e-05, "loss": 0.0115, "step": 136400 }, { "epoch": 1.97, "learning_rate": 1.9344930126200395e-05, "loss": 0.0124, "step": 136410 }, { "epoch": 1.97, "learning_rate": 1.9344882086461924e-05, "loss": 0.0114, "step": 136420 }, { "epoch": 1.97, "learning_rate": 1.934483404672345e-05, "loss": 0.0123, "step": 136430 }, { "epoch": 1.97, "learning_rate": 1.934478600698498e-05, "loss": 0.0121, "step": 136440 }, { "epoch": 1.97, "learning_rate": 1.934473796724651e-05, "loss": 0.0085, "step": 136450 }, { "epoch": 1.97, "learning_rate": 1.9344689927508034e-05, "loss": 0.0143, "step": 136460 }, { "epoch": 1.97, "learning_rate": 1.9344641887769564e-05, "loss": 0.0079, "step": 136470 }, { "epoch": 1.97, "learning_rate": 1.9344593848031093e-05, "loss": 0.0101, "step": 136480 }, { "epoch": 1.97, "learning_rate": 1.9344545808292622e-05, "loss": 0.0071, "step": 136490 }, { "epoch": 1.97, "learning_rate": 1.9344497768554148e-05, "loss": 0.0094, "step": 136500 }, { "epoch": 1.97, "learning_rate": 1.9344449728815677e-05, "loss": 0.0227, "step": 136510 }, { "epoch": 1.97, "learning_rate": 1.9344401689077207e-05, "loss": 0.0089, "step": 136520 }, { "epoch": 1.97, "learning_rate": 1.9344353649338732e-05, "loss": 0.0084, "step": 136530 }, { "epoch": 1.97, "learning_rate": 1.934430560960026e-05, "loss": 0.0082, "step": 136540 }, { "epoch": 1.97, "learning_rate": 1.934425756986179e-05, "loss": 0.0124, "step": 136550 }, { "epoch": 1.97, "learning_rate": 1.934420953012332e-05, "loss": 0.0095, "step": 136560 }, { "epoch": 1.97, "learning_rate": 1.9344161490384846e-05, "loss": 0.0074, "step": 136570 }, { "epoch": 1.97, "learning_rate": 1.9344113450646375e-05, "loss": 0.0082, "step": 136580 }, { "epoch": 1.97, "learning_rate": 1.9344065410907905e-05, "loss": 0.011, "step": 136590 }, { "epoch": 1.97, "learning_rate": 1.9344017371169434e-05, "loss": 0.0125, "step": 136600 }, { "epoch": 1.97, "learning_rate": 1.934396933143096e-05, "loss": 0.0108, "step": 136610 }, { "epoch": 1.97, "learning_rate": 1.934392129169249e-05, "loss": 0.008, "step": 136620 }, { "epoch": 1.97, "learning_rate": 1.934387325195402e-05, "loss": 0.0082, "step": 136630 }, { "epoch": 1.97, "learning_rate": 1.9343825212215544e-05, "loss": 0.0073, "step": 136640 }, { "epoch": 1.97, "learning_rate": 1.9343777172477073e-05, "loss": 0.0105, "step": 136650 }, { "epoch": 1.97, "learning_rate": 1.9343729132738603e-05, "loss": 0.0073, "step": 136660 }, { "epoch": 1.97, "learning_rate": 1.9343681093000132e-05, "loss": 0.0098, "step": 136670 }, { "epoch": 1.97, "learning_rate": 1.9343633053261658e-05, "loss": 0.0061, "step": 136680 }, { "epoch": 1.97, "learning_rate": 1.9343585013523187e-05, "loss": 0.0118, "step": 136690 }, { "epoch": 1.97, "learning_rate": 1.9343536973784716e-05, "loss": 0.011, "step": 136700 }, { "epoch": 1.97, "learning_rate": 1.9343488934046242e-05, "loss": 0.0075, "step": 136710 }, { "epoch": 1.97, "learning_rate": 1.934344089430777e-05, "loss": 0.0081, "step": 136720 }, { "epoch": 1.97, "learning_rate": 1.93433928545693e-05, "loss": 0.0094, "step": 136730 }, { "epoch": 1.97, "learning_rate": 1.934334481483083e-05, "loss": 0.0086, "step": 136740 }, { "epoch": 1.97, "learning_rate": 1.9343296775092356e-05, "loss": 0.0088, "step": 136750 }, { "epoch": 1.97, "learning_rate": 1.9343248735353885e-05, "loss": 0.0101, "step": 136760 }, { "epoch": 1.97, "learning_rate": 1.9343200695615415e-05, "loss": 0.0096, "step": 136770 }, { "epoch": 1.97, "learning_rate": 1.9343152655876944e-05, "loss": 0.0097, "step": 136780 }, { "epoch": 1.97, "learning_rate": 1.934310461613847e-05, "loss": 0.0056, "step": 136790 }, { "epoch": 1.97, "learning_rate": 1.93430565764e-05, "loss": 0.0091, "step": 136800 }, { "epoch": 1.97, "learning_rate": 1.9343008536661528e-05, "loss": 0.0119, "step": 136810 }, { "epoch": 1.97, "learning_rate": 1.9342960496923054e-05, "loss": 0.0061, "step": 136820 }, { "epoch": 1.97, "learning_rate": 1.9342912457184583e-05, "loss": 0.0073, "step": 136830 }, { "epoch": 1.97, "learning_rate": 1.9342864417446113e-05, "loss": 0.0059, "step": 136840 }, { "epoch": 1.97, "learning_rate": 1.9342816377707642e-05, "loss": 0.0075, "step": 136850 }, { "epoch": 1.97, "learning_rate": 1.9342768337969168e-05, "loss": 0.0089, "step": 136860 }, { "epoch": 1.97, "learning_rate": 1.9342720298230697e-05, "loss": 0.0128, "step": 136870 }, { "epoch": 1.97, "learning_rate": 1.9342672258492226e-05, "loss": 0.0105, "step": 136880 }, { "epoch": 1.97, "learning_rate": 1.9342624218753752e-05, "loss": 0.0089, "step": 136890 }, { "epoch": 1.97, "learning_rate": 1.934257617901528e-05, "loss": 0.008, "step": 136900 }, { "epoch": 1.97, "learning_rate": 1.934252813927681e-05, "loss": 0.0076, "step": 136910 }, { "epoch": 1.97, "learning_rate": 1.934248009953834e-05, "loss": 0.0129, "step": 136920 }, { "epoch": 1.97, "learning_rate": 1.9342432059799866e-05, "loss": 0.0119, "step": 136930 }, { "epoch": 1.97, "learning_rate": 1.9342384020061395e-05, "loss": 0.0127, "step": 136940 }, { "epoch": 1.97, "learning_rate": 1.9342335980322924e-05, "loss": 0.0132, "step": 136950 }, { "epoch": 1.97, "learning_rate": 1.9342287940584454e-05, "loss": 0.0081, "step": 136960 }, { "epoch": 1.97, "learning_rate": 1.934223990084598e-05, "loss": 0.013, "step": 136970 }, { "epoch": 1.97, "learning_rate": 1.934219186110751e-05, "loss": 0.0096, "step": 136980 }, { "epoch": 1.97, "learning_rate": 1.9342143821369038e-05, "loss": 0.0067, "step": 136990 }, { "epoch": 1.97, "learning_rate": 1.9342095781630564e-05, "loss": 0.0103, "step": 137000 }, { "epoch": 1.97, "learning_rate": 1.9342047741892093e-05, "loss": 0.0101, "step": 137010 }, { "epoch": 1.97, "learning_rate": 1.9341999702153623e-05, "loss": 0.0125, "step": 137020 }, { "epoch": 1.97, "learning_rate": 1.9341951662415152e-05, "loss": 0.01, "step": 137030 }, { "epoch": 1.98, "learning_rate": 1.9341903622676678e-05, "loss": 0.0149, "step": 137040 }, { "epoch": 1.98, "learning_rate": 1.9341855582938207e-05, "loss": 0.0081, "step": 137050 }, { "epoch": 1.98, "learning_rate": 1.9341807543199736e-05, "loss": 0.0096, "step": 137060 }, { "epoch": 1.98, "learning_rate": 1.9341759503461262e-05, "loss": 0.009, "step": 137070 }, { "epoch": 1.98, "learning_rate": 1.934171146372279e-05, "loss": 0.0103, "step": 137080 }, { "epoch": 1.98, "learning_rate": 1.934166342398432e-05, "loss": 0.0098, "step": 137090 }, { "epoch": 1.98, "learning_rate": 1.934161538424585e-05, "loss": 0.0107, "step": 137100 }, { "epoch": 1.98, "learning_rate": 1.9341567344507376e-05, "loss": 0.0132, "step": 137110 }, { "epoch": 1.98, "learning_rate": 1.9341519304768905e-05, "loss": 0.0104, "step": 137120 }, { "epoch": 1.98, "learning_rate": 1.9341471265030434e-05, "loss": 0.0095, "step": 137130 }, { "epoch": 1.98, "learning_rate": 1.9341423225291964e-05, "loss": 0.0073, "step": 137140 }, { "epoch": 1.98, "learning_rate": 1.934137518555349e-05, "loss": 0.0079, "step": 137150 }, { "epoch": 1.98, "learning_rate": 1.934132714581502e-05, "loss": 0.0147, "step": 137160 }, { "epoch": 1.98, "learning_rate": 1.9341279106076548e-05, "loss": 0.0135, "step": 137170 }, { "epoch": 1.98, "learning_rate": 1.9341231066338074e-05, "loss": 0.0079, "step": 137180 }, { "epoch": 1.98, "learning_rate": 1.9341183026599603e-05, "loss": 0.008, "step": 137190 }, { "epoch": 1.98, "learning_rate": 1.9341134986861133e-05, "loss": 0.0099, "step": 137200 }, { "epoch": 1.98, "learning_rate": 1.9341086947122662e-05, "loss": 0.011, "step": 137210 }, { "epoch": 1.98, "learning_rate": 1.934103890738419e-05, "loss": 0.0093, "step": 137220 }, { "epoch": 1.98, "learning_rate": 1.934099086764572e-05, "loss": 0.0071, "step": 137230 }, { "epoch": 1.98, "learning_rate": 1.9340942827907246e-05, "loss": 0.0084, "step": 137240 }, { "epoch": 1.98, "learning_rate": 1.9340894788168775e-05, "loss": 0.0052, "step": 137250 }, { "epoch": 1.98, "learning_rate": 1.9340846748430305e-05, "loss": 0.0079, "step": 137260 }, { "epoch": 1.98, "learning_rate": 1.9340798708691834e-05, "loss": 0.0104, "step": 137270 }, { "epoch": 1.98, "learning_rate": 1.934075066895336e-05, "loss": 0.0082, "step": 137280 }, { "epoch": 1.98, "learning_rate": 1.934070262921489e-05, "loss": 0.0081, "step": 137290 }, { "epoch": 1.98, "learning_rate": 1.934065458947642e-05, "loss": 0.0102, "step": 137300 }, { "epoch": 1.98, "learning_rate": 1.9340606549737944e-05, "loss": 0.012, "step": 137310 }, { "epoch": 1.98, "learning_rate": 1.9340558509999474e-05, "loss": 0.0114, "step": 137320 }, { "epoch": 1.98, "learning_rate": 1.9340510470261003e-05, "loss": 0.0097, "step": 137330 }, { "epoch": 1.98, "learning_rate": 1.9340462430522532e-05, "loss": 0.0103, "step": 137340 }, { "epoch": 1.98, "learning_rate": 1.9340414390784058e-05, "loss": 0.0081, "step": 137350 }, { "epoch": 1.98, "learning_rate": 1.9340366351045587e-05, "loss": 0.0089, "step": 137360 }, { "epoch": 1.98, "learning_rate": 1.9340318311307117e-05, "loss": 0.0095, "step": 137370 }, { "epoch": 1.98, "learning_rate": 1.9340270271568646e-05, "loss": 0.007, "step": 137380 }, { "epoch": 1.98, "learning_rate": 1.934022223183017e-05, "loss": 0.0117, "step": 137390 }, { "epoch": 1.98, "learning_rate": 1.93401741920917e-05, "loss": 0.0111, "step": 137400 }, { "epoch": 1.98, "learning_rate": 1.934012615235323e-05, "loss": 0.0111, "step": 137410 }, { "epoch": 1.98, "learning_rate": 1.9340078112614756e-05, "loss": 0.011, "step": 137420 }, { "epoch": 1.98, "learning_rate": 1.9340030072876285e-05, "loss": 0.0073, "step": 137430 }, { "epoch": 1.98, "learning_rate": 1.9339982033137815e-05, "loss": 0.009, "step": 137440 }, { "epoch": 1.98, "learning_rate": 1.9339933993399344e-05, "loss": 0.0091, "step": 137450 }, { "epoch": 1.98, "learning_rate": 1.933988595366087e-05, "loss": 0.0089, "step": 137460 }, { "epoch": 1.98, "learning_rate": 1.93398379139224e-05, "loss": 0.0097, "step": 137470 }, { "epoch": 1.98, "learning_rate": 1.933978987418393e-05, "loss": 0.0106, "step": 137480 }, { "epoch": 1.98, "learning_rate": 1.9339741834445454e-05, "loss": 0.0083, "step": 137490 }, { "epoch": 1.98, "learning_rate": 1.9339693794706983e-05, "loss": 0.0107, "step": 137500 }, { "epoch": 1.98, "learning_rate": 1.9339645754968513e-05, "loss": 0.0113, "step": 137510 }, { "epoch": 1.98, "learning_rate": 1.9339597715230042e-05, "loss": 0.0071, "step": 137520 }, { "epoch": 1.98, "learning_rate": 1.9339549675491568e-05, "loss": 0.0099, "step": 137530 }, { "epoch": 1.98, "learning_rate": 1.9339501635753097e-05, "loss": 0.009, "step": 137540 }, { "epoch": 1.98, "learning_rate": 1.9339453596014626e-05, "loss": 0.0093, "step": 137550 }, { "epoch": 1.98, "learning_rate": 1.9339405556276152e-05, "loss": 0.0111, "step": 137560 }, { "epoch": 1.98, "learning_rate": 1.933935751653768e-05, "loss": 0.0084, "step": 137570 }, { "epoch": 1.98, "learning_rate": 1.933930947679921e-05, "loss": 0.0072, "step": 137580 }, { "epoch": 1.98, "learning_rate": 1.933926143706074e-05, "loss": 0.0152, "step": 137590 }, { "epoch": 1.98, "learning_rate": 1.9339213397322266e-05, "loss": 0.008, "step": 137600 }, { "epoch": 1.98, "learning_rate": 1.9339165357583795e-05, "loss": 0.0085, "step": 137610 }, { "epoch": 1.98, "learning_rate": 1.9339117317845325e-05, "loss": 0.0097, "step": 137620 }, { "epoch": 1.98, "learning_rate": 1.9339069278106854e-05, "loss": 0.0077, "step": 137630 }, { "epoch": 1.98, "learning_rate": 1.933902123836838e-05, "loss": 0.0107, "step": 137640 }, { "epoch": 1.98, "learning_rate": 1.933897319862991e-05, "loss": 0.0083, "step": 137650 }, { "epoch": 1.98, "learning_rate": 1.9338925158891438e-05, "loss": 0.0108, "step": 137660 }, { "epoch": 1.98, "learning_rate": 1.9338877119152964e-05, "loss": 0.0104, "step": 137670 }, { "epoch": 1.98, "learning_rate": 1.9338829079414493e-05, "loss": 0.0095, "step": 137680 }, { "epoch": 1.98, "learning_rate": 1.9338781039676023e-05, "loss": 0.0083, "step": 137690 }, { "epoch": 1.98, "learning_rate": 1.9338732999937552e-05, "loss": 0.0085, "step": 137700 }, { "epoch": 1.98, "learning_rate": 1.9338684960199078e-05, "loss": 0.0072, "step": 137710 }, { "epoch": 1.98, "learning_rate": 1.9338636920460607e-05, "loss": 0.0087, "step": 137720 }, { "epoch": 1.98, "learning_rate": 1.9338588880722136e-05, "loss": 0.0118, "step": 137730 }, { "epoch": 1.99, "learning_rate": 1.9338540840983662e-05, "loss": 0.0091, "step": 137740 }, { "epoch": 1.99, "learning_rate": 1.933849280124519e-05, "loss": 0.0161, "step": 137750 }, { "epoch": 1.99, "learning_rate": 1.933844476150672e-05, "loss": 0.0061, "step": 137760 }, { "epoch": 1.99, "learning_rate": 1.933839672176825e-05, "loss": 0.0083, "step": 137770 }, { "epoch": 1.99, "learning_rate": 1.9338348682029776e-05, "loss": 0.0113, "step": 137780 }, { "epoch": 1.99, "learning_rate": 1.9338300642291305e-05, "loss": 0.0076, "step": 137790 }, { "epoch": 1.99, "learning_rate": 1.9338252602552834e-05, "loss": 0.0093, "step": 137800 }, { "epoch": 1.99, "learning_rate": 1.9338204562814364e-05, "loss": 0.0084, "step": 137810 }, { "epoch": 1.99, "learning_rate": 1.933815652307589e-05, "loss": 0.0072, "step": 137820 }, { "epoch": 1.99, "learning_rate": 1.933810848333742e-05, "loss": 0.0076, "step": 137830 }, { "epoch": 1.99, "learning_rate": 1.9338060443598948e-05, "loss": 0.0073, "step": 137840 }, { "epoch": 1.99, "learning_rate": 1.9338012403860474e-05, "loss": 0.0079, "step": 137850 }, { "epoch": 1.99, "learning_rate": 1.9337964364122003e-05, "loss": 0.0089, "step": 137860 }, { "epoch": 1.99, "learning_rate": 1.9337916324383533e-05, "loss": 0.0116, "step": 137870 }, { "epoch": 1.99, "learning_rate": 1.9337868284645062e-05, "loss": 0.0099, "step": 137880 }, { "epoch": 1.99, "learning_rate": 1.9337820244906588e-05, "loss": 0.0089, "step": 137890 }, { "epoch": 1.99, "learning_rate": 1.9337772205168117e-05, "loss": 0.0095, "step": 137900 }, { "epoch": 1.99, "learning_rate": 1.9337724165429646e-05, "loss": 0.0084, "step": 137910 }, { "epoch": 1.99, "learning_rate": 1.9337676125691172e-05, "loss": 0.0091, "step": 137920 }, { "epoch": 1.99, "learning_rate": 1.93376280859527e-05, "loss": 0.0073, "step": 137930 }, { "epoch": 1.99, "learning_rate": 1.933758004621423e-05, "loss": 0.0135, "step": 137940 }, { "epoch": 1.99, "learning_rate": 1.933753200647576e-05, "loss": 0.0085, "step": 137950 }, { "epoch": 1.99, "learning_rate": 1.9337483966737286e-05, "loss": 0.0096, "step": 137960 }, { "epoch": 1.99, "learning_rate": 1.9337435926998815e-05, "loss": 0.01, "step": 137970 }, { "epoch": 1.99, "learning_rate": 1.9337387887260344e-05, "loss": 0.0106, "step": 137980 }, { "epoch": 1.99, "learning_rate": 1.9337339847521874e-05, "loss": 0.0095, "step": 137990 }, { "epoch": 1.99, "learning_rate": 1.93372918077834e-05, "loss": 0.007, "step": 138000 }, { "epoch": 1.99, "learning_rate": 1.933724376804493e-05, "loss": 0.0152, "step": 138010 }, { "epoch": 1.99, "learning_rate": 1.9337195728306458e-05, "loss": 0.0074, "step": 138020 }, { "epoch": 1.99, "learning_rate": 1.9337147688567984e-05, "loss": 0.0086, "step": 138030 }, { "epoch": 1.99, "learning_rate": 1.9337099648829513e-05, "loss": 0.0066, "step": 138040 }, { "epoch": 1.99, "learning_rate": 1.9337051609091043e-05, "loss": 0.0104, "step": 138050 }, { "epoch": 1.99, "learning_rate": 1.9337003569352572e-05, "loss": 0.0047, "step": 138060 }, { "epoch": 1.99, "learning_rate": 1.9336955529614098e-05, "loss": 0.0083, "step": 138070 }, { "epoch": 1.99, "learning_rate": 1.9336907489875627e-05, "loss": 0.013, "step": 138080 }, { "epoch": 1.99, "learning_rate": 1.9336859450137156e-05, "loss": 0.0094, "step": 138090 }, { "epoch": 1.99, "learning_rate": 1.9336811410398682e-05, "loss": 0.0105, "step": 138100 }, { "epoch": 1.99, "learning_rate": 1.933676337066021e-05, "loss": 0.0089, "step": 138110 }, { "epoch": 1.99, "learning_rate": 1.933671533092174e-05, "loss": 0.01, "step": 138120 }, { "epoch": 1.99, "learning_rate": 1.933666729118327e-05, "loss": 0.0079, "step": 138130 }, { "epoch": 1.99, "learning_rate": 1.9336619251444796e-05, "loss": 0.0114, "step": 138140 }, { "epoch": 1.99, "learning_rate": 1.9336571211706325e-05, "loss": 0.0085, "step": 138150 }, { "epoch": 1.99, "learning_rate": 1.9336523171967854e-05, "loss": 0.0128, "step": 138160 }, { "epoch": 1.99, "learning_rate": 1.9336475132229384e-05, "loss": 0.0063, "step": 138170 }, { "epoch": 1.99, "learning_rate": 1.933642709249091e-05, "loss": 0.0115, "step": 138180 }, { "epoch": 1.99, "learning_rate": 1.933637905275244e-05, "loss": 0.0092, "step": 138190 }, { "epoch": 1.99, "learning_rate": 1.9336331013013968e-05, "loss": 0.0057, "step": 138200 }, { "epoch": 1.99, "learning_rate": 1.9336282973275494e-05, "loss": 0.0072, "step": 138210 }, { "epoch": 1.99, "learning_rate": 1.9336234933537023e-05, "loss": 0.0123, "step": 138220 }, { "epoch": 1.99, "learning_rate": 1.9336186893798552e-05, "loss": 0.0097, "step": 138230 }, { "epoch": 1.99, "learning_rate": 1.933613885406008e-05, "loss": 0.0084, "step": 138240 }, { "epoch": 1.99, "learning_rate": 1.9336090814321608e-05, "loss": 0.0076, "step": 138250 }, { "epoch": 1.99, "learning_rate": 1.9336042774583137e-05, "loss": 0.0123, "step": 138260 }, { "epoch": 1.99, "learning_rate": 1.9335994734844666e-05, "loss": 0.0085, "step": 138270 }, { "epoch": 1.99, "learning_rate": 1.9335946695106192e-05, "loss": 0.0105, "step": 138280 }, { "epoch": 1.99, "learning_rate": 1.933589865536772e-05, "loss": 0.0099, "step": 138290 }, { "epoch": 1.99, "learning_rate": 1.933585061562925e-05, "loss": 0.0099, "step": 138300 }, { "epoch": 1.99, "learning_rate": 1.933580257589078e-05, "loss": 0.0111, "step": 138310 }, { "epoch": 1.99, "learning_rate": 1.9335754536152306e-05, "loss": 0.0097, "step": 138320 }, { "epoch": 1.99, "learning_rate": 1.9335706496413835e-05, "loss": 0.0097, "step": 138330 }, { "epoch": 1.99, "learning_rate": 1.9335658456675364e-05, "loss": 0.0116, "step": 138340 }, { "epoch": 1.99, "learning_rate": 1.9335610416936893e-05, "loss": 0.009, "step": 138350 }, { "epoch": 1.99, "learning_rate": 1.933556237719842e-05, "loss": 0.0076, "step": 138360 }, { "epoch": 1.99, "learning_rate": 1.933551433745995e-05, "loss": 0.0061, "step": 138370 }, { "epoch": 1.99, "learning_rate": 1.9335466297721478e-05, "loss": 0.0114, "step": 138380 }, { "epoch": 1.99, "learning_rate": 1.9335418257983004e-05, "loss": 0.012, "step": 138390 }, { "epoch": 1.99, "learning_rate": 1.9335370218244533e-05, "loss": 0.0093, "step": 138400 }, { "epoch": 1.99, "learning_rate": 1.9335322178506062e-05, "loss": 0.0085, "step": 138410 }, { "epoch": 1.99, "learning_rate": 1.933527413876759e-05, "loss": 0.0079, "step": 138420 }, { "epoch": 2.0, "learning_rate": 1.9335226099029117e-05, "loss": 0.0076, "step": 138430 }, { "epoch": 2.0, "learning_rate": 1.9335178059290647e-05, "loss": 0.0125, "step": 138440 }, { "epoch": 2.0, "learning_rate": 1.9335130019552176e-05, "loss": 0.0101, "step": 138450 }, { "epoch": 2.0, "learning_rate": 1.9335081979813702e-05, "loss": 0.0111, "step": 138460 }, { "epoch": 2.0, "learning_rate": 1.933503394007523e-05, "loss": 0.0102, "step": 138470 }, { "epoch": 2.0, "learning_rate": 1.933498590033676e-05, "loss": 0.0103, "step": 138480 }, { "epoch": 2.0, "learning_rate": 1.933493786059829e-05, "loss": 0.0096, "step": 138490 }, { "epoch": 2.0, "learning_rate": 1.9334889820859816e-05, "loss": 0.012, "step": 138500 }, { "epoch": 2.0, "learning_rate": 1.9334841781121345e-05, "loss": 0.0068, "step": 138510 }, { "epoch": 2.0, "learning_rate": 1.9334793741382874e-05, "loss": 0.0139, "step": 138520 }, { "epoch": 2.0, "learning_rate": 1.9334745701644403e-05, "loss": 0.009, "step": 138530 }, { "epoch": 2.0, "learning_rate": 1.933469766190593e-05, "loss": 0.0124, "step": 138540 }, { "epoch": 2.0, "learning_rate": 1.933464962216746e-05, "loss": 0.0084, "step": 138550 }, { "epoch": 2.0, "learning_rate": 1.9334601582428988e-05, "loss": 0.0067, "step": 138560 }, { "epoch": 2.0, "learning_rate": 1.9334553542690514e-05, "loss": 0.0072, "step": 138570 }, { "epoch": 2.0, "learning_rate": 1.9334505502952043e-05, "loss": 0.0141, "step": 138580 }, { "epoch": 2.0, "learning_rate": 1.9334457463213572e-05, "loss": 0.0095, "step": 138590 }, { "epoch": 2.0, "learning_rate": 1.93344094234751e-05, "loss": 0.0094, "step": 138600 }, { "epoch": 2.0, "learning_rate": 1.9334361383736627e-05, "loss": 0.0085, "step": 138610 }, { "epoch": 2.0, "learning_rate": 1.9334313343998157e-05, "loss": 0.0081, "step": 138620 }, { "epoch": 2.0, "learning_rate": 1.9334265304259686e-05, "loss": 0.0099, "step": 138630 }, { "epoch": 2.0, "learning_rate": 1.9334217264521212e-05, "loss": 0.0081, "step": 138640 }, { "epoch": 2.0, "learning_rate": 1.933416922478274e-05, "loss": 0.0073, "step": 138650 }, { "epoch": 2.0, "learning_rate": 1.933412118504427e-05, "loss": 0.0089, "step": 138660 }, { "epoch": 2.0, "learning_rate": 1.93340731453058e-05, "loss": 0.0066, "step": 138670 }, { "epoch": 2.0, "learning_rate": 1.9334025105567326e-05, "loss": 0.0095, "step": 138680 }, { "epoch": 2.0, "learning_rate": 1.9333977065828855e-05, "loss": 0.008, "step": 138690 }, { "epoch": 2.0, "learning_rate": 1.9333929026090384e-05, "loss": 0.0083, "step": 138700 }, { "epoch": 2.0, "learning_rate": 1.9333880986351913e-05, "loss": 0.0054, "step": 138710 }, { "epoch": 2.0, "learning_rate": 1.933383294661344e-05, "loss": 0.0108, "step": 138720 }, { "epoch": 2.0, "learning_rate": 1.933378490687497e-05, "loss": 0.0079, "step": 138730 }, { "epoch": 2.0, "learning_rate": 1.9333736867136498e-05, "loss": 0.0074, "step": 138740 }, { "epoch": 2.0, "learning_rate": 1.9333688827398024e-05, "loss": 0.0073, "step": 138750 }, { "epoch": 2.0, "learning_rate": 1.9333640787659553e-05, "loss": 0.0108, "step": 138760 }, { "epoch": 2.0, "learning_rate": 1.9333592747921082e-05, "loss": 0.0063, "step": 138770 }, { "epoch": 2.0, "learning_rate": 1.933354470818261e-05, "loss": 0.0091, "step": 138780 }, { "epoch": 2.0, "learning_rate": 1.9333496668444137e-05, "loss": 0.0072, "step": 138790 }, { "epoch": 2.0, "learning_rate": 1.9333448628705667e-05, "loss": 0.006, "step": 138800 }, { "epoch": 2.0, "learning_rate": 1.9333400588967196e-05, "loss": 0.0124, "step": 138810 }, { "epoch": 2.0, "learning_rate": 1.9333352549228722e-05, "loss": 0.0091, "step": 138820 }, { "epoch": 2.0, "learning_rate": 1.933330450949025e-05, "loss": 0.0079, "step": 138830 }, { "epoch": 2.0, "learning_rate": 1.933325646975178e-05, "loss": 0.0062, "step": 138840 }, { "epoch": 2.0, "learning_rate": 1.933320843001331e-05, "loss": 0.0084, "step": 138850 }, { "epoch": 2.0, "learning_rate": 1.9333160390274835e-05, "loss": 0.007, "step": 138860 }, { "epoch": 2.0, "learning_rate": 1.9333112350536365e-05, "loss": 0.0067, "step": 138870 }, { "epoch": 2.0, "learning_rate": 1.9333064310797894e-05, "loss": 0.0108, "step": 138880 }, { "epoch": 2.0, "learning_rate": 1.9333016271059423e-05, "loss": 0.0055, "step": 138890 }, { "epoch": 2.0, "learning_rate": 1.933296823132095e-05, "loss": 0.0078, "step": 138900 }, { "epoch": 2.0, "learning_rate": 1.933292019158248e-05, "loss": 0.0099, "step": 138910 }, { "epoch": 2.0, "learning_rate": 1.9332872151844008e-05, "loss": 0.0099, "step": 138920 }, { "epoch": 2.0, "learning_rate": 1.9332824112105534e-05, "loss": 0.0088, "step": 138930 }, { "epoch": 2.0, "learning_rate": 1.9332776072367063e-05, "loss": 0.0093, "step": 138940 }, { "epoch": 2.0, "learning_rate": 1.9332728032628592e-05, "loss": 0.0066, "step": 138950 }, { "epoch": 2.0, "learning_rate": 1.933267999289012e-05, "loss": 0.0065, "step": 138960 }, { "epoch": 2.0, "learning_rate": 1.9332631953151647e-05, "loss": 0.0087, "step": 138970 }, { "epoch": 2.0, "learning_rate": 1.9332583913413177e-05, "loss": 0.0103, "step": 138980 }, { "epoch": 2.0, "learning_rate": 1.9332535873674706e-05, "loss": 0.0071, "step": 138990 }, { "epoch": 2.0, "learning_rate": 1.933248783393623e-05, "loss": 0.0078, "step": 139000 }, { "epoch": 2.0, "learning_rate": 1.933243979419776e-05, "loss": 0.0069, "step": 139010 }, { "epoch": 2.0, "learning_rate": 1.933239175445929e-05, "loss": 0.0082, "step": 139020 }, { "epoch": 2.0, "learning_rate": 1.933234371472082e-05, "loss": 0.0059, "step": 139030 }, { "epoch": 2.0, "learning_rate": 1.9332295674982345e-05, "loss": 0.0103, "step": 139040 }, { "epoch": 2.0, "learning_rate": 1.9332247635243875e-05, "loss": 0.0092, "step": 139050 }, { "epoch": 2.0, "learning_rate": 1.9332199595505404e-05, "loss": 0.0065, "step": 139060 }, { "epoch": 2.0, "learning_rate": 1.9332151555766933e-05, "loss": 0.0078, "step": 139070 }, { "epoch": 2.0, "learning_rate": 1.933210351602846e-05, "loss": 0.0077, "step": 139080 }, { "epoch": 2.0, "learning_rate": 1.9332055476289988e-05, "loss": 0.0085, "step": 139090 }, { "epoch": 2.0, "learning_rate": 1.9332007436551518e-05, "loss": 0.0101, "step": 139100 }, { "epoch": 2.0, "learning_rate": 1.9331959396813043e-05, "loss": 0.0075, "step": 139110 }, { "epoch": 2.0, "learning_rate": 1.9331911357074573e-05, "loss": 0.0048, "step": 139120 }, { "epoch": 2.01, "learning_rate": 1.9331863317336102e-05, "loss": 0.0069, "step": 139130 }, { "epoch": 2.01, "learning_rate": 1.933181527759763e-05, "loss": 0.0056, "step": 139140 }, { "epoch": 2.01, "learning_rate": 1.9331767237859157e-05, "loss": 0.0054, "step": 139150 }, { "epoch": 2.01, "learning_rate": 1.9331719198120686e-05, "loss": 0.0085, "step": 139160 }, { "epoch": 2.01, "learning_rate": 1.9331671158382216e-05, "loss": 0.0084, "step": 139170 }, { "epoch": 2.01, "learning_rate": 1.933162311864374e-05, "loss": 0.0094, "step": 139180 }, { "epoch": 2.01, "learning_rate": 1.933157507890527e-05, "loss": 0.0058, "step": 139190 }, { "epoch": 2.01, "learning_rate": 1.93315270391668e-05, "loss": 0.0077, "step": 139200 }, { "epoch": 2.01, "learning_rate": 1.933147899942833e-05, "loss": 0.0069, "step": 139210 }, { "epoch": 2.01, "learning_rate": 1.9331430959689855e-05, "loss": 0.0066, "step": 139220 }, { "epoch": 2.01, "learning_rate": 1.9331382919951385e-05, "loss": 0.006, "step": 139230 }, { "epoch": 2.01, "learning_rate": 1.9331334880212914e-05, "loss": 0.006, "step": 139240 }, { "epoch": 2.01, "learning_rate": 1.933128684047444e-05, "loss": 0.0076, "step": 139250 }, { "epoch": 2.01, "learning_rate": 1.933123880073597e-05, "loss": 0.0101, "step": 139260 }, { "epoch": 2.01, "learning_rate": 1.9331190760997498e-05, "loss": 0.0076, "step": 139270 }, { "epoch": 2.01, "learning_rate": 1.9331142721259027e-05, "loss": 0.0092, "step": 139280 }, { "epoch": 2.01, "learning_rate": 1.9331094681520553e-05, "loss": 0.0084, "step": 139290 }, { "epoch": 2.01, "learning_rate": 1.9331046641782083e-05, "loss": 0.007, "step": 139300 }, { "epoch": 2.01, "learning_rate": 1.9330998602043612e-05, "loss": 0.0092, "step": 139310 }, { "epoch": 2.01, "learning_rate": 1.933095056230514e-05, "loss": 0.0064, "step": 139320 }, { "epoch": 2.01, "learning_rate": 1.9330902522566667e-05, "loss": 0.0069, "step": 139330 }, { "epoch": 2.01, "learning_rate": 1.9330854482828196e-05, "loss": 0.007, "step": 139340 }, { "epoch": 2.01, "learning_rate": 1.9330806443089726e-05, "loss": 0.0101, "step": 139350 }, { "epoch": 2.01, "learning_rate": 1.933075840335125e-05, "loss": 0.0083, "step": 139360 }, { "epoch": 2.01, "learning_rate": 1.933071036361278e-05, "loss": 0.008, "step": 139370 }, { "epoch": 2.01, "learning_rate": 1.933066232387431e-05, "loss": 0.0072, "step": 139380 }, { "epoch": 2.01, "learning_rate": 1.933061428413584e-05, "loss": 0.0091, "step": 139390 }, { "epoch": 2.01, "learning_rate": 1.9330566244397365e-05, "loss": 0.0089, "step": 139400 }, { "epoch": 2.01, "learning_rate": 1.9330518204658894e-05, "loss": 0.0056, "step": 139410 }, { "epoch": 2.01, "learning_rate": 1.9330470164920424e-05, "loss": 0.0064, "step": 139420 }, { "epoch": 2.01, "learning_rate": 1.933042212518195e-05, "loss": 0.0061, "step": 139430 }, { "epoch": 2.01, "learning_rate": 1.933037408544348e-05, "loss": 0.0134, "step": 139440 }, { "epoch": 2.01, "learning_rate": 1.9330326045705008e-05, "loss": 0.0064, "step": 139450 }, { "epoch": 2.01, "learning_rate": 1.9330278005966537e-05, "loss": 0.0125, "step": 139460 }, { "epoch": 2.01, "learning_rate": 1.9330229966228063e-05, "loss": 0.0069, "step": 139470 }, { "epoch": 2.01, "learning_rate": 1.9330181926489593e-05, "loss": 0.0093, "step": 139480 }, { "epoch": 2.01, "learning_rate": 1.9330133886751122e-05, "loss": 0.0059, "step": 139490 }, { "epoch": 2.01, "learning_rate": 1.933008584701265e-05, "loss": 0.0089, "step": 139500 }, { "epoch": 2.01, "learning_rate": 1.9330037807274177e-05, "loss": 0.0063, "step": 139510 }, { "epoch": 2.01, "learning_rate": 1.9329989767535706e-05, "loss": 0.0112, "step": 139520 }, { "epoch": 2.01, "learning_rate": 1.9329941727797236e-05, "loss": 0.0085, "step": 139530 }, { "epoch": 2.01, "learning_rate": 1.932989368805876e-05, "loss": 0.0077, "step": 139540 }, { "epoch": 2.01, "learning_rate": 1.932984564832029e-05, "loss": 0.0053, "step": 139550 }, { "epoch": 2.01, "learning_rate": 1.932979760858182e-05, "loss": 0.0076, "step": 139560 }, { "epoch": 2.01, "learning_rate": 1.932974956884335e-05, "loss": 0.0074, "step": 139570 }, { "epoch": 2.01, "learning_rate": 1.9329701529104875e-05, "loss": 0.0057, "step": 139580 }, { "epoch": 2.01, "learning_rate": 1.9329653489366404e-05, "loss": 0.0086, "step": 139590 }, { "epoch": 2.01, "learning_rate": 1.9329605449627934e-05, "loss": 0.0081, "step": 139600 }, { "epoch": 2.01, "learning_rate": 1.932955740988946e-05, "loss": 0.0055, "step": 139610 }, { "epoch": 2.01, "learning_rate": 1.932950937015099e-05, "loss": 0.0058, "step": 139620 }, { "epoch": 2.01, "learning_rate": 1.9329461330412518e-05, "loss": 0.0064, "step": 139630 }, { "epoch": 2.01, "learning_rate": 1.9329413290674047e-05, "loss": 0.0051, "step": 139640 }, { "epoch": 2.01, "learning_rate": 1.9329365250935573e-05, "loss": 0.0076, "step": 139650 }, { "epoch": 2.01, "learning_rate": 1.9329317211197102e-05, "loss": 0.0064, "step": 139660 }, { "epoch": 2.01, "learning_rate": 1.9329269171458632e-05, "loss": 0.0077, "step": 139670 }, { "epoch": 2.01, "learning_rate": 1.932922113172016e-05, "loss": 0.0085, "step": 139680 }, { "epoch": 2.01, "learning_rate": 1.9329173091981687e-05, "loss": 0.0097, "step": 139690 }, { "epoch": 2.01, "learning_rate": 1.9329125052243216e-05, "loss": 0.0086, "step": 139700 }, { "epoch": 2.01, "learning_rate": 1.9329077012504745e-05, "loss": 0.0058, "step": 139710 }, { "epoch": 2.01, "learning_rate": 1.932902897276627e-05, "loss": 0.0097, "step": 139720 }, { "epoch": 2.01, "learning_rate": 1.93289809330278e-05, "loss": 0.0049, "step": 139730 }, { "epoch": 2.01, "learning_rate": 1.932893289328933e-05, "loss": 0.0059, "step": 139740 }, { "epoch": 2.01, "learning_rate": 1.932888485355086e-05, "loss": 0.008, "step": 139750 }, { "epoch": 2.01, "learning_rate": 1.9328836813812385e-05, "loss": 0.0092, "step": 139760 }, { "epoch": 2.01, "learning_rate": 1.9328788774073918e-05, "loss": 0.0082, "step": 139770 }, { "epoch": 2.01, "learning_rate": 1.9328740734335444e-05, "loss": 0.008, "step": 139780 }, { "epoch": 2.01, "learning_rate": 1.9328692694596973e-05, "loss": 0.008, "step": 139790 }, { "epoch": 2.01, "learning_rate": 1.9328644654858502e-05, "loss": 0.0059, "step": 139800 }, { "epoch": 2.01, "learning_rate": 1.932859661512003e-05, "loss": 0.0083, "step": 139810 }, { "epoch": 2.02, "learning_rate": 1.9328548575381557e-05, "loss": 0.0063, "step": 139820 }, { "epoch": 2.02, "learning_rate": 1.9328500535643087e-05, "loss": 0.0096, "step": 139830 }, { "epoch": 2.02, "learning_rate": 1.9328452495904616e-05, "loss": 0.0107, "step": 139840 }, { "epoch": 2.02, "learning_rate": 1.932840445616614e-05, "loss": 0.0077, "step": 139850 }, { "epoch": 2.02, "learning_rate": 1.932835641642767e-05, "loss": 0.0069, "step": 139860 }, { "epoch": 2.02, "learning_rate": 1.93283083766892e-05, "loss": 0.0039, "step": 139870 }, { "epoch": 2.02, "learning_rate": 1.932826033695073e-05, "loss": 0.0078, "step": 139880 }, { "epoch": 2.02, "learning_rate": 1.9328212297212255e-05, "loss": 0.0088, "step": 139890 }, { "epoch": 2.02, "learning_rate": 1.9328164257473785e-05, "loss": 0.0115, "step": 139900 }, { "epoch": 2.02, "learning_rate": 1.9328116217735314e-05, "loss": 0.0064, "step": 139910 }, { "epoch": 2.02, "learning_rate": 1.9328068177996843e-05, "loss": 0.0071, "step": 139920 }, { "epoch": 2.02, "learning_rate": 1.932802013825837e-05, "loss": 0.0084, "step": 139930 }, { "epoch": 2.02, "learning_rate": 1.93279720985199e-05, "loss": 0.0061, "step": 139940 }, { "epoch": 2.02, "learning_rate": 1.9327924058781428e-05, "loss": 0.0071, "step": 139950 }, { "epoch": 2.02, "learning_rate": 1.9327876019042953e-05, "loss": 0.0105, "step": 139960 }, { "epoch": 2.02, "learning_rate": 1.9327827979304483e-05, "loss": 0.0097, "step": 139970 }, { "epoch": 2.02, "learning_rate": 1.9327779939566012e-05, "loss": 0.0084, "step": 139980 }, { "epoch": 2.02, "learning_rate": 1.932773189982754e-05, "loss": 0.0078, "step": 139990 }, { "epoch": 2.02, "learning_rate": 1.9327683860089067e-05, "loss": 0.0058, "step": 140000 }, { "epoch": 2.02, "learning_rate": 1.9327635820350596e-05, "loss": 0.0072, "step": 140010 }, { "epoch": 2.02, "learning_rate": 1.9327587780612126e-05, "loss": 0.0069, "step": 140020 }, { "epoch": 2.02, "learning_rate": 1.932753974087365e-05, "loss": 0.0085, "step": 140030 }, { "epoch": 2.02, "learning_rate": 1.932749170113518e-05, "loss": 0.0066, "step": 140040 }, { "epoch": 2.02, "learning_rate": 1.932744366139671e-05, "loss": 0.0077, "step": 140050 }, { "epoch": 2.02, "learning_rate": 1.932739562165824e-05, "loss": 0.0051, "step": 140060 }, { "epoch": 2.02, "learning_rate": 1.9327347581919765e-05, "loss": 0.0113, "step": 140070 }, { "epoch": 2.02, "learning_rate": 1.932730434615514e-05, "loss": 0.0102, "step": 140080 }, { "epoch": 2.02, "learning_rate": 1.932725630641667e-05, "loss": 0.0087, "step": 140090 }, { "epoch": 2.02, "learning_rate": 1.93272082666782e-05, "loss": 0.0083, "step": 140100 }, { "epoch": 2.02, "learning_rate": 1.9327160226939724e-05, "loss": 0.0085, "step": 140110 }, { "epoch": 2.02, "learning_rate": 1.9327112187201254e-05, "loss": 0.0072, "step": 140120 }, { "epoch": 2.02, "learning_rate": 1.9327064147462783e-05, "loss": 0.0073, "step": 140130 }, { "epoch": 2.02, "learning_rate": 1.932701610772431e-05, "loss": 0.0072, "step": 140140 }, { "epoch": 2.02, "learning_rate": 1.9326968067985838e-05, "loss": 0.0118, "step": 140150 }, { "epoch": 2.02, "learning_rate": 1.9326920028247367e-05, "loss": 0.0086, "step": 140160 }, { "epoch": 2.02, "learning_rate": 1.9326871988508897e-05, "loss": 0.0055, "step": 140170 }, { "epoch": 2.02, "learning_rate": 1.9326823948770422e-05, "loss": 0.0086, "step": 140180 }, { "epoch": 2.02, "learning_rate": 1.9326775909031952e-05, "loss": 0.008, "step": 140190 }, { "epoch": 2.02, "learning_rate": 1.932672786929348e-05, "loss": 0.0092, "step": 140200 }, { "epoch": 2.02, "learning_rate": 1.9326679829555007e-05, "loss": 0.0087, "step": 140210 }, { "epoch": 2.02, "learning_rate": 1.9326631789816536e-05, "loss": 0.0048, "step": 140220 }, { "epoch": 2.02, "learning_rate": 1.9326583750078065e-05, "loss": 0.0078, "step": 140230 }, { "epoch": 2.02, "learning_rate": 1.9326535710339595e-05, "loss": 0.0076, "step": 140240 }, { "epoch": 2.02, "learning_rate": 1.932648767060112e-05, "loss": 0.0057, "step": 140250 }, { "epoch": 2.02, "learning_rate": 1.932643963086265e-05, "loss": 0.0088, "step": 140260 }, { "epoch": 2.02, "learning_rate": 1.932639159112418e-05, "loss": 0.0082, "step": 140270 }, { "epoch": 2.02, "learning_rate": 1.932634355138571e-05, "loss": 0.0086, "step": 140280 }, { "epoch": 2.02, "learning_rate": 1.9326295511647238e-05, "loss": 0.0071, "step": 140290 }, { "epoch": 2.02, "learning_rate": 1.9326247471908767e-05, "loss": 0.0085, "step": 140300 }, { "epoch": 2.02, "learning_rate": 1.9326199432170293e-05, "loss": 0.0098, "step": 140310 }, { "epoch": 2.02, "learning_rate": 1.9326151392431822e-05, "loss": 0.0056, "step": 140320 }, { "epoch": 2.02, "learning_rate": 1.932610335269335e-05, "loss": 0.0053, "step": 140330 }, { "epoch": 2.02, "learning_rate": 1.932605531295488e-05, "loss": 0.0105, "step": 140340 }, { "epoch": 2.02, "learning_rate": 1.9326007273216406e-05, "loss": 0.0065, "step": 140350 }, { "epoch": 2.02, "learning_rate": 1.9325959233477936e-05, "loss": 0.0067, "step": 140360 }, { "epoch": 2.02, "learning_rate": 1.9325911193739465e-05, "loss": 0.0078, "step": 140370 }, { "epoch": 2.02, "learning_rate": 1.932586315400099e-05, "loss": 0.0072, "step": 140380 }, { "epoch": 2.02, "learning_rate": 1.9325819918236366e-05, "loss": 0.0116, "step": 140390 }, { "epoch": 2.02, "learning_rate": 1.9325771878497895e-05, "loss": 0.0098, "step": 140400 }, { "epoch": 2.02, "learning_rate": 1.9325723838759424e-05, "loss": 0.008, "step": 140410 }, { "epoch": 2.02, "learning_rate": 1.932567579902095e-05, "loss": 0.0075, "step": 140420 }, { "epoch": 2.02, "learning_rate": 1.932562775928248e-05, "loss": 0.0091, "step": 140430 }, { "epoch": 2.02, "learning_rate": 1.932557971954401e-05, "loss": 0.0073, "step": 140440 }, { "epoch": 2.02, "learning_rate": 1.9325531679805534e-05, "loss": 0.0097, "step": 140450 }, { "epoch": 2.02, "learning_rate": 1.9325483640067064e-05, "loss": 0.0077, "step": 140460 }, { "epoch": 2.02, "learning_rate": 1.9325435600328593e-05, "loss": 0.0072, "step": 140470 }, { "epoch": 2.02, "learning_rate": 1.9325387560590122e-05, "loss": 0.0058, "step": 140480 }, { "epoch": 2.02, "learning_rate": 1.9325339520851648e-05, "loss": 0.0072, "step": 140490 }, { "epoch": 2.02, "learning_rate": 1.9325291481113177e-05, "loss": 0.008, "step": 140500 }, { "epoch": 2.03, "learning_rate": 1.9325243441374707e-05, "loss": 0.0088, "step": 140510 }, { "epoch": 2.03, "learning_rate": 1.9325195401636236e-05, "loss": 0.0111, "step": 140520 }, { "epoch": 2.03, "learning_rate": 1.9325147361897762e-05, "loss": 0.0061, "step": 140530 }, { "epoch": 2.03, "learning_rate": 1.932509932215929e-05, "loss": 0.0075, "step": 140540 }, { "epoch": 2.03, "learning_rate": 1.932505128242082e-05, "loss": 0.0067, "step": 140550 }, { "epoch": 2.03, "learning_rate": 1.9325003242682346e-05, "loss": 0.0077, "step": 140560 }, { "epoch": 2.03, "learning_rate": 1.9324955202943875e-05, "loss": 0.0097, "step": 140570 }, { "epoch": 2.03, "learning_rate": 1.9324907163205405e-05, "loss": 0.007, "step": 140580 }, { "epoch": 2.03, "learning_rate": 1.9324859123466934e-05, "loss": 0.0064, "step": 140590 }, { "epoch": 2.03, "learning_rate": 1.932481108372846e-05, "loss": 0.007, "step": 140600 }, { "epoch": 2.03, "learning_rate": 1.932476304398999e-05, "loss": 0.0083, "step": 140610 }, { "epoch": 2.03, "learning_rate": 1.932471500425152e-05, "loss": 0.0087, "step": 140620 }, { "epoch": 2.03, "learning_rate": 1.9324666964513044e-05, "loss": 0.0121, "step": 140630 }, { "epoch": 2.03, "learning_rate": 1.9324618924774574e-05, "loss": 0.0093, "step": 140640 }, { "epoch": 2.03, "learning_rate": 1.9324570885036103e-05, "loss": 0.0085, "step": 140650 }, { "epoch": 2.03, "learning_rate": 1.9324522845297632e-05, "loss": 0.0069, "step": 140660 }, { "epoch": 2.03, "learning_rate": 1.9324474805559158e-05, "loss": 0.0069, "step": 140670 }, { "epoch": 2.03, "learning_rate": 1.9324426765820687e-05, "loss": 0.0089, "step": 140680 }, { "epoch": 2.03, "learning_rate": 1.9324378726082217e-05, "loss": 0.0082, "step": 140690 }, { "epoch": 2.03, "learning_rate": 1.9324330686343742e-05, "loss": 0.007, "step": 140700 }, { "epoch": 2.03, "learning_rate": 1.932428264660527e-05, "loss": 0.0078, "step": 140710 }, { "epoch": 2.03, "learning_rate": 1.93242346068668e-05, "loss": 0.0055, "step": 140720 }, { "epoch": 2.03, "learning_rate": 1.932418656712833e-05, "loss": 0.0077, "step": 140730 }, { "epoch": 2.03, "learning_rate": 1.9324138527389856e-05, "loss": 0.0065, "step": 140740 }, { "epoch": 2.03, "learning_rate": 1.9324090487651385e-05, "loss": 0.0093, "step": 140750 }, { "epoch": 2.03, "learning_rate": 1.9324042447912915e-05, "loss": 0.01, "step": 140760 }, { "epoch": 2.03, "learning_rate": 1.9323994408174444e-05, "loss": 0.0066, "step": 140770 }, { "epoch": 2.03, "learning_rate": 1.932394636843597e-05, "loss": 0.0082, "step": 140780 }, { "epoch": 2.03, "learning_rate": 1.93238983286975e-05, "loss": 0.0085, "step": 140790 }, { "epoch": 2.03, "learning_rate": 1.932385028895903e-05, "loss": 0.0069, "step": 140800 }, { "epoch": 2.03, "learning_rate": 1.9323802249220558e-05, "loss": 0.0125, "step": 140810 }, { "epoch": 2.03, "learning_rate": 1.9323754209482087e-05, "loss": 0.0088, "step": 140820 }, { "epoch": 2.03, "learning_rate": 1.9323706169743616e-05, "loss": 0.0073, "step": 140830 }, { "epoch": 2.03, "learning_rate": 1.9323658130005142e-05, "loss": 0.0081, "step": 140840 }, { "epoch": 2.03, "learning_rate": 1.932361009026667e-05, "loss": 0.0062, "step": 140850 }, { "epoch": 2.03, "learning_rate": 1.93235620505282e-05, "loss": 0.0095, "step": 140860 }, { "epoch": 2.03, "learning_rate": 1.9323514010789726e-05, "loss": 0.01, "step": 140870 }, { "epoch": 2.03, "learning_rate": 1.9323465971051256e-05, "loss": 0.007, "step": 140880 }, { "epoch": 2.03, "learning_rate": 1.9323417931312785e-05, "loss": 0.0082, "step": 140890 }, { "epoch": 2.03, "learning_rate": 1.9323369891574314e-05, "loss": 0.0087, "step": 140900 }, { "epoch": 2.03, "learning_rate": 1.932332185183584e-05, "loss": 0.008, "step": 140910 }, { "epoch": 2.03, "learning_rate": 1.932327381209737e-05, "loss": 0.0088, "step": 140920 }, { "epoch": 2.03, "learning_rate": 1.93232257723589e-05, "loss": 0.0061, "step": 140930 }, { "epoch": 2.03, "learning_rate": 1.9323177732620425e-05, "loss": 0.0094, "step": 140940 }, { "epoch": 2.03, "learning_rate": 1.9323129692881954e-05, "loss": 0.0096, "step": 140950 }, { "epoch": 2.03, "learning_rate": 1.9323081653143483e-05, "loss": 0.0098, "step": 140960 }, { "epoch": 2.03, "learning_rate": 1.9323033613405012e-05, "loss": 0.0075, "step": 140970 }, { "epoch": 2.03, "learning_rate": 1.9322985573666538e-05, "loss": 0.009, "step": 140980 }, { "epoch": 2.03, "learning_rate": 1.9322937533928068e-05, "loss": 0.0092, "step": 140990 }, { "epoch": 2.03, "learning_rate": 1.9322889494189597e-05, "loss": 0.0083, "step": 141000 }, { "epoch": 2.03, "learning_rate": 1.9322841454451126e-05, "loss": 0.0064, "step": 141010 }, { "epoch": 2.03, "learning_rate": 1.9322793414712652e-05, "loss": 0.007, "step": 141020 }, { "epoch": 2.03, "learning_rate": 1.932274537497418e-05, "loss": 0.0121, "step": 141030 }, { "epoch": 2.03, "learning_rate": 1.932269733523571e-05, "loss": 0.0083, "step": 141040 }, { "epoch": 2.03, "learning_rate": 1.9322649295497236e-05, "loss": 0.0118, "step": 141050 }, { "epoch": 2.03, "learning_rate": 1.9322601255758766e-05, "loss": 0.0088, "step": 141060 }, { "epoch": 2.03, "learning_rate": 1.9322553216020295e-05, "loss": 0.0078, "step": 141070 }, { "epoch": 2.03, "learning_rate": 1.9322505176281824e-05, "loss": 0.0082, "step": 141080 }, { "epoch": 2.03, "learning_rate": 1.932245713654335e-05, "loss": 0.0081, "step": 141090 }, { "epoch": 2.03, "learning_rate": 1.932240909680488e-05, "loss": 0.0097, "step": 141100 }, { "epoch": 2.03, "learning_rate": 1.932236105706641e-05, "loss": 0.0122, "step": 141110 }, { "epoch": 2.03, "learning_rate": 1.9322313017327934e-05, "loss": 0.0107, "step": 141120 }, { "epoch": 2.03, "learning_rate": 1.9322264977589464e-05, "loss": 0.0067, "step": 141130 }, { "epoch": 2.03, "learning_rate": 1.9322216937850993e-05, "loss": 0.0046, "step": 141140 }, { "epoch": 2.03, "learning_rate": 1.9322168898112522e-05, "loss": 0.0103, "step": 141150 }, { "epoch": 2.03, "learning_rate": 1.9322120858374048e-05, "loss": 0.0064, "step": 141160 }, { "epoch": 2.03, "learning_rate": 1.9322072818635577e-05, "loss": 0.0063, "step": 141170 }, { "epoch": 2.03, "learning_rate": 1.9322024778897107e-05, "loss": 0.0074, "step": 141180 }, { "epoch": 2.03, "learning_rate": 1.9321976739158636e-05, "loss": 0.0105, "step": 141190 }, { "epoch": 2.03, "learning_rate": 1.9321928699420162e-05, "loss": 0.008, "step": 141200 }, { "epoch": 2.04, "learning_rate": 1.932188065968169e-05, "loss": 0.0062, "step": 141210 }, { "epoch": 2.04, "learning_rate": 1.932183261994322e-05, "loss": 0.007, "step": 141220 }, { "epoch": 2.04, "learning_rate": 1.9321784580204746e-05, "loss": 0.0062, "step": 141230 }, { "epoch": 2.04, "learning_rate": 1.9321736540466276e-05, "loss": 0.0109, "step": 141240 }, { "epoch": 2.04, "learning_rate": 1.9321688500727805e-05, "loss": 0.0069, "step": 141250 }, { "epoch": 2.04, "learning_rate": 1.9321640460989334e-05, "loss": 0.0099, "step": 141260 }, { "epoch": 2.04, "learning_rate": 1.932159242125086e-05, "loss": 0.0086, "step": 141270 }, { "epoch": 2.04, "learning_rate": 1.932154438151239e-05, "loss": 0.0063, "step": 141280 }, { "epoch": 2.04, "learning_rate": 1.932149634177392e-05, "loss": 0.0095, "step": 141290 }, { "epoch": 2.04, "learning_rate": 1.9321448302035444e-05, "loss": 0.0078, "step": 141300 }, { "epoch": 2.04, "learning_rate": 1.9321400262296974e-05, "loss": 0.0085, "step": 141310 }, { "epoch": 2.04, "learning_rate": 1.9321352222558503e-05, "loss": 0.0077, "step": 141320 }, { "epoch": 2.04, "learning_rate": 1.9321304182820032e-05, "loss": 0.008, "step": 141330 }, { "epoch": 2.04, "learning_rate": 1.9321256143081558e-05, "loss": 0.0088, "step": 141340 }, { "epoch": 2.04, "learning_rate": 1.9321208103343087e-05, "loss": 0.0071, "step": 141350 }, { "epoch": 2.04, "learning_rate": 1.9321160063604617e-05, "loss": 0.0085, "step": 141360 }, { "epoch": 2.04, "learning_rate": 1.9321112023866146e-05, "loss": 0.0079, "step": 141370 }, { "epoch": 2.04, "learning_rate": 1.9321063984127672e-05, "loss": 0.0081, "step": 141380 }, { "epoch": 2.04, "learning_rate": 1.93210159443892e-05, "loss": 0.0078, "step": 141390 }, { "epoch": 2.04, "learning_rate": 1.932096790465073e-05, "loss": 0.0097, "step": 141400 }, { "epoch": 2.04, "learning_rate": 1.9320919864912256e-05, "loss": 0.0075, "step": 141410 }, { "epoch": 2.04, "learning_rate": 1.9320871825173785e-05, "loss": 0.0079, "step": 141420 }, { "epoch": 2.04, "learning_rate": 1.9320823785435315e-05, "loss": 0.007, "step": 141430 }, { "epoch": 2.04, "learning_rate": 1.9320775745696844e-05, "loss": 0.0063, "step": 141440 }, { "epoch": 2.04, "learning_rate": 1.932072770595837e-05, "loss": 0.0058, "step": 141450 }, { "epoch": 2.04, "learning_rate": 1.93206796662199e-05, "loss": 0.0101, "step": 141460 }, { "epoch": 2.04, "learning_rate": 1.932063162648143e-05, "loss": 0.0067, "step": 141470 }, { "epoch": 2.04, "learning_rate": 1.9320583586742954e-05, "loss": 0.0085, "step": 141480 }, { "epoch": 2.04, "learning_rate": 1.9320535547004484e-05, "loss": 0.0077, "step": 141490 }, { "epoch": 2.04, "learning_rate": 1.9320487507266013e-05, "loss": 0.0064, "step": 141500 }, { "epoch": 2.04, "learning_rate": 1.9320439467527542e-05, "loss": 0.0074, "step": 141510 }, { "epoch": 2.04, "learning_rate": 1.9320391427789068e-05, "loss": 0.0075, "step": 141520 }, { "epoch": 2.04, "learning_rate": 1.9320343388050597e-05, "loss": 0.0071, "step": 141530 }, { "epoch": 2.04, "learning_rate": 1.9320295348312127e-05, "loss": 0.0054, "step": 141540 }, { "epoch": 2.04, "learning_rate": 1.9320247308573656e-05, "loss": 0.0082, "step": 141550 }, { "epoch": 2.04, "learning_rate": 1.932019926883518e-05, "loss": 0.0087, "step": 141560 }, { "epoch": 2.04, "learning_rate": 1.932015122909671e-05, "loss": 0.0083, "step": 141570 }, { "epoch": 2.04, "learning_rate": 1.932010318935824e-05, "loss": 0.008, "step": 141580 }, { "epoch": 2.04, "learning_rate": 1.9320055149619766e-05, "loss": 0.0121, "step": 141590 }, { "epoch": 2.04, "learning_rate": 1.9320007109881295e-05, "loss": 0.0054, "step": 141600 }, { "epoch": 2.04, "learning_rate": 1.9319959070142825e-05, "loss": 0.0054, "step": 141610 }, { "epoch": 2.04, "learning_rate": 1.9319911030404354e-05, "loss": 0.0074, "step": 141620 }, { "epoch": 2.04, "learning_rate": 1.931986299066588e-05, "loss": 0.0053, "step": 141630 }, { "epoch": 2.04, "learning_rate": 1.931981495092741e-05, "loss": 0.0089, "step": 141640 }, { "epoch": 2.04, "learning_rate": 1.931976691118894e-05, "loss": 0.005, "step": 141650 }, { "epoch": 2.04, "learning_rate": 1.9319718871450464e-05, "loss": 0.0096, "step": 141660 }, { "epoch": 2.04, "learning_rate": 1.9319670831711993e-05, "loss": 0.0059, "step": 141670 }, { "epoch": 2.04, "learning_rate": 1.9319622791973523e-05, "loss": 0.0063, "step": 141680 }, { "epoch": 2.04, "learning_rate": 1.9319574752235052e-05, "loss": 0.0066, "step": 141690 }, { "epoch": 2.04, "learning_rate": 1.9319526712496578e-05, "loss": 0.0085, "step": 141700 }, { "epoch": 2.04, "learning_rate": 1.9319478672758107e-05, "loss": 0.0059, "step": 141710 }, { "epoch": 2.04, "learning_rate": 1.9319430633019636e-05, "loss": 0.0063, "step": 141720 }, { "epoch": 2.04, "learning_rate": 1.9319382593281166e-05, "loss": 0.012, "step": 141730 }, { "epoch": 2.04, "learning_rate": 1.931933455354269e-05, "loss": 0.0076, "step": 141740 }, { "epoch": 2.04, "learning_rate": 1.931928651380422e-05, "loss": 0.0064, "step": 141750 }, { "epoch": 2.04, "learning_rate": 1.931923847406575e-05, "loss": 0.0087, "step": 141760 }, { "epoch": 2.04, "learning_rate": 1.9319190434327276e-05, "loss": 0.0107, "step": 141770 }, { "epoch": 2.04, "learning_rate": 1.9319142394588805e-05, "loss": 0.0093, "step": 141780 }, { "epoch": 2.04, "learning_rate": 1.9319094354850335e-05, "loss": 0.0056, "step": 141790 }, { "epoch": 2.04, "learning_rate": 1.9319046315111864e-05, "loss": 0.0071, "step": 141800 }, { "epoch": 2.04, "learning_rate": 1.931899827537339e-05, "loss": 0.0055, "step": 141810 }, { "epoch": 2.04, "learning_rate": 1.931895023563492e-05, "loss": 0.009, "step": 141820 }, { "epoch": 2.04, "learning_rate": 1.9318902195896448e-05, "loss": 0.0065, "step": 141830 }, { "epoch": 2.04, "learning_rate": 1.9318854156157974e-05, "loss": 0.0095, "step": 141840 }, { "epoch": 2.04, "learning_rate": 1.9318806116419503e-05, "loss": 0.0087, "step": 141850 }, { "epoch": 2.04, "learning_rate": 1.9318758076681033e-05, "loss": 0.0077, "step": 141860 }, { "epoch": 2.04, "learning_rate": 1.9318710036942562e-05, "loss": 0.0088, "step": 141870 }, { "epoch": 2.04, "learning_rate": 1.9318661997204088e-05, "loss": 0.0061, "step": 141880 }, { "epoch": 2.04, "learning_rate": 1.9318613957465617e-05, "loss": 0.0086, "step": 141890 }, { "epoch": 2.05, "learning_rate": 1.9318565917727146e-05, "loss": 0.008, "step": 141900 }, { "epoch": 2.05, "learning_rate": 1.9318517877988676e-05, "loss": 0.0053, "step": 141910 }, { "epoch": 2.05, "learning_rate": 1.93184698382502e-05, "loss": 0.0082, "step": 141920 }, { "epoch": 2.05, "learning_rate": 1.931842179851173e-05, "loss": 0.0095, "step": 141930 }, { "epoch": 2.05, "learning_rate": 1.931837375877326e-05, "loss": 0.0065, "step": 141940 }, { "epoch": 2.05, "learning_rate": 1.9318325719034786e-05, "loss": 0.0079, "step": 141950 }, { "epoch": 2.05, "learning_rate": 1.9318277679296315e-05, "loss": 0.0064, "step": 141960 }, { "epoch": 2.05, "learning_rate": 1.9318229639557844e-05, "loss": 0.006, "step": 141970 }, { "epoch": 2.05, "learning_rate": 1.9318181599819374e-05, "loss": 0.0072, "step": 141980 }, { "epoch": 2.05, "learning_rate": 1.93181335600809e-05, "loss": 0.0086, "step": 141990 }, { "epoch": 2.05, "learning_rate": 1.931808552034243e-05, "loss": 0.0088, "step": 142000 }, { "epoch": 2.05, "learning_rate": 1.9318037480603958e-05, "loss": 0.0085, "step": 142010 }, { "epoch": 2.05, "learning_rate": 1.9317989440865484e-05, "loss": 0.0069, "step": 142020 }, { "epoch": 2.05, "learning_rate": 1.9317941401127013e-05, "loss": 0.0065, "step": 142030 }, { "epoch": 2.05, "learning_rate": 1.9317893361388543e-05, "loss": 0.0065, "step": 142040 }, { "epoch": 2.05, "learning_rate": 1.9317845321650072e-05, "loss": 0.011, "step": 142050 }, { "epoch": 2.05, "learning_rate": 1.9317797281911598e-05, "loss": 0.0059, "step": 142060 }, { "epoch": 2.05, "learning_rate": 1.9317749242173127e-05, "loss": 0.0062, "step": 142070 }, { "epoch": 2.05, "learning_rate": 1.9317701202434656e-05, "loss": 0.0087, "step": 142080 }, { "epoch": 2.05, "learning_rate": 1.9317653162696182e-05, "loss": 0.0074, "step": 142090 }, { "epoch": 2.05, "learning_rate": 1.931760512295771e-05, "loss": 0.0105, "step": 142100 }, { "epoch": 2.05, "learning_rate": 1.931755708321924e-05, "loss": 0.0091, "step": 142110 }, { "epoch": 2.05, "learning_rate": 1.931750904348077e-05, "loss": 0.0083, "step": 142120 }, { "epoch": 2.05, "learning_rate": 1.9317461003742296e-05, "loss": 0.0056, "step": 142130 }, { "epoch": 2.05, "learning_rate": 1.9317412964003825e-05, "loss": 0.0045, "step": 142140 }, { "epoch": 2.05, "learning_rate": 1.9317364924265354e-05, "loss": 0.0086, "step": 142150 }, { "epoch": 2.05, "learning_rate": 1.9317316884526884e-05, "loss": 0.007, "step": 142160 }, { "epoch": 2.05, "learning_rate": 1.931726884478841e-05, "loss": 0.0059, "step": 142170 }, { "epoch": 2.05, "learning_rate": 1.931722080504994e-05, "loss": 0.0083, "step": 142180 }, { "epoch": 2.05, "learning_rate": 1.9317172765311468e-05, "loss": 0.008, "step": 142190 }, { "epoch": 2.05, "learning_rate": 1.9317124725572994e-05, "loss": 0.0089, "step": 142200 }, { "epoch": 2.05, "learning_rate": 1.9317076685834523e-05, "loss": 0.0052, "step": 142210 }, { "epoch": 2.05, "learning_rate": 1.9317028646096053e-05, "loss": 0.0093, "step": 142220 }, { "epoch": 2.05, "learning_rate": 1.9316980606357582e-05, "loss": 0.0075, "step": 142230 }, { "epoch": 2.05, "learning_rate": 1.9316932566619108e-05, "loss": 0.0063, "step": 142240 }, { "epoch": 2.05, "learning_rate": 1.9316884526880637e-05, "loss": 0.0083, "step": 142250 }, { "epoch": 2.05, "learning_rate": 1.9316836487142166e-05, "loss": 0.0093, "step": 142260 }, { "epoch": 2.05, "learning_rate": 1.9316788447403692e-05, "loss": 0.0072, "step": 142270 }, { "epoch": 2.05, "learning_rate": 1.931674040766522e-05, "loss": 0.0084, "step": 142280 }, { "epoch": 2.05, "learning_rate": 1.931669236792675e-05, "loss": 0.0075, "step": 142290 }, { "epoch": 2.05, "learning_rate": 1.931664432818828e-05, "loss": 0.0095, "step": 142300 }, { "epoch": 2.05, "learning_rate": 1.9316596288449806e-05, "loss": 0.0072, "step": 142310 }, { "epoch": 2.05, "learning_rate": 1.9316548248711335e-05, "loss": 0.006, "step": 142320 }, { "epoch": 2.05, "learning_rate": 1.9316500208972864e-05, "loss": 0.0079, "step": 142330 }, { "epoch": 2.05, "learning_rate": 1.9316452169234394e-05, "loss": 0.0057, "step": 142340 }, { "epoch": 2.05, "learning_rate": 1.931640412949592e-05, "loss": 0.0121, "step": 142350 }, { "epoch": 2.05, "learning_rate": 1.931635608975745e-05, "loss": 0.0057, "step": 142360 }, { "epoch": 2.05, "learning_rate": 1.9316308050018978e-05, "loss": 0.0089, "step": 142370 }, { "epoch": 2.05, "learning_rate": 1.9316260010280504e-05, "loss": 0.0054, "step": 142380 }, { "epoch": 2.05, "learning_rate": 1.9316211970542033e-05, "loss": 0.0096, "step": 142390 }, { "epoch": 2.05, "learning_rate": 1.9316163930803562e-05, "loss": 0.0069, "step": 142400 }, { "epoch": 2.05, "learning_rate": 1.931611589106509e-05, "loss": 0.0075, "step": 142410 }, { "epoch": 2.05, "learning_rate": 1.9316067851326618e-05, "loss": 0.0083, "step": 142420 }, { "epoch": 2.05, "learning_rate": 1.9316019811588147e-05, "loss": 0.008, "step": 142430 }, { "epoch": 2.05, "learning_rate": 1.9315971771849676e-05, "loss": 0.0098, "step": 142440 }, { "epoch": 2.05, "learning_rate": 1.9315923732111202e-05, "loss": 0.0082, "step": 142450 }, { "epoch": 2.05, "learning_rate": 1.931587569237273e-05, "loss": 0.0128, "step": 142460 }, { "epoch": 2.05, "learning_rate": 1.931582765263426e-05, "loss": 0.0077, "step": 142470 }, { "epoch": 2.05, "learning_rate": 1.931577961289579e-05, "loss": 0.0066, "step": 142480 }, { "epoch": 2.05, "learning_rate": 1.9315731573157316e-05, "loss": 0.0106, "step": 142490 }, { "epoch": 2.05, "learning_rate": 1.9315683533418845e-05, "loss": 0.0071, "step": 142500 }, { "epoch": 2.05, "learning_rate": 1.9315635493680374e-05, "loss": 0.0059, "step": 142510 }, { "epoch": 2.05, "learning_rate": 1.9315587453941903e-05, "loss": 0.0086, "step": 142520 }, { "epoch": 2.05, "learning_rate": 1.931553941420343e-05, "loss": 0.0059, "step": 142530 }, { "epoch": 2.05, "learning_rate": 1.931549137446496e-05, "loss": 0.0102, "step": 142540 }, { "epoch": 2.05, "learning_rate": 1.9315443334726488e-05, "loss": 0.0098, "step": 142550 }, { "epoch": 2.05, "learning_rate": 1.9315395294988014e-05, "loss": 0.0059, "step": 142560 }, { "epoch": 2.05, "learning_rate": 1.9315347255249543e-05, "loss": 0.0088, "step": 142570 }, { "epoch": 2.05, "learning_rate": 1.9315299215511072e-05, "loss": 0.005, "step": 142580 }, { "epoch": 2.05, "learning_rate": 1.93152511757726e-05, "loss": 0.0082, "step": 142590 }, { "epoch": 2.06, "learning_rate": 1.9315203136034127e-05, "loss": 0.0049, "step": 142600 }, { "epoch": 2.06, "learning_rate": 1.9315155096295657e-05, "loss": 0.0064, "step": 142610 }, { "epoch": 2.06, "learning_rate": 1.9315107056557186e-05, "loss": 0.0044, "step": 142620 }, { "epoch": 2.06, "learning_rate": 1.9315059016818712e-05, "loss": 0.0117, "step": 142630 }, { "epoch": 2.06, "learning_rate": 1.931501097708024e-05, "loss": 0.0081, "step": 142640 }, { "epoch": 2.06, "learning_rate": 1.931496293734177e-05, "loss": 0.0118, "step": 142650 }, { "epoch": 2.06, "learning_rate": 1.93149148976033e-05, "loss": 0.0067, "step": 142660 }, { "epoch": 2.06, "learning_rate": 1.9314866857864826e-05, "loss": 0.0062, "step": 142670 }, { "epoch": 2.06, "learning_rate": 1.9314818818126355e-05, "loss": 0.0056, "step": 142680 }, { "epoch": 2.06, "learning_rate": 1.9314770778387884e-05, "loss": 0.0062, "step": 142690 }, { "epoch": 2.06, "learning_rate": 1.9314722738649413e-05, "loss": 0.0087, "step": 142700 }, { "epoch": 2.06, "learning_rate": 1.931467469891094e-05, "loss": 0.0094, "step": 142710 }, { "epoch": 2.06, "learning_rate": 1.931462665917247e-05, "loss": 0.0052, "step": 142720 }, { "epoch": 2.06, "learning_rate": 1.9314578619433998e-05, "loss": 0.0052, "step": 142730 }, { "epoch": 2.06, "learning_rate": 1.9314530579695524e-05, "loss": 0.0095, "step": 142740 }, { "epoch": 2.06, "learning_rate": 1.9314482539957053e-05, "loss": 0.0067, "step": 142750 }, { "epoch": 2.06, "learning_rate": 1.9314434500218582e-05, "loss": 0.0048, "step": 142760 }, { "epoch": 2.06, "learning_rate": 1.931438646048011e-05, "loss": 0.0071, "step": 142770 }, { "epoch": 2.06, "learning_rate": 1.9314338420741637e-05, "loss": 0.009, "step": 142780 }, { "epoch": 2.06, "learning_rate": 1.9314290381003167e-05, "loss": 0.0085, "step": 142790 }, { "epoch": 2.06, "learning_rate": 1.9314242341264696e-05, "loss": 0.0067, "step": 142800 }, { "epoch": 2.06, "learning_rate": 1.9314194301526222e-05, "loss": 0.0093, "step": 142810 }, { "epoch": 2.06, "learning_rate": 1.931414626178775e-05, "loss": 0.0078, "step": 142820 }, { "epoch": 2.06, "learning_rate": 1.931409822204928e-05, "loss": 0.0086, "step": 142830 }, { "epoch": 2.06, "learning_rate": 1.931405018231081e-05, "loss": 0.0091, "step": 142840 }, { "epoch": 2.06, "learning_rate": 1.9314002142572336e-05, "loss": 0.0081, "step": 142850 }, { "epoch": 2.06, "learning_rate": 1.9313954102833865e-05, "loss": 0.0076, "step": 142860 }, { "epoch": 2.06, "learning_rate": 1.9313906063095394e-05, "loss": 0.0067, "step": 142870 }, { "epoch": 2.06, "learning_rate": 1.9313858023356923e-05, "loss": 0.0049, "step": 142880 }, { "epoch": 2.06, "learning_rate": 1.931380998361845e-05, "loss": 0.0091, "step": 142890 }, { "epoch": 2.06, "learning_rate": 1.931376194387998e-05, "loss": 0.008, "step": 142900 }, { "epoch": 2.06, "learning_rate": 1.9313713904141508e-05, "loss": 0.006, "step": 142910 }, { "epoch": 2.06, "learning_rate": 1.9313665864403034e-05, "loss": 0.0085, "step": 142920 }, { "epoch": 2.06, "learning_rate": 1.9313617824664563e-05, "loss": 0.0082, "step": 142930 }, { "epoch": 2.06, "learning_rate": 1.9313569784926092e-05, "loss": 0.0143, "step": 142940 }, { "epoch": 2.06, "learning_rate": 1.931352174518762e-05, "loss": 0.0065, "step": 142950 }, { "epoch": 2.06, "learning_rate": 1.9313473705449147e-05, "loss": 0.0123, "step": 142960 }, { "epoch": 2.06, "learning_rate": 1.9313425665710677e-05, "loss": 0.0062, "step": 142970 }, { "epoch": 2.06, "learning_rate": 1.9313377625972206e-05, "loss": 0.0125, "step": 142980 }, { "epoch": 2.06, "learning_rate": 1.9313329586233732e-05, "loss": 0.0071, "step": 142990 }, { "epoch": 2.06, "learning_rate": 1.931328154649526e-05, "loss": 0.0085, "step": 143000 }, { "epoch": 2.06, "learning_rate": 1.931323350675679e-05, "loss": 0.0089, "step": 143010 }, { "epoch": 2.06, "learning_rate": 1.931318546701832e-05, "loss": 0.0088, "step": 143020 }, { "epoch": 2.06, "learning_rate": 1.9313137427279845e-05, "loss": 0.0055, "step": 143030 }, { "epoch": 2.06, "learning_rate": 1.9313089387541375e-05, "loss": 0.0095, "step": 143040 }, { "epoch": 2.06, "learning_rate": 1.9313041347802904e-05, "loss": 0.0092, "step": 143050 }, { "epoch": 2.06, "learning_rate": 1.9312993308064433e-05, "loss": 0.0056, "step": 143060 }, { "epoch": 2.06, "learning_rate": 1.931294526832596e-05, "loss": 0.0103, "step": 143070 }, { "epoch": 2.06, "learning_rate": 1.931289722858749e-05, "loss": 0.0074, "step": 143080 }, { "epoch": 2.06, "learning_rate": 1.9312849188849018e-05, "loss": 0.0082, "step": 143090 }, { "epoch": 2.06, "learning_rate": 1.9312801149110544e-05, "loss": 0.0052, "step": 143100 }, { "epoch": 2.06, "learning_rate": 1.9312753109372073e-05, "loss": 0.0068, "step": 143110 }, { "epoch": 2.06, "learning_rate": 1.9312705069633602e-05, "loss": 0.0061, "step": 143120 }, { "epoch": 2.06, "learning_rate": 1.931265702989513e-05, "loss": 0.0093, "step": 143130 }, { "epoch": 2.06, "learning_rate": 1.9312608990156657e-05, "loss": 0.0075, "step": 143140 }, { "epoch": 2.06, "learning_rate": 1.9312560950418186e-05, "loss": 0.0073, "step": 143150 }, { "epoch": 2.06, "learning_rate": 1.9312512910679716e-05, "loss": 0.0065, "step": 143160 }, { "epoch": 2.06, "learning_rate": 1.931246487094124e-05, "loss": 0.0074, "step": 143170 }, { "epoch": 2.06, "learning_rate": 1.931241683120277e-05, "loss": 0.0092, "step": 143180 }, { "epoch": 2.06, "learning_rate": 1.93123687914643e-05, "loss": 0.0098, "step": 143190 }, { "epoch": 2.06, "learning_rate": 1.931232075172583e-05, "loss": 0.006, "step": 143200 }, { "epoch": 2.06, "learning_rate": 1.9312272711987355e-05, "loss": 0.0081, "step": 143210 }, { "epoch": 2.06, "learning_rate": 1.9312224672248885e-05, "loss": 0.0051, "step": 143220 }, { "epoch": 2.06, "learning_rate": 1.9312176632510414e-05, "loss": 0.0066, "step": 143230 }, { "epoch": 2.06, "learning_rate": 1.9312128592771943e-05, "loss": 0.0082, "step": 143240 }, { "epoch": 2.06, "learning_rate": 1.931208055303347e-05, "loss": 0.0067, "step": 143250 }, { "epoch": 2.06, "learning_rate": 1.9312032513294998e-05, "loss": 0.0084, "step": 143260 }, { "epoch": 2.06, "learning_rate": 1.9311984473556528e-05, "loss": 0.0077, "step": 143270 }, { "epoch": 2.06, "learning_rate": 1.9311936433818053e-05, "loss": 0.008, "step": 143280 }, { "epoch": 2.07, "learning_rate": 1.9311888394079583e-05, "loss": 0.009, "step": 143290 }, { "epoch": 2.07, "learning_rate": 1.9311840354341112e-05, "loss": 0.0101, "step": 143300 }, { "epoch": 2.07, "learning_rate": 1.931179231460264e-05, "loss": 0.0073, "step": 143310 }, { "epoch": 2.07, "learning_rate": 1.9311744274864167e-05, "loss": 0.0063, "step": 143320 }, { "epoch": 2.07, "learning_rate": 1.9311696235125696e-05, "loss": 0.0082, "step": 143330 }, { "epoch": 2.07, "learning_rate": 1.9311648195387226e-05, "loss": 0.009, "step": 143340 }, { "epoch": 2.07, "learning_rate": 1.931160015564875e-05, "loss": 0.0089, "step": 143350 }, { "epoch": 2.07, "learning_rate": 1.9311552115910284e-05, "loss": 0.0068, "step": 143360 }, { "epoch": 2.07, "learning_rate": 1.9311504076171813e-05, "loss": 0.0094, "step": 143370 }, { "epoch": 2.07, "learning_rate": 1.931145603643334e-05, "loss": 0.0075, "step": 143380 }, { "epoch": 2.07, "learning_rate": 1.931140799669487e-05, "loss": 0.0058, "step": 143390 }, { "epoch": 2.07, "learning_rate": 1.9311359956956398e-05, "loss": 0.0078, "step": 143400 }, { "epoch": 2.07, "learning_rate": 1.9311311917217924e-05, "loss": 0.0087, "step": 143410 }, { "epoch": 2.07, "learning_rate": 1.9311263877479453e-05, "loss": 0.0086, "step": 143420 }, { "epoch": 2.07, "learning_rate": 1.9311215837740982e-05, "loss": 0.0081, "step": 143430 }, { "epoch": 2.07, "learning_rate": 1.931116779800251e-05, "loss": 0.0059, "step": 143440 }, { "epoch": 2.07, "learning_rate": 1.9311119758264037e-05, "loss": 0.007, "step": 143450 }, { "epoch": 2.07, "learning_rate": 1.9311071718525567e-05, "loss": 0.0071, "step": 143460 }, { "epoch": 2.07, "learning_rate": 1.9311023678787096e-05, "loss": 0.01, "step": 143470 }, { "epoch": 2.07, "learning_rate": 1.9310975639048622e-05, "loss": 0.008, "step": 143480 }, { "epoch": 2.07, "learning_rate": 1.931092759931015e-05, "loss": 0.0078, "step": 143490 }, { "epoch": 2.07, "learning_rate": 1.931087955957168e-05, "loss": 0.0069, "step": 143500 }, { "epoch": 2.07, "learning_rate": 1.931083151983321e-05, "loss": 0.0094, "step": 143510 }, { "epoch": 2.07, "learning_rate": 1.9310783480094736e-05, "loss": 0.0064, "step": 143520 }, { "epoch": 2.07, "learning_rate": 1.9310735440356265e-05, "loss": 0.0074, "step": 143530 }, { "epoch": 2.07, "learning_rate": 1.9310687400617794e-05, "loss": 0.0074, "step": 143540 }, { "epoch": 2.07, "learning_rate": 1.9310639360879323e-05, "loss": 0.0084, "step": 143550 }, { "epoch": 2.07, "learning_rate": 1.931059132114085e-05, "loss": 0.0093, "step": 143560 }, { "epoch": 2.07, "learning_rate": 1.931054328140238e-05, "loss": 0.0089, "step": 143570 }, { "epoch": 2.07, "learning_rate": 1.9310495241663908e-05, "loss": 0.0084, "step": 143580 }, { "epoch": 2.07, "learning_rate": 1.9310447201925434e-05, "loss": 0.0057, "step": 143590 }, { "epoch": 2.07, "learning_rate": 1.9310399162186963e-05, "loss": 0.0051, "step": 143600 }, { "epoch": 2.07, "learning_rate": 1.9310351122448492e-05, "loss": 0.0087, "step": 143610 }, { "epoch": 2.07, "learning_rate": 1.931030308271002e-05, "loss": 0.0063, "step": 143620 }, { "epoch": 2.07, "learning_rate": 1.9310255042971547e-05, "loss": 0.0086, "step": 143630 }, { "epoch": 2.07, "learning_rate": 1.9310207003233077e-05, "loss": 0.0079, "step": 143640 }, { "epoch": 2.07, "learning_rate": 1.9310158963494606e-05, "loss": 0.0065, "step": 143650 }, { "epoch": 2.07, "learning_rate": 1.9310110923756132e-05, "loss": 0.0063, "step": 143660 }, { "epoch": 2.07, "learning_rate": 1.931006288401766e-05, "loss": 0.0097, "step": 143670 }, { "epoch": 2.07, "learning_rate": 1.931001484427919e-05, "loss": 0.0085, "step": 143680 }, { "epoch": 2.07, "learning_rate": 1.930996680454072e-05, "loss": 0.0134, "step": 143690 }, { "epoch": 2.07, "learning_rate": 1.9309918764802246e-05, "loss": 0.0095, "step": 143700 }, { "epoch": 2.07, "learning_rate": 1.9309870725063775e-05, "loss": 0.0063, "step": 143710 }, { "epoch": 2.07, "learning_rate": 1.9309822685325304e-05, "loss": 0.0086, "step": 143720 }, { "epoch": 2.07, "learning_rate": 1.9309774645586833e-05, "loss": 0.0081, "step": 143730 }, { "epoch": 2.07, "learning_rate": 1.930972660584836e-05, "loss": 0.0066, "step": 143740 }, { "epoch": 2.07, "learning_rate": 1.930967856610989e-05, "loss": 0.0095, "step": 143750 }, { "epoch": 2.07, "learning_rate": 1.9309630526371418e-05, "loss": 0.0066, "step": 143760 }, { "epoch": 2.07, "learning_rate": 1.9309582486632944e-05, "loss": 0.0066, "step": 143770 }, { "epoch": 2.07, "learning_rate": 1.9309534446894473e-05, "loss": 0.0082, "step": 143780 }, { "epoch": 2.07, "learning_rate": 1.9309486407156002e-05, "loss": 0.0073, "step": 143790 }, { "epoch": 2.07, "learning_rate": 1.930943836741753e-05, "loss": 0.0121, "step": 143800 }, { "epoch": 2.07, "learning_rate": 1.9309390327679057e-05, "loss": 0.0055, "step": 143810 }, { "epoch": 2.07, "learning_rate": 1.9309342287940587e-05, "loss": 0.0068, "step": 143820 }, { "epoch": 2.07, "learning_rate": 1.9309294248202116e-05, "loss": 0.0066, "step": 143830 }, { "epoch": 2.07, "learning_rate": 1.9309246208463642e-05, "loss": 0.0062, "step": 143840 }, { "epoch": 2.07, "learning_rate": 1.9309202972699016e-05, "loss": 0.0051, "step": 143850 }, { "epoch": 2.07, "learning_rate": 1.9309154932960546e-05, "loss": 0.0085, "step": 143860 }, { "epoch": 2.07, "learning_rate": 1.9309106893222075e-05, "loss": 0.0073, "step": 143870 }, { "epoch": 2.07, "learning_rate": 1.9309058853483604e-05, "loss": 0.0071, "step": 143880 }, { "epoch": 2.07, "learning_rate": 1.9309010813745133e-05, "loss": 0.0072, "step": 143890 }, { "epoch": 2.07, "learning_rate": 1.930896277400666e-05, "loss": 0.0101, "step": 143900 }, { "epoch": 2.07, "learning_rate": 1.930891473426819e-05, "loss": 0.0088, "step": 143910 }, { "epoch": 2.07, "learning_rate": 1.9308866694529718e-05, "loss": 0.0078, "step": 143920 }, { "epoch": 2.07, "learning_rate": 1.9308818654791247e-05, "loss": 0.0072, "step": 143930 }, { "epoch": 2.07, "learning_rate": 1.9308770615052773e-05, "loss": 0.0063, "step": 143940 }, { "epoch": 2.07, "learning_rate": 1.9308722575314302e-05, "loss": 0.0074, "step": 143950 }, { "epoch": 2.07, "learning_rate": 1.930867453557583e-05, "loss": 0.0086, "step": 143960 }, { "epoch": 2.07, "learning_rate": 1.930862649583736e-05, "loss": 0.0065, "step": 143970 }, { "epoch": 2.08, "learning_rate": 1.9308578456098887e-05, "loss": 0.0053, "step": 143980 }, { "epoch": 2.08, "learning_rate": 1.9308530416360416e-05, "loss": 0.0067, "step": 143990 }, { "epoch": 2.08, "learning_rate": 1.9308482376621945e-05, "loss": 0.0065, "step": 144000 }, { "epoch": 2.08, "learning_rate": 1.930843433688347e-05, "loss": 0.0067, "step": 144010 }, { "epoch": 2.08, "learning_rate": 1.9308386297145e-05, "loss": 0.008, "step": 144020 }, { "epoch": 2.08, "learning_rate": 1.930833825740653e-05, "loss": 0.0065, "step": 144030 }, { "epoch": 2.08, "learning_rate": 1.930829021766806e-05, "loss": 0.0056, "step": 144040 }, { "epoch": 2.08, "learning_rate": 1.9308242177929585e-05, "loss": 0.0087, "step": 144050 }, { "epoch": 2.08, "learning_rate": 1.9308194138191114e-05, "loss": 0.0078, "step": 144060 }, { "epoch": 2.08, "learning_rate": 1.9308146098452643e-05, "loss": 0.0063, "step": 144070 }, { "epoch": 2.08, "learning_rate": 1.930809805871417e-05, "loss": 0.0103, "step": 144080 }, { "epoch": 2.08, "learning_rate": 1.93080500189757e-05, "loss": 0.0073, "step": 144090 }, { "epoch": 2.08, "learning_rate": 1.9308001979237228e-05, "loss": 0.0077, "step": 144100 }, { "epoch": 2.08, "learning_rate": 1.9307953939498757e-05, "loss": 0.007, "step": 144110 }, { "epoch": 2.08, "learning_rate": 1.9307905899760283e-05, "loss": 0.0079, "step": 144120 }, { "epoch": 2.08, "learning_rate": 1.9307857860021812e-05, "loss": 0.006, "step": 144130 }, { "epoch": 2.08, "learning_rate": 1.930780982028334e-05, "loss": 0.0082, "step": 144140 }, { "epoch": 2.08, "learning_rate": 1.930776178054487e-05, "loss": 0.0095, "step": 144150 }, { "epoch": 2.08, "learning_rate": 1.9307713740806397e-05, "loss": 0.0065, "step": 144160 }, { "epoch": 2.08, "learning_rate": 1.9307665701067926e-05, "loss": 0.0071, "step": 144170 }, { "epoch": 2.08, "learning_rate": 1.9307617661329455e-05, "loss": 0.0066, "step": 144180 }, { "epoch": 2.08, "learning_rate": 1.930756962159098e-05, "loss": 0.0094, "step": 144190 }, { "epoch": 2.08, "learning_rate": 1.930752158185251e-05, "loss": 0.0081, "step": 144200 }, { "epoch": 2.08, "learning_rate": 1.930747354211404e-05, "loss": 0.0069, "step": 144210 }, { "epoch": 2.08, "learning_rate": 1.930742550237557e-05, "loss": 0.0096, "step": 144220 }, { "epoch": 2.08, "learning_rate": 1.9307377462637095e-05, "loss": 0.0072, "step": 144230 }, { "epoch": 2.08, "learning_rate": 1.9307329422898624e-05, "loss": 0.0087, "step": 144240 }, { "epoch": 2.08, "learning_rate": 1.9307281383160153e-05, "loss": 0.0056, "step": 144250 }, { "epoch": 2.08, "learning_rate": 1.930723334342168e-05, "loss": 0.0056, "step": 144260 }, { "epoch": 2.08, "learning_rate": 1.930718530368321e-05, "loss": 0.0083, "step": 144270 }, { "epoch": 2.08, "learning_rate": 1.9307137263944738e-05, "loss": 0.0114, "step": 144280 }, { "epoch": 2.08, "learning_rate": 1.9307089224206267e-05, "loss": 0.0062, "step": 144290 }, { "epoch": 2.08, "learning_rate": 1.9307041184467793e-05, "loss": 0.0085, "step": 144300 }, { "epoch": 2.08, "learning_rate": 1.9306993144729322e-05, "loss": 0.0074, "step": 144310 }, { "epoch": 2.08, "learning_rate": 1.930694510499085e-05, "loss": 0.0058, "step": 144320 }, { "epoch": 2.08, "learning_rate": 1.930689706525238e-05, "loss": 0.0101, "step": 144330 }, { "epoch": 2.08, "learning_rate": 1.9306849025513907e-05, "loss": 0.0108, "step": 144340 }, { "epoch": 2.08, "learning_rate": 1.9306800985775436e-05, "loss": 0.0063, "step": 144350 }, { "epoch": 2.08, "learning_rate": 1.9306752946036965e-05, "loss": 0.0073, "step": 144360 }, { "epoch": 2.08, "learning_rate": 1.930670490629849e-05, "loss": 0.0067, "step": 144370 }, { "epoch": 2.08, "learning_rate": 1.930665686656002e-05, "loss": 0.0053, "step": 144380 }, { "epoch": 2.08, "learning_rate": 1.930660882682155e-05, "loss": 0.0112, "step": 144390 }, { "epoch": 2.08, "learning_rate": 1.930656078708308e-05, "loss": 0.0107, "step": 144400 }, { "epoch": 2.08, "learning_rate": 1.9306512747344605e-05, "loss": 0.0054, "step": 144410 }, { "epoch": 2.08, "learning_rate": 1.9306464707606134e-05, "loss": 0.0093, "step": 144420 }, { "epoch": 2.08, "learning_rate": 1.9306416667867663e-05, "loss": 0.0083, "step": 144430 }, { "epoch": 2.08, "learning_rate": 1.930636862812919e-05, "loss": 0.0096, "step": 144440 }, { "epoch": 2.08, "learning_rate": 1.930632058839072e-05, "loss": 0.01, "step": 144450 }, { "epoch": 2.08, "learning_rate": 1.9306272548652248e-05, "loss": 0.0085, "step": 144460 }, { "epoch": 2.08, "learning_rate": 1.9306224508913777e-05, "loss": 0.0073, "step": 144470 }, { "epoch": 2.08, "learning_rate": 1.9306176469175303e-05, "loss": 0.0095, "step": 144480 }, { "epoch": 2.08, "learning_rate": 1.9306128429436832e-05, "loss": 0.0108, "step": 144490 }, { "epoch": 2.08, "learning_rate": 1.930608038969836e-05, "loss": 0.006, "step": 144500 }, { "epoch": 2.08, "learning_rate": 1.930603234995989e-05, "loss": 0.0066, "step": 144510 }, { "epoch": 2.08, "learning_rate": 1.9305984310221416e-05, "loss": 0.0061, "step": 144520 }, { "epoch": 2.08, "learning_rate": 1.9305936270482946e-05, "loss": 0.0077, "step": 144530 }, { "epoch": 2.08, "learning_rate": 1.9305888230744475e-05, "loss": 0.0091, "step": 144540 }, { "epoch": 2.08, "learning_rate": 1.9305840191006e-05, "loss": 0.0076, "step": 144550 }, { "epoch": 2.08, "learning_rate": 1.930579215126753e-05, "loss": 0.0095, "step": 144560 }, { "epoch": 2.08, "learning_rate": 1.930574411152906e-05, "loss": 0.0085, "step": 144570 }, { "epoch": 2.08, "learning_rate": 1.930569607179059e-05, "loss": 0.0064, "step": 144580 }, { "epoch": 2.08, "learning_rate": 1.9305648032052115e-05, "loss": 0.0071, "step": 144590 }, { "epoch": 2.08, "learning_rate": 1.9305599992313644e-05, "loss": 0.0083, "step": 144600 }, { "epoch": 2.08, "learning_rate": 1.9305551952575173e-05, "loss": 0.0076, "step": 144610 }, { "epoch": 2.08, "learning_rate": 1.93055039128367e-05, "loss": 0.0081, "step": 144620 }, { "epoch": 2.08, "learning_rate": 1.9305455873098228e-05, "loss": 0.0059, "step": 144630 }, { "epoch": 2.08, "learning_rate": 1.9305407833359758e-05, "loss": 0.0078, "step": 144640 }, { "epoch": 2.08, "learning_rate": 1.9305359793621287e-05, "loss": 0.008, "step": 144650 }, { "epoch": 2.08, "learning_rate": 1.9305311753882813e-05, "loss": 0.008, "step": 144660 }, { "epoch": 2.08, "learning_rate": 1.9305263714144342e-05, "loss": 0.0069, "step": 144670 }, { "epoch": 2.09, "learning_rate": 1.930521567440587e-05, "loss": 0.005, "step": 144680 }, { "epoch": 2.09, "learning_rate": 1.93051676346674e-05, "loss": 0.0074, "step": 144690 }, { "epoch": 2.09, "learning_rate": 1.9305119594928926e-05, "loss": 0.0052, "step": 144700 }, { "epoch": 2.09, "learning_rate": 1.9305071555190456e-05, "loss": 0.0081, "step": 144710 }, { "epoch": 2.09, "learning_rate": 1.9305023515451985e-05, "loss": 0.0049, "step": 144720 }, { "epoch": 2.09, "learning_rate": 1.930497547571351e-05, "loss": 0.0112, "step": 144730 }, { "epoch": 2.09, "learning_rate": 1.930492743597504e-05, "loss": 0.0088, "step": 144740 }, { "epoch": 2.09, "learning_rate": 1.930487939623657e-05, "loss": 0.0117, "step": 144750 }, { "epoch": 2.09, "learning_rate": 1.93048313564981e-05, "loss": 0.007, "step": 144760 }, { "epoch": 2.09, "learning_rate": 1.9304783316759624e-05, "loss": 0.0109, "step": 144770 }, { "epoch": 2.09, "learning_rate": 1.9304735277021154e-05, "loss": 0.0083, "step": 144780 }, { "epoch": 2.09, "learning_rate": 1.9304687237282683e-05, "loss": 0.0094, "step": 144790 }, { "epoch": 2.09, "learning_rate": 1.930463919754421e-05, "loss": 0.009, "step": 144800 }, { "epoch": 2.09, "learning_rate": 1.9304591157805738e-05, "loss": 0.0041, "step": 144810 }, { "epoch": 2.09, "learning_rate": 1.9304543118067267e-05, "loss": 0.0074, "step": 144820 }, { "epoch": 2.09, "learning_rate": 1.9304495078328797e-05, "loss": 0.0063, "step": 144830 }, { "epoch": 2.09, "learning_rate": 1.9304447038590323e-05, "loss": 0.0093, "step": 144840 }, { "epoch": 2.09, "learning_rate": 1.9304398998851852e-05, "loss": 0.01, "step": 144850 }, { "epoch": 2.09, "learning_rate": 1.930435095911338e-05, "loss": 0.0073, "step": 144860 }, { "epoch": 2.09, "learning_rate": 1.930430291937491e-05, "loss": 0.0079, "step": 144870 }, { "epoch": 2.09, "learning_rate": 1.9304254879636436e-05, "loss": 0.0064, "step": 144880 }, { "epoch": 2.09, "learning_rate": 1.9304206839897966e-05, "loss": 0.0076, "step": 144890 }, { "epoch": 2.09, "learning_rate": 1.9304158800159495e-05, "loss": 0.0058, "step": 144900 }, { "epoch": 2.09, "learning_rate": 1.930411076042102e-05, "loss": 0.0082, "step": 144910 }, { "epoch": 2.09, "learning_rate": 1.930406272068255e-05, "loss": 0.0075, "step": 144920 }, { "epoch": 2.09, "learning_rate": 1.930401468094408e-05, "loss": 0.0071, "step": 144930 }, { "epoch": 2.09, "learning_rate": 1.930396664120561e-05, "loss": 0.0086, "step": 144940 }, { "epoch": 2.09, "learning_rate": 1.9303918601467134e-05, "loss": 0.0067, "step": 144950 }, { "epoch": 2.09, "learning_rate": 1.9303870561728664e-05, "loss": 0.0074, "step": 144960 }, { "epoch": 2.09, "learning_rate": 1.9303822521990193e-05, "loss": 0.008, "step": 144970 }, { "epoch": 2.09, "learning_rate": 1.930377448225172e-05, "loss": 0.0085, "step": 144980 }, { "epoch": 2.09, "learning_rate": 1.9303726442513248e-05, "loss": 0.0091, "step": 144990 }, { "epoch": 2.09, "learning_rate": 1.9303678402774777e-05, "loss": 0.0112, "step": 145000 }, { "epoch": 2.09, "learning_rate": 1.9303630363036307e-05, "loss": 0.0064, "step": 145010 }, { "epoch": 2.09, "learning_rate": 1.9303582323297833e-05, "loss": 0.0099, "step": 145020 }, { "epoch": 2.09, "learning_rate": 1.9303534283559362e-05, "loss": 0.0086, "step": 145030 }, { "epoch": 2.09, "learning_rate": 1.930348624382089e-05, "loss": 0.0086, "step": 145040 }, { "epoch": 2.09, "learning_rate": 1.9303438204082417e-05, "loss": 0.0067, "step": 145050 }, { "epoch": 2.09, "learning_rate": 1.9303390164343946e-05, "loss": 0.0065, "step": 145060 }, { "epoch": 2.09, "learning_rate": 1.9303342124605475e-05, "loss": 0.0089, "step": 145070 }, { "epoch": 2.09, "learning_rate": 1.9303294084867005e-05, "loss": 0.0076, "step": 145080 }, { "epoch": 2.09, "learning_rate": 1.930324604512853e-05, "loss": 0.0055, "step": 145090 }, { "epoch": 2.09, "learning_rate": 1.930319800539006e-05, "loss": 0.0064, "step": 145100 }, { "epoch": 2.09, "learning_rate": 1.930314996565159e-05, "loss": 0.0064, "step": 145110 }, { "epoch": 2.09, "learning_rate": 1.930310192591312e-05, "loss": 0.0079, "step": 145120 }, { "epoch": 2.09, "learning_rate": 1.9303053886174644e-05, "loss": 0.0069, "step": 145130 }, { "epoch": 2.09, "learning_rate": 1.9303005846436174e-05, "loss": 0.0086, "step": 145140 }, { "epoch": 2.09, "learning_rate": 1.9302957806697703e-05, "loss": 0.0044, "step": 145150 }, { "epoch": 2.09, "learning_rate": 1.930290976695923e-05, "loss": 0.0078, "step": 145160 }, { "epoch": 2.09, "learning_rate": 1.9302861727220758e-05, "loss": 0.0047, "step": 145170 }, { "epoch": 2.09, "learning_rate": 1.9302813687482287e-05, "loss": 0.0073, "step": 145180 }, { "epoch": 2.09, "learning_rate": 1.9302765647743817e-05, "loss": 0.0074, "step": 145190 }, { "epoch": 2.09, "learning_rate": 1.9302717608005342e-05, "loss": 0.0103, "step": 145200 }, { "epoch": 2.09, "learning_rate": 1.9302669568266872e-05, "loss": 0.0069, "step": 145210 }, { "epoch": 2.09, "learning_rate": 1.93026215285284e-05, "loss": 0.0085, "step": 145220 }, { "epoch": 2.09, "learning_rate": 1.9302573488789927e-05, "loss": 0.0088, "step": 145230 }, { "epoch": 2.09, "learning_rate": 1.9302525449051456e-05, "loss": 0.0081, "step": 145240 }, { "epoch": 2.09, "learning_rate": 1.9302477409312985e-05, "loss": 0.0095, "step": 145250 }, { "epoch": 2.09, "learning_rate": 1.9302429369574515e-05, "loss": 0.0086, "step": 145260 }, { "epoch": 2.09, "learning_rate": 1.930238132983604e-05, "loss": 0.0117, "step": 145270 }, { "epoch": 2.09, "learning_rate": 1.930233329009757e-05, "loss": 0.0085, "step": 145280 }, { "epoch": 2.09, "learning_rate": 1.93022852503591e-05, "loss": 0.0099, "step": 145290 }, { "epoch": 2.09, "learning_rate": 1.930223721062063e-05, "loss": 0.0094, "step": 145300 }, { "epoch": 2.09, "learning_rate": 1.9302189170882154e-05, "loss": 0.0069, "step": 145310 }, { "epoch": 2.09, "learning_rate": 1.9302141131143684e-05, "loss": 0.0076, "step": 145320 }, { "epoch": 2.09, "learning_rate": 1.9302093091405213e-05, "loss": 0.0064, "step": 145330 }, { "epoch": 2.09, "learning_rate": 1.930204505166674e-05, "loss": 0.0086, "step": 145340 }, { "epoch": 2.09, "learning_rate": 1.9301997011928268e-05, "loss": 0.0122, "step": 145350 }, { "epoch": 2.09, "learning_rate": 1.9301948972189797e-05, "loss": 0.0077, "step": 145360 }, { "epoch": 2.1, "learning_rate": 1.9301900932451326e-05, "loss": 0.0096, "step": 145370 }, { "epoch": 2.1, "learning_rate": 1.9301852892712852e-05, "loss": 0.0085, "step": 145380 }, { "epoch": 2.1, "learning_rate": 1.930180485297438e-05, "loss": 0.0087, "step": 145390 }, { "epoch": 2.1, "learning_rate": 1.930175681323591e-05, "loss": 0.0101, "step": 145400 }, { "epoch": 2.1, "learning_rate": 1.9301708773497437e-05, "loss": 0.0093, "step": 145410 }, { "epoch": 2.1, "learning_rate": 1.9301660733758966e-05, "loss": 0.0069, "step": 145420 }, { "epoch": 2.1, "learning_rate": 1.9301612694020495e-05, "loss": 0.0079, "step": 145430 }, { "epoch": 2.1, "learning_rate": 1.9301564654282025e-05, "loss": 0.0091, "step": 145440 }, { "epoch": 2.1, "learning_rate": 1.930151661454355e-05, "loss": 0.0082, "step": 145450 }, { "epoch": 2.1, "learning_rate": 1.930146857480508e-05, "loss": 0.0096, "step": 145460 }, { "epoch": 2.1, "learning_rate": 1.930142053506661e-05, "loss": 0.0094, "step": 145470 }, { "epoch": 2.1, "learning_rate": 1.9301372495328138e-05, "loss": 0.0066, "step": 145480 }, { "epoch": 2.1, "learning_rate": 1.9301324455589664e-05, "loss": 0.0058, "step": 145490 }, { "epoch": 2.1, "learning_rate": 1.9301276415851193e-05, "loss": 0.008, "step": 145500 }, { "epoch": 2.1, "learning_rate": 1.9301228376112723e-05, "loss": 0.0088, "step": 145510 }, { "epoch": 2.1, "learning_rate": 1.930118033637425e-05, "loss": 0.008, "step": 145520 }, { "epoch": 2.1, "learning_rate": 1.9301132296635778e-05, "loss": 0.0065, "step": 145530 }, { "epoch": 2.1, "learning_rate": 1.9301084256897307e-05, "loss": 0.0099, "step": 145540 }, { "epoch": 2.1, "learning_rate": 1.9301036217158836e-05, "loss": 0.0072, "step": 145550 }, { "epoch": 2.1, "learning_rate": 1.9300988177420362e-05, "loss": 0.0096, "step": 145560 }, { "epoch": 2.1, "learning_rate": 1.930094013768189e-05, "loss": 0.0055, "step": 145570 }, { "epoch": 2.1, "learning_rate": 1.930089209794342e-05, "loss": 0.0103, "step": 145580 }, { "epoch": 2.1, "learning_rate": 1.9300844058204947e-05, "loss": 0.0063, "step": 145590 }, { "epoch": 2.1, "learning_rate": 1.9300796018466476e-05, "loss": 0.0088, "step": 145600 }, { "epoch": 2.1, "learning_rate": 1.9300747978728005e-05, "loss": 0.0069, "step": 145610 }, { "epoch": 2.1, "learning_rate": 1.9300699938989535e-05, "loss": 0.0099, "step": 145620 }, { "epoch": 2.1, "learning_rate": 1.930065189925106e-05, "loss": 0.0075, "step": 145630 }, { "epoch": 2.1, "learning_rate": 1.930060385951259e-05, "loss": 0.0081, "step": 145640 }, { "epoch": 2.1, "learning_rate": 1.930055581977412e-05, "loss": 0.0088, "step": 145650 }, { "epoch": 2.1, "learning_rate": 1.9300507780035648e-05, "loss": 0.0053, "step": 145660 }, { "epoch": 2.1, "learning_rate": 1.9300459740297174e-05, "loss": 0.0044, "step": 145670 }, { "epoch": 2.1, "learning_rate": 1.9300411700558703e-05, "loss": 0.0101, "step": 145680 }, { "epoch": 2.1, "learning_rate": 1.9300363660820233e-05, "loss": 0.0082, "step": 145690 }, { "epoch": 2.1, "learning_rate": 1.930031562108176e-05, "loss": 0.0069, "step": 145700 }, { "epoch": 2.1, "learning_rate": 1.9300267581343288e-05, "loss": 0.0065, "step": 145710 }, { "epoch": 2.1, "learning_rate": 1.9300219541604817e-05, "loss": 0.0115, "step": 145720 }, { "epoch": 2.1, "learning_rate": 1.9300171501866346e-05, "loss": 0.0065, "step": 145730 }, { "epoch": 2.1, "learning_rate": 1.9300123462127872e-05, "loss": 0.0083, "step": 145740 }, { "epoch": 2.1, "learning_rate": 1.93000754223894e-05, "loss": 0.0087, "step": 145750 }, { "epoch": 2.1, "learning_rate": 1.930002738265093e-05, "loss": 0.0126, "step": 145760 }, { "epoch": 2.1, "learning_rate": 1.9299979342912457e-05, "loss": 0.0053, "step": 145770 }, { "epoch": 2.1, "learning_rate": 1.9299931303173986e-05, "loss": 0.008, "step": 145780 }, { "epoch": 2.1, "learning_rate": 1.9299883263435515e-05, "loss": 0.0056, "step": 145790 }, { "epoch": 2.1, "learning_rate": 1.9299835223697044e-05, "loss": 0.0054, "step": 145800 }, { "epoch": 2.1, "learning_rate": 1.929978718395857e-05, "loss": 0.0082, "step": 145810 }, { "epoch": 2.1, "learning_rate": 1.92997391442201e-05, "loss": 0.0088, "step": 145820 }, { "epoch": 2.1, "learning_rate": 1.929969110448163e-05, "loss": 0.0095, "step": 145830 }, { "epoch": 2.1, "learning_rate": 1.9299643064743158e-05, "loss": 0.0069, "step": 145840 }, { "epoch": 2.1, "learning_rate": 1.9299595025004684e-05, "loss": 0.0062, "step": 145850 }, { "epoch": 2.1, "learning_rate": 1.9299546985266213e-05, "loss": 0.0077, "step": 145860 }, { "epoch": 2.1, "learning_rate": 1.9299498945527743e-05, "loss": 0.0101, "step": 145870 }, { "epoch": 2.1, "learning_rate": 1.929945090578927e-05, "loss": 0.0083, "step": 145880 }, { "epoch": 2.1, "learning_rate": 1.9299402866050798e-05, "loss": 0.0073, "step": 145890 }, { "epoch": 2.1, "learning_rate": 1.9299354826312327e-05, "loss": 0.0072, "step": 145900 }, { "epoch": 2.1, "learning_rate": 1.9299306786573856e-05, "loss": 0.01, "step": 145910 }, { "epoch": 2.1, "learning_rate": 1.9299258746835382e-05, "loss": 0.0066, "step": 145920 }, { "epoch": 2.1, "learning_rate": 1.929921070709691e-05, "loss": 0.005, "step": 145930 }, { "epoch": 2.1, "learning_rate": 1.929916266735844e-05, "loss": 0.0085, "step": 145940 }, { "epoch": 2.1, "learning_rate": 1.9299114627619967e-05, "loss": 0.0071, "step": 145950 }, { "epoch": 2.1, "learning_rate": 1.9299066587881496e-05, "loss": 0.0072, "step": 145960 }, { "epoch": 2.1, "learning_rate": 1.9299018548143025e-05, "loss": 0.0082, "step": 145970 }, { "epoch": 2.1, "learning_rate": 1.9298970508404554e-05, "loss": 0.0084, "step": 145980 }, { "epoch": 2.1, "learning_rate": 1.929892246866608e-05, "loss": 0.0116, "step": 145990 }, { "epoch": 2.1, "learning_rate": 1.929887442892761e-05, "loss": 0.0096, "step": 146000 }, { "epoch": 2.1, "learning_rate": 1.929882638918914e-05, "loss": 0.0096, "step": 146010 }, { "epoch": 2.1, "learning_rate": 1.9298778349450668e-05, "loss": 0.0076, "step": 146020 }, { "epoch": 2.1, "learning_rate": 1.9298730309712194e-05, "loss": 0.0086, "step": 146030 }, { "epoch": 2.1, "learning_rate": 1.9298682269973723e-05, "loss": 0.0075, "step": 146040 }, { "epoch": 2.1, "learning_rate": 1.9298634230235252e-05, "loss": 0.0103, "step": 146050 }, { "epoch": 2.11, "learning_rate": 1.929858619049678e-05, "loss": 0.0095, "step": 146060 }, { "epoch": 2.11, "learning_rate": 1.9298538150758308e-05, "loss": 0.0086, "step": 146070 }, { "epoch": 2.11, "learning_rate": 1.9298490111019837e-05, "loss": 0.0087, "step": 146080 }, { "epoch": 2.11, "learning_rate": 1.9298442071281366e-05, "loss": 0.0082, "step": 146090 }, { "epoch": 2.11, "learning_rate": 1.9298394031542892e-05, "loss": 0.0088, "step": 146100 }, { "epoch": 2.11, "learning_rate": 1.929834599180442e-05, "loss": 0.0075, "step": 146110 }, { "epoch": 2.11, "learning_rate": 1.929829795206595e-05, "loss": 0.0068, "step": 146120 }, { "epoch": 2.11, "learning_rate": 1.9298249912327476e-05, "loss": 0.0104, "step": 146130 }, { "epoch": 2.11, "learning_rate": 1.9298201872589006e-05, "loss": 0.0084, "step": 146140 }, { "epoch": 2.11, "learning_rate": 1.9298153832850535e-05, "loss": 0.0068, "step": 146150 }, { "epoch": 2.11, "learning_rate": 1.9298105793112064e-05, "loss": 0.0064, "step": 146160 }, { "epoch": 2.11, "learning_rate": 1.929805775337359e-05, "loss": 0.0107, "step": 146170 }, { "epoch": 2.11, "learning_rate": 1.929800971363512e-05, "loss": 0.008, "step": 146180 }, { "epoch": 2.11, "learning_rate": 1.929796167389665e-05, "loss": 0.0076, "step": 146190 }, { "epoch": 2.11, "learning_rate": 1.9297913634158178e-05, "loss": 0.0083, "step": 146200 }, { "epoch": 2.11, "learning_rate": 1.9297865594419704e-05, "loss": 0.0065, "step": 146210 }, { "epoch": 2.11, "learning_rate": 1.9297817554681233e-05, "loss": 0.0079, "step": 146220 }, { "epoch": 2.11, "learning_rate": 1.9297769514942762e-05, "loss": 0.0058, "step": 146230 }, { "epoch": 2.11, "learning_rate": 1.9297721475204288e-05, "loss": 0.0073, "step": 146240 }, { "epoch": 2.11, "learning_rate": 1.9297673435465818e-05, "loss": 0.0057, "step": 146250 }, { "epoch": 2.11, "learning_rate": 1.9297625395727347e-05, "loss": 0.0073, "step": 146260 }, { "epoch": 2.11, "learning_rate": 1.9297577355988876e-05, "loss": 0.0096, "step": 146270 }, { "epoch": 2.11, "learning_rate": 1.9297529316250402e-05, "loss": 0.0048, "step": 146280 }, { "epoch": 2.11, "learning_rate": 1.929748127651193e-05, "loss": 0.0059, "step": 146290 }, { "epoch": 2.11, "learning_rate": 1.929743323677346e-05, "loss": 0.0085, "step": 146300 }, { "epoch": 2.11, "learning_rate": 1.9297385197034986e-05, "loss": 0.0071, "step": 146310 }, { "epoch": 2.11, "learning_rate": 1.9297337157296516e-05, "loss": 0.0068, "step": 146320 }, { "epoch": 2.11, "learning_rate": 1.9297289117558045e-05, "loss": 0.0088, "step": 146330 }, { "epoch": 2.11, "learning_rate": 1.9297241077819574e-05, "loss": 0.0085, "step": 146340 }, { "epoch": 2.11, "learning_rate": 1.92971930380811e-05, "loss": 0.0063, "step": 146350 }, { "epoch": 2.11, "learning_rate": 1.929714499834263e-05, "loss": 0.0093, "step": 146360 }, { "epoch": 2.11, "learning_rate": 1.929709695860416e-05, "loss": 0.0073, "step": 146370 }, { "epoch": 2.11, "learning_rate": 1.9297048918865688e-05, "loss": 0.0072, "step": 146380 }, { "epoch": 2.11, "learning_rate": 1.9297000879127214e-05, "loss": 0.0074, "step": 146390 }, { "epoch": 2.11, "learning_rate": 1.9296952839388743e-05, "loss": 0.0078, "step": 146400 }, { "epoch": 2.11, "learning_rate": 1.9296904799650272e-05, "loss": 0.0057, "step": 146410 }, { "epoch": 2.11, "learning_rate": 1.9296856759911798e-05, "loss": 0.0049, "step": 146420 }, { "epoch": 2.11, "learning_rate": 1.9296808720173327e-05, "loss": 0.0084, "step": 146430 }, { "epoch": 2.11, "learning_rate": 1.929676068043486e-05, "loss": 0.0093, "step": 146440 }, { "epoch": 2.11, "learning_rate": 1.9296712640696386e-05, "loss": 0.0112, "step": 146450 }, { "epoch": 2.11, "learning_rate": 1.9296664600957915e-05, "loss": 0.0107, "step": 146460 }, { "epoch": 2.11, "learning_rate": 1.9296616561219445e-05, "loss": 0.0046, "step": 146470 }, { "epoch": 2.11, "learning_rate": 1.929656852148097e-05, "loss": 0.0078, "step": 146480 }, { "epoch": 2.11, "learning_rate": 1.92965204817425e-05, "loss": 0.0075, "step": 146490 }, { "epoch": 2.11, "learning_rate": 1.929647244200403e-05, "loss": 0.0115, "step": 146500 }, { "epoch": 2.11, "learning_rate": 1.9296424402265558e-05, "loss": 0.0089, "step": 146510 }, { "epoch": 2.11, "learning_rate": 1.9296376362527084e-05, "loss": 0.0118, "step": 146520 }, { "epoch": 2.11, "learning_rate": 1.9296328322788613e-05, "loss": 0.0061, "step": 146530 }, { "epoch": 2.11, "learning_rate": 1.9296280283050143e-05, "loss": 0.0068, "step": 146540 }, { "epoch": 2.11, "learning_rate": 1.929623224331167e-05, "loss": 0.0079, "step": 146550 }, { "epoch": 2.11, "learning_rate": 1.9296184203573198e-05, "loss": 0.0085, "step": 146560 }, { "epoch": 2.11, "learning_rate": 1.9296136163834727e-05, "loss": 0.0091, "step": 146570 }, { "epoch": 2.11, "learning_rate": 1.9296088124096256e-05, "loss": 0.0095, "step": 146580 }, { "epoch": 2.11, "learning_rate": 1.9296040084357782e-05, "loss": 0.0065, "step": 146590 }, { "epoch": 2.11, "learning_rate": 1.929599204461931e-05, "loss": 0.012, "step": 146600 }, { "epoch": 2.11, "learning_rate": 1.929594400488084e-05, "loss": 0.0117, "step": 146610 }, { "epoch": 2.11, "learning_rate": 1.9295895965142367e-05, "loss": 0.0063, "step": 146620 }, { "epoch": 2.11, "learning_rate": 1.9295847925403896e-05, "loss": 0.0059, "step": 146630 }, { "epoch": 2.11, "learning_rate": 1.9295799885665425e-05, "loss": 0.0102, "step": 146640 }, { "epoch": 2.11, "learning_rate": 1.9295751845926954e-05, "loss": 0.0089, "step": 146650 }, { "epoch": 2.11, "learning_rate": 1.929570380618848e-05, "loss": 0.0081, "step": 146660 }, { "epoch": 2.11, "learning_rate": 1.929565576645001e-05, "loss": 0.0069, "step": 146670 }, { "epoch": 2.11, "learning_rate": 1.9295612530685384e-05, "loss": 0.0087, "step": 146680 }, { "epoch": 2.11, "learning_rate": 1.9295564490946913e-05, "loss": 0.0086, "step": 146690 }, { "epoch": 2.11, "learning_rate": 1.929551645120844e-05, "loss": 0.0059, "step": 146700 }, { "epoch": 2.11, "learning_rate": 1.929546841146997e-05, "loss": 0.0053, "step": 146710 }, { "epoch": 2.11, "learning_rate": 1.9295420371731498e-05, "loss": 0.0086, "step": 146720 }, { "epoch": 2.11, "learning_rate": 1.9295372331993024e-05, "loss": 0.0066, "step": 146730 }, { "epoch": 2.11, "learning_rate": 1.9295324292254553e-05, "loss": 0.0072, "step": 146740 }, { "epoch": 2.11, "learning_rate": 1.9295276252516082e-05, "loss": 0.0051, "step": 146750 }, { "epoch": 2.12, "learning_rate": 1.929522821277761e-05, "loss": 0.008, "step": 146760 }, { "epoch": 2.12, "learning_rate": 1.9295180173039137e-05, "loss": 0.0066, "step": 146770 }, { "epoch": 2.12, "learning_rate": 1.9295132133300667e-05, "loss": 0.0068, "step": 146780 }, { "epoch": 2.12, "learning_rate": 1.9295084093562196e-05, "loss": 0.0094, "step": 146790 }, { "epoch": 2.12, "learning_rate": 1.9295036053823722e-05, "loss": 0.0066, "step": 146800 }, { "epoch": 2.12, "learning_rate": 1.929498801408525e-05, "loss": 0.0077, "step": 146810 }, { "epoch": 2.12, "learning_rate": 1.929493997434678e-05, "loss": 0.0084, "step": 146820 }, { "epoch": 2.12, "learning_rate": 1.929489193460831e-05, "loss": 0.008, "step": 146830 }, { "epoch": 2.12, "learning_rate": 1.9294843894869836e-05, "loss": 0.0223, "step": 146840 }, { "epoch": 2.12, "learning_rate": 1.9294795855131365e-05, "loss": 0.0087, "step": 146850 }, { "epoch": 2.12, "learning_rate": 1.9294747815392894e-05, "loss": 0.0054, "step": 146860 }, { "epoch": 2.12, "learning_rate": 1.9294699775654423e-05, "loss": 0.0066, "step": 146870 }, { "epoch": 2.12, "learning_rate": 1.929465173591595e-05, "loss": 0.006, "step": 146880 }, { "epoch": 2.12, "learning_rate": 1.929460369617748e-05, "loss": 0.0106, "step": 146890 }, { "epoch": 2.12, "learning_rate": 1.9294555656439008e-05, "loss": 0.0109, "step": 146900 }, { "epoch": 2.12, "learning_rate": 1.9294507616700534e-05, "loss": 0.011, "step": 146910 }, { "epoch": 2.12, "learning_rate": 1.9294459576962063e-05, "loss": 0.0079, "step": 146920 }, { "epoch": 2.12, "learning_rate": 1.9294411537223592e-05, "loss": 0.0079, "step": 146930 }, { "epoch": 2.12, "learning_rate": 1.929436349748512e-05, "loss": 0.0077, "step": 146940 }, { "epoch": 2.12, "learning_rate": 1.929431545774665e-05, "loss": 0.0073, "step": 146950 }, { "epoch": 2.12, "learning_rate": 1.929426741800818e-05, "loss": 0.0084, "step": 146960 }, { "epoch": 2.12, "learning_rate": 1.9294219378269706e-05, "loss": 0.0055, "step": 146970 }, { "epoch": 2.12, "learning_rate": 1.9294171338531235e-05, "loss": 0.008, "step": 146980 }, { "epoch": 2.12, "learning_rate": 1.9294123298792764e-05, "loss": 0.008, "step": 146990 }, { "epoch": 2.12, "learning_rate": 1.9294075259054294e-05, "loss": 0.0122, "step": 147000 }, { "epoch": 2.12, "learning_rate": 1.929402721931582e-05, "loss": 0.0119, "step": 147010 }, { "epoch": 2.12, "learning_rate": 1.929397917957735e-05, "loss": 0.0126, "step": 147020 }, { "epoch": 2.12, "learning_rate": 1.9293931139838878e-05, "loss": 0.01, "step": 147030 }, { "epoch": 2.12, "learning_rate": 1.9293883100100404e-05, "loss": 0.0052, "step": 147040 }, { "epoch": 2.12, "learning_rate": 1.9293835060361933e-05, "loss": 0.0087, "step": 147050 }, { "epoch": 2.12, "learning_rate": 1.9293787020623463e-05, "loss": 0.0113, "step": 147060 }, { "epoch": 2.12, "learning_rate": 1.9293738980884992e-05, "loss": 0.0057, "step": 147070 }, { "epoch": 2.12, "learning_rate": 1.9293690941146518e-05, "loss": 0.0072, "step": 147080 }, { "epoch": 2.12, "learning_rate": 1.9293642901408047e-05, "loss": 0.0084, "step": 147090 }, { "epoch": 2.12, "learning_rate": 1.9293594861669576e-05, "loss": 0.007, "step": 147100 }, { "epoch": 2.12, "learning_rate": 1.9293546821931106e-05, "loss": 0.0083, "step": 147110 }, { "epoch": 2.12, "learning_rate": 1.929349878219263e-05, "loss": 0.0083, "step": 147120 }, { "epoch": 2.12, "learning_rate": 1.929345074245416e-05, "loss": 0.0065, "step": 147130 }, { "epoch": 2.12, "learning_rate": 1.929340270271569e-05, "loss": 0.0071, "step": 147140 }, { "epoch": 2.12, "learning_rate": 1.9293354662977216e-05, "loss": 0.0095, "step": 147150 }, { "epoch": 2.12, "learning_rate": 1.9293306623238745e-05, "loss": 0.0072, "step": 147160 }, { "epoch": 2.12, "learning_rate": 1.9293258583500274e-05, "loss": 0.0098, "step": 147170 }, { "epoch": 2.12, "learning_rate": 1.9293210543761804e-05, "loss": 0.0095, "step": 147180 }, { "epoch": 2.12, "learning_rate": 1.929316250402333e-05, "loss": 0.009, "step": 147190 }, { "epoch": 2.12, "learning_rate": 1.929311446428486e-05, "loss": 0.0103, "step": 147200 }, { "epoch": 2.12, "learning_rate": 1.9293066424546388e-05, "loss": 0.0094, "step": 147210 }, { "epoch": 2.12, "learning_rate": 1.9293018384807914e-05, "loss": 0.006, "step": 147220 }, { "epoch": 2.12, "learning_rate": 1.9292970345069443e-05, "loss": 0.007, "step": 147230 }, { "epoch": 2.12, "learning_rate": 1.9292922305330973e-05, "loss": 0.0062, "step": 147240 }, { "epoch": 2.12, "learning_rate": 1.9292874265592502e-05, "loss": 0.0075, "step": 147250 }, { "epoch": 2.12, "learning_rate": 1.9292826225854028e-05, "loss": 0.0085, "step": 147260 }, { "epoch": 2.12, "learning_rate": 1.9292778186115557e-05, "loss": 0.0063, "step": 147270 }, { "epoch": 2.12, "learning_rate": 1.9292730146377086e-05, "loss": 0.0082, "step": 147280 }, { "epoch": 2.12, "learning_rate": 1.9292682106638615e-05, "loss": 0.0096, "step": 147290 }, { "epoch": 2.12, "learning_rate": 1.929263406690014e-05, "loss": 0.0069, "step": 147300 }, { "epoch": 2.12, "learning_rate": 1.929258602716167e-05, "loss": 0.0071, "step": 147310 }, { "epoch": 2.12, "learning_rate": 1.92925379874232e-05, "loss": 0.0065, "step": 147320 }, { "epoch": 2.12, "learning_rate": 1.9292489947684726e-05, "loss": 0.008, "step": 147330 }, { "epoch": 2.12, "learning_rate": 1.9292441907946255e-05, "loss": 0.014, "step": 147340 }, { "epoch": 2.12, "learning_rate": 1.9292393868207784e-05, "loss": 0.0086, "step": 147350 }, { "epoch": 2.12, "learning_rate": 1.9292345828469314e-05, "loss": 0.0103, "step": 147360 }, { "epoch": 2.12, "learning_rate": 1.929229778873084e-05, "loss": 0.0052, "step": 147370 }, { "epoch": 2.12, "learning_rate": 1.929224974899237e-05, "loss": 0.0084, "step": 147380 }, { "epoch": 2.12, "learning_rate": 1.9292201709253898e-05, "loss": 0.0083, "step": 147390 }, { "epoch": 2.12, "learning_rate": 1.9292153669515424e-05, "loss": 0.0081, "step": 147400 }, { "epoch": 2.12, "learning_rate": 1.9292105629776953e-05, "loss": 0.0106, "step": 147410 }, { "epoch": 2.12, "learning_rate": 1.9292057590038482e-05, "loss": 0.0099, "step": 147420 }, { "epoch": 2.12, "learning_rate": 1.929200955030001e-05, "loss": 0.0082, "step": 147430 }, { "epoch": 2.12, "learning_rate": 1.9291961510561538e-05, "loss": 0.0082, "step": 147440 }, { "epoch": 2.13, "learning_rate": 1.9291913470823067e-05, "loss": 0.0067, "step": 147450 }, { "epoch": 2.13, "learning_rate": 1.9291865431084596e-05, "loss": 0.0064, "step": 147460 }, { "epoch": 2.13, "learning_rate": 1.9291817391346125e-05, "loss": 0.0104, "step": 147470 }, { "epoch": 2.13, "learning_rate": 1.929176935160765e-05, "loss": 0.0083, "step": 147480 }, { "epoch": 2.13, "learning_rate": 1.929172131186918e-05, "loss": 0.0062, "step": 147490 }, { "epoch": 2.13, "learning_rate": 1.929167327213071e-05, "loss": 0.0104, "step": 147500 }, { "epoch": 2.13, "learning_rate": 1.9291625232392236e-05, "loss": 0.008, "step": 147510 }, { "epoch": 2.13, "learning_rate": 1.9291577192653765e-05, "loss": 0.0137, "step": 147520 }, { "epoch": 2.13, "learning_rate": 1.9291529152915294e-05, "loss": 0.007, "step": 147530 }, { "epoch": 2.13, "learning_rate": 1.9291481113176823e-05, "loss": 0.007, "step": 147540 }, { "epoch": 2.13, "learning_rate": 1.929143307343835e-05, "loss": 0.0091, "step": 147550 }, { "epoch": 2.13, "learning_rate": 1.929138503369988e-05, "loss": 0.0056, "step": 147560 }, { "epoch": 2.13, "learning_rate": 1.9291336993961408e-05, "loss": 0.0086, "step": 147570 }, { "epoch": 2.13, "learning_rate": 1.9291288954222934e-05, "loss": 0.0119, "step": 147580 }, { "epoch": 2.13, "learning_rate": 1.9291240914484463e-05, "loss": 0.0099, "step": 147590 }, { "epoch": 2.13, "learning_rate": 1.9291192874745992e-05, "loss": 0.0092, "step": 147600 }, { "epoch": 2.13, "learning_rate": 1.929114483500752e-05, "loss": 0.0095, "step": 147610 }, { "epoch": 2.13, "learning_rate": 1.9291096795269047e-05, "loss": 0.0082, "step": 147620 }, { "epoch": 2.13, "learning_rate": 1.9291048755530577e-05, "loss": 0.0068, "step": 147630 }, { "epoch": 2.13, "learning_rate": 1.9291000715792106e-05, "loss": 0.0074, "step": 147640 }, { "epoch": 2.13, "learning_rate": 1.9290952676053635e-05, "loss": 0.0066, "step": 147650 }, { "epoch": 2.13, "learning_rate": 1.929090463631516e-05, "loss": 0.0071, "step": 147660 }, { "epoch": 2.13, "learning_rate": 1.929085659657669e-05, "loss": 0.0088, "step": 147670 }, { "epoch": 2.13, "learning_rate": 1.929080855683822e-05, "loss": 0.0086, "step": 147680 }, { "epoch": 2.13, "learning_rate": 1.9290760517099746e-05, "loss": 0.0074, "step": 147690 }, { "epoch": 2.13, "learning_rate": 1.9290712477361275e-05, "loss": 0.0108, "step": 147700 }, { "epoch": 2.13, "learning_rate": 1.9290664437622804e-05, "loss": 0.009, "step": 147710 }, { "epoch": 2.13, "learning_rate": 1.9290616397884333e-05, "loss": 0.008, "step": 147720 }, { "epoch": 2.13, "learning_rate": 1.929056835814586e-05, "loss": 0.0094, "step": 147730 }, { "epoch": 2.13, "learning_rate": 1.929052031840739e-05, "loss": 0.0089, "step": 147740 }, { "epoch": 2.13, "learning_rate": 1.9290472278668918e-05, "loss": 0.0108, "step": 147750 }, { "epoch": 2.13, "learning_rate": 1.9290424238930444e-05, "loss": 0.0057, "step": 147760 }, { "epoch": 2.13, "learning_rate": 1.9290376199191973e-05, "loss": 0.0064, "step": 147770 }, { "epoch": 2.13, "learning_rate": 1.9290328159453502e-05, "loss": 0.0075, "step": 147780 }, { "epoch": 2.13, "learning_rate": 1.929028011971503e-05, "loss": 0.0079, "step": 147790 }, { "epoch": 2.13, "learning_rate": 1.9290232079976557e-05, "loss": 0.007, "step": 147800 }, { "epoch": 2.13, "learning_rate": 1.9290184040238087e-05, "loss": 0.0054, "step": 147810 }, { "epoch": 2.13, "learning_rate": 1.9290136000499616e-05, "loss": 0.0064, "step": 147820 }, { "epoch": 2.13, "learning_rate": 1.9290087960761145e-05, "loss": 0.0092, "step": 147830 }, { "epoch": 2.13, "learning_rate": 1.929003992102267e-05, "loss": 0.0059, "step": 147840 }, { "epoch": 2.13, "learning_rate": 1.92899918812842e-05, "loss": 0.0104, "step": 147850 }, { "epoch": 2.13, "learning_rate": 1.928994384154573e-05, "loss": 0.0105, "step": 147860 }, { "epoch": 2.13, "learning_rate": 1.9289895801807256e-05, "loss": 0.0105, "step": 147870 }, { "epoch": 2.13, "learning_rate": 1.9289847762068785e-05, "loss": 0.0069, "step": 147880 }, { "epoch": 2.13, "learning_rate": 1.9289799722330314e-05, "loss": 0.0077, "step": 147890 }, { "epoch": 2.13, "learning_rate": 1.9289751682591843e-05, "loss": 0.0074, "step": 147900 }, { "epoch": 2.13, "learning_rate": 1.928970364285337e-05, "loss": 0.0071, "step": 147910 }, { "epoch": 2.13, "learning_rate": 1.92896556031149e-05, "loss": 0.0062, "step": 147920 }, { "epoch": 2.13, "learning_rate": 1.9289607563376428e-05, "loss": 0.0056, "step": 147930 }, { "epoch": 2.13, "learning_rate": 1.9289559523637954e-05, "loss": 0.0086, "step": 147940 }, { "epoch": 2.13, "learning_rate": 1.9289511483899483e-05, "loss": 0.0075, "step": 147950 }, { "epoch": 2.13, "learning_rate": 1.9289463444161012e-05, "loss": 0.0102, "step": 147960 }, { "epoch": 2.13, "learning_rate": 1.928941540442254e-05, "loss": 0.0039, "step": 147970 }, { "epoch": 2.13, "learning_rate": 1.9289367364684067e-05, "loss": 0.011, "step": 147980 }, { "epoch": 2.13, "learning_rate": 1.9289319324945597e-05, "loss": 0.0067, "step": 147990 }, { "epoch": 2.13, "learning_rate": 1.9289271285207126e-05, "loss": 0.0077, "step": 148000 }, { "epoch": 2.13, "learning_rate": 1.9289223245468655e-05, "loss": 0.0078, "step": 148010 }, { "epoch": 2.13, "learning_rate": 1.928917520573018e-05, "loss": 0.0065, "step": 148020 }, { "epoch": 2.13, "learning_rate": 1.928912716599171e-05, "loss": 0.0073, "step": 148030 }, { "epoch": 2.13, "learning_rate": 1.928907912625324e-05, "loss": 0.0103, "step": 148040 }, { "epoch": 2.13, "learning_rate": 1.9289031086514765e-05, "loss": 0.0079, "step": 148050 }, { "epoch": 2.13, "learning_rate": 1.9288983046776295e-05, "loss": 0.0075, "step": 148060 }, { "epoch": 2.13, "learning_rate": 1.9288935007037824e-05, "loss": 0.0049, "step": 148070 }, { "epoch": 2.13, "learning_rate": 1.9288886967299353e-05, "loss": 0.0064, "step": 148080 }, { "epoch": 2.13, "learning_rate": 1.928883892756088e-05, "loss": 0.0042, "step": 148090 }, { "epoch": 2.13, "learning_rate": 1.928879088782241e-05, "loss": 0.0093, "step": 148100 }, { "epoch": 2.13, "learning_rate": 1.9288742848083938e-05, "loss": 0.0082, "step": 148110 }, { "epoch": 2.13, "learning_rate": 1.9288694808345464e-05, "loss": 0.0105, "step": 148120 }, { "epoch": 2.13, "learning_rate": 1.9288646768606993e-05, "loss": 0.0065, "step": 148130 }, { "epoch": 2.13, "learning_rate": 1.9288598728868522e-05, "loss": 0.0106, "step": 148140 }, { "epoch": 2.14, "learning_rate": 1.928855068913005e-05, "loss": 0.0089, "step": 148150 }, { "epoch": 2.14, "learning_rate": 1.9288502649391577e-05, "loss": 0.01, "step": 148160 }, { "epoch": 2.14, "learning_rate": 1.9288454609653106e-05, "loss": 0.0075, "step": 148170 }, { "epoch": 2.14, "learning_rate": 1.9288406569914636e-05, "loss": 0.0052, "step": 148180 }, { "epoch": 2.14, "learning_rate": 1.928835853017616e-05, "loss": 0.0106, "step": 148190 }, { "epoch": 2.14, "learning_rate": 1.928831049043769e-05, "loss": 0.0085, "step": 148200 }, { "epoch": 2.14, "learning_rate": 1.928826245069922e-05, "loss": 0.008, "step": 148210 }, { "epoch": 2.14, "learning_rate": 1.928821441096075e-05, "loss": 0.0065, "step": 148220 }, { "epoch": 2.14, "learning_rate": 1.9288166371222275e-05, "loss": 0.0073, "step": 148230 }, { "epoch": 2.14, "learning_rate": 1.9288118331483805e-05, "loss": 0.0073, "step": 148240 }, { "epoch": 2.14, "learning_rate": 1.9288070291745334e-05, "loss": 0.008, "step": 148250 }, { "epoch": 2.14, "learning_rate": 1.9288022252006863e-05, "loss": 0.006, "step": 148260 }, { "epoch": 2.14, "learning_rate": 1.928797421226839e-05, "loss": 0.0088, "step": 148270 }, { "epoch": 2.14, "learning_rate": 1.9287926172529918e-05, "loss": 0.007, "step": 148280 }, { "epoch": 2.14, "learning_rate": 1.9287878132791448e-05, "loss": 0.0076, "step": 148290 }, { "epoch": 2.14, "learning_rate": 1.9287830093052973e-05, "loss": 0.0087, "step": 148300 }, { "epoch": 2.14, "learning_rate": 1.9287782053314503e-05, "loss": 0.0077, "step": 148310 }, { "epoch": 2.14, "learning_rate": 1.9287734013576032e-05, "loss": 0.0097, "step": 148320 }, { "epoch": 2.14, "learning_rate": 1.928768597383756e-05, "loss": 0.0096, "step": 148330 }, { "epoch": 2.14, "learning_rate": 1.9287637934099087e-05, "loss": 0.0067, "step": 148340 }, { "epoch": 2.14, "learning_rate": 1.9287589894360616e-05, "loss": 0.0086, "step": 148350 }, { "epoch": 2.14, "learning_rate": 1.9287541854622146e-05, "loss": 0.0094, "step": 148360 }, { "epoch": 2.14, "learning_rate": 1.928749381488367e-05, "loss": 0.009, "step": 148370 }, { "epoch": 2.14, "learning_rate": 1.92874457751452e-05, "loss": 0.0117, "step": 148380 }, { "epoch": 2.14, "learning_rate": 1.928739773540673e-05, "loss": 0.0106, "step": 148390 }, { "epoch": 2.14, "learning_rate": 1.928734969566826e-05, "loss": 0.0069, "step": 148400 }, { "epoch": 2.14, "learning_rate": 1.9287301655929785e-05, "loss": 0.0052, "step": 148410 }, { "epoch": 2.14, "learning_rate": 1.9287253616191315e-05, "loss": 0.0089, "step": 148420 }, { "epoch": 2.14, "learning_rate": 1.9287205576452844e-05, "loss": 0.0084, "step": 148430 }, { "epoch": 2.14, "learning_rate": 1.9287157536714373e-05, "loss": 0.0043, "step": 148440 }, { "epoch": 2.14, "learning_rate": 1.92871094969759e-05, "loss": 0.0089, "step": 148450 }, { "epoch": 2.14, "learning_rate": 1.9287061457237428e-05, "loss": 0.0115, "step": 148460 }, { "epoch": 2.14, "learning_rate": 1.9287013417498957e-05, "loss": 0.0108, "step": 148470 }, { "epoch": 2.14, "learning_rate": 1.9286965377760483e-05, "loss": 0.0065, "step": 148480 }, { "epoch": 2.14, "learning_rate": 1.9286917338022013e-05, "loss": 0.0092, "step": 148490 }, { "epoch": 2.14, "learning_rate": 1.9286869298283542e-05, "loss": 0.008, "step": 148500 }, { "epoch": 2.14, "learning_rate": 1.928682125854507e-05, "loss": 0.0063, "step": 148510 }, { "epoch": 2.14, "learning_rate": 1.9286773218806597e-05, "loss": 0.0072, "step": 148520 }, { "epoch": 2.14, "learning_rate": 1.9286725179068126e-05, "loss": 0.0105, "step": 148530 }, { "epoch": 2.14, "learning_rate": 1.9286677139329656e-05, "loss": 0.0074, "step": 148540 }, { "epoch": 2.14, "learning_rate": 1.928662909959118e-05, "loss": 0.0073, "step": 148550 }, { "epoch": 2.14, "learning_rate": 1.928658105985271e-05, "loss": 0.0054, "step": 148560 }, { "epoch": 2.14, "learning_rate": 1.928653302011424e-05, "loss": 0.0107, "step": 148570 }, { "epoch": 2.14, "learning_rate": 1.928648498037577e-05, "loss": 0.0073, "step": 148580 }, { "epoch": 2.14, "learning_rate": 1.9286436940637295e-05, "loss": 0.0103, "step": 148590 }, { "epoch": 2.14, "learning_rate": 1.9286388900898824e-05, "loss": 0.0081, "step": 148600 }, { "epoch": 2.14, "learning_rate": 1.9286340861160354e-05, "loss": 0.0087, "step": 148610 }, { "epoch": 2.14, "learning_rate": 1.9286292821421883e-05, "loss": 0.0057, "step": 148620 }, { "epoch": 2.14, "learning_rate": 1.928624478168341e-05, "loss": 0.0081, "step": 148630 }, { "epoch": 2.14, "learning_rate": 1.9286196741944938e-05, "loss": 0.012, "step": 148640 }, { "epoch": 2.14, "learning_rate": 1.9286148702206467e-05, "loss": 0.007, "step": 148650 }, { "epoch": 2.14, "learning_rate": 1.9286100662467993e-05, "loss": 0.0062, "step": 148660 }, { "epoch": 2.14, "learning_rate": 1.9286052622729523e-05, "loss": 0.0114, "step": 148670 }, { "epoch": 2.14, "learning_rate": 1.9286004582991052e-05, "loss": 0.0081, "step": 148680 }, { "epoch": 2.14, "learning_rate": 1.928595654325258e-05, "loss": 0.0066, "step": 148690 }, { "epoch": 2.14, "learning_rate": 1.9285908503514107e-05, "loss": 0.0078, "step": 148700 }, { "epoch": 2.14, "learning_rate": 1.9285860463775636e-05, "loss": 0.0088, "step": 148710 }, { "epoch": 2.14, "learning_rate": 1.9285812424037166e-05, "loss": 0.0059, "step": 148720 }, { "epoch": 2.14, "learning_rate": 1.928576918827254e-05, "loss": 0.0094, "step": 148730 }, { "epoch": 2.14, "learning_rate": 1.928572114853407e-05, "loss": 0.0081, "step": 148740 }, { "epoch": 2.14, "learning_rate": 1.92856731087956e-05, "loss": 0.0092, "step": 148750 }, { "epoch": 2.14, "learning_rate": 1.9285625069057125e-05, "loss": 0.0112, "step": 148760 }, { "epoch": 2.14, "learning_rate": 1.9285577029318654e-05, "loss": 0.0072, "step": 148770 }, { "epoch": 2.14, "learning_rate": 1.9285528989580183e-05, "loss": 0.0061, "step": 148780 }, { "epoch": 2.14, "learning_rate": 1.928548094984171e-05, "loss": 0.0069, "step": 148790 }, { "epoch": 2.14, "learning_rate": 1.9285432910103238e-05, "loss": 0.0085, "step": 148800 }, { "epoch": 2.14, "learning_rate": 1.9285384870364768e-05, "loss": 0.0051, "step": 148810 }, { "epoch": 2.14, "learning_rate": 1.9285336830626297e-05, "loss": 0.0101, "step": 148820 }, { "epoch": 2.14, "learning_rate": 1.9285288790887823e-05, "loss": 0.0057, "step": 148830 }, { "epoch": 2.15, "learning_rate": 1.9285240751149352e-05, "loss": 0.0102, "step": 148840 }, { "epoch": 2.15, "learning_rate": 1.928519271141088e-05, "loss": 0.0087, "step": 148850 }, { "epoch": 2.15, "learning_rate": 1.928514467167241e-05, "loss": 0.0083, "step": 148860 }, { "epoch": 2.15, "learning_rate": 1.9285096631933936e-05, "loss": 0.0069, "step": 148870 }, { "epoch": 2.15, "learning_rate": 1.9285048592195466e-05, "loss": 0.0074, "step": 148880 }, { "epoch": 2.15, "learning_rate": 1.9285000552456995e-05, "loss": 0.0077, "step": 148890 }, { "epoch": 2.15, "learning_rate": 1.928495251271852e-05, "loss": 0.0098, "step": 148900 }, { "epoch": 2.15, "learning_rate": 1.928490447298005e-05, "loss": 0.0086, "step": 148910 }, { "epoch": 2.15, "learning_rate": 1.928485643324158e-05, "loss": 0.0107, "step": 148920 }, { "epoch": 2.15, "learning_rate": 1.928480839350311e-05, "loss": 0.008, "step": 148930 }, { "epoch": 2.15, "learning_rate": 1.9284760353764634e-05, "loss": 0.0084, "step": 148940 }, { "epoch": 2.15, "learning_rate": 1.9284712314026164e-05, "loss": 0.0049, "step": 148950 }, { "epoch": 2.15, "learning_rate": 1.9284664274287693e-05, "loss": 0.0096, "step": 148960 }, { "epoch": 2.15, "learning_rate": 1.928461623454922e-05, "loss": 0.0087, "step": 148970 }, { "epoch": 2.15, "learning_rate": 1.9284568194810748e-05, "loss": 0.0087, "step": 148980 }, { "epoch": 2.15, "learning_rate": 1.9284520155072277e-05, "loss": 0.0068, "step": 148990 }, { "epoch": 2.15, "learning_rate": 1.9284472115333807e-05, "loss": 0.0104, "step": 149000 }, { "epoch": 2.15, "learning_rate": 1.9284424075595333e-05, "loss": 0.0071, "step": 149010 }, { "epoch": 2.15, "learning_rate": 1.9284376035856862e-05, "loss": 0.0095, "step": 149020 }, { "epoch": 2.15, "learning_rate": 1.928432799611839e-05, "loss": 0.0068, "step": 149030 }, { "epoch": 2.15, "learning_rate": 1.928427995637992e-05, "loss": 0.0085, "step": 149040 }, { "epoch": 2.15, "learning_rate": 1.9284231916641446e-05, "loss": 0.0076, "step": 149050 }, { "epoch": 2.15, "learning_rate": 1.9284183876902976e-05, "loss": 0.0097, "step": 149060 }, { "epoch": 2.15, "learning_rate": 1.9284135837164505e-05, "loss": 0.01, "step": 149070 }, { "epoch": 2.15, "learning_rate": 1.928408779742603e-05, "loss": 0.0075, "step": 149080 }, { "epoch": 2.15, "learning_rate": 1.928403975768756e-05, "loss": 0.0073, "step": 149090 }, { "epoch": 2.15, "learning_rate": 1.928399171794909e-05, "loss": 0.0081, "step": 149100 }, { "epoch": 2.15, "learning_rate": 1.928394367821062e-05, "loss": 0.0059, "step": 149110 }, { "epoch": 2.15, "learning_rate": 1.9283895638472144e-05, "loss": 0.006, "step": 149120 }, { "epoch": 2.15, "learning_rate": 1.9283847598733674e-05, "loss": 0.006, "step": 149130 }, { "epoch": 2.15, "learning_rate": 1.9283799558995203e-05, "loss": 0.008, "step": 149140 }, { "epoch": 2.15, "learning_rate": 1.928375151925673e-05, "loss": 0.0056, "step": 149150 }, { "epoch": 2.15, "learning_rate": 1.9283703479518258e-05, "loss": 0.0046, "step": 149160 }, { "epoch": 2.15, "learning_rate": 1.9283655439779787e-05, "loss": 0.0076, "step": 149170 }, { "epoch": 2.15, "learning_rate": 1.9283607400041317e-05, "loss": 0.0085, "step": 149180 }, { "epoch": 2.15, "learning_rate": 1.9283559360302843e-05, "loss": 0.0095, "step": 149190 }, { "epoch": 2.15, "learning_rate": 1.9283511320564372e-05, "loss": 0.0069, "step": 149200 }, { "epoch": 2.15, "learning_rate": 1.92834632808259e-05, "loss": 0.0084, "step": 149210 }, { "epoch": 2.15, "learning_rate": 1.928341524108743e-05, "loss": 0.0067, "step": 149220 }, { "epoch": 2.15, "learning_rate": 1.9283367201348956e-05, "loss": 0.0069, "step": 149230 }, { "epoch": 2.15, "learning_rate": 1.9283319161610485e-05, "loss": 0.0093, "step": 149240 }, { "epoch": 2.15, "learning_rate": 1.9283271121872015e-05, "loss": 0.0104, "step": 149250 }, { "epoch": 2.15, "learning_rate": 1.928322308213354e-05, "loss": 0.0069, "step": 149260 }, { "epoch": 2.15, "learning_rate": 1.928317504239507e-05, "loss": 0.0091, "step": 149270 }, { "epoch": 2.15, "learning_rate": 1.92831270026566e-05, "loss": 0.0081, "step": 149280 }, { "epoch": 2.15, "learning_rate": 1.928307896291813e-05, "loss": 0.0082, "step": 149290 }, { "epoch": 2.15, "learning_rate": 1.9283030923179654e-05, "loss": 0.0072, "step": 149300 }, { "epoch": 2.15, "learning_rate": 1.9282982883441184e-05, "loss": 0.0059, "step": 149310 }, { "epoch": 2.15, "learning_rate": 1.9282934843702713e-05, "loss": 0.01, "step": 149320 }, { "epoch": 2.15, "learning_rate": 1.928288680396424e-05, "loss": 0.0067, "step": 149330 }, { "epoch": 2.15, "learning_rate": 1.9282838764225768e-05, "loss": 0.0068, "step": 149340 }, { "epoch": 2.15, "learning_rate": 1.9282790724487297e-05, "loss": 0.0102, "step": 149350 }, { "epoch": 2.15, "learning_rate": 1.9282742684748827e-05, "loss": 0.0103, "step": 149360 }, { "epoch": 2.15, "learning_rate": 1.9282694645010352e-05, "loss": 0.0053, "step": 149370 }, { "epoch": 2.15, "learning_rate": 1.9282646605271882e-05, "loss": 0.0084, "step": 149380 }, { "epoch": 2.15, "learning_rate": 1.928259856553341e-05, "loss": 0.0079, "step": 149390 }, { "epoch": 2.15, "learning_rate": 1.928255052579494e-05, "loss": 0.0089, "step": 149400 }, { "epoch": 2.15, "learning_rate": 1.9282502486056466e-05, "loss": 0.0075, "step": 149410 }, { "epoch": 2.15, "learning_rate": 1.9282454446317995e-05, "loss": 0.0079, "step": 149420 }, { "epoch": 2.15, "learning_rate": 1.9282406406579525e-05, "loss": 0.0081, "step": 149430 }, { "epoch": 2.15, "learning_rate": 1.928235836684105e-05, "loss": 0.009, "step": 149440 }, { "epoch": 2.15, "learning_rate": 1.928231032710258e-05, "loss": 0.0076, "step": 149450 }, { "epoch": 2.15, "learning_rate": 1.928226228736411e-05, "loss": 0.0064, "step": 149460 }, { "epoch": 2.15, "learning_rate": 1.928221424762564e-05, "loss": 0.011, "step": 149470 }, { "epoch": 2.15, "learning_rate": 1.9282166207887164e-05, "loss": 0.0088, "step": 149480 }, { "epoch": 2.15, "learning_rate": 1.9282118168148694e-05, "loss": 0.0067, "step": 149490 }, { "epoch": 2.15, "learning_rate": 1.9282070128410223e-05, "loss": 0.0094, "step": 149500 }, { "epoch": 2.15, "learning_rate": 1.928202208867175e-05, "loss": 0.0096, "step": 149510 }, { "epoch": 2.15, "learning_rate": 1.9281974048933278e-05, "loss": 0.0073, "step": 149520 }, { "epoch": 2.16, "learning_rate": 1.9281926009194807e-05, "loss": 0.0106, "step": 149530 }, { "epoch": 2.16, "learning_rate": 1.9281877969456336e-05, "loss": 0.0072, "step": 149540 }, { "epoch": 2.16, "learning_rate": 1.9281829929717862e-05, "loss": 0.0071, "step": 149550 }, { "epoch": 2.16, "learning_rate": 1.928178188997939e-05, "loss": 0.0082, "step": 149560 }, { "epoch": 2.16, "learning_rate": 1.928173385024092e-05, "loss": 0.0079, "step": 149570 }, { "epoch": 2.16, "learning_rate": 1.928168581050245e-05, "loss": 0.0055, "step": 149580 }, { "epoch": 2.16, "learning_rate": 1.9281637770763976e-05, "loss": 0.0067, "step": 149590 }, { "epoch": 2.16, "learning_rate": 1.9281589731025505e-05, "loss": 0.0103, "step": 149600 }, { "epoch": 2.16, "learning_rate": 1.9281541691287035e-05, "loss": 0.0091, "step": 149610 }, { "epoch": 2.16, "learning_rate": 1.928149365154856e-05, "loss": 0.007, "step": 149620 }, { "epoch": 2.16, "learning_rate": 1.928144561181009e-05, "loss": 0.008, "step": 149630 }, { "epoch": 2.16, "learning_rate": 1.928139757207162e-05, "loss": 0.0083, "step": 149640 }, { "epoch": 2.16, "learning_rate": 1.9281349532333148e-05, "loss": 0.0116, "step": 149650 }, { "epoch": 2.16, "learning_rate": 1.9281301492594674e-05, "loss": 0.0081, "step": 149660 }, { "epoch": 2.16, "learning_rate": 1.9281253452856203e-05, "loss": 0.0072, "step": 149670 }, { "epoch": 2.16, "learning_rate": 1.9281205413117733e-05, "loss": 0.0072, "step": 149680 }, { "epoch": 2.16, "learning_rate": 1.928115737337926e-05, "loss": 0.0072, "step": 149690 }, { "epoch": 2.16, "learning_rate": 1.9281109333640788e-05, "loss": 0.0069, "step": 149700 }, { "epoch": 2.16, "learning_rate": 1.9281061293902317e-05, "loss": 0.0087, "step": 149710 }, { "epoch": 2.16, "learning_rate": 1.9281013254163846e-05, "loss": 0.0094, "step": 149720 }, { "epoch": 2.16, "learning_rate": 1.9280965214425372e-05, "loss": 0.0064, "step": 149730 }, { "epoch": 2.16, "learning_rate": 1.92809171746869e-05, "loss": 0.0088, "step": 149740 }, { "epoch": 2.16, "learning_rate": 1.928086913494843e-05, "loss": 0.0088, "step": 149750 }, { "epoch": 2.16, "learning_rate": 1.9280821095209957e-05, "loss": 0.0082, "step": 149760 }, { "epoch": 2.16, "learning_rate": 1.9280773055471486e-05, "loss": 0.0076, "step": 149770 }, { "epoch": 2.16, "learning_rate": 1.9280725015733015e-05, "loss": 0.0109, "step": 149780 }, { "epoch": 2.16, "learning_rate": 1.9280676975994544e-05, "loss": 0.0106, "step": 149790 }, { "epoch": 2.16, "learning_rate": 1.928062893625607e-05, "loss": 0.0082, "step": 149800 }, { "epoch": 2.16, "learning_rate": 1.92805808965176e-05, "loss": 0.0083, "step": 149810 }, { "epoch": 2.16, "learning_rate": 1.928053285677913e-05, "loss": 0.0081, "step": 149820 }, { "epoch": 2.16, "learning_rate": 1.9280484817040658e-05, "loss": 0.0091, "step": 149830 }, { "epoch": 2.16, "learning_rate": 1.9280436777302184e-05, "loss": 0.0074, "step": 149840 }, { "epoch": 2.16, "learning_rate": 1.9280388737563713e-05, "loss": 0.0079, "step": 149850 }, { "epoch": 2.16, "learning_rate": 1.9280340697825243e-05, "loss": 0.0074, "step": 149860 }, { "epoch": 2.16, "learning_rate": 1.928029265808677e-05, "loss": 0.0098, "step": 149870 }, { "epoch": 2.16, "learning_rate": 1.9280244618348298e-05, "loss": 0.0086, "step": 149880 }, { "epoch": 2.16, "learning_rate": 1.9280196578609827e-05, "loss": 0.0098, "step": 149890 }, { "epoch": 2.16, "learning_rate": 1.9280148538871356e-05, "loss": 0.007, "step": 149900 }, { "epoch": 2.16, "learning_rate": 1.9280100499132882e-05, "loss": 0.0089, "step": 149910 }, { "epoch": 2.16, "learning_rate": 1.928005245939441e-05, "loss": 0.007, "step": 149920 }, { "epoch": 2.16, "learning_rate": 1.928000441965594e-05, "loss": 0.0057, "step": 149930 }, { "epoch": 2.16, "learning_rate": 1.9279956379917467e-05, "loss": 0.0093, "step": 149940 }, { "epoch": 2.16, "learning_rate": 1.9279908340178996e-05, "loss": 0.0054, "step": 149950 }, { "epoch": 2.16, "learning_rate": 1.9279860300440525e-05, "loss": 0.008, "step": 149960 }, { "epoch": 2.16, "learning_rate": 1.9279812260702054e-05, "loss": 0.0057, "step": 149970 }, { "epoch": 2.16, "learning_rate": 1.927976422096358e-05, "loss": 0.0095, "step": 149980 }, { "epoch": 2.16, "learning_rate": 1.927971618122511e-05, "loss": 0.0064, "step": 149990 }, { "epoch": 2.16, "learning_rate": 1.927966814148664e-05, "loss": 0.0088, "step": 150000 }, { "epoch": 2.16, "learning_rate": 1.9279620101748168e-05, "loss": 0.006, "step": 150010 }, { "epoch": 2.16, "learning_rate": 1.9279572062009694e-05, "loss": 0.0079, "step": 150020 }, { "epoch": 2.16, "learning_rate": 1.9279524022271227e-05, "loss": 0.0062, "step": 150030 }, { "epoch": 2.16, "learning_rate": 1.9279475982532753e-05, "loss": 0.0075, "step": 150040 }, { "epoch": 2.16, "learning_rate": 1.9279427942794282e-05, "loss": 0.0072, "step": 150050 }, { "epoch": 2.16, "learning_rate": 1.927937990305581e-05, "loss": 0.009, "step": 150060 }, { "epoch": 2.16, "learning_rate": 1.927933186331734e-05, "loss": 0.0086, "step": 150070 }, { "epoch": 2.16, "learning_rate": 1.9279283823578866e-05, "loss": 0.0057, "step": 150080 }, { "epoch": 2.16, "learning_rate": 1.9279235783840395e-05, "loss": 0.0093, "step": 150090 }, { "epoch": 2.16, "learning_rate": 1.9279187744101925e-05, "loss": 0.0072, "step": 150100 }, { "epoch": 2.16, "learning_rate": 1.927913970436345e-05, "loss": 0.0069, "step": 150110 }, { "epoch": 2.16, "learning_rate": 1.927909166462498e-05, "loss": 0.0095, "step": 150120 }, { "epoch": 2.16, "learning_rate": 1.927904362488651e-05, "loss": 0.0086, "step": 150130 }, { "epoch": 2.16, "learning_rate": 1.927899558514804e-05, "loss": 0.0097, "step": 150140 }, { "epoch": 2.16, "learning_rate": 1.9278947545409564e-05, "loss": 0.0101, "step": 150150 }, { "epoch": 2.16, "learning_rate": 1.9278899505671094e-05, "loss": 0.0117, "step": 150160 }, { "epoch": 2.16, "learning_rate": 1.9278851465932623e-05, "loss": 0.0089, "step": 150170 }, { "epoch": 2.16, "learning_rate": 1.927880342619415e-05, "loss": 0.0071, "step": 150180 }, { "epoch": 2.16, "learning_rate": 1.9278755386455678e-05, "loss": 0.0099, "step": 150190 }, { "epoch": 2.16, "learning_rate": 1.9278707346717207e-05, "loss": 0.0076, "step": 150200 }, { "epoch": 2.16, "learning_rate": 1.9278659306978737e-05, "loss": 0.0105, "step": 150210 }, { "epoch": 2.16, "learning_rate": 1.9278611267240262e-05, "loss": 0.0066, "step": 150220 }, { "epoch": 2.17, "learning_rate": 1.9278563227501792e-05, "loss": 0.007, "step": 150230 }, { "epoch": 2.17, "learning_rate": 1.927851518776332e-05, "loss": 0.0081, "step": 150240 }, { "epoch": 2.17, "learning_rate": 1.927846714802485e-05, "loss": 0.009, "step": 150250 }, { "epoch": 2.17, "learning_rate": 1.9278419108286376e-05, "loss": 0.0075, "step": 150260 }, { "epoch": 2.17, "learning_rate": 1.9278371068547905e-05, "loss": 0.0057, "step": 150270 }, { "epoch": 2.17, "learning_rate": 1.9278323028809435e-05, "loss": 0.0111, "step": 150280 }, { "epoch": 2.17, "learning_rate": 1.927827498907096e-05, "loss": 0.0088, "step": 150290 }, { "epoch": 2.17, "learning_rate": 1.927822694933249e-05, "loss": 0.0078, "step": 150300 }, { "epoch": 2.17, "learning_rate": 1.927817890959402e-05, "loss": 0.008, "step": 150310 }, { "epoch": 2.17, "learning_rate": 1.927813086985555e-05, "loss": 0.0094, "step": 150320 }, { "epoch": 2.17, "learning_rate": 1.9278082830117074e-05, "loss": 0.0074, "step": 150330 }, { "epoch": 2.17, "learning_rate": 1.9278034790378604e-05, "loss": 0.0059, "step": 150340 }, { "epoch": 2.17, "learning_rate": 1.9277986750640133e-05, "loss": 0.0065, "step": 150350 }, { "epoch": 2.17, "learning_rate": 1.927793871090166e-05, "loss": 0.0098, "step": 150360 }, { "epoch": 2.17, "learning_rate": 1.9277890671163188e-05, "loss": 0.0076, "step": 150370 }, { "epoch": 2.17, "learning_rate": 1.9277842631424717e-05, "loss": 0.0072, "step": 150380 }, { "epoch": 2.17, "learning_rate": 1.9277794591686246e-05, "loss": 0.0067, "step": 150390 }, { "epoch": 2.17, "learning_rate": 1.9277746551947772e-05, "loss": 0.0064, "step": 150400 }, { "epoch": 2.17, "learning_rate": 1.92776985122093e-05, "loss": 0.01, "step": 150410 }, { "epoch": 2.17, "learning_rate": 1.927765047247083e-05, "loss": 0.0086, "step": 150420 }, { "epoch": 2.17, "learning_rate": 1.927760243273236e-05, "loss": 0.0091, "step": 150430 }, { "epoch": 2.17, "learning_rate": 1.9277554392993886e-05, "loss": 0.0074, "step": 150440 }, { "epoch": 2.17, "learning_rate": 1.9277506353255415e-05, "loss": 0.0056, "step": 150450 }, { "epoch": 2.17, "learning_rate": 1.9277458313516945e-05, "loss": 0.0088, "step": 150460 }, { "epoch": 2.17, "learning_rate": 1.927741027377847e-05, "loss": 0.0088, "step": 150470 }, { "epoch": 2.17, "learning_rate": 1.927736223404e-05, "loss": 0.0061, "step": 150480 }, { "epoch": 2.17, "learning_rate": 1.927731419430153e-05, "loss": 0.006, "step": 150490 }, { "epoch": 2.17, "learning_rate": 1.9277266154563058e-05, "loss": 0.0072, "step": 150500 }, { "epoch": 2.17, "learning_rate": 1.9277218114824584e-05, "loss": 0.0079, "step": 150510 }, { "epoch": 2.17, "learning_rate": 1.9277170075086113e-05, "loss": 0.006, "step": 150520 }, { "epoch": 2.17, "learning_rate": 1.9277122035347643e-05, "loss": 0.0054, "step": 150530 }, { "epoch": 2.17, "learning_rate": 1.927707399560917e-05, "loss": 0.0108, "step": 150540 }, { "epoch": 2.17, "learning_rate": 1.9277025955870698e-05, "loss": 0.0057, "step": 150550 }, { "epoch": 2.17, "learning_rate": 1.9276977916132227e-05, "loss": 0.0073, "step": 150560 }, { "epoch": 2.17, "learning_rate": 1.9276929876393756e-05, "loss": 0.0082, "step": 150570 }, { "epoch": 2.17, "learning_rate": 1.9276881836655282e-05, "loss": 0.0052, "step": 150580 }, { "epoch": 2.17, "learning_rate": 1.927683379691681e-05, "loss": 0.0074, "step": 150590 }, { "epoch": 2.17, "learning_rate": 1.927678575717834e-05, "loss": 0.0078, "step": 150600 }, { "epoch": 2.17, "learning_rate": 1.927673771743987e-05, "loss": 0.0073, "step": 150610 }, { "epoch": 2.17, "learning_rate": 1.9276689677701396e-05, "loss": 0.0069, "step": 150620 }, { "epoch": 2.17, "learning_rate": 1.9276641637962925e-05, "loss": 0.0096, "step": 150630 }, { "epoch": 2.17, "learning_rate": 1.9276593598224454e-05, "loss": 0.0099, "step": 150640 }, { "epoch": 2.17, "learning_rate": 1.927654555848598e-05, "loss": 0.0102, "step": 150650 }, { "epoch": 2.17, "learning_rate": 1.927649751874751e-05, "loss": 0.01, "step": 150660 }, { "epoch": 2.17, "learning_rate": 1.927644947900904e-05, "loss": 0.0065, "step": 150670 }, { "epoch": 2.17, "learning_rate": 1.9276401439270568e-05, "loss": 0.0086, "step": 150680 }, { "epoch": 2.17, "learning_rate": 1.9276353399532094e-05, "loss": 0.0076, "step": 150690 }, { "epoch": 2.17, "learning_rate": 1.9276305359793623e-05, "loss": 0.0067, "step": 150700 }, { "epoch": 2.17, "learning_rate": 1.9276257320055153e-05, "loss": 0.0078, "step": 150710 }, { "epoch": 2.17, "learning_rate": 1.927620928031668e-05, "loss": 0.0081, "step": 150720 }, { "epoch": 2.17, "learning_rate": 1.9276161240578208e-05, "loss": 0.0056, "step": 150730 }, { "epoch": 2.17, "learning_rate": 1.9276113200839737e-05, "loss": 0.0064, "step": 150740 }, { "epoch": 2.17, "learning_rate": 1.9276065161101266e-05, "loss": 0.0064, "step": 150750 }, { "epoch": 2.17, "learning_rate": 1.9276017121362792e-05, "loss": 0.007, "step": 150760 }, { "epoch": 2.17, "learning_rate": 1.927596908162432e-05, "loss": 0.0072, "step": 150770 }, { "epoch": 2.17, "learning_rate": 1.927592104188585e-05, "loss": 0.0105, "step": 150780 }, { "epoch": 2.17, "learning_rate": 1.927587300214738e-05, "loss": 0.0054, "step": 150790 }, { "epoch": 2.17, "learning_rate": 1.9275824962408906e-05, "loss": 0.0106, "step": 150800 }, { "epoch": 2.17, "learning_rate": 1.9275776922670435e-05, "loss": 0.0059, "step": 150810 }, { "epoch": 2.17, "learning_rate": 1.9275728882931964e-05, "loss": 0.0076, "step": 150820 }, { "epoch": 2.17, "learning_rate": 1.927568084319349e-05, "loss": 0.0063, "step": 150830 }, { "epoch": 2.17, "learning_rate": 1.927563280345502e-05, "loss": 0.0069, "step": 150840 }, { "epoch": 2.17, "learning_rate": 1.927558476371655e-05, "loss": 0.0075, "step": 150850 }, { "epoch": 2.17, "learning_rate": 1.9275536723978078e-05, "loss": 0.0067, "step": 150860 }, { "epoch": 2.17, "learning_rate": 1.9275488684239604e-05, "loss": 0.0078, "step": 150870 }, { "epoch": 2.17, "learning_rate": 1.9275440644501133e-05, "loss": 0.0091, "step": 150880 }, { "epoch": 2.17, "learning_rate": 1.9275392604762663e-05, "loss": 0.0081, "step": 150890 }, { "epoch": 2.17, "learning_rate": 1.927534456502419e-05, "loss": 0.011, "step": 150900 }, { "epoch": 2.17, "learning_rate": 1.9275296525285718e-05, "loss": 0.0065, "step": 150910 }, { "epoch": 2.18, "learning_rate": 1.9275248485547247e-05, "loss": 0.0085, "step": 150920 }, { "epoch": 2.18, "learning_rate": 1.9275200445808776e-05, "loss": 0.0086, "step": 150930 }, { "epoch": 2.18, "learning_rate": 1.9275152406070302e-05, "loss": 0.0055, "step": 150940 }, { "epoch": 2.18, "learning_rate": 1.927510436633183e-05, "loss": 0.0056, "step": 150950 }, { "epoch": 2.18, "learning_rate": 1.927505632659336e-05, "loss": 0.011, "step": 150960 }, { "epoch": 2.18, "learning_rate": 1.927500828685489e-05, "loss": 0.0049, "step": 150970 }, { "epoch": 2.18, "learning_rate": 1.9274960247116416e-05, "loss": 0.0068, "step": 150980 }, { "epoch": 2.18, "learning_rate": 1.9274912207377945e-05, "loss": 0.0091, "step": 150990 }, { "epoch": 2.18, "learning_rate": 1.9274864167639474e-05, "loss": 0.0067, "step": 151000 }, { "epoch": 2.18, "learning_rate": 1.9274816127901e-05, "loss": 0.0064, "step": 151010 }, { "epoch": 2.18, "learning_rate": 1.927476808816253e-05, "loss": 0.0082, "step": 151020 }, { "epoch": 2.18, "learning_rate": 1.927472004842406e-05, "loss": 0.0064, "step": 151030 }, { "epoch": 2.18, "learning_rate": 1.9274672008685588e-05, "loss": 0.0081, "step": 151040 }, { "epoch": 2.18, "learning_rate": 1.9274623968947114e-05, "loss": 0.0075, "step": 151050 }, { "epoch": 2.18, "learning_rate": 1.9274575929208643e-05, "loss": 0.0065, "step": 151060 }, { "epoch": 2.18, "learning_rate": 1.9274527889470172e-05, "loss": 0.0108, "step": 151070 }, { "epoch": 2.18, "learning_rate": 1.92744798497317e-05, "loss": 0.0074, "step": 151080 }, { "epoch": 2.18, "learning_rate": 1.9274431809993228e-05, "loss": 0.008, "step": 151090 }, { "epoch": 2.18, "learning_rate": 1.9274383770254757e-05, "loss": 0.0097, "step": 151100 }, { "epoch": 2.18, "learning_rate": 1.9274335730516286e-05, "loss": 0.0115, "step": 151110 }, { "epoch": 2.18, "learning_rate": 1.9274287690777812e-05, "loss": 0.0059, "step": 151120 }, { "epoch": 2.18, "learning_rate": 1.927423965103934e-05, "loss": 0.0081, "step": 151130 }, { "epoch": 2.18, "learning_rate": 1.927419161130087e-05, "loss": 0.0072, "step": 151140 }, { "epoch": 2.18, "learning_rate": 1.9274143571562396e-05, "loss": 0.0079, "step": 151150 }, { "epoch": 2.18, "learning_rate": 1.9274095531823926e-05, "loss": 0.011, "step": 151160 }, { "epoch": 2.18, "learning_rate": 1.9274047492085455e-05, "loss": 0.0057, "step": 151170 }, { "epoch": 2.18, "learning_rate": 1.9273999452346984e-05, "loss": 0.0094, "step": 151180 }, { "epoch": 2.18, "learning_rate": 1.927395141260851e-05, "loss": 0.0065, "step": 151190 }, { "epoch": 2.18, "learning_rate": 1.927390337287004e-05, "loss": 0.0092, "step": 151200 }, { "epoch": 2.18, "learning_rate": 1.927385533313157e-05, "loss": 0.0105, "step": 151210 }, { "epoch": 2.18, "learning_rate": 1.9273807293393098e-05, "loss": 0.009, "step": 151220 }, { "epoch": 2.18, "learning_rate": 1.9273759253654624e-05, "loss": 0.0083, "step": 151230 }, { "epoch": 2.18, "learning_rate": 1.9273711213916153e-05, "loss": 0.0097, "step": 151240 }, { "epoch": 2.18, "learning_rate": 1.9273663174177682e-05, "loss": 0.0073, "step": 151250 }, { "epoch": 2.18, "learning_rate": 1.9273615134439208e-05, "loss": 0.0064, "step": 151260 }, { "epoch": 2.18, "learning_rate": 1.9273567094700738e-05, "loss": 0.0074, "step": 151270 }, { "epoch": 2.18, "learning_rate": 1.9273519054962267e-05, "loss": 0.0099, "step": 151280 }, { "epoch": 2.18, "learning_rate": 1.9273471015223796e-05, "loss": 0.0067, "step": 151290 }, { "epoch": 2.18, "learning_rate": 1.9273422975485322e-05, "loss": 0.0063, "step": 151300 }, { "epoch": 2.18, "learning_rate": 1.927337493574685e-05, "loss": 0.0071, "step": 151310 }, { "epoch": 2.18, "learning_rate": 1.927332689600838e-05, "loss": 0.0075, "step": 151320 }, { "epoch": 2.18, "learning_rate": 1.9273278856269906e-05, "loss": 0.0079, "step": 151330 }, { "epoch": 2.18, "learning_rate": 1.9273230816531436e-05, "loss": 0.0102, "step": 151340 }, { "epoch": 2.18, "learning_rate": 1.9273182776792965e-05, "loss": 0.0074, "step": 151350 }, { "epoch": 2.18, "learning_rate": 1.9273134737054494e-05, "loss": 0.0091, "step": 151360 }, { "epoch": 2.18, "learning_rate": 1.927308669731602e-05, "loss": 0.0094, "step": 151370 }, { "epoch": 2.18, "learning_rate": 1.927303865757755e-05, "loss": 0.0091, "step": 151380 }, { "epoch": 2.18, "learning_rate": 1.927299061783908e-05, "loss": 0.006, "step": 151390 }, { "epoch": 2.18, "learning_rate": 1.9272942578100608e-05, "loss": 0.0133, "step": 151400 }, { "epoch": 2.18, "learning_rate": 1.9272894538362134e-05, "loss": 0.007, "step": 151410 }, { "epoch": 2.18, "learning_rate": 1.9272846498623663e-05, "loss": 0.0063, "step": 151420 }, { "epoch": 2.18, "learning_rate": 1.9272798458885192e-05, "loss": 0.0089, "step": 151430 }, { "epoch": 2.18, "learning_rate": 1.9272750419146718e-05, "loss": 0.0078, "step": 151440 }, { "epoch": 2.18, "learning_rate": 1.9272702379408247e-05, "loss": 0.0046, "step": 151450 }, { "epoch": 2.18, "learning_rate": 1.9272654339669777e-05, "loss": 0.0064, "step": 151460 }, { "epoch": 2.18, "learning_rate": 1.9272606299931306e-05, "loss": 0.0106, "step": 151470 }, { "epoch": 2.18, "learning_rate": 1.9272558260192832e-05, "loss": 0.0108, "step": 151480 }, { "epoch": 2.18, "learning_rate": 1.927251022045436e-05, "loss": 0.01, "step": 151490 }, { "epoch": 2.18, "learning_rate": 1.927246218071589e-05, "loss": 0.0091, "step": 151500 }, { "epoch": 2.18, "learning_rate": 1.9272414140977416e-05, "loss": 0.0079, "step": 151510 }, { "epoch": 2.18, "learning_rate": 1.9272366101238946e-05, "loss": 0.0086, "step": 151520 }, { "epoch": 2.18, "learning_rate": 1.9272318061500475e-05, "loss": 0.0055, "step": 151530 }, { "epoch": 2.18, "learning_rate": 1.9272270021762004e-05, "loss": 0.0089, "step": 151540 }, { "epoch": 2.18, "learning_rate": 1.927222198202353e-05, "loss": 0.007, "step": 151550 }, { "epoch": 2.18, "learning_rate": 1.927217394228506e-05, "loss": 0.0097, "step": 151560 }, { "epoch": 2.18, "learning_rate": 1.927212590254659e-05, "loss": 0.0053, "step": 151570 }, { "epoch": 2.18, "learning_rate": 1.9272077862808118e-05, "loss": 0.0067, "step": 151580 }, { "epoch": 2.18, "learning_rate": 1.9272029823069644e-05, "loss": 0.0067, "step": 151590 }, { "epoch": 2.18, "learning_rate": 1.9271981783331173e-05, "loss": 0.0082, "step": 151600 }, { "epoch": 2.18, "learning_rate": 1.9271933743592702e-05, "loss": 0.0088, "step": 151610 }, { "epoch": 2.19, "learning_rate": 1.9271885703854228e-05, "loss": 0.009, "step": 151620 }, { "epoch": 2.19, "learning_rate": 1.9271837664115757e-05, "loss": 0.0085, "step": 151630 }, { "epoch": 2.19, "learning_rate": 1.9271789624377287e-05, "loss": 0.0097, "step": 151640 }, { "epoch": 2.19, "learning_rate": 1.9271741584638816e-05, "loss": 0.0078, "step": 151650 }, { "epoch": 2.19, "learning_rate": 1.9271693544900342e-05, "loss": 0.0083, "step": 151660 }, { "epoch": 2.19, "learning_rate": 1.927164550516187e-05, "loss": 0.0074, "step": 151670 }, { "epoch": 2.19, "learning_rate": 1.92715974654234e-05, "loss": 0.0069, "step": 151680 }, { "epoch": 2.19, "learning_rate": 1.9271549425684926e-05, "loss": 0.0158, "step": 151690 }, { "epoch": 2.19, "learning_rate": 1.9271501385946455e-05, "loss": 0.0074, "step": 151700 }, { "epoch": 2.19, "learning_rate": 1.9271453346207985e-05, "loss": 0.0109, "step": 151710 }, { "epoch": 2.19, "learning_rate": 1.9271405306469514e-05, "loss": 0.0097, "step": 151720 }, { "epoch": 2.19, "learning_rate": 1.927135726673104e-05, "loss": 0.0088, "step": 151730 }, { "epoch": 2.19, "learning_rate": 1.927130922699257e-05, "loss": 0.007, "step": 151740 }, { "epoch": 2.19, "learning_rate": 1.92712611872541e-05, "loss": 0.0089, "step": 151750 }, { "epoch": 2.19, "learning_rate": 1.9271213147515628e-05, "loss": 0.0058, "step": 151760 }, { "epoch": 2.19, "learning_rate": 1.9271165107777154e-05, "loss": 0.0074, "step": 151770 }, { "epoch": 2.19, "learning_rate": 1.9271117068038683e-05, "loss": 0.0111, "step": 151780 }, { "epoch": 2.19, "learning_rate": 1.9271069028300212e-05, "loss": 0.0074, "step": 151790 }, { "epoch": 2.19, "learning_rate": 1.9271020988561738e-05, "loss": 0.0062, "step": 151800 }, { "epoch": 2.19, "learning_rate": 1.9270972948823267e-05, "loss": 0.0073, "step": 151810 }, { "epoch": 2.19, "learning_rate": 1.9270924909084797e-05, "loss": 0.01, "step": 151820 }, { "epoch": 2.19, "learning_rate": 1.9270876869346326e-05, "loss": 0.0053, "step": 151830 }, { "epoch": 2.19, "learning_rate": 1.927082882960785e-05, "loss": 0.0107, "step": 151840 }, { "epoch": 2.19, "learning_rate": 1.927078078986938e-05, "loss": 0.0094, "step": 151850 }, { "epoch": 2.19, "learning_rate": 1.927073275013091e-05, "loss": 0.0054, "step": 151860 }, { "epoch": 2.19, "learning_rate": 1.9270684710392436e-05, "loss": 0.0085, "step": 151870 }, { "epoch": 2.19, "learning_rate": 1.9270636670653965e-05, "loss": 0.0085, "step": 151880 }, { "epoch": 2.19, "learning_rate": 1.9270588630915495e-05, "loss": 0.0089, "step": 151890 }, { "epoch": 2.19, "learning_rate": 1.9270540591177024e-05, "loss": 0.0087, "step": 151900 }, { "epoch": 2.19, "learning_rate": 1.927049255143855e-05, "loss": 0.0059, "step": 151910 }, { "epoch": 2.19, "learning_rate": 1.927044451170008e-05, "loss": 0.0103, "step": 151920 }, { "epoch": 2.19, "learning_rate": 1.927039647196161e-05, "loss": 0.0074, "step": 151930 }, { "epoch": 2.19, "learning_rate": 1.9270348432223138e-05, "loss": 0.0108, "step": 151940 }, { "epoch": 2.19, "learning_rate": 1.9270300392484663e-05, "loss": 0.0048, "step": 151950 }, { "epoch": 2.19, "learning_rate": 1.9270252352746193e-05, "loss": 0.0095, "step": 151960 }, { "epoch": 2.19, "learning_rate": 1.9270204313007722e-05, "loss": 0.0078, "step": 151970 }, { "epoch": 2.19, "learning_rate": 1.9270156273269248e-05, "loss": 0.009, "step": 151980 }, { "epoch": 2.19, "learning_rate": 1.9270108233530777e-05, "loss": 0.008, "step": 151990 }, { "epoch": 2.19, "learning_rate": 1.9270060193792306e-05, "loss": 0.0066, "step": 152000 }, { "epoch": 2.19, "learning_rate": 1.9270012154053836e-05, "loss": 0.0082, "step": 152010 }, { "epoch": 2.19, "learning_rate": 1.926996411431536e-05, "loss": 0.0075, "step": 152020 }, { "epoch": 2.19, "learning_rate": 1.926991607457689e-05, "loss": 0.0064, "step": 152030 }, { "epoch": 2.19, "learning_rate": 1.926986803483842e-05, "loss": 0.0077, "step": 152040 }, { "epoch": 2.19, "learning_rate": 1.9269819995099946e-05, "loss": 0.0069, "step": 152050 }, { "epoch": 2.19, "learning_rate": 1.9269771955361475e-05, "loss": 0.0086, "step": 152060 }, { "epoch": 2.19, "learning_rate": 1.9269723915623005e-05, "loss": 0.0078, "step": 152070 }, { "epoch": 2.19, "learning_rate": 1.9269675875884534e-05, "loss": 0.0065, "step": 152080 }, { "epoch": 2.19, "learning_rate": 1.926962783614606e-05, "loss": 0.0068, "step": 152090 }, { "epoch": 2.19, "learning_rate": 1.926957979640759e-05, "loss": 0.0084, "step": 152100 }, { "epoch": 2.19, "learning_rate": 1.9269531756669118e-05, "loss": 0.0063, "step": 152110 }, { "epoch": 2.19, "learning_rate": 1.9269483716930648e-05, "loss": 0.0064, "step": 152120 }, { "epoch": 2.19, "learning_rate": 1.9269435677192173e-05, "loss": 0.0087, "step": 152130 }, { "epoch": 2.19, "learning_rate": 1.9269387637453703e-05, "loss": 0.007, "step": 152140 }, { "epoch": 2.19, "learning_rate": 1.9269339597715232e-05, "loss": 0.0093, "step": 152150 }, { "epoch": 2.19, "learning_rate": 1.9269291557976758e-05, "loss": 0.0051, "step": 152160 }, { "epoch": 2.19, "learning_rate": 1.9269243518238287e-05, "loss": 0.0088, "step": 152170 }, { "epoch": 2.19, "learning_rate": 1.9269195478499816e-05, "loss": 0.0072, "step": 152180 }, { "epoch": 2.19, "learning_rate": 1.9269147438761346e-05, "loss": 0.0077, "step": 152190 }, { "epoch": 2.19, "learning_rate": 1.926909939902287e-05, "loss": 0.0062, "step": 152200 }, { "epoch": 2.19, "learning_rate": 1.92690513592844e-05, "loss": 0.0071, "step": 152210 }, { "epoch": 2.19, "learning_rate": 1.926900331954593e-05, "loss": 0.0069, "step": 152220 }, { "epoch": 2.19, "learning_rate": 1.9268955279807456e-05, "loss": 0.0087, "step": 152230 }, { "epoch": 2.19, "learning_rate": 1.9268907240068985e-05, "loss": 0.0078, "step": 152240 }, { "epoch": 2.19, "learning_rate": 1.9268859200330514e-05, "loss": 0.0064, "step": 152250 }, { "epoch": 2.19, "learning_rate": 1.9268811160592044e-05, "loss": 0.0071, "step": 152260 }, { "epoch": 2.19, "learning_rate": 1.926876312085357e-05, "loss": 0.008, "step": 152270 }, { "epoch": 2.19, "learning_rate": 1.92687150811151e-05, "loss": 0.0091, "step": 152280 }, { "epoch": 2.19, "learning_rate": 1.9268667041376628e-05, "loss": 0.011, "step": 152290 }, { "epoch": 2.19, "learning_rate": 1.9268619001638157e-05, "loss": 0.0063, "step": 152300 }, { "epoch": 2.2, "learning_rate": 1.9268570961899683e-05, "loss": 0.0073, "step": 152310 }, { "epoch": 2.2, "learning_rate": 1.9268522922161213e-05, "loss": 0.0052, "step": 152320 }, { "epoch": 2.2, "learning_rate": 1.9268474882422742e-05, "loss": 0.0087, "step": 152330 }, { "epoch": 2.2, "learning_rate": 1.9268426842684268e-05, "loss": 0.0072, "step": 152340 }, { "epoch": 2.2, "learning_rate": 1.9268378802945797e-05, "loss": 0.0097, "step": 152350 }, { "epoch": 2.2, "learning_rate": 1.9268330763207326e-05, "loss": 0.0067, "step": 152360 }, { "epoch": 2.2, "learning_rate": 1.9268282723468856e-05, "loss": 0.0062, "step": 152370 }, { "epoch": 2.2, "learning_rate": 1.926823468373038e-05, "loss": 0.0082, "step": 152380 }, { "epoch": 2.2, "learning_rate": 1.926818664399191e-05, "loss": 0.0095, "step": 152390 }, { "epoch": 2.2, "learning_rate": 1.926813860425344e-05, "loss": 0.0063, "step": 152400 }, { "epoch": 2.2, "learning_rate": 1.9268090564514966e-05, "loss": 0.0087, "step": 152410 }, { "epoch": 2.2, "learning_rate": 1.9268042524776495e-05, "loss": 0.0131, "step": 152420 }, { "epoch": 2.2, "learning_rate": 1.9267994485038024e-05, "loss": 0.0082, "step": 152430 }, { "epoch": 2.2, "learning_rate": 1.9267946445299554e-05, "loss": 0.0092, "step": 152440 }, { "epoch": 2.2, "learning_rate": 1.926789840556108e-05, "loss": 0.0067, "step": 152450 }, { "epoch": 2.2, "learning_rate": 1.926785036582261e-05, "loss": 0.0093, "step": 152460 }, { "epoch": 2.2, "learning_rate": 1.9267802326084138e-05, "loss": 0.0064, "step": 152470 }, { "epoch": 2.2, "learning_rate": 1.9267754286345667e-05, "loss": 0.0071, "step": 152480 }, { "epoch": 2.2, "learning_rate": 1.9267706246607193e-05, "loss": 0.0114, "step": 152490 }, { "epoch": 2.2, "learning_rate": 1.9267658206868722e-05, "loss": 0.0084, "step": 152500 }, { "epoch": 2.2, "learning_rate": 1.9267610167130252e-05, "loss": 0.0077, "step": 152510 }, { "epoch": 2.2, "learning_rate": 1.9267562127391778e-05, "loss": 0.0062, "step": 152520 }, { "epoch": 2.2, "learning_rate": 1.9267514087653307e-05, "loss": 0.0072, "step": 152530 }, { "epoch": 2.2, "learning_rate": 1.9267466047914836e-05, "loss": 0.0103, "step": 152540 }, { "epoch": 2.2, "learning_rate": 1.9267418008176365e-05, "loss": 0.0048, "step": 152550 }, { "epoch": 2.2, "learning_rate": 1.926736996843789e-05, "loss": 0.0089, "step": 152560 }, { "epoch": 2.2, "learning_rate": 1.926732192869942e-05, "loss": 0.0106, "step": 152570 }, { "epoch": 2.2, "learning_rate": 1.926727388896095e-05, "loss": 0.0099, "step": 152580 }, { "epoch": 2.2, "learning_rate": 1.926722584922248e-05, "loss": 0.0079, "step": 152590 }, { "epoch": 2.2, "learning_rate": 1.926717780948401e-05, "loss": 0.0089, "step": 152600 }, { "epoch": 2.2, "learning_rate": 1.9267129769745538e-05, "loss": 0.0088, "step": 152610 }, { "epoch": 2.2, "learning_rate": 1.9267081730007064e-05, "loss": 0.0068, "step": 152620 }, { "epoch": 2.2, "learning_rate": 1.9267033690268593e-05, "loss": 0.0105, "step": 152630 }, { "epoch": 2.2, "learning_rate": 1.9266985650530122e-05, "loss": 0.0057, "step": 152640 }, { "epoch": 2.2, "learning_rate": 1.9266937610791648e-05, "loss": 0.0075, "step": 152650 }, { "epoch": 2.2, "learning_rate": 1.9266889571053177e-05, "loss": 0.007, "step": 152660 }, { "epoch": 2.2, "learning_rate": 1.9266846335288552e-05, "loss": 0.0057, "step": 152670 }, { "epoch": 2.2, "learning_rate": 1.926679829555008e-05, "loss": 0.0074, "step": 152680 }, { "epoch": 2.2, "learning_rate": 1.9266750255811607e-05, "loss": 0.0082, "step": 152690 }, { "epoch": 2.2, "learning_rate": 1.9266702216073136e-05, "loss": 0.0073, "step": 152700 }, { "epoch": 2.2, "learning_rate": 1.9266654176334666e-05, "loss": 0.0097, "step": 152710 }, { "epoch": 2.2, "learning_rate": 1.926660613659619e-05, "loss": 0.01, "step": 152720 }, { "epoch": 2.2, "learning_rate": 1.926655809685772e-05, "loss": 0.005, "step": 152730 }, { "epoch": 2.2, "learning_rate": 1.926651005711925e-05, "loss": 0.0063, "step": 152740 }, { "epoch": 2.2, "learning_rate": 1.926646201738078e-05, "loss": 0.0075, "step": 152750 }, { "epoch": 2.2, "learning_rate": 1.9266413977642305e-05, "loss": 0.005, "step": 152760 }, { "epoch": 2.2, "learning_rate": 1.9266365937903834e-05, "loss": 0.0079, "step": 152770 }, { "epoch": 2.2, "learning_rate": 1.9266317898165364e-05, "loss": 0.0072, "step": 152780 }, { "epoch": 2.2, "learning_rate": 1.9266269858426893e-05, "loss": 0.0059, "step": 152790 }, { "epoch": 2.2, "learning_rate": 1.926622181868842e-05, "loss": 0.0097, "step": 152800 }, { "epoch": 2.2, "learning_rate": 1.9266173778949948e-05, "loss": 0.0063, "step": 152810 }, { "epoch": 2.2, "learning_rate": 1.9266125739211477e-05, "loss": 0.01, "step": 152820 }, { "epoch": 2.2, "learning_rate": 1.9266077699473003e-05, "loss": 0.0071, "step": 152830 }, { "epoch": 2.2, "learning_rate": 1.9266029659734533e-05, "loss": 0.0073, "step": 152840 }, { "epoch": 2.2, "learning_rate": 1.9265981619996062e-05, "loss": 0.0077, "step": 152850 }, { "epoch": 2.2, "learning_rate": 1.926593358025759e-05, "loss": 0.0136, "step": 152860 }, { "epoch": 2.2, "learning_rate": 1.9265885540519117e-05, "loss": 0.0077, "step": 152870 }, { "epoch": 2.2, "learning_rate": 1.9265837500780646e-05, "loss": 0.0076, "step": 152880 }, { "epoch": 2.2, "learning_rate": 1.9265789461042176e-05, "loss": 0.0111, "step": 152890 }, { "epoch": 2.2, "learning_rate": 1.92657414213037e-05, "loss": 0.0096, "step": 152900 }, { "epoch": 2.2, "learning_rate": 1.926569338156523e-05, "loss": 0.0068, "step": 152910 }, { "epoch": 2.2, "learning_rate": 1.926564534182676e-05, "loss": 0.0075, "step": 152920 }, { "epoch": 2.2, "learning_rate": 1.926559730208829e-05, "loss": 0.0061, "step": 152930 }, { "epoch": 2.2, "learning_rate": 1.9265549262349815e-05, "loss": 0.0078, "step": 152940 }, { "epoch": 2.2, "learning_rate": 1.9265501222611344e-05, "loss": 0.0101, "step": 152950 }, { "epoch": 2.2, "learning_rate": 1.9265453182872874e-05, "loss": 0.0055, "step": 152960 }, { "epoch": 2.2, "learning_rate": 1.9265405143134403e-05, "loss": 0.0091, "step": 152970 }, { "epoch": 2.2, "learning_rate": 1.926535710339593e-05, "loss": 0.0065, "step": 152980 }, { "epoch": 2.2, "learning_rate": 1.9265309063657458e-05, "loss": 0.008, "step": 152990 }, { "epoch": 2.21, "learning_rate": 1.9265261023918987e-05, "loss": 0.0072, "step": 153000 }, { "epoch": 2.21, "learning_rate": 1.9265212984180513e-05, "loss": 0.0079, "step": 153010 }, { "epoch": 2.21, "learning_rate": 1.9265164944442042e-05, "loss": 0.0083, "step": 153020 }, { "epoch": 2.21, "learning_rate": 1.9265116904703572e-05, "loss": 0.0064, "step": 153030 }, { "epoch": 2.21, "learning_rate": 1.92650688649651e-05, "loss": 0.0097, "step": 153040 }, { "epoch": 2.21, "learning_rate": 1.9265020825226627e-05, "loss": 0.0092, "step": 153050 }, { "epoch": 2.21, "learning_rate": 1.9264972785488156e-05, "loss": 0.0085, "step": 153060 }, { "epoch": 2.21, "learning_rate": 1.9264924745749685e-05, "loss": 0.0084, "step": 153070 }, { "epoch": 2.21, "learning_rate": 1.926487670601121e-05, "loss": 0.0068, "step": 153080 }, { "epoch": 2.21, "learning_rate": 1.926482866627274e-05, "loss": 0.0049, "step": 153090 }, { "epoch": 2.21, "learning_rate": 1.926478062653427e-05, "loss": 0.0055, "step": 153100 }, { "epoch": 2.21, "learning_rate": 1.92647325867958e-05, "loss": 0.0056, "step": 153110 }, { "epoch": 2.21, "learning_rate": 1.926468454705733e-05, "loss": 0.0079, "step": 153120 }, { "epoch": 2.21, "learning_rate": 1.9264636507318858e-05, "loss": 0.0067, "step": 153130 }, { "epoch": 2.21, "learning_rate": 1.9264588467580384e-05, "loss": 0.0064, "step": 153140 }, { "epoch": 2.21, "learning_rate": 1.9264540427841913e-05, "loss": 0.0088, "step": 153150 }, { "epoch": 2.21, "learning_rate": 1.9264492388103442e-05, "loss": 0.0079, "step": 153160 }, { "epoch": 2.21, "learning_rate": 1.926444434836497e-05, "loss": 0.0086, "step": 153170 }, { "epoch": 2.21, "learning_rate": 1.9264396308626497e-05, "loss": 0.0068, "step": 153180 }, { "epoch": 2.21, "learning_rate": 1.9264348268888026e-05, "loss": 0.0052, "step": 153190 }, { "epoch": 2.21, "learning_rate": 1.9264300229149556e-05, "loss": 0.0083, "step": 153200 }, { "epoch": 2.21, "learning_rate": 1.9264252189411085e-05, "loss": 0.0059, "step": 153210 }, { "epoch": 2.21, "learning_rate": 1.926420414967261e-05, "loss": 0.0072, "step": 153220 }, { "epoch": 2.21, "learning_rate": 1.926415610993414e-05, "loss": 0.0127, "step": 153230 }, { "epoch": 2.21, "learning_rate": 1.926410807019567e-05, "loss": 0.006, "step": 153240 }, { "epoch": 2.21, "learning_rate": 1.9264060030457195e-05, "loss": 0.0065, "step": 153250 }, { "epoch": 2.21, "learning_rate": 1.9264011990718725e-05, "loss": 0.0078, "step": 153260 }, { "epoch": 2.21, "learning_rate": 1.9263963950980254e-05, "loss": 0.0076, "step": 153270 }, { "epoch": 2.21, "learning_rate": 1.9263915911241783e-05, "loss": 0.0086, "step": 153280 }, { "epoch": 2.21, "learning_rate": 1.926386787150331e-05, "loss": 0.0098, "step": 153290 }, { "epoch": 2.21, "learning_rate": 1.9263819831764838e-05, "loss": 0.0068, "step": 153300 }, { "epoch": 2.21, "learning_rate": 1.9263771792026368e-05, "loss": 0.0061, "step": 153310 }, { "epoch": 2.21, "learning_rate": 1.9263723752287893e-05, "loss": 0.0091, "step": 153320 }, { "epoch": 2.21, "learning_rate": 1.9263675712549423e-05, "loss": 0.0043, "step": 153330 }, { "epoch": 2.21, "learning_rate": 1.9263627672810952e-05, "loss": 0.0067, "step": 153340 }, { "epoch": 2.21, "learning_rate": 1.926357963307248e-05, "loss": 0.006, "step": 153350 }, { "epoch": 2.21, "learning_rate": 1.9263531593334007e-05, "loss": 0.0098, "step": 153360 }, { "epoch": 2.21, "learning_rate": 1.9263483553595536e-05, "loss": 0.0048, "step": 153370 }, { "epoch": 2.21, "learning_rate": 1.9263435513857066e-05, "loss": 0.0107, "step": 153380 }, { "epoch": 2.21, "learning_rate": 1.9263387474118595e-05, "loss": 0.0109, "step": 153390 }, { "epoch": 2.21, "learning_rate": 1.926333943438012e-05, "loss": 0.0071, "step": 153400 }, { "epoch": 2.21, "learning_rate": 1.926329139464165e-05, "loss": 0.0078, "step": 153410 }, { "epoch": 2.21, "learning_rate": 1.926324335490318e-05, "loss": 0.0105, "step": 153420 }, { "epoch": 2.21, "learning_rate": 1.9263195315164705e-05, "loss": 0.0088, "step": 153430 }, { "epoch": 2.21, "learning_rate": 1.9263147275426235e-05, "loss": 0.0096, "step": 153440 }, { "epoch": 2.21, "learning_rate": 1.9263099235687764e-05, "loss": 0.0107, "step": 153450 }, { "epoch": 2.21, "learning_rate": 1.9263051195949293e-05, "loss": 0.0132, "step": 153460 }, { "epoch": 2.21, "learning_rate": 1.926300315621082e-05, "loss": 0.0061, "step": 153470 }, { "epoch": 2.21, "learning_rate": 1.9262955116472348e-05, "loss": 0.0091, "step": 153480 }, { "epoch": 2.21, "learning_rate": 1.9262907076733877e-05, "loss": 0.0077, "step": 153490 }, { "epoch": 2.21, "learning_rate": 1.9262859036995403e-05, "loss": 0.0097, "step": 153500 }, { "epoch": 2.21, "learning_rate": 1.9262810997256933e-05, "loss": 0.004, "step": 153510 }, { "epoch": 2.21, "learning_rate": 1.9262762957518462e-05, "loss": 0.0095, "step": 153520 }, { "epoch": 2.21, "learning_rate": 1.926271491777999e-05, "loss": 0.0079, "step": 153530 }, { "epoch": 2.21, "learning_rate": 1.9262666878041517e-05, "loss": 0.0056, "step": 153540 }, { "epoch": 2.21, "learning_rate": 1.9262618838303046e-05, "loss": 0.0084, "step": 153550 }, { "epoch": 2.21, "learning_rate": 1.9262570798564576e-05, "loss": 0.0094, "step": 153560 }, { "epoch": 2.21, "learning_rate": 1.9262522758826105e-05, "loss": 0.0119, "step": 153570 }, { "epoch": 2.21, "learning_rate": 1.926247471908763e-05, "loss": 0.006, "step": 153580 }, { "epoch": 2.21, "learning_rate": 1.926242667934916e-05, "loss": 0.0079, "step": 153590 }, { "epoch": 2.21, "learning_rate": 1.926237863961069e-05, "loss": 0.008, "step": 153600 }, { "epoch": 2.21, "learning_rate": 1.9262330599872215e-05, "loss": 0.009, "step": 153610 }, { "epoch": 2.21, "learning_rate": 1.9262282560133744e-05, "loss": 0.0052, "step": 153620 }, { "epoch": 2.21, "learning_rate": 1.9262234520395274e-05, "loss": 0.0084, "step": 153630 }, { "epoch": 2.21, "learning_rate": 1.9262186480656803e-05, "loss": 0.0047, "step": 153640 }, { "epoch": 2.21, "learning_rate": 1.926213844091833e-05, "loss": 0.0065, "step": 153650 }, { "epoch": 2.21, "learning_rate": 1.9262090401179858e-05, "loss": 0.0076, "step": 153660 }, { "epoch": 2.21, "learning_rate": 1.9262042361441387e-05, "loss": 0.0068, "step": 153670 }, { "epoch": 2.21, "learning_rate": 1.9261994321702913e-05, "loss": 0.0076, "step": 153680 }, { "epoch": 2.21, "learning_rate": 1.9261946281964443e-05, "loss": 0.0081, "step": 153690 }, { "epoch": 2.22, "learning_rate": 1.9261898242225972e-05, "loss": 0.0088, "step": 153700 }, { "epoch": 2.22, "learning_rate": 1.92618502024875e-05, "loss": 0.0122, "step": 153710 }, { "epoch": 2.22, "learning_rate": 1.9261802162749027e-05, "loss": 0.0081, "step": 153720 }, { "epoch": 2.22, "learning_rate": 1.9261754123010556e-05, "loss": 0.0111, "step": 153730 }, { "epoch": 2.22, "learning_rate": 1.9261706083272086e-05, "loss": 0.0083, "step": 153740 }, { "epoch": 2.22, "learning_rate": 1.9261658043533615e-05, "loss": 0.0066, "step": 153750 }, { "epoch": 2.22, "learning_rate": 1.926161000379514e-05, "loss": 0.0084, "step": 153760 }, { "epoch": 2.22, "learning_rate": 1.926156196405667e-05, "loss": 0.0112, "step": 153770 }, { "epoch": 2.22, "learning_rate": 1.92615139243182e-05, "loss": 0.0066, "step": 153780 }, { "epoch": 2.22, "learning_rate": 1.9261465884579725e-05, "loss": 0.0068, "step": 153790 }, { "epoch": 2.22, "learning_rate": 1.9261417844841254e-05, "loss": 0.0064, "step": 153800 }, { "epoch": 2.22, "learning_rate": 1.9261369805102784e-05, "loss": 0.0079, "step": 153810 }, { "epoch": 2.22, "learning_rate": 1.9261321765364313e-05, "loss": 0.0079, "step": 153820 }, { "epoch": 2.22, "learning_rate": 1.926127372562584e-05, "loss": 0.0073, "step": 153830 }, { "epoch": 2.22, "learning_rate": 1.9261225685887368e-05, "loss": 0.0094, "step": 153840 }, { "epoch": 2.22, "learning_rate": 1.9261177646148897e-05, "loss": 0.0066, "step": 153850 }, { "epoch": 2.22, "learning_rate": 1.9261129606410423e-05, "loss": 0.0085, "step": 153860 }, { "epoch": 2.22, "learning_rate": 1.9261081566671952e-05, "loss": 0.0074, "step": 153870 }, { "epoch": 2.22, "learning_rate": 1.9261033526933482e-05, "loss": 0.0103, "step": 153880 }, { "epoch": 2.22, "learning_rate": 1.926098548719501e-05, "loss": 0.006, "step": 153890 }, { "epoch": 2.22, "learning_rate": 1.9260937447456537e-05, "loss": 0.0058, "step": 153900 }, { "epoch": 2.22, "learning_rate": 1.9260889407718066e-05, "loss": 0.0071, "step": 153910 }, { "epoch": 2.22, "learning_rate": 1.9260841367979595e-05, "loss": 0.0064, "step": 153920 }, { "epoch": 2.22, "learning_rate": 1.9260793328241125e-05, "loss": 0.0084, "step": 153930 }, { "epoch": 2.22, "learning_rate": 1.926074528850265e-05, "loss": 0.0085, "step": 153940 }, { "epoch": 2.22, "learning_rate": 1.926069724876418e-05, "loss": 0.0071, "step": 153950 }, { "epoch": 2.22, "learning_rate": 1.926064920902571e-05, "loss": 0.0086, "step": 153960 }, { "epoch": 2.22, "learning_rate": 1.9260601169287235e-05, "loss": 0.007, "step": 153970 }, { "epoch": 2.22, "learning_rate": 1.9260553129548764e-05, "loss": 0.0054, "step": 153980 }, { "epoch": 2.22, "learning_rate": 1.9260505089810294e-05, "loss": 0.0114, "step": 153990 }, { "epoch": 2.22, "learning_rate": 1.9260457050071823e-05, "loss": 0.0071, "step": 154000 }, { "epoch": 2.22, "learning_rate": 1.926040901033335e-05, "loss": 0.0052, "step": 154010 }, { "epoch": 2.22, "learning_rate": 1.9260360970594878e-05, "loss": 0.0089, "step": 154020 }, { "epoch": 2.22, "learning_rate": 1.9260312930856407e-05, "loss": 0.0078, "step": 154030 }, { "epoch": 2.22, "learning_rate": 1.9260264891117933e-05, "loss": 0.0078, "step": 154040 }, { "epoch": 2.22, "learning_rate": 1.9260216851379462e-05, "loss": 0.0077, "step": 154050 }, { "epoch": 2.22, "learning_rate": 1.926016881164099e-05, "loss": 0.0082, "step": 154060 }, { "epoch": 2.22, "learning_rate": 1.926012077190252e-05, "loss": 0.011, "step": 154070 }, { "epoch": 2.22, "learning_rate": 1.9260072732164047e-05, "loss": 0.0072, "step": 154080 }, { "epoch": 2.22, "learning_rate": 1.9260024692425576e-05, "loss": 0.0061, "step": 154090 }, { "epoch": 2.22, "learning_rate": 1.9259976652687105e-05, "loss": 0.0101, "step": 154100 }, { "epoch": 2.22, "learning_rate": 1.9259928612948635e-05, "loss": 0.0081, "step": 154110 }, { "epoch": 2.22, "learning_rate": 1.925988057321016e-05, "loss": 0.01, "step": 154120 }, { "epoch": 2.22, "learning_rate": 1.925983253347169e-05, "loss": 0.0097, "step": 154130 }, { "epoch": 2.22, "learning_rate": 1.925978449373322e-05, "loss": 0.0097, "step": 154140 }, { "epoch": 2.22, "learning_rate": 1.9259736453994745e-05, "loss": 0.0062, "step": 154150 }, { "epoch": 2.22, "learning_rate": 1.9259688414256274e-05, "loss": 0.0072, "step": 154160 }, { "epoch": 2.22, "learning_rate": 1.9259640374517803e-05, "loss": 0.0076, "step": 154170 }, { "epoch": 2.22, "learning_rate": 1.9259592334779333e-05, "loss": 0.0085, "step": 154180 }, { "epoch": 2.22, "learning_rate": 1.925954429504086e-05, "loss": 0.0098, "step": 154190 }, { "epoch": 2.22, "learning_rate": 1.9259496255302388e-05, "loss": 0.0072, "step": 154200 }, { "epoch": 2.22, "learning_rate": 1.9259448215563917e-05, "loss": 0.0062, "step": 154210 }, { "epoch": 2.22, "learning_rate": 1.9259400175825443e-05, "loss": 0.0052, "step": 154220 }, { "epoch": 2.22, "learning_rate": 1.9259352136086972e-05, "loss": 0.0058, "step": 154230 }, { "epoch": 2.22, "learning_rate": 1.92593040963485e-05, "loss": 0.0066, "step": 154240 }, { "epoch": 2.22, "learning_rate": 1.925925605661003e-05, "loss": 0.0079, "step": 154250 }, { "epoch": 2.22, "learning_rate": 1.9259208016871557e-05, "loss": 0.0103, "step": 154260 }, { "epoch": 2.22, "learning_rate": 1.9259159977133086e-05, "loss": 0.0099, "step": 154270 }, { "epoch": 2.22, "learning_rate": 1.9259111937394615e-05, "loss": 0.0067, "step": 154280 }, { "epoch": 2.22, "learning_rate": 1.925906389765614e-05, "loss": 0.0085, "step": 154290 }, { "epoch": 2.22, "learning_rate": 1.925901585791767e-05, "loss": 0.0078, "step": 154300 }, { "epoch": 2.22, "learning_rate": 1.92589678181792e-05, "loss": 0.0083, "step": 154310 }, { "epoch": 2.22, "learning_rate": 1.925891977844073e-05, "loss": 0.0083, "step": 154320 }, { "epoch": 2.22, "learning_rate": 1.9258871738702255e-05, "loss": 0.0081, "step": 154330 }, { "epoch": 2.22, "learning_rate": 1.9258823698963784e-05, "loss": 0.0064, "step": 154340 }, { "epoch": 2.22, "learning_rate": 1.9258775659225313e-05, "loss": 0.009, "step": 154350 }, { "epoch": 2.22, "learning_rate": 1.9258727619486843e-05, "loss": 0.0072, "step": 154360 }, { "epoch": 2.22, "learning_rate": 1.925867957974837e-05, "loss": 0.008, "step": 154370 }, { "epoch": 2.22, "learning_rate": 1.9258631540009898e-05, "loss": 0.0066, "step": 154380 }, { "epoch": 2.23, "learning_rate": 1.9258583500271427e-05, "loss": 0.0095, "step": 154390 }, { "epoch": 2.23, "learning_rate": 1.9258535460532953e-05, "loss": 0.0076, "step": 154400 }, { "epoch": 2.23, "learning_rate": 1.9258487420794482e-05, "loss": 0.0086, "step": 154410 }, { "epoch": 2.23, "learning_rate": 1.925843938105601e-05, "loss": 0.0063, "step": 154420 }, { "epoch": 2.23, "learning_rate": 1.925839134131754e-05, "loss": 0.0079, "step": 154430 }, { "epoch": 2.23, "learning_rate": 1.9258343301579067e-05, "loss": 0.0083, "step": 154440 }, { "epoch": 2.23, "learning_rate": 1.9258295261840596e-05, "loss": 0.0085, "step": 154450 }, { "epoch": 2.23, "learning_rate": 1.9258247222102125e-05, "loss": 0.004, "step": 154460 }, { "epoch": 2.23, "learning_rate": 1.925819918236365e-05, "loss": 0.01, "step": 154470 }, { "epoch": 2.23, "learning_rate": 1.925815114262518e-05, "loss": 0.0078, "step": 154480 }, { "epoch": 2.23, "learning_rate": 1.925810310288671e-05, "loss": 0.0073, "step": 154490 }, { "epoch": 2.23, "learning_rate": 1.925805506314824e-05, "loss": 0.0071, "step": 154500 }, { "epoch": 2.23, "learning_rate": 1.9258007023409765e-05, "loss": 0.0108, "step": 154510 }, { "epoch": 2.23, "learning_rate": 1.9257958983671294e-05, "loss": 0.008, "step": 154520 }, { "epoch": 2.23, "learning_rate": 1.9257910943932823e-05, "loss": 0.0099, "step": 154530 }, { "epoch": 2.23, "learning_rate": 1.9257862904194353e-05, "loss": 0.0046, "step": 154540 }, { "epoch": 2.23, "learning_rate": 1.925781486445588e-05, "loss": 0.0112, "step": 154550 }, { "epoch": 2.23, "learning_rate": 1.9257766824717408e-05, "loss": 0.0084, "step": 154560 }, { "epoch": 2.23, "learning_rate": 1.9257718784978937e-05, "loss": 0.006, "step": 154570 }, { "epoch": 2.23, "learning_rate": 1.9257670745240463e-05, "loss": 0.0094, "step": 154580 }, { "epoch": 2.23, "learning_rate": 1.9257622705501992e-05, "loss": 0.0071, "step": 154590 }, { "epoch": 2.23, "learning_rate": 1.925757466576352e-05, "loss": 0.0062, "step": 154600 }, { "epoch": 2.23, "learning_rate": 1.925752662602505e-05, "loss": 0.0103, "step": 154610 }, { "epoch": 2.23, "learning_rate": 1.9257478586286577e-05, "loss": 0.0069, "step": 154620 }, { "epoch": 2.23, "learning_rate": 1.9257430546548106e-05, "loss": 0.0089, "step": 154630 }, { "epoch": 2.23, "learning_rate": 1.9257382506809635e-05, "loss": 0.0059, "step": 154640 }, { "epoch": 2.23, "learning_rate": 1.925733446707116e-05, "loss": 0.0084, "step": 154650 }, { "epoch": 2.23, "learning_rate": 1.925728642733269e-05, "loss": 0.009, "step": 154660 }, { "epoch": 2.23, "learning_rate": 1.925723838759422e-05, "loss": 0.0067, "step": 154670 }, { "epoch": 2.23, "learning_rate": 1.925719034785575e-05, "loss": 0.0054, "step": 154680 }, { "epoch": 2.23, "learning_rate": 1.9257142308117275e-05, "loss": 0.0086, "step": 154690 }, { "epoch": 2.23, "learning_rate": 1.9257094268378804e-05, "loss": 0.0062, "step": 154700 }, { "epoch": 2.23, "learning_rate": 1.9257046228640333e-05, "loss": 0.0066, "step": 154710 }, { "epoch": 2.23, "learning_rate": 1.9256998188901862e-05, "loss": 0.0084, "step": 154720 }, { "epoch": 2.23, "learning_rate": 1.925695014916339e-05, "loss": 0.007, "step": 154730 }, { "epoch": 2.23, "learning_rate": 1.9256902109424918e-05, "loss": 0.0089, "step": 154740 }, { "epoch": 2.23, "learning_rate": 1.9256854069686447e-05, "loss": 0.0078, "step": 154750 }, { "epoch": 2.23, "learning_rate": 1.9256806029947973e-05, "loss": 0.007, "step": 154760 }, { "epoch": 2.23, "learning_rate": 1.9256757990209502e-05, "loss": 0.0096, "step": 154770 }, { "epoch": 2.23, "learning_rate": 1.925670995047103e-05, "loss": 0.0067, "step": 154780 }, { "epoch": 2.23, "learning_rate": 1.925666191073256e-05, "loss": 0.0088, "step": 154790 }, { "epoch": 2.23, "learning_rate": 1.9256613870994086e-05, "loss": 0.0087, "step": 154800 }, { "epoch": 2.23, "learning_rate": 1.9256565831255616e-05, "loss": 0.0063, "step": 154810 }, { "epoch": 2.23, "learning_rate": 1.9256517791517145e-05, "loss": 0.0088, "step": 154820 }, { "epoch": 2.23, "learning_rate": 1.925646975177867e-05, "loss": 0.0058, "step": 154830 }, { "epoch": 2.23, "learning_rate": 1.92564217120402e-05, "loss": 0.0072, "step": 154840 }, { "epoch": 2.23, "learning_rate": 1.925637367230173e-05, "loss": 0.0065, "step": 154850 }, { "epoch": 2.23, "learning_rate": 1.925632563256326e-05, "loss": 0.0113, "step": 154860 }, { "epoch": 2.23, "learning_rate": 1.9256277592824785e-05, "loss": 0.0067, "step": 154870 }, { "epoch": 2.23, "learning_rate": 1.9256229553086314e-05, "loss": 0.0051, "step": 154880 }, { "epoch": 2.23, "learning_rate": 1.9256181513347843e-05, "loss": 0.0098, "step": 154890 }, { "epoch": 2.23, "learning_rate": 1.9256133473609372e-05, "loss": 0.0102, "step": 154900 }, { "epoch": 2.23, "learning_rate": 1.9256085433870898e-05, "loss": 0.0071, "step": 154910 }, { "epoch": 2.23, "learning_rate": 1.9256037394132428e-05, "loss": 0.0105, "step": 154920 }, { "epoch": 2.23, "learning_rate": 1.9255989354393957e-05, "loss": 0.0064, "step": 154930 }, { "epoch": 2.23, "learning_rate": 1.9255941314655483e-05, "loss": 0.0068, "step": 154940 }, { "epoch": 2.23, "learning_rate": 1.9255893274917012e-05, "loss": 0.0062, "step": 154950 }, { "epoch": 2.23, "learning_rate": 1.925584523517854e-05, "loss": 0.0095, "step": 154960 }, { "epoch": 2.23, "learning_rate": 1.925579719544007e-05, "loss": 0.0077, "step": 154970 }, { "epoch": 2.23, "learning_rate": 1.9255749155701596e-05, "loss": 0.0061, "step": 154980 }, { "epoch": 2.23, "learning_rate": 1.9255701115963126e-05, "loss": 0.0076, "step": 154990 }, { "epoch": 2.23, "learning_rate": 1.9255653076224655e-05, "loss": 0.0081, "step": 155000 }, { "epoch": 2.23, "learning_rate": 1.925560503648618e-05, "loss": 0.0102, "step": 155010 }, { "epoch": 2.23, "learning_rate": 1.925555699674771e-05, "loss": 0.0112, "step": 155020 }, { "epoch": 2.23, "learning_rate": 1.925550895700924e-05, "loss": 0.0063, "step": 155030 }, { "epoch": 2.23, "learning_rate": 1.925546091727077e-05, "loss": 0.0076, "step": 155040 }, { "epoch": 2.23, "learning_rate": 1.9255412877532294e-05, "loss": 0.0097, "step": 155050 }, { "epoch": 2.23, "learning_rate": 1.9255364837793824e-05, "loss": 0.0079, "step": 155060 }, { "epoch": 2.23, "learning_rate": 1.9255316798055353e-05, "loss": 0.0094, "step": 155070 }, { "epoch": 2.24, "learning_rate": 1.9255268758316882e-05, "loss": 0.0071, "step": 155080 }, { "epoch": 2.24, "learning_rate": 1.9255220718578408e-05, "loss": 0.011, "step": 155090 }, { "epoch": 2.24, "learning_rate": 1.9255172678839937e-05, "loss": 0.0064, "step": 155100 }, { "epoch": 2.24, "learning_rate": 1.9255124639101467e-05, "loss": 0.0099, "step": 155110 }, { "epoch": 2.24, "learning_rate": 1.9255076599362993e-05, "loss": 0.0064, "step": 155120 }, { "epoch": 2.24, "learning_rate": 1.9255028559624522e-05, "loss": 0.0062, "step": 155130 }, { "epoch": 2.24, "learning_rate": 1.925498051988605e-05, "loss": 0.0083, "step": 155140 }, { "epoch": 2.24, "learning_rate": 1.925493248014758e-05, "loss": 0.0108, "step": 155150 }, { "epoch": 2.24, "learning_rate": 1.9254884440409106e-05, "loss": 0.007, "step": 155160 }, { "epoch": 2.24, "learning_rate": 1.9254836400670636e-05, "loss": 0.0068, "step": 155170 }, { "epoch": 2.24, "learning_rate": 1.9254788360932165e-05, "loss": 0.0061, "step": 155180 }, { "epoch": 2.24, "learning_rate": 1.925474032119369e-05, "loss": 0.0076, "step": 155190 }, { "epoch": 2.24, "learning_rate": 1.925469228145522e-05, "loss": 0.0056, "step": 155200 }, { "epoch": 2.24, "learning_rate": 1.925464424171675e-05, "loss": 0.0064, "step": 155210 }, { "epoch": 2.24, "learning_rate": 1.925459620197828e-05, "loss": 0.0095, "step": 155220 }, { "epoch": 2.24, "learning_rate": 1.9254548162239804e-05, "loss": 0.0092, "step": 155230 }, { "epoch": 2.24, "learning_rate": 1.9254500122501334e-05, "loss": 0.0052, "step": 155240 }, { "epoch": 2.24, "learning_rate": 1.9254452082762863e-05, "loss": 0.0101, "step": 155250 }, { "epoch": 2.24, "learning_rate": 1.9254404043024392e-05, "loss": 0.0068, "step": 155260 }, { "epoch": 2.24, "learning_rate": 1.9254356003285918e-05, "loss": 0.0091, "step": 155270 }, { "epoch": 2.24, "learning_rate": 1.9254307963547447e-05, "loss": 0.0065, "step": 155280 }, { "epoch": 2.24, "learning_rate": 1.9254259923808977e-05, "loss": 0.0064, "step": 155290 }, { "epoch": 2.24, "learning_rate": 1.9254211884070503e-05, "loss": 0.01, "step": 155300 }, { "epoch": 2.24, "learning_rate": 1.9254163844332032e-05, "loss": 0.0099, "step": 155310 }, { "epoch": 2.24, "learning_rate": 1.925411580459356e-05, "loss": 0.0096, "step": 155320 }, { "epoch": 2.24, "learning_rate": 1.925406776485509e-05, "loss": 0.0075, "step": 155330 }, { "epoch": 2.24, "learning_rate": 1.9254019725116616e-05, "loss": 0.0117, "step": 155340 }, { "epoch": 2.24, "learning_rate": 1.9253971685378145e-05, "loss": 0.0085, "step": 155350 }, { "epoch": 2.24, "learning_rate": 1.9253923645639675e-05, "loss": 0.0072, "step": 155360 }, { "epoch": 2.24, "learning_rate": 1.92538756059012e-05, "loss": 0.0082, "step": 155370 }, { "epoch": 2.24, "learning_rate": 1.925382756616273e-05, "loss": 0.0074, "step": 155380 }, { "epoch": 2.24, "learning_rate": 1.925377952642426e-05, "loss": 0.0075, "step": 155390 }, { "epoch": 2.24, "learning_rate": 1.925373148668579e-05, "loss": 0.0078, "step": 155400 }, { "epoch": 2.24, "learning_rate": 1.9253683446947314e-05, "loss": 0.0077, "step": 155410 }, { "epoch": 2.24, "learning_rate": 1.9253635407208844e-05, "loss": 0.0078, "step": 155420 }, { "epoch": 2.24, "learning_rate": 1.9253587367470373e-05, "loss": 0.0065, "step": 155430 }, { "epoch": 2.24, "learning_rate": 1.9253539327731902e-05, "loss": 0.0088, "step": 155440 }, { "epoch": 2.24, "learning_rate": 1.9253491287993428e-05, "loss": 0.0079, "step": 155450 }, { "epoch": 2.24, "learning_rate": 1.9253443248254957e-05, "loss": 0.0073, "step": 155460 }, { "epoch": 2.24, "learning_rate": 1.9253395208516487e-05, "loss": 0.0081, "step": 155470 }, { "epoch": 2.24, "learning_rate": 1.9253347168778012e-05, "loss": 0.0088, "step": 155480 }, { "epoch": 2.24, "learning_rate": 1.9253299129039542e-05, "loss": 0.0069, "step": 155490 }, { "epoch": 2.24, "learning_rate": 1.925325108930107e-05, "loss": 0.0065, "step": 155500 }, { "epoch": 2.24, "learning_rate": 1.92532030495626e-05, "loss": 0.0108, "step": 155510 }, { "epoch": 2.24, "learning_rate": 1.9253155009824126e-05, "loss": 0.0051, "step": 155520 }, { "epoch": 2.24, "learning_rate": 1.9253106970085655e-05, "loss": 0.0131, "step": 155530 }, { "epoch": 2.24, "learning_rate": 1.9253058930347185e-05, "loss": 0.0084, "step": 155540 }, { "epoch": 2.24, "learning_rate": 1.925301089060871e-05, "loss": 0.009, "step": 155550 }, { "epoch": 2.24, "learning_rate": 1.925296285087024e-05, "loss": 0.0087, "step": 155560 }, { "epoch": 2.24, "learning_rate": 1.925291481113177e-05, "loss": 0.0093, "step": 155570 }, { "epoch": 2.24, "learning_rate": 1.92528667713933e-05, "loss": 0.0068, "step": 155580 }, { "epoch": 2.24, "learning_rate": 1.9252818731654824e-05, "loss": 0.0057, "step": 155590 }, { "epoch": 2.24, "learning_rate": 1.9252770691916354e-05, "loss": 0.0064, "step": 155600 }, { "epoch": 2.24, "learning_rate": 1.9252722652177883e-05, "loss": 0.006, "step": 155610 }, { "epoch": 2.24, "learning_rate": 1.9252674612439412e-05, "loss": 0.0077, "step": 155620 }, { "epoch": 2.24, "learning_rate": 1.9252626572700938e-05, "loss": 0.0058, "step": 155630 }, { "epoch": 2.24, "learning_rate": 1.9252578532962467e-05, "loss": 0.01, "step": 155640 }, { "epoch": 2.24, "learning_rate": 1.9252530493223996e-05, "loss": 0.0067, "step": 155650 }, { "epoch": 2.24, "learning_rate": 1.9252482453485522e-05, "loss": 0.0057, "step": 155660 }, { "epoch": 2.24, "learning_rate": 1.9252434413747055e-05, "loss": 0.0074, "step": 155670 }, { "epoch": 2.24, "learning_rate": 1.925238637400858e-05, "loss": 0.0056, "step": 155680 }, { "epoch": 2.24, "learning_rate": 1.925233833427011e-05, "loss": 0.0081, "step": 155690 }, { "epoch": 2.24, "learning_rate": 1.925229029453164e-05, "loss": 0.0064, "step": 155700 }, { "epoch": 2.24, "learning_rate": 1.9252247058767014e-05, "loss": 0.0071, "step": 155710 }, { "epoch": 2.24, "learning_rate": 1.925219901902854e-05, "loss": 0.0086, "step": 155720 }, { "epoch": 2.24, "learning_rate": 1.925215097929007e-05, "loss": 0.0122, "step": 155730 }, { "epoch": 2.24, "learning_rate": 1.92521029395516e-05, "loss": 0.0082, "step": 155740 }, { "epoch": 2.24, "learning_rate": 1.9252054899813128e-05, "loss": 0.0095, "step": 155750 }, { "epoch": 2.24, "learning_rate": 1.9252006860074654e-05, "loss": 0.0083, "step": 155760 }, { "epoch": 2.24, "learning_rate": 1.9251958820336183e-05, "loss": 0.0063, "step": 155770 }, { "epoch": 2.25, "learning_rate": 1.9251910780597712e-05, "loss": 0.0065, "step": 155780 }, { "epoch": 2.25, "learning_rate": 1.9251862740859238e-05, "loss": 0.006, "step": 155790 }, { "epoch": 2.25, "learning_rate": 1.9251814701120767e-05, "loss": 0.0066, "step": 155800 }, { "epoch": 2.25, "learning_rate": 1.9251766661382297e-05, "loss": 0.0115, "step": 155810 }, { "epoch": 2.25, "learning_rate": 1.9251718621643826e-05, "loss": 0.0093, "step": 155820 }, { "epoch": 2.25, "learning_rate": 1.9251670581905352e-05, "loss": 0.01, "step": 155830 }, { "epoch": 2.25, "learning_rate": 1.925162254216688e-05, "loss": 0.008, "step": 155840 }, { "epoch": 2.25, "learning_rate": 1.925157450242841e-05, "loss": 0.0075, "step": 155850 }, { "epoch": 2.25, "learning_rate": 1.9251526462689936e-05, "loss": 0.0066, "step": 155860 }, { "epoch": 2.25, "learning_rate": 1.9251478422951465e-05, "loss": 0.0091, "step": 155870 }, { "epoch": 2.25, "learning_rate": 1.9251430383212995e-05, "loss": 0.0059, "step": 155880 }, { "epoch": 2.25, "learning_rate": 1.9251382343474524e-05, "loss": 0.0065, "step": 155890 }, { "epoch": 2.25, "learning_rate": 1.925133430373605e-05, "loss": 0.0047, "step": 155900 }, { "epoch": 2.25, "learning_rate": 1.925128626399758e-05, "loss": 0.0082, "step": 155910 }, { "epoch": 2.25, "learning_rate": 1.925123822425911e-05, "loss": 0.0088, "step": 155920 }, { "epoch": 2.25, "learning_rate": 1.9251190184520638e-05, "loss": 0.0104, "step": 155930 }, { "epoch": 2.25, "learning_rate": 1.9251142144782164e-05, "loss": 0.0078, "step": 155940 }, { "epoch": 2.25, "learning_rate": 1.9251094105043693e-05, "loss": 0.0087, "step": 155950 }, { "epoch": 2.25, "learning_rate": 1.9251046065305222e-05, "loss": 0.0097, "step": 155960 }, { "epoch": 2.25, "learning_rate": 1.9250998025566748e-05, "loss": 0.0043, "step": 155970 }, { "epoch": 2.25, "learning_rate": 1.9250949985828277e-05, "loss": 0.0069, "step": 155980 }, { "epoch": 2.25, "learning_rate": 1.9250901946089807e-05, "loss": 0.0087, "step": 155990 }, { "epoch": 2.25, "learning_rate": 1.9250853906351336e-05, "loss": 0.0087, "step": 156000 }, { "epoch": 2.25, "learning_rate": 1.925080586661286e-05, "loss": 0.0109, "step": 156010 }, { "epoch": 2.25, "learning_rate": 1.925075782687439e-05, "loss": 0.0087, "step": 156020 }, { "epoch": 2.25, "learning_rate": 1.925070978713592e-05, "loss": 0.0066, "step": 156030 }, { "epoch": 2.25, "learning_rate": 1.9250661747397446e-05, "loss": 0.0096, "step": 156040 }, { "epoch": 2.25, "learning_rate": 1.9250613707658975e-05, "loss": 0.0073, "step": 156050 }, { "epoch": 2.25, "learning_rate": 1.9250565667920505e-05, "loss": 0.0085, "step": 156060 }, { "epoch": 2.25, "learning_rate": 1.9250517628182034e-05, "loss": 0.0058, "step": 156070 }, { "epoch": 2.25, "learning_rate": 1.925046958844356e-05, "loss": 0.0089, "step": 156080 }, { "epoch": 2.25, "learning_rate": 1.925042154870509e-05, "loss": 0.006, "step": 156090 }, { "epoch": 2.25, "learning_rate": 1.925037350896662e-05, "loss": 0.009, "step": 156100 }, { "epoch": 2.25, "learning_rate": 1.9250325469228148e-05, "loss": 0.0086, "step": 156110 }, { "epoch": 2.25, "learning_rate": 1.9250277429489673e-05, "loss": 0.0078, "step": 156120 }, { "epoch": 2.25, "learning_rate": 1.9250229389751203e-05, "loss": 0.0073, "step": 156130 }, { "epoch": 2.25, "learning_rate": 1.9250181350012732e-05, "loss": 0.0055, "step": 156140 }, { "epoch": 2.25, "learning_rate": 1.9250138114248107e-05, "loss": 0.0077, "step": 156150 }, { "epoch": 2.25, "learning_rate": 1.9250090074509636e-05, "loss": 0.007, "step": 156160 }, { "epoch": 2.25, "learning_rate": 1.9250042034771165e-05, "loss": 0.0079, "step": 156170 }, { "epoch": 2.25, "learning_rate": 1.924999399503269e-05, "loss": 0.009, "step": 156180 }, { "epoch": 2.25, "learning_rate": 1.924994595529422e-05, "loss": 0.0069, "step": 156190 }, { "epoch": 2.25, "learning_rate": 1.924989791555575e-05, "loss": 0.0057, "step": 156200 }, { "epoch": 2.25, "learning_rate": 1.9249849875817276e-05, "loss": 0.0078, "step": 156210 }, { "epoch": 2.25, "learning_rate": 1.9249801836078805e-05, "loss": 0.0076, "step": 156220 }, { "epoch": 2.25, "learning_rate": 1.9249753796340334e-05, "loss": 0.0078, "step": 156230 }, { "epoch": 2.25, "learning_rate": 1.9249705756601863e-05, "loss": 0.0113, "step": 156240 }, { "epoch": 2.25, "learning_rate": 1.924965771686339e-05, "loss": 0.0078, "step": 156250 }, { "epoch": 2.25, "learning_rate": 1.924960967712492e-05, "loss": 0.0107, "step": 156260 }, { "epoch": 2.25, "learning_rate": 1.9249561637386448e-05, "loss": 0.0084, "step": 156270 }, { "epoch": 2.25, "learning_rate": 1.9249513597647974e-05, "loss": 0.0039, "step": 156280 }, { "epoch": 2.25, "learning_rate": 1.9249465557909503e-05, "loss": 0.0047, "step": 156290 }, { "epoch": 2.25, "learning_rate": 1.9249417518171032e-05, "loss": 0.0085, "step": 156300 }, { "epoch": 2.25, "learning_rate": 1.924936947843256e-05, "loss": 0.0086, "step": 156310 }, { "epoch": 2.25, "learning_rate": 1.9249321438694087e-05, "loss": 0.0067, "step": 156320 }, { "epoch": 2.25, "learning_rate": 1.9249273398955617e-05, "loss": 0.0061, "step": 156330 }, { "epoch": 2.25, "learning_rate": 1.9249225359217146e-05, "loss": 0.0074, "step": 156340 }, { "epoch": 2.25, "learning_rate": 1.9249177319478675e-05, "loss": 0.0069, "step": 156350 }, { "epoch": 2.25, "learning_rate": 1.92491292797402e-05, "loss": 0.0071, "step": 156360 }, { "epoch": 2.25, "learning_rate": 1.924908124000173e-05, "loss": 0.0065, "step": 156370 }, { "epoch": 2.25, "learning_rate": 1.924903320026326e-05, "loss": 0.0093, "step": 156380 }, { "epoch": 2.25, "learning_rate": 1.9248985160524785e-05, "loss": 0.0081, "step": 156390 }, { "epoch": 2.25, "learning_rate": 1.9248937120786315e-05, "loss": 0.0097, "step": 156400 }, { "epoch": 2.25, "learning_rate": 1.9248889081047844e-05, "loss": 0.0064, "step": 156410 }, { "epoch": 2.25, "learning_rate": 1.9248841041309373e-05, "loss": 0.0087, "step": 156420 }, { "epoch": 2.25, "learning_rate": 1.92487930015709e-05, "loss": 0.0065, "step": 156430 }, { "epoch": 2.25, "learning_rate": 1.924874496183243e-05, "loss": 0.0051, "step": 156440 }, { "epoch": 2.25, "learning_rate": 1.9248696922093958e-05, "loss": 0.0067, "step": 156450 }, { "epoch": 2.25, "learning_rate": 1.9248648882355484e-05, "loss": 0.0074, "step": 156460 }, { "epoch": 2.26, "learning_rate": 1.9248600842617013e-05, "loss": 0.0074, "step": 156470 }, { "epoch": 2.26, "learning_rate": 1.9248552802878542e-05, "loss": 0.0088, "step": 156480 }, { "epoch": 2.26, "learning_rate": 1.924850476314007e-05, "loss": 0.0085, "step": 156490 }, { "epoch": 2.26, "learning_rate": 1.9248456723401597e-05, "loss": 0.0064, "step": 156500 }, { "epoch": 2.26, "learning_rate": 1.9248408683663126e-05, "loss": 0.0061, "step": 156510 }, { "epoch": 2.26, "learning_rate": 1.9248360643924656e-05, "loss": 0.0085, "step": 156520 }, { "epoch": 2.26, "learning_rate": 1.9248312604186185e-05, "loss": 0.0068, "step": 156530 }, { "epoch": 2.26, "learning_rate": 1.924826456444771e-05, "loss": 0.0101, "step": 156540 }, { "epoch": 2.26, "learning_rate": 1.924821652470924e-05, "loss": 0.0074, "step": 156550 }, { "epoch": 2.26, "learning_rate": 1.924816848497077e-05, "loss": 0.0065, "step": 156560 }, { "epoch": 2.26, "learning_rate": 1.9248120445232295e-05, "loss": 0.0063, "step": 156570 }, { "epoch": 2.26, "learning_rate": 1.9248072405493825e-05, "loss": 0.0087, "step": 156580 }, { "epoch": 2.26, "learning_rate": 1.9248024365755354e-05, "loss": 0.0065, "step": 156590 }, { "epoch": 2.26, "learning_rate": 1.9247976326016883e-05, "loss": 0.0082, "step": 156600 }, { "epoch": 2.26, "learning_rate": 1.924792828627841e-05, "loss": 0.0059, "step": 156610 }, { "epoch": 2.26, "learning_rate": 1.9247880246539938e-05, "loss": 0.0077, "step": 156620 }, { "epoch": 2.26, "learning_rate": 1.9247832206801468e-05, "loss": 0.0103, "step": 156630 }, { "epoch": 2.26, "learning_rate": 1.9247784167062993e-05, "loss": 0.0078, "step": 156640 }, { "epoch": 2.26, "learning_rate": 1.9247736127324523e-05, "loss": 0.0064, "step": 156650 }, { "epoch": 2.26, "learning_rate": 1.9247688087586052e-05, "loss": 0.0098, "step": 156660 }, { "epoch": 2.26, "learning_rate": 1.924764004784758e-05, "loss": 0.0068, "step": 156670 }, { "epoch": 2.26, "learning_rate": 1.9247592008109107e-05, "loss": 0.0079, "step": 156680 }, { "epoch": 2.26, "learning_rate": 1.9247543968370636e-05, "loss": 0.009, "step": 156690 }, { "epoch": 2.26, "learning_rate": 1.9247495928632166e-05, "loss": 0.0088, "step": 156700 }, { "epoch": 2.26, "learning_rate": 1.9247447888893695e-05, "loss": 0.0103, "step": 156710 }, { "epoch": 2.26, "learning_rate": 1.9247399849155224e-05, "loss": 0.0093, "step": 156720 }, { "epoch": 2.26, "learning_rate": 1.9247351809416753e-05, "loss": 0.0087, "step": 156730 }, { "epoch": 2.26, "learning_rate": 1.924730376967828e-05, "loss": 0.0092, "step": 156740 }, { "epoch": 2.26, "learning_rate": 1.924725572993981e-05, "loss": 0.0084, "step": 156750 }, { "epoch": 2.26, "learning_rate": 1.9247207690201338e-05, "loss": 0.0066, "step": 156760 }, { "epoch": 2.26, "learning_rate": 1.9247159650462867e-05, "loss": 0.0073, "step": 156770 }, { "epoch": 2.26, "learning_rate": 1.9247111610724393e-05, "loss": 0.0107, "step": 156780 }, { "epoch": 2.26, "learning_rate": 1.9247063570985922e-05, "loss": 0.0106, "step": 156790 }, { "epoch": 2.26, "learning_rate": 1.924701553124745e-05, "loss": 0.0076, "step": 156800 }, { "epoch": 2.26, "learning_rate": 1.9246967491508977e-05, "loss": 0.0083, "step": 156810 }, { "epoch": 2.26, "learning_rate": 1.9246919451770507e-05, "loss": 0.0073, "step": 156820 }, { "epoch": 2.26, "learning_rate": 1.9246871412032036e-05, "loss": 0.0066, "step": 156830 }, { "epoch": 2.26, "learning_rate": 1.9246823372293565e-05, "loss": 0.0077, "step": 156840 }, { "epoch": 2.26, "learning_rate": 1.924677533255509e-05, "loss": 0.007, "step": 156850 }, { "epoch": 2.26, "learning_rate": 1.924672729281662e-05, "loss": 0.0119, "step": 156860 }, { "epoch": 2.26, "learning_rate": 1.924667925307815e-05, "loss": 0.012, "step": 156870 }, { "epoch": 2.26, "learning_rate": 1.9246631213339676e-05, "loss": 0.0078, "step": 156880 }, { "epoch": 2.26, "learning_rate": 1.9246583173601205e-05, "loss": 0.0079, "step": 156890 }, { "epoch": 2.26, "learning_rate": 1.9246535133862734e-05, "loss": 0.0085, "step": 156900 }, { "epoch": 2.26, "learning_rate": 1.9246487094124263e-05, "loss": 0.0107, "step": 156910 }, { "epoch": 2.26, "learning_rate": 1.924643905438579e-05, "loss": 0.0084, "step": 156920 }, { "epoch": 2.26, "learning_rate": 1.924639101464732e-05, "loss": 0.0079, "step": 156930 }, { "epoch": 2.26, "learning_rate": 1.9246342974908848e-05, "loss": 0.009, "step": 156940 }, { "epoch": 2.26, "learning_rate": 1.9246294935170374e-05, "loss": 0.0099, "step": 156950 }, { "epoch": 2.26, "learning_rate": 1.9246246895431903e-05, "loss": 0.0074, "step": 156960 }, { "epoch": 2.26, "learning_rate": 1.9246198855693432e-05, "loss": 0.0096, "step": 156970 }, { "epoch": 2.26, "learning_rate": 1.924615081595496e-05, "loss": 0.0071, "step": 156980 }, { "epoch": 2.26, "learning_rate": 1.9246102776216487e-05, "loss": 0.0082, "step": 156990 }, { "epoch": 2.26, "learning_rate": 1.9246054736478017e-05, "loss": 0.0068, "step": 157000 }, { "epoch": 2.26, "learning_rate": 1.9246006696739546e-05, "loss": 0.0046, "step": 157010 }, { "epoch": 2.26, "learning_rate": 1.9245958657001075e-05, "loss": 0.0061, "step": 157020 }, { "epoch": 2.26, "learning_rate": 1.92459106172626e-05, "loss": 0.0075, "step": 157030 }, { "epoch": 2.26, "learning_rate": 1.924586257752413e-05, "loss": 0.0115, "step": 157040 }, { "epoch": 2.26, "learning_rate": 1.924581453778566e-05, "loss": 0.0082, "step": 157050 }, { "epoch": 2.26, "learning_rate": 1.9245766498047186e-05, "loss": 0.0061, "step": 157060 }, { "epoch": 2.26, "learning_rate": 1.9245718458308715e-05, "loss": 0.0093, "step": 157070 }, { "epoch": 2.26, "learning_rate": 1.9245670418570244e-05, "loss": 0.0073, "step": 157080 }, { "epoch": 2.26, "learning_rate": 1.9245622378831773e-05, "loss": 0.0071, "step": 157090 }, { "epoch": 2.26, "learning_rate": 1.92455743390933e-05, "loss": 0.0072, "step": 157100 }, { "epoch": 2.26, "learning_rate": 1.924552629935483e-05, "loss": 0.0047, "step": 157110 }, { "epoch": 2.26, "learning_rate": 1.9245478259616358e-05, "loss": 0.0094, "step": 157120 }, { "epoch": 2.26, "learning_rate": 1.9245430219877884e-05, "loss": 0.006, "step": 157130 }, { "epoch": 2.26, "learning_rate": 1.9245382180139413e-05, "loss": 0.0079, "step": 157140 }, { "epoch": 2.26, "learning_rate": 1.9245334140400942e-05, "loss": 0.0075, "step": 157150 }, { "epoch": 2.26, "learning_rate": 1.924528610066247e-05, "loss": 0.0093, "step": 157160 }, { "epoch": 2.27, "learning_rate": 1.9245238060923997e-05, "loss": 0.0066, "step": 157170 }, { "epoch": 2.27, "learning_rate": 1.9245190021185527e-05, "loss": 0.0048, "step": 157180 }, { "epoch": 2.27, "learning_rate": 1.9245141981447056e-05, "loss": 0.0079, "step": 157190 }, { "epoch": 2.27, "learning_rate": 1.9245093941708585e-05, "loss": 0.0083, "step": 157200 }, { "epoch": 2.27, "learning_rate": 1.924504590197011e-05, "loss": 0.0081, "step": 157210 }, { "epoch": 2.27, "learning_rate": 1.924499786223164e-05, "loss": 0.0086, "step": 157220 }, { "epoch": 2.27, "learning_rate": 1.924494982249317e-05, "loss": 0.0075, "step": 157230 }, { "epoch": 2.27, "learning_rate": 1.9244901782754695e-05, "loss": 0.011, "step": 157240 }, { "epoch": 2.27, "learning_rate": 1.9244853743016225e-05, "loss": 0.0087, "step": 157250 }, { "epoch": 2.27, "learning_rate": 1.9244805703277754e-05, "loss": 0.008, "step": 157260 }, { "epoch": 2.27, "learning_rate": 1.9244757663539283e-05, "loss": 0.0102, "step": 157270 }, { "epoch": 2.27, "learning_rate": 1.924470962380081e-05, "loss": 0.0097, "step": 157280 }, { "epoch": 2.27, "learning_rate": 1.924466158406234e-05, "loss": 0.0068, "step": 157290 }, { "epoch": 2.27, "learning_rate": 1.9244613544323868e-05, "loss": 0.0079, "step": 157300 }, { "epoch": 2.27, "learning_rate": 1.9244565504585394e-05, "loss": 0.0085, "step": 157310 }, { "epoch": 2.27, "learning_rate": 1.9244517464846923e-05, "loss": 0.0082, "step": 157320 }, { "epoch": 2.27, "learning_rate": 1.9244469425108452e-05, "loss": 0.0075, "step": 157330 }, { "epoch": 2.27, "learning_rate": 1.924442138536998e-05, "loss": 0.008, "step": 157340 }, { "epoch": 2.27, "learning_rate": 1.9244373345631507e-05, "loss": 0.0058, "step": 157350 }, { "epoch": 2.27, "learning_rate": 1.9244325305893036e-05, "loss": 0.008, "step": 157360 }, { "epoch": 2.27, "learning_rate": 1.9244277266154566e-05, "loss": 0.013, "step": 157370 }, { "epoch": 2.27, "learning_rate": 1.9244229226416095e-05, "loss": 0.0085, "step": 157380 }, { "epoch": 2.27, "learning_rate": 1.924418118667762e-05, "loss": 0.008, "step": 157390 }, { "epoch": 2.27, "learning_rate": 1.924413314693915e-05, "loss": 0.0087, "step": 157400 }, { "epoch": 2.27, "learning_rate": 1.924408510720068e-05, "loss": 0.0098, "step": 157410 }, { "epoch": 2.27, "learning_rate": 1.9244037067462205e-05, "loss": 0.0084, "step": 157420 }, { "epoch": 2.27, "learning_rate": 1.9243989027723735e-05, "loss": 0.0213, "step": 157430 }, { "epoch": 2.27, "learning_rate": 1.9243940987985264e-05, "loss": 0.0112, "step": 157440 }, { "epoch": 2.27, "learning_rate": 1.9243892948246793e-05, "loss": 0.0075, "step": 157450 }, { "epoch": 2.27, "learning_rate": 1.924384490850832e-05, "loss": 0.0089, "step": 157460 }, { "epoch": 2.27, "learning_rate": 1.9243796868769848e-05, "loss": 0.0066, "step": 157470 }, { "epoch": 2.27, "learning_rate": 1.9243748829031378e-05, "loss": 0.0071, "step": 157480 }, { "epoch": 2.27, "learning_rate": 1.9243700789292903e-05, "loss": 0.0097, "step": 157490 }, { "epoch": 2.27, "learning_rate": 1.9243652749554433e-05, "loss": 0.008, "step": 157500 }, { "epoch": 2.27, "learning_rate": 1.9243604709815962e-05, "loss": 0.0062, "step": 157510 }, { "epoch": 2.27, "learning_rate": 1.924355667007749e-05, "loss": 0.0074, "step": 157520 }, { "epoch": 2.27, "learning_rate": 1.9243508630339017e-05, "loss": 0.0104, "step": 157530 }, { "epoch": 2.27, "learning_rate": 1.9243460590600546e-05, "loss": 0.0067, "step": 157540 }, { "epoch": 2.27, "learning_rate": 1.9243412550862076e-05, "loss": 0.0074, "step": 157550 }, { "epoch": 2.27, "learning_rate": 1.9243364511123605e-05, "loss": 0.008, "step": 157560 }, { "epoch": 2.27, "learning_rate": 1.924331647138513e-05, "loss": 0.0073, "step": 157570 }, { "epoch": 2.27, "learning_rate": 1.924326843164666e-05, "loss": 0.0096, "step": 157580 }, { "epoch": 2.27, "learning_rate": 1.924322039190819e-05, "loss": 0.0077, "step": 157590 }, { "epoch": 2.27, "learning_rate": 1.9243172352169715e-05, "loss": 0.0129, "step": 157600 }, { "epoch": 2.27, "learning_rate": 1.9243124312431245e-05, "loss": 0.0065, "step": 157610 }, { "epoch": 2.27, "learning_rate": 1.9243076272692774e-05, "loss": 0.0074, "step": 157620 }, { "epoch": 2.27, "learning_rate": 1.9243028232954303e-05, "loss": 0.0075, "step": 157630 }, { "epoch": 2.27, "learning_rate": 1.924298019321583e-05, "loss": 0.0094, "step": 157640 }, { "epoch": 2.27, "learning_rate": 1.9242932153477358e-05, "loss": 0.0095, "step": 157650 }, { "epoch": 2.27, "learning_rate": 1.9242884113738887e-05, "loss": 0.0077, "step": 157660 }, { "epoch": 2.27, "learning_rate": 1.9242836074000413e-05, "loss": 0.0072, "step": 157670 }, { "epoch": 2.27, "learning_rate": 1.9242788034261943e-05, "loss": 0.007, "step": 157680 }, { "epoch": 2.27, "learning_rate": 1.9242739994523472e-05, "loss": 0.0046, "step": 157690 }, { "epoch": 2.27, "learning_rate": 1.9242691954785e-05, "loss": 0.0051, "step": 157700 }, { "epoch": 2.27, "learning_rate": 1.9242643915046527e-05, "loss": 0.0083, "step": 157710 }, { "epoch": 2.27, "learning_rate": 1.9242595875308056e-05, "loss": 0.0078, "step": 157720 }, { "epoch": 2.27, "learning_rate": 1.9242547835569586e-05, "loss": 0.0087, "step": 157730 }, { "epoch": 2.27, "learning_rate": 1.9242499795831115e-05, "loss": 0.0073, "step": 157740 }, { "epoch": 2.27, "learning_rate": 1.924245175609264e-05, "loss": 0.0076, "step": 157750 }, { "epoch": 2.27, "learning_rate": 1.924240371635417e-05, "loss": 0.0052, "step": 157760 }, { "epoch": 2.27, "learning_rate": 1.92423556766157e-05, "loss": 0.0097, "step": 157770 }, { "epoch": 2.27, "learning_rate": 1.9242307636877225e-05, "loss": 0.0077, "step": 157780 }, { "epoch": 2.27, "learning_rate": 1.9242259597138754e-05, "loss": 0.0047, "step": 157790 }, { "epoch": 2.27, "learning_rate": 1.9242211557400284e-05, "loss": 0.0073, "step": 157800 }, { "epoch": 2.27, "learning_rate": 1.9242163517661813e-05, "loss": 0.0096, "step": 157810 }, { "epoch": 2.27, "learning_rate": 1.924211547792334e-05, "loss": 0.01, "step": 157820 }, { "epoch": 2.27, "learning_rate": 1.9242067438184868e-05, "loss": 0.007, "step": 157830 }, { "epoch": 2.27, "learning_rate": 1.9242019398446397e-05, "loss": 0.0077, "step": 157840 }, { "epoch": 2.27, "learning_rate": 1.9241971358707923e-05, "loss": 0.0089, "step": 157850 }, { "epoch": 2.28, "learning_rate": 1.9241923318969453e-05, "loss": 0.0061, "step": 157860 }, { "epoch": 2.28, "learning_rate": 1.9241875279230982e-05, "loss": 0.0093, "step": 157870 }, { "epoch": 2.28, "learning_rate": 1.924182723949251e-05, "loss": 0.0079, "step": 157880 }, { "epoch": 2.28, "learning_rate": 1.9241779199754037e-05, "loss": 0.008, "step": 157890 }, { "epoch": 2.28, "learning_rate": 1.9241731160015566e-05, "loss": 0.0108, "step": 157900 }, { "epoch": 2.28, "learning_rate": 1.9241683120277096e-05, "loss": 0.0083, "step": 157910 }, { "epoch": 2.28, "learning_rate": 1.9241635080538625e-05, "loss": 0.0078, "step": 157920 }, { "epoch": 2.28, "learning_rate": 1.924158704080015e-05, "loss": 0.0089, "step": 157930 }, { "epoch": 2.28, "learning_rate": 1.924153900106168e-05, "loss": 0.0064, "step": 157940 }, { "epoch": 2.28, "learning_rate": 1.924149096132321e-05, "loss": 0.0101, "step": 157950 }, { "epoch": 2.28, "learning_rate": 1.9241442921584735e-05, "loss": 0.0086, "step": 157960 }, { "epoch": 2.28, "learning_rate": 1.9241394881846264e-05, "loss": 0.0056, "step": 157970 }, { "epoch": 2.28, "learning_rate": 1.9241346842107794e-05, "loss": 0.0061, "step": 157980 }, { "epoch": 2.28, "learning_rate": 1.9241298802369323e-05, "loss": 0.011, "step": 157990 }, { "epoch": 2.28, "learning_rate": 1.924125076263085e-05, "loss": 0.008, "step": 158000 }, { "epoch": 2.28, "learning_rate": 1.9241202722892378e-05, "loss": 0.0097, "step": 158010 }, { "epoch": 2.28, "learning_rate": 1.9241154683153907e-05, "loss": 0.0086, "step": 158020 }, { "epoch": 2.28, "learning_rate": 1.9241106643415433e-05, "loss": 0.0096, "step": 158030 }, { "epoch": 2.28, "learning_rate": 1.9241058603676962e-05, "loss": 0.0075, "step": 158040 }, { "epoch": 2.28, "learning_rate": 1.9241010563938492e-05, "loss": 0.0157, "step": 158050 }, { "epoch": 2.28, "learning_rate": 1.924096252420002e-05, "loss": 0.0109, "step": 158060 }, { "epoch": 2.28, "learning_rate": 1.9240914484461547e-05, "loss": 0.0083, "step": 158070 }, { "epoch": 2.28, "learning_rate": 1.9240866444723076e-05, "loss": 0.0052, "step": 158080 }, { "epoch": 2.28, "learning_rate": 1.9240818404984605e-05, "loss": 0.0066, "step": 158090 }, { "epoch": 2.28, "learning_rate": 1.9240770365246135e-05, "loss": 0.0059, "step": 158100 }, { "epoch": 2.28, "learning_rate": 1.924072232550766e-05, "loss": 0.0111, "step": 158110 }, { "epoch": 2.28, "learning_rate": 1.924067428576919e-05, "loss": 0.0079, "step": 158120 }, { "epoch": 2.28, "learning_rate": 1.924062624603072e-05, "loss": 0.0077, "step": 158130 }, { "epoch": 2.28, "learning_rate": 1.9240578206292245e-05, "loss": 0.0069, "step": 158140 }, { "epoch": 2.28, "learning_rate": 1.9240530166553774e-05, "loss": 0.0079, "step": 158150 }, { "epoch": 2.28, "learning_rate": 1.9240482126815304e-05, "loss": 0.0098, "step": 158160 }, { "epoch": 2.28, "learning_rate": 1.9240434087076833e-05, "loss": 0.0063, "step": 158170 }, { "epoch": 2.28, "learning_rate": 1.924038604733836e-05, "loss": 0.0056, "step": 158180 }, { "epoch": 2.28, "learning_rate": 1.9240338007599888e-05, "loss": 0.0062, "step": 158190 }, { "epoch": 2.28, "learning_rate": 1.9240289967861417e-05, "loss": 0.0082, "step": 158200 }, { "epoch": 2.28, "learning_rate": 1.9240241928122943e-05, "loss": 0.0088, "step": 158210 }, { "epoch": 2.28, "learning_rate": 1.9240193888384472e-05, "loss": 0.012, "step": 158220 }, { "epoch": 2.28, "learning_rate": 1.9240145848646e-05, "loss": 0.0065, "step": 158230 }, { "epoch": 2.28, "learning_rate": 1.924009780890753e-05, "loss": 0.0101, "step": 158240 }, { "epoch": 2.28, "learning_rate": 1.9240049769169057e-05, "loss": 0.0074, "step": 158250 }, { "epoch": 2.28, "learning_rate": 1.9240001729430586e-05, "loss": 0.0113, "step": 158260 }, { "epoch": 2.28, "learning_rate": 1.9239953689692115e-05, "loss": 0.0085, "step": 158270 }, { "epoch": 2.28, "learning_rate": 1.9239905649953645e-05, "loss": 0.0057, "step": 158280 }, { "epoch": 2.28, "learning_rate": 1.923985761021517e-05, "loss": 0.0073, "step": 158290 }, { "epoch": 2.28, "learning_rate": 1.92398095704767e-05, "loss": 0.013, "step": 158300 }, { "epoch": 2.28, "learning_rate": 1.923976153073823e-05, "loss": 0.0083, "step": 158310 }, { "epoch": 2.28, "learning_rate": 1.9239713490999755e-05, "loss": 0.0068, "step": 158320 }, { "epoch": 2.28, "learning_rate": 1.9239665451261284e-05, "loss": 0.0089, "step": 158330 }, { "epoch": 2.28, "learning_rate": 1.9239617411522813e-05, "loss": 0.0051, "step": 158340 }, { "epoch": 2.28, "learning_rate": 1.9239569371784343e-05, "loss": 0.0069, "step": 158350 }, { "epoch": 2.28, "learning_rate": 1.923952133204587e-05, "loss": 0.0093, "step": 158360 }, { "epoch": 2.28, "learning_rate": 1.9239473292307398e-05, "loss": 0.0064, "step": 158370 }, { "epoch": 2.28, "learning_rate": 1.9239425252568927e-05, "loss": 0.0063, "step": 158380 }, { "epoch": 2.28, "learning_rate": 1.9239377212830453e-05, "loss": 0.0086, "step": 158390 }, { "epoch": 2.28, "learning_rate": 1.9239329173091982e-05, "loss": 0.008, "step": 158400 }, { "epoch": 2.28, "learning_rate": 1.923928113335351e-05, "loss": 0.0086, "step": 158410 }, { "epoch": 2.28, "learning_rate": 1.923923309361504e-05, "loss": 0.0045, "step": 158420 }, { "epoch": 2.28, "learning_rate": 1.9239185053876567e-05, "loss": 0.0067, "step": 158430 }, { "epoch": 2.28, "learning_rate": 1.9239137014138096e-05, "loss": 0.0087, "step": 158440 }, { "epoch": 2.28, "learning_rate": 1.9239088974399625e-05, "loss": 0.0061, "step": 158450 }, { "epoch": 2.28, "learning_rate": 1.9239040934661155e-05, "loss": 0.007, "step": 158460 }, { "epoch": 2.28, "learning_rate": 1.923899289492268e-05, "loss": 0.0082, "step": 158470 }, { "epoch": 2.28, "learning_rate": 1.923894485518421e-05, "loss": 0.0097, "step": 158480 }, { "epoch": 2.28, "learning_rate": 1.923889681544574e-05, "loss": 0.0095, "step": 158490 }, { "epoch": 2.28, "learning_rate": 1.9238848775707265e-05, "loss": 0.0062, "step": 158500 }, { "epoch": 2.28, "learning_rate": 1.9238800735968794e-05, "loss": 0.0101, "step": 158510 }, { "epoch": 2.28, "learning_rate": 1.9238752696230323e-05, "loss": 0.0065, "step": 158520 }, { "epoch": 2.28, "learning_rate": 1.9238704656491853e-05, "loss": 0.0096, "step": 158530 }, { "epoch": 2.28, "learning_rate": 1.923865661675338e-05, "loss": 0.0065, "step": 158540 }, { "epoch": 2.29, "learning_rate": 1.9238608577014908e-05, "loss": 0.0093, "step": 158550 }, { "epoch": 2.29, "learning_rate": 1.9238560537276437e-05, "loss": 0.0062, "step": 158560 }, { "epoch": 2.29, "learning_rate": 1.9238512497537963e-05, "loss": 0.0093, "step": 158570 }, { "epoch": 2.29, "learning_rate": 1.9238464457799492e-05, "loss": 0.0078, "step": 158580 }, { "epoch": 2.29, "learning_rate": 1.923841641806102e-05, "loss": 0.0054, "step": 158590 }, { "epoch": 2.29, "learning_rate": 1.923836837832255e-05, "loss": 0.0093, "step": 158600 }, { "epoch": 2.29, "learning_rate": 1.9238320338584077e-05, "loss": 0.0084, "step": 158610 }, { "epoch": 2.29, "learning_rate": 1.9238272298845606e-05, "loss": 0.0097, "step": 158620 }, { "epoch": 2.29, "learning_rate": 1.9238224259107135e-05, "loss": 0.0045, "step": 158630 }, { "epoch": 2.29, "learning_rate": 1.9238176219368664e-05, "loss": 0.0081, "step": 158640 }, { "epoch": 2.29, "learning_rate": 1.923812817963019e-05, "loss": 0.0072, "step": 158650 }, { "epoch": 2.29, "learning_rate": 1.923808013989172e-05, "loss": 0.0073, "step": 158660 }, { "epoch": 2.29, "learning_rate": 1.923803210015325e-05, "loss": 0.007, "step": 158670 }, { "epoch": 2.29, "learning_rate": 1.9237984060414775e-05, "loss": 0.0074, "step": 158680 }, { "epoch": 2.29, "learning_rate": 1.9237936020676304e-05, "loss": 0.0097, "step": 158690 }, { "epoch": 2.29, "learning_rate": 1.9237887980937833e-05, "loss": 0.0078, "step": 158700 }, { "epoch": 2.29, "learning_rate": 1.9237839941199363e-05, "loss": 0.0091, "step": 158710 }, { "epoch": 2.29, "learning_rate": 1.923779190146089e-05, "loss": 0.0093, "step": 158720 }, { "epoch": 2.29, "learning_rate": 1.9237743861722418e-05, "loss": 0.0103, "step": 158730 }, { "epoch": 2.29, "learning_rate": 1.9237695821983947e-05, "loss": 0.0068, "step": 158740 }, { "epoch": 2.29, "learning_rate": 1.9237647782245473e-05, "loss": 0.0067, "step": 158750 }, { "epoch": 2.29, "learning_rate": 1.9237599742507002e-05, "loss": 0.0084, "step": 158760 }, { "epoch": 2.29, "learning_rate": 1.923755170276853e-05, "loss": 0.0075, "step": 158770 }, { "epoch": 2.29, "learning_rate": 1.923750366303006e-05, "loss": 0.0091, "step": 158780 }, { "epoch": 2.29, "learning_rate": 1.9237455623291587e-05, "loss": 0.0108, "step": 158790 }, { "epoch": 2.29, "learning_rate": 1.9237407583553116e-05, "loss": 0.0068, "step": 158800 }, { "epoch": 2.29, "learning_rate": 1.9237359543814645e-05, "loss": 0.008, "step": 158810 }, { "epoch": 2.29, "learning_rate": 1.923731150407617e-05, "loss": 0.0092, "step": 158820 }, { "epoch": 2.29, "learning_rate": 1.92372634643377e-05, "loss": 0.0076, "step": 158830 }, { "epoch": 2.29, "learning_rate": 1.923721542459923e-05, "loss": 0.0059, "step": 158840 }, { "epoch": 2.29, "learning_rate": 1.923716738486076e-05, "loss": 0.0099, "step": 158850 }, { "epoch": 2.29, "learning_rate": 1.9237119345122285e-05, "loss": 0.0117, "step": 158860 }, { "epoch": 2.29, "learning_rate": 1.9237071305383814e-05, "loss": 0.0081, "step": 158870 }, { "epoch": 2.29, "learning_rate": 1.9237023265645343e-05, "loss": 0.0087, "step": 158880 }, { "epoch": 2.29, "learning_rate": 1.9236975225906872e-05, "loss": 0.0076, "step": 158890 }, { "epoch": 2.29, "learning_rate": 1.92369271861684e-05, "loss": 0.0058, "step": 158900 }, { "epoch": 2.29, "learning_rate": 1.9236879146429928e-05, "loss": 0.0069, "step": 158910 }, { "epoch": 2.29, "learning_rate": 1.9236831106691457e-05, "loss": 0.0072, "step": 158920 }, { "epoch": 2.29, "learning_rate": 1.9236783066952983e-05, "loss": 0.0068, "step": 158930 }, { "epoch": 2.29, "learning_rate": 1.9236735027214512e-05, "loss": 0.0061, "step": 158940 }, { "epoch": 2.29, "learning_rate": 1.923668698747604e-05, "loss": 0.0067, "step": 158950 }, { "epoch": 2.29, "learning_rate": 1.923663894773757e-05, "loss": 0.0135, "step": 158960 }, { "epoch": 2.29, "learning_rate": 1.9236590907999096e-05, "loss": 0.0083, "step": 158970 }, { "epoch": 2.29, "learning_rate": 1.9236542868260626e-05, "loss": 0.0124, "step": 158980 }, { "epoch": 2.29, "learning_rate": 1.9236494828522155e-05, "loss": 0.0084, "step": 158990 }, { "epoch": 2.29, "learning_rate": 1.923644678878368e-05, "loss": 0.0068, "step": 159000 }, { "epoch": 2.29, "learning_rate": 1.923639874904521e-05, "loss": 0.0062, "step": 159010 }, { "epoch": 2.29, "learning_rate": 1.923635070930674e-05, "loss": 0.0092, "step": 159020 }, { "epoch": 2.29, "learning_rate": 1.923630266956827e-05, "loss": 0.0097, "step": 159030 }, { "epoch": 2.29, "learning_rate": 1.9236254629829795e-05, "loss": 0.0109, "step": 159040 }, { "epoch": 2.29, "learning_rate": 1.9236206590091324e-05, "loss": 0.0111, "step": 159050 }, { "epoch": 2.29, "learning_rate": 1.9236158550352853e-05, "loss": 0.0081, "step": 159060 }, { "epoch": 2.29, "learning_rate": 1.9236110510614382e-05, "loss": 0.0048, "step": 159070 }, { "epoch": 2.29, "learning_rate": 1.9236062470875908e-05, "loss": 0.0067, "step": 159080 }, { "epoch": 2.29, "learning_rate": 1.9236014431137438e-05, "loss": 0.0073, "step": 159090 }, { "epoch": 2.29, "learning_rate": 1.9235966391398967e-05, "loss": 0.0216, "step": 159100 }, { "epoch": 2.29, "learning_rate": 1.9235918351660493e-05, "loss": 0.0059, "step": 159110 }, { "epoch": 2.29, "learning_rate": 1.9235870311922022e-05, "loss": 0.007, "step": 159120 }, { "epoch": 2.29, "learning_rate": 1.923582227218355e-05, "loss": 0.0067, "step": 159130 }, { "epoch": 2.29, "learning_rate": 1.923577423244508e-05, "loss": 0.0101, "step": 159140 }, { "epoch": 2.29, "learning_rate": 1.9235726192706606e-05, "loss": 0.006, "step": 159150 }, { "epoch": 2.29, "learning_rate": 1.9235678152968136e-05, "loss": 0.0085, "step": 159160 }, { "epoch": 2.29, "learning_rate": 1.9235630113229665e-05, "loss": 0.0095, "step": 159170 }, { "epoch": 2.29, "learning_rate": 1.923558207349119e-05, "loss": 0.0092, "step": 159180 }, { "epoch": 2.29, "learning_rate": 1.923553403375272e-05, "loss": 0.0083, "step": 159190 }, { "epoch": 2.29, "learning_rate": 1.923548599401425e-05, "loss": 0.0064, "step": 159200 }, { "epoch": 2.29, "learning_rate": 1.923543795427578e-05, "loss": 0.0051, "step": 159210 }, { "epoch": 2.29, "learning_rate": 1.9235389914537304e-05, "loss": 0.0097, "step": 159220 }, { "epoch": 2.29, "learning_rate": 1.9235341874798834e-05, "loss": 0.0075, "step": 159230 }, { "epoch": 2.29, "learning_rate": 1.9235293835060363e-05, "loss": 0.0076, "step": 159240 }, { "epoch": 2.3, "learning_rate": 1.9235245795321892e-05, "loss": 0.0047, "step": 159250 }, { "epoch": 2.3, "learning_rate": 1.923519775558342e-05, "loss": 0.0077, "step": 159260 }, { "epoch": 2.3, "learning_rate": 1.923514971584495e-05, "loss": 0.0076, "step": 159270 }, { "epoch": 2.3, "learning_rate": 1.9235101676106477e-05, "loss": 0.0121, "step": 159280 }, { "epoch": 2.3, "learning_rate": 1.9235053636368006e-05, "loss": 0.0084, "step": 159290 }, { "epoch": 2.3, "learning_rate": 1.9235005596629535e-05, "loss": 0.0049, "step": 159300 }, { "epoch": 2.3, "learning_rate": 1.9234957556891065e-05, "loss": 0.0072, "step": 159310 }, { "epoch": 2.3, "learning_rate": 1.923490951715259e-05, "loss": 0.0077, "step": 159320 }, { "epoch": 2.3, "learning_rate": 1.923486147741412e-05, "loss": 0.0067, "step": 159330 }, { "epoch": 2.3, "learning_rate": 1.923481343767565e-05, "loss": 0.0089, "step": 159340 }, { "epoch": 2.3, "learning_rate": 1.9234765397937175e-05, "loss": 0.0089, "step": 159350 }, { "epoch": 2.3, "learning_rate": 1.9234717358198704e-05, "loss": 0.0063, "step": 159360 }, { "epoch": 2.3, "learning_rate": 1.9234669318460233e-05, "loss": 0.0095, "step": 159370 }, { "epoch": 2.3, "learning_rate": 1.9234621278721763e-05, "loss": 0.0073, "step": 159380 }, { "epoch": 2.3, "learning_rate": 1.923457323898329e-05, "loss": 0.0061, "step": 159390 }, { "epoch": 2.3, "learning_rate": 1.9234525199244818e-05, "loss": 0.01, "step": 159400 }, { "epoch": 2.3, "learning_rate": 1.9234477159506347e-05, "loss": 0.0076, "step": 159410 }, { "epoch": 2.3, "learning_rate": 1.9234429119767873e-05, "loss": 0.0073, "step": 159420 }, { "epoch": 2.3, "learning_rate": 1.9234381080029402e-05, "loss": 0.007, "step": 159430 }, { "epoch": 2.3, "learning_rate": 1.923433304029093e-05, "loss": 0.008, "step": 159440 }, { "epoch": 2.3, "learning_rate": 1.923428500055246e-05, "loss": 0.0055, "step": 159450 }, { "epoch": 2.3, "learning_rate": 1.9234236960813987e-05, "loss": 0.0056, "step": 159460 }, { "epoch": 2.3, "learning_rate": 1.9234188921075516e-05, "loss": 0.0059, "step": 159470 }, { "epoch": 2.3, "learning_rate": 1.9234140881337045e-05, "loss": 0.0081, "step": 159480 }, { "epoch": 2.3, "learning_rate": 1.9234092841598574e-05, "loss": 0.0063, "step": 159490 }, { "epoch": 2.3, "learning_rate": 1.92340448018601e-05, "loss": 0.0053, "step": 159500 }, { "epoch": 2.3, "learning_rate": 1.923399676212163e-05, "loss": 0.0122, "step": 159510 }, { "epoch": 2.3, "learning_rate": 1.923394872238316e-05, "loss": 0.0095, "step": 159520 }, { "epoch": 2.3, "learning_rate": 1.9233900682644685e-05, "loss": 0.0117, "step": 159530 }, { "epoch": 2.3, "learning_rate": 1.9233852642906214e-05, "loss": 0.0088, "step": 159540 }, { "epoch": 2.3, "learning_rate": 1.9233804603167743e-05, "loss": 0.0078, "step": 159550 }, { "epoch": 2.3, "learning_rate": 1.9233756563429273e-05, "loss": 0.0091, "step": 159560 }, { "epoch": 2.3, "learning_rate": 1.92337085236908e-05, "loss": 0.0079, "step": 159570 }, { "epoch": 2.3, "learning_rate": 1.9233660483952328e-05, "loss": 0.0051, "step": 159580 }, { "epoch": 2.3, "learning_rate": 1.9233612444213857e-05, "loss": 0.007, "step": 159590 }, { "epoch": 2.3, "learning_rate": 1.9233564404475383e-05, "loss": 0.0065, "step": 159600 }, { "epoch": 2.3, "learning_rate": 1.9233516364736912e-05, "loss": 0.0086, "step": 159610 }, { "epoch": 2.3, "learning_rate": 1.923346832499844e-05, "loss": 0.0102, "step": 159620 }, { "epoch": 2.3, "learning_rate": 1.923342028525997e-05, "loss": 0.0075, "step": 159630 }, { "epoch": 2.3, "learning_rate": 1.9233372245521497e-05, "loss": 0.0058, "step": 159640 }, { "epoch": 2.3, "learning_rate": 1.9233324205783026e-05, "loss": 0.0061, "step": 159650 }, { "epoch": 2.3, "learning_rate": 1.9233276166044555e-05, "loss": 0.0108, "step": 159660 }, { "epoch": 2.3, "learning_rate": 1.9233228126306084e-05, "loss": 0.0081, "step": 159670 }, { "epoch": 2.3, "learning_rate": 1.923318008656761e-05, "loss": 0.0073, "step": 159680 }, { "epoch": 2.3, "learning_rate": 1.923313204682914e-05, "loss": 0.0084, "step": 159690 }, { "epoch": 2.3, "learning_rate": 1.923308400709067e-05, "loss": 0.0079, "step": 159700 }, { "epoch": 2.3, "learning_rate": 1.9233035967352195e-05, "loss": 0.0063, "step": 159710 }, { "epoch": 2.3, "learning_rate": 1.9232987927613724e-05, "loss": 0.0084, "step": 159720 }, { "epoch": 2.3, "learning_rate": 1.9232939887875253e-05, "loss": 0.0092, "step": 159730 }, { "epoch": 2.3, "learning_rate": 1.9232891848136782e-05, "loss": 0.0092, "step": 159740 }, { "epoch": 2.3, "learning_rate": 1.923284380839831e-05, "loss": 0.0108, "step": 159750 }, { "epoch": 2.3, "learning_rate": 1.9232795768659838e-05, "loss": 0.01, "step": 159760 }, { "epoch": 2.3, "learning_rate": 1.9232747728921367e-05, "loss": 0.0093, "step": 159770 }, { "epoch": 2.3, "learning_rate": 1.9232699689182893e-05, "loss": 0.006, "step": 159780 }, { "epoch": 2.3, "learning_rate": 1.9232651649444422e-05, "loss": 0.005, "step": 159790 }, { "epoch": 2.3, "learning_rate": 1.923260360970595e-05, "loss": 0.0075, "step": 159800 }, { "epoch": 2.3, "learning_rate": 1.923255556996748e-05, "loss": 0.0084, "step": 159810 }, { "epoch": 2.3, "learning_rate": 1.9232507530229006e-05, "loss": 0.0101, "step": 159820 }, { "epoch": 2.3, "learning_rate": 1.9232459490490536e-05, "loss": 0.0081, "step": 159830 }, { "epoch": 2.3, "learning_rate": 1.9232411450752065e-05, "loss": 0.0067, "step": 159840 }, { "epoch": 2.3, "learning_rate": 1.9232363411013594e-05, "loss": 0.0083, "step": 159850 }, { "epoch": 2.3, "learning_rate": 1.923231537127512e-05, "loss": 0.0067, "step": 159860 }, { "epoch": 2.3, "learning_rate": 1.923226733153665e-05, "loss": 0.0075, "step": 159870 }, { "epoch": 2.3, "learning_rate": 1.923221929179818e-05, "loss": 0.0058, "step": 159880 }, { "epoch": 2.3, "learning_rate": 1.9232171252059705e-05, "loss": 0.0082, "step": 159890 }, { "epoch": 2.3, "learning_rate": 1.9232123212321234e-05, "loss": 0.008, "step": 159900 }, { "epoch": 2.3, "learning_rate": 1.9232075172582763e-05, "loss": 0.0083, "step": 159910 }, { "epoch": 2.3, "learning_rate": 1.9232027132844292e-05, "loss": 0.0081, "step": 159920 }, { "epoch": 2.3, "learning_rate": 1.9231979093105818e-05, "loss": 0.0084, "step": 159930 }, { "epoch": 2.31, "learning_rate": 1.9231931053367348e-05, "loss": 0.0081, "step": 159940 }, { "epoch": 2.31, "learning_rate": 1.9231883013628877e-05, "loss": 0.0082, "step": 159950 }, { "epoch": 2.31, "learning_rate": 1.9231834973890403e-05, "loss": 0.0058, "step": 159960 }, { "epoch": 2.31, "learning_rate": 1.9231786934151932e-05, "loss": 0.0079, "step": 159970 }, { "epoch": 2.31, "learning_rate": 1.923173889441346e-05, "loss": 0.0093, "step": 159980 }, { "epoch": 2.31, "learning_rate": 1.923169085467499e-05, "loss": 0.0075, "step": 159990 }, { "epoch": 2.31, "learning_rate": 1.9231642814936516e-05, "loss": 0.007, "step": 160000 }, { "epoch": 2.31, "learning_rate": 1.9231594775198046e-05, "loss": 0.0085, "step": 160010 }, { "epoch": 2.31, "learning_rate": 1.9231546735459575e-05, "loss": 0.0071, "step": 160020 }, { "epoch": 2.31, "learning_rate": 1.9231498695721104e-05, "loss": 0.007, "step": 160030 }, { "epoch": 2.31, "learning_rate": 1.923145065598263e-05, "loss": 0.0089, "step": 160040 }, { "epoch": 2.31, "learning_rate": 1.923140261624416e-05, "loss": 0.0096, "step": 160050 }, { "epoch": 2.31, "learning_rate": 1.923135457650569e-05, "loss": 0.0067, "step": 160060 }, { "epoch": 2.31, "learning_rate": 1.9231306536767214e-05, "loss": 0.0082, "step": 160070 }, { "epoch": 2.31, "learning_rate": 1.9231258497028744e-05, "loss": 0.0096, "step": 160080 }, { "epoch": 2.31, "learning_rate": 1.9231210457290273e-05, "loss": 0.0059, "step": 160090 }, { "epoch": 2.31, "learning_rate": 1.9231162417551802e-05, "loss": 0.0069, "step": 160100 }, { "epoch": 2.31, "learning_rate": 1.9231114377813328e-05, "loss": 0.0092, "step": 160110 }, { "epoch": 2.31, "learning_rate": 1.9231066338074857e-05, "loss": 0.0079, "step": 160120 }, { "epoch": 2.31, "learning_rate": 1.9231018298336387e-05, "loss": 0.0077, "step": 160130 }, { "epoch": 2.31, "learning_rate": 1.9230970258597913e-05, "loss": 0.008, "step": 160140 }, { "epoch": 2.31, "learning_rate": 1.9230922218859442e-05, "loss": 0.0124, "step": 160150 }, { "epoch": 2.31, "learning_rate": 1.923087417912097e-05, "loss": 0.0099, "step": 160160 }, { "epoch": 2.31, "learning_rate": 1.92308261393825e-05, "loss": 0.0079, "step": 160170 }, { "epoch": 2.31, "learning_rate": 1.9230778099644026e-05, "loss": 0.0061, "step": 160180 }, { "epoch": 2.31, "learning_rate": 1.9230730059905556e-05, "loss": 0.0084, "step": 160190 }, { "epoch": 2.31, "learning_rate": 1.9230682020167085e-05, "loss": 0.01, "step": 160200 }, { "epoch": 2.31, "learning_rate": 1.9230633980428614e-05, "loss": 0.0074, "step": 160210 }, { "epoch": 2.31, "learning_rate": 1.923058594069014e-05, "loss": 0.0061, "step": 160220 }, { "epoch": 2.31, "learning_rate": 1.923053790095167e-05, "loss": 0.0068, "step": 160230 }, { "epoch": 2.31, "learning_rate": 1.92304898612132e-05, "loss": 0.0078, "step": 160240 }, { "epoch": 2.31, "learning_rate": 1.9230441821474724e-05, "loss": 0.0057, "step": 160250 }, { "epoch": 2.31, "learning_rate": 1.9230393781736254e-05, "loss": 0.0058, "step": 160260 }, { "epoch": 2.31, "learning_rate": 1.9230345741997783e-05, "loss": 0.006, "step": 160270 }, { "epoch": 2.31, "learning_rate": 1.9230297702259312e-05, "loss": 0.011, "step": 160280 }, { "epoch": 2.31, "learning_rate": 1.9230249662520838e-05, "loss": 0.0062, "step": 160290 }, { "epoch": 2.31, "learning_rate": 1.9230201622782367e-05, "loss": 0.0073, "step": 160300 }, { "epoch": 2.31, "learning_rate": 1.9230153583043897e-05, "loss": 0.0087, "step": 160310 }, { "epoch": 2.31, "learning_rate": 1.9230105543305423e-05, "loss": 0.0095, "step": 160320 }, { "epoch": 2.31, "learning_rate": 1.9230057503566952e-05, "loss": 0.0069, "step": 160330 }, { "epoch": 2.31, "learning_rate": 1.923000946382848e-05, "loss": 0.0072, "step": 160340 }, { "epoch": 2.31, "learning_rate": 1.922996142409001e-05, "loss": 0.0101, "step": 160350 }, { "epoch": 2.31, "learning_rate": 1.9229913384351536e-05, "loss": 0.0081, "step": 160360 }, { "epoch": 2.31, "learning_rate": 1.9229865344613065e-05, "loss": 0.0091, "step": 160370 }, { "epoch": 2.31, "learning_rate": 1.9229817304874595e-05, "loss": 0.0107, "step": 160380 }, { "epoch": 2.31, "learning_rate": 1.922976926513612e-05, "loss": 0.0096, "step": 160390 }, { "epoch": 2.31, "learning_rate": 1.922972122539765e-05, "loss": 0.0117, "step": 160400 }, { "epoch": 2.31, "learning_rate": 1.922967318565918e-05, "loss": 0.0096, "step": 160410 }, { "epoch": 2.31, "learning_rate": 1.922962514592071e-05, "loss": 0.0065, "step": 160420 }, { "epoch": 2.31, "learning_rate": 1.9229577106182234e-05, "loss": 0.0085, "step": 160430 }, { "epoch": 2.31, "learning_rate": 1.9229529066443764e-05, "loss": 0.0083, "step": 160440 }, { "epoch": 2.31, "learning_rate": 1.9229481026705293e-05, "loss": 0.0088, "step": 160450 }, { "epoch": 2.31, "learning_rate": 1.9229432986966822e-05, "loss": 0.0092, "step": 160460 }, { "epoch": 2.31, "learning_rate": 1.9229384947228348e-05, "loss": 0.0075, "step": 160470 }, { "epoch": 2.31, "learning_rate": 1.9229336907489877e-05, "loss": 0.01, "step": 160480 }, { "epoch": 2.31, "learning_rate": 1.9229288867751407e-05, "loss": 0.0077, "step": 160490 }, { "epoch": 2.31, "learning_rate": 1.9229240828012932e-05, "loss": 0.0063, "step": 160500 }, { "epoch": 2.31, "learning_rate": 1.9229192788274462e-05, "loss": 0.0084, "step": 160510 }, { "epoch": 2.31, "learning_rate": 1.922914474853599e-05, "loss": 0.0048, "step": 160520 }, { "epoch": 2.31, "learning_rate": 1.922909670879752e-05, "loss": 0.0063, "step": 160530 }, { "epoch": 2.31, "learning_rate": 1.9229048669059046e-05, "loss": 0.0064, "step": 160540 }, { "epoch": 2.31, "learning_rate": 1.9229000629320575e-05, "loss": 0.0071, "step": 160550 }, { "epoch": 2.31, "learning_rate": 1.9228952589582105e-05, "loss": 0.007, "step": 160560 }, { "epoch": 2.31, "learning_rate": 1.922890454984363e-05, "loss": 0.0084, "step": 160570 }, { "epoch": 2.31, "learning_rate": 1.922885651010516e-05, "loss": 0.0058, "step": 160580 }, { "epoch": 2.31, "learning_rate": 1.922880847036669e-05, "loss": 0.0082, "step": 160590 }, { "epoch": 2.31, "learning_rate": 1.922876043062822e-05, "loss": 0.0095, "step": 160600 }, { "epoch": 2.31, "learning_rate": 1.9228712390889744e-05, "loss": 0.0072, "step": 160610 }, { "epoch": 2.31, "learning_rate": 1.9228664351151273e-05, "loss": 0.0092, "step": 160620 }, { "epoch": 2.31, "learning_rate": 1.9228616311412803e-05, "loss": 0.0068, "step": 160630 }, { "epoch": 2.32, "learning_rate": 1.9228568271674332e-05, "loss": 0.0098, "step": 160640 }, { "epoch": 2.32, "learning_rate": 1.9228520231935858e-05, "loss": 0.0084, "step": 160650 }, { "epoch": 2.32, "learning_rate": 1.9228472192197387e-05, "loss": 0.0063, "step": 160660 }, { "epoch": 2.32, "learning_rate": 1.9228424152458916e-05, "loss": 0.0088, "step": 160670 }, { "epoch": 2.32, "learning_rate": 1.9228376112720442e-05, "loss": 0.0099, "step": 160680 }, { "epoch": 2.32, "learning_rate": 1.922832807298197e-05, "loss": 0.0056, "step": 160690 }, { "epoch": 2.32, "learning_rate": 1.92282800332435e-05, "loss": 0.0057, "step": 160700 }, { "epoch": 2.32, "learning_rate": 1.922823199350503e-05, "loss": 0.0099, "step": 160710 }, { "epoch": 2.32, "learning_rate": 1.9228183953766556e-05, "loss": 0.0049, "step": 160720 }, { "epoch": 2.32, "learning_rate": 1.9228135914028085e-05, "loss": 0.0068, "step": 160730 }, { "epoch": 2.32, "learning_rate": 1.9228087874289615e-05, "loss": 0.0091, "step": 160740 }, { "epoch": 2.32, "learning_rate": 1.922803983455114e-05, "loss": 0.0063, "step": 160750 }, { "epoch": 2.32, "learning_rate": 1.922799179481267e-05, "loss": 0.0062, "step": 160760 }, { "epoch": 2.32, "learning_rate": 1.92279437550742e-05, "loss": 0.0112, "step": 160770 }, { "epoch": 2.32, "learning_rate": 1.9227895715335728e-05, "loss": 0.0106, "step": 160780 }, { "epoch": 2.32, "learning_rate": 1.9227847675597254e-05, "loss": 0.0087, "step": 160790 }, { "epoch": 2.32, "learning_rate": 1.9227799635858783e-05, "loss": 0.0057, "step": 160800 }, { "epoch": 2.32, "learning_rate": 1.9227751596120313e-05, "loss": 0.0056, "step": 160810 }, { "epoch": 2.32, "learning_rate": 1.9227703556381842e-05, "loss": 0.0059, "step": 160820 }, { "epoch": 2.32, "learning_rate": 1.9227655516643368e-05, "loss": 0.0049, "step": 160830 }, { "epoch": 2.32, "learning_rate": 1.9227607476904897e-05, "loss": 0.0051, "step": 160840 }, { "epoch": 2.32, "learning_rate": 1.9227559437166426e-05, "loss": 0.0049, "step": 160850 }, { "epoch": 2.32, "learning_rate": 1.9227511397427952e-05, "loss": 0.0093, "step": 160860 }, { "epoch": 2.32, "learning_rate": 1.922746335768948e-05, "loss": 0.0083, "step": 160870 }, { "epoch": 2.32, "learning_rate": 1.922741531795101e-05, "loss": 0.0079, "step": 160880 }, { "epoch": 2.32, "learning_rate": 1.922736727821254e-05, "loss": 0.0076, "step": 160890 }, { "epoch": 2.32, "learning_rate": 1.9227319238474066e-05, "loss": 0.0083, "step": 160900 }, { "epoch": 2.32, "learning_rate": 1.9227271198735595e-05, "loss": 0.0068, "step": 160910 }, { "epoch": 2.32, "learning_rate": 1.9227223158997124e-05, "loss": 0.0081, "step": 160920 }, { "epoch": 2.32, "learning_rate": 1.922717511925865e-05, "loss": 0.0076, "step": 160930 }, { "epoch": 2.32, "learning_rate": 1.922712707952018e-05, "loss": 0.0062, "step": 160940 }, { "epoch": 2.32, "learning_rate": 1.922707903978171e-05, "loss": 0.0077, "step": 160950 }, { "epoch": 2.32, "learning_rate": 1.9227031000043238e-05, "loss": 0.0055, "step": 160960 }, { "epoch": 2.32, "learning_rate": 1.9226982960304764e-05, "loss": 0.0063, "step": 160970 }, { "epoch": 2.32, "learning_rate": 1.9226934920566293e-05, "loss": 0.0075, "step": 160980 }, { "epoch": 2.32, "learning_rate": 1.9226886880827823e-05, "loss": 0.0072, "step": 160990 }, { "epoch": 2.32, "learning_rate": 1.9226838841089352e-05, "loss": 0.0063, "step": 161000 }, { "epoch": 2.32, "learning_rate": 1.9226790801350878e-05, "loss": 0.0082, "step": 161010 }, { "epoch": 2.32, "learning_rate": 1.9226742761612407e-05, "loss": 0.0073, "step": 161020 }, { "epoch": 2.32, "learning_rate": 1.9226694721873936e-05, "loss": 0.0069, "step": 161030 }, { "epoch": 2.32, "learning_rate": 1.9226646682135462e-05, "loss": 0.0079, "step": 161040 }, { "epoch": 2.32, "learning_rate": 1.922659864239699e-05, "loss": 0.0097, "step": 161050 }, { "epoch": 2.32, "learning_rate": 1.922655060265852e-05, "loss": 0.0054, "step": 161060 }, { "epoch": 2.32, "learning_rate": 1.922650256292005e-05, "loss": 0.0055, "step": 161070 }, { "epoch": 2.32, "learning_rate": 1.9226454523181576e-05, "loss": 0.0071, "step": 161080 }, { "epoch": 2.32, "learning_rate": 1.9226406483443105e-05, "loss": 0.0101, "step": 161090 }, { "epoch": 2.32, "learning_rate": 1.9226358443704634e-05, "loss": 0.0061, "step": 161100 }, { "epoch": 2.32, "learning_rate": 1.922631040396616e-05, "loss": 0.0079, "step": 161110 }, { "epoch": 2.32, "learning_rate": 1.922626236422769e-05, "loss": 0.0085, "step": 161120 }, { "epoch": 2.32, "learning_rate": 1.922621432448922e-05, "loss": 0.0073, "step": 161130 }, { "epoch": 2.32, "learning_rate": 1.9226166284750748e-05, "loss": 0.0099, "step": 161140 }, { "epoch": 2.32, "learning_rate": 1.9226118245012274e-05, "loss": 0.0071, "step": 161150 }, { "epoch": 2.32, "learning_rate": 1.9226070205273803e-05, "loss": 0.0099, "step": 161160 }, { "epoch": 2.32, "learning_rate": 1.9226022165535333e-05, "loss": 0.0082, "step": 161170 }, { "epoch": 2.32, "learning_rate": 1.9225974125796862e-05, "loss": 0.0059, "step": 161180 }, { "epoch": 2.32, "learning_rate": 1.9225926086058388e-05, "loss": 0.0063, "step": 161190 }, { "epoch": 2.32, "learning_rate": 1.9225878046319917e-05, "loss": 0.0075, "step": 161200 }, { "epoch": 2.32, "learning_rate": 1.9225830006581446e-05, "loss": 0.0072, "step": 161210 }, { "epoch": 2.32, "learning_rate": 1.9225781966842972e-05, "loss": 0.0076, "step": 161220 }, { "epoch": 2.32, "learning_rate": 1.92257339271045e-05, "loss": 0.0056, "step": 161230 }, { "epoch": 2.32, "learning_rate": 1.922568588736603e-05, "loss": 0.0087, "step": 161240 }, { "epoch": 2.32, "learning_rate": 1.922563784762756e-05, "loss": 0.0082, "step": 161250 }, { "epoch": 2.32, "learning_rate": 1.9225589807889086e-05, "loss": 0.0065, "step": 161260 }, { "epoch": 2.32, "learning_rate": 1.9225541768150615e-05, "loss": 0.007, "step": 161270 }, { "epoch": 2.32, "learning_rate": 1.9225493728412144e-05, "loss": 0.0139, "step": 161280 }, { "epoch": 2.32, "learning_rate": 1.922544568867367e-05, "loss": 0.0071, "step": 161290 }, { "epoch": 2.32, "learning_rate": 1.92253976489352e-05, "loss": 0.0106, "step": 161300 }, { "epoch": 2.32, "learning_rate": 1.922534960919673e-05, "loss": 0.0099, "step": 161310 }, { "epoch": 2.32, "learning_rate": 1.9225301569458258e-05, "loss": 0.0078, "step": 161320 }, { "epoch": 2.33, "learning_rate": 1.9225253529719784e-05, "loss": 0.0076, "step": 161330 }, { "epoch": 2.33, "learning_rate": 1.9225205489981313e-05, "loss": 0.0069, "step": 161340 }, { "epoch": 2.33, "learning_rate": 1.9225157450242842e-05, "loss": 0.0079, "step": 161350 }, { "epoch": 2.33, "learning_rate": 1.9225109410504372e-05, "loss": 0.009, "step": 161360 }, { "epoch": 2.33, "learning_rate": 1.9225061370765898e-05, "loss": 0.0107, "step": 161370 }, { "epoch": 2.33, "learning_rate": 1.9225013331027427e-05, "loss": 0.0059, "step": 161380 }, { "epoch": 2.33, "learning_rate": 1.9224965291288956e-05, "loss": 0.0079, "step": 161390 }, { "epoch": 2.33, "learning_rate": 1.9224917251550482e-05, "loss": 0.0082, "step": 161400 }, { "epoch": 2.33, "learning_rate": 1.922486921181201e-05, "loss": 0.0167, "step": 161410 }, { "epoch": 2.33, "learning_rate": 1.922482117207354e-05, "loss": 0.0095, "step": 161420 }, { "epoch": 2.33, "learning_rate": 1.922477313233507e-05, "loss": 0.0074, "step": 161430 }, { "epoch": 2.33, "learning_rate": 1.9224725092596596e-05, "loss": 0.0063, "step": 161440 }, { "epoch": 2.33, "learning_rate": 1.9224677052858125e-05, "loss": 0.0077, "step": 161450 }, { "epoch": 2.33, "learning_rate": 1.9224629013119654e-05, "loss": 0.0069, "step": 161460 }, { "epoch": 2.33, "learning_rate": 1.922458577735503e-05, "loss": 0.0077, "step": 161470 }, { "epoch": 2.33, "learning_rate": 1.9224537737616558e-05, "loss": 0.0055, "step": 161480 }, { "epoch": 2.33, "learning_rate": 1.9224489697878087e-05, "loss": 0.0098, "step": 161490 }, { "epoch": 2.33, "learning_rate": 1.9224441658139613e-05, "loss": 0.0077, "step": 161500 }, { "epoch": 2.33, "learning_rate": 1.9224393618401143e-05, "loss": 0.0072, "step": 161510 }, { "epoch": 2.33, "learning_rate": 1.9224345578662672e-05, "loss": 0.0086, "step": 161520 }, { "epoch": 2.33, "learning_rate": 1.9224297538924198e-05, "loss": 0.0072, "step": 161530 }, { "epoch": 2.33, "learning_rate": 1.9224249499185727e-05, "loss": 0.0062, "step": 161540 }, { "epoch": 2.33, "learning_rate": 1.9224201459447256e-05, "loss": 0.0082, "step": 161550 }, { "epoch": 2.33, "learning_rate": 1.9224153419708786e-05, "loss": 0.0081, "step": 161560 }, { "epoch": 2.33, "learning_rate": 1.922410537997031e-05, "loss": 0.0097, "step": 161570 }, { "epoch": 2.33, "learning_rate": 1.922405734023184e-05, "loss": 0.0084, "step": 161580 }, { "epoch": 2.33, "learning_rate": 1.922400930049337e-05, "loss": 0.0064, "step": 161590 }, { "epoch": 2.33, "learning_rate": 1.92239612607549e-05, "loss": 0.0062, "step": 161600 }, { "epoch": 2.33, "learning_rate": 1.9223913221016425e-05, "loss": 0.0081, "step": 161610 }, { "epoch": 2.33, "learning_rate": 1.9223865181277954e-05, "loss": 0.0069, "step": 161620 }, { "epoch": 2.33, "learning_rate": 1.9223817141539484e-05, "loss": 0.0075, "step": 161630 }, { "epoch": 2.33, "learning_rate": 1.922376910180101e-05, "loss": 0.0091, "step": 161640 }, { "epoch": 2.33, "learning_rate": 1.922372106206254e-05, "loss": 0.0097, "step": 161650 }, { "epoch": 2.33, "learning_rate": 1.9223673022324068e-05, "loss": 0.0066, "step": 161660 }, { "epoch": 2.33, "learning_rate": 1.9223624982585597e-05, "loss": 0.007, "step": 161670 }, { "epoch": 2.33, "learning_rate": 1.9223576942847123e-05, "loss": 0.0055, "step": 161680 }, { "epoch": 2.33, "learning_rate": 1.9223528903108652e-05, "loss": 0.0103, "step": 161690 }, { "epoch": 2.33, "learning_rate": 1.9223480863370182e-05, "loss": 0.0063, "step": 161700 }, { "epoch": 2.33, "learning_rate": 1.9223432823631708e-05, "loss": 0.0081, "step": 161710 }, { "epoch": 2.33, "learning_rate": 1.9223384783893237e-05, "loss": 0.0095, "step": 161720 }, { "epoch": 2.33, "learning_rate": 1.9223336744154766e-05, "loss": 0.0056, "step": 161730 }, { "epoch": 2.33, "learning_rate": 1.9223288704416295e-05, "loss": 0.0069, "step": 161740 }, { "epoch": 2.33, "learning_rate": 1.922324066467782e-05, "loss": 0.0079, "step": 161750 }, { "epoch": 2.33, "learning_rate": 1.922319262493935e-05, "loss": 0.0055, "step": 161760 }, { "epoch": 2.33, "learning_rate": 1.922314458520088e-05, "loss": 0.0063, "step": 161770 }, { "epoch": 2.33, "learning_rate": 1.922309654546241e-05, "loss": 0.0068, "step": 161780 }, { "epoch": 2.33, "learning_rate": 1.9223048505723935e-05, "loss": 0.0057, "step": 161790 }, { "epoch": 2.33, "learning_rate": 1.9223000465985464e-05, "loss": 0.0087, "step": 161800 }, { "epoch": 2.33, "learning_rate": 1.9222952426246994e-05, "loss": 0.011, "step": 161810 }, { "epoch": 2.33, "learning_rate": 1.922290438650852e-05, "loss": 0.0055, "step": 161820 }, { "epoch": 2.33, "learning_rate": 1.922285634677005e-05, "loss": 0.0066, "step": 161830 }, { "epoch": 2.33, "learning_rate": 1.9222808307031578e-05, "loss": 0.006, "step": 161840 }, { "epoch": 2.33, "learning_rate": 1.9222760267293107e-05, "loss": 0.0079, "step": 161850 }, { "epoch": 2.33, "learning_rate": 1.9222712227554633e-05, "loss": 0.0046, "step": 161860 }, { "epoch": 2.33, "learning_rate": 1.9222664187816162e-05, "loss": 0.0067, "step": 161870 }, { "epoch": 2.33, "learning_rate": 1.922261614807769e-05, "loss": 0.0072, "step": 161880 }, { "epoch": 2.33, "learning_rate": 1.9222568108339218e-05, "loss": 0.0055, "step": 161890 }, { "epoch": 2.33, "learning_rate": 1.9222520068600747e-05, "loss": 0.0057, "step": 161900 }, { "epoch": 2.33, "learning_rate": 1.9222472028862276e-05, "loss": 0.0064, "step": 161910 }, { "epoch": 2.33, "learning_rate": 1.9222423989123805e-05, "loss": 0.0096, "step": 161920 }, { "epoch": 2.33, "learning_rate": 1.922237594938533e-05, "loss": 0.0057, "step": 161930 }, { "epoch": 2.33, "learning_rate": 1.922232790964686e-05, "loss": 0.011, "step": 161940 }, { "epoch": 2.33, "learning_rate": 1.922227986990839e-05, "loss": 0.0055, "step": 161950 }, { "epoch": 2.33, "learning_rate": 1.9222231830169916e-05, "loss": 0.0102, "step": 161960 }, { "epoch": 2.33, "learning_rate": 1.9222183790431445e-05, "loss": 0.0083, "step": 161970 }, { "epoch": 2.33, "learning_rate": 1.9222135750692974e-05, "loss": 0.0085, "step": 161980 }, { "epoch": 2.33, "learning_rate": 1.9222087710954503e-05, "loss": 0.0093, "step": 161990 }, { "epoch": 2.33, "learning_rate": 1.922203967121603e-05, "loss": 0.0073, "step": 162000 }, { "epoch": 2.33, "learning_rate": 1.922199163147756e-05, "loss": 0.0056, "step": 162010 }, { "epoch": 2.34, "learning_rate": 1.9221943591739088e-05, "loss": 0.0085, "step": 162020 }, { "epoch": 2.34, "learning_rate": 1.9221895552000617e-05, "loss": 0.0048, "step": 162030 }, { "epoch": 2.34, "learning_rate": 1.9221847512262143e-05, "loss": 0.0056, "step": 162040 }, { "epoch": 2.34, "learning_rate": 1.9221799472523672e-05, "loss": 0.008, "step": 162050 }, { "epoch": 2.34, "learning_rate": 1.92217514327852e-05, "loss": 0.0079, "step": 162060 }, { "epoch": 2.34, "learning_rate": 1.9221703393046727e-05, "loss": 0.0092, "step": 162070 }, { "epoch": 2.34, "learning_rate": 1.9221655353308257e-05, "loss": 0.0061, "step": 162080 }, { "epoch": 2.34, "learning_rate": 1.9221607313569786e-05, "loss": 0.0063, "step": 162090 }, { "epoch": 2.34, "learning_rate": 1.9221559273831315e-05, "loss": 0.0061, "step": 162100 }, { "epoch": 2.34, "learning_rate": 1.922151123409284e-05, "loss": 0.01, "step": 162110 }, { "epoch": 2.34, "learning_rate": 1.922146319435437e-05, "loss": 0.0101, "step": 162120 }, { "epoch": 2.34, "learning_rate": 1.92214151546159e-05, "loss": 0.0086, "step": 162130 }, { "epoch": 2.34, "learning_rate": 1.9221367114877426e-05, "loss": 0.0071, "step": 162140 }, { "epoch": 2.34, "learning_rate": 1.9221319075138955e-05, "loss": 0.0069, "step": 162150 }, { "epoch": 2.34, "learning_rate": 1.9221271035400484e-05, "loss": 0.0094, "step": 162160 }, { "epoch": 2.34, "learning_rate": 1.9221222995662013e-05, "loss": 0.0047, "step": 162170 }, { "epoch": 2.34, "learning_rate": 1.922117495592354e-05, "loss": 0.0064, "step": 162180 }, { "epoch": 2.34, "learning_rate": 1.922112691618507e-05, "loss": 0.0082, "step": 162190 }, { "epoch": 2.34, "learning_rate": 1.9221078876446598e-05, "loss": 0.0102, "step": 162200 }, { "epoch": 2.34, "learning_rate": 1.9221030836708127e-05, "loss": 0.0087, "step": 162210 }, { "epoch": 2.34, "learning_rate": 1.9220982796969653e-05, "loss": 0.0082, "step": 162220 }, { "epoch": 2.34, "learning_rate": 1.9220934757231182e-05, "loss": 0.0077, "step": 162230 }, { "epoch": 2.34, "learning_rate": 1.922088671749271e-05, "loss": 0.0138, "step": 162240 }, { "epoch": 2.34, "learning_rate": 1.9220838677754237e-05, "loss": 0.0074, "step": 162250 }, { "epoch": 2.34, "learning_rate": 1.9220790638015767e-05, "loss": 0.0099, "step": 162260 }, { "epoch": 2.34, "learning_rate": 1.9220742598277296e-05, "loss": 0.0068, "step": 162270 }, { "epoch": 2.34, "learning_rate": 1.9220694558538825e-05, "loss": 0.0073, "step": 162280 }, { "epoch": 2.34, "learning_rate": 1.922064651880035e-05, "loss": 0.006, "step": 162290 }, { "epoch": 2.34, "learning_rate": 1.922059847906188e-05, "loss": 0.0115, "step": 162300 }, { "epoch": 2.34, "learning_rate": 1.922055043932341e-05, "loss": 0.0082, "step": 162310 }, { "epoch": 2.34, "learning_rate": 1.9220502399584935e-05, "loss": 0.0079, "step": 162320 }, { "epoch": 2.34, "learning_rate": 1.9220454359846465e-05, "loss": 0.0079, "step": 162330 }, { "epoch": 2.34, "learning_rate": 1.9220406320107997e-05, "loss": 0.01, "step": 162340 }, { "epoch": 2.34, "learning_rate": 1.9220358280369523e-05, "loss": 0.0081, "step": 162350 }, { "epoch": 2.34, "learning_rate": 1.9220310240631053e-05, "loss": 0.012, "step": 162360 }, { "epoch": 2.34, "learning_rate": 1.9220262200892582e-05, "loss": 0.0087, "step": 162370 }, { "epoch": 2.34, "learning_rate": 1.9220214161154108e-05, "loss": 0.0095, "step": 162380 }, { "epoch": 2.34, "learning_rate": 1.9220166121415637e-05, "loss": 0.0079, "step": 162390 }, { "epoch": 2.34, "learning_rate": 1.9220118081677166e-05, "loss": 0.0079, "step": 162400 }, { "epoch": 2.34, "learning_rate": 1.9220070041938696e-05, "loss": 0.0082, "step": 162410 }, { "epoch": 2.34, "learning_rate": 1.922002200220022e-05, "loss": 0.007, "step": 162420 }, { "epoch": 2.34, "learning_rate": 1.921997396246175e-05, "loss": 0.0064, "step": 162430 }, { "epoch": 2.34, "learning_rate": 1.921992592272328e-05, "loss": 0.0074, "step": 162440 }, { "epoch": 2.34, "learning_rate": 1.921987788298481e-05, "loss": 0.0076, "step": 162450 }, { "epoch": 2.34, "learning_rate": 1.9219829843246335e-05, "loss": 0.0063, "step": 162460 }, { "epoch": 2.34, "learning_rate": 1.9219781803507864e-05, "loss": 0.0069, "step": 162470 }, { "epoch": 2.34, "learning_rate": 1.9219733763769394e-05, "loss": 0.0072, "step": 162480 }, { "epoch": 2.34, "learning_rate": 1.921968572403092e-05, "loss": 0.006, "step": 162490 }, { "epoch": 2.34, "learning_rate": 1.921963768429245e-05, "loss": 0.009, "step": 162500 }, { "epoch": 2.34, "learning_rate": 1.9219589644553978e-05, "loss": 0.0074, "step": 162510 }, { "epoch": 2.34, "learning_rate": 1.9219541604815507e-05, "loss": 0.0049, "step": 162520 }, { "epoch": 2.34, "learning_rate": 1.9219493565077033e-05, "loss": 0.0079, "step": 162530 }, { "epoch": 2.34, "learning_rate": 1.9219445525338562e-05, "loss": 0.008, "step": 162540 }, { "epoch": 2.34, "learning_rate": 1.9219397485600092e-05, "loss": 0.0094, "step": 162550 }, { "epoch": 2.34, "learning_rate": 1.9219349445861618e-05, "loss": 0.007, "step": 162560 }, { "epoch": 2.34, "learning_rate": 1.9219301406123147e-05, "loss": 0.008, "step": 162570 }, { "epoch": 2.34, "learning_rate": 1.9219253366384676e-05, "loss": 0.0087, "step": 162580 }, { "epoch": 2.34, "learning_rate": 1.9219205326646205e-05, "loss": 0.0103, "step": 162590 }, { "epoch": 2.34, "learning_rate": 1.921915728690773e-05, "loss": 0.0073, "step": 162600 }, { "epoch": 2.34, "learning_rate": 1.921910924716926e-05, "loss": 0.0078, "step": 162610 }, { "epoch": 2.34, "learning_rate": 1.921906120743079e-05, "loss": 0.0063, "step": 162620 }, { "epoch": 2.34, "learning_rate": 1.921901316769232e-05, "loss": 0.0045, "step": 162630 }, { "epoch": 2.34, "learning_rate": 1.9218965127953845e-05, "loss": 0.0086, "step": 162640 }, { "epoch": 2.34, "learning_rate": 1.9218917088215374e-05, "loss": 0.0061, "step": 162650 }, { "epoch": 2.34, "learning_rate": 1.9218869048476904e-05, "loss": 0.0077, "step": 162660 }, { "epoch": 2.34, "learning_rate": 1.921882100873843e-05, "loss": 0.0097, "step": 162670 }, { "epoch": 2.34, "learning_rate": 1.921877296899996e-05, "loss": 0.0084, "step": 162680 }, { "epoch": 2.34, "learning_rate": 1.9218724929261488e-05, "loss": 0.0063, "step": 162690 }, { "epoch": 2.34, "learning_rate": 1.9218676889523017e-05, "loss": 0.0075, "step": 162700 }, { "epoch": 2.34, "learning_rate": 1.9218628849784543e-05, "loss": 0.0076, "step": 162710 }, { "epoch": 2.35, "learning_rate": 1.9218580810046072e-05, "loss": 0.0075, "step": 162720 }, { "epoch": 2.35, "learning_rate": 1.92185327703076e-05, "loss": 0.0049, "step": 162730 }, { "epoch": 2.35, "learning_rate": 1.9218484730569128e-05, "loss": 0.0063, "step": 162740 }, { "epoch": 2.35, "learning_rate": 1.9218436690830657e-05, "loss": 0.0084, "step": 162750 }, { "epoch": 2.35, "learning_rate": 1.9218388651092186e-05, "loss": 0.0088, "step": 162760 }, { "epoch": 2.35, "learning_rate": 1.9218340611353715e-05, "loss": 0.0092, "step": 162770 }, { "epoch": 2.35, "learning_rate": 1.921829257161524e-05, "loss": 0.0068, "step": 162780 }, { "epoch": 2.35, "learning_rate": 1.921824453187677e-05, "loss": 0.0088, "step": 162790 }, { "epoch": 2.35, "learning_rate": 1.92181964921383e-05, "loss": 0.0065, "step": 162800 }, { "epoch": 2.35, "learning_rate": 1.921814845239983e-05, "loss": 0.0079, "step": 162810 }, { "epoch": 2.35, "learning_rate": 1.9218100412661355e-05, "loss": 0.0076, "step": 162820 }, { "epoch": 2.35, "learning_rate": 1.9218052372922884e-05, "loss": 0.0068, "step": 162830 }, { "epoch": 2.35, "learning_rate": 1.9218004333184413e-05, "loss": 0.0066, "step": 162840 }, { "epoch": 2.35, "learning_rate": 1.921795629344594e-05, "loss": 0.0103, "step": 162850 }, { "epoch": 2.35, "learning_rate": 1.921790825370747e-05, "loss": 0.0074, "step": 162860 }, { "epoch": 2.35, "learning_rate": 1.9217860213968998e-05, "loss": 0.0047, "step": 162870 }, { "epoch": 2.35, "learning_rate": 1.9217812174230527e-05, "loss": 0.0067, "step": 162880 }, { "epoch": 2.35, "learning_rate": 1.9217764134492053e-05, "loss": 0.0076, "step": 162890 }, { "epoch": 2.35, "learning_rate": 1.9217716094753582e-05, "loss": 0.0073, "step": 162900 }, { "epoch": 2.35, "learning_rate": 1.921766805501511e-05, "loss": 0.0065, "step": 162910 }, { "epoch": 2.35, "learning_rate": 1.9217620015276637e-05, "loss": 0.0045, "step": 162920 }, { "epoch": 2.35, "learning_rate": 1.9217571975538167e-05, "loss": 0.0058, "step": 162930 }, { "epoch": 2.35, "learning_rate": 1.9217523935799696e-05, "loss": 0.0075, "step": 162940 }, { "epoch": 2.35, "learning_rate": 1.9217475896061225e-05, "loss": 0.0048, "step": 162950 }, { "epoch": 2.35, "learning_rate": 1.921742785632275e-05, "loss": 0.0084, "step": 162960 }, { "epoch": 2.35, "learning_rate": 1.921737981658428e-05, "loss": 0.0032, "step": 162970 }, { "epoch": 2.35, "learning_rate": 1.921733177684581e-05, "loss": 0.0096, "step": 162980 }, { "epoch": 2.35, "learning_rate": 1.921728373710734e-05, "loss": 0.007, "step": 162990 }, { "epoch": 2.35, "learning_rate": 1.9217235697368865e-05, "loss": 0.0084, "step": 163000 }, { "epoch": 2.35, "learning_rate": 1.9217187657630394e-05, "loss": 0.0089, "step": 163010 }, { "epoch": 2.35, "learning_rate": 1.9217139617891923e-05, "loss": 0.009, "step": 163020 }, { "epoch": 2.35, "learning_rate": 1.921709157815345e-05, "loss": 0.0062, "step": 163030 }, { "epoch": 2.35, "learning_rate": 1.921704353841498e-05, "loss": 0.0081, "step": 163040 }, { "epoch": 2.35, "learning_rate": 1.9216995498676508e-05, "loss": 0.0122, "step": 163050 }, { "epoch": 2.35, "learning_rate": 1.9216947458938037e-05, "loss": 0.0068, "step": 163060 }, { "epoch": 2.35, "learning_rate": 1.9216899419199563e-05, "loss": 0.009, "step": 163070 }, { "epoch": 2.35, "learning_rate": 1.9216851379461092e-05, "loss": 0.0065, "step": 163080 }, { "epoch": 2.35, "learning_rate": 1.921680333972262e-05, "loss": 0.0062, "step": 163090 }, { "epoch": 2.35, "learning_rate": 1.9216755299984147e-05, "loss": 0.0097, "step": 163100 }, { "epoch": 2.35, "learning_rate": 1.9216707260245677e-05, "loss": 0.0084, "step": 163110 }, { "epoch": 2.35, "learning_rate": 1.9216659220507206e-05, "loss": 0.0079, "step": 163120 }, { "epoch": 2.35, "learning_rate": 1.9216611180768735e-05, "loss": 0.0075, "step": 163130 }, { "epoch": 2.35, "learning_rate": 1.921656314103026e-05, "loss": 0.0066, "step": 163140 }, { "epoch": 2.35, "learning_rate": 1.921651510129179e-05, "loss": 0.0074, "step": 163150 }, { "epoch": 2.35, "learning_rate": 1.921646706155332e-05, "loss": 0.0082, "step": 163160 }, { "epoch": 2.35, "learning_rate": 1.921641902181485e-05, "loss": 0.007, "step": 163170 }, { "epoch": 2.35, "learning_rate": 1.9216370982076375e-05, "loss": 0.0093, "step": 163180 }, { "epoch": 2.35, "learning_rate": 1.9216322942337904e-05, "loss": 0.0077, "step": 163190 }, { "epoch": 2.35, "learning_rate": 1.921627970657328e-05, "loss": 0.0092, "step": 163200 }, { "epoch": 2.35, "learning_rate": 1.9216231666834808e-05, "loss": 0.0079, "step": 163210 }, { "epoch": 2.35, "learning_rate": 1.9216183627096337e-05, "loss": 0.0064, "step": 163220 }, { "epoch": 2.35, "learning_rate": 1.9216135587357863e-05, "loss": 0.0075, "step": 163230 }, { "epoch": 2.35, "learning_rate": 1.9216087547619392e-05, "loss": 0.0101, "step": 163240 }, { "epoch": 2.35, "learning_rate": 1.921603950788092e-05, "loss": 0.0091, "step": 163250 }, { "epoch": 2.35, "learning_rate": 1.921599146814245e-05, "loss": 0.0079, "step": 163260 }, { "epoch": 2.35, "learning_rate": 1.9215943428403977e-05, "loss": 0.0056, "step": 163270 }, { "epoch": 2.35, "learning_rate": 1.9215895388665506e-05, "loss": 0.0081, "step": 163280 }, { "epoch": 2.35, "learning_rate": 1.9215847348927035e-05, "loss": 0.0059, "step": 163290 }, { "epoch": 2.35, "learning_rate": 1.9215799309188565e-05, "loss": 0.0077, "step": 163300 }, { "epoch": 2.35, "learning_rate": 1.921575126945009e-05, "loss": 0.0096, "step": 163310 }, { "epoch": 2.35, "learning_rate": 1.921570322971162e-05, "loss": 0.0093, "step": 163320 }, { "epoch": 2.35, "learning_rate": 1.921565518997315e-05, "loss": 0.0079, "step": 163330 }, { "epoch": 2.35, "learning_rate": 1.9215607150234675e-05, "loss": 0.0075, "step": 163340 }, { "epoch": 2.35, "learning_rate": 1.9215559110496204e-05, "loss": 0.0076, "step": 163350 }, { "epoch": 2.35, "learning_rate": 1.9215511070757733e-05, "loss": 0.0065, "step": 163360 }, { "epoch": 2.35, "learning_rate": 1.9215463031019263e-05, "loss": 0.0073, "step": 163370 }, { "epoch": 2.35, "learning_rate": 1.921541499128079e-05, "loss": 0.0063, "step": 163380 }, { "epoch": 2.35, "learning_rate": 1.9215366951542318e-05, "loss": 0.0075, "step": 163390 }, { "epoch": 2.35, "learning_rate": 1.9215318911803847e-05, "loss": 0.0066, "step": 163400 }, { "epoch": 2.36, "learning_rate": 1.9215270872065373e-05, "loss": 0.007, "step": 163410 }, { "epoch": 2.36, "learning_rate": 1.9215222832326902e-05, "loss": 0.0073, "step": 163420 }, { "epoch": 2.36, "learning_rate": 1.921517479258843e-05, "loss": 0.0048, "step": 163430 }, { "epoch": 2.36, "learning_rate": 1.921512675284996e-05, "loss": 0.0061, "step": 163440 }, { "epoch": 2.36, "learning_rate": 1.9215078713111487e-05, "loss": 0.0051, "step": 163450 }, { "epoch": 2.36, "learning_rate": 1.9215030673373016e-05, "loss": 0.0063, "step": 163460 }, { "epoch": 2.36, "learning_rate": 1.9214982633634545e-05, "loss": 0.0113, "step": 163470 }, { "epoch": 2.36, "learning_rate": 1.9214934593896075e-05, "loss": 0.0065, "step": 163480 }, { "epoch": 2.36, "learning_rate": 1.92148865541576e-05, "loss": 0.009, "step": 163490 }, { "epoch": 2.36, "learning_rate": 1.921483851441913e-05, "loss": 0.0059, "step": 163500 }, { "epoch": 2.36, "learning_rate": 1.921479047468066e-05, "loss": 0.006, "step": 163510 }, { "epoch": 2.36, "learning_rate": 1.9214742434942185e-05, "loss": 0.0077, "step": 163520 }, { "epoch": 2.36, "learning_rate": 1.9214694395203714e-05, "loss": 0.0076, "step": 163530 }, { "epoch": 2.36, "learning_rate": 1.9214646355465243e-05, "loss": 0.0101, "step": 163540 }, { "epoch": 2.36, "learning_rate": 1.9214598315726773e-05, "loss": 0.008, "step": 163550 }, { "epoch": 2.36, "learning_rate": 1.92145502759883e-05, "loss": 0.009, "step": 163560 }, { "epoch": 2.36, "learning_rate": 1.9214502236249828e-05, "loss": 0.0108, "step": 163570 }, { "epoch": 2.36, "learning_rate": 1.9214454196511357e-05, "loss": 0.0084, "step": 163580 }, { "epoch": 2.36, "learning_rate": 1.9214406156772883e-05, "loss": 0.0062, "step": 163590 }, { "epoch": 2.36, "learning_rate": 1.9214358117034412e-05, "loss": 0.0086, "step": 163600 }, { "epoch": 2.36, "learning_rate": 1.921431007729594e-05, "loss": 0.0075, "step": 163610 }, { "epoch": 2.36, "learning_rate": 1.921426203755747e-05, "loss": 0.0071, "step": 163620 }, { "epoch": 2.36, "learning_rate": 1.9214213997818997e-05, "loss": 0.0062, "step": 163630 }, { "epoch": 2.36, "learning_rate": 1.9214165958080526e-05, "loss": 0.0047, "step": 163640 }, { "epoch": 2.36, "learning_rate": 1.9214117918342055e-05, "loss": 0.0097, "step": 163650 }, { "epoch": 2.36, "learning_rate": 1.9214069878603584e-05, "loss": 0.0072, "step": 163660 }, { "epoch": 2.36, "learning_rate": 1.921402183886511e-05, "loss": 0.0062, "step": 163670 }, { "epoch": 2.36, "learning_rate": 1.921397379912664e-05, "loss": 0.0077, "step": 163680 }, { "epoch": 2.36, "learning_rate": 1.921392575938817e-05, "loss": 0.0062, "step": 163690 }, { "epoch": 2.36, "learning_rate": 1.9213877719649695e-05, "loss": 0.0089, "step": 163700 }, { "epoch": 2.36, "learning_rate": 1.9213829679911224e-05, "loss": 0.0081, "step": 163710 }, { "epoch": 2.36, "learning_rate": 1.9213781640172753e-05, "loss": 0.0064, "step": 163720 }, { "epoch": 2.36, "learning_rate": 1.9213733600434283e-05, "loss": 0.0092, "step": 163730 }, { "epoch": 2.36, "learning_rate": 1.921368556069581e-05, "loss": 0.0077, "step": 163740 }, { "epoch": 2.36, "learning_rate": 1.9213637520957338e-05, "loss": 0.0057, "step": 163750 }, { "epoch": 2.36, "learning_rate": 1.9213589481218867e-05, "loss": 0.0076, "step": 163760 }, { "epoch": 2.36, "learning_rate": 1.9213541441480393e-05, "loss": 0.0052, "step": 163770 }, { "epoch": 2.36, "learning_rate": 1.9213493401741922e-05, "loss": 0.0072, "step": 163780 }, { "epoch": 2.36, "learning_rate": 1.921344536200345e-05, "loss": 0.0058, "step": 163790 }, { "epoch": 2.36, "learning_rate": 1.921339732226498e-05, "loss": 0.0087, "step": 163800 }, { "epoch": 2.36, "learning_rate": 1.9213349282526507e-05, "loss": 0.0076, "step": 163810 }, { "epoch": 2.36, "learning_rate": 1.9213301242788036e-05, "loss": 0.0097, "step": 163820 }, { "epoch": 2.36, "learning_rate": 1.9213253203049565e-05, "loss": 0.0067, "step": 163830 }, { "epoch": 2.36, "learning_rate": 1.9213205163311094e-05, "loss": 0.0088, "step": 163840 }, { "epoch": 2.36, "learning_rate": 1.921315712357262e-05, "loss": 0.0077, "step": 163850 }, { "epoch": 2.36, "learning_rate": 1.921310908383415e-05, "loss": 0.0091, "step": 163860 }, { "epoch": 2.36, "learning_rate": 1.921306104409568e-05, "loss": 0.0073, "step": 163870 }, { "epoch": 2.36, "learning_rate": 1.9213013004357205e-05, "loss": 0.0075, "step": 163880 }, { "epoch": 2.36, "learning_rate": 1.9212964964618734e-05, "loss": 0.0094, "step": 163890 }, { "epoch": 2.36, "learning_rate": 1.9212916924880263e-05, "loss": 0.008, "step": 163900 }, { "epoch": 2.36, "learning_rate": 1.9212868885141792e-05, "loss": 0.0094, "step": 163910 }, { "epoch": 2.36, "learning_rate": 1.921282084540332e-05, "loss": 0.0099, "step": 163920 }, { "epoch": 2.36, "learning_rate": 1.9212772805664848e-05, "loss": 0.007, "step": 163930 }, { "epoch": 2.36, "learning_rate": 1.9212724765926377e-05, "loss": 0.0069, "step": 163940 }, { "epoch": 2.36, "learning_rate": 1.9212676726187903e-05, "loss": 0.0068, "step": 163950 }, { "epoch": 2.36, "learning_rate": 1.9212628686449432e-05, "loss": 0.0073, "step": 163960 }, { "epoch": 2.36, "learning_rate": 1.921258064671096e-05, "loss": 0.0064, "step": 163970 }, { "epoch": 2.36, "learning_rate": 1.921253260697249e-05, "loss": 0.0048, "step": 163980 }, { "epoch": 2.36, "learning_rate": 1.9212484567234016e-05, "loss": 0.0059, "step": 163990 }, { "epoch": 2.36, "learning_rate": 1.9212436527495546e-05, "loss": 0.0092, "step": 164000 }, { "epoch": 2.36, "learning_rate": 1.9212388487757075e-05, "loss": 0.0087, "step": 164010 }, { "epoch": 2.36, "learning_rate": 1.9212340448018604e-05, "loss": 0.0061, "step": 164020 }, { "epoch": 2.36, "learning_rate": 1.921229240828013e-05, "loss": 0.0065, "step": 164030 }, { "epoch": 2.36, "learning_rate": 1.921224436854166e-05, "loss": 0.0072, "step": 164040 }, { "epoch": 2.36, "learning_rate": 1.921219632880319e-05, "loss": 0.008, "step": 164050 }, { "epoch": 2.36, "learning_rate": 1.9212148289064715e-05, "loss": 0.0072, "step": 164060 }, { "epoch": 2.36, "learning_rate": 1.9212100249326244e-05, "loss": 0.0062, "step": 164070 }, { "epoch": 2.36, "learning_rate": 1.9212052209587773e-05, "loss": 0.0069, "step": 164080 }, { "epoch": 2.36, "learning_rate": 1.9212004169849302e-05, "loss": 0.0073, "step": 164090 }, { "epoch": 2.36, "learning_rate": 1.9211956130110828e-05, "loss": 0.0065, "step": 164100 }, { "epoch": 2.37, "learning_rate": 1.9211908090372358e-05, "loss": 0.0104, "step": 164110 }, { "epoch": 2.37, "learning_rate": 1.9211860050633887e-05, "loss": 0.0071, "step": 164120 }, { "epoch": 2.37, "learning_rate": 1.9211812010895413e-05, "loss": 0.0055, "step": 164130 }, { "epoch": 2.37, "learning_rate": 1.9211763971156942e-05, "loss": 0.0063, "step": 164140 }, { "epoch": 2.37, "learning_rate": 1.921171593141847e-05, "loss": 0.0086, "step": 164150 }, { "epoch": 2.37, "learning_rate": 1.921166789168e-05, "loss": 0.0073, "step": 164160 }, { "epoch": 2.37, "learning_rate": 1.9211619851941526e-05, "loss": 0.0083, "step": 164170 }, { "epoch": 2.37, "learning_rate": 1.9211571812203056e-05, "loss": 0.0075, "step": 164180 }, { "epoch": 2.37, "learning_rate": 1.9211523772464585e-05, "loss": 0.0074, "step": 164190 }, { "epoch": 2.37, "learning_rate": 1.9211475732726114e-05, "loss": 0.0069, "step": 164200 }, { "epoch": 2.37, "learning_rate": 1.921142769298764e-05, "loss": 0.0084, "step": 164210 }, { "epoch": 2.37, "learning_rate": 1.921137965324917e-05, "loss": 0.0083, "step": 164220 }, { "epoch": 2.37, "learning_rate": 1.92113316135107e-05, "loss": 0.0061, "step": 164230 }, { "epoch": 2.37, "learning_rate": 1.9211283573772224e-05, "loss": 0.0093, "step": 164240 }, { "epoch": 2.37, "learning_rate": 1.9211235534033754e-05, "loss": 0.0053, "step": 164250 }, { "epoch": 2.37, "learning_rate": 1.9211187494295283e-05, "loss": 0.0087, "step": 164260 }, { "epoch": 2.37, "learning_rate": 1.9211139454556812e-05, "loss": 0.0053, "step": 164270 }, { "epoch": 2.37, "learning_rate": 1.9211091414818338e-05, "loss": 0.009, "step": 164280 }, { "epoch": 2.37, "learning_rate": 1.9211043375079867e-05, "loss": 0.0066, "step": 164290 }, { "epoch": 2.37, "learning_rate": 1.9210995335341397e-05, "loss": 0.0059, "step": 164300 }, { "epoch": 2.37, "learning_rate": 1.9210947295602923e-05, "loss": 0.0057, "step": 164310 }, { "epoch": 2.37, "learning_rate": 1.9210899255864452e-05, "loss": 0.0041, "step": 164320 }, { "epoch": 2.37, "learning_rate": 1.921085121612598e-05, "loss": 0.0092, "step": 164330 }, { "epoch": 2.37, "learning_rate": 1.921080317638751e-05, "loss": 0.0092, "step": 164340 }, { "epoch": 2.37, "learning_rate": 1.9210755136649036e-05, "loss": 0.009, "step": 164350 }, { "epoch": 2.37, "learning_rate": 1.9210707096910566e-05, "loss": 0.0098, "step": 164360 }, { "epoch": 2.37, "learning_rate": 1.9210659057172095e-05, "loss": 0.0081, "step": 164370 }, { "epoch": 2.37, "learning_rate": 1.9210611017433624e-05, "loss": 0.006, "step": 164380 }, { "epoch": 2.37, "learning_rate": 1.921056297769515e-05, "loss": 0.0084, "step": 164390 }, { "epoch": 2.37, "learning_rate": 1.921051493795668e-05, "loss": 0.007, "step": 164400 }, { "epoch": 2.37, "learning_rate": 1.921046689821821e-05, "loss": 0.0047, "step": 164410 }, { "epoch": 2.37, "learning_rate": 1.9210418858479734e-05, "loss": 0.005, "step": 164420 }, { "epoch": 2.37, "learning_rate": 1.9210370818741264e-05, "loss": 0.0079, "step": 164430 }, { "epoch": 2.37, "learning_rate": 1.9210322779002793e-05, "loss": 0.0052, "step": 164440 }, { "epoch": 2.37, "learning_rate": 1.9210274739264322e-05, "loss": 0.0053, "step": 164450 }, { "epoch": 2.37, "learning_rate": 1.9210226699525848e-05, "loss": 0.0059, "step": 164460 }, { "epoch": 2.37, "learning_rate": 1.9210178659787377e-05, "loss": 0.0122, "step": 164470 }, { "epoch": 2.37, "learning_rate": 1.9210130620048907e-05, "loss": 0.0116, "step": 164480 }, { "epoch": 2.37, "learning_rate": 1.9210082580310433e-05, "loss": 0.0064, "step": 164490 }, { "epoch": 2.37, "learning_rate": 1.9210034540571962e-05, "loss": 0.0079, "step": 164500 }, { "epoch": 2.37, "learning_rate": 1.920998650083349e-05, "loss": 0.007, "step": 164510 }, { "epoch": 2.37, "learning_rate": 1.920993846109502e-05, "loss": 0.004, "step": 164520 }, { "epoch": 2.37, "learning_rate": 1.9209890421356546e-05, "loss": 0.0076, "step": 164530 }, { "epoch": 2.37, "learning_rate": 1.9209842381618075e-05, "loss": 0.0079, "step": 164540 }, { "epoch": 2.37, "learning_rate": 1.9209794341879605e-05, "loss": 0.0069, "step": 164550 }, { "epoch": 2.37, "learning_rate": 1.9209746302141134e-05, "loss": 0.0072, "step": 164560 }, { "epoch": 2.37, "learning_rate": 1.920969826240266e-05, "loss": 0.0076, "step": 164570 }, { "epoch": 2.37, "learning_rate": 1.920965022266419e-05, "loss": 0.009, "step": 164580 }, { "epoch": 2.37, "learning_rate": 1.920960218292572e-05, "loss": 0.0092, "step": 164590 }, { "epoch": 2.37, "learning_rate": 1.9209554143187244e-05, "loss": 0.0085, "step": 164600 }, { "epoch": 2.37, "learning_rate": 1.9209506103448774e-05, "loss": 0.0091, "step": 164610 }, { "epoch": 2.37, "learning_rate": 1.9209458063710303e-05, "loss": 0.0067, "step": 164620 }, { "epoch": 2.37, "learning_rate": 1.9209410023971832e-05, "loss": 0.0077, "step": 164630 }, { "epoch": 2.37, "learning_rate": 1.9209361984233358e-05, "loss": 0.0075, "step": 164640 }, { "epoch": 2.37, "learning_rate": 1.9209313944494887e-05, "loss": 0.0073, "step": 164650 }, { "epoch": 2.37, "learning_rate": 1.9209265904756417e-05, "loss": 0.0093, "step": 164660 }, { "epoch": 2.37, "learning_rate": 1.9209217865017942e-05, "loss": 0.0062, "step": 164670 }, { "epoch": 2.37, "learning_rate": 1.920916982527947e-05, "loss": 0.0073, "step": 164680 }, { "epoch": 2.37, "learning_rate": 1.9209121785541e-05, "loss": 0.0044, "step": 164690 }, { "epoch": 2.37, "learning_rate": 1.920907374580253e-05, "loss": 0.0054, "step": 164700 }, { "epoch": 2.37, "learning_rate": 1.9209025706064056e-05, "loss": 0.0093, "step": 164710 }, { "epoch": 2.37, "learning_rate": 1.9208977666325585e-05, "loss": 0.0071, "step": 164720 }, { "epoch": 2.37, "learning_rate": 1.9208929626587115e-05, "loss": 0.0072, "step": 164730 }, { "epoch": 2.37, "learning_rate": 1.9208881586848644e-05, "loss": 0.0058, "step": 164740 }, { "epoch": 2.37, "learning_rate": 1.920883354711017e-05, "loss": 0.0071, "step": 164750 }, { "epoch": 2.37, "learning_rate": 1.92087855073717e-05, "loss": 0.0059, "step": 164760 }, { "epoch": 2.37, "learning_rate": 1.920873746763323e-05, "loss": 0.0079, "step": 164770 }, { "epoch": 2.37, "learning_rate": 1.9208689427894754e-05, "loss": 0.0079, "step": 164780 }, { "epoch": 2.37, "learning_rate": 1.9208641388156283e-05, "loss": 0.012, "step": 164790 }, { "epoch": 2.38, "learning_rate": 1.9208593348417813e-05, "loss": 0.0146, "step": 164800 }, { "epoch": 2.38, "learning_rate": 1.9208545308679342e-05, "loss": 0.0078, "step": 164810 }, { "epoch": 2.38, "learning_rate": 1.9208497268940868e-05, "loss": 0.0082, "step": 164820 }, { "epoch": 2.38, "learning_rate": 1.9208449229202397e-05, "loss": 0.0046, "step": 164830 }, { "epoch": 2.38, "learning_rate": 1.9208401189463926e-05, "loss": 0.0079, "step": 164840 }, { "epoch": 2.38, "learning_rate": 1.9208353149725452e-05, "loss": 0.0062, "step": 164850 }, { "epoch": 2.38, "learning_rate": 1.920830510998698e-05, "loss": 0.0087, "step": 164860 }, { "epoch": 2.38, "learning_rate": 1.920825707024851e-05, "loss": 0.0101, "step": 164870 }, { "epoch": 2.38, "learning_rate": 1.920820903051004e-05, "loss": 0.0046, "step": 164880 }, { "epoch": 2.38, "learning_rate": 1.9208160990771566e-05, "loss": 0.0046, "step": 164890 }, { "epoch": 2.38, "learning_rate": 1.9208112951033095e-05, "loss": 0.0088, "step": 164900 }, { "epoch": 2.38, "learning_rate": 1.9208064911294625e-05, "loss": 0.0064, "step": 164910 }, { "epoch": 2.38, "learning_rate": 1.920801687155615e-05, "loss": 0.0079, "step": 164920 }, { "epoch": 2.38, "learning_rate": 1.920796883181768e-05, "loss": 0.0083, "step": 164930 }, { "epoch": 2.38, "learning_rate": 1.920792079207921e-05, "loss": 0.0069, "step": 164940 }, { "epoch": 2.38, "learning_rate": 1.9207872752340738e-05, "loss": 0.0089, "step": 164950 }, { "epoch": 2.38, "learning_rate": 1.9207824712602264e-05, "loss": 0.0067, "step": 164960 }, { "epoch": 2.38, "learning_rate": 1.9207776672863793e-05, "loss": 0.0126, "step": 164970 }, { "epoch": 2.38, "learning_rate": 1.9207728633125323e-05, "loss": 0.0086, "step": 164980 }, { "epoch": 2.38, "learning_rate": 1.9207680593386852e-05, "loss": 0.0109, "step": 164990 }, { "epoch": 2.38, "learning_rate": 1.9207632553648378e-05, "loss": 0.0074, "step": 165000 }, { "epoch": 2.38, "learning_rate": 1.9207584513909907e-05, "loss": 0.0073, "step": 165010 }, { "epoch": 2.38, "learning_rate": 1.9207536474171436e-05, "loss": 0.0077, "step": 165020 }, { "epoch": 2.38, "learning_rate": 1.9207488434432962e-05, "loss": 0.0053, "step": 165030 }, { "epoch": 2.38, "learning_rate": 1.920744039469449e-05, "loss": 0.0088, "step": 165040 }, { "epoch": 2.38, "learning_rate": 1.920739235495602e-05, "loss": 0.007, "step": 165050 }, { "epoch": 2.38, "learning_rate": 1.920734431521755e-05, "loss": 0.0089, "step": 165060 }, { "epoch": 2.38, "learning_rate": 1.9207296275479076e-05, "loss": 0.0073, "step": 165070 }, { "epoch": 2.38, "learning_rate": 1.9207248235740605e-05, "loss": 0.0059, "step": 165080 }, { "epoch": 2.38, "learning_rate": 1.9207200196002134e-05, "loss": 0.0057, "step": 165090 }, { "epoch": 2.38, "learning_rate": 1.920715215626366e-05, "loss": 0.0045, "step": 165100 }, { "epoch": 2.38, "learning_rate": 1.920710411652519e-05, "loss": 0.005, "step": 165110 }, { "epoch": 2.38, "learning_rate": 1.920705607678672e-05, "loss": 0.0094, "step": 165120 }, { "epoch": 2.38, "learning_rate": 1.9207008037048248e-05, "loss": 0.0063, "step": 165130 }, { "epoch": 2.38, "learning_rate": 1.9206959997309774e-05, "loss": 0.0153, "step": 165140 }, { "epoch": 2.38, "learning_rate": 1.9206911957571303e-05, "loss": 0.0113, "step": 165150 }, { "epoch": 2.38, "learning_rate": 1.9206863917832833e-05, "loss": 0.0072, "step": 165160 }, { "epoch": 2.38, "learning_rate": 1.9206815878094362e-05, "loss": 0.0054, "step": 165170 }, { "epoch": 2.38, "learning_rate": 1.9206767838355888e-05, "loss": 0.0045, "step": 165180 }, { "epoch": 2.38, "learning_rate": 1.9206719798617417e-05, "loss": 0.0097, "step": 165190 }, { "epoch": 2.38, "learning_rate": 1.9206671758878946e-05, "loss": 0.007, "step": 165200 }, { "epoch": 2.38, "learning_rate": 1.9206623719140472e-05, "loss": 0.0056, "step": 165210 }, { "epoch": 2.38, "learning_rate": 1.9206575679402e-05, "loss": 0.0063, "step": 165220 }, { "epoch": 2.38, "learning_rate": 1.920652763966353e-05, "loss": 0.009, "step": 165230 }, { "epoch": 2.38, "learning_rate": 1.920647959992506e-05, "loss": 0.006, "step": 165240 }, { "epoch": 2.38, "learning_rate": 1.9206431560186586e-05, "loss": 0.0053, "step": 165250 }, { "epoch": 2.38, "learning_rate": 1.9206383520448115e-05, "loss": 0.0068, "step": 165260 }, { "epoch": 2.38, "learning_rate": 1.9206335480709644e-05, "loss": 0.0057, "step": 165270 }, { "epoch": 2.38, "learning_rate": 1.920628744097117e-05, "loss": 0.0091, "step": 165280 }, { "epoch": 2.38, "learning_rate": 1.92062394012327e-05, "loss": 0.0059, "step": 165290 }, { "epoch": 2.38, "learning_rate": 1.920619136149423e-05, "loss": 0.0081, "step": 165300 }, { "epoch": 2.38, "learning_rate": 1.9206143321755758e-05, "loss": 0.0107, "step": 165310 }, { "epoch": 2.38, "learning_rate": 1.9206095282017284e-05, "loss": 0.0069, "step": 165320 }, { "epoch": 2.38, "learning_rate": 1.9206047242278813e-05, "loss": 0.0052, "step": 165330 }, { "epoch": 2.38, "learning_rate": 1.9205999202540343e-05, "loss": 0.0135, "step": 165340 }, { "epoch": 2.38, "learning_rate": 1.9205951162801872e-05, "loss": 0.007, "step": 165350 }, { "epoch": 2.38, "learning_rate": 1.9205903123063398e-05, "loss": 0.0085, "step": 165360 }, { "epoch": 2.38, "learning_rate": 1.9205855083324927e-05, "loss": 0.0072, "step": 165370 }, { "epoch": 2.38, "learning_rate": 1.9205807043586456e-05, "loss": 0.0077, "step": 165380 }, { "epoch": 2.38, "learning_rate": 1.9205759003847982e-05, "loss": 0.0076, "step": 165390 }, { "epoch": 2.38, "learning_rate": 1.920571096410951e-05, "loss": 0.0073, "step": 165400 }, { "epoch": 2.38, "learning_rate": 1.9205662924371044e-05, "loss": 0.0082, "step": 165410 }, { "epoch": 2.38, "learning_rate": 1.920561488463257e-05, "loss": 0.0086, "step": 165420 }, { "epoch": 2.38, "learning_rate": 1.92055668448941e-05, "loss": 0.0096, "step": 165430 }, { "epoch": 2.38, "learning_rate": 1.920551880515563e-05, "loss": 0.0065, "step": 165440 }, { "epoch": 2.38, "learning_rate": 1.9205470765417154e-05, "loss": 0.0046, "step": 165450 }, { "epoch": 2.38, "learning_rate": 1.9205422725678684e-05, "loss": 0.0075, "step": 165460 }, { "epoch": 2.38, "learning_rate": 1.9205374685940213e-05, "loss": 0.0116, "step": 165470 }, { "epoch": 2.38, "learning_rate": 1.9205326646201742e-05, "loss": 0.0082, "step": 165480 }, { "epoch": 2.39, "learning_rate": 1.9205278606463268e-05, "loss": 0.0049, "step": 165490 }, { "epoch": 2.39, "learning_rate": 1.9205230566724797e-05, "loss": 0.0084, "step": 165500 }, { "epoch": 2.39, "learning_rate": 1.9205182526986327e-05, "loss": 0.0077, "step": 165510 }, { "epoch": 2.39, "learning_rate": 1.9205134487247852e-05, "loss": 0.0068, "step": 165520 }, { "epoch": 2.39, "learning_rate": 1.920508644750938e-05, "loss": 0.0104, "step": 165530 }, { "epoch": 2.39, "learning_rate": 1.920503840777091e-05, "loss": 0.0084, "step": 165540 }, { "epoch": 2.39, "learning_rate": 1.920499036803244e-05, "loss": 0.0067, "step": 165550 }, { "epoch": 2.39, "learning_rate": 1.9204942328293966e-05, "loss": 0.0066, "step": 165560 }, { "epoch": 2.39, "learning_rate": 1.9204894288555495e-05, "loss": 0.0137, "step": 165570 }, { "epoch": 2.39, "learning_rate": 1.9204846248817025e-05, "loss": 0.0093, "step": 165580 }, { "epoch": 2.39, "learning_rate": 1.9204798209078554e-05, "loss": 0.0081, "step": 165590 }, { "epoch": 2.39, "learning_rate": 1.920475016934008e-05, "loss": 0.0082, "step": 165600 }, { "epoch": 2.39, "learning_rate": 1.920470212960161e-05, "loss": 0.0088, "step": 165610 }, { "epoch": 2.39, "learning_rate": 1.920465408986314e-05, "loss": 0.0065, "step": 165620 }, { "epoch": 2.39, "learning_rate": 1.9204606050124664e-05, "loss": 0.0081, "step": 165630 }, { "epoch": 2.39, "learning_rate": 1.9204558010386193e-05, "loss": 0.0079, "step": 165640 }, { "epoch": 2.39, "learning_rate": 1.9204509970647723e-05, "loss": 0.0068, "step": 165650 }, { "epoch": 2.39, "learning_rate": 1.9204461930909252e-05, "loss": 0.0069, "step": 165660 }, { "epoch": 2.39, "learning_rate": 1.9204413891170778e-05, "loss": 0.0126, "step": 165670 }, { "epoch": 2.39, "learning_rate": 1.9204365851432307e-05, "loss": 0.0056, "step": 165680 }, { "epoch": 2.39, "learning_rate": 1.9204317811693836e-05, "loss": 0.0087, "step": 165690 }, { "epoch": 2.39, "learning_rate": 1.9204269771955362e-05, "loss": 0.0075, "step": 165700 }, { "epoch": 2.39, "learning_rate": 1.920422173221689e-05, "loss": 0.0073, "step": 165710 }, { "epoch": 2.39, "learning_rate": 1.920417369247842e-05, "loss": 0.0069, "step": 165720 }, { "epoch": 2.39, "learning_rate": 1.920412565273995e-05, "loss": 0.0113, "step": 165730 }, { "epoch": 2.39, "learning_rate": 1.9204077613001476e-05, "loss": 0.0055, "step": 165740 }, { "epoch": 2.39, "learning_rate": 1.9204029573263005e-05, "loss": 0.0049, "step": 165750 }, { "epoch": 2.39, "learning_rate": 1.9203981533524535e-05, "loss": 0.0058, "step": 165760 }, { "epoch": 2.39, "learning_rate": 1.9203933493786064e-05, "loss": 0.0068, "step": 165770 }, { "epoch": 2.39, "learning_rate": 1.920388545404759e-05, "loss": 0.0063, "step": 165780 }, { "epoch": 2.39, "learning_rate": 1.920383741430912e-05, "loss": 0.0086, "step": 165790 }, { "epoch": 2.39, "learning_rate": 1.9203789374570648e-05, "loss": 0.006, "step": 165800 }, { "epoch": 2.39, "learning_rate": 1.9203741334832174e-05, "loss": 0.0078, "step": 165810 }, { "epoch": 2.39, "learning_rate": 1.9203693295093703e-05, "loss": 0.0073, "step": 165820 }, { "epoch": 2.39, "learning_rate": 1.9203645255355233e-05, "loss": 0.0075, "step": 165830 }, { "epoch": 2.39, "learning_rate": 1.9203597215616762e-05, "loss": 0.0052, "step": 165840 }, { "epoch": 2.39, "learning_rate": 1.9203549175878288e-05, "loss": 0.0114, "step": 165850 }, { "epoch": 2.39, "learning_rate": 1.9203501136139817e-05, "loss": 0.0071, "step": 165860 }, { "epoch": 2.39, "learning_rate": 1.9203453096401346e-05, "loss": 0.007, "step": 165870 }, { "epoch": 2.39, "learning_rate": 1.9203405056662872e-05, "loss": 0.0082, "step": 165880 }, { "epoch": 2.39, "learning_rate": 1.92033570169244e-05, "loss": 0.0081, "step": 165890 }, { "epoch": 2.39, "learning_rate": 1.920330897718593e-05, "loss": 0.0096, "step": 165900 }, { "epoch": 2.39, "learning_rate": 1.920326093744746e-05, "loss": 0.0098, "step": 165910 }, { "epoch": 2.39, "learning_rate": 1.9203212897708986e-05, "loss": 0.0075, "step": 165920 }, { "epoch": 2.39, "learning_rate": 1.9203164857970515e-05, "loss": 0.0081, "step": 165930 }, { "epoch": 2.39, "learning_rate": 1.9203116818232044e-05, "loss": 0.0078, "step": 165940 }, { "epoch": 2.39, "learning_rate": 1.9203068778493574e-05, "loss": 0.0078, "step": 165950 }, { "epoch": 2.39, "learning_rate": 1.92030207387551e-05, "loss": 0.0133, "step": 165960 }, { "epoch": 2.39, "learning_rate": 1.920297269901663e-05, "loss": 0.008, "step": 165970 }, { "epoch": 2.39, "learning_rate": 1.9202924659278158e-05, "loss": 0.0073, "step": 165980 }, { "epoch": 2.39, "learning_rate": 1.9202876619539684e-05, "loss": 0.0062, "step": 165990 }, { "epoch": 2.39, "learning_rate": 1.9202828579801213e-05, "loss": 0.0076, "step": 166000 }, { "epoch": 2.39, "learning_rate": 1.9202780540062743e-05, "loss": 0.0075, "step": 166010 }, { "epoch": 2.39, "learning_rate": 1.9202732500324272e-05, "loss": 0.0046, "step": 166020 }, { "epoch": 2.39, "learning_rate": 1.9202684460585798e-05, "loss": 0.0069, "step": 166030 }, { "epoch": 2.39, "learning_rate": 1.9202636420847327e-05, "loss": 0.0065, "step": 166040 }, { "epoch": 2.39, "learning_rate": 1.9202588381108856e-05, "loss": 0.0082, "step": 166050 }, { "epoch": 2.39, "learning_rate": 1.9202540341370382e-05, "loss": 0.0082, "step": 166060 }, { "epoch": 2.39, "learning_rate": 1.920249230163191e-05, "loss": 0.0058, "step": 166070 }, { "epoch": 2.39, "learning_rate": 1.920244426189344e-05, "loss": 0.0059, "step": 166080 }, { "epoch": 2.39, "learning_rate": 1.920239622215497e-05, "loss": 0.0085, "step": 166090 }, { "epoch": 2.39, "learning_rate": 1.9202348182416496e-05, "loss": 0.0091, "step": 166100 }, { "epoch": 2.39, "learning_rate": 1.9202300142678025e-05, "loss": 0.0066, "step": 166110 }, { "epoch": 2.39, "learning_rate": 1.9202252102939554e-05, "loss": 0.0081, "step": 166120 }, { "epoch": 2.39, "learning_rate": 1.9202204063201084e-05, "loss": 0.0115, "step": 166130 }, { "epoch": 2.39, "learning_rate": 1.920215602346261e-05, "loss": 0.0061, "step": 166140 }, { "epoch": 2.39, "learning_rate": 1.920210798372414e-05, "loss": 0.0062, "step": 166150 }, { "epoch": 2.39, "learning_rate": 1.9202059943985668e-05, "loss": 0.0096, "step": 166160 }, { "epoch": 2.39, "learning_rate": 1.9202011904247194e-05, "loss": 0.0068, "step": 166170 }, { "epoch": 2.39, "learning_rate": 1.9201963864508723e-05, "loss": 0.0049, "step": 166180 }, { "epoch": 2.4, "learning_rate": 1.9201915824770253e-05, "loss": 0.0058, "step": 166190 }, { "epoch": 2.4, "learning_rate": 1.9201867785031782e-05, "loss": 0.0084, "step": 166200 }, { "epoch": 2.4, "learning_rate": 1.9201819745293308e-05, "loss": 0.0074, "step": 166210 }, { "epoch": 2.4, "learning_rate": 1.9201771705554837e-05, "loss": 0.0094, "step": 166220 }, { "epoch": 2.4, "learning_rate": 1.9201723665816366e-05, "loss": 0.0065, "step": 166230 }, { "epoch": 2.4, "learning_rate": 1.9201675626077892e-05, "loss": 0.0073, "step": 166240 }, { "epoch": 2.4, "learning_rate": 1.920162758633942e-05, "loss": 0.0066, "step": 166250 }, { "epoch": 2.4, "learning_rate": 1.920157954660095e-05, "loss": 0.0053, "step": 166260 }, { "epoch": 2.4, "learning_rate": 1.920153150686248e-05, "loss": 0.008, "step": 166270 }, { "epoch": 2.4, "learning_rate": 1.9201483467124006e-05, "loss": 0.0076, "step": 166280 }, { "epoch": 2.4, "learning_rate": 1.9201435427385535e-05, "loss": 0.0056, "step": 166290 }, { "epoch": 2.4, "learning_rate": 1.9201387387647064e-05, "loss": 0.006, "step": 166300 }, { "epoch": 2.4, "learning_rate": 1.920133934790859e-05, "loss": 0.0074, "step": 166310 }, { "epoch": 2.4, "learning_rate": 1.920129130817012e-05, "loss": 0.0096, "step": 166320 }, { "epoch": 2.4, "learning_rate": 1.920124326843165e-05, "loss": 0.0129, "step": 166330 }, { "epoch": 2.4, "learning_rate": 1.9201195228693178e-05, "loss": 0.0086, "step": 166340 }, { "epoch": 2.4, "learning_rate": 1.9201147188954704e-05, "loss": 0.0086, "step": 166350 }, { "epoch": 2.4, "learning_rate": 1.9201099149216233e-05, "loss": 0.0084, "step": 166360 }, { "epoch": 2.4, "learning_rate": 1.9201051109477762e-05, "loss": 0.0103, "step": 166370 }, { "epoch": 2.4, "learning_rate": 1.9201003069739292e-05, "loss": 0.0078, "step": 166380 }, { "epoch": 2.4, "learning_rate": 1.9200955030000818e-05, "loss": 0.0084, "step": 166390 }, { "epoch": 2.4, "learning_rate": 1.9200906990262347e-05, "loss": 0.0075, "step": 166400 }, { "epoch": 2.4, "learning_rate": 1.9200858950523876e-05, "loss": 0.0085, "step": 166410 }, { "epoch": 2.4, "learning_rate": 1.9200810910785402e-05, "loss": 0.0067, "step": 166420 }, { "epoch": 2.4, "learning_rate": 1.920076287104693e-05, "loss": 0.0111, "step": 166430 }, { "epoch": 2.4, "learning_rate": 1.920071483130846e-05, "loss": 0.0075, "step": 166440 }, { "epoch": 2.4, "learning_rate": 1.920066679156999e-05, "loss": 0.0063, "step": 166450 }, { "epoch": 2.4, "learning_rate": 1.9200618751831516e-05, "loss": 0.0101, "step": 166460 }, { "epoch": 2.4, "learning_rate": 1.9200570712093045e-05, "loss": 0.0088, "step": 166470 }, { "epoch": 2.4, "learning_rate": 1.9200522672354574e-05, "loss": 0.0075, "step": 166480 }, { "epoch": 2.4, "learning_rate": 1.92004746326161e-05, "loss": 0.0074, "step": 166490 }, { "epoch": 2.4, "learning_rate": 1.920042659287763e-05, "loss": 0.0081, "step": 166500 }, { "epoch": 2.4, "learning_rate": 1.920037855313916e-05, "loss": 0.0095, "step": 166510 }, { "epoch": 2.4, "learning_rate": 1.9200330513400688e-05, "loss": 0.0139, "step": 166520 }, { "epoch": 2.4, "learning_rate": 1.9200282473662214e-05, "loss": 0.007, "step": 166530 }, { "epoch": 2.4, "learning_rate": 1.9200234433923743e-05, "loss": 0.0088, "step": 166540 }, { "epoch": 2.4, "learning_rate": 1.9200186394185272e-05, "loss": 0.0076, "step": 166550 }, { "epoch": 2.4, "learning_rate": 1.92001383544468e-05, "loss": 0.0096, "step": 166560 }, { "epoch": 2.4, "learning_rate": 1.9200090314708327e-05, "loss": 0.0082, "step": 166570 }, { "epoch": 2.4, "learning_rate": 1.9200042274969857e-05, "loss": 0.0078, "step": 166580 }, { "epoch": 2.4, "learning_rate": 1.9199994235231386e-05, "loss": 0.0082, "step": 166590 }, { "epoch": 2.4, "learning_rate": 1.9199946195492912e-05, "loss": 0.0069, "step": 166600 }, { "epoch": 2.4, "learning_rate": 1.919989815575444e-05, "loss": 0.0068, "step": 166610 }, { "epoch": 2.4, "learning_rate": 1.919985011601597e-05, "loss": 0.0078, "step": 166620 }, { "epoch": 2.4, "learning_rate": 1.91998020762775e-05, "loss": 0.0053, "step": 166630 }, { "epoch": 2.4, "learning_rate": 1.9199754036539026e-05, "loss": 0.0088, "step": 166640 }, { "epoch": 2.4, "learning_rate": 1.9199705996800555e-05, "loss": 0.0076, "step": 166650 }, { "epoch": 2.4, "learning_rate": 1.9199657957062084e-05, "loss": 0.007, "step": 166660 }, { "epoch": 2.4, "learning_rate": 1.919960991732361e-05, "loss": 0.0064, "step": 166670 }, { "epoch": 2.4, "learning_rate": 1.919956187758514e-05, "loss": 0.0053, "step": 166680 }, { "epoch": 2.4, "learning_rate": 1.919951383784667e-05, "loss": 0.0051, "step": 166690 }, { "epoch": 2.4, "learning_rate": 1.9199465798108198e-05, "loss": 0.0082, "step": 166700 }, { "epoch": 2.4, "learning_rate": 1.9199417758369724e-05, "loss": 0.0072, "step": 166710 }, { "epoch": 2.4, "learning_rate": 1.9199369718631253e-05, "loss": 0.0043, "step": 166720 }, { "epoch": 2.4, "learning_rate": 1.9199321678892782e-05, "loss": 0.0065, "step": 166730 }, { "epoch": 2.4, "learning_rate": 1.919927363915431e-05, "loss": 0.007, "step": 166740 }, { "epoch": 2.4, "learning_rate": 1.9199225599415837e-05, "loss": 0.0067, "step": 166750 }, { "epoch": 2.4, "learning_rate": 1.9199177559677367e-05, "loss": 0.0045, "step": 166760 }, { "epoch": 2.4, "learning_rate": 1.9199129519938896e-05, "loss": 0.0094, "step": 166770 }, { "epoch": 2.4, "learning_rate": 1.9199081480200422e-05, "loss": 0.0077, "step": 166780 }, { "epoch": 2.4, "learning_rate": 1.919903344046195e-05, "loss": 0.0074, "step": 166790 }, { "epoch": 2.4, "learning_rate": 1.919898540072348e-05, "loss": 0.0084, "step": 166800 }, { "epoch": 2.4, "learning_rate": 1.919893736098501e-05, "loss": 0.0076, "step": 166810 }, { "epoch": 2.4, "learning_rate": 1.9198889321246536e-05, "loss": 0.0083, "step": 166820 }, { "epoch": 2.4, "learning_rate": 1.9198841281508065e-05, "loss": 0.007, "step": 166830 }, { "epoch": 2.4, "learning_rate": 1.9198793241769594e-05, "loss": 0.0102, "step": 166840 }, { "epoch": 2.4, "learning_rate": 1.919874520203112e-05, "loss": 0.0071, "step": 166850 }, { "epoch": 2.4, "learning_rate": 1.919869716229265e-05, "loss": 0.0066, "step": 166860 }, { "epoch": 2.4, "learning_rate": 1.919864912255418e-05, "loss": 0.0089, "step": 166870 }, { "epoch": 2.41, "learning_rate": 1.9198601082815708e-05, "loss": 0.0089, "step": 166880 }, { "epoch": 2.41, "learning_rate": 1.9198553043077234e-05, "loss": 0.0098, "step": 166890 }, { "epoch": 2.41, "learning_rate": 1.9198505003338763e-05, "loss": 0.0073, "step": 166900 }, { "epoch": 2.41, "learning_rate": 1.9198456963600292e-05, "loss": 0.0089, "step": 166910 }, { "epoch": 2.41, "learning_rate": 1.919840892386182e-05, "loss": 0.0075, "step": 166920 }, { "epoch": 2.41, "learning_rate": 1.9198360884123347e-05, "loss": 0.0081, "step": 166930 }, { "epoch": 2.41, "learning_rate": 1.9198312844384877e-05, "loss": 0.0088, "step": 166940 }, { "epoch": 2.41, "learning_rate": 1.9198264804646406e-05, "loss": 0.0088, "step": 166950 }, { "epoch": 2.41, "learning_rate": 1.9198216764907932e-05, "loss": 0.0064, "step": 166960 }, { "epoch": 2.41, "learning_rate": 1.919816872516946e-05, "loss": 0.0062, "step": 166970 }, { "epoch": 2.41, "learning_rate": 1.919812068543099e-05, "loss": 0.006, "step": 166980 }, { "epoch": 2.41, "learning_rate": 1.919807264569252e-05, "loss": 0.0128, "step": 166990 }, { "epoch": 2.41, "learning_rate": 1.9198024605954045e-05, "loss": 0.0055, "step": 167000 }, { "epoch": 2.41, "learning_rate": 1.9197976566215575e-05, "loss": 0.008, "step": 167010 }, { "epoch": 2.41, "learning_rate": 1.9197928526477104e-05, "loss": 0.0103, "step": 167020 }, { "epoch": 2.41, "learning_rate": 1.919788048673863e-05, "loss": 0.0096, "step": 167030 }, { "epoch": 2.41, "learning_rate": 1.919783244700016e-05, "loss": 0.008, "step": 167040 }, { "epoch": 2.41, "learning_rate": 1.919778440726169e-05, "loss": 0.0082, "step": 167050 }, { "epoch": 2.41, "learning_rate": 1.9197736367523218e-05, "loss": 0.0084, "step": 167060 }, { "epoch": 2.41, "learning_rate": 1.9197688327784744e-05, "loss": 0.0078, "step": 167070 }, { "epoch": 2.41, "learning_rate": 1.9197640288046273e-05, "loss": 0.0071, "step": 167080 }, { "epoch": 2.41, "learning_rate": 1.9197592248307802e-05, "loss": 0.0047, "step": 167090 }, { "epoch": 2.41, "learning_rate": 1.919754420856933e-05, "loss": 0.0051, "step": 167100 }, { "epoch": 2.41, "learning_rate": 1.9197496168830857e-05, "loss": 0.0129, "step": 167110 }, { "epoch": 2.41, "learning_rate": 1.9197448129092387e-05, "loss": 0.0075, "step": 167120 }, { "epoch": 2.41, "learning_rate": 1.9197400089353916e-05, "loss": 0.006, "step": 167130 }, { "epoch": 2.41, "learning_rate": 1.919735204961544e-05, "loss": 0.0054, "step": 167140 }, { "epoch": 2.41, "learning_rate": 1.919730881385082e-05, "loss": 0.0072, "step": 167150 }, { "epoch": 2.41, "learning_rate": 1.919726077411235e-05, "loss": 0.0057, "step": 167160 }, { "epoch": 2.41, "learning_rate": 1.9197212734373875e-05, "loss": 0.0055, "step": 167170 }, { "epoch": 2.41, "learning_rate": 1.9197164694635404e-05, "loss": 0.0068, "step": 167180 }, { "epoch": 2.41, "learning_rate": 1.9197116654896933e-05, "loss": 0.0063, "step": 167190 }, { "epoch": 2.41, "learning_rate": 1.919706861515846e-05, "loss": 0.011, "step": 167200 }, { "epoch": 2.41, "learning_rate": 1.919702057541999e-05, "loss": 0.0064, "step": 167210 }, { "epoch": 2.41, "learning_rate": 1.9196972535681518e-05, "loss": 0.0077, "step": 167220 }, { "epoch": 2.41, "learning_rate": 1.9196924495943047e-05, "loss": 0.008, "step": 167230 }, { "epoch": 2.41, "learning_rate": 1.9196876456204573e-05, "loss": 0.0089, "step": 167240 }, { "epoch": 2.41, "learning_rate": 1.9196828416466102e-05, "loss": 0.0082, "step": 167250 }, { "epoch": 2.41, "learning_rate": 1.919678037672763e-05, "loss": 0.0061, "step": 167260 }, { "epoch": 2.41, "learning_rate": 1.9196732336989157e-05, "loss": 0.0078, "step": 167270 }, { "epoch": 2.41, "learning_rate": 1.9196684297250687e-05, "loss": 0.0088, "step": 167280 }, { "epoch": 2.41, "learning_rate": 1.9196636257512216e-05, "loss": 0.0079, "step": 167290 }, { "epoch": 2.41, "learning_rate": 1.9196588217773745e-05, "loss": 0.0068, "step": 167300 }, { "epoch": 2.41, "learning_rate": 1.919654017803527e-05, "loss": 0.0089, "step": 167310 }, { "epoch": 2.41, "learning_rate": 1.91964921382968e-05, "loss": 0.0061, "step": 167320 }, { "epoch": 2.41, "learning_rate": 1.919644409855833e-05, "loss": 0.008, "step": 167330 }, { "epoch": 2.41, "learning_rate": 1.919639605881986e-05, "loss": 0.0089, "step": 167340 }, { "epoch": 2.41, "learning_rate": 1.9196348019081385e-05, "loss": 0.0089, "step": 167350 }, { "epoch": 2.41, "learning_rate": 1.9196299979342914e-05, "loss": 0.0083, "step": 167360 }, { "epoch": 2.41, "learning_rate": 1.9196251939604443e-05, "loss": 0.0063, "step": 167370 }, { "epoch": 2.41, "learning_rate": 1.919620389986597e-05, "loss": 0.0074, "step": 167380 }, { "epoch": 2.41, "learning_rate": 1.91961558601275e-05, "loss": 0.0098, "step": 167390 }, { "epoch": 2.41, "learning_rate": 1.9196107820389028e-05, "loss": 0.0097, "step": 167400 }, { "epoch": 2.41, "learning_rate": 1.9196059780650557e-05, "loss": 0.0108, "step": 167410 }, { "epoch": 2.41, "learning_rate": 1.9196011740912083e-05, "loss": 0.0071, "step": 167420 }, { "epoch": 2.41, "learning_rate": 1.9195963701173612e-05, "loss": 0.0096, "step": 167430 }, { "epoch": 2.41, "learning_rate": 1.919591566143514e-05, "loss": 0.0068, "step": 167440 }, { "epoch": 2.41, "learning_rate": 1.9195867621696667e-05, "loss": 0.0071, "step": 167450 }, { "epoch": 2.41, "learning_rate": 1.9195819581958197e-05, "loss": 0.0068, "step": 167460 }, { "epoch": 2.41, "learning_rate": 1.9195771542219726e-05, "loss": 0.0083, "step": 167470 }, { "epoch": 2.41, "learning_rate": 1.9195723502481255e-05, "loss": 0.0062, "step": 167480 }, { "epoch": 2.41, "learning_rate": 1.919567546274278e-05, "loss": 0.0093, "step": 167490 }, { "epoch": 2.41, "learning_rate": 1.919562742300431e-05, "loss": 0.008, "step": 167500 }, { "epoch": 2.41, "learning_rate": 1.919557938326584e-05, "loss": 0.0123, "step": 167510 }, { "epoch": 2.41, "learning_rate": 1.919553134352737e-05, "loss": 0.0083, "step": 167520 }, { "epoch": 2.41, "learning_rate": 1.9195483303788895e-05, "loss": 0.0071, "step": 167530 }, { "epoch": 2.41, "learning_rate": 1.9195435264050424e-05, "loss": 0.0074, "step": 167540 }, { "epoch": 2.41, "learning_rate": 1.9195387224311953e-05, "loss": 0.0073, "step": 167550 }, { "epoch": 2.41, "learning_rate": 1.919533918457348e-05, "loss": 0.0069, "step": 167560 }, { "epoch": 2.42, "learning_rate": 1.919529114483501e-05, "loss": 0.0068, "step": 167570 }, { "epoch": 2.42, "learning_rate": 1.9195243105096538e-05, "loss": 0.006, "step": 167580 }, { "epoch": 2.42, "learning_rate": 1.9195195065358067e-05, "loss": 0.0069, "step": 167590 }, { "epoch": 2.42, "learning_rate": 1.9195147025619593e-05, "loss": 0.0091, "step": 167600 }, { "epoch": 2.42, "learning_rate": 1.9195098985881122e-05, "loss": 0.0079, "step": 167610 }, { "epoch": 2.42, "learning_rate": 1.919505094614265e-05, "loss": 0.0067, "step": 167620 }, { "epoch": 2.42, "learning_rate": 1.9195002906404177e-05, "loss": 0.006, "step": 167630 }, { "epoch": 2.42, "learning_rate": 1.9194954866665706e-05, "loss": 0.0104, "step": 167640 }, { "epoch": 2.42, "learning_rate": 1.9194906826927236e-05, "loss": 0.0111, "step": 167650 }, { "epoch": 2.42, "learning_rate": 1.9194858787188765e-05, "loss": 0.0063, "step": 167660 }, { "epoch": 2.42, "learning_rate": 1.919481074745029e-05, "loss": 0.0092, "step": 167670 }, { "epoch": 2.42, "learning_rate": 1.919476270771182e-05, "loss": 0.0085, "step": 167680 }, { "epoch": 2.42, "learning_rate": 1.919471466797335e-05, "loss": 0.0113, "step": 167690 }, { "epoch": 2.42, "learning_rate": 1.919466662823488e-05, "loss": 0.0056, "step": 167700 }, { "epoch": 2.42, "learning_rate": 1.9194618588496405e-05, "loss": 0.0068, "step": 167710 }, { "epoch": 2.42, "learning_rate": 1.9194570548757934e-05, "loss": 0.0073, "step": 167720 }, { "epoch": 2.42, "learning_rate": 1.9194522509019463e-05, "loss": 0.0088, "step": 167730 }, { "epoch": 2.42, "learning_rate": 1.919447446928099e-05, "loss": 0.0057, "step": 167740 }, { "epoch": 2.42, "learning_rate": 1.9194426429542518e-05, "loss": 0.0072, "step": 167750 }, { "epoch": 2.42, "learning_rate": 1.9194378389804048e-05, "loss": 0.0067, "step": 167760 }, { "epoch": 2.42, "learning_rate": 1.9194330350065577e-05, "loss": 0.0055, "step": 167770 }, { "epoch": 2.42, "learning_rate": 1.9194282310327103e-05, "loss": 0.011, "step": 167780 }, { "epoch": 2.42, "learning_rate": 1.9194234270588632e-05, "loss": 0.0081, "step": 167790 }, { "epoch": 2.42, "learning_rate": 1.919418623085016e-05, "loss": 0.0099, "step": 167800 }, { "epoch": 2.42, "learning_rate": 1.9194138191111687e-05, "loss": 0.0098, "step": 167810 }, { "epoch": 2.42, "learning_rate": 1.9194090151373216e-05, "loss": 0.007, "step": 167820 }, { "epoch": 2.42, "learning_rate": 1.9194042111634746e-05, "loss": 0.0064, "step": 167830 }, { "epoch": 2.42, "learning_rate": 1.9193994071896275e-05, "loss": 0.0081, "step": 167840 }, { "epoch": 2.42, "learning_rate": 1.91939460321578e-05, "loss": 0.007, "step": 167850 }, { "epoch": 2.42, "learning_rate": 1.919389799241933e-05, "loss": 0.0104, "step": 167860 }, { "epoch": 2.42, "learning_rate": 1.919384995268086e-05, "loss": 0.0069, "step": 167870 }, { "epoch": 2.42, "learning_rate": 1.9193801912942385e-05, "loss": 0.0077, "step": 167880 }, { "epoch": 2.42, "learning_rate": 1.9193753873203915e-05, "loss": 0.0102, "step": 167890 }, { "epoch": 2.42, "learning_rate": 1.9193705833465444e-05, "loss": 0.0074, "step": 167900 }, { "epoch": 2.42, "learning_rate": 1.9193657793726973e-05, "loss": 0.0076, "step": 167910 }, { "epoch": 2.42, "learning_rate": 1.91936097539885e-05, "loss": 0.0065, "step": 167920 }, { "epoch": 2.42, "learning_rate": 1.9193561714250028e-05, "loss": 0.0098, "step": 167930 }, { "epoch": 2.42, "learning_rate": 1.9193513674511557e-05, "loss": 0.0037, "step": 167940 }, { "epoch": 2.42, "learning_rate": 1.9193465634773087e-05, "loss": 0.0054, "step": 167950 }, { "epoch": 2.42, "learning_rate": 1.9193417595034613e-05, "loss": 0.0095, "step": 167960 }, { "epoch": 2.42, "learning_rate": 1.9193369555296142e-05, "loss": 0.0081, "step": 167970 }, { "epoch": 2.42, "learning_rate": 1.919332151555767e-05, "loss": 0.0096, "step": 167980 }, { "epoch": 2.42, "learning_rate": 1.9193273475819197e-05, "loss": 0.0073, "step": 167990 }, { "epoch": 2.42, "learning_rate": 1.9193225436080726e-05, "loss": 0.0051, "step": 168000 }, { "epoch": 2.42, "learning_rate": 1.9193177396342256e-05, "loss": 0.0092, "step": 168010 }, { "epoch": 2.42, "learning_rate": 1.9193129356603785e-05, "loss": 0.0064, "step": 168020 }, { "epoch": 2.42, "learning_rate": 1.919308131686531e-05, "loss": 0.009, "step": 168030 }, { "epoch": 2.42, "learning_rate": 1.919303327712684e-05, "loss": 0.01, "step": 168040 }, { "epoch": 2.42, "learning_rate": 1.919298523738837e-05, "loss": 0.0055, "step": 168050 }, { "epoch": 2.42, "learning_rate": 1.9192937197649895e-05, "loss": 0.0063, "step": 168060 }, { "epoch": 2.42, "learning_rate": 1.9192889157911424e-05, "loss": 0.0068, "step": 168070 }, { "epoch": 2.42, "learning_rate": 1.9192841118172954e-05, "loss": 0.0069, "step": 168080 }, { "epoch": 2.42, "learning_rate": 1.9192793078434483e-05, "loss": 0.0072, "step": 168090 }, { "epoch": 2.42, "learning_rate": 1.919274503869601e-05, "loss": 0.0059, "step": 168100 }, { "epoch": 2.42, "learning_rate": 1.9192696998957538e-05, "loss": 0.0087, "step": 168110 }, { "epoch": 2.42, "learning_rate": 1.9192648959219067e-05, "loss": 0.009, "step": 168120 }, { "epoch": 2.42, "learning_rate": 1.9192600919480597e-05, "loss": 0.0053, "step": 168130 }, { "epoch": 2.42, "learning_rate": 1.919255768371597e-05, "loss": 0.006, "step": 168140 }, { "epoch": 2.42, "learning_rate": 1.91925096439775e-05, "loss": 0.01, "step": 168150 }, { "epoch": 2.42, "learning_rate": 1.9192461604239026e-05, "loss": 0.0061, "step": 168160 }, { "epoch": 2.42, "learning_rate": 1.9192413564500556e-05, "loss": 0.0086, "step": 168170 }, { "epoch": 2.42, "learning_rate": 1.9192365524762085e-05, "loss": 0.0089, "step": 168180 }, { "epoch": 2.42, "learning_rate": 1.9192317485023614e-05, "loss": 0.0056, "step": 168190 }, { "epoch": 2.42, "learning_rate": 1.919226944528514e-05, "loss": 0.009, "step": 168200 }, { "epoch": 2.42, "learning_rate": 1.919222140554667e-05, "loss": 0.0069, "step": 168210 }, { "epoch": 2.42, "learning_rate": 1.91921733658082e-05, "loss": 0.0088, "step": 168220 }, { "epoch": 2.42, "learning_rate": 1.9192125326069725e-05, "loss": 0.0065, "step": 168230 }, { "epoch": 2.42, "learning_rate": 1.9192077286331254e-05, "loss": 0.0076, "step": 168240 }, { "epoch": 2.42, "learning_rate": 1.9192029246592783e-05, "loss": 0.0084, "step": 168250 }, { "epoch": 2.42, "learning_rate": 1.9191981206854312e-05, "loss": 0.0084, "step": 168260 }, { "epoch": 2.43, "learning_rate": 1.9191933167115838e-05, "loss": 0.0081, "step": 168270 }, { "epoch": 2.43, "learning_rate": 1.9191885127377368e-05, "loss": 0.0116, "step": 168280 }, { "epoch": 2.43, "learning_rate": 1.9191837087638897e-05, "loss": 0.0092, "step": 168290 }, { "epoch": 2.43, "learning_rate": 1.9191789047900423e-05, "loss": 0.0063, "step": 168300 }, { "epoch": 2.43, "learning_rate": 1.9191741008161952e-05, "loss": 0.0077, "step": 168310 }, { "epoch": 2.43, "learning_rate": 1.919169296842348e-05, "loss": 0.0049, "step": 168320 }, { "epoch": 2.43, "learning_rate": 1.919164492868501e-05, "loss": 0.0079, "step": 168330 }, { "epoch": 2.43, "learning_rate": 1.9191596888946536e-05, "loss": 0.0074, "step": 168340 }, { "epoch": 2.43, "learning_rate": 1.9191548849208066e-05, "loss": 0.0053, "step": 168350 }, { "epoch": 2.43, "learning_rate": 1.9191500809469595e-05, "loss": 0.0088, "step": 168360 }, { "epoch": 2.43, "learning_rate": 1.9191452769731124e-05, "loss": 0.0072, "step": 168370 }, { "epoch": 2.43, "learning_rate": 1.919140472999265e-05, "loss": 0.0078, "step": 168380 }, { "epoch": 2.43, "learning_rate": 1.919135669025418e-05, "loss": 0.0042, "step": 168390 }, { "epoch": 2.43, "learning_rate": 1.919130865051571e-05, "loss": 0.0078, "step": 168400 }, { "epoch": 2.43, "learning_rate": 1.9191260610777234e-05, "loss": 0.0076, "step": 168410 }, { "epoch": 2.43, "learning_rate": 1.9191212571038764e-05, "loss": 0.005, "step": 168420 }, { "epoch": 2.43, "learning_rate": 1.9191164531300293e-05, "loss": 0.0078, "step": 168430 }, { "epoch": 2.43, "learning_rate": 1.9191116491561822e-05, "loss": 0.0058, "step": 168440 }, { "epoch": 2.43, "learning_rate": 1.9191068451823348e-05, "loss": 0.0089, "step": 168450 }, { "epoch": 2.43, "learning_rate": 1.9191020412084877e-05, "loss": 0.0055, "step": 168460 }, { "epoch": 2.43, "learning_rate": 1.9190972372346407e-05, "loss": 0.0053, "step": 168470 }, { "epoch": 2.43, "learning_rate": 1.9190924332607933e-05, "loss": 0.0091, "step": 168480 }, { "epoch": 2.43, "learning_rate": 1.9190876292869462e-05, "loss": 0.0069, "step": 168490 }, { "epoch": 2.43, "learning_rate": 1.919082825313099e-05, "loss": 0.0092, "step": 168500 }, { "epoch": 2.43, "learning_rate": 1.919078021339252e-05, "loss": 0.0066, "step": 168510 }, { "epoch": 2.43, "learning_rate": 1.9190732173654046e-05, "loss": 0.0077, "step": 168520 }, { "epoch": 2.43, "learning_rate": 1.9190684133915576e-05, "loss": 0.008, "step": 168530 }, { "epoch": 2.43, "learning_rate": 1.9190636094177105e-05, "loss": 0.006, "step": 168540 }, { "epoch": 2.43, "learning_rate": 1.9190588054438634e-05, "loss": 0.0074, "step": 168550 }, { "epoch": 2.43, "learning_rate": 1.919054001470016e-05, "loss": 0.0056, "step": 168560 }, { "epoch": 2.43, "learning_rate": 1.919049197496169e-05, "loss": 0.0069, "step": 168570 }, { "epoch": 2.43, "learning_rate": 1.919044393522322e-05, "loss": 0.0079, "step": 168580 }, { "epoch": 2.43, "learning_rate": 1.9190395895484744e-05, "loss": 0.0098, "step": 168590 }, { "epoch": 2.43, "learning_rate": 1.9190347855746274e-05, "loss": 0.0102, "step": 168600 }, { "epoch": 2.43, "learning_rate": 1.9190299816007803e-05, "loss": 0.0074, "step": 168610 }, { "epoch": 2.43, "learning_rate": 1.9190251776269332e-05, "loss": 0.0056, "step": 168620 }, { "epoch": 2.43, "learning_rate": 1.9190203736530858e-05, "loss": 0.0086, "step": 168630 }, { "epoch": 2.43, "learning_rate": 1.9190155696792387e-05, "loss": 0.0085, "step": 168640 }, { "epoch": 2.43, "learning_rate": 1.9190107657053917e-05, "loss": 0.0077, "step": 168650 }, { "epoch": 2.43, "learning_rate": 1.9190059617315443e-05, "loss": 0.0054, "step": 168660 }, { "epoch": 2.43, "learning_rate": 1.9190011577576972e-05, "loss": 0.007, "step": 168670 }, { "epoch": 2.43, "learning_rate": 1.91899635378385e-05, "loss": 0.0064, "step": 168680 }, { "epoch": 2.43, "learning_rate": 1.918991549810003e-05, "loss": 0.0102, "step": 168690 }, { "epoch": 2.43, "learning_rate": 1.9189867458361556e-05, "loss": 0.0084, "step": 168700 }, { "epoch": 2.43, "learning_rate": 1.9189819418623085e-05, "loss": 0.0063, "step": 168710 }, { "epoch": 2.43, "learning_rate": 1.9189771378884615e-05, "loss": 0.0056, "step": 168720 }, { "epoch": 2.43, "learning_rate": 1.9189723339146144e-05, "loss": 0.0087, "step": 168730 }, { "epoch": 2.43, "learning_rate": 1.918967529940767e-05, "loss": 0.0071, "step": 168740 }, { "epoch": 2.43, "learning_rate": 1.91896272596692e-05, "loss": 0.0066, "step": 168750 }, { "epoch": 2.43, "learning_rate": 1.918957921993073e-05, "loss": 0.0195, "step": 168760 }, { "epoch": 2.43, "learning_rate": 1.9189531180192254e-05, "loss": 0.0088, "step": 168770 }, { "epoch": 2.43, "learning_rate": 1.9189483140453784e-05, "loss": 0.0077, "step": 168780 }, { "epoch": 2.43, "learning_rate": 1.9189435100715313e-05, "loss": 0.005, "step": 168790 }, { "epoch": 2.43, "learning_rate": 1.9189387060976842e-05, "loss": 0.0069, "step": 168800 }, { "epoch": 2.43, "learning_rate": 1.9189339021238368e-05, "loss": 0.0067, "step": 168810 }, { "epoch": 2.43, "learning_rate": 1.9189290981499897e-05, "loss": 0.0068, "step": 168820 }, { "epoch": 2.43, "learning_rate": 1.9189242941761427e-05, "loss": 0.0057, "step": 168830 }, { "epoch": 2.43, "learning_rate": 1.9189194902022952e-05, "loss": 0.0065, "step": 168840 }, { "epoch": 2.43, "learning_rate": 1.918914686228448e-05, "loss": 0.0064, "step": 168850 }, { "epoch": 2.43, "learning_rate": 1.918909882254601e-05, "loss": 0.0061, "step": 168860 }, { "epoch": 2.43, "learning_rate": 1.918905078280754e-05, "loss": 0.0087, "step": 168870 }, { "epoch": 2.43, "learning_rate": 1.9189002743069066e-05, "loss": 0.0076, "step": 168880 }, { "epoch": 2.43, "learning_rate": 1.9188954703330595e-05, "loss": 0.01, "step": 168890 }, { "epoch": 2.43, "learning_rate": 1.9188906663592125e-05, "loss": 0.0085, "step": 168900 }, { "epoch": 2.43, "learning_rate": 1.9188858623853654e-05, "loss": 0.0069, "step": 168910 }, { "epoch": 2.43, "learning_rate": 1.918881058411518e-05, "loss": 0.0062, "step": 168920 }, { "epoch": 2.43, "learning_rate": 1.918876254437671e-05, "loss": 0.0082, "step": 168930 }, { "epoch": 2.43, "learning_rate": 1.918871450463824e-05, "loss": 0.0145, "step": 168940 }, { "epoch": 2.43, "learning_rate": 1.9188666464899764e-05, "loss": 0.0082, "step": 168950 }, { "epoch": 2.44, "learning_rate": 1.9188618425161293e-05, "loss": 0.0077, "step": 168960 }, { "epoch": 2.44, "learning_rate": 1.9188570385422823e-05, "loss": 0.0087, "step": 168970 }, { "epoch": 2.44, "learning_rate": 1.9188522345684352e-05, "loss": 0.0078, "step": 168980 }, { "epoch": 2.44, "learning_rate": 1.9188474305945878e-05, "loss": 0.0064, "step": 168990 }, { "epoch": 2.44, "learning_rate": 1.9188426266207407e-05, "loss": 0.0058, "step": 169000 }, { "epoch": 2.44, "learning_rate": 1.9188378226468936e-05, "loss": 0.0069, "step": 169010 }, { "epoch": 2.44, "learning_rate": 1.9188330186730466e-05, "loss": 0.0091, "step": 169020 }, { "epoch": 2.44, "learning_rate": 1.9188282146991995e-05, "loss": 0.0132, "step": 169030 }, { "epoch": 2.44, "learning_rate": 1.9188234107253524e-05, "loss": 0.0049, "step": 169040 }, { "epoch": 2.44, "learning_rate": 1.918818606751505e-05, "loss": 0.0072, "step": 169050 }, { "epoch": 2.44, "learning_rate": 1.918813802777658e-05, "loss": 0.0069, "step": 169060 }, { "epoch": 2.44, "learning_rate": 1.918808998803811e-05, "loss": 0.0074, "step": 169070 }, { "epoch": 2.44, "learning_rate": 1.9188041948299635e-05, "loss": 0.0095, "step": 169080 }, { "epoch": 2.44, "learning_rate": 1.9187993908561164e-05, "loss": 0.0075, "step": 169090 }, { "epoch": 2.44, "learning_rate": 1.9187945868822693e-05, "loss": 0.0072, "step": 169100 }, { "epoch": 2.44, "learning_rate": 1.9187897829084222e-05, "loss": 0.0076, "step": 169110 }, { "epoch": 2.44, "learning_rate": 1.9187849789345748e-05, "loss": 0.0069, "step": 169120 }, { "epoch": 2.44, "learning_rate": 1.9187801749607278e-05, "loss": 0.0069, "step": 169130 }, { "epoch": 2.44, "learning_rate": 1.9187753709868807e-05, "loss": 0.0071, "step": 169140 }, { "epoch": 2.44, "learning_rate": 1.9187705670130333e-05, "loss": 0.0099, "step": 169150 }, { "epoch": 2.44, "learning_rate": 1.9187657630391862e-05, "loss": 0.0075, "step": 169160 }, { "epoch": 2.44, "learning_rate": 1.918760959065339e-05, "loss": 0.0068, "step": 169170 }, { "epoch": 2.44, "learning_rate": 1.918756155091492e-05, "loss": 0.0078, "step": 169180 }, { "epoch": 2.44, "learning_rate": 1.9187513511176446e-05, "loss": 0.0051, "step": 169190 }, { "epoch": 2.44, "learning_rate": 1.9187465471437976e-05, "loss": 0.0073, "step": 169200 }, { "epoch": 2.44, "learning_rate": 1.9187417431699505e-05, "loss": 0.0064, "step": 169210 }, { "epoch": 2.44, "learning_rate": 1.9187369391961034e-05, "loss": 0.0072, "step": 169220 }, { "epoch": 2.44, "learning_rate": 1.918732135222256e-05, "loss": 0.0107, "step": 169230 }, { "epoch": 2.44, "learning_rate": 1.918727331248409e-05, "loss": 0.0078, "step": 169240 }, { "epoch": 2.44, "learning_rate": 1.918722527274562e-05, "loss": 0.0075, "step": 169250 }, { "epoch": 2.44, "learning_rate": 1.9187177233007144e-05, "loss": 0.0086, "step": 169260 }, { "epoch": 2.44, "learning_rate": 1.9187129193268674e-05, "loss": 0.0092, "step": 169270 }, { "epoch": 2.44, "learning_rate": 1.9187081153530203e-05, "loss": 0.0084, "step": 169280 }, { "epoch": 2.44, "learning_rate": 1.9187033113791732e-05, "loss": 0.0088, "step": 169290 }, { "epoch": 2.44, "learning_rate": 1.9186985074053258e-05, "loss": 0.0083, "step": 169300 }, { "epoch": 2.44, "learning_rate": 1.9186937034314787e-05, "loss": 0.0055, "step": 169310 }, { "epoch": 2.44, "learning_rate": 1.9186888994576317e-05, "loss": 0.0081, "step": 169320 }, { "epoch": 2.44, "learning_rate": 1.9186840954837843e-05, "loss": 0.007, "step": 169330 }, { "epoch": 2.44, "learning_rate": 1.9186792915099372e-05, "loss": 0.0068, "step": 169340 }, { "epoch": 2.44, "learning_rate": 1.91867448753609e-05, "loss": 0.0092, "step": 169350 }, { "epoch": 2.44, "learning_rate": 1.918669683562243e-05, "loss": 0.0042, "step": 169360 }, { "epoch": 2.44, "learning_rate": 1.9186648795883956e-05, "loss": 0.0091, "step": 169370 }, { "epoch": 2.44, "learning_rate": 1.9186600756145486e-05, "loss": 0.01, "step": 169380 }, { "epoch": 2.44, "learning_rate": 1.9186552716407015e-05, "loss": 0.0099, "step": 169390 }, { "epoch": 2.44, "learning_rate": 1.9186504676668544e-05, "loss": 0.0086, "step": 169400 }, { "epoch": 2.44, "learning_rate": 1.918645663693007e-05, "loss": 0.0066, "step": 169410 }, { "epoch": 2.44, "learning_rate": 1.91864085971916e-05, "loss": 0.0089, "step": 169420 }, { "epoch": 2.44, "learning_rate": 1.918636055745313e-05, "loss": 0.006, "step": 169430 }, { "epoch": 2.44, "learning_rate": 1.9186312517714654e-05, "loss": 0.0059, "step": 169440 }, { "epoch": 2.44, "learning_rate": 1.9186264477976184e-05, "loss": 0.0065, "step": 169450 }, { "epoch": 2.44, "learning_rate": 1.9186216438237713e-05, "loss": 0.005, "step": 169460 }, { "epoch": 2.44, "learning_rate": 1.9186168398499242e-05, "loss": 0.0068, "step": 169470 }, { "epoch": 2.44, "learning_rate": 1.9186120358760768e-05, "loss": 0.0087, "step": 169480 }, { "epoch": 2.44, "learning_rate": 1.9186072319022297e-05, "loss": 0.0068, "step": 169490 }, { "epoch": 2.44, "learning_rate": 1.9186024279283827e-05, "loss": 0.012, "step": 169500 }, { "epoch": 2.44, "learning_rate": 1.9185976239545353e-05, "loss": 0.0089, "step": 169510 }, { "epoch": 2.44, "learning_rate": 1.9185928199806882e-05, "loss": 0.0085, "step": 169520 }, { "epoch": 2.44, "learning_rate": 1.918588016006841e-05, "loss": 0.0087, "step": 169530 }, { "epoch": 2.44, "learning_rate": 1.918583212032994e-05, "loss": 0.0066, "step": 169540 }, { "epoch": 2.44, "learning_rate": 1.9185784080591466e-05, "loss": 0.0075, "step": 169550 }, { "epoch": 2.44, "learning_rate": 1.9185736040852995e-05, "loss": 0.0104, "step": 169560 }, { "epoch": 2.44, "learning_rate": 1.9185688001114525e-05, "loss": 0.0095, "step": 169570 }, { "epoch": 2.44, "learning_rate": 1.9185639961376054e-05, "loss": 0.0075, "step": 169580 }, { "epoch": 2.44, "learning_rate": 1.918559192163758e-05, "loss": 0.0092, "step": 169590 }, { "epoch": 2.44, "learning_rate": 1.918554388189911e-05, "loss": 0.0072, "step": 169600 }, { "epoch": 2.44, "learning_rate": 1.918549584216064e-05, "loss": 0.0076, "step": 169610 }, { "epoch": 2.44, "learning_rate": 1.9185447802422164e-05, "loss": 0.0108, "step": 169620 }, { "epoch": 2.44, "learning_rate": 1.9185399762683694e-05, "loss": 0.0091, "step": 169630 }, { "epoch": 2.44, "learning_rate": 1.9185351722945223e-05, "loss": 0.0085, "step": 169640 }, { "epoch": 2.44, "learning_rate": 1.9185303683206752e-05, "loss": 0.0059, "step": 169650 }, { "epoch": 2.45, "learning_rate": 1.9185255643468278e-05, "loss": 0.0045, "step": 169660 }, { "epoch": 2.45, "learning_rate": 1.9185207603729807e-05, "loss": 0.0063, "step": 169670 }, { "epoch": 2.45, "learning_rate": 1.9185159563991337e-05, "loss": 0.0074, "step": 169680 }, { "epoch": 2.45, "learning_rate": 1.9185111524252862e-05, "loss": 0.0143, "step": 169690 }, { "epoch": 2.45, "learning_rate": 1.918506348451439e-05, "loss": 0.0102, "step": 169700 }, { "epoch": 2.45, "learning_rate": 1.918501544477592e-05, "loss": 0.0092, "step": 169710 }, { "epoch": 2.45, "learning_rate": 1.918496740503745e-05, "loss": 0.0078, "step": 169720 }, { "epoch": 2.45, "learning_rate": 1.9184919365298976e-05, "loss": 0.0064, "step": 169730 }, { "epoch": 2.45, "learning_rate": 1.9184871325560505e-05, "loss": 0.0095, "step": 169740 }, { "epoch": 2.45, "learning_rate": 1.9184823285822035e-05, "loss": 0.0095, "step": 169750 }, { "epoch": 2.45, "learning_rate": 1.9184775246083564e-05, "loss": 0.0065, "step": 169760 }, { "epoch": 2.45, "learning_rate": 1.918472720634509e-05, "loss": 0.0064, "step": 169770 }, { "epoch": 2.45, "learning_rate": 1.918467916660662e-05, "loss": 0.0047, "step": 169780 }, { "epoch": 2.45, "learning_rate": 1.918463112686815e-05, "loss": 0.0087, "step": 169790 }, { "epoch": 2.45, "learning_rate": 1.9184583087129674e-05, "loss": 0.0072, "step": 169800 }, { "epoch": 2.45, "learning_rate": 1.9184535047391203e-05, "loss": 0.0055, "step": 169810 }, { "epoch": 2.45, "learning_rate": 1.9184487007652733e-05, "loss": 0.0061, "step": 169820 }, { "epoch": 2.45, "learning_rate": 1.9184438967914262e-05, "loss": 0.0075, "step": 169830 }, { "epoch": 2.45, "learning_rate": 1.9184390928175788e-05, "loss": 0.0079, "step": 169840 }, { "epoch": 2.45, "learning_rate": 1.9184342888437317e-05, "loss": 0.0074, "step": 169850 }, { "epoch": 2.45, "learning_rate": 1.9184294848698846e-05, "loss": 0.0069, "step": 169860 }, { "epoch": 2.45, "learning_rate": 1.9184246808960372e-05, "loss": 0.0068, "step": 169870 }, { "epoch": 2.45, "learning_rate": 1.91841987692219e-05, "loss": 0.0098, "step": 169880 }, { "epoch": 2.45, "learning_rate": 1.918415072948343e-05, "loss": 0.0062, "step": 169890 }, { "epoch": 2.45, "learning_rate": 1.918410268974496e-05, "loss": 0.0065, "step": 169900 }, { "epoch": 2.45, "learning_rate": 1.9184054650006486e-05, "loss": 0.0092, "step": 169910 }, { "epoch": 2.45, "learning_rate": 1.9184006610268015e-05, "loss": 0.0077, "step": 169920 }, { "epoch": 2.45, "learning_rate": 1.9183958570529545e-05, "loss": 0.0071, "step": 169930 }, { "epoch": 2.45, "learning_rate": 1.9183910530791074e-05, "loss": 0.0067, "step": 169940 }, { "epoch": 2.45, "learning_rate": 1.91838624910526e-05, "loss": 0.0086, "step": 169950 }, { "epoch": 2.45, "learning_rate": 1.918381445131413e-05, "loss": 0.0091, "step": 169960 }, { "epoch": 2.45, "learning_rate": 1.9183766411575658e-05, "loss": 0.0065, "step": 169970 }, { "epoch": 2.45, "learning_rate": 1.9183718371837184e-05, "loss": 0.006, "step": 169980 }, { "epoch": 2.45, "learning_rate": 1.9183670332098713e-05, "loss": 0.0046, "step": 169990 }, { "epoch": 2.45, "learning_rate": 1.9183622292360243e-05, "loss": 0.0098, "step": 170000 }, { "epoch": 2.45, "learning_rate": 1.9183574252621772e-05, "loss": 0.0089, "step": 170010 }, { "epoch": 2.45, "learning_rate": 1.9183526212883298e-05, "loss": 0.0103, "step": 170020 }, { "epoch": 2.45, "learning_rate": 1.9183478173144827e-05, "loss": 0.0061, "step": 170030 }, { "epoch": 2.45, "learning_rate": 1.9183430133406356e-05, "loss": 0.0066, "step": 170040 }, { "epoch": 2.45, "learning_rate": 1.9183382093667882e-05, "loss": 0.008, "step": 170050 }, { "epoch": 2.45, "learning_rate": 1.918333405392941e-05, "loss": 0.0057, "step": 170060 }, { "epoch": 2.45, "learning_rate": 1.918328601419094e-05, "loss": 0.0058, "step": 170070 }, { "epoch": 2.45, "learning_rate": 1.918323797445247e-05, "loss": 0.0045, "step": 170080 }, { "epoch": 2.45, "learning_rate": 1.9183189934713996e-05, "loss": 0.0107, "step": 170090 }, { "epoch": 2.45, "learning_rate": 1.9183141894975525e-05, "loss": 0.0083, "step": 170100 }, { "epoch": 2.45, "learning_rate": 1.9183093855237054e-05, "loss": 0.0091, "step": 170110 }, { "epoch": 2.45, "learning_rate": 1.9183045815498584e-05, "loss": 0.0087, "step": 170120 }, { "epoch": 2.45, "learning_rate": 1.918299777576011e-05, "loss": 0.0084, "step": 170130 }, { "epoch": 2.45, "learning_rate": 1.918294973602164e-05, "loss": 0.0049, "step": 170140 }, { "epoch": 2.45, "learning_rate": 1.9182901696283168e-05, "loss": 0.0071, "step": 170150 }, { "epoch": 2.45, "learning_rate": 1.9182853656544694e-05, "loss": 0.006, "step": 170160 }, { "epoch": 2.45, "learning_rate": 1.9182805616806223e-05, "loss": 0.009, "step": 170170 }, { "epoch": 2.45, "learning_rate": 1.9182757577067753e-05, "loss": 0.0069, "step": 170180 }, { "epoch": 2.45, "learning_rate": 1.9182709537329282e-05, "loss": 0.0057, "step": 170190 }, { "epoch": 2.45, "learning_rate": 1.9182661497590808e-05, "loss": 0.0124, "step": 170200 }, { "epoch": 2.45, "learning_rate": 1.9182613457852337e-05, "loss": 0.0063, "step": 170210 }, { "epoch": 2.45, "learning_rate": 1.9182565418113866e-05, "loss": 0.007, "step": 170220 }, { "epoch": 2.45, "learning_rate": 1.9182517378375392e-05, "loss": 0.008, "step": 170230 }, { "epoch": 2.45, "learning_rate": 1.918246933863692e-05, "loss": 0.0101, "step": 170240 }, { "epoch": 2.45, "learning_rate": 1.918242129889845e-05, "loss": 0.0084, "step": 170250 }, { "epoch": 2.45, "learning_rate": 1.918237325915998e-05, "loss": 0.0079, "step": 170260 }, { "epoch": 2.45, "learning_rate": 1.9182325219421506e-05, "loss": 0.0075, "step": 170270 }, { "epoch": 2.45, "learning_rate": 1.9182277179683035e-05, "loss": 0.0068, "step": 170280 }, { "epoch": 2.45, "learning_rate": 1.9182229139944564e-05, "loss": 0.0089, "step": 170290 }, { "epoch": 2.45, "learning_rate": 1.9182181100206094e-05, "loss": 0.0089, "step": 170300 }, { "epoch": 2.45, "learning_rate": 1.918213306046762e-05, "loss": 0.0066, "step": 170310 }, { "epoch": 2.45, "learning_rate": 1.918208502072915e-05, "loss": 0.0091, "step": 170320 }, { "epoch": 2.45, "learning_rate": 1.9182036980990678e-05, "loss": 0.0065, "step": 170330 }, { "epoch": 2.45, "learning_rate": 1.9181988941252204e-05, "loss": 0.0071, "step": 170340 }, { "epoch": 2.46, "learning_rate": 1.9181940901513733e-05, "loss": 0.0072, "step": 170350 }, { "epoch": 2.46, "learning_rate": 1.9181892861775263e-05, "loss": 0.008, "step": 170360 }, { "epoch": 2.46, "learning_rate": 1.9181844822036792e-05, "loss": 0.0084, "step": 170370 }, { "epoch": 2.46, "learning_rate": 1.9181796782298318e-05, "loss": 0.0112, "step": 170380 }, { "epoch": 2.46, "learning_rate": 1.9181748742559847e-05, "loss": 0.0066, "step": 170390 }, { "epoch": 2.46, "learning_rate": 1.9181700702821376e-05, "loss": 0.0072, "step": 170400 }, { "epoch": 2.46, "learning_rate": 1.9181652663082902e-05, "loss": 0.0073, "step": 170410 }, { "epoch": 2.46, "learning_rate": 1.918160462334443e-05, "loss": 0.0074, "step": 170420 }, { "epoch": 2.46, "learning_rate": 1.918155658360596e-05, "loss": 0.0085, "step": 170430 }, { "epoch": 2.46, "learning_rate": 1.918150854386749e-05, "loss": 0.006, "step": 170440 }, { "epoch": 2.46, "learning_rate": 1.9181460504129016e-05, "loss": 0.0098, "step": 170450 }, { "epoch": 2.46, "learning_rate": 1.9181412464390545e-05, "loss": 0.0055, "step": 170460 }, { "epoch": 2.46, "learning_rate": 1.9181364424652074e-05, "loss": 0.0073, "step": 170470 }, { "epoch": 2.46, "learning_rate": 1.9181316384913604e-05, "loss": 0.0083, "step": 170480 }, { "epoch": 2.46, "learning_rate": 1.918126834517513e-05, "loss": 0.009, "step": 170490 }, { "epoch": 2.46, "learning_rate": 1.918122030543666e-05, "loss": 0.0056, "step": 170500 }, { "epoch": 2.46, "learning_rate": 1.9181172265698188e-05, "loss": 0.0062, "step": 170510 }, { "epoch": 2.46, "learning_rate": 1.9181124225959714e-05, "loss": 0.0086, "step": 170520 }, { "epoch": 2.46, "learning_rate": 1.9181076186221243e-05, "loss": 0.0055, "step": 170530 }, { "epoch": 2.46, "learning_rate": 1.9181028146482772e-05, "loss": 0.0106, "step": 170540 }, { "epoch": 2.46, "learning_rate": 1.91809801067443e-05, "loss": 0.0104, "step": 170550 }, { "epoch": 2.46, "learning_rate": 1.9180932067005828e-05, "loss": 0.0062, "step": 170560 }, { "epoch": 2.46, "learning_rate": 1.9180884027267357e-05, "loss": 0.0053, "step": 170570 }, { "epoch": 2.46, "learning_rate": 1.9180835987528886e-05, "loss": 0.006, "step": 170580 }, { "epoch": 2.46, "learning_rate": 1.9180787947790412e-05, "loss": 0.0072, "step": 170590 }, { "epoch": 2.46, "learning_rate": 1.918073990805194e-05, "loss": 0.0054, "step": 170600 }, { "epoch": 2.46, "learning_rate": 1.918069186831347e-05, "loss": 0.0068, "step": 170610 }, { "epoch": 2.46, "learning_rate": 1.9180643828575e-05, "loss": 0.0073, "step": 170620 }, { "epoch": 2.46, "learning_rate": 1.9180595788836526e-05, "loss": 0.0071, "step": 170630 }, { "epoch": 2.46, "learning_rate": 1.9180547749098055e-05, "loss": 0.0067, "step": 170640 }, { "epoch": 2.46, "learning_rate": 1.9180499709359584e-05, "loss": 0.0092, "step": 170650 }, { "epoch": 2.46, "learning_rate": 1.9180451669621113e-05, "loss": 0.0047, "step": 170660 }, { "epoch": 2.46, "learning_rate": 1.918040362988264e-05, "loss": 0.0065, "step": 170670 }, { "epoch": 2.46, "learning_rate": 1.918035559014417e-05, "loss": 0.0074, "step": 170680 }, { "epoch": 2.46, "learning_rate": 1.9180307550405698e-05, "loss": 0.0074, "step": 170690 }, { "epoch": 2.46, "learning_rate": 1.9180259510667224e-05, "loss": 0.0051, "step": 170700 }, { "epoch": 2.46, "learning_rate": 1.9180211470928753e-05, "loss": 0.0091, "step": 170710 }, { "epoch": 2.46, "learning_rate": 1.9180163431190282e-05, "loss": 0.0063, "step": 170720 }, { "epoch": 2.46, "learning_rate": 1.918011539145181e-05, "loss": 0.0071, "step": 170730 }, { "epoch": 2.46, "learning_rate": 1.9180067351713337e-05, "loss": 0.009, "step": 170740 }, { "epoch": 2.46, "learning_rate": 1.9180019311974867e-05, "loss": 0.0094, "step": 170750 }, { "epoch": 2.46, "learning_rate": 1.9179971272236396e-05, "loss": 0.0065, "step": 170760 }, { "epoch": 2.46, "learning_rate": 1.9179923232497922e-05, "loss": 0.0063, "step": 170770 }, { "epoch": 2.46, "learning_rate": 1.917987519275945e-05, "loss": 0.0064, "step": 170780 }, { "epoch": 2.46, "learning_rate": 1.917982715302098e-05, "loss": 0.0059, "step": 170790 }, { "epoch": 2.46, "learning_rate": 1.917977911328251e-05, "loss": 0.0075, "step": 170800 }, { "epoch": 2.46, "learning_rate": 1.9179731073544036e-05, "loss": 0.0099, "step": 170810 }, { "epoch": 2.46, "learning_rate": 1.9179683033805565e-05, "loss": 0.0089, "step": 170820 }, { "epoch": 2.46, "learning_rate": 1.9179634994067094e-05, "loss": 0.0106, "step": 170830 }, { "epoch": 2.46, "learning_rate": 1.9179586954328623e-05, "loss": 0.007, "step": 170840 }, { "epoch": 2.46, "learning_rate": 1.917953891459015e-05, "loss": 0.0066, "step": 170850 }, { "epoch": 2.46, "learning_rate": 1.917949087485168e-05, "loss": 0.0056, "step": 170860 }, { "epoch": 2.46, "learning_rate": 1.9179442835113208e-05, "loss": 0.0067, "step": 170870 }, { "epoch": 2.46, "learning_rate": 1.9179394795374734e-05, "loss": 0.0071, "step": 170880 }, { "epoch": 2.46, "learning_rate": 1.9179346755636263e-05, "loss": 0.0064, "step": 170890 }, { "epoch": 2.46, "learning_rate": 1.9179298715897792e-05, "loss": 0.0089, "step": 170900 }, { "epoch": 2.46, "learning_rate": 1.917925067615932e-05, "loss": 0.0087, "step": 170910 }, { "epoch": 2.46, "learning_rate": 1.9179202636420847e-05, "loss": 0.0075, "step": 170920 }, { "epoch": 2.46, "learning_rate": 1.9179154596682377e-05, "loss": 0.0087, "step": 170930 }, { "epoch": 2.46, "learning_rate": 1.9179106556943906e-05, "loss": 0.0047, "step": 170940 }, { "epoch": 2.46, "learning_rate": 1.9179058517205432e-05, "loss": 0.0063, "step": 170950 }, { "epoch": 2.46, "learning_rate": 1.917901047746696e-05, "loss": 0.0053, "step": 170960 }, { "epoch": 2.46, "learning_rate": 1.917896243772849e-05, "loss": 0.0067, "step": 170970 }, { "epoch": 2.46, "learning_rate": 1.917891439799002e-05, "loss": 0.0056, "step": 170980 }, { "epoch": 2.46, "learning_rate": 1.9178866358251546e-05, "loss": 0.0074, "step": 170990 }, { "epoch": 2.46, "learning_rate": 1.9178818318513075e-05, "loss": 0.005, "step": 171000 }, { "epoch": 2.46, "learning_rate": 1.9178770278774604e-05, "loss": 0.0101, "step": 171010 }, { "epoch": 2.46, "learning_rate": 1.917872223903613e-05, "loss": 0.0097, "step": 171020 }, { "epoch": 2.46, "learning_rate": 1.917867419929766e-05, "loss": 0.0064, "step": 171030 }, { "epoch": 2.47, "learning_rate": 1.917862615955919e-05, "loss": 0.0062, "step": 171040 }, { "epoch": 2.47, "learning_rate": 1.9178578119820718e-05, "loss": 0.0074, "step": 171050 }, { "epoch": 2.47, "learning_rate": 1.9178530080082244e-05, "loss": 0.0067, "step": 171060 }, { "epoch": 2.47, "learning_rate": 1.9178482040343773e-05, "loss": 0.0055, "step": 171070 }, { "epoch": 2.47, "learning_rate": 1.9178434000605302e-05, "loss": 0.0055, "step": 171080 }, { "epoch": 2.47, "learning_rate": 1.917838596086683e-05, "loss": 0.0059, "step": 171090 }, { "epoch": 2.47, "learning_rate": 1.9178337921128357e-05, "loss": 0.007, "step": 171100 }, { "epoch": 2.47, "learning_rate": 1.9178289881389887e-05, "loss": 0.008, "step": 171110 }, { "epoch": 2.47, "learning_rate": 1.9178241841651416e-05, "loss": 0.009, "step": 171120 }, { "epoch": 2.47, "learning_rate": 1.9178193801912942e-05, "loss": 0.0112, "step": 171130 }, { "epoch": 2.47, "learning_rate": 1.917814576217447e-05, "loss": 0.0117, "step": 171140 }, { "epoch": 2.47, "learning_rate": 1.9178097722436e-05, "loss": 0.008, "step": 171150 }, { "epoch": 2.47, "learning_rate": 1.917804968269753e-05, "loss": 0.0075, "step": 171160 }, { "epoch": 2.47, "learning_rate": 1.9178001642959055e-05, "loss": 0.0067, "step": 171170 }, { "epoch": 2.47, "learning_rate": 1.9177953603220585e-05, "loss": 0.0037, "step": 171180 }, { "epoch": 2.47, "learning_rate": 1.9177905563482114e-05, "loss": 0.0088, "step": 171190 }, { "epoch": 2.47, "learning_rate": 1.917785752374364e-05, "loss": 0.0074, "step": 171200 }, { "epoch": 2.47, "learning_rate": 1.917780948400517e-05, "loss": 0.0099, "step": 171210 }, { "epoch": 2.47, "learning_rate": 1.91777614442667e-05, "loss": 0.0098, "step": 171220 }, { "epoch": 2.47, "learning_rate": 1.9177713404528228e-05, "loss": 0.0086, "step": 171230 }, { "epoch": 2.47, "learning_rate": 1.9177665364789754e-05, "loss": 0.0082, "step": 171240 }, { "epoch": 2.47, "learning_rate": 1.9177617325051283e-05, "loss": 0.0065, "step": 171250 }, { "epoch": 2.47, "learning_rate": 1.9177569285312812e-05, "loss": 0.0072, "step": 171260 }, { "epoch": 2.47, "learning_rate": 1.917752124557434e-05, "loss": 0.0081, "step": 171270 }, { "epoch": 2.47, "learning_rate": 1.9177473205835867e-05, "loss": 0.0076, "step": 171280 }, { "epoch": 2.47, "learning_rate": 1.9177425166097397e-05, "loss": 0.0087, "step": 171290 }, { "epoch": 2.47, "learning_rate": 1.9177377126358926e-05, "loss": 0.0056, "step": 171300 }, { "epoch": 2.47, "learning_rate": 1.917732908662045e-05, "loss": 0.0061, "step": 171310 }, { "epoch": 2.47, "learning_rate": 1.917728104688198e-05, "loss": 0.0074, "step": 171320 }, { "epoch": 2.47, "learning_rate": 1.917723300714351e-05, "loss": 0.0078, "step": 171330 }, { "epoch": 2.47, "learning_rate": 1.917718496740504e-05, "loss": 0.0086, "step": 171340 }, { "epoch": 2.47, "learning_rate": 1.9177136927666565e-05, "loss": 0.009, "step": 171350 }, { "epoch": 2.47, "learning_rate": 1.9177088887928095e-05, "loss": 0.0082, "step": 171360 }, { "epoch": 2.47, "learning_rate": 1.9177040848189624e-05, "loss": 0.0081, "step": 171370 }, { "epoch": 2.47, "learning_rate": 1.917699280845115e-05, "loss": 0.0077, "step": 171380 }, { "epoch": 2.47, "learning_rate": 1.917694476871268e-05, "loss": 0.0088, "step": 171390 }, { "epoch": 2.47, "learning_rate": 1.9176896728974208e-05, "loss": 0.0068, "step": 171400 }, { "epoch": 2.47, "learning_rate": 1.9176848689235738e-05, "loss": 0.0057, "step": 171410 }, { "epoch": 2.47, "learning_rate": 1.9176800649497263e-05, "loss": 0.0067, "step": 171420 }, { "epoch": 2.47, "learning_rate": 1.9176752609758793e-05, "loss": 0.0064, "step": 171430 }, { "epoch": 2.47, "learning_rate": 1.9176704570020322e-05, "loss": 0.0087, "step": 171440 }, { "epoch": 2.47, "learning_rate": 1.917665653028185e-05, "loss": 0.0061, "step": 171450 }, { "epoch": 2.47, "learning_rate": 1.9176608490543377e-05, "loss": 0.0086, "step": 171460 }, { "epoch": 2.47, "learning_rate": 1.9176560450804906e-05, "loss": 0.006, "step": 171470 }, { "epoch": 2.47, "learning_rate": 1.9176512411066436e-05, "loss": 0.0076, "step": 171480 }, { "epoch": 2.47, "learning_rate": 1.917646437132796e-05, "loss": 0.008, "step": 171490 }, { "epoch": 2.47, "learning_rate": 1.917641633158949e-05, "loss": 0.0054, "step": 171500 }, { "epoch": 2.47, "learning_rate": 1.917636829185102e-05, "loss": 0.0057, "step": 171510 }, { "epoch": 2.47, "learning_rate": 1.917632025211255e-05, "loss": 0.0064, "step": 171520 }, { "epoch": 2.47, "learning_rate": 1.9176272212374075e-05, "loss": 0.0065, "step": 171530 }, { "epoch": 2.47, "learning_rate": 1.9176224172635605e-05, "loss": 0.0053, "step": 171540 }, { "epoch": 2.47, "learning_rate": 1.9176176132897134e-05, "loss": 0.0079, "step": 171550 }, { "epoch": 2.47, "learning_rate": 1.917612809315866e-05, "loss": 0.0047, "step": 171560 }, { "epoch": 2.47, "learning_rate": 1.9176080053420192e-05, "loss": 0.0077, "step": 171570 }, { "epoch": 2.47, "learning_rate": 1.917603201368172e-05, "loss": 0.008, "step": 171580 }, { "epoch": 2.47, "learning_rate": 1.9175983973943247e-05, "loss": 0.0048, "step": 171590 }, { "epoch": 2.47, "learning_rate": 1.9175935934204777e-05, "loss": 0.008, "step": 171600 }, { "epoch": 2.47, "learning_rate": 1.9175887894466306e-05, "loss": 0.0072, "step": 171610 }, { "epoch": 2.47, "learning_rate": 1.9175839854727832e-05, "loss": 0.0077, "step": 171620 }, { "epoch": 2.47, "learning_rate": 1.917579181498936e-05, "loss": 0.0082, "step": 171630 }, { "epoch": 2.47, "learning_rate": 1.917574377525089e-05, "loss": 0.0073, "step": 171640 }, { "epoch": 2.47, "learning_rate": 1.917569573551242e-05, "loss": 0.0082, "step": 171650 }, { "epoch": 2.47, "learning_rate": 1.9175647695773946e-05, "loss": 0.0066, "step": 171660 }, { "epoch": 2.47, "learning_rate": 1.9175599656035475e-05, "loss": 0.0097, "step": 171670 }, { "epoch": 2.47, "learning_rate": 1.9175551616297004e-05, "loss": 0.0092, "step": 171680 }, { "epoch": 2.47, "learning_rate": 1.9175503576558533e-05, "loss": 0.014, "step": 171690 }, { "epoch": 2.47, "learning_rate": 1.917545553682006e-05, "loss": 0.0056, "step": 171700 }, { "epoch": 2.47, "learning_rate": 1.917540749708159e-05, "loss": 0.0088, "step": 171710 }, { "epoch": 2.47, "learning_rate": 1.9175359457343118e-05, "loss": 0.0076, "step": 171720 }, { "epoch": 2.47, "learning_rate": 1.9175311417604644e-05, "loss": 0.0081, "step": 171730 }, { "epoch": 2.48, "learning_rate": 1.9175263377866173e-05, "loss": 0.0065, "step": 171740 }, { "epoch": 2.48, "learning_rate": 1.9175215338127702e-05, "loss": 0.0116, "step": 171750 }, { "epoch": 2.48, "learning_rate": 1.917516729838923e-05, "loss": 0.0093, "step": 171760 }, { "epoch": 2.48, "learning_rate": 1.9175119258650757e-05, "loss": 0.0064, "step": 171770 }, { "epoch": 2.48, "learning_rate": 1.9175071218912287e-05, "loss": 0.0067, "step": 171780 }, { "epoch": 2.48, "learning_rate": 1.9175023179173816e-05, "loss": 0.0058, "step": 171790 }, { "epoch": 2.48, "learning_rate": 1.9174975139435342e-05, "loss": 0.0057, "step": 171800 }, { "epoch": 2.48, "learning_rate": 1.917492709969687e-05, "loss": 0.0077, "step": 171810 }, { "epoch": 2.48, "learning_rate": 1.91748790599584e-05, "loss": 0.0059, "step": 171820 }, { "epoch": 2.48, "learning_rate": 1.917483102021993e-05, "loss": 0.0058, "step": 171830 }, { "epoch": 2.48, "learning_rate": 1.9174782980481456e-05, "loss": 0.006, "step": 171840 }, { "epoch": 2.48, "learning_rate": 1.9174734940742985e-05, "loss": 0.0115, "step": 171850 }, { "epoch": 2.48, "learning_rate": 1.9174686901004514e-05, "loss": 0.0053, "step": 171860 }, { "epoch": 2.48, "learning_rate": 1.9174638861266043e-05, "loss": 0.0082, "step": 171870 }, { "epoch": 2.48, "learning_rate": 1.917459082152757e-05, "loss": 0.006, "step": 171880 }, { "epoch": 2.48, "learning_rate": 1.91745427817891e-05, "loss": 0.0083, "step": 171890 }, { "epoch": 2.48, "learning_rate": 1.9174494742050628e-05, "loss": 0.013, "step": 171900 }, { "epoch": 2.48, "learning_rate": 1.9174446702312154e-05, "loss": 0.0098, "step": 171910 }, { "epoch": 2.48, "learning_rate": 1.9174398662573683e-05, "loss": 0.0078, "step": 171920 }, { "epoch": 2.48, "learning_rate": 1.9174350622835212e-05, "loss": 0.0096, "step": 171930 }, { "epoch": 2.48, "learning_rate": 1.917430258309674e-05, "loss": 0.0063, "step": 171940 }, { "epoch": 2.48, "learning_rate": 1.9174254543358267e-05, "loss": 0.0095, "step": 171950 }, { "epoch": 2.48, "learning_rate": 1.9174206503619797e-05, "loss": 0.0088, "step": 171960 }, { "epoch": 2.48, "learning_rate": 1.9174158463881326e-05, "loss": 0.0082, "step": 171970 }, { "epoch": 2.48, "learning_rate": 1.9174110424142852e-05, "loss": 0.006, "step": 171980 }, { "epoch": 2.48, "learning_rate": 1.917406238440438e-05, "loss": 0.0063, "step": 171990 }, { "epoch": 2.48, "learning_rate": 1.917401434466591e-05, "loss": 0.0072, "step": 172000 }, { "epoch": 2.48, "learning_rate": 1.917396630492744e-05, "loss": 0.0076, "step": 172010 }, { "epoch": 2.48, "learning_rate": 1.9173918265188965e-05, "loss": 0.0115, "step": 172020 }, { "epoch": 2.48, "learning_rate": 1.9173870225450495e-05, "loss": 0.0063, "step": 172030 }, { "epoch": 2.48, "learning_rate": 1.9173822185712024e-05, "loss": 0.0072, "step": 172040 }, { "epoch": 2.48, "learning_rate": 1.9173774145973553e-05, "loss": 0.0083, "step": 172050 }, { "epoch": 2.48, "learning_rate": 1.917372610623508e-05, "loss": 0.0066, "step": 172060 }, { "epoch": 2.48, "learning_rate": 1.917367806649661e-05, "loss": 0.0064, "step": 172070 }, { "epoch": 2.48, "learning_rate": 1.9173630026758138e-05, "loss": 0.0081, "step": 172080 }, { "epoch": 2.48, "learning_rate": 1.9173581987019664e-05, "loss": 0.0089, "step": 172090 }, { "epoch": 2.48, "learning_rate": 1.9173533947281193e-05, "loss": 0.0071, "step": 172100 }, { "epoch": 2.48, "learning_rate": 1.9173485907542722e-05, "loss": 0.0063, "step": 172110 }, { "epoch": 2.48, "learning_rate": 1.917343786780425e-05, "loss": 0.0085, "step": 172120 }, { "epoch": 2.48, "learning_rate": 1.9173389828065777e-05, "loss": 0.0077, "step": 172130 }, { "epoch": 2.48, "learning_rate": 1.9173341788327307e-05, "loss": 0.0054, "step": 172140 }, { "epoch": 2.48, "learning_rate": 1.9173293748588836e-05, "loss": 0.0067, "step": 172150 }, { "epoch": 2.48, "learning_rate": 1.917324570885036e-05, "loss": 0.0067, "step": 172160 }, { "epoch": 2.48, "learning_rate": 1.917319766911189e-05, "loss": 0.0075, "step": 172170 }, { "epoch": 2.48, "learning_rate": 1.917314962937342e-05, "loss": 0.0076, "step": 172180 }, { "epoch": 2.48, "learning_rate": 1.917310158963495e-05, "loss": 0.006, "step": 172190 }, { "epoch": 2.48, "learning_rate": 1.9173053549896475e-05, "loss": 0.0096, "step": 172200 }, { "epoch": 2.48, "learning_rate": 1.9173005510158005e-05, "loss": 0.0096, "step": 172210 }, { "epoch": 2.48, "learning_rate": 1.9172957470419534e-05, "loss": 0.0081, "step": 172220 }, { "epoch": 2.48, "learning_rate": 1.9172909430681063e-05, "loss": 0.0079, "step": 172230 }, { "epoch": 2.48, "learning_rate": 1.917286139094259e-05, "loss": 0.0068, "step": 172240 }, { "epoch": 2.48, "learning_rate": 1.917281335120412e-05, "loss": 0.0052, "step": 172250 }, { "epoch": 2.48, "learning_rate": 1.9172765311465648e-05, "loss": 0.0066, "step": 172260 }, { "epoch": 2.48, "learning_rate": 1.9172717271727173e-05, "loss": 0.0118, "step": 172270 }, { "epoch": 2.48, "learning_rate": 1.9172669231988703e-05, "loss": 0.0056, "step": 172280 }, { "epoch": 2.48, "learning_rate": 1.9172621192250232e-05, "loss": 0.007, "step": 172290 }, { "epoch": 2.48, "learning_rate": 1.917257315251176e-05, "loss": 0.0063, "step": 172300 }, { "epoch": 2.48, "learning_rate": 1.9172525112773287e-05, "loss": 0.0069, "step": 172310 }, { "epoch": 2.48, "learning_rate": 1.9172477073034816e-05, "loss": 0.0113, "step": 172320 }, { "epoch": 2.48, "learning_rate": 1.9172429033296346e-05, "loss": 0.005, "step": 172330 }, { "epoch": 2.48, "learning_rate": 1.917238099355787e-05, "loss": 0.0064, "step": 172340 }, { "epoch": 2.48, "learning_rate": 1.91723329538194e-05, "loss": 0.0087, "step": 172350 }, { "epoch": 2.48, "learning_rate": 1.917228491408093e-05, "loss": 0.0076, "step": 172360 }, { "epoch": 2.48, "learning_rate": 1.917223687434246e-05, "loss": 0.0075, "step": 172370 }, { "epoch": 2.48, "learning_rate": 1.9172188834603985e-05, "loss": 0.0085, "step": 172380 }, { "epoch": 2.48, "learning_rate": 1.9172140794865515e-05, "loss": 0.0075, "step": 172390 }, { "epoch": 2.48, "learning_rate": 1.9172092755127044e-05, "loss": 0.0089, "step": 172400 }, { "epoch": 2.48, "learning_rate": 1.917204471538857e-05, "loss": 0.007, "step": 172410 }, { "epoch": 2.48, "learning_rate": 1.91719966756501e-05, "loss": 0.0056, "step": 172420 }, { "epoch": 2.49, "learning_rate": 1.9171948635911628e-05, "loss": 0.0061, "step": 172430 }, { "epoch": 2.49, "learning_rate": 1.9171900596173157e-05, "loss": 0.0059, "step": 172440 }, { "epoch": 2.49, "learning_rate": 1.9171852556434683e-05, "loss": 0.0074, "step": 172450 }, { "epoch": 2.49, "learning_rate": 1.9171804516696213e-05, "loss": 0.0098, "step": 172460 }, { "epoch": 2.49, "learning_rate": 1.9171756476957742e-05, "loss": 0.0081, "step": 172470 }, { "epoch": 2.49, "learning_rate": 1.917170843721927e-05, "loss": 0.004, "step": 172480 }, { "epoch": 2.49, "learning_rate": 1.9171660397480797e-05, "loss": 0.0068, "step": 172490 }, { "epoch": 2.49, "learning_rate": 1.9171612357742326e-05, "loss": 0.0089, "step": 172500 }, { "epoch": 2.49, "learning_rate": 1.9171564318003856e-05, "loss": 0.0089, "step": 172510 }, { "epoch": 2.49, "learning_rate": 1.917151627826538e-05, "loss": 0.0052, "step": 172520 }, { "epoch": 2.49, "learning_rate": 1.917146823852691e-05, "loss": 0.0079, "step": 172530 }, { "epoch": 2.49, "learning_rate": 1.917142019878844e-05, "loss": 0.0064, "step": 172540 }, { "epoch": 2.49, "learning_rate": 1.917137215904997e-05, "loss": 0.0082, "step": 172550 }, { "epoch": 2.49, "learning_rate": 1.9171324119311495e-05, "loss": 0.0095, "step": 172560 }, { "epoch": 2.49, "learning_rate": 1.9171276079573024e-05, "loss": 0.0083, "step": 172570 }, { "epoch": 2.49, "learning_rate": 1.9171228039834554e-05, "loss": 0.0094, "step": 172580 }, { "epoch": 2.49, "learning_rate": 1.917118000009608e-05, "loss": 0.0065, "step": 172590 }, { "epoch": 2.49, "learning_rate": 1.917113196035761e-05, "loss": 0.0075, "step": 172600 }, { "epoch": 2.49, "learning_rate": 1.9171083920619138e-05, "loss": 0.0084, "step": 172610 }, { "epoch": 2.49, "learning_rate": 1.9171035880880667e-05, "loss": 0.0061, "step": 172620 }, { "epoch": 2.49, "learning_rate": 1.9170987841142193e-05, "loss": 0.0103, "step": 172630 }, { "epoch": 2.49, "learning_rate": 1.9170939801403723e-05, "loss": 0.0094, "step": 172640 }, { "epoch": 2.49, "learning_rate": 1.9170891761665252e-05, "loss": 0.007, "step": 172650 }, { "epoch": 2.49, "learning_rate": 1.917084372192678e-05, "loss": 0.006, "step": 172660 }, { "epoch": 2.49, "learning_rate": 1.9170795682188307e-05, "loss": 0.0085, "step": 172670 }, { "epoch": 2.49, "learning_rate": 1.9170747642449836e-05, "loss": 0.0094, "step": 172680 }, { "epoch": 2.49, "learning_rate": 1.9170699602711366e-05, "loss": 0.0082, "step": 172690 }, { "epoch": 2.49, "learning_rate": 1.917065156297289e-05, "loss": 0.007, "step": 172700 }, { "epoch": 2.49, "learning_rate": 1.917060352323442e-05, "loss": 0.0083, "step": 172710 }, { "epoch": 2.49, "learning_rate": 1.917055548349595e-05, "loss": 0.0071, "step": 172720 }, { "epoch": 2.49, "learning_rate": 1.917050744375748e-05, "loss": 0.0074, "step": 172730 }, { "epoch": 2.49, "learning_rate": 1.9170459404019005e-05, "loss": 0.0107, "step": 172740 }, { "epoch": 2.49, "learning_rate": 1.9170411364280534e-05, "loss": 0.007, "step": 172750 }, { "epoch": 2.49, "learning_rate": 1.9170363324542064e-05, "loss": 0.0065, "step": 172760 }, { "epoch": 2.49, "learning_rate": 1.917031528480359e-05, "loss": 0.0048, "step": 172770 }, { "epoch": 2.49, "learning_rate": 1.917026724506512e-05, "loss": 0.0045, "step": 172780 }, { "epoch": 2.49, "learning_rate": 1.9170219205326648e-05, "loss": 0.0056, "step": 172790 }, { "epoch": 2.49, "learning_rate": 1.9170171165588177e-05, "loss": 0.0066, "step": 172800 }, { "epoch": 2.49, "learning_rate": 1.9170123125849703e-05, "loss": 0.0041, "step": 172810 }, { "epoch": 2.49, "learning_rate": 1.9170075086111232e-05, "loss": 0.0073, "step": 172820 }, { "epoch": 2.49, "learning_rate": 1.9170027046372762e-05, "loss": 0.0083, "step": 172830 }, { "epoch": 2.49, "learning_rate": 1.916997900663429e-05, "loss": 0.0068, "step": 172840 }, { "epoch": 2.49, "learning_rate": 1.9169930966895817e-05, "loss": 0.0092, "step": 172850 }, { "epoch": 2.49, "learning_rate": 1.9169882927157346e-05, "loss": 0.0084, "step": 172860 }, { "epoch": 2.49, "learning_rate": 1.9169834887418875e-05, "loss": 0.0079, "step": 172870 }, { "epoch": 2.49, "learning_rate": 1.91697868476804e-05, "loss": 0.0073, "step": 172880 }, { "epoch": 2.49, "learning_rate": 1.916973880794193e-05, "loss": 0.0089, "step": 172890 }, { "epoch": 2.49, "learning_rate": 1.916969076820346e-05, "loss": 0.0068, "step": 172900 }, { "epoch": 2.49, "learning_rate": 1.916964272846499e-05, "loss": 0.009, "step": 172910 }, { "epoch": 2.49, "learning_rate": 1.9169594688726515e-05, "loss": 0.006, "step": 172920 }, { "epoch": 2.49, "learning_rate": 1.9169546648988044e-05, "loss": 0.0086, "step": 172930 }, { "epoch": 2.49, "learning_rate": 1.9169498609249574e-05, "loss": 0.0056, "step": 172940 }, { "epoch": 2.49, "learning_rate": 1.91694505695111e-05, "loss": 0.008, "step": 172950 }, { "epoch": 2.49, "learning_rate": 1.916940252977263e-05, "loss": 0.005, "step": 172960 }, { "epoch": 2.49, "learning_rate": 1.9169354490034158e-05, "loss": 0.0074, "step": 172970 }, { "epoch": 2.49, "learning_rate": 1.9169306450295687e-05, "loss": 0.007, "step": 172980 }, { "epoch": 2.49, "learning_rate": 1.9169258410557213e-05, "loss": 0.0077, "step": 172990 }, { "epoch": 2.49, "learning_rate": 1.9169210370818742e-05, "loss": 0.0066, "step": 173000 }, { "epoch": 2.49, "learning_rate": 1.916916233108027e-05, "loss": 0.0081, "step": 173010 }, { "epoch": 2.49, "learning_rate": 1.91691142913418e-05, "loss": 0.0065, "step": 173020 }, { "epoch": 2.49, "learning_rate": 1.9169066251603327e-05, "loss": 0.005, "step": 173030 }, { "epoch": 2.49, "learning_rate": 1.9169018211864856e-05, "loss": 0.0064, "step": 173040 }, { "epoch": 2.49, "learning_rate": 1.9168970172126385e-05, "loss": 0.0058, "step": 173050 }, { "epoch": 2.49, "learning_rate": 1.916892213238791e-05, "loss": 0.0091, "step": 173060 }, { "epoch": 2.49, "learning_rate": 1.916887409264944e-05, "loss": 0.0086, "step": 173070 }, { "epoch": 2.49, "learning_rate": 1.916882605291097e-05, "loss": 0.0072, "step": 173080 }, { "epoch": 2.49, "learning_rate": 1.91687780131725e-05, "loss": 0.0068, "step": 173090 }, { "epoch": 2.49, "learning_rate": 1.9168729973434025e-05, "loss": 0.0076, "step": 173100 }, { "epoch": 2.49, "learning_rate": 1.9168681933695554e-05, "loss": 0.0072, "step": 173110 }, { "epoch": 2.49, "learning_rate": 1.9168633893957083e-05, "loss": 0.0091, "step": 173120 }, { "epoch": 2.5, "learning_rate": 1.916858585421861e-05, "loss": 0.0056, "step": 173130 }, { "epoch": 2.5, "learning_rate": 1.916853781448014e-05, "loss": 0.008, "step": 173140 }, { "epoch": 2.5, "learning_rate": 1.9168489774741668e-05, "loss": 0.0076, "step": 173150 }, { "epoch": 2.5, "learning_rate": 1.9168441735003197e-05, "loss": 0.0076, "step": 173160 }, { "epoch": 2.5, "learning_rate": 1.9168393695264723e-05, "loss": 0.0086, "step": 173170 }, { "epoch": 2.5, "learning_rate": 1.9168345655526252e-05, "loss": 0.0059, "step": 173180 }, { "epoch": 2.5, "learning_rate": 1.916829761578778e-05, "loss": 0.0081, "step": 173190 }, { "epoch": 2.5, "learning_rate": 1.916824957604931e-05, "loss": 0.0092, "step": 173200 }, { "epoch": 2.5, "learning_rate": 1.9168201536310837e-05, "loss": 0.0076, "step": 173210 }, { "epoch": 2.5, "learning_rate": 1.9168153496572366e-05, "loss": 0.005, "step": 173220 }, { "epoch": 2.5, "learning_rate": 1.9168105456833895e-05, "loss": 0.0075, "step": 173230 }, { "epoch": 2.5, "learning_rate": 1.916805741709542e-05, "loss": 0.0104, "step": 173240 }, { "epoch": 2.5, "learning_rate": 1.916800937735695e-05, "loss": 0.0098, "step": 173250 }, { "epoch": 2.5, "learning_rate": 1.916796133761848e-05, "loss": 0.0094, "step": 173260 }, { "epoch": 2.5, "learning_rate": 1.916791329788001e-05, "loss": 0.0059, "step": 173270 }, { "epoch": 2.5, "learning_rate": 1.9167865258141535e-05, "loss": 0.0073, "step": 173280 }, { "epoch": 2.5, "learning_rate": 1.9167817218403064e-05, "loss": 0.005, "step": 173290 }, { "epoch": 2.5, "learning_rate": 1.9167769178664593e-05, "loss": 0.0058, "step": 173300 }, { "epoch": 2.5, "learning_rate": 1.916772113892612e-05, "loss": 0.0042, "step": 173310 }, { "epoch": 2.5, "learning_rate": 1.916767309918765e-05, "loss": 0.0086, "step": 173320 }, { "epoch": 2.5, "learning_rate": 1.9167625059449178e-05, "loss": 0.0075, "step": 173330 }, { "epoch": 2.5, "learning_rate": 1.9167577019710707e-05, "loss": 0.0089, "step": 173340 }, { "epoch": 2.5, "learning_rate": 1.9167528979972233e-05, "loss": 0.0078, "step": 173350 }, { "epoch": 2.5, "learning_rate": 1.9167480940233762e-05, "loss": 0.0082, "step": 173360 }, { "epoch": 2.5, "learning_rate": 1.916743290049529e-05, "loss": 0.0063, "step": 173370 }, { "epoch": 2.5, "learning_rate": 1.916738486075682e-05, "loss": 0.0071, "step": 173380 }, { "epoch": 2.5, "learning_rate": 1.9167336821018347e-05, "loss": 0.0064, "step": 173390 }, { "epoch": 2.5, "learning_rate": 1.9167288781279876e-05, "loss": 0.008, "step": 173400 }, { "epoch": 2.5, "learning_rate": 1.9167240741541405e-05, "loss": 0.0109, "step": 173410 }, { "epoch": 2.5, "learning_rate": 1.916719270180293e-05, "loss": 0.0077, "step": 173420 }, { "epoch": 2.5, "learning_rate": 1.916714466206446e-05, "loss": 0.0072, "step": 173430 }, { "epoch": 2.5, "learning_rate": 1.916709662232599e-05, "loss": 0.0065, "step": 173440 }, { "epoch": 2.5, "learning_rate": 1.916704858258752e-05, "loss": 0.0109, "step": 173450 }, { "epoch": 2.5, "learning_rate": 1.9167000542849045e-05, "loss": 0.0069, "step": 173460 }, { "epoch": 2.5, "learning_rate": 1.9166952503110574e-05, "loss": 0.0076, "step": 173470 }, { "epoch": 2.5, "learning_rate": 1.9166904463372103e-05, "loss": 0.0061, "step": 173480 }, { "epoch": 2.5, "learning_rate": 1.916685642363363e-05, "loss": 0.0076, "step": 173490 }, { "epoch": 2.5, "learning_rate": 1.916680838389516e-05, "loss": 0.0105, "step": 173500 }, { "epoch": 2.5, "learning_rate": 1.9166760344156688e-05, "loss": 0.0087, "step": 173510 }, { "epoch": 2.5, "learning_rate": 1.9166712304418217e-05, "loss": 0.0079, "step": 173520 }, { "epoch": 2.5, "learning_rate": 1.9166664264679743e-05, "loss": 0.0068, "step": 173530 }, { "epoch": 2.5, "learning_rate": 1.9166616224941272e-05, "loss": 0.0115, "step": 173540 }, { "epoch": 2.5, "learning_rate": 1.91665681852028e-05, "loss": 0.0092, "step": 173550 }, { "epoch": 2.5, "learning_rate": 1.916652014546433e-05, "loss": 0.007, "step": 173560 }, { "epoch": 2.5, "learning_rate": 1.9166472105725857e-05, "loss": 0.0076, "step": 173570 }, { "epoch": 2.5, "learning_rate": 1.9166424065987386e-05, "loss": 0.0063, "step": 173580 }, { "epoch": 2.5, "learning_rate": 1.9166376026248915e-05, "loss": 0.0077, "step": 173590 }, { "epoch": 2.5, "learning_rate": 1.916632798651044e-05, "loss": 0.0052, "step": 173600 }, { "epoch": 2.5, "learning_rate": 1.916627994677197e-05, "loss": 0.0095, "step": 173610 }, { "epoch": 2.5, "learning_rate": 1.91662319070335e-05, "loss": 0.0064, "step": 173620 }, { "epoch": 2.5, "learning_rate": 1.916618386729503e-05, "loss": 0.0082, "step": 173630 }, { "epoch": 2.5, "learning_rate": 1.9166135827556555e-05, "loss": 0.0067, "step": 173640 }, { "epoch": 2.5, "learning_rate": 1.9166087787818084e-05, "loss": 0.0074, "step": 173650 }, { "epoch": 2.5, "learning_rate": 1.9166039748079613e-05, "loss": 0.0055, "step": 173660 }, { "epoch": 2.5, "learning_rate": 1.916599170834114e-05, "loss": 0.0066, "step": 173670 }, { "epoch": 2.5, "learning_rate": 1.916594366860267e-05, "loss": 0.0081, "step": 173680 }, { "epoch": 2.5, "learning_rate": 1.9165895628864198e-05, "loss": 0.0064, "step": 173690 }, { "epoch": 2.5, "learning_rate": 1.9165847589125727e-05, "loss": 0.0067, "step": 173700 }, { "epoch": 2.5, "learning_rate": 1.9165799549387253e-05, "loss": 0.0078, "step": 173710 }, { "epoch": 2.5, "learning_rate": 1.9165751509648782e-05, "loss": 0.0042, "step": 173720 }, { "epoch": 2.5, "learning_rate": 1.916570346991031e-05, "loss": 0.009, "step": 173730 }, { "epoch": 2.5, "learning_rate": 1.916565543017184e-05, "loss": 0.0084, "step": 173740 }, { "epoch": 2.5, "learning_rate": 1.9165607390433366e-05, "loss": 0.0074, "step": 173750 }, { "epoch": 2.5, "learning_rate": 1.9165559350694896e-05, "loss": 0.0072, "step": 173760 }, { "epoch": 2.5, "learning_rate": 1.9165511310956425e-05, "loss": 0.0061, "step": 173770 }, { "epoch": 2.5, "learning_rate": 1.916546327121795e-05, "loss": 0.0074, "step": 173780 }, { "epoch": 2.5, "learning_rate": 1.916541523147948e-05, "loss": 0.008, "step": 173790 }, { "epoch": 2.5, "learning_rate": 1.916536719174101e-05, "loss": 0.0045, "step": 173800 }, { "epoch": 2.5, "learning_rate": 1.916531915200254e-05, "loss": 0.0071, "step": 173810 }, { "epoch": 2.51, "learning_rate": 1.9165271112264065e-05, "loss": 0.0072, "step": 173820 }, { "epoch": 2.51, "learning_rate": 1.9165223072525594e-05, "loss": 0.011, "step": 173830 }, { "epoch": 2.51, "learning_rate": 1.9165175032787123e-05, "loss": 0.0061, "step": 173840 }, { "epoch": 2.51, "learning_rate": 1.916512699304865e-05, "loss": 0.0095, "step": 173850 }, { "epoch": 2.51, "learning_rate": 1.9165078953310178e-05, "loss": 0.0061, "step": 173860 }, { "epoch": 2.51, "learning_rate": 1.9165030913571708e-05, "loss": 0.0076, "step": 173870 }, { "epoch": 2.51, "learning_rate": 1.9164982873833237e-05, "loss": 0.0065, "step": 173880 }, { "epoch": 2.51, "learning_rate": 1.9164934834094763e-05, "loss": 0.0072, "step": 173890 }, { "epoch": 2.51, "learning_rate": 1.9164886794356292e-05, "loss": 0.0085, "step": 173900 }, { "epoch": 2.51, "learning_rate": 1.916483875461782e-05, "loss": 0.0064, "step": 173910 }, { "epoch": 2.51, "learning_rate": 1.916479071487935e-05, "loss": 0.0069, "step": 173920 }, { "epoch": 2.51, "learning_rate": 1.9164742675140876e-05, "loss": 0.0057, "step": 173930 }, { "epoch": 2.51, "learning_rate": 1.9164694635402406e-05, "loss": 0.0071, "step": 173940 }, { "epoch": 2.51, "learning_rate": 1.9164646595663935e-05, "loss": 0.009, "step": 173950 }, { "epoch": 2.51, "learning_rate": 1.916459855592546e-05, "loss": 0.006, "step": 173960 }, { "epoch": 2.51, "learning_rate": 1.916455051618699e-05, "loss": 0.0088, "step": 173970 }, { "epoch": 2.51, "learning_rate": 1.916450247644852e-05, "loss": 0.0089, "step": 173980 }, { "epoch": 2.51, "learning_rate": 1.916445443671005e-05, "loss": 0.0077, "step": 173990 }, { "epoch": 2.51, "learning_rate": 1.9164406396971574e-05, "loss": 0.0055, "step": 174000 }, { "epoch": 2.51, "learning_rate": 1.9164358357233104e-05, "loss": 0.0061, "step": 174010 }, { "epoch": 2.51, "learning_rate": 1.9164310317494633e-05, "loss": 0.0085, "step": 174020 }, { "epoch": 2.51, "learning_rate": 1.916426227775616e-05, "loss": 0.0052, "step": 174030 }, { "epoch": 2.51, "learning_rate": 1.9164214238017688e-05, "loss": 0.0067, "step": 174040 }, { "epoch": 2.51, "learning_rate": 1.9164166198279217e-05, "loss": 0.0049, "step": 174050 }, { "epoch": 2.51, "learning_rate": 1.9164122962514592e-05, "loss": 0.0067, "step": 174060 }, { "epoch": 2.51, "learning_rate": 1.916407492277612e-05, "loss": 0.0069, "step": 174070 }, { "epoch": 2.51, "learning_rate": 1.916402688303765e-05, "loss": 0.0073, "step": 174080 }, { "epoch": 2.51, "learning_rate": 1.9163978843299177e-05, "loss": 0.0068, "step": 174090 }, { "epoch": 2.51, "learning_rate": 1.9163930803560706e-05, "loss": 0.006, "step": 174100 }, { "epoch": 2.51, "learning_rate": 1.9163882763822235e-05, "loss": 0.0053, "step": 174110 }, { "epoch": 2.51, "learning_rate": 1.9163834724083764e-05, "loss": 0.0073, "step": 174120 }, { "epoch": 2.51, "learning_rate": 1.916378668434529e-05, "loss": 0.0072, "step": 174130 }, { "epoch": 2.51, "learning_rate": 1.916373864460682e-05, "loss": 0.0075, "step": 174140 }, { "epoch": 2.51, "learning_rate": 1.916369060486835e-05, "loss": 0.0098, "step": 174150 }, { "epoch": 2.51, "learning_rate": 1.9163642565129875e-05, "loss": 0.0078, "step": 174160 }, { "epoch": 2.51, "learning_rate": 1.9163594525391404e-05, "loss": 0.0081, "step": 174170 }, { "epoch": 2.51, "learning_rate": 1.9163546485652933e-05, "loss": 0.0052, "step": 174180 }, { "epoch": 2.51, "learning_rate": 1.9163498445914462e-05, "loss": 0.005, "step": 174190 }, { "epoch": 2.51, "learning_rate": 1.916345040617599e-05, "loss": 0.0081, "step": 174200 }, { "epoch": 2.51, "learning_rate": 1.9163402366437518e-05, "loss": 0.0061, "step": 174210 }, { "epoch": 2.51, "learning_rate": 1.9163354326699047e-05, "loss": 0.0069, "step": 174220 }, { "epoch": 2.51, "learning_rate": 1.9163306286960576e-05, "loss": 0.0046, "step": 174230 }, { "epoch": 2.51, "learning_rate": 1.9163258247222102e-05, "loss": 0.0108, "step": 174240 }, { "epoch": 2.51, "learning_rate": 1.916321020748363e-05, "loss": 0.0095, "step": 174250 }, { "epoch": 2.51, "learning_rate": 1.916316216774516e-05, "loss": 0.0063, "step": 174260 }, { "epoch": 2.51, "learning_rate": 1.9163114128006686e-05, "loss": 0.0083, "step": 174270 }, { "epoch": 2.51, "learning_rate": 1.9163066088268216e-05, "loss": 0.0073, "step": 174280 }, { "epoch": 2.51, "learning_rate": 1.9163018048529745e-05, "loss": 0.0069, "step": 174290 }, { "epoch": 2.51, "learning_rate": 1.9162970008791274e-05, "loss": 0.0065, "step": 174300 }, { "epoch": 2.51, "learning_rate": 1.91629219690528e-05, "loss": 0.0058, "step": 174310 }, { "epoch": 2.51, "learning_rate": 1.916287392931433e-05, "loss": 0.0105, "step": 174320 }, { "epoch": 2.51, "learning_rate": 1.916282588957586e-05, "loss": 0.0071, "step": 174330 }, { "epoch": 2.51, "learning_rate": 1.9162777849837385e-05, "loss": 0.005, "step": 174340 }, { "epoch": 2.51, "learning_rate": 1.9162729810098914e-05, "loss": 0.0065, "step": 174350 }, { "epoch": 2.51, "learning_rate": 1.9162681770360443e-05, "loss": 0.0075, "step": 174360 }, { "epoch": 2.51, "learning_rate": 1.9162633730621972e-05, "loss": 0.006, "step": 174370 }, { "epoch": 2.51, "learning_rate": 1.9162585690883498e-05, "loss": 0.0073, "step": 174380 }, { "epoch": 2.51, "learning_rate": 1.9162537651145028e-05, "loss": 0.0091, "step": 174390 }, { "epoch": 2.51, "learning_rate": 1.9162489611406557e-05, "loss": 0.0111, "step": 174400 }, { "epoch": 2.51, "learning_rate": 1.9162441571668086e-05, "loss": 0.0085, "step": 174410 }, { "epoch": 2.51, "learning_rate": 1.9162393531929612e-05, "loss": 0.0049, "step": 174420 }, { "epoch": 2.51, "learning_rate": 1.916234549219114e-05, "loss": 0.0072, "step": 174430 }, { "epoch": 2.51, "learning_rate": 1.916229745245267e-05, "loss": 0.0055, "step": 174440 }, { "epoch": 2.51, "learning_rate": 1.9162249412714196e-05, "loss": 0.0072, "step": 174450 }, { "epoch": 2.51, "learning_rate": 1.9162201372975726e-05, "loss": 0.0095, "step": 174460 }, { "epoch": 2.51, "learning_rate": 1.9162153333237255e-05, "loss": 0.0088, "step": 174470 }, { "epoch": 2.51, "learning_rate": 1.9162105293498784e-05, "loss": 0.0075, "step": 174480 }, { "epoch": 2.51, "learning_rate": 1.916205725376031e-05, "loss": 0.0067, "step": 174490 }, { "epoch": 2.51, "learning_rate": 1.916200921402184e-05, "loss": 0.0065, "step": 174500 }, { "epoch": 2.52, "learning_rate": 1.916196117428337e-05, "loss": 0.0083, "step": 174510 }, { "epoch": 2.52, "learning_rate": 1.9161913134544894e-05, "loss": 0.0096, "step": 174520 }, { "epoch": 2.52, "learning_rate": 1.9161865094806424e-05, "loss": 0.014, "step": 174530 }, { "epoch": 2.52, "learning_rate": 1.9161817055067953e-05, "loss": 0.0077, "step": 174540 }, { "epoch": 2.52, "learning_rate": 1.9161769015329482e-05, "loss": 0.0052, "step": 174550 }, { "epoch": 2.52, "learning_rate": 1.9161720975591008e-05, "loss": 0.0068, "step": 174560 }, { "epoch": 2.52, "learning_rate": 1.9161672935852537e-05, "loss": 0.007, "step": 174570 }, { "epoch": 2.52, "learning_rate": 1.9161624896114067e-05, "loss": 0.0082, "step": 174580 }, { "epoch": 2.52, "learning_rate": 1.9161576856375596e-05, "loss": 0.0142, "step": 174590 }, { "epoch": 2.52, "learning_rate": 1.9161528816637122e-05, "loss": 0.0075, "step": 174600 }, { "epoch": 2.52, "learning_rate": 1.916148077689865e-05, "loss": 0.0066, "step": 174610 }, { "epoch": 2.52, "learning_rate": 1.916143273716018e-05, "loss": 0.0088, "step": 174620 }, { "epoch": 2.52, "learning_rate": 1.9161384697421706e-05, "loss": 0.0049, "step": 174630 }, { "epoch": 2.52, "learning_rate": 1.9161336657683236e-05, "loss": 0.0091, "step": 174640 }, { "epoch": 2.52, "learning_rate": 1.9161288617944768e-05, "loss": 0.0062, "step": 174650 }, { "epoch": 2.52, "learning_rate": 1.9161240578206294e-05, "loss": 0.0089, "step": 174660 }, { "epoch": 2.52, "learning_rate": 1.9161192538467823e-05, "loss": 0.0085, "step": 174670 }, { "epoch": 2.52, "learning_rate": 1.9161144498729353e-05, "loss": 0.007, "step": 174680 }, { "epoch": 2.52, "learning_rate": 1.916109645899088e-05, "loss": 0.0058, "step": 174690 }, { "epoch": 2.52, "learning_rate": 1.9161048419252408e-05, "loss": 0.0095, "step": 174700 }, { "epoch": 2.52, "learning_rate": 1.9161000379513937e-05, "loss": 0.0075, "step": 174710 }, { "epoch": 2.52, "learning_rate": 1.9160952339775466e-05, "loss": 0.0083, "step": 174720 }, { "epoch": 2.52, "learning_rate": 1.9160904300036992e-05, "loss": 0.0103, "step": 174730 }, { "epoch": 2.52, "learning_rate": 1.916085626029852e-05, "loss": 0.0053, "step": 174740 }, { "epoch": 2.52, "learning_rate": 1.916080822056005e-05, "loss": 0.0087, "step": 174750 }, { "epoch": 2.52, "learning_rate": 1.9160760180821577e-05, "loss": 0.0077, "step": 174760 }, { "epoch": 2.52, "learning_rate": 1.9160712141083106e-05, "loss": 0.0057, "step": 174770 }, { "epoch": 2.52, "learning_rate": 1.9160664101344635e-05, "loss": 0.0074, "step": 174780 }, { "epoch": 2.52, "learning_rate": 1.9160616061606164e-05, "loss": 0.011, "step": 174790 }, { "epoch": 2.52, "learning_rate": 1.916056802186769e-05, "loss": 0.007, "step": 174800 }, { "epoch": 2.52, "learning_rate": 1.916051998212922e-05, "loss": 0.0084, "step": 174810 }, { "epoch": 2.52, "learning_rate": 1.916047194239075e-05, "loss": 0.0049, "step": 174820 }, { "epoch": 2.52, "learning_rate": 1.9160423902652278e-05, "loss": 0.0059, "step": 174830 }, { "epoch": 2.52, "learning_rate": 1.9160375862913804e-05, "loss": 0.0066, "step": 174840 }, { "epoch": 2.52, "learning_rate": 1.9160327823175333e-05, "loss": 0.0108, "step": 174850 }, { "epoch": 2.52, "learning_rate": 1.9160279783436863e-05, "loss": 0.0095, "step": 174860 }, { "epoch": 2.52, "learning_rate": 1.916023174369839e-05, "loss": 0.0097, "step": 174870 }, { "epoch": 2.52, "learning_rate": 1.9160183703959918e-05, "loss": 0.0047, "step": 174880 }, { "epoch": 2.52, "learning_rate": 1.9160135664221447e-05, "loss": 0.0062, "step": 174890 }, { "epoch": 2.52, "learning_rate": 1.9160087624482976e-05, "loss": 0.0097, "step": 174900 }, { "epoch": 2.52, "learning_rate": 1.9160039584744502e-05, "loss": 0.0073, "step": 174910 }, { "epoch": 2.52, "learning_rate": 1.915999154500603e-05, "loss": 0.0074, "step": 174920 }, { "epoch": 2.52, "learning_rate": 1.915994350526756e-05, "loss": 0.0085, "step": 174930 }, { "epoch": 2.52, "learning_rate": 1.9159895465529087e-05, "loss": 0.0067, "step": 174940 }, { "epoch": 2.52, "learning_rate": 1.9159847425790616e-05, "loss": 0.0049, "step": 174950 }, { "epoch": 2.52, "learning_rate": 1.9159799386052145e-05, "loss": 0.0074, "step": 174960 }, { "epoch": 2.52, "learning_rate": 1.9159751346313674e-05, "loss": 0.0051, "step": 174970 }, { "epoch": 2.52, "learning_rate": 1.91597033065752e-05, "loss": 0.0076, "step": 174980 }, { "epoch": 2.52, "learning_rate": 1.915965526683673e-05, "loss": 0.0106, "step": 174990 }, { "epoch": 2.52, "learning_rate": 1.915960722709826e-05, "loss": 0.0075, "step": 175000 }, { "epoch": 2.52, "learning_rate": 1.9159559187359788e-05, "loss": 0.0071, "step": 175010 }, { "epoch": 2.52, "learning_rate": 1.9159511147621314e-05, "loss": 0.0075, "step": 175020 }, { "epoch": 2.52, "learning_rate": 1.9159463107882843e-05, "loss": 0.0081, "step": 175030 }, { "epoch": 2.52, "learning_rate": 1.9159415068144372e-05, "loss": 0.0057, "step": 175040 }, { "epoch": 2.52, "learning_rate": 1.91593670284059e-05, "loss": 0.0083, "step": 175050 }, { "epoch": 2.52, "learning_rate": 1.9159318988667428e-05, "loss": 0.0086, "step": 175060 }, { "epoch": 2.52, "learning_rate": 1.9159270948928957e-05, "loss": 0.0069, "step": 175070 }, { "epoch": 2.52, "learning_rate": 1.9159222909190486e-05, "loss": 0.0087, "step": 175080 }, { "epoch": 2.52, "learning_rate": 1.9159174869452012e-05, "loss": 0.0066, "step": 175090 }, { "epoch": 2.52, "learning_rate": 1.915912682971354e-05, "loss": 0.0139, "step": 175100 }, { "epoch": 2.52, "learning_rate": 1.915907878997507e-05, "loss": 0.0084, "step": 175110 }, { "epoch": 2.52, "learning_rate": 1.9159030750236596e-05, "loss": 0.0054, "step": 175120 }, { "epoch": 2.52, "learning_rate": 1.9158982710498126e-05, "loss": 0.0069, "step": 175130 }, { "epoch": 2.52, "learning_rate": 1.9158934670759655e-05, "loss": 0.0059, "step": 175140 }, { "epoch": 2.52, "learning_rate": 1.9158886631021184e-05, "loss": 0.0094, "step": 175150 }, { "epoch": 2.52, "learning_rate": 1.915883859128271e-05, "loss": 0.0064, "step": 175160 }, { "epoch": 2.52, "learning_rate": 1.915879055154424e-05, "loss": 0.0065, "step": 175170 }, { "epoch": 2.52, "learning_rate": 1.915874251180577e-05, "loss": 0.0083, "step": 175180 }, { "epoch": 2.52, "learning_rate": 1.9158694472067298e-05, "loss": 0.0083, "step": 175190 }, { "epoch": 2.52, "learning_rate": 1.9158646432328824e-05, "loss": 0.0062, "step": 175200 }, { "epoch": 2.53, "learning_rate": 1.9158598392590353e-05, "loss": 0.0069, "step": 175210 }, { "epoch": 2.53, "learning_rate": 1.9158550352851882e-05, "loss": 0.0071, "step": 175220 }, { "epoch": 2.53, "learning_rate": 1.9158502313113408e-05, "loss": 0.0089, "step": 175230 }, { "epoch": 2.53, "learning_rate": 1.9158454273374938e-05, "loss": 0.0068, "step": 175240 }, { "epoch": 2.53, "learning_rate": 1.9158406233636467e-05, "loss": 0.0104, "step": 175250 }, { "epoch": 2.53, "learning_rate": 1.9158358193897996e-05, "loss": 0.0092, "step": 175260 }, { "epoch": 2.53, "learning_rate": 1.9158310154159522e-05, "loss": 0.0095, "step": 175270 }, { "epoch": 2.53, "learning_rate": 1.915826211442105e-05, "loss": 0.0057, "step": 175280 }, { "epoch": 2.53, "learning_rate": 1.915821407468258e-05, "loss": 0.0036, "step": 175290 }, { "epoch": 2.53, "learning_rate": 1.9158166034944106e-05, "loss": 0.0083, "step": 175300 }, { "epoch": 2.53, "learning_rate": 1.9158117995205636e-05, "loss": 0.008, "step": 175310 }, { "epoch": 2.53, "learning_rate": 1.9158069955467165e-05, "loss": 0.006, "step": 175320 }, { "epoch": 2.53, "learning_rate": 1.9158021915728694e-05, "loss": 0.0051, "step": 175330 }, { "epoch": 2.53, "learning_rate": 1.915797387599022e-05, "loss": 0.0073, "step": 175340 }, { "epoch": 2.53, "learning_rate": 1.915792583625175e-05, "loss": 0.0074, "step": 175350 }, { "epoch": 2.53, "learning_rate": 1.915787779651328e-05, "loss": 0.0061, "step": 175360 }, { "epoch": 2.53, "learning_rate": 1.9157829756774808e-05, "loss": 0.0081, "step": 175370 }, { "epoch": 2.53, "learning_rate": 1.9157781717036334e-05, "loss": 0.0048, "step": 175380 }, { "epoch": 2.53, "learning_rate": 1.9157733677297863e-05, "loss": 0.0063, "step": 175390 }, { "epoch": 2.53, "learning_rate": 1.9157685637559392e-05, "loss": 0.0086, "step": 175400 }, { "epoch": 2.53, "learning_rate": 1.9157637597820918e-05, "loss": 0.0058, "step": 175410 }, { "epoch": 2.53, "learning_rate": 1.9157589558082447e-05, "loss": 0.0081, "step": 175420 }, { "epoch": 2.53, "learning_rate": 1.9157541518343977e-05, "loss": 0.0079, "step": 175430 }, { "epoch": 2.53, "learning_rate": 1.9157493478605506e-05, "loss": 0.0059, "step": 175440 }, { "epoch": 2.53, "learning_rate": 1.9157445438867032e-05, "loss": 0.0068, "step": 175450 }, { "epoch": 2.53, "learning_rate": 1.915739739912856e-05, "loss": 0.0066, "step": 175460 }, { "epoch": 2.53, "learning_rate": 1.915734935939009e-05, "loss": 0.0093, "step": 175470 }, { "epoch": 2.53, "learning_rate": 1.9157301319651616e-05, "loss": 0.0057, "step": 175480 }, { "epoch": 2.53, "learning_rate": 1.9157253279913146e-05, "loss": 0.0088, "step": 175490 }, { "epoch": 2.53, "learning_rate": 1.9157205240174675e-05, "loss": 0.0068, "step": 175500 }, { "epoch": 2.53, "learning_rate": 1.9157157200436204e-05, "loss": 0.0071, "step": 175510 }, { "epoch": 2.53, "learning_rate": 1.915710916069773e-05, "loss": 0.0081, "step": 175520 }, { "epoch": 2.53, "learning_rate": 1.915706112095926e-05, "loss": 0.0062, "step": 175530 }, { "epoch": 2.53, "learning_rate": 1.915701308122079e-05, "loss": 0.0077, "step": 175540 }, { "epoch": 2.53, "learning_rate": 1.9156965041482314e-05, "loss": 0.0075, "step": 175550 }, { "epoch": 2.53, "learning_rate": 1.9156917001743844e-05, "loss": 0.0067, "step": 175560 }, { "epoch": 2.53, "learning_rate": 1.9156868962005373e-05, "loss": 0.0042, "step": 175570 }, { "epoch": 2.53, "learning_rate": 1.9156820922266902e-05, "loss": 0.0056, "step": 175580 }, { "epoch": 2.53, "learning_rate": 1.9156772882528428e-05, "loss": 0.0098, "step": 175590 }, { "epoch": 2.53, "learning_rate": 1.9156724842789957e-05, "loss": 0.0085, "step": 175600 }, { "epoch": 2.53, "learning_rate": 1.9156676803051487e-05, "loss": 0.0063, "step": 175610 }, { "epoch": 2.53, "learning_rate": 1.9156628763313016e-05, "loss": 0.0094, "step": 175620 }, { "epoch": 2.53, "learning_rate": 1.9156580723574542e-05, "loss": 0.0087, "step": 175630 }, { "epoch": 2.53, "learning_rate": 1.915653268383607e-05, "loss": 0.0072, "step": 175640 }, { "epoch": 2.53, "learning_rate": 1.91564846440976e-05, "loss": 0.0054, "step": 175650 }, { "epoch": 2.53, "learning_rate": 1.9156436604359126e-05, "loss": 0.0061, "step": 175660 }, { "epoch": 2.53, "learning_rate": 1.9156388564620655e-05, "loss": 0.0092, "step": 175670 }, { "epoch": 2.53, "learning_rate": 1.9156340524882185e-05, "loss": 0.0047, "step": 175680 }, { "epoch": 2.53, "learning_rate": 1.9156292485143714e-05, "loss": 0.0097, "step": 175690 }, { "epoch": 2.53, "learning_rate": 1.915624444540524e-05, "loss": 0.0067, "step": 175700 }, { "epoch": 2.53, "learning_rate": 1.915619640566677e-05, "loss": 0.0071, "step": 175710 }, { "epoch": 2.53, "learning_rate": 1.91561483659283e-05, "loss": 0.0059, "step": 175720 }, { "epoch": 2.53, "learning_rate": 1.9156100326189824e-05, "loss": 0.0056, "step": 175730 }, { "epoch": 2.53, "learning_rate": 1.9156052286451354e-05, "loss": 0.01, "step": 175740 }, { "epoch": 2.53, "learning_rate": 1.9156004246712883e-05, "loss": 0.0087, "step": 175750 }, { "epoch": 2.53, "learning_rate": 1.9155956206974412e-05, "loss": 0.0052, "step": 175760 }, { "epoch": 2.53, "learning_rate": 1.9155908167235938e-05, "loss": 0.0064, "step": 175770 }, { "epoch": 2.53, "learning_rate": 1.9155860127497467e-05, "loss": 0.0092, "step": 175780 }, { "epoch": 2.53, "learning_rate": 1.9155812087758997e-05, "loss": 0.0064, "step": 175790 }, { "epoch": 2.53, "learning_rate": 1.9155764048020526e-05, "loss": 0.0076, "step": 175800 }, { "epoch": 2.53, "learning_rate": 1.915571600828205e-05, "loss": 0.006, "step": 175810 }, { "epoch": 2.53, "learning_rate": 1.915566796854358e-05, "loss": 0.0048, "step": 175820 }, { "epoch": 2.53, "learning_rate": 1.915561992880511e-05, "loss": 0.0056, "step": 175830 }, { "epoch": 2.53, "learning_rate": 1.9155571889066636e-05, "loss": 0.008, "step": 175840 }, { "epoch": 2.53, "learning_rate": 1.9155523849328165e-05, "loss": 0.0055, "step": 175850 }, { "epoch": 2.53, "learning_rate": 1.9155475809589695e-05, "loss": 0.0083, "step": 175860 }, { "epoch": 2.53, "learning_rate": 1.9155427769851224e-05, "loss": 0.0083, "step": 175870 }, { "epoch": 2.53, "learning_rate": 1.915537973011275e-05, "loss": 0.0078, "step": 175880 }, { "epoch": 2.53, "learning_rate": 1.915533169037428e-05, "loss": 0.0053, "step": 175890 }, { "epoch": 2.54, "learning_rate": 1.915528365063581e-05, "loss": 0.0066, "step": 175900 }, { "epoch": 2.54, "learning_rate": 1.9155235610897334e-05, "loss": 0.0075, "step": 175910 }, { "epoch": 2.54, "learning_rate": 1.9155187571158863e-05, "loss": 0.0059, "step": 175920 }, { "epoch": 2.54, "learning_rate": 1.9155139531420393e-05, "loss": 0.0065, "step": 175930 }, { "epoch": 2.54, "learning_rate": 1.9155091491681922e-05, "loss": 0.0084, "step": 175940 }, { "epoch": 2.54, "learning_rate": 1.9155043451943448e-05, "loss": 0.0051, "step": 175950 }, { "epoch": 2.54, "learning_rate": 1.9154995412204977e-05, "loss": 0.0099, "step": 175960 }, { "epoch": 2.54, "learning_rate": 1.9154947372466506e-05, "loss": 0.0078, "step": 175970 }, { "epoch": 2.54, "learning_rate": 1.9154899332728036e-05, "loss": 0.0068, "step": 175980 }, { "epoch": 2.54, "learning_rate": 1.915485129298956e-05, "loss": 0.0078, "step": 175990 }, { "epoch": 2.54, "learning_rate": 1.915480325325109e-05, "loss": 0.0059, "step": 176000 }, { "epoch": 2.54, "learning_rate": 1.915475521351262e-05, "loss": 0.005, "step": 176010 }, { "epoch": 2.54, "learning_rate": 1.9154707173774146e-05, "loss": 0.0076, "step": 176020 }, { "epoch": 2.54, "learning_rate": 1.9154659134035675e-05, "loss": 0.0095, "step": 176030 }, { "epoch": 2.54, "learning_rate": 1.9154611094297205e-05, "loss": 0.0068, "step": 176040 }, { "epoch": 2.54, "learning_rate": 1.9154563054558734e-05, "loss": 0.0088, "step": 176050 }, { "epoch": 2.54, "learning_rate": 1.915451501482026e-05, "loss": 0.0084, "step": 176060 }, { "epoch": 2.54, "learning_rate": 1.915446697508179e-05, "loss": 0.007, "step": 176070 }, { "epoch": 2.54, "learning_rate": 1.9154418935343318e-05, "loss": 0.006, "step": 176080 }, { "epoch": 2.54, "learning_rate": 1.9154370895604844e-05, "loss": 0.0088, "step": 176090 }, { "epoch": 2.54, "learning_rate": 1.9154322855866373e-05, "loss": 0.0099, "step": 176100 }, { "epoch": 2.54, "learning_rate": 1.9154274816127903e-05, "loss": 0.006, "step": 176110 }, { "epoch": 2.54, "learning_rate": 1.9154226776389432e-05, "loss": 0.0089, "step": 176120 }, { "epoch": 2.54, "learning_rate": 1.9154178736650958e-05, "loss": 0.0089, "step": 176130 }, { "epoch": 2.54, "learning_rate": 1.9154130696912487e-05, "loss": 0.0048, "step": 176140 }, { "epoch": 2.54, "learning_rate": 1.9154082657174016e-05, "loss": 0.009, "step": 176150 }, { "epoch": 2.54, "learning_rate": 1.9154034617435546e-05, "loss": 0.0048, "step": 176160 }, { "epoch": 2.54, "learning_rate": 1.915398657769707e-05, "loss": 0.0104, "step": 176170 }, { "epoch": 2.54, "learning_rate": 1.91539385379586e-05, "loss": 0.0106, "step": 176180 }, { "epoch": 2.54, "learning_rate": 1.915389049822013e-05, "loss": 0.0095, "step": 176190 }, { "epoch": 2.54, "learning_rate": 1.9153842458481656e-05, "loss": 0.0086, "step": 176200 }, { "epoch": 2.54, "learning_rate": 1.9153794418743185e-05, "loss": 0.0066, "step": 176210 }, { "epoch": 2.54, "learning_rate": 1.9153746379004714e-05, "loss": 0.0071, "step": 176220 }, { "epoch": 2.54, "learning_rate": 1.9153698339266244e-05, "loss": 0.0051, "step": 176230 }, { "epoch": 2.54, "learning_rate": 1.915365029952777e-05, "loss": 0.0111, "step": 176240 }, { "epoch": 2.54, "learning_rate": 1.91536022597893e-05, "loss": 0.0077, "step": 176250 }, { "epoch": 2.54, "learning_rate": 1.9153554220050828e-05, "loss": 0.0068, "step": 176260 }, { "epoch": 2.54, "learning_rate": 1.9153506180312354e-05, "loss": 0.0065, "step": 176270 }, { "epoch": 2.54, "learning_rate": 1.9153458140573883e-05, "loss": 0.0056, "step": 176280 }, { "epoch": 2.54, "learning_rate": 1.9153410100835413e-05, "loss": 0.0062, "step": 176290 }, { "epoch": 2.54, "learning_rate": 1.9153362061096942e-05, "loss": 0.0063, "step": 176300 }, { "epoch": 2.54, "learning_rate": 1.9153314021358468e-05, "loss": 0.0086, "step": 176310 }, { "epoch": 2.54, "learning_rate": 1.9153265981619997e-05, "loss": 0.0058, "step": 176320 }, { "epoch": 2.54, "learning_rate": 1.9153217941881526e-05, "loss": 0.0068, "step": 176330 }, { "epoch": 2.54, "learning_rate": 1.9153169902143056e-05, "loss": 0.0124, "step": 176340 }, { "epoch": 2.54, "learning_rate": 1.915312186240458e-05, "loss": 0.0091, "step": 176350 }, { "epoch": 2.54, "learning_rate": 1.915307382266611e-05, "loss": 0.0072, "step": 176360 }, { "epoch": 2.54, "learning_rate": 1.915302578292764e-05, "loss": 0.011, "step": 176370 }, { "epoch": 2.54, "learning_rate": 1.9152977743189166e-05, "loss": 0.0111, "step": 176380 }, { "epoch": 2.54, "learning_rate": 1.9152929703450695e-05, "loss": 0.011, "step": 176390 }, { "epoch": 2.54, "learning_rate": 1.9152881663712224e-05, "loss": 0.006, "step": 176400 }, { "epoch": 2.54, "learning_rate": 1.9152833623973754e-05, "loss": 0.0085, "step": 176410 }, { "epoch": 2.54, "learning_rate": 1.915278558423528e-05, "loss": 0.009, "step": 176420 }, { "epoch": 2.54, "learning_rate": 1.915273754449681e-05, "loss": 0.0078, "step": 176430 }, { "epoch": 2.54, "learning_rate": 1.9152689504758338e-05, "loss": 0.0056, "step": 176440 }, { "epoch": 2.54, "learning_rate": 1.9152641465019864e-05, "loss": 0.007, "step": 176450 }, { "epoch": 2.54, "learning_rate": 1.9152593425281393e-05, "loss": 0.0081, "step": 176460 }, { "epoch": 2.54, "learning_rate": 1.9152545385542922e-05, "loss": 0.0047, "step": 176470 }, { "epoch": 2.54, "learning_rate": 1.9152497345804452e-05, "loss": 0.0094, "step": 176480 }, { "epoch": 2.54, "learning_rate": 1.9152449306065978e-05, "loss": 0.0059, "step": 176490 }, { "epoch": 2.54, "learning_rate": 1.9152401266327507e-05, "loss": 0.0068, "step": 176500 }, { "epoch": 2.54, "learning_rate": 1.9152353226589036e-05, "loss": 0.0056, "step": 176510 }, { "epoch": 2.54, "learning_rate": 1.9152305186850565e-05, "loss": 0.0068, "step": 176520 }, { "epoch": 2.54, "learning_rate": 1.915225714711209e-05, "loss": 0.0044, "step": 176530 }, { "epoch": 2.54, "learning_rate": 1.915220910737362e-05, "loss": 0.0065, "step": 176540 }, { "epoch": 2.54, "learning_rate": 1.915216106763515e-05, "loss": 0.01, "step": 176550 }, { "epoch": 2.54, "learning_rate": 1.9152113027896676e-05, "loss": 0.0071, "step": 176560 }, { "epoch": 2.54, "learning_rate": 1.9152064988158205e-05, "loss": 0.0065, "step": 176570 }, { "epoch": 2.54, "learning_rate": 1.9152016948419734e-05, "loss": 0.011, "step": 176580 }, { "epoch": 2.55, "learning_rate": 1.9151968908681264e-05, "loss": 0.0062, "step": 176590 }, { "epoch": 2.55, "learning_rate": 1.915192086894279e-05, "loss": 0.0062, "step": 176600 }, { "epoch": 2.55, "learning_rate": 1.915187282920432e-05, "loss": 0.0048, "step": 176610 }, { "epoch": 2.55, "learning_rate": 1.9151824789465848e-05, "loss": 0.0073, "step": 176620 }, { "epoch": 2.55, "learning_rate": 1.9151776749727374e-05, "loss": 0.0074, "step": 176630 }, { "epoch": 2.55, "learning_rate": 1.9151728709988903e-05, "loss": 0.0068, "step": 176640 }, { "epoch": 2.55, "learning_rate": 1.9151680670250432e-05, "loss": 0.0118, "step": 176650 }, { "epoch": 2.55, "learning_rate": 1.915163263051196e-05, "loss": 0.0053, "step": 176660 }, { "epoch": 2.55, "learning_rate": 1.9151584590773488e-05, "loss": 0.0047, "step": 176670 }, { "epoch": 2.55, "learning_rate": 1.9151536551035017e-05, "loss": 0.0094, "step": 176680 }, { "epoch": 2.55, "learning_rate": 1.9151488511296546e-05, "loss": 0.0095, "step": 176690 }, { "epoch": 2.55, "learning_rate": 1.9151440471558075e-05, "loss": 0.0113, "step": 176700 }, { "epoch": 2.55, "learning_rate": 1.915139723579345e-05, "loss": 0.0055, "step": 176710 }, { "epoch": 2.55, "learning_rate": 1.915134919605498e-05, "loss": 0.0064, "step": 176720 }, { "epoch": 2.55, "learning_rate": 1.9151301156316505e-05, "loss": 0.011, "step": 176730 }, { "epoch": 2.55, "learning_rate": 1.9151253116578034e-05, "loss": 0.0052, "step": 176740 }, { "epoch": 2.55, "learning_rate": 1.9151205076839564e-05, "loss": 0.0077, "step": 176750 }, { "epoch": 2.55, "learning_rate": 1.9151157037101093e-05, "loss": 0.0092, "step": 176760 }, { "epoch": 2.55, "learning_rate": 1.915110899736262e-05, "loss": 0.0079, "step": 176770 }, { "epoch": 2.55, "learning_rate": 1.9151060957624148e-05, "loss": 0.0079, "step": 176780 }, { "epoch": 2.55, "learning_rate": 1.9151012917885677e-05, "loss": 0.0082, "step": 176790 }, { "epoch": 2.55, "learning_rate": 1.9150964878147203e-05, "loss": 0.0061, "step": 176800 }, { "epoch": 2.55, "learning_rate": 1.9150916838408733e-05, "loss": 0.0086, "step": 176810 }, { "epoch": 2.55, "learning_rate": 1.9150868798670262e-05, "loss": 0.0076, "step": 176820 }, { "epoch": 2.55, "learning_rate": 1.915082075893179e-05, "loss": 0.007, "step": 176830 }, { "epoch": 2.55, "learning_rate": 1.9150772719193317e-05, "loss": 0.0059, "step": 176840 }, { "epoch": 2.55, "learning_rate": 1.9150724679454846e-05, "loss": 0.0084, "step": 176850 }, { "epoch": 2.55, "learning_rate": 1.9150676639716376e-05, "loss": 0.0057, "step": 176860 }, { "epoch": 2.55, "learning_rate": 1.91506285999779e-05, "loss": 0.0075, "step": 176870 }, { "epoch": 2.55, "learning_rate": 1.915058056023943e-05, "loss": 0.0069, "step": 176880 }, { "epoch": 2.55, "learning_rate": 1.915053252050096e-05, "loss": 0.0086, "step": 176890 }, { "epoch": 2.55, "learning_rate": 1.915048448076249e-05, "loss": 0.0047, "step": 176900 }, { "epoch": 2.55, "learning_rate": 1.9150436441024015e-05, "loss": 0.0063, "step": 176910 }, { "epoch": 2.55, "learning_rate": 1.9150388401285544e-05, "loss": 0.0094, "step": 176920 }, { "epoch": 2.55, "learning_rate": 1.9150340361547074e-05, "loss": 0.0062, "step": 176930 }, { "epoch": 2.55, "learning_rate": 1.9150292321808603e-05, "loss": 0.0084, "step": 176940 }, { "epoch": 2.55, "learning_rate": 1.915024428207013e-05, "loss": 0.0052, "step": 176950 }, { "epoch": 2.55, "learning_rate": 1.9150196242331658e-05, "loss": 0.0042, "step": 176960 }, { "epoch": 2.55, "learning_rate": 1.9150148202593187e-05, "loss": 0.0051, "step": 176970 }, { "epoch": 2.55, "learning_rate": 1.9150100162854713e-05, "loss": 0.0042, "step": 176980 }, { "epoch": 2.55, "learning_rate": 1.9150052123116242e-05, "loss": 0.0063, "step": 176990 }, { "epoch": 2.55, "learning_rate": 1.9150004083377772e-05, "loss": 0.0085, "step": 177000 }, { "epoch": 2.55, "learning_rate": 1.91499560436393e-05, "loss": 0.0057, "step": 177010 }, { "epoch": 2.55, "learning_rate": 1.9149908003900827e-05, "loss": 0.0081, "step": 177020 }, { "epoch": 2.55, "learning_rate": 1.9149859964162356e-05, "loss": 0.0074, "step": 177030 }, { "epoch": 2.55, "learning_rate": 1.9149811924423885e-05, "loss": 0.0076, "step": 177040 }, { "epoch": 2.55, "learning_rate": 1.914976388468541e-05, "loss": 0.0067, "step": 177050 }, { "epoch": 2.55, "learning_rate": 1.914971584494694e-05, "loss": 0.0061, "step": 177060 }, { "epoch": 2.55, "learning_rate": 1.914966780520847e-05, "loss": 0.0084, "step": 177070 }, { "epoch": 2.55, "learning_rate": 1.914961976547e-05, "loss": 0.0055, "step": 177080 }, { "epoch": 2.55, "learning_rate": 1.9149571725731525e-05, "loss": 0.0088, "step": 177090 }, { "epoch": 2.55, "learning_rate": 1.9149523685993054e-05, "loss": 0.0061, "step": 177100 }, { "epoch": 2.55, "learning_rate": 1.9149475646254584e-05, "loss": 0.0085, "step": 177110 }, { "epoch": 2.55, "learning_rate": 1.914942760651611e-05, "loss": 0.0066, "step": 177120 }, { "epoch": 2.55, "learning_rate": 1.914937956677764e-05, "loss": 0.0064, "step": 177130 }, { "epoch": 2.55, "learning_rate": 1.9149331527039168e-05, "loss": 0.0073, "step": 177140 }, { "epoch": 2.55, "learning_rate": 1.9149283487300697e-05, "loss": 0.0074, "step": 177150 }, { "epoch": 2.55, "learning_rate": 1.9149235447562223e-05, "loss": 0.0067, "step": 177160 }, { "epoch": 2.55, "learning_rate": 1.9149187407823752e-05, "loss": 0.0076, "step": 177170 }, { "epoch": 2.55, "learning_rate": 1.914913936808528e-05, "loss": 0.007, "step": 177180 }, { "epoch": 2.55, "learning_rate": 1.914909132834681e-05, "loss": 0.0072, "step": 177190 }, { "epoch": 2.55, "learning_rate": 1.9149043288608337e-05, "loss": 0.0056, "step": 177200 }, { "epoch": 2.55, "learning_rate": 1.9148995248869866e-05, "loss": 0.006, "step": 177210 }, { "epoch": 2.55, "learning_rate": 1.9148947209131395e-05, "loss": 0.0072, "step": 177220 }, { "epoch": 2.55, "learning_rate": 1.914889916939292e-05, "loss": 0.0093, "step": 177230 }, { "epoch": 2.55, "learning_rate": 1.914885112965445e-05, "loss": 0.0076, "step": 177240 }, { "epoch": 2.55, "learning_rate": 1.914880308991598e-05, "loss": 0.0068, "step": 177250 }, { "epoch": 2.55, "learning_rate": 1.914875505017751e-05, "loss": 0.0073, "step": 177260 }, { "epoch": 2.55, "learning_rate": 1.9148707010439035e-05, "loss": 0.005, "step": 177270 }, { "epoch": 2.55, "learning_rate": 1.9148658970700564e-05, "loss": 0.0096, "step": 177280 }, { "epoch": 2.56, "learning_rate": 1.9148610930962093e-05, "loss": 0.007, "step": 177290 }, { "epoch": 2.56, "learning_rate": 1.914856289122362e-05, "loss": 0.0061, "step": 177300 }, { "epoch": 2.56, "learning_rate": 1.914851485148515e-05, "loss": 0.0086, "step": 177310 }, { "epoch": 2.56, "learning_rate": 1.9148466811746678e-05, "loss": 0.0093, "step": 177320 }, { "epoch": 2.56, "learning_rate": 1.9148418772008207e-05, "loss": 0.0052, "step": 177330 }, { "epoch": 2.56, "learning_rate": 1.9148370732269733e-05, "loss": 0.0085, "step": 177340 }, { "epoch": 2.56, "learning_rate": 1.9148322692531262e-05, "loss": 0.0063, "step": 177350 }, { "epoch": 2.56, "learning_rate": 1.914827465279279e-05, "loss": 0.0071, "step": 177360 }, { "epoch": 2.56, "learning_rate": 1.914822661305432e-05, "loss": 0.0056, "step": 177370 }, { "epoch": 2.56, "learning_rate": 1.9148178573315847e-05, "loss": 0.0083, "step": 177380 }, { "epoch": 2.56, "learning_rate": 1.9148130533577376e-05, "loss": 0.0073, "step": 177390 }, { "epoch": 2.56, "learning_rate": 1.9148082493838905e-05, "loss": 0.0058, "step": 177400 }, { "epoch": 2.56, "learning_rate": 1.914803445410043e-05, "loss": 0.0088, "step": 177410 }, { "epoch": 2.56, "learning_rate": 1.914798641436196e-05, "loss": 0.0062, "step": 177420 }, { "epoch": 2.56, "learning_rate": 1.914793837462349e-05, "loss": 0.0062, "step": 177430 }, { "epoch": 2.56, "learning_rate": 1.914789033488502e-05, "loss": 0.006, "step": 177440 }, { "epoch": 2.56, "learning_rate": 1.9147842295146545e-05, "loss": 0.0049, "step": 177450 }, { "epoch": 2.56, "learning_rate": 1.9147794255408074e-05, "loss": 0.0064, "step": 177460 }, { "epoch": 2.56, "learning_rate": 1.9147746215669603e-05, "loss": 0.0068, "step": 177470 }, { "epoch": 2.56, "learning_rate": 1.914769817593113e-05, "loss": 0.0086, "step": 177480 }, { "epoch": 2.56, "learning_rate": 1.914765013619266e-05, "loss": 0.0076, "step": 177490 }, { "epoch": 2.56, "learning_rate": 1.9147602096454188e-05, "loss": 0.0049, "step": 177500 }, { "epoch": 2.56, "learning_rate": 1.9147554056715717e-05, "loss": 0.0098, "step": 177510 }, { "epoch": 2.56, "learning_rate": 1.9147506016977243e-05, "loss": 0.0075, "step": 177520 }, { "epoch": 2.56, "learning_rate": 1.9147457977238772e-05, "loss": 0.0052, "step": 177530 }, { "epoch": 2.56, "learning_rate": 1.91474099375003e-05, "loss": 0.01, "step": 177540 }, { "epoch": 2.56, "learning_rate": 1.914736189776183e-05, "loss": 0.009, "step": 177550 }, { "epoch": 2.56, "learning_rate": 1.9147313858023357e-05, "loss": 0.0095, "step": 177560 }, { "epoch": 2.56, "learning_rate": 1.9147265818284886e-05, "loss": 0.0079, "step": 177570 }, { "epoch": 2.56, "learning_rate": 1.9147217778546415e-05, "loss": 0.0064, "step": 177580 }, { "epoch": 2.56, "learning_rate": 1.914716973880794e-05, "loss": 0.0093, "step": 177590 }, { "epoch": 2.56, "learning_rate": 1.914712169906947e-05, "loss": 0.0063, "step": 177600 }, { "epoch": 2.56, "learning_rate": 1.9147073659331e-05, "loss": 0.007, "step": 177610 }, { "epoch": 2.56, "learning_rate": 1.914702561959253e-05, "loss": 0.0081, "step": 177620 }, { "epoch": 2.56, "learning_rate": 1.9146977579854055e-05, "loss": 0.0089, "step": 177630 }, { "epoch": 2.56, "learning_rate": 1.9146929540115584e-05, "loss": 0.0078, "step": 177640 }, { "epoch": 2.56, "learning_rate": 1.9146881500377113e-05, "loss": 0.0071, "step": 177650 }, { "epoch": 2.56, "learning_rate": 1.914683346063864e-05, "loss": 0.0051, "step": 177660 }, { "epoch": 2.56, "learning_rate": 1.914678542090017e-05, "loss": 0.0091, "step": 177670 }, { "epoch": 2.56, "learning_rate": 1.9146737381161698e-05, "loss": 0.0092, "step": 177680 }, { "epoch": 2.56, "learning_rate": 1.9146689341423227e-05, "loss": 0.0081, "step": 177690 }, { "epoch": 2.56, "learning_rate": 1.9146641301684753e-05, "loss": 0.0074, "step": 177700 }, { "epoch": 2.56, "learning_rate": 1.9146593261946282e-05, "loss": 0.0065, "step": 177710 }, { "epoch": 2.56, "learning_rate": 1.914654522220781e-05, "loss": 0.0065, "step": 177720 }, { "epoch": 2.56, "learning_rate": 1.914649718246934e-05, "loss": 0.0068, "step": 177730 }, { "epoch": 2.56, "learning_rate": 1.914644914273087e-05, "loss": 0.0048, "step": 177740 }, { "epoch": 2.56, "learning_rate": 1.91464011029924e-05, "loss": 0.0082, "step": 177750 }, { "epoch": 2.56, "learning_rate": 1.9146353063253925e-05, "loss": 0.0096, "step": 177760 }, { "epoch": 2.56, "learning_rate": 1.9146305023515454e-05, "loss": 0.0054, "step": 177770 }, { "epoch": 2.56, "learning_rate": 1.9146256983776984e-05, "loss": 0.007, "step": 177780 }, { "epoch": 2.56, "learning_rate": 1.9146208944038513e-05, "loss": 0.0068, "step": 177790 }, { "epoch": 2.56, "learning_rate": 1.914616090430004e-05, "loss": 0.009, "step": 177800 }, { "epoch": 2.56, "learning_rate": 1.9146112864561568e-05, "loss": 0.0047, "step": 177810 }, { "epoch": 2.56, "learning_rate": 1.9146064824823097e-05, "loss": 0.0059, "step": 177820 }, { "epoch": 2.56, "learning_rate": 1.9146016785084623e-05, "loss": 0.0042, "step": 177830 }, { "epoch": 2.56, "learning_rate": 1.9145968745346152e-05, "loss": 0.0051, "step": 177840 }, { "epoch": 2.56, "learning_rate": 1.9145920705607682e-05, "loss": 0.0055, "step": 177850 }, { "epoch": 2.56, "learning_rate": 1.914587266586921e-05, "loss": 0.0078, "step": 177860 }, { "epoch": 2.56, "learning_rate": 1.9145824626130737e-05, "loss": 0.0071, "step": 177870 }, { "epoch": 2.56, "learning_rate": 1.9145776586392266e-05, "loss": 0.0061, "step": 177880 }, { "epoch": 2.56, "learning_rate": 1.9145728546653795e-05, "loss": 0.0074, "step": 177890 }, { "epoch": 2.56, "learning_rate": 1.914568050691532e-05, "loss": 0.0069, "step": 177900 }, { "epoch": 2.56, "learning_rate": 1.914563246717685e-05, "loss": 0.008, "step": 177910 }, { "epoch": 2.56, "learning_rate": 1.914558442743838e-05, "loss": 0.0073, "step": 177920 }, { "epoch": 2.56, "learning_rate": 1.914553638769991e-05, "loss": 0.0077, "step": 177930 }, { "epoch": 2.56, "learning_rate": 1.9145488347961435e-05, "loss": 0.0078, "step": 177940 }, { "epoch": 2.56, "learning_rate": 1.9145440308222964e-05, "loss": 0.0073, "step": 177950 }, { "epoch": 2.56, "learning_rate": 1.9145392268484494e-05, "loss": 0.0063, "step": 177960 }, { "epoch": 2.56, "learning_rate": 1.9145344228746023e-05, "loss": 0.0084, "step": 177970 }, { "epoch": 2.57, "learning_rate": 1.914529618900755e-05, "loss": 0.0066, "step": 177980 }, { "epoch": 2.57, "learning_rate": 1.9145248149269078e-05, "loss": 0.0057, "step": 177990 }, { "epoch": 2.57, "learning_rate": 1.9145200109530607e-05, "loss": 0.0091, "step": 178000 }, { "epoch": 2.57, "learning_rate": 1.9145152069792133e-05, "loss": 0.0058, "step": 178010 }, { "epoch": 2.57, "learning_rate": 1.9145104030053662e-05, "loss": 0.0077, "step": 178020 }, { "epoch": 2.57, "learning_rate": 1.914505599031519e-05, "loss": 0.0101, "step": 178030 }, { "epoch": 2.57, "learning_rate": 1.914500795057672e-05, "loss": 0.0064, "step": 178040 }, { "epoch": 2.57, "learning_rate": 1.9144959910838247e-05, "loss": 0.0079, "step": 178050 }, { "epoch": 2.57, "learning_rate": 1.9144911871099776e-05, "loss": 0.0078, "step": 178060 }, { "epoch": 2.57, "learning_rate": 1.9144863831361305e-05, "loss": 0.0095, "step": 178070 }, { "epoch": 2.57, "learning_rate": 1.914481579162283e-05, "loss": 0.0059, "step": 178080 }, { "epoch": 2.57, "learning_rate": 1.914476775188436e-05, "loss": 0.006, "step": 178090 }, { "epoch": 2.57, "learning_rate": 1.914471971214589e-05, "loss": 0.0064, "step": 178100 }, { "epoch": 2.57, "learning_rate": 1.914467167240742e-05, "loss": 0.007, "step": 178110 }, { "epoch": 2.57, "learning_rate": 1.9144623632668945e-05, "loss": 0.0061, "step": 178120 }, { "epoch": 2.57, "learning_rate": 1.9144575592930474e-05, "loss": 0.0071, "step": 178130 }, { "epoch": 2.57, "learning_rate": 1.9144527553192003e-05, "loss": 0.0048, "step": 178140 }, { "epoch": 2.57, "learning_rate": 1.9144479513453533e-05, "loss": 0.0055, "step": 178150 }, { "epoch": 2.57, "learning_rate": 1.914443147371506e-05, "loss": 0.0074, "step": 178160 }, { "epoch": 2.57, "learning_rate": 1.9144383433976588e-05, "loss": 0.0067, "step": 178170 }, { "epoch": 2.57, "learning_rate": 1.9144335394238117e-05, "loss": 0.0048, "step": 178180 }, { "epoch": 2.57, "learning_rate": 1.9144287354499643e-05, "loss": 0.0068, "step": 178190 }, { "epoch": 2.57, "learning_rate": 1.9144239314761172e-05, "loss": 0.0083, "step": 178200 }, { "epoch": 2.57, "learning_rate": 1.91441912750227e-05, "loss": 0.0082, "step": 178210 }, { "epoch": 2.57, "learning_rate": 1.914414323528423e-05, "loss": 0.0077, "step": 178220 }, { "epoch": 2.57, "learning_rate": 1.9144095195545757e-05, "loss": 0.007, "step": 178230 }, { "epoch": 2.57, "learning_rate": 1.9144047155807286e-05, "loss": 0.0099, "step": 178240 }, { "epoch": 2.57, "learning_rate": 1.9143999116068815e-05, "loss": 0.008, "step": 178250 }, { "epoch": 2.57, "learning_rate": 1.914395107633034e-05, "loss": 0.008, "step": 178260 }, { "epoch": 2.57, "learning_rate": 1.914390303659187e-05, "loss": 0.0087, "step": 178270 }, { "epoch": 2.57, "learning_rate": 1.91438549968534e-05, "loss": 0.0079, "step": 178280 }, { "epoch": 2.57, "learning_rate": 1.914380695711493e-05, "loss": 0.0068, "step": 178290 }, { "epoch": 2.57, "learning_rate": 1.9143758917376455e-05, "loss": 0.0071, "step": 178300 }, { "epoch": 2.57, "learning_rate": 1.9143710877637984e-05, "loss": 0.0089, "step": 178310 }, { "epoch": 2.57, "learning_rate": 1.9143662837899513e-05, "loss": 0.0075, "step": 178320 }, { "epoch": 2.57, "learning_rate": 1.9143614798161043e-05, "loss": 0.0053, "step": 178330 }, { "epoch": 2.57, "learning_rate": 1.914356675842257e-05, "loss": 0.0072, "step": 178340 }, { "epoch": 2.57, "learning_rate": 1.9143518718684098e-05, "loss": 0.0084, "step": 178350 }, { "epoch": 2.57, "learning_rate": 1.9143470678945627e-05, "loss": 0.0061, "step": 178360 }, { "epoch": 2.57, "learning_rate": 1.9143422639207153e-05, "loss": 0.0093, "step": 178370 }, { "epoch": 2.57, "learning_rate": 1.9143374599468682e-05, "loss": 0.009, "step": 178380 }, { "epoch": 2.57, "learning_rate": 1.914332655973021e-05, "loss": 0.0066, "step": 178390 }, { "epoch": 2.57, "learning_rate": 1.914327851999174e-05, "loss": 0.0077, "step": 178400 }, { "epoch": 2.57, "learning_rate": 1.9143230480253267e-05, "loss": 0.0082, "step": 178410 }, { "epoch": 2.57, "learning_rate": 1.9143182440514796e-05, "loss": 0.0047, "step": 178420 }, { "epoch": 2.57, "learning_rate": 1.9143134400776325e-05, "loss": 0.0088, "step": 178430 }, { "epoch": 2.57, "learning_rate": 1.914308636103785e-05, "loss": 0.0095, "step": 178440 }, { "epoch": 2.57, "learning_rate": 1.914303832129938e-05, "loss": 0.0067, "step": 178450 }, { "epoch": 2.57, "learning_rate": 1.914299028156091e-05, "loss": 0.0057, "step": 178460 }, { "epoch": 2.57, "learning_rate": 1.914294224182244e-05, "loss": 0.0059, "step": 178470 }, { "epoch": 2.57, "learning_rate": 1.9142894202083965e-05, "loss": 0.0066, "step": 178480 }, { "epoch": 2.57, "learning_rate": 1.9142846162345494e-05, "loss": 0.0059, "step": 178490 }, { "epoch": 2.57, "learning_rate": 1.9142798122607023e-05, "loss": 0.004, "step": 178500 }, { "epoch": 2.57, "learning_rate": 1.914275008286855e-05, "loss": 0.0055, "step": 178510 }, { "epoch": 2.57, "learning_rate": 1.914270204313008e-05, "loss": 0.0063, "step": 178520 }, { "epoch": 2.57, "learning_rate": 1.9142654003391608e-05, "loss": 0.008, "step": 178530 }, { "epoch": 2.57, "learning_rate": 1.9142605963653137e-05, "loss": 0.0064, "step": 178540 }, { "epoch": 2.57, "learning_rate": 1.9142557923914663e-05, "loss": 0.0062, "step": 178550 }, { "epoch": 2.57, "learning_rate": 1.9142509884176192e-05, "loss": 0.008, "step": 178560 }, { "epoch": 2.57, "learning_rate": 1.914246184443772e-05, "loss": 0.006, "step": 178570 }, { "epoch": 2.57, "learning_rate": 1.914241380469925e-05, "loss": 0.0058, "step": 178580 }, { "epoch": 2.57, "learning_rate": 1.9142365764960777e-05, "loss": 0.0096, "step": 178590 }, { "epoch": 2.57, "learning_rate": 1.9142317725222306e-05, "loss": 0.0085, "step": 178600 }, { "epoch": 2.57, "learning_rate": 1.9142269685483835e-05, "loss": 0.0092, "step": 178610 }, { "epoch": 2.57, "learning_rate": 1.914222164574536e-05, "loss": 0.0078, "step": 178620 }, { "epoch": 2.57, "learning_rate": 1.914217360600689e-05, "loss": 0.0079, "step": 178630 }, { "epoch": 2.57, "learning_rate": 1.914212556626842e-05, "loss": 0.0057, "step": 178640 }, { "epoch": 2.57, "learning_rate": 1.914207752652995e-05, "loss": 0.0098, "step": 178650 }, { "epoch": 2.57, "learning_rate": 1.9142029486791475e-05, "loss": 0.0053, "step": 178660 }, { "epoch": 2.57, "learning_rate": 1.9141981447053004e-05, "loss": 0.0073, "step": 178670 }, { "epoch": 2.58, "learning_rate": 1.9141933407314533e-05, "loss": 0.0053, "step": 178680 }, { "epoch": 2.58, "learning_rate": 1.914188536757606e-05, "loss": 0.0067, "step": 178690 }, { "epoch": 2.58, "learning_rate": 1.914183732783759e-05, "loss": 0.0057, "step": 178700 }, { "epoch": 2.58, "learning_rate": 1.9141789288099118e-05, "loss": 0.0069, "step": 178710 }, { "epoch": 2.58, "learning_rate": 1.9141741248360647e-05, "loss": 0.0063, "step": 178720 }, { "epoch": 2.58, "learning_rate": 1.9141693208622173e-05, "loss": 0.0056, "step": 178730 }, { "epoch": 2.58, "learning_rate": 1.9141645168883702e-05, "loss": 0.0066, "step": 178740 }, { "epoch": 2.58, "learning_rate": 1.914159712914523e-05, "loss": 0.0068, "step": 178750 }, { "epoch": 2.58, "learning_rate": 1.914154908940676e-05, "loss": 0.0057, "step": 178760 }, { "epoch": 2.58, "learning_rate": 1.9141501049668286e-05, "loss": 0.0074, "step": 178770 }, { "epoch": 2.58, "learning_rate": 1.9141453009929816e-05, "loss": 0.0102, "step": 178780 }, { "epoch": 2.58, "learning_rate": 1.9141404970191345e-05, "loss": 0.0097, "step": 178790 }, { "epoch": 2.58, "learning_rate": 1.914135693045287e-05, "loss": 0.0075, "step": 178800 }, { "epoch": 2.58, "learning_rate": 1.91413088907144e-05, "loss": 0.0052, "step": 178810 }, { "epoch": 2.58, "learning_rate": 1.914126085097593e-05, "loss": 0.0082, "step": 178820 }, { "epoch": 2.58, "learning_rate": 1.914121281123746e-05, "loss": 0.0053, "step": 178830 }, { "epoch": 2.58, "learning_rate": 1.9141164771498985e-05, "loss": 0.0104, "step": 178840 }, { "epoch": 2.58, "learning_rate": 1.9141116731760514e-05, "loss": 0.0107, "step": 178850 }, { "epoch": 2.58, "learning_rate": 1.9141068692022043e-05, "loss": 0.0064, "step": 178860 }, { "epoch": 2.58, "learning_rate": 1.914102065228357e-05, "loss": 0.0092, "step": 178870 }, { "epoch": 2.58, "learning_rate": 1.9140972612545098e-05, "loss": 0.01, "step": 178880 }, { "epoch": 2.58, "learning_rate": 1.9140929376780476e-05, "loss": 0.0077, "step": 178890 }, { "epoch": 2.58, "learning_rate": 1.9140881337042002e-05, "loss": 0.0072, "step": 178900 }, { "epoch": 2.58, "learning_rate": 1.914083329730353e-05, "loss": 0.0101, "step": 178910 }, { "epoch": 2.58, "learning_rate": 1.914078525756506e-05, "loss": 0.0066, "step": 178920 }, { "epoch": 2.58, "learning_rate": 1.9140737217826587e-05, "loss": 0.008, "step": 178930 }, { "epoch": 2.58, "learning_rate": 1.9140689178088116e-05, "loss": 0.0056, "step": 178940 }, { "epoch": 2.58, "learning_rate": 1.9140641138349645e-05, "loss": 0.0071, "step": 178950 }, { "epoch": 2.58, "learning_rate": 1.9140593098611174e-05, "loss": 0.0095, "step": 178960 }, { "epoch": 2.58, "learning_rate": 1.91405450588727e-05, "loss": 0.0074, "step": 178970 }, { "epoch": 2.58, "learning_rate": 1.914049701913423e-05, "loss": 0.0058, "step": 178980 }, { "epoch": 2.58, "learning_rate": 1.914044897939576e-05, "loss": 0.0062, "step": 178990 }, { "epoch": 2.58, "learning_rate": 1.9140400939657288e-05, "loss": 0.01, "step": 179000 }, { "epoch": 2.58, "learning_rate": 1.9140352899918814e-05, "loss": 0.0049, "step": 179010 }, { "epoch": 2.58, "learning_rate": 1.9140304860180343e-05, "loss": 0.0077, "step": 179020 }, { "epoch": 2.58, "learning_rate": 1.9140256820441873e-05, "loss": 0.0056, "step": 179030 }, { "epoch": 2.58, "learning_rate": 1.91402087807034e-05, "loss": 0.0079, "step": 179040 }, { "epoch": 2.58, "learning_rate": 1.9140160740964928e-05, "loss": 0.0051, "step": 179050 }, { "epoch": 2.58, "learning_rate": 1.9140112701226457e-05, "loss": 0.007, "step": 179060 }, { "epoch": 2.58, "learning_rate": 1.9140064661487986e-05, "loss": 0.0116, "step": 179070 }, { "epoch": 2.58, "learning_rate": 1.9140016621749512e-05, "loss": 0.0083, "step": 179080 }, { "epoch": 2.58, "learning_rate": 1.913996858201104e-05, "loss": 0.0054, "step": 179090 }, { "epoch": 2.58, "learning_rate": 1.913992054227257e-05, "loss": 0.0071, "step": 179100 }, { "epoch": 2.58, "learning_rate": 1.9139872502534097e-05, "loss": 0.0091, "step": 179110 }, { "epoch": 2.58, "learning_rate": 1.9139824462795626e-05, "loss": 0.0072, "step": 179120 }, { "epoch": 2.58, "learning_rate": 1.9139776423057155e-05, "loss": 0.0061, "step": 179130 }, { "epoch": 2.58, "learning_rate": 1.9139728383318684e-05, "loss": 0.0086, "step": 179140 }, { "epoch": 2.58, "learning_rate": 1.913968034358021e-05, "loss": 0.0081, "step": 179150 }, { "epoch": 2.58, "learning_rate": 1.913963230384174e-05, "loss": 0.0076, "step": 179160 }, { "epoch": 2.58, "learning_rate": 1.913958426410327e-05, "loss": 0.0129, "step": 179170 }, { "epoch": 2.58, "learning_rate": 1.9139536224364798e-05, "loss": 0.0052, "step": 179180 }, { "epoch": 2.58, "learning_rate": 1.9139488184626324e-05, "loss": 0.0067, "step": 179190 }, { "epoch": 2.58, "learning_rate": 1.9139440144887853e-05, "loss": 0.01, "step": 179200 }, { "epoch": 2.58, "learning_rate": 1.9139392105149382e-05, "loss": 0.0079, "step": 179210 }, { "epoch": 2.58, "learning_rate": 1.913934406541091e-05, "loss": 0.0091, "step": 179220 }, { "epoch": 2.58, "learning_rate": 1.9139296025672438e-05, "loss": 0.0076, "step": 179230 }, { "epoch": 2.58, "learning_rate": 1.9139247985933967e-05, "loss": 0.0102, "step": 179240 }, { "epoch": 2.58, "learning_rate": 1.9139199946195496e-05, "loss": 0.0102, "step": 179250 }, { "epoch": 2.58, "learning_rate": 1.9139151906457022e-05, "loss": 0.0063, "step": 179260 }, { "epoch": 2.58, "learning_rate": 1.913910386671855e-05, "loss": 0.0049, "step": 179270 }, { "epoch": 2.58, "learning_rate": 1.913905582698008e-05, "loss": 0.0093, "step": 179280 }, { "epoch": 2.58, "learning_rate": 1.9139007787241606e-05, "loss": 0.0072, "step": 179290 }, { "epoch": 2.58, "learning_rate": 1.9138959747503136e-05, "loss": 0.0132, "step": 179300 }, { "epoch": 2.58, "learning_rate": 1.9138911707764665e-05, "loss": 0.0061, "step": 179310 }, { "epoch": 2.58, "learning_rate": 1.9138863668026194e-05, "loss": 0.0063, "step": 179320 }, { "epoch": 2.58, "learning_rate": 1.913881562828772e-05, "loss": 0.0092, "step": 179330 }, { "epoch": 2.58, "learning_rate": 1.913876758854925e-05, "loss": 0.0092, "step": 179340 }, { "epoch": 2.58, "learning_rate": 1.913871954881078e-05, "loss": 0.0077, "step": 179350 }, { "epoch": 2.58, "learning_rate": 1.9138671509072308e-05, "loss": 0.009, "step": 179360 }, { "epoch": 2.59, "learning_rate": 1.9138623469333834e-05, "loss": 0.0065, "step": 179370 }, { "epoch": 2.59, "learning_rate": 1.9138575429595363e-05, "loss": 0.01, "step": 179380 }, { "epoch": 2.59, "learning_rate": 1.9138527389856892e-05, "loss": 0.0082, "step": 179390 }, { "epoch": 2.59, "learning_rate": 1.9138479350118418e-05, "loss": 0.0038, "step": 179400 }, { "epoch": 2.59, "learning_rate": 1.9138431310379948e-05, "loss": 0.0076, "step": 179410 }, { "epoch": 2.59, "learning_rate": 1.9138383270641477e-05, "loss": 0.0087, "step": 179420 }, { "epoch": 2.59, "learning_rate": 1.9138335230903006e-05, "loss": 0.0074, "step": 179430 }, { "epoch": 2.59, "learning_rate": 1.9138287191164532e-05, "loss": 0.0052, "step": 179440 }, { "epoch": 2.59, "learning_rate": 1.913823915142606e-05, "loss": 0.0062, "step": 179450 }, { "epoch": 2.59, "learning_rate": 1.913819111168759e-05, "loss": 0.0081, "step": 179460 }, { "epoch": 2.59, "learning_rate": 1.9138143071949116e-05, "loss": 0.0078, "step": 179470 }, { "epoch": 2.59, "learning_rate": 1.9138095032210646e-05, "loss": 0.0064, "step": 179480 }, { "epoch": 2.59, "learning_rate": 1.9138046992472175e-05, "loss": 0.0047, "step": 179490 }, { "epoch": 2.59, "learning_rate": 1.9137998952733704e-05, "loss": 0.0083, "step": 179500 }, { "epoch": 2.59, "learning_rate": 1.913795091299523e-05, "loss": 0.0083, "step": 179510 }, { "epoch": 2.59, "learning_rate": 1.913790287325676e-05, "loss": 0.0085, "step": 179520 }, { "epoch": 2.59, "learning_rate": 1.913785483351829e-05, "loss": 0.0065, "step": 179530 }, { "epoch": 2.59, "learning_rate": 1.9137806793779818e-05, "loss": 0.0073, "step": 179540 }, { "epoch": 2.59, "learning_rate": 1.9137758754041344e-05, "loss": 0.0048, "step": 179550 }, { "epoch": 2.59, "learning_rate": 1.9137710714302873e-05, "loss": 0.0115, "step": 179560 }, { "epoch": 2.59, "learning_rate": 1.9137662674564402e-05, "loss": 0.0075, "step": 179570 }, { "epoch": 2.59, "learning_rate": 1.9137614634825928e-05, "loss": 0.0078, "step": 179580 }, { "epoch": 2.59, "learning_rate": 1.9137566595087457e-05, "loss": 0.0091, "step": 179590 }, { "epoch": 2.59, "learning_rate": 1.9137518555348987e-05, "loss": 0.0096, "step": 179600 }, { "epoch": 2.59, "learning_rate": 1.9137470515610516e-05, "loss": 0.0094, "step": 179610 }, { "epoch": 2.59, "learning_rate": 1.9137422475872042e-05, "loss": 0.0083, "step": 179620 }, { "epoch": 2.59, "learning_rate": 1.913737443613357e-05, "loss": 0.0056, "step": 179630 }, { "epoch": 2.59, "learning_rate": 1.91373263963951e-05, "loss": 0.0077, "step": 179640 }, { "epoch": 2.59, "learning_rate": 1.9137278356656626e-05, "loss": 0.0065, "step": 179650 }, { "epoch": 2.59, "learning_rate": 1.9137230316918156e-05, "loss": 0.0069, "step": 179660 }, { "epoch": 2.59, "learning_rate": 1.9137182277179685e-05, "loss": 0.0094, "step": 179670 }, { "epoch": 2.59, "learning_rate": 1.9137134237441214e-05, "loss": 0.0088, "step": 179680 }, { "epoch": 2.59, "learning_rate": 1.913708619770274e-05, "loss": 0.0048, "step": 179690 }, { "epoch": 2.59, "learning_rate": 1.913703815796427e-05, "loss": 0.0064, "step": 179700 }, { "epoch": 2.59, "learning_rate": 1.91369901182258e-05, "loss": 0.0083, "step": 179710 }, { "epoch": 2.59, "learning_rate": 1.9136942078487328e-05, "loss": 0.007, "step": 179720 }, { "epoch": 2.59, "learning_rate": 1.9136894038748854e-05, "loss": 0.0083, "step": 179730 }, { "epoch": 2.59, "learning_rate": 1.9136845999010383e-05, "loss": 0.0084, "step": 179740 }, { "epoch": 2.59, "learning_rate": 1.9136797959271912e-05, "loss": 0.0058, "step": 179750 }, { "epoch": 2.59, "learning_rate": 1.9136749919533438e-05, "loss": 0.0135, "step": 179760 }, { "epoch": 2.59, "learning_rate": 1.9136701879794967e-05, "loss": 0.0056, "step": 179770 }, { "epoch": 2.59, "learning_rate": 1.9136653840056497e-05, "loss": 0.0082, "step": 179780 }, { "epoch": 2.59, "learning_rate": 1.9136605800318026e-05, "loss": 0.0058, "step": 179790 }, { "epoch": 2.59, "learning_rate": 1.9136557760579552e-05, "loss": 0.0053, "step": 179800 }, { "epoch": 2.59, "learning_rate": 1.913650972084108e-05, "loss": 0.0063, "step": 179810 }, { "epoch": 2.59, "learning_rate": 1.913646168110261e-05, "loss": 0.0062, "step": 179820 }, { "epoch": 2.59, "learning_rate": 1.9136413641364136e-05, "loss": 0.0074, "step": 179830 }, { "epoch": 2.59, "learning_rate": 1.9136365601625665e-05, "loss": 0.0066, "step": 179840 }, { "epoch": 2.59, "learning_rate": 1.9136317561887195e-05, "loss": 0.0081, "step": 179850 }, { "epoch": 2.59, "learning_rate": 1.9136269522148724e-05, "loss": 0.0069, "step": 179860 }, { "epoch": 2.59, "learning_rate": 1.913622148241025e-05, "loss": 0.0071, "step": 179870 }, { "epoch": 2.59, "learning_rate": 1.913617344267178e-05, "loss": 0.0075, "step": 179880 }, { "epoch": 2.59, "learning_rate": 1.913612540293331e-05, "loss": 0.0064, "step": 179890 }, { "epoch": 2.59, "learning_rate": 1.9136077363194838e-05, "loss": 0.0086, "step": 179900 }, { "epoch": 2.59, "learning_rate": 1.9136029323456364e-05, "loss": 0.0062, "step": 179910 }, { "epoch": 2.59, "learning_rate": 1.9135981283717893e-05, "loss": 0.006, "step": 179920 }, { "epoch": 2.59, "learning_rate": 1.9135933243979422e-05, "loss": 0.0092, "step": 179930 }, { "epoch": 2.59, "learning_rate": 1.9135885204240948e-05, "loss": 0.0087, "step": 179940 }, { "epoch": 2.59, "learning_rate": 1.9135837164502477e-05, "loss": 0.0078, "step": 179950 }, { "epoch": 2.59, "learning_rate": 1.9135789124764007e-05, "loss": 0.0048, "step": 179960 }, { "epoch": 2.59, "learning_rate": 1.9135741085025536e-05, "loss": 0.0051, "step": 179970 }, { "epoch": 2.59, "learning_rate": 1.913569304528706e-05, "loss": 0.0073, "step": 179980 }, { "epoch": 2.59, "learning_rate": 1.913564500554859e-05, "loss": 0.0049, "step": 179990 }, { "epoch": 2.59, "learning_rate": 1.913559696581012e-05, "loss": 0.008, "step": 180000 }, { "epoch": 2.59, "learning_rate": 1.9135548926071646e-05, "loss": 0.0068, "step": 180010 }, { "epoch": 2.59, "learning_rate": 1.9135500886333175e-05, "loss": 0.0101, "step": 180020 }, { "epoch": 2.59, "learning_rate": 1.9135452846594705e-05, "loss": 0.0071, "step": 180030 }, { "epoch": 2.59, "learning_rate": 1.9135404806856234e-05, "loss": 0.0048, "step": 180040 }, { "epoch": 2.59, "learning_rate": 1.913535676711776e-05, "loss": 0.01, "step": 180050 }, { "epoch": 2.6, "learning_rate": 1.913530872737929e-05, "loss": 0.0073, "step": 180060 }, { "epoch": 2.6, "learning_rate": 1.913526068764082e-05, "loss": 0.0074, "step": 180070 }, { "epoch": 2.6, "learning_rate": 1.9135212647902344e-05, "loss": 0.0074, "step": 180080 }, { "epoch": 2.6, "learning_rate": 1.9135164608163873e-05, "loss": 0.0083, "step": 180090 }, { "epoch": 2.6, "learning_rate": 1.9135116568425403e-05, "loss": 0.0068, "step": 180100 }, { "epoch": 2.6, "learning_rate": 1.9135068528686932e-05, "loss": 0.006, "step": 180110 }, { "epoch": 2.6, "learning_rate": 1.9135020488948458e-05, "loss": 0.0061, "step": 180120 }, { "epoch": 2.6, "learning_rate": 1.9134972449209987e-05, "loss": 0.0075, "step": 180130 }, { "epoch": 2.6, "learning_rate": 1.9134924409471516e-05, "loss": 0.0067, "step": 180140 }, { "epoch": 2.6, "learning_rate": 1.9134876369733046e-05, "loss": 0.0064, "step": 180150 }, { "epoch": 2.6, "learning_rate": 1.913482832999457e-05, "loss": 0.0065, "step": 180160 }, { "epoch": 2.6, "learning_rate": 1.91347802902561e-05, "loss": 0.0043, "step": 180170 }, { "epoch": 2.6, "learning_rate": 1.913473225051763e-05, "loss": 0.0073, "step": 180180 }, { "epoch": 2.6, "learning_rate": 1.9134684210779156e-05, "loss": 0.0099, "step": 180190 }, { "epoch": 2.6, "learning_rate": 1.9134636171040685e-05, "loss": 0.0061, "step": 180200 }, { "epoch": 2.6, "learning_rate": 1.9134588131302215e-05, "loss": 0.0085, "step": 180210 }, { "epoch": 2.6, "learning_rate": 1.9134540091563744e-05, "loss": 0.0063, "step": 180220 }, { "epoch": 2.6, "learning_rate": 1.913449205182527e-05, "loss": 0.0053, "step": 180230 }, { "epoch": 2.6, "learning_rate": 1.91344440120868e-05, "loss": 0.0087, "step": 180240 }, { "epoch": 2.6, "learning_rate": 1.9134395972348328e-05, "loss": 0.0083, "step": 180250 }, { "epoch": 2.6, "learning_rate": 1.9134347932609854e-05, "loss": 0.0093, "step": 180260 }, { "epoch": 2.6, "learning_rate": 1.9134299892871383e-05, "loss": 0.0052, "step": 180270 }, { "epoch": 2.6, "learning_rate": 1.9134251853132913e-05, "loss": 0.0048, "step": 180280 }, { "epoch": 2.6, "learning_rate": 1.9134203813394442e-05, "loss": 0.009, "step": 180290 }, { "epoch": 2.6, "learning_rate": 1.9134155773655968e-05, "loss": 0.0046, "step": 180300 }, { "epoch": 2.6, "learning_rate": 1.9134107733917497e-05, "loss": 0.0056, "step": 180310 }, { "epoch": 2.6, "learning_rate": 1.9134059694179026e-05, "loss": 0.005, "step": 180320 }, { "epoch": 2.6, "learning_rate": 1.9134011654440556e-05, "loss": 0.0049, "step": 180330 }, { "epoch": 2.6, "learning_rate": 1.913396361470208e-05, "loss": 0.0045, "step": 180340 }, { "epoch": 2.6, "learning_rate": 1.913391557496361e-05, "loss": 0.0073, "step": 180350 }, { "epoch": 2.6, "learning_rate": 1.913386753522514e-05, "loss": 0.0097, "step": 180360 }, { "epoch": 2.6, "learning_rate": 1.9133819495486666e-05, "loss": 0.0096, "step": 180370 }, { "epoch": 2.6, "learning_rate": 1.9133771455748195e-05, "loss": 0.0063, "step": 180380 }, { "epoch": 2.6, "learning_rate": 1.9133723416009724e-05, "loss": 0.0062, "step": 180390 }, { "epoch": 2.6, "learning_rate": 1.9133675376271254e-05, "loss": 0.009, "step": 180400 }, { "epoch": 2.6, "learning_rate": 1.913362733653278e-05, "loss": 0.0043, "step": 180410 }, { "epoch": 2.6, "learning_rate": 1.913357929679431e-05, "loss": 0.0087, "step": 180420 }, { "epoch": 2.6, "learning_rate": 1.9133531257055838e-05, "loss": 0.0056, "step": 180430 }, { "epoch": 2.6, "learning_rate": 1.9133483217317364e-05, "loss": 0.0064, "step": 180440 }, { "epoch": 2.6, "learning_rate": 1.9133435177578893e-05, "loss": 0.0056, "step": 180450 }, { "epoch": 2.6, "learning_rate": 1.9133387137840423e-05, "loss": 0.005, "step": 180460 }, { "epoch": 2.6, "learning_rate": 1.9133339098101952e-05, "loss": 0.0122, "step": 180470 }, { "epoch": 2.6, "learning_rate": 1.9133291058363478e-05, "loss": 0.0068, "step": 180480 }, { "epoch": 2.6, "learning_rate": 1.9133243018625007e-05, "loss": 0.0085, "step": 180490 }, { "epoch": 2.6, "learning_rate": 1.9133194978886536e-05, "loss": 0.0086, "step": 180500 }, { "epoch": 2.6, "learning_rate": 1.9133146939148066e-05, "loss": 0.009, "step": 180510 }, { "epoch": 2.6, "learning_rate": 1.913309889940959e-05, "loss": 0.0069, "step": 180520 }, { "epoch": 2.6, "learning_rate": 1.913305085967112e-05, "loss": 0.0101, "step": 180530 }, { "epoch": 2.6, "learning_rate": 1.913300281993265e-05, "loss": 0.007, "step": 180540 }, { "epoch": 2.6, "learning_rate": 1.9132954780194176e-05, "loss": 0.0066, "step": 180550 }, { "epoch": 2.6, "learning_rate": 1.9132906740455705e-05, "loss": 0.0056, "step": 180560 }, { "epoch": 2.6, "learning_rate": 1.9132858700717234e-05, "loss": 0.0103, "step": 180570 }, { "epoch": 2.6, "learning_rate": 1.9132810660978764e-05, "loss": 0.007, "step": 180580 }, { "epoch": 2.6, "learning_rate": 1.913276262124029e-05, "loss": 0.0079, "step": 180590 }, { "epoch": 2.6, "learning_rate": 1.913271458150182e-05, "loss": 0.006, "step": 180600 }, { "epoch": 2.6, "learning_rate": 1.9132666541763348e-05, "loss": 0.007, "step": 180610 }, { "epoch": 2.6, "learning_rate": 1.9132618502024874e-05, "loss": 0.0163, "step": 180620 }, { "epoch": 2.6, "learning_rate": 1.9132570462286403e-05, "loss": 0.0066, "step": 180630 }, { "epoch": 2.6, "learning_rate": 1.9132522422547932e-05, "loss": 0.0069, "step": 180640 }, { "epoch": 2.6, "learning_rate": 1.9132474382809462e-05, "loss": 0.0065, "step": 180650 }, { "epoch": 2.6, "learning_rate": 1.9132426343070988e-05, "loss": 0.0065, "step": 180660 }, { "epoch": 2.6, "learning_rate": 1.9132378303332517e-05, "loss": 0.0062, "step": 180670 }, { "epoch": 2.6, "learning_rate": 1.9132330263594046e-05, "loss": 0.0083, "step": 180680 }, { "epoch": 2.6, "learning_rate": 1.9132282223855575e-05, "loss": 0.0064, "step": 180690 }, { "epoch": 2.6, "learning_rate": 1.91322341841171e-05, "loss": 0.0059, "step": 180700 }, { "epoch": 2.6, "learning_rate": 1.913218614437863e-05, "loss": 0.0068, "step": 180710 }, { "epoch": 2.6, "learning_rate": 1.913213810464016e-05, "loss": 0.0082, "step": 180720 }, { "epoch": 2.6, "learning_rate": 1.9132090064901686e-05, "loss": 0.0055, "step": 180730 }, { "epoch": 2.6, "learning_rate": 1.9132042025163215e-05, "loss": 0.008, "step": 180740 }, { "epoch": 2.6, "learning_rate": 1.9131993985424744e-05, "loss": 0.0063, "step": 180750 }, { "epoch": 2.61, "learning_rate": 1.9131945945686274e-05, "loss": 0.0071, "step": 180760 }, { "epoch": 2.61, "learning_rate": 1.91318979059478e-05, "loss": 0.0065, "step": 180770 }, { "epoch": 2.61, "learning_rate": 1.913184986620933e-05, "loss": 0.003, "step": 180780 }, { "epoch": 2.61, "learning_rate": 1.9131801826470858e-05, "loss": 0.0085, "step": 180790 }, { "epoch": 2.61, "learning_rate": 1.9131753786732387e-05, "loss": 0.0073, "step": 180800 }, { "epoch": 2.61, "learning_rate": 1.9131705746993917e-05, "loss": 0.0075, "step": 180810 }, { "epoch": 2.61, "learning_rate": 1.9131657707255446e-05, "loss": 0.0043, "step": 180820 }, { "epoch": 2.61, "learning_rate": 1.913160966751697e-05, "loss": 0.0062, "step": 180830 }, { "epoch": 2.61, "learning_rate": 1.91315616277785e-05, "loss": 0.0053, "step": 180840 }, { "epoch": 2.61, "learning_rate": 1.913151358804003e-05, "loss": 0.0073, "step": 180850 }, { "epoch": 2.61, "learning_rate": 1.9131465548301556e-05, "loss": 0.005, "step": 180860 }, { "epoch": 2.61, "learning_rate": 1.9131417508563085e-05, "loss": 0.0095, "step": 180870 }, { "epoch": 2.61, "learning_rate": 1.9131369468824615e-05, "loss": 0.0076, "step": 180880 }, { "epoch": 2.61, "learning_rate": 1.9131321429086144e-05, "loss": 0.0059, "step": 180890 }, { "epoch": 2.61, "learning_rate": 1.913127338934767e-05, "loss": 0.0087, "step": 180900 }, { "epoch": 2.61, "learning_rate": 1.91312253496092e-05, "loss": 0.0057, "step": 180910 }, { "epoch": 2.61, "learning_rate": 1.913117730987073e-05, "loss": 0.009, "step": 180920 }, { "epoch": 2.61, "learning_rate": 1.9131129270132258e-05, "loss": 0.0071, "step": 180930 }, { "epoch": 2.61, "learning_rate": 1.9131081230393783e-05, "loss": 0.0062, "step": 180940 }, { "epoch": 2.61, "learning_rate": 1.9131033190655313e-05, "loss": 0.0073, "step": 180950 }, { "epoch": 2.61, "learning_rate": 1.9130985150916842e-05, "loss": 0.0075, "step": 180960 }, { "epoch": 2.61, "learning_rate": 1.9130937111178368e-05, "loss": 0.006, "step": 180970 }, { "epoch": 2.61, "learning_rate": 1.9130889071439897e-05, "loss": 0.0074, "step": 180980 }, { "epoch": 2.61, "learning_rate": 1.9130841031701426e-05, "loss": 0.0058, "step": 180990 }, { "epoch": 2.61, "learning_rate": 1.9130792991962956e-05, "loss": 0.0073, "step": 181000 }, { "epoch": 2.61, "learning_rate": 1.913074495222448e-05, "loss": 0.0084, "step": 181010 }, { "epoch": 2.61, "learning_rate": 1.913069691248601e-05, "loss": 0.0054, "step": 181020 }, { "epoch": 2.61, "learning_rate": 1.913064887274754e-05, "loss": 0.0086, "step": 181030 }, { "epoch": 2.61, "learning_rate": 1.9130600833009066e-05, "loss": 0.0088, "step": 181040 }, { "epoch": 2.61, "learning_rate": 1.9130552793270595e-05, "loss": 0.0064, "step": 181050 }, { "epoch": 2.61, "learning_rate": 1.9130504753532125e-05, "loss": 0.0089, "step": 181060 }, { "epoch": 2.61, "learning_rate": 1.9130456713793654e-05, "loss": 0.0059, "step": 181070 }, { "epoch": 2.61, "learning_rate": 1.913040867405518e-05, "loss": 0.0068, "step": 181080 }, { "epoch": 2.61, "learning_rate": 1.913036063431671e-05, "loss": 0.0058, "step": 181090 }, { "epoch": 2.61, "learning_rate": 1.9130312594578238e-05, "loss": 0.0105, "step": 181100 }, { "epoch": 2.61, "learning_rate": 1.9130264554839768e-05, "loss": 0.0078, "step": 181110 }, { "epoch": 2.61, "learning_rate": 1.9130216515101293e-05, "loss": 0.0089, "step": 181120 }, { "epoch": 2.61, "learning_rate": 1.9130168475362823e-05, "loss": 0.0065, "step": 181130 }, { "epoch": 2.61, "learning_rate": 1.9130120435624352e-05, "loss": 0.0066, "step": 181140 }, { "epoch": 2.61, "learning_rate": 1.9130072395885878e-05, "loss": 0.0103, "step": 181150 }, { "epoch": 2.61, "learning_rate": 1.9130024356147407e-05, "loss": 0.007, "step": 181160 }, { "epoch": 2.61, "learning_rate": 1.9129976316408936e-05, "loss": 0.0045, "step": 181170 }, { "epoch": 2.61, "learning_rate": 1.9129928276670466e-05, "loss": 0.0071, "step": 181180 }, { "epoch": 2.61, "learning_rate": 1.912988023693199e-05, "loss": 0.0082, "step": 181190 }, { "epoch": 2.61, "learning_rate": 1.912983219719352e-05, "loss": 0.008, "step": 181200 }, { "epoch": 2.61, "learning_rate": 1.912978415745505e-05, "loss": 0.0127, "step": 181210 }, { "epoch": 2.61, "learning_rate": 1.9129736117716576e-05, "loss": 0.0045, "step": 181220 }, { "epoch": 2.61, "learning_rate": 1.9129688077978105e-05, "loss": 0.0089, "step": 181230 }, { "epoch": 2.61, "learning_rate": 1.9129640038239634e-05, "loss": 0.0059, "step": 181240 }, { "epoch": 2.61, "learning_rate": 1.9129591998501164e-05, "loss": 0.0069, "step": 181250 }, { "epoch": 2.61, "learning_rate": 1.912954395876269e-05, "loss": 0.0065, "step": 181260 }, { "epoch": 2.61, "learning_rate": 1.912949591902422e-05, "loss": 0.0057, "step": 181270 }, { "epoch": 2.61, "learning_rate": 1.9129447879285748e-05, "loss": 0.006, "step": 181280 }, { "epoch": 2.61, "learning_rate": 1.9129399839547277e-05, "loss": 0.0057, "step": 181290 }, { "epoch": 2.61, "learning_rate": 1.9129351799808803e-05, "loss": 0.0072, "step": 181300 }, { "epoch": 2.61, "learning_rate": 1.9129303760070333e-05, "loss": 0.0077, "step": 181310 }, { "epoch": 2.61, "learning_rate": 1.9129255720331862e-05, "loss": 0.0065, "step": 181320 }, { "epoch": 2.61, "learning_rate": 1.9129207680593388e-05, "loss": 0.0049, "step": 181330 }, { "epoch": 2.61, "learning_rate": 1.9129159640854917e-05, "loss": 0.0065, "step": 181340 }, { "epoch": 2.61, "learning_rate": 1.9129111601116446e-05, "loss": 0.0099, "step": 181350 }, { "epoch": 2.61, "learning_rate": 1.9129063561377976e-05, "loss": 0.0077, "step": 181360 }, { "epoch": 2.61, "learning_rate": 1.91290155216395e-05, "loss": 0.0107, "step": 181370 }, { "epoch": 2.61, "learning_rate": 1.912896748190103e-05, "loss": 0.0058, "step": 181380 }, { "epoch": 2.61, "learning_rate": 1.912891944216256e-05, "loss": 0.0069, "step": 181390 }, { "epoch": 2.61, "learning_rate": 1.9128871402424086e-05, "loss": 0.0056, "step": 181400 }, { "epoch": 2.61, "learning_rate": 1.9128823362685615e-05, "loss": 0.0081, "step": 181410 }, { "epoch": 2.61, "learning_rate": 1.9128775322947144e-05, "loss": 0.0058, "step": 181420 }, { "epoch": 2.61, "learning_rate": 1.9128727283208674e-05, "loss": 0.0078, "step": 181430 }, { "epoch": 2.61, "learning_rate": 1.91286792434702e-05, "loss": 0.0071, "step": 181440 }, { "epoch": 2.62, "learning_rate": 1.912863120373173e-05, "loss": 0.0071, "step": 181450 }, { "epoch": 2.62, "learning_rate": 1.9128583163993258e-05, "loss": 0.0081, "step": 181460 }, { "epoch": 2.62, "learning_rate": 1.9128535124254784e-05, "loss": 0.0062, "step": 181470 }, { "epoch": 2.62, "learning_rate": 1.9128487084516313e-05, "loss": 0.008, "step": 181480 }, { "epoch": 2.62, "learning_rate": 1.9128439044777842e-05, "loss": 0.0074, "step": 181490 }, { "epoch": 2.62, "learning_rate": 1.9128391005039372e-05, "loss": 0.0109, "step": 181500 }, { "epoch": 2.62, "learning_rate": 1.9128342965300898e-05, "loss": 0.0077, "step": 181510 }, { "epoch": 2.62, "learning_rate": 1.9128294925562427e-05, "loss": 0.0063, "step": 181520 }, { "epoch": 2.62, "learning_rate": 1.9128246885823956e-05, "loss": 0.0055, "step": 181530 }, { "epoch": 2.62, "learning_rate": 1.9128198846085485e-05, "loss": 0.0069, "step": 181540 }, { "epoch": 2.62, "learning_rate": 1.912815080634701e-05, "loss": 0.0058, "step": 181550 }, { "epoch": 2.62, "learning_rate": 1.912810276660854e-05, "loss": 0.0063, "step": 181560 }, { "epoch": 2.62, "learning_rate": 1.912805472687007e-05, "loss": 0.0066, "step": 181570 }, { "epoch": 2.62, "learning_rate": 1.9128006687131596e-05, "loss": 0.0065, "step": 181580 }, { "epoch": 2.62, "learning_rate": 1.9127958647393125e-05, "loss": 0.0059, "step": 181590 }, { "epoch": 2.62, "learning_rate": 1.9127910607654654e-05, "loss": 0.0082, "step": 181600 }, { "epoch": 2.62, "learning_rate": 1.9127862567916184e-05, "loss": 0.007, "step": 181610 }, { "epoch": 2.62, "learning_rate": 1.912781452817771e-05, "loss": 0.0061, "step": 181620 }, { "epoch": 2.62, "learning_rate": 1.912776648843924e-05, "loss": 0.0073, "step": 181630 }, { "epoch": 2.62, "learning_rate": 1.9127718448700768e-05, "loss": 0.0062, "step": 181640 }, { "epoch": 2.62, "learning_rate": 1.9127670408962294e-05, "loss": 0.007, "step": 181650 }, { "epoch": 2.62, "learning_rate": 1.9127622369223823e-05, "loss": 0.0086, "step": 181660 }, { "epoch": 2.62, "learning_rate": 1.9127574329485352e-05, "loss": 0.0075, "step": 181670 }, { "epoch": 2.62, "learning_rate": 1.912752628974688e-05, "loss": 0.0056, "step": 181680 }, { "epoch": 2.62, "learning_rate": 1.9127478250008408e-05, "loss": 0.0091, "step": 181690 }, { "epoch": 2.62, "learning_rate": 1.9127430210269937e-05, "loss": 0.009, "step": 181700 }, { "epoch": 2.62, "learning_rate": 1.9127382170531466e-05, "loss": 0.0075, "step": 181710 }, { "epoch": 2.62, "learning_rate": 1.9127334130792995e-05, "loss": 0.0066, "step": 181720 }, { "epoch": 2.62, "learning_rate": 1.912728609105452e-05, "loss": 0.0061, "step": 181730 }, { "epoch": 2.62, "learning_rate": 1.912723805131605e-05, "loss": 0.0065, "step": 181740 }, { "epoch": 2.62, "learning_rate": 1.912719001157758e-05, "loss": 0.0061, "step": 181750 }, { "epoch": 2.62, "learning_rate": 1.9127141971839106e-05, "loss": 0.0087, "step": 181760 }, { "epoch": 2.62, "learning_rate": 1.9127093932100635e-05, "loss": 0.0065, "step": 181770 }, { "epoch": 2.62, "learning_rate": 1.9127045892362164e-05, "loss": 0.0081, "step": 181780 }, { "epoch": 2.62, "learning_rate": 1.9126997852623693e-05, "loss": 0.0067, "step": 181790 }, { "epoch": 2.62, "learning_rate": 1.912694981288522e-05, "loss": 0.0062, "step": 181800 }, { "epoch": 2.62, "learning_rate": 1.912690177314675e-05, "loss": 0.0059, "step": 181810 }, { "epoch": 2.62, "learning_rate": 1.9126853733408278e-05, "loss": 0.0064, "step": 181820 }, { "epoch": 2.62, "learning_rate": 1.9126805693669804e-05, "loss": 0.007, "step": 181830 }, { "epoch": 2.62, "learning_rate": 1.9126757653931333e-05, "loss": 0.0068, "step": 181840 }, { "epoch": 2.62, "learning_rate": 1.9126709614192862e-05, "loss": 0.0068, "step": 181850 }, { "epoch": 2.62, "learning_rate": 1.912666157445439e-05, "loss": 0.01, "step": 181860 }, { "epoch": 2.62, "learning_rate": 1.9126613534715917e-05, "loss": 0.0081, "step": 181870 }, { "epoch": 2.62, "learning_rate": 1.9126565494977447e-05, "loss": 0.0078, "step": 181880 }, { "epoch": 2.62, "learning_rate": 1.9126517455238976e-05, "loss": 0.0054, "step": 181890 }, { "epoch": 2.62, "learning_rate": 1.9126469415500505e-05, "loss": 0.0073, "step": 181900 }, { "epoch": 2.62, "learning_rate": 1.912642137576203e-05, "loss": 0.0055, "step": 181910 }, { "epoch": 2.62, "learning_rate": 1.912637333602356e-05, "loss": 0.007, "step": 181920 }, { "epoch": 2.62, "learning_rate": 1.912632529628509e-05, "loss": 0.0087, "step": 181930 }, { "epoch": 2.62, "learning_rate": 1.9126277256546616e-05, "loss": 0.0072, "step": 181940 }, { "epoch": 2.62, "learning_rate": 1.9126229216808145e-05, "loss": 0.0081, "step": 181950 }, { "epoch": 2.62, "learning_rate": 1.9126181177069674e-05, "loss": 0.0051, "step": 181960 }, { "epoch": 2.62, "learning_rate": 1.9126133137331203e-05, "loss": 0.0119, "step": 181970 }, { "epoch": 2.62, "learning_rate": 1.912608509759273e-05, "loss": 0.0077, "step": 181980 }, { "epoch": 2.62, "learning_rate": 1.912603705785426e-05, "loss": 0.0072, "step": 181990 }, { "epoch": 2.62, "learning_rate": 1.9125989018115788e-05, "loss": 0.0066, "step": 182000 }, { "epoch": 2.62, "learning_rate": 1.9125940978377314e-05, "loss": 0.0076, "step": 182010 }, { "epoch": 2.62, "learning_rate": 1.9125892938638843e-05, "loss": 0.0067, "step": 182020 }, { "epoch": 2.62, "learning_rate": 1.9125844898900372e-05, "loss": 0.0089, "step": 182030 }, { "epoch": 2.62, "learning_rate": 1.91257968591619e-05, "loss": 0.0104, "step": 182040 }, { "epoch": 2.62, "learning_rate": 1.9125748819423427e-05, "loss": 0.0078, "step": 182050 }, { "epoch": 2.62, "learning_rate": 1.9125700779684957e-05, "loss": 0.0049, "step": 182060 }, { "epoch": 2.62, "learning_rate": 1.9125652739946486e-05, "loss": 0.0058, "step": 182070 }, { "epoch": 2.62, "learning_rate": 1.9125604700208015e-05, "loss": 0.0093, "step": 182080 }, { "epoch": 2.62, "learning_rate": 1.912555666046954e-05, "loss": 0.0079, "step": 182090 }, { "epoch": 2.62, "learning_rate": 1.912550862073107e-05, "loss": 0.0068, "step": 182100 }, { "epoch": 2.62, "learning_rate": 1.91254605809926e-05, "loss": 0.0084, "step": 182110 }, { "epoch": 2.62, "learning_rate": 1.9125412541254126e-05, "loss": 0.0081, "step": 182120 }, { "epoch": 2.62, "learning_rate": 1.9125364501515655e-05, "loss": 0.0049, "step": 182130 }, { "epoch": 2.62, "learning_rate": 1.9125316461777184e-05, "loss": 0.0103, "step": 182140 }, { "epoch": 2.63, "learning_rate": 1.9125268422038713e-05, "loss": 0.0063, "step": 182150 }, { "epoch": 2.63, "learning_rate": 1.912522038230024e-05, "loss": 0.0082, "step": 182160 }, { "epoch": 2.63, "learning_rate": 1.912517234256177e-05, "loss": 0.0085, "step": 182170 }, { "epoch": 2.63, "learning_rate": 1.9125124302823298e-05, "loss": 0.0111, "step": 182180 }, { "epoch": 2.63, "learning_rate": 1.9125076263084824e-05, "loss": 0.0069, "step": 182190 }, { "epoch": 2.63, "learning_rate": 1.9125028223346353e-05, "loss": 0.0092, "step": 182200 }, { "epoch": 2.63, "learning_rate": 1.9124980183607882e-05, "loss": 0.0074, "step": 182210 }, { "epoch": 2.63, "learning_rate": 1.912493214386941e-05, "loss": 0.0082, "step": 182220 }, { "epoch": 2.63, "learning_rate": 1.9124884104130937e-05, "loss": 0.004, "step": 182230 }, { "epoch": 2.63, "learning_rate": 1.9124836064392467e-05, "loss": 0.0106, "step": 182240 }, { "epoch": 2.63, "learning_rate": 1.9124788024653996e-05, "loss": 0.0092, "step": 182250 }, { "epoch": 2.63, "learning_rate": 1.9124739984915525e-05, "loss": 0.0075, "step": 182260 }, { "epoch": 2.63, "learning_rate": 1.912469194517705e-05, "loss": 0.0117, "step": 182270 }, { "epoch": 2.63, "learning_rate": 1.912464390543858e-05, "loss": 0.0069, "step": 182280 }, { "epoch": 2.63, "learning_rate": 1.912459586570011e-05, "loss": 0.0073, "step": 182290 }, { "epoch": 2.63, "learning_rate": 1.9124547825961635e-05, "loss": 0.0088, "step": 182300 }, { "epoch": 2.63, "learning_rate": 1.9124499786223165e-05, "loss": 0.0075, "step": 182310 }, { "epoch": 2.63, "learning_rate": 1.9124451746484694e-05, "loss": 0.0064, "step": 182320 }, { "epoch": 2.63, "learning_rate": 1.9124403706746223e-05, "loss": 0.0063, "step": 182330 }, { "epoch": 2.63, "learning_rate": 1.912435566700775e-05, "loss": 0.0071, "step": 182340 }, { "epoch": 2.63, "learning_rate": 1.912430762726928e-05, "loss": 0.0052, "step": 182350 }, { "epoch": 2.63, "learning_rate": 1.9124259587530808e-05, "loss": 0.0062, "step": 182360 }, { "epoch": 2.63, "learning_rate": 1.9124211547792334e-05, "loss": 0.0054, "step": 182370 }, { "epoch": 2.63, "learning_rate": 1.9124163508053863e-05, "loss": 0.0069, "step": 182380 }, { "epoch": 2.63, "learning_rate": 1.9124115468315392e-05, "loss": 0.0085, "step": 182390 }, { "epoch": 2.63, "learning_rate": 1.912406742857692e-05, "loss": 0.0073, "step": 182400 }, { "epoch": 2.63, "learning_rate": 1.9124019388838447e-05, "loss": 0.0046, "step": 182410 }, { "epoch": 2.63, "learning_rate": 1.9123971349099976e-05, "loss": 0.0062, "step": 182420 }, { "epoch": 2.63, "learning_rate": 1.9123923309361506e-05, "loss": 0.0053, "step": 182430 }, { "epoch": 2.63, "learning_rate": 1.9123875269623035e-05, "loss": 0.0064, "step": 182440 }, { "epoch": 2.63, "learning_rate": 1.912382722988456e-05, "loss": 0.0058, "step": 182450 }, { "epoch": 2.63, "learning_rate": 1.912377919014609e-05, "loss": 0.0111, "step": 182460 }, { "epoch": 2.63, "learning_rate": 1.912373115040762e-05, "loss": 0.0089, "step": 182470 }, { "epoch": 2.63, "learning_rate": 1.9123683110669145e-05, "loss": 0.007, "step": 182480 }, { "epoch": 2.63, "learning_rate": 1.9123635070930675e-05, "loss": 0.009, "step": 182490 }, { "epoch": 2.63, "learning_rate": 1.9123587031192204e-05, "loss": 0.0057, "step": 182500 }, { "epoch": 2.63, "learning_rate": 1.9123538991453733e-05, "loss": 0.0079, "step": 182510 }, { "epoch": 2.63, "learning_rate": 1.912349095171526e-05, "loss": 0.0084, "step": 182520 }, { "epoch": 2.63, "learning_rate": 1.9123442911976788e-05, "loss": 0.0047, "step": 182530 }, { "epoch": 2.63, "learning_rate": 1.9123394872238318e-05, "loss": 0.008, "step": 182540 }, { "epoch": 2.63, "learning_rate": 1.9123346832499843e-05, "loss": 0.0064, "step": 182550 }, { "epoch": 2.63, "learning_rate": 1.9123298792761373e-05, "loss": 0.0069, "step": 182560 }, { "epoch": 2.63, "learning_rate": 1.9123250753022902e-05, "loss": 0.0082, "step": 182570 }, { "epoch": 2.63, "learning_rate": 1.912320271328443e-05, "loss": 0.0041, "step": 182580 }, { "epoch": 2.63, "learning_rate": 1.9123154673545957e-05, "loss": 0.0084, "step": 182590 }, { "epoch": 2.63, "learning_rate": 1.9123106633807486e-05, "loss": 0.0058, "step": 182600 }, { "epoch": 2.63, "learning_rate": 1.9123058594069016e-05, "loss": 0.009, "step": 182610 }, { "epoch": 2.63, "learning_rate": 1.9123010554330545e-05, "loss": 0.006, "step": 182620 }, { "epoch": 2.63, "learning_rate": 1.912296251459207e-05, "loss": 0.0063, "step": 182630 }, { "epoch": 2.63, "learning_rate": 1.91229144748536e-05, "loss": 0.006, "step": 182640 }, { "epoch": 2.63, "learning_rate": 1.912286643511513e-05, "loss": 0.0036, "step": 182650 }, { "epoch": 2.63, "learning_rate": 1.9122818395376655e-05, "loss": 0.0088, "step": 182660 }, { "epoch": 2.63, "learning_rate": 1.9122770355638185e-05, "loss": 0.0076, "step": 182670 }, { "epoch": 2.63, "learning_rate": 1.9122722315899714e-05, "loss": 0.0074, "step": 182680 }, { "epoch": 2.63, "learning_rate": 1.9122674276161243e-05, "loss": 0.0082, "step": 182690 }, { "epoch": 2.63, "learning_rate": 1.912262623642277e-05, "loss": 0.0074, "step": 182700 }, { "epoch": 2.63, "learning_rate": 1.9122578196684298e-05, "loss": 0.0109, "step": 182710 }, { "epoch": 2.63, "learning_rate": 1.9122530156945827e-05, "loss": 0.0062, "step": 182720 }, { "epoch": 2.63, "learning_rate": 1.9122482117207353e-05, "loss": 0.0059, "step": 182730 }, { "epoch": 2.63, "learning_rate": 1.9122434077468883e-05, "loss": 0.0091, "step": 182740 }, { "epoch": 2.63, "learning_rate": 1.9122386037730412e-05, "loss": 0.009, "step": 182750 }, { "epoch": 2.63, "learning_rate": 1.912233799799194e-05, "loss": 0.009, "step": 182760 }, { "epoch": 2.63, "learning_rate": 1.9122289958253467e-05, "loss": 0.0093, "step": 182770 }, { "epoch": 2.63, "learning_rate": 1.9122241918514996e-05, "loss": 0.0073, "step": 182780 }, { "epoch": 2.63, "learning_rate": 1.9122193878776526e-05, "loss": 0.0065, "step": 182790 }, { "epoch": 2.63, "learning_rate": 1.9122145839038055e-05, "loss": 0.0083, "step": 182800 }, { "epoch": 2.63, "learning_rate": 1.912209779929958e-05, "loss": 0.0074, "step": 182810 }, { "epoch": 2.63, "learning_rate": 1.912204975956111e-05, "loss": 0.0073, "step": 182820 }, { "epoch": 2.63, "learning_rate": 1.912200171982264e-05, "loss": 0.0063, "step": 182830 }, { "epoch": 2.64, "learning_rate": 1.9121953680084165e-05, "loss": 0.0072, "step": 182840 }, { "epoch": 2.64, "learning_rate": 1.9121905640345694e-05, "loss": 0.008, "step": 182850 }, { "epoch": 2.64, "learning_rate": 1.9121857600607224e-05, "loss": 0.0074, "step": 182860 }, { "epoch": 2.64, "learning_rate": 1.9121809560868753e-05, "loss": 0.007, "step": 182870 }, { "epoch": 2.64, "learning_rate": 1.912176152113028e-05, "loss": 0.0096, "step": 182880 }, { "epoch": 2.64, "learning_rate": 1.9121713481391808e-05, "loss": 0.0088, "step": 182890 }, { "epoch": 2.64, "learning_rate": 1.9121665441653337e-05, "loss": 0.0067, "step": 182900 }, { "epoch": 2.64, "learning_rate": 1.9121617401914863e-05, "loss": 0.0106, "step": 182910 }, { "epoch": 2.64, "learning_rate": 1.9121569362176393e-05, "loss": 0.0047, "step": 182920 }, { "epoch": 2.64, "learning_rate": 1.9121521322437922e-05, "loss": 0.009, "step": 182930 }, { "epoch": 2.64, "learning_rate": 1.912147328269945e-05, "loss": 0.0067, "step": 182940 }, { "epoch": 2.64, "learning_rate": 1.9121425242960977e-05, "loss": 0.0097, "step": 182950 }, { "epoch": 2.64, "learning_rate": 1.9121377203222506e-05, "loss": 0.0088, "step": 182960 }, { "epoch": 2.64, "learning_rate": 1.9121329163484036e-05, "loss": 0.0079, "step": 182970 }, { "epoch": 2.64, "learning_rate": 1.9121281123745565e-05, "loss": 0.0064, "step": 182980 }, { "epoch": 2.64, "learning_rate": 1.912123308400709e-05, "loss": 0.0087, "step": 182990 }, { "epoch": 2.64, "learning_rate": 1.912118504426862e-05, "loss": 0.0064, "step": 183000 }, { "epoch": 2.64, "learning_rate": 1.912113700453015e-05, "loss": 0.009, "step": 183010 }, { "epoch": 2.64, "learning_rate": 1.9121088964791675e-05, "loss": 0.0081, "step": 183020 }, { "epoch": 2.64, "learning_rate": 1.9121040925053204e-05, "loss": 0.0077, "step": 183030 }, { "epoch": 2.64, "learning_rate": 1.9120992885314734e-05, "loss": 0.0075, "step": 183040 }, { "epoch": 2.64, "learning_rate": 1.9120944845576263e-05, "loss": 0.0075, "step": 183050 }, { "epoch": 2.64, "learning_rate": 1.912089680583779e-05, "loss": 0.005, "step": 183060 }, { "epoch": 2.64, "learning_rate": 1.9120848766099318e-05, "loss": 0.0075, "step": 183070 }, { "epoch": 2.64, "learning_rate": 1.9120800726360847e-05, "loss": 0.0065, "step": 183080 }, { "epoch": 2.64, "learning_rate": 1.9120752686622373e-05, "loss": 0.0081, "step": 183090 }, { "epoch": 2.64, "learning_rate": 1.9120704646883902e-05, "loss": 0.0073, "step": 183100 }, { "epoch": 2.64, "learning_rate": 1.9120656607145432e-05, "loss": 0.0075, "step": 183110 }, { "epoch": 2.64, "learning_rate": 1.912060856740696e-05, "loss": 0.0073, "step": 183120 }, { "epoch": 2.64, "learning_rate": 1.9120560527668487e-05, "loss": 0.0079, "step": 183130 }, { "epoch": 2.64, "learning_rate": 1.9120512487930016e-05, "loss": 0.0058, "step": 183140 }, { "epoch": 2.64, "learning_rate": 1.9120464448191545e-05, "loss": 0.008, "step": 183150 }, { "epoch": 2.64, "learning_rate": 1.9120416408453075e-05, "loss": 0.0074, "step": 183160 }, { "epoch": 2.64, "learning_rate": 1.91203683687146e-05, "loss": 0.0085, "step": 183170 }, { "epoch": 2.64, "learning_rate": 1.912032032897613e-05, "loss": 0.0091, "step": 183180 }, { "epoch": 2.64, "learning_rate": 1.912027228923766e-05, "loss": 0.0054, "step": 183190 }, { "epoch": 2.64, "learning_rate": 1.9120224249499185e-05, "loss": 0.0069, "step": 183200 }, { "epoch": 2.64, "learning_rate": 1.9120176209760714e-05, "loss": 0.0057, "step": 183210 }, { "epoch": 2.64, "learning_rate": 1.9120128170022244e-05, "loss": 0.0078, "step": 183220 }, { "epoch": 2.64, "learning_rate": 1.9120080130283773e-05, "loss": 0.0076, "step": 183230 }, { "epoch": 2.64, "learning_rate": 1.91200320905453e-05, "loss": 0.0092, "step": 183240 }, { "epoch": 2.64, "learning_rate": 1.9119984050806828e-05, "loss": 0.0075, "step": 183250 }, { "epoch": 2.64, "learning_rate": 1.9119936011068357e-05, "loss": 0.0076, "step": 183260 }, { "epoch": 2.64, "learning_rate": 1.9119887971329883e-05, "loss": 0.0057, "step": 183270 }, { "epoch": 2.64, "learning_rate": 1.9119839931591412e-05, "loss": 0.0089, "step": 183280 }, { "epoch": 2.64, "learning_rate": 1.911979189185294e-05, "loss": 0.0074, "step": 183290 }, { "epoch": 2.64, "learning_rate": 1.911974385211447e-05, "loss": 0.0045, "step": 183300 }, { "epoch": 2.64, "learning_rate": 1.9119695812375997e-05, "loss": 0.0074, "step": 183310 }, { "epoch": 2.64, "learning_rate": 1.9119647772637526e-05, "loss": 0.008, "step": 183320 }, { "epoch": 2.64, "learning_rate": 1.9119599732899055e-05, "loss": 0.0053, "step": 183330 }, { "epoch": 2.64, "learning_rate": 1.911955169316058e-05, "loss": 0.0071, "step": 183340 }, { "epoch": 2.64, "learning_rate": 1.911950365342211e-05, "loss": 0.0083, "step": 183350 }, { "epoch": 2.64, "learning_rate": 1.9119455613683643e-05, "loss": 0.0068, "step": 183360 }, { "epoch": 2.64, "learning_rate": 1.911940757394517e-05, "loss": 0.0067, "step": 183370 }, { "epoch": 2.64, "learning_rate": 1.9119359534206698e-05, "loss": 0.0066, "step": 183380 }, { "epoch": 2.64, "learning_rate": 1.9119311494468228e-05, "loss": 0.0063, "step": 183390 }, { "epoch": 2.64, "learning_rate": 1.9119263454729753e-05, "loss": 0.0058, "step": 183400 }, { "epoch": 2.64, "learning_rate": 1.9119215414991283e-05, "loss": 0.0076, "step": 183410 }, { "epoch": 2.64, "learning_rate": 1.9119167375252812e-05, "loss": 0.0057, "step": 183420 }, { "epoch": 2.64, "learning_rate": 1.911911933551434e-05, "loss": 0.006, "step": 183430 }, { "epoch": 2.64, "learning_rate": 1.9119071295775867e-05, "loss": 0.0061, "step": 183440 }, { "epoch": 2.64, "learning_rate": 1.9119023256037396e-05, "loss": 0.0047, "step": 183450 }, { "epoch": 2.64, "learning_rate": 1.9118975216298926e-05, "loss": 0.0065, "step": 183460 }, { "epoch": 2.64, "learning_rate": 1.9118927176560455e-05, "loss": 0.0085, "step": 183470 }, { "epoch": 2.64, "learning_rate": 1.911887913682198e-05, "loss": 0.0082, "step": 183480 }, { "epoch": 2.64, "learning_rate": 1.911883109708351e-05, "loss": 0.0087, "step": 183490 }, { "epoch": 2.64, "learning_rate": 1.911878305734504e-05, "loss": 0.0067, "step": 183500 }, { "epoch": 2.64, "learning_rate": 1.9118735017606565e-05, "loss": 0.0069, "step": 183510 }, { "epoch": 2.64, "learning_rate": 1.9118686977868095e-05, "loss": 0.0077, "step": 183520 }, { "epoch": 2.65, "learning_rate": 1.9118638938129624e-05, "loss": 0.0075, "step": 183530 }, { "epoch": 2.65, "learning_rate": 1.9118590898391153e-05, "loss": 0.0074, "step": 183540 }, { "epoch": 2.65, "learning_rate": 1.911854285865268e-05, "loss": 0.0081, "step": 183550 }, { "epoch": 2.65, "learning_rate": 1.9118494818914208e-05, "loss": 0.011, "step": 183560 }, { "epoch": 2.65, "learning_rate": 1.9118446779175737e-05, "loss": 0.0076, "step": 183570 }, { "epoch": 2.65, "learning_rate": 1.9118398739437263e-05, "loss": 0.0079, "step": 183580 }, { "epoch": 2.65, "learning_rate": 1.9118350699698793e-05, "loss": 0.0078, "step": 183590 }, { "epoch": 2.65, "learning_rate": 1.9118302659960322e-05, "loss": 0.0062, "step": 183600 }, { "epoch": 2.65, "learning_rate": 1.911825462022185e-05, "loss": 0.0074, "step": 183610 }, { "epoch": 2.65, "learning_rate": 1.9118206580483377e-05, "loss": 0.0078, "step": 183620 }, { "epoch": 2.65, "learning_rate": 1.9118158540744906e-05, "loss": 0.0061, "step": 183630 }, { "epoch": 2.65, "learning_rate": 1.9118110501006436e-05, "loss": 0.0079, "step": 183640 }, { "epoch": 2.65, "learning_rate": 1.9118062461267965e-05, "loss": 0.0074, "step": 183650 }, { "epoch": 2.65, "learning_rate": 1.911801442152949e-05, "loss": 0.0073, "step": 183660 }, { "epoch": 2.65, "learning_rate": 1.911796638179102e-05, "loss": 0.0075, "step": 183670 }, { "epoch": 2.65, "learning_rate": 1.911791834205255e-05, "loss": 0.0059, "step": 183680 }, { "epoch": 2.65, "learning_rate": 1.9117870302314075e-05, "loss": 0.007, "step": 183690 }, { "epoch": 2.65, "learning_rate": 1.9117822262575604e-05, "loss": 0.0092, "step": 183700 }, { "epoch": 2.65, "learning_rate": 1.9117774222837134e-05, "loss": 0.0079, "step": 183710 }, { "epoch": 2.65, "learning_rate": 1.9117726183098663e-05, "loss": 0.0059, "step": 183720 }, { "epoch": 2.65, "learning_rate": 1.911767814336019e-05, "loss": 0.0076, "step": 183730 }, { "epoch": 2.65, "learning_rate": 1.9117630103621718e-05, "loss": 0.0036, "step": 183740 }, { "epoch": 2.65, "learning_rate": 1.9117582063883247e-05, "loss": 0.0084, "step": 183750 }, { "epoch": 2.65, "learning_rate": 1.9117534024144773e-05, "loss": 0.0071, "step": 183760 }, { "epoch": 2.65, "learning_rate": 1.9117485984406303e-05, "loss": 0.0069, "step": 183770 }, { "epoch": 2.65, "learning_rate": 1.9117437944667832e-05, "loss": 0.0043, "step": 183780 }, { "epoch": 2.65, "learning_rate": 1.911738990492936e-05, "loss": 0.0057, "step": 183790 }, { "epoch": 2.65, "learning_rate": 1.9117341865190887e-05, "loss": 0.0112, "step": 183800 }, { "epoch": 2.65, "learning_rate": 1.9117293825452416e-05, "loss": 0.0066, "step": 183810 }, { "epoch": 2.65, "learning_rate": 1.9117245785713946e-05, "loss": 0.0067, "step": 183820 }, { "epoch": 2.65, "learning_rate": 1.9117197745975475e-05, "loss": 0.0098, "step": 183830 }, { "epoch": 2.65, "learning_rate": 1.9117149706237e-05, "loss": 0.0073, "step": 183840 }, { "epoch": 2.65, "learning_rate": 1.911710166649853e-05, "loss": 0.008, "step": 183850 }, { "epoch": 2.65, "learning_rate": 1.911705362676006e-05, "loss": 0.0055, "step": 183860 }, { "epoch": 2.65, "learning_rate": 1.9117005587021585e-05, "loss": 0.0059, "step": 183870 }, { "epoch": 2.65, "learning_rate": 1.9116957547283114e-05, "loss": 0.0075, "step": 183880 }, { "epoch": 2.65, "learning_rate": 1.9116909507544644e-05, "loss": 0.0076, "step": 183890 }, { "epoch": 2.65, "learning_rate": 1.9116861467806173e-05, "loss": 0.0057, "step": 183900 }, { "epoch": 2.65, "learning_rate": 1.91168134280677e-05, "loss": 0.0069, "step": 183910 }, { "epoch": 2.65, "learning_rate": 1.9116765388329228e-05, "loss": 0.0068, "step": 183920 }, { "epoch": 2.65, "learning_rate": 1.9116717348590757e-05, "loss": 0.0079, "step": 183930 }, { "epoch": 2.65, "learning_rate": 1.9116669308852283e-05, "loss": 0.0045, "step": 183940 }, { "epoch": 2.65, "learning_rate": 1.9116621269113812e-05, "loss": 0.0052, "step": 183950 }, { "epoch": 2.65, "learning_rate": 1.9116573229375342e-05, "loss": 0.0091, "step": 183960 }, { "epoch": 2.65, "learning_rate": 1.911652518963687e-05, "loss": 0.0081, "step": 183970 }, { "epoch": 2.65, "learning_rate": 1.9116477149898397e-05, "loss": 0.0052, "step": 183980 }, { "epoch": 2.65, "learning_rate": 1.9116429110159926e-05, "loss": 0.0077, "step": 183990 }, { "epoch": 2.65, "learning_rate": 1.9116381070421455e-05, "loss": 0.0089, "step": 184000 }, { "epoch": 2.65, "learning_rate": 1.9116333030682985e-05, "loss": 0.0077, "step": 184010 }, { "epoch": 2.65, "learning_rate": 1.911628499094451e-05, "loss": 0.0051, "step": 184020 }, { "epoch": 2.65, "learning_rate": 1.911623695120604e-05, "loss": 0.011, "step": 184030 }, { "epoch": 2.65, "learning_rate": 1.911618891146757e-05, "loss": 0.0111, "step": 184040 }, { "epoch": 2.65, "learning_rate": 1.9116140871729095e-05, "loss": 0.0074, "step": 184050 }, { "epoch": 2.65, "learning_rate": 1.9116092831990624e-05, "loss": 0.0087, "step": 184060 }, { "epoch": 2.65, "learning_rate": 1.9116044792252154e-05, "loss": 0.0043, "step": 184070 }, { "epoch": 2.65, "learning_rate": 1.9115996752513683e-05, "loss": 0.0152, "step": 184080 }, { "epoch": 2.65, "learning_rate": 1.911594871277521e-05, "loss": 0.0096, "step": 184090 }, { "epoch": 2.65, "learning_rate": 1.9115900673036738e-05, "loss": 0.0052, "step": 184100 }, { "epoch": 2.65, "learning_rate": 1.9115852633298267e-05, "loss": 0.0066, "step": 184110 }, { "epoch": 2.65, "learning_rate": 1.9115804593559793e-05, "loss": 0.0073, "step": 184120 }, { "epoch": 2.65, "learning_rate": 1.9115756553821322e-05, "loss": 0.0059, "step": 184130 }, { "epoch": 2.65, "learning_rate": 1.911570851408285e-05, "loss": 0.0057, "step": 184140 }, { "epoch": 2.65, "learning_rate": 1.911566047434438e-05, "loss": 0.0063, "step": 184150 }, { "epoch": 2.65, "learning_rate": 1.9115612434605907e-05, "loss": 0.0044, "step": 184160 }, { "epoch": 2.65, "learning_rate": 1.9115564394867436e-05, "loss": 0.0095, "step": 184170 }, { "epoch": 2.65, "learning_rate": 1.9115516355128965e-05, "loss": 0.0074, "step": 184180 }, { "epoch": 2.65, "learning_rate": 1.9115468315390495e-05, "loss": 0.0069, "step": 184190 }, { "epoch": 2.65, "learning_rate": 1.911542027565202e-05, "loss": 0.0068, "step": 184200 }, { "epoch": 2.65, "learning_rate": 1.911537223591355e-05, "loss": 0.0037, "step": 184210 }, { "epoch": 2.65, "learning_rate": 1.911532419617508e-05, "loss": 0.0045, "step": 184220 }, { "epoch": 2.66, "learning_rate": 1.9115276156436605e-05, "loss": 0.0054, "step": 184230 }, { "epoch": 2.66, "learning_rate": 1.9115228116698134e-05, "loss": 0.0058, "step": 184240 }, { "epoch": 2.66, "learning_rate": 1.9115180076959663e-05, "loss": 0.0084, "step": 184250 }, { "epoch": 2.66, "learning_rate": 1.9115132037221193e-05, "loss": 0.0074, "step": 184260 }, { "epoch": 2.66, "learning_rate": 1.911508399748272e-05, "loss": 0.004, "step": 184270 }, { "epoch": 2.66, "learning_rate": 1.9115035957744248e-05, "loss": 0.0066, "step": 184280 }, { "epoch": 2.66, "learning_rate": 1.9114987918005777e-05, "loss": 0.006, "step": 184290 }, { "epoch": 2.66, "learning_rate": 1.9114939878267303e-05, "loss": 0.0072, "step": 184300 }, { "epoch": 2.66, "learning_rate": 1.9114891838528832e-05, "loss": 0.0069, "step": 184310 }, { "epoch": 2.66, "learning_rate": 1.911484379879036e-05, "loss": 0.0093, "step": 184320 }, { "epoch": 2.66, "learning_rate": 1.911479575905189e-05, "loss": 0.0065, "step": 184330 }, { "epoch": 2.66, "learning_rate": 1.9114747719313417e-05, "loss": 0.0075, "step": 184340 }, { "epoch": 2.66, "learning_rate": 1.9114699679574946e-05, "loss": 0.0076, "step": 184350 }, { "epoch": 2.66, "learning_rate": 1.9114651639836475e-05, "loss": 0.0053, "step": 184360 }, { "epoch": 2.66, "learning_rate": 1.9114603600098005e-05, "loss": 0.0081, "step": 184370 }, { "epoch": 2.66, "learning_rate": 1.911455556035953e-05, "loss": 0.0057, "step": 184380 }, { "epoch": 2.66, "learning_rate": 1.911450752062106e-05, "loss": 0.0086, "step": 184390 }, { "epoch": 2.66, "learning_rate": 1.911445948088259e-05, "loss": 0.0095, "step": 184400 }, { "epoch": 2.66, "learning_rate": 1.9114411441144115e-05, "loss": 0.006, "step": 184410 }, { "epoch": 2.66, "learning_rate": 1.9114363401405644e-05, "loss": 0.0089, "step": 184420 }, { "epoch": 2.66, "learning_rate": 1.9114315361667173e-05, "loss": 0.0043, "step": 184430 }, { "epoch": 2.66, "learning_rate": 1.9114267321928703e-05, "loss": 0.0055, "step": 184440 }, { "epoch": 2.66, "learning_rate": 1.911421928219023e-05, "loss": 0.0079, "step": 184450 }, { "epoch": 2.66, "learning_rate": 1.9114171242451758e-05, "loss": 0.0053, "step": 184460 }, { "epoch": 2.66, "learning_rate": 1.9114123202713287e-05, "loss": 0.0066, "step": 184470 }, { "epoch": 2.66, "learning_rate": 1.9114075162974813e-05, "loss": 0.0067, "step": 184480 }, { "epoch": 2.66, "learning_rate": 1.9114027123236342e-05, "loss": 0.0075, "step": 184490 }, { "epoch": 2.66, "learning_rate": 1.911397908349787e-05, "loss": 0.0065, "step": 184500 }, { "epoch": 2.66, "learning_rate": 1.91139310437594e-05, "loss": 0.0089, "step": 184510 }, { "epoch": 2.66, "learning_rate": 1.9113883004020927e-05, "loss": 0.0057, "step": 184520 }, { "epoch": 2.66, "learning_rate": 1.9113834964282456e-05, "loss": 0.007, "step": 184530 }, { "epoch": 2.66, "learning_rate": 1.9113786924543985e-05, "loss": 0.0056, "step": 184540 }, { "epoch": 2.66, "learning_rate": 1.9113738884805514e-05, "loss": 0.0096, "step": 184550 }, { "epoch": 2.66, "learning_rate": 1.911369084506704e-05, "loss": 0.0065, "step": 184560 }, { "epoch": 2.66, "learning_rate": 1.911364280532857e-05, "loss": 0.0065, "step": 184570 }, { "epoch": 2.66, "learning_rate": 1.91135947655901e-05, "loss": 0.0069, "step": 184580 }, { "epoch": 2.66, "learning_rate": 1.9113546725851625e-05, "loss": 0.0041, "step": 184590 }, { "epoch": 2.66, "learning_rate": 1.9113498686113154e-05, "loss": 0.0084, "step": 184600 }, { "epoch": 2.66, "learning_rate": 1.9113450646374683e-05, "loss": 0.0074, "step": 184610 }, { "epoch": 2.66, "learning_rate": 1.9113402606636213e-05, "loss": 0.0043, "step": 184620 }, { "epoch": 2.66, "learning_rate": 1.911335456689774e-05, "loss": 0.0061, "step": 184630 }, { "epoch": 2.66, "learning_rate": 1.9113306527159268e-05, "loss": 0.0075, "step": 184640 }, { "epoch": 2.66, "learning_rate": 1.9113258487420797e-05, "loss": 0.0088, "step": 184650 }, { "epoch": 2.66, "learning_rate": 1.9113210447682323e-05, "loss": 0.0057, "step": 184660 }, { "epoch": 2.66, "learning_rate": 1.9113162407943852e-05, "loss": 0.0091, "step": 184670 }, { "epoch": 2.66, "learning_rate": 1.911311436820538e-05, "loss": 0.006, "step": 184680 }, { "epoch": 2.66, "learning_rate": 1.911306632846691e-05, "loss": 0.0062, "step": 184690 }, { "epoch": 2.66, "learning_rate": 1.9113018288728437e-05, "loss": 0.0069, "step": 184700 }, { "epoch": 2.66, "learning_rate": 1.9112970248989966e-05, "loss": 0.0079, "step": 184710 }, { "epoch": 2.66, "learning_rate": 1.9112922209251495e-05, "loss": 0.0068, "step": 184720 }, { "epoch": 2.66, "learning_rate": 1.9112874169513024e-05, "loss": 0.0073, "step": 184730 }, { "epoch": 2.66, "learning_rate": 1.911282612977455e-05, "loss": 0.0072, "step": 184740 }, { "epoch": 2.66, "learning_rate": 1.911277809003608e-05, "loss": 0.0092, "step": 184750 }, { "epoch": 2.66, "learning_rate": 1.911273005029761e-05, "loss": 0.0068, "step": 184760 }, { "epoch": 2.66, "learning_rate": 1.9112682010559135e-05, "loss": 0.0065, "step": 184770 }, { "epoch": 2.66, "learning_rate": 1.9112633970820664e-05, "loss": 0.0053, "step": 184780 }, { "epoch": 2.66, "learning_rate": 1.9112585931082193e-05, "loss": 0.0104, "step": 184790 }, { "epoch": 2.66, "learning_rate": 1.9112537891343722e-05, "loss": 0.0071, "step": 184800 }, { "epoch": 2.66, "learning_rate": 1.911248985160525e-05, "loss": 0.0095, "step": 184810 }, { "epoch": 2.66, "learning_rate": 1.9112441811866778e-05, "loss": 0.0075, "step": 184820 }, { "epoch": 2.66, "learning_rate": 1.9112393772128307e-05, "loss": 0.0073, "step": 184830 }, { "epoch": 2.66, "learning_rate": 1.9112345732389833e-05, "loss": 0.008, "step": 184840 }, { "epoch": 2.66, "learning_rate": 1.9112297692651362e-05, "loss": 0.007, "step": 184850 }, { "epoch": 2.66, "learning_rate": 1.911224965291289e-05, "loss": 0.0045, "step": 184860 }, { "epoch": 2.66, "learning_rate": 1.911220161317442e-05, "loss": 0.0091, "step": 184870 }, { "epoch": 2.66, "learning_rate": 1.9112153573435946e-05, "loss": 0.0087, "step": 184880 }, { "epoch": 2.66, "learning_rate": 1.9112105533697476e-05, "loss": 0.0067, "step": 184890 }, { "epoch": 2.66, "learning_rate": 1.9112057493959005e-05, "loss": 0.0059, "step": 184900 }, { "epoch": 2.66, "learning_rate": 1.911200945422053e-05, "loss": 0.0081, "step": 184910 }, { "epoch": 2.67, "learning_rate": 1.911196141448206e-05, "loss": 0.0081, "step": 184920 }, { "epoch": 2.67, "learning_rate": 1.911191337474359e-05, "loss": 0.0066, "step": 184930 }, { "epoch": 2.67, "learning_rate": 1.911186533500512e-05, "loss": 0.0066, "step": 184940 }, { "epoch": 2.67, "learning_rate": 1.9111817295266645e-05, "loss": 0.0141, "step": 184950 }, { "epoch": 2.67, "learning_rate": 1.9111769255528174e-05, "loss": 0.0072, "step": 184960 }, { "epoch": 2.67, "learning_rate": 1.9111721215789703e-05, "loss": 0.006, "step": 184970 }, { "epoch": 2.67, "learning_rate": 1.9111673176051232e-05, "loss": 0.0062, "step": 184980 }, { "epoch": 2.67, "learning_rate": 1.9111625136312758e-05, "loss": 0.0071, "step": 184990 }, { "epoch": 2.67, "learning_rate": 1.9111577096574288e-05, "loss": 0.0089, "step": 185000 }, { "epoch": 2.67, "learning_rate": 1.9111529056835817e-05, "loss": 0.0055, "step": 185010 }, { "epoch": 2.67, "learning_rate": 1.9111481017097343e-05, "loss": 0.0071, "step": 185020 }, { "epoch": 2.67, "learning_rate": 1.9111432977358872e-05, "loss": 0.0076, "step": 185030 }, { "epoch": 2.67, "learning_rate": 1.91113849376204e-05, "loss": 0.0054, "step": 185040 }, { "epoch": 2.67, "learning_rate": 1.911133689788193e-05, "loss": 0.0059, "step": 185050 }, { "epoch": 2.67, "learning_rate": 1.9111288858143456e-05, "loss": 0.0066, "step": 185060 }, { "epoch": 2.67, "learning_rate": 1.9111240818404986e-05, "loss": 0.0091, "step": 185070 }, { "epoch": 2.67, "learning_rate": 1.9111192778666515e-05, "loss": 0.0059, "step": 185080 }, { "epoch": 2.67, "learning_rate": 1.911114473892804e-05, "loss": 0.0085, "step": 185090 }, { "epoch": 2.67, "learning_rate": 1.911109669918957e-05, "loss": 0.009, "step": 185100 }, { "epoch": 2.67, "learning_rate": 1.91110486594511e-05, "loss": 0.0079, "step": 185110 }, { "epoch": 2.67, "learning_rate": 1.911100061971263e-05, "loss": 0.0055, "step": 185120 }, { "epoch": 2.67, "learning_rate": 1.9110952579974154e-05, "loss": 0.006, "step": 185130 }, { "epoch": 2.67, "learning_rate": 1.9110904540235684e-05, "loss": 0.006, "step": 185140 }, { "epoch": 2.67, "learning_rate": 1.9110856500497213e-05, "loss": 0.0054, "step": 185150 }, { "epoch": 2.67, "learning_rate": 1.9110808460758742e-05, "loss": 0.0071, "step": 185160 }, { "epoch": 2.67, "learning_rate": 1.9110760421020268e-05, "loss": 0.0061, "step": 185170 }, { "epoch": 2.67, "learning_rate": 1.9110712381281797e-05, "loss": 0.0057, "step": 185180 }, { "epoch": 2.67, "learning_rate": 1.9110664341543327e-05, "loss": 0.0052, "step": 185190 }, { "epoch": 2.67, "learning_rate": 1.9110616301804853e-05, "loss": 0.0053, "step": 185200 }, { "epoch": 2.67, "learning_rate": 1.9110568262066382e-05, "loss": 0.0076, "step": 185210 }, { "epoch": 2.67, "learning_rate": 1.911052022232791e-05, "loss": 0.0054, "step": 185220 }, { "epoch": 2.67, "learning_rate": 1.911047218258944e-05, "loss": 0.0063, "step": 185230 }, { "epoch": 2.67, "learning_rate": 1.9110424142850966e-05, "loss": 0.0101, "step": 185240 }, { "epoch": 2.67, "learning_rate": 1.9110376103112496e-05, "loss": 0.0065, "step": 185250 }, { "epoch": 2.67, "learning_rate": 1.9110328063374025e-05, "loss": 0.0079, "step": 185260 }, { "epoch": 2.67, "learning_rate": 1.911028002363555e-05, "loss": 0.0056, "step": 185270 }, { "epoch": 2.67, "learning_rate": 1.911023198389708e-05, "loss": 0.0077, "step": 185280 }, { "epoch": 2.67, "learning_rate": 1.911018394415861e-05, "loss": 0.0075, "step": 185290 }, { "epoch": 2.67, "learning_rate": 1.9110140708393984e-05, "loss": 0.005, "step": 185300 }, { "epoch": 2.67, "learning_rate": 1.9110092668655513e-05, "loss": 0.0047, "step": 185310 }, { "epoch": 2.67, "learning_rate": 1.9110044628917042e-05, "loss": 0.0081, "step": 185320 }, { "epoch": 2.67, "learning_rate": 1.910999658917857e-05, "loss": 0.0115, "step": 185330 }, { "epoch": 2.67, "learning_rate": 1.9109948549440098e-05, "loss": 0.0067, "step": 185340 }, { "epoch": 2.67, "learning_rate": 1.9109900509701627e-05, "loss": 0.0111, "step": 185350 }, { "epoch": 2.67, "learning_rate": 1.9109852469963156e-05, "loss": 0.006, "step": 185360 }, { "epoch": 2.67, "learning_rate": 1.9109804430224682e-05, "loss": 0.0049, "step": 185370 }, { "epoch": 2.67, "learning_rate": 1.910975639048621e-05, "loss": 0.0052, "step": 185380 }, { "epoch": 2.67, "learning_rate": 1.910970835074774e-05, "loss": 0.0065, "step": 185390 }, { "epoch": 2.67, "learning_rate": 1.910966031100927e-05, "loss": 0.0073, "step": 185400 }, { "epoch": 2.67, "learning_rate": 1.9109612271270796e-05, "loss": 0.0052, "step": 185410 }, { "epoch": 2.67, "learning_rate": 1.9109564231532325e-05, "loss": 0.0052, "step": 185420 }, { "epoch": 2.67, "learning_rate": 1.9109516191793854e-05, "loss": 0.0071, "step": 185430 }, { "epoch": 2.67, "learning_rate": 1.910946815205538e-05, "loss": 0.0062, "step": 185440 }, { "epoch": 2.67, "learning_rate": 1.910942011231691e-05, "loss": 0.0062, "step": 185450 }, { "epoch": 2.67, "learning_rate": 1.910937207257844e-05, "loss": 0.0084, "step": 185460 }, { "epoch": 2.67, "learning_rate": 1.9109324032839968e-05, "loss": 0.0074, "step": 185470 }, { "epoch": 2.67, "learning_rate": 1.9109275993101494e-05, "loss": 0.0063, "step": 185480 }, { "epoch": 2.67, "learning_rate": 1.9109227953363023e-05, "loss": 0.0047, "step": 185490 }, { "epoch": 2.67, "learning_rate": 1.9109179913624552e-05, "loss": 0.0081, "step": 185500 }, { "epoch": 2.67, "learning_rate": 1.9109131873886078e-05, "loss": 0.0106, "step": 185510 }, { "epoch": 2.67, "learning_rate": 1.9109083834147608e-05, "loss": 0.0102, "step": 185520 }, { "epoch": 2.67, "learning_rate": 1.9109035794409137e-05, "loss": 0.0071, "step": 185530 }, { "epoch": 2.67, "learning_rate": 1.9108987754670666e-05, "loss": 0.0075, "step": 185540 }, { "epoch": 2.67, "learning_rate": 1.9108939714932192e-05, "loss": 0.0065, "step": 185550 }, { "epoch": 2.67, "learning_rate": 1.910889167519372e-05, "loss": 0.0097, "step": 185560 }, { "epoch": 2.67, "learning_rate": 1.910884363545525e-05, "loss": 0.0074, "step": 185570 }, { "epoch": 2.67, "learning_rate": 1.910879559571678e-05, "loss": 0.0082, "step": 185580 }, { "epoch": 2.67, "learning_rate": 1.9108747555978306e-05, "loss": 0.0062, "step": 185590 }, { "epoch": 2.67, "learning_rate": 1.9108699516239835e-05, "loss": 0.0052, "step": 185600 }, { "epoch": 2.67, "learning_rate": 1.9108651476501364e-05, "loss": 0.0057, "step": 185610 }, { "epoch": 2.68, "learning_rate": 1.910860343676289e-05, "loss": 0.0049, "step": 185620 }, { "epoch": 2.68, "learning_rate": 1.910855539702442e-05, "loss": 0.0049, "step": 185630 }, { "epoch": 2.68, "learning_rate": 1.910850735728595e-05, "loss": 0.0062, "step": 185640 }, { "epoch": 2.68, "learning_rate": 1.9108459317547478e-05, "loss": 0.0061, "step": 185650 }, { "epoch": 2.68, "learning_rate": 1.9108411277809004e-05, "loss": 0.0086, "step": 185660 }, { "epoch": 2.68, "learning_rate": 1.9108363238070533e-05, "loss": 0.0082, "step": 185670 }, { "epoch": 2.68, "learning_rate": 1.9108315198332062e-05, "loss": 0.0096, "step": 185680 }, { "epoch": 2.68, "learning_rate": 1.9108267158593588e-05, "loss": 0.0068, "step": 185690 }, { "epoch": 2.68, "learning_rate": 1.9108219118855117e-05, "loss": 0.0048, "step": 185700 }, { "epoch": 2.68, "learning_rate": 1.9108171079116647e-05, "loss": 0.0082, "step": 185710 }, { "epoch": 2.68, "learning_rate": 1.9108123039378176e-05, "loss": 0.0036, "step": 185720 }, { "epoch": 2.68, "learning_rate": 1.9108074999639702e-05, "loss": 0.0068, "step": 185730 }, { "epoch": 2.68, "learning_rate": 1.910802695990123e-05, "loss": 0.0039, "step": 185740 }, { "epoch": 2.68, "learning_rate": 1.910797892016276e-05, "loss": 0.0064, "step": 185750 }, { "epoch": 2.68, "learning_rate": 1.910793088042429e-05, "loss": 0.0063, "step": 185760 }, { "epoch": 2.68, "learning_rate": 1.9107882840685816e-05, "loss": 0.0073, "step": 185770 }, { "epoch": 2.68, "learning_rate": 1.9107834800947345e-05, "loss": 0.0059, "step": 185780 }, { "epoch": 2.68, "learning_rate": 1.9107786761208874e-05, "loss": 0.0066, "step": 185790 }, { "epoch": 2.68, "learning_rate": 1.91077387214704e-05, "loss": 0.0079, "step": 185800 }, { "epoch": 2.68, "learning_rate": 1.910769068173193e-05, "loss": 0.0075, "step": 185810 }, { "epoch": 2.68, "learning_rate": 1.910764264199346e-05, "loss": 0.0048, "step": 185820 }, { "epoch": 2.68, "learning_rate": 1.9107594602254988e-05, "loss": 0.0074, "step": 185830 }, { "epoch": 2.68, "learning_rate": 1.9107546562516514e-05, "loss": 0.0078, "step": 185840 }, { "epoch": 2.68, "learning_rate": 1.9107498522778043e-05, "loss": 0.008, "step": 185850 }, { "epoch": 2.68, "learning_rate": 1.9107450483039572e-05, "loss": 0.0059, "step": 185860 }, { "epoch": 2.68, "learning_rate": 1.9107402443301098e-05, "loss": 0.0055, "step": 185870 }, { "epoch": 2.68, "learning_rate": 1.9107354403562627e-05, "loss": 0.0074, "step": 185880 }, { "epoch": 2.68, "learning_rate": 1.9107306363824157e-05, "loss": 0.0063, "step": 185890 }, { "epoch": 2.68, "learning_rate": 1.9107258324085686e-05, "loss": 0.0091, "step": 185900 }, { "epoch": 2.68, "learning_rate": 1.9107210284347212e-05, "loss": 0.0084, "step": 185910 }, { "epoch": 2.68, "learning_rate": 1.910716224460874e-05, "loss": 0.0047, "step": 185920 }, { "epoch": 2.68, "learning_rate": 1.910711420487027e-05, "loss": 0.0081, "step": 185930 }, { "epoch": 2.68, "learning_rate": 1.91070661651318e-05, "loss": 0.0052, "step": 185940 }, { "epoch": 2.68, "learning_rate": 1.9107018125393325e-05, "loss": 0.0084, "step": 185950 }, { "epoch": 2.68, "learning_rate": 1.9106970085654855e-05, "loss": 0.0056, "step": 185960 }, { "epoch": 2.68, "learning_rate": 1.9106922045916384e-05, "loss": 0.0052, "step": 185970 }, { "epoch": 2.68, "learning_rate": 1.910687400617791e-05, "loss": 0.0036, "step": 185980 }, { "epoch": 2.68, "learning_rate": 1.910682596643944e-05, "loss": 0.0075, "step": 185990 }, { "epoch": 2.68, "learning_rate": 1.910677792670097e-05, "loss": 0.0051, "step": 186000 }, { "epoch": 2.68, "learning_rate": 1.9106729886962498e-05, "loss": 0.0065, "step": 186010 }, { "epoch": 2.68, "learning_rate": 1.9106681847224024e-05, "loss": 0.0037, "step": 186020 }, { "epoch": 2.68, "learning_rate": 1.9106633807485553e-05, "loss": 0.0077, "step": 186030 }, { "epoch": 2.68, "learning_rate": 1.9106585767747082e-05, "loss": 0.0098, "step": 186040 }, { "epoch": 2.68, "learning_rate": 1.9106537728008608e-05, "loss": 0.0085, "step": 186050 }, { "epoch": 2.68, "learning_rate": 1.9106489688270137e-05, "loss": 0.0072, "step": 186060 }, { "epoch": 2.68, "learning_rate": 1.9106441648531667e-05, "loss": 0.0059, "step": 186070 }, { "epoch": 2.68, "learning_rate": 1.9106393608793196e-05, "loss": 0.0078, "step": 186080 }, { "epoch": 2.68, "learning_rate": 1.910634556905472e-05, "loss": 0.0058, "step": 186090 }, { "epoch": 2.68, "learning_rate": 1.910629752931625e-05, "loss": 0.0072, "step": 186100 }, { "epoch": 2.68, "learning_rate": 1.910624948957778e-05, "loss": 0.0067, "step": 186110 }, { "epoch": 2.68, "learning_rate": 1.910620144983931e-05, "loss": 0.006, "step": 186120 }, { "epoch": 2.68, "learning_rate": 1.9106153410100835e-05, "loss": 0.0105, "step": 186130 }, { "epoch": 2.68, "learning_rate": 1.9106105370362365e-05, "loss": 0.0048, "step": 186140 }, { "epoch": 2.68, "learning_rate": 1.9106057330623894e-05, "loss": 0.0085, "step": 186150 }, { "epoch": 2.68, "learning_rate": 1.910600929088542e-05, "loss": 0.0075, "step": 186160 }, { "epoch": 2.68, "learning_rate": 1.910596125114695e-05, "loss": 0.0069, "step": 186170 }, { "epoch": 2.68, "learning_rate": 1.910591321140848e-05, "loss": 0.0071, "step": 186180 }, { "epoch": 2.68, "learning_rate": 1.9105865171670008e-05, "loss": 0.0069, "step": 186190 }, { "epoch": 2.68, "learning_rate": 1.9105817131931533e-05, "loss": 0.0091, "step": 186200 }, { "epoch": 2.68, "learning_rate": 1.9105769092193063e-05, "loss": 0.0056, "step": 186210 }, { "epoch": 2.68, "learning_rate": 1.9105721052454592e-05, "loss": 0.0085, "step": 186220 }, { "epoch": 2.68, "learning_rate": 1.9105673012716118e-05, "loss": 0.0059, "step": 186230 }, { "epoch": 2.68, "learning_rate": 1.9105624972977647e-05, "loss": 0.0054, "step": 186240 }, { "epoch": 2.68, "learning_rate": 1.9105576933239176e-05, "loss": 0.0063, "step": 186250 }, { "epoch": 2.68, "learning_rate": 1.9105528893500706e-05, "loss": 0.0038, "step": 186260 }, { "epoch": 2.68, "learning_rate": 1.910548085376223e-05, "loss": 0.006, "step": 186270 }, { "epoch": 2.68, "learning_rate": 1.910543281402376e-05, "loss": 0.0099, "step": 186280 }, { "epoch": 2.68, "learning_rate": 1.910538477428529e-05, "loss": 0.0054, "step": 186290 }, { "epoch": 2.68, "learning_rate": 1.910533673454682e-05, "loss": 0.0091, "step": 186300 }, { "epoch": 2.69, "learning_rate": 1.9105288694808345e-05, "loss": 0.0071, "step": 186310 }, { "epoch": 2.69, "learning_rate": 1.9105240655069875e-05, "loss": 0.0083, "step": 186320 }, { "epoch": 2.69, "learning_rate": 1.9105192615331404e-05, "loss": 0.0047, "step": 186330 }, { "epoch": 2.69, "learning_rate": 1.910514457559293e-05, "loss": 0.006, "step": 186340 }, { "epoch": 2.69, "learning_rate": 1.910509653585446e-05, "loss": 0.0054, "step": 186350 }, { "epoch": 2.69, "learning_rate": 1.9105048496115988e-05, "loss": 0.0064, "step": 186360 }, { "epoch": 2.69, "learning_rate": 1.9105000456377518e-05, "loss": 0.0061, "step": 186370 }, { "epoch": 2.69, "learning_rate": 1.9104952416639043e-05, "loss": 0.0075, "step": 186380 }, { "epoch": 2.69, "learning_rate": 1.9104904376900573e-05, "loss": 0.0062, "step": 186390 }, { "epoch": 2.69, "learning_rate": 1.9104856337162102e-05, "loss": 0.004, "step": 186400 }, { "epoch": 2.69, "learning_rate": 1.9104808297423628e-05, "loss": 0.0052, "step": 186410 }, { "epoch": 2.69, "learning_rate": 1.9104760257685157e-05, "loss": 0.0064, "step": 186420 }, { "epoch": 2.69, "learning_rate": 1.9104712217946686e-05, "loss": 0.008, "step": 186430 }, { "epoch": 2.69, "learning_rate": 1.9104664178208216e-05, "loss": 0.0065, "step": 186440 }, { "epoch": 2.69, "learning_rate": 1.9104616138469745e-05, "loss": 0.0072, "step": 186450 }, { "epoch": 2.69, "learning_rate": 1.9104568098731274e-05, "loss": 0.0085, "step": 186460 }, { "epoch": 2.69, "learning_rate": 1.91045200589928e-05, "loss": 0.0058, "step": 186470 }, { "epoch": 2.69, "learning_rate": 1.910447201925433e-05, "loss": 0.0071, "step": 186480 }, { "epoch": 2.69, "learning_rate": 1.910442397951586e-05, "loss": 0.005, "step": 186490 }, { "epoch": 2.69, "learning_rate": 1.9104375939777388e-05, "loss": 0.0095, "step": 186500 }, { "epoch": 2.69, "learning_rate": 1.9104327900038914e-05, "loss": 0.0052, "step": 186510 }, { "epoch": 2.69, "learning_rate": 1.9104279860300443e-05, "loss": 0.0075, "step": 186520 }, { "epoch": 2.69, "learning_rate": 1.9104231820561972e-05, "loss": 0.0075, "step": 186530 }, { "epoch": 2.69, "learning_rate": 1.9104183780823498e-05, "loss": 0.0071, "step": 186540 }, { "epoch": 2.69, "learning_rate": 1.9104135741085027e-05, "loss": 0.0079, "step": 186550 }, { "epoch": 2.69, "learning_rate": 1.9104087701346557e-05, "loss": 0.0057, "step": 186560 }, { "epoch": 2.69, "learning_rate": 1.9104039661608086e-05, "loss": 0.0078, "step": 186570 }, { "epoch": 2.69, "learning_rate": 1.9103991621869612e-05, "loss": 0.0076, "step": 186580 }, { "epoch": 2.69, "learning_rate": 1.910394358213114e-05, "loss": 0.0069, "step": 186590 }, { "epoch": 2.69, "learning_rate": 1.910389554239267e-05, "loss": 0.0052, "step": 186600 }, { "epoch": 2.69, "learning_rate": 1.91038475026542e-05, "loss": 0.0064, "step": 186610 }, { "epoch": 2.69, "learning_rate": 1.9103799462915726e-05, "loss": 0.0068, "step": 186620 }, { "epoch": 2.69, "learning_rate": 1.9103751423177255e-05, "loss": 0.0083, "step": 186630 }, { "epoch": 2.69, "learning_rate": 1.9103703383438784e-05, "loss": 0.0051, "step": 186640 }, { "epoch": 2.69, "learning_rate": 1.910365534370031e-05, "loss": 0.0073, "step": 186650 }, { "epoch": 2.69, "learning_rate": 1.910360730396184e-05, "loss": 0.0054, "step": 186660 }, { "epoch": 2.69, "learning_rate": 1.910355926422337e-05, "loss": 0.0076, "step": 186670 }, { "epoch": 2.69, "learning_rate": 1.9103511224484898e-05, "loss": 0.0049, "step": 186680 }, { "epoch": 2.69, "learning_rate": 1.9103463184746424e-05, "loss": 0.0048, "step": 186690 }, { "epoch": 2.69, "learning_rate": 1.9103415145007953e-05, "loss": 0.0075, "step": 186700 }, { "epoch": 2.69, "learning_rate": 1.9103367105269482e-05, "loss": 0.0093, "step": 186710 }, { "epoch": 2.69, "learning_rate": 1.9103319065531008e-05, "loss": 0.0068, "step": 186720 }, { "epoch": 2.69, "learning_rate": 1.9103271025792537e-05, "loss": 0.0066, "step": 186730 }, { "epoch": 2.69, "learning_rate": 1.9103222986054067e-05, "loss": 0.0059, "step": 186740 }, { "epoch": 2.69, "learning_rate": 1.9103174946315596e-05, "loss": 0.0062, "step": 186750 }, { "epoch": 2.69, "learning_rate": 1.9103126906577122e-05, "loss": 0.0055, "step": 186760 }, { "epoch": 2.69, "learning_rate": 1.910307886683865e-05, "loss": 0.0086, "step": 186770 }, { "epoch": 2.69, "learning_rate": 1.910303082710018e-05, "loss": 0.0065, "step": 186780 }, { "epoch": 2.69, "learning_rate": 1.910298278736171e-05, "loss": 0.0049, "step": 186790 }, { "epoch": 2.69, "learning_rate": 1.9102934747623235e-05, "loss": 0.0057, "step": 186800 }, { "epoch": 2.69, "learning_rate": 1.9102886707884765e-05, "loss": 0.006, "step": 186810 }, { "epoch": 2.69, "learning_rate": 1.9102838668146294e-05, "loss": 0.0113, "step": 186820 }, { "epoch": 2.69, "learning_rate": 1.910279062840782e-05, "loss": 0.0075, "step": 186830 }, { "epoch": 2.69, "learning_rate": 1.910274258866935e-05, "loss": 0.006, "step": 186840 }, { "epoch": 2.69, "learning_rate": 1.910269454893088e-05, "loss": 0.0066, "step": 186850 }, { "epoch": 2.69, "learning_rate": 1.9102646509192408e-05, "loss": 0.0061, "step": 186860 }, { "epoch": 2.69, "learning_rate": 1.9102598469453934e-05, "loss": 0.0067, "step": 186870 }, { "epoch": 2.69, "learning_rate": 1.9102550429715463e-05, "loss": 0.0064, "step": 186880 }, { "epoch": 2.69, "learning_rate": 1.9102502389976992e-05, "loss": 0.006, "step": 186890 }, { "epoch": 2.69, "learning_rate": 1.9102454350238518e-05, "loss": 0.007, "step": 186900 }, { "epoch": 2.69, "learning_rate": 1.9102406310500047e-05, "loss": 0.009, "step": 186910 }, { "epoch": 2.69, "learning_rate": 1.9102358270761577e-05, "loss": 0.0068, "step": 186920 }, { "epoch": 2.69, "learning_rate": 1.9102310231023106e-05, "loss": 0.006, "step": 186930 }, { "epoch": 2.69, "learning_rate": 1.910226219128463e-05, "loss": 0.0088, "step": 186940 }, { "epoch": 2.69, "learning_rate": 1.910221415154616e-05, "loss": 0.0082, "step": 186950 }, { "epoch": 2.69, "learning_rate": 1.910216611180769e-05, "loss": 0.0047, "step": 186960 }, { "epoch": 2.69, "learning_rate": 1.910211807206922e-05, "loss": 0.0086, "step": 186970 }, { "epoch": 2.69, "learning_rate": 1.9102070032330745e-05, "loss": 0.0068, "step": 186980 }, { "epoch": 2.69, "learning_rate": 1.9102021992592275e-05, "loss": 0.0097, "step": 186990 }, { "epoch": 2.7, "learning_rate": 1.9101973952853804e-05, "loss": 0.006, "step": 187000 }, { "epoch": 2.7, "learning_rate": 1.910192591311533e-05, "loss": 0.0086, "step": 187010 }, { "epoch": 2.7, "learning_rate": 1.910187787337686e-05, "loss": 0.0076, "step": 187020 }, { "epoch": 2.7, "learning_rate": 1.910182983363839e-05, "loss": 0.0099, "step": 187030 }, { "epoch": 2.7, "learning_rate": 1.9101781793899918e-05, "loss": 0.0111, "step": 187040 }, { "epoch": 2.7, "learning_rate": 1.9101733754161443e-05, "loss": 0.0076, "step": 187050 }, { "epoch": 2.7, "learning_rate": 1.9101685714422973e-05, "loss": 0.0086, "step": 187060 }, { "epoch": 2.7, "learning_rate": 1.9101637674684502e-05, "loss": 0.008, "step": 187070 }, { "epoch": 2.7, "learning_rate": 1.9101589634946028e-05, "loss": 0.0099, "step": 187080 }, { "epoch": 2.7, "learning_rate": 1.9101541595207557e-05, "loss": 0.0099, "step": 187090 }, { "epoch": 2.7, "learning_rate": 1.9101493555469086e-05, "loss": 0.0066, "step": 187100 }, { "epoch": 2.7, "learning_rate": 1.9101445515730616e-05, "loss": 0.0077, "step": 187110 }, { "epoch": 2.7, "learning_rate": 1.910139747599214e-05, "loss": 0.0074, "step": 187120 }, { "epoch": 2.7, "learning_rate": 1.910134943625367e-05, "loss": 0.0077, "step": 187130 }, { "epoch": 2.7, "learning_rate": 1.91013013965152e-05, "loss": 0.0077, "step": 187140 }, { "epoch": 2.7, "learning_rate": 1.910125335677673e-05, "loss": 0.005, "step": 187150 }, { "epoch": 2.7, "learning_rate": 1.9101205317038255e-05, "loss": 0.0049, "step": 187160 }, { "epoch": 2.7, "learning_rate": 1.9101157277299785e-05, "loss": 0.0077, "step": 187170 }, { "epoch": 2.7, "learning_rate": 1.9101109237561314e-05, "loss": 0.0053, "step": 187180 }, { "epoch": 2.7, "learning_rate": 1.910106119782284e-05, "loss": 0.0082, "step": 187190 }, { "epoch": 2.7, "learning_rate": 1.910101315808437e-05, "loss": 0.0039, "step": 187200 }, { "epoch": 2.7, "learning_rate": 1.9100965118345898e-05, "loss": 0.0069, "step": 187210 }, { "epoch": 2.7, "learning_rate": 1.9100917078607428e-05, "loss": 0.0063, "step": 187220 }, { "epoch": 2.7, "learning_rate": 1.9100869038868953e-05, "loss": 0.0038, "step": 187230 }, { "epoch": 2.7, "learning_rate": 1.9100820999130483e-05, "loss": 0.0062, "step": 187240 }, { "epoch": 2.7, "learning_rate": 1.9100772959392012e-05, "loss": 0.0065, "step": 187250 }, { "epoch": 2.7, "learning_rate": 1.9100724919653538e-05, "loss": 0.0107, "step": 187260 }, { "epoch": 2.7, "learning_rate": 1.9100676879915067e-05, "loss": 0.0069, "step": 187270 }, { "epoch": 2.7, "learning_rate": 1.9100628840176596e-05, "loss": 0.007, "step": 187280 }, { "epoch": 2.7, "learning_rate": 1.9100580800438126e-05, "loss": 0.0082, "step": 187290 }, { "epoch": 2.7, "learning_rate": 1.910053276069965e-05, "loss": 0.0106, "step": 187300 }, { "epoch": 2.7, "learning_rate": 1.910048472096118e-05, "loss": 0.0066, "step": 187310 }, { "epoch": 2.7, "learning_rate": 1.910043668122271e-05, "loss": 0.0082, "step": 187320 }, { "epoch": 2.7, "learning_rate": 1.910038864148424e-05, "loss": 0.0053, "step": 187330 }, { "epoch": 2.7, "learning_rate": 1.9100340601745765e-05, "loss": 0.0065, "step": 187340 }, { "epoch": 2.7, "learning_rate": 1.9100292562007294e-05, "loss": 0.0062, "step": 187350 }, { "epoch": 2.7, "learning_rate": 1.9100244522268824e-05, "loss": 0.0068, "step": 187360 }, { "epoch": 2.7, "learning_rate": 1.910019648253035e-05, "loss": 0.0068, "step": 187370 }, { "epoch": 2.7, "learning_rate": 1.910014844279188e-05, "loss": 0.0062, "step": 187380 }, { "epoch": 2.7, "learning_rate": 1.9100100403053408e-05, "loss": 0.0059, "step": 187390 }, { "epoch": 2.7, "learning_rate": 1.9100052363314937e-05, "loss": 0.009, "step": 187400 }, { "epoch": 2.7, "learning_rate": 1.9100004323576463e-05, "loss": 0.0082, "step": 187410 }, { "epoch": 2.7, "learning_rate": 1.9099956283837993e-05, "loss": 0.01, "step": 187420 }, { "epoch": 2.7, "learning_rate": 1.9099908244099522e-05, "loss": 0.0076, "step": 187430 }, { "epoch": 2.7, "learning_rate": 1.9099860204361048e-05, "loss": 0.0082, "step": 187440 }, { "epoch": 2.7, "learning_rate": 1.9099816968596426e-05, "loss": 0.0058, "step": 187450 }, { "epoch": 2.7, "learning_rate": 1.9099768928857955e-05, "loss": 0.0048, "step": 187460 }, { "epoch": 2.7, "learning_rate": 1.909972088911948e-05, "loss": 0.0045, "step": 187470 }, { "epoch": 2.7, "learning_rate": 1.909967284938101e-05, "loss": 0.0069, "step": 187480 }, { "epoch": 2.7, "learning_rate": 1.909962480964254e-05, "loss": 0.007, "step": 187490 }, { "epoch": 2.7, "learning_rate": 1.9099576769904065e-05, "loss": 0.0101, "step": 187500 }, { "epoch": 2.7, "learning_rate": 1.9099528730165595e-05, "loss": 0.0083, "step": 187510 }, { "epoch": 2.7, "learning_rate": 1.9099480690427124e-05, "loss": 0.0055, "step": 187520 }, { "epoch": 2.7, "learning_rate": 1.9099432650688653e-05, "loss": 0.0079, "step": 187530 }, { "epoch": 2.7, "learning_rate": 1.909938461095018e-05, "loss": 0.0067, "step": 187540 }, { "epoch": 2.7, "learning_rate": 1.9099336571211708e-05, "loss": 0.0073, "step": 187550 }, { "epoch": 2.7, "learning_rate": 1.9099288531473238e-05, "loss": 0.0056, "step": 187560 }, { "epoch": 2.7, "learning_rate": 1.9099240491734763e-05, "loss": 0.0054, "step": 187570 }, { "epoch": 2.7, "learning_rate": 1.9099192451996293e-05, "loss": 0.0078, "step": 187580 }, { "epoch": 2.7, "learning_rate": 1.9099144412257822e-05, "loss": 0.0101, "step": 187590 }, { "epoch": 2.7, "learning_rate": 1.909909637251935e-05, "loss": 0.0076, "step": 187600 }, { "epoch": 2.7, "learning_rate": 1.9099048332780877e-05, "loss": 0.0074, "step": 187610 }, { "epoch": 2.7, "learning_rate": 1.9099000293042406e-05, "loss": 0.0057, "step": 187620 }, { "epoch": 2.7, "learning_rate": 1.9098952253303936e-05, "loss": 0.0067, "step": 187630 }, { "epoch": 2.7, "learning_rate": 1.9098904213565465e-05, "loss": 0.0076, "step": 187640 }, { "epoch": 2.7, "learning_rate": 1.909885617382699e-05, "loss": 0.0075, "step": 187650 }, { "epoch": 2.7, "learning_rate": 1.909880813408852e-05, "loss": 0.007, "step": 187660 }, { "epoch": 2.7, "learning_rate": 1.909876009435005e-05, "loss": 0.0065, "step": 187670 }, { "epoch": 2.7, "learning_rate": 1.9098712054611575e-05, "loss": 0.0063, "step": 187680 }, { "epoch": 2.7, "learning_rate": 1.9098664014873105e-05, "loss": 0.0052, "step": 187690 }, { "epoch": 2.71, "learning_rate": 1.9098615975134634e-05, "loss": 0.0052, "step": 187700 }, { "epoch": 2.71, "learning_rate": 1.9098567935396163e-05, "loss": 0.0058, "step": 187710 }, { "epoch": 2.71, "learning_rate": 1.909851989565769e-05, "loss": 0.0077, "step": 187720 }, { "epoch": 2.71, "learning_rate": 1.9098471855919218e-05, "loss": 0.0068, "step": 187730 }, { "epoch": 2.71, "learning_rate": 1.9098423816180747e-05, "loss": 0.0084, "step": 187740 }, { "epoch": 2.71, "learning_rate": 1.9098375776442273e-05, "loss": 0.0066, "step": 187750 }, { "epoch": 2.71, "learning_rate": 1.9098327736703803e-05, "loss": 0.0049, "step": 187760 }, { "epoch": 2.71, "learning_rate": 1.9098279696965332e-05, "loss": 0.0065, "step": 187770 }, { "epoch": 2.71, "learning_rate": 1.909823165722686e-05, "loss": 0.0063, "step": 187780 }, { "epoch": 2.71, "learning_rate": 1.9098183617488387e-05, "loss": 0.0069, "step": 187790 }, { "epoch": 2.71, "learning_rate": 1.9098135577749916e-05, "loss": 0.0084, "step": 187800 }, { "epoch": 2.71, "learning_rate": 1.9098087538011446e-05, "loss": 0.0082, "step": 187810 }, { "epoch": 2.71, "learning_rate": 1.9098039498272975e-05, "loss": 0.0055, "step": 187820 }, { "epoch": 2.71, "learning_rate": 1.90979914585345e-05, "loss": 0.0076, "step": 187830 }, { "epoch": 2.71, "learning_rate": 1.909794341879603e-05, "loss": 0.0055, "step": 187840 }, { "epoch": 2.71, "learning_rate": 1.909789537905756e-05, "loss": 0.0074, "step": 187850 }, { "epoch": 2.71, "learning_rate": 1.9097847339319085e-05, "loss": 0.0083, "step": 187860 }, { "epoch": 2.71, "learning_rate": 1.9097799299580614e-05, "loss": 0.0062, "step": 187870 }, { "epoch": 2.71, "learning_rate": 1.9097751259842144e-05, "loss": 0.0051, "step": 187880 }, { "epoch": 2.71, "learning_rate": 1.9097703220103673e-05, "loss": 0.0047, "step": 187890 }, { "epoch": 2.71, "learning_rate": 1.90976551803652e-05, "loss": 0.0072, "step": 187900 }, { "epoch": 2.71, "learning_rate": 1.9097607140626728e-05, "loss": 0.0058, "step": 187910 }, { "epoch": 2.71, "learning_rate": 1.9097559100888257e-05, "loss": 0.0073, "step": 187920 }, { "epoch": 2.71, "learning_rate": 1.9097511061149783e-05, "loss": 0.0064, "step": 187930 }, { "epoch": 2.71, "learning_rate": 1.9097463021411313e-05, "loss": 0.0085, "step": 187940 }, { "epoch": 2.71, "learning_rate": 1.9097414981672842e-05, "loss": 0.0086, "step": 187950 }, { "epoch": 2.71, "learning_rate": 1.909736694193437e-05, "loss": 0.0087, "step": 187960 }, { "epoch": 2.71, "learning_rate": 1.9097318902195897e-05, "loss": 0.0065, "step": 187970 }, { "epoch": 2.71, "learning_rate": 1.9097270862457426e-05, "loss": 0.0098, "step": 187980 }, { "epoch": 2.71, "learning_rate": 1.9097222822718956e-05, "loss": 0.008, "step": 187990 }, { "epoch": 2.71, "learning_rate": 1.9097174782980485e-05, "loss": 0.007, "step": 188000 }, { "epoch": 2.71, "learning_rate": 1.909712674324201e-05, "loss": 0.0081, "step": 188010 }, { "epoch": 2.71, "learning_rate": 1.909707870350354e-05, "loss": 0.0065, "step": 188020 }, { "epoch": 2.71, "learning_rate": 1.909703066376507e-05, "loss": 0.0083, "step": 188030 }, { "epoch": 2.71, "learning_rate": 1.9096982624026595e-05, "loss": 0.0085, "step": 188040 }, { "epoch": 2.71, "learning_rate": 1.9096934584288124e-05, "loss": 0.0083, "step": 188050 }, { "epoch": 2.71, "learning_rate": 1.9096886544549654e-05, "loss": 0.007, "step": 188060 }, { "epoch": 2.71, "learning_rate": 1.9096838504811183e-05, "loss": 0.0055, "step": 188070 }, { "epoch": 2.71, "learning_rate": 1.909679046507271e-05, "loss": 0.008, "step": 188080 }, { "epoch": 2.71, "learning_rate": 1.9096742425334238e-05, "loss": 0.0083, "step": 188090 }, { "epoch": 2.71, "learning_rate": 1.9096694385595767e-05, "loss": 0.0065, "step": 188100 }, { "epoch": 2.71, "learning_rate": 1.9096646345857293e-05, "loss": 0.0063, "step": 188110 }, { "epoch": 2.71, "learning_rate": 1.9096598306118822e-05, "loss": 0.0045, "step": 188120 }, { "epoch": 2.71, "learning_rate": 1.9096550266380352e-05, "loss": 0.0053, "step": 188130 }, { "epoch": 2.71, "learning_rate": 1.909650222664188e-05, "loss": 0.0115, "step": 188140 }, { "epoch": 2.71, "learning_rate": 1.9096454186903407e-05, "loss": 0.0063, "step": 188150 }, { "epoch": 2.71, "learning_rate": 1.9096406147164936e-05, "loss": 0.0068, "step": 188160 }, { "epoch": 2.71, "learning_rate": 1.9096358107426465e-05, "loss": 0.0052, "step": 188170 }, { "epoch": 2.71, "learning_rate": 1.9096310067687995e-05, "loss": 0.0053, "step": 188180 }, { "epoch": 2.71, "learning_rate": 1.909626202794952e-05, "loss": 0.0088, "step": 188190 }, { "epoch": 2.71, "learning_rate": 1.909621398821105e-05, "loss": 0.0078, "step": 188200 }, { "epoch": 2.71, "learning_rate": 1.909616594847258e-05, "loss": 0.0069, "step": 188210 }, { "epoch": 2.71, "learning_rate": 1.9096117908734105e-05, "loss": 0.006, "step": 188220 }, { "epoch": 2.71, "learning_rate": 1.9096069868995634e-05, "loss": 0.007, "step": 188230 }, { "epoch": 2.71, "learning_rate": 1.9096021829257164e-05, "loss": 0.0067, "step": 188240 }, { "epoch": 2.71, "learning_rate": 1.9095973789518693e-05, "loss": 0.0051, "step": 188250 }, { "epoch": 2.71, "learning_rate": 1.909592574978022e-05, "loss": 0.0071, "step": 188260 }, { "epoch": 2.71, "learning_rate": 1.9095877710041748e-05, "loss": 0.0072, "step": 188270 }, { "epoch": 2.71, "learning_rate": 1.9095829670303277e-05, "loss": 0.006, "step": 188280 }, { "epoch": 2.71, "learning_rate": 1.9095781630564803e-05, "loss": 0.0098, "step": 188290 }, { "epoch": 2.71, "learning_rate": 1.9095733590826332e-05, "loss": 0.0068, "step": 188300 }, { "epoch": 2.71, "learning_rate": 1.909568555108786e-05, "loss": 0.0073, "step": 188310 }, { "epoch": 2.71, "learning_rate": 1.909563751134939e-05, "loss": 0.0085, "step": 188320 }, { "epoch": 2.71, "learning_rate": 1.9095589471610917e-05, "loss": 0.0097, "step": 188330 }, { "epoch": 2.71, "learning_rate": 1.9095541431872446e-05, "loss": 0.0072, "step": 188340 }, { "epoch": 2.71, "learning_rate": 1.9095493392133975e-05, "loss": 0.0098, "step": 188350 }, { "epoch": 2.71, "learning_rate": 1.9095445352395505e-05, "loss": 0.0046, "step": 188360 }, { "epoch": 2.71, "learning_rate": 1.909539731265703e-05, "loss": 0.0066, "step": 188370 }, { "epoch": 2.71, "learning_rate": 1.909534927291856e-05, "loss": 0.0082, "step": 188380 }, { "epoch": 2.72, "learning_rate": 1.909530123318009e-05, "loss": 0.0078, "step": 188390 }, { "epoch": 2.72, "learning_rate": 1.9095253193441615e-05, "loss": 0.0089, "step": 188400 }, { "epoch": 2.72, "learning_rate": 1.9095205153703144e-05, "loss": 0.007, "step": 188410 }, { "epoch": 2.72, "learning_rate": 1.9095157113964673e-05, "loss": 0.0164, "step": 188420 }, { "epoch": 2.72, "learning_rate": 1.9095109074226203e-05, "loss": 0.0072, "step": 188430 }, { "epoch": 2.72, "learning_rate": 1.909506103448773e-05, "loss": 0.0095, "step": 188440 }, { "epoch": 2.72, "learning_rate": 1.9095012994749258e-05, "loss": 0.0063, "step": 188450 }, { "epoch": 2.72, "learning_rate": 1.9094964955010787e-05, "loss": 0.0077, "step": 188460 }, { "epoch": 2.72, "learning_rate": 1.9094916915272313e-05, "loss": 0.0066, "step": 188470 }, { "epoch": 2.72, "learning_rate": 1.9094868875533842e-05, "loss": 0.0054, "step": 188480 }, { "epoch": 2.72, "learning_rate": 1.909482083579537e-05, "loss": 0.0102, "step": 188490 }, { "epoch": 2.72, "learning_rate": 1.90947727960569e-05, "loss": 0.0082, "step": 188500 }, { "epoch": 2.72, "learning_rate": 1.9094724756318427e-05, "loss": 0.0057, "step": 188510 }, { "epoch": 2.72, "learning_rate": 1.9094676716579956e-05, "loss": 0.0119, "step": 188520 }, { "epoch": 2.72, "learning_rate": 1.9094628676841485e-05, "loss": 0.0085, "step": 188530 }, { "epoch": 2.72, "learning_rate": 1.9094580637103015e-05, "loss": 0.0048, "step": 188540 }, { "epoch": 2.72, "learning_rate": 1.909453259736454e-05, "loss": 0.0057, "step": 188550 }, { "epoch": 2.72, "learning_rate": 1.909448455762607e-05, "loss": 0.0047, "step": 188560 }, { "epoch": 2.72, "learning_rate": 1.90944365178876e-05, "loss": 0.0105, "step": 188570 }, { "epoch": 2.72, "learning_rate": 1.9094388478149125e-05, "loss": 0.0101, "step": 188580 }, { "epoch": 2.72, "learning_rate": 1.9094340438410654e-05, "loss": 0.0062, "step": 188590 }, { "epoch": 2.72, "learning_rate": 1.9094292398672183e-05, "loss": 0.0057, "step": 188600 }, { "epoch": 2.72, "learning_rate": 1.9094244358933713e-05, "loss": 0.008, "step": 188610 }, { "epoch": 2.72, "learning_rate": 1.909419631919524e-05, "loss": 0.0103, "step": 188620 }, { "epoch": 2.72, "learning_rate": 1.9094148279456768e-05, "loss": 0.0105, "step": 188630 }, { "epoch": 2.72, "learning_rate": 1.9094100239718297e-05, "loss": 0.0104, "step": 188640 }, { "epoch": 2.72, "learning_rate": 1.9094052199979823e-05, "loss": 0.0081, "step": 188650 }, { "epoch": 2.72, "learning_rate": 1.9094004160241352e-05, "loss": 0.0062, "step": 188660 }, { "epoch": 2.72, "learning_rate": 1.909395612050288e-05, "loss": 0.0052, "step": 188670 }, { "epoch": 2.72, "learning_rate": 1.909390808076441e-05, "loss": 0.0067, "step": 188680 }, { "epoch": 2.72, "learning_rate": 1.9093860041025937e-05, "loss": 0.0066, "step": 188690 }, { "epoch": 2.72, "learning_rate": 1.9093812001287466e-05, "loss": 0.006, "step": 188700 }, { "epoch": 2.72, "learning_rate": 1.9093763961548995e-05, "loss": 0.006, "step": 188710 }, { "epoch": 2.72, "learning_rate": 1.9093715921810524e-05, "loss": 0.0049, "step": 188720 }, { "epoch": 2.72, "learning_rate": 1.909366788207205e-05, "loss": 0.0084, "step": 188730 }, { "epoch": 2.72, "learning_rate": 1.909361984233358e-05, "loss": 0.0057, "step": 188740 }, { "epoch": 2.72, "learning_rate": 1.909357180259511e-05, "loss": 0.0049, "step": 188750 }, { "epoch": 2.72, "learning_rate": 1.9093523762856635e-05, "loss": 0.0071, "step": 188760 }, { "epoch": 2.72, "learning_rate": 1.9093475723118164e-05, "loss": 0.0044, "step": 188770 }, { "epoch": 2.72, "learning_rate": 1.9093427683379693e-05, "loss": 0.0075, "step": 188780 }, { "epoch": 2.72, "learning_rate": 1.9093379643641223e-05, "loss": 0.0051, "step": 188790 }, { "epoch": 2.72, "learning_rate": 1.909333160390275e-05, "loss": 0.0057, "step": 188800 }, { "epoch": 2.72, "learning_rate": 1.9093283564164278e-05, "loss": 0.0092, "step": 188810 }, { "epoch": 2.72, "learning_rate": 1.9093235524425807e-05, "loss": 0.0069, "step": 188820 }, { "epoch": 2.72, "learning_rate": 1.9093187484687333e-05, "loss": 0.0074, "step": 188830 }, { "epoch": 2.72, "learning_rate": 1.9093139444948862e-05, "loss": 0.0053, "step": 188840 }, { "epoch": 2.72, "learning_rate": 1.909309140521039e-05, "loss": 0.0063, "step": 188850 }, { "epoch": 2.72, "learning_rate": 1.909304336547192e-05, "loss": 0.0078, "step": 188860 }, { "epoch": 2.72, "learning_rate": 1.9092995325733447e-05, "loss": 0.0095, "step": 188870 }, { "epoch": 2.72, "learning_rate": 1.9092947285994976e-05, "loss": 0.0055, "step": 188880 }, { "epoch": 2.72, "learning_rate": 1.9092899246256505e-05, "loss": 0.0084, "step": 188890 }, { "epoch": 2.72, "learning_rate": 1.9092851206518034e-05, "loss": 0.0067, "step": 188900 }, { "epoch": 2.72, "learning_rate": 1.909280316677956e-05, "loss": 0.0072, "step": 188910 }, { "epoch": 2.72, "learning_rate": 1.909275512704109e-05, "loss": 0.0068, "step": 188920 }, { "epoch": 2.72, "learning_rate": 1.909270708730262e-05, "loss": 0.0064, "step": 188930 }, { "epoch": 2.72, "learning_rate": 1.9092659047564145e-05, "loss": 0.0068, "step": 188940 }, { "epoch": 2.72, "learning_rate": 1.9092611007825674e-05, "loss": 0.0059, "step": 188950 }, { "epoch": 2.72, "learning_rate": 1.9092562968087203e-05, "loss": 0.0076, "step": 188960 }, { "epoch": 2.72, "learning_rate": 1.9092514928348732e-05, "loss": 0.0079, "step": 188970 }, { "epoch": 2.72, "learning_rate": 1.909246688861026e-05, "loss": 0.0049, "step": 188980 }, { "epoch": 2.72, "learning_rate": 1.9092418848871788e-05, "loss": 0.0062, "step": 188990 }, { "epoch": 2.72, "learning_rate": 1.9092370809133317e-05, "loss": 0.0067, "step": 189000 }, { "epoch": 2.72, "learning_rate": 1.9092322769394843e-05, "loss": 0.007, "step": 189010 }, { "epoch": 2.72, "learning_rate": 1.9092274729656372e-05, "loss": 0.0058, "step": 189020 }, { "epoch": 2.72, "learning_rate": 1.90922266899179e-05, "loss": 0.0048, "step": 189030 }, { "epoch": 2.72, "learning_rate": 1.909217865017943e-05, "loss": 0.0076, "step": 189040 }, { "epoch": 2.72, "learning_rate": 1.9092130610440956e-05, "loss": 0.0058, "step": 189050 }, { "epoch": 2.72, "learning_rate": 1.9092082570702486e-05, "loss": 0.0085, "step": 189060 }, { "epoch": 2.72, "learning_rate": 1.9092034530964015e-05, "loss": 0.0083, "step": 189070 }, { "epoch": 2.73, "learning_rate": 1.9091986491225544e-05, "loss": 0.0063, "step": 189080 }, { "epoch": 2.73, "learning_rate": 1.909193845148707e-05, "loss": 0.0052, "step": 189090 }, { "epoch": 2.73, "learning_rate": 1.90918904117486e-05, "loss": 0.0052, "step": 189100 }, { "epoch": 2.73, "learning_rate": 1.909184237201013e-05, "loss": 0.0105, "step": 189110 }, { "epoch": 2.73, "learning_rate": 1.9091794332271655e-05, "loss": 0.0092, "step": 189120 }, { "epoch": 2.73, "learning_rate": 1.9091746292533184e-05, "loss": 0.0056, "step": 189130 }, { "epoch": 2.73, "learning_rate": 1.9091698252794713e-05, "loss": 0.0108, "step": 189140 }, { "epoch": 2.73, "learning_rate": 1.9091650213056242e-05, "loss": 0.0083, "step": 189150 }, { "epoch": 2.73, "learning_rate": 1.9091602173317768e-05, "loss": 0.0067, "step": 189160 }, { "epoch": 2.73, "learning_rate": 1.9091554133579298e-05, "loss": 0.0079, "step": 189170 }, { "epoch": 2.73, "learning_rate": 1.9091506093840827e-05, "loss": 0.0065, "step": 189180 }, { "epoch": 2.73, "learning_rate": 1.9091458054102353e-05, "loss": 0.0062, "step": 189190 }, { "epoch": 2.73, "learning_rate": 1.9091410014363882e-05, "loss": 0.0097, "step": 189200 }, { "epoch": 2.73, "learning_rate": 1.909136197462541e-05, "loss": 0.009, "step": 189210 }, { "epoch": 2.73, "learning_rate": 1.909131393488694e-05, "loss": 0.0096, "step": 189220 }, { "epoch": 2.73, "learning_rate": 1.9091265895148466e-05, "loss": 0.0064, "step": 189230 }, { "epoch": 2.73, "learning_rate": 1.9091217855409996e-05, "loss": 0.008, "step": 189240 }, { "epoch": 2.73, "learning_rate": 1.9091169815671525e-05, "loss": 0.0083, "step": 189250 }, { "epoch": 2.73, "learning_rate": 1.9091121775933054e-05, "loss": 0.0074, "step": 189260 }, { "epoch": 2.73, "learning_rate": 1.909107373619458e-05, "loss": 0.007, "step": 189270 }, { "epoch": 2.73, "learning_rate": 1.909102569645611e-05, "loss": 0.0076, "step": 189280 }, { "epoch": 2.73, "learning_rate": 1.909097765671764e-05, "loss": 0.0064, "step": 189290 }, { "epoch": 2.73, "learning_rate": 1.9090929616979164e-05, "loss": 0.0094, "step": 189300 }, { "epoch": 2.73, "learning_rate": 1.9090881577240694e-05, "loss": 0.0053, "step": 189310 }, { "epoch": 2.73, "learning_rate": 1.9090833537502223e-05, "loss": 0.0104, "step": 189320 }, { "epoch": 2.73, "learning_rate": 1.9090785497763752e-05, "loss": 0.0056, "step": 189330 }, { "epoch": 2.73, "learning_rate": 1.9090737458025278e-05, "loss": 0.0057, "step": 189340 }, { "epoch": 2.73, "learning_rate": 1.9090689418286807e-05, "loss": 0.0097, "step": 189350 }, { "epoch": 2.73, "learning_rate": 1.9090641378548337e-05, "loss": 0.0068, "step": 189360 }, { "epoch": 2.73, "learning_rate": 1.9090593338809863e-05, "loss": 0.0057, "step": 189370 }, { "epoch": 2.73, "learning_rate": 1.9090545299071392e-05, "loss": 0.009, "step": 189380 }, { "epoch": 2.73, "learning_rate": 1.909049725933292e-05, "loss": 0.0047, "step": 189390 }, { "epoch": 2.73, "learning_rate": 1.909044921959445e-05, "loss": 0.006, "step": 189400 }, { "epoch": 2.73, "learning_rate": 1.9090401179855976e-05, "loss": 0.0078, "step": 189410 }, { "epoch": 2.73, "learning_rate": 1.9090353140117506e-05, "loss": 0.0074, "step": 189420 }, { "epoch": 2.73, "learning_rate": 1.9090305100379035e-05, "loss": 0.0073, "step": 189430 }, { "epoch": 2.73, "learning_rate": 1.909025706064056e-05, "loss": 0.0076, "step": 189440 }, { "epoch": 2.73, "learning_rate": 1.909020902090209e-05, "loss": 0.008, "step": 189450 }, { "epoch": 2.73, "learning_rate": 1.909016098116362e-05, "loss": 0.0079, "step": 189460 }, { "epoch": 2.73, "learning_rate": 1.909011294142515e-05, "loss": 0.0065, "step": 189470 }, { "epoch": 2.73, "learning_rate": 1.9090064901686674e-05, "loss": 0.0086, "step": 189480 }, { "epoch": 2.73, "learning_rate": 1.9090016861948204e-05, "loss": 0.0058, "step": 189490 }, { "epoch": 2.73, "learning_rate": 1.9089968822209733e-05, "loss": 0.0078, "step": 189500 }, { "epoch": 2.73, "learning_rate": 1.9089920782471262e-05, "loss": 0.0078, "step": 189510 }, { "epoch": 2.73, "learning_rate": 1.908987274273279e-05, "loss": 0.0072, "step": 189520 }, { "epoch": 2.73, "learning_rate": 1.908982470299432e-05, "loss": 0.0051, "step": 189530 }, { "epoch": 2.73, "learning_rate": 1.9089776663255847e-05, "loss": 0.0069, "step": 189540 }, { "epoch": 2.73, "learning_rate": 1.9089728623517376e-05, "loss": 0.0061, "step": 189550 }, { "epoch": 2.73, "learning_rate": 1.9089680583778905e-05, "loss": 0.0082, "step": 189560 }, { "epoch": 2.73, "learning_rate": 1.9089632544040434e-05, "loss": 0.0087, "step": 189570 }, { "epoch": 2.73, "learning_rate": 1.908958450430196e-05, "loss": 0.0061, "step": 189580 }, { "epoch": 2.73, "learning_rate": 1.908953646456349e-05, "loss": 0.0084, "step": 189590 }, { "epoch": 2.73, "learning_rate": 1.908948842482502e-05, "loss": 0.0112, "step": 189600 }, { "epoch": 2.73, "learning_rate": 1.9089440385086545e-05, "loss": 0.0069, "step": 189610 }, { "epoch": 2.73, "learning_rate": 1.9089392345348074e-05, "loss": 0.0106, "step": 189620 }, { "epoch": 2.73, "learning_rate": 1.9089344305609603e-05, "loss": 0.0075, "step": 189630 }, { "epoch": 2.73, "learning_rate": 1.9089296265871133e-05, "loss": 0.0066, "step": 189640 }, { "epoch": 2.73, "learning_rate": 1.908924822613266e-05, "loss": 0.0051, "step": 189650 }, { "epoch": 2.73, "learning_rate": 1.9089200186394188e-05, "loss": 0.0057, "step": 189660 }, { "epoch": 2.73, "learning_rate": 1.9089152146655717e-05, "loss": 0.0088, "step": 189670 }, { "epoch": 2.73, "learning_rate": 1.9089104106917243e-05, "loss": 0.0083, "step": 189680 }, { "epoch": 2.73, "learning_rate": 1.9089056067178772e-05, "loss": 0.0055, "step": 189690 }, { "epoch": 2.73, "learning_rate": 1.90890080274403e-05, "loss": 0.0059, "step": 189700 }, { "epoch": 2.73, "learning_rate": 1.908895998770183e-05, "loss": 0.0105, "step": 189710 }, { "epoch": 2.73, "learning_rate": 1.9088911947963357e-05, "loss": 0.0091, "step": 189720 }, { "epoch": 2.73, "learning_rate": 1.9088863908224886e-05, "loss": 0.0073, "step": 189730 }, { "epoch": 2.73, "learning_rate": 1.9088815868486415e-05, "loss": 0.0059, "step": 189740 }, { "epoch": 2.73, "learning_rate": 1.9088767828747944e-05, "loss": 0.0081, "step": 189750 }, { "epoch": 2.73, "learning_rate": 1.908871978900947e-05, "loss": 0.0088, "step": 189760 }, { "epoch": 2.73, "learning_rate": 1.9088671749271e-05, "loss": 0.01, "step": 189770 }, { "epoch": 2.74, "learning_rate": 1.908862370953253e-05, "loss": 0.009, "step": 189780 }, { "epoch": 2.74, "learning_rate": 1.9088575669794055e-05, "loss": 0.0061, "step": 189790 }, { "epoch": 2.74, "learning_rate": 1.9088527630055584e-05, "loss": 0.0077, "step": 189800 }, { "epoch": 2.74, "learning_rate": 1.9088479590317113e-05, "loss": 0.0061, "step": 189810 }, { "epoch": 2.74, "learning_rate": 1.9088431550578642e-05, "loss": 0.0102, "step": 189820 }, { "epoch": 2.74, "learning_rate": 1.908838351084017e-05, "loss": 0.0093, "step": 189830 }, { "epoch": 2.74, "learning_rate": 1.9088335471101698e-05, "loss": 0.0058, "step": 189840 }, { "epoch": 2.74, "learning_rate": 1.9088287431363227e-05, "loss": 0.0059, "step": 189850 }, { "epoch": 2.74, "learning_rate": 1.9088239391624753e-05, "loss": 0.0068, "step": 189860 }, { "epoch": 2.74, "learning_rate": 1.9088191351886282e-05, "loss": 0.0048, "step": 189870 }, { "epoch": 2.74, "learning_rate": 1.908814331214781e-05, "loss": 0.0071, "step": 189880 }, { "epoch": 2.74, "learning_rate": 1.908809527240934e-05, "loss": 0.0066, "step": 189890 }, { "epoch": 2.74, "learning_rate": 1.9088047232670866e-05, "loss": 0.0122, "step": 189900 }, { "epoch": 2.74, "learning_rate": 1.9087999192932396e-05, "loss": 0.0079, "step": 189910 }, { "epoch": 2.74, "learning_rate": 1.908795595716777e-05, "loss": 0.0112, "step": 189920 }, { "epoch": 2.74, "learning_rate": 1.90879079174293e-05, "loss": 0.0063, "step": 189930 }, { "epoch": 2.74, "learning_rate": 1.9087859877690826e-05, "loss": 0.0129, "step": 189940 }, { "epoch": 2.74, "learning_rate": 1.9087811837952355e-05, "loss": 0.0057, "step": 189950 }, { "epoch": 2.74, "learning_rate": 1.9087763798213884e-05, "loss": 0.0073, "step": 189960 }, { "epoch": 2.74, "learning_rate": 1.908771575847541e-05, "loss": 0.0039, "step": 189970 }, { "epoch": 2.74, "learning_rate": 1.908766771873694e-05, "loss": 0.0063, "step": 189980 }, { "epoch": 2.74, "learning_rate": 1.908761967899847e-05, "loss": 0.0052, "step": 189990 }, { "epoch": 2.74, "learning_rate": 1.9087571639259998e-05, "loss": 0.008, "step": 190000 }, { "epoch": 2.74, "learning_rate": 1.9087523599521524e-05, "loss": 0.007, "step": 190010 }, { "epoch": 2.74, "learning_rate": 1.9087475559783053e-05, "loss": 0.0079, "step": 190020 }, { "epoch": 2.74, "learning_rate": 1.9087427520044582e-05, "loss": 0.0053, "step": 190030 }, { "epoch": 2.74, "learning_rate": 1.908737948030611e-05, "loss": 0.0047, "step": 190040 }, { "epoch": 2.74, "learning_rate": 1.908733144056764e-05, "loss": 0.0083, "step": 190050 }, { "epoch": 2.74, "learning_rate": 1.908728340082917e-05, "loss": 0.0075, "step": 190060 }, { "epoch": 2.74, "learning_rate": 1.9087235361090696e-05, "loss": 0.0087, "step": 190070 }, { "epoch": 2.74, "learning_rate": 1.9087187321352225e-05, "loss": 0.0103, "step": 190080 }, { "epoch": 2.74, "learning_rate": 1.9087139281613754e-05, "loss": 0.0065, "step": 190090 }, { "epoch": 2.74, "learning_rate": 1.908709124187528e-05, "loss": 0.0094, "step": 190100 }, { "epoch": 2.74, "learning_rate": 1.908704320213681e-05, "loss": 0.0079, "step": 190110 }, { "epoch": 2.74, "learning_rate": 1.908699516239834e-05, "loss": 0.01, "step": 190120 }, { "epoch": 2.74, "learning_rate": 1.9086947122659868e-05, "loss": 0.0057, "step": 190130 }, { "epoch": 2.74, "learning_rate": 1.9086899082921394e-05, "loss": 0.0054, "step": 190140 }, { "epoch": 2.74, "learning_rate": 1.9086851043182923e-05, "loss": 0.007, "step": 190150 }, { "epoch": 2.74, "learning_rate": 1.9086803003444453e-05, "loss": 0.0097, "step": 190160 }, { "epoch": 2.74, "learning_rate": 1.9086754963705982e-05, "loss": 0.0048, "step": 190170 }, { "epoch": 2.74, "learning_rate": 1.9086706923967508e-05, "loss": 0.0066, "step": 190180 }, { "epoch": 2.74, "learning_rate": 1.9086658884229037e-05, "loss": 0.0085, "step": 190190 }, { "epoch": 2.74, "learning_rate": 1.9086610844490566e-05, "loss": 0.0063, "step": 190200 }, { "epoch": 2.74, "learning_rate": 1.9086562804752092e-05, "loss": 0.0079, "step": 190210 }, { "epoch": 2.74, "learning_rate": 1.908651476501362e-05, "loss": 0.0048, "step": 190220 }, { "epoch": 2.74, "learning_rate": 1.908646672527515e-05, "loss": 0.0062, "step": 190230 }, { "epoch": 2.74, "learning_rate": 1.908641868553668e-05, "loss": 0.0078, "step": 190240 }, { "epoch": 2.74, "learning_rate": 1.9086370645798206e-05, "loss": 0.0048, "step": 190250 }, { "epoch": 2.74, "learning_rate": 1.9086322606059735e-05, "loss": 0.0086, "step": 190260 }, { "epoch": 2.74, "learning_rate": 1.9086274566321264e-05, "loss": 0.0079, "step": 190270 }, { "epoch": 2.74, "learning_rate": 1.908622652658279e-05, "loss": 0.0065, "step": 190280 }, { "epoch": 2.74, "learning_rate": 1.908617848684432e-05, "loss": 0.0086, "step": 190290 }, { "epoch": 2.74, "learning_rate": 1.908613044710585e-05, "loss": 0.007, "step": 190300 }, { "epoch": 2.74, "learning_rate": 1.9086082407367378e-05, "loss": 0.0057, "step": 190310 }, { "epoch": 2.74, "learning_rate": 1.9086034367628904e-05, "loss": 0.0054, "step": 190320 }, { "epoch": 2.74, "learning_rate": 1.9085986327890433e-05, "loss": 0.0068, "step": 190330 }, { "epoch": 2.74, "learning_rate": 1.9085938288151962e-05, "loss": 0.0114, "step": 190340 }, { "epoch": 2.74, "learning_rate": 1.9085890248413492e-05, "loss": 0.0078, "step": 190350 }, { "epoch": 2.74, "learning_rate": 1.9085842208675018e-05, "loss": 0.0079, "step": 190360 }, { "epoch": 2.74, "learning_rate": 1.9085794168936547e-05, "loss": 0.0046, "step": 190370 }, { "epoch": 2.74, "learning_rate": 1.9085746129198076e-05, "loss": 0.0094, "step": 190380 }, { "epoch": 2.74, "learning_rate": 1.9085698089459602e-05, "loss": 0.0064, "step": 190390 }, { "epoch": 2.74, "learning_rate": 1.908565004972113e-05, "loss": 0.0058, "step": 190400 }, { "epoch": 2.74, "learning_rate": 1.908560200998266e-05, "loss": 0.0067, "step": 190410 }, { "epoch": 2.74, "learning_rate": 1.908555397024419e-05, "loss": 0.0105, "step": 190420 }, { "epoch": 2.74, "learning_rate": 1.9085505930505716e-05, "loss": 0.0066, "step": 190430 }, { "epoch": 2.74, "learning_rate": 1.9085457890767245e-05, "loss": 0.0051, "step": 190440 }, { "epoch": 2.74, "learning_rate": 1.9085409851028774e-05, "loss": 0.0062, "step": 190450 }, { "epoch": 2.74, "learning_rate": 1.9085366615264145e-05, "loss": 0.014, "step": 190460 }, { "epoch": 2.75, "learning_rate": 1.9085318575525675e-05, "loss": 0.0058, "step": 190470 }, { "epoch": 2.75, "learning_rate": 1.9085270535787204e-05, "loss": 0.0082, "step": 190480 }, { "epoch": 2.75, "learning_rate": 1.9085222496048733e-05, "loss": 0.0064, "step": 190490 }, { "epoch": 2.75, "learning_rate": 1.908517445631026e-05, "loss": 0.0076, "step": 190500 }, { "epoch": 2.75, "learning_rate": 1.908512641657179e-05, "loss": 0.006, "step": 190510 }, { "epoch": 2.75, "learning_rate": 1.9085078376833318e-05, "loss": 0.0059, "step": 190520 }, { "epoch": 2.75, "learning_rate": 1.9085030337094847e-05, "loss": 0.007, "step": 190530 }, { "epoch": 2.75, "learning_rate": 1.9084982297356373e-05, "loss": 0.0054, "step": 190540 }, { "epoch": 2.75, "learning_rate": 1.9084934257617906e-05, "loss": 0.0084, "step": 190550 }, { "epoch": 2.75, "learning_rate": 1.908488621787943e-05, "loss": 0.0049, "step": 190560 }, { "epoch": 2.75, "learning_rate": 1.908483817814096e-05, "loss": 0.0074, "step": 190570 }, { "epoch": 2.75, "learning_rate": 1.908479013840249e-05, "loss": 0.0041, "step": 190580 }, { "epoch": 2.75, "learning_rate": 1.9084742098664016e-05, "loss": 0.0061, "step": 190590 }, { "epoch": 2.75, "learning_rate": 1.9084694058925545e-05, "loss": 0.0087, "step": 190600 }, { "epoch": 2.75, "learning_rate": 1.9084646019187074e-05, "loss": 0.0056, "step": 190610 }, { "epoch": 2.75, "learning_rate": 1.9084597979448604e-05, "loss": 0.0063, "step": 190620 }, { "epoch": 2.75, "learning_rate": 1.908454993971013e-05, "loss": 0.0078, "step": 190630 }, { "epoch": 2.75, "learning_rate": 1.908450189997166e-05, "loss": 0.0063, "step": 190640 }, { "epoch": 2.75, "learning_rate": 1.9084453860233188e-05, "loss": 0.0102, "step": 190650 }, { "epoch": 2.75, "learning_rate": 1.9084405820494717e-05, "loss": 0.009, "step": 190660 }, { "epoch": 2.75, "learning_rate": 1.9084357780756243e-05, "loss": 0.0067, "step": 190670 }, { "epoch": 2.75, "learning_rate": 1.9084309741017772e-05, "loss": 0.0064, "step": 190680 }, { "epoch": 2.75, "learning_rate": 1.9084261701279302e-05, "loss": 0.0056, "step": 190690 }, { "epoch": 2.75, "learning_rate": 1.9084213661540828e-05, "loss": 0.0056, "step": 190700 }, { "epoch": 2.75, "learning_rate": 1.9084165621802357e-05, "loss": 0.0073, "step": 190710 }, { "epoch": 2.75, "learning_rate": 1.9084117582063886e-05, "loss": 0.0062, "step": 190720 }, { "epoch": 2.75, "learning_rate": 1.9084069542325415e-05, "loss": 0.0053, "step": 190730 }, { "epoch": 2.75, "learning_rate": 1.908402150258694e-05, "loss": 0.0043, "step": 190740 }, { "epoch": 2.75, "learning_rate": 1.908397346284847e-05, "loss": 0.0065, "step": 190750 }, { "epoch": 2.75, "learning_rate": 1.908392542311e-05, "loss": 0.0062, "step": 190760 }, { "epoch": 2.75, "learning_rate": 1.9083877383371526e-05, "loss": 0.0105, "step": 190770 }, { "epoch": 2.75, "learning_rate": 1.9083829343633055e-05, "loss": 0.0065, "step": 190780 }, { "epoch": 2.75, "learning_rate": 1.9083781303894584e-05, "loss": 0.0066, "step": 190790 }, { "epoch": 2.75, "learning_rate": 1.9083733264156114e-05, "loss": 0.0042, "step": 190800 }, { "epoch": 2.75, "learning_rate": 1.908368522441764e-05, "loss": 0.0045, "step": 190810 }, { "epoch": 2.75, "learning_rate": 1.908363718467917e-05, "loss": 0.0062, "step": 190820 }, { "epoch": 2.75, "learning_rate": 1.9083589144940698e-05, "loss": 0.0075, "step": 190830 }, { "epoch": 2.75, "learning_rate": 1.9083541105202227e-05, "loss": 0.0079, "step": 190840 }, { "epoch": 2.75, "learning_rate": 1.9083493065463753e-05, "loss": 0.0068, "step": 190850 }, { "epoch": 2.75, "learning_rate": 1.9083445025725282e-05, "loss": 0.008, "step": 190860 }, { "epoch": 2.75, "learning_rate": 1.908339698598681e-05, "loss": 0.0083, "step": 190870 }, { "epoch": 2.75, "learning_rate": 1.9083348946248338e-05, "loss": 0.0076, "step": 190880 }, { "epoch": 2.75, "learning_rate": 1.9083300906509867e-05, "loss": 0.0097, "step": 190890 }, { "epoch": 2.75, "learning_rate": 1.9083252866771396e-05, "loss": 0.0056, "step": 190900 }, { "epoch": 2.75, "learning_rate": 1.9083204827032925e-05, "loss": 0.0071, "step": 190910 }, { "epoch": 2.75, "learning_rate": 1.908315678729445e-05, "loss": 0.0048, "step": 190920 }, { "epoch": 2.75, "learning_rate": 1.908310874755598e-05, "loss": 0.008, "step": 190930 }, { "epoch": 2.75, "learning_rate": 1.908306070781751e-05, "loss": 0.0076, "step": 190940 }, { "epoch": 2.75, "learning_rate": 1.9083012668079036e-05, "loss": 0.0082, "step": 190950 }, { "epoch": 2.75, "learning_rate": 1.9082964628340565e-05, "loss": 0.0076, "step": 190960 }, { "epoch": 2.75, "learning_rate": 1.9082916588602094e-05, "loss": 0.0089, "step": 190970 }, { "epoch": 2.75, "learning_rate": 1.9082868548863623e-05, "loss": 0.011, "step": 190980 }, { "epoch": 2.75, "learning_rate": 1.908282050912515e-05, "loss": 0.0088, "step": 190990 }, { "epoch": 2.75, "learning_rate": 1.908277246938668e-05, "loss": 0.0064, "step": 191000 }, { "epoch": 2.75, "learning_rate": 1.9082724429648208e-05, "loss": 0.0053, "step": 191010 }, { "epoch": 2.75, "learning_rate": 1.9082676389909737e-05, "loss": 0.0041, "step": 191020 }, { "epoch": 2.75, "learning_rate": 1.9082628350171263e-05, "loss": 0.0092, "step": 191030 }, { "epoch": 2.75, "learning_rate": 1.9082580310432792e-05, "loss": 0.007, "step": 191040 }, { "epoch": 2.75, "learning_rate": 1.908253227069432e-05, "loss": 0.0069, "step": 191050 }, { "epoch": 2.75, "learning_rate": 1.9082484230955847e-05, "loss": 0.0052, "step": 191060 }, { "epoch": 2.75, "learning_rate": 1.9082436191217377e-05, "loss": 0.0072, "step": 191070 }, { "epoch": 2.75, "learning_rate": 1.9082388151478906e-05, "loss": 0.0074, "step": 191080 }, { "epoch": 2.75, "learning_rate": 1.9082340111740435e-05, "loss": 0.0083, "step": 191090 }, { "epoch": 2.75, "learning_rate": 1.908229207200196e-05, "loss": 0.005, "step": 191100 }, { "epoch": 2.75, "learning_rate": 1.908224403226349e-05, "loss": 0.0062, "step": 191110 }, { "epoch": 2.75, "learning_rate": 1.908219599252502e-05, "loss": 0.0078, "step": 191120 }, { "epoch": 2.75, "learning_rate": 1.9082147952786546e-05, "loss": 0.0061, "step": 191130 }, { "epoch": 2.75, "learning_rate": 1.9082099913048075e-05, "loss": 0.0065, "step": 191140 }, { "epoch": 2.75, "learning_rate": 1.9082051873309604e-05, "loss": 0.0055, "step": 191150 }, { "epoch": 2.75, "learning_rate": 1.9082003833571133e-05, "loss": 0.0054, "step": 191160 }, { "epoch": 2.76, "learning_rate": 1.908195579383266e-05, "loss": 0.0084, "step": 191170 }, { "epoch": 2.76, "learning_rate": 1.908190775409419e-05, "loss": 0.0044, "step": 191180 }, { "epoch": 2.76, "learning_rate": 1.9081859714355718e-05, "loss": 0.0057, "step": 191190 }, { "epoch": 2.76, "learning_rate": 1.9081811674617247e-05, "loss": 0.0043, "step": 191200 }, { "epoch": 2.76, "learning_rate": 1.9081763634878773e-05, "loss": 0.0069, "step": 191210 }, { "epoch": 2.76, "learning_rate": 1.9081715595140302e-05, "loss": 0.0082, "step": 191220 }, { "epoch": 2.76, "learning_rate": 1.908166755540183e-05, "loss": 0.009, "step": 191230 }, { "epoch": 2.76, "learning_rate": 1.9081619515663357e-05, "loss": 0.0065, "step": 191240 }, { "epoch": 2.76, "learning_rate": 1.9081571475924887e-05, "loss": 0.0074, "step": 191250 }, { "epoch": 2.76, "learning_rate": 1.9081523436186416e-05, "loss": 0.0089, "step": 191260 }, { "epoch": 2.76, "learning_rate": 1.9081475396447945e-05, "loss": 0.0082, "step": 191270 }, { "epoch": 2.76, "learning_rate": 1.908142735670947e-05, "loss": 0.0065, "step": 191280 }, { "epoch": 2.76, "learning_rate": 1.9081379316971e-05, "loss": 0.0079, "step": 191290 }, { "epoch": 2.76, "learning_rate": 1.908133127723253e-05, "loss": 0.0073, "step": 191300 }, { "epoch": 2.76, "learning_rate": 1.9081283237494055e-05, "loss": 0.008, "step": 191310 }, { "epoch": 2.76, "learning_rate": 1.9081235197755585e-05, "loss": 0.0055, "step": 191320 }, { "epoch": 2.76, "learning_rate": 1.9081187158017114e-05, "loss": 0.0061, "step": 191330 }, { "epoch": 2.76, "learning_rate": 1.9081139118278643e-05, "loss": 0.0071, "step": 191340 }, { "epoch": 2.76, "learning_rate": 1.908109107854017e-05, "loss": 0.0071, "step": 191350 }, { "epoch": 2.76, "learning_rate": 1.90810430388017e-05, "loss": 0.0058, "step": 191360 }, { "epoch": 2.76, "learning_rate": 1.9080994999063228e-05, "loss": 0.0063, "step": 191370 }, { "epoch": 2.76, "learning_rate": 1.9080946959324757e-05, "loss": 0.006, "step": 191380 }, { "epoch": 2.76, "learning_rate": 1.9080898919586283e-05, "loss": 0.011, "step": 191390 }, { "epoch": 2.76, "learning_rate": 1.9080850879847812e-05, "loss": 0.0065, "step": 191400 }, { "epoch": 2.76, "learning_rate": 1.908080284010934e-05, "loss": 0.0127, "step": 191410 }, { "epoch": 2.76, "learning_rate": 1.9080754800370867e-05, "loss": 0.0078, "step": 191420 }, { "epoch": 2.76, "learning_rate": 1.9080706760632397e-05, "loss": 0.0065, "step": 191430 }, { "epoch": 2.76, "learning_rate": 1.9080658720893926e-05, "loss": 0.0112, "step": 191440 }, { "epoch": 2.76, "learning_rate": 1.9080610681155455e-05, "loss": 0.0112, "step": 191450 }, { "epoch": 2.76, "learning_rate": 1.908056264141698e-05, "loss": 0.0048, "step": 191460 }, { "epoch": 2.76, "learning_rate": 1.908051460167851e-05, "loss": 0.01, "step": 191470 }, { "epoch": 2.76, "learning_rate": 1.908046656194004e-05, "loss": 0.0081, "step": 191480 }, { "epoch": 2.76, "learning_rate": 1.9080418522201565e-05, "loss": 0.006, "step": 191490 }, { "epoch": 2.76, "learning_rate": 1.9080370482463095e-05, "loss": 0.006, "step": 191500 }, { "epoch": 2.76, "learning_rate": 1.9080322442724624e-05, "loss": 0.0094, "step": 191510 }, { "epoch": 2.76, "learning_rate": 1.9080274402986153e-05, "loss": 0.0067, "step": 191520 }, { "epoch": 2.76, "learning_rate": 1.908022636324768e-05, "loss": 0.0079, "step": 191530 }, { "epoch": 2.76, "learning_rate": 1.908017832350921e-05, "loss": 0.0038, "step": 191540 }, { "epoch": 2.76, "learning_rate": 1.9080130283770738e-05, "loss": 0.0051, "step": 191550 }, { "epoch": 2.76, "learning_rate": 1.9080082244032267e-05, "loss": 0.0083, "step": 191560 }, { "epoch": 2.76, "learning_rate": 1.9080034204293793e-05, "loss": 0.0054, "step": 191570 }, { "epoch": 2.76, "learning_rate": 1.9079986164555322e-05, "loss": 0.0052, "step": 191580 }, { "epoch": 2.76, "learning_rate": 1.907993812481685e-05, "loss": 0.0066, "step": 191590 }, { "epoch": 2.76, "learning_rate": 1.9079890085078377e-05, "loss": 0.007, "step": 191600 }, { "epoch": 2.76, "learning_rate": 1.9079842045339906e-05, "loss": 0.0065, "step": 191610 }, { "epoch": 2.76, "learning_rate": 1.9079794005601436e-05, "loss": 0.0064, "step": 191620 }, { "epoch": 2.76, "learning_rate": 1.9079745965862965e-05, "loss": 0.0058, "step": 191630 }, { "epoch": 2.76, "learning_rate": 1.907969792612449e-05, "loss": 0.0061, "step": 191640 }, { "epoch": 2.76, "learning_rate": 1.907964988638602e-05, "loss": 0.0077, "step": 191650 }, { "epoch": 2.76, "learning_rate": 1.907960184664755e-05, "loss": 0.0076, "step": 191660 }, { "epoch": 2.76, "learning_rate": 1.9079553806909075e-05, "loss": 0.0081, "step": 191670 }, { "epoch": 2.76, "learning_rate": 1.9079505767170605e-05, "loss": 0.008, "step": 191680 }, { "epoch": 2.76, "learning_rate": 1.9079457727432134e-05, "loss": 0.0088, "step": 191690 }, { "epoch": 2.76, "learning_rate": 1.9079409687693663e-05, "loss": 0.0073, "step": 191700 }, { "epoch": 2.76, "learning_rate": 1.907936164795519e-05, "loss": 0.006, "step": 191710 }, { "epoch": 2.76, "learning_rate": 1.9079313608216718e-05, "loss": 0.004, "step": 191720 }, { "epoch": 2.76, "learning_rate": 1.9079265568478248e-05, "loss": 0.0062, "step": 191730 }, { "epoch": 2.76, "learning_rate": 1.9079217528739777e-05, "loss": 0.0085, "step": 191740 }, { "epoch": 2.76, "learning_rate": 1.9079169489001303e-05, "loss": 0.0084, "step": 191750 }, { "epoch": 2.76, "learning_rate": 1.9079121449262832e-05, "loss": 0.0076, "step": 191760 }, { "epoch": 2.76, "learning_rate": 1.907907340952436e-05, "loss": 0.0048, "step": 191770 }, { "epoch": 2.76, "learning_rate": 1.9079025369785887e-05, "loss": 0.0092, "step": 191780 }, { "epoch": 2.76, "learning_rate": 1.9078977330047416e-05, "loss": 0.0077, "step": 191790 }, { "epoch": 2.76, "learning_rate": 1.9078929290308946e-05, "loss": 0.0061, "step": 191800 }, { "epoch": 2.76, "learning_rate": 1.9078881250570475e-05, "loss": 0.01, "step": 191810 }, { "epoch": 2.76, "learning_rate": 1.9078833210832e-05, "loss": 0.005, "step": 191820 }, { "epoch": 2.76, "learning_rate": 1.907878517109353e-05, "loss": 0.0063, "step": 191830 }, { "epoch": 2.76, "learning_rate": 1.907873713135506e-05, "loss": 0.0078, "step": 191840 }, { "epoch": 2.76, "learning_rate": 1.9078689091616585e-05, "loss": 0.0056, "step": 191850 }, { "epoch": 2.77, "learning_rate": 1.9078641051878115e-05, "loss": 0.0068, "step": 191860 }, { "epoch": 2.77, "learning_rate": 1.9078593012139644e-05, "loss": 0.0045, "step": 191870 }, { "epoch": 2.77, "learning_rate": 1.9078544972401173e-05, "loss": 0.0053, "step": 191880 }, { "epoch": 2.77, "learning_rate": 1.90784969326627e-05, "loss": 0.0067, "step": 191890 }, { "epoch": 2.77, "learning_rate": 1.9078448892924228e-05, "loss": 0.0056, "step": 191900 }, { "epoch": 2.77, "learning_rate": 1.9078400853185757e-05, "loss": 0.0042, "step": 191910 }, { "epoch": 2.77, "learning_rate": 1.9078352813447287e-05, "loss": 0.0057, "step": 191920 }, { "epoch": 2.77, "learning_rate": 1.9078304773708813e-05, "loss": 0.0062, "step": 191930 }, { "epoch": 2.77, "learning_rate": 1.9078256733970342e-05, "loss": 0.0055, "step": 191940 }, { "epoch": 2.77, "learning_rate": 1.907820869423187e-05, "loss": 0.007, "step": 191950 }, { "epoch": 2.77, "learning_rate": 1.9078160654493397e-05, "loss": 0.0061, "step": 191960 }, { "epoch": 2.77, "learning_rate": 1.9078112614754926e-05, "loss": 0.0068, "step": 191970 }, { "epoch": 2.77, "learning_rate": 1.9078064575016456e-05, "loss": 0.0078, "step": 191980 }, { "epoch": 2.77, "learning_rate": 1.9078016535277985e-05, "loss": 0.0084, "step": 191990 }, { "epoch": 2.77, "learning_rate": 1.907796849553951e-05, "loss": 0.0056, "step": 192000 }, { "epoch": 2.77, "learning_rate": 1.907792045580104e-05, "loss": 0.0062, "step": 192010 }, { "epoch": 2.77, "learning_rate": 1.907787241606257e-05, "loss": 0.0069, "step": 192020 }, { "epoch": 2.77, "learning_rate": 1.9077824376324095e-05, "loss": 0.0049, "step": 192030 }, { "epoch": 2.77, "learning_rate": 1.9077776336585624e-05, "loss": 0.0056, "step": 192040 }, { "epoch": 2.77, "learning_rate": 1.9077728296847154e-05, "loss": 0.0049, "step": 192050 }, { "epoch": 2.77, "learning_rate": 1.9077680257108683e-05, "loss": 0.006, "step": 192060 }, { "epoch": 2.77, "learning_rate": 1.907763221737021e-05, "loss": 0.0069, "step": 192070 }, { "epoch": 2.77, "learning_rate": 1.9077584177631738e-05, "loss": 0.0073, "step": 192080 }, { "epoch": 2.77, "learning_rate": 1.9077536137893267e-05, "loss": 0.0062, "step": 192090 }, { "epoch": 2.77, "learning_rate": 1.9077488098154797e-05, "loss": 0.0064, "step": 192100 }, { "epoch": 2.77, "learning_rate": 1.9077440058416323e-05, "loss": 0.0078, "step": 192110 }, { "epoch": 2.77, "learning_rate": 1.9077392018677852e-05, "loss": 0.0058, "step": 192120 }, { "epoch": 2.77, "learning_rate": 1.907734397893938e-05, "loss": 0.0042, "step": 192130 }, { "epoch": 2.77, "learning_rate": 1.9077295939200907e-05, "loss": 0.0065, "step": 192140 }, { "epoch": 2.77, "learning_rate": 1.9077247899462436e-05, "loss": 0.0081, "step": 192150 }, { "epoch": 2.77, "learning_rate": 1.9077199859723966e-05, "loss": 0.0056, "step": 192160 }, { "epoch": 2.77, "learning_rate": 1.9077151819985495e-05, "loss": 0.0063, "step": 192170 }, { "epoch": 2.77, "learning_rate": 1.907710378024702e-05, "loss": 0.0091, "step": 192180 }, { "epoch": 2.77, "learning_rate": 1.907705574050855e-05, "loss": 0.005, "step": 192190 }, { "epoch": 2.77, "learning_rate": 1.907700770077008e-05, "loss": 0.0091, "step": 192200 }, { "epoch": 2.77, "learning_rate": 1.9076959661031605e-05, "loss": 0.0054, "step": 192210 }, { "epoch": 2.77, "learning_rate": 1.9076911621293134e-05, "loss": 0.0061, "step": 192220 }, { "epoch": 2.77, "learning_rate": 1.9076863581554664e-05, "loss": 0.0064, "step": 192230 }, { "epoch": 2.77, "learning_rate": 1.9076815541816193e-05, "loss": 0.0075, "step": 192240 }, { "epoch": 2.77, "learning_rate": 1.907676750207772e-05, "loss": 0.0062, "step": 192250 }, { "epoch": 2.77, "learning_rate": 1.9076719462339248e-05, "loss": 0.0066, "step": 192260 }, { "epoch": 2.77, "learning_rate": 1.9076671422600777e-05, "loss": 0.0102, "step": 192270 }, { "epoch": 2.77, "learning_rate": 1.9076623382862303e-05, "loss": 0.0051, "step": 192280 }, { "epoch": 2.77, "learning_rate": 1.9076575343123832e-05, "loss": 0.008, "step": 192290 }, { "epoch": 2.77, "learning_rate": 1.9076527303385362e-05, "loss": 0.0069, "step": 192300 }, { "epoch": 2.77, "learning_rate": 1.907647926364689e-05, "loss": 0.0057, "step": 192310 }, { "epoch": 2.77, "learning_rate": 1.9076431223908417e-05, "loss": 0.0074, "step": 192320 }, { "epoch": 2.77, "learning_rate": 1.9076383184169946e-05, "loss": 0.0082, "step": 192330 }, { "epoch": 2.77, "learning_rate": 1.9076335144431475e-05, "loss": 0.0098, "step": 192340 }, { "epoch": 2.77, "learning_rate": 1.9076287104693005e-05, "loss": 0.0088, "step": 192350 }, { "epoch": 2.77, "learning_rate": 1.907623906495453e-05, "loss": 0.0066, "step": 192360 }, { "epoch": 2.77, "learning_rate": 1.907619102521606e-05, "loss": 0.008, "step": 192370 }, { "epoch": 2.77, "learning_rate": 1.907614298547759e-05, "loss": 0.0074, "step": 192380 }, { "epoch": 2.77, "learning_rate": 1.9076094945739115e-05, "loss": 0.0068, "step": 192390 }, { "epoch": 2.77, "learning_rate": 1.9076046906000644e-05, "loss": 0.0099, "step": 192400 }, { "epoch": 2.77, "learning_rate": 1.9075998866262174e-05, "loss": 0.0079, "step": 192410 }, { "epoch": 2.77, "learning_rate": 1.9075950826523703e-05, "loss": 0.0082, "step": 192420 }, { "epoch": 2.77, "learning_rate": 1.907590278678523e-05, "loss": 0.0052, "step": 192430 }, { "epoch": 2.77, "learning_rate": 1.9075854747046758e-05, "loss": 0.0064, "step": 192440 }, { "epoch": 2.77, "learning_rate": 1.9075806707308287e-05, "loss": 0.0071, "step": 192450 }, { "epoch": 2.77, "learning_rate": 1.9075758667569813e-05, "loss": 0.0054, "step": 192460 }, { "epoch": 2.77, "learning_rate": 1.9075710627831342e-05, "loss": 0.0065, "step": 192470 }, { "epoch": 2.77, "learning_rate": 1.907566258809287e-05, "loss": 0.0064, "step": 192480 }, { "epoch": 2.77, "learning_rate": 1.90756145483544e-05, "loss": 0.0083, "step": 192490 }, { "epoch": 2.77, "learning_rate": 1.9075566508615927e-05, "loss": 0.0063, "step": 192500 }, { "epoch": 2.77, "learning_rate": 1.9075518468877456e-05, "loss": 0.008, "step": 192510 }, { "epoch": 2.77, "learning_rate": 1.9075470429138985e-05, "loss": 0.0074, "step": 192520 }, { "epoch": 2.77, "learning_rate": 1.9075422389400515e-05, "loss": 0.0076, "step": 192530 }, { "epoch": 2.77, "learning_rate": 1.907537434966204e-05, "loss": 0.0035, "step": 192540 }, { "epoch": 2.78, "learning_rate": 1.907532630992357e-05, "loss": 0.0085, "step": 192550 }, { "epoch": 2.78, "learning_rate": 1.90752782701851e-05, "loss": 0.0078, "step": 192560 }, { "epoch": 2.78, "learning_rate": 1.9075230230446625e-05, "loss": 0.008, "step": 192570 }, { "epoch": 2.78, "learning_rate": 1.9075182190708154e-05, "loss": 0.0053, "step": 192580 }, { "epoch": 2.78, "learning_rate": 1.9075134150969683e-05, "loss": 0.0049, "step": 192590 }, { "epoch": 2.78, "learning_rate": 1.9075086111231213e-05, "loss": 0.0055, "step": 192600 }, { "epoch": 2.78, "learning_rate": 1.907503807149274e-05, "loss": 0.0073, "step": 192610 }, { "epoch": 2.78, "learning_rate": 1.9074990031754268e-05, "loss": 0.0067, "step": 192620 }, { "epoch": 2.78, "learning_rate": 1.9074941992015797e-05, "loss": 0.0052, "step": 192630 }, { "epoch": 2.78, "learning_rate": 1.9074893952277323e-05, "loss": 0.0088, "step": 192640 }, { "epoch": 2.78, "learning_rate": 1.9074845912538852e-05, "loss": 0.006, "step": 192650 }, { "epoch": 2.78, "learning_rate": 1.907479787280038e-05, "loss": 0.0061, "step": 192660 }, { "epoch": 2.78, "learning_rate": 1.907474983306191e-05, "loss": 0.0051, "step": 192670 }, { "epoch": 2.78, "learning_rate": 1.9074701793323437e-05, "loss": 0.0056, "step": 192680 }, { "epoch": 2.78, "learning_rate": 1.9074653753584966e-05, "loss": 0.0072, "step": 192690 }, { "epoch": 2.78, "learning_rate": 1.9074605713846495e-05, "loss": 0.0066, "step": 192700 }, { "epoch": 2.78, "learning_rate": 1.9074557674108025e-05, "loss": 0.0078, "step": 192710 }, { "epoch": 2.78, "learning_rate": 1.907450963436955e-05, "loss": 0.0055, "step": 192720 }, { "epoch": 2.78, "learning_rate": 1.907446159463108e-05, "loss": 0.006, "step": 192730 }, { "epoch": 2.78, "learning_rate": 1.907441355489261e-05, "loss": 0.0115, "step": 192740 }, { "epoch": 2.78, "learning_rate": 1.9074365515154135e-05, "loss": 0.0052, "step": 192750 }, { "epoch": 2.78, "learning_rate": 1.9074317475415664e-05, "loss": 0.0069, "step": 192760 }, { "epoch": 2.78, "learning_rate": 1.9074269435677193e-05, "loss": 0.0083, "step": 192770 }, { "epoch": 2.78, "learning_rate": 1.9074221395938723e-05, "loss": 0.0071, "step": 192780 }, { "epoch": 2.78, "learning_rate": 1.907417335620025e-05, "loss": 0.0063, "step": 192790 }, { "epoch": 2.78, "learning_rate": 1.9074125316461778e-05, "loss": 0.0077, "step": 192800 }, { "epoch": 2.78, "learning_rate": 1.9074077276723307e-05, "loss": 0.0051, "step": 192810 }, { "epoch": 2.78, "learning_rate": 1.9074029236984833e-05, "loss": 0.0053, "step": 192820 }, { "epoch": 2.78, "learning_rate": 1.9073981197246362e-05, "loss": 0.0135, "step": 192830 }, { "epoch": 2.78, "learning_rate": 1.907393315750789e-05, "loss": 0.0074, "step": 192840 }, { "epoch": 2.78, "learning_rate": 1.907388511776942e-05, "loss": 0.0091, "step": 192850 }, { "epoch": 2.78, "learning_rate": 1.9073837078030947e-05, "loss": 0.0055, "step": 192860 }, { "epoch": 2.78, "learning_rate": 1.9073789038292476e-05, "loss": 0.0081, "step": 192870 }, { "epoch": 2.78, "learning_rate": 1.9073740998554005e-05, "loss": 0.0078, "step": 192880 }, { "epoch": 2.78, "learning_rate": 1.9073692958815534e-05, "loss": 0.0068, "step": 192890 }, { "epoch": 2.78, "learning_rate": 1.907364491907706e-05, "loss": 0.0053, "step": 192900 }, { "epoch": 2.78, "learning_rate": 1.907359687933859e-05, "loss": 0.0052, "step": 192910 }, { "epoch": 2.78, "learning_rate": 1.907354883960012e-05, "loss": 0.0074, "step": 192920 }, { "epoch": 2.78, "learning_rate": 1.9073500799861645e-05, "loss": 0.0061, "step": 192930 }, { "epoch": 2.78, "learning_rate": 1.9073452760123174e-05, "loss": 0.0062, "step": 192940 }, { "epoch": 2.78, "learning_rate": 1.9073404720384703e-05, "loss": 0.0048, "step": 192950 }, { "epoch": 2.78, "learning_rate": 1.9073356680646233e-05, "loss": 0.0087, "step": 192960 }, { "epoch": 2.78, "learning_rate": 1.907330864090776e-05, "loss": 0.0067, "step": 192970 }, { "epoch": 2.78, "learning_rate": 1.9073260601169288e-05, "loss": 0.0081, "step": 192980 }, { "epoch": 2.78, "learning_rate": 1.9073212561430817e-05, "loss": 0.0073, "step": 192990 }, { "epoch": 2.78, "learning_rate": 1.9073164521692343e-05, "loss": 0.0065, "step": 193000 }, { "epoch": 2.78, "learning_rate": 1.9073116481953872e-05, "loss": 0.0098, "step": 193010 }, { "epoch": 2.78, "learning_rate": 1.90730684422154e-05, "loss": 0.0068, "step": 193020 }, { "epoch": 2.78, "learning_rate": 1.907302040247693e-05, "loss": 0.0053, "step": 193030 }, { "epoch": 2.78, "learning_rate": 1.9072972362738457e-05, "loss": 0.0061, "step": 193040 }, { "epoch": 2.78, "learning_rate": 1.9072924322999986e-05, "loss": 0.004, "step": 193050 }, { "epoch": 2.78, "learning_rate": 1.9072876283261515e-05, "loss": 0.0054, "step": 193060 }, { "epoch": 2.78, "learning_rate": 1.9072828243523044e-05, "loss": 0.0053, "step": 193070 }, { "epoch": 2.78, "learning_rate": 1.907278020378457e-05, "loss": 0.0052, "step": 193080 }, { "epoch": 2.78, "learning_rate": 1.90727321640461e-05, "loss": 0.0061, "step": 193090 }, { "epoch": 2.78, "learning_rate": 1.907268412430763e-05, "loss": 0.0056, "step": 193100 }, { "epoch": 2.78, "learning_rate": 1.9072636084569158e-05, "loss": 0.0069, "step": 193110 }, { "epoch": 2.78, "learning_rate": 1.9072588044830687e-05, "loss": 0.0062, "step": 193120 }, { "epoch": 2.78, "learning_rate": 1.9072540005092217e-05, "loss": 0.0067, "step": 193130 }, { "epoch": 2.78, "learning_rate": 1.9072491965353742e-05, "loss": 0.0069, "step": 193140 }, { "epoch": 2.78, "learning_rate": 1.9072443925615272e-05, "loss": 0.0102, "step": 193150 }, { "epoch": 2.78, "learning_rate": 1.90723958858768e-05, "loss": 0.0049, "step": 193160 }, { "epoch": 2.78, "learning_rate": 1.9072347846138327e-05, "loss": 0.0061, "step": 193170 }, { "epoch": 2.78, "learning_rate": 1.9072299806399856e-05, "loss": 0.0053, "step": 193180 }, { "epoch": 2.78, "learning_rate": 1.9072251766661385e-05, "loss": 0.0053, "step": 193190 }, { "epoch": 2.78, "learning_rate": 1.9072203726922915e-05, "loss": 0.0048, "step": 193200 }, { "epoch": 2.78, "learning_rate": 1.907215568718444e-05, "loss": 0.0041, "step": 193210 }, { "epoch": 2.78, "learning_rate": 1.907210764744597e-05, "loss": 0.0076, "step": 193220 }, { "epoch": 2.78, "learning_rate": 1.90720596077075e-05, "loss": 0.0057, "step": 193230 }, { "epoch": 2.78, "learning_rate": 1.9072011567969025e-05, "loss": 0.0044, "step": 193240 }, { "epoch": 2.79, "learning_rate": 1.9071963528230554e-05, "loss": 0.0066, "step": 193250 }, { "epoch": 2.79, "learning_rate": 1.9071915488492084e-05, "loss": 0.0065, "step": 193260 }, { "epoch": 2.79, "learning_rate": 1.9071867448753613e-05, "loss": 0.0074, "step": 193270 }, { "epoch": 2.79, "learning_rate": 1.907181940901514e-05, "loss": 0.0092, "step": 193280 }, { "epoch": 2.79, "learning_rate": 1.9071771369276668e-05, "loss": 0.0056, "step": 193290 }, { "epoch": 2.79, "learning_rate": 1.9071723329538197e-05, "loss": 0.0063, "step": 193300 }, { "epoch": 2.79, "learning_rate": 1.9071675289799726e-05, "loss": 0.0086, "step": 193310 }, { "epoch": 2.79, "learning_rate": 1.9071627250061252e-05, "loss": 0.0058, "step": 193320 }, { "epoch": 2.79, "learning_rate": 1.907157921032278e-05, "loss": 0.0065, "step": 193330 }, { "epoch": 2.79, "learning_rate": 1.907153117058431e-05, "loss": 0.0059, "step": 193340 }, { "epoch": 2.79, "learning_rate": 1.9071483130845837e-05, "loss": 0.0061, "step": 193350 }, { "epoch": 2.79, "learning_rate": 1.9071435091107366e-05, "loss": 0.0055, "step": 193360 }, { "epoch": 2.79, "learning_rate": 1.9071387051368895e-05, "loss": 0.0059, "step": 193370 }, { "epoch": 2.79, "learning_rate": 1.9071339011630425e-05, "loss": 0.007, "step": 193380 }, { "epoch": 2.79, "learning_rate": 1.907129097189195e-05, "loss": 0.0103, "step": 193390 }, { "epoch": 2.79, "learning_rate": 1.907124293215348e-05, "loss": 0.0085, "step": 193400 }, { "epoch": 2.79, "learning_rate": 1.907119489241501e-05, "loss": 0.0059, "step": 193410 }, { "epoch": 2.79, "learning_rate": 1.9071146852676535e-05, "loss": 0.0096, "step": 193420 }, { "epoch": 2.79, "learning_rate": 1.9071098812938064e-05, "loss": 0.0091, "step": 193430 }, { "epoch": 2.79, "learning_rate": 1.9071050773199593e-05, "loss": 0.0071, "step": 193440 }, { "epoch": 2.79, "learning_rate": 1.9071002733461123e-05, "loss": 0.0049, "step": 193450 }, { "epoch": 2.79, "learning_rate": 1.907095469372265e-05, "loss": 0.0063, "step": 193460 }, { "epoch": 2.79, "learning_rate": 1.9070906653984178e-05, "loss": 0.0077, "step": 193470 }, { "epoch": 2.79, "learning_rate": 1.9070858614245707e-05, "loss": 0.0072, "step": 193480 }, { "epoch": 2.79, "learning_rate": 1.9070810574507236e-05, "loss": 0.0069, "step": 193490 }, { "epoch": 2.79, "learning_rate": 1.9070762534768762e-05, "loss": 0.0077, "step": 193500 }, { "epoch": 2.79, "learning_rate": 1.907071449503029e-05, "loss": 0.0072, "step": 193510 }, { "epoch": 2.79, "learning_rate": 1.907066645529182e-05, "loss": 0.008, "step": 193520 }, { "epoch": 2.79, "learning_rate": 1.9070618415553347e-05, "loss": 0.0062, "step": 193530 }, { "epoch": 2.79, "learning_rate": 1.9070570375814876e-05, "loss": 0.0056, "step": 193540 }, { "epoch": 2.79, "learning_rate": 1.9070522336076405e-05, "loss": 0.0056, "step": 193550 }, { "epoch": 2.79, "learning_rate": 1.9070474296337935e-05, "loss": 0.0091, "step": 193560 }, { "epoch": 2.79, "learning_rate": 1.907042625659946e-05, "loss": 0.0059, "step": 193570 }, { "epoch": 2.79, "learning_rate": 1.907037821686099e-05, "loss": 0.0095, "step": 193580 }, { "epoch": 2.79, "learning_rate": 1.907033017712252e-05, "loss": 0.0057, "step": 193590 }, { "epoch": 2.79, "learning_rate": 1.9070282137384045e-05, "loss": 0.0104, "step": 193600 }, { "epoch": 2.79, "learning_rate": 1.9070234097645574e-05, "loss": 0.0058, "step": 193610 }, { "epoch": 2.79, "learning_rate": 1.9070186057907103e-05, "loss": 0.0072, "step": 193620 }, { "epoch": 2.79, "learning_rate": 1.9070138018168633e-05, "loss": 0.0068, "step": 193630 }, { "epoch": 2.79, "learning_rate": 1.907008997843016e-05, "loss": 0.0057, "step": 193640 }, { "epoch": 2.79, "learning_rate": 1.9070041938691688e-05, "loss": 0.0079, "step": 193650 }, { "epoch": 2.79, "learning_rate": 1.9069993898953217e-05, "loss": 0.0062, "step": 193660 }, { "epoch": 2.79, "learning_rate": 1.9069945859214743e-05, "loss": 0.0082, "step": 193670 }, { "epoch": 2.79, "learning_rate": 1.9069897819476272e-05, "loss": 0.007, "step": 193680 }, { "epoch": 2.79, "learning_rate": 1.90698497797378e-05, "loss": 0.0079, "step": 193690 }, { "epoch": 2.79, "learning_rate": 1.906980173999933e-05, "loss": 0.004, "step": 193700 }, { "epoch": 2.79, "learning_rate": 1.9069753700260857e-05, "loss": 0.0057, "step": 193710 }, { "epoch": 2.79, "learning_rate": 1.9069705660522386e-05, "loss": 0.0059, "step": 193720 }, { "epoch": 2.79, "learning_rate": 1.9069657620783915e-05, "loss": 0.0054, "step": 193730 }, { "epoch": 2.79, "learning_rate": 1.9069609581045444e-05, "loss": 0.0086, "step": 193740 }, { "epoch": 2.79, "learning_rate": 1.906956154130697e-05, "loss": 0.0071, "step": 193750 }, { "epoch": 2.79, "learning_rate": 1.90695135015685e-05, "loss": 0.0074, "step": 193760 }, { "epoch": 2.79, "learning_rate": 1.906946546183003e-05, "loss": 0.0062, "step": 193770 }, { "epoch": 2.79, "learning_rate": 1.9069417422091555e-05, "loss": 0.0073, "step": 193780 }, { "epoch": 2.79, "learning_rate": 1.9069369382353084e-05, "loss": 0.0063, "step": 193790 }, { "epoch": 2.79, "learning_rate": 1.9069321342614613e-05, "loss": 0.0108, "step": 193800 }, { "epoch": 2.79, "learning_rate": 1.9069273302876143e-05, "loss": 0.0051, "step": 193810 }, { "epoch": 2.79, "learning_rate": 1.906922526313767e-05, "loss": 0.0078, "step": 193820 }, { "epoch": 2.79, "learning_rate": 1.9069177223399198e-05, "loss": 0.0094, "step": 193830 }, { "epoch": 2.79, "learning_rate": 1.9069129183660727e-05, "loss": 0.0055, "step": 193840 }, { "epoch": 2.79, "learning_rate": 1.9069081143922253e-05, "loss": 0.0064, "step": 193850 }, { "epoch": 2.79, "learning_rate": 1.9069033104183782e-05, "loss": 0.0059, "step": 193860 }, { "epoch": 2.79, "learning_rate": 1.906898506444531e-05, "loss": 0.0074, "step": 193870 }, { "epoch": 2.79, "learning_rate": 1.906893702470684e-05, "loss": 0.0078, "step": 193880 }, { "epoch": 2.79, "learning_rate": 1.9068888984968367e-05, "loss": 0.0061, "step": 193890 }, { "epoch": 2.79, "learning_rate": 1.9068840945229896e-05, "loss": 0.0078, "step": 193900 }, { "epoch": 2.79, "learning_rate": 1.9068792905491425e-05, "loss": 0.0092, "step": 193910 }, { "epoch": 2.79, "learning_rate": 1.9068744865752954e-05, "loss": 0.0054, "step": 193920 }, { "epoch": 2.79, "learning_rate": 1.906869682601448e-05, "loss": 0.0093, "step": 193930 }, { "epoch": 2.8, "learning_rate": 1.906864878627601e-05, "loss": 0.0067, "step": 193940 }, { "epoch": 2.8, "learning_rate": 1.906860074653754e-05, "loss": 0.0053, "step": 193950 }, { "epoch": 2.8, "learning_rate": 1.9068552706799065e-05, "loss": 0.0116, "step": 193960 }, { "epoch": 2.8, "learning_rate": 1.9068504667060594e-05, "loss": 0.0047, "step": 193970 }, { "epoch": 2.8, "learning_rate": 1.9068456627322123e-05, "loss": 0.0062, "step": 193980 }, { "epoch": 2.8, "learning_rate": 1.9068408587583652e-05, "loss": 0.0084, "step": 193990 }, { "epoch": 2.8, "learning_rate": 1.906836054784518e-05, "loss": 0.0074, "step": 194000 }, { "epoch": 2.8, "learning_rate": 1.9068312508106708e-05, "loss": 0.0069, "step": 194010 }, { "epoch": 2.8, "learning_rate": 1.9068264468368237e-05, "loss": 0.0058, "step": 194020 }, { "epoch": 2.8, "learning_rate": 1.9068216428629763e-05, "loss": 0.0057, "step": 194030 }, { "epoch": 2.8, "learning_rate": 1.9068168388891292e-05, "loss": 0.0075, "step": 194040 }, { "epoch": 2.8, "learning_rate": 1.906812034915282e-05, "loss": 0.0064, "step": 194050 }, { "epoch": 2.8, "learning_rate": 1.906807230941435e-05, "loss": 0.0068, "step": 194060 }, { "epoch": 2.8, "learning_rate": 1.9068024269675876e-05, "loss": 0.0084, "step": 194070 }, { "epoch": 2.8, "learning_rate": 1.9067976229937406e-05, "loss": 0.008, "step": 194080 }, { "epoch": 2.8, "learning_rate": 1.9067928190198935e-05, "loss": 0.0059, "step": 194090 }, { "epoch": 2.8, "learning_rate": 1.9067880150460464e-05, "loss": 0.0049, "step": 194100 }, { "epoch": 2.8, "learning_rate": 1.906783211072199e-05, "loss": 0.0066, "step": 194110 }, { "epoch": 2.8, "learning_rate": 1.906778407098352e-05, "loss": 0.0048, "step": 194120 }, { "epoch": 2.8, "learning_rate": 1.906773603124505e-05, "loss": 0.0073, "step": 194130 }, { "epoch": 2.8, "learning_rate": 1.9067687991506575e-05, "loss": 0.0097, "step": 194140 }, { "epoch": 2.8, "learning_rate": 1.9067639951768104e-05, "loss": 0.0039, "step": 194150 }, { "epoch": 2.8, "learning_rate": 1.9067591912029633e-05, "loss": 0.0051, "step": 194160 }, { "epoch": 2.8, "learning_rate": 1.9067543872291162e-05, "loss": 0.009, "step": 194170 }, { "epoch": 2.8, "learning_rate": 1.9067495832552688e-05, "loss": 0.0042, "step": 194180 }, { "epoch": 2.8, "learning_rate": 1.9067447792814218e-05, "loss": 0.0076, "step": 194190 }, { "epoch": 2.8, "learning_rate": 1.9067399753075747e-05, "loss": 0.0103, "step": 194200 }, { "epoch": 2.8, "learning_rate": 1.9067351713337273e-05, "loss": 0.0041, "step": 194210 }, { "epoch": 2.8, "learning_rate": 1.9067303673598802e-05, "loss": 0.0048, "step": 194220 }, { "epoch": 2.8, "learning_rate": 1.906725563386033e-05, "loss": 0.0072, "step": 194230 }, { "epoch": 2.8, "learning_rate": 1.906720759412186e-05, "loss": 0.0075, "step": 194240 }, { "epoch": 2.8, "learning_rate": 1.9067159554383386e-05, "loss": 0.01, "step": 194250 }, { "epoch": 2.8, "learning_rate": 1.9067111514644916e-05, "loss": 0.0109, "step": 194260 }, { "epoch": 2.8, "learning_rate": 1.9067063474906445e-05, "loss": 0.0077, "step": 194270 }, { "epoch": 2.8, "learning_rate": 1.9067015435167974e-05, "loss": 0.0044, "step": 194280 }, { "epoch": 2.8, "learning_rate": 1.90669673954295e-05, "loss": 0.007, "step": 194290 }, { "epoch": 2.8, "learning_rate": 1.906691935569103e-05, "loss": 0.0063, "step": 194300 }, { "epoch": 2.8, "learning_rate": 1.906687131595256e-05, "loss": 0.0064, "step": 194310 }, { "epoch": 2.8, "learning_rate": 1.9066823276214084e-05, "loss": 0.0059, "step": 194320 }, { "epoch": 2.8, "learning_rate": 1.9066775236475614e-05, "loss": 0.0134, "step": 194330 }, { "epoch": 2.8, "learning_rate": 1.9066727196737143e-05, "loss": 0.007, "step": 194340 }, { "epoch": 2.8, "learning_rate": 1.9066679156998672e-05, "loss": 0.006, "step": 194350 }, { "epoch": 2.8, "learning_rate": 1.9066631117260198e-05, "loss": 0.006, "step": 194360 }, { "epoch": 2.8, "learning_rate": 1.9066583077521727e-05, "loss": 0.0083, "step": 194370 }, { "epoch": 2.8, "learning_rate": 1.9066535037783257e-05, "loss": 0.0064, "step": 194380 }, { "epoch": 2.8, "learning_rate": 1.9066486998044783e-05, "loss": 0.0066, "step": 194390 }, { "epoch": 2.8, "learning_rate": 1.9066438958306312e-05, "loss": 0.0086, "step": 194400 }, { "epoch": 2.8, "learning_rate": 1.906639091856784e-05, "loss": 0.0107, "step": 194410 }, { "epoch": 2.8, "learning_rate": 1.906634287882937e-05, "loss": 0.0099, "step": 194420 }, { "epoch": 2.8, "learning_rate": 1.9066294839090896e-05, "loss": 0.0042, "step": 194430 }, { "epoch": 2.8, "learning_rate": 1.9066246799352426e-05, "loss": 0.0088, "step": 194440 }, { "epoch": 2.8, "learning_rate": 1.9066198759613955e-05, "loss": 0.0056, "step": 194450 }, { "epoch": 2.8, "learning_rate": 1.9066150719875484e-05, "loss": 0.006, "step": 194460 }, { "epoch": 2.8, "learning_rate": 1.906610268013701e-05, "loss": 0.0067, "step": 194470 }, { "epoch": 2.8, "learning_rate": 1.906605464039854e-05, "loss": 0.0106, "step": 194480 }, { "epoch": 2.8, "learning_rate": 1.906600660066007e-05, "loss": 0.0081, "step": 194490 }, { "epoch": 2.8, "learning_rate": 1.9065958560921594e-05, "loss": 0.0048, "step": 194500 }, { "epoch": 2.8, "learning_rate": 1.9065910521183124e-05, "loss": 0.0085, "step": 194510 }, { "epoch": 2.8, "learning_rate": 1.9065867285418502e-05, "loss": 0.0083, "step": 194520 }, { "epoch": 2.8, "learning_rate": 1.9065819245680028e-05, "loss": 0.0064, "step": 194530 }, { "epoch": 2.8, "learning_rate": 1.9065771205941557e-05, "loss": 0.0091, "step": 194540 }, { "epoch": 2.8, "learning_rate": 1.9065723166203086e-05, "loss": 0.007, "step": 194550 }, { "epoch": 2.8, "learning_rate": 1.9065675126464612e-05, "loss": 0.0057, "step": 194560 }, { "epoch": 2.8, "learning_rate": 1.906562708672614e-05, "loss": 0.0054, "step": 194570 }, { "epoch": 2.8, "learning_rate": 1.906557904698767e-05, "loss": 0.0064, "step": 194580 }, { "epoch": 2.8, "learning_rate": 1.90655310072492e-05, "loss": 0.0045, "step": 194590 }, { "epoch": 2.8, "learning_rate": 1.9065482967510726e-05, "loss": 0.0069, "step": 194600 }, { "epoch": 2.8, "learning_rate": 1.9065434927772255e-05, "loss": 0.0054, "step": 194610 }, { "epoch": 2.8, "learning_rate": 1.9065386888033784e-05, "loss": 0.0109, "step": 194620 }, { "epoch": 2.8, "learning_rate": 1.906533884829531e-05, "loss": 0.0036, "step": 194630 }, { "epoch": 2.81, "learning_rate": 1.906529080855684e-05, "loss": 0.0068, "step": 194640 }, { "epoch": 2.81, "learning_rate": 1.906524276881837e-05, "loss": 0.0084, "step": 194650 }, { "epoch": 2.81, "learning_rate": 1.9065194729079898e-05, "loss": 0.0084, "step": 194660 }, { "epoch": 2.81, "learning_rate": 1.9065146689341424e-05, "loss": 0.0056, "step": 194670 }, { "epoch": 2.81, "learning_rate": 1.9065098649602953e-05, "loss": 0.0059, "step": 194680 }, { "epoch": 2.81, "learning_rate": 1.9065050609864482e-05, "loss": 0.0058, "step": 194690 }, { "epoch": 2.81, "learning_rate": 1.906500257012601e-05, "loss": 0.0075, "step": 194700 }, { "epoch": 2.81, "learning_rate": 1.9064954530387537e-05, "loss": 0.0085, "step": 194710 }, { "epoch": 2.81, "learning_rate": 1.9064906490649067e-05, "loss": 0.0046, "step": 194720 }, { "epoch": 2.81, "learning_rate": 1.9064858450910596e-05, "loss": 0.0072, "step": 194730 }, { "epoch": 2.81, "learning_rate": 1.9064810411172122e-05, "loss": 0.006, "step": 194740 }, { "epoch": 2.81, "learning_rate": 1.906476237143365e-05, "loss": 0.009, "step": 194750 }, { "epoch": 2.81, "learning_rate": 1.906471433169518e-05, "loss": 0.0059, "step": 194760 }, { "epoch": 2.81, "learning_rate": 1.906466629195671e-05, "loss": 0.0067, "step": 194770 }, { "epoch": 2.81, "learning_rate": 1.9064618252218236e-05, "loss": 0.0072, "step": 194780 }, { "epoch": 2.81, "learning_rate": 1.9064570212479765e-05, "loss": 0.0048, "step": 194790 }, { "epoch": 2.81, "learning_rate": 1.9064522172741294e-05, "loss": 0.0093, "step": 194800 }, { "epoch": 2.81, "learning_rate": 1.906447413300282e-05, "loss": 0.0068, "step": 194810 }, { "epoch": 2.81, "learning_rate": 1.906442609326435e-05, "loss": 0.0064, "step": 194820 }, { "epoch": 2.81, "learning_rate": 1.906437805352588e-05, "loss": 0.0067, "step": 194830 }, { "epoch": 2.81, "learning_rate": 1.9064330013787408e-05, "loss": 0.0048, "step": 194840 }, { "epoch": 2.81, "learning_rate": 1.9064281974048934e-05, "loss": 0.0057, "step": 194850 }, { "epoch": 2.81, "learning_rate": 1.9064233934310463e-05, "loss": 0.0065, "step": 194860 }, { "epoch": 2.81, "learning_rate": 1.9064185894571992e-05, "loss": 0.0079, "step": 194870 }, { "epoch": 2.81, "learning_rate": 1.906413785483352e-05, "loss": 0.0069, "step": 194880 }, { "epoch": 2.81, "learning_rate": 1.9064089815095047e-05, "loss": 0.0065, "step": 194890 }, { "epoch": 2.81, "learning_rate": 1.9064041775356577e-05, "loss": 0.0053, "step": 194900 }, { "epoch": 2.81, "learning_rate": 1.9063993735618106e-05, "loss": 0.0075, "step": 194910 }, { "epoch": 2.81, "learning_rate": 1.9063945695879632e-05, "loss": 0.0063, "step": 194920 }, { "epoch": 2.81, "learning_rate": 1.906389765614116e-05, "loss": 0.0057, "step": 194930 }, { "epoch": 2.81, "learning_rate": 1.906384961640269e-05, "loss": 0.0056, "step": 194940 }, { "epoch": 2.81, "learning_rate": 1.906380157666422e-05, "loss": 0.0042, "step": 194950 }, { "epoch": 2.81, "learning_rate": 1.9063753536925746e-05, "loss": 0.0079, "step": 194960 }, { "epoch": 2.81, "learning_rate": 1.9063705497187275e-05, "loss": 0.005, "step": 194970 }, { "epoch": 2.81, "learning_rate": 1.9063657457448804e-05, "loss": 0.0072, "step": 194980 }, { "epoch": 2.81, "learning_rate": 1.906360941771033e-05, "loss": 0.0061, "step": 194990 }, { "epoch": 2.81, "learning_rate": 1.906356137797186e-05, "loss": 0.0038, "step": 195000 }, { "epoch": 2.81, "learning_rate": 1.906351333823339e-05, "loss": 0.006, "step": 195010 }, { "epoch": 2.81, "learning_rate": 1.9063465298494918e-05, "loss": 0.0044, "step": 195020 }, { "epoch": 2.81, "learning_rate": 1.9063417258756444e-05, "loss": 0.0071, "step": 195030 }, { "epoch": 2.81, "learning_rate": 1.9063369219017973e-05, "loss": 0.0092, "step": 195040 }, { "epoch": 2.81, "learning_rate": 1.9063321179279502e-05, "loss": 0.0061, "step": 195050 }, { "epoch": 2.81, "learning_rate": 1.906327313954103e-05, "loss": 0.0073, "step": 195060 }, { "epoch": 2.81, "learning_rate": 1.9063225099802557e-05, "loss": 0.0056, "step": 195070 }, { "epoch": 2.81, "learning_rate": 1.9063177060064087e-05, "loss": 0.0065, "step": 195080 }, { "epoch": 2.81, "learning_rate": 1.9063129020325616e-05, "loss": 0.0057, "step": 195090 }, { "epoch": 2.81, "learning_rate": 1.9063080980587142e-05, "loss": 0.0067, "step": 195100 }, { "epoch": 2.81, "learning_rate": 1.906303294084867e-05, "loss": 0.0079, "step": 195110 }, { "epoch": 2.81, "learning_rate": 1.90629849011102e-05, "loss": 0.007, "step": 195120 }, { "epoch": 2.81, "learning_rate": 1.906293686137173e-05, "loss": 0.0074, "step": 195130 }, { "epoch": 2.81, "learning_rate": 1.9062888821633255e-05, "loss": 0.0074, "step": 195140 }, { "epoch": 2.81, "learning_rate": 1.9062840781894785e-05, "loss": 0.0077, "step": 195150 }, { "epoch": 2.81, "learning_rate": 1.9062792742156314e-05, "loss": 0.0078, "step": 195160 }, { "epoch": 2.81, "learning_rate": 1.906274470241784e-05, "loss": 0.0085, "step": 195170 }, { "epoch": 2.81, "learning_rate": 1.906269666267937e-05, "loss": 0.0089, "step": 195180 }, { "epoch": 2.81, "learning_rate": 1.90626486229409e-05, "loss": 0.0056, "step": 195190 }, { "epoch": 2.81, "learning_rate": 1.9062600583202428e-05, "loss": 0.006, "step": 195200 }, { "epoch": 2.81, "learning_rate": 1.9062552543463954e-05, "loss": 0.0057, "step": 195210 }, { "epoch": 2.81, "learning_rate": 1.9062504503725483e-05, "loss": 0.0057, "step": 195220 }, { "epoch": 2.81, "learning_rate": 1.9062456463987012e-05, "loss": 0.0096, "step": 195230 }, { "epoch": 2.81, "learning_rate": 1.9062408424248538e-05, "loss": 0.007, "step": 195240 }, { "epoch": 2.81, "learning_rate": 1.9062360384510067e-05, "loss": 0.005, "step": 195250 }, { "epoch": 2.81, "learning_rate": 1.9062312344771597e-05, "loss": 0.0069, "step": 195260 }, { "epoch": 2.81, "learning_rate": 1.9062264305033126e-05, "loss": 0.0066, "step": 195270 }, { "epoch": 2.81, "learning_rate": 1.906221626529465e-05, "loss": 0.0067, "step": 195280 }, { "epoch": 2.81, "learning_rate": 1.906216822555618e-05, "loss": 0.0091, "step": 195290 }, { "epoch": 2.81, "learning_rate": 1.906212018581771e-05, "loss": 0.0052, "step": 195300 }, { "epoch": 2.81, "learning_rate": 1.906207214607924e-05, "loss": 0.0058, "step": 195310 }, { "epoch": 2.81, "learning_rate": 1.9062024106340765e-05, "loss": 0.0068, "step": 195320 }, { "epoch": 2.82, "learning_rate": 1.9061976066602295e-05, "loss": 0.0064, "step": 195330 }, { "epoch": 2.82, "learning_rate": 1.9061928026863824e-05, "loss": 0.0081, "step": 195340 }, { "epoch": 2.82, "learning_rate": 1.906187998712535e-05, "loss": 0.0051, "step": 195350 }, { "epoch": 2.82, "learning_rate": 1.906183194738688e-05, "loss": 0.0093, "step": 195360 }, { "epoch": 2.82, "learning_rate": 1.906178390764841e-05, "loss": 0.0078, "step": 195370 }, { "epoch": 2.82, "learning_rate": 1.9061735867909938e-05, "loss": 0.0149, "step": 195380 }, { "epoch": 2.82, "learning_rate": 1.9061687828171463e-05, "loss": 0.0069, "step": 195390 }, { "epoch": 2.82, "learning_rate": 1.9061639788432993e-05, "loss": 0.0069, "step": 195400 }, { "epoch": 2.82, "learning_rate": 1.9061591748694522e-05, "loss": 0.0083, "step": 195410 }, { "epoch": 2.82, "learning_rate": 1.9061543708956048e-05, "loss": 0.0096, "step": 195420 }, { "epoch": 2.82, "learning_rate": 1.9061495669217577e-05, "loss": 0.0081, "step": 195430 }, { "epoch": 2.82, "learning_rate": 1.9061447629479106e-05, "loss": 0.0045, "step": 195440 }, { "epoch": 2.82, "learning_rate": 1.9061399589740636e-05, "loss": 0.0062, "step": 195450 }, { "epoch": 2.82, "learning_rate": 1.906135155000216e-05, "loss": 0.0041, "step": 195460 }, { "epoch": 2.82, "learning_rate": 1.906130351026369e-05, "loss": 0.0042, "step": 195470 }, { "epoch": 2.82, "learning_rate": 1.906125547052522e-05, "loss": 0.01, "step": 195480 }, { "epoch": 2.82, "learning_rate": 1.906120743078675e-05, "loss": 0.005, "step": 195490 }, { "epoch": 2.82, "learning_rate": 1.9061159391048275e-05, "loss": 0.0054, "step": 195500 }, { "epoch": 2.82, "learning_rate": 1.9061111351309805e-05, "loss": 0.0045, "step": 195510 }, { "epoch": 2.82, "learning_rate": 1.9061063311571334e-05, "loss": 0.0054, "step": 195520 }, { "epoch": 2.82, "learning_rate": 1.906101527183286e-05, "loss": 0.0074, "step": 195530 }, { "epoch": 2.82, "learning_rate": 1.906096723209439e-05, "loss": 0.0061, "step": 195540 }, { "epoch": 2.82, "learning_rate": 1.9060919192355918e-05, "loss": 0.0071, "step": 195550 }, { "epoch": 2.82, "learning_rate": 1.9060871152617447e-05, "loss": 0.0081, "step": 195560 }, { "epoch": 2.82, "learning_rate": 1.9060823112878973e-05, "loss": 0.0063, "step": 195570 }, { "epoch": 2.82, "learning_rate": 1.9060775073140503e-05, "loss": 0.0051, "step": 195580 }, { "epoch": 2.82, "learning_rate": 1.9060727033402032e-05, "loss": 0.0065, "step": 195590 }, { "epoch": 2.82, "learning_rate": 1.9060678993663558e-05, "loss": 0.0076, "step": 195600 }, { "epoch": 2.82, "learning_rate": 1.9060630953925087e-05, "loss": 0.0078, "step": 195610 }, { "epoch": 2.82, "learning_rate": 1.9060582914186616e-05, "loss": 0.0078, "step": 195620 }, { "epoch": 2.82, "learning_rate": 1.9060534874448146e-05, "loss": 0.0045, "step": 195630 }, { "epoch": 2.82, "learning_rate": 1.906048683470967e-05, "loss": 0.008, "step": 195640 }, { "epoch": 2.82, "learning_rate": 1.90604387949712e-05, "loss": 0.0075, "step": 195650 }, { "epoch": 2.82, "learning_rate": 1.906039075523273e-05, "loss": 0.0082, "step": 195660 }, { "epoch": 2.82, "learning_rate": 1.906034271549426e-05, "loss": 0.0079, "step": 195670 }, { "epoch": 2.82, "learning_rate": 1.9060294675755785e-05, "loss": 0.0081, "step": 195680 }, { "epoch": 2.82, "learning_rate": 1.9060246636017314e-05, "loss": 0.007, "step": 195690 }, { "epoch": 2.82, "learning_rate": 1.9060198596278844e-05, "loss": 0.006, "step": 195700 }, { "epoch": 2.82, "learning_rate": 1.906015055654037e-05, "loss": 0.0072, "step": 195710 }, { "epoch": 2.82, "learning_rate": 1.90601025168019e-05, "loss": 0.0086, "step": 195720 }, { "epoch": 2.82, "learning_rate": 1.9060054477063428e-05, "loss": 0.0095, "step": 195730 }, { "epoch": 2.82, "learning_rate": 1.9060006437324957e-05, "loss": 0.0072, "step": 195740 }, { "epoch": 2.82, "learning_rate": 1.9059958397586483e-05, "loss": 0.0054, "step": 195750 }, { "epoch": 2.82, "learning_rate": 1.9059910357848013e-05, "loss": 0.0056, "step": 195760 }, { "epoch": 2.82, "learning_rate": 1.9059862318109542e-05, "loss": 0.0065, "step": 195770 }, { "epoch": 2.82, "learning_rate": 1.9059814278371068e-05, "loss": 0.0041, "step": 195780 }, { "epoch": 2.82, "learning_rate": 1.9059766238632597e-05, "loss": 0.0076, "step": 195790 }, { "epoch": 2.82, "learning_rate": 1.9059718198894126e-05, "loss": 0.0075, "step": 195800 }, { "epoch": 2.82, "learning_rate": 1.9059670159155656e-05, "loss": 0.0081, "step": 195810 }, { "epoch": 2.82, "learning_rate": 1.905962211941718e-05, "loss": 0.007, "step": 195820 }, { "epoch": 2.82, "learning_rate": 1.905957407967871e-05, "loss": 0.0091, "step": 195830 }, { "epoch": 2.82, "learning_rate": 1.905952603994024e-05, "loss": 0.0045, "step": 195840 }, { "epoch": 2.82, "learning_rate": 1.905947800020177e-05, "loss": 0.0079, "step": 195850 }, { "epoch": 2.82, "learning_rate": 1.9059429960463295e-05, "loss": 0.0101, "step": 195860 }, { "epoch": 2.82, "learning_rate": 1.9059381920724824e-05, "loss": 0.005, "step": 195870 }, { "epoch": 2.82, "learning_rate": 1.9059333880986354e-05, "loss": 0.0074, "step": 195880 }, { "epoch": 2.82, "learning_rate": 1.905928584124788e-05, "loss": 0.0061, "step": 195890 }, { "epoch": 2.82, "learning_rate": 1.905923780150941e-05, "loss": 0.0077, "step": 195900 }, { "epoch": 2.82, "learning_rate": 1.9059189761770938e-05, "loss": 0.0063, "step": 195910 }, { "epoch": 2.82, "learning_rate": 1.9059141722032467e-05, "loss": 0.0055, "step": 195920 }, { "epoch": 2.82, "learning_rate": 1.9059093682293993e-05, "loss": 0.007, "step": 195930 }, { "epoch": 2.82, "learning_rate": 1.9059045642555522e-05, "loss": 0.0067, "step": 195940 }, { "epoch": 2.82, "learning_rate": 1.9058997602817052e-05, "loss": 0.0089, "step": 195950 }, { "epoch": 2.82, "learning_rate": 1.9058949563078578e-05, "loss": 0.0079, "step": 195960 }, { "epoch": 2.82, "learning_rate": 1.9058901523340107e-05, "loss": 0.0171, "step": 195970 }, { "epoch": 2.82, "learning_rate": 1.9058853483601636e-05, "loss": 0.0079, "step": 195980 }, { "epoch": 2.82, "learning_rate": 1.9058805443863165e-05, "loss": 0.0047, "step": 195990 }, { "epoch": 2.82, "learning_rate": 1.905875740412469e-05, "loss": 0.0074, "step": 196000 }, { "epoch": 2.82, "learning_rate": 1.905870936438622e-05, "loss": 0.0059, "step": 196010 }, { "epoch": 2.83, "learning_rate": 1.905866132464775e-05, "loss": 0.0069, "step": 196020 }, { "epoch": 2.83, "learning_rate": 1.905861328490928e-05, "loss": 0.004, "step": 196030 }, { "epoch": 2.83, "learning_rate": 1.9058565245170805e-05, "loss": 0.0066, "step": 196040 }, { "epoch": 2.83, "learning_rate": 1.9058517205432334e-05, "loss": 0.0053, "step": 196050 }, { "epoch": 2.83, "learning_rate": 1.9058469165693864e-05, "loss": 0.0033, "step": 196060 }, { "epoch": 2.83, "learning_rate": 1.905842112595539e-05, "loss": 0.0065, "step": 196070 }, { "epoch": 2.83, "learning_rate": 1.905837308621692e-05, "loss": 0.0088, "step": 196080 }, { "epoch": 2.83, "learning_rate": 1.9058325046478448e-05, "loss": 0.0052, "step": 196090 }, { "epoch": 2.83, "learning_rate": 1.9058277006739977e-05, "loss": 0.0075, "step": 196100 }, { "epoch": 2.83, "learning_rate": 1.9058228967001503e-05, "loss": 0.0078, "step": 196110 }, { "epoch": 2.83, "learning_rate": 1.9058180927263032e-05, "loss": 0.0037, "step": 196120 }, { "epoch": 2.83, "learning_rate": 1.905813288752456e-05, "loss": 0.0065, "step": 196130 }, { "epoch": 2.83, "learning_rate": 1.9058084847786088e-05, "loss": 0.0045, "step": 196140 }, { "epoch": 2.83, "learning_rate": 1.9058036808047617e-05, "loss": 0.0078, "step": 196150 }, { "epoch": 2.83, "learning_rate": 1.9057988768309146e-05, "loss": 0.0119, "step": 196160 }, { "epoch": 2.83, "learning_rate": 1.9057940728570675e-05, "loss": 0.0202, "step": 196170 }, { "epoch": 2.83, "learning_rate": 1.90578926888322e-05, "loss": 0.0076, "step": 196180 }, { "epoch": 2.83, "learning_rate": 1.9057844649093734e-05, "loss": 0.0067, "step": 196190 }, { "epoch": 2.83, "learning_rate": 1.905779660935526e-05, "loss": 0.0061, "step": 196200 }, { "epoch": 2.83, "learning_rate": 1.905774856961679e-05, "loss": 0.0085, "step": 196210 }, { "epoch": 2.83, "learning_rate": 1.905770052987832e-05, "loss": 0.008, "step": 196220 }, { "epoch": 2.83, "learning_rate": 1.9057652490139848e-05, "loss": 0.0064, "step": 196230 }, { "epoch": 2.83, "learning_rate": 1.9057604450401373e-05, "loss": 0.0076, "step": 196240 }, { "epoch": 2.83, "learning_rate": 1.9057556410662903e-05, "loss": 0.0056, "step": 196250 }, { "epoch": 2.83, "learning_rate": 1.9057508370924432e-05, "loss": 0.008, "step": 196260 }, { "epoch": 2.83, "learning_rate": 1.905746033118596e-05, "loss": 0.0066, "step": 196270 }, { "epoch": 2.83, "learning_rate": 1.9057412291447487e-05, "loss": 0.0073, "step": 196280 }, { "epoch": 2.83, "learning_rate": 1.9057364251709016e-05, "loss": 0.0079, "step": 196290 }, { "epoch": 2.83, "learning_rate": 1.9057316211970546e-05, "loss": 0.0084, "step": 196300 }, { "epoch": 2.83, "learning_rate": 1.905726817223207e-05, "loss": 0.0054, "step": 196310 }, { "epoch": 2.83, "learning_rate": 1.90572201324936e-05, "loss": 0.0058, "step": 196320 }, { "epoch": 2.83, "learning_rate": 1.905717209275513e-05, "loss": 0.0059, "step": 196330 }, { "epoch": 2.83, "learning_rate": 1.905712405301666e-05, "loss": 0.0042, "step": 196340 }, { "epoch": 2.83, "learning_rate": 1.9057076013278185e-05, "loss": 0.0075, "step": 196350 }, { "epoch": 2.83, "learning_rate": 1.9057027973539715e-05, "loss": 0.0061, "step": 196360 }, { "epoch": 2.83, "learning_rate": 1.9056979933801244e-05, "loss": 0.0069, "step": 196370 }, { "epoch": 2.83, "learning_rate": 1.905693189406277e-05, "loss": 0.007, "step": 196380 }, { "epoch": 2.83, "learning_rate": 1.90568838543243e-05, "loss": 0.0063, "step": 196390 }, { "epoch": 2.83, "learning_rate": 1.9056835814585828e-05, "loss": 0.0049, "step": 196400 }, { "epoch": 2.83, "learning_rate": 1.9056787774847357e-05, "loss": 0.0047, "step": 196410 }, { "epoch": 2.83, "learning_rate": 1.9056739735108883e-05, "loss": 0.0056, "step": 196420 }, { "epoch": 2.83, "learning_rate": 1.9056691695370413e-05, "loss": 0.0047, "step": 196430 }, { "epoch": 2.83, "learning_rate": 1.9056643655631942e-05, "loss": 0.0089, "step": 196440 }, { "epoch": 2.83, "learning_rate": 1.905659561589347e-05, "loss": 0.0074, "step": 196450 }, { "epoch": 2.83, "learning_rate": 1.9056547576154997e-05, "loss": 0.0092, "step": 196460 }, { "epoch": 2.83, "learning_rate": 1.9056499536416526e-05, "loss": 0.0051, "step": 196470 }, { "epoch": 2.83, "learning_rate": 1.9056451496678056e-05, "loss": 0.005, "step": 196480 }, { "epoch": 2.83, "learning_rate": 1.905640345693958e-05, "loss": 0.0082, "step": 196490 }, { "epoch": 2.83, "learning_rate": 1.905635541720111e-05, "loss": 0.0079, "step": 196500 }, { "epoch": 2.83, "learning_rate": 1.905630737746264e-05, "loss": 0.0076, "step": 196510 }, { "epoch": 2.83, "learning_rate": 1.905625933772417e-05, "loss": 0.0049, "step": 196520 }, { "epoch": 2.83, "learning_rate": 1.9056211297985695e-05, "loss": 0.0044, "step": 196530 }, { "epoch": 2.83, "learning_rate": 1.9056163258247224e-05, "loss": 0.0063, "step": 196540 }, { "epoch": 2.83, "learning_rate": 1.9056115218508754e-05, "loss": 0.0052, "step": 196550 }, { "epoch": 2.83, "learning_rate": 1.905606717877028e-05, "loss": 0.0098, "step": 196560 }, { "epoch": 2.83, "learning_rate": 1.905601913903181e-05, "loss": 0.0068, "step": 196570 }, { "epoch": 2.83, "learning_rate": 1.9055971099293338e-05, "loss": 0.0066, "step": 196580 }, { "epoch": 2.83, "learning_rate": 1.9055923059554867e-05, "loss": 0.008, "step": 196590 }, { "epoch": 2.83, "learning_rate": 1.9055875019816393e-05, "loss": 0.0086, "step": 196600 }, { "epoch": 2.83, "learning_rate": 1.9055826980077923e-05, "loss": 0.0082, "step": 196610 }, { "epoch": 2.83, "learning_rate": 1.9055778940339452e-05, "loss": 0.0057, "step": 196620 }, { "epoch": 2.83, "learning_rate": 1.9055730900600978e-05, "loss": 0.007, "step": 196630 }, { "epoch": 2.83, "learning_rate": 1.9055682860862507e-05, "loss": 0.0101, "step": 196640 }, { "epoch": 2.83, "learning_rate": 1.9055634821124036e-05, "loss": 0.0077, "step": 196650 }, { "epoch": 2.83, "learning_rate": 1.9055586781385566e-05, "loss": 0.0063, "step": 196660 }, { "epoch": 2.83, "learning_rate": 1.905553874164709e-05, "loss": 0.0087, "step": 196670 }, { "epoch": 2.83, "learning_rate": 1.905549070190862e-05, "loss": 0.0058, "step": 196680 }, { "epoch": 2.83, "learning_rate": 1.905544266217015e-05, "loss": 0.0058, "step": 196690 }, { "epoch": 2.83, "learning_rate": 1.905539462243168e-05, "loss": 0.0054, "step": 196700 }, { "epoch": 2.83, "learning_rate": 1.9055346582693205e-05, "loss": 0.0053, "step": 196710 }, { "epoch": 2.84, "learning_rate": 1.9055298542954734e-05, "loss": 0.0076, "step": 196720 }, { "epoch": 2.84, "learning_rate": 1.9055250503216264e-05, "loss": 0.0062, "step": 196730 }, { "epoch": 2.84, "learning_rate": 1.905520246347779e-05, "loss": 0.0071, "step": 196740 }, { "epoch": 2.84, "learning_rate": 1.905515442373932e-05, "loss": 0.0032, "step": 196750 }, { "epoch": 2.84, "learning_rate": 1.9055106384000848e-05, "loss": 0.0071, "step": 196760 }, { "epoch": 2.84, "learning_rate": 1.9055058344262377e-05, "loss": 0.0085, "step": 196770 }, { "epoch": 2.84, "learning_rate": 1.9055010304523903e-05, "loss": 0.0066, "step": 196780 }, { "epoch": 2.84, "learning_rate": 1.9054962264785432e-05, "loss": 0.0055, "step": 196790 }, { "epoch": 2.84, "learning_rate": 1.9054914225046962e-05, "loss": 0.0046, "step": 196800 }, { "epoch": 2.84, "learning_rate": 1.9054866185308488e-05, "loss": 0.0059, "step": 196810 }, { "epoch": 2.84, "learning_rate": 1.9054818145570017e-05, "loss": 0.0048, "step": 196820 }, { "epoch": 2.84, "learning_rate": 1.9054770105831546e-05, "loss": 0.0063, "step": 196830 }, { "epoch": 2.84, "learning_rate": 1.9054722066093075e-05, "loss": 0.0071, "step": 196840 }, { "epoch": 2.84, "learning_rate": 1.90546740263546e-05, "loss": 0.0083, "step": 196850 }, { "epoch": 2.84, "learning_rate": 1.905462598661613e-05, "loss": 0.0059, "step": 196860 }, { "epoch": 2.84, "learning_rate": 1.905457794687766e-05, "loss": 0.009, "step": 196870 }, { "epoch": 2.84, "learning_rate": 1.905452990713919e-05, "loss": 0.0066, "step": 196880 }, { "epoch": 2.84, "learning_rate": 1.9054481867400715e-05, "loss": 0.0085, "step": 196890 }, { "epoch": 2.84, "learning_rate": 1.9054433827662244e-05, "loss": 0.0057, "step": 196900 }, { "epoch": 2.84, "learning_rate": 1.9054385787923774e-05, "loss": 0.0062, "step": 196910 }, { "epoch": 2.84, "learning_rate": 1.90543377481853e-05, "loss": 0.0118, "step": 196920 }, { "epoch": 2.84, "learning_rate": 1.905428970844683e-05, "loss": 0.0059, "step": 196930 }, { "epoch": 2.84, "learning_rate": 1.9054241668708358e-05, "loss": 0.0079, "step": 196940 }, { "epoch": 2.84, "learning_rate": 1.9054193628969887e-05, "loss": 0.0057, "step": 196950 }, { "epoch": 2.84, "learning_rate": 1.9054145589231413e-05, "loss": 0.0065, "step": 196960 }, { "epoch": 2.84, "learning_rate": 1.9054097549492942e-05, "loss": 0.005, "step": 196970 }, { "epoch": 2.84, "learning_rate": 1.905404950975447e-05, "loss": 0.007, "step": 196980 }, { "epoch": 2.84, "learning_rate": 1.9054001470015998e-05, "loss": 0.0067, "step": 196990 }, { "epoch": 2.84, "learning_rate": 1.9053953430277527e-05, "loss": 0.0064, "step": 197000 }, { "epoch": 2.84, "learning_rate": 1.9053905390539056e-05, "loss": 0.0065, "step": 197010 }, { "epoch": 2.84, "learning_rate": 1.9053857350800585e-05, "loss": 0.0062, "step": 197020 }, { "epoch": 2.84, "learning_rate": 1.905380931106211e-05, "loss": 0.0047, "step": 197030 }, { "epoch": 2.84, "learning_rate": 1.905376127132364e-05, "loss": 0.0079, "step": 197040 }, { "epoch": 2.84, "learning_rate": 1.905371323158517e-05, "loss": 0.006, "step": 197050 }, { "epoch": 2.84, "learning_rate": 1.90536651918467e-05, "loss": 0.0077, "step": 197060 }, { "epoch": 2.84, "learning_rate": 1.9053617152108225e-05, "loss": 0.0071, "step": 197070 }, { "epoch": 2.84, "learning_rate": 1.9053573916343603e-05, "loss": 0.0045, "step": 197080 }, { "epoch": 2.84, "learning_rate": 1.905352587660513e-05, "loss": 0.0059, "step": 197090 }, { "epoch": 2.84, "learning_rate": 1.9053477836866658e-05, "loss": 0.0057, "step": 197100 }, { "epoch": 2.84, "learning_rate": 1.9053429797128187e-05, "loss": 0.0051, "step": 197110 }, { "epoch": 2.84, "learning_rate": 1.9053381757389717e-05, "loss": 0.0045, "step": 197120 }, { "epoch": 2.84, "learning_rate": 1.9053333717651243e-05, "loss": 0.0074, "step": 197130 }, { "epoch": 2.84, "learning_rate": 1.9053285677912772e-05, "loss": 0.0075, "step": 197140 }, { "epoch": 2.84, "learning_rate": 1.90532376381743e-05, "loss": 0.0104, "step": 197150 }, { "epoch": 2.84, "learning_rate": 1.9053189598435827e-05, "loss": 0.0062, "step": 197160 }, { "epoch": 2.84, "learning_rate": 1.9053141558697356e-05, "loss": 0.0057, "step": 197170 }, { "epoch": 2.84, "learning_rate": 1.9053093518958885e-05, "loss": 0.0065, "step": 197180 }, { "epoch": 2.84, "learning_rate": 1.9053045479220415e-05, "loss": 0.0049, "step": 197190 }, { "epoch": 2.84, "learning_rate": 1.905299743948194e-05, "loss": 0.0079, "step": 197200 }, { "epoch": 2.84, "learning_rate": 1.905294939974347e-05, "loss": 0.0072, "step": 197210 }, { "epoch": 2.84, "learning_rate": 1.9052901360005e-05, "loss": 0.0107, "step": 197220 }, { "epoch": 2.84, "learning_rate": 1.9052853320266525e-05, "loss": 0.008, "step": 197230 }, { "epoch": 2.84, "learning_rate": 1.9052805280528054e-05, "loss": 0.0058, "step": 197240 }, { "epoch": 2.84, "learning_rate": 1.9052757240789584e-05, "loss": 0.0057, "step": 197250 }, { "epoch": 2.84, "learning_rate": 1.9052709201051113e-05, "loss": 0.0045, "step": 197260 }, { "epoch": 2.84, "learning_rate": 1.905266116131264e-05, "loss": 0.0072, "step": 197270 }, { "epoch": 2.84, "learning_rate": 1.9052613121574168e-05, "loss": 0.0094, "step": 197280 }, { "epoch": 2.84, "learning_rate": 1.9052569885809543e-05, "loss": 0.0058, "step": 197290 }, { "epoch": 2.84, "learning_rate": 1.9052521846071072e-05, "loss": 0.0068, "step": 197300 }, { "epoch": 2.84, "learning_rate": 1.90524738063326e-05, "loss": 0.0066, "step": 197310 }, { "epoch": 2.84, "learning_rate": 1.905242576659413e-05, "loss": 0.0058, "step": 197320 }, { "epoch": 2.84, "learning_rate": 1.9052377726855656e-05, "loss": 0.0057, "step": 197330 }, { "epoch": 2.84, "learning_rate": 1.9052329687117186e-05, "loss": 0.0084, "step": 197340 }, { "epoch": 2.84, "learning_rate": 1.9052281647378715e-05, "loss": 0.0085, "step": 197350 }, { "epoch": 2.84, "learning_rate": 1.9052233607640244e-05, "loss": 0.007, "step": 197360 }, { "epoch": 2.84, "learning_rate": 1.905218556790177e-05, "loss": 0.0047, "step": 197370 }, { "epoch": 2.84, "learning_rate": 1.90521375281633e-05, "loss": 0.0071, "step": 197380 }, { "epoch": 2.84, "learning_rate": 1.905208948842483e-05, "loss": 0.0066, "step": 197390 }, { "epoch": 2.84, "learning_rate": 1.9052041448686354e-05, "loss": 0.0089, "step": 197400 }, { "epoch": 2.85, "learning_rate": 1.9051993408947884e-05, "loss": 0.0052, "step": 197410 }, { "epoch": 2.85, "learning_rate": 1.9051945369209413e-05, "loss": 0.006, "step": 197420 }, { "epoch": 2.85, "learning_rate": 1.9051897329470942e-05, "loss": 0.0061, "step": 197430 }, { "epoch": 2.85, "learning_rate": 1.9051849289732468e-05, "loss": 0.005, "step": 197440 }, { "epoch": 2.85, "learning_rate": 1.9051801249993997e-05, "loss": 0.0046, "step": 197450 }, { "epoch": 2.85, "learning_rate": 1.9051753210255527e-05, "loss": 0.0096, "step": 197460 }, { "epoch": 2.85, "learning_rate": 1.9051705170517053e-05, "loss": 0.0065, "step": 197470 }, { "epoch": 2.85, "learning_rate": 1.9051657130778582e-05, "loss": 0.0054, "step": 197480 }, { "epoch": 2.85, "learning_rate": 1.905160909104011e-05, "loss": 0.0066, "step": 197490 }, { "epoch": 2.85, "learning_rate": 1.905156105130164e-05, "loss": 0.0061, "step": 197500 }, { "epoch": 2.85, "learning_rate": 1.9051513011563166e-05, "loss": 0.0053, "step": 197510 }, { "epoch": 2.85, "learning_rate": 1.9051464971824696e-05, "loss": 0.0051, "step": 197520 }, { "epoch": 2.85, "learning_rate": 1.9051416932086225e-05, "loss": 0.0049, "step": 197530 }, { "epoch": 2.85, "learning_rate": 1.9051368892347754e-05, "loss": 0.0065, "step": 197540 }, { "epoch": 2.85, "learning_rate": 1.905132085260928e-05, "loss": 0.0068, "step": 197550 }, { "epoch": 2.85, "learning_rate": 1.905127281287081e-05, "loss": 0.0063, "step": 197560 }, { "epoch": 2.85, "learning_rate": 1.905122477313234e-05, "loss": 0.0089, "step": 197570 }, { "epoch": 2.85, "learning_rate": 1.9051176733393864e-05, "loss": 0.008, "step": 197580 }, { "epoch": 2.85, "learning_rate": 1.9051128693655394e-05, "loss": 0.0053, "step": 197590 }, { "epoch": 2.85, "learning_rate": 1.9051080653916923e-05, "loss": 0.0057, "step": 197600 }, { "epoch": 2.85, "learning_rate": 1.9051032614178452e-05, "loss": 0.0082, "step": 197610 }, { "epoch": 2.85, "learning_rate": 1.9050984574439978e-05, "loss": 0.004, "step": 197620 }, { "epoch": 2.85, "learning_rate": 1.9050936534701507e-05, "loss": 0.0052, "step": 197630 }, { "epoch": 2.85, "learning_rate": 1.9050888494963037e-05, "loss": 0.0054, "step": 197640 }, { "epoch": 2.85, "learning_rate": 1.9050840455224563e-05, "loss": 0.0073, "step": 197650 }, { "epoch": 2.85, "learning_rate": 1.9050792415486092e-05, "loss": 0.0091, "step": 197660 }, { "epoch": 2.85, "learning_rate": 1.905074437574762e-05, "loss": 0.005, "step": 197670 }, { "epoch": 2.85, "learning_rate": 1.905069633600915e-05, "loss": 0.0064, "step": 197680 }, { "epoch": 2.85, "learning_rate": 1.9050648296270676e-05, "loss": 0.008, "step": 197690 }, { "epoch": 2.85, "learning_rate": 1.9050600256532205e-05, "loss": 0.0096, "step": 197700 }, { "epoch": 2.85, "learning_rate": 1.9050552216793735e-05, "loss": 0.0053, "step": 197710 }, { "epoch": 2.85, "learning_rate": 1.9050504177055264e-05, "loss": 0.006, "step": 197720 }, { "epoch": 2.85, "learning_rate": 1.905045613731679e-05, "loss": 0.0053, "step": 197730 }, { "epoch": 2.85, "learning_rate": 1.905040809757832e-05, "loss": 0.0062, "step": 197740 }, { "epoch": 2.85, "learning_rate": 1.905036005783985e-05, "loss": 0.0064, "step": 197750 }, { "epoch": 2.85, "learning_rate": 1.9050312018101374e-05, "loss": 0.0078, "step": 197760 }, { "epoch": 2.85, "learning_rate": 1.9050263978362904e-05, "loss": 0.0065, "step": 197770 }, { "epoch": 2.85, "learning_rate": 1.9050215938624433e-05, "loss": 0.0072, "step": 197780 }, { "epoch": 2.85, "learning_rate": 1.9050167898885962e-05, "loss": 0.0055, "step": 197790 }, { "epoch": 2.85, "learning_rate": 1.9050119859147488e-05, "loss": 0.0066, "step": 197800 }, { "epoch": 2.85, "learning_rate": 1.9050071819409017e-05, "loss": 0.0084, "step": 197810 }, { "epoch": 2.85, "learning_rate": 1.9050023779670547e-05, "loss": 0.0072, "step": 197820 }, { "epoch": 2.85, "learning_rate": 1.9049975739932072e-05, "loss": 0.004, "step": 197830 }, { "epoch": 2.85, "learning_rate": 1.9049927700193602e-05, "loss": 0.0089, "step": 197840 }, { "epoch": 2.85, "learning_rate": 1.904987966045513e-05, "loss": 0.0077, "step": 197850 }, { "epoch": 2.85, "learning_rate": 1.904983162071666e-05, "loss": 0.0051, "step": 197860 }, { "epoch": 2.85, "learning_rate": 1.9049783580978186e-05, "loss": 0.007, "step": 197870 }, { "epoch": 2.85, "learning_rate": 1.9049735541239715e-05, "loss": 0.0066, "step": 197880 }, { "epoch": 2.85, "learning_rate": 1.9049687501501245e-05, "loss": 0.0069, "step": 197890 }, { "epoch": 2.85, "learning_rate": 1.9049639461762774e-05, "loss": 0.0081, "step": 197900 }, { "epoch": 2.85, "learning_rate": 1.90495914220243e-05, "loss": 0.0055, "step": 197910 }, { "epoch": 2.85, "learning_rate": 1.904954338228583e-05, "loss": 0.0058, "step": 197920 }, { "epoch": 2.85, "learning_rate": 1.904949534254736e-05, "loss": 0.0079, "step": 197930 }, { "epoch": 2.85, "learning_rate": 1.9049447302808884e-05, "loss": 0.0047, "step": 197940 }, { "epoch": 2.85, "learning_rate": 1.9049399263070413e-05, "loss": 0.0092, "step": 197950 }, { "epoch": 2.85, "learning_rate": 1.9049351223331943e-05, "loss": 0.0084, "step": 197960 }, { "epoch": 2.85, "learning_rate": 1.9049303183593472e-05, "loss": 0.008, "step": 197970 }, { "epoch": 2.85, "learning_rate": 1.9049255143854998e-05, "loss": 0.0055, "step": 197980 }, { "epoch": 2.85, "learning_rate": 1.9049207104116527e-05, "loss": 0.0064, "step": 197990 }, { "epoch": 2.85, "learning_rate": 1.9049159064378056e-05, "loss": 0.0064, "step": 198000 }, { "epoch": 2.85, "learning_rate": 1.9049111024639582e-05, "loss": 0.0079, "step": 198010 }, { "epoch": 2.85, "learning_rate": 1.904906298490111e-05, "loss": 0.0081, "step": 198020 }, { "epoch": 2.85, "learning_rate": 1.904901494516264e-05, "loss": 0.009, "step": 198030 }, { "epoch": 2.85, "learning_rate": 1.904896690542417e-05, "loss": 0.0074, "step": 198040 }, { "epoch": 2.85, "learning_rate": 1.9048918865685696e-05, "loss": 0.0051, "step": 198050 }, { "epoch": 2.85, "learning_rate": 1.9048870825947225e-05, "loss": 0.0053, "step": 198060 }, { "epoch": 2.85, "learning_rate": 1.9048822786208755e-05, "loss": 0.0069, "step": 198070 }, { "epoch": 2.85, "learning_rate": 1.904877474647028e-05, "loss": 0.0076, "step": 198080 }, { "epoch": 2.85, "learning_rate": 1.904872670673181e-05, "loss": 0.0065, "step": 198090 }, { "epoch": 2.86, "learning_rate": 1.904867866699334e-05, "loss": 0.0054, "step": 198100 }, { "epoch": 2.86, "learning_rate": 1.9048630627254868e-05, "loss": 0.007, "step": 198110 }, { "epoch": 2.86, "learning_rate": 1.9048582587516394e-05, "loss": 0.0066, "step": 198120 }, { "epoch": 2.86, "learning_rate": 1.9048534547777923e-05, "loss": 0.0113, "step": 198130 }, { "epoch": 2.86, "learning_rate": 1.9048486508039453e-05, "loss": 0.004, "step": 198140 }, { "epoch": 2.86, "learning_rate": 1.9048438468300982e-05, "loss": 0.0073, "step": 198150 }, { "epoch": 2.86, "learning_rate": 1.9048390428562508e-05, "loss": 0.0074, "step": 198160 }, { "epoch": 2.86, "learning_rate": 1.9048342388824037e-05, "loss": 0.0057, "step": 198170 }, { "epoch": 2.86, "learning_rate": 1.9048294349085566e-05, "loss": 0.0065, "step": 198180 }, { "epoch": 2.86, "learning_rate": 1.9048246309347092e-05, "loss": 0.0053, "step": 198190 }, { "epoch": 2.86, "learning_rate": 1.904819826960862e-05, "loss": 0.0051, "step": 198200 }, { "epoch": 2.86, "learning_rate": 1.904815022987015e-05, "loss": 0.0101, "step": 198210 }, { "epoch": 2.86, "learning_rate": 1.904810219013168e-05, "loss": 0.0093, "step": 198220 }, { "epoch": 2.86, "learning_rate": 1.9048054150393206e-05, "loss": 0.0081, "step": 198230 }, { "epoch": 2.86, "learning_rate": 1.9048006110654735e-05, "loss": 0.0062, "step": 198240 }, { "epoch": 2.86, "learning_rate": 1.9047958070916264e-05, "loss": 0.0074, "step": 198250 }, { "epoch": 2.86, "learning_rate": 1.904791003117779e-05, "loss": 0.0059, "step": 198260 }, { "epoch": 2.86, "learning_rate": 1.904786199143932e-05, "loss": 0.0058, "step": 198270 }, { "epoch": 2.86, "learning_rate": 1.904781395170085e-05, "loss": 0.0072, "step": 198280 }, { "epoch": 2.86, "learning_rate": 1.9047765911962378e-05, "loss": 0.0074, "step": 198290 }, { "epoch": 2.86, "learning_rate": 1.9047717872223904e-05, "loss": 0.0052, "step": 198300 }, { "epoch": 2.86, "learning_rate": 1.9047669832485433e-05, "loss": 0.0086, "step": 198310 }, { "epoch": 2.86, "learning_rate": 1.9047621792746963e-05, "loss": 0.007, "step": 198320 }, { "epoch": 2.86, "learning_rate": 1.9047573753008492e-05, "loss": 0.0067, "step": 198330 }, { "epoch": 2.86, "learning_rate": 1.9047525713270018e-05, "loss": 0.0079, "step": 198340 }, { "epoch": 2.86, "learning_rate": 1.9047477673531547e-05, "loss": 0.0049, "step": 198350 }, { "epoch": 2.86, "learning_rate": 1.9047429633793076e-05, "loss": 0.0074, "step": 198360 }, { "epoch": 2.86, "learning_rate": 1.9047381594054602e-05, "loss": 0.0046, "step": 198370 }, { "epoch": 2.86, "learning_rate": 1.904733355431613e-05, "loss": 0.0041, "step": 198380 }, { "epoch": 2.86, "learning_rate": 1.904729031855151e-05, "loss": 0.0071, "step": 198390 }, { "epoch": 2.86, "learning_rate": 1.9047242278813035e-05, "loss": 0.0062, "step": 198400 }, { "epoch": 2.86, "learning_rate": 1.9047194239074565e-05, "loss": 0.0081, "step": 198410 }, { "epoch": 2.86, "learning_rate": 1.9047146199336094e-05, "loss": 0.0067, "step": 198420 }, { "epoch": 2.86, "learning_rate": 1.904709815959762e-05, "loss": 0.0049, "step": 198430 }, { "epoch": 2.86, "learning_rate": 1.904705011985915e-05, "loss": 0.0086, "step": 198440 }, { "epoch": 2.86, "learning_rate": 1.904700208012068e-05, "loss": 0.0058, "step": 198450 }, { "epoch": 2.86, "learning_rate": 1.9046954040382208e-05, "loss": 0.0063, "step": 198460 }, { "epoch": 2.86, "learning_rate": 1.9046906000643733e-05, "loss": 0.0068, "step": 198470 }, { "epoch": 2.86, "learning_rate": 1.9046857960905263e-05, "loss": 0.0085, "step": 198480 }, { "epoch": 2.86, "learning_rate": 1.9046809921166792e-05, "loss": 0.0058, "step": 198490 }, { "epoch": 2.86, "learning_rate": 1.9046761881428318e-05, "loss": 0.0056, "step": 198500 }, { "epoch": 2.86, "learning_rate": 1.9046713841689847e-05, "loss": 0.0059, "step": 198510 }, { "epoch": 2.86, "learning_rate": 1.9046665801951376e-05, "loss": 0.009, "step": 198520 }, { "epoch": 2.86, "learning_rate": 1.9046617762212906e-05, "loss": 0.0078, "step": 198530 }, { "epoch": 2.86, "learning_rate": 1.904656972247443e-05, "loss": 0.0045, "step": 198540 }, { "epoch": 2.86, "learning_rate": 1.904652168273596e-05, "loss": 0.0063, "step": 198550 }, { "epoch": 2.86, "learning_rate": 1.904647364299749e-05, "loss": 0.008, "step": 198560 }, { "epoch": 2.86, "learning_rate": 1.904642560325902e-05, "loss": 0.0043, "step": 198570 }, { "epoch": 2.86, "learning_rate": 1.9046377563520545e-05, "loss": 0.0069, "step": 198580 }, { "epoch": 2.86, "learning_rate": 1.9046329523782075e-05, "loss": 0.0121, "step": 198590 }, { "epoch": 2.86, "learning_rate": 1.9046281484043604e-05, "loss": 0.0056, "step": 198600 }, { "epoch": 2.86, "learning_rate": 1.904623344430513e-05, "loss": 0.0064, "step": 198610 }, { "epoch": 2.86, "learning_rate": 1.904618540456666e-05, "loss": 0.0045, "step": 198620 }, { "epoch": 2.86, "learning_rate": 1.9046137364828188e-05, "loss": 0.0081, "step": 198630 }, { "epoch": 2.86, "learning_rate": 1.9046089325089718e-05, "loss": 0.0061, "step": 198640 }, { "epoch": 2.86, "learning_rate": 1.9046041285351243e-05, "loss": 0.0042, "step": 198650 }, { "epoch": 2.86, "learning_rate": 1.9045993245612773e-05, "loss": 0.0066, "step": 198660 }, { "epoch": 2.86, "learning_rate": 1.9045945205874302e-05, "loss": 0.0057, "step": 198670 }, { "epoch": 2.86, "learning_rate": 1.9045897166135828e-05, "loss": 0.0038, "step": 198680 }, { "epoch": 2.86, "learning_rate": 1.9045849126397357e-05, "loss": 0.0059, "step": 198690 }, { "epoch": 2.86, "learning_rate": 1.9045801086658886e-05, "loss": 0.0062, "step": 198700 }, { "epoch": 2.86, "learning_rate": 1.9045753046920416e-05, "loss": 0.0069, "step": 198710 }, { "epoch": 2.86, "learning_rate": 1.904570500718194e-05, "loss": 0.0063, "step": 198720 }, { "epoch": 2.86, "learning_rate": 1.904565696744347e-05, "loss": 0.0051, "step": 198730 }, { "epoch": 2.86, "learning_rate": 1.9045608927705e-05, "loss": 0.0048, "step": 198740 }, { "epoch": 2.86, "learning_rate": 1.904556088796653e-05, "loss": 0.0068, "step": 198750 }, { "epoch": 2.86, "learning_rate": 1.9045512848228055e-05, "loss": 0.0059, "step": 198760 }, { "epoch": 2.86, "learning_rate": 1.9045464808489584e-05, "loss": 0.0051, "step": 198770 }, { "epoch": 2.86, "learning_rate": 1.9045416768751114e-05, "loss": 0.0068, "step": 198780 }, { "epoch": 2.86, "learning_rate": 1.904536872901264e-05, "loss": 0.0075, "step": 198790 }, { "epoch": 2.87, "learning_rate": 1.904532068927417e-05, "loss": 0.0065, "step": 198800 }, { "epoch": 2.87, "learning_rate": 1.9045272649535698e-05, "loss": 0.008, "step": 198810 }, { "epoch": 2.87, "learning_rate": 1.9045224609797227e-05, "loss": 0.0064, "step": 198820 }, { "epoch": 2.87, "learning_rate": 1.9045176570058753e-05, "loss": 0.0048, "step": 198830 }, { "epoch": 2.87, "learning_rate": 1.9045128530320283e-05, "loss": 0.0108, "step": 198840 }, { "epoch": 2.87, "learning_rate": 1.9045080490581812e-05, "loss": 0.0071, "step": 198850 }, { "epoch": 2.87, "learning_rate": 1.9045032450843338e-05, "loss": 0.009, "step": 198860 }, { "epoch": 2.87, "learning_rate": 1.9044984411104867e-05, "loss": 0.0106, "step": 198870 }, { "epoch": 2.87, "learning_rate": 1.9044936371366396e-05, "loss": 0.0073, "step": 198880 }, { "epoch": 2.87, "learning_rate": 1.9044888331627926e-05, "loss": 0.0064, "step": 198890 }, { "epoch": 2.87, "learning_rate": 1.904484029188945e-05, "loss": 0.0082, "step": 198900 }, { "epoch": 2.87, "learning_rate": 1.904479225215098e-05, "loss": 0.0068, "step": 198910 }, { "epoch": 2.87, "learning_rate": 1.904474421241251e-05, "loss": 0.008, "step": 198920 }, { "epoch": 2.87, "learning_rate": 1.904469617267404e-05, "loss": 0.0085, "step": 198930 }, { "epoch": 2.87, "learning_rate": 1.9044648132935565e-05, "loss": 0.0065, "step": 198940 }, { "epoch": 2.87, "learning_rate": 1.9044600093197094e-05, "loss": 0.0062, "step": 198950 }, { "epoch": 2.87, "learning_rate": 1.9044552053458624e-05, "loss": 0.0041, "step": 198960 }, { "epoch": 2.87, "learning_rate": 1.904450401372015e-05, "loss": 0.0041, "step": 198970 }, { "epoch": 2.87, "learning_rate": 1.904445597398168e-05, "loss": 0.0081, "step": 198980 }, { "epoch": 2.87, "learning_rate": 1.9044407934243208e-05, "loss": 0.0092, "step": 198990 }, { "epoch": 2.87, "learning_rate": 1.9044359894504737e-05, "loss": 0.0059, "step": 199000 }, { "epoch": 2.87, "learning_rate": 1.9044311854766263e-05, "loss": 0.0046, "step": 199010 }, { "epoch": 2.87, "learning_rate": 1.9044263815027792e-05, "loss": 0.0064, "step": 199020 }, { "epoch": 2.87, "learning_rate": 1.9044215775289322e-05, "loss": 0.0067, "step": 199030 }, { "epoch": 2.87, "learning_rate": 1.9044167735550848e-05, "loss": 0.0054, "step": 199040 }, { "epoch": 2.87, "learning_rate": 1.9044119695812377e-05, "loss": 0.0057, "step": 199050 }, { "epoch": 2.87, "learning_rate": 1.9044071656073906e-05, "loss": 0.0067, "step": 199060 }, { "epoch": 2.87, "learning_rate": 1.9044023616335435e-05, "loss": 0.0055, "step": 199070 }, { "epoch": 2.87, "learning_rate": 1.904397557659696e-05, "loss": 0.0043, "step": 199080 }, { "epoch": 2.87, "learning_rate": 1.904392753685849e-05, "loss": 0.0047, "step": 199090 }, { "epoch": 2.87, "learning_rate": 1.904387949712002e-05, "loss": 0.0043, "step": 199100 }, { "epoch": 2.87, "learning_rate": 1.904383145738155e-05, "loss": 0.0043, "step": 199110 }, { "epoch": 2.87, "learning_rate": 1.9043783417643075e-05, "loss": 0.0088, "step": 199120 }, { "epoch": 2.87, "learning_rate": 1.9043735377904604e-05, "loss": 0.0058, "step": 199130 }, { "epoch": 2.87, "learning_rate": 1.9043687338166134e-05, "loss": 0.0068, "step": 199140 }, { "epoch": 2.87, "learning_rate": 1.904363929842766e-05, "loss": 0.0059, "step": 199150 }, { "epoch": 2.87, "learning_rate": 1.904359125868919e-05, "loss": 0.0073, "step": 199160 }, { "epoch": 2.87, "learning_rate": 1.9043543218950718e-05, "loss": 0.0052, "step": 199170 }, { "epoch": 2.87, "learning_rate": 1.9043495179212247e-05, "loss": 0.0053, "step": 199180 }, { "epoch": 2.87, "learning_rate": 1.9043447139473773e-05, "loss": 0.0052, "step": 199190 }, { "epoch": 2.87, "learning_rate": 1.9043399099735302e-05, "loss": 0.0101, "step": 199200 }, { "epoch": 2.87, "learning_rate": 1.904335105999683e-05, "loss": 0.0065, "step": 199210 }, { "epoch": 2.87, "learning_rate": 1.9043303020258358e-05, "loss": 0.0065, "step": 199220 }, { "epoch": 2.87, "learning_rate": 1.9043254980519887e-05, "loss": 0.0055, "step": 199230 }, { "epoch": 2.87, "learning_rate": 1.9043206940781416e-05, "loss": 0.0071, "step": 199240 }, { "epoch": 2.87, "learning_rate": 1.9043158901042945e-05, "loss": 0.0108, "step": 199250 }, { "epoch": 2.87, "learning_rate": 1.904311086130447e-05, "loss": 0.0053, "step": 199260 }, { "epoch": 2.87, "learning_rate": 1.9043062821566e-05, "loss": 0.0077, "step": 199270 }, { "epoch": 2.87, "learning_rate": 1.904301478182753e-05, "loss": 0.0075, "step": 199280 }, { "epoch": 2.87, "learning_rate": 1.904296674208906e-05, "loss": 0.0047, "step": 199290 }, { "epoch": 2.87, "learning_rate": 1.9042918702350585e-05, "loss": 0.0053, "step": 199300 }, { "epoch": 2.87, "learning_rate": 1.9042870662612114e-05, "loss": 0.005, "step": 199310 }, { "epoch": 2.87, "learning_rate": 1.9042822622873643e-05, "loss": 0.005, "step": 199320 }, { "epoch": 2.87, "learning_rate": 1.904277458313517e-05, "loss": 0.0035, "step": 199330 }, { "epoch": 2.87, "learning_rate": 1.90427265433967e-05, "loss": 0.0055, "step": 199340 }, { "epoch": 2.87, "learning_rate": 1.9042678503658228e-05, "loss": 0.0051, "step": 199350 }, { "epoch": 2.87, "learning_rate": 1.9042630463919757e-05, "loss": 0.0049, "step": 199360 }, { "epoch": 2.87, "learning_rate": 1.9042582424181283e-05, "loss": 0.0073, "step": 199370 }, { "epoch": 2.87, "learning_rate": 1.9042534384442812e-05, "loss": 0.0093, "step": 199380 }, { "epoch": 2.87, "learning_rate": 1.904248634470434e-05, "loss": 0.0164, "step": 199390 }, { "epoch": 2.87, "learning_rate": 1.9042438304965867e-05, "loss": 0.0091, "step": 199400 }, { "epoch": 2.87, "learning_rate": 1.9042390265227397e-05, "loss": 0.0082, "step": 199410 }, { "epoch": 2.87, "learning_rate": 1.9042342225488926e-05, "loss": 0.009, "step": 199420 }, { "epoch": 2.87, "learning_rate": 1.9042294185750455e-05, "loss": 0.0075, "step": 199430 }, { "epoch": 2.87, "learning_rate": 1.904224614601198e-05, "loss": 0.0048, "step": 199440 }, { "epoch": 2.87, "learning_rate": 1.904219810627351e-05, "loss": 0.0077, "step": 199450 }, { "epoch": 2.87, "learning_rate": 1.904215006653504e-05, "loss": 0.007, "step": 199460 }, { "epoch": 2.87, "learning_rate": 1.904210202679657e-05, "loss": 0.0064, "step": 199470 }, { "epoch": 2.87, "learning_rate": 1.9042053987058095e-05, "loss": 0.0055, "step": 199480 }, { "epoch": 2.88, "learning_rate": 1.9042005947319624e-05, "loss": 0.0082, "step": 199490 }, { "epoch": 2.88, "learning_rate": 1.9041957907581153e-05, "loss": 0.0072, "step": 199500 }, { "epoch": 2.88, "learning_rate": 1.904190986784268e-05, "loss": 0.0092, "step": 199510 }, { "epoch": 2.88, "learning_rate": 1.904186182810421e-05, "loss": 0.0057, "step": 199520 }, { "epoch": 2.88, "learning_rate": 1.9041813788365738e-05, "loss": 0.0034, "step": 199530 }, { "epoch": 2.88, "learning_rate": 1.9041765748627267e-05, "loss": 0.0071, "step": 199540 }, { "epoch": 2.88, "learning_rate": 1.9041717708888793e-05, "loss": 0.0089, "step": 199550 }, { "epoch": 2.88, "learning_rate": 1.9041669669150322e-05, "loss": 0.0063, "step": 199560 }, { "epoch": 2.88, "learning_rate": 1.904162162941185e-05, "loss": 0.0085, "step": 199570 }, { "epoch": 2.88, "learning_rate": 1.9041573589673377e-05, "loss": 0.0063, "step": 199580 }, { "epoch": 2.88, "learning_rate": 1.9041525549934907e-05, "loss": 0.0074, "step": 199590 }, { "epoch": 2.88, "learning_rate": 1.9041477510196436e-05, "loss": 0.005, "step": 199600 }, { "epoch": 2.88, "learning_rate": 1.9041429470457965e-05, "loss": 0.008, "step": 199610 }, { "epoch": 2.88, "learning_rate": 1.904138143071949e-05, "loss": 0.0046, "step": 199620 }, { "epoch": 2.88, "learning_rate": 1.904133339098102e-05, "loss": 0.0056, "step": 199630 }, { "epoch": 2.88, "learning_rate": 1.904128535124255e-05, "loss": 0.007, "step": 199640 }, { "epoch": 2.88, "learning_rate": 1.9041237311504075e-05, "loss": 0.0057, "step": 199650 }, { "epoch": 2.88, "learning_rate": 1.9041189271765605e-05, "loss": 0.0117, "step": 199660 }, { "epoch": 2.88, "learning_rate": 1.9041141232027134e-05, "loss": 0.0097, "step": 199670 }, { "epoch": 2.88, "learning_rate": 1.9041093192288663e-05, "loss": 0.0058, "step": 199680 }, { "epoch": 2.88, "learning_rate": 1.904104515255019e-05, "loss": 0.0053, "step": 199690 }, { "epoch": 2.88, "learning_rate": 1.904099711281172e-05, "loss": 0.0084, "step": 199700 }, { "epoch": 2.88, "learning_rate": 1.9040949073073248e-05, "loss": 0.0069, "step": 199710 }, { "epoch": 2.88, "learning_rate": 1.9040901033334777e-05, "loss": 0.0066, "step": 199720 }, { "epoch": 2.88, "learning_rate": 1.9040852993596303e-05, "loss": 0.0063, "step": 199730 }, { "epoch": 2.88, "learning_rate": 1.9040804953857832e-05, "loss": 0.0087, "step": 199740 }, { "epoch": 2.88, "learning_rate": 1.904075691411936e-05, "loss": 0.0073, "step": 199750 }, { "epoch": 2.88, "learning_rate": 1.9040708874380887e-05, "loss": 0.0079, "step": 199760 }, { "epoch": 2.88, "learning_rate": 1.9040660834642417e-05, "loss": 0.0077, "step": 199770 }, { "epoch": 2.88, "learning_rate": 1.9040612794903946e-05, "loss": 0.0076, "step": 199780 }, { "epoch": 2.88, "learning_rate": 1.9040564755165475e-05, "loss": 0.0073, "step": 199790 }, { "epoch": 2.88, "learning_rate": 1.9040516715427e-05, "loss": 0.0081, "step": 199800 }, { "epoch": 2.88, "learning_rate": 1.904046867568853e-05, "loss": 0.0072, "step": 199810 }, { "epoch": 2.88, "learning_rate": 1.904042063595006e-05, "loss": 0.0069, "step": 199820 }, { "epoch": 2.88, "learning_rate": 1.9040372596211585e-05, "loss": 0.0064, "step": 199830 }, { "epoch": 2.88, "learning_rate": 1.9040324556473115e-05, "loss": 0.0038, "step": 199840 }, { "epoch": 2.88, "learning_rate": 1.9040276516734644e-05, "loss": 0.0037, "step": 199850 }, { "epoch": 2.88, "learning_rate": 1.9040228476996173e-05, "loss": 0.0043, "step": 199860 }, { "epoch": 2.88, "learning_rate": 1.90401804372577e-05, "loss": 0.0068, "step": 199870 }, { "epoch": 2.88, "learning_rate": 1.904013239751923e-05, "loss": 0.0093, "step": 199880 }, { "epoch": 2.88, "learning_rate": 1.9040084357780758e-05, "loss": 0.0056, "step": 199890 }, { "epoch": 2.88, "learning_rate": 1.9040036318042287e-05, "loss": 0.0046, "step": 199900 }, { "epoch": 2.88, "learning_rate": 1.9039988278303813e-05, "loss": 0.0049, "step": 199910 }, { "epoch": 2.88, "learning_rate": 1.9039940238565342e-05, "loss": 0.0081, "step": 199920 }, { "epoch": 2.88, "learning_rate": 1.903989219882687e-05, "loss": 0.0056, "step": 199930 }, { "epoch": 2.88, "learning_rate": 1.9039844159088397e-05, "loss": 0.0056, "step": 199940 }, { "epoch": 2.88, "learning_rate": 1.9039796119349926e-05, "loss": 0.0105, "step": 199950 }, { "epoch": 2.88, "learning_rate": 1.9039748079611456e-05, "loss": 0.0093, "step": 199960 }, { "epoch": 2.88, "learning_rate": 1.9039700039872985e-05, "loss": 0.0053, "step": 199970 }, { "epoch": 2.88, "learning_rate": 1.903965200013451e-05, "loss": 0.0071, "step": 199980 }, { "epoch": 2.88, "learning_rate": 1.903960396039604e-05, "loss": 0.0036, "step": 199990 }, { "epoch": 2.88, "learning_rate": 1.903955592065757e-05, "loss": 0.004, "step": 200000 } ], "max_steps": 4163220, "num_train_epochs": 60, "total_flos": 1.2542511339243725e+18, "trial_name": null, "trial_params": null }