{"current_steps": 1, "total_steps": 113, "loss": 0.9875, "lr": 4.999033893736386e-05, "epoch": 0.008830022075055188, "percentage": 0.88, "elapsed_time": "0:02:59", "remaining_time": "5:34:56", "throughput": 11687.78, "total_tokens": 2097152} {"current_steps": 2, "total_steps": 113, "loss": 0.944, "lr": 4.99613632163459e-05, "epoch": 0.017660044150110375, "percentage": 1.77, "elapsed_time": "0:05:53", "remaining_time": "5:27:13", "throughput": 11856.46, "total_tokens": 4194304} {"current_steps": 3, "total_steps": 113, "loss": 0.904, "lr": 4.991309523184661e-05, "epoch": 0.026490066225165563, "percentage": 2.65, "elapsed_time": "0:08:43", "remaining_time": "5:20:09", "throughput": 12009.19, "total_tokens": 6291456} {"current_steps": 4, "total_steps": 113, "loss": 0.8913, "lr": 4.98455722894677e-05, "epoch": 0.03532008830022075, "percentage": 3.54, "elapsed_time": "0:11:34", "remaining_time": "5:15:26", "throughput": 12077.74, "total_tokens": 8388608} {"current_steps": 5, "total_steps": 113, "loss": 0.8511, "lr": 4.975884657667922e-05, "epoch": 0.04415011037527594, "percentage": 4.42, "elapsed_time": "0:14:24", "remaining_time": "5:11:10", "throughput": 12131.05, "total_tokens": 10485760} {"current_steps": 6, "total_steps": 113, "loss": 0.8311, "lr": 4.965298512248466e-05, "epoch": 0.052980132450331126, "percentage": 5.31, "elapsed_time": "0:17:14", "remaining_time": "5:07:33", "throughput": 12160.16, "total_tokens": 12582912} {"current_steps": 7, "total_steps": 113, "loss": 0.838, "lr": 4.952806974561518e-05, "epoch": 0.06181015452538632, "percentage": 6.19, "elapsed_time": "0:20:05", "remaining_time": "5:04:07", "throughput": 12182.29, "total_tokens": 14680064} {"current_steps": 8, "total_steps": 113, "loss": 0.8468, "lr": 4.9384196991293205e-05, "epoch": 0.0706401766004415, "percentage": 7.08, "elapsed_time": "0:22:54", "remaining_time": "5:00:41", "throughput": 12205.11, "total_tokens": 16777216} {"current_steps": 9, "total_steps": 113, "loss": 0.7884, "lr": 4.922147805661402e-05, "epoch": 0.07947019867549669, "percentage": 7.96, "elapsed_time": "0:25:44", "remaining_time": "4:57:22", "throughput": 12224.04, "total_tokens": 18874368} {"current_steps": 10, "total_steps": 113, "loss": 0.8009, "lr": 4.904003870460323e-05, "epoch": 0.08830022075055188, "percentage": 8.85, "elapsed_time": "0:28:34", "remaining_time": "4:54:16", "throughput": 12233.96, "total_tokens": 20971520} {"current_steps": 11, "total_steps": 113, "loss": 0.7764, "lr": 4.884001916701639e-05, "epoch": 0.09713024282560706, "percentage": 9.73, "elapsed_time": "0:31:23", "remaining_time": "4:51:08", "throughput": 12245.4, "total_tokens": 23068672} {"current_steps": 12, "total_steps": 113, "loss": 0.7774, "lr": 4.862157403595598e-05, "epoch": 0.10596026490066225, "percentage": 10.62, "elapsed_time": "0:34:14", "remaining_time": "4:48:13", "throughput": 12248.38, "total_tokens": 25165824} {"current_steps": 13, "total_steps": 113, "loss": 0.7808, "lr": 4.838487214438951e-05, "epoch": 0.11479028697571744, "percentage": 11.5, "elapsed_time": "0:37:04", "remaining_time": "4:45:15", "throughput": 12253.12, "total_tokens": 27262976} {"current_steps": 14, "total_steps": 113, "loss": 0.8111, "lr": 4.813009643566101e-05, "epoch": 0.12362030905077263, "percentage": 12.39, "elapsed_time": "0:39:54", "remaining_time": "4:42:15", "throughput": 12259.37, "total_tokens": 29360128} {"current_steps": 15, "total_steps": 113, "loss": 0.7997, "lr": 4.7857443822096905e-05, "epoch": 0.13245033112582782, "percentage": 13.27, "elapsed_time": "0:42:45", "remaining_time": "4:39:21", "throughput": 12261.52, "total_tokens": 31457280} {"current_steps": 16, "total_steps": 113, "loss": 0.7537, "lr": 4.7567125032815394e-05, "epoch": 0.141280353200883, "percentage": 14.16, "elapsed_time": "0:45:35", "remaining_time": "4:36:21", "throughput": 12267.81, "total_tokens": 33554432} {"current_steps": 17, "total_steps": 113, "loss": 0.7645, "lr": 4.7259364450857096e-05, "epoch": 0.15011037527593818, "percentage": 15.04, "elapsed_time": "0:48:25", "remaining_time": "4:33:27", "throughput": 12270.65, "total_tokens": 35651584} {"current_steps": 18, "total_steps": 113, "loss": 0.7712, "lr": 4.6934399939762746e-05, "epoch": 0.15894039735099338, "percentage": 15.93, "elapsed_time": "0:51:15", "remaining_time": "4:30:33", "throughput": 12272.81, "total_tokens": 37748736} {"current_steps": 19, "total_steps": 113, "loss": 0.74, "lr": 4.659248265973205e-05, "epoch": 0.16777041942604856, "percentage": 16.81, "elapsed_time": "0:54:05", "remaining_time": "4:27:38", "throughput": 12275.77, "total_tokens": 39845888} {"current_steps": 20, "total_steps": 113, "loss": 0.777, "lr": 4.6233876873505694e-05, "epoch": 0.17660044150110377, "percentage": 17.7, "elapsed_time": "0:56:55", "remaining_time": "4:24:43", "throughput": 12279.48, "total_tokens": 41943040} {"current_steps": 21, "total_steps": 113, "loss": 0.7537, "lr": 4.585885974212068e-05, "epoch": 0.18543046357615894, "percentage": 18.58, "elapsed_time": "0:59:44", "remaining_time": "4:21:45", "throughput": 12284.78, "total_tokens": 44040192} {"current_steps": 22, "total_steps": 113, "loss": 0.7453, "lr": 4.5467721110696685e-05, "epoch": 0.19426048565121412, "percentage": 19.47, "elapsed_time": "1:02:34", "remaining_time": "4:18:50", "throughput": 12288.21, "total_tokens": 46137344} {"current_steps": 23, "total_steps": 113, "loss": 0.7573, "lr": 4.5060763284419114e-05, "epoch": 0.20309050772626933, "percentage": 20.35, "elapsed_time": "1:05:24", "remaining_time": "4:15:56", "throughput": 12290.92, "total_tokens": 48234496} {"current_steps": 24, "total_steps": 113, "loss": 0.7626, "lr": 4.463830079489196e-05, "epoch": 0.2119205298013245, "percentage": 21.24, "elapsed_time": "1:08:13", "remaining_time": "4:13:01", "throughput": 12294.4, "total_tokens": 50331648} {"current_steps": 25, "total_steps": 113, "loss": 0.7558, "lr": 4.420066015704105e-05, "epoch": 0.22075055187637968, "percentage": 22.12, "elapsed_time": "1:11:03", "remaining_time": "4:10:08", "throughput": 12296.47, "total_tokens": 52428800} {"current_steps": 26, "total_steps": 113, "loss": 0.7654, "lr": 4.374817961675553e-05, "epoch": 0.22958057395143489, "percentage": 23.01, "elapsed_time": "1:13:53", "remaining_time": "4:07:15", "throughput": 12298.04, "total_tokens": 54525952} {"current_steps": 27, "total_steps": 113, "loss": 0.7363, "lr": 4.3281208889462715e-05, "epoch": 0.23841059602649006, "percentage": 23.89, "elapsed_time": "1:16:43", "remaining_time": "4:04:22", "throughput": 12300.77, "total_tokens": 56623104} {"current_steps": 28, "total_steps": 113, "loss": 0.7503, "lr": 4.2800108889838244e-05, "epoch": 0.24724061810154527, "percentage": 24.78, "elapsed_time": "1:19:33", "remaining_time": "4:01:29", "throughput": 12302.45, "total_tokens": 58720256} {"current_steps": 29, "total_steps": 113, "loss": 0.7474, "lr": 4.230525145286057e-05, "epoch": 0.2560706401766004, "percentage": 25.66, "elapsed_time": "1:22:22", "remaining_time": "3:58:35", "throughput": 12305.37, "total_tokens": 60817408} {"current_steps": 30, "total_steps": 113, "loss": 0.7442, "lr": 4.1797019046425264e-05, "epoch": 0.26490066225165565, "percentage": 26.55, "elapsed_time": "1:25:12", "remaining_time": "3:55:44", "throughput": 12306.4, "total_tokens": 62914560} {"current_steps": 31, "total_steps": 113, "loss": 0.7492, "lr": 4.127580447574131e-05, "epoch": 0.2737306843267108, "percentage": 27.43, "elapsed_time": "1:28:01", "remaining_time": "3:52:51", "throughput": 12308.37, "total_tokens": 65011712} {"current_steps": 32, "total_steps": 113, "loss": 0.7601, "lr": 4.0742010579737855e-05, "epoch": 0.282560706401766, "percentage": 28.32, "elapsed_time": "1:30:51", "remaining_time": "3:49:59", "throughput": 12309.6, "total_tokens": 67108864} {"current_steps": 33, "total_steps": 113, "loss": 0.7381, "lr": 4.0196049919716004e-05, "epoch": 0.2913907284768212, "percentage": 29.2, "elapsed_time": "1:33:41", "remaining_time": "3:47:07", "throughput": 12311.56, "total_tokens": 69206016} {"current_steps": 34, "total_steps": 113, "loss": 0.7406, "lr": 3.963834446048644e-05, "epoch": 0.30022075055187636, "percentage": 30.09, "elapsed_time": "1:36:31", "remaining_time": "3:44:16", "throughput": 12312.23, "total_tokens": 71303168} {"current_steps": 35, "total_steps": 113, "loss": 0.7573, "lr": 3.9069325244239095e-05, "epoch": 0.3090507726269316, "percentage": 30.97, "elapsed_time": "1:39:20", "remaining_time": "3:41:23", "throughput": 12313.97, "total_tokens": 73400320} {"current_steps": 36, "total_steps": 113, "loss": 0.7419, "lr": 3.848943205739711e-05, "epoch": 0.31788079470198677, "percentage": 31.86, "elapsed_time": "1:42:10", "remaining_time": "3:38:32", "throughput": 12315.1, "total_tokens": 75497472} {"current_steps": 37, "total_steps": 113, "loss": 0.7357, "lr": 3.7899113090712526e-05, "epoch": 0.32671081677704195, "percentage": 32.74, "elapsed_time": "1:45:00", "remaining_time": "3:35:40", "throughput": 12316.24, "total_tokens": 77594624} {"current_steps": 38, "total_steps": 113, "loss": 0.7346, "lr": 3.729882459286632e-05, "epoch": 0.3355408388520971, "percentage": 33.63, "elapsed_time": "1:47:49", "remaining_time": "3:32:49", "throughput": 12317.13, "total_tokens": 79691776} {"current_steps": 39, "total_steps": 113, "loss": 0.7437, "lr": 3.66890305178407e-05, "epoch": 0.3443708609271523, "percentage": 34.51, "elapsed_time": "1:50:39", "remaining_time": "3:29:58", "throughput": 12318.14, "total_tokens": 81788928} {"current_steps": 40, "total_steps": 113, "loss": 0.742, "lr": 3.607020216633599e-05, "epoch": 0.35320088300220753, "percentage": 35.4, "elapsed_time": "1:53:29", "remaining_time": "3:27:08", "throughput": 12318.13, "total_tokens": 83886080} {"current_steps": 41, "total_steps": 113, "loss": 0.7136, "lr": 3.544281782150936e-05, "epoch": 0.3620309050772627, "percentage": 36.28, "elapsed_time": "1:56:20", "remaining_time": "3:24:17", "throughput": 12318.44, "total_tokens": 85983232} {"current_steps": 42, "total_steps": 113, "loss": 0.7417, "lr": 3.4807362379317025e-05, "epoch": 0.3708609271523179, "percentage": 37.17, "elapsed_time": "1:59:10", "remaining_time": "3:21:27", "throughput": 12318.8, "total_tokens": 88080384} {"current_steps": 43, "total_steps": 113, "loss": 0.7102, "lr": 3.416432697374533e-05, "epoch": 0.37969094922737306, "percentage": 38.05, "elapsed_time": "2:01:59", "remaining_time": "3:18:36", "throughput": 12319.37, "total_tokens": 90177536} {"current_steps": 44, "total_steps": 113, "loss": 0.7685, "lr": 3.3514208597220705e-05, "epoch": 0.38852097130242824, "percentage": 38.94, "elapsed_time": "2:04:49", "remaining_time": "3:15:44", "throughput": 12320.63, "total_tokens": 92274688} {"current_steps": 45, "total_steps": 113, "loss": 0.7332, "lr": 3.285750971649167e-05, "epoch": 0.3973509933774834, "percentage": 39.82, "elapsed_time": "2:07:40", "remaining_time": "3:12:55", "throughput": 12319.92, "total_tokens": 94371840} {"current_steps": 46, "total_steps": 113, "loss": 0.7387, "lr": 3.219473788427984e-05, "epoch": 0.40618101545253865, "percentage": 40.71, "elapsed_time": "2:10:30", "remaining_time": "3:10:05", "throughput": 12319.21, "total_tokens": 96468992} {"current_steps": 47, "total_steps": 113, "loss": 0.7096, "lr": 3.1526405346999946e-05, "epoch": 0.41501103752759383, "percentage": 41.59, "elapsed_time": "2:13:20", "remaining_time": "3:07:15", "throughput": 12319.45, "total_tokens": 98566144} {"current_steps": 48, "total_steps": 113, "loss": 0.7242, "lr": 3.085302864885235e-05, "epoch": 0.423841059602649, "percentage": 42.48, "elapsed_time": "2:16:10", "remaining_time": "3:04:24", "throughput": 12319.97, "total_tokens": 100663296} {"current_steps": 49, "total_steps": 113, "loss": 0.7338, "lr": 3.017512823259373e-05, "epoch": 0.4326710816777042, "percentage": 43.36, "elapsed_time": "2:19:00", "remaining_time": "3:01:33", "throughput": 12320.62, "total_tokens": 102760448} {"current_steps": 50, "total_steps": 113, "loss": 0.7494, "lr": 2.9493228037294702e-05, "epoch": 0.44150110375275936, "percentage": 44.25, "elapsed_time": "2:21:50", "remaining_time": "2:58:43", "throughput": 12321.04, "total_tokens": 104857600} {"current_steps": 51, "total_steps": 113, "loss": 0.7272, "lr": 2.8807855093395126e-05, "epoch": 0.4503311258278146, "percentage": 45.13, "elapsed_time": "2:24:41", "remaining_time": "2:55:53", "throughput": 12320.02, "total_tokens": 106954752} {"current_steps": 52, "total_steps": 113, "loss": 0.7447, "lr": 2.8119539115370218e-05, "epoch": 0.45916114790286977, "percentage": 46.02, "elapsed_time": "2:27:29", "remaining_time": "2:53:00", "throughput": 12323.37, "total_tokens": 109051904} {"current_steps": 53, "total_steps": 113, "loss": 0.7219, "lr": 2.742881209232215e-05, "epoch": 0.46799116997792495, "percentage": 46.9, "elapsed_time": "2:30:17", "remaining_time": "2:50:08", "throughput": 12325.84, "total_tokens": 111149056} {"current_steps": 54, "total_steps": 113, "loss": 0.7484, "lr": 2.6736207876813646e-05, "epoch": 0.4768211920529801, "percentage": 47.79, "elapsed_time": "2:33:05", "remaining_time": "2:47:15", "throughput": 12328.88, "total_tokens": 113246208} {"current_steps": 55, "total_steps": 113, "loss": 0.7352, "lr": 2.604226177226137e-05, "epoch": 0.4856512141280353, "percentage": 48.67, "elapsed_time": "2:35:54", "remaining_time": "2:44:24", "throughput": 12330.83, "total_tokens": 115343360} {"current_steps": 56, "total_steps": 113, "loss": 0.7254, "lr": 2.5347510119207878e-05, "epoch": 0.49448123620309054, "percentage": 49.56, "elapsed_time": "2:38:43", "remaining_time": "2:41:33", "throughput": 12331.8, "total_tokens": 117440512} {"current_steps": 57, "total_steps": 113, "loss": 0.724, "lr": 2.4652489880792128e-05, "epoch": 0.5033112582781457, "percentage": 50.44, "elapsed_time": "2:41:32", "remaining_time": "2:38:42", "throughput": 12333.18, "total_tokens": 119537664} {"current_steps": 58, "total_steps": 113, "loss": 0.747, "lr": 2.395773822773863e-05, "epoch": 0.5121412803532008, "percentage": 51.33, "elapsed_time": "2:44:19", "remaining_time": "2:35:49", "throughput": 12336.23, "total_tokens": 121634816} {"current_steps": 59, "total_steps": 113, "loss": 0.7246, "lr": 2.3263792123186353e-05, "epoch": 0.5209713024282561, "percentage": 52.21, "elapsed_time": "2:47:08", "remaining_time": "2:32:58", "throughput": 12338.13, "total_tokens": 123731968} {"current_steps": 60, "total_steps": 113, "loss": 0.7424, "lr": 2.2571187907677853e-05, "epoch": 0.5298013245033113, "percentage": 53.1, "elapsed_time": "2:49:57", "remaining_time": "2:30:07", "throughput": 12339.8, "total_tokens": 125829120} {"current_steps": 61, "total_steps": 113, "loss": 0.7422, "lr": 2.188046088462979e-05, "epoch": 0.5386313465783664, "percentage": 53.98, "elapsed_time": "2:52:45", "remaining_time": "2:27:16", "throughput": 12341.13, "total_tokens": 127926272} {"current_steps": 62, "total_steps": 113, "loss": 0.7166, "lr": 2.1192144906604876e-05, "epoch": 0.5474613686534217, "percentage": 54.87, "elapsed_time": "2:55:33", "remaining_time": "2:24:25", "throughput": 12343.22, "total_tokens": 130023424} {"current_steps": 63, "total_steps": 113, "loss": 0.7564, "lr": 2.0506771962705304e-05, "epoch": 0.5562913907284768, "percentage": 55.75, "elapsed_time": "2:58:21", "remaining_time": "2:21:33", "throughput": 12346.02, "total_tokens": 132120576} {"current_steps": 64, "total_steps": 113, "loss": 0.744, "lr": 1.982487176740627e-05, "epoch": 0.565121412803532, "percentage": 56.64, "elapsed_time": "3:01:10", "remaining_time": "2:18:42", "throughput": 12347.51, "total_tokens": 134217728} {"current_steps": 65, "total_steps": 113, "loss": 0.7523, "lr": 1.9146971351147655e-05, "epoch": 0.5739514348785872, "percentage": 57.52, "elapsed_time": "3:03:57", "remaining_time": "2:15:51", "throughput": 12349.65, "total_tokens": 136314880} {"current_steps": 66, "total_steps": 113, "loss": 0.7274, "lr": 1.847359465300006e-05, "epoch": 0.5827814569536424, "percentage": 58.41, "elapsed_time": "3:06:46", "remaining_time": "2:13:00", "throughput": 12351.39, "total_tokens": 138412032} {"current_steps": 67, "total_steps": 113, "loss": 0.746, "lr": 1.780526211572016e-05, "epoch": 0.5916114790286976, "percentage": 59.29, "elapsed_time": "3:09:34", "remaining_time": "2:10:09", "throughput": 12353.19, "total_tokens": 140509184} {"current_steps": 68, "total_steps": 113, "loss": 0.7423, "lr": 1.7142490283508324e-05, "epoch": 0.6004415011037527, "percentage": 60.18, "elapsed_time": "3:12:21", "remaining_time": "2:07:18", "throughput": 12355.43, "total_tokens": 142606336} {"current_steps": 69, "total_steps": 113, "loss": 0.7234, "lr": 1.648579140277931e-05, "epoch": 0.609271523178808, "percentage": 61.06, "elapsed_time": "3:15:09", "remaining_time": "2:04:26", "throughput": 12357.73, "total_tokens": 144703488} {"current_steps": 70, "total_steps": 113, "loss": 0.7495, "lr": 1.583567302625469e-05, "epoch": 0.6181015452538632, "percentage": 61.95, "elapsed_time": "3:17:57", "remaining_time": "2:01:35", "throughput": 12359.87, "total_tokens": 146800640} {"current_steps": 71, "total_steps": 113, "loss": 0.7227, "lr": 1.5192637620682981e-05, "epoch": 0.6269315673289183, "percentage": 62.83, "elapsed_time": "3:20:45", "remaining_time": "1:58:45", "throughput": 12361.65, "total_tokens": 148897792} {"current_steps": 72, "total_steps": 113, "loss": 0.7607, "lr": 1.4557182178490636e-05, "epoch": 0.6357615894039735, "percentage": 63.72, "elapsed_time": "3:23:32", "remaining_time": "1:55:54", "throughput": 12363.6, "total_tokens": 150994944} {"current_steps": 73, "total_steps": 113, "loss": 0.7296, "lr": 1.3929797833664013e-05, "epoch": 0.6445916114790287, "percentage": 64.6, "elapsed_time": "3:26:21", "remaining_time": "1:53:04", "throughput": 12364.6, "total_tokens": 153092096} {"current_steps": 74, "total_steps": 113, "loss": 0.7361, "lr": 1.3310969482159297e-05, "epoch": 0.6534216335540839, "percentage": 65.49, "elapsed_time": "3:29:09", "remaining_time": "1:50:13", "throughput": 12366.65, "total_tokens": 155189248} {"current_steps": 75, "total_steps": 113, "loss": 0.7379, "lr": 1.270117540713368e-05, "epoch": 0.6622516556291391, "percentage": 66.37, "elapsed_time": "3:31:57", "remaining_time": "1:47:23", "throughput": 12368.13, "total_tokens": 157286400} {"current_steps": 76, "total_steps": 113, "loss": 0.7351, "lr": 1.2100886909287478e-05, "epoch": 0.6710816777041942, "percentage": 67.26, "elapsed_time": "3:34:44", "remaining_time": "1:44:32", "throughput": 12369.85, "total_tokens": 159383552} {"current_steps": 77, "total_steps": 113, "loss": 0.7295, "lr": 1.151056794260289e-05, "epoch": 0.6799116997792495, "percentage": 68.14, "elapsed_time": "3:37:32", "remaining_time": "1:41:42", "throughput": 12371.69, "total_tokens": 161480704} {"current_steps": 78, "total_steps": 113, "loss": 0.7333, "lr": 1.0930674755760908e-05, "epoch": 0.6887417218543046, "percentage": 69.03, "elapsed_time": "3:40:20", "remaining_time": "1:38:52", "throughput": 12373.07, "total_tokens": 163577856} {"current_steps": 79, "total_steps": 113, "loss": 0.7334, "lr": 1.0361655539513565e-05, "epoch": 0.6975717439293598, "percentage": 69.91, "elapsed_time": "3:43:08", "remaining_time": "1:36:02", "throughput": 12374.64, "total_tokens": 165675008} {"current_steps": 80, "total_steps": 113, "loss": 0.7437, "lr": 9.803950080284005e-06, "epoch": 0.7064017660044151, "percentage": 70.8, "elapsed_time": "3:45:56", "remaining_time": "1:33:12", "throughput": 12375.68, "total_tokens": 167772160} {"current_steps": 81, "total_steps": 113, "loss": 0.7133, "lr": 9.257989420262151e-06, "epoch": 0.7152317880794702, "percentage": 71.68, "elapsed_time": "3:48:44", "remaining_time": "1:30:21", "throughput": 12377.37, "total_tokens": 169869312} {"current_steps": 82, "total_steps": 113, "loss": 0.7415, "lr": 8.724195524258688e-06, "epoch": 0.7240618101545254, "percentage": 72.57, "elapsed_time": "3:51:31", "remaining_time": "1:27:31", "throughput": 12379.17, "total_tokens": 171966464} {"current_steps": 83, "total_steps": 113, "loss": 0.7423, "lr": 8.202980953574735e-06, "epoch": 0.7328918322295805, "percentage": 73.45, "elapsed_time": "3:54:19", "remaining_time": "1:24:41", "throughput": 12380.31, "total_tokens": 174063616} {"current_steps": 84, "total_steps": 113, "loss": 0.7125, "lr": 7.69474854713943e-06, "epoch": 0.7417218543046358, "percentage": 74.34, "elapsed_time": "3:57:08", "remaining_time": "1:21:52", "throughput": 12381.1, "total_tokens": 176160768} {"current_steps": 85, "total_steps": 113, "loss": 0.7346, "lr": 7.1998911101617575e-06, "epoch": 0.7505518763796909, "percentage": 75.22, "elapsed_time": "3:59:56", "remaining_time": "1:19:02", "throughput": 12382.4, "total_tokens": 178257920} {"current_steps": 86, "total_steps": 113, "loss": 0.7235, "lr": 6.718791110537287e-06, "epoch": 0.7593818984547461, "percentage": 76.11, "elapsed_time": "4:02:44", "remaining_time": "1:16:12", "throughput": 12383.21, "total_tokens": 180355072} {"current_steps": 87, "total_steps": 113, "loss": 0.7268, "lr": 6.25182038324447e-06, "epoch": 0.7682119205298014, "percentage": 76.99, "elapsed_time": "4:05:32", "remaining_time": "1:13:22", "throughput": 12384.33, "total_tokens": 182452224} {"current_steps": 88, "total_steps": 113, "loss": 0.7251, "lr": 5.7993398429589506e-06, "epoch": 0.7770419426048565, "percentage": 77.88, "elapsed_time": "4:08:20", "remaining_time": "1:10:33", "throughput": 12385.44, "total_tokens": 184549376} {"current_steps": 89, "total_steps": 113, "loss": 0.7216, "lr": 5.361699205108042e-06, "epoch": 0.7858719646799117, "percentage": 78.76, "elapsed_time": "4:11:08", "remaining_time": "1:07:43", "throughput": 12386.47, "total_tokens": 186646528} {"current_steps": 90, "total_steps": 113, "loss": 0.7386, "lr": 4.939236715580884e-06, "epoch": 0.7947019867549668, "percentage": 79.65, "elapsed_time": "4:13:57", "remaining_time": "1:04:53", "throughput": 12387.18, "total_tokens": 188743680} {"current_steps": 91, "total_steps": 113, "loss": 0.734, "lr": 4.5322788893033155e-06, "epoch": 0.8035320088300221, "percentage": 80.53, "elapsed_time": "4:16:45", "remaining_time": "1:02:04", "throughput": 12387.88, "total_tokens": 190840832} {"current_steps": 92, "total_steps": 113, "loss": 0.7519, "lr": 4.14114025787932e-06, "epoch": 0.8123620309050773, "percentage": 81.42, "elapsed_time": "4:19:33", "remaining_time": "0:59:14", "throughput": 12389.08, "total_tokens": 192937984} {"current_steps": 93, "total_steps": 113, "loss": 0.7194, "lr": 3.7661231264943086e-06, "epoch": 0.8211920529801324, "percentage": 82.3, "elapsed_time": "4:22:21", "remaining_time": "0:56:25", "throughput": 12389.85, "total_tokens": 195035136} {"current_steps": 94, "total_steps": 113, "loss": 0.7263, "lr": 3.4075173402679574e-06, "epoch": 0.8300220750551877, "percentage": 83.19, "elapsed_time": "4:25:10", "remaining_time": "0:53:35", "throughput": 12390.35, "total_tokens": 197132288} {"current_steps": 95, "total_steps": 113, "loss": 0.7093, "lr": 3.0656000602372558e-06, "epoch": 0.8388520971302428, "percentage": 84.07, "elapsed_time": "4:27:58", "remaining_time": "0:50:46", "throughput": 12391.05, "total_tokens": 199229440} {"current_steps": 96, "total_steps": 113, "loss": 0.7654, "lr": 2.7406355491429086e-06, "epoch": 0.847682119205298, "percentage": 84.96, "elapsed_time": "4:30:47", "remaining_time": "0:47:57", "throughput": 12391.45, "total_tokens": 201326592} {"current_steps": 97, "total_steps": 113, "loss": 0.7365, "lr": 2.4328749671846116e-06, "epoch": 0.8565121412803532, "percentage": 85.84, "elapsed_time": "4:33:35", "remaining_time": "0:45:07", "throughput": 12392.15, "total_tokens": 203423744} {"current_steps": 98, "total_steps": 113, "loss": 0.7468, "lr": 2.142556177903096e-06, "epoch": 0.8653421633554084, "percentage": 86.73, "elapsed_time": "4:36:23", "remaining_time": "0:42:18", "throughput": 12393.07, "total_tokens": 205520896} {"current_steps": 99, "total_steps": 113, "loss": 0.7264, "lr": 1.8699035643389928e-06, "epoch": 0.8741721854304636, "percentage": 87.61, "elapsed_time": "4:39:11", "remaining_time": "0:39:28", "throughput": 12394.01, "total_tokens": 207618048} {"current_steps": 100, "total_steps": 113, "loss": 0.7392, "lr": 1.615127855610496e-06, "epoch": 0.8830022075055187, "percentage": 88.5, "elapsed_time": "4:41:59", "remaining_time": "0:36:39", "throughput": 12395.06, "total_tokens": 209715200} {"current_steps": 101, "total_steps": 113, "loss": 0.7378, "lr": 1.3784259640440279e-06, "epoch": 0.891832229580574, "percentage": 89.38, "elapsed_time": "4:44:47", "remaining_time": "0:33:50", "throughput": 12396.1, "total_tokens": 211812352} {"current_steps": 102, "total_steps": 113, "loss": 0.7384, "lr": 1.1599808329836177e-06, "epoch": 0.9006622516556292, "percentage": 90.27, "elapsed_time": "4:47:34", "remaining_time": "0:31:00", "throughput": 12397.09, "total_tokens": 213909504} {"current_steps": 103, "total_steps": 113, "loss": 0.7326, "lr": 9.599612953967746e-07, "epoch": 0.9094922737306843, "percentage": 91.15, "elapsed_time": "4:50:23", "remaining_time": "0:28:11", "throughput": 12397.55, "total_tokens": 216006656} {"current_steps": 104, "total_steps": 113, "loss": 0.7319, "lr": 7.785219433859847e-07, "epoch": 0.9183222958057395, "percentage": 92.04, "elapsed_time": "4:53:11", "remaining_time": "0:25:22", "throughput": 12398.3, "total_tokens": 218103808} {"current_steps": 105, "total_steps": 113, "loss": 0.7365, "lr": 6.158030087068001e-07, "epoch": 0.9271523178807947, "percentage": 92.92, "elapsed_time": "4:55:59", "remaining_time": "0:22:33", "throughput": 12399.3, "total_tokens": 220200960} {"current_steps": 106, "total_steps": 113, "loss": 0.75, "lr": 4.719302543848225e-07, "epoch": 0.9359823399558499, "percentage": 93.81, "elapsed_time": "4:58:46", "remaining_time": "0:19:43", "throughput": 12400.52, "total_tokens": 222298112} {"current_steps": 107, "total_steps": 113, "loss": 0.7468, "lr": 3.470148775153448e-07, "epoch": 0.9448123620309051, "percentage": 94.69, "elapsed_time": "5:01:34", "remaining_time": "0:16:54", "throughput": 12401.53, "total_tokens": 224395264} {"current_steps": 108, "total_steps": 113, "loss": 0.7425, "lr": 2.4115342332078074e-07, "epoch": 0.9536423841059603, "percentage": 95.58, "elapsed_time": "5:04:21", "remaining_time": "0:14:05", "throughput": 12402.6, "total_tokens": 226492416} {"current_steps": 109, "total_steps": 113, "loss": 0.7314, "lr": 1.5442771053230665e-07, "epoch": 0.9624724061810155, "percentage": 96.46, "elapsed_time": "5:07:14", "remaining_time": "0:11:16", "throughput": 12399.84, "total_tokens": 228589568} {"current_steps": 110, "total_steps": 113, "loss": 0.7407, "lr": 8.690476815339244e-08, "epoch": 0.9713024282560706, "percentage": 97.35, "elapsed_time": "5:10:04", "remaining_time": "0:08:27", "throughput": 12399.79, "total_tokens": 230686720} {"current_steps": 111, "total_steps": 113, "loss": 0.729, "lr": 3.8636783654100174e-08, "epoch": 0.9801324503311258, "percentage": 98.23, "elapsed_time": "5:12:51", "remaining_time": "0:05:38", "throughput": 12400.69, "total_tokens": 232783872} {"current_steps": 112, "total_steps": 113, "loss": 0.7333, "lr": 9.661062636148744e-09, "epoch": 0.9889624724061811, "percentage": 99.12, "elapsed_time": "5:15:40", "remaining_time": "0:02:49", "throughput": 12401.32, "total_tokens": 234881024} {"current_steps": 113, "total_steps": 113, "loss": 0.7217, "lr": 0.0, "epoch": 0.9977924944812362, "percentage": 100.0, "elapsed_time": "5:18:28", "remaining_time": "0:00:00", "throughput": 12401.67, "total_tokens": 236978176} {"current_steps": 113, "total_steps": 113, "epoch": 0.9977924944812362, "percentage": 100.0, "elapsed_time": "5:18:52", "remaining_time": "0:00:00", "throughput": 12385.92, "total_tokens": 236978176}