{"current_steps": 1, "total_steps": 103, "loss": 1.2542, "lr": 4.998837209058379e-05, "epoch": 0.00963855421686747, "percentage": 0.97, "elapsed_time": "0:02:53", "remaining_time": "4:55:31", "throughput": 12063.73, "total_tokens": 2097152} {"current_steps": 2, "total_steps": 103, "loss": 1.2368, "lr": 4.9953499178997346e-05, "epoch": 0.01927710843373494, "percentage": 1.94, "elapsed_time": "0:05:41", "remaining_time": "4:47:02", "throughput": 12298.53, "total_tokens": 4194304} {"current_steps": 3, "total_steps": 103, "loss": 1.1874, "lr": 4.9895413705165234e-05, "epoch": 0.02891566265060241, "percentage": 2.91, "elapsed_time": "0:08:28", "remaining_time": "4:42:24", "throughput": 12376.74, "total_tokens": 6291456} {"current_steps": 4, "total_steps": 103, "loss": 1.1094, "lr": 4.98141697020977e-05, "epoch": 0.03855421686746988, "percentage": 3.88, "elapsed_time": "0:11:15", "remaining_time": "4:38:41", "throughput": 12416.4, "total_tokens": 8388608} {"current_steps": 5, "total_steps": 103, "loss": 1.0771, "lr": 4.970984274562741e-05, "epoch": 0.04819277108433735, "percentage": 4.85, "elapsed_time": "0:14:02", "remaining_time": "4:35:17", "throughput": 12442.52, "total_tokens": 10485760} {"current_steps": 6, "total_steps": 103, "loss": 1.0465, "lr": 4.958252988410631e-05, "epoch": 0.05783132530120482, "percentage": 5.83, "elapsed_time": "0:16:49", "remaining_time": "4:32:03", "throughput": 12462.24, "total_tokens": 12582912} {"current_steps": 7, "total_steps": 103, "loss": 1.0828, "lr": 4.9432349548128124e-05, "epoch": 0.06746987951807229, "percentage": 6.8, "elapsed_time": "0:19:36", "remaining_time": "4:29:01", "throughput": 12472.99, "total_tokens": 14680064} {"current_steps": 8, "total_steps": 103, "loss": 1.0584, "lr": 4.925944144036026e-05, "epoch": 0.07710843373493977, "percentage": 7.77, "elapsed_time": "0:22:23", "remaining_time": "4:25:59", "throughput": 12483.46, "total_tokens": 16777216} {"current_steps": 9, "total_steps": 103, "loss": 1.0203, "lr": 4.90639664055879e-05, "epoch": 0.08674698795180723, "percentage": 8.74, "elapsed_time": "0:25:11", "remaining_time": "4:23:01", "throughput": 12491.03, "total_tokens": 18874368} {"current_steps": 10, "total_steps": 103, "loss": 1.0074, "lr": 4.884610628109082e-05, "epoch": 0.0963855421686747, "percentage": 9.71, "elapsed_time": "0:27:58", "remaining_time": "4:20:09", "throughput": 12494.73, "total_tokens": 20971520} {"current_steps": 11, "total_steps": 103, "loss": 1.0076, "lr": 4.860606372749247e-05, "epoch": 0.10602409638554217, "percentage": 10.68, "elapsed_time": "0:30:45", "remaining_time": "4:17:16", "throughput": 12498.8, "total_tokens": 23068672} {"current_steps": 12, "total_steps": 103, "loss": 0.9358, "lr": 4.8344062040238395e-05, "epoch": 0.11566265060240964, "percentage": 11.65, "elapsed_time": "0:33:33", "remaining_time": "4:14:30", "throughput": 12497.6, "total_tokens": 25165824} {"current_steps": 13, "total_steps": 103, "loss": 0.9963, "lr": 4.806034494187949e-05, "epoch": 0.12530120481927712, "percentage": 12.62, "elapsed_time": "0:36:22", "remaining_time": "4:11:48", "throughput": 12492.58, "total_tokens": 27262976} {"current_steps": 14, "total_steps": 103, "loss": 0.9646, "lr": 4.775517635535332e-05, "epoch": 0.13493975903614458, "percentage": 13.59, "elapsed_time": "0:39:09", "remaining_time": "4:08:57", "throughput": 12495.22, "total_tokens": 29360128} {"current_steps": 15, "total_steps": 103, "loss": 0.9749, "lr": 4.742884015847436e-05, "epoch": 0.14457831325301204, "percentage": 14.56, "elapsed_time": "0:41:57", "remaining_time": "4:06:10", "throughput": 12494.34, "total_tokens": 31457280} {"current_steps": 16, "total_steps": 103, "loss": 0.9222, "lr": 4.708163991986152e-05, "epoch": 0.15421686746987953, "percentage": 15.53, "elapsed_time": "0:44:45", "remaining_time": "4:03:23", "throughput": 12493.86, "total_tokens": 33554432} {"current_steps": 17, "total_steps": 103, "loss": 0.9341, "lr": 4.6713898616548724e-05, "epoch": 0.163855421686747, "percentage": 16.5, "elapsed_time": "0:47:33", "remaining_time": "4:00:35", "throughput": 12494.19, "total_tokens": 35651584} {"current_steps": 18, "total_steps": 103, "loss": 0.9262, "lr": 4.6325958333541044e-05, "epoch": 0.17349397590361446, "percentage": 17.48, "elapsed_time": "0:50:20", "remaining_time": "3:57:44", "throughput": 12496.39, "total_tokens": 37748736} {"current_steps": 19, "total_steps": 103, "loss": 0.9563, "lr": 4.591817994559605e-05, "epoch": 0.18313253012048192, "percentage": 18.45, "elapsed_time": "0:53:13", "remaining_time": "3:55:16", "throughput": 12478.68, "total_tokens": 39845888} {"current_steps": 20, "total_steps": 103, "loss": 0.9378, "lr": 4.5490942781526316e-05, "epoch": 0.1927710843373494, "percentage": 19.42, "elapsed_time": "0:56:00", "remaining_time": "3:52:26", "throughput": 12481.2, "total_tokens": 41943040} {"current_steps": 21, "total_steps": 103, "loss": 0.9421, "lr": 4.504464427133527e-05, "epoch": 0.20240963855421687, "percentage": 20.39, "elapsed_time": "0:58:47", "remaining_time": "3:49:35", "throughput": 12483.12, "total_tokens": 44040192} {"current_steps": 22, "total_steps": 103, "loss": 0.9219, "lr": 4.457969957651484e-05, "epoch": 0.21204819277108433, "percentage": 21.36, "elapsed_time": "1:01:35", "remaining_time": "3:46:47", "throughput": 12483.76, "total_tokens": 46137344} {"current_steps": 23, "total_steps": 103, "loss": 0.9108, "lr": 4.409654120384862e-05, "epoch": 0.2216867469879518, "percentage": 22.33, "elapsed_time": "1:04:27", "remaining_time": "3:44:13", "throughput": 12470.41, "total_tokens": 48234496} {"current_steps": 24, "total_steps": 103, "loss": 0.9331, "lr": 4.35956186030799e-05, "epoch": 0.23132530120481928, "percentage": 23.3, "elapsed_time": "1:07:18", "remaining_time": "3:41:32", "throughput": 12464.13, "total_tokens": 50331648} {"current_steps": 25, "total_steps": 103, "loss": 0.9405, "lr": 4.307739774881878e-05, "epoch": 0.24096385542168675, "percentage": 24.27, "elapsed_time": "1:10:05", "remaining_time": "3:38:40", "throughput": 12467.02, "total_tokens": 52428800} {"current_steps": 26, "total_steps": 103, "loss": 0.9667, "lr": 4.254236070707733e-05, "epoch": 0.25060240963855424, "percentage": 25.24, "elapsed_time": "1:12:52", "remaining_time": "3:35:50", "throughput": 12469.48, "total_tokens": 54525952} {"current_steps": 27, "total_steps": 103, "loss": 0.935, "lr": 4.1991005186836005e-05, "epoch": 0.26024096385542167, "percentage": 26.21, "elapsed_time": "1:15:40", "remaining_time": "3:32:59", "throughput": 12471.33, "total_tokens": 56623104} {"current_steps": 28, "total_steps": 103, "loss": 0.8985, "lr": 4.142384407705846e-05, "epoch": 0.26987951807228916, "percentage": 27.18, "elapsed_time": "1:18:27", "remaining_time": "3:30:09", "throughput": 12473.52, "total_tokens": 58720256} {"current_steps": 29, "total_steps": 103, "loss": 0.8879, "lr": 4.084140496958538e-05, "epoch": 0.27951807228915665, "percentage": 28.16, "elapsed_time": "1:21:15", "remaining_time": "3:27:20", "throughput": 12474.78, "total_tokens": 60817408} {"current_steps": 30, "total_steps": 103, "loss": 0.9086, "lr": 4.024422966835136e-05, "epoch": 0.2891566265060241, "percentage": 29.13, "elapsed_time": "1:24:02", "remaining_time": "3:24:30", "throughput": 12475.93, "total_tokens": 62914560} {"current_steps": 31, "total_steps": 103, "loss": 0.9437, "lr": 3.963287368538106e-05, "epoch": 0.2987951807228916, "percentage": 30.1, "elapsed_time": "1:26:50", "remaining_time": "3:21:40", "throughput": 12478.25, "total_tokens": 65011712} {"current_steps": 32, "total_steps": 103, "loss": 0.916, "lr": 3.900790572403376e-05, "epoch": 0.30843373493975906, "percentage": 31.07, "elapsed_time": "1:29:37", "remaining_time": "3:18:51", "throughput": 12479.52, "total_tokens": 67108864} {"current_steps": 33, "total_steps": 103, "loss": 0.9433, "lr": 3.836990714997686e-05, "epoch": 0.3180722891566265, "percentage": 32.04, "elapsed_time": "1:32:24", "remaining_time": "3:16:00", "throughput": 12482.06, "total_tokens": 69206016} {"current_steps": 34, "total_steps": 103, "loss": 0.9276, "lr": 3.7719471450380514e-05, "epoch": 0.327710843373494, "percentage": 33.01, "elapsed_time": "1:35:11", "remaining_time": "3:13:10", "throughput": 12484.67, "total_tokens": 71303168} {"current_steps": 35, "total_steps": 103, "loss": 0.918, "lr": 3.7057203681836406e-05, "epoch": 0.3373493975903614, "percentage": 33.98, "elapsed_time": "1:37:58", "remaining_time": "3:10:20", "throughput": 12486.49, "total_tokens": 73400320} {"current_steps": 36, "total_steps": 103, "loss": 0.8979, "lr": 3.638371990751428e-05, "epoch": 0.3469879518072289, "percentage": 34.95, "elapsed_time": "1:40:45", "remaining_time": "3:07:31", "throughput": 12488.19, "total_tokens": 75497472} {"current_steps": 37, "total_steps": 103, "loss": 0.9065, "lr": 3.569964662407983e-05, "epoch": 0.3566265060240964, "percentage": 35.92, "elapsed_time": "1:43:32", "remaining_time": "3:04:42", "throughput": 12489.21, "total_tokens": 77594624} {"current_steps": 38, "total_steps": 103, "loss": 0.9405, "lr": 3.500562017890695e-05, "epoch": 0.36626506024096384, "percentage": 36.89, "elapsed_time": "1:46:20", "remaining_time": "3:01:53", "throughput": 12490.78, "total_tokens": 79691776} {"current_steps": 39, "total_steps": 103, "loss": 0.9263, "lr": 3.430228617812661e-05, "epoch": 0.3759036144578313, "percentage": 37.86, "elapsed_time": "1:49:07", "remaining_time": "2:59:04", "throughput": 12492.31, "total_tokens": 81788928} {"current_steps": 40, "total_steps": 103, "loss": 0.9243, "lr": 3.3590298886062833e-05, "epoch": 0.3855421686746988, "percentage": 38.83, "elapsed_time": "1:51:54", "remaining_time": "2:56:14", "throughput": 12493.77, "total_tokens": 83886080} {"current_steps": 41, "total_steps": 103, "loss": 0.9201, "lr": 3.2870320616614626e-05, "epoch": 0.39518072289156625, "percentage": 39.81, "elapsed_time": "1:54:41", "remaining_time": "2:53:26", "throughput": 12494.83, "total_tokens": 85983232} {"current_steps": 42, "total_steps": 103, "loss": 0.9015, "lr": 3.21430211171499e-05, "epoch": 0.40481927710843374, "percentage": 40.78, "elapsed_time": "1:57:28", "remaining_time": "2:50:37", "throughput": 12495.51, "total_tokens": 88080384} {"current_steps": 43, "total_steps": 103, "loss": 0.9104, "lr": 3.140907694548451e-05, "epoch": 0.41445783132530123, "percentage": 41.75, "elapsed_time": "2:00:16", "remaining_time": "2:47:49", "throughput": 12496.2, "total_tokens": 90177536} {"current_steps": 44, "total_steps": 103, "loss": 0.9194, "lr": 3.066917084052603e-05, "epoch": 0.42409638554216866, "percentage": 42.72, "elapsed_time": "2:03:03", "remaining_time": "2:45:00", "throughput": 12497.21, "total_tokens": 92274688} {"current_steps": 45, "total_steps": 103, "loss": 0.9575, "lr": 2.9923991087167658e-05, "epoch": 0.43373493975903615, "percentage": 43.69, "elapsed_time": "2:05:51", "remaining_time": "2:42:12", "throughput": 12497.84, "total_tokens": 94371840} {"current_steps": 46, "total_steps": 103, "loss": 0.8922, "lr": 2.9174230876023058e-05, "epoch": 0.4433734939759036, "percentage": 44.66, "elapsed_time": "2:08:38", "remaining_time": "2:39:24", "throughput": 12498.21, "total_tokens": 96468992} {"current_steps": 47, "total_steps": 103, "loss": 0.9125, "lr": 2.8420587658597757e-05, "epoch": 0.4530120481927711, "percentage": 45.63, "elapsed_time": "2:11:26", "remaining_time": "2:36:36", "throughput": 12498.66, "total_tokens": 98566144} {"current_steps": 48, "total_steps": 103, "loss": 0.8989, "lr": 2.7663762498496905e-05, "epoch": 0.46265060240963857, "percentage": 46.6, "elapsed_time": "2:14:13", "remaining_time": "2:33:48", "throughput": 12498.85, "total_tokens": 100663296} {"current_steps": 49, "total_steps": 103, "loss": 0.8719, "lr": 2.6904459419272955e-05, "epoch": 0.472289156626506, "percentage": 47.57, "elapsed_time": "2:17:01", "remaining_time": "2:31:00", "throughput": 12499.07, "total_tokens": 102760448} {"current_steps": 50, "total_steps": 103, "loss": 0.9074, "lr": 2.6143384749519866e-05, "epoch": 0.4819277108433735, "percentage": 48.54, "elapsed_time": "2:19:49", "remaining_time": "2:28:12", "throughput": 12499.4, "total_tokens": 104857600} {"current_steps": 51, "total_steps": 103, "loss": 0.8911, "lr": 2.538124646582315e-05, "epoch": 0.491566265060241, "percentage": 49.51, "elapsed_time": "2:22:36", "remaining_time": "2:25:24", "throughput": 12499.72, "total_tokens": 106954752} {"current_steps": 52, "total_steps": 103, "loss": 0.9314, "lr": 2.4618753534176856e-05, "epoch": 0.5012048192771085, "percentage": 50.49, "elapsed_time": "2:25:24", "remaining_time": "2:22:36", "throughput": 12499.98, "total_tokens": 109051904} {"current_steps": 53, "total_steps": 103, "loss": 0.9104, "lr": 2.385661525048014e-05, "epoch": 0.5108433734939759, "percentage": 51.46, "elapsed_time": "2:28:11", "remaining_time": "2:19:48", "throughput": 12500.38, "total_tokens": 111149056} {"current_steps": 54, "total_steps": 103, "loss": 0.8854, "lr": 2.3095540580727055e-05, "epoch": 0.5204819277108433, "percentage": 52.43, "elapsed_time": "2:30:59", "remaining_time": "2:17:00", "throughput": 12500.53, "total_tokens": 113246208} {"current_steps": 55, "total_steps": 103, "loss": 0.8827, "lr": 2.23362375015031e-05, "epoch": 0.5301204819277109, "percentage": 53.4, "elapsed_time": "2:33:47", "remaining_time": "2:14:12", "throughput": 12500.44, "total_tokens": 115343360} {"current_steps": 56, "total_steps": 103, "loss": 0.9197, "lr": 2.157941234140225e-05, "epoch": 0.5397590361445783, "percentage": 54.37, "elapsed_time": "2:36:35", "remaining_time": "2:11:25", "throughput": 12500.3, "total_tokens": 117440512} {"current_steps": 57, "total_steps": 103, "loss": 0.9112, "lr": 2.082576912397695e-05, "epoch": 0.5493975903614458, "percentage": 55.34, "elapsed_time": "2:39:22", "remaining_time": "2:08:37", "throughput": 12500.37, "total_tokens": 119537664} {"current_steps": 58, "total_steps": 103, "loss": 0.8954, "lr": 2.0076008912832355e-05, "epoch": 0.5590361445783133, "percentage": 56.31, "elapsed_time": "2:42:10", "remaining_time": "2:05:49", "throughput": 12500.44, "total_tokens": 121634816} {"current_steps": 59, "total_steps": 103, "loss": 0.8575, "lr": 1.933082915947398e-05, "epoch": 0.5686746987951807, "percentage": 57.28, "elapsed_time": "2:44:58", "remaining_time": "2:03:01", "throughput": 12500.3, "total_tokens": 123731968} {"current_steps": 60, "total_steps": 103, "loss": 0.8983, "lr": 1.8590923054515503e-05, "epoch": 0.5783132530120482, "percentage": 58.25, "elapsed_time": "2:47:46", "remaining_time": "2:00:14", "throughput": 12500.29, "total_tokens": 125829120} {"current_steps": 61, "total_steps": 103, "loss": 0.8819, "lr": 1.7856978882850113e-05, "epoch": 0.5879518072289157, "percentage": 59.22, "elapsed_time": "2:50:33", "remaining_time": "1:57:26", "throughput": 12500.38, "total_tokens": 127926272} {"current_steps": 62, "total_steps": 103, "loss": 0.9067, "lr": 1.7129679383385383e-05, "epoch": 0.5975903614457831, "percentage": 60.19, "elapsed_time": "2:53:21", "remaining_time": "1:54:38", "throughput": 12500.36, "total_tokens": 130023424} {"current_steps": 63, "total_steps": 103, "loss": 0.9054, "lr": 1.6409701113937183e-05, "epoch": 0.6072289156626506, "percentage": 61.17, "elapsed_time": "2:56:09", "remaining_time": "1:51:50", "throughput": 12500.52, "total_tokens": 132120576} {"current_steps": 64, "total_steps": 103, "loss": 0.8938, "lr": 1.5697713821873398e-05, "epoch": 0.6168674698795181, "percentage": 62.14, "elapsed_time": "2:58:56", "remaining_time": "1:49:02", "throughput": 12500.72, "total_tokens": 134217728} {"current_steps": 65, "total_steps": 103, "loss": 0.8964, "lr": 1.4994379821093049e-05, "epoch": 0.6265060240963856, "percentage": 63.11, "elapsed_time": "3:01:44", "remaining_time": "1:46:14", "throughput": 12500.8, "total_tokens": 136314880} {"current_steps": 66, "total_steps": 103, "loss": 0.8979, "lr": 1.430035337592018e-05, "epoch": 0.636144578313253, "percentage": 64.08, "elapsed_time": "3:04:32", "remaining_time": "1:43:27", "throughput": 12500.8, "total_tokens": 138412032} {"current_steps": 67, "total_steps": 103, "loss": 0.9085, "lr": 1.3616280092485717e-05, "epoch": 0.6457831325301204, "percentage": 65.05, "elapsed_time": "3:07:20", "remaining_time": "1:40:39", "throughput": 12500.64, "total_tokens": 140509184} {"current_steps": 68, "total_steps": 103, "loss": 0.9091, "lr": 1.2942796318163595e-05, "epoch": 0.655421686746988, "percentage": 66.02, "elapsed_time": "3:10:08", "remaining_time": "1:37:51", "throughput": 12500.46, "total_tokens": 142606336} {"current_steps": 69, "total_steps": 103, "loss": 0.8615, "lr": 1.2280528549619485e-05, "epoch": 0.6650602409638554, "percentage": 66.99, "elapsed_time": "3:12:55", "remaining_time": "1:35:04", "throughput": 12500.31, "total_tokens": 144703488} {"current_steps": 70, "total_steps": 103, "loss": 0.8873, "lr": 1.1630092850023147e-05, "epoch": 0.6746987951807228, "percentage": 67.96, "elapsed_time": "3:15:44", "remaining_time": "1:32:16", "throughput": 12499.75, "total_tokens": 146800640} {"current_steps": 71, "total_steps": 103, "loss": 0.8958, "lr": 1.0992094275966256e-05, "epoch": 0.6843373493975904, "percentage": 68.93, "elapsed_time": "3:18:32", "remaining_time": "1:29:29", "throughput": 12499.08, "total_tokens": 148897792} {"current_steps": 72, "total_steps": 103, "loss": 0.9171, "lr": 1.0367126314618947e-05, "epoch": 0.6939759036144578, "percentage": 69.9, "elapsed_time": "3:21:20", "remaining_time": "1:26:41", "throughput": 12498.68, "total_tokens": 150994944} {"current_steps": 73, "total_steps": 103, "loss": 0.9064, "lr": 9.755770331648642e-06, "epoch": 0.7036144578313253, "percentage": 70.87, "elapsed_time": "3:24:08", "remaining_time": "1:23:53", "throughput": 12498.57, "total_tokens": 153092096} {"current_steps": 74, "total_steps": 103, "loss": 0.9176, "lr": 9.15859503041462e-06, "epoch": 0.7132530120481928, "percentage": 71.84, "elapsed_time": "3:26:56", "remaining_time": "1:21:06", "throughput": 12498.23, "total_tokens": 155189248} {"current_steps": 75, "total_steps": 103, "loss": 0.8882, "lr": 8.576155922941548e-06, "epoch": 0.7228915662650602, "percentage": 72.82, "elapsed_time": "3:29:45", "remaining_time": "1:18:18", "throughput": 12497.44, "total_tokens": 157286400} {"current_steps": 76, "total_steps": 103, "loss": 0.9081, "lr": 8.008994813163995e-06, "epoch": 0.7325301204819277, "percentage": 73.79, "elapsed_time": "3:32:34", "remaining_time": "1:15:31", "throughput": 12496.38, "total_tokens": 159383552} {"current_steps": 77, "total_steps": 103, "loss": 0.8861, "lr": 7.457639292922675e-06, "epoch": 0.7421686746987952, "percentage": 74.76, "elapsed_time": "3:35:21", "remaining_time": "1:12:43", "throughput": 12496.81, "total_tokens": 161480704} {"current_steps": 78, "total_steps": 103, "loss": 0.8766, "lr": 6.92260225118122e-06, "epoch": 0.7518072289156627, "percentage": 75.73, "elapsed_time": "3:38:10", "remaining_time": "1:09:55", "throughput": 12496.11, "total_tokens": 163577856} {"current_steps": 79, "total_steps": 103, "loss": 0.8789, "lr": 6.4043813969201004e-06, "epoch": 0.7614457831325301, "percentage": 76.7, "elapsed_time": "3:40:58", "remaining_time": "1:07:08", "throughput": 12495.36, "total_tokens": 165675008} {"current_steps": 80, "total_steps": 103, "loss": 0.8952, "lr": 5.903458796151381e-06, "epoch": 0.7710843373493976, "percentage": 77.67, "elapsed_time": "3:43:47", "remaining_time": "1:04:20", "throughput": 12495.06, "total_tokens": 167772160} {"current_steps": 81, "total_steps": 103, "loss": 0.8847, "lr": 5.420300423485167e-06, "epoch": 0.7807228915662651, "percentage": 78.64, "elapsed_time": "3:46:35", "remaining_time": "1:01:32", "throughput": 12494.12, "total_tokens": 169869312} {"current_steps": 82, "total_steps": 103, "loss": 0.8848, "lr": 4.95535572866474e-06, "epoch": 0.7903614457831325, "percentage": 79.61, "elapsed_time": "3:49:24", "remaining_time": "0:58:45", "throughput": 12493.19, "total_tokens": 171966464} {"current_steps": 83, "total_steps": 103, "loss": 0.8884, "lr": 4.5090572184736864e-06, "epoch": 0.8, "percentage": 80.58, "elapsed_time": "3:52:13", "remaining_time": "0:55:57", "throughput": 12492.26, "total_tokens": 174063616} {"current_steps": 84, "total_steps": 103, "loss": 0.8885, "lr": 4.081820054403948e-06, "epoch": 0.8096385542168675, "percentage": 81.55, "elapsed_time": "3:55:02", "remaining_time": "0:53:09", "throughput": 12491.51, "total_tokens": 176160768} {"current_steps": 85, "total_steps": 103, "loss": 0.8821, "lr": 3.674041666458963e-06, "epoch": 0.8192771084337349, "percentage": 82.52, "elapsed_time": "3:57:50", "remaining_time": "0:50:21", "throughput": 12491.34, "total_tokens": 178257920} {"current_steps": 86, "total_steps": 103, "loss": 0.9095, "lr": 3.2861013834512846e-06, "epoch": 0.8289156626506025, "percentage": 83.5, "elapsed_time": "4:00:39", "remaining_time": "0:47:34", "throughput": 12490.8, "total_tokens": 180355072} {"current_steps": 87, "total_steps": 103, "loss": 0.8505, "lr": 2.918360080138485e-06, "epoch": 0.8385542168674699, "percentage": 84.47, "elapsed_time": "4:03:26", "remaining_time": "0:44:46", "throughput": 12490.77, "total_tokens": 182452224} {"current_steps": 88, "total_steps": 103, "loss": 0.8776, "lr": 2.57115984152565e-06, "epoch": 0.8481927710843373, "percentage": 85.44, "elapsed_time": "4:06:15", "remaining_time": "0:41:58", "throughput": 12490.59, "total_tokens": 184549376} {"current_steps": 89, "total_steps": 103, "loss": 0.8932, "lr": 2.2448236446466846e-06, "epoch": 0.8578313253012049, "percentage": 86.41, "elapsed_time": "4:09:03", "remaining_time": "0:39:10", "throughput": 12490.33, "total_tokens": 186646528} {"current_steps": 90, "total_steps": 103, "loss": 0.8887, "lr": 1.939655058120521e-06, "epoch": 0.8674698795180723, "percentage": 87.38, "elapsed_time": "4:11:51", "remaining_time": "0:36:22", "throughput": 12489.73, "total_tokens": 188743680} {"current_steps": 91, "total_steps": 103, "loss": 0.8613, "lr": 1.6559379597616137e-06, "epoch": 0.8771084337349397, "percentage": 88.35, "elapsed_time": "4:14:39", "remaining_time": "0:33:34", "throughput": 12489.75, "total_tokens": 190840832} {"current_steps": 92, "total_steps": 103, "loss": 0.9218, "lr": 1.3939362725075345e-06, "epoch": 0.8867469879518072, "percentage": 89.32, "elapsed_time": "4:17:28", "remaining_time": "0:30:47", "throughput": 12489.1, "total_tokens": 192937984} {"current_steps": 93, "total_steps": 103, "loss": 0.9037, "lr": 1.1538937189091825e-06, "epoch": 0.8963855421686747, "percentage": 90.29, "elapsed_time": "4:20:16", "remaining_time": "0:27:59", "throughput": 12489.14, "total_tokens": 195035136} {"current_steps": 94, "total_steps": 103, "loss": 0.8971, "lr": 9.360335944121029e-07, "epoch": 0.9060240963855422, "percentage": 91.26, "elapsed_time": "4:23:05", "remaining_time": "0:25:11", "throughput": 12488.37, "total_tokens": 197132288} {"current_steps": 95, "total_steps": 103, "loss": 0.9131, "lr": 7.405585596397313e-07, "epoch": 0.9156626506024096, "percentage": 92.23, "elapsed_time": "4:25:53", "remaining_time": "0:22:23", "throughput": 12488.09, "total_tokens": 199229440} {"current_steps": 96, "total_steps": 103, "loss": 0.9085, "lr": 5.676504518718761e-07, "epoch": 0.9253012048192771, "percentage": 93.2, "elapsed_time": "4:28:41", "remaining_time": "0:19:35", "throughput": 12488.43, "total_tokens": 201326592} {"current_steps": 97, "total_steps": 103, "loss": 0.8804, "lr": 4.1747011589368947e-07, "epoch": 0.9349397590361446, "percentage": 94.17, "elapsed_time": "4:31:28", "remaining_time": "0:16:47", "throughput": 12488.47, "total_tokens": 203423744} {"current_steps": 98, "total_steps": 103, "loss": 0.8935, "lr": 2.9015725437259724e-07, "epoch": 0.944578313253012, "percentage": 95.15, "elapsed_time": "4:34:16", "remaining_time": "0:13:59", "throughput": 12488.79, "total_tokens": 205520896} {"current_steps": 99, "total_steps": 103, "loss": 0.8984, "lr": 1.8583029790230355e-07, "epoch": 0.9542168674698795, "percentage": 96.12, "elapsed_time": "4:37:04", "remaining_time": "0:11:11", "throughput": 12488.8, "total_tokens": 207618048} {"current_steps": 100, "total_steps": 103, "loss": 0.9129, "lr": 1.0458629483476867e-07, "epoch": 0.963855421686747, "percentage": 97.09, "elapsed_time": "4:39:52", "remaining_time": "0:08:23", "throughput": 12488.69, "total_tokens": 209715200} {"current_steps": 101, "total_steps": 103, "loss": 0.9183, "lr": 4.650082100265407e-08, "epoch": 0.9734939759036144, "percentage": 98.06, "elapsed_time": "4:42:39", "remaining_time": "0:05:35", "throughput": 12489.13, "total_tokens": 211812352} {"current_steps": 102, "total_steps": 103, "loss": 0.8792, "lr": 1.1627909416211947e-08, "epoch": 0.983132530120482, "percentage": 99.03, "elapsed_time": "4:45:27", "remaining_time": "0:02:47", "throughput": 12489.25, "total_tokens": 213909504} {"current_steps": 103, "total_steps": 103, "loss": 0.8806, "lr": 0.0, "epoch": 0.9927710843373494, "percentage": 100.0, "elapsed_time": "4:48:15", "remaining_time": "0:00:00", "throughput": 12489.23, "total_tokens": 216006656} {"current_steps": 103, "total_steps": 103, "epoch": 0.9927710843373494, "percentage": 100.0, "elapsed_time": "4:48:39", "remaining_time": "0:00:00", "throughput": 12471.66, "total_tokens": 216006656}