{"current_steps": 10, "total_steps": 23217, "loss": 1.186, "learning_rate": 4.999997711254574e-05, "epoch": 0.001292156609381057, "percentage": 0.04, "elapsed_time": "0:01:01", "remaining_time": "1 day, 15:20:31", "throughput": "1342.30", "total_tokens": 81920} {"current_steps": 20, "total_steps": 23217, "loss": 1.557, "learning_rate": 4.999990845022488e-05, "epoch": 0.002584313218762114, "percentage": 0.09, "elapsed_time": "0:01:52", "remaining_time": "1 day, 12:15:49", "throughput": "1455.61", "total_tokens": 163840} {"current_steps": 30, "total_steps": 23217, "loss": 1.2102, "learning_rate": 4.999979401316311e-05, "epoch": 0.003876469828143171, "percentage": 0.13, "elapsed_time": "0:02:44", "remaining_time": "1 day, 11:17:52", "throughput": "1494.80", "total_tokens": 245760} {"current_steps": 40, "total_steps": 23217, "loss": 1.1901, "learning_rate": 4.999963380156999e-05, "epoch": 0.005168626437524228, "percentage": 0.17, "elapsed_time": "0:03:34", "remaining_time": "1 day, 10:34:04", "throughput": "1525.71", "total_tokens": 327680} {"current_steps": 50, "total_steps": 23217, "loss": 1.0801, "learning_rate": 4.9999427815738856e-05, "epoch": 0.006460783046905285, "percentage": 0.22, "elapsed_time": "0:04:24", "remaining_time": "1 day, 9:59:03", "throughput": "1551.25", "total_tokens": 409600} {"current_steps": 60, "total_steps": 23217, "loss": 1.039, "learning_rate": 4.999917605604688e-05, "epoch": 0.007752939656286342, "percentage": 0.26, "elapsed_time": "0:05:13", "remaining_time": "1 day, 9:35:09", "throughput": "1568.96", "total_tokens": 491520} {"current_steps": 70, "total_steps": 23217, "loss": 1.1476, "learning_rate": 4.999887852295502e-05, "epoch": 0.009045096265667399, "percentage": 0.3, "elapsed_time": "0:06:03", "remaining_time": "1 day, 9:21:39", "throughput": "1578.86", "total_tokens": 573440} {"current_steps": 80, "total_steps": 23217, "loss": 0.8873, "learning_rate": 4.9998535217008054e-05, "epoch": 0.010337252875048455, "percentage": 0.34, "elapsed_time": "0:06:52", "remaining_time": "1 day, 9:07:25", "throughput": "1589.48", "total_tokens": 655360} {"current_steps": 90, "total_steps": 23217, "loss": 0.959, "learning_rate": 4.999814613883459e-05, "epoch": 0.011629409484429512, "percentage": 0.39, "elapsed_time": "0:07:41", "remaining_time": "1 day, 8:56:48", "throughput": "1597.32", "total_tokens": 737280} {"current_steps": 100, "total_steps": 23217, "loss": 1.0245, "learning_rate": 4.999771128914701e-05, "epoch": 0.01292156609381057, "percentage": 0.43, "elapsed_time": "0:08:31", "remaining_time": "1 day, 8:52:04", "throughput": "1600.46", "total_tokens": 819200} {"current_steps": 110, "total_steps": 23217, "loss": 1.0335, "learning_rate": 4.999723066874154e-05, "epoch": 0.014213722703191626, "percentage": 0.47, "elapsed_time": "0:09:22", "remaining_time": "1 day, 8:48:52", "throughput": "1602.38", "total_tokens": 901120} {"current_steps": 120, "total_steps": 23217, "loss": 1.224, "learning_rate": 4.9996704278498185e-05, "epoch": 0.015505879312572683, "percentage": 0.52, "elapsed_time": "0:10:12", "remaining_time": "1 day, 8:45:56", "throughput": "1604.07", "total_tokens": 983040} {"current_steps": 130, "total_steps": 23217, "loss": 1.2653, "learning_rate": 4.9996132119380764e-05, "epoch": 0.016798035921953742, "percentage": 0.56, "elapsed_time": "0:11:03", "remaining_time": "1 day, 8:43:29", "throughput": "1605.37", "total_tokens": 1064960} {"current_steps": 140, "total_steps": 23217, "loss": 1.152, "learning_rate": 4.999551419243691e-05, "epoch": 0.018090192531334797, "percentage": 0.6, "elapsed_time": "0:11:53", "remaining_time": "1 day, 8:41:02", "throughput": "1606.69", "total_tokens": 1146880} {"current_steps": 150, "total_steps": 23217, "loss": 1.1498, "learning_rate": 4.9994850498798026e-05, "epoch": 0.019382349140715856, "percentage": 0.65, "elapsed_time": "0:12:44", "remaining_time": "1 day, 8:39:42", "throughput": "1607.08", "total_tokens": 1228800} {"current_steps": 160, "total_steps": 23217, "loss": 0.9303, "learning_rate": 4.999414103967934e-05, "epoch": 0.02067450575009691, "percentage": 0.69, "elapsed_time": "0:13:35", "remaining_time": "1 day, 8:38:26", "throughput": "1607.42", "total_tokens": 1310720} {"current_steps": 170, "total_steps": 23217, "loss": 0.9473, "learning_rate": 4.9993385816379876e-05, "epoch": 0.02196666235947797, "percentage": 0.73, "elapsed_time": "0:14:26", "remaining_time": "1 day, 8:36:46", "throughput": "1608.10", "total_tokens": 1392640} {"current_steps": 180, "total_steps": 23217, "loss": 1.0698, "learning_rate": 4.999258483028243e-05, "epoch": 0.023258818968859025, "percentage": 0.78, "elapsed_time": "0:15:16", "remaining_time": "1 day, 8:35:29", "throughput": "1608.45", "total_tokens": 1474560} {"current_steps": 190, "total_steps": 23217, "loss": 1.1219, "learning_rate": 4.999173808285362e-05, "epoch": 0.024550975578240083, "percentage": 0.82, "elapsed_time": "0:16:07", "remaining_time": "1 day, 8:34:04", "throughput": "1608.92", "total_tokens": 1556480} {"current_steps": 200, "total_steps": 23217, "loss": 1.3272, "learning_rate": 4.999084557564383e-05, "epoch": 0.02584313218762114, "percentage": 0.86, "elapsed_time": "0:16:57", "remaining_time": "1 day, 8:32:25", "throughput": "1609.59", "total_tokens": 1638400} {"current_steps": 210, "total_steps": 23217, "loss": 1.1947, "learning_rate": 4.9989907310287243e-05, "epoch": 0.027135288797002197, "percentage": 0.9, "elapsed_time": "0:17:48", "remaining_time": "1 day, 8:30:44", "throughput": "1610.27", "total_tokens": 1720320} {"current_steps": 220, "total_steps": 23217, "loss": 1.2172, "learning_rate": 4.998892328850181e-05, "epoch": 0.028427445406383253, "percentage": 0.95, "elapsed_time": "0:18:39", "remaining_time": "1 day, 8:31:15", "throughput": "1609.15", "total_tokens": 1802240} {"current_steps": 230, "total_steps": 23217, "loss": 1.3311, "learning_rate": 4.9987893512089276e-05, "epoch": 0.02971960201576431, "percentage": 0.99, "elapsed_time": "0:19:37", "remaining_time": "1 day, 8:41:55", "throughput": "1599.70", "total_tokens": 1884160} {"current_steps": 10, "total_steps": 23217, "loss": 1.1858, "learning_rate": 4.999997711254574e-05, "epoch": 0.001292156609381057, "percentage": 0.04, "elapsed_time": "0:00:56", "remaining_time": "1 day, 12:12:11", "throughput": "1458.68", "total_tokens": 81920} {"current_steps": 20, "total_steps": 23217, "loss": 1.5568, "learning_rate": 4.999990845022488e-05, "epoch": 0.002584313218762114, "percentage": 0.09, "elapsed_time": "0:01:46", "remaining_time": "1 day, 10:22:50", "throughput": "1535.34", "total_tokens": 163840} {"current_steps": 30, "total_steps": 23217, "loss": 1.2099, "learning_rate": 4.999979401316311e-05, "epoch": 0.003876469828143171, "percentage": 0.13, "elapsed_time": "0:02:46", "remaining_time": "1 day, 11:46:29", "throughput": "1474.87", "total_tokens": 245760} {"current_steps": 40, "total_steps": 23217, "loss": 1.1902, "learning_rate": 4.999963380156999e-05, "epoch": 0.005168626437524228, "percentage": 0.17, "elapsed_time": "0:03:45", "remaining_time": "1 day, 12:14:32", "throughput": "1455.22", "total_tokens": 327680} {"current_steps": 50, "total_steps": 23217, "loss": 1.0802, "learning_rate": 4.9999427815738856e-05, "epoch": 0.006460783046905285, "percentage": 0.22, "elapsed_time": "0:04:43", "remaining_time": "1 day, 12:30:48", "throughput": "1443.79", "total_tokens": 409600} {"current_steps": 60, "total_steps": 23217, "loss": 1.0393, "learning_rate": 4.999917605604688e-05, "epoch": 0.007752939656286342, "percentage": 0.26, "elapsed_time": "0:05:41", "remaining_time": "1 day, 12:33:44", "throughput": "1441.24", "total_tokens": 491520} {"current_steps": 70, "total_steps": 23217, "loss": 1.1473, "learning_rate": 4.999887852295502e-05, "epoch": 0.009045096265667399, "percentage": 0.3, "elapsed_time": "0:06:38", "remaining_time": "1 day, 12:34:58", "throughput": "1439.81", "total_tokens": 573440} {"current_steps": 80, "total_steps": 23217, "loss": 0.8868, "learning_rate": 4.9998535217008054e-05, "epoch": 0.010337252875048455, "percentage": 0.34, "elapsed_time": "0:07:34", "remaining_time": "1 day, 12:29:52", "throughput": "1442.54", "total_tokens": 655360} {"current_steps": 90, "total_steps": 23217, "loss": 0.9585, "learning_rate": 4.999814613883459e-05, "epoch": 0.011629409484429512, "percentage": 0.39, "elapsed_time": "0:08:29", "remaining_time": "1 day, 12:22:58", "throughput": "1446.47", "total_tokens": 737280} {"current_steps": 100, "total_steps": 23217, "loss": 1.0241, "learning_rate": 4.999771128914701e-05, "epoch": 0.01292156609381057, "percentage": 0.43, "elapsed_time": "0:09:25", "remaining_time": "1 day, 12:18:39", "throughput": "1448.71", "total_tokens": 819200} {"current_steps": 110, "total_steps": 23217, "loss": 1.034, "learning_rate": 4.999723066874154e-05, "epoch": 0.014213722703191626, "percentage": 0.47, "elapsed_time": "0:10:21", "remaining_time": "1 day, 12:14:26", "throughput": "1450.89", "total_tokens": 901120} {"current_steps": 120, "total_steps": 23217, "loss": 1.2244, "learning_rate": 4.9996704278498185e-05, "epoch": 0.015505879312572683, "percentage": 0.52, "elapsed_time": "0:11:17", "remaining_time": "1 day, 12:12:50", "throughput": "1451.32", "total_tokens": 983040} {"current_steps": 130, "total_steps": 23217, "loss": 1.266, "learning_rate": 4.9996132119380764e-05, "epoch": 0.016798035921953742, "percentage": 0.56, "elapsed_time": "0:12:15", "remaining_time": "1 day, 12:16:46", "throughput": "1448.08", "total_tokens": 1064960} {"current_steps": 140, "total_steps": 23217, "loss": 1.1523, "learning_rate": 4.999551419243691e-05, "epoch": 0.018090192531334797, "percentage": 0.6, "elapsed_time": "0:13:12", "remaining_time": "1 day, 12:18:31", "throughput": "1446.29", "total_tokens": 1146880} {"current_steps": 150, "total_steps": 23217, "loss": 1.1496, "learning_rate": 4.9994850498798026e-05, "epoch": 0.019382349140715856, "percentage": 0.65, "elapsed_time": "0:14:11", "remaining_time": "1 day, 12:21:34", "throughput": "1443.64", "total_tokens": 1228800} {"current_steps": 160, "total_steps": 23217, "loss": 0.9302, "learning_rate": 4.999414103967934e-05, "epoch": 0.02067450575009691, "percentage": 0.69, "elapsed_time": "0:15:10", "remaining_time": "1 day, 12:25:50", "throughput": "1440.20", "total_tokens": 1310720} {"current_steps": 170, "total_steps": 23217, "loss": 0.9475, "learning_rate": 4.9993385816379876e-05, "epoch": 0.02196666235947797, "percentage": 0.73, "elapsed_time": "0:16:18", "remaining_time": "1 day, 12:51:37", "throughput": "1422.80", "total_tokens": 1392640} {"current_steps": 180, "total_steps": 23217, "loss": 1.0703, "learning_rate": 4.999258483028243e-05, "epoch": 0.023258818968859025, "percentage": 0.78, "elapsed_time": "0:17:21", "remaining_time": "1 day, 13:00:38", "throughput": "1416.40", "total_tokens": 1474560} {"current_steps": 190, "total_steps": 23217, "loss": 1.1235, "learning_rate": 4.999173808285362e-05, "epoch": 0.024550975578240083, "percentage": 0.82, "elapsed_time": "0:18:54", "remaining_time": "1 day, 14:10:35", "throughput": "1372.55", "total_tokens": 1556480} {"current_steps": 200, "total_steps": 23217, "loss": 1.3278, "learning_rate": 4.999084557564383e-05, "epoch": 0.02584313218762114, "percentage": 0.86, "elapsed_time": "0:20:27", "remaining_time": "1 day, 15:14:26", "throughput": "1334.75", "total_tokens": 1638400} {"current_steps": 210, "total_steps": 23217, "loss": 1.1928, "learning_rate": 4.9989907310287243e-05, "epoch": 0.027135288797002197, "percentage": 0.9, "elapsed_time": "0:22:00", "remaining_time": "1 day, 16:10:23", "throughput": "1303.20", "total_tokens": 1720320} {"current_steps": 220, "total_steps": 23217, "loss": 1.215, "learning_rate": 4.998892328850181e-05, "epoch": 0.028427445406383253, "percentage": 0.95, "elapsed_time": "0:23:33", "remaining_time": "1 day, 17:02:37", "throughput": "1275.01", "total_tokens": 1802240} {"current_steps": 230, "total_steps": 23217, "loss": 1.3318, "learning_rate": 4.9987893512089276e-05, "epoch": 0.02971960201576431, "percentage": 0.99, "elapsed_time": "0:24:43", "remaining_time": "1 day, 17:11:32", "throughput": "1269.86", "total_tokens": 1884160} {"current_steps": 240, "total_steps": 23217, "loss": 1.3226, "learning_rate": 4.998681798293516e-05, "epoch": 0.031011758625145366, "percentage": 1.03, "elapsed_time": "0:25:31", "remaining_time": "1 day, 16:43:20", "throughput": "1283.95", "total_tokens": 1966080} {"current_steps": 250, "total_steps": 23217, "loss": 1.1795, "learning_rate": 4.998569670300876e-05, "epoch": 0.03230391523452642, "percentage": 1.08, "elapsed_time": "0:26:18", "remaining_time": "1 day, 16:17:22", "throughput": "1297.18", "total_tokens": 2048000} {"current_steps": 260, "total_steps": 23217, "loss": 0.9646, "learning_rate": 4.9984529674363114e-05, "epoch": 0.033596071843907484, "percentage": 1.12, "elapsed_time": "0:27:06", "remaining_time": "1 day, 15:53:19", "throughput": "1309.64", "total_tokens": 2129920} {"current_steps": 270, "total_steps": 23217, "loss": 1.1236, "learning_rate": 4.998331689913506e-05, "epoch": 0.03488822845328854, "percentage": 1.16, "elapsed_time": "0:27:53", "remaining_time": "1 day, 15:30:53", "throughput": "1321.46", "total_tokens": 2211840} {"current_steps": 280, "total_steps": 23217, "loss": 0.9761, "learning_rate": 4.998205837954518e-05, "epoch": 0.036180385062669594, "percentage": 1.21, "elapsed_time": "0:28:41", "remaining_time": "1 day, 15:10:03", "throughput": "1332.59", "total_tokens": 2293760} {"current_steps": 290, "total_steps": 23217, "loss": 1.0846, "learning_rate": 4.998075411789783e-05, "epoch": 0.03747254167205065, "percentage": 1.25, "elapsed_time": "0:29:28", "remaining_time": "1 day, 14:50:39", "throughput": "1343.09", "total_tokens": 2375680} {"current_steps": 300, "total_steps": 23217, "loss": 0.9604, "learning_rate": 4.9979404116581104e-05, "epoch": 0.03876469828143171, "percentage": 1.29, "elapsed_time": "0:30:16", "remaining_time": "1 day, 14:32:31", "throughput": "1353.04", "total_tokens": 2457600} {"current_steps": 310, "total_steps": 23217, "loss": 1.135, "learning_rate": 4.9978008378066844e-05, "epoch": 0.04005685489081277, "percentage": 1.34, "elapsed_time": "0:31:03", "remaining_time": "1 day, 14:15:31", "throughput": "1362.46", "total_tokens": 2539520} {"current_steps": 320, "total_steps": 23217, "loss": 1.0162, "learning_rate": 4.997656690491064e-05, "epoch": 0.04134901150019382, "percentage": 1.38, "elapsed_time": "0:31:51", "remaining_time": "1 day, 13:59:27", "throughput": "1371.46", "total_tokens": 2621440} {"current_steps": 330, "total_steps": 23217, "loss": 1.0928, "learning_rate": 4.9975079699751825e-05, "epoch": 0.04264116810957488, "percentage": 1.42, "elapsed_time": "0:32:38", "remaining_time": "1 day, 13:44:23", "throughput": "1379.99", "total_tokens": 2703360} {"current_steps": 340, "total_steps": 23217, "loss": 1.4001, "learning_rate": 4.997354676531348e-05, "epoch": 0.04393332471895594, "percentage": 1.46, "elapsed_time": "0:33:26", "remaining_time": "1 day, 13:30:06", "throughput": "1388.14", "total_tokens": 2785280} {"current_steps": 350, "total_steps": 23217, "loss": 1.2969, "learning_rate": 4.997196810440239e-05, "epoch": 0.045225481328336994, "percentage": 1.51, "elapsed_time": "0:34:14", "remaining_time": "1 day, 13:16:36", "throughput": "1395.91", "total_tokens": 2867200} {"current_steps": 360, "total_steps": 23217, "loss": 1.0298, "learning_rate": 4.997034371990907e-05, "epoch": 0.04651763793771805, "percentage": 1.55, "elapsed_time": "0:35:01", "remaining_time": "1 day, 13:03:47", "throughput": "1403.34", "total_tokens": 2949120} {"current_steps": 370, "total_steps": 23217, "loss": 1.1618, "learning_rate": 4.9968673614807787e-05, "epoch": 0.04780979454709911, "percentage": 1.59, "elapsed_time": "0:35:48", "remaining_time": "1 day, 12:51:37", "throughput": "1410.45", "total_tokens": 3031040} {"current_steps": 380, "total_steps": 23217, "loss": 0.8982, "learning_rate": 4.9966957792156475e-05, "epoch": 0.04910195115648017, "percentage": 1.64, "elapsed_time": "0:36:36", "remaining_time": "1 day, 12:40:01", "throughput": "1417.26", "total_tokens": 3112960} {"current_steps": 390, "total_steps": 23217, "loss": 1.15, "learning_rate": 4.99651962550968e-05, "epoch": 0.05039410776586122, "percentage": 1.68, "elapsed_time": "0:37:23", "remaining_time": "1 day, 12:29:02", "throughput": "1423.75", "total_tokens": 3194880} {"current_steps": 400, "total_steps": 23217, "loss": 1.3498, "learning_rate": 4.996338900685414e-05, "epoch": 0.05168626437524228, "percentage": 1.72, "elapsed_time": "0:38:11", "remaining_time": "1 day, 12:18:34", "throughput": "1429.96", "total_tokens": 3276800} {"current_steps": 410, "total_steps": 23217, "loss": 0.8624, "learning_rate": 4.996153605073756e-05, "epoch": 0.05297842098462334, "percentage": 1.77, "elapsed_time": "0:38:59", "remaining_time": "1 day, 12:08:35", "throughput": "1435.92", "total_tokens": 3358720} {"current_steps": 420, "total_steps": 23217, "loss": 1.1246, "learning_rate": 4.9959637390139814e-05, "epoch": 0.054270577594004395, "percentage": 1.81, "elapsed_time": "0:39:46", "remaining_time": "1 day, 11:59:02", "throughput": "1441.64", "total_tokens": 3440640} {"current_steps": 430, "total_steps": 23217, "loss": 0.8941, "learning_rate": 4.995769302853733e-05, "epoch": 0.05556273420338545, "percentage": 1.85, "elapsed_time": "0:40:34", "remaining_time": "1 day, 11:49:53", "throughput": "1447.13", "total_tokens": 3522560} {"current_steps": 440, "total_steps": 23217, "loss": 1.1223, "learning_rate": 4.995570296949024e-05, "epoch": 0.056854890812766505, "percentage": 1.9, "elapsed_time": "0:41:21", "remaining_time": "1 day, 11:41:03", "throughput": "1452.47", "total_tokens": 3604480} {"current_steps": 450, "total_steps": 23217, "loss": 0.7063, "learning_rate": 4.995366721664234e-05, "epoch": 0.05814704742214757, "percentage": 1.94, "elapsed_time": "0:42:09", "remaining_time": "1 day, 11:32:38", "throughput": "1457.56", "total_tokens": 3686400} {"current_steps": 460, "total_steps": 23217, "loss": 0.8703, "learning_rate": 4.995158577372107e-05, "epoch": 0.05943920403152862, "percentage": 1.98, "elapsed_time": "0:42:56", "remaining_time": "1 day, 11:24:29", "throughput": "1462.51", "total_tokens": 3768320} {"current_steps": 470, "total_steps": 23217, "loss": 0.8798, "learning_rate": 4.9949458644537556e-05, "epoch": 0.06073136064090968, "percentage": 2.02, "elapsed_time": "0:43:44", "remaining_time": "1 day, 11:16:40", "throughput": "1467.27", "total_tokens": 3850240} {"current_steps": 480, "total_steps": 23217, "loss": 1.154, "learning_rate": 4.9947285832986553e-05, "epoch": 0.06202351725029073, "percentage": 2.07, "elapsed_time": "0:44:31", "remaining_time": "1 day, 11:09:11", "throughput": "1471.82", "total_tokens": 3932160} {"current_steps": 490, "total_steps": 23217, "loss": 1.179, "learning_rate": 4.9945067343046494e-05, "epoch": 0.0633156738596718, "percentage": 2.11, "elapsed_time": "0:45:19", "remaining_time": "1 day, 11:01:57", "throughput": "1476.24", "total_tokens": 4014080} {"current_steps": 500, "total_steps": 23217, "loss": 1.3203, "learning_rate": 4.9942803178779396e-05, "epoch": 0.06460783046905284, "percentage": 2.15, "elapsed_time": "0:46:06", "remaining_time": "1 day, 10:54:59", "throughput": "1480.49", "total_tokens": 4096000} {"current_steps": 510, "total_steps": 23217, "loss": 0.95, "learning_rate": 4.994049334433095e-05, "epoch": 0.0658999870784339, "percentage": 2.2, "elapsed_time": "0:46:54", "remaining_time": "1 day, 10:48:16", "throughput": "1484.60", "total_tokens": 4177920} {"current_steps": 520, "total_steps": 23217, "loss": 0.721, "learning_rate": 4.9938137843930466e-05, "epoch": 0.06719214368781497, "percentage": 2.24, "elapsed_time": "0:47:41", "remaining_time": "1 day, 10:41:47", "throughput": "1488.57", "total_tokens": 4259840} {"current_steps": 530, "total_steps": 23217, "loss": 1.1505, "learning_rate": 4.993573668189083e-05, "epoch": 0.06848430029719602, "percentage": 2.28, "elapsed_time": "0:48:29", "remaining_time": "1 day, 10:35:30", "throughput": "1492.42", "total_tokens": 4341760} {"current_steps": 540, "total_steps": 23217, "loss": 1.1169, "learning_rate": 4.9933289862608584e-05, "epoch": 0.06977645690657708, "percentage": 2.33, "elapsed_time": "0:49:16", "remaining_time": "1 day, 10:29:25", "throughput": "1496.15", "total_tokens": 4423680} {"current_steps": 550, "total_steps": 23217, "loss": 1.0893, "learning_rate": 4.9930797390563834e-05, "epoch": 0.07106861351595814, "percentage": 2.37, "elapsed_time": "0:50:04", "remaining_time": "1 day, 10:23:32", "throughput": "1499.76", "total_tokens": 4505600} {"current_steps": 560, "total_steps": 23217, "loss": 0.6521, "learning_rate": 4.9928259270320295e-05, "epoch": 0.07236077012533919, "percentage": 2.41, "elapsed_time": "0:50:51", "remaining_time": "1 day, 10:17:49", "throughput": "1503.25", "total_tokens": 4587520} {"current_steps": 570, "total_steps": 23217, "loss": 0.9833, "learning_rate": 4.992567550652525e-05, "epoch": 0.07365292673472025, "percentage": 2.46, "elapsed_time": "0:51:39", "remaining_time": "1 day, 10:12:19", "throughput": "1506.62", "total_tokens": 4669440} {"current_steps": 580, "total_steps": 23217, "loss": 1.1048, "learning_rate": 4.992304610390955e-05, "epoch": 0.0749450833441013, "percentage": 2.5, "elapsed_time": "0:52:26", "remaining_time": "1 day, 10:06:58", "throughput": "1509.88", "total_tokens": 4751360} {"current_steps": 590, "total_steps": 23217, "loss": 0.8898, "learning_rate": 4.9920371067287645e-05, "epoch": 0.07623723995348236, "percentage": 2.54, "elapsed_time": "0:53:14", "remaining_time": "1 day, 10:01:44", "throughput": "1513.08", "total_tokens": 4833280} {"current_steps": 600, "total_steps": 23217, "loss": 0.9906, "learning_rate": 4.9917650401557505e-05, "epoch": 0.07752939656286342, "percentage": 2.58, "elapsed_time": "0:54:01", "remaining_time": "1 day, 9:56:38", "throughput": "1516.21", "total_tokens": 4915200} {"current_steps": 610, "total_steps": 23217, "loss": 0.9923, "learning_rate": 4.9914884111700656e-05, "epoch": 0.07882155317224447, "percentage": 2.63, "elapsed_time": "0:54:49", "remaining_time": "1 day, 9:51:40", "throughput": "1519.24", "total_tokens": 4997120} {"current_steps": 620, "total_steps": 23217, "loss": 0.8434, "learning_rate": 4.991207220278217e-05, "epoch": 0.08011370978162553, "percentage": 2.67, "elapsed_time": "0:55:36", "remaining_time": "1 day, 9:46:53", "throughput": "1522.16", "total_tokens": 5079040} {"current_steps": 630, "total_steps": 23217, "loss": 0.6813, "learning_rate": 4.990921467995064e-05, "epoch": 0.0814058663910066, "percentage": 2.71, "elapsed_time": "0:56:24", "remaining_time": "1 day, 9:42:14", "throughput": "1524.99", "total_tokens": 5160960} {"current_steps": 640, "total_steps": 23217, "loss": 0.8735, "learning_rate": 4.9906311548438184e-05, "epoch": 0.08269802300038764, "percentage": 2.76, "elapsed_time": "0:57:11", "remaining_time": "1 day, 9:37:39", "throughput": "1527.76", "total_tokens": 5242880} {"current_steps": 650, "total_steps": 23217, "loss": 1.1035, "learning_rate": 4.990336281356042e-05, "epoch": 0.0839901796097687, "percentage": 2.8, "elapsed_time": "0:57:59", "remaining_time": "1 day, 9:33:13", "throughput": "1530.45", "total_tokens": 5324800} {"current_steps": 660, "total_steps": 23217, "loss": 0.8329, "learning_rate": 4.9900368480716466e-05, "epoch": 0.08528233621914975, "percentage": 2.84, "elapsed_time": "0:58:46", "remaining_time": "1 day, 9:28:55", "throughput": "1533.04", "total_tokens": 5406720} {"current_steps": 670, "total_steps": 23217, "loss": 1.1088, "learning_rate": 4.9897328555388943e-05, "epoch": 0.08657449282853082, "percentage": 2.89, "elapsed_time": "0:59:34", "remaining_time": "1 day, 9:24:45", "throughput": "1535.55", "total_tokens": 5488640} {"current_steps": 680, "total_steps": 23217, "loss": 1.0048, "learning_rate": 4.989424304314395e-05, "epoch": 0.08786664943791188, "percentage": 2.93, "elapsed_time": "1:00:21", "remaining_time": "1 day, 9:20:38", "throughput": "1538.03", "total_tokens": 5570560} {"current_steps": 690, "total_steps": 23217, "loss": 0.9396, "learning_rate": 4.9891111949631023e-05, "epoch": 0.08915880604729293, "percentage": 2.97, "elapsed_time": "1:01:09", "remaining_time": "1 day, 9:16:38", "throughput": "1540.43", "total_tokens": 5652480} {"current_steps": 700, "total_steps": 23217, "loss": 1.1961, "learning_rate": 4.988793528058321e-05, "epoch": 0.09045096265667399, "percentage": 3.02, "elapsed_time": "1:01:56", "remaining_time": "1 day, 9:12:44", "throughput": "1542.76", "total_tokens": 5734400} {"current_steps": 710, "total_steps": 23217, "loss": 0.9563, "learning_rate": 4.988471304181697e-05, "epoch": 0.09174311926605505, "percentage": 3.06, "elapsed_time": "1:02:44", "remaining_time": "1 day, 9:08:54", "throughput": "1545.05", "total_tokens": 5816320} {"current_steps": 720, "total_steps": 23217, "loss": 0.9487, "learning_rate": 4.988144523923221e-05, "epoch": 0.0930352758754361, "percentage": 3.1, "elapsed_time": "1:03:32", "remaining_time": "1 day, 9:05:10", "throughput": "1547.26", "total_tokens": 5898240} {"current_steps": 730, "total_steps": 23217, "loss": 0.9847, "learning_rate": 4.987813187881226e-05, "epoch": 0.09432743248481716, "percentage": 3.14, "elapsed_time": "1:04:19", "remaining_time": "1 day, 9:01:32", "throughput": "1549.41", "total_tokens": 5980160} {"current_steps": 740, "total_steps": 23217, "loss": 1.3118, "learning_rate": 4.987477296662387e-05, "epoch": 0.09561958909419822, "percentage": 3.19, "elapsed_time": "1:05:07", "remaining_time": "1 day, 8:57:56", "throughput": "1551.54", "total_tokens": 6062080} {"current_steps": 750, "total_steps": 23217, "loss": 1.0996, "learning_rate": 4.987136850881721e-05, "epoch": 0.09691174570357927, "percentage": 3.23, "elapsed_time": "1:05:54", "remaining_time": "1 day, 8:54:26", "throughput": "1553.61", "total_tokens": 6144000} {"current_steps": 760, "total_steps": 23217, "loss": 0.9023, "learning_rate": 4.986791851162582e-05, "epoch": 0.09820390231296033, "percentage": 3.27, "elapsed_time": "1:06:42", "remaining_time": "1 day, 8:50:58", "throughput": "1555.64", "total_tokens": 6225920} {"current_steps": 770, "total_steps": 23217, "loss": 1.0904, "learning_rate": 4.986442298136663e-05, "epoch": 0.09949605892234138, "percentage": 3.32, "elapsed_time": "1:07:29", "remaining_time": "1 day, 8:47:35", "throughput": "1557.62", "total_tokens": 6307840} {"current_steps": 780, "total_steps": 23217, "loss": 0.9374, "learning_rate": 4.986088192443995e-05, "epoch": 0.10078821553172244, "percentage": 3.36, "elapsed_time": "1:08:17", "remaining_time": "1 day, 8:44:17", "throughput": "1559.55", "total_tokens": 6389760} {"current_steps": 790, "total_steps": 23217, "loss": 0.8173, "learning_rate": 4.985729534732944e-05, "epoch": 0.1020803721411035, "percentage": 3.4, "elapsed_time": "1:09:04", "remaining_time": "1 day, 8:41:02", "throughput": "1561.44", "total_tokens": 6471680} {"current_steps": 800, "total_steps": 23217, "loss": 0.9162, "learning_rate": 4.98536632566021e-05, "epoch": 0.10337252875048455, "percentage": 3.45, "elapsed_time": "1:09:52", "remaining_time": "1 day, 8:37:50", "throughput": "1563.29", "total_tokens": 6553600} {"current_steps": 810, "total_steps": 23217, "loss": 0.7986, "learning_rate": 4.9849985658908296e-05, "epoch": 0.10466468535986562, "percentage": 3.49, "elapsed_time": "1:10:39", "remaining_time": "1 day, 8:34:42", "throughput": "1565.09", "total_tokens": 6635520} {"current_steps": 820, "total_steps": 23217, "loss": 0.7034, "learning_rate": 4.9846262560981674e-05, "epoch": 0.10595684196924668, "percentage": 3.53, "elapsed_time": "1:11:27", "remaining_time": "1 day, 8:31:37", "throughput": "1566.86", "total_tokens": 6717440} {"current_steps": 830, "total_steps": 23217, "loss": 0.9466, "learning_rate": 4.9842493969639215e-05, "epoch": 0.10724899857862773, "percentage": 3.57, "elapsed_time": "1:12:14", "remaining_time": "1 day, 8:28:35", "throughput": "1568.60", "total_tokens": 6799360} {"current_steps": 840, "total_steps": 23217, "loss": 1.2844, "learning_rate": 4.9838679891781214e-05, "epoch": 0.10854115518800879, "percentage": 3.62, "elapsed_time": "1:13:02", "remaining_time": "1 day, 8:25:38", "throughput": "1570.28", "total_tokens": 6881280} {"current_steps": 850, "total_steps": 23217, "loss": 0.7703, "learning_rate": 4.983482033439122e-05, "epoch": 0.10983331179738984, "percentage": 3.66, "elapsed_time": "1:13:49", "remaining_time": "1 day, 8:22:43", "throughput": "1571.94", "total_tokens": 6963200} {"current_steps": 860, "total_steps": 23217, "loss": 1.2312, "learning_rate": 4.9830915304536065e-05, "epoch": 0.1111254684067709, "percentage": 3.7, "elapsed_time": "1:14:37", "remaining_time": "1 day, 8:19:51", "throughput": "1573.55", "total_tokens": 7045120} {"current_steps": 870, "total_steps": 23217, "loss": 1.3658, "learning_rate": 4.982696480936586e-05, "epoch": 0.11241762501615196, "percentage": 3.75, "elapsed_time": "1:15:24", "remaining_time": "1 day, 8:17:03", "throughput": "1575.13", "total_tokens": 7127040} {"current_steps": 880, "total_steps": 23217, "loss": 1.0453, "learning_rate": 4.9822968856113926e-05, "epoch": 0.11370978162553301, "percentage": 3.79, "elapsed_time": "1:16:12", "remaining_time": "1 day, 8:14:16", "throughput": "1576.68", "total_tokens": 7208960} {"current_steps": 890, "total_steps": 23217, "loss": 1.1852, "learning_rate": 4.9818927452096855e-05, "epoch": 0.11500193823491407, "percentage": 3.83, "elapsed_time": "1:16:59", "remaining_time": "1 day, 8:11:30", "throughput": "1578.23", "total_tokens": 7290880} {"current_steps": 900, "total_steps": 23217, "loss": 1.2232, "learning_rate": 4.981484060471444e-05, "epoch": 0.11629409484429513, "percentage": 3.88, "elapsed_time": "1:17:47", "remaining_time": "1 day, 8:08:50", "throughput": "1579.71", "total_tokens": 7372800} {"current_steps": 910, "total_steps": 23217, "loss": 1.1144, "learning_rate": 4.981070832144967e-05, "epoch": 0.11758625145367618, "percentage": 3.92, "elapsed_time": "1:18:34", "remaining_time": "1 day, 8:06:09", "throughput": "1581.20", "total_tokens": 7454720} {"current_steps": 920, "total_steps": 23217, "loss": 1.0344, "learning_rate": 4.980653060986877e-05, "epoch": 0.11887840806305724, "percentage": 3.96, "elapsed_time": "1:19:22", "remaining_time": "1 day, 8:03:31", "throughput": "1582.65", "total_tokens": 7536640} {"current_steps": 930, "total_steps": 23217, "loss": 1.1751, "learning_rate": 4.9802307477621084e-05, "epoch": 0.1201705646724383, "percentage": 4.01, "elapsed_time": "1:20:09", "remaining_time": "1 day, 8:00:57", "throughput": "1584.07", "total_tokens": 7618560} {"current_steps": 940, "total_steps": 23217, "loss": 1.1844, "learning_rate": 4.9798038932439175e-05, "epoch": 0.12146272128181936, "percentage": 4.05, "elapsed_time": "1:20:56", "remaining_time": "1 day, 7:58:25", "throughput": "1585.45", "total_tokens": 7700480} {"current_steps": 950, "total_steps": 23217, "loss": 1.0034, "learning_rate": 4.979372498213871e-05, "epoch": 0.12275487789120042, "percentage": 4.09, "elapsed_time": "1:21:44", "remaining_time": "1 day, 7:55:56", "throughput": "1586.79", "total_tokens": 7782400} {"current_steps": 960, "total_steps": 23217, "loss": 0.9102, "learning_rate": 4.978936563461854e-05, "epoch": 0.12404703450058147, "percentage": 4.13, "elapsed_time": "1:22:32", "remaining_time": "1 day, 7:53:29", "throughput": "1588.10", "total_tokens": 7864320} {"current_steps": 970, "total_steps": 23217, "loss": 0.8154, "learning_rate": 4.97849608978606e-05, "epoch": 0.12533919110996253, "percentage": 4.18, "elapsed_time": "1:23:19", "remaining_time": "1 day, 7:51:04", "throughput": "1589.40", "total_tokens": 7946240} {"current_steps": 980, "total_steps": 23217, "loss": 1.0143, "learning_rate": 4.978051077992994e-05, "epoch": 0.1266313477193436, "percentage": 4.22, "elapsed_time": "1:24:06", "remaining_time": "1 day, 7:48:39", "throughput": "1590.69", "total_tokens": 8028160} {"current_steps": 990, "total_steps": 23217, "loss": 0.7723, "learning_rate": 4.9776015288974736e-05, "epoch": 0.12792350432872465, "percentage": 4.26, "elapsed_time": "1:24:54", "remaining_time": "1 day, 7:46:18", "throughput": "1591.94", "total_tokens": 8110080} {"current_steps": 1000, "total_steps": 23217, "loss": 1.2866, "learning_rate": 4.9771474433226194e-05, "epoch": 0.1292156609381057, "percentage": 4.31, "elapsed_time": "1:25:41", "remaining_time": "1 day, 7:43:59", "throughput": "1593.17", "total_tokens": 8192000} {"current_steps": 1010, "total_steps": 23217, "loss": 1.4743, "learning_rate": 4.976688822099861e-05, "epoch": 0.13050781754748675, "percentage": 4.35, "elapsed_time": "1:26:36", "remaining_time": "1 day, 7:44:14", "throughput": "1592.24", "total_tokens": 8273920} {"current_steps": 1020, "total_steps": 23217, "loss": 0.904, "learning_rate": 4.976225666068932e-05, "epoch": 0.1317999741568678, "percentage": 4.39, "elapsed_time": "1:27:23", "remaining_time": "1 day, 7:41:58", "throughput": "1593.41", "total_tokens": 8355840} {"current_steps": 1030, "total_steps": 23217, "loss": 0.9119, "learning_rate": 4.9757579760778697e-05, "epoch": 0.13309213076624887, "percentage": 4.44, "elapsed_time": "1:28:11", "remaining_time": "1 day, 7:39:43", "throughput": "1594.58", "total_tokens": 8437760} {"current_steps": 1040, "total_steps": 23217, "loss": 1.1209, "learning_rate": 4.9752857529830125e-05, "epoch": 0.13438428737562993, "percentage": 4.48, "elapsed_time": "1:28:59", "remaining_time": "1 day, 7:37:29", "throughput": "1595.74", "total_tokens": 8519680} {"current_steps": 1050, "total_steps": 23217, "loss": 1.2202, "learning_rate": 4.9748089976489996e-05, "epoch": 0.135676443985011, "percentage": 4.52, "elapsed_time": "1:29:46", "remaining_time": "1 day, 7:35:18", "throughput": "1596.86", "total_tokens": 8601600} {"current_steps": 1060, "total_steps": 23217, "loss": 1.2102, "learning_rate": 4.9743277109487674e-05, "epoch": 0.13696860059439203, "percentage": 4.57, "elapsed_time": "1:30:34", "remaining_time": "1 day, 7:33:07", "throughput": "1597.97", "total_tokens": 8683520} {"current_steps": 1070, "total_steps": 23217, "loss": 0.9835, "learning_rate": 4.973841893763551e-05, "epoch": 0.1382607572037731, "percentage": 4.61, "elapsed_time": "1:31:21", "remaining_time": "1 day, 7:30:59", "throughput": "1599.06", "total_tokens": 8765440} {"current_steps": 1080, "total_steps": 23217, "loss": 0.9155, "learning_rate": 4.9733515469828795e-05, "epoch": 0.13955291381315416, "percentage": 4.65, "elapsed_time": "1:32:09", "remaining_time": "1 day, 7:28:51", "throughput": "1600.13", "total_tokens": 8847360} {"current_steps": 1090, "total_steps": 23217, "loss": 1.196, "learning_rate": 4.972856671504576e-05, "epoch": 0.14084507042253522, "percentage": 4.69, "elapsed_time": "1:32:56", "remaining_time": "1 day, 7:26:46", "throughput": "1601.19", "total_tokens": 8929280} {"current_steps": 1100, "total_steps": 23217, "loss": 0.8913, "learning_rate": 4.9723572682347566e-05, "epoch": 0.14213722703191628, "percentage": 4.74, "elapsed_time": "1:33:44", "remaining_time": "1 day, 7:24:41", "throughput": "1602.23", "total_tokens": 9011200} {"current_steps": 1110, "total_steps": 23217, "loss": 1.1649, "learning_rate": 4.971853338087825e-05, "epoch": 0.14342938364129731, "percentage": 4.78, "elapsed_time": "1:34:31", "remaining_time": "1 day, 7:22:38", "throughput": "1603.24", "total_tokens": 9093120} {"current_steps": 1120, "total_steps": 23217, "loss": 1.084, "learning_rate": 4.971344881986477e-05, "epoch": 0.14472154025067838, "percentage": 4.82, "elapsed_time": "1:35:19", "remaining_time": "1 day, 7:20:36", "throughput": "1604.25", "total_tokens": 9175040} {"current_steps": 1130, "total_steps": 23217, "loss": 0.9945, "learning_rate": 4.9708319008616926e-05, "epoch": 0.14601369686005944, "percentage": 4.87, "elapsed_time": "1:36:06", "remaining_time": "1 day, 7:18:35", "throughput": "1605.26", "total_tokens": 9256960} {"current_steps": 1140, "total_steps": 23217, "loss": 0.8976, "learning_rate": 4.97031439565274e-05, "epoch": 0.1473058534694405, "percentage": 4.91, "elapsed_time": "1:36:54", "remaining_time": "1 day, 7:16:36", "throughput": "1606.22", "total_tokens": 9338880} {"current_steps": 1150, "total_steps": 23217, "loss": 1.063, "learning_rate": 4.969792367307168e-05, "epoch": 0.14859801007882156, "percentage": 4.95, "elapsed_time": "1:37:41", "remaining_time": "1 day, 7:14:37", "throughput": "1607.18", "total_tokens": 9420800} {"current_steps": 1160, "total_steps": 23217, "loss": 0.8809, "learning_rate": 4.9692658167808094e-05, "epoch": 0.1498901666882026, "percentage": 5.0, "elapsed_time": "1:38:29", "remaining_time": "1 day, 7:12:41", "throughput": "1608.12", "total_tokens": 9502720} {"current_steps": 1170, "total_steps": 23217, "loss": 1.3418, "learning_rate": 4.9687347450377755e-05, "epoch": 0.15118232329758366, "percentage": 5.04, "elapsed_time": "1:39:16", "remaining_time": "1 day, 7:10:46", "throughput": "1609.04", "total_tokens": 9584640} {"current_steps": 1180, "total_steps": 23217, "loss": 0.6324, "learning_rate": 4.968199153050457e-05, "epoch": 0.15247447990696472, "percentage": 5.08, "elapsed_time": "1:40:04", "remaining_time": "1 day, 7:08:52", "throughput": "1609.95", "total_tokens": 9666560} {"current_steps": 1190, "total_steps": 23217, "loss": 0.9144, "learning_rate": 4.967659041799522e-05, "epoch": 0.15376663651634578, "percentage": 5.13, "elapsed_time": "1:40:51", "remaining_time": "1 day, 7:06:58", "throughput": "1610.86", "total_tokens": 9748480} {"current_steps": 1200, "total_steps": 23217, "loss": 0.8396, "learning_rate": 4.9671144122739106e-05, "epoch": 0.15505879312572685, "percentage": 5.17, "elapsed_time": "1:41:39", "remaining_time": "1 day, 7:05:05", "throughput": "1611.75", "total_tokens": 9830400} {"current_steps": 1210, "total_steps": 23217, "loss": 1.0608, "learning_rate": 4.966565265470838e-05, "epoch": 0.1563509497351079, "percentage": 5.21, "elapsed_time": "1:42:26", "remaining_time": "1 day, 7:03:13", "throughput": "1612.62", "total_tokens": 9912320} {"current_steps": 1220, "total_steps": 23217, "loss": 0.9964, "learning_rate": 4.9660116023957906e-05, "epoch": 0.15764310634448894, "percentage": 5.25, "elapsed_time": "1:43:14", "remaining_time": "1 day, 7:01:23", "throughput": "1613.48", "total_tokens": 9994240} {"current_steps": 1230, "total_steps": 23217, "loss": 0.8427, "learning_rate": 4.9654534240625225e-05, "epoch": 0.15893526295387, "percentage": 5.3, "elapsed_time": "1:44:01", "remaining_time": "1 day, 6:59:34", "throughput": "1614.32", "total_tokens": 10076160} {"current_steps": 1240, "total_steps": 23217, "loss": 1.2353, "learning_rate": 4.964890731493057e-05, "epoch": 0.16022741956325107, "percentage": 5.34, "elapsed_time": "1:44:49", "remaining_time": "1 day, 6:57:46", "throughput": "1615.15", "total_tokens": 10158080} {"current_steps": 1250, "total_steps": 23217, "loss": 1.0439, "learning_rate": 4.964323525717681e-05, "epoch": 0.16151957617263213, "percentage": 5.38, "elapsed_time": "1:45:36", "remaining_time": "1 day, 6:55:59", "throughput": "1615.97", "total_tokens": 10240000} {"current_steps": 1260, "total_steps": 23217, "loss": 0.914, "learning_rate": 4.9637518077749476e-05, "epoch": 0.1628117327820132, "percentage": 5.43, "elapsed_time": "1:46:24", "remaining_time": "1 day, 6:54:13", "throughput": "1616.77", "total_tokens": 10321920} {"current_steps": 1270, "total_steps": 23217, "loss": 1.0189, "learning_rate": 4.96317557871167e-05, "epoch": 0.16410388939139423, "percentage": 5.47, "elapsed_time": "1:47:11", "remaining_time": "1 day, 6:52:27", "throughput": "1617.57", "total_tokens": 10403840} {"current_steps": 1280, "total_steps": 23217, "loss": 1.0049, "learning_rate": 4.9625948395829216e-05, "epoch": 0.1653960460007753, "percentage": 5.51, "elapsed_time": "1:47:59", "remaining_time": "1 day, 6:50:43", "throughput": "1618.36", "total_tokens": 10485760} {"current_steps": 1290, "total_steps": 23217, "loss": 0.941, "learning_rate": 4.962009591452032e-05, "epoch": 0.16668820261015635, "percentage": 5.56, "elapsed_time": "1:48:46", "remaining_time": "1 day, 6:48:59", "throughput": "1619.14", "total_tokens": 10567680} {"current_steps": 1300, "total_steps": 23217, "loss": 1.1209, "learning_rate": 4.96141983539059e-05, "epoch": 0.1679803592195374, "percentage": 5.6, "elapsed_time": "1:49:34", "remaining_time": "1 day, 6:47:16", "throughput": "1619.90", "total_tokens": 10649600} {"current_steps": 1310, "total_steps": 23217, "loss": 1.0478, "learning_rate": 4.960825572478436e-05, "epoch": 0.16927251582891847, "percentage": 5.64, "elapsed_time": "1:50:21", "remaining_time": "1 day, 6:45:34", "throughput": "1620.65", "total_tokens": 10731520} {"current_steps": 1320, "total_steps": 23217, "loss": 0.9342, "learning_rate": 4.960226803803664e-05, "epoch": 0.1705646724382995, "percentage": 5.69, "elapsed_time": "1:51:09", "remaining_time": "1 day, 6:43:54", "throughput": "1621.38", "total_tokens": 10813440} {"current_steps": 1330, "total_steps": 23217, "loss": 1.0727, "learning_rate": 4.959623530462617e-05, "epoch": 0.17185682904768057, "percentage": 5.73, "elapsed_time": "1:51:56", "remaining_time": "1 day, 6:42:13", "throughput": "1622.12", "total_tokens": 10895360} {"current_steps": 1340, "total_steps": 23217, "loss": 1.0719, "learning_rate": 4.9590157535598855e-05, "epoch": 0.17314898565706163, "percentage": 5.77, "elapsed_time": "1:52:44", "remaining_time": "1 day, 6:40:33", "throughput": "1622.84", "total_tokens": 10977280} {"current_steps": 1350, "total_steps": 23217, "loss": 1.0195, "learning_rate": 4.958403474208308e-05, "epoch": 0.1744411422664427, "percentage": 5.81, "elapsed_time": "1:53:31", "remaining_time": "1 day, 6:38:54", "throughput": "1623.55", "total_tokens": 11059200} {"current_steps": 1360, "total_steps": 23217, "loss": 1.1703, "learning_rate": 4.957786693528965e-05, "epoch": 0.17573329887582376, "percentage": 5.86, "elapsed_time": "1:54:19", "remaining_time": "1 day, 6:37:16", "throughput": "1624.26", "total_tokens": 11141120} {"current_steps": 1370, "total_steps": 23217, "loss": 0.8547, "learning_rate": 4.95716541265118e-05, "epoch": 0.17702545548520482, "percentage": 5.9, "elapsed_time": "1:55:06", "remaining_time": "1 day, 6:35:39", "throughput": "1624.95", "total_tokens": 11223040} {"current_steps": 1380, "total_steps": 23217, "loss": 1.056, "learning_rate": 4.9565396327125155e-05, "epoch": 0.17831761209458585, "percentage": 5.94, "elapsed_time": "1:55:54", "remaining_time": "1 day, 6:34:03", "throughput": "1625.62", "total_tokens": 11304960} {"current_steps": 1390, "total_steps": 23217, "loss": 0.8731, "learning_rate": 4.955909354858772e-05, "epoch": 0.17960976870396692, "percentage": 5.99, "elapsed_time": "1:56:41", "remaining_time": "1 day, 6:32:27", "throughput": "1626.29", "total_tokens": 11386880} {"current_steps": 1400, "total_steps": 23217, "loss": 0.7233, "learning_rate": 4.955274580243987e-05, "epoch": 0.18090192531334798, "percentage": 6.03, "elapsed_time": "1:57:29", "remaining_time": "1 day, 6:30:53", "throughput": "1626.94", "total_tokens": 11468800} {"current_steps": 1410, "total_steps": 23217, "loss": 0.8429, "learning_rate": 4.95463531003043e-05, "epoch": 0.18219408192272904, "percentage": 6.07, "elapsed_time": "1:58:16", "remaining_time": "1 day, 6:29:18", "throughput": "1627.60", "total_tokens": 11550720} {"current_steps": 1420, "total_steps": 23217, "loss": 0.9205, "learning_rate": 4.953991545388603e-05, "epoch": 0.1834862385321101, "percentage": 6.12, "elapsed_time": "1:59:04", "remaining_time": "1 day, 6:27:44", "throughput": "1628.25", "total_tokens": 11632640} {"current_steps": 1430, "total_steps": 23217, "loss": 1.0245, "learning_rate": 4.9533432874972366e-05, "epoch": 0.18477839514149114, "percentage": 6.16, "elapsed_time": "1:59:51", "remaining_time": "1 day, 6:26:11", "throughput": "1628.89", "total_tokens": 11714560} {"current_steps": 1440, "total_steps": 23217, "loss": 1.161, "learning_rate": 4.952690537543287e-05, "epoch": 0.1860705517508722, "percentage": 6.2, "elapsed_time": "2:00:39", "remaining_time": "1 day, 6:24:37", "throughput": "1629.53", "total_tokens": 11796480} {"current_steps": 1450, "total_steps": 23217, "loss": 1.4307, "learning_rate": 4.952033296721938e-05, "epoch": 0.18736270836025326, "percentage": 6.25, "elapsed_time": "2:01:26", "remaining_time": "1 day, 6:23:05", "throughput": "1630.15", "total_tokens": 11878400} {"current_steps": 1460, "total_steps": 23217, "loss": 0.9983, "learning_rate": 4.951371566236597e-05, "epoch": 0.18865486496963432, "percentage": 6.29, "elapsed_time": "2:02:14", "remaining_time": "1 day, 6:21:34", "throughput": "1630.77", "total_tokens": 11960320} {"current_steps": 1470, "total_steps": 23217, "loss": 0.927, "learning_rate": 4.9507053472988867e-05, "epoch": 0.18994702157901538, "percentage": 6.33, "elapsed_time": "2:03:01", "remaining_time": "1 day, 6:20:03", "throughput": "1631.37", "total_tokens": 12042240} {"current_steps": 1480, "total_steps": 23217, "loss": 1.0184, "learning_rate": 4.9500346411286534e-05, "epoch": 0.19123917818839645, "percentage": 6.37, "elapsed_time": "2:03:49", "remaining_time": "1 day, 6:18:33", "throughput": "1631.96", "total_tokens": 12124160} {"current_steps": 1490, "total_steps": 23217, "loss": 0.9956, "learning_rate": 4.949359448953959e-05, "epoch": 0.19253133479777748, "percentage": 6.42, "elapsed_time": "2:04:36", "remaining_time": "1 day, 6:17:04", "throughput": "1632.55", "total_tokens": 12206080} {"current_steps": 1500, "total_steps": 23217, "loss": 0.7369, "learning_rate": 4.9486797720110746e-05, "epoch": 0.19382349140715854, "percentage": 6.46, "elapsed_time": "2:05:24", "remaining_time": "1 day, 6:15:36", "throughput": "1633.12", "total_tokens": 12288000} {"current_steps": 1510, "total_steps": 23217, "loss": 0.9916, "learning_rate": 4.947995611544489e-05, "epoch": 0.1951156480165396, "percentage": 6.5, "elapsed_time": "2:06:11", "remaining_time": "1 day, 6:14:08", "throughput": "1633.68", "total_tokens": 12369920} {"current_steps": 1520, "total_steps": 23217, "loss": 1.0502, "learning_rate": 4.947306968806896e-05, "epoch": 0.19640780462592067, "percentage": 6.55, "elapsed_time": "2:06:59", "remaining_time": "1 day, 6:12:40", "throughput": "1634.25", "total_tokens": 12451840} {"current_steps": 1530, "total_steps": 23217, "loss": 1.1209, "learning_rate": 4.946613845059199e-05, "epoch": 0.19769996123530173, "percentage": 6.59, "elapsed_time": "2:07:46", "remaining_time": "1 day, 6:11:12", "throughput": "1634.83", "total_tokens": 12533760} {"current_steps": 1540, "total_steps": 23217, "loss": 1.152, "learning_rate": 4.945916241570504e-05, "epoch": 0.19899211784468276, "percentage": 6.63, "elapsed_time": "2:08:34", "remaining_time": "1 day, 6:09:45", "throughput": "1635.37", "total_tokens": 12615680} {"current_steps": 1550, "total_steps": 23217, "loss": 1.1884, "learning_rate": 4.945214159618121e-05, "epoch": 0.20028427445406383, "percentage": 6.68, "elapsed_time": "2:09:21", "remaining_time": "1 day, 6:08:20", "throughput": "1635.91", "total_tokens": 12697600} {"current_steps": 1560, "total_steps": 23217, "loss": 1.1069, "learning_rate": 4.9445076004875596e-05, "epoch": 0.2015764310634449, "percentage": 6.72, "elapsed_time": "2:10:09", "remaining_time": "1 day, 6:06:53", "throughput": "1636.45", "total_tokens": 12779520} {"current_steps": 1570, "total_steps": 23217, "loss": 1.0457, "learning_rate": 4.9437965654725264e-05, "epoch": 0.20286858767282595, "percentage": 6.76, "elapsed_time": "2:10:56", "remaining_time": "1 day, 6:05:29", "throughput": "1636.98", "total_tokens": 12861440} {"current_steps": 1580, "total_steps": 23217, "loss": 0.8206, "learning_rate": 4.943081055874925e-05, "epoch": 0.204160744282207, "percentage": 6.81, "elapsed_time": "2:11:44", "remaining_time": "1 day, 6:04:04", "throughput": "1637.50", "total_tokens": 12943360} {"current_steps": 1590, "total_steps": 23217, "loss": 1.2474, "learning_rate": 4.9423610730048495e-05, "epoch": 0.20545290089158805, "percentage": 6.85, "elapsed_time": "2:12:31", "remaining_time": "1 day, 6:02:40", "throughput": "1638.01", "total_tokens": 13025280} {"current_steps": 1600, "total_steps": 23217, "loss": 0.9485, "learning_rate": 4.941636618180586e-05, "epoch": 0.2067450575009691, "percentage": 6.89, "elapsed_time": "2:13:19", "remaining_time": "1 day, 6:01:16", "throughput": "1638.53", "total_tokens": 13107200} {"current_steps": 1610, "total_steps": 23217, "loss": 1.0329, "learning_rate": 4.94090769272861e-05, "epoch": 0.20803721411035017, "percentage": 6.93, "elapsed_time": "2:14:06", "remaining_time": "1 day, 5:59:53", "throughput": "1639.03", "total_tokens": 13189120} {"current_steps": 1620, "total_steps": 23217, "loss": 1.1409, "learning_rate": 4.940174297983581e-05, "epoch": 0.20932937071973123, "percentage": 6.98, "elapsed_time": "2:14:54", "remaining_time": "1 day, 5:58:30", "throughput": "1639.53", "total_tokens": 13271040} {"current_steps": 1630, "total_steps": 23217, "loss": 0.6724, "learning_rate": 4.93943643528834e-05, "epoch": 0.2106215273291123, "percentage": 7.02, "elapsed_time": "2:15:41", "remaining_time": "1 day, 5:57:08", "throughput": "1640.02", "total_tokens": 13352960} {"current_steps": 1640, "total_steps": 23217, "loss": 0.9835, "learning_rate": 4.938694105993914e-05, "epoch": 0.21191368393849336, "percentage": 7.06, "elapsed_time": "2:16:29", "remaining_time": "1 day, 5:55:46", "throughput": "1640.51", "total_tokens": 13434880} {"current_steps": 1650, "total_steps": 23217, "loss": 1.2099, "learning_rate": 4.937947311459503e-05, "epoch": 0.2132058405478744, "percentage": 7.11, "elapsed_time": "2:17:16", "remaining_time": "1 day, 5:54:23", "throughput": "1641.00", "total_tokens": 13516800} {"current_steps": 1660, "total_steps": 23217, "loss": 0.9276, "learning_rate": 4.937196053052486e-05, "epoch": 0.21449799715725545, "percentage": 7.15, "elapsed_time": "2:18:04", "remaining_time": "1 day, 5:53:02", "throughput": "1641.48", "total_tokens": 13598720} {"current_steps": 1670, "total_steps": 23217, "loss": 1.4808, "learning_rate": 4.9364403321484145e-05, "epoch": 0.21579015376663652, "percentage": 7.19, "elapsed_time": "2:18:51", "remaining_time": "1 day, 5:51:42", "throughput": "1641.95", "total_tokens": 13680640} {"current_steps": 1680, "total_steps": 23217, "loss": 1.248, "learning_rate": 4.9356801501310105e-05, "epoch": 0.21708231037601758, "percentage": 7.24, "elapsed_time": "2:19:39", "remaining_time": "1 day, 5:50:21", "throughput": "1642.42", "total_tokens": 13762560} {"current_steps": 1690, "total_steps": 23217, "loss": 0.8261, "learning_rate": 4.934915508392164e-05, "epoch": 0.21837446698539864, "percentage": 7.28, "elapsed_time": "2:20:26", "remaining_time": "1 day, 5:49:01", "throughput": "1642.88", "total_tokens": 13844480} {"current_steps": 1700, "total_steps": 23217, "loss": 1.2263, "learning_rate": 4.9341464083319314e-05, "epoch": 0.21966662359477968, "percentage": 7.32, "elapsed_time": "2:21:14", "remaining_time": "1 day, 5:47:41", "throughput": "1643.34", "total_tokens": 13926400} {"current_steps": 1710, "total_steps": 23217, "loss": 0.8885, "learning_rate": 4.933372851358532e-05, "epoch": 0.22095878020416074, "percentage": 7.37, "elapsed_time": "2:22:01", "remaining_time": "1 day, 5:46:22", "throughput": "1643.79", "total_tokens": 14008320} {"current_steps": 1720, "total_steps": 23217, "loss": 1.369, "learning_rate": 4.932594838888347e-05, "epoch": 0.2222509368135418, "percentage": 7.41, "elapsed_time": "2:22:49", "remaining_time": "1 day, 5:45:03", "throughput": "1644.23", "total_tokens": 14090240} {"current_steps": 1730, "total_steps": 23217, "loss": 1.1812, "learning_rate": 4.931812372345913e-05, "epoch": 0.22354309342292286, "percentage": 7.45, "elapsed_time": "2:23:36", "remaining_time": "1 day, 5:43:44", "throughput": "1644.68", "total_tokens": 14172160} {"current_steps": 1740, "total_steps": 23217, "loss": 0.7136, "learning_rate": 4.9310254531639235e-05, "epoch": 0.22483525003230392, "percentage": 7.49, "elapsed_time": "2:24:24", "remaining_time": "1 day, 5:42:27", "throughput": "1645.10", "total_tokens": 14254080} {"current_steps": 1750, "total_steps": 23217, "loss": 1.4446, "learning_rate": 4.930234082783225e-05, "epoch": 0.22612740664168499, "percentage": 7.54, "elapsed_time": "2:25:12", "remaining_time": "1 day, 5:41:09", "throughput": "1645.53", "total_tokens": 14336000} {"current_steps": 1760, "total_steps": 23217, "loss": 0.7729, "learning_rate": 4.9294382626528144e-05, "epoch": 0.22741956325106602, "percentage": 7.58, "elapsed_time": "2:25:59", "remaining_time": "1 day, 5:39:52", "throughput": "1645.96", "total_tokens": 14417920} {"current_steps": 1770, "total_steps": 23217, "loss": 0.9155, "learning_rate": 4.928637994229834e-05, "epoch": 0.22871171986044708, "percentage": 7.62, "elapsed_time": "2:26:47", "remaining_time": "1 day, 5:38:34", "throughput": "1646.39", "total_tokens": 14499840} {"current_steps": 1780, "total_steps": 23217, "loss": 1.0874, "learning_rate": 4.9278332789795746e-05, "epoch": 0.23000387646982814, "percentage": 7.67, "elapsed_time": "2:27:34", "remaining_time": "1 day, 5:37:17", "throughput": "1646.81", "total_tokens": 14581760} {"current_steps": 1790, "total_steps": 23217, "loss": 0.7714, "learning_rate": 4.9270241183754637e-05, "epoch": 0.2312960330792092, "percentage": 7.71, "elapsed_time": "2:28:22", "remaining_time": "1 day, 5:36:01", "throughput": "1647.22", "total_tokens": 14663680} {"current_steps": 1800, "total_steps": 23217, "loss": 1.3797, "learning_rate": 4.9262105138990745e-05, "epoch": 0.23258818968859027, "percentage": 7.75, "elapsed_time": "2:29:09", "remaining_time": "1 day, 5:34:45", "throughput": "1647.63", "total_tokens": 14745600} {"current_steps": 1810, "total_steps": 23217, "loss": 1.2271, "learning_rate": 4.925392467040112e-05, "epoch": 0.2338803462979713, "percentage": 7.8, "elapsed_time": "2:29:57", "remaining_time": "1 day, 5:33:29", "throughput": "1648.02", "total_tokens": 14827520} {"current_steps": 1820, "total_steps": 23217, "loss": 0.9982, "learning_rate": 4.924569979296417e-05, "epoch": 0.23517250290735237, "percentage": 7.84, "elapsed_time": "2:30:44", "remaining_time": "1 day, 5:32:14", "throughput": "1648.43", "total_tokens": 14909440} {"current_steps": 1830, "total_steps": 23217, "loss": 0.9374, "learning_rate": 4.9237430521739626e-05, "epoch": 0.23646465951673343, "percentage": 7.88, "elapsed_time": "2:31:32", "remaining_time": "1 day, 5:30:58", "throughput": "1648.83", "total_tokens": 14991360} {"current_steps": 1840, "total_steps": 23217, "loss": 0.9464, "learning_rate": 4.9229116871868485e-05, "epoch": 0.2377568161261145, "percentage": 7.93, "elapsed_time": "2:32:19", "remaining_time": "1 day, 5:29:43", "throughput": "1649.22", "total_tokens": 15073280} {"current_steps": 1850, "total_steps": 23217, "loss": 0.8913, "learning_rate": 4.922075885857301e-05, "epoch": 0.23904897273549555, "percentage": 7.97, "elapsed_time": "2:33:07", "remaining_time": "1 day, 5:28:29", "throughput": "1649.61", "total_tokens": 15155200} {"current_steps": 1860, "total_steps": 23217, "loss": 1.3031, "learning_rate": 4.92123564971567e-05, "epoch": 0.2403411293448766, "percentage": 8.01, "elapsed_time": "2:33:54", "remaining_time": "1 day, 5:27:14", "throughput": "1650.00", "total_tokens": 15237120} {"current_steps": 1870, "total_steps": 23217, "loss": 1.0151, "learning_rate": 4.9203909803004245e-05, "epoch": 0.24163328595425765, "percentage": 8.05, "elapsed_time": "2:34:42", "remaining_time": "1 day, 5:26:00", "throughput": "1650.38", "total_tokens": 15319040} {"current_steps": 1880, "total_steps": 23217, "loss": 1.0122, "learning_rate": 4.9195418791581504e-05, "epoch": 0.2429254425636387, "percentage": 8.1, "elapsed_time": "2:35:29", "remaining_time": "1 day, 5:24:46", "throughput": "1650.75", "total_tokens": 15400960} {"current_steps": 1890, "total_steps": 23217, "loss": 1.3312, "learning_rate": 4.918688347843549e-05, "epoch": 0.24421759917301977, "percentage": 8.14, "elapsed_time": "2:36:17", "remaining_time": "1 day, 5:23:33", "throughput": "1651.12", "total_tokens": 15482880} {"current_steps": 1900, "total_steps": 23217, "loss": 1.4312, "learning_rate": 4.917830387919434e-05, "epoch": 0.24550975578240083, "percentage": 8.18, "elapsed_time": "2:37:04", "remaining_time": "1 day, 5:22:19", "throughput": "1651.50", "total_tokens": 15564800} {"current_steps": 1910, "total_steps": 23217, "loss": 0.8297, "learning_rate": 4.9169680009567254e-05, "epoch": 0.2468019123917819, "percentage": 8.23, "elapsed_time": "2:37:52", "remaining_time": "1 day, 5:21:06", "throughput": "1651.86", "total_tokens": 15646720} {"current_steps": 1920, "total_steps": 23217, "loss": 0.9553, "learning_rate": 4.916101188534452e-05, "epoch": 0.24809406900116293, "percentage": 8.27, "elapsed_time": "2:38:39", "remaining_time": "1 day, 5:19:54", "throughput": "1652.21", "total_tokens": 15728640} {"current_steps": 1930, "total_steps": 23217, "loss": 1.2107, "learning_rate": 4.9152299522397424e-05, "epoch": 0.249386225610544, "percentage": 8.31, "elapsed_time": "2:39:27", "remaining_time": "1 day, 5:18:42", "throughput": "1652.56", "total_tokens": 15810560} {"current_steps": 1940, "total_steps": 23217, "loss": 1.3879, "learning_rate": 4.91435429366783e-05, "epoch": 0.25067838221992506, "percentage": 8.36, "elapsed_time": "2:40:14", "remaining_time": "1 day, 5:17:30", "throughput": "1652.92", "total_tokens": 15892480} {"current_steps": 1950, "total_steps": 23217, "loss": 1.2823, "learning_rate": 4.9134742144220394e-05, "epoch": 0.2519705388293061, "percentage": 8.4, "elapsed_time": "2:41:02", "remaining_time": "1 day, 5:16:19", "throughput": "1653.26", "total_tokens": 15974400} {"current_steps": 1960, "total_steps": 23217, "loss": 0.9816, "learning_rate": 4.912589716113794e-05, "epoch": 0.2532626954386872, "percentage": 8.44, "elapsed_time": "2:41:49", "remaining_time": "1 day, 5:15:07", "throughput": "1653.60", "total_tokens": 16056320} {"current_steps": 1970, "total_steps": 23217, "loss": 0.8746, "learning_rate": 4.9117008003626066e-05, "epoch": 0.2545548520480682, "percentage": 8.49, "elapsed_time": "2:42:37", "remaining_time": "1 day, 5:13:55", "throughput": "1653.95", "total_tokens": 16138240} {"current_steps": 1980, "total_steps": 23217, "loss": 0.8788, "learning_rate": 4.910807468796079e-05, "epoch": 0.2558470086574493, "percentage": 8.53, "elapsed_time": "2:43:24", "remaining_time": "1 day, 5:12:44", "throughput": "1654.30", "total_tokens": 16220160} {"current_steps": 1990, "total_steps": 23217, "loss": 0.9458, "learning_rate": 4.9099097230498974e-05, "epoch": 0.25713916526683034, "percentage": 8.57, "elapsed_time": "2:44:12", "remaining_time": "1 day, 5:11:33", "throughput": "1654.63", "total_tokens": 16302080} {"current_steps": 2000, "total_steps": 23217, "loss": 0.7193, "learning_rate": 4.909007564767831e-05, "epoch": 0.2584313218762114, "percentage": 8.61, "elapsed_time": "2:44:59", "remaining_time": "1 day, 5:10:22", "throughput": "1654.97", "total_tokens": 16384000} {"current_steps": 2010, "total_steps": 23217, "loss": 1.1241, "learning_rate": 4.90810099560173e-05, "epoch": 0.25972347848559246, "percentage": 8.66, "elapsed_time": "2:45:53", "remaining_time": "1 day, 5:10:16", "throughput": "1654.30", "total_tokens": 16465920} {"current_steps": 2020, "total_steps": 23217, "loss": 1.2065, "learning_rate": 4.907190017211517e-05, "epoch": 0.2610156350949735, "percentage": 8.7, "elapsed_time": "2:46:40", "remaining_time": "1 day, 5:09:05", "throughput": "1654.63", "total_tokens": 16547840} {"current_steps": 2030, "total_steps": 23217, "loss": 1.0478, "learning_rate": 4.906274631265191e-05, "epoch": 0.2623077917043546, "percentage": 8.74, "elapsed_time": "2:47:28", "remaining_time": "1 day, 5:07:55", "throughput": "1654.96", "total_tokens": 16629760} {"current_steps": 2040, "total_steps": 23217, "loss": 1.0866, "learning_rate": 4.90535483943882e-05, "epoch": 0.2635999483137356, "percentage": 8.79, "elapsed_time": "2:48:15", "remaining_time": "1 day, 5:06:44", "throughput": "1655.29", "total_tokens": 16711680} {"current_steps": 2050, "total_steps": 23217, "loss": 0.7329, "learning_rate": 4.904430643416541e-05, "epoch": 0.26489210492311666, "percentage": 8.83, "elapsed_time": "2:49:03", "remaining_time": "1 day, 5:05:34", "throughput": "1655.61", "total_tokens": 16793600} {"current_steps": 2060, "total_steps": 23217, "loss": 0.8875, "learning_rate": 4.903502044890551e-05, "epoch": 0.26618426153249775, "percentage": 8.87, "elapsed_time": "2:49:50", "remaining_time": "1 day, 5:04:24", "throughput": "1655.94", "total_tokens": 16875520} {"current_steps": 2070, "total_steps": 23217, "loss": 1.1042, "learning_rate": 4.902569045561113e-05, "epoch": 0.2674764181418788, "percentage": 8.92, "elapsed_time": "2:50:38", "remaining_time": "1 day, 5:03:15", "throughput": "1656.25", "total_tokens": 16957440} {"current_steps": 2080, "total_steps": 23217, "loss": 1.012, "learning_rate": 4.901631647136543e-05, "epoch": 0.26876857475125987, "percentage": 8.96, "elapsed_time": "2:51:25", "remaining_time": "1 day, 5:02:05", "throughput": "1656.57", "total_tokens": 17039360} {"current_steps": 2090, "total_steps": 23217, "loss": 1.0272, "learning_rate": 4.900689851333216e-05, "epoch": 0.2700607313606409, "percentage": 9.0, "elapsed_time": "2:52:13", "remaining_time": "1 day, 5:00:57", "throughput": "1656.88", "total_tokens": 17121280} {"current_steps": 2100, "total_steps": 23217, "loss": 1.1297, "learning_rate": 4.899743659875556e-05, "epoch": 0.271352887970022, "percentage": 9.05, "elapsed_time": "2:53:01", "remaining_time": "1 day, 4:59:48", "throughput": "1657.18", "total_tokens": 17203200} {"current_steps": 2110, "total_steps": 23217, "loss": 1.3631, "learning_rate": 4.8987930744960355e-05, "epoch": 0.27264504457940303, "percentage": 9.09, "elapsed_time": "2:53:48", "remaining_time": "1 day, 4:58:40", "throughput": "1657.48", "total_tokens": 17285120} {"current_steps": 2120, "total_steps": 23217, "loss": 1.1892, "learning_rate": 4.897838096935174e-05, "epoch": 0.27393720118878406, "percentage": 9.13, "elapsed_time": "2:54:35", "remaining_time": "1 day, 4:57:30", "throughput": "1657.79", "total_tokens": 17367040} {"current_steps": 2130, "total_steps": 23217, "loss": 0.9273, "learning_rate": 4.896878728941531e-05, "epoch": 0.27522935779816515, "percentage": 9.17, "elapsed_time": "2:55:23", "remaining_time": "1 day, 4:56:22", "throughput": "1658.09", "total_tokens": 17448960} {"current_steps": 2140, "total_steps": 23217, "loss": 0.7893, "learning_rate": 4.8959149722717057e-05, "epoch": 0.2765215144075462, "percentage": 9.22, "elapsed_time": "2:56:10", "remaining_time": "1 day, 4:55:14", "throughput": "1658.40", "total_tokens": 17530880} {"current_steps": 2150, "total_steps": 23217, "loss": 1.0423, "learning_rate": 4.894946828690334e-05, "epoch": 0.2778136710169273, "percentage": 9.26, "elapsed_time": "2:56:58", "remaining_time": "1 day, 4:54:06", "throughput": "1658.69", "total_tokens": 17612800} {"current_steps": 2160, "total_steps": 23217, "loss": 1.2965, "learning_rate": 4.893974299970082e-05, "epoch": 0.2791058276263083, "percentage": 9.3, "elapsed_time": "2:57:45", "remaining_time": "1 day, 4:52:58", "throughput": "1658.98", "total_tokens": 17694720} {"current_steps": 2170, "total_steps": 23217, "loss": 0.9901, "learning_rate": 4.892997387891648e-05, "epoch": 0.28039798423568935, "percentage": 9.35, "elapsed_time": "2:58:33", "remaining_time": "1 day, 4:51:50", "throughput": "1659.28", "total_tokens": 17776640} {"current_steps": 2180, "total_steps": 23217, "loss": 1.1746, "learning_rate": 4.892016094243753e-05, "epoch": 0.28169014084507044, "percentage": 9.39, "elapsed_time": "2:59:20", "remaining_time": "1 day, 4:50:43", "throughput": "1659.56", "total_tokens": 17858560} {"current_steps": 2190, "total_steps": 23217, "loss": 0.8179, "learning_rate": 4.891030420823142e-05, "epoch": 0.28298229745445147, "percentage": 9.43, "elapsed_time": "3:00:08", "remaining_time": "1 day, 4:49:36", "throughput": "1659.85", "total_tokens": 17940480} {"current_steps": 2200, "total_steps": 23217, "loss": 0.9974, "learning_rate": 4.89004036943458e-05, "epoch": 0.28427445406383256, "percentage": 9.48, "elapsed_time": "3:00:55", "remaining_time": "1 day, 4:48:29", "throughput": "1660.14", "total_tokens": 18022400} {"current_steps": 2210, "total_steps": 23217, "loss": 1.307, "learning_rate": 4.8890459418908476e-05, "epoch": 0.2855666106732136, "percentage": 9.52, "elapsed_time": "3:01:43", "remaining_time": "1 day, 4:47:22", "throughput": "1660.41", "total_tokens": 18104320} {"current_steps": 2220, "total_steps": 23217, "loss": 0.8764, "learning_rate": 4.888047140012737e-05, "epoch": 0.28685876728259463, "percentage": 9.56, "elapsed_time": "3:02:31", "remaining_time": "1 day, 4:46:15", "throughput": "1660.69", "total_tokens": 18186240} {"current_steps": 2230, "total_steps": 23217, "loss": 0.8948, "learning_rate": 4.8870439656290525e-05, "epoch": 0.2881509238919757, "percentage": 9.61, "elapsed_time": "3:03:18", "remaining_time": "1 day, 4:45:09", "throughput": "1660.97", "total_tokens": 18268160} {"current_steps": 2240, "total_steps": 23217, "loss": 0.8611, "learning_rate": 4.8860364205766006e-05, "epoch": 0.28944308050135675, "percentage": 9.65, "elapsed_time": "3:04:06", "remaining_time": "1 day, 4:44:02", "throughput": "1661.24", "total_tokens": 18350080} {"current_steps": 2250, "total_steps": 23217, "loss": 0.9409, "learning_rate": 4.885024506700195e-05, "epoch": 0.29073523711073784, "percentage": 9.69, "elapsed_time": "3:04:53", "remaining_time": "1 day, 4:42:57", "throughput": "1661.50", "total_tokens": 18432000} {"current_steps": 2260, "total_steps": 23217, "loss": 1.1464, "learning_rate": 4.884008225852644e-05, "epoch": 0.2920273937201189, "percentage": 9.73, "elapsed_time": "3:05:41", "remaining_time": "1 day, 4:41:51", "throughput": "1661.77", "total_tokens": 18513920} {"current_steps": 2270, "total_steps": 23217, "loss": 1.3091, "learning_rate": 4.8829875798947554e-05, "epoch": 0.2933195503294999, "percentage": 9.78, "elapsed_time": "3:06:28", "remaining_time": "1 day, 4:40:45", "throughput": "1662.03", "total_tokens": 18595840} {"current_steps": 2280, "total_steps": 23217, "loss": 1.0955, "learning_rate": 4.8819625706953286e-05, "epoch": 0.294611706938881, "percentage": 9.82, "elapsed_time": "3:07:16", "remaining_time": "1 day, 4:39:39", "throughput": "1662.30", "total_tokens": 18677760} {"current_steps": 2290, "total_steps": 23217, "loss": 0.6546, "learning_rate": 4.88093320013115e-05, "epoch": 0.29590386354826204, "percentage": 9.86, "elapsed_time": "3:08:03", "remaining_time": "1 day, 4:38:33", "throughput": "1662.57", "total_tokens": 18759680} {"current_steps": 2300, "total_steps": 23217, "loss": 0.7477, "learning_rate": 4.879899470086995e-05, "epoch": 0.2971960201576431, "percentage": 9.91, "elapsed_time": "3:08:51", "remaining_time": "1 day, 4:37:28", "throughput": "1662.83", "total_tokens": 18841600} {"current_steps": 2310, "total_steps": 23217, "loss": 1.0105, "learning_rate": 4.8788613824556194e-05, "epoch": 0.29848817676702416, "percentage": 9.95, "elapsed_time": "3:09:38", "remaining_time": "1 day, 4:36:23", "throughput": "1663.09", "total_tokens": 18923520} {"current_steps": 2320, "total_steps": 23217, "loss": 1.3434, "learning_rate": 4.8778189391377574e-05, "epoch": 0.2997803333764052, "percentage": 9.99, "elapsed_time": "3:10:26", "remaining_time": "1 day, 4:35:18", "throughput": "1663.34", "total_tokens": 19005440} {"current_steps": 2330, "total_steps": 23217, "loss": 1.0991, "learning_rate": 4.876772142042117e-05, "epoch": 0.3010724899857863, "percentage": 10.04, "elapsed_time": "3:11:13", "remaining_time": "1 day, 4:34:12", "throughput": "1663.60", "total_tokens": 19087360} {"current_steps": 2340, "total_steps": 23217, "loss": 1.2049, "learning_rate": 4.875720993085384e-05, "epoch": 0.3023646465951673, "percentage": 10.08, "elapsed_time": "3:12:01", "remaining_time": "1 day, 4:33:08", "throughput": "1663.86", "total_tokens": 19169280} {"current_steps": 2350, "total_steps": 23217, "loss": 0.6964, "learning_rate": 4.874665494192206e-05, "epoch": 0.3036568032045484, "percentage": 10.12, "elapsed_time": "3:12:48", "remaining_time": "1 day, 4:32:03", "throughput": "1664.11", "total_tokens": 19251200} {"current_steps": 2360, "total_steps": 23217, "loss": 0.8926, "learning_rate": 4.8736056472951955e-05, "epoch": 0.30494895981392944, "percentage": 10.16, "elapsed_time": "3:13:35", "remaining_time": "1 day, 4:30:58", "throughput": "1664.35", "total_tokens": 19333120} {"current_steps": 2010, "total_steps": 23217, "loss": 1.1239, "learning_rate": 4.90810099560173e-05, "epoch": 0.25972347848559246, "percentage": 8.66, "elapsed_time": "0:00:53", "remaining_time": "0:09:28", "throughput": "305669.81", "total_tokens": 16465920} {"current_steps": 2020, "total_steps": 23217, "loss": 1.2067, "learning_rate": 4.907190017211517e-05, "epoch": 0.2610156350949735, "percentage": 8.7, "elapsed_time": "0:01:41", "remaining_time": "0:17:43", "throughput": "163211.79", "total_tokens": 16547840} {"current_steps": 2030, "total_steps": 23217, "loss": 1.0478, "learning_rate": 4.906274631265191e-05, "epoch": 0.2623077917043546, "percentage": 8.74, "elapsed_time": "0:02:29", "remaining_time": "0:25:57", "throughput": "111404.29", "total_tokens": 16629760} {"current_steps": 2040, "total_steps": 23217, "loss": 1.0864, "learning_rate": 4.90535483943882e-05, "epoch": 0.2635999483137356, "percentage": 8.79, "elapsed_time": "0:03:18", "remaining_time": "0:34:17", "throughput": "84301.34", "total_tokens": 16711680} {"current_steps": 2050, "total_steps": 23217, "loss": 0.7331, "learning_rate": 4.904430643416541e-05, "epoch": 0.26489210492311666, "percentage": 8.83, "elapsed_time": "0:04:07", "remaining_time": "0:42:34", "throughput": "67892.86", "total_tokens": 16793600} {"current_steps": 2060, "total_steps": 23217, "loss": 0.8874, "learning_rate": 4.903502044890551e-05, "epoch": 0.26618426153249775, "percentage": 8.87, "elapsed_time": "0:04:55", "remaining_time": "0:50:35", "throughput": "57102.50", "total_tokens": 16875520} {"current_steps": 2070, "total_steps": 23217, "loss": 1.1042, "learning_rate": 4.902569045561113e-05, "epoch": 0.2674764181418788, "percentage": 8.92, "elapsed_time": "0:05:44", "remaining_time": "0:58:44", "throughput": "49155.04", "total_tokens": 16957440} {"current_steps": 2080, "total_steps": 23217, "loss": 1.0121, "learning_rate": 4.901631647136543e-05, "epoch": 0.26876857475125987, "percentage": 8.96, "elapsed_time": "0:06:34", "remaining_time": "1:06:49", "throughput": "43189.25", "total_tokens": 17039360} {"current_steps": 2090, "total_steps": 23217, "loss": 1.027, "learning_rate": 4.900689851333216e-05, "epoch": 0.2700607313606409, "percentage": 9.0, "elapsed_time": "0:07:23", "remaining_time": "1:14:48", "throughput": "38561.93", "total_tokens": 17121280} {"current_steps": 2100, "total_steps": 23217, "loss": 1.1295, "learning_rate": 4.899743659875556e-05, "epoch": 0.271352887970022, "percentage": 9.05, "elapsed_time": "0:08:14", "remaining_time": "1:22:53", "throughput": "34785.57", "total_tokens": 17203200} {"current_steps": 2110, "total_steps": 23217, "loss": 1.3633, "learning_rate": 4.8987930744960355e-05, "epoch": 0.27264504457940303, "percentage": 9.09, "elapsed_time": "0:09:07", "remaining_time": "1:31:12", "throughput": "31594.60", "total_tokens": 17285120} {"current_steps": 2120, "total_steps": 23217, "loss": 1.1889, "learning_rate": 4.897838096935174e-05, "epoch": 0.27393720118878406, "percentage": 9.13, "elapsed_time": "0:09:55", "remaining_time": "1:38:46", "throughput": "29161.92", "total_tokens": 17367040} {"current_steps": 2130, "total_steps": 23217, "loss": 0.927, "learning_rate": 4.896878728941531e-05, "epoch": 0.27522935779816515, "percentage": 9.17, "elapsed_time": "0:10:43", "remaining_time": "1:46:14", "throughput": "27097.86", "total_tokens": 17448960} {"current_steps": 2140, "total_steps": 23217, "loss": 0.7892, "learning_rate": 4.8959149722717057e-05, "epoch": 0.2765215144075462, "percentage": 9.22, "elapsed_time": "0:11:36", "remaining_time": "1:54:15", "throughput": "25185.86", "total_tokens": 17530880} {"current_steps": 2150, "total_steps": 23217, "loss": 1.0423, "learning_rate": 4.894946828690334e-05, "epoch": 0.2778136710169273, "percentage": 9.26, "elapsed_time": "0:12:33", "remaining_time": "2:03:00", "throughput": "23383.61", "total_tokens": 17612800} {"current_steps": 2160, "total_steps": 23217, "loss": 1.2965, "learning_rate": 4.893974299970082e-05, "epoch": 0.2791058276263083, "percentage": 9.3, "elapsed_time": "0:13:30", "remaining_time": "2:11:43", "throughput": "21826.31", "total_tokens": 17694720} {"current_steps": 2170, "total_steps": 23217, "loss": 0.9905, "learning_rate": 4.892997387891648e-05, "epoch": 0.28039798423568935, "percentage": 9.35, "elapsed_time": "0:14:24", "remaining_time": "2:19:49", "throughput": "20551.78", "total_tokens": 17776640} {"current_steps": 2180, "total_steps": 23217, "loss": 1.1746, "learning_rate": 4.892016094243753e-05, "epoch": 0.28169014084507044, "percentage": 9.39, "elapsed_time": "0:15:19", "remaining_time": "2:27:53", "throughput": "19421.66", "total_tokens": 17858560} {"current_steps": 2190, "total_steps": 23217, "loss": 0.818, "learning_rate": 4.891030420823142e-05, "epoch": 0.28298229745445147, "percentage": 9.43, "elapsed_time": "0:16:11", "remaining_time": "2:35:31", "throughput": "18459.08", "total_tokens": 17940480} {"current_steps": 2200, "total_steps": 23217, "loss": 0.997, "learning_rate": 4.89004036943458e-05, "epoch": 0.28427445406383256, "percentage": 9.48, "elapsed_time": "0:17:07", "remaining_time": "2:43:32", "throughput": "17546.47", "total_tokens": 18022400} {"current_steps": 2210, "total_steps": 23217, "loss": 1.3072, "learning_rate": 4.8890459418908476e-05, "epoch": 0.2855666106732136, "percentage": 9.52, "elapsed_time": "0:18:02", "remaining_time": "2:51:25", "throughput": "16730.55", "total_tokens": 18104320} {"current_steps": 2220, "total_steps": 23217, "loss": 0.8763, "learning_rate": 4.888047140012737e-05, "epoch": 0.28685876728259463, "percentage": 9.56, "elapsed_time": "0:18:56", "remaining_time": "2:59:06", "throughput": "16005.61", "total_tokens": 18186240} {"current_steps": 2230, "total_steps": 23217, "loss": 0.8944, "learning_rate": 4.8870439656290525e-05, "epoch": 0.2881509238919757, "percentage": 9.61, "elapsed_time": "0:19:55", "remaining_time": "3:07:28", "throughput": "15284.68", "total_tokens": 18268160} {"current_steps": 2240, "total_steps": 23217, "loss": 0.8613, "learning_rate": 4.8860364205766006e-05, "epoch": 0.28944308050135675, "percentage": 9.65, "elapsed_time": "0:20:51", "remaining_time": "3:15:18", "throughput": "14664.31", "total_tokens": 18350080} {"current_steps": 2250, "total_steps": 23217, "loss": 0.9404, "learning_rate": 4.885024506700195e-05, "epoch": 0.29073523711073784, "percentage": 9.69, "elapsed_time": "0:21:42", "remaining_time": "3:22:13", "throughput": "14155.57", "total_tokens": 18432000} {"current_steps": 2260, "total_steps": 23217, "loss": 1.1465, "learning_rate": 4.884008225852644e-05, "epoch": 0.2920273937201189, "percentage": 9.73, "elapsed_time": "0:22:40", "remaining_time": "3:30:14", "throughput": "13609.96", "total_tokens": 18513920} {"current_steps": 2270, "total_steps": 23217, "loss": 1.3089, "learning_rate": 4.8829875798947554e-05, "epoch": 0.2933195503294999, "percentage": 9.78, "elapsed_time": "0:23:36", "remaining_time": "3:37:46", "throughput": "13132.33", "total_tokens": 18595840} {"current_steps": 2280, "total_steps": 23217, "loss": 1.0963, "learning_rate": 4.8819625706953286e-05, "epoch": 0.294611706938881, "percentage": 9.82, "elapsed_time": "0:24:28", "remaining_time": "3:44:46", "throughput": "12718.05", "total_tokens": 18677760} {"current_steps": 2290, "total_steps": 23217, "loss": 0.6548, "learning_rate": 4.88093320013115e-05, "epoch": 0.29590386354826204, "percentage": 9.86, "elapsed_time": "0:25:21", "remaining_time": "3:51:42", "throughput": "12330.72", "total_tokens": 18759680} {"current_steps": 2300, "total_steps": 23217, "loss": 0.7479, "learning_rate": 4.879899470086995e-05, "epoch": 0.2971960201576431, "percentage": 9.91, "elapsed_time": "0:26:13", "remaining_time": "3:58:28", "throughput": "11975.39", "total_tokens": 18841600} {"current_steps": 2310, "total_steps": 23217, "loss": 1.0112, "learning_rate": 4.8788613824556194e-05, "epoch": 0.29848817676702416, "percentage": 9.95, "elapsed_time": "0:27:04", "remaining_time": "4:05:05", "throughput": "11647.06", "total_tokens": 18923520} {"current_steps": 2320, "total_steps": 23217, "loss": 1.3439, "learning_rate": 4.8778189391377574e-05, "epoch": 0.2997803333764052, "percentage": 9.99, "elapsed_time": "0:27:58", "remaining_time": "4:12:00", "throughput": "11321.62", "total_tokens": 19005440} {"current_steps": 2330, "total_steps": 23217, "loss": 1.0994, "learning_rate": 4.876772142042117e-05, "epoch": 0.3010724899857863, "percentage": 10.04, "elapsed_time": "0:28:50", "remaining_time": "4:18:28", "throughput": "11032.98", "total_tokens": 19087360} {"current_steps": 2340, "total_steps": 23217, "loss": 1.2049, "learning_rate": 4.875720993085384e-05, "epoch": 0.3023646465951673, "percentage": 10.08, "elapsed_time": "0:29:41", "remaining_time": "4:24:50", "throughput": "10762.53", "total_tokens": 19169280} {"current_steps": 2350, "total_steps": 23217, "loss": 0.6961, "learning_rate": 4.874665494192206e-05, "epoch": 0.3036568032045484, "percentage": 10.12, "elapsed_time": "0:30:34", "remaining_time": "4:31:27", "throughput": "10495.44", "total_tokens": 19251200} {"current_steps": 2360, "total_steps": 23217, "loss": 0.8927, "learning_rate": 4.8736056472951955e-05, "epoch": 0.30494895981392944, "percentage": 10.16, "elapsed_time": "0:31:27", "remaining_time": "4:37:59", "throughput": "10243.92", "total_tokens": 19333120} {"current_steps": 2370, "total_steps": 23217, "loss": 0.9728, "learning_rate": 4.8725414543349326e-05, "epoch": 0.3062411164233105, "percentage": 10.21, "elapsed_time": "0:32:20", "remaining_time": "4:44:27", "throughput": "10005.81", "total_tokens": 19415040} {"current_steps": 2380, "total_steps": 23217, "loss": 1.3036, "learning_rate": 4.871472917259947e-05, "epoch": 0.30753327303269157, "percentage": 10.25, "elapsed_time": "0:33:19", "remaining_time": "4:51:42", "throughput": "9752.50", "total_tokens": 19496960} {"current_steps": 2390, "total_steps": 23217, "loss": 0.9335, "learning_rate": 4.870400038026728e-05, "epoch": 0.3088254296420726, "percentage": 10.29, "elapsed_time": "0:34:16", "remaining_time": "4:58:39", "throughput": "9521.34", "total_tokens": 19578880} {"current_steps": 2400, "total_steps": 23217, "loss": 1.1586, "learning_rate": 4.869322818599714e-05, "epoch": 0.3101175862514537, "percentage": 10.34, "elapsed_time": "0:35:08", "remaining_time": "5:04:46", "throughput": "9325.56", "total_tokens": 19660800} {"current_steps": 2410, "total_steps": 23217, "loss": 1.2544, "learning_rate": 4.868241260951289e-05, "epoch": 0.3114097428608347, "percentage": 10.38, "elapsed_time": "0:35:57", "remaining_time": "5:10:28", "throughput": "9150.13", "total_tokens": 19742720} {"current_steps": 2420, "total_steps": 23217, "loss": 1.1045, "learning_rate": 4.867155367061781e-05, "epoch": 0.3127018994702158, "percentage": 10.42, "elapsed_time": "0:36:51", "remaining_time": "5:16:42", "throughput": "8965.77", "total_tokens": 19824640} {"current_steps": 2430, "total_steps": 23217, "loss": 0.5473, "learning_rate": 4.8660651389194576e-05, "epoch": 0.31399405607959685, "percentage": 10.47, "elapsed_time": "0:37:41", "remaining_time": "5:22:29", "throughput": "8800.46", "total_tokens": 19906560} {"current_steps": 2440, "total_steps": 23217, "loss": 1.2962, "learning_rate": 4.8649705785205224e-05, "epoch": 0.3152862126889779, "percentage": 10.51, "elapsed_time": "0:38:30", "remaining_time": "5:27:53", "throughput": "8651.29", "total_tokens": 19988480} {"current_steps": 2450, "total_steps": 23217, "loss": 0.8808, "learning_rate": 4.8638716878691125e-05, "epoch": 0.316578369298359, "percentage": 10.55, "elapsed_time": "0:39:19", "remaining_time": "5:33:21", "throughput": "8505.72", "total_tokens": 20070400} {"current_steps": 2460, "total_steps": 23217, "loss": 1.2679, "learning_rate": 4.862768468977293e-05, "epoch": 0.31787052590774, "percentage": 10.6, "elapsed_time": "0:40:07", "remaining_time": "5:38:36", "throughput": "8369.59", "total_tokens": 20152320} {"current_steps": 2470, "total_steps": 23217, "loss": 0.9461, "learning_rate": 4.861660923865052e-05, "epoch": 0.3191626825171211, "percentage": 10.64, "elapsed_time": "0:40:56", "remaining_time": "5:43:52", "throughput": "8237.36", "total_tokens": 20234240} {"current_steps": 2480, "total_steps": 23217, "loss": 0.7236, "learning_rate": 4.860549054560301e-05, "epoch": 0.32045483912650213, "percentage": 10.68, "elapsed_time": "0:41:46", "remaining_time": "5:49:16", "throughput": "8106.09", "total_tokens": 20316160} {"current_steps": 2490, "total_steps": 23217, "loss": 1.2098, "learning_rate": 4.8594328630988696e-05, "epoch": 0.32174699573588317, "percentage": 10.72, "elapsed_time": "0:42:35", "remaining_time": "5:54:32", "throughput": "7982.03", "total_tokens": 20398080} {"current_steps": 2500, "total_steps": 23217, "loss": 1.2859, "learning_rate": 4.858312351524499e-05, "epoch": 0.32303915234526426, "percentage": 10.77, "elapsed_time": "0:43:24", "remaining_time": "5:59:38", "throughput": "7864.81", "total_tokens": 20480000} {"current_steps": 2510, "total_steps": 23217, "loss": 0.9768, "learning_rate": 4.857187521888843e-05, "epoch": 0.3243313089546453, "percentage": 10.81, "elapsed_time": "0:44:12", "remaining_time": "6:04:41", "throughput": "7752.43", "total_tokens": 20561920} {"current_steps": 2520, "total_steps": 23217, "loss": 0.8317, "learning_rate": 4.8560583762514594e-05, "epoch": 0.3256234655640264, "percentage": 10.85, "elapsed_time": "0:45:00", "remaining_time": "6:09:39", "throughput": "7644.53", "total_tokens": 20643840} {"current_steps": 2530, "total_steps": 23217, "loss": 0.6581, "learning_rate": 4.854924916679811e-05, "epoch": 0.3269156221734074, "percentage": 10.9, "elapsed_time": "0:45:49", "remaining_time": "6:14:39", "throughput": "7538.94", "total_tokens": 20725760} {"current_steps": 2540, "total_steps": 23217, "loss": 1.248, "learning_rate": 4.8537871452492565e-05, "epoch": 0.32820777878278845, "percentage": 10.94, "elapsed_time": "0:46:37", "remaining_time": "6:19:36", "throughput": "7436.80", "total_tokens": 20807680} {"current_steps": 2550, "total_steps": 23217, "loss": 0.9416, "learning_rate": 4.852645064043053e-05, "epoch": 0.32949993539216954, "percentage": 10.98, "elapsed_time": "0:47:26", "remaining_time": "6:24:31", "throughput": "7338.35", "total_tokens": 20889600} {"current_steps": 2560, "total_steps": 23217, "loss": 1.0115, "learning_rate": 4.851498675152346e-05, "epoch": 0.3307920920015506, "percentage": 11.03, "elapsed_time": "0:48:15", "remaining_time": "6:29:26", "throughput": "7242.05", "total_tokens": 20971520} {"current_steps": 2570, "total_steps": 23217, "loss": 0.8474, "learning_rate": 4.8503479806761684e-05, "epoch": 0.33208424861093166, "percentage": 11.07, "elapsed_time": "0:49:04", "remaining_time": "6:34:14", "throughput": "7150.46", "total_tokens": 21053440} {"current_steps": 2580, "total_steps": 23217, "loss": 1.0834, "learning_rate": 4.84919298272144e-05, "epoch": 0.3333764052203127, "percentage": 11.11, "elapsed_time": "0:49:53", "remaining_time": "6:39:01", "throughput": "7061.41", "total_tokens": 21135360} {"current_steps": 2590, "total_steps": 23217, "loss": 1.3049, "learning_rate": 4.848033683402956e-05, "epoch": 0.33466856182969373, "percentage": 11.16, "elapsed_time": "0:50:42", "remaining_time": "6:43:47", "throughput": "6974.62", "total_tokens": 21217280} {"current_steps": 2600, "total_steps": 23217, "loss": 1.0012, "learning_rate": 4.84687008484339e-05, "epoch": 0.3359607184390748, "percentage": 11.2, "elapsed_time": "0:51:30", "remaining_time": "6:48:27", "throughput": "6891.50", "total_tokens": 21299200} {"current_steps": 2610, "total_steps": 23217, "loss": 0.6511, "learning_rate": 4.8457021891732866e-05, "epoch": 0.33725287504845586, "percentage": 11.24, "elapsed_time": "0:52:19", "remaining_time": "6:53:06", "throughput": "6810.70", "total_tokens": 21381120} {"current_steps": 2620, "total_steps": 23217, "loss": 0.715, "learning_rate": 4.844529998531058e-05, "epoch": 0.33854503165783695, "percentage": 11.28, "elapsed_time": "0:53:07", "remaining_time": "6:57:41", "throughput": "6732.71", "total_tokens": 21463040} {"current_steps": 2630, "total_steps": 23217, "loss": 0.9274, "learning_rate": 4.843353515062982e-05, "epoch": 0.339837188267218, "percentage": 11.33, "elapsed_time": "0:53:56", "remaining_time": "7:02:14", "throughput": "6656.75", "total_tokens": 21544960} {"current_steps": 2640, "total_steps": 23217, "loss": 0.6468, "learning_rate": 4.842172740923194e-05, "epoch": 0.341129344876599, "percentage": 11.37, "elapsed_time": "0:54:44", "remaining_time": "7:06:42", "throughput": "6583.94", "total_tokens": 21626880} {"current_steps": 2650, "total_steps": 23217, "loss": 0.9614, "learning_rate": 4.840987678273688e-05, "epoch": 0.3424215014859801, "percentage": 11.41, "elapsed_time": "0:55:32", "remaining_time": "7:11:06", "throughput": "6513.68", "total_tokens": 21708800} {"current_steps": 2660, "total_steps": 23217, "loss": 0.8697, "learning_rate": 4.8397983292843095e-05, "epoch": 0.34371365809536114, "percentage": 11.46, "elapsed_time": "0:56:21", "remaining_time": "7:15:30", "throughput": "6444.59", "total_tokens": 21790720} {"current_steps": 2670, "total_steps": 23217, "loss": 0.7511, "learning_rate": 4.838604696132753e-05, "epoch": 0.34500581470474223, "percentage": 11.5, "elapsed_time": "0:57:10", "remaining_time": "7:19:59", "throughput": "6375.80", "total_tokens": 21872640} {"current_steps": 2680, "total_steps": 23217, "loss": 1.081, "learning_rate": 4.837406781004554e-05, "epoch": 0.34629797131412327, "percentage": 11.54, "elapsed_time": "0:58:07", "remaining_time": "7:25:27", "throughput": "6294.52", "total_tokens": 21954560} {"current_steps": 2690, "total_steps": 23217, "loss": 0.9772, "learning_rate": 4.836204586093092e-05, "epoch": 0.34759012792350436, "percentage": 11.59, "elapsed_time": "0:59:00", "remaining_time": "7:30:14", "throughput": "6224.72", "total_tokens": 22036480} {"current_steps": 2700, "total_steps": 23217, "loss": 0.7102, "learning_rate": 4.8349981135995826e-05, "epoch": 0.3488822845328854, "percentage": 11.63, "elapsed_time": "0:59:52", "remaining_time": "7:34:58", "throughput": "6156.97", "total_tokens": 22118400} {"current_steps": 2710, "total_steps": 23217, "loss": 0.8293, "learning_rate": 4.833787365733071e-05, "epoch": 0.3501744411422664, "percentage": 11.67, "elapsed_time": "1:00:46", "remaining_time": "7:39:50", "throughput": "6088.71", "total_tokens": 22200320} {"current_steps": 2720, "total_steps": 23217, "loss": 0.6742, "learning_rate": 4.832572344710433e-05, "epoch": 0.3514665977516475, "percentage": 11.72, "elapsed_time": "1:01:39", "remaining_time": "7:44:36", "throughput": "6023.49", "total_tokens": 22282240} {"current_steps": 2730, "total_steps": 23217, "loss": 1.1822, "learning_rate": 4.831353052756367e-05, "epoch": 0.35275875436102855, "percentage": 11.76, "elapsed_time": "1:02:27", "remaining_time": "7:48:41", "throughput": "5968.01", "total_tokens": 22364160} {"current_steps": 2740, "total_steps": 23217, "loss": 1.0566, "learning_rate": 4.830129492103392e-05, "epoch": 0.35405091097040964, "percentage": 11.8, "elapsed_time": "1:03:15", "remaining_time": "7:52:46", "throughput": "5913.49", "total_tokens": 22446080} {"current_steps": 2750, "total_steps": 23217, "loss": 0.8509, "learning_rate": 4.828901664991845e-05, "epoch": 0.3553430675797907, "percentage": 11.84, "elapsed_time": "1:04:03", "remaining_time": "7:56:45", "throughput": "5861.24", "total_tokens": 22528000} {"current_steps": 2760, "total_steps": 23217, "loss": 0.9067, "learning_rate": 4.8276695736698704e-05, "epoch": 0.3566352241891717, "percentage": 11.89, "elapsed_time": "1:04:52", "remaining_time": "8:00:47", "throughput": "5809.31", "total_tokens": 22609920} {"current_steps": 2770, "total_steps": 23217, "loss": 0.7381, "learning_rate": 4.826433220393424e-05, "epoch": 0.3579273807985528, "percentage": 11.93, "elapsed_time": "1:05:41", "remaining_time": "8:04:50", "throughput": "5757.89", "total_tokens": 22691840} {"current_steps": 2780, "total_steps": 23217, "loss": 0.9375, "learning_rate": 4.825192607426264e-05, "epoch": 0.35921953740793383, "percentage": 11.97, "elapsed_time": "1:06:30", "remaining_time": "8:08:54", "throughput": "5707.26", "total_tokens": 22773760} {"current_steps": 2790, "total_steps": 23217, "loss": 1.1993, "learning_rate": 4.823947737039948e-05, "epoch": 0.3605116940173149, "percentage": 12.02, "elapsed_time": "1:07:19", "remaining_time": "8:12:55", "throughput": "5657.99", "total_tokens": 22855680} {"current_steps": 2800, "total_steps": 23217, "loss": 0.7907, "learning_rate": 4.82269861151383e-05, "epoch": 0.36180385062669596, "percentage": 12.06, "elapsed_time": "1:08:08", "remaining_time": "8:16:54", "throughput": "5609.84", "total_tokens": 22937600} {"current_steps": 2810, "total_steps": 23217, "loss": 1.0263, "learning_rate": 4.821445233135053e-05, "epoch": 0.363096007236077, "percentage": 12.1, "elapsed_time": "1:08:58", "remaining_time": "8:20:51", "throughput": "5562.87", "total_tokens": 23019520} {"current_steps": 2820, "total_steps": 23217, "loss": 0.8387, "learning_rate": 4.8201876041985496e-05, "epoch": 0.3643881638454581, "percentage": 12.15, "elapsed_time": "1:09:47", "remaining_time": "8:24:46", "throughput": "5517.05", "total_tokens": 23101440} {"current_steps": 2830, "total_steps": 23217, "loss": 1.1519, "learning_rate": 4.8189257270070335e-05, "epoch": 0.3656803204548391, "percentage": 12.19, "elapsed_time": "1:10:36", "remaining_time": "8:28:40", "throughput": "5472.08", "total_tokens": 23183360} {"current_steps": 2840, "total_steps": 23217, "loss": 0.8801, "learning_rate": 4.817659603870995e-05, "epoch": 0.3669724770642202, "percentage": 12.23, "elapsed_time": "1:11:26", "remaining_time": "8:32:32", "throughput": "5428.12", "total_tokens": 23265280} {"current_steps": 2850, "total_steps": 23217, "loss": 0.8017, "learning_rate": 4.8163892371087045e-05, "epoch": 0.36826463367360124, "percentage": 12.28, "elapsed_time": "1:12:15", "remaining_time": "8:36:19", "throughput": "5385.70", "total_tokens": 23347200} {"current_steps": 2860, "total_steps": 23217, "loss": 0.9614, "learning_rate": 4.815114629046196e-05, "epoch": 0.3695567902829823, "percentage": 12.32, "elapsed_time": "1:13:03", "remaining_time": "8:40:00", "throughput": "5344.87", "total_tokens": 23429120} {"current_steps": 2870, "total_steps": 23217, "loss": 0.93, "learning_rate": 4.813835782017274e-05, "epoch": 0.37084894689236336, "percentage": 12.36, "elapsed_time": "1:13:51", "remaining_time": "8:43:37", "throughput": "5305.46", "total_tokens": 23511040} {"current_steps": 2880, "total_steps": 23217, "loss": 0.9083, "learning_rate": 4.812552698363502e-05, "epoch": 0.3721411035017444, "percentage": 12.4, "elapsed_time": "1:14:40", "remaining_time": "8:47:20", "throughput": "5265.49", "total_tokens": 23592960} {"current_steps": 2890, "total_steps": 23217, "loss": 0.486, "learning_rate": 4.8112653804342015e-05, "epoch": 0.3734332601111255, "percentage": 12.45, "elapsed_time": "1:15:35", "remaining_time": "8:51:38", "throughput": "5220.32", "total_tokens": 23674880} {"current_steps": 2900, "total_steps": 23217, "loss": 1.176, "learning_rate": 4.809973830586446e-05, "epoch": 0.3747254167205065, "percentage": 12.49, "elapsed_time": "1:16:24", "remaining_time": "8:55:15", "throughput": "5182.47", "total_tokens": 23756800} {"current_steps": 2910, "total_steps": 23217, "loss": 1.007, "learning_rate": 4.8086780511850606e-05, "epoch": 0.37601757332988756, "percentage": 12.53, "elapsed_time": "1:17:11", "remaining_time": "8:58:42", "throughput": "5146.70", "total_tokens": 23838720} {"current_steps": 2920, "total_steps": 23217, "loss": 1.0682, "learning_rate": 4.807378044602611e-05, "epoch": 0.37730972993926865, "percentage": 12.58, "elapsed_time": "1:17:59", "remaining_time": "9:02:10", "throughput": "5111.37", "total_tokens": 23920640} {"current_steps": 2930, "total_steps": 23217, "loss": 0.9145, "learning_rate": 4.806073813219404e-05, "epoch": 0.3786018865486497, "percentage": 12.62, "elapsed_time": "1:18:47", "remaining_time": "9:05:35", "throughput": "5076.82", "total_tokens": 24002560} {"current_steps": 2940, "total_steps": 23217, "loss": 0.6768, "learning_rate": 4.8047653594234855e-05, "epoch": 0.37989404315803077, "percentage": 12.66, "elapsed_time": "1:19:35", "remaining_time": "9:08:58", "throughput": "5043.01", "total_tokens": 24084480} {"current_steps": 2950, "total_steps": 23217, "loss": 1.3005, "learning_rate": 4.803452685610626e-05, "epoch": 0.3811861997674118, "percentage": 12.71, "elapsed_time": "1:20:23", "remaining_time": "9:12:20", "throughput": "5009.87", "total_tokens": 24166400} {"current_steps": 2960, "total_steps": 23217, "loss": 0.9298, "learning_rate": 4.802135794184329e-05, "epoch": 0.3824783563767929, "percentage": 12.75, "elapsed_time": "1:21:11", "remaining_time": "9:15:40", "throughput": "4977.31", "total_tokens": 24248320} {"current_steps": 2970, "total_steps": 23217, "loss": 0.7336, "learning_rate": 4.800814687555817e-05, "epoch": 0.38377051298617393, "percentage": 12.79, "elapsed_time": "1:22:17", "remaining_time": "9:20:59", "throughput": "4927.65", "total_tokens": 24330240} {"current_steps": 2980, "total_steps": 23217, "loss": 1.221, "learning_rate": 4.799489368144031e-05, "epoch": 0.38506266959555496, "percentage": 12.84, "elapsed_time": "1:23:11", "remaining_time": "9:24:58", "throughput": "4890.54", "total_tokens": 24412160} {"current_steps": 2990, "total_steps": 23217, "loss": 0.9109, "learning_rate": 4.798159838375626e-05, "epoch": 0.38635482620493605, "percentage": 12.88, "elapsed_time": "1:24:00", "remaining_time": "9:28:15", "throughput": "4859.81", "total_tokens": 24494080} {"current_steps": 3000, "total_steps": 23217, "loss": 0.6901, "learning_rate": 4.796826100684967e-05, "epoch": 0.3876469828143171, "percentage": 12.92, "elapsed_time": "1:24:53", "remaining_time": "9:32:04", "throughput": "4825.10", "total_tokens": 24576000} {"current_steps": 3010, "total_steps": 23217, "loss": 1.0645, "learning_rate": 4.795488157514122e-05, "epoch": 0.3889391394236982, "percentage": 12.96, "elapsed_time": "1:26:28", "remaining_time": "9:40:31", "throughput": "4752.48", "total_tokens": 24657920} {"current_steps": 3020, "total_steps": 23217, "loss": 1.0953, "learning_rate": 4.794146011312861e-05, "epoch": 0.3902312960330792, "percentage": 13.01, "elapsed_time": "1:27:34", "remaining_time": "9:45:42", "throughput": "4708.02", "total_tokens": 24739840} {"current_steps": 3030, "total_steps": 23217, "loss": 1.2322, "learning_rate": 4.7927996645386476e-05, "epoch": 0.39152345264246025, "percentage": 13.05, "elapsed_time": "1:28:36", "remaining_time": "9:50:23", "throughput": "4668.47", "total_tokens": 24821760} {"current_steps": 3040, "total_steps": 23217, "loss": 0.7708, "learning_rate": 4.791449119656638e-05, "epoch": 0.39281560925184134, "percentage": 13.09, "elapsed_time": "1:29:34", "remaining_time": "9:54:30", "throughput": "4633.84", "total_tokens": 24903680} {"current_steps": 3050, "total_steps": 23217, "loss": 0.8159, "learning_rate": 4.790094379139676e-05, "epoch": 0.39410776586122237, "percentage": 13.14, "elapsed_time": "1:30:37", "remaining_time": "9:59:12", "throughput": "4595.22", "total_tokens": 24985600} {"current_steps": 3060, "total_steps": 23217, "loss": 0.7697, "learning_rate": 4.7887354454682854e-05, "epoch": 0.39539992247060346, "percentage": 13.18, "elapsed_time": "1:31:37", "remaining_time": "10:03:35", "throughput": "4559.57", "total_tokens": 25067520} {"current_steps": 3070, "total_steps": 23217, "loss": 1.0574, "learning_rate": 4.78737232113067e-05, "epoch": 0.3966920790799845, "percentage": 13.22, "elapsed_time": "1:32:37", "remaining_time": "10:07:52", "throughput": "4525.18", "total_tokens": 25149440} {"current_steps": 3080, "total_steps": 23217, "loss": 1.0678, "learning_rate": 4.7860050086227035e-05, "epoch": 0.39798423568936553, "percentage": 13.27, "elapsed_time": "1:33:35", "remaining_time": "10:11:55", "throughput": "4493.04", "total_tokens": 25231360} {"current_steps": 3090, "total_steps": 23217, "loss": 0.9143, "learning_rate": 4.784633510447932e-05, "epoch": 0.3992763922987466, "percentage": 13.31, "elapsed_time": "1:34:33", "remaining_time": "10:15:56", "throughput": "4461.43", "total_tokens": 25313280} {"current_steps": 3100, "total_steps": 23217, "loss": 0.8812, "learning_rate": 4.7832578291175626e-05, "epoch": 0.40056854890812765, "percentage": 13.35, "elapsed_time": "1:35:27", "remaining_time": "10:19:30", "throughput": "4433.58", "total_tokens": 25395200} {"current_steps": 3110, "total_steps": 23217, "loss": 0.6671, "learning_rate": 4.781877967150463e-05, "epoch": 0.40186070551750874, "percentage": 13.4, "elapsed_time": "1:36:18", "remaining_time": "10:22:40", "throughput": "4408.85", "total_tokens": 25477120} {"current_steps": 3120, "total_steps": 23217, "loss": 1.0019, "learning_rate": 4.7804939270731564e-05, "epoch": 0.4031528621268898, "percentage": 13.44, "elapsed_time": "1:37:09", "remaining_time": "10:25:47", "throughput": "4384.69", "total_tokens": 25559040} {"current_steps": 3130, "total_steps": 23217, "loss": 0.799, "learning_rate": 4.7791057114198133e-05, "epoch": 0.4044450187362708, "percentage": 13.48, "elapsed_time": "1:37:57", "remaining_time": "10:28:39", "throughput": "4362.52", "total_tokens": 25640960} {"current_steps": 3140, "total_steps": 23217, "loss": 1.0606, "learning_rate": 4.7777133227322525e-05, "epoch": 0.4057371753456519, "percentage": 13.52, "elapsed_time": "1:38:48", "remaining_time": "10:31:46", "throughput": "4338.84", "total_tokens": 25722880} {"current_steps": 3150, "total_steps": 23217, "loss": 0.8224, "learning_rate": 4.776316763559933e-05, "epoch": 0.40702933195503294, "percentage": 13.57, "elapsed_time": "1:39:40", "remaining_time": "10:34:55", "throughput": "4315.18", "total_tokens": 25804800} {"current_steps": 3160, "total_steps": 23217, "loss": 0.8995, "learning_rate": 4.774916036459949e-05, "epoch": 0.408321488564414, "percentage": 13.61, "elapsed_time": "1:40:29", "remaining_time": "10:37:52", "throughput": "4293.07", "total_tokens": 25886720} {"current_steps": 3170, "total_steps": 23217, "loss": 1.1617, "learning_rate": 4.773511143997026e-05, "epoch": 0.40961364517379506, "percentage": 13.65, "elapsed_time": "1:41:19", "remaining_time": "10:40:47", "throughput": "4271.42", "total_tokens": 25968640} {"current_steps": 3180, "total_steps": 23217, "loss": 0.8537, "learning_rate": 4.7721020887435186e-05, "epoch": 0.4109058017831761, "percentage": 13.7, "elapsed_time": "1:42:16", "remaining_time": "10:44:26", "throughput": "4245.09", "total_tokens": 26050560} {"current_steps": 3190, "total_steps": 23217, "loss": 1.5184, "learning_rate": 4.7706888732793996e-05, "epoch": 0.4121979583925572, "percentage": 13.74, "elapsed_time": "1:43:05", "remaining_time": "10:47:12", "throughput": "4224.80", "total_tokens": 26132480} {"current_steps": 3200, "total_steps": 23217, "loss": 1.1, "learning_rate": 4.769271500192264e-05, "epoch": 0.4134901150019382, "percentage": 13.78, "elapsed_time": "1:43:55", "remaining_time": "10:50:07", "throughput": "4203.74", "total_tokens": 26214400} {"current_steps": 3210, "total_steps": 23217, "loss": 1.0147, "learning_rate": 4.767849972077315e-05, "epoch": 0.4147822716113193, "percentage": 13.83, "elapsed_time": "1:44:46", "remaining_time": "10:53:01", "throughput": "4183.02", "total_tokens": 26296320} {"current_steps": 3220, "total_steps": 23217, "loss": 1.0684, "learning_rate": 4.766424291537366e-05, "epoch": 0.41607442822070034, "percentage": 13.87, "elapsed_time": "1:45:35", "remaining_time": "10:55:47", "throughput": "4163.34", "total_tokens": 26378240} {"current_steps": 3230, "total_steps": 23217, "loss": 0.7629, "learning_rate": 4.7649944611828316e-05, "epoch": 0.41736658483008143, "percentage": 13.91, "elapsed_time": "1:46:24", "remaining_time": "10:58:27", "throughput": "4144.35", "total_tokens": 26460160} {"current_steps": 3240, "total_steps": 23217, "loss": 0.8127, "learning_rate": 4.763560483631728e-05, "epoch": 0.41865874143946247, "percentage": 13.96, "elapsed_time": "1:47:12", "remaining_time": "11:00:59", "throughput": "4126.43", "total_tokens": 26542080} {"current_steps": 3250, "total_steps": 23217, "loss": 1.0787, "learning_rate": 4.762122361509662e-05, "epoch": 0.4199508980488435, "percentage": 14.0, "elapsed_time": "1:47:59", "remaining_time": "11:03:27", "throughput": "4109.01", "total_tokens": 26624000} {"current_steps": 3260, "total_steps": 23217, "loss": 1.089, "learning_rate": 4.7606800974498287e-05, "epoch": 0.4212430546582246, "percentage": 14.04, "elapsed_time": "1:48:49", "remaining_time": "11:06:09", "throughput": "4090.32", "total_tokens": 26705920} {"current_steps": 3270, "total_steps": 23217, "loss": 0.7698, "learning_rate": 4.75923369409301e-05, "epoch": 0.4225352112676056, "percentage": 14.08, "elapsed_time": "1:49:39", "remaining_time": "11:08:52", "throughput": "4071.66", "total_tokens": 26787840} {"current_steps": 3280, "total_steps": 23217, "loss": 1.2242, "learning_rate": 4.757783154087564e-05, "epoch": 0.4238273678769867, "percentage": 14.13, "elapsed_time": "1:50:30", "remaining_time": "11:11:44", "throughput": "4052.22", "total_tokens": 26869760} {"current_steps": 3290, "total_steps": 23217, "loss": 1.2536, "learning_rate": 4.756328480089425e-05, "epoch": 0.42511952448636775, "percentage": 14.17, "elapsed_time": "1:51:19", "remaining_time": "11:14:14", "throughput": "4035.16", "total_tokens": 26951680} {"current_steps": 3300, "total_steps": 23217, "loss": 1.0486, "learning_rate": 4.7548696747620956e-05, "epoch": 0.4264116810957488, "percentage": 14.21, "elapsed_time": "1:52:07", "remaining_time": "11:16:46", "throughput": "4018.08", "total_tokens": 27033600} {"current_steps": 3310, "total_steps": 23217, "loss": 1.1756, "learning_rate": 4.753406740776643e-05, "epoch": 0.4277038377051299, "percentage": 14.26, "elapsed_time": "1:52:57", "remaining_time": "11:19:21", "throughput": "4000.76", "total_tokens": 27115520} {"current_steps": 3320, "total_steps": 23217, "loss": 1.2511, "learning_rate": 4.7519396808116933e-05, "epoch": 0.4289959943145109, "percentage": 14.3, "elapsed_time": "1:53:46", "remaining_time": "11:21:49", "throughput": "3984.31", "total_tokens": 27197440} {"current_steps": 3330, "total_steps": 23217, "loss": 0.8987, "learning_rate": 4.750468497553429e-05, "epoch": 0.430288150923892, "percentage": 14.34, "elapsed_time": "1:54:36", "remaining_time": "11:24:24", "throughput": "3967.25", "total_tokens": 27279360} {"current_steps": 3340, "total_steps": 23217, "loss": 1.0922, "learning_rate": 4.74899319369558e-05, "epoch": 0.43158030753327303, "percentage": 14.39, "elapsed_time": "1:55:24", "remaining_time": "11:26:49", "throughput": "3951.34", "total_tokens": 27361280} {"current_steps": 3350, "total_steps": 23217, "loss": 1.028, "learning_rate": 4.7475137719394234e-05, "epoch": 0.43287246414265407, "percentage": 14.43, "elapsed_time": "1:56:12", "remaining_time": "11:29:07", "throughput": "3936.13", "total_tokens": 27443200} {"current_steps": 3360, "total_steps": 23217, "loss": 0.7594, "learning_rate": 4.746030234993775e-05, "epoch": 0.43416462075203516, "percentage": 14.47, "elapsed_time": "1:56:59", "remaining_time": "11:31:23", "throughput": "3921.27", "total_tokens": 27525120} {"current_steps": 3370, "total_steps": 23217, "loss": 1.21, "learning_rate": 4.7445425855749844e-05, "epoch": 0.4354567773614162, "percentage": 14.52, "elapsed_time": "1:57:47", "remaining_time": "11:33:43", "throughput": "3906.17", "total_tokens": 27607040} {"current_steps": 3380, "total_steps": 23217, "loss": 0.8709, "learning_rate": 4.743050826406934e-05, "epoch": 0.4367489339707973, "percentage": 14.56, "elapsed_time": "1:58:35", "remaining_time": "11:36:01", "throughput": "3891.29", "total_tokens": 27688960} {"current_steps": 3390, "total_steps": 23217, "loss": 0.8737, "learning_rate": 4.741554960221027e-05, "epoch": 0.4380410905801783, "percentage": 14.6, "elapsed_time": "1:59:23", "remaining_time": "11:38:18", "throughput": "3876.58", "total_tokens": 27770880} {"current_steps": 3400, "total_steps": 23217, "loss": 1.2981, "learning_rate": 4.7400549897561914e-05, "epoch": 0.43933324718955935, "percentage": 14.64, "elapsed_time": "2:00:11", "remaining_time": "11:40:33", "throughput": "3862.20", "total_tokens": 27852800} {"current_steps": 3410, "total_steps": 23217, "loss": 0.7498, "learning_rate": 4.7385509177588664e-05, "epoch": 0.44062540379894044, "percentage": 14.69, "elapsed_time": "2:00:59", "remaining_time": "11:42:47", "throughput": "3848.00", "total_tokens": 27934720} {"current_steps": 3420, "total_steps": 23217, "loss": 1.5585, "learning_rate": 4.7370427469830016e-05, "epoch": 0.4419175604083215, "percentage": 14.73, "elapsed_time": "2:01:47", "remaining_time": "11:44:59", "throughput": "3834.01", "total_tokens": 28016640} {"current_steps": 3430, "total_steps": 23217, "loss": 1.2198, "learning_rate": 4.735530480190053e-05, "epoch": 0.44320971701770256, "percentage": 14.77, "elapsed_time": "2:02:34", "remaining_time": "11:47:09", "throughput": "3820.34", "total_tokens": 28098560} {"current_steps": 3440, "total_steps": 23217, "loss": 0.7208, "learning_rate": 4.734014120148976e-05, "epoch": 0.4445018736270836, "percentage": 14.82, "elapsed_time": "2:03:22", "remaining_time": "11:49:18", "throughput": "3806.84", "total_tokens": 28180480} {"current_steps": 3450, "total_steps": 23217, "loss": 0.8981, "learning_rate": 4.73249366963622e-05, "epoch": 0.44579403023646463, "percentage": 14.86, "elapsed_time": "2:04:10", "remaining_time": "11:51:26", "throughput": "3793.52", "total_tokens": 28262400} {"current_steps": 3460, "total_steps": 23217, "loss": 0.9347, "learning_rate": 4.730969131435724e-05, "epoch": 0.4470861868458457, "percentage": 14.9, "elapsed_time": "2:04:57", "remaining_time": "11:53:33", "throughput": "3780.34", "total_tokens": 28344320} {"current_steps": 3470, "total_steps": 23217, "loss": 1.1323, "learning_rate": 4.729440508338911e-05, "epoch": 0.44837834345522676, "percentage": 14.95, "elapsed_time": "2:05:46", "remaining_time": "11:55:42", "throughput": "3767.04", "total_tokens": 28426240} {"current_steps": 3480, "total_steps": 23217, "loss": 1.1095, "learning_rate": 4.727907803144686e-05, "epoch": 0.44967050006460785, "percentage": 14.99, "elapsed_time": "2:06:34", "remaining_time": "11:57:54", "throughput": "3753.63", "total_tokens": 28508160} {"current_steps": 3490, "total_steps": 23217, "loss": 1.2198, "learning_rate": 4.726371018659427e-05, "epoch": 0.4509626566739889, "percentage": 15.03, "elapsed_time": "2:07:23", "remaining_time": "12:00:02", "throughput": "3740.62", "total_tokens": 28590080} {"current_steps": 3500, "total_steps": 23217, "loss": 1.078, "learning_rate": 4.724830157696979e-05, "epoch": 0.45225481328336997, "percentage": 15.08, "elapsed_time": "2:08:10", "remaining_time": "12:02:06", "throughput": "3728.02", "total_tokens": 28672000} {"current_steps": 3510, "total_steps": 23217, "loss": 0.9332, "learning_rate": 4.723285223078653e-05, "epoch": 0.453546969892751, "percentage": 15.12, "elapsed_time": "2:08:59", "remaining_time": "12:04:11", "throughput": "3715.43", "total_tokens": 28753920} {"current_steps": 3520, "total_steps": 23217, "loss": 1.3173, "learning_rate": 4.721736217633219e-05, "epoch": 0.45483912650213204, "percentage": 15.16, "elapsed_time": "2:09:47", "remaining_time": "12:06:15", "throughput": "3702.94", "total_tokens": 28835840} {"current_steps": 3530, "total_steps": 23217, "loss": 0.9488, "learning_rate": 4.7201831441969016e-05, "epoch": 0.45613128311151313, "percentage": 15.2, "elapsed_time": "2:10:35", "remaining_time": "12:08:20", "throughput": "3690.45", "total_tokens": 28917760} {"current_steps": 3540, "total_steps": 23217, "loss": 0.8988, "learning_rate": 4.71862600561337e-05, "epoch": 0.45742343972089416, "percentage": 15.25, "elapsed_time": "2:11:25", "remaining_time": "12:10:30", "throughput": "3677.66", "total_tokens": 28999680} {"current_steps": 3550, "total_steps": 23217, "loss": 1.401, "learning_rate": 4.7170648047337415e-05, "epoch": 0.45871559633027525, "percentage": 15.29, "elapsed_time": "2:12:13", "remaining_time": "12:12:30", "throughput": "3665.72", "total_tokens": 29081600} {"current_steps": 3560, "total_steps": 23217, "loss": 0.768, "learning_rate": 4.7154995444165685e-05, "epoch": 0.4600077529396563, "percentage": 15.33, "elapsed_time": "2:13:01", "remaining_time": "12:14:30", "throughput": "3653.93", "total_tokens": 29163520} {"current_steps": 3570, "total_steps": 23217, "loss": 0.8524, "learning_rate": 4.713930227527836e-05, "epoch": 0.4612999095490373, "percentage": 15.38, "elapsed_time": "2:13:49", "remaining_time": "12:16:30", "throughput": "3642.16", "total_tokens": 29245440} {"current_steps": 3580, "total_steps": 23217, "loss": 0.8993, "learning_rate": 4.712356856940958e-05, "epoch": 0.4625920661584184, "percentage": 15.42, "elapsed_time": "2:14:38", "remaining_time": "12:18:29", "throughput": "3630.48", "total_tokens": 29327360} {"current_steps": 3590, "total_steps": 23217, "loss": 0.7759, "learning_rate": 4.710779435536772e-05, "epoch": 0.46388422276779945, "percentage": 15.46, "elapsed_time": "2:15:26", "remaining_time": "12:20:30", "throughput": "3618.82", "total_tokens": 29409280} {"current_steps": 3600, "total_steps": 23217, "loss": 0.7109, "learning_rate": 4.709197966203528e-05, "epoch": 0.46517637937718054, "percentage": 15.51, "elapsed_time": "2:16:15", "remaining_time": "12:22:30", "throughput": "3607.17", "total_tokens": 29491200} {"current_steps": 3610, "total_steps": 23217, "loss": 1.2732, "learning_rate": 4.707612451836892e-05, "epoch": 0.46646853598656157, "percentage": 15.55, "elapsed_time": "2:17:03", "remaining_time": "12:24:21", "throughput": "3596.39", "total_tokens": 29573120} {"current_steps": 3620, "total_steps": 23217, "loss": 1.0464, "learning_rate": 4.706022895339936e-05, "epoch": 0.4677606925959426, "percentage": 15.59, "elapsed_time": "2:17:52", "remaining_time": "12:26:25", "throughput": "3584.60", "total_tokens": 29655040} {"current_steps": 3630, "total_steps": 23217, "loss": 0.8741, "learning_rate": 4.704429299623129e-05, "epoch": 0.4690528492053237, "percentage": 15.64, "elapsed_time": "2:18:41", "remaining_time": "12:28:23", "throughput": "3573.37", "total_tokens": 29736960} {"current_steps": 3640, "total_steps": 23217, "loss": 0.9055, "learning_rate": 4.7028316676043425e-05, "epoch": 0.47034500581470473, "percentage": 15.68, "elapsed_time": "2:19:30", "remaining_time": "12:30:19", "throughput": "3562.35", "total_tokens": 29818880} {"current_steps": 3650, "total_steps": 23217, "loss": 0.9934, "learning_rate": 4.7012300022088326e-05, "epoch": 0.4716371624240858, "percentage": 15.72, "elapsed_time": "2:20:19", "remaining_time": "12:32:16", "throughput": "3551.33", "total_tokens": 29900800} {"current_steps": 3660, "total_steps": 23217, "loss": 1.0764, "learning_rate": 4.6996243063692446e-05, "epoch": 0.47292931903346686, "percentage": 15.76, "elapsed_time": "2:21:08", "remaining_time": "12:34:10", "throughput": "3540.54", "total_tokens": 29982720} {"current_steps": 3670, "total_steps": 23217, "loss": 0.5566, "learning_rate": 4.6980145830255993e-05, "epoch": 0.4742214756428479, "percentage": 15.81, "elapsed_time": "2:21:56", "remaining_time": "12:36:00", "throughput": "3530.11", "total_tokens": 30064640} {"current_steps": 3680, "total_steps": 23217, "loss": 0.9627, "learning_rate": 4.6964008351252964e-05, "epoch": 0.475513632252229, "percentage": 15.85, "elapsed_time": "2:22:44", "remaining_time": "12:37:49", "throughput": "3519.90", "total_tokens": 30146560} {"current_steps": 3690, "total_steps": 23217, "loss": 0.8859, "learning_rate": 4.694783065623102e-05, "epoch": 0.47680578886161, "percentage": 15.89, "elapsed_time": "2:23:32", "remaining_time": "12:39:37", "throughput": "3509.73", "total_tokens": 30228480} {"current_steps": 3700, "total_steps": 23217, "loss": 1.1395, "learning_rate": 4.6931612774811445e-05, "epoch": 0.4780979454709911, "percentage": 15.94, "elapsed_time": "2:24:20", "remaining_time": "12:41:22", "throughput": "3499.86", "total_tokens": 30310400} {"current_steps": 3710, "total_steps": 23217, "loss": 0.7113, "learning_rate": 4.691535473668914e-05, "epoch": 0.47939010208037214, "percentage": 15.98, "elapsed_time": "2:25:08", "remaining_time": "12:43:07", "throughput": "3490.09", "total_tokens": 30392320} {"current_steps": 3720, "total_steps": 23217, "loss": 1.049, "learning_rate": 4.68990565716325e-05, "epoch": 0.4806822586897532, "percentage": 16.02, "elapsed_time": "2:25:57", "remaining_time": "12:44:58", "throughput": "3479.85", "total_tokens": 30474240} {"current_steps": 3730, "total_steps": 23217, "loss": 1.1382, "learning_rate": 4.688271830948342e-05, "epoch": 0.48197441529913426, "percentage": 16.07, "elapsed_time": "2:26:46", "remaining_time": "12:46:46", "throughput": "3469.86", "total_tokens": 30556160} {"current_steps": 3740, "total_steps": 23217, "loss": 0.8307, "learning_rate": 4.686633998015718e-05, "epoch": 0.4832665719085153, "percentage": 16.11, "elapsed_time": "2:27:34", "remaining_time": "12:48:29", "throughput": "3460.34", "total_tokens": 30638080} {"current_steps": 3750, "total_steps": 23217, "loss": 1.0814, "learning_rate": 4.6849921613642456e-05, "epoch": 0.4845587285178964, "percentage": 16.15, "elapsed_time": "2:28:22", "remaining_time": "12:50:15", "throughput": "3450.68", "total_tokens": 30720000} {"current_steps": 3760, "total_steps": 23217, "loss": 1.0745, "learning_rate": 4.683346324000122e-05, "epoch": 0.4858508851272774, "percentage": 16.2, "elapsed_time": "2:29:10", "remaining_time": "12:51:57", "throughput": "3441.27", "total_tokens": 30801920} {"current_steps": 3770, "total_steps": 23217, "loss": 1.0342, "learning_rate": 4.6816964889368674e-05, "epoch": 0.48714304173665846, "percentage": 16.24, "elapsed_time": "2:29:58", "remaining_time": "12:53:40", "throughput": "3431.92", "total_tokens": 30883840} {"current_steps": 3780, "total_steps": 23217, "loss": 1.5249, "learning_rate": 4.680042659195325e-05, "epoch": 0.48843519834603955, "percentage": 16.28, "elapsed_time": "2:30:46", "remaining_time": "12:55:19", "throughput": "3422.80", "total_tokens": 30965760} {"current_steps": 3790, "total_steps": 23217, "loss": 0.9, "learning_rate": 4.678384837803651e-05, "epoch": 0.4897273549554206, "percentage": 16.32, "elapsed_time": "2:31:34", "remaining_time": "12:56:59", "throughput": "3413.76", "total_tokens": 31047680} {"current_steps": 3800, "total_steps": 23217, "loss": 0.835, "learning_rate": 4.67672302779731e-05, "epoch": 0.49101951156480167, "percentage": 16.37, "elapsed_time": "2:32:23", "remaining_time": "12:58:39", "throughput": "3404.64", "total_tokens": 31129600} {"current_steps": 3810, "total_steps": 23217, "loss": 1.2393, "learning_rate": 4.6750572322190716e-05, "epoch": 0.4923116681741827, "percentage": 16.41, "elapsed_time": "2:33:11", "remaining_time": "13:00:19", "throughput": "3395.65", "total_tokens": 31211520} {"current_steps": 3820, "total_steps": 23217, "loss": 0.5902, "learning_rate": 4.673387454118999e-05, "epoch": 0.4936038247835638, "percentage": 16.45, "elapsed_time": "2:34:00", "remaining_time": "13:02:00", "throughput": "3386.62", "total_tokens": 31293440} {"current_steps": 3830, "total_steps": 23217, "loss": 0.8908, "learning_rate": 4.671713696554452e-05, "epoch": 0.49489598139294483, "percentage": 16.5, "elapsed_time": "2:34:49", "remaining_time": "13:03:42", "throughput": "3377.50", "total_tokens": 31375360} {"current_steps": 3840, "total_steps": 23217, "loss": 0.9977, "learning_rate": 4.6700359625900724e-05, "epoch": 0.49618813800232586, "percentage": 16.54, "elapsed_time": "2:35:38", "remaining_time": "13:05:23", "throughput": "3368.52", "total_tokens": 31457280} {"current_steps": 3850, "total_steps": 23217, "loss": 0.8617, "learning_rate": 4.668354255297785e-05, "epoch": 0.49748029461170695, "percentage": 16.58, "elapsed_time": "2:36:27", "remaining_time": "13:07:05", "throughput": "3359.53", "total_tokens": 31539200} {"current_steps": 3860, "total_steps": 23217, "loss": 0.7011, "learning_rate": 4.666668577756793e-05, "epoch": 0.498772451221088, "percentage": 16.63, "elapsed_time": "2:37:16", "remaining_time": "13:08:40", "throughput": "3351.01", "total_tokens": 31621120} {"current_steps": 3870, "total_steps": 23217, "loss": 0.8713, "learning_rate": 4.664978933053562e-05, "epoch": 0.500064607830469, "percentage": 16.67, "elapsed_time": "2:38:05", "remaining_time": "13:10:18", "throughput": "3342.41", "total_tokens": 31703040} {"current_steps": 3880, "total_steps": 23217, "loss": 1.0985, "learning_rate": 4.6632853242818274e-05, "epoch": 0.5013567644398501, "percentage": 16.71, "elapsed_time": "2:38:53", "remaining_time": "13:11:54", "throughput": "3333.89", "total_tokens": 31784960} {"current_steps": 3890, "total_steps": 23217, "loss": 0.8102, "learning_rate": 4.66158775454258e-05, "epoch": 0.5026489210492312, "percentage": 16.75, "elapsed_time": "2:39:42", "remaining_time": "13:13:31", "throughput": "3325.40", "total_tokens": 31866880} {"current_steps": 3900, "total_steps": 23217, "loss": 1.0378, "learning_rate": 4.659886226944063e-05, "epoch": 0.5039410776586122, "percentage": 16.8, "elapsed_time": "2:40:31", "remaining_time": "13:15:06", "throughput": "3317.05", "total_tokens": 31948800} {"current_steps": 3910, "total_steps": 23217, "loss": 0.9426, "learning_rate": 4.658180744601769e-05, "epoch": 0.5052332342679933, "percentage": 16.84, "elapsed_time": "2:41:21", "remaining_time": "13:16:45", "throughput": "3308.49", "total_tokens": 32030720} {"current_steps": 3920, "total_steps": 23217, "loss": 1.1089, "learning_rate": 4.6564713106384296e-05, "epoch": 0.5065253908773744, "percentage": 16.88, "elapsed_time": "2:42:10", "remaining_time": "13:18:18", "throughput": "3300.30", "total_tokens": 32112640} {"current_steps": 3930, "total_steps": 23217, "loss": 1.0339, "learning_rate": 4.65475792818401e-05, "epoch": 0.5078175474867554, "percentage": 16.93, "elapsed_time": "2:42:59", "remaining_time": "13:19:55", "throughput": "3291.94", "total_tokens": 32194560} {"current_steps": 3940, "total_steps": 23217, "loss": 1.1407, "learning_rate": 4.653040600375709e-05, "epoch": 0.5091097040961364, "percentage": 16.97, "elapsed_time": "2:43:48", "remaining_time": "13:21:28", "throughput": "3283.91", "total_tokens": 32276480} {"current_steps": 3950, "total_steps": 23217, "loss": 1.1492, "learning_rate": 4.6513193303579476e-05, "epoch": 0.5104018607055175, "percentage": 17.01, "elapsed_time": "2:44:36", "remaining_time": "13:22:56", "throughput": "3276.21", "total_tokens": 32358400} {"current_steps": 3960, "total_steps": 23217, "loss": 0.8435, "learning_rate": 4.6495941212823644e-05, "epoch": 0.5116940173148986, "percentage": 17.06, "elapsed_time": "2:45:24", "remaining_time": "13:24:22", "throughput": "3268.65", "total_tokens": 32440320} {"current_steps": 3970, "total_steps": 23217, "loss": 0.6948, "learning_rate": 4.647864976307811e-05, "epoch": 0.5129861739242796, "percentage": 17.1, "elapsed_time": "2:46:13", "remaining_time": "13:25:52", "throughput": "3260.90", "total_tokens": 32522240} {"current_steps": 3980, "total_steps": 23217, "loss": 0.8107, "learning_rate": 4.646131898600345e-05, "epoch": 0.5142783305336607, "percentage": 17.14, "elapsed_time": "2:47:01", "remaining_time": "13:27:16", "throughput": "3253.53", "total_tokens": 32604160} {"current_steps": 3990, "total_steps": 23217, "loss": 1.0497, "learning_rate": 4.644394891333227e-05, "epoch": 0.5155704871430418, "percentage": 17.19, "elapsed_time": "2:47:49", "remaining_time": "13:28:43", "throughput": "3246.03", "total_tokens": 32686080} {"current_steps": 4000, "total_steps": 23217, "loss": 0.988, "learning_rate": 4.64265395768691e-05, "epoch": 0.5168626437524227, "percentage": 17.23, "elapsed_time": "2:48:37", "remaining_time": "13:30:07", "throughput": "3238.69", "total_tokens": 32768000} {"current_steps": 4010, "total_steps": 23217, "loss": 0.9792, "learning_rate": 4.6409091008490365e-05, "epoch": 0.5181548003618038, "percentage": 17.27, "elapsed_time": "2:49:36", "remaining_time": "13:32:22", "throughput": "3228.08", "total_tokens": 32849920} {"current_steps": 4020, "total_steps": 23217, "loss": 0.7922, "learning_rate": 4.639160324014433e-05, "epoch": 0.5194469569711849, "percentage": 17.31, "elapsed_time": "2:50:24", "remaining_time": "13:33:46", "throughput": "3220.80", "total_tokens": 32931840} {"current_steps": 4030, "total_steps": 23217, "loss": 1.2068, "learning_rate": 4.637407630385104e-05, "epoch": 0.520739113580566, "percentage": 17.36, "elapsed_time": "2:51:14", "remaining_time": "13:35:17", "throughput": "3213.19", "total_tokens": 33013760} {"current_steps": 4040, "total_steps": 23217, "loss": 0.9503, "learning_rate": 4.6356510231702254e-05, "epoch": 0.522031270189947, "percentage": 17.4, "elapsed_time": "2:52:03", "remaining_time": "13:36:43", "throughput": "3205.82", "total_tokens": 33095680} {"current_steps": 4050, "total_steps": 23217, "loss": 0.8793, "learning_rate": 4.633890505586139e-05, "epoch": 0.5233234267993281, "percentage": 17.44, "elapsed_time": "2:52:52", "remaining_time": "13:38:11", "throughput": "3198.46", "total_tokens": 33177600} {"current_steps": 4060, "total_steps": 23217, "loss": 1.0048, "learning_rate": 4.6321260808563445e-05, "epoch": 0.5246155834087092, "percentage": 17.49, "elapsed_time": "2:53:41", "remaining_time": "13:39:33", "throughput": "3191.44", "total_tokens": 33259520} {"current_steps": 4070, "total_steps": 23217, "loss": 0.8116, "learning_rate": 4.630357752211498e-05, "epoch": 0.5259077400180902, "percentage": 17.53, "elapsed_time": "2:54:29", "remaining_time": "13:40:52", "throughput": "3184.67", "total_tokens": 33341440} {"current_steps": 4080, "total_steps": 23217, "loss": 1.202, "learning_rate": 4.6285855228894025e-05, "epoch": 0.5271998966274712, "percentage": 17.57, "elapsed_time": "2:55:17", "remaining_time": "13:42:12", "throughput": "3177.81", "total_tokens": 33423360} {"current_steps": 4090, "total_steps": 23217, "loss": 1.2678, "learning_rate": 4.626809396135003e-05, "epoch": 0.5284920532368523, "percentage": 17.62, "elapsed_time": "2:56:06", "remaining_time": "13:43:32", "throughput": "3171.02", "total_tokens": 33505280} {"current_steps": 4100, "total_steps": 23217, "loss": 1.052, "learning_rate": 4.6250293752003834e-05, "epoch": 0.5297842098462333, "percentage": 17.66, "elapsed_time": "2:56:56", "remaining_time": "13:44:59", "throughput": "3163.80", "total_tokens": 33587200} {"current_steps": 4110, "total_steps": 23217, "loss": 0.9749, "learning_rate": 4.623245463344753e-05, "epoch": 0.5310763664556144, "percentage": 17.7, "elapsed_time": "2:57:45", "remaining_time": "13:46:24", "throughput": "3156.71", "total_tokens": 33669120} {"current_steps": 4120, "total_steps": 23217, "loss": 0.9361, "learning_rate": 4.6214576638344484e-05, "epoch": 0.5323685230649955, "percentage": 17.75, "elapsed_time": "2:58:34", "remaining_time": "13:47:43", "throughput": "3150.05", "total_tokens": 33751040} {"current_steps": 4130, "total_steps": 23217, "loss": 1.0865, "learning_rate": 4.619665979942924e-05, "epoch": 0.5336606796743766, "percentage": 17.79, "elapsed_time": "2:59:23", "remaining_time": "13:49:05", "throughput": "3143.24", "total_tokens": 33832960} {"current_steps": 4140, "total_steps": 23217, "loss": 0.8994, "learning_rate": 4.617870414950748e-05, "epoch": 0.5349528362837576, "percentage": 17.83, "elapsed_time": "3:00:12", "remaining_time": "13:50:21", "throughput": "3136.77", "total_tokens": 33914880} {"current_steps": 4150, "total_steps": 23217, "loss": 1.0843, "learning_rate": 4.616070972145591e-05, "epoch": 0.5362449928931387, "percentage": 17.87, "elapsed_time": "3:01:00", "remaining_time": "13:51:38", "throughput": "3130.29", "total_tokens": 33996800} {"current_steps": 4160, "total_steps": 23217, "loss": 1.1799, "learning_rate": 4.614267654822228e-05, "epoch": 0.5375371495025197, "percentage": 17.92, "elapsed_time": "3:01:49", "remaining_time": "13:52:54", "throughput": "3123.88", "total_tokens": 34078720} {"current_steps": 4170, "total_steps": 23217, "loss": 1.018, "learning_rate": 4.612460466282525e-05, "epoch": 0.5388293061119007, "percentage": 17.96, "elapsed_time": "3:02:37", "remaining_time": "13:54:10", "throughput": "3117.51", "total_tokens": 34160640} {"current_steps": 4180, "total_steps": 23217, "loss": 1.2698, "learning_rate": 4.610649409835438e-05, "epoch": 0.5401214627212818, "percentage": 18.0, "elapsed_time": "3:03:26", "remaining_time": "13:55:26", "throughput": "3111.12", "total_tokens": 34242560} {"current_steps": 4190, "total_steps": 23217, "loss": 1.3887, "learning_rate": 4.608834488797006e-05, "epoch": 0.5414136193306629, "percentage": 18.05, "elapsed_time": "3:04:15", "remaining_time": "13:56:41", "throughput": "3104.85", "total_tokens": 34324480} {"current_steps": 4200, "total_steps": 23217, "loss": 0.983, "learning_rate": 4.607015706490341e-05, "epoch": 0.542705775940044, "percentage": 18.09, "elapsed_time": "3:05:03", "remaining_time": "13:57:54", "throughput": "3098.75", "total_tokens": 34406400} {"current_steps": 4210, "total_steps": 23217, "loss": 0.8547, "learning_rate": 4.6051930662456276e-05, "epoch": 0.543997932549425, "percentage": 18.13, "elapsed_time": "3:05:52", "remaining_time": "13:59:08", "throughput": "3092.55", "total_tokens": 34488320} {"current_steps": 4220, "total_steps": 23217, "loss": 1.1971, "learning_rate": 4.603366571400114e-05, "epoch": 0.5452900891588061, "percentage": 18.18, "elapsed_time": "3:06:39", "remaining_time": "14:00:18", "throughput": "3086.64", "total_tokens": 34570240} {"current_steps": 4230, "total_steps": 23217, "loss": 0.927, "learning_rate": 4.601536225298104e-05, "epoch": 0.5465822457681871, "percentage": 18.22, "elapsed_time": "3:07:29", "remaining_time": "14:01:33", "throughput": "3080.41", "total_tokens": 34652160} {"current_steps": 4240, "total_steps": 23217, "loss": 0.8928, "learning_rate": 4.5997020312909565e-05, "epoch": 0.5478744023775681, "percentage": 18.26, "elapsed_time": "3:08:17", "remaining_time": "14:02:43", "throughput": "3074.51", "total_tokens": 34734080} {"current_steps": 4250, "total_steps": 23217, "loss": 0.9546, "learning_rate": 4.597863992737072e-05, "epoch": 0.5491665589869492, "percentage": 18.31, "elapsed_time": "3:09:06", "remaining_time": "14:03:55", "throughput": "3068.53", "total_tokens": 34816000} {"current_steps": 4260, "total_steps": 23217, "loss": 1.1029, "learning_rate": 4.5960221130018946e-05, "epoch": 0.5504587155963303, "percentage": 18.35, "elapsed_time": "3:09:54", "remaining_time": "14:05:07", "throughput": "3062.60", "total_tokens": 34897920} {"current_steps": 4270, "total_steps": 23217, "loss": 1.1309, "learning_rate": 4.594176395457897e-05, "epoch": 0.5517508722057113, "percentage": 18.39, "elapsed_time": "3:10:43", "remaining_time": "14:06:18", "throughput": "3056.65", "total_tokens": 34979840} {"current_steps": 4280, "total_steps": 23217, "loss": 0.8424, "learning_rate": 4.592326843484583e-05, "epoch": 0.5530430288150924, "percentage": 18.43, "elapsed_time": "3:11:31", "remaining_time": "14:07:24", "throughput": "3051.09", "total_tokens": 35061760} {"current_steps": 4290, "total_steps": 23217, "loss": 1.2382, "learning_rate": 4.590473460468475e-05, "epoch": 0.5543351854244735, "percentage": 18.48, "elapsed_time": "3:12:19", "remaining_time": "14:08:29", "throughput": "3045.61", "total_tokens": 35143680} {"current_steps": 4300, "total_steps": 23217, "loss": 1.0987, "learning_rate": 4.58861624980311e-05, "epoch": 0.5556273420338546, "percentage": 18.52, "elapsed_time": "3:13:12", "remaining_time": "14:09:59", "throughput": "3038.59", "total_tokens": 35225600} {"current_steps": 4310, "total_steps": 23217, "loss": 0.6929, "learning_rate": 4.586755214889035e-05, "epoch": 0.5569194986432355, "percentage": 18.56, "elapsed_time": "3:14:10", "remaining_time": "14:11:49", "throughput": "3030.48", "total_tokens": 35307520} {"current_steps": 4320, "total_steps": 23217, "loss": 0.9671, "learning_rate": 4.584890359133797e-05, "epoch": 0.5582116552526166, "percentage": 18.61, "elapsed_time": "3:15:08", "remaining_time": "14:13:37", "throughput": "3022.50", "total_tokens": 35389440} {"current_steps": 4330, "total_steps": 23217, "loss": 0.7893, "learning_rate": 4.58302168595194e-05, "epoch": 0.5595038118619977, "percentage": 18.65, "elapsed_time": "3:16:02", "remaining_time": "14:15:08", "throughput": "3015.55", "total_tokens": 35471360} {"current_steps": 4340, "total_steps": 23217, "loss": 0.8821, "learning_rate": 4.5811491987649994e-05, "epoch": 0.5607959684713787, "percentage": 18.69, "elapsed_time": "3:17:06", "remaining_time": "14:17:18", "throughput": "3006.29", "total_tokens": 35553280} {"current_steps": 4350, "total_steps": 23217, "loss": 0.8082, "learning_rate": 4.579272901001491e-05, "epoch": 0.5620881250807598, "percentage": 18.74, "elapsed_time": "3:18:05", "remaining_time": "14:19:11", "throughput": "2998.12", "total_tokens": 35635200} {"current_steps": 4360, "total_steps": 23217, "loss": 0.9638, "learning_rate": 4.57739279609691e-05, "epoch": 0.5633802816901409, "percentage": 18.78, "elapsed_time": "3:19:03", "remaining_time": "14:20:56", "throughput": "2990.48", "total_tokens": 35717120} {"current_steps": 4370, "total_steps": 23217, "loss": 1.0087, "learning_rate": 4.57550888749372e-05, "epoch": 0.5646724382995219, "percentage": 18.82, "elapsed_time": "3:20:12", "remaining_time": "14:23:26", "throughput": "2980.23", "total_tokens": 35799040} {"current_steps": 4380, "total_steps": 23217, "loss": 1.0578, "learning_rate": 4.5736211786413524e-05, "epoch": 0.5659645949089029, "percentage": 18.87, "elapsed_time": "3:21:22", "remaining_time": "14:26:03", "throughput": "2969.65", "total_tokens": 35880960} {"current_steps": 4390, "total_steps": 23217, "loss": 0.5186, "learning_rate": 4.571729672996195e-05, "epoch": 0.567256751518284, "percentage": 18.91, "elapsed_time": "3:22:23", "remaining_time": "14:27:58", "throughput": "2961.53", "total_tokens": 35962880} {"current_steps": 4400, "total_steps": 23217, "loss": 1.0137, "learning_rate": 4.5698343740215865e-05, "epoch": 0.5685489081276651, "percentage": 18.95, "elapsed_time": "3:23:31", "remaining_time": "14:30:25", "throughput": "2951.60", "total_tokens": 36044800} {"current_steps": 4410, "total_steps": 23217, "loss": 0.91, "learning_rate": 4.5679352851878135e-05, "epoch": 0.5698410647370461, "percentage": 18.99, "elapsed_time": "3:24:35", "remaining_time": "14:32:30", "throughput": "2942.98", "total_tokens": 36126720} {"current_steps": 4420, "total_steps": 23217, "loss": 0.8943, "learning_rate": 4.5660324099721005e-05, "epoch": 0.5711332213464272, "percentage": 19.04, "elapsed_time": "3:25:47", "remaining_time": "14:35:08", "throughput": "2932.58", "total_tokens": 36208640} {"current_steps": 4430, "total_steps": 23217, "loss": 0.8402, "learning_rate": 4.5641257518586044e-05, "epoch": 0.5724253779558083, "percentage": 19.08, "elapsed_time": "3:26:55", "remaining_time": "14:37:33", "throughput": "2922.95", "total_tokens": 36290560} {"current_steps": 4440, "total_steps": 23217, "loss": 0.8945, "learning_rate": 4.562215314338411e-05, "epoch": 0.5737175345651893, "percentage": 19.12, "elapsed_time": "3:28:03", "remaining_time": "14:39:52", "throughput": "2913.72", "total_tokens": 36372480} {"current_steps": 4450, "total_steps": 23217, "loss": 1.3013, "learning_rate": 4.560301100909522e-05, "epoch": 0.5750096911745703, "percentage": 19.17, "elapsed_time": "3:29:02", "remaining_time": "14:41:37", "throughput": "2906.38", "total_tokens": 36454400} {"current_steps": 4460, "total_steps": 23217, "loss": 0.8028, "learning_rate": 4.558383115076857e-05, "epoch": 0.5763018477839514, "percentage": 19.21, "elapsed_time": "3:30:23", "remaining_time": "14:44:49", "throughput": "2894.31", "total_tokens": 36536320} {"current_steps": 4470, "total_steps": 23217, "loss": 1.1116, "learning_rate": 4.556461360352241e-05, "epoch": 0.5775940043933324, "percentage": 19.25, "elapsed_time": "3:31:27", "remaining_time": "14:46:51", "throughput": "2886.15", "total_tokens": 36618240} {"current_steps": 4480, "total_steps": 23217, "loss": 1.094, "learning_rate": 4.554535840254398e-05, "epoch": 0.5788861610027135, "percentage": 19.3, "elapsed_time": "3:32:17", "remaining_time": "14:47:52", "throughput": "2881.27", "total_tokens": 36700160} {"current_steps": 4490, "total_steps": 23217, "loss": 0.9717, "learning_rate": 4.552606558308951e-05, "epoch": 0.5801783176120946, "percentage": 19.34, "elapsed_time": "3:33:07", "remaining_time": "14:48:56", "throughput": "2876.30", "total_tokens": 36782080} {"current_steps": 4500, "total_steps": 23217, "loss": 1.0816, "learning_rate": 4.550673518048405e-05, "epoch": 0.5814704742214757, "percentage": 19.38, "elapsed_time": "3:33:57", "remaining_time": "14:49:57", "throughput": "2871.50", "total_tokens": 36864000} {"current_steps": 4510, "total_steps": 23217, "loss": 0.9271, "learning_rate": 4.548736723012153e-05, "epoch": 0.5827626308308567, "percentage": 19.43, "elapsed_time": "3:34:48", "remaining_time": "14:51:01", "throughput": "2866.51", "total_tokens": 36945920} {"current_steps": 4520, "total_steps": 23217, "loss": 0.9318, "learning_rate": 4.5467961767464575e-05, "epoch": 0.5840547874402378, "percentage": 19.47, "elapsed_time": "3:35:38", "remaining_time": "14:51:58", "throughput": "2861.92", "total_tokens": 37027840} {"current_steps": 4530, "total_steps": 23217, "loss": 0.7255, "learning_rate": 4.5448518828044515e-05, "epoch": 0.5853469440496188, "percentage": 19.51, "elapsed_time": "3:36:28", "remaining_time": "14:52:59", "throughput": "2857.12", "total_tokens": 37109760} {"current_steps": 4540, "total_steps": 23217, "loss": 1.1148, "learning_rate": 4.5429038447461315e-05, "epoch": 0.5866391006589998, "percentage": 19.55, "elapsed_time": "3:37:18", "remaining_time": "14:54:00", "throughput": "2852.35", "total_tokens": 37191680} {"current_steps": 4550, "total_steps": 23217, "loss": 1.1077, "learning_rate": 4.540952066138347e-05, "epoch": 0.5879312572683809, "percentage": 19.6, "elapsed_time": "3:38:08", "remaining_time": "14:54:55", "throughput": "2847.92", "total_tokens": 37273600} {"current_steps": 4560, "total_steps": 23217, "loss": 0.923, "learning_rate": 4.538996550554798e-05, "epoch": 0.589223413877762, "percentage": 19.64, "elapsed_time": "3:38:56", "remaining_time": "14:55:45", "throughput": "2843.72", "total_tokens": 37355520} {"current_steps": 4570, "total_steps": 23217, "loss": 0.9954, "learning_rate": 4.537037301576026e-05, "epoch": 0.5905155704871431, "percentage": 19.68, "elapsed_time": "3:39:46", "remaining_time": "14:56:44", "throughput": "2839.10", "total_tokens": 37437440} {"current_steps": 4580, "total_steps": 23217, "loss": 0.9237, "learning_rate": 4.535074322789408e-05, "epoch": 0.5918077270965241, "percentage": 19.73, "elapsed_time": "3:40:36", "remaining_time": "14:57:41", "throughput": "2834.58", "total_tokens": 37519360} {"current_steps": 4590, "total_steps": 23217, "loss": 1.0009, "learning_rate": 4.5331076177891527e-05, "epoch": 0.5930998837059052, "percentage": 19.77, "elapsed_time": "3:41:27", "remaining_time": "14:58:43", "throughput": "2829.80", "total_tokens": 37601280} {"current_steps": 4600, "total_steps": 23217, "loss": 1.0067, "learning_rate": 4.531137190176289e-05, "epoch": 0.5943920403152863, "percentage": 19.81, "elapsed_time": "3:42:17", "remaining_time": "14:59:39", "throughput": "2825.34", "total_tokens": 37683200} {"current_steps": 4610, "total_steps": 23217, "loss": 0.7292, "learning_rate": 4.529163043558662e-05, "epoch": 0.5956841969246672, "percentage": 19.86, "elapsed_time": "3:43:08", "remaining_time": "15:00:38", "throughput": "2820.75", "total_tokens": 37765120} {"current_steps": 4620, "total_steps": 23217, "loss": 1.0878, "learning_rate": 4.527185181550928e-05, "epoch": 0.5969763535340483, "percentage": 19.9, "elapsed_time": "3:43:57", "remaining_time": "15:01:30", "throughput": "2816.53", "total_tokens": 37847040} {"current_steps": 4630, "total_steps": 23217, "loss": 0.741, "learning_rate": 4.525203607774544e-05, "epoch": 0.5982685101434294, "percentage": 19.94, "elapsed_time": "3:44:48", "remaining_time": "15:02:30", "throughput": "2811.87", "total_tokens": 37928960} {"current_steps": 4640, "total_steps": 23217, "loss": 0.498, "learning_rate": 4.5232183258577655e-05, "epoch": 0.5995606667528104, "percentage": 19.99, "elapsed_time": "3:45:39", "remaining_time": "15:03:27", "throughput": "2807.39", "total_tokens": 38010880} {"current_steps": 4650, "total_steps": 23217, "loss": 0.854, "learning_rate": 4.5212293394356356e-05, "epoch": 0.6008528233621915, "percentage": 20.03, "elapsed_time": "3:46:32", "remaining_time": "15:04:32", "throughput": "2802.55", "total_tokens": 38092800} {"current_steps": 4660, "total_steps": 23217, "loss": 0.8904, "learning_rate": 4.519236652149981e-05, "epoch": 0.6021449799715726, "percentage": 20.07, "elapsed_time": "3:47:23", "remaining_time": "15:05:29", "throughput": "2798.09", "total_tokens": 38174720} {"current_steps": 4670, "total_steps": 23217, "loss": 0.6613, "learning_rate": 4.517240267649405e-05, "epoch": 0.6034371365809537, "percentage": 20.11, "elapsed_time": "3:48:15", "remaining_time": "15:06:32", "throughput": "2793.34", "total_tokens": 38256640} {"current_steps": 4680, "total_steps": 23217, "loss": 0.679, "learning_rate": 4.515240189589282e-05, "epoch": 0.6047292931903346, "percentage": 20.16, "elapsed_time": "3:49:06", "remaining_time": "15:07:28", "throughput": "2788.97", "total_tokens": 38338560} {"current_steps": 4690, "total_steps": 23217, "loss": 0.7213, "learning_rate": 4.5132364216317446e-05, "epoch": 0.6060214497997157, "percentage": 20.2, "elapsed_time": "3:49:57", "remaining_time": "15:08:22", "throughput": "2784.69", "total_tokens": 38420480} {"current_steps": 4700, "total_steps": 23217, "loss": 1.0668, "learning_rate": 4.5112289674456864e-05, "epoch": 0.6073136064090968, "percentage": 20.24, "elapsed_time": "3:50:47", "remaining_time": "15:09:17", "throughput": "2780.39", "total_tokens": 38502400} {"current_steps": 4710, "total_steps": 23217, "loss": 0.6861, "learning_rate": 4.509217830706749e-05, "epoch": 0.6086057630184778, "percentage": 20.29, "elapsed_time": "3:51:37", "remaining_time": "15:10:09", "throughput": "2776.27", "total_tokens": 38584320} {"current_steps": 4720, "total_steps": 23217, "loss": 0.9106, "learning_rate": 4.5072030150973154e-05, "epoch": 0.6098979196278589, "percentage": 20.33, "elapsed_time": "3:52:28", "remaining_time": "15:11:01", "throughput": "2772.09", "total_tokens": 38666240} {"current_steps": 4730, "total_steps": 23217, "loss": 0.73, "learning_rate": 4.505184524306506e-05, "epoch": 0.61119007623724, "percentage": 20.37, "elapsed_time": "3:53:17", "remaining_time": "15:11:48", "throughput": "2768.25", "total_tokens": 38748160} {"current_steps": 4740, "total_steps": 23217, "loss": 1.3151, "learning_rate": 4.50316236203017e-05, "epoch": 0.612482232846621, "percentage": 20.42, "elapsed_time": "3:54:07", "remaining_time": "15:12:40", "throughput": "2764.11", "total_tokens": 38830080} {"current_steps": 4750, "total_steps": 23217, "loss": 1.0097, "learning_rate": 4.5011365319708796e-05, "epoch": 0.613774389456002, "percentage": 20.46, "elapsed_time": "3:54:59", "remaining_time": "15:13:35", "throughput": "2759.84", "total_tokens": 38912000} {"current_steps": 4760, "total_steps": 23217, "loss": 1.0672, "learning_rate": 4.499107037837922e-05, "epoch": 0.6150665460653831, "percentage": 20.5, "elapsed_time": "3:55:50", "remaining_time": "15:14:27", "throughput": "2755.71", "total_tokens": 38993920} {"current_steps": 4770, "total_steps": 23217, "loss": 0.8592, "learning_rate": 4.497073883347293e-05, "epoch": 0.6163587026747642, "percentage": 20.55, "elapsed_time": "3:56:40", "remaining_time": "15:15:16", "throughput": "2751.78", "total_tokens": 39075840} {"current_steps": 4780, "total_steps": 23217, "loss": 0.979, "learning_rate": 4.495037072221692e-05, "epoch": 0.6176508592841452, "percentage": 20.59, "elapsed_time": "3:57:31", "remaining_time": "15:16:08", "throughput": "2747.69", "total_tokens": 39157760} {"current_steps": 4790, "total_steps": 23217, "loss": 1.1349, "learning_rate": 4.49299660819051e-05, "epoch": 0.6189430158935263, "percentage": 20.63, "elapsed_time": "3:58:20", "remaining_time": "15:16:54", "throughput": "2743.88", "total_tokens": 39239680} {"current_steps": 4800, "total_steps": 23217, "loss": 0.8819, "learning_rate": 4.490952494989834e-05, "epoch": 0.6202351725029074, "percentage": 20.67, "elapsed_time": "3:59:12", "remaining_time": "15:17:48", "throughput": "2739.72", "total_tokens": 39321600} {"current_steps": 4810, "total_steps": 23217, "loss": 1.0527, "learning_rate": 4.4889047363624236e-05, "epoch": 0.6215273291122884, "percentage": 20.72, "elapsed_time": "4:00:03", "remaining_time": "15:18:39", "throughput": "2735.71", "total_tokens": 39403520} {"current_steps": 4820, "total_steps": 23217, "loss": 1.1608, "learning_rate": 4.486853336057719e-05, "epoch": 0.6228194857216695, "percentage": 20.76, "elapsed_time": "4:00:53", "remaining_time": "15:19:26", "throughput": "2731.90", "total_tokens": 39485440} {"current_steps": 4830, "total_steps": 23217, "loss": 0.9382, "learning_rate": 4.484798297831826e-05, "epoch": 0.6241116423310505, "percentage": 20.8, "elapsed_time": "4:01:43", "remaining_time": "15:20:12", "throughput": "2728.13", "total_tokens": 39567360} {"current_steps": 4840, "total_steps": 23217, "loss": 0.9578, "learning_rate": 4.482739625447514e-05, "epoch": 0.6254037989404316, "percentage": 20.85, "elapsed_time": "4:02:32", "remaining_time": "15:20:55", "throughput": "2724.52", "total_tokens": 39649280} {"current_steps": 4850, "total_steps": 23217, "loss": 0.5964, "learning_rate": 4.480677322674202e-05, "epoch": 0.6266959555498126, "percentage": 20.89, "elapsed_time": "4:03:22", "remaining_time": "15:21:38", "throughput": "2720.90", "total_tokens": 39731200} {"current_steps": 4860, "total_steps": 23217, "loss": 1.0508, "learning_rate": 4.4786113932879605e-05, "epoch": 0.6279881121591937, "percentage": 20.93, "elapsed_time": "4:04:12", "remaining_time": "15:22:22", "throughput": "2717.25", "total_tokens": 39813120} {"current_steps": 4870, "total_steps": 23217, "loss": 0.7638, "learning_rate": 4.476541841071498e-05, "epoch": 0.6292802687685748, "percentage": 20.98, "elapsed_time": "4:05:02", "remaining_time": "15:23:11", "throughput": "2713.41", "total_tokens": 39895040} {"current_steps": 4880, "total_steps": 23217, "loss": 0.5432, "learning_rate": 4.4744686698141564e-05, "epoch": 0.6305724253779558, "percentage": 21.02, "elapsed_time": "4:05:53", "remaining_time": "15:23:58", "throughput": "2709.62", "total_tokens": 39976960} {"current_steps": 4890, "total_steps": 23217, "loss": 1.0626, "learning_rate": 4.472391883311906e-05, "epoch": 0.6318645819873369, "percentage": 21.06, "elapsed_time": "4:06:44", "remaining_time": "15:24:44", "throughput": "2705.88", "total_tokens": 40058880} {"current_steps": 4900, "total_steps": 23217, "loss": 0.8067, "learning_rate": 4.470311485367335e-05, "epoch": 0.633156738596718, "percentage": 21.11, "elapsed_time": "4:07:32", "remaining_time": "15:25:22", "throughput": "2702.58", "total_tokens": 40140800} {"current_steps": 4910, "total_steps": 23217, "loss": 0.8431, "learning_rate": 4.468227479789644e-05, "epoch": 0.6344488952060989, "percentage": 21.15, "elapsed_time": "4:08:22", "remaining_time": "15:26:02", "throughput": "2699.12", "total_tokens": 40222720} {"current_steps": 4920, "total_steps": 23217, "loss": 0.92, "learning_rate": 4.4661398703946396e-05, "epoch": 0.63574105181548, "percentage": 21.19, "elapsed_time": "4:09:11", "remaining_time": "15:26:43", "throughput": "2695.66", "total_tokens": 40304640} {"current_steps": 4930, "total_steps": 23217, "loss": 1.0994, "learning_rate": 4.464048661004727e-05, "epoch": 0.6370332084248611, "percentage": 21.23, "elapsed_time": "4:10:02", "remaining_time": "15:27:29", "throughput": "2691.97", "total_tokens": 40386560} {"current_steps": 4940, "total_steps": 23217, "loss": 1.0147, "learning_rate": 4.461953855448903e-05, "epoch": 0.6383253650342422, "percentage": 21.28, "elapsed_time": "4:10:50", "remaining_time": "15:28:05", "throughput": "2688.77", "total_tokens": 40468480} {"current_steps": 4950, "total_steps": 23217, "loss": 1.1607, "learning_rate": 4.4598554575627495e-05, "epoch": 0.6396175216436232, "percentage": 21.32, "elapsed_time": "4:11:40", "remaining_time": "15:28:47", "throughput": "2685.29", "total_tokens": 40550400} {"current_steps": 4960, "total_steps": 23217, "loss": 1.1159, "learning_rate": 4.4577534711884244e-05, "epoch": 0.6409096782530043, "percentage": 21.36, "elapsed_time": "4:12:29", "remaining_time": "15:29:21", "throughput": "2682.15", "total_tokens": 40632320} {"current_steps": 4970, "total_steps": 23217, "loss": 1.0039, "learning_rate": 4.455647900174658e-05, "epoch": 0.6422018348623854, "percentage": 21.41, "elapsed_time": "4:13:17", "remaining_time": "15:29:58", "throughput": "2678.93", "total_tokens": 40714240} {"current_steps": 4980, "total_steps": 23217, "loss": 0.8848, "learning_rate": 4.453538748376742e-05, "epoch": 0.6434939914717663, "percentage": 21.45, "elapsed_time": "4:14:07", "remaining_time": "15:30:37", "throughput": "2675.56", "total_tokens": 40796160} {"current_steps": 4990, "total_steps": 23217, "loss": 0.624, "learning_rate": 4.451426019656526e-05, "epoch": 0.6447861480811474, "percentage": 21.49, "elapsed_time": "4:14:56", "remaining_time": "15:31:12", "throughput": "2672.42", "total_tokens": 40878080} {"current_steps": 5000, "total_steps": 23217, "loss": 1.0137, "learning_rate": 4.449309717882409e-05, "epoch": 0.6460783046905285, "percentage": 21.54, "elapsed_time": "4:15:46", "remaining_time": "15:31:52", "throughput": "2669.08", "total_tokens": 40960000} {"current_steps": 5010, "total_steps": 23217, "loss": 0.9478, "learning_rate": 4.4471898469293324e-05, "epoch": 0.6473704612999095, "percentage": 21.58, "elapsed_time": "4:16:40", "remaining_time": "15:32:48", "throughput": "2664.90", "total_tokens": 41041920} {"current_steps": 5020, "total_steps": 23217, "loss": 0.8829, "learning_rate": 4.4450664106787706e-05, "epoch": 0.6486626179092906, "percentage": 21.62, "elapsed_time": "4:17:31", "remaining_time": "15:33:30", "throughput": "2661.45", "total_tokens": 41123840} {"current_steps": 5030, "total_steps": 23217, "loss": 1.0126, "learning_rate": 4.442939413018728e-05, "epoch": 0.6499547745186717, "percentage": 21.67, "elapsed_time": "4:18:21", "remaining_time": "15:34:09", "throughput": "2658.13", "total_tokens": 41205760} {"current_steps": 5040, "total_steps": 23217, "loss": 0.8302, "learning_rate": 4.44080885784373e-05, "epoch": 0.6512469311280528, "percentage": 21.71, "elapsed_time": "4:19:10", "remaining_time": "15:34:44", "throughput": "2655.01", "total_tokens": 41287680} {"current_steps": 5050, "total_steps": 23217, "loss": 1.0349, "learning_rate": 4.4386747490548156e-05, "epoch": 0.6525390877374337, "percentage": 21.75, "elapsed_time": "4:19:59", "remaining_time": "15:35:19", "throughput": "2651.90", "total_tokens": 41369600} {"current_steps": 5060, "total_steps": 23217, "loss": 1.1468, "learning_rate": 4.43653709055953e-05, "epoch": 0.6538312443468148, "percentage": 21.79, "elapsed_time": "4:20:48", "remaining_time": "15:35:53", "throughput": "2648.87", "total_tokens": 41451520} {"current_steps": 5070, "total_steps": 23217, "loss": 1.1647, "learning_rate": 4.434395886271917e-05, "epoch": 0.6551234009561959, "percentage": 21.84, "elapsed_time": "4:21:37", "remaining_time": "15:36:25", "throughput": "2645.90", "total_tokens": 41533440} {"current_steps": 5080, "total_steps": 23217, "loss": 1.2088, "learning_rate": 4.4322511401125156e-05, "epoch": 0.6564155575655769, "percentage": 21.88, "elapsed_time": "4:22:26", "remaining_time": "15:36:58", "throughput": "2642.88", "total_tokens": 41615360} {"current_steps": 5090, "total_steps": 23217, "loss": 0.8394, "learning_rate": 4.430102856008347e-05, "epoch": 0.657707714174958, "percentage": 21.92, "elapsed_time": "4:23:14", "remaining_time": "15:37:30", "throughput": "2639.91", "total_tokens": 41697280} {"current_steps": 5100, "total_steps": 23217, "loss": 0.7364, "learning_rate": 4.427951037892911e-05, "epoch": 0.6589998707843391, "percentage": 21.97, "elapsed_time": "4:24:03", "remaining_time": "15:38:01", "throughput": "2637.03", "total_tokens": 41779200} {"current_steps": 5110, "total_steps": 23217, "loss": 0.8559, "learning_rate": 4.4257956897061805e-05, "epoch": 0.6602920273937202, "percentage": 22.01, "elapsed_time": "4:24:51", "remaining_time": "15:38:30", "throughput": "2634.18", "total_tokens": 41861120} {"current_steps": 5120, "total_steps": 23217, "loss": 0.9424, "learning_rate": 4.423636815394588e-05, "epoch": 0.6615841840031012, "percentage": 22.05, "elapsed_time": "4:25:39", "remaining_time": "15:39:00", "throughput": "2631.32", "total_tokens": 41943040} {"current_steps": 5130, "total_steps": 23217, "loss": 1.1937, "learning_rate": 4.4214744189110266e-05, "epoch": 0.6628763406124822, "percentage": 22.1, "elapsed_time": "4:26:27", "remaining_time": "15:39:29", "throughput": "2628.54", "total_tokens": 42024960} {"current_steps": 5140, "total_steps": 23217, "loss": 1.0227, "learning_rate": 4.4193085042148354e-05, "epoch": 0.6641684972218633, "percentage": 22.14, "elapsed_time": "4:27:15", "remaining_time": "15:39:56", "throughput": "2625.82", "total_tokens": 42106880} {"current_steps": 5150, "total_steps": 23217, "loss": 1.3091, "learning_rate": 4.417139075271796e-05, "epoch": 0.6654606538312443, "percentage": 22.18, "elapsed_time": "4:28:04", "remaining_time": "15:40:27", "throughput": "2622.94", "total_tokens": 42188800} {"current_steps": 5160, "total_steps": 23217, "loss": 0.6186, "learning_rate": 4.414966136054125e-05, "epoch": 0.6667528104406254, "percentage": 22.23, "elapsed_time": "4:28:53", "remaining_time": "15:40:57", "throughput": "2620.10", "total_tokens": 42270720} {"current_steps": 5170, "total_steps": 23217, "loss": 0.7974, "learning_rate": 4.412789690540466e-05, "epoch": 0.6680449670500065, "percentage": 22.27, "elapsed_time": "4:29:41", "remaining_time": "15:41:24", "throughput": "2617.35", "total_tokens": 42352640} {"current_steps": 5180, "total_steps": 23217, "loss": 0.8996, "learning_rate": 4.410609742715883e-05, "epoch": 0.6693371236593875, "percentage": 22.31, "elapsed_time": "4:30:29", "remaining_time": "15:41:53", "throughput": "2614.58", "total_tokens": 42434560} {"current_steps": 5190, "total_steps": 23217, "loss": 1.0341, "learning_rate": 4.408426296571852e-05, "epoch": 0.6706292802687686, "percentage": 22.35, "elapsed_time": "4:31:18", "remaining_time": "15:42:22", "throughput": "2611.80", "total_tokens": 42516480} {"current_steps": 5200, "total_steps": 23217, "loss": 0.9729, "learning_rate": 4.406239356106257e-05, "epoch": 0.6719214368781496, "percentage": 22.4, "elapsed_time": "4:32:06", "remaining_time": "15:42:48", "throughput": "2609.16", "total_tokens": 42598400} {"current_steps": 5210, "total_steps": 23217, "loss": 0.6879, "learning_rate": 4.404048925323375e-05, "epoch": 0.6732135934875307, "percentage": 22.44, "elapsed_time": "4:32:54", "remaining_time": "15:43:15", "throughput": "2606.44", "total_tokens": 42680320} {"current_steps": 5220, "total_steps": 23217, "loss": 1.2569, "learning_rate": 4.401855008233879e-05, "epoch": 0.6745057500969117, "percentage": 22.48, "elapsed_time": "4:33:44", "remaining_time": "15:43:46", "throughput": "2603.57", "total_tokens": 42762240} {"current_steps": 5230, "total_steps": 23217, "loss": 1.1061, "learning_rate": 4.3996576088548214e-05, "epoch": 0.6757979067062928, "percentage": 22.53, "elapsed_time": "4:34:33", "remaining_time": "15:44:16", "throughput": "2600.73", "total_tokens": 42844160} {"current_steps": 5240, "total_steps": 23217, "loss": 1.0198, "learning_rate": 4.397456731209634e-05, "epoch": 0.6770900633156739, "percentage": 22.57, "elapsed_time": "4:35:23", "remaining_time": "15:44:47", "throughput": "2597.89", "total_tokens": 42926080} {"current_steps": 5250, "total_steps": 23217, "loss": 0.7051, "learning_rate": 4.395252379328115e-05, "epoch": 0.6783822199250549, "percentage": 22.61, "elapsed_time": "4:36:12", "remaining_time": "15:45:14", "throughput": "2595.21", "total_tokens": 43008000} {"current_steps": 5260, "total_steps": 23217, "loss": 0.853, "learning_rate": 4.393044557246424e-05, "epoch": 0.679674376534436, "percentage": 22.66, "elapsed_time": "4:37:00", "remaining_time": "15:45:41", "throughput": "2592.53", "total_tokens": 43089920} {"current_steps": 5270, "total_steps": 23217, "loss": 0.9311, "learning_rate": 4.3908332690070765e-05, "epoch": 0.680966533143817, "percentage": 22.7, "elapsed_time": "4:37:49", "remaining_time": "15:46:06", "throughput": "2589.92", "total_tokens": 43171840} {"current_steps": 5280, "total_steps": 23217, "loss": 1.3277, "learning_rate": 4.388618518658932e-05, "epoch": 0.682258689753198, "percentage": 22.74, "elapsed_time": "4:38:37", "remaining_time": "15:46:32", "throughput": "2587.32", "total_tokens": 43253760} {"current_steps": 5290, "total_steps": 23217, "loss": 0.8287, "learning_rate": 4.3864003102571916e-05, "epoch": 0.6835508463625791, "percentage": 22.79, "elapsed_time": "4:39:26", "remaining_time": "15:47:00", "throughput": "2584.60", "total_tokens": 43335680} {"current_steps": 5300, "total_steps": 23217, "loss": 0.6284, "learning_rate": 4.384178647863385e-05, "epoch": 0.6848430029719602, "percentage": 22.83, "elapsed_time": "4:40:15", "remaining_time": "15:47:24", "throughput": "2582.06", "total_tokens": 43417600} {"current_steps": 5310, "total_steps": 23217, "loss": 1.1245, "learning_rate": 4.381953535545369e-05, "epoch": 0.6861351595813413, "percentage": 22.87, "elapsed_time": "4:41:03", "remaining_time": "15:47:50", "throughput": "2579.46", "total_tokens": 43499520} {"current_steps": 5320, "total_steps": 23217, "loss": 0.8103, "learning_rate": 4.3797249773773165e-05, "epoch": 0.6874273161907223, "percentage": 22.91, "elapsed_time": "4:41:52", "remaining_time": "15:48:14", "throughput": "2576.93", "total_tokens": 43581440} {"current_steps": 5330, "total_steps": 23217, "loss": 0.6222, "learning_rate": 4.3774929774397086e-05, "epoch": 0.6887194728001034, "percentage": 22.96, "elapsed_time": "4:42:40", "remaining_time": "15:48:38", "throughput": "2574.38", "total_tokens": 43663360} {"current_steps": 5340, "total_steps": 23217, "loss": 1.0592, "learning_rate": 4.375257539819328e-05, "epoch": 0.6900116294094845, "percentage": 23.0, "elapsed_time": "4:43:29", "remaining_time": "15:49:04", "throughput": "2571.78", "total_tokens": 43745280} {"current_steps": 5350, "total_steps": 23217, "loss": 1.1099, "learning_rate": 4.373018668609256e-05, "epoch": 0.6913037860188654, "percentage": 23.04, "elapsed_time": "4:44:18", "remaining_time": "15:49:30", "throughput": "2569.18", "total_tokens": 43827200} {"current_steps": 5360, "total_steps": 23217, "loss": 1.0354, "learning_rate": 4.370776367908854e-05, "epoch": 0.6925959426282465, "percentage": 23.09, "elapsed_time": "4:45:07", "remaining_time": "15:49:54", "throughput": "2566.63", "total_tokens": 43909120} {"current_steps": 5370, "total_steps": 23217, "loss": 1.2438, "learning_rate": 4.368530641823769e-05, "epoch": 0.6938880992376276, "percentage": 23.13, "elapsed_time": "4:45:56", "remaining_time": "15:50:19", "throughput": "2564.09", "total_tokens": 43991040} {"current_steps": 5380, "total_steps": 23217, "loss": 0.9602, "learning_rate": 4.3662814944659156e-05, "epoch": 0.6951802558470087, "percentage": 23.17, "elapsed_time": "4:46:44", "remaining_time": "15:50:41", "throughput": "2561.64", "total_tokens": 44072960} {"current_steps": 5390, "total_steps": 23217, "loss": 0.9233, "learning_rate": 4.364028929953476e-05, "epoch": 0.6964724124563897, "percentage": 23.22, "elapsed_time": "4:47:33", "remaining_time": "15:51:06", "throughput": "2559.11", "total_tokens": 44154880} {"current_steps": 5400, "total_steps": 23217, "loss": 1.1027, "learning_rate": 4.361772952410886e-05, "epoch": 0.6977645690657708, "percentage": 23.26, "elapsed_time": "4:48:22", "remaining_time": "15:51:27", "throughput": "2556.72", "total_tokens": 44236800} {"current_steps": 5410, "total_steps": 23217, "loss": 1.0273, "learning_rate": 4.359513565968832e-05, "epoch": 0.6990567256751519, "percentage": 23.3, "elapsed_time": "4:49:10", "remaining_time": "15:51:50", "throughput": "2554.28", "total_tokens": 44318720} {"current_steps": 5420, "total_steps": 23217, "loss": 0.8502, "learning_rate": 4.357250774764245e-05, "epoch": 0.7003488822845328, "percentage": 23.34, "elapsed_time": "4:49:59", "remaining_time": "15:52:12", "throughput": "2551.85", "total_tokens": 44400640} {"current_steps": 5430, "total_steps": 23217, "loss": 0.7773, "learning_rate": 4.354984582940285e-05, "epoch": 0.7016410388939139, "percentage": 23.39, "elapsed_time": "4:50:48", "remaining_time": "15:52:34", "throughput": "2549.43", "total_tokens": 44482560} {"current_steps": 5440, "total_steps": 23217, "loss": 0.9399, "learning_rate": 4.35271499464634e-05, "epoch": 0.702933195503295, "percentage": 23.43, "elapsed_time": "4:51:37", "remaining_time": "15:52:57", "throughput": "2546.95", "total_tokens": 44564480} {"current_steps": 5450, "total_steps": 23217, "loss": 0.9732, "learning_rate": 4.350442014038021e-05, "epoch": 0.704225352112676, "percentage": 23.47, "elapsed_time": "4:52:25", "remaining_time": "15:53:16", "throughput": "2544.67", "total_tokens": 44646400} {"current_steps": 5460, "total_steps": 23217, "loss": 0.9438, "learning_rate": 4.348165645277145e-05, "epoch": 0.7055175087220571, "percentage": 23.52, "elapsed_time": "4:53:13", "remaining_time": "15:53:37", "throughput": "2542.31", "total_tokens": 44728320} {"current_steps": 5470, "total_steps": 23217, "loss": 1.3828, "learning_rate": 4.345885892531735e-05, "epoch": 0.7068096653314382, "percentage": 23.56, "elapsed_time": "4:54:03", "remaining_time": "15:54:02", "throughput": "2539.80", "total_tokens": 44810240} {"current_steps": 5480, "total_steps": 23217, "loss": 1.1361, "learning_rate": 4.343602759976011e-05, "epoch": 0.7081018219408193, "percentage": 23.6, "elapsed_time": "4:54:51", "remaining_time": "15:54:22", "throughput": "2537.47", "total_tokens": 44892160} {"current_steps": 5490, "total_steps": 23217, "loss": 0.9972, "learning_rate": 4.34131625179038e-05, "epoch": 0.7093939785502003, "percentage": 23.65, "elapsed_time": "4:55:40", "remaining_time": "15:54:44", "throughput": "2535.04", "total_tokens": 44974080} {"current_steps": 5500, "total_steps": 23217, "loss": 1.1289, "learning_rate": 4.3390263721614286e-05, "epoch": 0.7106861351595813, "percentage": 23.69, "elapsed_time": "4:56:31", "remaining_time": "15:55:09", "throughput": "2532.51", "total_tokens": 45056000} {"current_steps": 5510, "total_steps": 23217, "loss": 0.699, "learning_rate": 4.33673312528192e-05, "epoch": 0.7119782917689624, "percentage": 23.73, "elapsed_time": "4:57:20", "remaining_time": "15:55:31", "throughput": "2530.13", "total_tokens": 45137920} {"current_steps": 5520, "total_steps": 23217, "loss": 1.1252, "learning_rate": 4.334436515350779e-05, "epoch": 0.7132704483783434, "percentage": 23.78, "elapsed_time": "4:58:08", "remaining_time": "15:55:50", "throughput": "2527.85", "total_tokens": 45219840} {"current_steps": 5530, "total_steps": 23217, "loss": 1.0118, "learning_rate": 4.332136546573092e-05, "epoch": 0.7145626049877245, "percentage": 23.82, "elapsed_time": "4:58:57", "remaining_time": "15:56:09", "throughput": "2525.60", "total_tokens": 45301760} {"current_steps": 5540, "total_steps": 23217, "loss": 0.8958, "learning_rate": 4.3298332231600925e-05, "epoch": 0.7158547615971056, "percentage": 23.86, "elapsed_time": "4:59:46", "remaining_time": "15:56:32", "throughput": "2523.16", "total_tokens": 45383680} {"current_steps": 5550, "total_steps": 23217, "loss": 0.7937, "learning_rate": 4.327526549329157e-05, "epoch": 0.7171469182064866, "percentage": 23.9, "elapsed_time": "5:00:35", "remaining_time": "15:56:51", "throughput": "2520.89", "total_tokens": 45465600} {"current_steps": 5560, "total_steps": 23217, "loss": 0.7012, "learning_rate": 4.325216529303798e-05, "epoch": 0.7184390748158677, "percentage": 23.95, "elapsed_time": "5:01:22", "remaining_time": "15:57:05", "throughput": "2518.84", "total_tokens": 45547520} {"current_steps": 5570, "total_steps": 23217, "loss": 0.7965, "learning_rate": 4.3229031673136514e-05, "epoch": 0.7197312314252488, "percentage": 23.99, "elapsed_time": "5:02:10", "remaining_time": "15:57:20", "throughput": "2516.77", "total_tokens": 45629440} {"current_steps": 5580, "total_steps": 23217, "loss": 0.9927, "learning_rate": 4.320586467594476e-05, "epoch": 0.7210233880346298, "percentage": 24.03, "elapsed_time": "5:02:58", "remaining_time": "15:57:37", "throughput": "2514.59", "total_tokens": 45711360} {"current_steps": 5590, "total_steps": 23217, "loss": 0.8541, "learning_rate": 4.3182664343881415e-05, "epoch": 0.7223155446440108, "percentage": 24.08, "elapsed_time": "5:03:46", "remaining_time": "15:57:54", "throughput": "2512.43", "total_tokens": 45793280} {"current_steps": 5600, "total_steps": 23217, "loss": 0.989, "learning_rate": 4.315943071942619e-05, "epoch": 0.7236077012533919, "percentage": 24.12, "elapsed_time": "5:04:34", "remaining_time": "15:58:09", "throughput": "2510.33", "total_tokens": 45875200} {"current_steps": 5610, "total_steps": 23217, "loss": 1.0818, "learning_rate": 4.313616384511976e-05, "epoch": 0.724899857862773, "percentage": 24.16, "elapsed_time": "5:05:23", "remaining_time": "15:58:28", "throughput": "2508.10", "total_tokens": 45957120} {"current_steps": 5620, "total_steps": 23217, "loss": 1.0183, "learning_rate": 4.3112863763563695e-05, "epoch": 0.726192014472154, "percentage": 24.21, "elapsed_time": "5:06:12", "remaining_time": "15:58:46", "throughput": "2505.88", "total_tokens": 46039040} {"current_steps": 5630, "total_steps": 23217, "loss": 1.1861, "learning_rate": 4.308953051742036e-05, "epoch": 0.7274841710815351, "percentage": 24.25, "elapsed_time": "5:07:01", "remaining_time": "15:59:05", "throughput": "2503.62", "total_tokens": 46120960} {"current_steps": 5640, "total_steps": 23217, "loss": 0.8941, "learning_rate": 4.3066164149412844e-05, "epoch": 0.7287763276909162, "percentage": 24.29, "elapsed_time": "5:07:50", "remaining_time": "15:59:24", "throughput": "2501.38", "total_tokens": 46202880} {"current_steps": 5650, "total_steps": 23217, "loss": 0.8618, "learning_rate": 4.304276470232488e-05, "epoch": 0.7300684843002972, "percentage": 24.34, "elapsed_time": "5:08:38", "remaining_time": "15:59:37", "throughput": "2499.38", "total_tokens": 46284800} {"current_steps": 5660, "total_steps": 23217, "loss": 0.8772, "learning_rate": 4.3019332219000766e-05, "epoch": 0.7313606409096782, "percentage": 24.38, "elapsed_time": "5:09:25", "remaining_time": "15:59:50", "throughput": "2497.41", "total_tokens": 46366720} {"current_steps": 5670, "total_steps": 23217, "loss": 1.0889, "learning_rate": 4.299586674234529e-05, "epoch": 0.7326527975190593, "percentage": 24.42, "elapsed_time": "5:10:13", "remaining_time": "16:00:02", "throughput": "2495.45", "total_tokens": 46448640} {"current_steps": 5680, "total_steps": 23217, "loss": 0.7212, "learning_rate": 4.2972368315323676e-05, "epoch": 0.7339449541284404, "percentage": 24.46, "elapsed_time": "5:11:00", "remaining_time": "16:00:15", "throughput": "2493.49", "total_tokens": 46530560} {"current_steps": 5690, "total_steps": 23217, "loss": 0.8605, "learning_rate": 4.294883698096143e-05, "epoch": 0.7352371107378214, "percentage": 24.51, "elapsed_time": "5:11:48", "remaining_time": "16:00:27", "throughput": "2491.54", "total_tokens": 46612480} {"current_steps": 5700, "total_steps": 23217, "loss": 0.9687, "learning_rate": 4.292527278234435e-05, "epoch": 0.7365292673472025, "percentage": 24.55, "elapsed_time": "5:12:36", "remaining_time": "16:00:40", "throughput": "2489.56", "total_tokens": 46694400} {"current_steps": 5710, "total_steps": 23217, "loss": 0.5747, "learning_rate": 4.290167576261841e-05, "epoch": 0.7378214239565836, "percentage": 24.59, "elapsed_time": "5:13:24", "remaining_time": "16:00:54", "throughput": "2487.51", "total_tokens": 46776320} {"current_steps": 5720, "total_steps": 23217, "loss": 0.7948, "learning_rate": 4.2878045964989646e-05, "epoch": 0.7391135805659645, "percentage": 24.64, "elapsed_time": "5:14:13", "remaining_time": "16:01:12", "throughput": "2485.35", "total_tokens": 46858240} {"current_steps": 5730, "total_steps": 23217, "loss": 1.0718, "learning_rate": 4.285438343272414e-05, "epoch": 0.7404057371753456, "percentage": 24.68, "elapsed_time": "5:15:02", "remaining_time": "16:01:28", "throughput": "2483.22", "total_tokens": 46940160} {"current_steps": 5740, "total_steps": 23217, "loss": 0.9519, "learning_rate": 4.283068820914791e-05, "epoch": 0.7416978937847267, "percentage": 24.72, "elapsed_time": "5:15:52", "remaining_time": "16:01:45", "throughput": "2481.06", "total_tokens": 47022080} {"current_steps": 5750, "total_steps": 23217, "loss": 1.015, "learning_rate": 4.2806960337646804e-05, "epoch": 0.7429900503941078, "percentage": 24.77, "elapsed_time": "5:16:41", "remaining_time": "16:02:01", "throughput": "2478.95", "total_tokens": 47104000} {"current_steps": 5760, "total_steps": 23217, "loss": 0.8983, "learning_rate": 4.278319986166649e-05, "epoch": 0.7442822070034888, "percentage": 24.81, "elapsed_time": "5:17:30", "remaining_time": "16:02:15", "throughput": "2476.94", "total_tokens": 47185920} {"current_steps": 5770, "total_steps": 23217, "loss": 0.8726, "learning_rate": 4.27594068247123e-05, "epoch": 0.7455743636128699, "percentage": 24.85, "elapsed_time": "5:18:19", "remaining_time": "16:02:30", "throughput": "2474.88", "total_tokens": 47267840} {"current_steps": 5780, "total_steps": 23217, "loss": 0.7588, "learning_rate": 4.27355812703492e-05, "epoch": 0.746866520222251, "percentage": 24.9, "elapsed_time": "5:19:08", "remaining_time": "16:02:46", "throughput": "2472.77", "total_tokens": 47349760} {"current_steps": 5790, "total_steps": 23217, "loss": 1.1223, "learning_rate": 4.2711723242201695e-05, "epoch": 0.748158676831632, "percentage": 24.94, "elapsed_time": "5:19:57", "remaining_time": "16:03:01", "throughput": "2470.73", "total_tokens": 47431680} {"current_steps": 5800, "total_steps": 23217, "loss": 0.7947, "learning_rate": 4.268783278395374e-05, "epoch": 0.749450833441013, "percentage": 24.98, "elapsed_time": "5:20:46", "remaining_time": "16:03:16", "throughput": "2468.66", "total_tokens": 47513600} {"current_steps": 5810, "total_steps": 23217, "loss": 0.9494, "learning_rate": 4.2663909939348684e-05, "epoch": 0.7507429900503941, "percentage": 25.02, "elapsed_time": "5:21:37", "remaining_time": "16:03:35", "throughput": "2466.45", "total_tokens": 47595520} {"current_steps": 5820, "total_steps": 23217, "loss": 0.7431, "learning_rate": 4.263995475218917e-05, "epoch": 0.7520351466597751, "percentage": 25.07, "elapsed_time": "5:22:27", "remaining_time": "16:03:52", "throughput": "2464.29", "total_tokens": 47677440} {"current_steps": 5830, "total_steps": 23217, "loss": 0.8616, "learning_rate": 4.2615967266337045e-05, "epoch": 0.7533273032691562, "percentage": 25.11, "elapsed_time": "5:23:20", "remaining_time": "16:04:20", "throughput": "2461.71", "total_tokens": 47759360} {"current_steps": 5840, "total_steps": 23217, "loss": 1.1937, "learning_rate": 4.2591947525713326e-05, "epoch": 0.7546194598785373, "percentage": 25.15, "elapsed_time": "5:24:13", "remaining_time": "16:04:44", "throughput": "2459.27", "total_tokens": 47841280} {"current_steps": 5850, "total_steps": 23217, "loss": 0.8848, "learning_rate": 4.256789557429806e-05, "epoch": 0.7559116164879184, "percentage": 25.2, "elapsed_time": "5:25:03", "remaining_time": "16:05:01", "throughput": "2457.10", "total_tokens": 47923200} {"current_steps": 5860, "total_steps": 23217, "loss": 0.9741, "learning_rate": 4.254381145613027e-05, "epoch": 0.7572037730972994, "percentage": 25.24, "elapsed_time": "5:25:54", "remaining_time": "16:05:18", "throughput": "2454.98", "total_tokens": 48005120} {"current_steps": 5870, "total_steps": 23217, "loss": 1.1395, "learning_rate": 4.251969521530791e-05, "epoch": 0.7584959297066804, "percentage": 25.28, "elapsed_time": "5:26:44", "remaining_time": "16:05:35", "throughput": "2452.84", "total_tokens": 48087040} {"current_steps": 5880, "total_steps": 23217, "loss": 1.074, "learning_rate": 4.2495546895987724e-05, "epoch": 0.7597880863160615, "percentage": 25.33, "elapsed_time": "5:27:35", "remaining_time": "16:05:53", "throughput": "2450.68", "total_tokens": 48168960} {"current_steps": 5890, "total_steps": 23217, "loss": 0.9192, "learning_rate": 4.2471366542385196e-05, "epoch": 0.7610802429254425, "percentage": 25.37, "elapsed_time": "5:28:23", "remaining_time": "16:06:04", "throughput": "2448.79", "total_tokens": 48250880} {"current_steps": 5900, "total_steps": 23217, "loss": 0.999, "learning_rate": 4.2447154198774445e-05, "epoch": 0.7623723995348236, "percentage": 25.41, "elapsed_time": "5:29:11", "remaining_time": "16:06:12", "throughput": "2447.04", "total_tokens": 48332800} {"current_steps": 5910, "total_steps": 23217, "loss": 1.0004, "learning_rate": 4.242290990948821e-05, "epoch": 0.7636645561442047, "percentage": 25.46, "elapsed_time": "5:29:59", "remaining_time": "16:06:20", "throughput": "2445.29", "total_tokens": 48414720} {"current_steps": 5920, "total_steps": 23217, "loss": 0.8302, "learning_rate": 4.2398633718917684e-05, "epoch": 0.7649567127535858, "percentage": 25.5, "elapsed_time": "5:30:46", "remaining_time": "16:06:28", "throughput": "2443.55", "total_tokens": 48496640} {"current_steps": 5930, "total_steps": 23217, "loss": 1.2325, "learning_rate": 4.237432567151248e-05, "epoch": 0.7662488693629668, "percentage": 25.54, "elapsed_time": "5:31:34", "remaining_time": "16:06:35", "throughput": "2441.82", "total_tokens": 48578560} {"current_steps": 5940, "total_steps": 23217, "loss": 0.636, "learning_rate": 4.234998581178056e-05, "epoch": 0.7675410259723479, "percentage": 25.58, "elapsed_time": "5:32:22", "remaining_time": "16:06:43", "throughput": "2440.08", "total_tokens": 48660480} {"current_steps": 5950, "total_steps": 23217, "loss": 0.633, "learning_rate": 4.2325614184288096e-05, "epoch": 0.768833182581729, "percentage": 25.63, "elapsed_time": "5:33:09", "remaining_time": "16:06:50", "throughput": "2438.37", "total_tokens": 48742400} {"current_steps": 5960, "total_steps": 23217, "loss": 0.8583, "learning_rate": 4.2301210833659464e-05, "epoch": 0.7701253391911099, "percentage": 25.67, "elapsed_time": "5:33:57", "remaining_time": "16:06:57", "throughput": "2436.66", "total_tokens": 48824320} {"current_steps": 5970, "total_steps": 23217, "loss": 0.9888, "learning_rate": 4.227677580457711e-05, "epoch": 0.771417495800491, "percentage": 25.71, "elapsed_time": "5:34:44", "remaining_time": "16:07:04", "throughput": "2434.97", "total_tokens": 48906240} {"current_steps": 5980, "total_steps": 23217, "loss": 1.0736, "learning_rate": 4.2252309141781464e-05, "epoch": 0.7727096524098721, "percentage": 25.76, "elapsed_time": "5:35:32", "remaining_time": "16:07:11", "throughput": "2433.28", "total_tokens": 48988160} {"current_steps": 5990, "total_steps": 23217, "loss": 0.995, "learning_rate": 4.222781089007092e-05, "epoch": 0.7740018090192531, "percentage": 25.8, "elapsed_time": "5:36:20", "remaining_time": "16:07:18", "throughput": "2431.53", "total_tokens": 49070080} {"current_steps": 6000, "total_steps": 23217, "loss": 0.8812, "learning_rate": 4.220328109430167e-05, "epoch": 0.7752939656286342, "percentage": 25.84, "elapsed_time": "5:37:08", "remaining_time": "16:07:25", "throughput": "2429.86", "total_tokens": 49152000} {"current_steps": 6010, "total_steps": 23217, "loss": 1.3251, "learning_rate": 4.217871979938769e-05, "epoch": 0.7765861222380153, "percentage": 25.89, "elapsed_time": "5:38:05", "remaining_time": "16:07:59", "throughput": "2427.00", "total_tokens": 49233920} {"current_steps": 6020, "total_steps": 23217, "loss": 0.9141, "learning_rate": 4.215412705030063e-05, "epoch": 0.7778782788473964, "percentage": 25.93, "elapsed_time": "5:38:53", "remaining_time": "16:08:05", "throughput": "2425.35", "total_tokens": 49315840} {"current_steps": 6010, "total_steps": 23217, "loss": 1.3075, "learning_rate": 4.217871979938769e-05, "epoch": 0.7765861222380153, "percentage": 25.89, "elapsed_time": "0:00:56", "remaining_time": "0:02:42", "throughput": "867448.22", "total_tokens": 49233920} {"current_steps": 6020, "total_steps": 23217, "loss": 0.8665, "learning_rate": 4.215412705030063e-05, "epoch": 0.7778782788473964, "percentage": 25.93, "elapsed_time": "0:01:44", "remaining_time": "0:04:58", "throughput": "472521.70", "total_tokens": 49315840} {"current_steps": 6030, "total_steps": 23217, "loss": 0.852, "learning_rate": 4.21295028920697e-05, "epoch": 0.7791704354567773, "percentage": 25.97, "elapsed_time": "0:02:31", "remaining_time": "0:07:13", "throughput": "324986.38", "total_tokens": 49397760} {"current_steps": 6040, "total_steps": 23217, "loss": 0.9422, "learning_rate": 4.210484736978166e-05, "epoch": 0.7804625920661584, "percentage": 26.02, "elapsed_time": "0:03:19", "remaining_time": "0:09:28", "throughput": "247621.66", "total_tokens": 49479680} {"current_steps": 6050, "total_steps": 23217, "loss": 0.8523, "learning_rate": 4.208016052858067e-05, "epoch": 0.7817547486755395, "percentage": 26.06, "elapsed_time": "0:04:07", "remaining_time": "0:11:42", "throughput": "200296.03", "total_tokens": 49561600} {"current_steps": 6060, "total_steps": 23217, "loss": 0.7916, "learning_rate": 4.2055442413668264e-05, "epoch": 0.7830469052849205, "percentage": 26.1, "elapsed_time": "0:04:55", "remaining_time": "0:13:55", "throughput": "168249.32", "total_tokens": 49643520} {"current_steps": 6070, "total_steps": 23217, "loss": 1.1109, "learning_rate": 4.2030693070303204e-05, "epoch": 0.7843390618943016, "percentage": 26.14, "elapsed_time": "0:05:42", "remaining_time": "0:16:08", "throughput": "145101.69", "total_tokens": 49725440} {"current_steps": 6080, "total_steps": 23217, "loss": 0.7227, "learning_rate": 4.2005912543801444e-05, "epoch": 0.7856312185036827, "percentage": 26.19, "elapsed_time": "0:06:30", "remaining_time": "0:18:20", "throughput": "127610.12", "total_tokens": 49807360} {"current_steps": 6090, "total_steps": 23217, "loss": 0.7407, "learning_rate": 4.198110087953606e-05, "epoch": 0.7869233751130637, "percentage": 26.23, "elapsed_time": "0:07:17", "remaining_time": "0:20:31", "throughput": "113923.28", "total_tokens": 49889280} {"current_steps": 6100, "total_steps": 23217, "loss": 1.4336, "learning_rate": 4.195625812293709e-05, "epoch": 0.7882155317224447, "percentage": 26.27, "elapsed_time": "0:08:05", "remaining_time": "0:22:42", "throughput": "102941.09", "total_tokens": 49971200} {"current_steps": 6110, "total_steps": 23217, "loss": 0.9719, "learning_rate": 4.193138431949155e-05, "epoch": 0.7895076883318258, "percentage": 26.32, "elapsed_time": "0:08:52", "remaining_time": "0:24:50", "throughput": "94021.78", "total_tokens": 50053120} {"current_steps": 6120, "total_steps": 23217, "loss": 1.0592, "learning_rate": 4.190647951474328e-05, "epoch": 0.7907998449412069, "percentage": 26.36, "elapsed_time": "0:09:39", "remaining_time": "0:26:58", "throughput": "86545.26", "total_tokens": 50135040} {"current_steps": 6130, "total_steps": 23217, "loss": 0.8778, "learning_rate": 4.188154375429288e-05, "epoch": 0.7920920015505879, "percentage": 26.4, "elapsed_time": "0:10:26", "remaining_time": "0:29:05", "throughput": "80190.82", "total_tokens": 50216960} {"current_steps": 6140, "total_steps": 23217, "loss": 1.329, "learning_rate": 4.1856577083797646e-05, "epoch": 0.793384158159969, "percentage": 26.45, "elapsed_time": "0:11:13", "remaining_time": "0:31:12", "throughput": "74721.93", "total_tokens": 50298880} {"current_steps": 6150, "total_steps": 23217, "loss": 1.2239, "learning_rate": 4.183157954897144e-05, "epoch": 0.7946763147693501, "percentage": 26.49, "elapsed_time": "0:12:00", "remaining_time": "0:33:18", "throughput": "69944.37", "total_tokens": 50380800} {"current_steps": 6160, "total_steps": 23217, "loss": 1.0103, "learning_rate": 4.1806551195584685e-05, "epoch": 0.7959684713787311, "percentage": 26.53, "elapsed_time": "0:12:47", "remaining_time": "0:35:24", "throughput": "65774.80", "total_tokens": 50462720} {"current_steps": 6170, "total_steps": 23217, "loss": 0.8958, "learning_rate": 4.178149206946419e-05, "epoch": 0.7972606279881121, "percentage": 26.58, "elapsed_time": "0:13:34", "remaining_time": "0:37:29", "throughput": "62082.60", "total_tokens": 50544640} {"current_steps": 6180, "total_steps": 23217, "loss": 1.0327, "learning_rate": 4.1756402216493115e-05, "epoch": 0.7985527845974932, "percentage": 26.62, "elapsed_time": "0:14:21", "remaining_time": "0:39:33", "throughput": "58793.79", "total_tokens": 50626560} {"current_steps": 6190, "total_steps": 23217, "loss": 0.9924, "learning_rate": 4.17312816826109e-05, "epoch": 0.7998449412068743, "percentage": 26.66, "elapsed_time": "0:15:08", "remaining_time": "0:41:37", "throughput": "55841.94", "total_tokens": 50708480} {"current_steps": 6200, "total_steps": 23217, "loss": 0.7853, "learning_rate": 4.1706130513813146e-05, "epoch": 0.8011370978162553, "percentage": 26.7, "elapsed_time": "0:15:54", "remaining_time": "0:43:41", "throughput": "53183.97", "total_tokens": 50790400} {"current_steps": 6210, "total_steps": 23217, "loss": 0.9263, "learning_rate": 4.1680948756151564e-05, "epoch": 0.8024292544256364, "percentage": 26.75, "elapsed_time": "0:16:41", "remaining_time": "0:45:43", "throughput": "50774.85", "total_tokens": 50872320} {"current_steps": 6220, "total_steps": 23217, "loss": 0.9224, "learning_rate": 4.165573645573384e-05, "epoch": 0.8037214110350175, "percentage": 26.79, "elapsed_time": "0:17:28", "remaining_time": "0:47:46", "throughput": "48580.28", "total_tokens": 50954240} {"current_steps": 6230, "total_steps": 23217, "loss": 1.2382, "learning_rate": 4.1630493658723606e-05, "epoch": 0.8050135676443985, "percentage": 26.83, "elapsed_time": "0:18:15", "remaining_time": "0:49:47", "throughput": "46574.43", "total_tokens": 51036160} {"current_steps": 6240, "total_steps": 23217, "loss": 1.0701, "learning_rate": 4.160522041134035e-05, "epoch": 0.8063057242537796, "percentage": 26.88, "elapsed_time": "0:19:02", "remaining_time": "0:51:48", "throughput": "44734.31", "total_tokens": 51118080} {"current_steps": 6250, "total_steps": 23217, "loss": 0.9246, "learning_rate": 4.1579916759859286e-05, "epoch": 0.8075978808631606, "percentage": 26.92, "elapsed_time": "0:19:49", "remaining_time": "0:53:49", "throughput": "43038.70", "total_tokens": 51200000} {"current_steps": 6260, "total_steps": 23217, "loss": 1.1799, "learning_rate": 4.155458275061129e-05, "epoch": 0.8088900374725416, "percentage": 26.96, "elapsed_time": "0:20:36", "remaining_time": "0:55:50", "throughput": "41464.45", "total_tokens": 51281920} {"current_steps": 6270, "total_steps": 23217, "loss": 1.2025, "learning_rate": 4.152921842998287e-05, "epoch": 0.8101821940819227, "percentage": 27.01, "elapsed_time": "0:21:23", "remaining_time": "0:57:49", "throughput": "40012.57", "total_tokens": 51363840} {"current_steps": 6280, "total_steps": 23217, "loss": 0.7594, "learning_rate": 4.150382384441598e-05, "epoch": 0.8114743506913038, "percentage": 27.05, "elapsed_time": "0:22:10", "remaining_time": "0:59:48", "throughput": "38663.30", "total_tokens": 51445760} {"current_steps": 6290, "total_steps": 23217, "loss": 0.8714, "learning_rate": 4.147839904040803e-05, "epoch": 0.8127665073006849, "percentage": 27.09, "elapsed_time": "0:22:57", "remaining_time": "1:01:47", "throughput": "37405.95", "total_tokens": 51527680} {"current_steps": 6300, "total_steps": 23217, "loss": 1.2455, "learning_rate": 4.145294406451173e-05, "epoch": 0.8140586639100659, "percentage": 27.14, "elapsed_time": "0:23:44", "remaining_time": "1:03:45", "throughput": "36230.83", "total_tokens": 51609600} {"current_steps": 6310, "total_steps": 23217, "loss": 1.1417, "learning_rate": 4.142745896333505e-05, "epoch": 0.815350820519447, "percentage": 27.18, "elapsed_time": "0:24:31", "remaining_time": "1:05:42", "throughput": "35131.20", "total_tokens": 51691520} {"current_steps": 6320, "total_steps": 23217, "loss": 1.1736, "learning_rate": 4.140194378354113e-05, "epoch": 0.816642977128828, "percentage": 27.22, "elapsed_time": "0:25:18", "remaining_time": "1:07:39", "throughput": "34099.36", "total_tokens": 51773440} {"current_steps": 6330, "total_steps": 23217, "loss": 0.8252, "learning_rate": 4.137639857184815e-05, "epoch": 0.817935133738209, "percentage": 27.26, "elapsed_time": "0:26:05", "remaining_time": "1:09:35", "throughput": "33129.67", "total_tokens": 51855360} {"current_steps": 6340, "total_steps": 23217, "loss": 1.2724, "learning_rate": 4.1350823375029326e-05, "epoch": 0.8192272903475901, "percentage": 27.31, "elapsed_time": "0:26:52", "remaining_time": "1:11:31", "throughput": "32216.50", "total_tokens": 51937280} {"current_steps": 6350, "total_steps": 23217, "loss": 0.6208, "learning_rate": 4.132521823991272e-05, "epoch": 0.8205194469569712, "percentage": 27.35, "elapsed_time": "0:27:39", "remaining_time": "1:13:26", "throughput": "31354.63", "total_tokens": 52019200} {"current_steps": 6360, "total_steps": 23217, "loss": 0.8883, "learning_rate": 4.129958321338127e-05, "epoch": 0.8218116035663522, "percentage": 27.39, "elapsed_time": "0:28:25", "remaining_time": "1:15:21", "throughput": "30540.07", "total_tokens": 52101120} {"current_steps": 6370, "total_steps": 23217, "loss": 0.7734, "learning_rate": 4.127391834237258e-05, "epoch": 0.8231037601757333, "percentage": 27.44, "elapsed_time": "0:29:12", "remaining_time": "1:17:15", "throughput": "29769.65", "total_tokens": 52183040} {"current_steps": 6380, "total_steps": 23217, "loss": 0.8842, "learning_rate": 4.124822367387897e-05, "epoch": 0.8243959167851144, "percentage": 27.48, "elapsed_time": "0:29:59", "remaining_time": "1:19:09", "throughput": "29038.97", "total_tokens": 52264960} {"current_steps": 6390, "total_steps": 23217, "loss": 0.8806, "learning_rate": 4.122249925494726e-05, "epoch": 0.8256880733944955, "percentage": 27.52, "elapsed_time": "0:30:46", "remaining_time": "1:21:03", "throughput": "28345.91", "total_tokens": 52346880} {"current_steps": 6400, "total_steps": 23217, "loss": 0.9348, "learning_rate": 4.119674513267878e-05, "epoch": 0.8269802300038764, "percentage": 27.57, "elapsed_time": "0:31:33", "remaining_time": "1:22:55", "throughput": "27686.84", "total_tokens": 52428800} {"current_steps": 6410, "total_steps": 23217, "loss": 0.7648, "learning_rate": 4.117096135422923e-05, "epoch": 0.8282723866132575, "percentage": 27.61, "elapsed_time": "0:32:20", "remaining_time": "1:24:48", "throughput": "27059.49", "total_tokens": 52510720} {"current_steps": 6420, "total_steps": 23217, "loss": 0.6926, "learning_rate": 4.114514796680862e-05, "epoch": 0.8295645432226386, "percentage": 27.65, "elapsed_time": "0:33:07", "remaining_time": "1:26:39", "throughput": "26461.98", "total_tokens": 52592640} {"current_steps": 6430, "total_steps": 23217, "loss": 1.0296, "learning_rate": 4.111930501768116e-05, "epoch": 0.8308566998320196, "percentage": 27.7, "elapsed_time": "0:33:54", "remaining_time": "1:28:31", "throughput": "25891.93", "total_tokens": 52674560} {"current_steps": 6440, "total_steps": 23217, "loss": 0.9102, "learning_rate": 4.1093432554165196e-05, "epoch": 0.8321488564414007, "percentage": 27.74, "elapsed_time": "0:34:41", "remaining_time": "1:30:22", "throughput": "25347.33", "total_tokens": 52756480} {"current_steps": 6450, "total_steps": 23217, "loss": 0.8159, "learning_rate": 4.106753062363311e-05, "epoch": 0.8334410130507818, "percentage": 27.78, "elapsed_time": "0:35:28", "remaining_time": "1:32:12", "throughput": "24827.07", "total_tokens": 52838400} {"current_steps": 6460, "total_steps": 23217, "loss": 1.1631, "learning_rate": 4.104159927351125e-05, "epoch": 0.8347331696601629, "percentage": 27.82, "elapsed_time": "0:36:15", "remaining_time": "1:34:02", "throughput": "24328.94", "total_tokens": 52920320} {"current_steps": 6470, "total_steps": 23217, "loss": 0.8534, "learning_rate": 4.1015638551279825e-05, "epoch": 0.8360253262695438, "percentage": 27.87, "elapsed_time": "0:37:02", "remaining_time": "1:35:51", "throughput": "23851.99", "total_tokens": 53002240} {"current_steps": 6480, "total_steps": 23217, "loss": 1.0583, "learning_rate": 4.098964850447281e-05, "epoch": 0.8373174828789249, "percentage": 27.91, "elapsed_time": "0:37:49", "remaining_time": "1:37:40", "throughput": "23394.54", "total_tokens": 53084160} {"current_steps": 6490, "total_steps": 23217, "loss": 0.8959, "learning_rate": 4.0963629180677896e-05, "epoch": 0.838609639488306, "percentage": 27.95, "elapsed_time": "0:38:36", "remaining_time": "1:39:29", "throughput": "22955.93", "total_tokens": 53166080} {"current_steps": 6500, "total_steps": 23217, "loss": 1.1624, "learning_rate": 4.093758062753638e-05, "epoch": 0.839901796097687, "percentage": 28.0, "elapsed_time": "0:39:23", "remaining_time": "1:41:17", "throughput": "22531.41", "total_tokens": 53248000} {"current_steps": 6510, "total_steps": 23217, "loss": 1.2004, "learning_rate": 4.0911502892743035e-05, "epoch": 0.8411939527070681, "percentage": 28.04, "elapsed_time": "0:40:14", "remaining_time": "1:43:15", "throughput": "22089.92", "total_tokens": 53329920} {"current_steps": 6520, "total_steps": 23217, "loss": 1.2094, "learning_rate": 4.088539602404613e-05, "epoch": 0.8424861093164492, "percentage": 28.08, "elapsed_time": "0:41:03", "remaining_time": "1:45:08", "throughput": "21683.67", "total_tokens": 53411840} {"current_steps": 6530, "total_steps": 23217, "loss": 1.0853, "learning_rate": 4.085926006924723e-05, "epoch": 0.8437782659258302, "percentage": 28.13, "elapsed_time": "0:41:50", "remaining_time": "1:46:56", "throughput": "21303.98", "total_tokens": 53493760} {"current_steps": 6540, "total_steps": 23217, "loss": 0.8684, "learning_rate": 4.083309507620118e-05, "epoch": 0.8450704225352113, "percentage": 28.17, "elapsed_time": "0:42:38", "remaining_time": "1:48:44", "throughput": "20938.31", "total_tokens": 53575680} {"current_steps": 6550, "total_steps": 23217, "loss": 1.1792, "learning_rate": 4.080690109281597e-05, "epoch": 0.8463625791445923, "percentage": 28.21, "elapsed_time": "0:43:27", "remaining_time": "1:50:34", "throughput": "20579.23", "total_tokens": 53657600} {"current_steps": 6560, "total_steps": 23217, "loss": 0.8527, "learning_rate": 4.078067816705272e-05, "epoch": 0.8476547357539734, "percentage": 28.26, "elapsed_time": "0:44:17", "remaining_time": "1:52:28", "throughput": "20219.21", "total_tokens": 53739520} {"current_steps": 6570, "total_steps": 23217, "loss": 0.9558, "learning_rate": 4.075442634692548e-05, "epoch": 0.8489468923633544, "percentage": 28.3, "elapsed_time": "0:45:06", "remaining_time": "1:54:17", "throughput": "19886.69", "total_tokens": 53821440} {"current_steps": 6580, "total_steps": 23217, "loss": 1.0556, "learning_rate": 4.072814568050125e-05, "epoch": 0.8502390489727355, "percentage": 28.34, "elapsed_time": "0:45:54", "remaining_time": "1:56:04", "throughput": "19567.93", "total_tokens": 53903360} {"current_steps": 6590, "total_steps": 23217, "loss": 0.9564, "learning_rate": 4.070183621589983e-05, "epoch": 0.8515312055821166, "percentage": 28.38, "elapsed_time": "0:46:42", "remaining_time": "1:57:50", "throughput": "19264.67", "total_tokens": 53985280} {"current_steps": 6600, "total_steps": 23217, "loss": 1.2202, "learning_rate": 4.067549800129375e-05, "epoch": 0.8528233621914976, "percentage": 28.43, "elapsed_time": "0:47:29", "remaining_time": "1:59:34", "throughput": "18973.70", "total_tokens": 54067200} {"current_steps": 6610, "total_steps": 23217, "loss": 0.9542, "learning_rate": 4.06491310849082e-05, "epoch": 0.8541155188008787, "percentage": 28.47, "elapsed_time": "0:48:16", "remaining_time": "2:01:17", "throughput": "18694.22", "total_tokens": 54149120} {"current_steps": 6620, "total_steps": 23217, "loss": 1.0358, "learning_rate": 4.0622735515020896e-05, "epoch": 0.8554076754102597, "percentage": 28.51, "elapsed_time": "0:49:03", "remaining_time": "2:02:59", "throughput": "18423.19", "total_tokens": 54231040} {"current_steps": 6630, "total_steps": 23217, "loss": 1.2331, "learning_rate": 4.059631133996203e-05, "epoch": 0.8566998320196407, "percentage": 28.56, "elapsed_time": "0:49:50", "remaining_time": "2:04:42", "throughput": "18160.95", "total_tokens": 54312960} {"current_steps": 6640, "total_steps": 23217, "loss": 0.9423, "learning_rate": 4.0569858608114177e-05, "epoch": 0.8579919886290218, "percentage": 28.6, "elapsed_time": "0:50:37", "remaining_time": "2:06:23", "throughput": "17907.14", "total_tokens": 54394880} {"current_steps": 6650, "total_steps": 23217, "loss": 1.1609, "learning_rate": 4.054337736791218e-05, "epoch": 0.8592841452384029, "percentage": 28.64, "elapsed_time": "0:51:24", "remaining_time": "2:08:04", "throughput": "17661.16", "total_tokens": 54476800} {"current_steps": 6660, "total_steps": 23217, "loss": 0.9658, "learning_rate": 4.05168676678431e-05, "epoch": 0.860576301847784, "percentage": 28.69, "elapsed_time": "0:52:11", "remaining_time": "2:09:45", "throughput": "17421.56", "total_tokens": 54558720} {"current_steps": 6670, "total_steps": 23217, "loss": 0.7992, "learning_rate": 4.04903295564461e-05, "epoch": 0.861868458457165, "percentage": 28.73, "elapsed_time": "0:52:59", "remaining_time": "2:11:28", "throughput": "17183.18", "total_tokens": 54640640} {"current_steps": 6680, "total_steps": 23217, "loss": 0.9918, "learning_rate": 4.046376308231237e-05, "epoch": 0.8631606150665461, "percentage": 28.77, "elapsed_time": "0:53:47", "remaining_time": "2:13:09", "throughput": "16955.46", "total_tokens": 54722560} {"current_steps": 6690, "total_steps": 23217, "loss": 0.9523, "learning_rate": 4.0437168294085013e-05, "epoch": 0.8644527716759272, "percentage": 28.82, "elapsed_time": "0:54:34", "remaining_time": "2:14:49", "throughput": "16737.08", "total_tokens": 54804480} {"current_steps": 6700, "total_steps": 23217, "loss": 1.1628, "learning_rate": 4.0410545240459005e-05, "epoch": 0.8657449282853081, "percentage": 28.86, "elapsed_time": "0:55:21", "remaining_time": "2:16:28", "throughput": "16524.81", "total_tokens": 54886400} {"current_steps": 6710, "total_steps": 23217, "loss": 1.0468, "learning_rate": 4.0383893970181054e-05, "epoch": 0.8670370848946892, "percentage": 28.9, "elapsed_time": "0:56:08", "remaining_time": "2:18:06", "throughput": "16318.21", "total_tokens": 54968320} {"current_steps": 6720, "total_steps": 23217, "loss": 1.2028, "learning_rate": 4.0357214532049535e-05, "epoch": 0.8683292415040703, "percentage": 28.94, "elapsed_time": "0:56:57", "remaining_time": "2:19:48", "throughput": "16109.63", "total_tokens": 55050240} {"current_steps": 6730, "total_steps": 23217, "loss": 0.503, "learning_rate": 4.03305069749144e-05, "epoch": 0.8696213981134514, "percentage": 28.99, "elapsed_time": "0:57:44", "remaining_time": "2:21:26", "throughput": "15914.87", "total_tokens": 55132160} {"current_steps": 6740, "total_steps": 23217, "loss": 1.0739, "learning_rate": 4.03037713476771e-05, "epoch": 0.8709135547228324, "percentage": 29.03, "elapsed_time": "0:58:31", "remaining_time": "2:23:04", "throughput": "15724.34", "total_tokens": 55214080} {"current_steps": 6750, "total_steps": 23217, "loss": 0.7428, "learning_rate": 4.027700769929046e-05, "epoch": 0.8722057113322135, "percentage": 29.07, "elapsed_time": "0:59:18", "remaining_time": "2:24:41", "throughput": "15538.38", "total_tokens": 55296000} {"current_steps": 6760, "total_steps": 23217, "loss": 1.0242, "learning_rate": 4.025021607875862e-05, "epoch": 0.8734978679415946, "percentage": 29.12, "elapsed_time": "1:00:05", "remaining_time": "2:26:17", "throughput": "15359.00", "total_tokens": 55377920} {"current_steps": 6770, "total_steps": 23217, "loss": 1.2703, "learning_rate": 4.0223396535136945e-05, "epoch": 0.8747900245509755, "percentage": 29.16, "elapsed_time": "1:00:52", "remaining_time": "2:27:53", "throughput": "15183.62", "total_tokens": 55459840} {"current_steps": 6780, "total_steps": 23217, "loss": 0.8773, "learning_rate": 4.019654911753193e-05, "epoch": 0.8760821811603566, "percentage": 29.2, "elapsed_time": "1:01:39", "remaining_time": "2:29:29", "throughput": "15012.88", "total_tokens": 55541760} {"current_steps": 6790, "total_steps": 23217, "loss": 1.094, "learning_rate": 4.016967387510108e-05, "epoch": 0.8773743377697377, "percentage": 29.25, "elapsed_time": "1:02:27", "remaining_time": "2:31:05", "throughput": "14844.34", "total_tokens": 55623680} {"current_steps": 6800, "total_steps": 23217, "loss": 0.9265, "learning_rate": 4.014277085705288e-05, "epoch": 0.8786664943791187, "percentage": 29.29, "elapsed_time": "1:03:14", "remaining_time": "2:32:40", "throughput": "14680.92", "total_tokens": 55705600} {"current_steps": 6810, "total_steps": 23217, "loss": 0.9153, "learning_rate": 4.011584011264665e-05, "epoch": 0.8799586509884998, "percentage": 29.33, "elapsed_time": "1:04:01", "remaining_time": "2:34:15", "throughput": "14522.11", "total_tokens": 55787520} {"current_steps": 6820, "total_steps": 23217, "loss": 0.7931, "learning_rate": 4.0088881691192474e-05, "epoch": 0.8812508075978809, "percentage": 29.38, "elapsed_time": "1:04:48", "remaining_time": "2:35:48", "throughput": "14367.95", "total_tokens": 55869440} {"current_steps": 6830, "total_steps": 23217, "loss": 0.9963, "learning_rate": 4.006189564205115e-05, "epoch": 0.882542964207262, "percentage": 29.42, "elapsed_time": "1:05:35", "remaining_time": "2:37:22", "throughput": "14217.40", "total_tokens": 55951360} {"current_steps": 6840, "total_steps": 23217, "loss": 0.7636, "learning_rate": 4.0034882014634015e-05, "epoch": 0.883835120816643, "percentage": 29.46, "elapsed_time": "1:06:22", "remaining_time": "2:38:55", "throughput": "14070.10", "total_tokens": 56033280} {"current_steps": 6850, "total_steps": 23217, "loss": 0.7192, "learning_rate": 4.000784085840293e-05, "epoch": 0.885127277426024, "percentage": 29.5, "elapsed_time": "1:07:09", "remaining_time": "2:40:27", "throughput": "13926.29", "total_tokens": 56115200} {"current_steps": 6860, "total_steps": 23217, "loss": 0.9082, "learning_rate": 3.9980772222870156e-05, "epoch": 0.8864194340354051, "percentage": 29.55, "elapsed_time": "1:07:56", "remaining_time": "2:41:59", "throughput": "13785.87", "total_tokens": 56197120} {"current_steps": 6870, "total_steps": 23217, "loss": 1.2218, "learning_rate": 3.995367615759825e-05, "epoch": 0.8877115906447861, "percentage": 29.59, "elapsed_time": "1:08:43", "remaining_time": "2:43:31", "throughput": "13648.89", "total_tokens": 56279040} {"current_steps": 6880, "total_steps": 23217, "loss": 1.0894, "learning_rate": 3.992655271220003e-05, "epoch": 0.8890037472541672, "percentage": 29.63, "elapsed_time": "1:09:30", "remaining_time": "2:45:02", "throughput": "13514.79", "total_tokens": 56360960} {"current_steps": 6890, "total_steps": 23217, "loss": 1.0208, "learning_rate": 3.98994019363384e-05, "epoch": 0.8902959038635483, "percentage": 29.68, "elapsed_time": "1:10:17", "remaining_time": "2:46:33", "throughput": "13383.51", "total_tokens": 56442880} {"current_steps": 6900, "total_steps": 23217, "loss": 0.7955, "learning_rate": 3.9872223879726356e-05, "epoch": 0.8915880604729293, "percentage": 29.72, "elapsed_time": "1:11:04", "remaining_time": "2:48:04", "throughput": "13255.33", "total_tokens": 56524800} {"current_steps": 6910, "total_steps": 23217, "loss": 1.262, "learning_rate": 3.98450185921268e-05, "epoch": 0.8928802170823104, "percentage": 29.76, "elapsed_time": "1:11:51", "remaining_time": "2:49:34", "throughput": "13129.87", "total_tokens": 56606720} {"current_steps": 6920, "total_steps": 23217, "loss": 1.1836, "learning_rate": 3.981778612335253e-05, "epoch": 0.8941723736916914, "percentage": 29.81, "elapsed_time": "1:12:38", "remaining_time": "2:51:03", "throughput": "13007.18", "total_tokens": 56688640} {"current_steps": 6930, "total_steps": 23217, "loss": 0.7662, "learning_rate": 3.979052652326609e-05, "epoch": 0.8954645303010725, "percentage": 29.85, "elapsed_time": "1:13:25", "remaining_time": "2:52:33", "throughput": "12887.21", "total_tokens": 56770560} {"current_steps": 6940, "total_steps": 23217, "loss": 0.7414, "learning_rate": 3.976323984177971e-05, "epoch": 0.8967566869104535, "percentage": 29.89, "elapsed_time": "1:14:12", "remaining_time": "2:54:02", "throughput": "12769.01", "total_tokens": 56852480} {"current_steps": 6950, "total_steps": 23217, "loss": 1.0458, "learning_rate": 3.97359261288552e-05, "epoch": 0.8980488435198346, "percentage": 29.93, "elapsed_time": "1:14:59", "remaining_time": "2:55:31", "throughput": "12653.83", "total_tokens": 56934400} {"current_steps": 6960, "total_steps": 23217, "loss": 1.0642, "learning_rate": 3.970858543450387e-05, "epoch": 0.8993410001292157, "percentage": 29.98, "elapsed_time": "1:15:46", "remaining_time": "2:56:59", "throughput": "12541.00", "total_tokens": 57016320} {"current_steps": 6970, "total_steps": 23217, "loss": 1.3093, "learning_rate": 3.968121780878643e-05, "epoch": 0.9006331567385967, "percentage": 30.02, "elapsed_time": "1:16:33", "remaining_time": "2:58:27", "throughput": "12430.56", "total_tokens": 57098240} {"current_steps": 6980, "total_steps": 23217, "loss": 0.6589, "learning_rate": 3.965382330181291e-05, "epoch": 0.9019253133479778, "percentage": 30.06, "elapsed_time": "1:17:20", "remaining_time": "2:59:54", "throughput": "12322.30", "total_tokens": 57180160} {"current_steps": 6990, "total_steps": 23217, "loss": 0.6929, "learning_rate": 3.962640196374254e-05, "epoch": 0.9032174699573589, "percentage": 30.11, "elapsed_time": "1:18:07", "remaining_time": "3:01:21", "throughput": "12216.35", "total_tokens": 57262080} {"current_steps": 7000, "total_steps": 23217, "loss": 1.1313, "learning_rate": 3.9598953844783705e-05, "epoch": 0.9045096265667399, "percentage": 30.15, "elapsed_time": "1:18:54", "remaining_time": "3:02:48", "throughput": "12112.46", "total_tokens": 57344000} {"current_steps": 7010, "total_steps": 23217, "loss": 0.8748, "learning_rate": 3.957147899519379e-05, "epoch": 0.9058017831761209, "percentage": 30.19, "elapsed_time": "1:19:48", "remaining_time": "3:04:31", "throughput": "11991.52", "total_tokens": 57425920} {"current_steps": 7020, "total_steps": 23217, "loss": 0.3491, "learning_rate": 3.954397746527916e-05, "epoch": 0.907093939785502, "percentage": 30.24, "elapsed_time": "1:20:35", "remaining_time": "3:05:57", "throughput": "11892.06", "total_tokens": 57507840} {"current_steps": 7030, "total_steps": 23217, "loss": 0.7414, "learning_rate": 3.951644930539502e-05, "epoch": 0.9083860963948831, "percentage": 30.28, "elapsed_time": "1:21:22", "remaining_time": "3:07:22", "throughput": "11794.55", "total_tokens": 57589760} {"current_steps": 7040, "total_steps": 23217, "loss": 0.8839, "learning_rate": 3.9488894565945305e-05, "epoch": 0.9096782530042641, "percentage": 30.32, "elapsed_time": "1:22:09", "remaining_time": "3:08:47", "throughput": "11698.78", "total_tokens": 57671680} {"current_steps": 7050, "total_steps": 23217, "loss": 0.5389, "learning_rate": 3.9461313297382666e-05, "epoch": 0.9109704096136452, "percentage": 30.37, "elapsed_time": "1:22:56", "remaining_time": "3:10:12", "throughput": "11604.74", "total_tokens": 57753600} {"current_steps": 7060, "total_steps": 23217, "loss": 1.0182, "learning_rate": 3.94337055502083e-05, "epoch": 0.9122625662230263, "percentage": 30.41, "elapsed_time": "1:23:43", "remaining_time": "3:11:36", "throughput": "11512.57", "total_tokens": 57835520} {"current_steps": 7070, "total_steps": 23217, "loss": 1.0376, "learning_rate": 3.9406071374971887e-05, "epoch": 0.9135547228324072, "percentage": 30.45, "elapsed_time": "1:24:30", "remaining_time": "3:13:00", "throughput": "11422.35", "total_tokens": 57917440} {"current_steps": 7080, "total_steps": 23217, "loss": 0.6095, "learning_rate": 3.93784108222715e-05, "epoch": 0.9148468794417883, "percentage": 30.49, "elapsed_time": "1:25:17", "remaining_time": "3:14:24", "throughput": "11333.44", "total_tokens": 57999360} {"current_steps": 7090, "total_steps": 23217, "loss": 1.0714, "learning_rate": 3.935072394275352e-05, "epoch": 0.9161390360511694, "percentage": 30.54, "elapsed_time": "1:26:04", "remaining_time": "3:15:47", "throughput": "11246.24", "total_tokens": 58081280} {"current_steps": 7100, "total_steps": 23217, "loss": 1.116, "learning_rate": 3.9323010787112505e-05, "epoch": 0.9174311926605505, "percentage": 30.58, "elapsed_time": "1:26:51", "remaining_time": "3:17:09", "throughput": "11160.75", "total_tokens": 58163200} {"current_steps": 7110, "total_steps": 23217, "loss": 1.1167, "learning_rate": 3.929527140609115e-05, "epoch": 0.9187233492699315, "percentage": 30.62, "elapsed_time": "1:27:38", "remaining_time": "3:18:32", "throughput": "11076.67", "total_tokens": 58245120} {"current_steps": 7120, "total_steps": 23217, "loss": 0.7755, "learning_rate": 3.926750585048016e-05, "epoch": 0.9200155058793126, "percentage": 30.67, "elapsed_time": "1:28:25", "remaining_time": "3:19:54", "throughput": "10994.01", "total_tokens": 58327040} {"current_steps": 7130, "total_steps": 23217, "loss": 0.7525, "learning_rate": 3.9239714171118167e-05, "epoch": 0.9213076624886937, "percentage": 30.71, "elapsed_time": "1:29:12", "remaining_time": "3:21:16", "throughput": "10912.75", "total_tokens": 58408960} {"current_steps": 7140, "total_steps": 23217, "loss": 0.9602, "learning_rate": 3.921189641889163e-05, "epoch": 0.9225998190980746, "percentage": 30.75, "elapsed_time": "1:29:59", "remaining_time": "3:22:37", "throughput": "10832.88", "total_tokens": 58490880} {"current_steps": 7150, "total_steps": 23217, "loss": 0.7652, "learning_rate": 3.918405264473476e-05, "epoch": 0.9238919757074557, "percentage": 30.8, "elapsed_time": "1:30:46", "remaining_time": "3:23:59", "throughput": "10754.09", "total_tokens": 58572800} {"current_steps": 7160, "total_steps": 23217, "loss": 0.5639, "learning_rate": 3.9156182899629404e-05, "epoch": 0.9251841323168368, "percentage": 30.84, "elapsed_time": "1:31:33", "remaining_time": "3:25:19", "throughput": "10676.95", "total_tokens": 58654720} {"current_steps": 7170, "total_steps": 23217, "loss": 0.8571, "learning_rate": 3.912828723460495e-05, "epoch": 0.9264762889262178, "percentage": 30.88, "elapsed_time": "1:32:20", "remaining_time": "3:26:40", "throughput": "10601.31", "total_tokens": 58736640} {"current_steps": 7180, "total_steps": 23217, "loss": 0.747, "learning_rate": 3.9100365700738275e-05, "epoch": 0.9277684455355989, "percentage": 30.93, "elapsed_time": "1:33:07", "remaining_time": "3:28:00", "throughput": "10526.82", "total_tokens": 58818560} {"current_steps": 7190, "total_steps": 23217, "loss": 0.8309, "learning_rate": 3.907241834915359e-05, "epoch": 0.92906060214498, "percentage": 30.97, "elapsed_time": "1:33:54", "remaining_time": "3:29:19", "throughput": "10453.69", "total_tokens": 58900480} {"current_steps": 7200, "total_steps": 23217, "loss": 0.9932, "learning_rate": 3.904444523102242e-05, "epoch": 0.9303527587543611, "percentage": 31.01, "elapsed_time": "1:34:41", "remaining_time": "3:30:38", "throughput": "10381.81", "total_tokens": 58982400} {"current_steps": 7210, "total_steps": 23217, "loss": 0.9913, "learning_rate": 3.901644639756342e-05, "epoch": 0.931644915363742, "percentage": 31.05, "elapsed_time": "1:35:28", "remaining_time": "3:31:57", "throughput": "10310.94", "total_tokens": 59064320} {"current_steps": 7220, "total_steps": 23217, "loss": 0.9762, "learning_rate": 3.898842190004235e-05, "epoch": 0.9329370719731231, "percentage": 31.1, "elapsed_time": "1:36:15", "remaining_time": "3:33:16", "throughput": "10241.20", "total_tokens": 59146240} {"current_steps": 7230, "total_steps": 23217, "loss": 0.6812, "learning_rate": 3.896037178977196e-05, "epoch": 0.9342292285825042, "percentage": 31.14, "elapsed_time": "1:37:02", "remaining_time": "3:34:34", "throughput": "10172.67", "total_tokens": 59228160} {"current_steps": 7240, "total_steps": 23217, "loss": 1.3312, "learning_rate": 3.893229611811192e-05, "epoch": 0.9355213851918852, "percentage": 31.18, "elapsed_time": "1:37:49", "remaining_time": "3:35:52", "throughput": "10105.09", "total_tokens": 59310080} {"current_steps": 7250, "total_steps": 23217, "loss": 1.0935, "learning_rate": 3.8904194936468665e-05, "epoch": 0.9368135418012663, "percentage": 31.23, "elapsed_time": "1:38:36", "remaining_time": "3:37:09", "throughput": "10038.72", "total_tokens": 59392000} {"current_steps": 7260, "total_steps": 23217, "loss": 0.7918, "learning_rate": 3.887606829629536e-05, "epoch": 0.9381056984106474, "percentage": 31.27, "elapsed_time": "1:39:23", "remaining_time": "3:38:26", "throughput": "9973.36", "total_tokens": 59473920} {"current_steps": 7270, "total_steps": 23217, "loss": 0.8013, "learning_rate": 3.884791624909178e-05, "epoch": 0.9393978550200285, "percentage": 31.31, "elapsed_time": "1:40:10", "remaining_time": "3:39:43", "throughput": "9909.09", "total_tokens": 59555840} {"current_steps": 7280, "total_steps": 23217, "loss": 1.0558, "learning_rate": 3.881973884640422e-05, "epoch": 0.9406900116294095, "percentage": 31.36, "elapsed_time": "1:40:57", "remaining_time": "3:41:00", "throughput": "9845.84", "total_tokens": 59637760} {"current_steps": 7290, "total_steps": 23217, "loss": 1.1583, "learning_rate": 3.87915361398254e-05, "epoch": 0.9419821682387906, "percentage": 31.4, "elapsed_time": "1:41:44", "remaining_time": "3:42:16", "throughput": "9783.51", "total_tokens": 59719680} {"current_steps": 7300, "total_steps": 23217, "loss": 0.4953, "learning_rate": 3.8763308180994384e-05, "epoch": 0.9432743248481716, "percentage": 31.44, "elapsed_time": "1:42:31", "remaining_time": "3:43:31", "throughput": "9722.05", "total_tokens": 59801600} {"current_steps": 7310, "total_steps": 23217, "loss": 1.1762, "learning_rate": 3.873505502159645e-05, "epoch": 0.9445664814575526, "percentage": 31.49, "elapsed_time": "1:43:18", "remaining_time": "3:44:47", "throughput": "9661.61", "total_tokens": 59883520} {"current_steps": 7320, "total_steps": 23217, "loss": 0.7593, "learning_rate": 3.8706776713363025e-05, "epoch": 0.9458586380669337, "percentage": 31.53, "elapsed_time": "1:44:05", "remaining_time": "3:46:02", "throughput": "9602.03", "total_tokens": 59965440} {"current_steps": 7330, "total_steps": 23217, "loss": 0.6101, "learning_rate": 3.86784733080716e-05, "epoch": 0.9471507946763148, "percentage": 31.57, "elapsed_time": "1:44:52", "remaining_time": "3:47:17", "throughput": "9543.38", "total_tokens": 60047360} {"current_steps": 7340, "total_steps": 23217, "loss": 1.1621, "learning_rate": 3.86501448575456e-05, "epoch": 0.9484429512856958, "percentage": 31.61, "elapsed_time": "1:45:39", "remaining_time": "3:48:31", "throughput": "9485.58", "total_tokens": 60129280} {"current_steps": 7350, "total_steps": 23217, "loss": 0.6934, "learning_rate": 3.862179141365431e-05, "epoch": 0.9497351078950769, "percentage": 31.66, "elapsed_time": "1:46:25", "remaining_time": "3:49:45", "throughput": "9428.67", "total_tokens": 60211200} {"current_steps": 7360, "total_steps": 23217, "loss": 1.064, "learning_rate": 3.859341302831279e-05, "epoch": 0.951027264504458, "percentage": 31.7, "elapsed_time": "1:47:12", "remaining_time": "3:50:59", "throughput": "9372.53", "total_tokens": 60293120} {"current_steps": 7370, "total_steps": 23217, "loss": 0.9418, "learning_rate": 3.856500975348176e-05, "epoch": 0.952319421113839, "percentage": 31.74, "elapsed_time": "1:47:59", "remaining_time": "3:52:13", "throughput": "9317.32", "total_tokens": 60375040} {"current_steps": 7380, "total_steps": 23217, "loss": 0.8951, "learning_rate": 3.8536581641167506e-05, "epoch": 0.95361157772322, "percentage": 31.79, "elapsed_time": "1:48:46", "remaining_time": "3:53:26", "throughput": "9262.85", "total_tokens": 60456960} {"current_steps": 7390, "total_steps": 23217, "loss": 0.9263, "learning_rate": 3.85081287434218e-05, "epoch": 0.9549037343326011, "percentage": 31.83, "elapsed_time": "1:49:33", "remaining_time": "3:54:39", "throughput": "9209.08", "total_tokens": 60538880} {"current_steps": 7400, "total_steps": 23217, "loss": 1.1756, "learning_rate": 3.84796511123418e-05, "epoch": 0.9561958909419822, "percentage": 31.87, "elapsed_time": "1:50:20", "remaining_time": "3:55:51", "throughput": "9156.13", "total_tokens": 60620800} {"current_steps": 7410, "total_steps": 23217, "loss": 0.9992, "learning_rate": 3.845114880006994e-05, "epoch": 0.9574880475513632, "percentage": 31.92, "elapsed_time": "1:51:07", "remaining_time": "3:57:03", "throughput": "9103.96", "total_tokens": 60702720} {"current_steps": 7420, "total_steps": 23217, "loss": 1.1923, "learning_rate": 3.842262185879384e-05, "epoch": 0.9587802041607443, "percentage": 31.96, "elapsed_time": "1:51:54", "remaining_time": "3:58:15", "throughput": "9052.45", "total_tokens": 60784640} {"current_steps": 7430, "total_steps": 23217, "loss": 0.828, "learning_rate": 3.8394070340746234e-05, "epoch": 0.9600723607701254, "percentage": 32.0, "elapsed_time": "1:52:41", "remaining_time": "3:59:27", "throughput": "9001.64", "total_tokens": 60866560} {"current_steps": 7440, "total_steps": 23217, "loss": 0.9765, "learning_rate": 3.836549429820485e-05, "epoch": 0.9613645173795063, "percentage": 32.05, "elapsed_time": "1:53:28", "remaining_time": "4:00:38", "throughput": "8951.57", "total_tokens": 60948480} {"current_steps": 7450, "total_steps": 23217, "loss": 0.9062, "learning_rate": 3.833689378349231e-05, "epoch": 0.9626566739888874, "percentage": 32.09, "elapsed_time": "1:54:15", "remaining_time": "4:01:49", "throughput": "8902.10", "total_tokens": 61030400} {"current_steps": 7460, "total_steps": 23217, "loss": 1.0222, "learning_rate": 3.830826884897606e-05, "epoch": 0.9639488305982685, "percentage": 32.13, "elapsed_time": "1:55:02", "remaining_time": "4:02:59", "throughput": "8853.43", "total_tokens": 61112320} {"current_steps": 7470, "total_steps": 23217, "loss": 1.118, "learning_rate": 3.827961954706825e-05, "epoch": 0.9652409872076496, "percentage": 32.17, "elapsed_time": "1:55:49", "remaining_time": "4:04:09", "throughput": "8805.46", "total_tokens": 61194240} {"current_steps": 7480, "total_steps": 23217, "loss": 1.078, "learning_rate": 3.825094593022563e-05, "epoch": 0.9665331438170306, "percentage": 32.22, "elapsed_time": "1:56:47", "remaining_time": "4:05:41", "throughput": "8744.94", "total_tokens": 61276160} {"current_steps": 7490, "total_steps": 23217, "loss": 0.665, "learning_rate": 3.8222248050949505e-05, "epoch": 0.9678253004264117, "percentage": 32.26, "elapsed_time": "1:57:33", "remaining_time": "4:06:51", "throughput": "8698.39", "total_tokens": 61358080} {"current_steps": 7500, "total_steps": 23217, "loss": 0.9969, "learning_rate": 3.8193525961785584e-05, "epoch": 0.9691174570357928, "percentage": 32.3, "elapsed_time": "1:58:20", "remaining_time": "4:08:00", "throughput": "8652.34", "total_tokens": 61440000} {"current_steps": 7510, "total_steps": 23217, "loss": 0.9114, "learning_rate": 3.8164779715323905e-05, "epoch": 0.9704096136451738, "percentage": 32.35, "elapsed_time": "1:59:07", "remaining_time": "4:09:09", "throughput": "8606.94", "total_tokens": 61521920} {"current_steps": 7520, "total_steps": 23217, "loss": 0.7856, "learning_rate": 3.813600936419874e-05, "epoch": 0.9717017702545548, "percentage": 32.39, "elapsed_time": "1:59:54", "remaining_time": "4:10:18", "throughput": "8562.04", "total_tokens": 61603840} {"current_steps": 7530, "total_steps": 23217, "loss": 1.0216, "learning_rate": 3.81072149610885e-05, "epoch": 0.9729939268639359, "percentage": 32.43, "elapsed_time": "2:00:41", "remaining_time": "4:11:27", "throughput": "8517.78", "total_tokens": 61685760} {"current_steps": 7540, "total_steps": 23217, "loss": 0.7388, "learning_rate": 3.807839655871563e-05, "epoch": 0.9742860834733169, "percentage": 32.48, "elapsed_time": "2:01:28", "remaining_time": "4:12:35", "throughput": "8474.10", "total_tokens": 61767680} {"current_steps": 7550, "total_steps": 23217, "loss": 0.6208, "learning_rate": 3.8049554209846514e-05, "epoch": 0.975578240082698, "percentage": 32.52, "elapsed_time": "2:02:16", "remaining_time": "4:13:43", "throughput": "8430.84", "total_tokens": 61849600} {"current_steps": 7560, "total_steps": 23217, "loss": 1.1114, "learning_rate": 3.802068796729139e-05, "epoch": 0.9768703966920791, "percentage": 32.56, "elapsed_time": "2:03:03", "remaining_time": "4:14:50", "throughput": "8388.35", "total_tokens": 61931520} {"current_steps": 7570, "total_steps": 23217, "loss": 0.9243, "learning_rate": 3.7991797883904254e-05, "epoch": 0.9781625533014602, "percentage": 32.61, "elapsed_time": "2:03:50", "remaining_time": "4:15:57", "throughput": "8346.31", "total_tokens": 62013440} {"current_steps": 7580, "total_steps": 23217, "loss": 0.8196, "learning_rate": 3.796288401258272e-05, "epoch": 0.9794547099108412, "percentage": 32.65, "elapsed_time": "2:04:37", "remaining_time": "4:17:04", "throughput": "8304.74", "total_tokens": 62095360} {"current_steps": 7590, "total_steps": 23217, "loss": 0.8933, "learning_rate": 3.7933946406268e-05, "epoch": 0.9807468665202222, "percentage": 32.69, "elapsed_time": "2:05:24", "remaining_time": "4:18:11", "throughput": "8263.77", "total_tokens": 62177280} {"current_steps": 7600, "total_steps": 23217, "loss": 0.9035, "learning_rate": 3.790498511794473e-05, "epoch": 0.9820390231296033, "percentage": 32.73, "elapsed_time": "2:06:11", "remaining_time": "4:19:17", "throughput": "8223.33", "total_tokens": 62259200} {"current_steps": 7610, "total_steps": 23217, "loss": 0.9369, "learning_rate": 3.787600020064095e-05, "epoch": 0.9833311797389843, "percentage": 32.78, "elapsed_time": "2:06:57", "remaining_time": "4:20:23", "throughput": "8183.43", "total_tokens": 62341120} {"current_steps": 7620, "total_steps": 23217, "loss": 0.7782, "learning_rate": 3.7846991707427905e-05, "epoch": 0.9846233363483654, "percentage": 32.82, "elapsed_time": "2:07:45", "remaining_time": "4:21:29", "throughput": "8143.90", "total_tokens": 62423040} {"current_steps": 7630, "total_steps": 23217, "loss": 0.8775, "learning_rate": 3.7817959691420056e-05, "epoch": 0.9859154929577465, "percentage": 32.86, "elapsed_time": "2:08:31", "remaining_time": "4:22:34", "throughput": "8104.94", "total_tokens": 62504960} {"current_steps": 7640, "total_steps": 23217, "loss": 0.7959, "learning_rate": 3.778890420577492e-05, "epoch": 0.9872076495671276, "percentage": 32.91, "elapsed_time": "2:09:18", "remaining_time": "4:23:39", "throughput": "8066.45", "total_tokens": 62586880} {"current_steps": 7650, "total_steps": 23217, "loss": 1.0962, "learning_rate": 3.775982530369298e-05, "epoch": 0.9884998061765086, "percentage": 32.95, "elapsed_time": "2:10:05", "remaining_time": "4:24:44", "throughput": "8028.46", "total_tokens": 62668800} {"current_steps": 7660, "total_steps": 23217, "loss": 1.1062, "learning_rate": 3.77307230384176e-05, "epoch": 0.9897919627858897, "percentage": 32.99, "elapsed_time": "2:10:52", "remaining_time": "4:25:48", "throughput": "7990.82", "total_tokens": 62750720} {"current_steps": 7670, "total_steps": 23217, "loss": 0.6531, "learning_rate": 3.7701597463234916e-05, "epoch": 0.9910841193952707, "percentage": 33.04, "elapsed_time": "2:11:39", "remaining_time": "4:26:52", "throughput": "7953.71", "total_tokens": 62832640} {"current_steps": 7680, "total_steps": 23217, "loss": 0.8184, "learning_rate": 3.767244863147377e-05, "epoch": 0.9923762760046517, "percentage": 33.08, "elapsed_time": "2:12:26", "remaining_time": "4:27:56", "throughput": "7917.07", "total_tokens": 62914560} {"current_steps": 7690, "total_steps": 23217, "loss": 1.1191, "learning_rate": 3.764327659650553e-05, "epoch": 0.9936684326140328, "percentage": 33.12, "elapsed_time": "2:13:13", "remaining_time": "4:29:00", "throughput": "7880.75", "total_tokens": 62996480} {"current_steps": 7700, "total_steps": 23217, "loss": 1.1411, "learning_rate": 3.7614081411744116e-05, "epoch": 0.9949605892234139, "percentage": 33.17, "elapsed_time": "2:14:00", "remaining_time": "4:30:03", "throughput": "7844.92", "total_tokens": 63078400} {"current_steps": 7710, "total_steps": 23217, "loss": 1.0581, "learning_rate": 3.75848631306458e-05, "epoch": 0.9962527458327949, "percentage": 33.21, "elapsed_time": "2:14:47", "remaining_time": "4:31:06", "throughput": "7809.46", "total_tokens": 63160320} {"current_steps": 7720, "total_steps": 23217, "loss": 0.8535, "learning_rate": 3.755562180670914e-05, "epoch": 0.997544902442176, "percentage": 33.25, "elapsed_time": "2:15:34", "remaining_time": "4:32:09", "throughput": "7774.44", "total_tokens": 63242240} {"current_steps": 7730, "total_steps": 23217, "loss": 0.7162, "learning_rate": 3.75263574934749e-05, "epoch": 0.9988370590515571, "percentage": 33.29, "elapsed_time": "2:16:21", "remaining_time": "4:33:11", "throughput": "7739.81", "total_tokens": 63324160} {"current_steps": 7740, "total_steps": 23217, "loss": 0.6882, "learning_rate": 3.7497070244525925e-05, "epoch": 1.000129215660938, "percentage": 33.34, "elapsed_time": "2:17:08", "remaining_time": "4:34:13", "throughput": "7705.59", "total_tokens": 63406080} {"current_steps": 7750, "total_steps": 23217, "loss": 1.1799, "learning_rate": 3.746776011348706e-05, "epoch": 1.0014213722703191, "percentage": 33.38, "elapsed_time": "2:17:55", "remaining_time": "4:35:15", "throughput": "7671.74", "total_tokens": 63488000} {"current_steps": 7760, "total_steps": 23217, "loss": 0.5552, "learning_rate": 3.7438427154025045e-05, "epoch": 1.0027135288797002, "percentage": 33.42, "elapsed_time": "2:18:42", "remaining_time": "4:36:17", "throughput": "7638.27", "total_tokens": 63569920} {"current_steps": 7770, "total_steps": 23217, "loss": 1.1324, "learning_rate": 3.7409071419848436e-05, "epoch": 1.0040056854890813, "percentage": 33.47, "elapsed_time": "2:19:29", "remaining_time": "4:37:18", "throughput": "7605.23", "total_tokens": 63651840} {"current_steps": 7780, "total_steps": 23217, "loss": 0.9001, "learning_rate": 3.7379692964707456e-05, "epoch": 1.0052978420984624, "percentage": 33.51, "elapsed_time": "2:20:16", "remaining_time": "4:38:19", "throughput": "7572.51", "total_tokens": 63733760} {"current_steps": 7790, "total_steps": 23217, "loss": 1.1056, "learning_rate": 3.735029184239396e-05, "epoch": 1.0065899987078435, "percentage": 33.55, "elapsed_time": "2:21:03", "remaining_time": "4:39:20", "throughput": "7540.18", "total_tokens": 63815680} {"current_steps": 7800, "total_steps": 23217, "loss": 0.9637, "learning_rate": 3.73208681067413e-05, "epoch": 1.0078821553172244, "percentage": 33.6, "elapsed_time": "2:21:50", "remaining_time": "4:40:21", "throughput": "7508.21", "total_tokens": 63897600} {"current_steps": 7810, "total_steps": 23217, "loss": 0.6649, "learning_rate": 3.7291421811624216e-05, "epoch": 1.0091743119266054, "percentage": 33.64, "elapsed_time": "2:22:37", "remaining_time": "4:41:21", "throughput": "7476.62", "total_tokens": 63979520} {"current_steps": 7820, "total_steps": 23217, "loss": 0.5021, "learning_rate": 3.726195301095877e-05, "epoch": 1.0104664685359865, "percentage": 33.68, "elapsed_time": "2:23:24", "remaining_time": "4:42:21", "throughput": "7445.29", "total_tokens": 64061440} {"current_steps": 7830, "total_steps": 23217, "loss": 0.9135, "learning_rate": 3.7232461758702244e-05, "epoch": 1.0117586251453676, "percentage": 33.73, "elapsed_time": "2:24:11", "remaining_time": "4:43:21", "throughput": "7414.20", "total_tokens": 64143360} {"current_steps": 7840, "total_steps": 23217, "loss": 0.6548, "learning_rate": 3.7202948108852984e-05, "epoch": 1.0130507817547487, "percentage": 33.77, "elapsed_time": "2:24:58", "remaining_time": "4:44:20", "throughput": "7383.59", "total_tokens": 64225280} {"current_steps": 7850, "total_steps": 23217, "loss": 0.6679, "learning_rate": 3.717341211545039e-05, "epoch": 1.0143429383641298, "percentage": 33.81, "elapsed_time": "2:25:45", "remaining_time": "4:45:19", "throughput": "7353.32", "total_tokens": 64307200} {"current_steps": 7860, "total_steps": 23217, "loss": 1.115, "learning_rate": 3.714385383257477e-05, "epoch": 1.015635094973511, "percentage": 33.85, "elapsed_time": "2:26:32", "remaining_time": "4:46:18", "throughput": "7323.31", "total_tokens": 64389120} {"current_steps": 7870, "total_steps": 23217, "loss": 0.7203, "learning_rate": 3.711427331434721e-05, "epoch": 1.0169272515828918, "percentage": 33.9, "elapsed_time": "2:27:19", "remaining_time": "4:47:17", "throughput": "7293.64", "total_tokens": 64471040} {"current_steps": 7880, "total_steps": 23217, "loss": 0.7494, "learning_rate": 3.7084670614929554e-05, "epoch": 1.0182194081922729, "percentage": 33.94, "elapsed_time": "2:28:06", "remaining_time": "4:48:15", "throughput": "7264.35", "total_tokens": 64552960} {"current_steps": 7890, "total_steps": 23217, "loss": 0.7702, "learning_rate": 3.7055045788524214e-05, "epoch": 1.019511564801654, "percentage": 33.98, "elapsed_time": "2:28:53", "remaining_time": "4:49:13", "throughput": "7235.40", "total_tokens": 64634880} {"current_steps": 7900, "total_steps": 23217, "loss": 1.0498, "learning_rate": 3.702539888937414e-05, "epoch": 1.020803721411035, "percentage": 34.03, "elapsed_time": "2:29:40", "remaining_time": "4:50:11", "throughput": "7206.68", "total_tokens": 64716800} {"current_steps": 7910, "total_steps": 23217, "loss": 0.8016, "learning_rate": 3.699572997176272e-05, "epoch": 1.0220958780204161, "percentage": 34.07, "elapsed_time": "2:30:27", "remaining_time": "4:51:08", "throughput": "7178.24", "total_tokens": 64798720} {"current_steps": 7920, "total_steps": 23217, "loss": 0.741, "learning_rate": 3.696603909001361e-05, "epoch": 1.0233880346297972, "percentage": 34.11, "elapsed_time": "2:31:14", "remaining_time": "4:52:06", "throughput": "7150.11", "total_tokens": 64880640} {"current_steps": 7930, "total_steps": 23217, "loss": 0.7687, "learning_rate": 3.69363262984907e-05, "epoch": 1.024680191239178, "percentage": 34.16, "elapsed_time": "2:32:01", "remaining_time": "4:53:02", "throughput": "7122.29", "total_tokens": 64962560} {"current_steps": 7940, "total_steps": 23217, "loss": 1.0326, "learning_rate": 3.690659165159803e-05, "epoch": 1.0259723478485592, "percentage": 34.2, "elapsed_time": "2:32:47", "remaining_time": "4:53:59", "throughput": "7094.74", "total_tokens": 65044480} {"current_steps": 7950, "total_steps": 23217, "loss": 0.961, "learning_rate": 3.6876835203779615e-05, "epoch": 1.0272645044579403, "percentage": 34.24, "elapsed_time": "2:33:34", "remaining_time": "4:54:56", "throughput": "7067.44", "total_tokens": 65126400} {"current_steps": 7960, "total_steps": 23217, "loss": 0.8982, "learning_rate": 3.68470570095194e-05, "epoch": 1.0285566610673214, "percentage": 34.29, "elapsed_time": "2:34:21", "remaining_time": "4:55:52", "throughput": "7040.43", "total_tokens": 65208320} {"current_steps": 7970, "total_steps": 23217, "loss": 0.8534, "learning_rate": 3.681725712334115e-05, "epoch": 1.0298488176767024, "percentage": 34.33, "elapsed_time": "2:35:08", "remaining_time": "4:56:48", "throughput": "7013.68", "total_tokens": 65290240} {"current_steps": 7980, "total_steps": 23217, "loss": 0.6313, "learning_rate": 3.678743559980835e-05, "epoch": 1.0311409742860835, "percentage": 34.37, "elapsed_time": "2:35:56", "remaining_time": "4:57:44", "throughput": "6987.17", "total_tokens": 65372160} {"current_steps": 7990, "total_steps": 23217, "loss": 0.9277, "learning_rate": 3.67575924935241e-05, "epoch": 1.0324331308954646, "percentage": 34.41, "elapsed_time": "2:36:43", "remaining_time": "4:58:39", "throughput": "6960.96", "total_tokens": 65454080} {"current_steps": 8000, "total_steps": 23217, "loss": 0.8789, "learning_rate": 3.672772785913102e-05, "epoch": 1.0337252875048455, "percentage": 34.46, "elapsed_time": "2:37:30", "remaining_time": "4:59:35", "throughput": "6935.03", "total_tokens": 65536000} {"current_steps": 8010, "total_steps": 23217, "loss": 0.4837, "learning_rate": 3.669784175131115e-05, "epoch": 1.0350174441142266, "percentage": 34.5, "elapsed_time": "2:38:27", "remaining_time": "5:00:49", "throughput": "6901.78", "total_tokens": 65617920} {"current_steps": 8020, "total_steps": 23217, "loss": 0.7244, "learning_rate": 3.666793422478583e-05, "epoch": 1.0363096007236077, "percentage": 34.54, "elapsed_time": "2:39:14", "remaining_time": "5:01:44", "throughput": "6876.46", "total_tokens": 65699840} {"current_steps": 8030, "total_steps": 23217, "loss": 0.63, "learning_rate": 3.663800533431564e-05, "epoch": 1.0376017573329888, "percentage": 34.59, "elapsed_time": "2:40:01", "remaining_time": "5:02:38", "throughput": "6851.32", "total_tokens": 65781760} {"current_steps": 8040, "total_steps": 23217, "loss": 1.0153, "learning_rate": 3.660805513470027e-05, "epoch": 1.0388939139423699, "percentage": 34.63, "elapsed_time": "2:40:48", "remaining_time": "5:03:33", "throughput": "6826.42", "total_tokens": 65863680} {"current_steps": 8050, "total_steps": 23217, "loss": 0.7835, "learning_rate": 3.657808368077843e-05, "epoch": 1.040186070551751, "percentage": 34.67, "elapsed_time": "2:41:35", "remaining_time": "5:04:26", "throughput": "6801.80", "total_tokens": 65945600} {"current_steps": 8060, "total_steps": 23217, "loss": 0.7988, "learning_rate": 3.654809102742773e-05, "epoch": 1.041478227161132, "percentage": 34.72, "elapsed_time": "2:42:22", "remaining_time": "5:05:20", "throughput": "6777.40", "total_tokens": 66027520} {"current_steps": 8070, "total_steps": 23217, "loss": 1.3038, "learning_rate": 3.651807722956462e-05, "epoch": 1.042770383770513, "percentage": 34.76, "elapsed_time": "2:43:09", "remaining_time": "5:06:14", "throughput": "6753.24", "total_tokens": 66109440} {"current_steps": 8080, "total_steps": 23217, "loss": 0.7774, "learning_rate": 3.648804234214425e-05, "epoch": 1.044062540379894, "percentage": 34.8, "elapsed_time": "2:43:56", "remaining_time": "5:07:07", "throughput": "6729.32", "total_tokens": 66191360} {"current_steps": 8090, "total_steps": 23217, "loss": 0.7951, "learning_rate": 3.645798642016039e-05, "epoch": 1.045354696989275, "percentage": 34.85, "elapsed_time": "2:44:43", "remaining_time": "5:08:00", "throughput": "6705.43", "total_tokens": 66273280} {"current_steps": 8100, "total_steps": 23217, "loss": 0.7105, "learning_rate": 3.642790951864532e-05, "epoch": 1.0466468535986562, "percentage": 34.89, "elapsed_time": "2:45:30", "remaining_time": "5:08:53", "throughput": "6681.96", "total_tokens": 66355200} {"current_steps": 8110, "total_steps": 23217, "loss": 0.644, "learning_rate": 3.639781169266975e-05, "epoch": 1.0479390102080373, "percentage": 34.93, "elapsed_time": "2:46:17", "remaining_time": "5:09:45", "throughput": "6658.73", "total_tokens": 66437120} {"current_steps": 8120, "total_steps": 23217, "loss": 0.7002, "learning_rate": 3.636769299734267e-05, "epoch": 1.0492311668174183, "percentage": 34.97, "elapsed_time": "2:47:04", "remaining_time": "5:10:37", "throughput": "6635.68", "total_tokens": 66519040} {"current_steps": 8130, "total_steps": 23217, "loss": 0.9435, "learning_rate": 3.63375534878113e-05, "epoch": 1.0505233234267992, "percentage": 35.02, "elapsed_time": "2:47:51", "remaining_time": "5:11:29", "throughput": "6612.88", "total_tokens": 66600960} {"current_steps": 8140, "total_steps": 23217, "loss": 0.8839, "learning_rate": 3.6307393219261e-05, "epoch": 1.0518154800361803, "percentage": 35.06, "elapsed_time": "2:48:38", "remaining_time": "5:12:21", "throughput": "6590.26", "total_tokens": 66682880} {"current_steps": 8150, "total_steps": 23217, "loss": 0.8676, "learning_rate": 3.627721224691507e-05, "epoch": 1.0531076366455614, "percentage": 35.1, "elapsed_time": "2:49:25", "remaining_time": "5:13:13", "throughput": "6567.71", "total_tokens": 66764800} {"current_steps": 8160, "total_steps": 23217, "loss": 0.6555, "learning_rate": 3.6247010626034795e-05, "epoch": 1.0543997932549425, "percentage": 35.15, "elapsed_time": "2:50:12", "remaining_time": "5:14:04", "throughput": "6545.53", "total_tokens": 66846720} {"current_steps": 8170, "total_steps": 23217, "loss": 0.8207, "learning_rate": 3.621678841191922e-05, "epoch": 1.0556919498643236, "percentage": 35.19, "elapsed_time": "2:50:59", "remaining_time": "5:14:55", "throughput": "6523.60", "total_tokens": 66928640} {"current_steps": 8180, "total_steps": 23217, "loss": 1.0707, "learning_rate": 3.618654565990511e-05, "epoch": 1.0569841064737047, "percentage": 35.23, "elapsed_time": "2:51:46", "remaining_time": "5:15:45", "throughput": "6501.87", "total_tokens": 67010560} {"current_steps": 8190, "total_steps": 23217, "loss": 0.7523, "learning_rate": 3.615628242536682e-05, "epoch": 1.0582762630830858, "percentage": 35.28, "elapsed_time": "2:52:33", "remaining_time": "5:16:36", "throughput": "6480.24", "total_tokens": 67092480} {"current_steps": 8200, "total_steps": 23217, "loss": 0.7847, "learning_rate": 3.612599876371625e-05, "epoch": 1.0595684196924666, "percentage": 35.32, "elapsed_time": "2:53:20", "remaining_time": "5:17:26", "throughput": "6458.83", "total_tokens": 67174400} {"current_steps": 8210, "total_steps": 23217, "loss": 1.0002, "learning_rate": 3.609569473040265e-05, "epoch": 1.0608605763018477, "percentage": 35.36, "elapsed_time": "2:54:07", "remaining_time": "5:18:17", "throughput": "6437.49", "total_tokens": 67256320} {"current_steps": 8220, "total_steps": 23217, "loss": 0.9216, "learning_rate": 3.6065370380912587e-05, "epoch": 1.0621527329112288, "percentage": 35.41, "elapsed_time": "2:54:54", "remaining_time": "5:19:06", "throughput": "6416.51", "total_tokens": 67338240} {"current_steps": 8230, "total_steps": 23217, "loss": 0.9941, "learning_rate": 3.603502577076986e-05, "epoch": 1.06344488952061, "percentage": 35.45, "elapsed_time": "2:55:41", "remaining_time": "5:19:56", "throughput": "6395.65", "total_tokens": 67420160} {"current_steps": 8240, "total_steps": 23217, "loss": 0.6576, "learning_rate": 3.600466095553532e-05, "epoch": 1.064737046129991, "percentage": 35.49, "elapsed_time": "2:56:28", "remaining_time": "5:20:45", "throughput": "6374.99", "total_tokens": 67502080} {"current_steps": 8250, "total_steps": 23217, "loss": 1.2263, "learning_rate": 3.5974275990806846e-05, "epoch": 1.066029202739372, "percentage": 35.53, "elapsed_time": "2:57:15", "remaining_time": "5:21:34", "throughput": "6354.49", "total_tokens": 67584000} {"current_steps": 8260, "total_steps": 23217, "loss": 0.7686, "learning_rate": 3.5943870932219184e-05, "epoch": 1.0673213593487532, "percentage": 35.58, "elapsed_time": "2:58:02", "remaining_time": "5:22:23", "throughput": "6334.20", "total_tokens": 67665920} {"current_steps": 8270, "total_steps": 23217, "loss": 0.9912, "learning_rate": 3.59134458354439e-05, "epoch": 1.068613515958134, "percentage": 35.62, "elapsed_time": "2:58:49", "remaining_time": "5:23:12", "throughput": "6314.11", "total_tokens": 67747840} {"current_steps": 8280, "total_steps": 23217, "loss": 0.7774, "learning_rate": 3.588300075618922e-05, "epoch": 1.0699056725675151, "percentage": 35.66, "elapsed_time": "2:59:36", "remaining_time": "5:24:00", "throughput": "6294.17", "total_tokens": 67829760} {"current_steps": 8290, "total_steps": 23217, "loss": 1.002, "learning_rate": 3.5852535750199977e-05, "epoch": 1.0711978291768962, "percentage": 35.71, "elapsed_time": "3:00:23", "remaining_time": "5:24:49", "throughput": "6274.40", "total_tokens": 67911680} {"current_steps": 8300, "total_steps": 23217, "loss": 0.767, "learning_rate": 3.5822050873257494e-05, "epoch": 1.0724899857862773, "percentage": 35.75, "elapsed_time": "3:01:10", "remaining_time": "5:25:36", "throughput": "6254.83", "total_tokens": 67993600} {"current_steps": 8310, "total_steps": 23217, "loss": 1.0006, "learning_rate": 3.579154618117946e-05, "epoch": 1.0737821423956584, "percentage": 35.79, "elapsed_time": "3:01:57", "remaining_time": "5:26:24", "throughput": "6235.43", "total_tokens": 68075520} {"current_steps": 8320, "total_steps": 23217, "loss": 0.4659, "learning_rate": 3.576102172981986e-05, "epoch": 1.0750742990050395, "percentage": 35.84, "elapsed_time": "3:02:44", "remaining_time": "5:27:11", "throughput": "6216.19", "total_tokens": 68157440} {"current_steps": 8330, "total_steps": 23217, "loss": 0.9332, "learning_rate": 3.5730477575068845e-05, "epoch": 1.0763664556144206, "percentage": 35.88, "elapsed_time": "3:03:31", "remaining_time": "5:27:59", "throughput": "6197.13", "total_tokens": 68239360} {"current_steps": 8340, "total_steps": 23217, "loss": 0.7617, "learning_rate": 3.5699913772852664e-05, "epoch": 1.0776586122238014, "percentage": 35.92, "elapsed_time": "3:04:18", "remaining_time": "5:28:46", "throughput": "6178.22", "total_tokens": 68321280} {"current_steps": 8350, "total_steps": 23217, "loss": 1.1367, "learning_rate": 3.566933037913351e-05, "epoch": 1.0789507688331825, "percentage": 35.97, "elapsed_time": "3:05:05", "remaining_time": "5:29:32", "throughput": "6159.47", "total_tokens": 68403200} {"current_steps": 8360, "total_steps": 23217, "loss": 0.6604, "learning_rate": 3.5638727449909473e-05, "epoch": 1.0802429254425636, "percentage": 36.01, "elapsed_time": "3:05:52", "remaining_time": "5:30:19", "throughput": "6140.87", "total_tokens": 68485120} {"current_steps": 8370, "total_steps": 23217, "loss": 1.0806, "learning_rate": 3.560810504121441e-05, "epoch": 1.0815350820519447, "percentage": 36.05, "elapsed_time": "3:06:39", "remaining_time": "5:31:05", "throughput": "6122.45", "total_tokens": 68567040} {"current_steps": 8380, "total_steps": 23217, "loss": 0.7424, "learning_rate": 3.5577463209117833e-05, "epoch": 1.0828272386613258, "percentage": 36.09, "elapsed_time": "3:07:26", "remaining_time": "5:31:51", "throughput": "6104.17", "total_tokens": 68648960} {"current_steps": 8390, "total_steps": 23217, "loss": 0.78, "learning_rate": 3.554680200972482e-05, "epoch": 1.0841193952707069, "percentage": 36.14, "elapsed_time": "3:08:13", "remaining_time": "5:32:37", "throughput": "6086.07", "total_tokens": 68730880} {"current_steps": 8400, "total_steps": 23217, "loss": 1.0331, "learning_rate": 3.551612149917593e-05, "epoch": 1.085411551880088, "percentage": 36.18, "elapsed_time": "3:09:00", "remaining_time": "5:33:23", "throughput": "6068.10", "total_tokens": 68812800} {"current_steps": 8410, "total_steps": 23217, "loss": 1.3448, "learning_rate": 3.548542173364705e-05, "epoch": 1.0867037084894688, "percentage": 36.22, "elapsed_time": "3:09:47", "remaining_time": "5:34:08", "throughput": "6050.28", "total_tokens": 68894720} {"current_steps": 8420, "total_steps": 23217, "loss": 0.9444, "learning_rate": 3.545470276934934e-05, "epoch": 1.08799586509885, "percentage": 36.27, "elapsed_time": "3:10:33", "remaining_time": "5:34:53", "throughput": "6032.60", "total_tokens": 68976640} {"current_steps": 8430, "total_steps": 23217, "loss": 0.6718, "learning_rate": 3.542396466252913e-05, "epoch": 1.089288021708231, "percentage": 36.31, "elapsed_time": "3:11:20", "remaining_time": "5:35:38", "throughput": "6015.04", "total_tokens": 69058560} {"current_steps": 8440, "total_steps": 23217, "loss": 0.8492, "learning_rate": 3.539320746946775e-05, "epoch": 1.0905801783176121, "percentage": 36.35, "elapsed_time": "3:12:07", "remaining_time": "5:36:23", "throughput": "5997.62", "total_tokens": 69140480} {"current_steps": 8450, "total_steps": 23217, "loss": 0.5818, "learning_rate": 3.5362431246481536e-05, "epoch": 1.0918723349269932, "percentage": 36.4, "elapsed_time": "3:12:55", "remaining_time": "5:37:08", "throughput": "5980.33", "total_tokens": 69222400} {"current_steps": 8460, "total_steps": 23217, "loss": 0.8846, "learning_rate": 3.533163604992163e-05, "epoch": 1.0931644915363743, "percentage": 36.44, "elapsed_time": "3:13:41", "remaining_time": "5:37:52", "throughput": "5963.21", "total_tokens": 69304320} {"current_steps": 8470, "total_steps": 23217, "loss": 0.8992, "learning_rate": 3.5300821936173926e-05, "epoch": 1.0944566481457552, "percentage": 36.48, "elapsed_time": "3:14:28", "remaining_time": "5:38:36", "throughput": "5946.21", "total_tokens": 69386240} {"current_steps": 8480, "total_steps": 23217, "loss": 0.9501, "learning_rate": 3.526998896165894e-05, "epoch": 1.0957488047551363, "percentage": 36.52, "elapsed_time": "3:15:15", "remaining_time": "5:39:20", "throughput": "5929.38", "total_tokens": 69468160} {"current_steps": 8490, "total_steps": 23217, "loss": 1.1183, "learning_rate": 3.523913718283175e-05, "epoch": 1.0970409613645173, "percentage": 36.57, "elapsed_time": "3:16:02", "remaining_time": "5:40:04", "throughput": "5912.66", "total_tokens": 69550080} {"current_steps": 8500, "total_steps": 23217, "loss": 0.9322, "learning_rate": 3.520826665618184e-05, "epoch": 1.0983331179738984, "percentage": 36.61, "elapsed_time": "3:16:49", "remaining_time": "5:40:47", "throughput": "5896.09", "total_tokens": 69632000} {"current_steps": 8510, "total_steps": 23217, "loss": 0.6564, "learning_rate": 3.5177377438233044e-05, "epoch": 1.0996252745832795, "percentage": 36.65, "elapsed_time": "3:17:36", "remaining_time": "5:41:30", "throughput": "5879.64", "total_tokens": 69713920} {"current_steps": 8520, "total_steps": 23217, "loss": 1.0945, "learning_rate": 3.514646958554339e-05, "epoch": 1.1009174311926606, "percentage": 36.7, "elapsed_time": "3:18:23", "remaining_time": "5:42:14", "throughput": "5863.32", "total_tokens": 69795840} {"current_steps": 8530, "total_steps": 23217, "loss": 0.8922, "learning_rate": 3.511554315470507e-05, "epoch": 1.1022095878020417, "percentage": 36.74, "elapsed_time": "3:19:10", "remaining_time": "5:42:56", "throughput": "5847.14", "total_tokens": 69877760} {"current_steps": 8540, "total_steps": 23217, "loss": 0.9603, "learning_rate": 3.508459820234423e-05, "epoch": 1.1035017444114226, "percentage": 36.78, "elapsed_time": "3:19:57", "remaining_time": "5:43:39", "throughput": "5831.08", "total_tokens": 69959680} {"current_steps": 8550, "total_steps": 23217, "loss": 0.8906, "learning_rate": 3.5053634785121e-05, "epoch": 1.1047939010208037, "percentage": 36.83, "elapsed_time": "3:20:44", "remaining_time": "5:44:21", "throughput": "5815.14", "total_tokens": 70041600} {"current_steps": 8560, "total_steps": 23217, "loss": 0.7746, "learning_rate": 3.5022652959729266e-05, "epoch": 1.1060860576301847, "percentage": 36.87, "elapsed_time": "3:21:31", "remaining_time": "5:45:04", "throughput": "5799.33", "total_tokens": 70123520} {"current_steps": 8570, "total_steps": 23217, "loss": 0.7997, "learning_rate": 3.499165278289663e-05, "epoch": 1.1073782142395658, "percentage": 36.91, "elapsed_time": "3:22:29", "remaining_time": "5:46:04", "throughput": "5778.57", "total_tokens": 70205440} {"current_steps": 8580, "total_steps": 23217, "loss": 0.7416, "learning_rate": 3.496063431138431e-05, "epoch": 1.108670370848947, "percentage": 36.96, "elapsed_time": "3:23:16", "remaining_time": "5:46:46", "throughput": "5763.03", "total_tokens": 70287360} {"current_steps": 8590, "total_steps": 23217, "loss": 0.7489, "learning_rate": 3.492959760198702e-05, "epoch": 1.109962527458328, "percentage": 37.0, "elapsed_time": "3:24:03", "remaining_time": "5:47:27", "throughput": "5747.65", "total_tokens": 70369280} {"current_steps": 8600, "total_steps": 23217, "loss": 0.8175, "learning_rate": 3.489854271153285e-05, "epoch": 1.111254684067709, "percentage": 37.04, "elapsed_time": "3:24:50", "remaining_time": "5:48:08", "throughput": "5732.34", "total_tokens": 70451200} {"current_steps": 8610, "total_steps": 23217, "loss": 0.6624, "learning_rate": 3.4867469696883204e-05, "epoch": 1.11254684067709, "percentage": 37.08, "elapsed_time": "3:25:37", "remaining_time": "5:48:49", "throughput": "5717.19", "total_tokens": 70533120} {"current_steps": 8620, "total_steps": 23217, "loss": 0.8943, "learning_rate": 3.483637861493264e-05, "epoch": 1.113838997286471, "percentage": 37.13, "elapsed_time": "3:26:24", "remaining_time": "5:49:31", "throughput": "5702.09", "total_tokens": 70615040} {"current_steps": 8630, "total_steps": 23217, "loss": 0.9308, "learning_rate": 3.480526952260884e-05, "epoch": 1.1151311538958522, "percentage": 37.17, "elapsed_time": "3:27:11", "remaining_time": "5:50:12", "throughput": "5687.04", "total_tokens": 70696960} {"current_steps": 8640, "total_steps": 23217, "loss": 0.6464, "learning_rate": 3.477414247687241e-05, "epoch": 1.1164233105052332, "percentage": 37.21, "elapsed_time": "3:27:58", "remaining_time": "5:50:52", "throughput": "5672.20", "total_tokens": 70778880} {"current_steps": 8650, "total_steps": 23217, "loss": 0.6793, "learning_rate": 3.4742997534716884e-05, "epoch": 1.1177154671146143, "percentage": 37.26, "elapsed_time": "3:28:45", "remaining_time": "5:51:33", "throughput": "5657.46", "total_tokens": 70860800} {"current_steps": 8660, "total_steps": 23217, "loss": 0.95, "learning_rate": 3.471183475316851e-05, "epoch": 1.1190076237239954, "percentage": 37.3, "elapsed_time": "3:29:32", "remaining_time": "5:52:13", "throughput": "5642.84", "total_tokens": 70942720} {"current_steps": 8670, "total_steps": 23217, "loss": 0.8991, "learning_rate": 3.468065418928625e-05, "epoch": 1.1202997803333763, "percentage": 37.34, "elapsed_time": "3:30:19", "remaining_time": "5:52:53", "throughput": "5628.33", "total_tokens": 71024640} {"current_steps": 8680, "total_steps": 23217, "loss": 1.0195, "learning_rate": 3.4649455900161596e-05, "epoch": 1.1215919369427574, "percentage": 37.39, "elapsed_time": "3:31:06", "remaining_time": "5:53:32", "throughput": "5613.93", "total_tokens": 71106560} {"current_steps": 8690, "total_steps": 23217, "loss": 1.0533, "learning_rate": 3.461823994291849e-05, "epoch": 1.1228840935521385, "percentage": 37.43, "elapsed_time": "3:31:53", "remaining_time": "5:54:12", "throughput": "5599.63", "total_tokens": 71188480} {"current_steps": 8700, "total_steps": 23217, "loss": 0.7323, "learning_rate": 3.458700637471325e-05, "epoch": 1.1241762501615196, "percentage": 37.47, "elapsed_time": "3:32:40", "remaining_time": "5:54:51", "throughput": "5585.45", "total_tokens": 71270400} {"current_steps": 8710, "total_steps": 23217, "loss": 0.4897, "learning_rate": 3.455575525273442e-05, "epoch": 1.1254684067709007, "percentage": 37.52, "elapsed_time": "3:33:27", "remaining_time": "5:55:30", "throughput": "5571.35", "total_tokens": 71352320} {"current_steps": 8720, "total_steps": 23217, "loss": 0.9862, "learning_rate": 3.4524486634202685e-05, "epoch": 1.1267605633802817, "percentage": 37.56, "elapsed_time": "3:34:13", "remaining_time": "5:56:09", "throughput": "5557.39", "total_tokens": 71434240} {"current_steps": 8730, "total_steps": 23217, "loss": 0.7261, "learning_rate": 3.4493200576370776e-05, "epoch": 1.1280527199896628, "percentage": 37.6, "elapsed_time": "3:35:00", "remaining_time": "5:56:48", "throughput": "5543.53", "total_tokens": 71516160} {"current_steps": 8740, "total_steps": 23217, "loss": 0.8157, "learning_rate": 3.4461897136523356e-05, "epoch": 1.1293448765990437, "percentage": 37.64, "elapsed_time": "3:35:47", "remaining_time": "5:57:26", "throughput": "5529.73", "total_tokens": 71598080} {"current_steps": 8750, "total_steps": 23217, "loss": 1.0178, "learning_rate": 3.44305763719769e-05, "epoch": 1.1306370332084248, "percentage": 37.69, "elapsed_time": "3:36:34", "remaining_time": "5:58:05", "throughput": "5516.04", "total_tokens": 71680000} {"current_steps": 8760, "total_steps": 23217, "loss": 0.9631, "learning_rate": 3.4399238340079607e-05, "epoch": 1.1319291898178059, "percentage": 37.73, "elapsed_time": "3:37:21", "remaining_time": "5:58:43", "throughput": "5502.44", "total_tokens": 71761920} {"current_steps": 8770, "total_steps": 23217, "loss": 0.7918, "learning_rate": 3.4367883098211316e-05, "epoch": 1.133221346427187, "percentage": 37.77, "elapsed_time": "3:38:08", "remaining_time": "5:59:21", "throughput": "5488.96", "total_tokens": 71843840} {"current_steps": 8780, "total_steps": 23217, "loss": 0.8197, "learning_rate": 3.4336510703783345e-05, "epoch": 1.134513503036568, "percentage": 37.82, "elapsed_time": "3:38:55", "remaining_time": "5:59:59", "throughput": "5475.56", "total_tokens": 71925760} {"current_steps": 8790, "total_steps": 23217, "loss": 0.6943, "learning_rate": 3.4305121214238446e-05, "epoch": 1.1358056596459492, "percentage": 37.86, "elapsed_time": "3:39:42", "remaining_time": "6:00:36", "throughput": "5462.28", "total_tokens": 72007680} {"current_steps": 8800, "total_steps": 23217, "loss": 0.9242, "learning_rate": 3.427371468705065e-05, "epoch": 1.1370978162553302, "percentage": 37.9, "elapsed_time": "3:40:29", "remaining_time": "6:01:14", "throughput": "5449.07", "total_tokens": 72089600} {"current_steps": 8810, "total_steps": 23217, "loss": 0.8938, "learning_rate": 3.42422911797252e-05, "epoch": 1.138389972864711, "percentage": 37.95, "elapsed_time": "3:41:16", "remaining_time": "6:01:51", "throughput": "5436.00", "total_tokens": 72171520} {"current_steps": 8820, "total_steps": 23217, "loss": 1.0008, "learning_rate": 3.4210850749798415e-05, "epoch": 1.1396821294740922, "percentage": 37.99, "elapsed_time": "3:42:03", "remaining_time": "6:02:28", "throughput": "5422.98", "total_tokens": 72253440} {"current_steps": 8830, "total_steps": 23217, "loss": 0.6786, "learning_rate": 3.417939345483762e-05, "epoch": 1.1409742860834733, "percentage": 38.03, "elapsed_time": "3:42:50", "remaining_time": "6:03:05", "throughput": "5410.03", "total_tokens": 72335360} {"current_steps": 8840, "total_steps": 23217, "loss": 0.9551, "learning_rate": 3.4147919352440995e-05, "epoch": 1.1422664426928544, "percentage": 38.08, "elapsed_time": "3:43:37", "remaining_time": "6:03:41", "throughput": "5397.18", "total_tokens": 72417280} {"current_steps": 8850, "total_steps": 23217, "loss": 0.7622, "learning_rate": 3.411642850023751e-05, "epoch": 1.1435585993022355, "percentage": 38.12, "elapsed_time": "3:44:24", "remaining_time": "6:04:18", "throughput": "5384.44", "total_tokens": 72499200} {"current_steps": 8860, "total_steps": 23217, "loss": 0.5537, "learning_rate": 3.40849209558868e-05, "epoch": 1.1448507559116166, "percentage": 38.16, "elapsed_time": "3:45:11", "remaining_time": "6:04:54", "throughput": "5371.79", "total_tokens": 72581120} {"current_steps": 8870, "total_steps": 23217, "loss": 0.6828, "learning_rate": 3.405339677707906e-05, "epoch": 1.1461429125209976, "percentage": 38.2, "elapsed_time": "3:45:58", "remaining_time": "6:05:30", "throughput": "5359.20", "total_tokens": 72663040} {"current_steps": 8880, "total_steps": 23217, "loss": 0.8754, "learning_rate": 3.402185602153495e-05, "epoch": 1.1474350691303785, "percentage": 38.25, "elapsed_time": "3:46:45", "remaining_time": "6:06:06", "throughput": "5346.73", "total_tokens": 72744960} {"current_steps": 8890, "total_steps": 23217, "loss": 1.1836, "learning_rate": 3.3990298747005485e-05, "epoch": 1.1487272257397596, "percentage": 38.29, "elapsed_time": "3:47:32", "remaining_time": "6:06:42", "throughput": "5334.31", "total_tokens": 72826880} {"current_steps": 8900, "total_steps": 23217, "loss": 0.9686, "learning_rate": 3.395872501127191e-05, "epoch": 1.1500193823491407, "percentage": 38.33, "elapsed_time": "3:48:19", "remaining_time": "6:07:17", "throughput": "5322.01", "total_tokens": 72908800} {"current_steps": 8910, "total_steps": 23217, "loss": 0.9425, "learning_rate": 3.392713487214561e-05, "epoch": 1.1513115389585218, "percentage": 38.38, "elapsed_time": "3:49:06", "remaining_time": "6:07:53", "throughput": "5309.79", "total_tokens": 72990720} {"current_steps": 8920, "total_steps": 23217, "loss": 0.6426, "learning_rate": 3.389552838746804e-05, "epoch": 1.1526036955679029, "percentage": 38.42, "elapsed_time": "3:49:53", "remaining_time": "6:08:28", "throughput": "5297.65", "total_tokens": 73072640} {"current_steps": 8930, "total_steps": 23217, "loss": 0.9311, "learning_rate": 3.386390561511055e-05, "epoch": 1.153895852177284, "percentage": 38.46, "elapsed_time": "3:50:40", "remaining_time": "6:09:03", "throughput": "5285.59", "total_tokens": 73154560} {"current_steps": 8940, "total_steps": 23217, "loss": 0.94, "learning_rate": 3.38322666129743e-05, "epoch": 1.155188008786665, "percentage": 38.51, "elapsed_time": "3:51:27", "remaining_time": "6:09:37", "throughput": "5273.61", "total_tokens": 73236480} {"current_steps": 8950, "total_steps": 23217, "loss": 0.8698, "learning_rate": 3.380061143899021e-05, "epoch": 1.156480165396046, "percentage": 38.55, "elapsed_time": "3:52:14", "remaining_time": "6:10:12", "throughput": "5261.70", "total_tokens": 73318400} {"current_steps": 8960, "total_steps": 23217, "loss": 1.0229, "learning_rate": 3.376894015111876e-05, "epoch": 1.157772322005427, "percentage": 38.59, "elapsed_time": "3:53:01", "remaining_time": "6:10:46", "throughput": "5249.89", "total_tokens": 73400320} {"current_steps": 8970, "total_steps": 23217, "loss": 0.7057, "learning_rate": 3.373725280735e-05, "epoch": 1.159064478614808, "percentage": 38.64, "elapsed_time": "3:53:48", "remaining_time": "6:11:21", "throughput": "5238.15", "total_tokens": 73482240} {"current_steps": 8980, "total_steps": 23217, "loss": 0.8812, "learning_rate": 3.3705549465703314e-05, "epoch": 1.1603566352241892, "percentage": 38.68, "elapsed_time": "3:54:35", "remaining_time": "6:11:55", "throughput": "5226.48", "total_tokens": 73564160} {"current_steps": 8990, "total_steps": 23217, "loss": 0.9767, "learning_rate": 3.3673830184227414e-05, "epoch": 1.1616487918335703, "percentage": 38.72, "elapsed_time": "3:55:23", "remaining_time": "6:12:31", "throughput": "5214.40", "total_tokens": 73646080} {"current_steps": 9000, "total_steps": 23217, "loss": 1.0073, "learning_rate": 3.3642095021000184e-05, "epoch": 1.1629409484429514, "percentage": 38.76, "elapsed_time": "3:56:20", "remaining_time": "6:13:20", "throughput": "5199.36", "total_tokens": 73728000} {"current_steps": 9010, "total_steps": 23217, "loss": 0.5677, "learning_rate": 3.36103440341286e-05, "epoch": 1.1642331050523325, "percentage": 38.81, "elapsed_time": "3:57:25", "remaining_time": "6:14:22", "throughput": "5181.18", "total_tokens": 73809920} {"current_steps": 9020, "total_steps": 23217, "loss": 0.5504, "learning_rate": 3.35785772817486e-05, "epoch": 1.1655252616617133, "percentage": 38.85, "elapsed_time": "3:58:14", "remaining_time": "6:14:59", "throughput": "5169.16", "total_tokens": 73891840} {"current_steps": 9030, "total_steps": 23217, "loss": 0.949, "learning_rate": 3.3546794822024976e-05, "epoch": 1.1668174182710944, "percentage": 38.89, "elapsed_time": "3:59:02", "remaining_time": "6:15:33", "throughput": "5157.73", "total_tokens": 73973760} {"current_steps": 9040, "total_steps": 23217, "loss": 0.9297, "learning_rate": 3.351499671315131e-05, "epoch": 1.1681095748804755, "percentage": 38.94, "elapsed_time": "3:59:50", "remaining_time": "6:16:08", "throughput": "5146.04", "total_tokens": 74055680} {"current_steps": 9050, "total_steps": 23217, "loss": 0.993, "learning_rate": 3.348318301334983e-05, "epoch": 1.1694017314898566, "percentage": 38.98, "elapsed_time": "4:00:38", "remaining_time": "6:16:42", "throughput": "5134.59", "total_tokens": 74137600} {"current_steps": 9060, "total_steps": 23217, "loss": 0.6176, "learning_rate": 3.3451353780871286e-05, "epoch": 1.1706938880992377, "percentage": 39.02, "elapsed_time": "4:01:28", "remaining_time": "6:17:19", "throughput": "5122.69", "total_tokens": 74219520} {"current_steps": 9070, "total_steps": 23217, "loss": 0.5138, "learning_rate": 3.341950907399489e-05, "epoch": 1.1719860447086188, "percentage": 39.07, "elapsed_time": "4:02:15", "remaining_time": "6:17:52", "throughput": "5111.57", "total_tokens": 74301440} {"current_steps": 9080, "total_steps": 23217, "loss": 0.7563, "learning_rate": 3.338764895102821e-05, "epoch": 1.1732782013179996, "percentage": 39.11, "elapsed_time": "4:03:03", "remaining_time": "6:18:25", "throughput": "5100.49", "total_tokens": 74383360} {"current_steps": 9090, "total_steps": 23217, "loss": 1.3017, "learning_rate": 3.335577347030697e-05, "epoch": 1.1745703579273807, "percentage": 39.15, "elapsed_time": "4:03:51", "remaining_time": "6:18:59", "throughput": "5089.40", "total_tokens": 74465280} {"current_steps": 9100, "total_steps": 23217, "loss": 1.1248, "learning_rate": 3.33238826901951e-05, "epoch": 1.1758625145367618, "percentage": 39.2, "elapsed_time": "4:04:39", "remaining_time": "6:19:31", "throughput": "5078.49", "total_tokens": 74547200} {"current_steps": 9110, "total_steps": 23217, "loss": 0.6756, "learning_rate": 3.329197666908447e-05, "epoch": 1.177154671146143, "percentage": 39.24, "elapsed_time": "4:05:26", "remaining_time": "6:20:04", "throughput": "5067.72", "total_tokens": 74629120} {"current_steps": 9120, "total_steps": 23217, "loss": 0.9454, "learning_rate": 3.32600554653949e-05, "epoch": 1.178446827755524, "percentage": 39.28, "elapsed_time": "4:06:13", "remaining_time": "6:20:36", "throughput": "5056.97", "total_tokens": 74711040} {"current_steps": 9130, "total_steps": 23217, "loss": 0.863, "learning_rate": 3.322811913757401e-05, "epoch": 1.179738984364905, "percentage": 39.32, "elapsed_time": "4:07:01", "remaining_time": "6:21:08", "throughput": "5046.26", "total_tokens": 74792960} {"current_steps": 9140, "total_steps": 23217, "loss": 0.8522, "learning_rate": 3.319616774409709e-05, "epoch": 1.181031140974286, "percentage": 39.37, "elapsed_time": "4:07:48", "remaining_time": "6:21:40", "throughput": "5035.66", "total_tokens": 74874880} {"current_steps": 9150, "total_steps": 23217, "loss": 0.8277, "learning_rate": 3.316420134346701e-05, "epoch": 1.182323297583667, "percentage": 39.41, "elapsed_time": "4:08:36", "remaining_time": "6:22:12", "throughput": "5025.07", "total_tokens": 74956800} {"current_steps": 9160, "total_steps": 23217, "loss": 0.8846, "learning_rate": 3.313221999421415e-05, "epoch": 1.1836154541930481, "percentage": 39.45, "elapsed_time": "4:09:24", "remaining_time": "6:22:44", "throughput": "5014.52", "total_tokens": 75038720} {"current_steps": 9170, "total_steps": 23217, "loss": 0.6351, "learning_rate": 3.310022375489623e-05, "epoch": 1.1849076108024292, "percentage": 39.5, "elapsed_time": "4:10:11", "remaining_time": "6:23:15", "throughput": "5004.20", "total_tokens": 75120640} {"current_steps": 9180, "total_steps": 23217, "loss": 1.023, "learning_rate": 3.306821268409827e-05, "epoch": 1.1861997674118103, "percentage": 39.54, "elapsed_time": "4:10:59", "remaining_time": "6:23:46", "throughput": "4993.84", "total_tokens": 75202560} {"current_steps": 9190, "total_steps": 23217, "loss": 1.0803, "learning_rate": 3.30361868404324e-05, "epoch": 1.1874919240211914, "percentage": 39.58, "elapsed_time": "4:11:46", "remaining_time": "6:24:17", "throughput": "4983.52", "total_tokens": 75284480} {"current_steps": 9200, "total_steps": 23217, "loss": 0.7852, "learning_rate": 3.300414628253783e-05, "epoch": 1.1887840806305725, "percentage": 39.63, "elapsed_time": "4:12:34", "remaining_time": "6:24:48", "throughput": "4973.29", "total_tokens": 75366400} {"current_steps": 9210, "total_steps": 23217, "loss": 0.8063, "learning_rate": 3.297209106908072e-05, "epoch": 1.1900762372399534, "percentage": 39.67, "elapsed_time": "4:13:21", "remaining_time": "6:25:19", "throughput": "4963.10", "total_tokens": 75448320} {"current_steps": 9220, "total_steps": 23217, "loss": 0.6504, "learning_rate": 3.294002125875402e-05, "epoch": 1.1913683938493345, "percentage": 39.71, "elapsed_time": "4:14:09", "remaining_time": "6:25:50", "throughput": "4953.01", "total_tokens": 75530240} {"current_steps": 9230, "total_steps": 23217, "loss": 0.7654, "learning_rate": 3.290793691027746e-05, "epoch": 1.1926605504587156, "percentage": 39.76, "elapsed_time": "4:14:56", "remaining_time": "6:26:20", "throughput": "4942.99", "total_tokens": 75612160} {"current_steps": 9240, "total_steps": 23217, "loss": 0.7852, "learning_rate": 3.287583808239735e-05, "epoch": 1.1939527070680966, "percentage": 39.8, "elapsed_time": "4:15:44", "remaining_time": "6:26:51", "throughput": "4932.91", "total_tokens": 75694080} {"current_steps": 9250, "total_steps": 23217, "loss": 0.5354, "learning_rate": 3.284372483388652e-05, "epoch": 1.1952448636774777, "percentage": 39.84, "elapsed_time": "4:16:32", "remaining_time": "6:27:21", "throughput": "4922.94", "total_tokens": 75776000} {"current_steps": 9260, "total_steps": 23217, "loss": 0.8227, "learning_rate": 3.2811597223544234e-05, "epoch": 1.1965370202868588, "percentage": 39.88, "elapsed_time": "4:17:27", "remaining_time": "6:28:02", "throughput": "4910.82", "total_tokens": 75857920} {"current_steps": 9270, "total_steps": 23217, "loss": 0.9902, "learning_rate": 3.277945531019601e-05, "epoch": 1.19782917689624, "percentage": 39.93, "elapsed_time": "4:18:26", "remaining_time": "6:28:50", "throughput": "4897.20", "total_tokens": 75939840} {"current_steps": 9280, "total_steps": 23217, "loss": 0.6786, "learning_rate": 3.274729915269358e-05, "epoch": 1.1991213335056208, "percentage": 39.97, "elapsed_time": "4:19:19", "remaining_time": "6:29:27", "throughput": "4885.93", "total_tokens": 76021760} {"current_steps": 9290, "total_steps": 23217, "loss": 0.7933, "learning_rate": 3.271512880991476e-05, "epoch": 1.2004134901150019, "percentage": 40.01, "elapsed_time": "4:20:07", "remaining_time": "6:29:57", "throughput": "4876.15", "total_tokens": 76103680} {"current_steps": 9300, "total_steps": 23217, "loss": 0.8867, "learning_rate": 3.268294434076332e-05, "epoch": 1.201705646724383, "percentage": 40.06, "elapsed_time": "4:20:56", "remaining_time": "6:30:28", "throughput": "4866.13", "total_tokens": 76185600} {"current_steps": 9310, "total_steps": 23217, "loss": 0.9081, "learning_rate": 3.26507458041689e-05, "epoch": 1.202997803333764, "percentage": 40.1, "elapsed_time": "4:21:49", "remaining_time": "6:31:06", "throughput": "4854.83", "total_tokens": 76267520} {"current_steps": 9320, "total_steps": 23217, "loss": 1.1582, "learning_rate": 3.261853325908691e-05, "epoch": 1.2042899599431451, "percentage": 40.14, "elapsed_time": "4:22:42", "remaining_time": "6:31:42", "throughput": "4843.84", "total_tokens": 76349440} {"current_steps": 9330, "total_steps": 23217, "loss": 1.1172, "learning_rate": 3.2586306764498395e-05, "epoch": 1.2055821165525262, "percentage": 40.19, "elapsed_time": "4:23:37", "remaining_time": "6:32:23", "throughput": "4831.93", "total_tokens": 76431360} {"current_steps": 9340, "total_steps": 23217, "loss": 0.8069, "learning_rate": 3.255406637940996e-05, "epoch": 1.2068742731619073, "percentage": 40.23, "elapsed_time": "4:24:25", "remaining_time": "6:32:52", "throughput": "4822.62", "total_tokens": 76513280} {"current_steps": 9350, "total_steps": 23217, "loss": 1.0322, "learning_rate": 3.252181216285363e-05, "epoch": 1.2081664297712882, "percentage": 40.27, "elapsed_time": "4:25:13", "remaining_time": "6:33:21", "throughput": "4813.12", "total_tokens": 76595200} {"current_steps": 9360, "total_steps": 23217, "loss": 1.1227, "learning_rate": 3.2489544173886745e-05, "epoch": 1.2094585863806693, "percentage": 40.32, "elapsed_time": "4:26:02", "remaining_time": "6:33:52", "throughput": "4803.50", "total_tokens": 76677120} {"current_steps": 9370, "total_steps": 23217, "loss": 0.9295, "learning_rate": 3.245726247159189e-05, "epoch": 1.2107507429900504, "percentage": 40.36, "elapsed_time": "4:26:50", "remaining_time": "6:34:20", "throughput": "4794.36", "total_tokens": 76759040} {"current_steps": 9380, "total_steps": 23217, "loss": 1.0272, "learning_rate": 3.242496711507673e-05, "epoch": 1.2120428995994315, "percentage": 40.4, "elapsed_time": "4:27:38", "remaining_time": "6:34:48", "throughput": "4785.12", "total_tokens": 76840960} {"current_steps": 9390, "total_steps": 23217, "loss": 0.9163, "learning_rate": 3.239265816347397e-05, "epoch": 1.2133350562088125, "percentage": 40.44, "elapsed_time": "4:28:26", "remaining_time": "6:35:17", "throughput": "4775.75", "total_tokens": 76922880} {"current_steps": 9400, "total_steps": 23217, "loss": 0.8623, "learning_rate": 3.236033567594115e-05, "epoch": 1.2146272128181936, "percentage": 40.49, "elapsed_time": "4:29:15", "remaining_time": "6:35:46", "throughput": "4766.53", "total_tokens": 77004800} {"current_steps": 9410, "total_steps": 23217, "loss": 0.9241, "learning_rate": 3.232799971166064e-05, "epoch": 1.2159193694275747, "percentage": 40.53, "elapsed_time": "4:30:10", "remaining_time": "6:36:25", "throughput": "4755.30", "total_tokens": 77086720} {"current_steps": 9420, "total_steps": 23217, "loss": 0.75, "learning_rate": 3.2295650329839474e-05, "epoch": 1.2172115260369556, "percentage": 40.57, "elapsed_time": "4:31:09", "remaining_time": "6:37:09", "throughput": "4743.09", "total_tokens": 77168640} {"current_steps": 9430, "total_steps": 23217, "loss": 0.6456, "learning_rate": 3.2263287589709255e-05, "epoch": 1.2185036826463367, "percentage": 40.62, "elapsed_time": "4:32:12", "remaining_time": "6:37:58", "throughput": "4729.99", "total_tokens": 77250560} {"current_steps": 9440, "total_steps": 23217, "loss": 0.8976, "learning_rate": 3.2230911550526035e-05, "epoch": 1.2197958392557178, "percentage": 40.66, "elapsed_time": "4:33:03", "remaining_time": "6:38:30", "throughput": "4720.13", "total_tokens": 77332480} {"current_steps": 9450, "total_steps": 23217, "loss": 0.9984, "learning_rate": 3.219852227157022e-05, "epoch": 1.2210879958650989, "percentage": 40.7, "elapsed_time": "4:33:52", "remaining_time": "6:38:59", "throughput": "4711.03", "total_tokens": 77414400} {"current_steps": 9460, "total_steps": 23217, "loss": 1.0182, "learning_rate": 3.216611981214648e-05, "epoch": 1.22238015247448, "percentage": 40.75, "elapsed_time": "4:34:41", "remaining_time": "6:39:28", "throughput": "4701.89", "total_tokens": 77496320} {"current_steps": 9470, "total_steps": 23217, "loss": 0.6102, "learning_rate": 3.2133704231583576e-05, "epoch": 1.223672309083861, "percentage": 40.79, "elapsed_time": "4:35:35", "remaining_time": "6:40:03", "throughput": "4691.57", "total_tokens": 77578240} {"current_steps": 9480, "total_steps": 23217, "loss": 0.868, "learning_rate": 3.210127558923434e-05, "epoch": 1.2249644656932421, "percentage": 40.83, "elapsed_time": "4:36:29", "remaining_time": "6:40:39", "throughput": "4681.26", "total_tokens": 77660160} {"current_steps": 9490, "total_steps": 23217, "loss": 0.9574, "learning_rate": 3.206883394447547e-05, "epoch": 1.226256622302623, "percentage": 40.88, "elapsed_time": "4:37:19", "remaining_time": "6:41:09", "throughput": "4672.04", "total_tokens": 77742080} {"current_steps": 9500, "total_steps": 23217, "loss": 0.852, "learning_rate": 3.203637935670752e-05, "epoch": 1.227548778912004, "percentage": 40.92, "elapsed_time": "4:38:11", "remaining_time": "6:41:40", "throughput": "4662.51", "total_tokens": 77824000} {"current_steps": 9510, "total_steps": 23217, "loss": 0.7199, "learning_rate": 3.200391188535472e-05, "epoch": 1.2288409355213852, "percentage": 40.96, "elapsed_time": "4:39:12", "remaining_time": "6:42:25", "throughput": "4650.39", "total_tokens": 77905920} {"current_steps": 9520, "total_steps": 23217, "loss": 0.7419, "learning_rate": 3.197143158986489e-05, "epoch": 1.2301330921307663, "percentage": 41.0, "elapsed_time": "4:40:09", "remaining_time": "6:43:05", "throughput": "4639.41", "total_tokens": 77987840} {"current_steps": 9530, "total_steps": 23217, "loss": 0.7953, "learning_rate": 3.193893852970932e-05, "epoch": 1.2314252487401474, "percentage": 41.05, "elapsed_time": "4:41:06", "remaining_time": "6:43:43", "throughput": "4628.65", "total_tokens": 78069760} {"current_steps": 9540, "total_steps": 23217, "loss": 0.8027, "learning_rate": 3.1906432764382695e-05, "epoch": 1.2327174053495285, "percentage": 41.09, "elapsed_time": "4:41:55", "remaining_time": "6:44:10", "throughput": "4620.22", "total_tokens": 78151680} {"current_steps": 9550, "total_steps": 23217, "loss": 0.7832, "learning_rate": 3.187391435340295e-05, "epoch": 1.2340095619589095, "percentage": 41.13, "elapsed_time": "4:42:42", "remaining_time": "6:44:35", "throughput": "4612.11", "total_tokens": 78233600} {"current_steps": 9560, "total_steps": 23217, "loss": 0.7582, "learning_rate": 3.184138335631118e-05, "epoch": 1.2353017185682904, "percentage": 41.18, "elapsed_time": "4:43:30", "remaining_time": "6:45:00", "throughput": "4604.04", "total_tokens": 78315520} {"current_steps": 9570, "total_steps": 23217, "loss": 1.1442, "learning_rate": 3.1808839832671523e-05, "epoch": 1.2365938751776715, "percentage": 41.22, "elapsed_time": "4:44:17", "remaining_time": "6:45:24", "throughput": "4595.95", "total_tokens": 78397440} {"current_steps": 9580, "total_steps": 23217, "loss": 0.9673, "learning_rate": 3.1776283842071045e-05, "epoch": 1.2378860317870526, "percentage": 41.26, "elapsed_time": "4:45:06", "remaining_time": "6:45:50", "throughput": "4587.81", "total_tokens": 78479360} {"current_steps": 9590, "total_steps": 23217, "loss": 0.8106, "learning_rate": 3.174371544411964e-05, "epoch": 1.2391781883964337, "percentage": 41.31, "elapsed_time": "4:45:54", "remaining_time": "6:46:15", "throughput": "4579.65", "total_tokens": 78561280} {"current_steps": 9600, "total_steps": 23217, "loss": 0.9658, "learning_rate": 3.1711134698449946e-05, "epoch": 1.2404703450058148, "percentage": 41.35, "elapsed_time": "4:46:42", "remaining_time": "6:46:40", "throughput": "4571.69", "total_tokens": 78643200} {"current_steps": 9610, "total_steps": 23217, "loss": 0.9531, "learning_rate": 3.167854166471717e-05, "epoch": 1.2417625016151959, "percentage": 41.39, "elapsed_time": "4:47:30", "remaining_time": "6:47:05", "throughput": "4563.56", "total_tokens": 78725120} {"current_steps": 9620, "total_steps": 23217, "loss": 0.8195, "learning_rate": 3.164593640259904e-05, "epoch": 1.2430546582245767, "percentage": 41.44, "elapsed_time": "4:48:19", "remaining_time": "6:47:31", "throughput": "4555.44", "total_tokens": 78807040} {"current_steps": 9630, "total_steps": 23217, "loss": 0.9972, "learning_rate": 3.161331897179568e-05, "epoch": 1.2443468148339578, "percentage": 41.48, "elapsed_time": "4:49:07", "remaining_time": "6:47:55", "throughput": "4547.57", "total_tokens": 78888960} {"current_steps": 9640, "total_steps": 23217, "loss": 0.5308, "learning_rate": 3.1580689432029484e-05, "epoch": 1.245638971443339, "percentage": 41.52, "elapsed_time": "4:49:54", "remaining_time": "6:48:19", "throughput": "4539.87", "total_tokens": 78970880} {"current_steps": 9650, "total_steps": 23217, "loss": 1.0639, "learning_rate": 3.154804784304502e-05, "epoch": 1.24693112805272, "percentage": 41.56, "elapsed_time": "4:50:42", "remaining_time": "6:48:42", "throughput": "4532.14", "total_tokens": 79052800} {"current_steps": 9660, "total_steps": 23217, "loss": 1.2022, "learning_rate": 3.151539426460892e-05, "epoch": 1.248223284662101, "percentage": 41.61, "elapsed_time": "4:51:30", "remaining_time": "6:49:06", "throughput": "4524.42", "total_tokens": 79134720} {"current_steps": 9670, "total_steps": 23217, "loss": 0.8717, "learning_rate": 3.148272875650976e-05, "epoch": 1.2495154412714822, "percentage": 41.65, "elapsed_time": "4:52:19", "remaining_time": "6:49:31", "throughput": "4516.56", "total_tokens": 79216640} {"current_steps": 9680, "total_steps": 23217, "loss": 0.9134, "learning_rate": 3.145005137855796e-05, "epoch": 1.250807597880863, "percentage": 41.69, "elapsed_time": "4:53:07", "remaining_time": "6:49:55", "throughput": "4508.82", "total_tokens": 79298560} {"current_steps": 9690, "total_steps": 23217, "loss": 0.671, "learning_rate": 3.14173621905857e-05, "epoch": 1.2520997544902444, "percentage": 41.74, "elapsed_time": "4:53:55", "remaining_time": "6:50:18", "throughput": "4501.27", "total_tokens": 79380480} {"current_steps": 9700, "total_steps": 23217, "loss": 1.0354, "learning_rate": 3.138466125244674e-05, "epoch": 1.2533919110996252, "percentage": 41.78, "elapsed_time": "4:54:44", "remaining_time": "6:50:43", "throughput": "4493.32", "total_tokens": 79462400} {"current_steps": 9710, "total_steps": 23217, "loss": 1.3345, "learning_rate": 3.13519486240164e-05, "epoch": 1.2546840677090063, "percentage": 41.82, "elapsed_time": "4:55:31", "remaining_time": "6:51:05", "throughput": "4485.95", "total_tokens": 79544320} {"current_steps": 9720, "total_steps": 23217, "loss": 0.7637, "learning_rate": 3.1319224365191366e-05, "epoch": 1.2559762243183874, "percentage": 41.87, "elapsed_time": "4:56:20", "remaining_time": "6:51:29", "throughput": "4478.31", "total_tokens": 79626240} {"current_steps": 9730, "total_steps": 23217, "loss": 0.5803, "learning_rate": 3.128648853588965e-05, "epoch": 1.2572683809277685, "percentage": 41.91, "elapsed_time": "4:57:12", "remaining_time": "6:51:57", "throughput": "4469.93", "total_tokens": 79708160} {"current_steps": 9740, "total_steps": 23217, "loss": 0.4912, "learning_rate": 3.1253741196050425e-05, "epoch": 1.2585605375371496, "percentage": 41.95, "elapsed_time": "4:58:00", "remaining_time": "6:52:20", "throughput": "4462.51", "total_tokens": 79790080} {"current_steps": 9750, "total_steps": 23217, "loss": 0.7291, "learning_rate": 3.122098240563396e-05, "epoch": 1.2598526941465304, "percentage": 42.0, "elapsed_time": "4:58:49", "remaining_time": "6:52:44", "throughput": "4454.88", "total_tokens": 79872000} {"current_steps": 9760, "total_steps": 23217, "loss": 1.0072, "learning_rate": 3.118821222462147e-05, "epoch": 1.2611448507559115, "percentage": 42.04, "elapsed_time": "4:59:38", "remaining_time": "6:53:08", "throughput": "4447.25", "total_tokens": 79953920} {"current_steps": 9770, "total_steps": 23217, "loss": 0.8663, "learning_rate": 3.1155430713015034e-05, "epoch": 1.2624370073652926, "percentage": 42.08, "elapsed_time": "5:00:26", "remaining_time": "6:53:31", "throughput": "4439.83", "total_tokens": 80035840} {"current_steps": 9780, "total_steps": 23217, "loss": 0.8375, "learning_rate": 3.1122637930837486e-05, "epoch": 1.2637291639746737, "percentage": 42.12, "elapsed_time": "5:01:16", "remaining_time": "6:53:55", "throughput": "4432.22", "total_tokens": 80117760} {"current_steps": 9790, "total_steps": 23217, "loss": 0.7423, "learning_rate": 3.10898339381323e-05, "epoch": 1.2650213205840548, "percentage": 42.17, "elapsed_time": "5:02:05", "remaining_time": "6:54:19", "throughput": "4424.66", "total_tokens": 80199680} {"current_steps": 9800, "total_steps": 23217, "loss": 1.3639, "learning_rate": 3.1057018794963454e-05, "epoch": 1.266313477193436, "percentage": 42.21, "elapsed_time": "5:02:54", "remaining_time": "6:54:42", "throughput": "4417.22", "total_tokens": 80281600} {"current_steps": 9810, "total_steps": 23217, "loss": 0.7074, "learning_rate": 3.102419256141536e-05, "epoch": 1.267605633802817, "percentage": 42.25, "elapsed_time": "5:03:43", "remaining_time": "6:55:05", "throughput": "4409.79", "total_tokens": 80363520} {"current_steps": 9820, "total_steps": 23217, "loss": 1.1645, "learning_rate": 3.0991355297592734e-05, "epoch": 1.2688977904121979, "percentage": 42.3, "elapsed_time": "5:04:31", "remaining_time": "6:55:27", "throughput": "4402.69", "total_tokens": 80445440} {"current_steps": 9830, "total_steps": 23217, "loss": 0.699, "learning_rate": 3.095850706362047e-05, "epoch": 1.270189947021579, "percentage": 42.34, "elapsed_time": "5:05:21", "remaining_time": "6:55:50", "throughput": "4395.34", "total_tokens": 80527360} {"current_steps": 9840, "total_steps": 23217, "loss": 1.1145, "learning_rate": 3.092564791964358e-05, "epoch": 1.27148210363096, "percentage": 42.38, "elapsed_time": "5:06:10", "remaining_time": "6:56:13", "throughput": "4388.02", "total_tokens": 80609280} {"current_steps": 9850, "total_steps": 23217, "loss": 0.9243, "learning_rate": 3.089277792582704e-05, "epoch": 1.2727742602403411, "percentage": 42.43, "elapsed_time": "5:06:58", "remaining_time": "6:56:34", "throughput": "4380.98", "total_tokens": 80691200} {"current_steps": 9860, "total_steps": 23217, "loss": 0.8664, "learning_rate": 3.085989714235568e-05, "epoch": 1.2740664168497222, "percentage": 42.47, "elapsed_time": "5:07:47", "remaining_time": "6:56:56", "throughput": "4373.86", "total_tokens": 80773120} {"current_steps": 9870, "total_steps": 23217, "loss": 0.8113, "learning_rate": 3.082700562943409e-05, "epoch": 1.2753585734591033, "percentage": 42.51, "elapsed_time": "5:08:36", "remaining_time": "6:57:19", "throughput": "4366.61", "total_tokens": 80855040} {"current_steps": 9880, "total_steps": 23217, "loss": 1.0342, "learning_rate": 3.079410344728652e-05, "epoch": 1.2766507300684844, "percentage": 42.56, "elapsed_time": "5:09:27", "remaining_time": "6:57:43", "throughput": "4359.13", "total_tokens": 80936960} {"current_steps": 9890, "total_steps": 23217, "loss": 0.8064, "learning_rate": 3.076119065615674e-05, "epoch": 1.2779428866778653, "percentage": 42.6, "elapsed_time": "5:10:15", "remaining_time": "6:58:04", "throughput": "4352.21", "total_tokens": 81018880} {"current_steps": 9900, "total_steps": 23217, "loss": 0.7267, "learning_rate": 3.0728267316307945e-05, "epoch": 1.2792350432872464, "percentage": 42.64, "elapsed_time": "5:11:04", "remaining_time": "6:58:26", "throughput": "4345.15", "total_tokens": 81100800} {"current_steps": 9910, "total_steps": 23217, "loss": 0.6364, "learning_rate": 3.069533348802266e-05, "epoch": 1.2805271998966274, "percentage": 42.68, "elapsed_time": "5:11:58", "remaining_time": "6:58:55", "throughput": "4336.97", "total_tokens": 81182720} {"current_steps": 9920, "total_steps": 23217, "loss": 0.7681, "learning_rate": 3.0662389231602595e-05, "epoch": 1.2818193565060085, "percentage": 42.73, "elapsed_time": "5:12:46", "remaining_time": "6:59:15", "throughput": "4330.21", "total_tokens": 81264640} {"current_steps": 9930, "total_steps": 23217, "loss": 0.6366, "learning_rate": 3.062943460736857e-05, "epoch": 1.2831115131153896, "percentage": 42.77, "elapsed_time": "5:13:34", "remaining_time": "6:59:35", "throughput": "4323.60", "total_tokens": 81346560} {"current_steps": 9940, "total_steps": 23217, "loss": 0.8101, "learning_rate": 3.059646967566038e-05, "epoch": 1.2844036697247707, "percentage": 42.81, "elapsed_time": "5:14:22", "remaining_time": "6:59:54", "throughput": "4317.00", "total_tokens": 81428480} {"current_steps": 9950, "total_steps": 23217, "loss": 0.5936, "learning_rate": 3.0563494496836686e-05, "epoch": 1.2856958263341518, "percentage": 42.86, "elapsed_time": "5:15:10", "remaining_time": "7:00:14", "throughput": "4310.43", "total_tokens": 81510400} {"current_steps": 9960, "total_steps": 23217, "loss": 0.8716, "learning_rate": 3.0530509131274935e-05, "epoch": 1.2869879829435327, "percentage": 42.9, "elapsed_time": "5:15:58", "remaining_time": "7:00:34", "throughput": "4303.69", "total_tokens": 81592320} {"current_steps": 9970, "total_steps": 23217, "loss": 0.7882, "learning_rate": 3.0497513639371195e-05, "epoch": 1.2882801395529138, "percentage": 42.94, "elapsed_time": "5:16:46", "remaining_time": "7:00:54", "throughput": "4297.11", "total_tokens": 81674240} {"current_steps": 9980, "total_steps": 23217, "loss": 0.8302, "learning_rate": 3.04645080815401e-05, "epoch": 1.2895722961622949, "percentage": 42.99, "elapsed_time": "5:17:34", "remaining_time": "7:01:13", "throughput": "4290.64", "total_tokens": 81756160} {"current_steps": 9990, "total_steps": 23217, "loss": 0.9569, "learning_rate": 3.04314925182147e-05, "epoch": 1.290864452771676, "percentage": 43.03, "elapsed_time": "5:18:23", "remaining_time": "7:01:33", "throughput": "4284.00", "total_tokens": 81838080} {"current_steps": 10000, "total_steps": 23217, "loss": 0.9173, "learning_rate": 3.0398467009846375e-05, "epoch": 1.292156609381057, "percentage": 43.07, "elapsed_time": "5:19:11", "remaining_time": "7:01:52", "throughput": "4277.50", "total_tokens": 81920000} {"current_steps": 10010, "total_steps": 23217, "loss": 0.9092, "learning_rate": 3.0365431616904714e-05, "epoch": 1.2934487659904381, "percentage": 43.11, "elapsed_time": "5:20:05", "remaining_time": "7:02:19", "throughput": "4269.61", "total_tokens": 82001920} {"current_steps": 10020, "total_steps": 23217, "loss": 0.8183, "learning_rate": 3.03323863998774e-05, "epoch": 1.2947409225998192, "percentage": 43.16, "elapsed_time": "5:20:56", "remaining_time": "7:02:41", "throughput": "4262.76", "total_tokens": 82083840} {"current_steps": 10030, "total_steps": 23217, "loss": 1.2083, "learning_rate": 3.02993314192701e-05, "epoch": 1.2960330792092, "percentage": 43.2, "elapsed_time": "5:21:44", "remaining_time": "7:03:00", "throughput": "4256.30", "total_tokens": 82165760} {"current_steps": 10040, "total_steps": 23217, "loss": 1.1272, "learning_rate": 3.0266266735606358e-05, "epoch": 1.2973252358185812, "percentage": 43.24, "elapsed_time": "5:22:33", "remaining_time": "7:03:19", "throughput": "4249.85", "total_tokens": 82247680} {"current_steps": 10050, "total_steps": 23217, "loss": 0.6936, "learning_rate": 3.0233192409427492e-05, "epoch": 1.2986173924279623, "percentage": 43.29, "elapsed_time": "5:23:20", "remaining_time": "7:03:38", "throughput": "4243.58", "total_tokens": 82329600} {"current_steps": 10060, "total_steps": 23217, "loss": 1.0776, "learning_rate": 3.0200108501292466e-05, "epoch": 1.2999095490373433, "percentage": 43.33, "elapsed_time": "5:24:08", "remaining_time": "7:03:55", "throughput": "4237.43", "total_tokens": 82411520} {"current_steps": 10070, "total_steps": 23217, "loss": 0.5866, "learning_rate": 3.0167015071777815e-05, "epoch": 1.3012017056467244, "percentage": 43.37, "elapsed_time": "5:24:57", "remaining_time": "7:04:15", "throughput": "4231.00", "total_tokens": 82493440} {"current_steps": 10080, "total_steps": 23217, "loss": 0.903, "learning_rate": 3.0133912181477475e-05, "epoch": 1.3024938622561053, "percentage": 43.42, "elapsed_time": "5:25:46", "remaining_time": "7:04:34", "throughput": "4224.63", "total_tokens": 82575360} {"current_steps": 10090, "total_steps": 23217, "loss": 1.1334, "learning_rate": 3.010079989100271e-05, "epoch": 1.3037860188654866, "percentage": 43.46, "elapsed_time": "5:26:34", "remaining_time": "7:04:52", "throughput": "4218.29", "total_tokens": 82657280} {"current_steps": 10100, "total_steps": 23217, "loss": 0.708, "learning_rate": 3.0067678260982018e-05, "epoch": 1.3050781754748675, "percentage": 43.5, "elapsed_time": "5:27:23", "remaining_time": "7:05:11", "throughput": "4212.07", "total_tokens": 82739200} {"current_steps": 10110, "total_steps": 23217, "loss": 1.094, "learning_rate": 3.003454735206097e-05, "epoch": 1.3063703320842486, "percentage": 43.55, "elapsed_time": "5:28:11", "remaining_time": "7:05:29", "throughput": "4205.87", "total_tokens": 82821120} {"current_steps": 10120, "total_steps": 23217, "loss": 0.7914, "learning_rate": 3.000140722490215e-05, "epoch": 1.3076624886936297, "percentage": 43.59, "elapsed_time": "5:29:00", "remaining_time": "7:05:47", "throughput": "4199.69", "total_tokens": 82903040} {"current_steps": 10130, "total_steps": 23217, "loss": 0.882, "learning_rate": 2.9968257940184997e-05, "epoch": 1.3089546453030108, "percentage": 43.63, "elapsed_time": "5:30:02", "remaining_time": "7:06:22", "throughput": "4190.71", "total_tokens": 82984960} {"current_steps": 10140, "total_steps": 23217, "loss": 0.7434, "learning_rate": 2.9935099558605728e-05, "epoch": 1.3102468019123918, "percentage": 43.67, "elapsed_time": "5:30:50", "remaining_time": "7:06:40", "throughput": "4184.52", "total_tokens": 83066880} {"current_steps": 10150, "total_steps": 23217, "loss": 1.0257, "learning_rate": 2.9901932140877232e-05, "epoch": 1.3115389585217727, "percentage": 43.72, "elapsed_time": "5:31:38", "remaining_time": "7:06:57", "throughput": "4178.57", "total_tokens": 83148800} {"current_steps": 10160, "total_steps": 23217, "loss": 0.6914, "learning_rate": 2.9868755747728927e-05, "epoch": 1.312831115131154, "percentage": 43.76, "elapsed_time": "5:32:28", "remaining_time": "7:07:16", "throughput": "4172.33", "total_tokens": 83230720} {"current_steps": 10170, "total_steps": 23217, "loss": 0.9318, "learning_rate": 2.9835570439906657e-05, "epoch": 1.314123271740535, "percentage": 43.8, "elapsed_time": "5:33:17", "remaining_time": "7:07:34", "throughput": "4166.17", "total_tokens": 83312640} {"current_steps": 10180, "total_steps": 23217, "loss": 0.9633, "learning_rate": 2.9802376278172612e-05, "epoch": 1.315415428349916, "percentage": 43.85, "elapsed_time": "5:34:06", "remaining_time": "7:07:52", "throughput": "4160.00", "total_tokens": 83394560} {"current_steps": 10190, "total_steps": 23217, "loss": 1.1187, "learning_rate": 2.976917332330517e-05, "epoch": 1.316707584959297, "percentage": 43.89, "elapsed_time": "5:34:56", "remaining_time": "7:08:11", "throughput": "4153.84", "total_tokens": 83476480} {"current_steps": 10200, "total_steps": 23217, "loss": 0.9031, "learning_rate": 2.973596163609883e-05, "epoch": 1.3179997415686782, "percentage": 43.93, "elapsed_time": "5:35:44", "remaining_time": "7:08:27", "throughput": "4148.01", "total_tokens": 83558400} {"current_steps": 10210, "total_steps": 23217, "loss": 0.8322, "learning_rate": 2.970274127736406e-05, "epoch": 1.3192918981780593, "percentage": 43.98, "elapsed_time": "5:36:32", "remaining_time": "7:08:44", "throughput": "4142.13", "total_tokens": 83640320} {"current_steps": 10220, "total_steps": 23217, "loss": 0.7939, "learning_rate": 2.966951230792722e-05, "epoch": 1.3205840547874401, "percentage": 44.02, "elapsed_time": "5:37:20", "remaining_time": "7:09:00", "throughput": "4136.28", "total_tokens": 83722240} {"current_steps": 10230, "total_steps": 23217, "loss": 1.0287, "learning_rate": 2.9636274788630437e-05, "epoch": 1.3218762113968214, "percentage": 44.06, "elapsed_time": "5:38:09", "remaining_time": "7:09:17", "throughput": "4130.48", "total_tokens": 83804160} {"current_steps": 10240, "total_steps": 23217, "loss": 0.8743, "learning_rate": 2.9603028780331475e-05, "epoch": 1.3231683680062023, "percentage": 44.11, "elapsed_time": "5:38:58", "remaining_time": "7:09:34", "throughput": "4124.59", "total_tokens": 83886080} {"current_steps": 10250, "total_steps": 23217, "loss": 1.089, "learning_rate": 2.9569774343903662e-05, "epoch": 1.3244605246155834, "percentage": 44.15, "elapsed_time": "5:39:46", "remaining_time": "7:09:50", "throughput": "4118.79", "total_tokens": 83968000} {"current_steps": 10260, "total_steps": 23217, "loss": 0.9047, "learning_rate": 2.9536511540235744e-05, "epoch": 1.3257526812249645, "percentage": 44.19, "elapsed_time": "5:40:35", "remaining_time": "7:10:06", "throughput": "4112.99", "total_tokens": 84049920} {"current_steps": 10270, "total_steps": 23217, "loss": 0.7258, "learning_rate": 2.9503240430231803e-05, "epoch": 1.3270448378343456, "percentage": 44.23, "elapsed_time": "5:41:24", "remaining_time": "7:10:23", "throughput": "4107.18", "total_tokens": 84131840} {"current_steps": 10280, "total_steps": 23217, "loss": 0.6985, "learning_rate": 2.9469961074811103e-05, "epoch": 1.3283369944437267, "percentage": 44.28, "elapsed_time": "5:42:12", "remaining_time": "7:10:39", "throughput": "4101.40", "total_tokens": 84213760} {"current_steps": 10290, "total_steps": 23217, "loss": 0.8227, "learning_rate": 2.9436673534908044e-05, "epoch": 1.3296291510531075, "percentage": 44.32, "elapsed_time": "5:43:01", "remaining_time": "7:10:55", "throughput": "4095.72", "total_tokens": 84295680} {"current_steps": 10300, "total_steps": 23217, "loss": 0.883, "learning_rate": 2.940337787147197e-05, "epoch": 1.3309213076624886, "percentage": 44.36, "elapsed_time": "5:43:50", "remaining_time": "7:11:12", "throughput": "4089.87", "total_tokens": 84377600} {"current_steps": 10310, "total_steps": 23217, "loss": 1.2221, "learning_rate": 2.9370074145467132e-05, "epoch": 1.3322134642718697, "percentage": 44.41, "elapsed_time": "5:44:39", "remaining_time": "7:11:28", "throughput": "4084.29", "total_tokens": 84459520} {"current_steps": 10320, "total_steps": 23217, "loss": 0.7841, "learning_rate": 2.9336762417872516e-05, "epoch": 1.3335056208812508, "percentage": 44.45, "elapsed_time": "5:45:27", "remaining_time": "7:11:42", "throughput": "4078.79", "total_tokens": 84541440} {"current_steps": 10330, "total_steps": 23217, "loss": 0.8774, "learning_rate": 2.9303442749681787e-05, "epoch": 1.3347977774906319, "percentage": 44.49, "elapsed_time": "5:46:14", "remaining_time": "7:11:57", "throughput": "4073.35", "total_tokens": 84623360} {"current_steps": 10340, "total_steps": 23217, "loss": 0.7681, "learning_rate": 2.927011520190313e-05, "epoch": 1.336089934100013, "percentage": 44.54, "elapsed_time": "5:47:02", "remaining_time": "7:12:10", "throughput": "4068.05", "total_tokens": 84705280} {"current_steps": 10350, "total_steps": 23217, "loss": 0.9598, "learning_rate": 2.9236779835559165e-05, "epoch": 1.337382090709394, "percentage": 44.58, "elapsed_time": "5:47:50", "remaining_time": "7:12:26", "throughput": "4062.49", "total_tokens": 84787200} {"current_steps": 10360, "total_steps": 23217, "loss": 0.6958, "learning_rate": 2.9203436711686817e-05, "epoch": 1.338674247318775, "percentage": 44.62, "elapsed_time": "5:48:39", "remaining_time": "7:12:41", "throughput": "4056.95", "total_tokens": 84869120} {"current_steps": 10370, "total_steps": 23217, "loss": 1.0247, "learning_rate": 2.917008589133724e-05, "epoch": 1.339966403928156, "percentage": 44.67, "elapsed_time": "5:49:29", "remaining_time": "7:12:58", "throughput": "4051.11", "total_tokens": 84951040} {"current_steps": 10380, "total_steps": 23217, "loss": 0.5671, "learning_rate": 2.913672743557565e-05, "epoch": 1.3412585605375371, "percentage": 44.71, "elapsed_time": "5:50:18", "remaining_time": "7:13:13", "throughput": "4045.58", "total_tokens": 85032960} {"current_steps": 10390, "total_steps": 23217, "loss": 0.6446, "learning_rate": 2.9103361405481272e-05, "epoch": 1.3425507171469182, "percentage": 44.75, "elapsed_time": "5:51:07", "remaining_time": "7:13:29", "throughput": "4040.02", "total_tokens": 85114880} {"current_steps": 10400, "total_steps": 23217, "loss": 1.0231, "learning_rate": 2.906998786214717e-05, "epoch": 1.3438428737562993, "percentage": 44.79, "elapsed_time": "5:51:55", "remaining_time": "7:13:43", "throughput": "4034.76", "total_tokens": 85196800} {"current_steps": 10410, "total_steps": 23217, "loss": 0.8076, "learning_rate": 2.9036606866680187e-05, "epoch": 1.3451350303656804, "percentage": 44.84, "elapsed_time": "5:52:43", "remaining_time": "7:13:56", "throughput": "4029.54", "total_tokens": 85278720} {"current_steps": 10420, "total_steps": 23217, "loss": 1.0485, "learning_rate": 2.90032184802008e-05, "epoch": 1.3464271869750615, "percentage": 44.88, "elapsed_time": "5:53:30", "remaining_time": "7:14:09", "throughput": "4024.38", "total_tokens": 85360640} {"current_steps": 10430, "total_steps": 23217, "loss": 1.0753, "learning_rate": 2.8969822763843018e-05, "epoch": 1.3477193435844423, "percentage": 44.92, "elapsed_time": "5:54:20", "remaining_time": "7:14:24", "throughput": "4018.87", "total_tokens": 85442560} {"current_steps": 10440, "total_steps": 23217, "loss": 0.9629, "learning_rate": 2.8936419778754294e-05, "epoch": 1.3490115001938234, "percentage": 44.97, "elapsed_time": "5:55:10", "remaining_time": "7:14:40", "throughput": "4013.25", "total_tokens": 85524480} {"current_steps": 10450, "total_steps": 23217, "loss": 0.7803, "learning_rate": 2.8903009586095353e-05, "epoch": 1.3503036568032045, "percentage": 45.01, "elapsed_time": "5:55:59", "remaining_time": "7:14:55", "throughput": "4007.83", "total_tokens": 85606400} {"current_steps": 10460, "total_steps": 23217, "loss": 0.9991, "learning_rate": 2.8869592247040138e-05, "epoch": 1.3515958134125856, "percentage": 45.05, "elapsed_time": "5:56:48", "remaining_time": "7:15:09", "throughput": "4002.58", "total_tokens": 85688320} {"current_steps": 10470, "total_steps": 23217, "loss": 0.7521, "learning_rate": 2.883616782277569e-05, "epoch": 1.3528879700219667, "percentage": 45.1, "elapsed_time": "5:57:39", "remaining_time": "7:15:26", "throughput": "3996.80", "total_tokens": 85770240} {"current_steps": 10480, "total_steps": 23217, "loss": 1.186, "learning_rate": 2.8802736374501994e-05, "epoch": 1.3541801266313478, "percentage": 45.14, "elapsed_time": "5:58:33", "remaining_time": "7:15:47", "throughput": "3990.57", "total_tokens": 85852160} {"current_steps": 10490, "total_steps": 23217, "loss": 1.1393, "learning_rate": 2.8769297963431908e-05, "epoch": 1.3554722832407289, "percentage": 45.18, "elapsed_time": "5:59:27", "remaining_time": "7:16:06", "throughput": "3984.41", "total_tokens": 85934080} {"current_steps": 10500, "total_steps": 23217, "loss": 0.6548, "learning_rate": 2.8735852650791035e-05, "epoch": 1.3567644398501097, "percentage": 45.23, "elapsed_time": "6:00:18", "remaining_time": "7:16:23", "throughput": "3978.78", "total_tokens": 86016000} {"current_steps": 10510, "total_steps": 23217, "loss": 0.9466, "learning_rate": 2.870240049781764e-05, "epoch": 1.3580565964594908, "percentage": 45.27, "elapsed_time": "6:01:09", "remaining_time": "7:16:38", "throughput": "3973.28", "total_tokens": 86097920} {"current_steps": 10520, "total_steps": 23217, "loss": 0.9157, "learning_rate": 2.8668941565762475e-05, "epoch": 1.359348753068872, "percentage": 45.31, "elapsed_time": "6:01:58", "remaining_time": "7:16:53", "throughput": "3968.02", "total_tokens": 86179840} {"current_steps": 10530, "total_steps": 23217, "loss": 0.8647, "learning_rate": 2.8635475915888732e-05, "epoch": 1.360640909678253, "percentage": 45.35, "elapsed_time": "6:02:46", "remaining_time": "7:17:05", "throughput": "3963.07", "total_tokens": 86261760} {"current_steps": 10540, "total_steps": 23217, "loss": 0.8976, "learning_rate": 2.8602003609471888e-05, "epoch": 1.361933066287634, "percentage": 45.4, "elapsed_time": "6:03:34", "remaining_time": "7:17:16", "throughput": "3958.15", "total_tokens": 86343680} {"current_steps": 10550, "total_steps": 23217, "loss": 1.0414, "learning_rate": 2.856852470779962e-05, "epoch": 1.3632252228970152, "percentage": 45.44, "elapsed_time": "6:04:24", "remaining_time": "7:17:31", "throughput": "3952.80", "total_tokens": 86425600} {"current_steps": 10560, "total_steps": 23217, "loss": 0.9523, "learning_rate": 2.853503927217167e-05, "epoch": 1.3645173795063963, "percentage": 45.48, "elapsed_time": "6:05:14", "remaining_time": "7:17:46", "throughput": "3947.42", "total_tokens": 86507520} {"current_steps": 10570, "total_steps": 23217, "loss": 0.7521, "learning_rate": 2.8501547363899744e-05, "epoch": 1.3658095361157772, "percentage": 45.53, "elapsed_time": "6:06:03", "remaining_time": "7:17:59", "throughput": "3942.42", "total_tokens": 86589440} {"current_steps": 10580, "total_steps": 23217, "loss": 0.9591, "learning_rate": 2.846804904430741e-05, "epoch": 1.3671016927251582, "percentage": 45.57, "elapsed_time": "6:06:53", "remaining_time": "7:18:13", "throughput": "3937.14", "total_tokens": 86671360} {"current_steps": 10590, "total_steps": 23217, "loss": 0.9854, "learning_rate": 2.8434544374729965e-05, "epoch": 1.3683938493345393, "percentage": 45.61, "elapsed_time": "6:07:44", "remaining_time": "7:18:29", "throughput": "3931.75", "total_tokens": 86753280} {"current_steps": 10600, "total_steps": 23217, "loss": 1.0439, "learning_rate": 2.8401033416514345e-05, "epoch": 1.3696860059439204, "percentage": 45.66, "elapsed_time": "6:08:34", "remaining_time": "7:18:42", "throughput": "3926.66", "total_tokens": 86835200} {"current_steps": 10610, "total_steps": 23217, "loss": 0.6884, "learning_rate": 2.8367516231018976e-05, "epoch": 1.3709781625533015, "percentage": 45.7, "elapsed_time": "6:09:22", "remaining_time": "7:18:54", "throughput": "3921.77", "total_tokens": 86917120} {"current_steps": 10620, "total_steps": 23217, "loss": 0.9114, "learning_rate": 2.8333992879613712e-05, "epoch": 1.3722703191626824, "percentage": 45.74, "elapsed_time": "6:10:16", "remaining_time": "7:19:11", "throughput": "3916.01", "total_tokens": 86999040} {"current_steps": 10630, "total_steps": 23217, "loss": 0.8389, "learning_rate": 2.830046342367969e-05, "epoch": 1.3735624757720637, "percentage": 45.79, "elapsed_time": "6:11:16", "remaining_time": "7:19:38", "throughput": "3909.03", "total_tokens": 87080960} {"current_steps": 10640, "total_steps": 23217, "loss": 0.5361, "learning_rate": 2.826692792460921e-05, "epoch": 1.3748546323814446, "percentage": 45.83, "elapsed_time": "6:12:17", "remaining_time": "7:20:04", "throughput": "3902.03", "total_tokens": 87162880} {"current_steps": 10650, "total_steps": 23217, "loss": 1.0727, "learning_rate": 2.823338644380566e-05, "epoch": 1.3761467889908257, "percentage": 45.87, "elapsed_time": "6:13:05", "remaining_time": "7:20:15", "throughput": "3897.33", "total_tokens": 87244800} {"current_steps": 10660, "total_steps": 23217, "loss": 0.5925, "learning_rate": 2.8199839042683363e-05, "epoch": 1.3774389456002067, "percentage": 45.91, "elapsed_time": "6:13:53", "remaining_time": "7:20:25", "throughput": "3892.73", "total_tokens": 87326720} {"current_steps": 10670, "total_steps": 23217, "loss": 0.9665, "learning_rate": 2.8166285782667483e-05, "epoch": 1.3787311022095878, "percentage": 45.96, "elapsed_time": "6:14:42", "remaining_time": "7:20:37", "throughput": "3887.88", "total_tokens": 87408640} {"current_steps": 10680, "total_steps": 23217, "loss": 0.9418, "learning_rate": 2.8132726725193926e-05, "epoch": 1.380023258818969, "percentage": 46.0, "elapsed_time": "6:15:30", "remaining_time": "7:20:48", "throughput": "3883.16", "total_tokens": 87490560} {"current_steps": 10690, "total_steps": 23217, "loss": 0.6926, "learning_rate": 2.8099161931709195e-05, "epoch": 1.3813154154283498, "percentage": 46.04, "elapsed_time": "6:16:18", "remaining_time": "7:20:58", "throughput": "3878.51", "total_tokens": 87572480} {"current_steps": 10700, "total_steps": 23217, "loss": 1.0825, "learning_rate": 2.806559146367031e-05, "epoch": 1.382607572037731, "percentage": 46.09, "elapsed_time": "6:17:07", "remaining_time": "7:21:10", "throughput": "3873.77", "total_tokens": 87654400} {"current_steps": 10710, "total_steps": 23217, "loss": 0.63, "learning_rate": 2.803201538254467e-05, "epoch": 1.383899728647112, "percentage": 46.13, "elapsed_time": "6:17:56", "remaining_time": "7:21:21", "throughput": "3869.04", "total_tokens": 87736320} {"current_steps": 10720, "total_steps": 23217, "loss": 0.8605, "learning_rate": 2.799843374980996e-05, "epoch": 1.385191885256493, "percentage": 46.17, "elapsed_time": "6:18:45", "remaining_time": "7:21:32", "throughput": "3864.27", "total_tokens": 87818240} {"current_steps": 10730, "total_steps": 23217, "loss": 1.0539, "learning_rate": 2.796484662695402e-05, "epoch": 1.3864840418658742, "percentage": 46.22, "elapsed_time": "6:19:35", "remaining_time": "7:21:45", "throughput": "3859.35", "total_tokens": 87900160} {"current_steps": 10740, "total_steps": 23217, "loss": 0.7748, "learning_rate": 2.7931254075474768e-05, "epoch": 1.3877761984752552, "percentage": 46.26, "elapsed_time": "6:20:27", "remaining_time": "7:21:59", "throughput": "3854.24", "total_tokens": 87982080} {"current_steps": 10750, "total_steps": 23217, "loss": 0.9568, "learning_rate": 2.789765615688003e-05, "epoch": 1.3890683550846363, "percentage": 46.3, "elapsed_time": "6:21:24", "remaining_time": "7:22:19", "throughput": "3848.24", "total_tokens": 88064000} {"current_steps": 10760, "total_steps": 23217, "loss": 1.0008, "learning_rate": 2.786405293268747e-05, "epoch": 1.3903605116940172, "percentage": 46.35, "elapsed_time": "6:22:19", "remaining_time": "7:22:37", "throughput": "3842.47", "total_tokens": 88145920} {"current_steps": 10770, "total_steps": 23217, "loss": 0.8518, "learning_rate": 2.7830444464424466e-05, "epoch": 1.3916526683033985, "percentage": 46.39, "elapsed_time": "6:23:13", "remaining_time": "7:22:53", "throughput": "3837.08", "total_tokens": 88227840} {"current_steps": 10780, "total_steps": 23217, "loss": 0.8596, "learning_rate": 2.7796830813628004e-05, "epoch": 1.3929448249127794, "percentage": 46.43, "elapsed_time": "6:24:07", "remaining_time": "7:23:09", "throughput": "3831.67", "total_tokens": 88309760} {"current_steps": 10790, "total_steps": 23217, "loss": 0.9577, "learning_rate": 2.776321204184456e-05, "epoch": 1.3942369815221605, "percentage": 46.47, "elapsed_time": "6:25:01", "remaining_time": "7:23:26", "throughput": "3826.17", "total_tokens": 88391680} {"current_steps": 10800, "total_steps": 23217, "loss": 0.9272, "learning_rate": 2.772958821062997e-05, "epoch": 1.3955291381315416, "percentage": 46.52, "elapsed_time": "6:25:55", "remaining_time": "7:23:42", "throughput": "3820.86", "total_tokens": 88473600} {"current_steps": 10810, "total_steps": 23217, "loss": 0.8736, "learning_rate": 2.7695959381549364e-05, "epoch": 1.3968212947409226, "percentage": 46.56, "elapsed_time": "6:26:47", "remaining_time": "7:23:55", "throughput": "3815.89", "total_tokens": 88555520} {"current_steps": 10820, "total_steps": 23217, "loss": 0.7469, "learning_rate": 2.7662325616176993e-05, "epoch": 1.3981134513503037, "percentage": 46.6, "elapsed_time": "6:27:40", "remaining_time": "7:24:10", "throughput": "3810.63", "total_tokens": 88637440} {"current_steps": 10830, "total_steps": 23217, "loss": 0.9801, "learning_rate": 2.7628686976096164e-05, "epoch": 1.3994056079596846, "percentage": 46.65, "elapsed_time": "6:28:31", "remaining_time": "7:24:23", "throughput": "3805.78", "total_tokens": 88719360} {"current_steps": 10840, "total_steps": 23217, "loss": 1.1059, "learning_rate": 2.7595043522899093e-05, "epoch": 1.4006977645690657, "percentage": 46.69, "elapsed_time": "6:29:20", "remaining_time": "7:24:33", "throughput": "3801.31", "total_tokens": 88801280} {"current_steps": 10850, "total_steps": 23217, "loss": 1.1236, "learning_rate": 2.756139531818684e-05, "epoch": 1.4019899211784468, "percentage": 46.73, "elapsed_time": "6:30:09", "remaining_time": "7:24:41", "throughput": "3796.96", "total_tokens": 88883200} {"current_steps": 10860, "total_steps": 23217, "loss": 0.7606, "learning_rate": 2.7527742423569124e-05, "epoch": 1.4032820777878279, "percentage": 46.78, "elapsed_time": "6:30:58", "remaining_time": "7:24:51", "throughput": "3792.47", "total_tokens": 88965120} {"current_steps": 10870, "total_steps": 23217, "loss": 0.7754, "learning_rate": 2.7494084900664273e-05, "epoch": 1.404574234397209, "percentage": 46.82, "elapsed_time": "6:31:50", "remaining_time": "7:25:05", "throughput": "3787.54", "total_tokens": 89047040} {"current_steps": 10880, "total_steps": 23217, "loss": 0.9668, "learning_rate": 2.746042281109911e-05, "epoch": 1.40586639100659, "percentage": 46.86, "elapsed_time": "6:32:50", "remaining_time": "7:25:27", "throughput": "3781.36", "total_tokens": 89128960} {"current_steps": 10890, "total_steps": 23217, "loss": 0.9552, "learning_rate": 2.7426756216508776e-05, "epoch": 1.4071585476159711, "percentage": 46.91, "elapsed_time": "6:33:50", "remaining_time": "7:25:48", "throughput": "3775.27", "total_tokens": 89210880} {"current_steps": 10900, "total_steps": 23217, "loss": 0.8455, "learning_rate": 2.7393085178536686e-05, "epoch": 1.408450704225352, "percentage": 46.95, "elapsed_time": "6:34:41", "remaining_time": "7:25:59", "throughput": "3770.63", "total_tokens": 89292800} {"current_steps": 10910, "total_steps": 23217, "loss": 0.515, "learning_rate": 2.7359409758834397e-05, "epoch": 1.409742860834733, "percentage": 46.99, "elapsed_time": "6:35:36", "remaining_time": "7:26:15", "throughput": "3765.30", "total_tokens": 89374720} {"current_steps": 10920, "total_steps": 23217, "loss": 0.5575, "learning_rate": 2.7325730019061474e-05, "epoch": 1.4110350174441142, "percentage": 47.03, "elapsed_time": "6:36:31", "remaining_time": "7:26:31", "throughput": "3760.01", "total_tokens": 89456640} {"current_steps": 10930, "total_steps": 23217, "loss": 0.7631, "learning_rate": 2.729204602088539e-05, "epoch": 1.4123271740534953, "percentage": 47.08, "elapsed_time": "6:37:23", "remaining_time": "7:26:43", "throughput": "3755.27", "total_tokens": 89538560} {"current_steps": 10940, "total_steps": 23217, "loss": 0.8117, "learning_rate": 2.7258357825981433e-05, "epoch": 1.4136193306628764, "percentage": 47.12, "elapsed_time": "6:38:13", "remaining_time": "7:26:54", "throughput": "3750.77", "total_tokens": 89620480} {"current_steps": 10950, "total_steps": 23217, "loss": 0.7802, "learning_rate": 2.7224665496032565e-05, "epoch": 1.4149114872722575, "percentage": 47.16, "elapsed_time": "6:39:03", "remaining_time": "7:27:03", "throughput": "3746.45", "total_tokens": 89702400} {"current_steps": 10960, "total_steps": 23217, "loss": 0.8345, "learning_rate": 2.7190969092729308e-05, "epoch": 1.4162036438816386, "percentage": 47.21, "elapsed_time": "6:39:53", "remaining_time": "7:27:12", "throughput": "3742.06", "total_tokens": 89784320} {"current_steps": 10970, "total_steps": 23217, "loss": 1.1491, "learning_rate": 2.7157268677769666e-05, "epoch": 1.4174958004910194, "percentage": 47.25, "elapsed_time": "6:40:45", "remaining_time": "7:27:24", "throughput": "3737.29", "total_tokens": 89866240} {"current_steps": 10980, "total_steps": 23217, "loss": 1.3288, "learning_rate": 2.712356431285896e-05, "epoch": 1.4187879571004005, "percentage": 47.29, "elapsed_time": "6:41:37", "remaining_time": "7:27:36", "throughput": "3732.68", "total_tokens": 89948160} {"current_steps": 10990, "total_steps": 23217, "loss": 0.8851, "learning_rate": 2.7089856059709774e-05, "epoch": 1.4200801137097816, "percentage": 47.34, "elapsed_time": "6:42:27", "remaining_time": "7:27:44", "throughput": "3728.40", "total_tokens": 90030080} {"current_steps": 11000, "total_steps": 23217, "loss": 0.7634, "learning_rate": 2.7056143980041787e-05, "epoch": 1.4213722703191627, "percentage": 47.38, "elapsed_time": "6:43:18", "remaining_time": "7:27:55", "throughput": "3723.87", "total_tokens": 90112000} {"current_steps": 11010, "total_steps": 23217, "loss": 0.8556, "learning_rate": 2.70224281355817e-05, "epoch": 1.4226644269285438, "percentage": 47.42, "elapsed_time": "6:44:15", "remaining_time": "7:28:12", "throughput": "3718.55", "total_tokens": 90193920} {"current_steps": 11020, "total_steps": 23217, "loss": 0.7443, "learning_rate": 2.6988708588063093e-05, "epoch": 1.4239565835379249, "percentage": 47.47, "elapsed_time": "6:45:05", "remaining_time": "7:28:21", "throughput": "3714.22", "total_tokens": 90275840} {"current_steps": 11030, "total_steps": 23217, "loss": 0.9481, "learning_rate": 2.695498539922634e-05, "epoch": 1.425248740147306, "percentage": 47.51, "elapsed_time": "6:45:53", "remaining_time": "7:28:27", "throughput": "3710.31", "total_tokens": 90357760} {"current_steps": 11040, "total_steps": 23217, "loss": 0.817, "learning_rate": 2.6921258630818475e-05, "epoch": 1.4265408967566868, "percentage": 47.55, "elapsed_time": "6:46:43", "remaining_time": "7:28:36", "throughput": "3706.05", "total_tokens": 90439680} {"current_steps": 11050, "total_steps": 23217, "loss": 0.6403, "learning_rate": 2.6887528344593087e-05, "epoch": 1.427833053366068, "percentage": 47.59, "elapsed_time": "6:47:33", "remaining_time": "7:28:45", "throughput": "3701.74", "total_tokens": 90521600} {"current_steps": 11060, "total_steps": 23217, "loss": 0.8245, "learning_rate": 2.685379460231021e-05, "epoch": 1.429125209975449, "percentage": 47.64, "elapsed_time": "6:48:22", "remaining_time": "7:28:53", "throughput": "3697.70", "total_tokens": 90603520} {"current_steps": 11070, "total_steps": 23217, "loss": 1.2493, "learning_rate": 2.6820057465736197e-05, "epoch": 1.43041736658483, "percentage": 47.68, "elapsed_time": "6:49:23", "remaining_time": "7:29:12", "throughput": "3691.93", "total_tokens": 90685440} {"current_steps": 11080, "total_steps": 23217, "loss": 0.9927, "learning_rate": 2.6786316996643623e-05, "epoch": 1.4317095231942112, "percentage": 47.72, "elapsed_time": "6:50:14", "remaining_time": "7:29:22", "throughput": "3687.53", "total_tokens": 90767360} {"current_steps": 11090, "total_steps": 23217, "loss": 0.9965, "learning_rate": 2.6752573256811165e-05, "epoch": 1.4330016798035923, "percentage": 47.77, "elapsed_time": "6:51:05", "remaining_time": "7:29:32", "throughput": "3683.24", "total_tokens": 90849280} {"current_steps": 11100, "total_steps": 23217, "loss": 0.8742, "learning_rate": 2.6718826308023487e-05, "epoch": 1.4342938364129734, "percentage": 47.81, "elapsed_time": "6:51:56", "remaining_time": "7:29:40", "throughput": "3679.02", "total_tokens": 90931200} {"current_steps": 11110, "total_steps": 23217, "loss": 0.9033, "learning_rate": 2.668507621207113e-05, "epoch": 1.4355859930223542, "percentage": 47.85, "elapsed_time": "6:52:45", "remaining_time": "7:29:47", "throughput": "3675.02", "total_tokens": 91013120} {"current_steps": 11120, "total_steps": 23217, "loss": 0.7038, "learning_rate": 2.6651323030750396e-05, "epoch": 1.4368781496317353, "percentage": 47.9, "elapsed_time": "6:53:35", "remaining_time": "7:29:55", "throughput": "3670.90", "total_tokens": 91095040} {"current_steps": 11130, "total_steps": 23217, "loss": 0.7839, "learning_rate": 2.6617566825863237e-05, "epoch": 1.4381703062411164, "percentage": 47.94, "elapsed_time": "6:54:24", "remaining_time": "7:30:02", "throughput": "3667.00", "total_tokens": 91176960} {"current_steps": 11140, "total_steps": 23217, "loss": 0.7871, "learning_rate": 2.6583807659217137e-05, "epoch": 1.4394624628504975, "percentage": 47.98, "elapsed_time": "6:55:14", "remaining_time": "7:30:09", "throughput": "3662.95", "total_tokens": 91258880} {"current_steps": 11150, "total_steps": 23217, "loss": 1.0343, "learning_rate": 2.6550045592625007e-05, "epoch": 1.4407546194598786, "percentage": 48.03, "elapsed_time": "6:56:05", "remaining_time": "7:30:18", "throughput": "3658.74", "total_tokens": 91340800} {"current_steps": 11160, "total_steps": 23217, "loss": 1.1501, "learning_rate": 2.651628068790507e-05, "epoch": 1.4420467760692595, "percentage": 48.07, "elapsed_time": "6:56:56", "remaining_time": "7:30:26", "throughput": "3654.54", "total_tokens": 91422720} {"current_steps": 11170, "total_steps": 23217, "loss": 0.8592, "learning_rate": 2.648251300688073e-05, "epoch": 1.4433389326786408, "percentage": 48.11, "elapsed_time": "6:57:46", "remaining_time": "7:30:35", "throughput": "3650.41", "total_tokens": 91504640} {"current_steps": 11180, "total_steps": 23217, "loss": 0.8201, "learning_rate": 2.6448742611380515e-05, "epoch": 1.4446310892880216, "percentage": 48.15, "elapsed_time": "6:58:38", "remaining_time": "7:30:43", "throughput": "3646.20", "total_tokens": 91586560} {"current_steps": 11190, "total_steps": 23217, "loss": 1.074, "learning_rate": 2.6414969563237874e-05, "epoch": 1.4459232458974027, "percentage": 48.2, "elapsed_time": "6:59:29", "remaining_time": "7:30:51", "throughput": "3642.10", "total_tokens": 91668480} {"current_steps": 11200, "total_steps": 23217, "loss": 0.8012, "learning_rate": 2.6381193924291143e-05, "epoch": 1.4472154025067838, "percentage": 48.24, "elapsed_time": "7:00:20", "remaining_time": "7:30:59", "throughput": "3637.97", "total_tokens": 91750400} {"current_steps": 11210, "total_steps": 23217, "loss": 1.1103, "learning_rate": 2.63474157563834e-05, "epoch": 1.448507559116165, "percentage": 48.28, "elapsed_time": "7:01:12", "remaining_time": "7:31:09", "throughput": "3633.62", "total_tokens": 91832320} {"current_steps": 11220, "total_steps": 23217, "loss": 0.6353, "learning_rate": 2.6313635121362322e-05, "epoch": 1.449799715725546, "percentage": 48.33, "elapsed_time": "7:02:02", "remaining_time": "7:31:16", "throughput": "3629.69", "total_tokens": 91914240} {"current_steps": 11230, "total_steps": 23217, "loss": 0.8131, "learning_rate": 2.6279852081080153e-05, "epoch": 1.4510918723349269, "percentage": 48.37, "elapsed_time": "7:02:52", "remaining_time": "7:31:23", "throughput": "3625.79", "total_tokens": 91996160} {"current_steps": 11240, "total_steps": 23217, "loss": 0.8539, "learning_rate": 2.6246066697393494e-05, "epoch": 1.4523840289443082, "percentage": 48.41, "elapsed_time": "7:03:45", "remaining_time": "7:31:32", "throughput": "3621.46", "total_tokens": 92078080} {"current_steps": 11250, "total_steps": 23217, "loss": 0.799, "learning_rate": 2.6212279032163283e-05, "epoch": 1.453676185553689, "percentage": 48.46, "elapsed_time": "7:04:39", "remaining_time": "7:31:43", "throughput": "3617.06", "total_tokens": 92160000} {"current_steps": 11260, "total_steps": 23217, "loss": 0.5722, "learning_rate": 2.6178489147254598e-05, "epoch": 1.4549683421630701, "percentage": 48.5, "elapsed_time": "7:05:31", "remaining_time": "7:31:52", "throughput": "3612.85", "total_tokens": 92241920} {"current_steps": 11270, "total_steps": 23217, "loss": 0.8796, "learning_rate": 2.6144697104536597e-05, "epoch": 1.4562604987724512, "percentage": 48.54, "elapsed_time": "7:06:20", "remaining_time": "7:31:57", "throughput": "3609.09", "total_tokens": 92323840} {"current_steps": 11280, "total_steps": 23217, "loss": 1.1459, "learning_rate": 2.6110902965882383e-05, "epoch": 1.4575526553818323, "percentage": 48.59, "elapsed_time": "7:07:13", "remaining_time": "7:32:06", "throughput": "3604.88", "total_tokens": 92405760} {"current_steps": 11290, "total_steps": 23217, "loss": 0.7492, "learning_rate": 2.607710679316891e-05, "epoch": 1.4588448119912134, "percentage": 48.63, "elapsed_time": "7:08:05", "remaining_time": "7:32:14", "throughput": "3600.78", "total_tokens": 92487680} {"current_steps": 11300, "total_steps": 23217, "loss": 0.9672, "learning_rate": 2.6043308648276833e-05, "epoch": 1.4601369686005943, "percentage": 48.67, "elapsed_time": "7:08:53", "remaining_time": "7:32:18", "throughput": "3597.20", "total_tokens": 92569600} {"current_steps": 11310, "total_steps": 23217, "loss": 0.606, "learning_rate": 2.6009508593090448e-05, "epoch": 1.4614291252099754, "percentage": 48.71, "elapsed_time": "7:09:42", "remaining_time": "7:32:23", "throughput": "3593.63", "total_tokens": 92651520} {"current_steps": 11320, "total_steps": 23217, "loss": 0.7642, "learning_rate": 2.5975706689497513e-05, "epoch": 1.4627212818193565, "percentage": 48.76, "elapsed_time": "7:10:31", "remaining_time": "7:32:27", "throughput": "3590.00", "total_tokens": 92733440} {"current_steps": 11330, "total_steps": 23217, "loss": 0.8852, "learning_rate": 2.59419029993892e-05, "epoch": 1.4640134384287375, "percentage": 48.8, "elapsed_time": "7:11:19", "remaining_time": "7:32:31", "throughput": "3586.51", "total_tokens": 92815360} {"current_steps": 11340, "total_steps": 23217, "loss": 1.1366, "learning_rate": 2.590809758465995e-05, "epoch": 1.4653055950381186, "percentage": 48.84, "elapsed_time": "7:12:10", "remaining_time": "7:32:38", "throughput": "3582.49", "total_tokens": 92897280} {"current_steps": 11350, "total_steps": 23217, "loss": 1.004, "learning_rate": 2.5874290507207337e-05, "epoch": 1.4665977516474997, "percentage": 48.89, "elapsed_time": "7:12:58", "remaining_time": "7:32:41", "throughput": "3579.12", "total_tokens": 92979200} {"current_steps": 11360, "total_steps": 23217, "loss": 1.1198, "learning_rate": 2.584048182893201e-05, "epoch": 1.4678899082568808, "percentage": 48.93, "elapsed_time": "7:13:45", "remaining_time": "7:32:44", "throughput": "3575.77", "total_tokens": 93061120} {"current_steps": 11370, "total_steps": 23217, "loss": 0.7811, "learning_rate": 2.580667161173753e-05, "epoch": 1.4691820648662617, "percentage": 48.97, "elapsed_time": "7:14:32", "remaining_time": "7:32:46", "throughput": "3572.43", "total_tokens": 93143040} {"current_steps": 11380, "total_steps": 23217, "loss": 1.0665, "learning_rate": 2.577285991753028e-05, "epoch": 1.4704742214756428, "percentage": 49.02, "elapsed_time": "7:15:19", "remaining_time": "7:32:48", "throughput": "3569.11", "total_tokens": 93224960} {"current_steps": 11390, "total_steps": 23217, "loss": 0.9232, "learning_rate": 2.5739046808219348e-05, "epoch": 1.4717663780850239, "percentage": 49.06, "elapsed_time": "7:16:07", "remaining_time": "7:32:51", "throughput": "3565.79", "total_tokens": 93306880} {"current_steps": 11400, "total_steps": 23217, "loss": 0.8771, "learning_rate": 2.570523234571642e-05, "epoch": 1.473058534694405, "percentage": 49.1, "elapsed_time": "7:16:54", "remaining_time": "7:32:53", "throughput": "3562.49", "total_tokens": 93388800} {"current_steps": 11410, "total_steps": 23217, "loss": 0.7952, "learning_rate": 2.5671416591935636e-05, "epoch": 1.474350691303786, "percentage": 49.15, "elapsed_time": "7:17:41", "remaining_time": "7:32:55", "throughput": "3559.20", "total_tokens": 93470720} {"current_steps": 11420, "total_steps": 23217, "loss": 0.8034, "learning_rate": 2.563759960879354e-05, "epoch": 1.4756428479131671, "percentage": 49.19, "elapsed_time": "7:18:29", "remaining_time": "7:32:57", "throughput": "3555.92", "total_tokens": 93552640} {"current_steps": 11430, "total_steps": 23217, "loss": 0.9861, "learning_rate": 2.5603781458208885e-05, "epoch": 1.4769350045225482, "percentage": 49.23, "elapsed_time": "7:19:16", "remaining_time": "7:32:59", "throughput": "3552.65", "total_tokens": 93634560} {"current_steps": 11440, "total_steps": 23217, "loss": 0.9154, "learning_rate": 2.55699622021026e-05, "epoch": 1.478227161131929, "percentage": 49.27, "elapsed_time": "7:20:03", "remaining_time": "7:33:01", "throughput": "3549.39", "total_tokens": 93716480} {"current_steps": 11450, "total_steps": 23217, "loss": 0.696, "learning_rate": 2.55361419023976e-05, "epoch": 1.4795193177413102, "percentage": 49.32, "elapsed_time": "7:20:50", "remaining_time": "7:33:03", "throughput": "3546.14", "total_tokens": 93798400} {"current_steps": 11460, "total_steps": 23217, "loss": 1.0897, "learning_rate": 2.5502320621018732e-05, "epoch": 1.4808114743506913, "percentage": 49.36, "elapsed_time": "7:21:38", "remaining_time": "7:33:04", "throughput": "3542.91", "total_tokens": 93880320} {"current_steps": 11470, "total_steps": 23217, "loss": 0.9171, "learning_rate": 2.5468498419892656e-05, "epoch": 1.4821036309600724, "percentage": 49.4, "elapsed_time": "7:22:25", "remaining_time": "7:33:06", "throughput": "3539.68", "total_tokens": 93962240} {"current_steps": 11480, "total_steps": 23217, "loss": 0.875, "learning_rate": 2.5434675360947692e-05, "epoch": 1.4833957875694535, "percentage": 49.45, "elapsed_time": "7:23:12", "remaining_time": "7:33:07", "throughput": "3536.47", "total_tokens": 94044160} {"current_steps": 11490, "total_steps": 23217, "loss": 0.7646, "learning_rate": 2.5400851506113728e-05, "epoch": 1.4846879441788345, "percentage": 49.49, "elapsed_time": "7:23:59", "remaining_time": "7:33:09", "throughput": "3533.26", "total_tokens": 94126080} {"current_steps": 11500, "total_steps": 23217, "loss": 0.9129, "learning_rate": 2.5367026917322117e-05, "epoch": 1.4859801007882156, "percentage": 49.53, "elapsed_time": "7:24:47", "remaining_time": "7:33:10", "throughput": "3530.06", "total_tokens": 94208000} {"current_steps": 11510, "total_steps": 23217, "loss": 1.2751, "learning_rate": 2.5333201656505567e-05, "epoch": 1.4872722573975965, "percentage": 49.58, "elapsed_time": "7:25:34", "remaining_time": "7:33:12", "throughput": "3526.88", "total_tokens": 94289920} {"current_steps": 11520, "total_steps": 23217, "loss": 0.8298, "learning_rate": 2.5299375785598005e-05, "epoch": 1.4885644140069776, "percentage": 49.62, "elapsed_time": "7:26:21", "remaining_time": "7:33:13", "throughput": "3523.71", "total_tokens": 94371840} {"current_steps": 11530, "total_steps": 23217, "loss": 1.0023, "learning_rate": 2.5265549366534475e-05, "epoch": 1.4898565706163587, "percentage": 49.66, "elapsed_time": "7:27:09", "remaining_time": "7:33:14", "throughput": "3520.56", "total_tokens": 94453760} {"current_steps": 11540, "total_steps": 23217, "loss": 0.8267, "learning_rate": 2.5231722461251017e-05, "epoch": 1.4911487272257398, "percentage": 49.7, "elapsed_time": "7:27:56", "remaining_time": "7:33:15", "throughput": "3517.40", "total_tokens": 94535680} {"current_steps": 11550, "total_steps": 23217, "loss": 0.6509, "learning_rate": 2.519789513168459e-05, "epoch": 1.4924408838351209, "percentage": 49.75, "elapsed_time": "7:28:43", "remaining_time": "7:33:16", "throughput": "3514.27", "total_tokens": 94617600} {"current_steps": 11560, "total_steps": 23217, "loss": 0.7988, "learning_rate": 2.5164067439772898e-05, "epoch": 1.493733040444502, "percentage": 49.79, "elapsed_time": "7:29:31", "remaining_time": "7:33:17", "throughput": "3511.15", "total_tokens": 94699520} {"current_steps": 11570, "total_steps": 23217, "loss": 0.7822, "learning_rate": 2.5130239447454328e-05, "epoch": 1.495025197053883, "percentage": 49.83, "elapsed_time": "7:30:18", "remaining_time": "7:33:18", "throughput": "3508.04", "total_tokens": 94781440} {"current_steps": 11580, "total_steps": 23217, "loss": 0.9319, "learning_rate": 2.509641121666781e-05, "epoch": 1.496317353663264, "percentage": 49.88, "elapsed_time": "7:31:05", "remaining_time": "7:33:18", "throughput": "3504.94", "total_tokens": 94863360} {"current_steps": 11590, "total_steps": 23217, "loss": 0.8723, "learning_rate": 2.5062582809352704e-05, "epoch": 1.497609510272645, "percentage": 49.92, "elapsed_time": "7:31:52", "remaining_time": "7:33:19", "throughput": "3501.86", "total_tokens": 94945280} {"current_steps": 11600, "total_steps": 23217, "loss": 1.0985, "learning_rate": 2.5028754287448695e-05, "epoch": 1.498901666882026, "percentage": 49.96, "elapsed_time": "7:32:40", "remaining_time": "7:33:19", "throughput": "3498.78", "total_tokens": 95027200} {"current_steps": 11610, "total_steps": 23217, "loss": 0.898, "learning_rate": 2.4994925712895697e-05, "epoch": 1.5001938234914072, "percentage": 50.01, "elapsed_time": "7:33:27", "remaining_time": "7:33:20", "throughput": "3495.72", "total_tokens": 95109120} {"current_steps": 11620, "total_steps": 23217, "loss": 1.2631, "learning_rate": 2.4961097147633698e-05, "epoch": 1.5014859801007883, "percentage": 50.05, "elapsed_time": "7:34:14", "remaining_time": "7:33:20", "throughput": "3492.65", "total_tokens": 95191040} {"current_steps": 11630, "total_steps": 23217, "loss": 0.9865, "learning_rate": 2.4927268653602684e-05, "epoch": 1.5027781367101691, "percentage": 50.09, "elapsed_time": "7:35:01", "remaining_time": "7:33:20", "throughput": "3489.61", "total_tokens": 95272960} {"current_steps": 11640, "total_steps": 23217, "loss": 1.063, "learning_rate": 2.489344029274249e-05, "epoch": 1.5040702933195504, "percentage": 50.14, "elapsed_time": "7:35:49", "remaining_time": "7:33:21", "throughput": "3486.57", "total_tokens": 95354880} {"current_steps": 11650, "total_steps": 23217, "loss": 0.4969, "learning_rate": 2.4859612126992737e-05, "epoch": 1.5053624499289313, "percentage": 50.18, "elapsed_time": "7:36:36", "remaining_time": "7:33:21", "throughput": "3483.55", "total_tokens": 95436800} {"current_steps": 11660, "total_steps": 23217, "loss": 0.6354, "learning_rate": 2.4825784218292664e-05, "epoch": 1.5066546065383124, "percentage": 50.22, "elapsed_time": "7:37:23", "remaining_time": "7:33:21", "throughput": "3480.53", "total_tokens": 95518720} {"current_steps": 11670, "total_steps": 23217, "loss": 0.9183, "learning_rate": 2.479195662858105e-05, "epoch": 1.5079467631476935, "percentage": 50.26, "elapsed_time": "7:38:10", "remaining_time": "7:33:21", "throughput": "3477.53", "total_tokens": 95600640} {"current_steps": 11680, "total_steps": 23217, "loss": 0.8669, "learning_rate": 2.4758129419796094e-05, "epoch": 1.5092389197570746, "percentage": 50.31, "elapsed_time": "7:38:58", "remaining_time": "7:33:21", "throughput": "3474.53", "total_tokens": 95682560} {"current_steps": 11690, "total_steps": 23217, "loss": 1.1856, "learning_rate": 2.4724302653875275e-05, "epoch": 1.5105310763664557, "percentage": 50.35, "elapsed_time": "7:39:45", "remaining_time": "7:33:20", "throughput": "3471.54", "total_tokens": 95764480} {"current_steps": 11700, "total_steps": 23217, "loss": 0.7345, "learning_rate": 2.4690476392755298e-05, "epoch": 1.5118232329758365, "percentage": 50.39, "elapsed_time": "7:40:32", "remaining_time": "7:33:20", "throughput": "3468.57", "total_tokens": 95846400} {"current_steps": 11710, "total_steps": 23217, "loss": 0.5009, "learning_rate": 2.4656650698371903e-05, "epoch": 1.5131153895852179, "percentage": 50.44, "elapsed_time": "7:41:20", "remaining_time": "7:33:20", "throughput": "3465.60", "total_tokens": 95928320} {"current_steps": 11720, "total_steps": 23217, "loss": 0.7891, "learning_rate": 2.462282563265982e-05, "epoch": 1.5144075461945987, "percentage": 50.48, "elapsed_time": "7:42:07", "remaining_time": "7:33:19", "throughput": "3462.65", "total_tokens": 96010240} {"current_steps": 11730, "total_steps": 23217, "loss": 0.6393, "learning_rate": 2.4589001257552637e-05, "epoch": 1.5156997028039798, "percentage": 50.52, "elapsed_time": "7:42:54", "remaining_time": "7:33:19", "throughput": "3459.71", "total_tokens": 96092160} {"current_steps": 11740, "total_steps": 23217, "loss": 0.8309, "learning_rate": 2.455517763498264e-05, "epoch": 1.516991859413361, "percentage": 50.57, "elapsed_time": "7:43:41", "remaining_time": "7:33:18", "throughput": "3456.78", "total_tokens": 96174080} {"current_steps": 11750, "total_steps": 23217, "loss": 0.7155, "learning_rate": 2.452135482688077e-05, "epoch": 1.518284016022742, "percentage": 50.61, "elapsed_time": "7:44:29", "remaining_time": "7:33:17", "throughput": "3453.87", "total_tokens": 96256000} {"current_steps": 11760, "total_steps": 23217, "loss": 0.8101, "learning_rate": 2.4487532895176457e-05, "epoch": 1.519576172632123, "percentage": 50.65, "elapsed_time": "7:45:16", "remaining_time": "7:33:17", "throughput": "3450.95", "total_tokens": 96337920} {"current_steps": 11770, "total_steps": 23217, "loss": 0.5187, "learning_rate": 2.4453711901797543e-05, "epoch": 1.520868329241504, "percentage": 50.7, "elapsed_time": "7:46:03", "remaining_time": "7:33:16", "throughput": "3448.04", "total_tokens": 96419840} {"current_steps": 11780, "total_steps": 23217, "loss": 1.1635, "learning_rate": 2.4419891908670127e-05, "epoch": 1.5221604858508853, "percentage": 50.74, "elapsed_time": "7:46:50", "remaining_time": "7:33:15", "throughput": "3445.16", "total_tokens": 96501760} {"current_steps": 11790, "total_steps": 23217, "loss": 0.8433, "learning_rate": 2.4386072977718503e-05, "epoch": 1.5234526424602661, "percentage": 50.78, "elapsed_time": "7:47:38", "remaining_time": "7:33:14", "throughput": "3442.27", "total_tokens": 96583680} {"current_steps": 11800, "total_steps": 23217, "loss": 0.9885, "learning_rate": 2.4352255170865025e-05, "epoch": 1.5247447990696472, "percentage": 50.82, "elapsed_time": "7:48:25", "remaining_time": "7:33:13", "throughput": "3439.39", "total_tokens": 96665600} {"current_steps": 11810, "total_steps": 23217, "loss": 1.0425, "learning_rate": 2.4318438550029946e-05, "epoch": 1.5260369556790283, "percentage": 50.87, "elapsed_time": "7:49:12", "remaining_time": "7:33:11", "throughput": "3436.53", "total_tokens": 96747520} {"current_steps": 11820, "total_steps": 23217, "loss": 0.6342, "learning_rate": 2.4284623177131395e-05, "epoch": 1.5273291122884094, "percentage": 50.91, "elapsed_time": "7:49:59", "remaining_time": "7:33:10", "throughput": "3433.68", "total_tokens": 96829440} {"current_steps": 11830, "total_steps": 23217, "loss": 1.1709, "learning_rate": 2.4250809114085183e-05, "epoch": 1.5286212688977905, "percentage": 50.95, "elapsed_time": "7:50:47", "remaining_time": "7:33:09", "throughput": "3430.84", "total_tokens": 96911360} {"current_steps": 11840, "total_steps": 23217, "loss": 1.0094, "learning_rate": 2.421699642280475e-05, "epoch": 1.5299134255071714, "percentage": 51.0, "elapsed_time": "7:51:34", "remaining_time": "7:33:07", "throughput": "3428.00", "total_tokens": 96993280} {"current_steps": 11850, "total_steps": 23217, "loss": 0.7204, "learning_rate": 2.4183185165200998e-05, "epoch": 1.5312055821165527, "percentage": 51.04, "elapsed_time": "7:52:21", "remaining_time": "7:33:06", "throughput": "3425.17", "total_tokens": 97075200} {"current_steps": 11860, "total_steps": 23217, "loss": 0.7901, "learning_rate": 2.4149375403182216e-05, "epoch": 1.5324977387259335, "percentage": 51.08, "elapsed_time": "7:53:09", "remaining_time": "7:33:04", "throughput": "3422.35", "total_tokens": 97157120} {"current_steps": 11870, "total_steps": 23217, "loss": 1.0571, "learning_rate": 2.4115567198653963e-05, "epoch": 1.5337898953353146, "percentage": 51.13, "elapsed_time": "7:53:56", "remaining_time": "7:33:03", "throughput": "3419.54", "total_tokens": 97239040} {"current_steps": 11880, "total_steps": 23217, "loss": 0.5656, "learning_rate": 2.4081760613518924e-05, "epoch": 1.5350820519446957, "percentage": 51.17, "elapsed_time": "7:54:43", "remaining_time": "7:33:01", "throughput": "3416.74", "total_tokens": 97320960} {"current_steps": 11890, "total_steps": 23217, "loss": 1.2245, "learning_rate": 2.4047955709676852e-05, "epoch": 1.5363742085540768, "percentage": 51.21, "elapsed_time": "7:55:30", "remaining_time": "7:32:59", "throughput": "3413.96", "total_tokens": 97402880} {"current_steps": 11900, "total_steps": 23217, "loss": 0.9675, "learning_rate": 2.401415254902438e-05, "epoch": 1.537666365163458, "percentage": 51.26, "elapsed_time": "7:56:18", "remaining_time": "7:32:57", "throughput": "3411.18", "total_tokens": 97484800} {"current_steps": 11910, "total_steps": 23217, "loss": 1.0065, "learning_rate": 2.3980351193455e-05, "epoch": 1.5389585217728388, "percentage": 51.3, "elapsed_time": "7:57:05", "remaining_time": "7:32:55", "throughput": "3408.42", "total_tokens": 97566720} {"current_steps": 11920, "total_steps": 23217, "loss": 0.8522, "learning_rate": 2.3946551704858838e-05, "epoch": 1.54025067838222, "percentage": 51.34, "elapsed_time": "7:57:52", "remaining_time": "7:32:53", "throughput": "3405.66", "total_tokens": 97648640} {"current_steps": 11930, "total_steps": 23217, "loss": 0.9128, "learning_rate": 2.3912754145122663e-05, "epoch": 1.541542834991601, "percentage": 51.38, "elapsed_time": "7:58:39", "remaining_time": "7:32:51", "throughput": "3402.92", "total_tokens": 97730560} {"current_steps": 11940, "total_steps": 23217, "loss": 0.8387, "learning_rate": 2.3878958576129664e-05, "epoch": 1.542834991600982, "percentage": 51.43, "elapsed_time": "7:59:26", "remaining_time": "7:32:49", "throughput": "3400.18", "total_tokens": 97812480} {"current_steps": 11950, "total_steps": 23217, "loss": 0.9149, "learning_rate": 2.3845165059759402e-05, "epoch": 1.5441271482103631, "percentage": 51.47, "elapsed_time": "8:00:14", "remaining_time": "7:32:47", "throughput": "3397.45", "total_tokens": 97894400} {"current_steps": 11960, "total_steps": 23217, "loss": 0.8989, "learning_rate": 2.3811373657887705e-05, "epoch": 1.545419304819744, "percentage": 51.51, "elapsed_time": "8:01:01", "remaining_time": "7:32:44", "throughput": "3394.73", "total_tokens": 97976320} {"current_steps": 11970, "total_steps": 23217, "loss": 0.8954, "learning_rate": 2.3777584432386474e-05, "epoch": 1.5467114614291253, "percentage": 51.56, "elapsed_time": "8:01:48", "remaining_time": "7:32:42", "throughput": "3392.02", "total_tokens": 98058240} {"current_steps": 11980, "total_steps": 23217, "loss": 0.9203, "learning_rate": 2.3743797445123688e-05, "epoch": 1.5480036180385062, "percentage": 51.6, "elapsed_time": "8:02:35", "remaining_time": "7:32:39", "throughput": "3389.31", "total_tokens": 98140160} {"current_steps": 11990, "total_steps": 23217, "loss": 1.0436, "learning_rate": 2.3710012757963175e-05, "epoch": 1.5492957746478875, "percentage": 51.64, "elapsed_time": "8:03:22", "remaining_time": "7:32:37", "throughput": "3386.62", "total_tokens": 98222080} {"current_steps": 12000, "total_steps": 23217, "loss": 1.0798, "learning_rate": 2.367623043276459e-05, "epoch": 1.5505879312572683, "percentage": 51.69, "elapsed_time": "8:04:10", "remaining_time": "7:32:34", "throughput": "3383.93", "total_tokens": 98304000} {"current_steps": 12010, "total_steps": 23217, "loss": 1.0669, "learning_rate": 2.364245053138323e-05, "epoch": 1.5518800878666494, "percentage": 51.73, "elapsed_time": "8:05:03", "remaining_time": "7:32:37", "throughput": "3380.51", "total_tokens": 98385920} {"current_steps": 12020, "total_steps": 23217, "loss": 0.8337, "learning_rate": 2.3608673115669978e-05, "epoch": 1.5531722444760305, "percentage": 51.77, "elapsed_time": "8:05:51", "remaining_time": "7:32:35", "throughput": "3377.83", "total_tokens": 98467840} {"current_steps": 12030, "total_steps": 23217, "loss": 1.2425, "learning_rate": 2.3574898247471167e-05, "epoch": 1.5544644010854114, "percentage": 51.82, "elapsed_time": "8:06:38", "remaining_time": "7:32:32", "throughput": "3375.17", "total_tokens": 98549760} {"current_steps": 12040, "total_steps": 23217, "loss": 0.9847, "learning_rate": 2.354112598862845e-05, "epoch": 1.5557565576947927, "percentage": 51.86, "elapsed_time": "8:07:25", "remaining_time": "7:32:29", "throughput": "3372.53", "total_tokens": 98631680} {"current_steps": 12050, "total_steps": 23217, "loss": 0.79, "learning_rate": 2.350735640097871e-05, "epoch": 1.5570487143041736, "percentage": 51.9, "elapsed_time": "8:08:12", "remaining_time": "7:32:26", "throughput": "3369.89", "total_tokens": 98713600} {"current_steps": 12060, "total_steps": 23217, "loss": 0.8655, "learning_rate": 2.347358954635393e-05, "epoch": 1.5583408709135549, "percentage": 51.94, "elapsed_time": "8:09:00", "remaining_time": "7:32:23", "throughput": "3367.25", "total_tokens": 98795520} {"current_steps": 12070, "total_steps": 23217, "loss": 0.7855, "learning_rate": 2.3439825486581116e-05, "epoch": 1.5596330275229358, "percentage": 51.99, "elapsed_time": "8:09:47", "remaining_time": "7:32:20", "throughput": "3364.62", "total_tokens": 98877440} {"current_steps": 12080, "total_steps": 23217, "loss": 0.911, "learning_rate": 2.3406064283482115e-05, "epoch": 1.5609251841323168, "percentage": 52.03, "elapsed_time": "8:10:34", "remaining_time": "7:32:16", "throughput": "3362.00", "total_tokens": 98959360} {"current_steps": 12090, "total_steps": 23217, "loss": 0.6987, "learning_rate": 2.337230599887358e-05, "epoch": 1.562217340741698, "percentage": 52.07, "elapsed_time": "8:11:22", "remaining_time": "7:32:13", "throughput": "3359.37", "total_tokens": 99041280} {"current_steps": 12100, "total_steps": 23217, "loss": 0.7693, "learning_rate": 2.3338550694566817e-05, "epoch": 1.5635094973510788, "percentage": 52.12, "elapsed_time": "8:12:09", "remaining_time": "7:32:10", "throughput": "3356.78", "total_tokens": 99123200} {"current_steps": 12110, "total_steps": 23217, "loss": 0.5875, "learning_rate": 2.3304798432367645e-05, "epoch": 1.5648016539604601, "percentage": 52.16, "elapsed_time": "8:12:56", "remaining_time": "7:32:06", "throughput": "3354.19", "total_tokens": 99205120} {"current_steps": 12120, "total_steps": 23217, "loss": 1.1252, "learning_rate": 2.327104927407634e-05, "epoch": 1.566093810569841, "percentage": 52.2, "elapsed_time": "8:13:43", "remaining_time": "7:32:03", "throughput": "3351.60", "total_tokens": 99287040} {"current_steps": 12130, "total_steps": 23217, "loss": 0.8912, "learning_rate": 2.3237303281487487e-05, "epoch": 1.567385967179222, "percentage": 52.25, "elapsed_time": "8:14:31", "remaining_time": "7:31:59", "throughput": "3349.02", "total_tokens": 99368960} {"current_steps": 12140, "total_steps": 23217, "loss": 0.6356, "learning_rate": 2.3203560516389882e-05, "epoch": 1.5686781237886032, "percentage": 52.29, "elapsed_time": "8:15:18", "remaining_time": "7:31:56", "throughput": "3346.44", "total_tokens": 99450880} {"current_steps": 12150, "total_steps": 23217, "loss": 1.1298, "learning_rate": 2.3169821040566387e-05, "epoch": 1.5699702803979843, "percentage": 52.33, "elapsed_time": "8:16:05", "remaining_time": "7:31:52", "throughput": "3343.88", "total_tokens": 99532800} {"current_steps": 12160, "total_steps": 23217, "loss": 1.0096, "learning_rate": 2.313608491579387e-05, "epoch": 1.5712624370073653, "percentage": 52.38, "elapsed_time": "8:16:52", "remaining_time": "7:31:48", "throughput": "3341.33", "total_tokens": 99614720} {"current_steps": 12170, "total_steps": 23217, "loss": 0.7456, "learning_rate": 2.3102352203843063e-05, "epoch": 1.5725545936167462, "percentage": 52.42, "elapsed_time": "8:17:40", "remaining_time": "7:31:44", "throughput": "3338.79", "total_tokens": 99696640} {"current_steps": 12180, "total_steps": 23217, "loss": 0.8698, "learning_rate": 2.306862296647841e-05, "epoch": 1.5738467502261275, "percentage": 52.46, "elapsed_time": "8:18:27", "remaining_time": "7:31:40", "throughput": "3336.25", "total_tokens": 99778560} {"current_steps": 12190, "total_steps": 23217, "loss": 0.6883, "learning_rate": 2.3034897265458056e-05, "epoch": 1.5751389068355084, "percentage": 52.5, "elapsed_time": "8:19:14", "remaining_time": "7:31:36", "throughput": "3333.73", "total_tokens": 99860480} {"current_steps": 12200, "total_steps": 23217, "loss": 0.8952, "learning_rate": 2.3001175162533606e-05, "epoch": 1.5764310634448895, "percentage": 52.55, "elapsed_time": "8:20:01", "remaining_time": "7:31:32", "throughput": "3331.20", "total_tokens": 99942400} {"current_steps": 12210, "total_steps": 23217, "loss": 0.7274, "learning_rate": 2.2967456719450127e-05, "epoch": 1.5777232200542706, "percentage": 52.59, "elapsed_time": "8:20:49", "remaining_time": "7:31:28", "throughput": "3328.68", "total_tokens": 100024320} {"current_steps": 12220, "total_steps": 23217, "loss": 0.8773, "learning_rate": 2.2933741997945954e-05, "epoch": 1.5790153766636517, "percentage": 52.63, "elapsed_time": "8:21:36", "remaining_time": "7:31:24", "throughput": "3326.18", "total_tokens": 100106240} {"current_steps": 12230, "total_steps": 23217, "loss": 0.9009, "learning_rate": 2.290003105975262e-05, "epoch": 1.5803075332730327, "percentage": 52.68, "elapsed_time": "8:22:23", "remaining_time": "7:31:20", "throughput": "3323.68", "total_tokens": 100188160} {"current_steps": 12240, "total_steps": 23217, "loss": 0.6566, "learning_rate": 2.2866323966594736e-05, "epoch": 1.5815996898824136, "percentage": 52.72, "elapsed_time": "8:23:10", "remaining_time": "7:31:15", "throughput": "3321.20", "total_tokens": 100270080} {"current_steps": 12250, "total_steps": 23217, "loss": 0.7216, "learning_rate": 2.283262078018985e-05, "epoch": 1.582891846491795, "percentage": 52.76, "elapsed_time": "8:23:58", "remaining_time": "7:31:11", "throughput": "3318.71", "total_tokens": 100352000} {"current_steps": 12260, "total_steps": 23217, "loss": 0.9039, "learning_rate": 2.27989215622484e-05, "epoch": 1.5841840031011758, "percentage": 52.81, "elapsed_time": "8:24:45", "remaining_time": "7:31:06", "throughput": "3316.23", "total_tokens": 100433920} {"current_steps": 12270, "total_steps": 23217, "loss": 0.9027, "learning_rate": 2.2765226374473504e-05, "epoch": 1.5854761597105569, "percentage": 52.85, "elapsed_time": "8:25:32", "remaining_time": "7:31:02", "throughput": "3313.76", "total_tokens": 100515840} {"current_steps": 12280, "total_steps": 23217, "loss": 0.7404, "learning_rate": 2.2731535278560944e-05, "epoch": 1.586768316319938, "percentage": 52.89, "elapsed_time": "8:26:20", "remaining_time": "7:30:57", "throughput": "3311.29", "total_tokens": 100597760} {"current_steps": 12290, "total_steps": 23217, "loss": 0.8567, "learning_rate": 2.269784833619898e-05, "epoch": 1.588060472929319, "percentage": 52.94, "elapsed_time": "8:27:07", "remaining_time": "7:30:52", "throughput": "3308.84", "total_tokens": 100679680} {"current_steps": 12300, "total_steps": 23217, "loss": 0.9177, "learning_rate": 2.2664165609068304e-05, "epoch": 1.5893526295387002, "percentage": 52.98, "elapsed_time": "8:27:54", "remaining_time": "7:30:48", "throughput": "3306.41", "total_tokens": 100761600} {"current_steps": 12310, "total_steps": 23217, "loss": 0.8511, "learning_rate": 2.263048715884184e-05, "epoch": 1.590644786148081, "percentage": 53.02, "elapsed_time": "8:28:41", "remaining_time": "7:30:43", "throughput": "3303.98", "total_tokens": 100843520} {"current_steps": 12320, "total_steps": 23217, "loss": 0.8876, "learning_rate": 2.2596813047184715e-05, "epoch": 1.5919369427574623, "percentage": 53.06, "elapsed_time": "8:29:29", "remaining_time": "7:30:38", "throughput": "3301.56", "total_tokens": 100925440} {"current_steps": 12330, "total_steps": 23217, "loss": 0.9139, "learning_rate": 2.2563143335754118e-05, "epoch": 1.5932290993668432, "percentage": 53.11, "elapsed_time": "8:30:16", "remaining_time": "7:30:33", "throughput": "3299.13", "total_tokens": 101007360} {"current_steps": 12340, "total_steps": 23217, "loss": 0.5727, "learning_rate": 2.252947808619914e-05, "epoch": 1.5945212559762243, "percentage": 53.15, "elapsed_time": "8:31:03", "remaining_time": "7:30:28", "throughput": "3296.71", "total_tokens": 101089280} {"current_steps": 12350, "total_steps": 23217, "loss": 0.7672, "learning_rate": 2.249581736016076e-05, "epoch": 1.5958134125856054, "percentage": 53.19, "elapsed_time": "8:31:51", "remaining_time": "7:30:23", "throughput": "3294.30", "total_tokens": 101171200} {"current_steps": 12360, "total_steps": 23217, "loss": 0.8705, "learning_rate": 2.2462161219271622e-05, "epoch": 1.5971055691949865, "percentage": 53.24, "elapsed_time": "8:32:38", "remaining_time": "7:30:18", "throughput": "3291.90", "total_tokens": 101253120} {"current_steps": 12370, "total_steps": 23217, "loss": 0.8957, "learning_rate": 2.242850972515601e-05, "epoch": 1.5983977258043676, "percentage": 53.28, "elapsed_time": "8:33:25", "remaining_time": "7:30:12", "throughput": "3289.51", "total_tokens": 101335040} {"current_steps": 12380, "total_steps": 23217, "loss": 1.0392, "learning_rate": 2.2394862939429677e-05, "epoch": 1.5996898824137484, "percentage": 53.32, "elapsed_time": "8:34:12", "remaining_time": "7:30:07", "throughput": "3287.12", "total_tokens": 101416960} {"current_steps": 12390, "total_steps": 23217, "loss": 0.7616, "learning_rate": 2.236122092369977e-05, "epoch": 1.6009820390231297, "percentage": 53.37, "elapsed_time": "8:35:00", "remaining_time": "7:30:02", "throughput": "3284.74", "total_tokens": 101498880} {"current_steps": 12400, "total_steps": 23217, "loss": 1.1416, "learning_rate": 2.2327583739564696e-05, "epoch": 1.6022741956325106, "percentage": 53.41, "elapsed_time": "8:35:47", "remaining_time": "7:29:56", "throughput": "3282.37", "total_tokens": 101580800} {"current_steps": 12410, "total_steps": 23217, "loss": 0.8276, "learning_rate": 2.229395144861402e-05, "epoch": 1.6035663522418917, "percentage": 53.45, "elapsed_time": "8:36:34", "remaining_time": "7:29:51", "throughput": "3280.00", "total_tokens": 101662720} {"current_steps": 12420, "total_steps": 23217, "loss": 1.044, "learning_rate": 2.2260324112428336e-05, "epoch": 1.6048585088512728, "percentage": 53.5, "elapsed_time": "8:37:22", "remaining_time": "7:29:45", "throughput": "3277.64", "total_tokens": 101744640} {"current_steps": 12430, "total_steps": 23217, "loss": 0.5725, "learning_rate": 2.2226701792579176e-05, "epoch": 1.6061506654606539, "percentage": 53.54, "elapsed_time": "8:38:09", "remaining_time": "7:29:39", "throughput": "3275.29", "total_tokens": 101826560} {"current_steps": 12440, "total_steps": 23217, "loss": 0.8819, "learning_rate": 2.219308455062889e-05, "epoch": 1.607442822070035, "percentage": 53.58, "elapsed_time": "8:38:56", "remaining_time": "7:29:34", "throughput": "3272.95", "total_tokens": 101908480} {"current_steps": 12450, "total_steps": 23217, "loss": 0.6064, "learning_rate": 2.2159472448130513e-05, "epoch": 1.6087349786794158, "percentage": 53.62, "elapsed_time": "8:39:43", "remaining_time": "7:29:28", "throughput": "3270.61", "total_tokens": 101990400} {"current_steps": 12460, "total_steps": 23217, "loss": 0.7968, "learning_rate": 2.212586554662769e-05, "epoch": 1.6100271352887972, "percentage": 53.67, "elapsed_time": "8:40:31", "remaining_time": "7:29:22", "throughput": "3268.28", "total_tokens": 102072320} {"current_steps": 12470, "total_steps": 23217, "loss": 0.6481, "learning_rate": 2.2092263907654544e-05, "epoch": 1.611319291898178, "percentage": 53.71, "elapsed_time": "8:41:18", "remaining_time": "7:29:16", "throughput": "3265.96", "total_tokens": 102154240} {"current_steps": 12480, "total_steps": 23217, "loss": 0.722, "learning_rate": 2.2058667592735532e-05, "epoch": 1.612611448507559, "percentage": 53.75, "elapsed_time": "8:42:05", "remaining_time": "7:29:10", "throughput": "3263.65", "total_tokens": 102236160} {"current_steps": 12490, "total_steps": 23217, "loss": 1.321, "learning_rate": 2.20250766633854e-05, "epoch": 1.6139036051169402, "percentage": 53.8, "elapsed_time": "8:42:53", "remaining_time": "7:29:04", "throughput": "3261.34", "total_tokens": 102318080} {"current_steps": 12500, "total_steps": 23217, "loss": 0.6964, "learning_rate": 2.199149118110901e-05, "epoch": 1.615195761726321, "percentage": 53.84, "elapsed_time": "8:43:40", "remaining_time": "7:28:58", "throughput": "3259.04", "total_tokens": 102400000} {"current_steps": 12510, "total_steps": 23217, "loss": 0.965, "learning_rate": 2.1957911207401267e-05, "epoch": 1.6164879183357024, "percentage": 53.88, "elapsed_time": "8:44:27", "remaining_time": "7:28:52", "throughput": "3256.74", "total_tokens": 102481920} {"current_steps": 12520, "total_steps": 23217, "loss": 0.6768, "learning_rate": 2.192433680374696e-05, "epoch": 1.6177800749450832, "percentage": 53.93, "elapsed_time": "8:45:14", "remaining_time": "7:28:46", "throughput": "3254.45", "total_tokens": 102563840} {"current_steps": 12530, "total_steps": 23217, "loss": 0.975, "learning_rate": 2.1890768031620705e-05, "epoch": 1.6190722315544646, "percentage": 53.97, "elapsed_time": "8:46:02", "remaining_time": "7:28:39", "throughput": "3252.18", "total_tokens": 102645760} {"current_steps": 12540, "total_steps": 23217, "loss": 1.0603, "learning_rate": 2.1857204952486824e-05, "epoch": 1.6203643881638454, "percentage": 54.01, "elapsed_time": "8:46:49", "remaining_time": "7:28:33", "throughput": "3249.91", "total_tokens": 102727680} {"current_steps": 12550, "total_steps": 23217, "loss": 0.737, "learning_rate": 2.182364762779916e-05, "epoch": 1.6216565447732265, "percentage": 54.06, "elapsed_time": "8:47:36", "remaining_time": "7:28:26", "throughput": "3247.64", "total_tokens": 102809600} {"current_steps": 12560, "total_steps": 23217, "loss": 0.8256, "learning_rate": 2.1790096119001077e-05, "epoch": 1.6229487013826076, "percentage": 54.1, "elapsed_time": "8:48:23", "remaining_time": "7:28:20", "throughput": "3245.38", "total_tokens": 102891520} {"current_steps": 12570, "total_steps": 23217, "loss": 1.0425, "learning_rate": 2.1756550487525247e-05, "epoch": 1.6242408579919885, "percentage": 54.14, "elapsed_time": "8:49:11", "remaining_time": "7:28:13", "throughput": "3243.13", "total_tokens": 102973440} {"current_steps": 12580, "total_steps": 23217, "loss": 0.6268, "learning_rate": 2.1723010794793612e-05, "epoch": 1.6255330146013698, "percentage": 54.18, "elapsed_time": "8:49:58", "remaining_time": "7:28:07", "throughput": "3240.89", "total_tokens": 103055360} {"current_steps": 12590, "total_steps": 23217, "loss": 0.9757, "learning_rate": 2.168947710221722e-05, "epoch": 1.6268251712107507, "percentage": 54.23, "elapsed_time": "8:50:45", "remaining_time": "7:28:00", "throughput": "3238.65", "total_tokens": 103137280} {"current_steps": 12600, "total_steps": 23217, "loss": 0.7146, "learning_rate": 2.165594947119613e-05, "epoch": 1.628117327820132, "percentage": 54.27, "elapsed_time": "8:51:33", "remaining_time": "7:27:53", "throughput": "3236.41", "total_tokens": 103219200} {"current_steps": 12610, "total_steps": 23217, "loss": 1.4099, "learning_rate": 2.1622427963119337e-05, "epoch": 1.6294094844295128, "percentage": 54.31, "elapsed_time": "8:52:20", "remaining_time": "7:27:46", "throughput": "3234.19", "total_tokens": 103301120} {"current_steps": 12620, "total_steps": 23217, "loss": 1.0245, "learning_rate": 2.1588912639364567e-05, "epoch": 1.630701641038894, "percentage": 54.36, "elapsed_time": "8:53:07", "remaining_time": "7:27:39", "throughput": "3231.97", "total_tokens": 103383040} {"current_steps": 12630, "total_steps": 23217, "loss": 1.1632, "learning_rate": 2.1555403561298287e-05, "epoch": 1.631993797648275, "percentage": 54.4, "elapsed_time": "8:53:54", "remaining_time": "7:27:32", "throughput": "3229.76", "total_tokens": 103464960} {"current_steps": 12640, "total_steps": 23217, "loss": 0.747, "learning_rate": 2.152190079027547e-05, "epoch": 1.6332859542576559, "percentage": 54.44, "elapsed_time": "8:54:42", "remaining_time": "7:27:26", "throughput": "3227.55", "total_tokens": 103546880} {"current_steps": 12650, "total_steps": 23217, "loss": 1.056, "learning_rate": 2.148840438763959e-05, "epoch": 1.6345781108670372, "percentage": 54.49, "elapsed_time": "8:55:29", "remaining_time": "7:27:18", "throughput": "3225.35", "total_tokens": 103628800} {"current_steps": 12660, "total_steps": 23217, "loss": 0.9465, "learning_rate": 2.1454914414722417e-05, "epoch": 1.635870267476418, "percentage": 54.53, "elapsed_time": "8:56:16", "remaining_time": "7:27:11", "throughput": "3223.16", "total_tokens": 103710720} {"current_steps": 12670, "total_steps": 23217, "loss": 1.1174, "learning_rate": 2.1421430932843988e-05, "epoch": 1.6371624240857992, "percentage": 54.57, "elapsed_time": "8:57:04", "remaining_time": "7:27:04", "throughput": "3220.97", "total_tokens": 103792640} {"current_steps": 12680, "total_steps": 23217, "loss": 0.6262, "learning_rate": 2.138795400331242e-05, "epoch": 1.6384545806951802, "percentage": 54.62, "elapsed_time": "8:57:51", "remaining_time": "7:26:57", "throughput": "3218.80", "total_tokens": 103874560} {"current_steps": 12690, "total_steps": 23217, "loss": 1.066, "learning_rate": 2.135448368742385e-05, "epoch": 1.6397467373045613, "percentage": 54.66, "elapsed_time": "8:58:38", "remaining_time": "7:26:49", "throughput": "3216.62", "total_tokens": 103956480} {"current_steps": 12700, "total_steps": 23217, "loss": 0.9554, "learning_rate": 2.1321020046462318e-05, "epoch": 1.6410388939139424, "percentage": 54.7, "elapsed_time": "8:59:25", "remaining_time": "7:26:42", "throughput": "3214.46", "total_tokens": 104038400} {"current_steps": 12710, "total_steps": 23217, "loss": 1.0322, "learning_rate": 2.128756314169961e-05, "epoch": 1.6423310505233233, "percentage": 54.74, "elapsed_time": "9:00:12", "remaining_time": "7:26:34", "throughput": "3212.31", "total_tokens": 104120320} {"current_steps": 12720, "total_steps": 23217, "loss": 0.6685, "learning_rate": 2.1254113034395212e-05, "epoch": 1.6436232071327046, "percentage": 54.79, "elapsed_time": "9:01:00", "remaining_time": "7:26:27", "throughput": "3210.16", "total_tokens": 104202240} {"current_steps": 12730, "total_steps": 23217, "loss": 0.7232, "learning_rate": 2.122066978579613e-05, "epoch": 1.6449153637420855, "percentage": 54.83, "elapsed_time": "9:01:47", "remaining_time": "7:26:19", "throughput": "3208.01", "total_tokens": 104284160} {"current_steps": 12740, "total_steps": 23217, "loss": 0.8379, "learning_rate": 2.1187233457136858e-05, "epoch": 1.6462075203514666, "percentage": 54.87, "elapsed_time": "9:02:34", "remaining_time": "7:26:12", "throughput": "3205.87", "total_tokens": 104366080} {"current_steps": 12750, "total_steps": 23217, "loss": 0.7044, "learning_rate": 2.1153804109639157e-05, "epoch": 1.6474996769608476, "percentage": 54.92, "elapsed_time": "9:03:21", "remaining_time": "7:26:04", "throughput": "3203.74", "total_tokens": 104448000} {"current_steps": 12760, "total_steps": 23217, "loss": 0.7293, "learning_rate": 2.1120381804512066e-05, "epoch": 1.6487918335702287, "percentage": 54.96, "elapsed_time": "9:04:09", "remaining_time": "7:25:56", "throughput": "3201.61", "total_tokens": 104529920} {"current_steps": 12770, "total_steps": 23217, "loss": 0.9354, "learning_rate": 2.1086966602951696e-05, "epoch": 1.6500839901796098, "percentage": 55.0, "elapsed_time": "9:04:56", "remaining_time": "7:25:48", "throughput": "3199.49", "total_tokens": 104611840} {"current_steps": 12780, "total_steps": 23217, "loss": 0.699, "learning_rate": 2.105355856614115e-05, "epoch": 1.6513761467889907, "percentage": 55.05, "elapsed_time": "9:05:43", "remaining_time": "7:25:40", "throughput": "3197.38", "total_tokens": 104693760} {"current_steps": 12790, "total_steps": 23217, "loss": 0.6137, "learning_rate": 2.1020157755250437e-05, "epoch": 1.652668303398372, "percentage": 55.09, "elapsed_time": "9:06:30", "remaining_time": "7:25:32", "throughput": "3195.26", "total_tokens": 104775680} {"current_steps": 12800, "total_steps": 23217, "loss": 0.8616, "learning_rate": 2.09867642314363e-05, "epoch": 1.6539604600077529, "percentage": 55.13, "elapsed_time": "9:07:18", "remaining_time": "7:25:24", "throughput": "3193.15", "total_tokens": 104857600} {"current_steps": 12810, "total_steps": 23217, "loss": 0.668, "learning_rate": 2.0953378055842183e-05, "epoch": 1.655252616617134, "percentage": 55.18, "elapsed_time": "9:08:05", "remaining_time": "7:25:16", "throughput": "3191.05", "total_tokens": 104939520} {"current_steps": 12820, "total_steps": 23217, "loss": 0.961, "learning_rate": 2.0919999289598027e-05, "epoch": 1.656544773226515, "percentage": 55.22, "elapsed_time": "9:08:52", "remaining_time": "7:25:08", "throughput": "3188.95", "total_tokens": 105021440} {"current_steps": 12830, "total_steps": 23217, "loss": 0.6605, "learning_rate": 2.088662799382024e-05, "epoch": 1.6578369298358961, "percentage": 55.26, "elapsed_time": "9:09:40", "remaining_time": "7:25:00", "throughput": "3186.87", "total_tokens": 105103360} {"current_steps": 12840, "total_steps": 23217, "loss": 1.176, "learning_rate": 2.0853264229611557e-05, "epoch": 1.6591290864452772, "percentage": 55.3, "elapsed_time": "9:10:27", "remaining_time": "7:24:51", "throughput": "3184.79", "total_tokens": 105185280} {"current_steps": 12850, "total_steps": 23217, "loss": 0.9159, "learning_rate": 2.081990805806089e-05, "epoch": 1.660421243054658, "percentage": 55.35, "elapsed_time": "9:11:14", "remaining_time": "7:24:43", "throughput": "3182.71", "total_tokens": 105267200} {"current_steps": 12860, "total_steps": 23217, "loss": 0.6293, "learning_rate": 2.078655954024327e-05, "epoch": 1.6617133996640394, "percentage": 55.39, "elapsed_time": "9:12:02", "remaining_time": "7:24:35", "throughput": "3180.63", "total_tokens": 105349120} {"current_steps": 12870, "total_steps": 23217, "loss": 0.7573, "learning_rate": 2.075321873721972e-05, "epoch": 1.6630055562734203, "percentage": 55.43, "elapsed_time": "9:12:49", "remaining_time": "7:24:26", "throughput": "3178.57", "total_tokens": 105431040} {"current_steps": 12880, "total_steps": 23217, "loss": 0.4979, "learning_rate": 2.0719885710037122e-05, "epoch": 1.6642977128828014, "percentage": 55.48, "elapsed_time": "9:13:36", "remaining_time": "7:24:18", "throughput": "3176.51", "total_tokens": 105512960} {"current_steps": 12890, "total_steps": 23217, "loss": 1.026, "learning_rate": 2.0686560519728117e-05, "epoch": 1.6655898694921825, "percentage": 55.52, "elapsed_time": "9:14:23", "remaining_time": "7:24:09", "throughput": "3174.45", "total_tokens": 105594880} {"current_steps": 12900, "total_steps": 23217, "loss": 0.5754, "learning_rate": 2.0653243227311014e-05, "epoch": 1.6668820261015636, "percentage": 55.56, "elapsed_time": "9:15:11", "remaining_time": "7:24:01", "throughput": "3172.41", "total_tokens": 105676800} {"current_steps": 12910, "total_steps": 23217, "loss": 0.8647, "learning_rate": 2.0619933893789673e-05, "epoch": 1.6681741827109446, "percentage": 55.61, "elapsed_time": "9:15:58", "remaining_time": "7:23:52", "throughput": "3170.38", "total_tokens": 105758720} {"current_steps": 12920, "total_steps": 23217, "loss": 1.2784, "learning_rate": 2.0586632580153328e-05, "epoch": 1.6694663393203255, "percentage": 55.65, "elapsed_time": "9:16:45", "remaining_time": "7:23:43", "throughput": "3168.35", "total_tokens": 105840640} {"current_steps": 12930, "total_steps": 23217, "loss": 0.8836, "learning_rate": 2.0553339347376592e-05, "epoch": 1.6707584959297068, "percentage": 55.69, "elapsed_time": "9:17:32", "remaining_time": "7:23:34", "throughput": "3166.33", "total_tokens": 105922560} {"current_steps": 12940, "total_steps": 23217, "loss": 0.909, "learning_rate": 2.0520054256419236e-05, "epoch": 1.6720506525390877, "percentage": 55.74, "elapsed_time": "9:18:20", "remaining_time": "7:23:25", "throughput": "3164.30", "total_tokens": 106004480} {"current_steps": 12950, "total_steps": 23217, "loss": 0.7516, "learning_rate": 2.0486777368226143e-05, "epoch": 1.6733428091484688, "percentage": 55.78, "elapsed_time": "9:19:07", "remaining_time": "7:23:17", "throughput": "3162.28", "total_tokens": 106086400} {"current_steps": 12960, "total_steps": 23217, "loss": 0.977, "learning_rate": 2.045350874372717e-05, "epoch": 1.6746349657578499, "percentage": 55.82, "elapsed_time": "9:19:54", "remaining_time": "7:23:07", "throughput": "3160.27", "total_tokens": 106168320} {"current_steps": 12970, "total_steps": 23217, "loss": 0.8461, "learning_rate": 2.0420248443837048e-05, "epoch": 1.675927122367231, "percentage": 55.86, "elapsed_time": "9:20:41", "remaining_time": "7:22:58", "throughput": "3158.27", "total_tokens": 106250240} {"current_steps": 12980, "total_steps": 23217, "loss": 0.7468, "learning_rate": 2.0386996529455276e-05, "epoch": 1.677219278976612, "percentage": 55.91, "elapsed_time": "9:21:29", "remaining_time": "7:22:49", "throughput": "3156.27", "total_tokens": 106332160} {"current_steps": 12990, "total_steps": 23217, "loss": 0.7406, "learning_rate": 2.0353753061465972e-05, "epoch": 1.678511435585993, "percentage": 55.95, "elapsed_time": "9:22:16", "remaining_time": "7:22:40", "throughput": "3154.27", "total_tokens": 106414080} {"current_steps": 13000, "total_steps": 23217, "loss": 0.9977, "learning_rate": 2.0320518100737817e-05, "epoch": 1.6798035921953742, "percentage": 55.99, "elapsed_time": "9:23:03", "remaining_time": "7:22:31", "throughput": "3152.29", "total_tokens": 106496000} {"current_steps": 13010, "total_steps": 23217, "loss": 0.867, "learning_rate": 2.0287291708123888e-05, "epoch": 1.681095748804755, "percentage": 56.04, "elapsed_time": "9:23:55", "remaining_time": "7:22:25", "throughput": "3149.90", "total_tokens": 106577920} {"current_steps": 13020, "total_steps": 23217, "loss": 0.86, "learning_rate": 2.0254073944461603e-05, "epoch": 1.6823879054141362, "percentage": 56.08, "elapsed_time": "9:24:42", "remaining_time": "7:22:16", "throughput": "3147.93", "total_tokens": 106659840} {"current_steps": 13030, "total_steps": 23217, "loss": 0.9676, "learning_rate": 2.0220864870572555e-05, "epoch": 1.6836800620235173, "percentage": 56.12, "elapsed_time": "9:25:29", "remaining_time": "7:22:06", "throughput": "3145.96", "total_tokens": 106741760} {"current_steps": 13040, "total_steps": 23217, "loss": 0.7239, "learning_rate": 2.0187664547262446e-05, "epoch": 1.6849722186328981, "percentage": 56.17, "elapsed_time": "9:26:17", "remaining_time": "7:21:57", "throughput": "3144.00", "total_tokens": 106823680} {"current_steps": 13050, "total_steps": 23217, "loss": 0.9287, "learning_rate": 2.0154473035320936e-05, "epoch": 1.6862643752422795, "percentage": 56.21, "elapsed_time": "9:27:04", "remaining_time": "7:21:47", "throughput": "3142.03", "total_tokens": 106905600} {"current_steps": 13060, "total_steps": 23217, "loss": 0.7107, "learning_rate": 2.0121290395521566e-05, "epoch": 1.6875565318516603, "percentage": 56.25, "elapsed_time": "9:27:51", "remaining_time": "7:21:38", "throughput": "3140.07", "total_tokens": 106987520} {"current_steps": 13070, "total_steps": 23217, "loss": 0.7824, "learning_rate": 2.008811668862164e-05, "epoch": 1.6888486884610416, "percentage": 56.29, "elapsed_time": "9:28:38", "remaining_time": "7:21:28", "throughput": "3138.12", "total_tokens": 107069440} {"current_steps": 13080, "total_steps": 23217, "loss": 0.6419, "learning_rate": 2.0054951975362067e-05, "epoch": 1.6901408450704225, "percentage": 56.34, "elapsed_time": "9:29:26", "remaining_time": "7:21:18", "throughput": "3136.18", "total_tokens": 107151360} {"current_steps": 13090, "total_steps": 23217, "loss": 0.5254, "learning_rate": 2.0021796316467346e-05, "epoch": 1.6914330016798036, "percentage": 56.38, "elapsed_time": "9:30:13", "remaining_time": "7:21:09", "throughput": "3134.24", "total_tokens": 107233280} {"current_steps": 13100, "total_steps": 23217, "loss": 0.6578, "learning_rate": 1.9988649772645346e-05, "epoch": 1.6927251582891847, "percentage": 56.42, "elapsed_time": "9:31:00", "remaining_time": "7:20:59", "throughput": "3132.32", "total_tokens": 107315200} {"current_steps": 13110, "total_steps": 23217, "loss": 0.7578, "learning_rate": 1.995551240458728e-05, "epoch": 1.6940173148985656, "percentage": 56.47, "elapsed_time": "9:31:47", "remaining_time": "7:20:49", "throughput": "3130.40", "total_tokens": 107397120} {"current_steps": 13120, "total_steps": 23217, "loss": 0.6271, "learning_rate": 1.9922384272967535e-05, "epoch": 1.6953094715079469, "percentage": 56.51, "elapsed_time": "9:32:35", "remaining_time": "7:20:39", "throughput": "3128.48", "total_tokens": 107479040} {"current_steps": 13130, "total_steps": 23217, "loss": 0.6214, "learning_rate": 1.9889265438443607e-05, "epoch": 1.6966016281173277, "percentage": 56.55, "elapsed_time": "9:33:22", "remaining_time": "7:20:29", "throughput": "3126.56", "total_tokens": 107560960} {"current_steps": 13140, "total_steps": 23217, "loss": 1.0424, "learning_rate": 1.985615596165597e-05, "epoch": 1.697893784726709, "percentage": 56.6, "elapsed_time": "9:34:09", "remaining_time": "7:20:19", "throughput": "3124.65", "total_tokens": 107642880} {"current_steps": 13150, "total_steps": 23217, "loss": 1.0063, "learning_rate": 1.982305590322793e-05, "epoch": 1.69918594133609, "percentage": 56.64, "elapsed_time": "9:34:56", "remaining_time": "7:20:09", "throughput": "3122.75", "total_tokens": 107724800} {"current_steps": 13160, "total_steps": 23217, "loss": 0.796, "learning_rate": 1.97899653237656e-05, "epoch": 1.700478097945471, "percentage": 56.68, "elapsed_time": "9:35:44", "remaining_time": "7:19:58", "throughput": "3120.84", "total_tokens": 107806720} {"current_steps": 13170, "total_steps": 23217, "loss": 0.8084, "learning_rate": 1.9756884283857685e-05, "epoch": 1.701770254554852, "percentage": 56.73, "elapsed_time": "9:36:31", "remaining_time": "7:19:48", "throughput": "3118.94", "total_tokens": 107888640} {"current_steps": 13180, "total_steps": 23217, "loss": 1.0913, "learning_rate": 1.9723812844075473e-05, "epoch": 1.703062411164233, "percentage": 56.77, "elapsed_time": "9:37:18", "remaining_time": "7:19:38", "throughput": "3117.05", "total_tokens": 107970560} {"current_steps": 13190, "total_steps": 23217, "loss": 1.1137, "learning_rate": 1.9690751064972625e-05, "epoch": 1.7043545677736143, "percentage": 56.81, "elapsed_time": "9:38:05", "remaining_time": "7:19:28", "throughput": "3115.16", "total_tokens": 108052480} {"current_steps": 13200, "total_steps": 23217, "loss": 0.9466, "learning_rate": 1.965769900708515e-05, "epoch": 1.7056467243829951, "percentage": 56.85, "elapsed_time": "9:38:53", "remaining_time": "7:19:17", "throughput": "3113.28", "total_tokens": 108134400} {"current_steps": 13210, "total_steps": 23217, "loss": 1.0154, "learning_rate": 1.9624656730931258e-05, "epoch": 1.7069388809923762, "percentage": 56.9, "elapsed_time": "9:39:40", "remaining_time": "7:19:07", "throughput": "3111.40", "total_tokens": 108216320} {"current_steps": 13220, "total_steps": 23217, "loss": 0.9086, "learning_rate": 1.959162429701121e-05, "epoch": 1.7082310376017573, "percentage": 56.94, "elapsed_time": "9:40:27", "remaining_time": "7:18:56", "throughput": "3109.53", "total_tokens": 108298240} {"current_steps": 13230, "total_steps": 23217, "loss": 0.9669, "learning_rate": 1.955860176580729e-05, "epoch": 1.7095231942111384, "percentage": 56.98, "elapsed_time": "9:41:15", "remaining_time": "7:18:46", "throughput": "3107.66", "total_tokens": 108380160} {"current_steps": 13240, "total_steps": 23217, "loss": 0.8869, "learning_rate": 1.9525589197783618e-05, "epoch": 1.7108153508205195, "percentage": 57.03, "elapsed_time": "9:42:02", "remaining_time": "7:18:35", "throughput": "3105.80", "total_tokens": 108462080} {"current_steps": 13250, "total_steps": 23217, "loss": 1.3718, "learning_rate": 1.9492586653386103e-05, "epoch": 1.7121075074299004, "percentage": 57.07, "elapsed_time": "9:42:49", "remaining_time": "7:18:25", "throughput": "3103.95", "total_tokens": 108544000} {"current_steps": 13260, "total_steps": 23217, "loss": 1.1025, "learning_rate": 1.945959419304226e-05, "epoch": 1.7133996640392817, "percentage": 57.11, "elapsed_time": "9:43:36", "remaining_time": "7:18:14", "throughput": "3102.11", "total_tokens": 108625920} {"current_steps": 13270, "total_steps": 23217, "loss": 0.7662, "learning_rate": 1.942661187716118e-05, "epoch": 1.7146918206486625, "percentage": 57.16, "elapsed_time": "9:44:24", "remaining_time": "7:18:03", "throughput": "3100.26", "total_tokens": 108707840} {"current_steps": 13280, "total_steps": 23217, "loss": 0.9356, "learning_rate": 1.9393639766133363e-05, "epoch": 1.7159839772580436, "percentage": 57.2, "elapsed_time": "9:45:11", "remaining_time": "7:17:52", "throughput": "3098.42", "total_tokens": 108789760} {"current_steps": 13290, "total_steps": 23217, "loss": 0.608, "learning_rate": 1.936067792033061e-05, "epoch": 1.7172761338674247, "percentage": 57.24, "elapsed_time": "9:45:58", "remaining_time": "7:17:41", "throughput": "3096.58", "total_tokens": 108871680} {"current_steps": 13300, "total_steps": 23217, "loss": 1.0139, "learning_rate": 1.9327726400105963e-05, "epoch": 1.7185682904768058, "percentage": 57.29, "elapsed_time": "9:46:45", "remaining_time": "7:17:30", "throughput": "3094.75", "total_tokens": 108953600} {"current_steps": 13310, "total_steps": 23217, "loss": 0.7744, "learning_rate": 1.9294785265793514e-05, "epoch": 1.719860447086187, "percentage": 57.33, "elapsed_time": "9:47:33", "remaining_time": "7:17:19", "throughput": "3092.92", "total_tokens": 109035520} {"current_steps": 13320, "total_steps": 23217, "loss": 0.7847, "learning_rate": 1.9261854577708366e-05, "epoch": 1.7211526036955678, "percentage": 57.37, "elapsed_time": "9:48:20", "remaining_time": "7:17:08", "throughput": "3091.10", "total_tokens": 109117440} {"current_steps": 13330, "total_steps": 23217, "loss": 0.9334, "learning_rate": 1.9228934396146486e-05, "epoch": 1.722444760304949, "percentage": 57.41, "elapsed_time": "9:49:07", "remaining_time": "7:16:57", "throughput": "3089.28", "total_tokens": 109199360} {"current_steps": 13340, "total_steps": 23217, "loss": 0.8011, "learning_rate": 1.9196024781384607e-05, "epoch": 1.72373691691433, "percentage": 57.46, "elapsed_time": "9:49:55", "remaining_time": "7:16:46", "throughput": "3087.47", "total_tokens": 109281280} {"current_steps": 13350, "total_steps": 23217, "loss": 0.8737, "learning_rate": 1.9163125793680125e-05, "epoch": 1.725029073523711, "percentage": 57.5, "elapsed_time": "9:50:42", "remaining_time": "7:16:35", "throughput": "3085.66", "total_tokens": 109363200} {"current_steps": 13360, "total_steps": 23217, "loss": 0.5359, "learning_rate": 1.9130237493270948e-05, "epoch": 1.7263212301330921, "percentage": 57.54, "elapsed_time": "9:51:29", "remaining_time": "7:16:24", "throughput": "3083.86", "total_tokens": 109445120} {"current_steps": 13370, "total_steps": 23217, "loss": 0.6703, "learning_rate": 1.9097359940375452e-05, "epoch": 1.7276133867424732, "percentage": 57.59, "elapsed_time": "9:52:16", "remaining_time": "7:16:12", "throughput": "3082.07", "total_tokens": 109527040} {"current_steps": 13380, "total_steps": 23217, "loss": 0.8231, "learning_rate": 1.9064493195192293e-05, "epoch": 1.7289055433518543, "percentage": 57.63, "elapsed_time": "9:53:04", "remaining_time": "7:16:01", "throughput": "3080.27", "total_tokens": 109608960} {"current_steps": 13390, "total_steps": 23217, "loss": 0.7302, "learning_rate": 1.9031637317900386e-05, "epoch": 1.7301976999612352, "percentage": 57.67, "elapsed_time": "9:53:51", "remaining_time": "7:15:50", "throughput": "3078.48", "total_tokens": 109690880} {"current_steps": 13400, "total_steps": 23217, "loss": 0.7282, "learning_rate": 1.8998792368658703e-05, "epoch": 1.7314898565706165, "percentage": 57.72, "elapsed_time": "9:54:38", "remaining_time": "7:15:38", "throughput": "3076.69", "total_tokens": 109772800} {"current_steps": 13410, "total_steps": 23217, "loss": 0.8997, "learning_rate": 1.8965958407606236e-05, "epoch": 1.7327820131799974, "percentage": 57.76, "elapsed_time": "9:55:26", "remaining_time": "7:15:27", "throughput": "3074.92", "total_tokens": 109854720} {"current_steps": 13420, "total_steps": 23217, "loss": 0.8703, "learning_rate": 1.893313549486184e-05, "epoch": 1.7340741697893785, "percentage": 57.8, "elapsed_time": "9:56:13", "remaining_time": "7:15:15", "throughput": "3073.15", "total_tokens": 109936640} {"current_steps": 13430, "total_steps": 23217, "loss": 0.5685, "learning_rate": 1.890032369052415e-05, "epoch": 1.7353663263987595, "percentage": 57.85, "elapsed_time": "9:57:00", "remaining_time": "7:15:03", "throughput": "3071.39", "total_tokens": 110018560} {"current_steps": 13440, "total_steps": 23217, "loss": 0.9621, "learning_rate": 1.8867523054671475e-05, "epoch": 1.7366584830081406, "percentage": 57.89, "elapsed_time": "9:57:47", "remaining_time": "7:14:52", "throughput": "3069.62", "total_tokens": 110100480} {"current_steps": 13450, "total_steps": 23217, "loss": 0.8279, "learning_rate": 1.8834733647361635e-05, "epoch": 1.7379506396175217, "percentage": 57.93, "elapsed_time": "9:58:35", "remaining_time": "7:14:40", "throughput": "3067.86", "total_tokens": 110182400} {"current_steps": 13460, "total_steps": 23217, "loss": 0.6358, "learning_rate": 1.880195552863194e-05, "epoch": 1.7392427962269026, "percentage": 57.97, "elapsed_time": "9:59:22", "remaining_time": "7:14:28", "throughput": "3066.11", "total_tokens": 110264320} {"current_steps": 13470, "total_steps": 23217, "loss": 0.8022, "learning_rate": 1.8769188758498973e-05, "epoch": 1.740534952836284, "percentage": 58.02, "elapsed_time": "10:00:09", "remaining_time": "7:14:16", "throughput": "3064.37", "total_tokens": 110346240} {"current_steps": 13480, "total_steps": 23217, "loss": 0.6169, "learning_rate": 1.8736433396958605e-05, "epoch": 1.7418271094456648, "percentage": 58.06, "elapsed_time": "10:00:56", "remaining_time": "7:14:04", "throughput": "3062.62", "total_tokens": 110428160} {"current_steps": 13490, "total_steps": 23217, "loss": 0.6387, "learning_rate": 1.8703689503985754e-05, "epoch": 1.7431192660550459, "percentage": 58.1, "elapsed_time": "10:01:43", "remaining_time": "7:13:52", "throughput": "3060.88", "total_tokens": 110510080} {"current_steps": 13500, "total_steps": 23217, "loss": 1.0567, "learning_rate": 1.867095713953439e-05, "epoch": 1.744411422664427, "percentage": 58.15, "elapsed_time": "10:02:31", "remaining_time": "7:13:40", "throughput": "3059.16", "total_tokens": 110592000} {"current_steps": 13510, "total_steps": 23217, "loss": 0.5526, "learning_rate": 1.8638236363537348e-05, "epoch": 1.745703579273808, "percentage": 58.19, "elapsed_time": "10:03:18", "remaining_time": "7:13:28", "throughput": "3057.42", "total_tokens": 110673920} {"current_steps": 13520, "total_steps": 23217, "loss": 0.987, "learning_rate": 1.8605527235906235e-05, "epoch": 1.7469957358831891, "percentage": 58.23, "elapsed_time": "10:04:05", "remaining_time": "7:13:16", "throughput": "3055.69", "total_tokens": 110755840} {"current_steps": 13530, "total_steps": 23217, "loss": 0.604, "learning_rate": 1.8572829816531364e-05, "epoch": 1.74828789249257, "percentage": 58.28, "elapsed_time": "10:04:53", "remaining_time": "7:13:04", "throughput": "3053.96", "total_tokens": 110837760} {"current_steps": 13540, "total_steps": 23217, "loss": 0.6048, "learning_rate": 1.854014416528157e-05, "epoch": 1.7495800491019513, "percentage": 58.32, "elapsed_time": "10:05:40", "remaining_time": "7:12:52", "throughput": "3052.24", "total_tokens": 110919680} {"current_steps": 13550, "total_steps": 23217, "loss": 0.8796, "learning_rate": 1.8507470342004182e-05, "epoch": 1.7508722057113322, "percentage": 58.36, "elapsed_time": "10:06:27", "remaining_time": "7:12:40", "throughput": "3050.53", "total_tokens": 111001600} {"current_steps": 13560, "total_steps": 23217, "loss": 0.8039, "learning_rate": 1.847480840652483e-05, "epoch": 1.7521643623207133, "percentage": 58.41, "elapsed_time": "10:07:14", "remaining_time": "7:12:27", "throughput": "3048.82", "total_tokens": 111083520} {"current_steps": 13570, "total_steps": 23217, "loss": 0.6875, "learning_rate": 1.844215841864741e-05, "epoch": 1.7534565189300944, "percentage": 58.45, "elapsed_time": "10:08:02", "remaining_time": "7:12:15", "throughput": "3047.12", "total_tokens": 111165440} {"current_steps": 13580, "total_steps": 23217, "loss": 0.9024, "learning_rate": 1.8409520438153933e-05, "epoch": 1.7547486755394752, "percentage": 58.49, "elapsed_time": "10:08:49", "remaining_time": "7:12:02", "throughput": "3045.42", "total_tokens": 111247360} {"current_steps": 13590, "total_steps": 23217, "loss": 0.6588, "learning_rate": 1.8376894524804416e-05, "epoch": 1.7560408321488565, "percentage": 58.53, "elapsed_time": "10:09:36", "remaining_time": "7:11:50", "throughput": "3043.73", "total_tokens": 111329280} {"current_steps": 13600, "total_steps": 23217, "loss": 0.9931, "learning_rate": 1.8344280738336796e-05, "epoch": 1.7573329887582374, "percentage": 58.58, "elapsed_time": "10:10:23", "remaining_time": "7:11:37", "throughput": "3042.03", "total_tokens": 111411200} {"current_steps": 13610, "total_steps": 23217, "loss": 0.9949, "learning_rate": 1.8311679138466772e-05, "epoch": 1.7586251453676187, "percentage": 58.62, "elapsed_time": "10:11:11", "remaining_time": "7:11:25", "throughput": "3040.35", "total_tokens": 111493120} {"current_steps": 13620, "total_steps": 23217, "loss": 1.0308, "learning_rate": 1.827908978488779e-05, "epoch": 1.7599173019769996, "percentage": 58.66, "elapsed_time": "10:11:58", "remaining_time": "7:11:12", "throughput": "3038.67", "total_tokens": 111575040} {"current_steps": 13630, "total_steps": 23217, "loss": 0.996, "learning_rate": 1.8246512737270798e-05, "epoch": 1.7612094585863807, "percentage": 58.71, "elapsed_time": "10:12:45", "remaining_time": "7:11:00", "throughput": "3036.99", "total_tokens": 111656960} {"current_steps": 13640, "total_steps": 23217, "loss": 1.0672, "learning_rate": 1.8213948055264278e-05, "epoch": 1.7625016151957618, "percentage": 58.75, "elapsed_time": "10:13:32", "remaining_time": "7:10:47", "throughput": "3035.32", "total_tokens": 111738880} {"current_steps": 13650, "total_steps": 23217, "loss": 0.5107, "learning_rate": 1.8181395798494048e-05, "epoch": 1.7637937718051426, "percentage": 58.79, "elapsed_time": "10:14:20", "remaining_time": "7:10:34", "throughput": "3033.65", "total_tokens": 111820800} {"current_steps": 13660, "total_steps": 23217, "loss": 1.0283, "learning_rate": 1.8148856026563148e-05, "epoch": 1.765085928414524, "percentage": 58.84, "elapsed_time": "10:15:07", "remaining_time": "7:10:21", "throughput": "3031.98", "total_tokens": 111902720} {"current_steps": 13670, "total_steps": 23217, "loss": 0.9913, "learning_rate": 1.81163287990518e-05, "epoch": 1.7663780850239048, "percentage": 58.88, "elapsed_time": "10:15:54", "remaining_time": "7:10:08", "throughput": "3030.32", "total_tokens": 111984640} {"current_steps": 13680, "total_steps": 23217, "loss": 0.5184, "learning_rate": 1.8083814175517234e-05, "epoch": 1.767670241633286, "percentage": 58.92, "elapsed_time": "10:16:42", "remaining_time": "7:09:55", "throughput": "3028.66", "total_tokens": 112066560} {"current_steps": 13690, "total_steps": 23217, "loss": 0.962, "learning_rate": 1.80513122154936e-05, "epoch": 1.768962398242667, "percentage": 58.97, "elapsed_time": "10:17:29", "remaining_time": "7:09:43", "throughput": "3027.00", "total_tokens": 112148480} {"current_steps": 13700, "total_steps": 23217, "loss": 0.6034, "learning_rate": 1.8018822978491872e-05, "epoch": 1.770254554852048, "percentage": 59.01, "elapsed_time": "10:18:16", "remaining_time": "7:09:30", "throughput": "3025.35", "total_tokens": 112230400} {"current_steps": 13710, "total_steps": 23217, "loss": 0.8974, "learning_rate": 1.798634652399972e-05, "epoch": 1.7715467114614292, "percentage": 59.05, "elapsed_time": "10:19:03", "remaining_time": "7:09:16", "throughput": "3023.70", "total_tokens": 112312320} {"current_steps": 13720, "total_steps": 23217, "loss": 1.0047, "learning_rate": 1.795388291148143e-05, "epoch": 1.77283886807081, "percentage": 59.09, "elapsed_time": "10:19:51", "remaining_time": "7:09:03", "throughput": "3022.07", "total_tokens": 112394240} {"current_steps": 13730, "total_steps": 23217, "loss": 0.608, "learning_rate": 1.7921432200377734e-05, "epoch": 1.7741310246801913, "percentage": 59.14, "elapsed_time": "10:20:38", "remaining_time": "7:08:50", "throughput": "3020.44", "total_tokens": 112476160} {"current_steps": 13740, "total_steps": 23217, "loss": 1.2077, "learning_rate": 1.7888994450105788e-05, "epoch": 1.7754231812895722, "percentage": 59.18, "elapsed_time": "10:21:25", "remaining_time": "7:08:37", "throughput": "3018.81", "total_tokens": 112558080} {"current_steps": 13750, "total_steps": 23217, "loss": 1.0667, "learning_rate": 1.785656972005897e-05, "epoch": 1.7767153378989533, "percentage": 59.22, "elapsed_time": "10:22:12", "remaining_time": "7:08:23", "throughput": "3017.19", "total_tokens": 112640000} {"current_steps": 13760, "total_steps": 23217, "loss": 0.8964, "learning_rate": 1.7824158069606867e-05, "epoch": 1.7780074945083344, "percentage": 59.27, "elapsed_time": "10:23:00", "remaining_time": "7:08:10", "throughput": "3015.56", "total_tokens": 112721920} {"current_steps": 13770, "total_steps": 23217, "loss": 0.6691, "learning_rate": 1.7791759558095077e-05, "epoch": 1.7792996511177155, "percentage": 59.31, "elapsed_time": "10:23:47", "remaining_time": "7:07:57", "throughput": "3013.94", "total_tokens": 112803840} {"current_steps": 13780, "total_steps": 23217, "loss": 0.9059, "learning_rate": 1.775937424484515e-05, "epoch": 1.7805918077270966, "percentage": 59.35, "elapsed_time": "10:24:34", "remaining_time": "7:07:43", "throughput": "3012.32", "total_tokens": 112885760} {"current_steps": 13790, "total_steps": 23217, "loss": 0.724, "learning_rate": 1.7727002189154502e-05, "epoch": 1.7818839643364774, "percentage": 59.4, "elapsed_time": "10:25:22", "remaining_time": "7:07:30", "throughput": "3010.70", "total_tokens": 112967680} {"current_steps": 13800, "total_steps": 23217, "loss": 1.064, "learning_rate": 1.7694643450296216e-05, "epoch": 1.7831761209458588, "percentage": 59.44, "elapsed_time": "10:26:09", "remaining_time": "7:07:16", "throughput": "3009.10", "total_tokens": 113049600} {"current_steps": 13810, "total_steps": 23217, "loss": 0.9433, "learning_rate": 1.7662298087519052e-05, "epoch": 1.7844682775552396, "percentage": 59.48, "elapsed_time": "10:26:56", "remaining_time": "7:07:03", "throughput": "3007.50", "total_tokens": 113131520} {"current_steps": 13820, "total_steps": 23217, "loss": 0.8747, "learning_rate": 1.762996616004723e-05, "epoch": 1.7857604341646207, "percentage": 59.53, "elapsed_time": "10:27:43", "remaining_time": "7:06:49", "throughput": "3005.91", "total_tokens": 113213440} {"current_steps": 13830, "total_steps": 23217, "loss": 0.9011, "learning_rate": 1.7597647727080408e-05, "epoch": 1.7870525907740018, "percentage": 59.57, "elapsed_time": "10:28:30", "remaining_time": "7:06:35", "throughput": "3004.31", "total_tokens": 113295360} {"current_steps": 13840, "total_steps": 23217, "loss": 0.9851, "learning_rate": 1.7565342847793502e-05, "epoch": 1.788344747383383, "percentage": 59.61, "elapsed_time": "10:29:18", "remaining_time": "7:06:22", "throughput": "3002.73", "total_tokens": 113377280} {"current_steps": 13850, "total_steps": 23217, "loss": 0.9077, "learning_rate": 1.7533051581336644e-05, "epoch": 1.789636903992764, "percentage": 59.65, "elapsed_time": "10:30:05", "remaining_time": "7:06:08", "throughput": "3001.15", "total_tokens": 113459200} {"current_steps": 13860, "total_steps": 23217, "loss": 0.9925, "learning_rate": 1.7500773986835013e-05, "epoch": 1.7909290606021449, "percentage": 59.7, "elapsed_time": "10:30:52", "remaining_time": "7:05:54", "throughput": "2999.57", "total_tokens": 113541120} {"current_steps": 13870, "total_steps": 23217, "loss": 0.7818, "learning_rate": 1.7468510123388775e-05, "epoch": 1.7922212172115262, "percentage": 59.74, "elapsed_time": "10:31:39", "remaining_time": "7:05:40", "throughput": "2997.99", "total_tokens": 113623040} {"current_steps": 13880, "total_steps": 23217, "loss": 0.9479, "learning_rate": 1.743626005007294e-05, "epoch": 1.793513373820907, "percentage": 59.78, "elapsed_time": "10:32:26", "remaining_time": "7:05:26", "throughput": "2996.42", "total_tokens": 113704960} {"current_steps": 13890, "total_steps": 23217, "loss": 0.9624, "learning_rate": 1.740402382593727e-05, "epoch": 1.7948055304302881, "percentage": 59.83, "elapsed_time": "10:33:14", "remaining_time": "7:05:12", "throughput": "2994.85", "total_tokens": 113786880} {"current_steps": 13900, "total_steps": 23217, "loss": 0.9844, "learning_rate": 1.7371801510006193e-05, "epoch": 1.7960976870396692, "percentage": 59.87, "elapsed_time": "10:34:01", "remaining_time": "7:04:58", "throughput": "2993.28", "total_tokens": 113868800} {"current_steps": 13910, "total_steps": 23217, "loss": 0.8112, "learning_rate": 1.733959316127862e-05, "epoch": 1.7973898436490503, "percentage": 59.91, "elapsed_time": "10:34:48", "remaining_time": "7:04:44", "throughput": "2991.72", "total_tokens": 113950720} {"current_steps": 13920, "total_steps": 23217, "loss": 0.9197, "learning_rate": 1.730739883872795e-05, "epoch": 1.7986820002584314, "percentage": 59.96, "elapsed_time": "10:35:35", "remaining_time": "7:04:30", "throughput": "2990.16", "total_tokens": 114032640} {"current_steps": 13930, "total_steps": 23217, "loss": 0.6208, "learning_rate": 1.7275218601301848e-05, "epoch": 1.7999741568678123, "percentage": 60.0, "elapsed_time": "10:36:23", "remaining_time": "7:04:16", "throughput": "2988.60", "total_tokens": 114114560} {"current_steps": 13940, "total_steps": 23217, "loss": 0.9374, "learning_rate": 1.7243052507922226e-05, "epoch": 1.8012663134771936, "percentage": 60.04, "elapsed_time": "10:37:10", "remaining_time": "7:04:02", "throughput": "2987.05", "total_tokens": 114196480} {"current_steps": 13950, "total_steps": 23217, "loss": 1.0343, "learning_rate": 1.7210900617485075e-05, "epoch": 1.8025584700865744, "percentage": 60.09, "elapsed_time": "10:37:57", "remaining_time": "7:03:47", "throughput": "2985.50", "total_tokens": 114278400} {"current_steps": 13960, "total_steps": 23217, "loss": 0.8684, "learning_rate": 1.7178762988860393e-05, "epoch": 1.8038506266959555, "percentage": 60.13, "elapsed_time": "10:38:45", "remaining_time": "7:03:33", "throughput": "2983.96", "total_tokens": 114360320} {"current_steps": 13970, "total_steps": 23217, "loss": 1.0918, "learning_rate": 1.7146639680892062e-05, "epoch": 1.8051427833053366, "percentage": 60.17, "elapsed_time": "10:39:32", "remaining_time": "7:03:19", "throughput": "2982.42", "total_tokens": 114442240} {"current_steps": 13980, "total_steps": 23217, "loss": 0.7429, "learning_rate": 1.711453075239773e-05, "epoch": 1.8064349399147177, "percentage": 60.21, "elapsed_time": "10:40:19", "remaining_time": "7:03:04", "throughput": "2980.89", "total_tokens": 114524160} {"current_steps": 13990, "total_steps": 23217, "loss": 0.7727, "learning_rate": 1.7082436262168745e-05, "epoch": 1.8077270965240988, "percentage": 60.26, "elapsed_time": "10:41:06", "remaining_time": "7:02:50", "throughput": "2979.36", "total_tokens": 114606080} {"current_steps": 14000, "total_steps": 23217, "loss": 1.0647, "learning_rate": 1.705035626896998e-05, "epoch": 1.8090192531334797, "percentage": 60.3, "elapsed_time": "10:41:53", "remaining_time": "7:02:35", "throughput": "2977.83", "total_tokens": 114688000} {"current_steps": 14010, "total_steps": 23217, "loss": 0.7367, "learning_rate": 1.7018290831539795e-05, "epoch": 1.810311409742861, "percentage": 60.34, "elapsed_time": "10:42:46", "remaining_time": "7:02:24", "throughput": "2975.88", "total_tokens": 114769920} {"current_steps": 14020, "total_steps": 23217, "loss": 0.9311, "learning_rate": 1.6986240008589903e-05, "epoch": 1.8116035663522418, "percentage": 60.39, "elapsed_time": "10:43:34", "remaining_time": "7:02:10", "throughput": "2974.35", "total_tokens": 114851840} {"current_steps": 14030, "total_steps": 23217, "loss": 0.9413, "learning_rate": 1.695420385880522e-05, "epoch": 1.812895722961623, "percentage": 60.43, "elapsed_time": "10:44:21", "remaining_time": "7:01:55", "throughput": "2972.83", "total_tokens": 114933760} {"current_steps": 14040, "total_steps": 23217, "loss": 0.7935, "learning_rate": 1.6922182440843843e-05, "epoch": 1.814187879571004, "percentage": 60.47, "elapsed_time": "10:45:08", "remaining_time": "7:01:41", "throughput": "2971.32", "total_tokens": 115015680} {"current_steps": 14050, "total_steps": 23217, "loss": 0.9507, "learning_rate": 1.689017581333685e-05, "epoch": 1.8154800361803851, "percentage": 60.52, "elapsed_time": "10:45:55", "remaining_time": "7:01:26", "throughput": "2969.81", "total_tokens": 115097600} {"current_steps": 14060, "total_steps": 23217, "loss": 1.1626, "learning_rate": 1.685818403488827e-05, "epoch": 1.8167721927897662, "percentage": 60.56, "elapsed_time": "10:46:43", "remaining_time": "7:01:11", "throughput": "2968.31", "total_tokens": 115179520} {"current_steps": 14070, "total_steps": 23217, "loss": 0.4731, "learning_rate": 1.6826207164074924e-05, "epoch": 1.818064349399147, "percentage": 60.6, "elapsed_time": "10:47:30", "remaining_time": "7:00:56", "throughput": "2966.80", "total_tokens": 115261440} {"current_steps": 14080, "total_steps": 23217, "loss": 0.8077, "learning_rate": 1.6794245259446347e-05, "epoch": 1.8193565060085284, "percentage": 60.65, "elapsed_time": "10:48:17", "remaining_time": "7:00:42", "throughput": "2965.30", "total_tokens": 115343360} {"current_steps": 14090, "total_steps": 23217, "loss": 0.8489, "learning_rate": 1.6762298379524684e-05, "epoch": 1.8206486626179093, "percentage": 60.69, "elapsed_time": "10:49:05", "remaining_time": "7:00:27", "throughput": "2963.80", "total_tokens": 115425280} {"current_steps": 14100, "total_steps": 23217, "loss": 0.5274, "learning_rate": 1.6730366582804535e-05, "epoch": 1.8219408192272903, "percentage": 60.73, "elapsed_time": "10:49:52", "remaining_time": "7:00:12", "throughput": "2962.30", "total_tokens": 115507200} {"current_steps": 14110, "total_steps": 23217, "loss": 0.659, "learning_rate": 1.6698449927752924e-05, "epoch": 1.8232329758366714, "percentage": 60.77, "elapsed_time": "10:50:39", "remaining_time": "6:59:57", "throughput": "2960.82", "total_tokens": 115589120} {"current_steps": 14120, "total_steps": 23217, "loss": 1.1145, "learning_rate": 1.6666548472809104e-05, "epoch": 1.8245251324460523, "percentage": 60.82, "elapsed_time": "10:51:26", "remaining_time": "6:59:42", "throughput": "2959.34", "total_tokens": 115671040} {"current_steps": 14130, "total_steps": 23217, "loss": 0.8391, "learning_rate": 1.6634662276384548e-05, "epoch": 1.8258172890554336, "percentage": 60.86, "elapsed_time": "10:52:13", "remaining_time": "6:59:27", "throughput": "2957.86", "total_tokens": 115752960} {"current_steps": 14140, "total_steps": 23217, "loss": 0.802, "learning_rate": 1.660279139686275e-05, "epoch": 1.8271094456648145, "percentage": 60.9, "elapsed_time": "10:53:01", "remaining_time": "6:59:11", "throughput": "2956.39", "total_tokens": 115834880} {"current_steps": 14150, "total_steps": 23217, "loss": 0.7398, "learning_rate": 1.657093589259917e-05, "epoch": 1.8284016022741958, "percentage": 60.95, "elapsed_time": "10:53:48", "remaining_time": "6:58:56", "throughput": "2954.91", "total_tokens": 115916800} {"current_steps": 14160, "total_steps": 23217, "loss": 0.8751, "learning_rate": 1.6539095821921136e-05, "epoch": 1.8296937588835767, "percentage": 60.99, "elapsed_time": "10:54:35", "remaining_time": "6:58:41", "throughput": "2953.45", "total_tokens": 115998720} {"current_steps": 14170, "total_steps": 23217, "loss": 0.7839, "learning_rate": 1.650727124312768e-05, "epoch": 1.8309859154929577, "percentage": 61.03, "elapsed_time": "10:55:22", "remaining_time": "6:58:26", "throughput": "2951.99", "total_tokens": 116080640} {"current_steps": 14180, "total_steps": 23217, "loss": 0.8393, "learning_rate": 1.6475462214489513e-05, "epoch": 1.8322780721023388, "percentage": 61.08, "elapsed_time": "10:56:10", "remaining_time": "6:58:10", "throughput": "2950.53", "total_tokens": 116162560} {"current_steps": 14190, "total_steps": 23217, "loss": 0.6922, "learning_rate": 1.6443668794248828e-05, "epoch": 1.8335702287117197, "percentage": 61.12, "elapsed_time": "10:56:57", "remaining_time": "6:57:55", "throughput": "2949.07", "total_tokens": 116244480} {"current_steps": 14200, "total_steps": 23217, "loss": 0.9365, "learning_rate": 1.641189104061928e-05, "epoch": 1.834862385321101, "percentage": 61.16, "elapsed_time": "10:57:44", "remaining_time": "6:57:40", "throughput": "2947.61", "total_tokens": 116326400} {"current_steps": 14210, "total_steps": 23217, "loss": 0.8715, "learning_rate": 1.63801290117858e-05, "epoch": 1.8361545419304819, "percentage": 61.21, "elapsed_time": "10:58:31", "remaining_time": "6:57:24", "throughput": "2946.16", "total_tokens": 116408320} {"current_steps": 14220, "total_steps": 23217, "loss": 0.8787, "learning_rate": 1.6348382765904567e-05, "epoch": 1.837446698539863, "percentage": 61.25, "elapsed_time": "10:59:19", "remaining_time": "6:57:09", "throughput": "2944.70", "total_tokens": 116490240} {"current_steps": 14230, "total_steps": 23217, "loss": 0.8164, "learning_rate": 1.631665236110283e-05, "epoch": 1.838738855149244, "percentage": 61.29, "elapsed_time": "11:00:06", "remaining_time": "6:56:53", "throughput": "2943.26", "total_tokens": 116572160} {"current_steps": 14240, "total_steps": 23217, "loss": 1.0631, "learning_rate": 1.6284937855478837e-05, "epoch": 1.8400310117586252, "percentage": 61.33, "elapsed_time": "11:00:53", "remaining_time": "6:56:38", "throughput": "2941.81", "total_tokens": 116654080} {"current_steps": 14250, "total_steps": 23217, "loss": 1.008, "learning_rate": 1.6253239307101748e-05, "epoch": 1.8413231683680062, "percentage": 61.38, "elapsed_time": "11:01:41", "remaining_time": "6:56:22", "throughput": "2940.37", "total_tokens": 116736000} {"current_steps": 14260, "total_steps": 23217, "loss": 1.006, "learning_rate": 1.6221556774011474e-05, "epoch": 1.8426153249773871, "percentage": 61.42, "elapsed_time": "11:02:28", "remaining_time": "6:56:06", "throughput": "2938.94", "total_tokens": 116817920} {"current_steps": 14270, "total_steps": 23217, "loss": 0.8024, "learning_rate": 1.6189890314218634e-05, "epoch": 1.8439074815867684, "percentage": 61.46, "elapsed_time": "11:03:15", "remaining_time": "6:55:51", "throughput": "2937.51", "total_tokens": 116899840} {"current_steps": 14280, "total_steps": 23217, "loss": 0.9059, "learning_rate": 1.6158239985704378e-05, "epoch": 1.8451996381961493, "percentage": 61.51, "elapsed_time": "11:04:02", "remaining_time": "6:55:35", "throughput": "2936.08", "total_tokens": 116981760} {"current_steps": 14290, "total_steps": 23217, "loss": 0.7783, "learning_rate": 1.6126605846420366e-05, "epoch": 1.8464917948055304, "percentage": 61.55, "elapsed_time": "11:04:50", "remaining_time": "6:55:19", "throughput": "2934.65", "total_tokens": 117063680} {"current_steps": 14300, "total_steps": 23217, "loss": 0.8708, "learning_rate": 1.609498795428857e-05, "epoch": 1.8477839514149115, "percentage": 61.59, "elapsed_time": "11:05:37", "remaining_time": "6:55:03", "throughput": "2933.23", "total_tokens": 117145600} {"current_steps": 14310, "total_steps": 23217, "loss": 0.4722, "learning_rate": 1.606338636720125e-05, "epoch": 1.8490761080242926, "percentage": 61.64, "elapsed_time": "11:06:24", "remaining_time": "6:54:47", "throughput": "2931.81", "total_tokens": 117227520} {"current_steps": 14320, "total_steps": 23217, "loss": 0.9373, "learning_rate": 1.6031801143020785e-05, "epoch": 1.8503682646336737, "percentage": 61.68, "elapsed_time": "11:07:11", "remaining_time": "6:54:31", "throughput": "2930.40", "total_tokens": 117309440} {"current_steps": 14330, "total_steps": 23217, "loss": 0.9453, "learning_rate": 1.6000232339579616e-05, "epoch": 1.8516604212430545, "percentage": 61.72, "elapsed_time": "11:07:59", "remaining_time": "6:54:15", "throughput": "2928.98", "total_tokens": 117391360} {"current_steps": 14340, "total_steps": 23217, "loss": 0.8859, "learning_rate": 1.5968680014680105e-05, "epoch": 1.8529525778524358, "percentage": 61.77, "elapsed_time": "11:08:46", "remaining_time": "6:53:59", "throughput": "2927.57", "total_tokens": 117473280} {"current_steps": 14350, "total_steps": 23217, "loss": 1.0594, "learning_rate": 1.5937144226094426e-05, "epoch": 1.8542447344618167, "percentage": 61.81, "elapsed_time": "11:09:33", "remaining_time": "6:53:43", "throughput": "2926.16", "total_tokens": 117555200} {"current_steps": 14360, "total_steps": 23217, "loss": 0.8882, "learning_rate": 1.590562503156452e-05, "epoch": 1.8555368910711978, "percentage": 61.85, "elapsed_time": "11:10:21", "remaining_time": "6:53:27", "throughput": "2924.76", "total_tokens": 117637120} {"current_steps": 14370, "total_steps": 23217, "loss": 0.6613, "learning_rate": 1.5874122488801888e-05, "epoch": 1.8568290476805789, "percentage": 61.89, "elapsed_time": "11:11:08", "remaining_time": "6:53:11", "throughput": "2923.37", "total_tokens": 117719040} {"current_steps": 14380, "total_steps": 23217, "loss": 0.6339, "learning_rate": 1.5842636655487585e-05, "epoch": 1.85812120428996, "percentage": 61.94, "elapsed_time": "11:11:55", "remaining_time": "6:52:55", "throughput": "2921.97", "total_tokens": 117800960} {"current_steps": 14390, "total_steps": 23217, "loss": 1.0055, "learning_rate": 1.5811167589272068e-05, "epoch": 1.859413360899341, "percentage": 61.98, "elapsed_time": "11:12:42", "remaining_time": "6:52:39", "throughput": "2920.58", "total_tokens": 117882880} {"current_steps": 14400, "total_steps": 23217, "loss": 0.7919, "learning_rate": 1.577971534777507e-05, "epoch": 1.860705517508722, "percentage": 62.02, "elapsed_time": "11:13:30", "remaining_time": "6:52:22", "throughput": "2919.19", "total_tokens": 117964800} {"current_steps": 14410, "total_steps": 23217, "loss": 0.7019, "learning_rate": 1.5748279988585528e-05, "epoch": 1.8619976741181032, "percentage": 62.07, "elapsed_time": "11:14:17", "remaining_time": "6:52:06", "throughput": "2917.81", "total_tokens": 118046720} {"current_steps": 14420, "total_steps": 23217, "loss": 0.7455, "learning_rate": 1.571686156926147e-05, "epoch": 1.863289830727484, "percentage": 62.11, "elapsed_time": "11:15:04", "remaining_time": "6:51:50", "throughput": "2916.42", "total_tokens": 118128640} {"current_steps": 14430, "total_steps": 23217, "loss": 0.68, "learning_rate": 1.5685460147329917e-05, "epoch": 1.8645819873368652, "percentage": 62.15, "elapsed_time": "11:15:51", "remaining_time": "6:51:33", "throughput": "2915.05", "total_tokens": 118210560} {"current_steps": 14440, "total_steps": 23217, "loss": 0.9481, "learning_rate": 1.5654075780286742e-05, "epoch": 1.8658741439462463, "percentage": 62.2, "elapsed_time": "11:16:39", "remaining_time": "6:51:17", "throughput": "2913.67", "total_tokens": 118292480} {"current_steps": 14450, "total_steps": 23217, "loss": 1.0229, "learning_rate": 1.562270852559661e-05, "epoch": 1.8671663005556274, "percentage": 62.24, "elapsed_time": "11:17:26", "remaining_time": "6:51:00", "throughput": "2912.30", "total_tokens": 118374400} {"current_steps": 14460, "total_steps": 23217, "loss": 1.0381, "learning_rate": 1.5591358440692865e-05, "epoch": 1.8684584571650085, "percentage": 62.28, "elapsed_time": "11:18:13", "remaining_time": "6:50:44", "throughput": "2910.93", "total_tokens": 118456320} {"current_steps": 14470, "total_steps": 23217, "loss": 0.988, "learning_rate": 1.5560025582977377e-05, "epoch": 1.8697506137743893, "percentage": 62.33, "elapsed_time": "11:19:00", "remaining_time": "6:50:27", "throughput": "2909.57", "total_tokens": 118538240} {"current_steps": 14480, "total_steps": 23217, "loss": 1.0819, "learning_rate": 1.5528710009820513e-05, "epoch": 1.8710427703837706, "percentage": 62.37, "elapsed_time": "11:19:48", "remaining_time": "6:50:10", "throughput": "2908.20", "total_tokens": 118620160} {"current_steps": 14490, "total_steps": 23217, "loss": 1.2201, "learning_rate": 1.5497411778560954e-05, "epoch": 1.8723349269931515, "percentage": 62.41, "elapsed_time": "11:20:35", "remaining_time": "6:49:54", "throughput": "2906.84", "total_tokens": 118702080} {"current_steps": 14500, "total_steps": 23217, "loss": 0.7508, "learning_rate": 1.5466130946505664e-05, "epoch": 1.8736270836025326, "percentage": 62.45, "elapsed_time": "11:21:22", "remaining_time": "6:49:37", "throughput": "2905.48", "total_tokens": 118784000} {"current_steps": 14510, "total_steps": 23217, "loss": 0.8983, "learning_rate": 1.5434867570929724e-05, "epoch": 1.8749192402119137, "percentage": 62.5, "elapsed_time": "11:22:09", "remaining_time": "6:49:20", "throughput": "2904.13", "total_tokens": 118865920} {"current_steps": 14520, "total_steps": 23217, "loss": 0.6051, "learning_rate": 1.5403621709076247e-05, "epoch": 1.8762113968212948, "percentage": 62.54, "elapsed_time": "11:22:57", "remaining_time": "6:49:03", "throughput": "2902.78", "total_tokens": 118947840} {"current_steps": 14530, "total_steps": 23217, "loss": 0.7321, "learning_rate": 1.5372393418156323e-05, "epoch": 1.8775035534306759, "percentage": 62.58, "elapsed_time": "11:23:44", "remaining_time": "6:48:47", "throughput": "2901.43", "total_tokens": 119029760} {"current_steps": 14540, "total_steps": 23217, "loss": 0.887, "learning_rate": 1.5341182755348806e-05, "epoch": 1.8787957100400567, "percentage": 62.63, "elapsed_time": "11:24:31", "remaining_time": "6:48:30", "throughput": "2900.09", "total_tokens": 119111680} {"current_steps": 14550, "total_steps": 23217, "loss": 0.7769, "learning_rate": 1.530998977780033e-05, "epoch": 1.880087866649438, "percentage": 62.67, "elapsed_time": "11:25:18", "remaining_time": "6:48:13", "throughput": "2898.75", "total_tokens": 119193600} {"current_steps": 14560, "total_steps": 23217, "loss": 0.7488, "learning_rate": 1.5278814542625107e-05, "epoch": 1.881380023258819, "percentage": 62.71, "elapsed_time": "11:26:06", "remaining_time": "6:47:56", "throughput": "2897.41", "total_tokens": 119275520} {"current_steps": 14570, "total_steps": 23217, "loss": 0.8852, "learning_rate": 1.5247657106904891e-05, "epoch": 1.8826721798682, "percentage": 62.76, "elapsed_time": "11:26:53", "remaining_time": "6:47:39", "throughput": "2896.08", "total_tokens": 119357440} {"current_steps": 14580, "total_steps": 23217, "loss": 0.8831, "learning_rate": 1.5216517527688818e-05, "epoch": 1.883964336477581, "percentage": 62.8, "elapsed_time": "11:27:40", "remaining_time": "6:47:22", "throughput": "2894.74", "total_tokens": 119439360} {"current_steps": 14590, "total_steps": 23217, "loss": 0.8191, "learning_rate": 1.5185395861993353e-05, "epoch": 1.8852564930869622, "percentage": 62.84, "elapsed_time": "11:28:28", "remaining_time": "6:47:05", "throughput": "2893.41", "total_tokens": 119521280} {"current_steps": 14600, "total_steps": 23217, "loss": 0.9853, "learning_rate": 1.515429216680216e-05, "epoch": 1.8865486496963433, "percentage": 62.88, "elapsed_time": "11:29:15", "remaining_time": "6:46:48", "throughput": "2892.09", "total_tokens": 119603200} {"current_steps": 14610, "total_steps": 23217, "loss": 0.9514, "learning_rate": 1.5123206499065967e-05, "epoch": 1.8878408063057242, "percentage": 62.93, "elapsed_time": "11:30:02", "remaining_time": "6:46:30", "throughput": "2890.77", "total_tokens": 119685120} {"current_steps": 14620, "total_steps": 23217, "loss": 1.2975, "learning_rate": 1.5092138915702545e-05, "epoch": 1.8891329629151055, "percentage": 62.97, "elapsed_time": "11:30:49", "remaining_time": "6:46:13", "throughput": "2889.45", "total_tokens": 119767040} {"current_steps": 14630, "total_steps": 23217, "loss": 0.8597, "learning_rate": 1.5061089473596501e-05, "epoch": 1.8904251195244863, "percentage": 63.01, "elapsed_time": "11:31:37", "remaining_time": "6:45:56", "throughput": "2888.13", "total_tokens": 119848960} {"current_steps": 14640, "total_steps": 23217, "loss": 0.7876, "learning_rate": 1.5030058229599275e-05, "epoch": 1.8917172761338674, "percentage": 63.06, "elapsed_time": "11:32:24", "remaining_time": "6:45:39", "throughput": "2886.82", "total_tokens": 119930880} {"current_steps": 14650, "total_steps": 23217, "loss": 0.4448, "learning_rate": 1.4999045240528935e-05, "epoch": 1.8930094327432485, "percentage": 63.1, "elapsed_time": "11:33:11", "remaining_time": "6:45:21", "throughput": "2885.51", "total_tokens": 120012800} {"current_steps": 14660, "total_steps": 23217, "loss": 0.9315, "learning_rate": 1.4968050563170177e-05, "epoch": 1.8943015893526294, "percentage": 63.14, "elapsed_time": "11:33:58", "remaining_time": "6:45:04", "throughput": "2884.20", "total_tokens": 120094720} {"current_steps": 14670, "total_steps": 23217, "loss": 1.0145, "learning_rate": 1.4937074254274117e-05, "epoch": 1.8955937459620107, "percentage": 63.19, "elapsed_time": "11:34:46", "remaining_time": "6:44:47", "throughput": "2882.89", "total_tokens": 120176640} {"current_steps": 14680, "total_steps": 23217, "loss": 0.6827, "learning_rate": 1.4906116370558276e-05, "epoch": 1.8968859025713916, "percentage": 63.23, "elapsed_time": "11:35:33", "remaining_time": "6:44:29", "throughput": "2881.59", "total_tokens": 120258560} {"current_steps": 14690, "total_steps": 23217, "loss": 0.8853, "learning_rate": 1.4875176968706434e-05, "epoch": 1.8981780591807729, "percentage": 63.27, "elapsed_time": "11:36:20", "remaining_time": "6:44:12", "throughput": "2880.28", "total_tokens": 120340480} {"current_steps": 14700, "total_steps": 23217, "loss": 0.7183, "learning_rate": 1.4844256105368504e-05, "epoch": 1.8994702157901537, "percentage": 63.32, "elapsed_time": "11:37:07", "remaining_time": "6:43:54", "throughput": "2878.99", "total_tokens": 120422400} {"current_steps": 14710, "total_steps": 23217, "loss": 0.5776, "learning_rate": 1.4813353837160488e-05, "epoch": 1.9007623723995348, "percentage": 63.36, "elapsed_time": "11:37:55", "remaining_time": "6:43:37", "throughput": "2877.70", "total_tokens": 120504320} {"current_steps": 14720, "total_steps": 23217, "loss": 1.1882, "learning_rate": 1.4782470220664313e-05, "epoch": 1.902054529008916, "percentage": 63.4, "elapsed_time": "11:38:42", "remaining_time": "6:43:19", "throughput": "2876.42", "total_tokens": 120586240} {"current_steps": 14730, "total_steps": 23217, "loss": 0.9617, "learning_rate": 1.4751605312427786e-05, "epoch": 1.9033466856182968, "percentage": 63.44, "elapsed_time": "11:39:29", "remaining_time": "6:43:01", "throughput": "2875.13", "total_tokens": 120668160} {"current_steps": 14740, "total_steps": 23217, "loss": 0.8622, "learning_rate": 1.472075916896442e-05, "epoch": 1.904638842227678, "percentage": 63.49, "elapsed_time": "11:40:16", "remaining_time": "6:42:44", "throughput": "2873.84", "total_tokens": 120750080} {"current_steps": 14750, "total_steps": 23217, "loss": 0.9725, "learning_rate": 1.4689931846753402e-05, "epoch": 1.905930998837059, "percentage": 63.53, "elapsed_time": "11:41:04", "remaining_time": "6:42:26", "throughput": "2872.56", "total_tokens": 120832000} {"current_steps": 14760, "total_steps": 23217, "loss": 1.2234, "learning_rate": 1.4659123402239454e-05, "epoch": 1.90722315544644, "percentage": 63.57, "elapsed_time": "11:41:51", "remaining_time": "6:42:08", "throughput": "2871.28", "total_tokens": 120913920} {"current_steps": 14770, "total_steps": 23217, "loss": 0.8926, "learning_rate": 1.4628333891832713e-05, "epoch": 1.9085153120558211, "percentage": 63.62, "elapsed_time": "11:42:38", "remaining_time": "6:41:50", "throughput": "2870.00", "total_tokens": 120995840} {"current_steps": 14780, "total_steps": 23217, "loss": 1.0101, "learning_rate": 1.4597563371908663e-05, "epoch": 1.9098074686652022, "percentage": 63.66, "elapsed_time": "11:43:26", "remaining_time": "6:41:32", "throughput": "2868.73", "total_tokens": 121077760} {"current_steps": 14790, "total_steps": 23217, "loss": 0.9358, "learning_rate": 1.4566811898808013e-05, "epoch": 1.9110996252745833, "percentage": 63.7, "elapsed_time": "11:44:13", "remaining_time": "6:41:14", "throughput": "2867.47", "total_tokens": 121159680} {"current_steps": 14800, "total_steps": 23217, "loss": 0.7874, "learning_rate": 1.4536079528836605e-05, "epoch": 1.9123917818839642, "percentage": 63.75, "elapsed_time": "11:45:00", "remaining_time": "6:40:56", "throughput": "2866.20", "total_tokens": 121241600} {"current_steps": 14810, "total_steps": 23217, "loss": 0.6709, "learning_rate": 1.4505366318265278e-05, "epoch": 1.9136839384933455, "percentage": 63.79, "elapsed_time": "11:45:47", "remaining_time": "6:40:38", "throughput": "2864.94", "total_tokens": 121323520} {"current_steps": 14820, "total_steps": 23217, "loss": 0.6944, "learning_rate": 1.4474672323329819e-05, "epoch": 1.9149760951027264, "percentage": 63.83, "elapsed_time": "11:46:35", "remaining_time": "6:40:21", "throughput": "2863.67", "total_tokens": 121405440} {"current_steps": 14830, "total_steps": 23217, "loss": 0.8012, "learning_rate": 1.4443997600230832e-05, "epoch": 1.9162682517121075, "percentage": 63.88, "elapsed_time": "11:47:22", "remaining_time": "6:40:02", "throughput": "2862.41", "total_tokens": 121487360} {"current_steps": 14840, "total_steps": 23217, "loss": 0.9204, "learning_rate": 1.4413342205133604e-05, "epoch": 1.9175604083214886, "percentage": 63.92, "elapsed_time": "11:48:09", "remaining_time": "6:39:44", "throughput": "2861.16", "total_tokens": 121569280} {"current_steps": 14850, "total_steps": 23217, "loss": 0.6648, "learning_rate": 1.4382706194168066e-05, "epoch": 1.9188525649308696, "percentage": 63.96, "elapsed_time": "11:48:56", "remaining_time": "6:39:26", "throughput": "2859.91", "total_tokens": 121651200} {"current_steps": 14860, "total_steps": 23217, "loss": 0.8368, "learning_rate": 1.4352089623428627e-05, "epoch": 1.9201447215402507, "percentage": 64.0, "elapsed_time": "11:49:44", "remaining_time": "6:39:08", "throughput": "2858.65", "total_tokens": 121733120} {"current_steps": 14870, "total_steps": 23217, "loss": 1.248, "learning_rate": 1.4321492548974137e-05, "epoch": 1.9214368781496316, "percentage": 64.05, "elapsed_time": "11:50:31", "remaining_time": "6:38:50", "throughput": "2857.40", "total_tokens": 121815040} {"current_steps": 14880, "total_steps": 23217, "loss": 1.0932, "learning_rate": 1.42909150268277e-05, "epoch": 1.922729034759013, "percentage": 64.09, "elapsed_time": "11:51:18", "remaining_time": "6:38:32", "throughput": "2856.16", "total_tokens": 121896960} {"current_steps": 14890, "total_steps": 23217, "loss": 0.8562, "learning_rate": 1.4260357112976664e-05, "epoch": 1.9240211913683938, "percentage": 64.13, "elapsed_time": "11:52:06", "remaining_time": "6:38:13", "throughput": "2854.91", "total_tokens": 121978880} {"current_steps": 14900, "total_steps": 23217, "loss": 0.9967, "learning_rate": 1.4229818863372463e-05, "epoch": 1.9253133479777749, "percentage": 64.18, "elapsed_time": "11:52:53", "remaining_time": "6:37:55", "throughput": "2853.67", "total_tokens": 122060800} {"current_steps": 14910, "total_steps": 23217, "loss": 1.2298, "learning_rate": 1.4199300333930515e-05, "epoch": 1.926605504587156, "percentage": 64.22, "elapsed_time": "11:53:40", "remaining_time": "6:37:37", "throughput": "2852.43", "total_tokens": 122142720} {"current_steps": 14920, "total_steps": 23217, "loss": 0.6193, "learning_rate": 1.4168801580530119e-05, "epoch": 1.927897661196537, "percentage": 64.26, "elapsed_time": "11:54:27", "remaining_time": "6:37:18", "throughput": "2851.19", "total_tokens": 122224640} {"current_steps": 14930, "total_steps": 23217, "loss": 0.9493, "learning_rate": 1.4138322659014408e-05, "epoch": 1.9291898178059181, "percentage": 64.31, "elapsed_time": "11:55:15", "remaining_time": "6:37:00", "throughput": "2849.96", "total_tokens": 122306560} {"current_steps": 14940, "total_steps": 23217, "loss": 0.8788, "learning_rate": 1.4107863625190163e-05, "epoch": 1.930481974415299, "percentage": 64.35, "elapsed_time": "11:56:02", "remaining_time": "6:36:41", "throughput": "2848.73", "total_tokens": 122388480} {"current_steps": 14950, "total_steps": 23217, "loss": 0.7922, "learning_rate": 1.4077424534827752e-05, "epoch": 1.9317741310246803, "percentage": 64.39, "elapsed_time": "11:56:49", "remaining_time": "6:36:23", "throughput": "2847.51", "total_tokens": 122470400} {"current_steps": 14960, "total_steps": 23217, "loss": 1.057, "learning_rate": 1.4047005443661048e-05, "epoch": 1.9330662876340612, "percentage": 64.44, "elapsed_time": "11:57:36", "remaining_time": "6:36:04", "throughput": "2846.29", "total_tokens": 122552320} {"current_steps": 14970, "total_steps": 23217, "loss": 0.9366, "learning_rate": 1.4016606407387312e-05, "epoch": 1.9343584442434423, "percentage": 64.48, "elapsed_time": "11:58:24", "remaining_time": "6:35:46", "throughput": "2845.07", "total_tokens": 122634240} {"current_steps": 14980, "total_steps": 23217, "loss": 0.3856, "learning_rate": 1.398622748166704e-05, "epoch": 1.9356506008528234, "percentage": 64.52, "elapsed_time": "11:59:11", "remaining_time": "6:35:27", "throughput": "2843.85", "total_tokens": 122716160} {"current_steps": 14990, "total_steps": 23217, "loss": 0.7705, "learning_rate": 1.3955868722123955e-05, "epoch": 1.9369427574622045, "percentage": 64.56, "elapsed_time": "11:59:58", "remaining_time": "6:35:08", "throughput": "2842.63", "total_tokens": 122798080} {"current_steps": 15000, "total_steps": 23217, "loss": 0.7423, "learning_rate": 1.3925530184344818e-05, "epoch": 1.9382349140715855, "percentage": 64.61, "elapsed_time": "12:00:46", "remaining_time": "6:34:50", "throughput": "2841.42", "total_tokens": 122880000} {"current_steps": 15010, "total_steps": 23217, "loss": 1.0697, "learning_rate": 1.3895211923879397e-05, "epoch": 1.9395270706809664, "percentage": 64.65, "elapsed_time": "12:01:39", "remaining_time": "6:34:34", "throughput": "2839.82", "total_tokens": 122961920} {"current_steps": 15020, "total_steps": 23217, "loss": 0.967, "learning_rate": 1.3864913996240304e-05, "epoch": 1.9408192272903477, "percentage": 64.69, "elapsed_time": "12:02:26", "remaining_time": "6:34:15", "throughput": "2838.62", "total_tokens": 123043840} {"current_steps": 15030, "total_steps": 23217, "loss": 0.8996, "learning_rate": 1.3834636456902944e-05, "epoch": 1.9421113838997286, "percentage": 64.74, "elapsed_time": "12:03:13", "remaining_time": "6:33:56", "throughput": "2837.41", "total_tokens": 123125760} {"current_steps": 15040, "total_steps": 23217, "loss": 0.5727, "learning_rate": 1.3804379361305363e-05, "epoch": 1.9434035405091097, "percentage": 64.78, "elapsed_time": "12:04:00", "remaining_time": "6:33:38", "throughput": "2836.21", "total_tokens": 123207680} {"current_steps": 15050, "total_steps": 23217, "loss": 0.9822, "learning_rate": 1.3774142764848207e-05, "epoch": 1.9446956971184908, "percentage": 64.82, "elapsed_time": "12:04:48", "remaining_time": "6:33:19", "throughput": "2835.00", "total_tokens": 123289600} {"current_steps": 15060, "total_steps": 23217, "loss": 0.7735, "learning_rate": 1.3743926722894579e-05, "epoch": 1.9459878537278719, "percentage": 64.87, "elapsed_time": "12:05:35", "remaining_time": "6:33:00", "throughput": "2833.80", "total_tokens": 123371520} {"current_steps": 15070, "total_steps": 23217, "loss": 1.0148, "learning_rate": 1.3713731290769921e-05, "epoch": 1.947280010337253, "percentage": 64.91, "elapsed_time": "12:06:23", "remaining_time": "6:32:41", "throughput": "2832.60", "total_tokens": 123453440} {"current_steps": 15080, "total_steps": 23217, "loss": 0.8874, "learning_rate": 1.3683556523761981e-05, "epoch": 1.9485721669466338, "percentage": 64.95, "elapsed_time": "12:07:10", "remaining_time": "6:32:22", "throughput": "2831.42", "total_tokens": 123535360} {"current_steps": 15090, "total_steps": 23217, "loss": 0.9097, "learning_rate": 1.365340247712064e-05, "epoch": 1.9498643235560151, "percentage": 65.0, "elapsed_time": "12:07:57", "remaining_time": "6:32:03", "throughput": "2830.23", "total_tokens": 123617280} {"current_steps": 15100, "total_steps": 23217, "loss": 0.8473, "learning_rate": 1.362326920605783e-05, "epoch": 1.951156480165396, "percentage": 65.04, "elapsed_time": "12:08:44", "remaining_time": "6:31:44", "throughput": "2829.04", "total_tokens": 123699200} {"current_steps": 15110, "total_steps": 23217, "loss": 0.7964, "learning_rate": 1.3593156765747483e-05, "epoch": 1.952448636774777, "percentage": 65.08, "elapsed_time": "12:09:32", "remaining_time": "6:31:25", "throughput": "2827.86", "total_tokens": 123781120} {"current_steps": 15120, "total_steps": 23217, "loss": 0.795, "learning_rate": 1.3563065211325349e-05, "epoch": 1.9537407933841582, "percentage": 65.12, "elapsed_time": "12:10:19", "remaining_time": "6:31:05", "throughput": "2826.68", "total_tokens": 123863040} {"current_steps": 15130, "total_steps": 23217, "loss": 0.6041, "learning_rate": 1.3532994597888971e-05, "epoch": 1.9550329499935393, "percentage": 65.17, "elapsed_time": "12:11:06", "remaining_time": "6:30:46", "throughput": "2825.50", "total_tokens": 123944960} {"current_steps": 15140, "total_steps": 23217, "loss": 0.7019, "learning_rate": 1.3502944980497514e-05, "epoch": 1.9563251066029204, "percentage": 65.21, "elapsed_time": "12:11:53", "remaining_time": "6:30:27", "throughput": "2824.32", "total_tokens": 124026880} {"current_steps": 15150, "total_steps": 23217, "loss": 1.2308, "learning_rate": 1.3472916414171738e-05, "epoch": 1.9576172632123012, "percentage": 65.25, "elapsed_time": "12:12:41", "remaining_time": "6:30:08", "throughput": "2823.15", "total_tokens": 124108800} {"current_steps": 15160, "total_steps": 23217, "loss": 0.8531, "learning_rate": 1.3442908953893816e-05, "epoch": 1.9589094198216825, "percentage": 65.3, "elapsed_time": "12:13:28", "remaining_time": "6:29:48", "throughput": "2821.97", "total_tokens": 124190720} {"current_steps": 15170, "total_steps": 23217, "loss": 0.8579, "learning_rate": 1.3412922654607318e-05, "epoch": 1.9602015764310634, "percentage": 65.34, "elapsed_time": "12:14:15", "remaining_time": "6:29:29", "throughput": "2820.80", "total_tokens": 124272640} {"current_steps": 15180, "total_steps": 23217, "loss": 0.7652, "learning_rate": 1.338295757121703e-05, "epoch": 1.9614937330404445, "percentage": 65.38, "elapsed_time": "12:15:03", "remaining_time": "6:29:10", "throughput": "2819.63", "total_tokens": 124354560} {"current_steps": 15190, "total_steps": 23217, "loss": 0.8972, "learning_rate": 1.3353013758588923e-05, "epoch": 1.9627858896498256, "percentage": 65.43, "elapsed_time": "12:15:50", "remaining_time": "6:28:50", "throughput": "2818.47", "total_tokens": 124436480} {"current_steps": 15200, "total_steps": 23217, "loss": 0.8894, "learning_rate": 1.3323091271550011e-05, "epoch": 1.9640780462592065, "percentage": 65.47, "elapsed_time": "12:16:37", "remaining_time": "6:28:31", "throughput": "2817.31", "total_tokens": 124518400} {"current_steps": 15210, "total_steps": 23217, "loss": 1.0825, "learning_rate": 1.3293190164888242e-05, "epoch": 1.9653702028685878, "percentage": 65.51, "elapsed_time": "12:17:25", "remaining_time": "6:28:11", "throughput": "2816.14", "total_tokens": 124600320} {"current_steps": 15220, "total_steps": 23217, "loss": 0.8476, "learning_rate": 1.3263310493352454e-05, "epoch": 1.9666623594779686, "percentage": 65.56, "elapsed_time": "12:18:12", "remaining_time": "6:27:52", "throughput": "2814.98", "total_tokens": 124682240} {"current_steps": 15230, "total_steps": 23217, "loss": 0.6004, "learning_rate": 1.3233452311652197e-05, "epoch": 1.96795451608735, "percentage": 65.6, "elapsed_time": "12:18:59", "remaining_time": "6:27:32", "throughput": "2813.83", "total_tokens": 124764160} {"current_steps": 15240, "total_steps": 23217, "loss": 0.4468, "learning_rate": 1.3203615674457709e-05, "epoch": 1.9692466726967308, "percentage": 65.64, "elapsed_time": "12:19:46", "remaining_time": "6:27:13", "throughput": "2812.68", "total_tokens": 124846080} {"current_steps": 15250, "total_steps": 23217, "loss": 0.704, "learning_rate": 1.3173800636399744e-05, "epoch": 1.970538829306112, "percentage": 65.68, "elapsed_time": "12:20:34", "remaining_time": "6:26:53", "throughput": "2811.53", "total_tokens": 124928000} {"current_steps": 15260, "total_steps": 23217, "loss": 0.5738, "learning_rate": 1.3144007252069552e-05, "epoch": 1.971830985915493, "percentage": 65.73, "elapsed_time": "12:21:21", "remaining_time": "6:26:33", "throughput": "2810.39", "total_tokens": 125009920} {"current_steps": 15270, "total_steps": 23217, "loss": 0.6915, "learning_rate": 1.3114235576018686e-05, "epoch": 1.9731231425248739, "percentage": 65.77, "elapsed_time": "12:22:08", "remaining_time": "6:26:14", "throughput": "2809.24", "total_tokens": 125091840} {"current_steps": 15280, "total_steps": 23217, "loss": 0.6731, "learning_rate": 1.3084485662758994e-05, "epoch": 1.9744152991342552, "percentage": 65.81, "elapsed_time": "12:22:55", "remaining_time": "6:25:54", "throughput": "2808.10", "total_tokens": 125173760} {"current_steps": 15290, "total_steps": 23217, "loss": 0.8532, "learning_rate": 1.3054757566762454e-05, "epoch": 1.975707455743636, "percentage": 65.86, "elapsed_time": "12:23:43", "remaining_time": "6:25:34", "throughput": "2806.96", "total_tokens": 125255680} {"current_steps": 15300, "total_steps": 23217, "loss": 1.3152, "learning_rate": 1.3025051342461087e-05, "epoch": 1.9769996123530171, "percentage": 65.9, "elapsed_time": "12:24:30", "remaining_time": "6:25:14", "throughput": "2805.82", "total_tokens": 125337600} {"current_steps": 15310, "total_steps": 23217, "loss": 0.6177, "learning_rate": 1.2995367044246903e-05, "epoch": 1.9782917689623982, "percentage": 65.94, "elapsed_time": "12:25:17", "remaining_time": "6:24:54", "throughput": "2804.69", "total_tokens": 125419520} {"current_steps": 15320, "total_steps": 23217, "loss": 0.7341, "learning_rate": 1.2965704726471729e-05, "epoch": 1.9795839255717793, "percentage": 65.99, "elapsed_time": "12:26:04", "remaining_time": "6:24:34", "throughput": "2803.57", "total_tokens": 125501440} {"current_steps": 15330, "total_steps": 23217, "loss": 0.7912, "learning_rate": 1.2936064443447157e-05, "epoch": 1.9808760821811604, "percentage": 66.03, "elapsed_time": "12:26:52", "remaining_time": "6:24:15", "throughput": "2802.44", "total_tokens": 125583360} {"current_steps": 15340, "total_steps": 23217, "loss": 1.0051, "learning_rate": 1.2906446249444457e-05, "epoch": 1.9821682387905413, "percentage": 66.07, "elapsed_time": "12:27:39", "remaining_time": "6:23:55", "throughput": "2801.30", "total_tokens": 125665280} {"current_steps": 15350, "total_steps": 23217, "loss": 0.4944, "learning_rate": 1.2876850198694409e-05, "epoch": 1.9834603953999226, "percentage": 66.12, "elapsed_time": "12:28:26", "remaining_time": "6:23:35", "throughput": "2800.18", "total_tokens": 125747200} {"current_steps": 15360, "total_steps": 23217, "loss": 0.7472, "learning_rate": 1.2847276345387299e-05, "epoch": 1.9847525520093035, "percentage": 66.16, "elapsed_time": "12:29:14", "remaining_time": "6:23:15", "throughput": "2799.06", "total_tokens": 125829120} {"current_steps": 15370, "total_steps": 23217, "loss": 0.6023, "learning_rate": 1.2817724743672715e-05, "epoch": 1.9860447086186845, "percentage": 66.2, "elapsed_time": "12:30:01", "remaining_time": "6:22:54", "throughput": "2797.94", "total_tokens": 125911040} {"current_steps": 15380, "total_steps": 23217, "loss": 1.1141, "learning_rate": 1.2788195447659562e-05, "epoch": 1.9873368652280656, "percentage": 66.24, "elapsed_time": "12:30:48", "remaining_time": "6:22:34", "throughput": "2796.82", "total_tokens": 125992960} {"current_steps": 15390, "total_steps": 23217, "loss": 0.9213, "learning_rate": 1.2758688511415848e-05, "epoch": 1.9886290218374467, "percentage": 66.29, "elapsed_time": "12:31:35", "remaining_time": "6:22:14", "throughput": "2795.70", "total_tokens": 126074880} {"current_steps": 15400, "total_steps": 23217, "loss": 0.7153, "learning_rate": 1.2729203988968674e-05, "epoch": 1.9899211784468278, "percentage": 66.33, "elapsed_time": "12:32:23", "remaining_time": "6:21:54", "throughput": "2794.59", "total_tokens": 126156800} {"current_steps": 15410, "total_steps": 23217, "loss": 0.5926, "learning_rate": 1.2699741934304104e-05, "epoch": 1.9912133350562087, "percentage": 66.37, "elapsed_time": "12:33:10", "remaining_time": "6:21:34", "throughput": "2793.48", "total_tokens": 126238720} {"current_steps": 15420, "total_steps": 23217, "loss": 0.9406, "learning_rate": 1.2670302401367035e-05, "epoch": 1.99250549166559, "percentage": 66.42, "elapsed_time": "12:33:57", "remaining_time": "6:21:14", "throughput": "2792.37", "total_tokens": 126320640} {"current_steps": 15430, "total_steps": 23217, "loss": 0.9174, "learning_rate": 1.2640885444061163e-05, "epoch": 1.9937976482749709, "percentage": 66.46, "elapsed_time": "12:34:44", "remaining_time": "6:20:53", "throughput": "2791.27", "total_tokens": 126402560} {"current_steps": 15440, "total_steps": 23217, "loss": 1.254, "learning_rate": 1.2611491116248802e-05, "epoch": 1.995089804884352, "percentage": 66.5, "elapsed_time": "12:35:32", "remaining_time": "6:20:33", "throughput": "2790.16", "total_tokens": 126484480} {"current_steps": 15450, "total_steps": 23217, "loss": 0.7516, "learning_rate": 1.2582119471750888e-05, "epoch": 1.996381961493733, "percentage": 66.55, "elapsed_time": "12:36:19", "remaining_time": "6:20:13", "throughput": "2789.06", "total_tokens": 126566400} {"current_steps": 15460, "total_steps": 23217, "loss": 0.9337, "learning_rate": 1.2552770564346781e-05, "epoch": 1.9976741181031141, "percentage": 66.59, "elapsed_time": "12:37:06", "remaining_time": "6:19:52", "throughput": "2787.96", "total_tokens": 126648320} {"current_steps": 15470, "total_steps": 23217, "loss": 0.9429, "learning_rate": 1.2523444447774213e-05, "epoch": 1.9989662747124952, "percentage": 66.63, "elapsed_time": "12:37:54", "remaining_time": "6:19:32", "throughput": "2786.86", "total_tokens": 126730240} {"current_steps": 15480, "total_steps": 23217, "loss": 0.9215, "learning_rate": 1.2494141175729216e-05, "epoch": 2.000258431321876, "percentage": 66.68, "elapsed_time": "12:38:41", "remaining_time": "6:19:11", "throughput": "2785.77", "total_tokens": 126812160} {"current_steps": 15490, "total_steps": 23217, "loss": 0.611, "learning_rate": 1.2464860801865954e-05, "epoch": 2.0015505879312574, "percentage": 66.72, "elapsed_time": "12:39:28", "remaining_time": "6:18:51", "throughput": "2784.67", "total_tokens": 126894080} {"current_steps": 15500, "total_steps": 23217, "loss": 1.1059, "learning_rate": 1.2435603379796704e-05, "epoch": 2.0028427445406383, "percentage": 66.76, "elapsed_time": "12:40:15", "remaining_time": "6:18:30", "throughput": "2783.59", "total_tokens": 126976000} {"current_steps": 15510, "total_steps": 23217, "loss": 0.9048, "learning_rate": 1.240636896309168e-05, "epoch": 2.0041349011500196, "percentage": 66.8, "elapsed_time": "12:41:03", "remaining_time": "6:18:10", "throughput": "2782.51", "total_tokens": 127057920} {"current_steps": 15520, "total_steps": 23217, "loss": 0.7904, "learning_rate": 1.237715760527901e-05, "epoch": 2.0054270577594004, "percentage": 66.85, "elapsed_time": "12:41:50", "remaining_time": "6:17:49", "throughput": "2781.43", "total_tokens": 127139840} {"current_steps": 15530, "total_steps": 23217, "loss": 0.7196, "learning_rate": 1.2347969359844566e-05, "epoch": 2.0067192143687813, "percentage": 66.89, "elapsed_time": "12:42:37", "remaining_time": "6:17:28", "throughput": "2780.35", "total_tokens": 127221760} {"current_steps": 15540, "total_steps": 23217, "loss": 1.102, "learning_rate": 1.2318804280231939e-05, "epoch": 2.0080113709781626, "percentage": 66.93, "elapsed_time": "12:43:24", "remaining_time": "6:17:08", "throughput": "2779.27", "total_tokens": 127303680} {"current_steps": 15550, "total_steps": 23217, "loss": 0.5505, "learning_rate": 1.2289662419842258e-05, "epoch": 2.0093035275875435, "percentage": 66.98, "elapsed_time": "12:44:12", "remaining_time": "6:16:47", "throughput": "2778.19", "total_tokens": 127385600} {"current_steps": 15560, "total_steps": 23217, "loss": 0.6824, "learning_rate": 1.2260543832034177e-05, "epoch": 2.010595684196925, "percentage": 67.02, "elapsed_time": "12:44:59", "remaining_time": "6:16:26", "throughput": "2777.12", "total_tokens": 127467520} {"current_steps": 15570, "total_steps": 23217, "loss": 0.9454, "learning_rate": 1.2231448570123732e-05, "epoch": 2.0118878408063057, "percentage": 67.06, "elapsed_time": "12:45:46", "remaining_time": "6:16:06", "throughput": "2776.04", "total_tokens": 127549440} {"current_steps": 15580, "total_steps": 23217, "loss": 0.9467, "learning_rate": 1.2202376687384223e-05, "epoch": 2.013179997415687, "percentage": 67.11, "elapsed_time": "12:46:33", "remaining_time": "6:15:45", "throughput": "2774.97", "total_tokens": 127631360} {"current_steps": 15590, "total_steps": 23217, "loss": 0.6482, "learning_rate": 1.2173328237046178e-05, "epoch": 2.014472154025068, "percentage": 67.15, "elapsed_time": "12:47:20", "remaining_time": "6:15:24", "throughput": "2773.90", "total_tokens": 127713280} {"current_steps": 15600, "total_steps": 23217, "loss": 0.547, "learning_rate": 1.2144303272297186e-05, "epoch": 2.0157643106344487, "percentage": 67.19, "elapsed_time": "12:48:08", "remaining_time": "6:15:03", "throughput": "2772.84", "total_tokens": 127795200} {"current_steps": 15610, "total_steps": 23217, "loss": 0.9459, "learning_rate": 1.2115301846281871e-05, "epoch": 2.01705646724383, "percentage": 67.24, "elapsed_time": "12:48:55", "remaining_time": "6:14:42", "throughput": "2771.77", "total_tokens": 127877120} {"current_steps": 15620, "total_steps": 23217, "loss": 0.8437, "learning_rate": 1.2086324012101716e-05, "epoch": 2.018348623853211, "percentage": 67.28, "elapsed_time": "12:49:42", "remaining_time": "6:14:21", "throughput": "2770.71", "total_tokens": 127959040} {"current_steps": 15630, "total_steps": 23217, "loss": 0.9276, "learning_rate": 1.2057369822815051e-05, "epoch": 2.019640780462592, "percentage": 67.32, "elapsed_time": "12:50:30", "remaining_time": "6:14:00", "throughput": "2769.64", "total_tokens": 128040960} {"current_steps": 15640, "total_steps": 23217, "loss": 0.8422, "learning_rate": 1.2028439331436869e-05, "epoch": 2.020932937071973, "percentage": 67.36, "elapsed_time": "12:51:17", "remaining_time": "6:13:39", "throughput": "2768.59", "total_tokens": 128122880} {"current_steps": 15650, "total_steps": 23217, "loss": 0.9474, "learning_rate": 1.1999532590938817e-05, "epoch": 2.0222250936813544, "percentage": 67.41, "elapsed_time": "12:52:04", "remaining_time": "6:13:18", "throughput": "2767.53", "total_tokens": 128204800} {"current_steps": 15660, "total_steps": 23217, "loss": 0.5438, "learning_rate": 1.1970649654249017e-05, "epoch": 2.0235172502907353, "percentage": 67.45, "elapsed_time": "12:52:51", "remaining_time": "6:12:57", "throughput": "2766.48", "total_tokens": 128286720} {"current_steps": 15670, "total_steps": 23217, "loss": 0.5885, "learning_rate": 1.1941790574252013e-05, "epoch": 2.024809406900116, "percentage": 67.49, "elapsed_time": "12:53:38", "remaining_time": "6:12:36", "throughput": "2765.43", "total_tokens": 128368640} {"current_steps": 15680, "total_steps": 23217, "loss": 0.878, "learning_rate": 1.1912955403788695e-05, "epoch": 2.0261015635094974, "percentage": 67.54, "elapsed_time": "12:54:26", "remaining_time": "6:12:15", "throughput": "2764.38", "total_tokens": 128450560} {"current_steps": 15690, "total_steps": 23217, "loss": 0.7301, "learning_rate": 1.1884144195656133e-05, "epoch": 2.0273937201188783, "percentage": 67.58, "elapsed_time": "12:55:13", "remaining_time": "6:11:53", "throughput": "2763.34", "total_tokens": 128532480} {"current_steps": 15700, "total_steps": 23217, "loss": 0.3667, "learning_rate": 1.1855357002607556e-05, "epoch": 2.0286858767282596, "percentage": 67.62, "elapsed_time": "12:56:00", "remaining_time": "6:11:32", "throughput": "2762.30", "total_tokens": 128614400} {"current_steps": 15710, "total_steps": 23217, "loss": 0.6625, "learning_rate": 1.1826593877352216e-05, "epoch": 2.0299780333376405, "percentage": 67.67, "elapsed_time": "12:56:47", "remaining_time": "6:11:11", "throughput": "2761.26", "total_tokens": 128696320} {"current_steps": 15720, "total_steps": 23217, "loss": 0.8176, "learning_rate": 1.1797854872555272e-05, "epoch": 2.031270189947022, "percentage": 67.71, "elapsed_time": "12:57:35", "remaining_time": "6:10:50", "throughput": "2760.22", "total_tokens": 128778240} {"current_steps": 15730, "total_steps": 23217, "loss": 0.8307, "learning_rate": 1.1769140040837755e-05, "epoch": 2.0325623465564027, "percentage": 67.75, "elapsed_time": "12:58:22", "remaining_time": "6:10:28", "throughput": "2759.18", "total_tokens": 128860160} {"current_steps": 15740, "total_steps": 23217, "loss": 0.4084, "learning_rate": 1.1740449434776402e-05, "epoch": 2.0338545031657835, "percentage": 67.8, "elapsed_time": "12:59:09", "remaining_time": "6:10:07", "throughput": "2758.15", "total_tokens": 128942080} {"current_steps": 15750, "total_steps": 23217, "loss": 0.664, "learning_rate": 1.171178310690362e-05, "epoch": 2.035146659775165, "percentage": 67.84, "elapsed_time": "12:59:56", "remaining_time": "6:09:46", "throughput": "2757.12", "total_tokens": 129024000} {"current_steps": 15760, "total_steps": 23217, "loss": 0.7079, "learning_rate": 1.1683141109707339e-05, "epoch": 2.0364388163845457, "percentage": 67.88, "elapsed_time": "13:00:43", "remaining_time": "6:09:24", "throughput": "2756.08", "total_tokens": 129105920} {"current_steps": 15770, "total_steps": 23217, "loss": 0.9028, "learning_rate": 1.165452349563095e-05, "epoch": 2.037730972993927, "percentage": 67.92, "elapsed_time": "13:01:31", "remaining_time": "6:09:03", "throughput": "2755.06", "total_tokens": 129187840} {"current_steps": 15780, "total_steps": 23217, "loss": 0.6014, "learning_rate": 1.1625930317073221e-05, "epoch": 2.039023129603308, "percentage": 67.97, "elapsed_time": "13:02:18", "remaining_time": "6:08:41", "throughput": "2754.03", "total_tokens": 129269760} {"current_steps": 15790, "total_steps": 23217, "loss": 0.7052, "learning_rate": 1.159736162638813e-05, "epoch": 2.0403152862126888, "percentage": 68.01, "elapsed_time": "13:03:05", "remaining_time": "6:08:20", "throughput": "2753.00", "total_tokens": 129351680} {"current_steps": 15800, "total_steps": 23217, "loss": 0.5514, "learning_rate": 1.1568817475884868e-05, "epoch": 2.04160744282207, "percentage": 68.05, "elapsed_time": "13:03:52", "remaining_time": "6:07:58", "throughput": "2751.98", "total_tokens": 129433600} {"current_steps": 15810, "total_steps": 23217, "loss": 0.9024, "learning_rate": 1.154029791782765e-05, "epoch": 2.042899599431451, "percentage": 68.1, "elapsed_time": "13:04:40", "remaining_time": "6:07:37", "throughput": "2750.96", "total_tokens": 129515520} {"current_steps": 15820, "total_steps": 23217, "loss": 0.8982, "learning_rate": 1.1511803004435704e-05, "epoch": 2.0441917560408323, "percentage": 68.14, "elapsed_time": "13:05:27", "remaining_time": "6:07:15", "throughput": "2749.94", "total_tokens": 129597440} {"current_steps": 15830, "total_steps": 23217, "loss": 0.8733, "learning_rate": 1.1483332787883096e-05, "epoch": 2.045483912650213, "percentage": 68.18, "elapsed_time": "13:06:14", "remaining_time": "6:06:53", "throughput": "2748.92", "total_tokens": 129679360} {"current_steps": 15840, "total_steps": 23217, "loss": 0.7505, "learning_rate": 1.1454887320298686e-05, "epoch": 2.0467760692595944, "percentage": 68.23, "elapsed_time": "13:07:01", "remaining_time": "6:06:32", "throughput": "2747.91", "total_tokens": 129761280} {"current_steps": 15850, "total_steps": 23217, "loss": 0.6831, "learning_rate": 1.1426466653766036e-05, "epoch": 2.0480682258689753, "percentage": 68.27, "elapsed_time": "13:07:49", "remaining_time": "6:06:10", "throughput": "2746.90", "total_tokens": 129843200} {"current_steps": 15860, "total_steps": 23217, "loss": 0.8099, "learning_rate": 1.1398070840323264e-05, "epoch": 2.049360382478356, "percentage": 68.31, "elapsed_time": "13:08:36", "remaining_time": "6:05:48", "throughput": "2745.89", "total_tokens": 129925120} {"current_steps": 15870, "total_steps": 23217, "loss": 0.7674, "learning_rate": 1.1369699931963018e-05, "epoch": 2.0506525390877375, "percentage": 68.36, "elapsed_time": "13:09:23", "remaining_time": "6:05:26", "throughput": "2744.88", "total_tokens": 130007040} {"current_steps": 15880, "total_steps": 23217, "loss": 0.9515, "learning_rate": 1.1341353980632313e-05, "epoch": 2.0519446956971183, "percentage": 68.4, "elapsed_time": "13:10:10", "remaining_time": "6:05:05", "throughput": "2743.87", "total_tokens": 130088960} {"current_steps": 15890, "total_steps": 23217, "loss": 0.9029, "learning_rate": 1.1313033038232498e-05, "epoch": 2.0532368523064997, "percentage": 68.44, "elapsed_time": "13:10:57", "remaining_time": "6:04:43", "throughput": "2742.87", "total_tokens": 130170880} {"current_steps": 15900, "total_steps": 23217, "loss": 0.7374, "learning_rate": 1.1284737156619096e-05, "epoch": 2.0545290089158805, "percentage": 68.48, "elapsed_time": "13:11:45", "remaining_time": "6:04:21", "throughput": "2741.87", "total_tokens": 130252800} {"current_steps": 15910, "total_steps": 23217, "loss": 0.7558, "learning_rate": 1.1256466387601782e-05, "epoch": 2.055821165525262, "percentage": 68.53, "elapsed_time": "13:12:32", "remaining_time": "6:03:59", "throughput": "2740.87", "total_tokens": 130334720} {"current_steps": 15920, "total_steps": 23217, "loss": 0.7905, "learning_rate": 1.1228220782944212e-05, "epoch": 2.0571133221346427, "percentage": 68.57, "elapsed_time": "13:13:19", "remaining_time": "6:03:37", "throughput": "2739.88", "total_tokens": 130416640} {"current_steps": 15930, "total_steps": 23217, "loss": 0.9914, "learning_rate": 1.1200000394363996e-05, "epoch": 2.0584054787440236, "percentage": 68.61, "elapsed_time": "13:14:06", "remaining_time": "6:03:15", "throughput": "2738.88", "total_tokens": 130498560} {"current_steps": 15940, "total_steps": 23217, "loss": 0.7977, "learning_rate": 1.1171805273532567e-05, "epoch": 2.059697635353405, "percentage": 68.66, "elapsed_time": "13:14:53", "remaining_time": "6:02:53", "throughput": "2737.89", "total_tokens": 130580480} {"current_steps": 15950, "total_steps": 23217, "loss": 0.8725, "learning_rate": 1.1143635472075074e-05, "epoch": 2.0609897919627858, "percentage": 68.7, "elapsed_time": "13:15:41", "remaining_time": "6:02:31", "throughput": "2736.90", "total_tokens": 130662400} {"current_steps": 15960, "total_steps": 23217, "loss": 1.0455, "learning_rate": 1.1115491041570337e-05, "epoch": 2.062281948572167, "percentage": 68.74, "elapsed_time": "13:16:28", "remaining_time": "6:02:09", "throughput": "2735.91", "total_tokens": 130744320} {"current_steps": 15970, "total_steps": 23217, "loss": 0.8646, "learning_rate": 1.1087372033550685e-05, "epoch": 2.063574105181548, "percentage": 68.79, "elapsed_time": "13:17:15", "remaining_time": "6:01:47", "throughput": "2734.92", "total_tokens": 130826240} {"current_steps": 15980, "total_steps": 23217, "loss": 0.9453, "learning_rate": 1.105927849950194e-05, "epoch": 2.0648662617909292, "percentage": 68.83, "elapsed_time": "13:18:02", "remaining_time": "6:01:25", "throughput": "2733.94", "total_tokens": 130908160} {"current_steps": 15990, "total_steps": 23217, "loss": 0.822, "learning_rate": 1.103121049086324e-05, "epoch": 2.06615841840031, "percentage": 68.87, "elapsed_time": "13:18:49", "remaining_time": "6:01:02", "throughput": "2732.96", "total_tokens": 130990080} {"current_steps": 16000, "total_steps": 23217, "loss": 0.8453, "learning_rate": 1.1003168059027025e-05, "epoch": 2.067450575009691, "percentage": 68.92, "elapsed_time": "13:19:36", "remaining_time": "6:00:40", "throughput": "2731.98", "total_tokens": 131072000} {"current_steps": 16010, "total_steps": 23217, "loss": 0.9873, "learning_rate": 1.0975151255338867e-05, "epoch": 2.0687427316190723, "percentage": 68.96, "elapsed_time": "13:20:29", "remaining_time": "6:00:20", "throughput": "2730.69", "total_tokens": 131153920} {"current_steps": 16020, "total_steps": 23217, "loss": 0.6615, "learning_rate": 1.094716013109745e-05, "epoch": 2.070034888228453, "percentage": 69.0, "elapsed_time": "13:21:16", "remaining_time": "5:59:58", "throughput": "2729.72", "total_tokens": 131235840} {"current_steps": 16030, "total_steps": 23217, "loss": 0.5598, "learning_rate": 1.0919194737554409e-05, "epoch": 2.0713270448378345, "percentage": 69.04, "elapsed_time": "13:22:04", "remaining_time": "5:59:36", "throughput": "2728.74", "total_tokens": 131317760} {"current_steps": 16040, "total_steps": 23217, "loss": 0.8139, "learning_rate": 1.0891255125914269e-05, "epoch": 2.0726192014472153, "percentage": 69.09, "elapsed_time": "13:22:51", "remaining_time": "5:59:13", "throughput": "2727.76", "total_tokens": 131399680} {"current_steps": 16050, "total_steps": 23217, "loss": 0.7574, "learning_rate": 1.0863341347334376e-05, "epoch": 2.0739113580565967, "percentage": 69.13, "elapsed_time": "13:23:38", "remaining_time": "5:58:51", "throughput": "2726.79", "total_tokens": 131481600} {"current_steps": 16060, "total_steps": 23217, "loss": 0.578, "learning_rate": 1.0835453452924737e-05, "epoch": 2.0752035146659775, "percentage": 69.17, "elapsed_time": "13:24:25", "remaining_time": "5:58:29", "throughput": "2725.82", "total_tokens": 131563520} {"current_steps": 16070, "total_steps": 23217, "loss": 0.6804, "learning_rate": 1.0807591493747992e-05, "epoch": 2.0764956712753584, "percentage": 69.22, "elapsed_time": "13:25:12", "remaining_time": "5:58:06", "throughput": "2724.86", "total_tokens": 131645440} {"current_steps": 16080, "total_steps": 23217, "loss": 0.5871, "learning_rate": 1.0779755520819302e-05, "epoch": 2.0777878278847397, "percentage": 69.26, "elapsed_time": "13:26:00", "remaining_time": "5:57:44", "throughput": "2723.89", "total_tokens": 131727360} {"current_steps": 16090, "total_steps": 23217, "loss": 0.8846, "learning_rate": 1.0751945585106205e-05, "epoch": 2.0790799844941206, "percentage": 69.3, "elapsed_time": "13:26:47", "remaining_time": "5:57:21", "throughput": "2722.93", "total_tokens": 131809280} {"current_steps": 16100, "total_steps": 23217, "loss": 0.9714, "learning_rate": 1.0724161737528616e-05, "epoch": 2.080372141103502, "percentage": 69.35, "elapsed_time": "13:27:34", "remaining_time": "5:56:59", "throughput": "2721.97", "total_tokens": 131891200} {"current_steps": 16110, "total_steps": 23217, "loss": 0.7469, "learning_rate": 1.0696404028958634e-05, "epoch": 2.0816642977128827, "percentage": 69.39, "elapsed_time": "13:28:21", "remaining_time": "5:56:36", "throughput": "2721.01", "total_tokens": 131973120} {"current_steps": 16120, "total_steps": 23217, "loss": 1.0468, "learning_rate": 1.0668672510220548e-05, "epoch": 2.082956454322264, "percentage": 69.43, "elapsed_time": "13:29:08", "remaining_time": "5:56:14", "throughput": "2720.05", "total_tokens": 132055040} {"current_steps": 16130, "total_steps": 23217, "loss": 0.4886, "learning_rate": 1.0640967232090643e-05, "epoch": 2.084248610931645, "percentage": 69.47, "elapsed_time": "13:29:55", "remaining_time": "5:55:51", "throughput": "2719.09", "total_tokens": 132136960} {"current_steps": 16140, "total_steps": 23217, "loss": 0.9022, "learning_rate": 1.0613288245297193e-05, "epoch": 2.085540767541026, "percentage": 69.52, "elapsed_time": "13:30:43", "remaining_time": "5:55:28", "throughput": "2718.14", "total_tokens": 132218880} {"current_steps": 16150, "total_steps": 23217, "loss": 0.9351, "learning_rate": 1.0585635600520327e-05, "epoch": 2.086832924150407, "percentage": 69.56, "elapsed_time": "13:31:30", "remaining_time": "5:55:06", "throughput": "2717.19", "total_tokens": 132300800} {"current_steps": 16160, "total_steps": 23217, "loss": 0.7735, "learning_rate": 1.0558009348391926e-05, "epoch": 2.088125080759788, "percentage": 69.6, "elapsed_time": "13:32:17", "remaining_time": "5:54:43", "throughput": "2716.24", "total_tokens": 132382720} {"current_steps": 16170, "total_steps": 23217, "loss": 0.6433, "learning_rate": 1.053040953949557e-05, "epoch": 2.0894172373691693, "percentage": 69.65, "elapsed_time": "13:33:04", "remaining_time": "5:54:20", "throughput": "2715.29", "total_tokens": 132464640} {"current_steps": 16180, "total_steps": 23217, "loss": 0.9383, "learning_rate": 1.0502836224366389e-05, "epoch": 2.09070939397855, "percentage": 69.69, "elapsed_time": "13:33:51", "remaining_time": "5:53:57", "throughput": "2714.34", "total_tokens": 132546560} {"current_steps": 16190, "total_steps": 23217, "loss": 0.8762, "learning_rate": 1.0475289453491038e-05, "epoch": 2.0920015505879315, "percentage": 69.73, "elapsed_time": "13:34:39", "remaining_time": "5:53:35", "throughput": "2713.40", "total_tokens": 132628480} {"current_steps": 16200, "total_steps": 23217, "loss": 0.7354, "learning_rate": 1.0447769277307554e-05, "epoch": 2.0932937071973123, "percentage": 69.78, "elapsed_time": "13:35:26", "remaining_time": "5:53:12", "throughput": "2712.45", "total_tokens": 132710400} {"current_steps": 16210, "total_steps": 23217, "loss": 0.6087, "learning_rate": 1.042027574620526e-05, "epoch": 2.094585863806693, "percentage": 69.82, "elapsed_time": "13:36:13", "remaining_time": "5:52:49", "throughput": "2711.51", "total_tokens": 132792320} {"current_steps": 16220, "total_steps": 23217, "loss": 0.8064, "learning_rate": 1.0392808910524735e-05, "epoch": 2.0958780204160745, "percentage": 69.86, "elapsed_time": "13:37:00", "remaining_time": "5:52:26", "throughput": "2710.57", "total_tokens": 132874240} {"current_steps": 16230, "total_steps": 23217, "loss": 0.6069, "learning_rate": 1.0365368820557633e-05, "epoch": 2.0971701770254554, "percentage": 69.91, "elapsed_time": "13:37:48", "remaining_time": "5:52:03", "throughput": "2709.63", "total_tokens": 132956160} {"current_steps": 16240, "total_steps": 23217, "loss": 0.6704, "learning_rate": 1.0337955526546678e-05, "epoch": 2.0984623336348367, "percentage": 69.95, "elapsed_time": "13:38:35", "remaining_time": "5:51:40", "throughput": "2708.69", "total_tokens": 133038080} {"current_steps": 16250, "total_steps": 23217, "loss": 0.764, "learning_rate": 1.0310569078685494e-05, "epoch": 2.0997544902442176, "percentage": 69.99, "elapsed_time": "13:39:22", "remaining_time": "5:51:17", "throughput": "2707.75", "total_tokens": 133120000} {"current_steps": 16260, "total_steps": 23217, "loss": 0.7597, "learning_rate": 1.0283209527118584e-05, "epoch": 2.1010466468535984, "percentage": 70.03, "elapsed_time": "13:40:09", "remaining_time": "5:50:54", "throughput": "2706.82", "total_tokens": 133201920} {"current_steps": 16270, "total_steps": 23217, "loss": 0.8361, "learning_rate": 1.0255876921941165e-05, "epoch": 2.1023388034629797, "percentage": 70.08, "elapsed_time": "13:40:56", "remaining_time": "5:50:31", "throughput": "2705.89", "total_tokens": 133283840} {"current_steps": 16280, "total_steps": 23217, "loss": 0.7833, "learning_rate": 1.0228571313199161e-05, "epoch": 2.1036309600723606, "percentage": 70.12, "elapsed_time": "13:41:44", "remaining_time": "5:50:08", "throughput": "2704.96", "total_tokens": 133365760} {"current_steps": 16290, "total_steps": 23217, "loss": 0.6994, "learning_rate": 1.0201292750889022e-05, "epoch": 2.104923116681742, "percentage": 70.16, "elapsed_time": "13:42:31", "remaining_time": "5:49:45", "throughput": "2704.03", "total_tokens": 133447680} {"current_steps": 16300, "total_steps": 23217, "loss": 0.549, "learning_rate": 1.0174041284957703e-05, "epoch": 2.106215273291123, "percentage": 70.21, "elapsed_time": "13:43:18", "remaining_time": "5:49:22", "throughput": "2703.10", "total_tokens": 133529600} {"current_steps": 16310, "total_steps": 23217, "loss": 0.966, "learning_rate": 1.0146816965302546e-05, "epoch": 2.107507429900504, "percentage": 70.25, "elapsed_time": "13:44:05", "remaining_time": "5:48:59", "throughput": "2702.18", "total_tokens": 133611520} {"current_steps": 16320, "total_steps": 23217, "loss": 0.8817, "learning_rate": 1.011961984177117e-05, "epoch": 2.108799586509885, "percentage": 70.29, "elapsed_time": "13:44:52", "remaining_time": "5:48:36", "throughput": "2701.26", "total_tokens": 133693440} {"current_steps": 16330, "total_steps": 23217, "loss": 0.7589, "learning_rate": 1.0092449964161416e-05, "epoch": 2.1100917431192663, "percentage": 70.34, "elapsed_time": "13:45:40", "remaining_time": "5:48:13", "throughput": "2700.34", "total_tokens": 133775360} {"current_steps": 16340, "total_steps": 23217, "loss": 0.7143, "learning_rate": 1.006530738222122e-05, "epoch": 2.111383899728647, "percentage": 70.38, "elapsed_time": "13:46:27", "remaining_time": "5:47:49", "throughput": "2699.42", "total_tokens": 133857280} {"current_steps": 16350, "total_steps": 23217, "loss": 0.9325, "learning_rate": 1.0038192145648567e-05, "epoch": 2.112676056338028, "percentage": 70.42, "elapsed_time": "13:47:14", "remaining_time": "5:47:26", "throughput": "2698.50", "total_tokens": 133939200} {"current_steps": 16360, "total_steps": 23217, "loss": 0.8195, "learning_rate": 1.001110430409134e-05, "epoch": 2.1139682129474093, "percentage": 70.47, "elapsed_time": "13:48:01", "remaining_time": "5:47:03", "throughput": "2697.59", "total_tokens": 134021120} {"current_steps": 16370, "total_steps": 23217, "loss": 0.6386, "learning_rate": 9.98404390714729e-06, "epoch": 2.11526036955679, "percentage": 70.51, "elapsed_time": "13:48:49", "remaining_time": "5:46:39", "throughput": "2696.67", "total_tokens": 134103040} {"current_steps": 16380, "total_steps": 23217, "loss": 0.8842, "learning_rate": 9.95701100436389e-06, "epoch": 2.1165525261661715, "percentage": 70.55, "elapsed_time": "13:49:36", "remaining_time": "5:46:16", "throughput": "2695.76", "total_tokens": 134184960} {"current_steps": 16390, "total_steps": 23217, "loss": 1.0033, "learning_rate": 9.930005645238302e-06, "epoch": 2.1178446827755524, "percentage": 70.59, "elapsed_time": "13:50:23", "remaining_time": "5:45:53", "throughput": "2694.85", "total_tokens": 134266880} {"current_steps": 16400, "total_steps": 23217, "loss": 0.7303, "learning_rate": 9.903027879217237e-06, "epoch": 2.1191368393849332, "percentage": 70.64, "elapsed_time": "13:51:10", "remaining_time": "5:45:29", "throughput": "2693.94", "total_tokens": 134348800} {"current_steps": 16410, "total_steps": 23217, "loss": 0.4911, "learning_rate": 9.876077755696868e-06, "epoch": 2.1204289959943146, "percentage": 70.68, "elapsed_time": "13:51:57", "remaining_time": "5:45:06", "throughput": "2693.03", "total_tokens": 134430720} {"current_steps": 16420, "total_steps": 23217, "loss": 0.8788, "learning_rate": 9.849155324022799e-06, "epoch": 2.1217211526036954, "percentage": 70.72, "elapsed_time": "13:52:45", "remaining_time": "5:44:42", "throughput": "2692.13", "total_tokens": 134512640} {"current_steps": 16430, "total_steps": 23217, "loss": 0.7269, "learning_rate": 9.82226063348988e-06, "epoch": 2.1230133092130767, "percentage": 70.77, "elapsed_time": "13:53:32", "remaining_time": "5:44:19", "throughput": "2691.22", "total_tokens": 134594560} {"current_steps": 16440, "total_steps": 23217, "loss": 0.8314, "learning_rate": 9.795393733342203e-06, "epoch": 2.1243054658224576, "percentage": 70.81, "elapsed_time": "13:54:19", "remaining_time": "5:43:55", "throughput": "2690.32", "total_tokens": 134676480} {"current_steps": 16450, "total_steps": 23217, "loss": 0.7974, "learning_rate": 9.76855467277297e-06, "epoch": 2.125597622431839, "percentage": 70.85, "elapsed_time": "13:55:06", "remaining_time": "5:43:32", "throughput": "2689.42", "total_tokens": 134758400} {"current_steps": 16460, "total_steps": 23217, "loss": 0.8748, "learning_rate": 9.741743500924388e-06, "epoch": 2.12688977904122, "percentage": 70.9, "elapsed_time": "13:55:54", "remaining_time": "5:43:08", "throughput": "2688.52", "total_tokens": 134840320} {"current_steps": 16470, "total_steps": 23217, "loss": 0.6756, "learning_rate": 9.71496026688763e-06, "epoch": 2.1281819356506007, "percentage": 70.94, "elapsed_time": "13:56:41", "remaining_time": "5:42:45", "throughput": "2687.64", "total_tokens": 134922240} {"current_steps": 16480, "total_steps": 23217, "loss": 1.01, "learning_rate": 9.688205019702684e-06, "epoch": 2.129474092259982, "percentage": 70.98, "elapsed_time": "13:57:28", "remaining_time": "5:42:21", "throughput": "2686.74", "total_tokens": 135004160} {"current_steps": 16490, "total_steps": 23217, "loss": 0.8252, "learning_rate": 9.661477808358323e-06, "epoch": 2.130766248869363, "percentage": 71.03, "elapsed_time": "13:58:15", "remaining_time": "5:41:57", "throughput": "2685.85", "total_tokens": 135086080} {"current_steps": 16500, "total_steps": 23217, "loss": 0.8617, "learning_rate": 9.634778681791962e-06, "epoch": 2.132058405478744, "percentage": 71.07, "elapsed_time": "13:59:02", "remaining_time": "5:41:34", "throughput": "2684.96", "total_tokens": 135168000} {"current_steps": 16510, "total_steps": 23217, "loss": 1.2436, "learning_rate": 9.608107688889609e-06, "epoch": 2.133350562088125, "percentage": 71.11, "elapsed_time": "13:59:49", "remaining_time": "5:41:10", "throughput": "2684.07", "total_tokens": 135249920} {"current_steps": 16520, "total_steps": 23217, "loss": 0.7527, "learning_rate": 9.581464878485764e-06, "epoch": 2.1346427186975063, "percentage": 71.15, "elapsed_time": "14:00:37", "remaining_time": "5:40:46", "throughput": "2683.18", "total_tokens": 135331840} {"current_steps": 16530, "total_steps": 23217, "loss": 0.7333, "learning_rate": 9.554850299363294e-06, "epoch": 2.135934875306887, "percentage": 71.2, "elapsed_time": "14:01:24", "remaining_time": "5:40:22", "throughput": "2682.29", "total_tokens": 135413760} {"current_steps": 16540, "total_steps": 23217, "loss": 1.0707, "learning_rate": 9.52826400025342e-06, "epoch": 2.137227031916268, "percentage": 71.24, "elapsed_time": "14:02:11", "remaining_time": "5:39:59", "throughput": "2681.40", "total_tokens": 135495680} {"current_steps": 16550, "total_steps": 23217, "loss": 0.7467, "learning_rate": 9.501706029835544e-06, "epoch": 2.1385191885256494, "percentage": 71.28, "elapsed_time": "14:02:58", "remaining_time": "5:39:35", "throughput": "2680.52", "total_tokens": 135577600} {"current_steps": 16560, "total_steps": 23217, "loss": 0.6344, "learning_rate": 9.47517643673721e-06, "epoch": 2.1398113451350302, "percentage": 71.33, "elapsed_time": "14:03:46", "remaining_time": "5:39:11", "throughput": "2679.64", "total_tokens": 135659520} {"current_steps": 16570, "total_steps": 23217, "loss": 0.844, "learning_rate": 9.448675269534015e-06, "epoch": 2.1411035017444116, "percentage": 71.37, "elapsed_time": "14:04:33", "remaining_time": "5:38:47", "throughput": "2678.76", "total_tokens": 135741440} {"current_steps": 16580, "total_steps": 23217, "loss": 0.9002, "learning_rate": 9.422202576749492e-06, "epoch": 2.1423956583537924, "percentage": 71.41, "elapsed_time": "14:05:20", "remaining_time": "5:38:23", "throughput": "2677.88", "total_tokens": 135823360} {"current_steps": 16590, "total_steps": 23217, "loss": 0.9066, "learning_rate": 9.395758406855053e-06, "epoch": 2.1436878149631737, "percentage": 71.46, "elapsed_time": "14:06:07", "remaining_time": "5:37:59", "throughput": "2677.00", "total_tokens": 135905280} {"current_steps": 16600, "total_steps": 23217, "loss": 0.8606, "learning_rate": 9.369342808269862e-06, "epoch": 2.1449799715725546, "percentage": 71.5, "elapsed_time": "14:06:54", "remaining_time": "5:37:35", "throughput": "2676.12", "total_tokens": 135987200} {"current_steps": 16610, "total_steps": 23217, "loss": 0.8238, "learning_rate": 9.342955829360806e-06, "epoch": 2.1462721281819355, "percentage": 71.54, "elapsed_time": "14:07:42", "remaining_time": "5:37:11", "throughput": "2675.25", "total_tokens": 136069120} {"current_steps": 16620, "total_steps": 23217, "loss": 0.571, "learning_rate": 9.31659751844232e-06, "epoch": 2.147564284791317, "percentage": 71.59, "elapsed_time": "14:08:29", "remaining_time": "5:36:47", "throughput": "2674.38", "total_tokens": 136151040} {"current_steps": 16630, "total_steps": 23217, "loss": 0.7521, "learning_rate": 9.290267923776397e-06, "epoch": 2.1488564414006976, "percentage": 71.63, "elapsed_time": "14:09:16", "remaining_time": "5:36:23", "throughput": "2673.51", "total_tokens": 136232960} {"current_steps": 16640, "total_steps": 23217, "loss": 0.3768, "learning_rate": 9.263967093572412e-06, "epoch": 2.150148598010079, "percentage": 71.67, "elapsed_time": "14:10:03", "remaining_time": "5:35:59", "throughput": "2672.64", "total_tokens": 136314880} {"current_steps": 16650, "total_steps": 23217, "loss": 0.727, "learning_rate": 9.237695075987106e-06, "epoch": 2.15144075461946, "percentage": 71.71, "elapsed_time": "14:10:51", "remaining_time": "5:35:35", "throughput": "2671.77", "total_tokens": 136396800} {"current_steps": 16660, "total_steps": 23217, "loss": 0.8798, "learning_rate": 9.211451919124429e-06, "epoch": 2.152732911228841, "percentage": 71.76, "elapsed_time": "14:11:38", "remaining_time": "5:35:11", "throughput": "2670.91", "total_tokens": 136478720} {"current_steps": 16670, "total_steps": 23217, "loss": 1.1385, "learning_rate": 9.185237671035512e-06, "epoch": 2.154025067838222, "percentage": 71.8, "elapsed_time": "14:12:25", "remaining_time": "5:34:46", "throughput": "2670.05", "total_tokens": 136560640} {"current_steps": 16680, "total_steps": 23217, "loss": 0.8854, "learning_rate": 9.15905237971856e-06, "epoch": 2.155317224447603, "percentage": 71.84, "elapsed_time": "14:13:12", "remaining_time": "5:34:22", "throughput": "2669.18", "total_tokens": 136642560} {"current_steps": 16690, "total_steps": 23217, "loss": 0.6467, "learning_rate": 9.132896093118726e-06, "epoch": 2.156609381056984, "percentage": 71.89, "elapsed_time": "14:13:59", "remaining_time": "5:33:58", "throughput": "2668.32", "total_tokens": 136724480} {"current_steps": 16700, "total_steps": 23217, "loss": 0.7871, "learning_rate": 9.10676885912809e-06, "epoch": 2.157901537666365, "percentage": 71.93, "elapsed_time": "14:14:47", "remaining_time": "5:33:34", "throughput": "2667.46", "total_tokens": 136806400} {"current_steps": 16710, "total_steps": 23217, "loss": 0.3123, "learning_rate": 9.080670725585511e-06, "epoch": 2.1591936942757464, "percentage": 71.97, "elapsed_time": "14:15:34", "remaining_time": "5:33:10", "throughput": "2666.60", "total_tokens": 136888320} {"current_steps": 16720, "total_steps": 23217, "loss": 0.7407, "learning_rate": 9.054601740276586e-06, "epoch": 2.1604858508851272, "percentage": 72.02, "elapsed_time": "14:16:21", "remaining_time": "5:32:45", "throughput": "2665.75", "total_tokens": 136970240} {"current_steps": 16730, "total_steps": 23217, "loss": 0.6363, "learning_rate": 9.028561950933517e-06, "epoch": 2.161778007494508, "percentage": 72.06, "elapsed_time": "14:17:08", "remaining_time": "5:32:21", "throughput": "2664.89", "total_tokens": 137052160} {"current_steps": 16740, "total_steps": 23217, "loss": 0.7121, "learning_rate": 9.002551405235082e-06, "epoch": 2.1630701641038894, "percentage": 72.1, "elapsed_time": "14:17:56", "remaining_time": "5:31:56", "throughput": "2664.04", "total_tokens": 137134080} {"current_steps": 16750, "total_steps": 23217, "loss": 0.9597, "learning_rate": 8.976570150806486e-06, "epoch": 2.1643623207132703, "percentage": 72.15, "elapsed_time": "14:18:43", "remaining_time": "5:31:32", "throughput": "2663.19", "total_tokens": 137216000} {"current_steps": 16760, "total_steps": 23217, "loss": 0.7746, "learning_rate": 8.950618235219302e-06, "epoch": 2.1656544773226516, "percentage": 72.19, "elapsed_time": "14:19:30", "remaining_time": "5:31:08", "throughput": "2662.34", "total_tokens": 137297920} {"current_steps": 16770, "total_steps": 23217, "loss": 0.4788, "learning_rate": 8.924695705991407e-06, "epoch": 2.1669466339320325, "percentage": 72.23, "elapsed_time": "14:20:17", "remaining_time": "5:30:43", "throughput": "2661.49", "total_tokens": 137379840} {"current_steps": 16780, "total_steps": 23217, "loss": 0.6243, "learning_rate": 8.898802610586843e-06, "epoch": 2.1682387905414138, "percentage": 72.27, "elapsed_time": "14:21:04", "remaining_time": "5:30:19", "throughput": "2660.65", "total_tokens": 137461760} {"current_steps": 16790, "total_steps": 23217, "loss": 0.9596, "learning_rate": 8.872938996415791e-06, "epoch": 2.1695309471507946, "percentage": 72.32, "elapsed_time": "14:21:51", "remaining_time": "5:29:54", "throughput": "2659.80", "total_tokens": 137543680} {"current_steps": 16800, "total_steps": 23217, "loss": 0.83, "learning_rate": 8.847104910834414e-06, "epoch": 2.170823103760176, "percentage": 72.36, "elapsed_time": "14:22:39", "remaining_time": "5:29:30", "throughput": "2658.96", "total_tokens": 137625600} {"current_steps": 16810, "total_steps": 23217, "loss": 0.8546, "learning_rate": 8.821300401144836e-06, "epoch": 2.172115260369557, "percentage": 72.4, "elapsed_time": "14:23:26", "remaining_time": "5:29:05", "throughput": "2658.12", "total_tokens": 137707520} {"current_steps": 16820, "total_steps": 23217, "loss": 0.7418, "learning_rate": 8.795525514595032e-06, "epoch": 2.1734074169789377, "percentage": 72.45, "elapsed_time": "14:24:13", "remaining_time": "5:28:41", "throughput": "2657.28", "total_tokens": 137789440} {"current_steps": 16830, "total_steps": 23217, "loss": 0.9961, "learning_rate": 8.769780298378705e-06, "epoch": 2.174699573588319, "percentage": 72.49, "elapsed_time": "14:25:00", "remaining_time": "5:28:16", "throughput": "2656.44", "total_tokens": 137871360} {"current_steps": 16840, "total_steps": 23217, "loss": 0.5871, "learning_rate": 8.74406479963527e-06, "epoch": 2.1759917301977, "percentage": 72.53, "elapsed_time": "14:25:48", "remaining_time": "5:27:51", "throughput": "2655.60", "total_tokens": 137953280} {"current_steps": 16850, "total_steps": 23217, "loss": 1.1771, "learning_rate": 8.718379065449694e-06, "epoch": 2.177283886807081, "percentage": 72.58, "elapsed_time": "14:26:35", "remaining_time": "5:27:27", "throughput": "2654.76", "total_tokens": 138035200} {"current_steps": 16860, "total_steps": 23217, "loss": 0.5562, "learning_rate": 8.69272314285248e-06, "epoch": 2.178576043416462, "percentage": 72.62, "elapsed_time": "14:27:22", "remaining_time": "5:27:02", "throughput": "2653.93", "total_tokens": 138117120} {"current_steps": 16870, "total_steps": 23217, "loss": 1.0242, "learning_rate": 8.667097078819511e-06, "epoch": 2.179868200025843, "percentage": 72.66, "elapsed_time": "14:28:09", "remaining_time": "5:26:37", "throughput": "2653.10", "total_tokens": 138199040} {"current_steps": 16880, "total_steps": 23217, "loss": 0.8353, "learning_rate": 8.641500920272022e-06, "epoch": 2.1811603566352242, "percentage": 72.71, "elapsed_time": "14:28:56", "remaining_time": "5:26:12", "throughput": "2652.27", "total_tokens": 138280960} {"current_steps": 16890, "total_steps": 23217, "loss": 0.7933, "learning_rate": 8.6159347140765e-06, "epoch": 2.182452513244605, "percentage": 72.75, "elapsed_time": "14:29:44", "remaining_time": "5:25:48", "throughput": "2651.44", "total_tokens": 138362880} {"current_steps": 16900, "total_steps": 23217, "loss": 0.9106, "learning_rate": 8.59039850704455e-06, "epoch": 2.1837446698539864, "percentage": 72.79, "elapsed_time": "14:30:31", "remaining_time": "5:25:23", "throughput": "2650.61", "total_tokens": 138444800} {"current_steps": 16910, "total_steps": 23217, "loss": 0.9258, "learning_rate": 8.564892345932899e-06, "epoch": 2.1850368264633673, "percentage": 72.83, "elapsed_time": "14:31:18", "remaining_time": "5:24:58", "throughput": "2649.78", "total_tokens": 138526720} {"current_steps": 16920, "total_steps": 23217, "loss": 0.6456, "learning_rate": 8.539416277443218e-06, "epoch": 2.1863289830727486, "percentage": 72.88, "elapsed_time": "14:32:05", "remaining_time": "5:24:33", "throughput": "2648.96", "total_tokens": 138608640} {"current_steps": 16930, "total_steps": 23217, "loss": 0.7899, "learning_rate": 8.513970348222095e-06, "epoch": 2.1876211396821295, "percentage": 72.92, "elapsed_time": "14:32:53", "remaining_time": "5:24:08", "throughput": "2648.13", "total_tokens": 138690560} {"current_steps": 16940, "total_steps": 23217, "loss": 1.0066, "learning_rate": 8.488554604860947e-06, "epoch": 2.1889132962915103, "percentage": 72.96, "elapsed_time": "14:33:40", "remaining_time": "5:23:43", "throughput": "2647.30", "total_tokens": 138772480} {"current_steps": 16950, "total_steps": 23217, "loss": 0.5788, "learning_rate": 8.463169093895887e-06, "epoch": 2.1902054529008916, "percentage": 73.01, "elapsed_time": "14:34:27", "remaining_time": "5:23:19", "throughput": "2646.48", "total_tokens": 138854400} {"current_steps": 16960, "total_steps": 23217, "loss": 0.6761, "learning_rate": 8.437813861807712e-06, "epoch": 2.1914976095102725, "percentage": 73.05, "elapsed_time": "14:35:14", "remaining_time": "5:22:54", "throughput": "2645.66", "total_tokens": 138936320} {"current_steps": 16970, "total_steps": 23217, "loss": 1.3443, "learning_rate": 8.412488955021744e-06, "epoch": 2.192789766119654, "percentage": 73.09, "elapsed_time": "14:36:01", "remaining_time": "5:22:29", "throughput": "2644.84", "total_tokens": 139018240} {"current_steps": 16980, "total_steps": 23217, "loss": 0.8272, "learning_rate": 8.38719441990781e-06, "epoch": 2.1940819227290347, "percentage": 73.14, "elapsed_time": "14:36:49", "remaining_time": "5:22:04", "throughput": "2644.03", "total_tokens": 139100160} {"current_steps": 16990, "total_steps": 23217, "loss": 0.6814, "learning_rate": 8.361930302780091e-06, "epoch": 2.195374079338416, "percentage": 73.18, "elapsed_time": "14:37:36", "remaining_time": "5:21:39", "throughput": "2643.21", "total_tokens": 139182080} {"current_steps": 17000, "total_steps": 23217, "loss": 0.5844, "learning_rate": 8.336696649897116e-06, "epoch": 2.196666235947797, "percentage": 73.22, "elapsed_time": "14:38:23", "remaining_time": "5:21:14", "throughput": "2642.40", "total_tokens": 139264000} {"current_steps": 17010, "total_steps": 23217, "loss": 0.6501, "learning_rate": 8.311493507461593e-06, "epoch": 2.1979583925571777, "percentage": 73.27, "elapsed_time": "14:39:14", "remaining_time": "5:20:50", "throughput": "2641.38", "total_tokens": 139345920} {"current_steps": 17020, "total_steps": 23217, "loss": 0.6703, "learning_rate": 8.286320921620394e-06, "epoch": 2.199250549166559, "percentage": 73.31, "elapsed_time": "14:40:02", "remaining_time": "5:20:25", "throughput": "2640.57", "total_tokens": 139427840} {"current_steps": 17030, "total_steps": 23217, "loss": 0.83, "learning_rate": 8.261178938464422e-06, "epoch": 2.20054270577594, "percentage": 73.35, "elapsed_time": "14:40:49", "remaining_time": "5:20:00", "throughput": "2639.76", "total_tokens": 139509760} {"current_steps": 17040, "total_steps": 23217, "loss": 0.6316, "learning_rate": 8.236067604028563e-06, "epoch": 2.2018348623853212, "percentage": 73.39, "elapsed_time": "14:41:36", "remaining_time": "5:19:35", "throughput": "2638.95", "total_tokens": 139591680} {"current_steps": 17050, "total_steps": 23217, "loss": 0.7002, "learning_rate": 8.210986964291587e-06, "epoch": 2.203127018994702, "percentage": 73.44, "elapsed_time": "14:42:23", "remaining_time": "5:19:09", "throughput": "2638.14", "total_tokens": 139673600} {"current_steps": 17060, "total_steps": 23217, "loss": 0.9392, "learning_rate": 8.185937065176033e-06, "epoch": 2.2044191756040834, "percentage": 73.48, "elapsed_time": "14:43:11", "remaining_time": "5:18:44", "throughput": "2637.34", "total_tokens": 139755520} {"current_steps": 17070, "total_steps": 23217, "loss": 0.828, "learning_rate": 8.160917952548197e-06, "epoch": 2.2057113322134643, "percentage": 73.52, "elapsed_time": "14:43:58", "remaining_time": "5:18:19", "throughput": "2636.53", "total_tokens": 139837440} {"current_steps": 17080, "total_steps": 23217, "loss": 0.9871, "learning_rate": 8.13592967221796e-06, "epoch": 2.207003488822845, "percentage": 73.57, "elapsed_time": "14:44:45", "remaining_time": "5:17:54", "throughput": "2635.73", "total_tokens": 139919360} {"current_steps": 17090, "total_steps": 23217, "loss": 1.0047, "learning_rate": 8.110972269938793e-06, "epoch": 2.2082956454322265, "percentage": 73.61, "elapsed_time": "14:45:32", "remaining_time": "5:17:28", "throughput": "2634.93", "total_tokens": 140001280} {"current_steps": 17100, "total_steps": 23217, "loss": 1.1041, "learning_rate": 8.08604579140759e-06, "epoch": 2.2095878020416073, "percentage": 73.65, "elapsed_time": "14:46:20", "remaining_time": "5:17:03", "throughput": "2634.13", "total_tokens": 140083200} {"current_steps": 17110, "total_steps": 23217, "loss": 1.116, "learning_rate": 8.06115028226466e-06, "epoch": 2.2108799586509886, "percentage": 73.7, "elapsed_time": "14:47:07", "remaining_time": "5:16:38", "throughput": "2633.33", "total_tokens": 140165120} {"current_steps": 17120, "total_steps": 23217, "loss": 0.82, "learning_rate": 8.036285788093578e-06, "epoch": 2.2121721152603695, "percentage": 73.74, "elapsed_time": "14:47:54", "remaining_time": "5:16:12", "throughput": "2632.53", "total_tokens": 140247040} {"current_steps": 17130, "total_steps": 23217, "loss": 0.6641, "learning_rate": 8.011452354421136e-06, "epoch": 2.213464271869751, "percentage": 73.78, "elapsed_time": "14:48:41", "remaining_time": "5:15:47", "throughput": "2631.74", "total_tokens": 140328960} {"current_steps": 17140, "total_steps": 23217, "loss": 0.5812, "learning_rate": 7.986650026717277e-06, "epoch": 2.2147564284791317, "percentage": 73.83, "elapsed_time": "14:49:29", "remaining_time": "5:15:22", "throughput": "2630.94", "total_tokens": 140410880} {"current_steps": 17150, "total_steps": 23217, "loss": 0.8512, "learning_rate": 7.961878850394952e-06, "epoch": 2.2160485850885125, "percentage": 73.87, "elapsed_time": "14:50:16", "remaining_time": "5:14:56", "throughput": "2630.15", "total_tokens": 140492800} {"current_steps": 17160, "total_steps": 23217, "loss": 0.7622, "learning_rate": 7.937138870810115e-06, "epoch": 2.217340741697894, "percentage": 73.91, "elapsed_time": "14:51:03", "remaining_time": "5:14:31", "throughput": "2629.36", "total_tokens": 140574720} {"current_steps": 17170, "total_steps": 23217, "loss": 0.7604, "learning_rate": 7.912430133261562e-06, "epoch": 2.2186328983072747, "percentage": 73.95, "elapsed_time": "14:51:50", "remaining_time": "5:14:05", "throughput": "2628.57", "total_tokens": 140656640} {"current_steps": 17180, "total_steps": 23217, "loss": 0.7567, "learning_rate": 7.887752682990903e-06, "epoch": 2.219925054916656, "percentage": 74.0, "elapsed_time": "14:52:37", "remaining_time": "5:13:40", "throughput": "2627.78", "total_tokens": 140738560} {"current_steps": 17190, "total_steps": 23217, "loss": 1.0241, "learning_rate": 7.863106565182474e-06, "epoch": 2.221217211526037, "percentage": 74.04, "elapsed_time": "14:53:25", "remaining_time": "5:13:14", "throughput": "2626.99", "total_tokens": 140820480} {"current_steps": 17200, "total_steps": 23217, "loss": 0.8592, "learning_rate": 7.838491824963207e-06, "epoch": 2.222509368135418, "percentage": 74.08, "elapsed_time": "14:54:12", "remaining_time": "5:12:49", "throughput": "2626.21", "total_tokens": 140902400} {"current_steps": 17210, "total_steps": 23217, "loss": 0.9155, "learning_rate": 7.81390850740262e-06, "epoch": 2.223801524744799, "percentage": 74.13, "elapsed_time": "14:54:59", "remaining_time": "5:12:23", "throughput": "2625.42", "total_tokens": 140984320} {"current_steps": 17220, "total_steps": 23217, "loss": 1.1792, "learning_rate": 7.78935665751266e-06, "epoch": 2.22509368135418, "percentage": 74.17, "elapsed_time": "14:55:46", "remaining_time": "5:11:57", "throughput": "2624.65", "total_tokens": 141066240} {"current_steps": 17230, "total_steps": 23217, "loss": 0.7382, "learning_rate": 7.764836320247686e-06, "epoch": 2.2263858379635613, "percentage": 74.21, "elapsed_time": "14:56:34", "remaining_time": "5:11:32", "throughput": "2623.86", "total_tokens": 141148160} {"current_steps": 17240, "total_steps": 23217, "loss": 0.7866, "learning_rate": 7.740347540504336e-06, "epoch": 2.227677994572942, "percentage": 74.26, "elapsed_time": "14:57:21", "remaining_time": "5:11:06", "throughput": "2623.08", "total_tokens": 141230080} {"current_steps": 17250, "total_steps": 23217, "loss": 0.5538, "learning_rate": 7.715890363121484e-06, "epoch": 2.2289701511823234, "percentage": 74.3, "elapsed_time": "14:58:08", "remaining_time": "5:10:40", "throughput": "2622.30", "total_tokens": 141312000} {"current_steps": 17260, "total_steps": 23217, "loss": 0.7333, "learning_rate": 7.691464832880135e-06, "epoch": 2.2302623077917043, "percentage": 74.34, "elapsed_time": "14:58:55", "remaining_time": "5:10:15", "throughput": "2621.52", "total_tokens": 141393920} {"current_steps": 17270, "total_steps": 23217, "loss": 0.7558, "learning_rate": 7.667070994503334e-06, "epoch": 2.2315544644010856, "percentage": 74.39, "elapsed_time": "14:59:43", "remaining_time": "5:09:49", "throughput": "2620.75", "total_tokens": 141475840} {"current_steps": 17280, "total_steps": 23217, "loss": 0.4585, "learning_rate": 7.642708892656125e-06, "epoch": 2.2328466210104665, "percentage": 74.43, "elapsed_time": "15:00:30", "remaining_time": "5:09:23", "throughput": "2619.97", "total_tokens": 141557760} {"current_steps": 17290, "total_steps": 23217, "loss": 0.602, "learning_rate": 7.618378571945417e-06, "epoch": 2.2341387776198474, "percentage": 74.47, "elapsed_time": "15:01:17", "remaining_time": "5:08:57", "throughput": "2619.20", "total_tokens": 141639680} {"current_steps": 17300, "total_steps": 23217, "loss": 0.7789, "learning_rate": 7.5940800769199345e-06, "epoch": 2.2354309342292287, "percentage": 74.51, "elapsed_time": "15:02:04", "remaining_time": "5:08:31", "throughput": "2618.43", "total_tokens": 141721600} {"current_steps": 17310, "total_steps": 23217, "loss": 0.5047, "learning_rate": 7.569813452070146e-06, "epoch": 2.2367230908386095, "percentage": 74.56, "elapsed_time": "15:02:51", "remaining_time": "5:08:06", "throughput": "2617.65", "total_tokens": 141803520} {"current_steps": 17320, "total_steps": 23217, "loss": 0.6986, "learning_rate": 7.545578741828136e-06, "epoch": 2.238015247447991, "percentage": 74.6, "elapsed_time": "15:03:39", "remaining_time": "5:07:40", "throughput": "2616.88", "total_tokens": 141885440} {"current_steps": 17330, "total_steps": 23217, "loss": 0.8236, "learning_rate": 7.521375990567589e-06, "epoch": 2.2393074040573717, "percentage": 74.64, "elapsed_time": "15:04:26", "remaining_time": "5:07:14", "throughput": "2616.12", "total_tokens": 141967360} {"current_steps": 17340, "total_steps": 23217, "loss": 0.469, "learning_rate": 7.497205242603636e-06, "epoch": 2.2405995606667526, "percentage": 74.69, "elapsed_time": "15:05:13", "remaining_time": "5:06:48", "throughput": "2615.35", "total_tokens": 142049280} {"current_steps": 17350, "total_steps": 23217, "loss": 0.7266, "learning_rate": 7.4730665421928445e-06, "epoch": 2.241891717276134, "percentage": 74.73, "elapsed_time": "15:06:01", "remaining_time": "5:06:22", "throughput": "2614.58", "total_tokens": 142131200} {"current_steps": 17360, "total_steps": 23217, "loss": 1.0225, "learning_rate": 7.4489599335330704e-06, "epoch": 2.2431838738855148, "percentage": 74.77, "elapsed_time": "15:06:48", "remaining_time": "5:05:56", "throughput": "2613.81", "total_tokens": 142213120} {"current_steps": 17370, "total_steps": 23217, "loss": 0.5151, "learning_rate": 7.424885460763442e-06, "epoch": 2.244476030494896, "percentage": 74.82, "elapsed_time": "15:07:35", "remaining_time": "5:05:30", "throughput": "2613.05", "total_tokens": 142295040} {"current_steps": 17380, "total_steps": 23217, "loss": 0.5883, "learning_rate": 7.4008431679642165e-06, "epoch": 2.245768187104277, "percentage": 74.86, "elapsed_time": "15:08:22", "remaining_time": "5:05:04", "throughput": "2612.29", "total_tokens": 142376960} {"current_steps": 17390, "total_steps": 23217, "loss": 0.6615, "learning_rate": 7.3768330991567495e-06, "epoch": 2.2470603437136583, "percentage": 74.9, "elapsed_time": "15:09:09", "remaining_time": "5:04:38", "throughput": "2611.53", "total_tokens": 142458880} {"current_steps": 17400, "total_steps": 23217, "loss": 0.7732, "learning_rate": 7.3528552983033985e-06, "epoch": 2.248352500323039, "percentage": 74.95, "elapsed_time": "15:09:57", "remaining_time": "5:04:12", "throughput": "2610.78", "total_tokens": 142540800} {"current_steps": 17410, "total_steps": 23217, "loss": 0.954, "learning_rate": 7.328909809307413e-06, "epoch": 2.2496446569324204, "percentage": 74.99, "elapsed_time": "15:10:44", "remaining_time": "5:03:46", "throughput": "2610.02", "total_tokens": 142622720} {"current_steps": 17420, "total_steps": 23217, "loss": 0.5088, "learning_rate": 7.304996676012913e-06, "epoch": 2.2509368135418013, "percentage": 75.03, "elapsed_time": "15:11:35", "remaining_time": "5:03:21", "throughput": "2609.09", "total_tokens": 142704640} {"current_steps": 17430, "total_steps": 23217, "loss": 0.812, "learning_rate": 7.281115942204739e-06, "epoch": 2.252228970151182, "percentage": 75.07, "elapsed_time": "15:12:26", "remaining_time": "5:02:56", "throughput": "2608.13", "total_tokens": 142786560} {"current_steps": 17440, "total_steps": 23217, "loss": 0.9194, "learning_rate": 7.257267651608446e-06, "epoch": 2.2535211267605635, "percentage": 75.12, "elapsed_time": "15:13:19", "remaining_time": "5:02:32", "throughput": "2607.13", "total_tokens": 142868480} {"current_steps": 17450, "total_steps": 23217, "loss": 0.6278, "learning_rate": 7.233451847890149e-06, "epoch": 2.2548132833699444, "percentage": 75.16, "elapsed_time": "15:14:09", "remaining_time": "5:02:07", "throughput": "2606.24", "total_tokens": 142950400} {"current_steps": 17460, "total_steps": 23217, "loss": 0.7189, "learning_rate": 7.209668574656514e-06, "epoch": 2.2561054399793257, "percentage": 75.2, "elapsed_time": "15:15:01", "remaining_time": "5:01:42", "throughput": "2605.27", "total_tokens": 143032320} {"current_steps": 17470, "total_steps": 23217, "loss": 0.8608, "learning_rate": 7.185917875454615e-06, "epoch": 2.2573975965887065, "percentage": 75.25, "elapsed_time": "15:15:51", "remaining_time": "5:01:17", "throughput": "2604.35", "total_tokens": 143114240} {"current_steps": 17480, "total_steps": 23217, "loss": 0.8747, "learning_rate": 7.162199793771904e-06, "epoch": 2.2586897531980874, "percentage": 75.29, "elapsed_time": "15:16:41", "remaining_time": "5:00:51", "throughput": "2603.51", "total_tokens": 143196160} {"current_steps": 17490, "total_steps": 23217, "loss": 0.8996, "learning_rate": 7.138514373036098e-06, "epoch": 2.2599819098074687, "percentage": 75.33, "elapsed_time": "15:17:29", "remaining_time": "5:00:25", "throughput": "2602.71", "total_tokens": 143278080} {"current_steps": 17500, "total_steps": 23217, "loss": 0.6536, "learning_rate": 7.11486165661511e-06, "epoch": 2.2612740664168496, "percentage": 75.38, "elapsed_time": "15:18:17", "remaining_time": "4:59:59", "throughput": "2601.93", "total_tokens": 143360000} {"current_steps": 17510, "total_steps": 23217, "loss": 0.9105, "learning_rate": 7.091241687816988e-06, "epoch": 2.262566223026231, "percentage": 75.42, "elapsed_time": "15:19:08", "remaining_time": "4:59:34", "throughput": "2601.04", "total_tokens": 143441920} {"current_steps": 17520, "total_steps": 23217, "loss": 0.7303, "learning_rate": 7.0676545098897956e-06, "epoch": 2.2638583796356118, "percentage": 75.46, "elapsed_time": "15:20:00", "remaining_time": "4:59:09", "throughput": "2600.02", "total_tokens": 143523840} {"current_steps": 17530, "total_steps": 23217, "loss": 0.6937, "learning_rate": 7.044100166021583e-06, "epoch": 2.265150536244993, "percentage": 75.51, "elapsed_time": "15:20:52", "remaining_time": "4:58:44", "throughput": "2599.10", "total_tokens": 143605760} {"current_steps": 17540, "total_steps": 23217, "loss": 0.7094, "learning_rate": 7.020578699340255e-06, "epoch": 2.266442692854374, "percentage": 75.55, "elapsed_time": "15:21:42", "remaining_time": "4:58:19", "throughput": "2598.20", "total_tokens": 143687680} {"current_steps": 17550, "total_steps": 23217, "loss": 1.0294, "learning_rate": 6.997090152913535e-06, "epoch": 2.2677348494637553, "percentage": 75.59, "elapsed_time": "15:22:34", "remaining_time": "4:57:54", "throughput": "2597.26", "total_tokens": 143769600} {"current_steps": 17560, "total_steps": 23217, "loss": 0.5169, "learning_rate": 6.97363456974888e-06, "epoch": 2.269027006073136, "percentage": 75.63, "elapsed_time": "15:23:23", "remaining_time": "4:57:28", "throughput": "2596.41", "total_tokens": 143851520} {"current_steps": 17570, "total_steps": 23217, "loss": 0.8054, "learning_rate": 6.950211992793354e-06, "epoch": 2.270319162682517, "percentage": 75.68, "elapsed_time": "15:24:14", "remaining_time": "4:57:02", "throughput": "2595.54", "total_tokens": 143933440} {"current_steps": 17580, "total_steps": 23217, "loss": 1.089, "learning_rate": 6.92682246493363e-06, "epoch": 2.2716113192918983, "percentage": 75.72, "elapsed_time": "15:25:04", "remaining_time": "4:56:37", "throughput": "2594.65", "total_tokens": 144015360} {"current_steps": 17590, "total_steps": 23217, "loss": 0.5911, "learning_rate": 6.903466028995828e-06, "epoch": 2.272903475901279, "percentage": 75.76, "elapsed_time": "15:25:53", "remaining_time": "4:56:11", "throughput": "2593.86", "total_tokens": 144097280} {"current_steps": 17600, "total_steps": 23217, "loss": 0.4274, "learning_rate": 6.880142727745517e-06, "epoch": 2.2741956325106605, "percentage": 75.81, "elapsed_time": "15:26:40", "remaining_time": "4:55:44", "throughput": "2593.12", "total_tokens": 144179200} {"current_steps": 17610, "total_steps": 23217, "loss": 0.5875, "learning_rate": 6.856852603887556e-06, "epoch": 2.2754877891200413, "percentage": 75.85, "elapsed_time": "15:27:29", "remaining_time": "4:55:18", "throughput": "2592.30", "total_tokens": 144261120} {"current_steps": 17620, "total_steps": 23217, "loss": 1.0119, "learning_rate": 6.8335957000660925e-06, "epoch": 2.276779945729422, "percentage": 75.89, "elapsed_time": "15:28:24", "remaining_time": "4:54:54", "throughput": "2591.22", "total_tokens": 144343040} {"current_steps": 17630, "total_steps": 23217, "loss": 0.8559, "learning_rate": 6.810372058864429e-06, "epoch": 2.2780721023388035, "percentage": 75.94, "elapsed_time": "15:29:17", "remaining_time": "4:54:29", "throughput": "2590.25", "total_tokens": 144424960} {"current_steps": 17640, "total_steps": 23217, "loss": 0.9657, "learning_rate": 6.787181722804959e-06, "epoch": 2.2793642589481844, "percentage": 75.98, "elapsed_time": "15:30:10", "remaining_time": "4:54:04", "throughput": "2589.24", "total_tokens": 144506880} {"current_steps": 17650, "total_steps": 23217, "loss": 0.9287, "learning_rate": 6.764024734349117e-06, "epoch": 2.2806564155575657, "percentage": 76.02, "elapsed_time": "15:30:59", "remaining_time": "4:53:38", "throughput": "2588.42", "total_tokens": 144588800} {"current_steps": 17660, "total_steps": 23217, "loss": 0.8438, "learning_rate": 6.740901135897257e-06, "epoch": 2.2819485721669466, "percentage": 76.06, "elapsed_time": "15:31:50", "remaining_time": "4:53:13", "throughput": "2587.55", "total_tokens": 144670720} {"current_steps": 17670, "total_steps": 23217, "loss": 0.8497, "learning_rate": 6.717810969788596e-06, "epoch": 2.2832407287763274, "percentage": 76.11, "elapsed_time": "15:32:39", "remaining_time": "4:52:46", "throughput": "2586.75", "total_tokens": 144752640} {"current_steps": 17680, "total_steps": 23217, "loss": 0.8295, "learning_rate": 6.694754278301154e-06, "epoch": 2.2845328853857088, "percentage": 76.15, "elapsed_time": "15:33:30", "remaining_time": "4:52:21", "throughput": "2585.83", "total_tokens": 144834560} {"current_steps": 17690, "total_steps": 23217, "loss": 0.6225, "learning_rate": 6.671731103651641e-06, "epoch": 2.2858250419950896, "percentage": 76.19, "elapsed_time": "15:34:19", "remaining_time": "4:51:55", "throughput": "2585.05", "total_tokens": 144916480} {"current_steps": 17700, "total_steps": 23217, "loss": 0.7609, "learning_rate": 6.648741487995416e-06, "epoch": 2.287117198604471, "percentage": 76.24, "elapsed_time": "15:35:09", "remaining_time": "4:51:29", "throughput": "2584.21", "total_tokens": 144998400} {"current_steps": 17710, "total_steps": 23217, "loss": 0.9989, "learning_rate": 6.625785473426369e-06, "epoch": 2.288409355213852, "percentage": 76.28, "elapsed_time": "15:35:59", "remaining_time": "4:51:02", "throughput": "2583.38", "total_tokens": 145080320} {"current_steps": 17720, "total_steps": 23217, "loss": 0.9415, "learning_rate": 6.602863101976886e-06, "epoch": 2.289701511823233, "percentage": 76.32, "elapsed_time": "15:36:47", "remaining_time": "4:50:36", "throughput": "2582.64", "total_tokens": 145162240} {"current_steps": 17730, "total_steps": 23217, "loss": 0.8093, "learning_rate": 6.57997441561774e-06, "epoch": 2.290993668432614, "percentage": 76.37, "elapsed_time": "15:37:38", "remaining_time": "4:50:10", "throughput": "2581.72", "total_tokens": 145244160} {"current_steps": 17740, "total_steps": 23217, "loss": 0.6653, "learning_rate": 6.557119456258043e-06, "epoch": 2.2922858250419953, "percentage": 76.41, "elapsed_time": "15:38:28", "remaining_time": "4:49:44", "throughput": "2580.89", "total_tokens": 145326080} {"current_steps": 17750, "total_steps": 23217, "loss": 0.4557, "learning_rate": 6.534298265745128e-06, "epoch": 2.293577981651376, "percentage": 76.45, "elapsed_time": "15:39:17", "remaining_time": "4:49:18", "throughput": "2580.08", "total_tokens": 145408000} {"current_steps": 17760, "total_steps": 23217, "loss": 0.4692, "learning_rate": 6.511510885864516e-06, "epoch": 2.294870138260757, "percentage": 76.5, "elapsed_time": "15:40:08", "remaining_time": "4:48:52", "throughput": "2579.23", "total_tokens": 145489920} {"current_steps": 17770, "total_steps": 23217, "loss": 0.6354, "learning_rate": 6.4887573583398255e-06, "epoch": 2.2961622948701383, "percentage": 76.54, "elapsed_time": "15:40:58", "remaining_time": "4:48:25", "throughput": "2578.41", "total_tokens": 145571840} {"current_steps": 17780, "total_steps": 23217, "loss": 0.4408, "learning_rate": 6.466037724832666e-06, "epoch": 2.297454451479519, "percentage": 76.58, "elapsed_time": "15:41:47", "remaining_time": "4:47:59", "throughput": "2577.62", "total_tokens": 145653760} {"current_steps": 17790, "total_steps": 23217, "loss": 0.9355, "learning_rate": 6.44335202694262e-06, "epoch": 2.2987466080889005, "percentage": 76.62, "elapsed_time": "15:42:35", "remaining_time": "4:47:32", "throughput": "2576.84", "total_tokens": 145735680} {"current_steps": 17800, "total_steps": 23217, "loss": 1.1966, "learning_rate": 6.420700306207103e-06, "epoch": 2.3000387646982814, "percentage": 76.67, "elapsed_time": "15:43:33", "remaining_time": "4:47:08", "throughput": "2575.69", "total_tokens": 145817600} {"current_steps": 17810, "total_steps": 23217, "loss": 0.3919, "learning_rate": 6.3980826041013464e-06, "epoch": 2.3013309213076623, "percentage": 76.71, "elapsed_time": "15:44:30", "remaining_time": "4:46:44", "throughput": "2574.51", "total_tokens": 145899520} {"current_steps": 17820, "total_steps": 23217, "loss": 0.9223, "learning_rate": 6.375498962038265e-06, "epoch": 2.3026230779170436, "percentage": 76.75, "elapsed_time": "15:45:18", "remaining_time": "4:46:17", "throughput": "2573.78", "total_tokens": 145981440} {"current_steps": 17830, "total_steps": 23217, "loss": 0.5995, "learning_rate": 6.35294942136844e-06, "epoch": 2.3039152345264244, "percentage": 76.8, "elapsed_time": "15:46:06", "remaining_time": "4:45:50", "throughput": "2573.05", "total_tokens": 146063360} {"current_steps": 17840, "total_steps": 23217, "loss": 0.6963, "learning_rate": 6.3304340233799805e-06, "epoch": 2.3052073911358058, "percentage": 76.84, "elapsed_time": "15:46:53", "remaining_time": "4:45:23", "throughput": "2572.35", "total_tokens": 146145280} {"current_steps": 17850, "total_steps": 23217, "loss": 0.6846, "learning_rate": 6.307952809298517e-06, "epoch": 2.3064995477451866, "percentage": 76.88, "elapsed_time": "15:47:41", "remaining_time": "4:44:56", "throughput": "2571.63", "total_tokens": 146227200} {"current_steps": 17860, "total_steps": 23217, "loss": 0.542, "learning_rate": 6.28550582028706e-06, "epoch": 2.307791704354568, "percentage": 76.93, "elapsed_time": "15:48:29", "remaining_time": "4:44:29", "throughput": "2570.93", "total_tokens": 146309120} {"current_steps": 17870, "total_steps": 23217, "loss": 0.9602, "learning_rate": 6.263093097445957e-06, "epoch": 2.309083860963949, "percentage": 76.97, "elapsed_time": "15:49:16", "remaining_time": "4:44:02", "throughput": "2570.21", "total_tokens": 146391040} {"current_steps": 17880, "total_steps": 23217, "loss": 0.8196, "learning_rate": 6.240714681812837e-06, "epoch": 2.31037601757333, "percentage": 77.01, "elapsed_time": "15:50:04", "remaining_time": "4:43:35", "throughput": "2569.51", "total_tokens": 146472960} {"current_steps": 17890, "total_steps": 23217, "loss": 0.6883, "learning_rate": 6.218370614362484e-06, "epoch": 2.311668174182711, "percentage": 77.06, "elapsed_time": "15:50:52", "remaining_time": "4:43:08", "throughput": "2568.78", "total_tokens": 146554880} {"current_steps": 17900, "total_steps": 23217, "loss": 0.5604, "learning_rate": 6.196060936006817e-06, "epoch": 2.312960330792092, "percentage": 77.1, "elapsed_time": "15:51:40", "remaining_time": "4:42:41", "throughput": "2568.05", "total_tokens": 146636800} {"current_steps": 17910, "total_steps": 23217, "loss": 1.045, "learning_rate": 6.173785687594761e-06, "epoch": 2.314252487401473, "percentage": 77.14, "elapsed_time": "15:52:28", "remaining_time": "4:42:13", "throughput": "2567.34", "total_tokens": 146718720} {"current_steps": 17920, "total_steps": 23217, "loss": 0.8279, "learning_rate": 6.1515449099122185e-06, "epoch": 2.315544644010854, "percentage": 77.18, "elapsed_time": "15:53:16", "remaining_time": "4:41:46", "throughput": "2566.62", "total_tokens": 146800640} {"current_steps": 17930, "total_steps": 23217, "loss": 1.0301, "learning_rate": 6.129338643681984e-06, "epoch": 2.3168368006202353, "percentage": 77.23, "elapsed_time": "15:54:03", "remaining_time": "4:41:19", "throughput": "2565.92", "total_tokens": 146882560} {"current_steps": 17940, "total_steps": 23217, "loss": 0.6595, "learning_rate": 6.107166929563629e-06, "epoch": 2.318128957229616, "percentage": 77.27, "elapsed_time": "15:54:51", "remaining_time": "4:40:52", "throughput": "2565.22", "total_tokens": 146964480} {"current_steps": 17950, "total_steps": 23217, "loss": 0.672, "learning_rate": 6.085029808153503e-06, "epoch": 2.319421113838997, "percentage": 77.31, "elapsed_time": "15:55:38", "remaining_time": "4:40:24", "throughput": "2564.53", "total_tokens": 147046400} {"current_steps": 17960, "total_steps": 23217, "loss": 0.7306, "learning_rate": 6.062927319984576e-06, "epoch": 2.3207132704483784, "percentage": 77.36, "elapsed_time": "15:56:26", "remaining_time": "4:39:57", "throughput": "2563.81", "total_tokens": 147128320} {"current_steps": 17970, "total_steps": 23217, "loss": 1.0703, "learning_rate": 6.040859505526439e-06, "epoch": 2.3220054270577593, "percentage": 77.4, "elapsed_time": "15:57:14", "remaining_time": "4:39:29", "throughput": "2563.12", "total_tokens": 147210240} {"current_steps": 17980, "total_steps": 23217, "loss": 0.9107, "learning_rate": 6.018826405185163e-06, "epoch": 2.3232975836671406, "percentage": 77.44, "elapsed_time": "15:58:01", "remaining_time": "4:39:02", "throughput": "2562.41", "total_tokens": 147292160} {"current_steps": 17990, "total_steps": 23217, "loss": 0.9921, "learning_rate": 5.99682805930328e-06, "epoch": 2.3245897402765214, "percentage": 77.49, "elapsed_time": "15:58:50", "remaining_time": "4:38:35", "throughput": "2561.66", "total_tokens": 147374080} {"current_steps": 18000, "total_steps": 23217, "loss": 1.121, "learning_rate": 5.974864508159692e-06, "epoch": 2.3258818968859027, "percentage": 77.53, "elapsed_time": "15:59:39", "remaining_time": "4:38:08", "throughput": "2560.92", "total_tokens": 147456000} {"current_steps": 18010, "total_steps": 23217, "loss": 0.7416, "learning_rate": 5.952935791969574e-06, "epoch": 2.3271740534952836, "percentage": 77.57, "elapsed_time": "16:00:32", "remaining_time": "4:37:42", "throughput": "2559.98", "total_tokens": 147537920} {"current_steps": 18020, "total_steps": 23217, "loss": 0.8224, "learning_rate": 5.931041950884314e-06, "epoch": 2.328466210104665, "percentage": 77.62, "elapsed_time": "16:01:20", "remaining_time": "4:37:15", "throughput": "2559.26", "total_tokens": 147619840} {"current_steps": 18030, "total_steps": 23217, "loss": 0.4575, "learning_rate": 5.9091830249914685e-06, "epoch": 2.329758366714046, "percentage": 77.66, "elapsed_time": "16:02:09", "remaining_time": "4:36:48", "throughput": "2558.50", "total_tokens": 147701760} {"current_steps": 18040, "total_steps": 23217, "loss": 0.8888, "learning_rate": 5.887359054314648e-06, "epoch": 2.3310505233234267, "percentage": 77.7, "elapsed_time": "16:02:58", "remaining_time": "4:36:20", "throughput": "2557.75", "total_tokens": 147783680} {"current_steps": 18050, "total_steps": 23217, "loss": 1.0576, "learning_rate": 5.8655700788134535e-06, "epoch": 2.332342679932808, "percentage": 77.74, "elapsed_time": "16:03:46", "remaining_time": "4:35:53", "throughput": "2557.05", "total_tokens": 147865600} {"current_steps": 18060, "total_steps": 23217, "loss": 0.967, "learning_rate": 5.843816138383429e-06, "epoch": 2.333634836542189, "percentage": 77.79, "elapsed_time": "16:04:34", "remaining_time": "4:35:26", "throughput": "2556.33", "total_tokens": 147947520} {"current_steps": 18070, "total_steps": 23217, "loss": 0.5175, "learning_rate": 5.822097272855964e-06, "epoch": 2.33492699315157, "percentage": 77.83, "elapsed_time": "16:05:23", "remaining_time": "4:34:58", "throughput": "2555.60", "total_tokens": 148029440} {"current_steps": 18080, "total_steps": 23217, "loss": 0.8177, "learning_rate": 5.800413521998208e-06, "epoch": 2.336219149760951, "percentage": 77.87, "elapsed_time": "16:06:11", "remaining_time": "4:34:31", "throughput": "2554.90", "total_tokens": 148111360} {"current_steps": 18090, "total_steps": 23217, "loss": 0.9179, "learning_rate": 5.778764925513045e-06, "epoch": 2.337511306370332, "percentage": 77.92, "elapsed_time": "16:07:00", "remaining_time": "4:34:03", "throughput": "2554.17", "total_tokens": 148193280} {"current_steps": 18100, "total_steps": 23217, "loss": 0.9355, "learning_rate": 5.7571515230389586e-06, "epoch": 2.338803462979713, "percentage": 77.96, "elapsed_time": "16:07:49", "remaining_time": "4:33:36", "throughput": "2553.42", "total_tokens": 148275200} {"current_steps": 18110, "total_steps": 23217, "loss": 0.9177, "learning_rate": 5.7355733541500285e-06, "epoch": 2.340095619589094, "percentage": 78.0, "elapsed_time": "16:08:39", "remaining_time": "4:33:09", "throughput": "2552.63", "total_tokens": 148357120} {"current_steps": 18120, "total_steps": 23217, "loss": 0.8673, "learning_rate": 5.714030458355784e-06, "epoch": 2.3413877761984754, "percentage": 78.05, "elapsed_time": "16:09:27", "remaining_time": "4:32:42", "throughput": "2551.91", "total_tokens": 148439040} {"current_steps": 18130, "total_steps": 23217, "loss": 0.8191, "learning_rate": 5.692522875101203e-06, "epoch": 2.3426799328078562, "percentage": 78.09, "elapsed_time": "16:10:15", "remaining_time": "4:32:14", "throughput": "2551.21", "total_tokens": 148520960} {"current_steps": 18140, "total_steps": 23217, "loss": 0.4773, "learning_rate": 5.67105064376659e-06, "epoch": 2.3439720894172376, "percentage": 78.13, "elapsed_time": "16:11:03", "remaining_time": "4:31:46", "throughput": "2550.51", "total_tokens": 148602880} {"current_steps": 18150, "total_steps": 23217, "loss": 0.8423, "learning_rate": 5.649613803667511e-06, "epoch": 2.3452642460266184, "percentage": 78.18, "elapsed_time": "16:11:53", "remaining_time": "4:31:19", "throughput": "2549.76", "total_tokens": 148684800} {"current_steps": 18160, "total_steps": 23217, "loss": 0.7039, "learning_rate": 5.628212394054758e-06, "epoch": 2.3465564026359993, "percentage": 78.22, "elapsed_time": "16:12:41", "remaining_time": "4:30:51", "throughput": "2549.04", "total_tokens": 148766720} {"current_steps": 18170, "total_steps": 23217, "loss": 0.4886, "learning_rate": 5.606846454114218e-06, "epoch": 2.3478485592453806, "percentage": 78.26, "elapsed_time": "16:13:30", "remaining_time": "4:30:24", "throughput": "2548.31", "total_tokens": 148848640} {"current_steps": 18180, "total_steps": 23217, "loss": 0.8072, "learning_rate": 5.5855160229668636e-06, "epoch": 2.3491407158547615, "percentage": 78.3, "elapsed_time": "16:14:18", "remaining_time": "4:29:56", "throughput": "2547.63", "total_tokens": 148930560} {"current_steps": 18190, "total_steps": 23217, "loss": 0.7343, "learning_rate": 5.564221139668621e-06, "epoch": 2.350432872464143, "percentage": 78.35, "elapsed_time": "16:15:07", "remaining_time": "4:29:29", "throughput": "2546.89", "total_tokens": 149012480} {"current_steps": 18200, "total_steps": 23217, "loss": 1.1034, "learning_rate": 5.542961843210359e-06, "epoch": 2.3517250290735237, "percentage": 78.39, "elapsed_time": "16:15:56", "remaining_time": "4:29:01", "throughput": "2546.17", "total_tokens": 149094400} {"current_steps": 18210, "total_steps": 23217, "loss": 0.7438, "learning_rate": 5.5217381725177624e-06, "epoch": 2.353017185682905, "percentage": 78.43, "elapsed_time": "16:16:44", "remaining_time": "4:28:33", "throughput": "2545.48", "total_tokens": 149176320} {"current_steps": 18220, "total_steps": 23217, "loss": 0.6506, "learning_rate": 5.50055016645129e-06, "epoch": 2.354309342292286, "percentage": 78.48, "elapsed_time": "16:17:31", "remaining_time": "4:28:05", "throughput": "2544.81", "total_tokens": 149258240} {"current_steps": 18230, "total_steps": 23217, "loss": 0.7191, "learning_rate": 5.479397863806115e-06, "epoch": 2.3556014989016667, "percentage": 78.52, "elapsed_time": "16:18:19", "remaining_time": "4:27:37", "throughput": "2544.15", "total_tokens": 149340160} {"current_steps": 18240, "total_steps": 23217, "loss": 0.8379, "learning_rate": 5.458281303312016e-06, "epoch": 2.356893655511048, "percentage": 78.56, "elapsed_time": "16:19:07", "remaining_time": "4:27:09", "throughput": "2543.48", "total_tokens": 149422080} {"current_steps": 18250, "total_steps": 23217, "loss": 0.388, "learning_rate": 5.437200523633348e-06, "epoch": 2.358185812120429, "percentage": 78.61, "elapsed_time": "16:19:54", "remaining_time": "4:26:41", "throughput": "2542.82", "total_tokens": 149504000} {"current_steps": 18260, "total_steps": 23217, "loss": 1.0104, "learning_rate": 5.41615556336893e-06, "epoch": 2.35947796872981, "percentage": 78.65, "elapsed_time": "16:20:42", "remaining_time": "4:26:13", "throughput": "2542.16", "total_tokens": 149585920} {"current_steps": 18270, "total_steps": 23217, "loss": 0.7642, "learning_rate": 5.39514646105202e-06, "epoch": 2.360770125339191, "percentage": 78.69, "elapsed_time": "16:21:29", "remaining_time": "4:25:45", "throughput": "2541.50", "total_tokens": 149667840} {"current_steps": 18280, "total_steps": 23217, "loss": 0.6885, "learning_rate": 5.374173255150194e-06, "epoch": 2.362062281948572, "percentage": 78.74, "elapsed_time": "16:22:17", "remaining_time": "4:25:17", "throughput": "2540.84", "total_tokens": 149749760} {"current_steps": 18290, "total_steps": 23217, "loss": 0.6808, "learning_rate": 5.353235984065321e-06, "epoch": 2.3633544385579532, "percentage": 78.78, "elapsed_time": "16:23:04", "remaining_time": "4:24:49", "throughput": "2540.18", "total_tokens": 149831680} {"current_steps": 18300, "total_steps": 23217, "loss": 0.7185, "learning_rate": 5.332334686133475e-06, "epoch": 2.364646595167334, "percentage": 78.82, "elapsed_time": "16:23:52", "remaining_time": "4:24:21", "throughput": "2539.52", "total_tokens": 149913600} {"current_steps": 18310, "total_steps": 23217, "loss": 0.8391, "learning_rate": 5.311469399624844e-06, "epoch": 2.3659387517767154, "percentage": 78.86, "elapsed_time": "16:24:41", "remaining_time": "4:23:53", "throughput": "2538.78", "total_tokens": 149995520} {"current_steps": 18320, "total_steps": 23217, "loss": 0.6135, "learning_rate": 5.290640162743704e-06, "epoch": 2.3672309083860963, "percentage": 78.91, "elapsed_time": "16:25:40", "remaining_time": "4:23:28", "throughput": "2537.66", "total_tokens": 150077440} {"current_steps": 18330, "total_steps": 23217, "loss": 0.9426, "learning_rate": 5.269847013628299e-06, "epoch": 2.3685230649954776, "percentage": 78.95, "elapsed_time": "16:26:35", "remaining_time": "4:23:02", "throughput": "2536.67", "total_tokens": 150159360} {"current_steps": 18340, "total_steps": 23217, "loss": 0.9153, "learning_rate": 5.24908999035082e-06, "epoch": 2.3698152216048585, "percentage": 78.99, "elapsed_time": "16:27:36", "remaining_time": "4:22:37", "throughput": "2535.45", "total_tokens": 150241280} {"current_steps": 18350, "total_steps": 23217, "loss": 0.4039, "learning_rate": 5.228369130917288e-06, "epoch": 2.37110737821424, "percentage": 79.04, "elapsed_time": "16:28:27", "remaining_time": "4:22:10", "throughput": "2534.66", "total_tokens": 150323200} {"current_steps": 18360, "total_steps": 23217, "loss": 0.573, "learning_rate": 5.207684473267527e-06, "epoch": 2.3723995348236206, "percentage": 79.08, "elapsed_time": "16:29:16", "remaining_time": "4:21:42", "throughput": "2533.93", "total_tokens": 150405120} {"current_steps": 18370, "total_steps": 23217, "loss": 1.009, "learning_rate": 5.187036055275077e-06, "epoch": 2.3736916914330015, "percentage": 79.12, "elapsed_time": "16:30:08", "remaining_time": "4:21:15", "throughput": "2533.10", "total_tokens": 150487040} {"current_steps": 18380, "total_steps": 23217, "loss": 0.6435, "learning_rate": 5.16642391474711e-06, "epoch": 2.374983848042383, "percentage": 79.17, "elapsed_time": "16:31:10", "remaining_time": "4:20:50", "throughput": "2531.84", "total_tokens": 150568960} {"current_steps": 18390, "total_steps": 23217, "loss": 0.884, "learning_rate": 5.145848089424374e-06, "epoch": 2.3762760046517637, "percentage": 79.21, "elapsed_time": "16:32:01", "remaining_time": "4:20:23", "throughput": "2531.04", "total_tokens": 150650880} {"current_steps": 18400, "total_steps": 23217, "loss": 0.7895, "learning_rate": 5.125308616981139e-06, "epoch": 2.377568161261145, "percentage": 79.25, "elapsed_time": "16:32:57", "remaining_time": "4:19:56", "throughput": "2530.04", "total_tokens": 150732800} {"current_steps": 18410, "total_steps": 23217, "loss": 0.971, "learning_rate": 5.1048055350251e-06, "epoch": 2.378860317870526, "percentage": 79.3, "elapsed_time": "16:33:46", "remaining_time": "4:19:28", "throughput": "2529.34", "total_tokens": 150814720} {"current_steps": 18420, "total_steps": 23217, "loss": 0.5018, "learning_rate": 5.0843388810973195e-06, "epoch": 2.3801524744799067, "percentage": 79.34, "elapsed_time": "16:34:33", "remaining_time": "4:19:00", "throughput": "2528.68", "total_tokens": 150896640} {"current_steps": 18430, "total_steps": 23217, "loss": 0.953, "learning_rate": 5.06390869267217e-06, "epoch": 2.381444631089288, "percentage": 79.38, "elapsed_time": "16:35:22", "remaining_time": "4:18:32", "throughput": "2528.01", "total_tokens": 150978560} {"current_steps": 18440, "total_steps": 23217, "loss": 1.2336, "learning_rate": 5.043515007157263e-06, "epoch": 2.382736787698669, "percentage": 79.42, "elapsed_time": "16:36:16", "remaining_time": "4:18:05", "throughput": "2527.09", "total_tokens": 151060480} {"current_steps": 18450, "total_steps": 23217, "loss": 0.6531, "learning_rate": 5.02315786189334e-06, "epoch": 2.3840289443080502, "percentage": 79.47, "elapsed_time": "16:37:12", "remaining_time": "4:17:39", "throughput": "2526.11", "total_tokens": 151142400} {"current_steps": 18460, "total_steps": 23217, "loss": 0.7825, "learning_rate": 5.002837294154283e-06, "epoch": 2.385321100917431, "percentage": 79.51, "elapsed_time": "16:38:05", "remaining_time": "4:17:12", "throughput": "2525.21", "total_tokens": 151224320} {"current_steps": 18470, "total_steps": 23217, "loss": 0.7779, "learning_rate": 4.982553341146956e-06, "epoch": 2.3866132575268124, "percentage": 79.55, "elapsed_time": "16:39:10", "remaining_time": "4:16:47", "throughput": "2523.87", "total_tokens": 151306240} {"current_steps": 18480, "total_steps": 23217, "loss": 0.9538, "learning_rate": 4.962306040011222e-06, "epoch": 2.3879054141361933, "percentage": 79.6, "elapsed_time": "16:40:03", "remaining_time": "4:16:20", "throughput": "2523.00", "total_tokens": 151388160} {"current_steps": 18490, "total_steps": 23217, "loss": 1.0866, "learning_rate": 4.942095427819796e-06, "epoch": 2.3891975707455746, "percentage": 79.64, "elapsed_time": "16:40:54", "remaining_time": "4:15:52", "throughput": "2522.22", "total_tokens": 151470080} {"current_steps": 18500, "total_steps": 23217, "loss": 0.8085, "learning_rate": 4.921921541578248e-06, "epoch": 2.3904897273549555, "percentage": 79.68, "elapsed_time": "16:41:48", "remaining_time": "4:15:26", "throughput": "2521.29", "total_tokens": 151552000} {"current_steps": 18510, "total_steps": 23217, "loss": 0.8541, "learning_rate": 4.901784418224892e-06, "epoch": 2.3917818839643363, "percentage": 79.73, "elapsed_time": "16:42:36", "remaining_time": "4:14:57", "throughput": "2520.65", "total_tokens": 151633920} {"current_steps": 18520, "total_steps": 23217, "loss": 0.6467, "learning_rate": 4.881684094630712e-06, "epoch": 2.3930740405737176, "percentage": 79.77, "elapsed_time": "16:43:25", "remaining_time": "4:14:29", "throughput": "2519.97", "total_tokens": 151715840} {"current_steps": 18530, "total_steps": 23217, "loss": 0.7586, "learning_rate": 4.861620607599346e-06, "epoch": 2.3943661971830985, "percentage": 79.81, "elapsed_time": "16:44:14", "remaining_time": "4:14:00", "throughput": "2519.27", "total_tokens": 151797760} {"current_steps": 18540, "total_steps": 23217, "loss": 0.853, "learning_rate": 4.841593993866949e-06, "epoch": 2.39565835379248, "percentage": 79.86, "elapsed_time": "16:45:07", "remaining_time": "4:13:33", "throughput": "2518.41", "total_tokens": 151879680} {"current_steps": 18550, "total_steps": 23217, "loss": 1.02, "learning_rate": 4.821604290102191e-06, "epoch": 2.3969505104018607, "percentage": 79.9, "elapsed_time": "16:46:11", "remaining_time": "4:13:08", "throughput": "2517.11", "total_tokens": 151961600} {"current_steps": 18560, "total_steps": 23217, "loss": 0.8047, "learning_rate": 4.801651532906135e-06, "epoch": 2.3982426670112416, "percentage": 79.94, "elapsed_time": "16:47:09", "remaining_time": "4:12:42", "throughput": "2516.06", "total_tokens": 152043520} {"current_steps": 18570, "total_steps": 23217, "loss": 0.9561, "learning_rate": 4.781735758812217e-06, "epoch": 2.399534823620623, "percentage": 79.98, "elapsed_time": "16:48:05", "remaining_time": "4:12:16", "throughput": "2515.05", "total_tokens": 152125440} {"current_steps": 18580, "total_steps": 23217, "loss": 0.6804, "learning_rate": 4.761857004286141e-06, "epoch": 2.4008269802300037, "percentage": 80.03, "elapsed_time": "16:49:02", "remaining_time": "4:11:49", "throughput": "2514.08", "total_tokens": 152207360} {"current_steps": 18590, "total_steps": 23217, "loss": 0.9148, "learning_rate": 4.742015305725828e-06, "epoch": 2.402119136839385, "percentage": 80.07, "elapsed_time": "16:50:02", "remaining_time": "4:11:23", "throughput": "2512.90", "total_tokens": 152289280} {"current_steps": 18600, "total_steps": 23217, "loss": 0.6088, "learning_rate": 4.7222106994613655e-06, "epoch": 2.403411293448766, "percentage": 80.11, "elapsed_time": "16:51:02", "remaining_time": "4:10:57", "throughput": "2511.79", "total_tokens": 152371200} {"current_steps": 18610, "total_steps": 23217, "loss": 0.7719, "learning_rate": 4.702443221754904e-06, "epoch": 2.4047034500581472, "percentage": 80.16, "elapsed_time": "16:52:03", "remaining_time": "4:10:32", "throughput": "2510.63", "total_tokens": 152453120} {"current_steps": 18620, "total_steps": 23217, "loss": 0.8772, "learning_rate": 4.6827129088006375e-06, "epoch": 2.405995606667528, "percentage": 80.2, "elapsed_time": "16:52:56", "remaining_time": "4:10:04", "throughput": "2509.75", "total_tokens": 152535040} {"current_steps": 18630, "total_steps": 23217, "loss": 0.7122, "learning_rate": 4.663019796724685e-06, "epoch": 2.4072877632769094, "percentage": 80.24, "elapsed_time": "16:53:47", "remaining_time": "4:09:36", "throughput": "2509.03", "total_tokens": 152616960} {"current_steps": 18640, "total_steps": 23217, "loss": 1.0226, "learning_rate": 4.6433639215850696e-06, "epoch": 2.4085799198862903, "percentage": 80.29, "elapsed_time": "16:54:39", "remaining_time": "4:09:08", "throughput": "2508.23", "total_tokens": 152698880} {"current_steps": 18650, "total_steps": 23217, "loss": 0.6679, "learning_rate": 4.623745319371617e-06, "epoch": 2.409872076495671, "percentage": 80.33, "elapsed_time": "16:55:28", "remaining_time": "4:08:40", "throughput": "2507.53", "total_tokens": 152780800} {"current_steps": 18660, "total_steps": 23217, "loss": 1.0588, "learning_rate": 4.604164026005925e-06, "epoch": 2.4111642331050525, "percentage": 80.37, "elapsed_time": "16:56:16", "remaining_time": "4:08:11", "throughput": "2506.92", "total_tokens": 152862720} {"current_steps": 18670, "total_steps": 23217, "loss": 0.8622, "learning_rate": 4.584620077341273e-06, "epoch": 2.4124563897144333, "percentage": 80.42, "elapsed_time": "16:57:07", "remaining_time": "4:07:43", "throughput": "2506.15", "total_tokens": 152944640} {"current_steps": 18680, "total_steps": 23217, "loss": 0.9585, "learning_rate": 4.565113509162547e-06, "epoch": 2.4137485463238146, "percentage": 80.46, "elapsed_time": "16:58:01", "remaining_time": "4:07:15", "throughput": "2505.30", "total_tokens": 153026560} {"current_steps": 18690, "total_steps": 23217, "loss": 0.5105, "learning_rate": 4.5456443571862185e-06, "epoch": 2.4150407029331955, "percentage": 80.5, "elapsed_time": "16:58:54", "remaining_time": "4:06:47", "throughput": "2504.46", "total_tokens": 153108480} {"current_steps": 18700, "total_steps": 23217, "loss": 0.7058, "learning_rate": 4.5262126570602135e-06, "epoch": 2.4163328595425764, "percentage": 80.54, "elapsed_time": "16:59:46", "remaining_time": "4:06:19", "throughput": "2503.64", "total_tokens": 153190400} {"current_steps": 18710, "total_steps": 23217, "loss": 0.7815, "learning_rate": 4.506818444363925e-06, "epoch": 2.4176250161519577, "percentage": 80.59, "elapsed_time": "17:00:40", "remaining_time": "4:05:51", "throughput": "2502.81", "total_tokens": 153272320} {"current_steps": 18720, "total_steps": 23217, "loss": 0.6579, "learning_rate": 4.487461754608066e-06, "epoch": 2.4189171727613386, "percentage": 80.63, "elapsed_time": "17:01:34", "remaining_time": "4:05:24", "throughput": "2501.93", "total_tokens": 153354240} {"current_steps": 18730, "total_steps": 23217, "loss": 0.5656, "learning_rate": 4.468142623234678e-06, "epoch": 2.42020932937072, "percentage": 80.67, "elapsed_time": "17:02:25", "remaining_time": "4:04:56", "throughput": "2501.17", "total_tokens": 153436160} {"current_steps": 18740, "total_steps": 23217, "loss": 0.9916, "learning_rate": 4.448861085617018e-06, "epoch": 2.4215014859801007, "percentage": 80.72, "elapsed_time": "17:03:18", "remaining_time": "4:04:28", "throughput": "2500.35", "total_tokens": 153518080} {"current_steps": 18750, "total_steps": 23217, "loss": 0.3525, "learning_rate": 4.429617177059508e-06, "epoch": 2.4227936425894816, "percentage": 80.76, "elapsed_time": "17:04:10", "remaining_time": "4:03:59", "throughput": "2499.57", "total_tokens": 153600000} {"current_steps": 18760, "total_steps": 23217, "loss": 0.912, "learning_rate": 4.410410932797671e-06, "epoch": 2.424085799198863, "percentage": 80.8, "elapsed_time": "17:05:06", "remaining_time": "4:03:32", "throughput": "2498.64", "total_tokens": 153681920} {"current_steps": 18770, "total_steps": 23217, "loss": 0.8084, "learning_rate": 4.391242387998079e-06, "epoch": 2.425377955808244, "percentage": 80.85, "elapsed_time": "17:05:58", "remaining_time": "4:03:04", "throughput": "2497.86", "total_tokens": 153763840} {"current_steps": 18780, "total_steps": 23217, "loss": 0.8788, "learning_rate": 4.372111577758261e-06, "epoch": 2.426670112417625, "percentage": 80.89, "elapsed_time": "17:06:54", "remaining_time": "4:02:37", "throughput": "2496.90", "total_tokens": 153845760} {"current_steps": 18790, "total_steps": 23217, "loss": 0.8239, "learning_rate": 4.353018537106657e-06, "epoch": 2.427962269027006, "percentage": 80.93, "elapsed_time": "17:07:53", "remaining_time": "4:02:10", "throughput": "2495.86", "total_tokens": 153927680} {"current_steps": 18800, "total_steps": 23217, "loss": 0.6755, "learning_rate": 4.333963301002558e-06, "epoch": 2.4292544256363873, "percentage": 80.98, "elapsed_time": "17:08:48", "remaining_time": "4:01:42", "throughput": "2494.97", "total_tokens": 154009600} {"current_steps": 18810, "total_steps": 23217, "loss": 0.8883, "learning_rate": 4.314945904336037e-06, "epoch": 2.430546582245768, "percentage": 81.02, "elapsed_time": "17:09:43", "remaining_time": "4:01:15", "throughput": "2494.06", "total_tokens": 154091520} {"current_steps": 18820, "total_steps": 23217, "loss": 0.9761, "learning_rate": 4.295966381927871e-06, "epoch": 2.4318387388551495, "percentage": 81.06, "elapsed_time": "17:10:36", "remaining_time": "4:00:47", "throughput": "2493.23", "total_tokens": 154173440} {"current_steps": 18830, "total_steps": 23217, "loss": 0.7079, "learning_rate": 4.2770247685295e-06, "epoch": 2.4331308954645303, "percentage": 81.1, "elapsed_time": "17:11:29", "remaining_time": "4:00:19", "throughput": "2492.41", "total_tokens": 154255360} {"current_steps": 18840, "total_steps": 23217, "loss": 0.8145, "learning_rate": 4.258121098822945e-06, "epoch": 2.434423052073911, "percentage": 81.15, "elapsed_time": "17:12:33", "remaining_time": "3:59:53", "throughput": "2491.18", "total_tokens": 154337280} {"current_steps": 18850, "total_steps": 23217, "loss": 0.668, "learning_rate": 4.239255407420764e-06, "epoch": 2.4357152086832925, "percentage": 81.19, "elapsed_time": "17:13:26", "remaining_time": "3:59:25", "throughput": "2490.36", "total_tokens": 154419200} {"current_steps": 18860, "total_steps": 23217, "loss": 0.635, "learning_rate": 4.220427728865956e-06, "epoch": 2.4370073652926734, "percentage": 81.23, "elapsed_time": "17:14:19", "remaining_time": "3:58:56", "throughput": "2489.56", "total_tokens": 154501120} {"current_steps": 18870, "total_steps": 23217, "loss": 0.8883, "learning_rate": 4.201638097631938e-06, "epoch": 2.4382995219020547, "percentage": 81.28, "elapsed_time": "17:15:12", "remaining_time": "3:58:28", "throughput": "2488.77", "total_tokens": 154583040} {"current_steps": 18880, "total_steps": 23217, "loss": 0.6052, "learning_rate": 4.182886548122464e-06, "epoch": 2.4395916785114355, "percentage": 81.32, "elapsed_time": "17:16:03", "remaining_time": "3:57:59", "throughput": "2488.05", "total_tokens": 154664960} {"current_steps": 18890, "total_steps": 23217, "loss": 0.5808, "learning_rate": 4.164173114671538e-06, "epoch": 2.4408838351208164, "percentage": 81.36, "elapsed_time": "17:16:53", "remaining_time": "3:57:30", "throughput": "2487.35", "total_tokens": 154746880} {"current_steps": 18900, "total_steps": 23217, "loss": 1.0335, "learning_rate": 4.145497831543402e-06, "epoch": 2.4421759917301977, "percentage": 81.41, "elapsed_time": "17:17:41", "remaining_time": "3:57:01", "throughput": "2486.77", "total_tokens": 154828800} {"current_steps": 18910, "total_steps": 23217, "loss": 0.8685, "learning_rate": 4.1268607329324195e-06, "epoch": 2.4434681483395786, "percentage": 81.45, "elapsed_time": "17:18:32", "remaining_time": "3:56:32", "throughput": "2486.04", "total_tokens": 154910720} {"current_steps": 18920, "total_steps": 23217, "loss": 0.9031, "learning_rate": 4.108261852963061e-06, "epoch": 2.44476030494896, "percentage": 81.49, "elapsed_time": "17:19:25", "remaining_time": "3:56:03", "throughput": "2485.25", "total_tokens": 154992640} {"current_steps": 18930, "total_steps": 23217, "loss": 0.6177, "learning_rate": 4.089701225689793e-06, "epoch": 2.4460524615583408, "percentage": 81.54, "elapsed_time": "17:20:17", "remaining_time": "3:55:35", "throughput": "2484.48", "total_tokens": 155074560} {"current_steps": 18940, "total_steps": 23217, "loss": 0.6072, "learning_rate": 4.071178885097074e-06, "epoch": 2.447344618167722, "percentage": 81.58, "elapsed_time": "17:21:10", "remaining_time": "3:55:06", "throughput": "2483.68", "total_tokens": 155156480} {"current_steps": 18950, "total_steps": 23217, "loss": 0.8248, "learning_rate": 4.052694865099232e-06, "epoch": 2.448636774777103, "percentage": 81.62, "elapsed_time": "17:22:00", "remaining_time": "3:54:37", "throughput": "2483.01", "total_tokens": 155238400} {"current_steps": 18960, "total_steps": 23217, "loss": 0.8951, "learning_rate": 4.034249199540432e-06, "epoch": 2.4499289313864843, "percentage": 81.66, "elapsed_time": "17:22:54", "remaining_time": "3:54:09", "throughput": "2482.18", "total_tokens": 155320320} {"current_steps": 18970, "total_steps": 23217, "loss": 0.6641, "learning_rate": 4.015841922194638e-06, "epoch": 2.451221087995865, "percentage": 81.71, "elapsed_time": "17:23:46", "remaining_time": "3:53:40", "throughput": "2481.40", "total_tokens": 155402240} {"current_steps": 18980, "total_steps": 23217, "loss": 0.3194, "learning_rate": 3.997473066765489e-06, "epoch": 2.452513244605246, "percentage": 81.75, "elapsed_time": "17:24:40", "remaining_time": "3:53:12", "throughput": "2480.59", "total_tokens": 155484160} {"current_steps": 18990, "total_steps": 23217, "loss": 0.8105, "learning_rate": 3.97914266688631e-06, "epoch": 2.4538054012146273, "percentage": 81.79, "elapsed_time": "17:25:44", "remaining_time": "3:52:46", "throughput": "2479.35", "total_tokens": 155566080} {"current_steps": 19000, "total_steps": 23217, "loss": 0.7238, "learning_rate": 3.96085075611998e-06, "epoch": 2.455097557824008, "percentage": 81.84, "elapsed_time": "17:26:32", "remaining_time": "3:52:16", "throughput": "2478.76", "total_tokens": 155648000} {"current_steps": 19010, "total_steps": 23217, "loss": 0.9272, "learning_rate": 3.942597367958928e-06, "epoch": 2.4563897144333895, "percentage": 81.88, "elapsed_time": "17:27:28", "remaining_time": "3:51:48", "throughput": "2477.85", "total_tokens": 155729920} {"current_steps": 19020, "total_steps": 23217, "loss": 0.5264, "learning_rate": 3.924382535825047e-06, "epoch": 2.4576818710427704, "percentage": 81.92, "elapsed_time": "17:28:16", "remaining_time": "3:51:18", "throughput": "2477.29", "total_tokens": 155811840} {"current_steps": 19030, "total_steps": 23217, "loss": 0.8021, "learning_rate": 3.906206293069617e-06, "epoch": 2.4589740276521512, "percentage": 81.97, "elapsed_time": "17:29:03", "remaining_time": "3:50:48", "throughput": "2476.72", "total_tokens": 155893760} {"current_steps": 19040, "total_steps": 23217, "loss": 0.9558, "learning_rate": 3.88806867297328e-06, "epoch": 2.4602661842615325, "percentage": 82.01, "elapsed_time": "17:29:50", "remaining_time": "3:50:18", "throughput": "2476.16", "total_tokens": 155975680} {"current_steps": 19050, "total_steps": 23217, "loss": 1.0861, "learning_rate": 3.869969708745946e-06, "epoch": 2.4615583408709134, "percentage": 82.05, "elapsed_time": "17:30:38", "remaining_time": "3:49:49", "throughput": "2475.60", "total_tokens": 156057600} {"current_steps": 19060, "total_steps": 23217, "loss": 0.9696, "learning_rate": 3.85190943352676e-06, "epoch": 2.4628504974802947, "percentage": 82.1, "elapsed_time": "17:31:25", "remaining_time": "3:49:19", "throughput": "2475.03", "total_tokens": 156139520} {"current_steps": 19070, "total_steps": 23217, "loss": 0.7405, "learning_rate": 3.833887880384007e-06, "epoch": 2.4641426540896756, "percentage": 82.14, "elapsed_time": "17:32:13", "remaining_time": "3:48:49", "throughput": "2474.46", "total_tokens": 156221440} {"current_steps": 19080, "total_steps": 23217, "loss": 0.6941, "learning_rate": 3.815905082315102e-06, "epoch": 2.465434810699057, "percentage": 82.18, "elapsed_time": "17:33:01", "remaining_time": "3:48:19", "throughput": "2473.89", "total_tokens": 156303360} {"current_steps": 19090, "total_steps": 23217, "loss": 0.472, "learning_rate": 3.7979610722464643e-06, "epoch": 2.4667269673084378, "percentage": 82.22, "elapsed_time": "17:33:48", "remaining_time": "3:47:49", "throughput": "2473.32", "total_tokens": 156385280} {"current_steps": 19100, "total_steps": 23217, "loss": 1.1217, "learning_rate": 3.780055883033523e-06, "epoch": 2.468019123917819, "percentage": 82.27, "elapsed_time": "17:34:36", "remaining_time": "3:47:19", "throughput": "2472.75", "total_tokens": 156467200} {"current_steps": 19110, "total_steps": 23217, "loss": 0.7157, "learning_rate": 3.762189547460615e-06, "epoch": 2.4693112805272, "percentage": 82.31, "elapsed_time": "17:35:23", "remaining_time": "3:46:49", "throughput": "2472.20", "total_tokens": 156549120} {"current_steps": 19120, "total_steps": 23217, "loss": 0.9332, "learning_rate": 3.7443620982409305e-06, "epoch": 2.470603437136581, "percentage": 82.35, "elapsed_time": "17:36:11", "remaining_time": "3:46:19", "throughput": "2471.64", "total_tokens": 156631040} {"current_steps": 19130, "total_steps": 23217, "loss": 0.5993, "learning_rate": 3.7265735680164615e-06, "epoch": 2.471895593745962, "percentage": 82.4, "elapsed_time": "17:36:58", "remaining_time": "3:45:48", "throughput": "2471.09", "total_tokens": 156712960} {"current_steps": 19140, "total_steps": 23217, "loss": 0.8641, "learning_rate": 3.7088239893579456e-06, "epoch": 2.473187750355343, "percentage": 82.44, "elapsed_time": "17:37:46", "remaining_time": "3:45:18", "throughput": "2470.53", "total_tokens": 156794880} {"current_steps": 19150, "total_steps": 23217, "loss": 0.5555, "learning_rate": 3.6911133947648002e-06, "epoch": 2.4744799069647243, "percentage": 82.48, "elapsed_time": "17:38:33", "remaining_time": "3:44:48", "throughput": "2469.96", "total_tokens": 156876800} {"current_steps": 19160, "total_steps": 23217, "loss": 0.7846, "learning_rate": 3.6734418166650436e-06, "epoch": 2.475772063574105, "percentage": 82.53, "elapsed_time": "17:39:23", "remaining_time": "3:44:19", "throughput": "2469.31", "total_tokens": 156958720} {"current_steps": 19170, "total_steps": 23217, "loss": 0.7447, "learning_rate": 3.655809287415285e-06, "epoch": 2.477064220183486, "percentage": 82.57, "elapsed_time": "17:40:17", "remaining_time": "3:43:50", "throughput": "2468.51", "total_tokens": 157040640} {"current_steps": 19180, "total_steps": 23217, "loss": 0.8456, "learning_rate": 3.638215839300624e-06, "epoch": 2.4783563767928674, "percentage": 82.61, "elapsed_time": "17:41:11", "remaining_time": "3:43:21", "throughput": "2467.71", "total_tokens": 157122560} {"current_steps": 19190, "total_steps": 23217, "loss": 0.9318, "learning_rate": 3.6206615045345837e-06, "epoch": 2.4796485334022482, "percentage": 82.65, "elapsed_time": "17:42:07", "remaining_time": "3:42:53", "throughput": "2466.82", "total_tokens": 157204480} {"current_steps": 19200, "total_steps": 23217, "loss": 1.074, "learning_rate": 3.603146315259104e-06, "epoch": 2.4809406900116295, "percentage": 82.7, "elapsed_time": "17:43:11", "remaining_time": "3:42:26", "throughput": "2465.63", "total_tokens": 157286400} {"current_steps": 19210, "total_steps": 23217, "loss": 0.6913, "learning_rate": 3.5856703035444196e-06, "epoch": 2.4822328466210104, "percentage": 82.74, "elapsed_time": "17:44:15", "remaining_time": "3:41:59", "throughput": "2464.45", "total_tokens": 157368320} {"current_steps": 19220, "total_steps": 23217, "loss": 0.7036, "learning_rate": 3.568233501389054e-06, "epoch": 2.4835250032303917, "percentage": 82.78, "elapsed_time": "17:45:14", "remaining_time": "3:41:31", "throughput": "2463.44", "total_tokens": 157450240} {"current_steps": 19230, "total_steps": 23217, "loss": 0.7991, "learning_rate": 3.5508359407197157e-06, "epoch": 2.4848171598397726, "percentage": 82.83, "elapsed_time": "17:46:14", "remaining_time": "3:41:04", "throughput": "2462.40", "total_tokens": 157532160} {"current_steps": 19240, "total_steps": 23217, "loss": 0.6216, "learning_rate": 3.5334776533912846e-06, "epoch": 2.4861093164491535, "percentage": 82.87, "elapsed_time": "17:47:21", "remaining_time": "3:40:37", "throughput": "2461.14", "total_tokens": 157614080} {"current_steps": 19250, "total_steps": 23217, "loss": 0.9294, "learning_rate": 3.516158671186723e-06, "epoch": 2.4874014730585348, "percentage": 82.91, "elapsed_time": "17:48:18", "remaining_time": "3:40:09", "throughput": "2460.20", "total_tokens": 157696000} {"current_steps": 19260, "total_steps": 23217, "loss": 0.8402, "learning_rate": 3.4988790258170146e-06, "epoch": 2.4886936296679156, "percentage": 82.96, "elapsed_time": "17:49:13", "remaining_time": "3:39:40", "throughput": "2459.39", "total_tokens": 157777920} {"current_steps": 19270, "total_steps": 23217, "loss": 0.8772, "learning_rate": 3.481638748921137e-06, "epoch": 2.489985786277297, "percentage": 83.0, "elapsed_time": "17:50:06", "remaining_time": "3:39:11", "throughput": "2458.62", "total_tokens": 157859840} {"current_steps": 19280, "total_steps": 23217, "loss": 0.5995, "learning_rate": 3.4644378720659648e-06, "epoch": 2.491277942886678, "percentage": 83.04, "elapsed_time": "17:50:59", "remaining_time": "3:38:41", "throughput": "2457.88", "total_tokens": 157941760} {"current_steps": 19290, "total_steps": 23217, "loss": 0.8775, "learning_rate": 3.4472764267462486e-06, "epoch": 2.492570099496059, "percentage": 83.09, "elapsed_time": "17:51:52", "remaining_time": "3:38:12", "throughput": "2457.14", "total_tokens": 158023680} {"current_steps": 19300, "total_steps": 23217, "loss": 0.827, "learning_rate": 3.430154444384523e-06, "epoch": 2.49386225610544, "percentage": 83.13, "elapsed_time": "17:52:44", "remaining_time": "3:37:42", "throughput": "2456.41", "total_tokens": 158105600} {"current_steps": 19310, "total_steps": 23217, "loss": 0.6568, "learning_rate": 3.4130719563310877e-06, "epoch": 2.495154412714821, "percentage": 83.17, "elapsed_time": "17:53:37", "remaining_time": "3:37:13", "throughput": "2455.65", "total_tokens": 158187520} {"current_steps": 19320, "total_steps": 23217, "loss": 0.8331, "learning_rate": 3.396028993863906e-06, "epoch": 2.496446569324202, "percentage": 83.21, "elapsed_time": "17:54:32", "remaining_time": "3:36:44", "throughput": "2454.84", "total_tokens": 158269440} {"current_steps": 19330, "total_steps": 23217, "loss": 0.6592, "learning_rate": 3.379025588188578e-06, "epoch": 2.497738725933583, "percentage": 83.26, "elapsed_time": "17:55:27", "remaining_time": "3:36:15", "throughput": "2454.01", "total_tokens": 158351360} {"current_steps": 19340, "total_steps": 23217, "loss": 0.9447, "learning_rate": 3.362061770438285e-06, "epoch": 2.4990308825429643, "percentage": 83.3, "elapsed_time": "17:56:20", "remaining_time": "3:35:46", "throughput": "2453.28", "total_tokens": 158433280} {"current_steps": 19350, "total_steps": 23217, "loss": 0.4547, "learning_rate": 3.3451375716737067e-06, "epoch": 2.500323039152345, "percentage": 83.34, "elapsed_time": "17:57:18", "remaining_time": "3:35:17", "throughput": "2452.32", "total_tokens": 158515200} {"current_steps": 19360, "total_steps": 23217, "loss": 0.8312, "learning_rate": 3.328253022883002e-06, "epoch": 2.501615195761726, "percentage": 83.39, "elapsed_time": "17:58:16", "remaining_time": "3:34:49", "throughput": "2451.39", "total_tokens": 158597120} {"current_steps": 19370, "total_steps": 23217, "loss": 0.744, "learning_rate": 3.3114081549817018e-06, "epoch": 2.5029073523711074, "percentage": 83.43, "elapsed_time": "17:59:12", "remaining_time": "3:34:20", "throughput": "2450.54", "total_tokens": 158679040} {"current_steps": 19380, "total_steps": 23217, "loss": 0.6551, "learning_rate": 3.2946029988127068e-06, "epoch": 2.5041995089804887, "percentage": 83.47, "elapsed_time": "18:00:04", "remaining_time": "3:33:50", "throughput": "2449.83", "total_tokens": 158760960} {"current_steps": 19390, "total_steps": 23217, "loss": 1.1236, "learning_rate": 3.2778375851462013e-06, "epoch": 2.5054916655898696, "percentage": 83.52, "elapsed_time": "18:00:58", "remaining_time": "3:33:21", "throughput": "2449.05", "total_tokens": 158842880} {"current_steps": 19400, "total_steps": 23217, "loss": 0.7408, "learning_rate": 3.2611119446795844e-06, "epoch": 2.5067838221992504, "percentage": 83.56, "elapsed_time": "18:01:53", "remaining_time": "3:32:51", "throughput": "2448.25", "total_tokens": 158924800} {"current_steps": 19410, "total_steps": 23217, "loss": 0.8042, "learning_rate": 3.2444261080374546e-06, "epoch": 2.5080759788086318, "percentage": 83.6, "elapsed_time": "18:02:47", "remaining_time": "3:32:22", "throughput": "2447.47", "total_tokens": 159006720} {"current_steps": 19420, "total_steps": 23217, "loss": 0.7672, "learning_rate": 3.227780105771505e-06, "epoch": 2.5093681354180126, "percentage": 83.65, "elapsed_time": "18:03:47", "remaining_time": "3:31:54", "throughput": "2446.48", "total_tokens": 159088640} {"current_steps": 19430, "total_steps": 23217, "loss": 0.9146, "learning_rate": 3.2111739683605204e-06, "epoch": 2.510660292027394, "percentage": 83.69, "elapsed_time": "18:04:39", "remaining_time": "3:31:24", "throughput": "2445.77", "total_tokens": 159170560} {"current_steps": 19440, "total_steps": 23217, "loss": 0.8129, "learning_rate": 3.194607726210261e-06, "epoch": 2.511952448636775, "percentage": 83.73, "elapsed_time": "18:05:34", "remaining_time": "3:30:55", "throughput": "2444.97", "total_tokens": 159252480} {"current_steps": 19450, "total_steps": 23217, "loss": 0.6187, "learning_rate": 3.178081409653469e-06, "epoch": 2.5132446052461557, "percentage": 83.77, "elapsed_time": "18:06:29", "remaining_time": "3:30:25", "throughput": "2444.17", "total_tokens": 159334400} {"current_steps": 19460, "total_steps": 23217, "loss": 0.7696, "learning_rate": 3.1615950489497587e-06, "epoch": 2.514536761855537, "percentage": 83.82, "elapsed_time": "18:07:30", "remaining_time": "3:29:57", "throughput": "2443.13", "total_tokens": 159416320} {"current_steps": 19470, "total_steps": 23217, "loss": 0.8106, "learning_rate": 3.1451486742856055e-06, "epoch": 2.515828918464918, "percentage": 83.86, "elapsed_time": "18:08:34", "remaining_time": "3:29:29", "throughput": "2442.02", "total_tokens": 159498240} {"current_steps": 19480, "total_steps": 23217, "loss": 0.8289, "learning_rate": 3.128742315774255e-06, "epoch": 2.517121075074299, "percentage": 83.9, "elapsed_time": "18:09:22", "remaining_time": "3:28:58", "throughput": "2441.48", "total_tokens": 159580160} {"current_steps": 19490, "total_steps": 23217, "loss": 0.4341, "learning_rate": 3.1123760034556943e-06, "epoch": 2.51841323168368, "percentage": 83.95, "elapsed_time": "18:10:10", "remaining_time": "3:28:28", "throughput": "2440.94", "total_tokens": 159662080} {"current_steps": 19500, "total_steps": 23217, "loss": 0.7386, "learning_rate": 3.0960497672965825e-06, "epoch": 2.519705388293061, "percentage": 83.99, "elapsed_time": "18:10:58", "remaining_time": "3:27:57", "throughput": "2440.40", "total_tokens": 159744000} {"current_steps": 19510, "total_steps": 23217, "loss": 0.6727, "learning_rate": 3.0797636371901863e-06, "epoch": 2.520997544902442, "percentage": 84.03, "elapsed_time": "18:11:46", "remaining_time": "3:27:26", "throughput": "2439.86", "total_tokens": 159825920} {"current_steps": 19520, "total_steps": 23217, "loss": 0.8113, "learning_rate": 3.063517642956365e-06, "epoch": 2.522289701511823, "percentage": 84.08, "elapsed_time": "18:12:34", "remaining_time": "3:26:55", "throughput": "2439.33", "total_tokens": 159907840} {"current_steps": 19530, "total_steps": 23217, "loss": 0.793, "learning_rate": 3.0473118143414634e-06, "epoch": 2.5235818581212044, "percentage": 84.12, "elapsed_time": "18:13:21", "remaining_time": "3:26:24", "throughput": "2438.80", "total_tokens": 159989760} {"current_steps": 19540, "total_steps": 23217, "loss": 0.8666, "learning_rate": 3.031146181018299e-06, "epoch": 2.5248740147305853, "percentage": 84.16, "elapsed_time": "18:14:09", "remaining_time": "3:25:53", "throughput": "2438.28", "total_tokens": 160071680} {"current_steps": 19550, "total_steps": 23217, "loss": 0.6603, "learning_rate": 3.0150207725860912e-06, "epoch": 2.526166171339966, "percentage": 84.21, "elapsed_time": "18:14:57", "remaining_time": "3:25:22", "throughput": "2437.76", "total_tokens": 160153600} {"current_steps": 19560, "total_steps": 23217, "loss": 0.6602, "learning_rate": 2.9989356185703975e-06, "epoch": 2.5274583279493474, "percentage": 84.25, "elapsed_time": "18:15:45", "remaining_time": "3:24:51", "throughput": "2437.22", "total_tokens": 160235520} {"current_steps": 19570, "total_steps": 23217, "loss": 0.4753, "learning_rate": 2.982890748423084e-06, "epoch": 2.5287504845587288, "percentage": 84.29, "elapsed_time": "18:16:33", "remaining_time": "3:24:21", "throughput": "2436.68", "total_tokens": 160317440} {"current_steps": 19580, "total_steps": 23217, "loss": 0.9147, "learning_rate": 2.9668861915222364e-06, "epoch": 2.5300426411681096, "percentage": 84.33, "elapsed_time": "18:17:21", "remaining_time": "3:23:50", "throughput": "2436.15", "total_tokens": 160399360} {"current_steps": 19590, "total_steps": 23217, "loss": 0.9882, "learning_rate": 2.950921977172155e-06, "epoch": 2.5313347977774905, "percentage": 84.38, "elapsed_time": "18:18:09", "remaining_time": "3:23:19", "throughput": "2435.61", "total_tokens": 160481280} {"current_steps": 19600, "total_steps": 23217, "loss": 0.5187, "learning_rate": 2.934998134603245e-06, "epoch": 2.532626954386872, "percentage": 84.42, "elapsed_time": "18:18:57", "remaining_time": "3:22:48", "throughput": "2435.06", "total_tokens": 160563200} {"current_steps": 19610, "total_steps": 23217, "loss": 0.7276, "learning_rate": 2.919114692972008e-06, "epoch": 2.5339191109962527, "percentage": 84.46, "elapsed_time": "18:19:45", "remaining_time": "3:22:17", "throughput": "2434.54", "total_tokens": 160645120} {"current_steps": 19620, "total_steps": 23217, "loss": 0.6929, "learning_rate": 2.9032716813609723e-06, "epoch": 2.535211267605634, "percentage": 84.51, "elapsed_time": "18:20:34", "remaining_time": "3:21:46", "throughput": "2434.00", "total_tokens": 160727040} {"current_steps": 19630, "total_steps": 23217, "loss": 0.5275, "learning_rate": 2.8874691287786275e-06, "epoch": 2.536503424215015, "percentage": 84.55, "elapsed_time": "18:21:22", "remaining_time": "3:21:15", "throughput": "2433.46", "total_tokens": 160808960} {"current_steps": 19640, "total_steps": 23217, "loss": 0.6655, "learning_rate": 2.8717070641593987e-06, "epoch": 2.5377955808243957, "percentage": 84.59, "elapsed_time": "18:22:10", "remaining_time": "3:20:44", "throughput": "2432.93", "total_tokens": 160890880} {"current_steps": 19650, "total_steps": 23217, "loss": 0.6951, "learning_rate": 2.8559855163635544e-06, "epoch": 2.539087737433777, "percentage": 84.64, "elapsed_time": "18:22:58", "remaining_time": "3:20:13", "throughput": "2432.40", "total_tokens": 160972800} {"current_steps": 19660, "total_steps": 23217, "loss": 0.6766, "learning_rate": 2.8403045141772054e-06, "epoch": 2.540379894043158, "percentage": 84.68, "elapsed_time": "18:23:46", "remaining_time": "3:19:42", "throughput": "2431.88", "total_tokens": 161054720} {"current_steps": 19670, "total_steps": 23217, "loss": 0.7144, "learning_rate": 2.824664086312204e-06, "epoch": 2.541672050652539, "percentage": 84.72, "elapsed_time": "18:24:34", "remaining_time": "3:19:11", "throughput": "2431.33", "total_tokens": 161136640} {"current_steps": 19680, "total_steps": 23217, "loss": 0.8016, "learning_rate": 2.809064261406111e-06, "epoch": 2.54296420726192, "percentage": 84.77, "elapsed_time": "18:25:23", "remaining_time": "3:18:40", "throughput": "2430.80", "total_tokens": 161218560} {"current_steps": 19690, "total_steps": 23217, "loss": 0.808, "learning_rate": 2.7935050680221565e-06, "epoch": 2.544256363871301, "percentage": 84.81, "elapsed_time": "18:26:11", "remaining_time": "3:18:08", "throughput": "2430.26", "total_tokens": 161300480} {"current_steps": 19700, "total_steps": 23217, "loss": 0.6117, "learning_rate": 2.7779865346491576e-06, "epoch": 2.5455485204806823, "percentage": 84.85, "elapsed_time": "18:26:59", "remaining_time": "3:17:37", "throughput": "2429.73", "total_tokens": 161382400} {"current_steps": 19710, "total_steps": 23217, "loss": 0.8894, "learning_rate": 2.762508689701504e-06, "epoch": 2.5468406770900636, "percentage": 84.89, "elapsed_time": "18:27:47", "remaining_time": "3:17:06", "throughput": "2429.21", "total_tokens": 161464320} {"current_steps": 19720, "total_steps": 23217, "loss": 0.9919, "learning_rate": 2.74707156151906e-06, "epoch": 2.5481328336994444, "percentage": 84.94, "elapsed_time": "18:28:36", "remaining_time": "3:16:35", "throughput": "2428.67", "total_tokens": 161546240} {"current_steps": 19730, "total_steps": 23217, "loss": 1.0815, "learning_rate": 2.7316751783671655e-06, "epoch": 2.5494249903088253, "percentage": 84.98, "elapsed_time": "18:29:24", "remaining_time": "3:16:04", "throughput": "2428.13", "total_tokens": 161628160} {"current_steps": 19740, "total_steps": 23217, "loss": 0.9753, "learning_rate": 2.716319568436529e-06, "epoch": 2.5507171469182066, "percentage": 85.02, "elapsed_time": "18:30:12", "remaining_time": "3:15:33", "throughput": "2427.61", "total_tokens": 161710080} {"current_steps": 19750, "total_steps": 23217, "loss": 1.0534, "learning_rate": 2.7010047598432205e-06, "epoch": 2.5520093035275875, "percentage": 85.07, "elapsed_time": "18:31:00", "remaining_time": "3:15:01", "throughput": "2427.09", "total_tokens": 161792000} {"current_steps": 19760, "total_steps": 23217, "loss": 0.5268, "learning_rate": 2.6857307806286037e-06, "epoch": 2.553301460136969, "percentage": 85.11, "elapsed_time": "18:31:49", "remaining_time": "3:14:30", "throughput": "2426.56", "total_tokens": 161873920} {"current_steps": 19770, "total_steps": 23217, "loss": 0.7309, "learning_rate": 2.6704976587592688e-06, "epoch": 2.5545936167463497, "percentage": 85.15, "elapsed_time": "18:32:37", "remaining_time": "3:13:59", "throughput": "2426.02", "total_tokens": 161955840} {"current_steps": 19780, "total_steps": 23217, "loss": 0.9389, "learning_rate": 2.655305422127016e-06, "epoch": 2.5558857733557305, "percentage": 85.2, "elapsed_time": "18:33:26", "remaining_time": "3:13:28", "throughput": "2425.49", "total_tokens": 162037760} {"current_steps": 19790, "total_steps": 23217, "loss": 0.6891, "learning_rate": 2.6401540985487667e-06, "epoch": 2.557177929965112, "percentage": 85.24, "elapsed_time": "18:34:14", "remaining_time": "3:12:57", "throughput": "2424.97", "total_tokens": 162119680} {"current_steps": 19800, "total_steps": 23217, "loss": 0.6537, "learning_rate": 2.6250437157665455e-06, "epoch": 2.5584700865744927, "percentage": 85.28, "elapsed_time": "18:35:03", "remaining_time": "3:12:25", "throughput": "2424.42", "total_tokens": 162201600} {"current_steps": 19810, "total_steps": 23217, "loss": 0.7283, "learning_rate": 2.6099743014474014e-06, "epoch": 2.559762243183874, "percentage": 85.33, "elapsed_time": "18:35:51", "remaining_time": "3:11:54", "throughput": "2423.89", "total_tokens": 162283520} {"current_steps": 19820, "total_steps": 23217, "loss": 0.6683, "learning_rate": 2.594945883183386e-06, "epoch": 2.561054399793255, "percentage": 85.37, "elapsed_time": "18:36:41", "remaining_time": "3:11:23", "throughput": "2423.33", "total_tokens": 162365440} {"current_steps": 19830, "total_steps": 23217, "loss": 0.855, "learning_rate": 2.5799584884914685e-06, "epoch": 2.5623465564026358, "percentage": 85.41, "elapsed_time": "18:37:30", "remaining_time": "3:10:52", "throughput": "2422.77", "total_tokens": 162447360} {"current_steps": 19840, "total_steps": 23217, "loss": 0.9368, "learning_rate": 2.5650121448135222e-06, "epoch": 2.563638713012017, "percentage": 85.45, "elapsed_time": "18:38:19", "remaining_time": "3:10:21", "throughput": "2422.21", "total_tokens": 162529280} {"current_steps": 19850, "total_steps": 23217, "loss": 0.5496, "learning_rate": 2.550106879516237e-06, "epoch": 2.5649308696213984, "percentage": 85.5, "elapsed_time": "18:39:08", "remaining_time": "3:09:49", "throughput": "2421.67", "total_tokens": 162611200} {"current_steps": 19860, "total_steps": 23217, "loss": 1.0861, "learning_rate": 2.535242719891112e-06, "epoch": 2.5662230262307792, "percentage": 85.54, "elapsed_time": "18:40:01", "remaining_time": "3:09:19", "throughput": "2420.98", "total_tokens": 162693120} {"current_steps": 19870, "total_steps": 23217, "loss": 0.4623, "learning_rate": 2.5204196931543635e-06, "epoch": 2.56751518284016, "percentage": 85.58, "elapsed_time": "18:40:57", "remaining_time": "3:08:49", "throughput": "2420.19", "total_tokens": 162775040} {"current_steps": 19880, "total_steps": 23217, "loss": 1.0828, "learning_rate": 2.505637826446891e-06, "epoch": 2.5688073394495414, "percentage": 85.63, "elapsed_time": "18:41:52", "remaining_time": "3:08:18", "throughput": "2419.43", "total_tokens": 162856960} {"current_steps": 19890, "total_steps": 23217, "loss": 0.8837, "learning_rate": 2.4908971468342535e-06, "epoch": 2.5700994960589223, "percentage": 85.67, "elapsed_time": "18:42:54", "remaining_time": "3:07:49", "throughput": "2418.39", "total_tokens": 162938880} {"current_steps": 19900, "total_steps": 23217, "loss": 0.986, "learning_rate": 2.4761976813065663e-06, "epoch": 2.5713916526683036, "percentage": 85.71, "elapsed_time": "18:43:53", "remaining_time": "3:07:20", "throughput": "2417.51", "total_tokens": 163020800} {"current_steps": 19910, "total_steps": 23217, "loss": 0.9548, "learning_rate": 2.4615394567785055e-06, "epoch": 2.5726838092776845, "percentage": 85.76, "elapsed_time": "18:44:48", "remaining_time": "3:06:49", "throughput": "2416.75", "total_tokens": 163102720} {"current_steps": 19920, "total_steps": 23217, "loss": 1.0377, "learning_rate": 2.44692250008923e-06, "epoch": 2.5739759658870653, "percentage": 85.8, "elapsed_time": "18:45:47", "remaining_time": "3:06:19", "throughput": "2415.85", "total_tokens": 163184640} {"current_steps": 19930, "total_steps": 23217, "loss": 0.8889, "learning_rate": 2.432346838002325e-06, "epoch": 2.5752681224964467, "percentage": 85.84, "elapsed_time": "18:46:41", "remaining_time": "3:05:49", "throughput": "2415.12", "total_tokens": 163266560} {"current_steps": 19940, "total_steps": 23217, "loss": 0.7366, "learning_rate": 2.417812497205782e-06, "epoch": 2.5765602791058275, "percentage": 85.89, "elapsed_time": "18:47:38", "remaining_time": "3:05:19", "throughput": "2414.32", "total_tokens": 163348480} {"current_steps": 19950, "total_steps": 23217, "loss": 0.9359, "learning_rate": 2.403319504311921e-06, "epoch": 2.577852435715209, "percentage": 85.93, "elapsed_time": "18:48:31", "remaining_time": "3:04:48", "throughput": "2413.64", "total_tokens": 163430400} {"current_steps": 19960, "total_steps": 23217, "loss": 1.1218, "learning_rate": 2.3888678858573625e-06, "epoch": 2.5791445923245897, "percentage": 85.97, "elapsed_time": "18:49:36", "remaining_time": "3:04:19", "throughput": "2412.51", "total_tokens": 163512320} {"current_steps": 19970, "total_steps": 23217, "loss": 0.8245, "learning_rate": 2.374457668302962e-06, "epoch": 2.5804367489339706, "percentage": 86.01, "elapsed_time": "18:50:33", "remaining_time": "3:03:49", "throughput": "2411.72", "total_tokens": 163594240} {"current_steps": 19980, "total_steps": 23217, "loss": 1.0923, "learning_rate": 2.360088878033778e-06, "epoch": 2.581728905543352, "percentage": 86.06, "elapsed_time": "18:51:30", "remaining_time": "3:03:19", "throughput": "2410.88", "total_tokens": 163676160} {"current_steps": 19990, "total_steps": 23217, "loss": 1.161, "learning_rate": 2.3457615413590177e-06, "epoch": 2.5830210621527327, "percentage": 86.1, "elapsed_time": "18:52:31", "remaining_time": "3:02:49", "throughput": "2409.92", "total_tokens": 163758080} {"current_steps": 20000, "total_steps": 23217, "loss": 0.9189, "learning_rate": 2.3314756845119746e-06, "epoch": 2.584313218762114, "percentage": 86.14, "elapsed_time": "18:53:28", "remaining_time": "3:02:19", "throughput": "2409.12", "total_tokens": 163840000} {"current_steps": 20010, "total_steps": 23217, "loss": 0.8559, "learning_rate": 2.317231333650005e-06, "epoch": 2.585605375371495, "percentage": 86.19, "elapsed_time": "18:54:31", "remaining_time": "3:01:49", "throughput": "2408.09", "total_tokens": 163921920} {"current_steps": 20020, "total_steps": 23217, "loss": 0.9338, "learning_rate": 2.3030285148544577e-06, "epoch": 2.5868975319808762, "percentage": 86.23, "elapsed_time": "18:55:29", "remaining_time": "3:01:19", "throughput": "2407.22", "total_tokens": 164003840} {"current_steps": 20030, "total_steps": 23217, "loss": 0.7432, "learning_rate": 2.2888672541306525e-06, "epoch": 2.588189688590257, "percentage": 86.27, "elapsed_time": "18:56:23", "remaining_time": "3:00:48", "throughput": "2406.53", "total_tokens": 164085760} {"current_steps": 20040, "total_steps": 23217, "loss": 0.7769, "learning_rate": 2.2747475774077986e-06, "epoch": 2.5894818451996384, "percentage": 86.32, "elapsed_time": "18:57:18", "remaining_time": "3:00:17", "throughput": "2405.81", "total_tokens": 164167680} {"current_steps": 20050, "total_steps": 23217, "loss": 0.8439, "learning_rate": 2.2606695105389653e-06, "epoch": 2.5907740018090193, "percentage": 86.36, "elapsed_time": "18:58:17", "remaining_time": "2:59:48", "throughput": "2404.90", "total_tokens": 164249600} {"current_steps": 20060, "total_steps": 23217, "loss": 0.772, "learning_rate": 2.2466330793010555e-06, "epoch": 2.5920661584184, "percentage": 86.4, "elapsed_time": "18:59:12", "remaining_time": "2:59:17", "throughput": "2404.18", "total_tokens": 164331520} {"current_steps": 20070, "total_steps": 23217, "loss": 0.7069, "learning_rate": 2.2326383093947135e-06, "epoch": 2.5933583150277815, "percentage": 86.45, "elapsed_time": "19:00:03", "remaining_time": "2:58:45", "throughput": "2403.57", "total_tokens": 164413440} {"current_steps": 20080, "total_steps": 23217, "loss": 0.9164, "learning_rate": 2.2186852264443196e-06, "epoch": 2.5946504716371623, "percentage": 86.49, "elapsed_time": "19:00:54", "remaining_time": "2:58:14", "throughput": "2403.00", "total_tokens": 164495360} {"current_steps": 20090, "total_steps": 23217, "loss": 0.8105, "learning_rate": 2.2047738559979104e-06, "epoch": 2.5959426282465436, "percentage": 86.53, "elapsed_time": "19:01:44", "remaining_time": "2:57:42", "throughput": "2402.44", "total_tokens": 164577280} {"current_steps": 20100, "total_steps": 23217, "loss": 1.0952, "learning_rate": 2.1909042235271597e-06, "epoch": 2.5972347848559245, "percentage": 86.57, "elapsed_time": "19:02:37", "remaining_time": "2:57:11", "throughput": "2401.78", "total_tokens": 164659200} {"current_steps": 20110, "total_steps": 23217, "loss": 0.9695, "learning_rate": 2.1770763544273098e-06, "epoch": 2.5985269414653054, "percentage": 86.62, "elapsed_time": "19:03:29", "remaining_time": "2:56:40", "throughput": "2401.14", "total_tokens": 164741120} {"current_steps": 20120, "total_steps": 23217, "loss": 0.8496, "learning_rate": 2.1632902740171378e-06, "epoch": 2.5998190980746867, "percentage": 86.66, "elapsed_time": "19:04:23", "remaining_time": "2:56:09", "throughput": "2400.46", "total_tokens": 164823040} {"current_steps": 20130, "total_steps": 23217, "loss": 0.7883, "learning_rate": 2.1495460075389133e-06, "epoch": 2.6011112546840676, "percentage": 86.7, "elapsed_time": "19:05:16", "remaining_time": "2:55:37", "throughput": "2399.78", "total_tokens": 164904960} {"current_steps": 20140, "total_steps": 23217, "loss": 0.6911, "learning_rate": 2.1358435801583283e-06, "epoch": 2.602403411293449, "percentage": 86.75, "elapsed_time": "19:06:09", "remaining_time": "2:55:06", "throughput": "2399.13", "total_tokens": 164986880} {"current_steps": 20150, "total_steps": 23217, "loss": 0.5446, "learning_rate": 2.122183016964488e-06, "epoch": 2.6036955679028297, "percentage": 86.79, "elapsed_time": "19:07:00", "remaining_time": "2:54:35", "throughput": "2398.53", "total_tokens": 165068800} {"current_steps": 20160, "total_steps": 23217, "loss": 0.7104, "learning_rate": 2.1085643429698236e-06, "epoch": 2.6049877245122106, "percentage": 86.83, "elapsed_time": "19:07:48", "remaining_time": "2:54:02", "throughput": "2398.06", "total_tokens": 165150720} {"current_steps": 20170, "total_steps": 23217, "loss": 0.9044, "learning_rate": 2.094987583110086e-06, "epoch": 2.606279881121592, "percentage": 86.88, "elapsed_time": "19:08:39", "remaining_time": "2:53:31", "throughput": "2397.48", "total_tokens": 165232640} {"current_steps": 20180, "total_steps": 23217, "loss": 0.687, "learning_rate": 2.0814527622442626e-06, "epoch": 2.6075720377309732, "percentage": 86.92, "elapsed_time": "19:09:29", "remaining_time": "2:52:59", "throughput": "2396.94", "total_tokens": 165314560} {"current_steps": 20190, "total_steps": 23217, "loss": 0.791, "learning_rate": 2.067959905154568e-06, "epoch": 2.608864194340354, "percentage": 86.96, "elapsed_time": "19:10:26", "remaining_time": "2:52:28", "throughput": "2396.14", "total_tokens": 165396480} {"current_steps": 20200, "total_steps": 23217, "loss": 0.508, "learning_rate": 2.0545090365463788e-06, "epoch": 2.610156350949735, "percentage": 87.01, "elapsed_time": "19:11:20", "remaining_time": "2:51:57", "throughput": "2395.44", "total_tokens": 165478400} {"current_steps": 20210, "total_steps": 23217, "loss": 0.9302, "learning_rate": 2.041100181048178e-06, "epoch": 2.6114485075591163, "percentage": 87.05, "elapsed_time": "19:12:18", "remaining_time": "2:51:27", "throughput": "2394.61", "total_tokens": 165560320} {"current_steps": 20220, "total_steps": 23217, "loss": 0.7966, "learning_rate": 2.0277333632115288e-06, "epoch": 2.612740664168497, "percentage": 87.09, "elapsed_time": "19:13:16", "remaining_time": "2:50:56", "throughput": "2393.78", "total_tokens": 165642240} {"current_steps": 20230, "total_steps": 23217, "loss": 1.1115, "learning_rate": 2.0144086075110367e-06, "epoch": 2.6140328207778785, "percentage": 87.13, "elapsed_time": "19:14:14", "remaining_time": "2:50:25", "throughput": "2392.99", "total_tokens": 165724160} {"current_steps": 20240, "total_steps": 23217, "loss": 0.6785, "learning_rate": 2.001125938344273e-06, "epoch": 2.6153249773872593, "percentage": 87.18, "elapsed_time": "19:15:09", "remaining_time": "2:49:54", "throughput": "2392.27", "total_tokens": 165806080} {"current_steps": 20250, "total_steps": 23217, "loss": 0.8553, "learning_rate": 1.9878853800317535e-06, "epoch": 2.61661713399664, "percentage": 87.22, "elapsed_time": "19:16:04", "remaining_time": "2:49:23", "throughput": "2391.55", "total_tokens": 165888000} {"current_steps": 20260, "total_steps": 23217, "loss": 0.7277, "learning_rate": 1.9746869568168985e-06, "epoch": 2.6179092906060215, "percentage": 87.26, "elapsed_time": "19:16:56", "remaining_time": "2:48:51", "throughput": "2390.92", "total_tokens": 165969920} {"current_steps": 20270, "total_steps": 23217, "loss": 0.823, "learning_rate": 1.9615306928659677e-06, "epoch": 2.6192014472154024, "percentage": 87.31, "elapsed_time": "19:17:44", "remaining_time": "2:48:19", "throughput": "2390.45", "total_tokens": 166051840} {"current_steps": 20280, "total_steps": 23217, "loss": 0.9189, "learning_rate": 1.948416612268034e-06, "epoch": 2.6204936038247837, "percentage": 87.35, "elapsed_time": "19:18:32", "remaining_time": "2:47:46", "throughput": "2389.99", "total_tokens": 166133760} {"current_steps": 20290, "total_steps": 23217, "loss": 0.8662, "learning_rate": 1.935344739034936e-06, "epoch": 2.6217857604341646, "percentage": 87.39, "elapsed_time": "19:19:19", "remaining_time": "2:47:14", "throughput": "2389.53", "total_tokens": 166215680} {"current_steps": 20300, "total_steps": 23217, "loss": 0.9959, "learning_rate": 1.922315097101218e-06, "epoch": 2.6230779170435454, "percentage": 87.44, "elapsed_time": "19:20:09", "remaining_time": "2:46:42", "throughput": "2389.00", "total_tokens": 166297600} {"current_steps": 20310, "total_steps": 23217, "loss": 0.4612, "learning_rate": 1.909327710324116e-06, "epoch": 2.6243700736529267, "percentage": 87.48, "elapsed_time": "19:21:00", "remaining_time": "2:46:10", "throughput": "2388.42", "total_tokens": 166379520} {"current_steps": 20320, "total_steps": 23217, "loss": 0.9159, "learning_rate": 1.8963826024834734e-06, "epoch": 2.625662230262308, "percentage": 87.52, "elapsed_time": "19:21:52", "remaining_time": "2:45:38", "throughput": "2387.84", "total_tokens": 166461440} {"current_steps": 20330, "total_steps": 23217, "loss": 0.6083, "learning_rate": 1.8834797972817508e-06, "epoch": 2.626954386871689, "percentage": 87.57, "elapsed_time": "19:22:44", "remaining_time": "2:45:07", "throughput": "2387.21", "total_tokens": 166543360} {"current_steps": 20340, "total_steps": 23217, "loss": 0.8399, "learning_rate": 1.8706193183439247e-06, "epoch": 2.62824654348107, "percentage": 87.61, "elapsed_time": "19:23:36", "remaining_time": "2:44:35", "throughput": "2386.61", "total_tokens": 166625280} {"current_steps": 20350, "total_steps": 23217, "loss": 0.4694, "learning_rate": 1.8578011892174924e-06, "epoch": 2.629538700090451, "percentage": 87.65, "elapsed_time": "19:24:29", "remaining_time": "2:44:03", "throughput": "2385.99", "total_tokens": 166707200} {"current_steps": 20360, "total_steps": 23217, "loss": 1.0965, "learning_rate": 1.845025433372402e-06, "epoch": 2.630830856699832, "percentage": 87.69, "elapsed_time": "19:25:21", "remaining_time": "2:43:31", "throughput": "2385.39", "total_tokens": 166789120} {"current_steps": 20370, "total_steps": 23217, "loss": 0.9704, "learning_rate": 1.8322920742010086e-06, "epoch": 2.6321230133092133, "percentage": 87.74, "elapsed_time": "19:26:12", "remaining_time": "2:42:59", "throughput": "2384.81", "total_tokens": 166871040} {"current_steps": 20380, "total_steps": 23217, "loss": 1.1178, "learning_rate": 1.8196011350180563e-06, "epoch": 2.633415169918594, "percentage": 87.78, "elapsed_time": "19:27:03", "remaining_time": "2:42:27", "throughput": "2384.26", "total_tokens": 166952960} {"current_steps": 20390, "total_steps": 23217, "loss": 0.6866, "learning_rate": 1.8069526390605968e-06, "epoch": 2.634707326527975, "percentage": 87.82, "elapsed_time": "19:27:51", "remaining_time": "2:41:55", "throughput": "2383.79", "total_tokens": 167034880} {"current_steps": 20400, "total_steps": 23217, "loss": 0.8549, "learning_rate": 1.7943466094879902e-06, "epoch": 2.6359994831373563, "percentage": 87.87, "elapsed_time": "19:28:41", "remaining_time": "2:41:22", "throughput": "2383.25", "total_tokens": 167116800} {"current_steps": 20410, "total_steps": 23217, "loss": 0.7212, "learning_rate": 1.7817830693818288e-06, "epoch": 2.637291639746737, "percentage": 87.91, "elapsed_time": "19:29:31", "remaining_time": "2:40:50", "throughput": "2382.72", "total_tokens": 167198720} {"current_steps": 20420, "total_steps": 23217, "loss": 0.3765, "learning_rate": 1.7692620417459004e-06, "epoch": 2.6385837963561185, "percentage": 87.95, "elapsed_time": "19:30:20", "remaining_time": "2:40:18", "throughput": "2382.22", "total_tokens": 167280640} {"current_steps": 20430, "total_steps": 23217, "loss": 0.9786, "learning_rate": 1.7567835495061718e-06, "epoch": 2.6398759529654994, "percentage": 88.0, "elapsed_time": "19:31:11", "remaining_time": "2:39:46", "throughput": "2381.67", "total_tokens": 167362560} {"current_steps": 20440, "total_steps": 23217, "loss": 0.8443, "learning_rate": 1.7443476155107052e-06, "epoch": 2.6411681095748802, "percentage": 88.04, "elapsed_time": "19:31:59", "remaining_time": "2:39:13", "throughput": "2381.19", "total_tokens": 167444480} {"current_steps": 20450, "total_steps": 23217, "loss": 0.9905, "learning_rate": 1.7319542625296613e-06, "epoch": 2.6424602661842616, "percentage": 88.08, "elapsed_time": "19:32:53", "remaining_time": "2:38:41", "throughput": "2380.52", "total_tokens": 167526400} {"current_steps": 20460, "total_steps": 23217, "loss": 0.7714, "learning_rate": 1.7196035132552135e-06, "epoch": 2.643752422793643, "percentage": 88.13, "elapsed_time": "19:33:44", "remaining_time": "2:38:09", "throughput": "2379.96", "total_tokens": 167608320} {"current_steps": 20470, "total_steps": 23217, "loss": 0.9703, "learning_rate": 1.7072953903015498e-06, "epoch": 2.6450445794030237, "percentage": 88.17, "elapsed_time": "19:34:33", "remaining_time": "2:37:37", "throughput": "2379.49", "total_tokens": 167690240} {"current_steps": 20480, "total_steps": 23217, "loss": 0.7194, "learning_rate": 1.6950299162047878e-06, "epoch": 2.6463367360124046, "percentage": 88.21, "elapsed_time": "19:35:23", "remaining_time": "2:37:04", "throughput": "2378.95", "total_tokens": 167772160} {"current_steps": 20490, "total_steps": 23217, "loss": 0.7812, "learning_rate": 1.682807113422971e-06, "epoch": 2.647628892621786, "percentage": 88.25, "elapsed_time": "19:36:15", "remaining_time": "2:36:32", "throughput": "2378.36", "total_tokens": 167854080} {"current_steps": 20500, "total_steps": 23217, "loss": 0.6726, "learning_rate": 1.6706270043360117e-06, "epoch": 2.648921049231167, "percentage": 88.3, "elapsed_time": "19:37:10", "remaining_time": "2:36:01", "throughput": "2377.67", "total_tokens": 167936000} {"current_steps": 20510, "total_steps": 23217, "loss": 0.921, "learning_rate": 1.6584896112456338e-06, "epoch": 2.650213205840548, "percentage": 88.34, "elapsed_time": "19:38:00", "remaining_time": "2:35:28", "throughput": "2377.14", "total_tokens": 168017920} {"current_steps": 20520, "total_steps": 23217, "loss": 0.8371, "learning_rate": 1.646394956375369e-06, "epoch": 2.651505362449929, "percentage": 88.38, "elapsed_time": "19:38:49", "remaining_time": "2:34:56", "throughput": "2376.67", "total_tokens": 168099840} {"current_steps": 20530, "total_steps": 23217, "loss": 0.6175, "learning_rate": 1.6343430618704775e-06, "epoch": 2.65279751905931, "percentage": 88.43, "elapsed_time": "19:39:38", "remaining_time": "2:34:23", "throughput": "2376.18", "total_tokens": 168181760} {"current_steps": 20540, "total_steps": 23217, "loss": 0.6474, "learning_rate": 1.622333949797944e-06, "epoch": 2.654089675668691, "percentage": 88.47, "elapsed_time": "19:40:25", "remaining_time": "2:33:50", "throughput": "2375.74", "total_tokens": 168263680} {"current_steps": 20550, "total_steps": 23217, "loss": 0.6756, "learning_rate": 1.6103676421463986e-06, "epoch": 2.655381832278072, "percentage": 88.51, "elapsed_time": "19:41:14", "remaining_time": "2:33:18", "throughput": "2375.27", "total_tokens": 168345600} {"current_steps": 20560, "total_steps": 23217, "loss": 0.8549, "learning_rate": 1.5984441608261152e-06, "epoch": 2.6566739888874533, "percentage": 88.56, "elapsed_time": "19:42:08", "remaining_time": "2:32:46", "throughput": "2374.60", "total_tokens": 168427520} {"current_steps": 20570, "total_steps": 23217, "loss": 0.6964, "learning_rate": 1.5865635276689412e-06, "epoch": 2.657966145496834, "percentage": 88.6, "elapsed_time": "19:42:58", "remaining_time": "2:32:13", "throughput": "2374.09", "total_tokens": 168509440} {"current_steps": 20580, "total_steps": 23217, "loss": 0.8505, "learning_rate": 1.5747257644282726e-06, "epoch": 2.659258302106215, "percentage": 88.64, "elapsed_time": "19:43:53", "remaining_time": "2:31:41", "throughput": "2373.42", "total_tokens": 168591360} {"current_steps": 20590, "total_steps": 23217, "loss": 0.4486, "learning_rate": 1.5629308927790077e-06, "epoch": 2.6605504587155964, "percentage": 88.69, "elapsed_time": "19:44:43", "remaining_time": "2:31:09", "throughput": "2372.87", "total_tokens": 168673280} {"current_steps": 20600, "total_steps": 23217, "loss": 0.7925, "learning_rate": 1.551178934317521e-06, "epoch": 2.6618426153249772, "percentage": 88.73, "elapsed_time": "19:45:33", "remaining_time": "2:30:36", "throughput": "2372.38", "total_tokens": 168755200} {"current_steps": 20610, "total_steps": 23217, "loss": 0.9941, "learning_rate": 1.5394699105616002e-06, "epoch": 2.6631347719343585, "percentage": 88.77, "elapsed_time": "19:46:21", "remaining_time": "2:30:03", "throughput": "2371.94", "total_tokens": 168837120} {"current_steps": 20620, "total_steps": 23217, "loss": 0.8127, "learning_rate": 1.5278038429504177e-06, "epoch": 2.6644269285437394, "percentage": 88.81, "elapsed_time": "19:47:11", "remaining_time": "2:29:31", "throughput": "2371.42", "total_tokens": 168919040} {"current_steps": 20630, "total_steps": 23217, "loss": 0.3516, "learning_rate": 1.516180752844515e-06, "epoch": 2.6657190851531203, "percentage": 88.86, "elapsed_time": "19:48:00", "remaining_time": "2:28:58", "throughput": "2370.92", "total_tokens": 169000960} {"current_steps": 20640, "total_steps": 23217, "loss": 0.7978, "learning_rate": 1.504600661525718e-06, "epoch": 2.6670112417625016, "percentage": 88.9, "elapsed_time": "19:48:52", "remaining_time": "2:28:26", "throughput": "2370.36", "total_tokens": 169082880} {"current_steps": 20650, "total_steps": 23217, "loss": 0.6851, "learning_rate": 1.493063590197133e-06, "epoch": 2.668303398371883, "percentage": 88.94, "elapsed_time": "19:49:41", "remaining_time": "2:27:53", "throughput": "2369.87", "total_tokens": 169164800} {"current_steps": 20660, "total_steps": 23217, "loss": 1.0456, "learning_rate": 1.4815695599830981e-06, "epoch": 2.6695955549812638, "percentage": 88.99, "elapsed_time": "19:50:32", "remaining_time": "2:27:20", "throughput": "2369.33", "total_tokens": 169246720} {"current_steps": 20670, "total_steps": 23217, "loss": 0.7482, "learning_rate": 1.4701185919291372e-06, "epoch": 2.6708877115906446, "percentage": 89.03, "elapsed_time": "19:51:22", "remaining_time": "2:26:48", "throughput": "2368.81", "total_tokens": 169328640} {"current_steps": 20680, "total_steps": 23217, "loss": 0.8197, "learning_rate": 1.4587107070019368e-06, "epoch": 2.672179868200026, "percentage": 89.07, "elapsed_time": "19:52:13", "remaining_time": "2:26:15", "throughput": "2368.27", "total_tokens": 169410560} {"current_steps": 20690, "total_steps": 23217, "loss": 0.8722, "learning_rate": 1.447345926089283e-06, "epoch": 2.673472024809407, "percentage": 89.12, "elapsed_time": "19:53:11", "remaining_time": "2:25:43", "throughput": "2367.50", "total_tokens": 169492480} {"current_steps": 20700, "total_steps": 23217, "loss": 0.9786, "learning_rate": 1.436024270000058e-06, "epoch": 2.674764181418788, "percentage": 89.16, "elapsed_time": "19:54:04", "remaining_time": "2:25:11", "throughput": "2366.89", "total_tokens": 169574400} {"current_steps": 20710, "total_steps": 23217, "loss": 0.8513, "learning_rate": 1.4247457594641662e-06, "epoch": 2.676056338028169, "percentage": 89.2, "elapsed_time": "19:54:55", "remaining_time": "2:24:38", "throughput": "2366.35", "total_tokens": 169656320} {"current_steps": 20720, "total_steps": 23217, "loss": 0.8101, "learning_rate": 1.4135104151325184e-06, "epoch": 2.67734849463755, "percentage": 89.24, "elapsed_time": "19:55:45", "remaining_time": "2:24:06", "throughput": "2365.84", "total_tokens": 169738240} {"current_steps": 20730, "total_steps": 23217, "loss": 0.5225, "learning_rate": 1.4023182575769956e-06, "epoch": 2.678640651246931, "percentage": 89.29, "elapsed_time": "19:56:36", "remaining_time": "2:23:33", "throughput": "2365.30", "total_tokens": 169820160} {"current_steps": 20740, "total_steps": 23217, "loss": 0.7088, "learning_rate": 1.391169307290391e-06, "epoch": 2.679932807856312, "percentage": 89.33, "elapsed_time": "19:57:25", "remaining_time": "2:23:00", "throughput": "2364.83", "total_tokens": 169902080} {"current_steps": 20750, "total_steps": 23217, "loss": 0.9884, "learning_rate": 1.3800635846863973e-06, "epoch": 2.6812249644656934, "percentage": 89.37, "elapsed_time": "19:58:13", "remaining_time": "2:22:27", "throughput": "2364.40", "total_tokens": 169984000} {"current_steps": 20760, "total_steps": 23217, "loss": 1.097, "learning_rate": 1.3690011100995437e-06, "epoch": 2.6825171210750742, "percentage": 89.42, "elapsed_time": "19:59:02", "remaining_time": "2:21:54", "throughput": "2363.92", "total_tokens": 170065920} {"current_steps": 20770, "total_steps": 23217, "loss": 0.7501, "learning_rate": 1.357981903785191e-06, "epoch": 2.683809277684455, "percentage": 89.46, "elapsed_time": "19:59:52", "remaining_time": "2:21:21", "throughput": "2363.41", "total_tokens": 170147840} {"current_steps": 20780, "total_steps": 23217, "loss": 0.9277, "learning_rate": 1.3470059859194583e-06, "epoch": 2.6851014342938364, "percentage": 89.5, "elapsed_time": "20:00:43", "remaining_time": "2:20:48", "throughput": "2362.88", "total_tokens": 170229760} {"current_steps": 20790, "total_steps": 23217, "loss": 0.6113, "learning_rate": 1.3360733765992116e-06, "epoch": 2.6863935909032177, "percentage": 89.55, "elapsed_time": "20:01:32", "remaining_time": "2:20:15", "throughput": "2362.41", "total_tokens": 170311680} {"current_steps": 20800, "total_steps": 23217, "loss": 0.7514, "learning_rate": 1.325184095842022e-06, "epoch": 2.6876857475125986, "percentage": 89.59, "elapsed_time": "20:02:22", "remaining_time": "2:19:43", "throughput": "2361.90", "total_tokens": 170393600} {"current_steps": 20810, "total_steps": 23217, "loss": 0.7529, "learning_rate": 1.3143381635861207e-06, "epoch": 2.6889779041219795, "percentage": 89.63, "elapsed_time": "20:03:12", "remaining_time": "2:19:10", "throughput": "2361.41", "total_tokens": 170475520} {"current_steps": 20820, "total_steps": 23217, "loss": 0.8549, "learning_rate": 1.3035355996903697e-06, "epoch": 2.6902700607313608, "percentage": 89.68, "elapsed_time": "20:04:01", "remaining_time": "2:18:37", "throughput": "2360.95", "total_tokens": 170557440} {"current_steps": 20830, "total_steps": 23217, "loss": 0.7501, "learning_rate": 1.2927764239342221e-06, "epoch": 2.6915622173407416, "percentage": 89.72, "elapsed_time": "20:04:50", "remaining_time": "2:18:04", "throughput": "2360.47", "total_tokens": 170639360} {"current_steps": 20840, "total_steps": 23217, "loss": 0.9612, "learning_rate": 1.2820606560176945e-06, "epoch": 2.692854373950123, "percentage": 89.76, "elapsed_time": "20:05:39", "remaining_time": "2:17:30", "throughput": "2360.00", "total_tokens": 170721280} {"current_steps": 20850, "total_steps": 23217, "loss": 0.8317, "learning_rate": 1.2713883155613144e-06, "epoch": 2.694146530559504, "percentage": 89.8, "elapsed_time": "20:06:29", "remaining_time": "2:16:57", "throughput": "2359.51", "total_tokens": 170803200} {"current_steps": 20860, "total_steps": 23217, "loss": 0.6523, "learning_rate": 1.2607594221060975e-06, "epoch": 2.6954386871688847, "percentage": 89.85, "elapsed_time": "20:07:19", "remaining_time": "2:16:25", "throughput": "2359.00", "total_tokens": 170885120} {"current_steps": 20870, "total_steps": 23217, "loss": 0.8824, "learning_rate": 1.2501739951135155e-06, "epoch": 2.696730843778266, "percentage": 89.89, "elapsed_time": "20:08:08", "remaining_time": "2:15:51", "throughput": "2358.55", "total_tokens": 170967040} {"current_steps": 20880, "total_steps": 23217, "loss": 0.8567, "learning_rate": 1.2396320539654366e-06, "epoch": 2.698023000387647, "percentage": 89.93, "elapsed_time": "20:08:58", "remaining_time": "2:15:18", "throughput": "2358.03", "total_tokens": 171048960} {"current_steps": 20890, "total_steps": 23217, "loss": 1.1474, "learning_rate": 1.229133617964126e-06, "epoch": 2.699315156997028, "percentage": 89.98, "elapsed_time": "20:09:50", "remaining_time": "2:14:46", "throughput": "2357.50", "total_tokens": 171130880} {"current_steps": 20900, "total_steps": 23217, "loss": 0.5778, "learning_rate": 1.2186787063321743e-06, "epoch": 2.700607313606409, "percentage": 90.02, "elapsed_time": "20:10:39", "remaining_time": "2:14:12", "throughput": "2357.01", "total_tokens": 171212800} {"current_steps": 20910, "total_steps": 23217, "loss": 0.9957, "learning_rate": 1.208267338212493e-06, "epoch": 2.70189947021579, "percentage": 90.06, "elapsed_time": "20:11:29", "remaining_time": "2:13:39", "throughput": "2356.52", "total_tokens": 171294720} {"current_steps": 20920, "total_steps": 23217, "loss": 0.8154, "learning_rate": 1.1978995326682535e-06, "epoch": 2.7031916268251712, "percentage": 90.11, "elapsed_time": "20:12:21", "remaining_time": "2:13:06", "throughput": "2355.98", "total_tokens": 171376640} {"current_steps": 20930, "total_steps": 23217, "loss": 0.3983, "learning_rate": 1.1875753086828727e-06, "epoch": 2.7044837834345525, "percentage": 90.15, "elapsed_time": "20:13:14", "remaining_time": "2:12:34", "throughput": "2355.38", "total_tokens": 171458560} {"current_steps": 20940, "total_steps": 23217, "loss": 0.8132, "learning_rate": 1.177294685159963e-06, "epoch": 2.7057759400439334, "percentage": 90.19, "elapsed_time": "20:14:16", "remaining_time": "2:12:02", "throughput": "2354.50", "total_tokens": 171540480} {"current_steps": 20950, "total_steps": 23217, "loss": 0.6962, "learning_rate": 1.167057680923317e-06, "epoch": 2.7070680966533143, "percentage": 90.24, "elapsed_time": "20:15:09", "remaining_time": "2:11:29", "throughput": "2353.91", "total_tokens": 171622400} {"current_steps": 20960, "total_steps": 23217, "loss": 0.5466, "learning_rate": 1.1568643147168434e-06, "epoch": 2.7083602532626956, "percentage": 90.28, "elapsed_time": "20:16:06", "remaining_time": "2:10:57", "throughput": "2353.20", "total_tokens": 171704320} {"current_steps": 20970, "total_steps": 23217, "loss": 0.9384, "learning_rate": 1.1467146052045603e-06, "epoch": 2.7096524098720765, "percentage": 90.32, "elapsed_time": "20:16:59", "remaining_time": "2:10:24", "throughput": "2352.60", "total_tokens": 171786240} {"current_steps": 20980, "total_steps": 23217, "loss": 0.3847, "learning_rate": 1.1366085709705515e-06, "epoch": 2.7109445664814578, "percentage": 90.36, "elapsed_time": "20:17:50", "remaining_time": "2:09:51", "throughput": "2352.09", "total_tokens": 171868160} {"current_steps": 20990, "total_steps": 23217, "loss": 0.7502, "learning_rate": 1.1265462305189268e-06, "epoch": 2.7122367230908386, "percentage": 90.41, "elapsed_time": "20:18:38", "remaining_time": "2:09:17", "throughput": "2351.65", "total_tokens": 171950080} {"current_steps": 21000, "total_steps": 23217, "loss": 0.8216, "learning_rate": 1.1165276022737926e-06, "epoch": 2.7135288797002195, "percentage": 90.45, "elapsed_time": "20:19:28", "remaining_time": "2:08:44", "throughput": "2351.18", "total_tokens": 172032000} {"current_steps": 21010, "total_steps": 23217, "loss": 0.6687, "learning_rate": 1.1065527045792251e-06, "epoch": 2.714821036309601, "percentage": 90.49, "elapsed_time": "20:20:26", "remaining_time": "2:08:12", "throughput": "2350.43", "total_tokens": 172113920} {"current_steps": 21020, "total_steps": 23217, "loss": 1.0147, "learning_rate": 1.0966215556992231e-06, "epoch": 2.7161131929189817, "percentage": 90.54, "elapsed_time": "20:21:17", "remaining_time": "2:07:38", "throughput": "2349.91", "total_tokens": 172195840} {"current_steps": 21030, "total_steps": 23217, "loss": 0.9388, "learning_rate": 1.0867341738176857e-06, "epoch": 2.717405349528363, "percentage": 90.58, "elapsed_time": "20:22:07", "remaining_time": "2:07:05", "throughput": "2349.44", "total_tokens": 172277760} {"current_steps": 21040, "total_steps": 23217, "loss": 0.9003, "learning_rate": 1.076890577038367e-06, "epoch": 2.718697506137744, "percentage": 90.62, "elapsed_time": "20:22:56", "remaining_time": "2:06:32", "throughput": "2348.96", "total_tokens": 172359680} {"current_steps": 21050, "total_steps": 23217, "loss": 0.6774, "learning_rate": 1.0670907833848664e-06, "epoch": 2.7199896627471247, "percentage": 90.67, "elapsed_time": "20:23:49", "remaining_time": "2:05:59", "throughput": "2348.40", "total_tokens": 172441600} {"current_steps": 21060, "total_steps": 23217, "loss": 0.9375, "learning_rate": 1.0573348108005614e-06, "epoch": 2.721281819356506, "percentage": 90.71, "elapsed_time": "20:24:39", "remaining_time": "2:05:25", "throughput": "2347.90", "total_tokens": 172523520} {"current_steps": 21070, "total_steps": 23217, "loss": 0.5949, "learning_rate": 1.0476226771486074e-06, "epoch": 2.722573975965887, "percentage": 90.75, "elapsed_time": "20:25:29", "remaining_time": "2:04:52", "throughput": "2347.43", "total_tokens": 172605440} {"current_steps": 21080, "total_steps": 23217, "loss": 0.5954, "learning_rate": 1.0379544002118824e-06, "epoch": 2.723866132575268, "percentage": 90.8, "elapsed_time": "20:26:18", "remaining_time": "2:04:19", "throughput": "2346.98", "total_tokens": 172687360} {"current_steps": 21090, "total_steps": 23217, "loss": 0.4849, "learning_rate": 1.0283299976929672e-06, "epoch": 2.725158289184649, "percentage": 90.84, "elapsed_time": "20:27:12", "remaining_time": "2:03:46", "throughput": "2346.36", "total_tokens": 172769280} {"current_steps": 21100, "total_steps": 23217, "loss": 0.6476, "learning_rate": 1.0187494872141102e-06, "epoch": 2.7264504457940304, "percentage": 90.88, "elapsed_time": "20:28:06", "remaining_time": "2:03:13", "throughput": "2345.77", "total_tokens": 172851200} {"current_steps": 21110, "total_steps": 23217, "loss": 1.1527, "learning_rate": 1.0092128863171846e-06, "epoch": 2.7277426024034113, "percentage": 90.92, "elapsed_time": "20:29:01", "remaining_time": "2:02:40", "throughput": "2345.13", "total_tokens": 172933120} {"current_steps": 21120, "total_steps": 23217, "loss": 0.7512, "learning_rate": 9.997202124636785e-07, "epoch": 2.7290347590127926, "percentage": 90.97, "elapsed_time": "20:29:49", "remaining_time": "2:02:06", "throughput": "2344.70", "total_tokens": 173015040} {"current_steps": 21130, "total_steps": 23217, "loss": 0.6027, "learning_rate": 9.902714830346437e-07, "epoch": 2.7303269156221734, "percentage": 91.01, "elapsed_time": "20:30:39", "remaining_time": "2:01:33", "throughput": "2344.23", "total_tokens": 173096960} {"current_steps": 21140, "total_steps": 23217, "loss": 0.5431, "learning_rate": 9.808667153306612e-07, "epoch": 2.7316190722315543, "percentage": 91.05, "elapsed_time": "20:31:29", "remaining_time": "2:00:59", "throughput": "2343.76", "total_tokens": 173178880} {"current_steps": 21150, "total_steps": 23217, "loss": 0.7888, "learning_rate": 9.715059265718335e-07, "epoch": 2.7329112288409356, "percentage": 91.1, "elapsed_time": "20:32:19", "remaining_time": "2:00:26", "throughput": "2343.27", "total_tokens": 173260800} {"current_steps": 21160, "total_steps": 23217, "loss": 0.9271, "learning_rate": 9.62189133897723e-07, "epoch": 2.7342033854503165, "percentage": 91.14, "elapsed_time": "20:33:09", "remaining_time": "1:59:52", "throughput": "2342.79", "total_tokens": 173342720} {"current_steps": 21170, "total_steps": 23217, "loss": 0.8073, "learning_rate": 9.52916354367353e-07, "epoch": 2.735495542059698, "percentage": 91.18, "elapsed_time": "20:33:59", "remaining_time": "1:59:19", "throughput": "2342.33", "total_tokens": 173424640} {"current_steps": 21180, "total_steps": 23217, "loss": 1.2963, "learning_rate": 9.436876049591398e-07, "epoch": 2.7367876986690787, "percentage": 91.23, "elapsed_time": "20:34:48", "remaining_time": "1:58:45", "throughput": "2341.87", "total_tokens": 173506560} {"current_steps": 21190, "total_steps": 23217, "loss": 0.6766, "learning_rate": 9.345029025708995e-07, "epoch": 2.7380798552784595, "percentage": 91.27, "elapsed_time": "20:35:36", "remaining_time": "1:58:11", "throughput": "2341.47", "total_tokens": 173588480} {"current_steps": 21200, "total_steps": 23217, "loss": 0.5872, "learning_rate": 9.253622640197773e-07, "epoch": 2.739372011887841, "percentage": 91.31, "elapsed_time": "20:36:25", "remaining_time": "1:57:38", "throughput": "2341.02", "total_tokens": 173670400} {"current_steps": 21210, "total_steps": 23217, "loss": 0.5351, "learning_rate": 9.162657060422574e-07, "epoch": 2.7406641684972217, "percentage": 91.36, "elapsed_time": "20:37:15", "remaining_time": "1:57:04", "throughput": "2340.56", "total_tokens": 173752320} {"current_steps": 21220, "total_steps": 23217, "loss": 0.6825, "learning_rate": 9.072132452941002e-07, "epoch": 2.741956325106603, "percentage": 91.4, "elapsed_time": "20:38:09", "remaining_time": "1:56:31", "throughput": "2339.95", "total_tokens": 173834240} {"current_steps": 21230, "total_steps": 23217, "loss": 0.84, "learning_rate": 8.982048983503271e-07, "epoch": 2.743248481715984, "percentage": 91.44, "elapsed_time": "20:39:01", "remaining_time": "1:55:57", "throughput": "2339.43", "total_tokens": 173916160} {"current_steps": 21240, "total_steps": 23217, "loss": 0.4665, "learning_rate": 8.892406817051946e-07, "epoch": 2.7445406383253648, "percentage": 91.48, "elapsed_time": "20:39:53", "remaining_time": "1:55:24", "throughput": "2338.87", "total_tokens": 173998080} {"current_steps": 21250, "total_steps": 23217, "loss": 0.8926, "learning_rate": 8.803206117721424e-07, "epoch": 2.745832794934746, "percentage": 91.53, "elapsed_time": "20:40:44", "remaining_time": "1:54:50", "throughput": "2338.40", "total_tokens": 174080000} {"current_steps": 21260, "total_steps": 23217, "loss": 0.8874, "learning_rate": 8.714447048837948e-07, "epoch": 2.7471249515441274, "percentage": 91.57, "elapsed_time": "20:41:34", "remaining_time": "1:54:17", "throughput": "2337.91", "total_tokens": 174161920} {"current_steps": 21270, "total_steps": 23217, "loss": 0.9445, "learning_rate": 8.626129772918962e-07, "epoch": 2.7484171081535083, "percentage": 91.61, "elapsed_time": "20:42:24", "remaining_time": "1:53:43", "throughput": "2337.44", "total_tokens": 174243840} {"current_steps": 21280, "total_steps": 23217, "loss": 0.7208, "learning_rate": 8.538254451673138e-07, "epoch": 2.749709264762889, "percentage": 91.66, "elapsed_time": "20:43:17", "remaining_time": "1:53:10", "throughput": "2336.89", "total_tokens": 174325760} {"current_steps": 21290, "total_steps": 23217, "loss": 0.6216, "learning_rate": 8.450821245999829e-07, "epoch": 2.7510014213722704, "percentage": 91.7, "elapsed_time": "20:44:08", "remaining_time": "1:52:36", "throughput": "2336.38", "total_tokens": 174407680} {"current_steps": 21300, "total_steps": 23217, "loss": 0.9531, "learning_rate": 8.363830315988947e-07, "epoch": 2.7522935779816513, "percentage": 91.74, "elapsed_time": "20:44:57", "remaining_time": "1:52:02", "throughput": "2335.93", "total_tokens": 174489600} {"current_steps": 21310, "total_steps": 23217, "loss": 0.7485, "learning_rate": 8.277281820920523e-07, "epoch": 2.7535857345910326, "percentage": 91.79, "elapsed_time": "20:45:50", "remaining_time": "1:51:29", "throughput": "2335.37", "total_tokens": 174571520} {"current_steps": 21320, "total_steps": 23217, "loss": 1.0028, "learning_rate": 8.191175919264604e-07, "epoch": 2.7548778912004135, "percentage": 91.83, "elapsed_time": "20:46:44", "remaining_time": "1:50:55", "throughput": "2334.80", "total_tokens": 174653440} {"current_steps": 21330, "total_steps": 23217, "loss": 0.7594, "learning_rate": 8.105512768680712e-07, "epoch": 2.7561700478097944, "percentage": 91.87, "elapsed_time": "20:47:37", "remaining_time": "1:50:22", "throughput": "2334.23", "total_tokens": 174735360} {"current_steps": 21340, "total_steps": 23217, "loss": 0.7408, "learning_rate": 8.02029252601777e-07, "epoch": 2.7574622044191757, "percentage": 91.92, "elapsed_time": "20:48:31", "remaining_time": "1:49:48", "throughput": "2333.65", "total_tokens": 174817280} {"current_steps": 21350, "total_steps": 23217, "loss": 0.845, "learning_rate": 7.935515347313793e-07, "epoch": 2.7587543610285565, "percentage": 91.96, "elapsed_time": "20:49:22", "remaining_time": "1:49:15", "throughput": "2333.15", "total_tokens": 174899200} {"current_steps": 21360, "total_steps": 23217, "loss": 0.9223, "learning_rate": 7.851181387795392e-07, "epoch": 2.760046517637938, "percentage": 92.0, "elapsed_time": "20:50:22", "remaining_time": "1:48:42", "throughput": "2332.38", "total_tokens": 174981120} {"current_steps": 21370, "total_steps": 23217, "loss": 0.5397, "learning_rate": 7.767290801877796e-07, "epoch": 2.7613386742473187, "percentage": 92.04, "elapsed_time": "20:51:50", "remaining_time": "1:48:11", "throughput": "2330.74", "total_tokens": 175063040} {"current_steps": 21380, "total_steps": 23217, "loss": 0.7537, "learning_rate": 7.683843743164359e-07, "epoch": 2.7626308308566996, "percentage": 92.09, "elapsed_time": "20:52:41", "remaining_time": "1:47:38", "throughput": "2330.24", "total_tokens": 175144960} {"current_steps": 21390, "total_steps": 23217, "loss": 0.7232, "learning_rate": 7.600840364446333e-07, "epoch": 2.763922987466081, "percentage": 92.13, "elapsed_time": "20:53:30", "remaining_time": "1:47:04", "throughput": "2329.81", "total_tokens": 175226880} {"current_steps": 21400, "total_steps": 23217, "loss": 0.683, "learning_rate": 7.518280817702616e-07, "epoch": 2.765215144075462, "percentage": 92.17, "elapsed_time": "20:54:18", "remaining_time": "1:46:29", "throughput": "2329.41", "total_tokens": 175308800} {"current_steps": 21410, "total_steps": 23217, "loss": 0.9568, "learning_rate": 7.436165254099376e-07, "epoch": 2.766507300684843, "percentage": 92.22, "elapsed_time": "20:55:06", "remaining_time": "1:45:55", "throughput": "2329.01", "total_tokens": 175390720} {"current_steps": 21420, "total_steps": 23217, "loss": 0.8146, "learning_rate": 7.354493823990006e-07, "epoch": 2.767799457294224, "percentage": 92.26, "elapsed_time": "20:55:55", "remaining_time": "1:45:21", "throughput": "2328.59", "total_tokens": 175472640} {"current_steps": 21430, "total_steps": 23217, "loss": 0.8714, "learning_rate": 7.273266676914498e-07, "epoch": 2.7690916139036053, "percentage": 92.3, "elapsed_time": "20:56:44", "remaining_time": "1:44:47", "throughput": "2328.17", "total_tokens": 175554560} {"current_steps": 21440, "total_steps": 23217, "loss": 0.621, "learning_rate": 7.19248396159955e-07, "epoch": 2.770383770512986, "percentage": 92.35, "elapsed_time": "20:57:32", "remaining_time": "1:44:13", "throughput": "2327.77", "total_tokens": 175636480} {"current_steps": 21450, "total_steps": 23217, "loss": 0.8045, "learning_rate": 7.112145825957927e-07, "epoch": 2.7716759271223674, "percentage": 92.39, "elapsed_time": "20:58:20", "remaining_time": "1:43:39", "throughput": "2327.38", "total_tokens": 175718400} {"current_steps": 21460, "total_steps": 23217, "loss": 1.0378, "learning_rate": 7.03225241708852e-07, "epoch": 2.7729680837317483, "percentage": 92.43, "elapsed_time": "20:59:08", "remaining_time": "1:43:05", "throughput": "2326.99", "total_tokens": 175800320} {"current_steps": 21470, "total_steps": 23217, "loss": 0.5995, "learning_rate": 6.952803881275894e-07, "epoch": 2.774260240341129, "percentage": 92.48, "elapsed_time": "20:59:56", "remaining_time": "1:42:31", "throughput": "2326.61", "total_tokens": 175882240} {"current_steps": 21480, "total_steps": 23217, "loss": 0.9361, "learning_rate": 6.873800363989935e-07, "epoch": 2.7755523969505105, "percentage": 92.52, "elapsed_time": "21:00:43", "remaining_time": "1:41:57", "throughput": "2326.21", "total_tokens": 175964160} {"current_steps": 21490, "total_steps": 23217, "loss": 0.7132, "learning_rate": 6.795242009885905e-07, "epoch": 2.7768445535598913, "percentage": 92.56, "elapsed_time": "21:01:32", "remaining_time": "1:41:22", "throughput": "2325.82", "total_tokens": 176046080} {"current_steps": 21500, "total_steps": 23217, "loss": 0.9569, "learning_rate": 6.717128962803798e-07, "epoch": 2.7781367101692727, "percentage": 92.6, "elapsed_time": "21:02:20", "remaining_time": "1:40:48", "throughput": "2325.42", "total_tokens": 176128000} {"current_steps": 21510, "total_steps": 23217, "loss": 0.5613, "learning_rate": 6.63946136576829e-07, "epoch": 2.7794288667786535, "percentage": 92.65, "elapsed_time": "21:03:08", "remaining_time": "1:40:14", "throughput": "2325.03", "total_tokens": 176209920} {"current_steps": 21520, "total_steps": 23217, "loss": 0.8761, "learning_rate": 6.562239360988542e-07, "epoch": 2.7807210233880344, "percentage": 92.69, "elapsed_time": "21:03:56", "remaining_time": "1:39:40", "throughput": "2324.62", "total_tokens": 176291840} {"current_steps": 21530, "total_steps": 23217, "loss": 0.5046, "learning_rate": 6.485463089857674e-07, "epoch": 2.7820131799974157, "percentage": 92.73, "elapsed_time": "21:04:45", "remaining_time": "1:39:06", "throughput": "2324.22", "total_tokens": 176373760} {"current_steps": 21540, "total_steps": 23217, "loss": 0.8931, "learning_rate": 6.409132692952874e-07, "epoch": 2.783305336606797, "percentage": 92.78, "elapsed_time": "21:05:32", "remaining_time": "1:38:31", "throughput": "2323.84", "total_tokens": 176455680} {"current_steps": 21550, "total_steps": 23217, "loss": 0.9367, "learning_rate": 6.333248310034706e-07, "epoch": 2.784597493216178, "percentage": 92.82, "elapsed_time": "21:06:20", "remaining_time": "1:37:57", "throughput": "2323.45", "total_tokens": 176537600} {"current_steps": 21560, "total_steps": 23217, "loss": 1.0246, "learning_rate": 6.257810080047249e-07, "epoch": 2.7858896498255588, "percentage": 92.86, "elapsed_time": "21:07:08", "remaining_time": "1:37:23", "throughput": "2323.07", "total_tokens": 176619520} {"current_steps": 21570, "total_steps": 23217, "loss": 0.7575, "learning_rate": 6.182818141117625e-07, "epoch": 2.78718180643494, "percentage": 92.91, "elapsed_time": "21:07:56", "remaining_time": "1:36:48", "throughput": "2322.69", "total_tokens": 176701440} {"current_steps": 21580, "total_steps": 23217, "loss": 0.8363, "learning_rate": 6.1082726305558e-07, "epoch": 2.788473963044321, "percentage": 92.95, "elapsed_time": "21:08:43", "remaining_time": "1:36:14", "throughput": "2322.31", "total_tokens": 176783360} {"current_steps": 21590, "total_steps": 23217, "loss": 0.8788, "learning_rate": 6.034173684854316e-07, "epoch": 2.7897661196537022, "percentage": 92.99, "elapsed_time": "21:09:32", "remaining_time": "1:35:40", "throughput": "2321.92", "total_tokens": 176865280} {"current_steps": 21600, "total_steps": 23217, "loss": 0.7845, "learning_rate": 5.960521439688088e-07, "epoch": 2.791058276263083, "percentage": 93.04, "elapsed_time": "21:10:23", "remaining_time": "1:35:06", "throughput": "2321.42", "total_tokens": 176947200} {"current_steps": 21610, "total_steps": 23217, "loss": 0.8485, "learning_rate": 5.88731602991413e-07, "epoch": 2.792350432872464, "percentage": 93.08, "elapsed_time": "21:11:13", "remaining_time": "1:34:31", "throughput": "2320.98", "total_tokens": 177029120} {"current_steps": 21620, "total_steps": 23217, "loss": 0.9114, "learning_rate": 5.814557589571223e-07, "epoch": 2.7936425894818453, "percentage": 93.12, "elapsed_time": "21:12:03", "remaining_time": "1:33:57", "throughput": "2320.53", "total_tokens": 177111040} {"current_steps": 21630, "total_steps": 23217, "loss": 0.6277, "learning_rate": 5.742246251879829e-07, "epoch": 2.794934746091226, "percentage": 93.16, "elapsed_time": "21:12:53", "remaining_time": "1:33:23", "throughput": "2320.08", "total_tokens": 177192960} {"current_steps": 21640, "total_steps": 23217, "loss": 0.8553, "learning_rate": 5.67038214924176e-07, "epoch": 2.7962269027006075, "percentage": 93.21, "elapsed_time": "21:13:41", "remaining_time": "1:32:49", "throughput": "2319.71", "total_tokens": 177274880} {"current_steps": 21650, "total_steps": 23217, "loss": 0.7787, "learning_rate": 5.598965413239926e-07, "epoch": 2.7975190593099883, "percentage": 93.25, "elapsed_time": "21:14:31", "remaining_time": "1:32:14", "throughput": "2319.27", "total_tokens": 177356800} {"current_steps": 21660, "total_steps": 23217, "loss": 0.5017, "learning_rate": 5.527996174638061e-07, "epoch": 2.798811215919369, "percentage": 93.29, "elapsed_time": "21:15:19", "remaining_time": "1:31:40", "throughput": "2318.87", "total_tokens": 177438720} {"current_steps": 21670, "total_steps": 23217, "loss": 1.0671, "learning_rate": 5.457474563380638e-07, "epoch": 2.8001033725287505, "percentage": 93.34, "elapsed_time": "21:16:07", "remaining_time": "1:31:06", "throughput": "2318.49", "total_tokens": 177520640} {"current_steps": 21680, "total_steps": 23217, "loss": 1.0223, "learning_rate": 5.387400708592422e-07, "epoch": 2.8013955291381314, "percentage": 93.38, "elapsed_time": "21:16:55", "remaining_time": "1:30:31", "throughput": "2318.11", "total_tokens": 177602560} {"current_steps": 21690, "total_steps": 23217, "loss": 0.7952, "learning_rate": 5.317774738578446e-07, "epoch": 2.8026876857475127, "percentage": 93.42, "elapsed_time": "21:17:46", "remaining_time": "1:29:57", "throughput": "2317.62", "total_tokens": 177684480} {"current_steps": 21700, "total_steps": 23217, "loss": 0.5789, "learning_rate": 5.248596780823567e-07, "epoch": 2.8039798423568936, "percentage": 93.47, "elapsed_time": "21:18:37", "remaining_time": "1:29:23", "throughput": "2317.16", "total_tokens": 177766400} {"current_steps": 21710, "total_steps": 23217, "loss": 0.9732, "learning_rate": 5.179866961992353e-07, "epoch": 2.8052719989662744, "percentage": 93.51, "elapsed_time": "21:19:28", "remaining_time": "1:28:48", "throughput": "2316.70", "total_tokens": 177848320} {"current_steps": 21720, "total_steps": 23217, "loss": 0.6634, "learning_rate": 5.111585407928887e-07, "epoch": 2.8065641555756558, "percentage": 93.55, "elapsed_time": "21:20:18", "remaining_time": "1:28:14", "throughput": "2316.25", "total_tokens": 177930240} {"current_steps": 21730, "total_steps": 23217, "loss": 0.6454, "learning_rate": 5.043752243656414e-07, "epoch": 2.807856312185037, "percentage": 93.6, "elapsed_time": "21:21:08", "remaining_time": "1:27:40", "throughput": "2315.80", "total_tokens": 178012160} {"current_steps": 21740, "total_steps": 23217, "loss": 0.8702, "learning_rate": 4.976367593377218e-07, "epoch": 2.809148468794418, "percentage": 93.64, "elapsed_time": "21:21:58", "remaining_time": "1:27:05", "throughput": "2315.35", "total_tokens": 178094080} {"current_steps": 21750, "total_steps": 23217, "loss": 1.0812, "learning_rate": 4.909431580472385e-07, "epoch": 2.810440625403799, "percentage": 93.68, "elapsed_time": "21:22:49", "remaining_time": "1:26:31", "throughput": "2314.88", "total_tokens": 178176000} {"current_steps": 21760, "total_steps": 23217, "loss": 0.9232, "learning_rate": 4.842944327501458e-07, "epoch": 2.81173278201318, "percentage": 93.72, "elapsed_time": "21:23:40", "remaining_time": "1:25:57", "throughput": "2314.43", "total_tokens": 178257920} {"current_steps": 21770, "total_steps": 23217, "loss": 0.7583, "learning_rate": 4.776905956202393e-07, "epoch": 2.813024938622561, "percentage": 93.77, "elapsed_time": "21:24:35", "remaining_time": "1:25:23", "throughput": "2313.84", "total_tokens": 178339840} {"current_steps": 21780, "total_steps": 23217, "loss": 0.626, "learning_rate": 4.711316587491188e-07, "epoch": 2.8143170952319423, "percentage": 93.81, "elapsed_time": "21:25:25", "remaining_time": "1:24:48", "throughput": "2313.41", "total_tokens": 178421760} {"current_steps": 21790, "total_steps": 23217, "loss": 0.7818, "learning_rate": 4.646176341461722e-07, "epoch": 2.815609251841323, "percentage": 93.85, "elapsed_time": "21:26:15", "remaining_time": "1:24:14", "throughput": "2312.97", "total_tokens": 178503680} {"current_steps": 21800, "total_steps": 23217, "loss": 0.7148, "learning_rate": 4.581485337385588e-07, "epoch": 2.816901408450704, "percentage": 93.9, "elapsed_time": "21:27:05", "remaining_time": "1:23:39", "throughput": "2312.52", "total_tokens": 178585600} {"current_steps": 21810, "total_steps": 23217, "loss": 0.8498, "learning_rate": 4.5172436937117036e-07, "epoch": 2.8181935650600853, "percentage": 93.94, "elapsed_time": "21:27:55", "remaining_time": "1:23:05", "throughput": "2312.08", "total_tokens": 178667520} {"current_steps": 21820, "total_steps": 23217, "loss": 1.0099, "learning_rate": 4.4534515280663937e-07, "epoch": 2.819485721669466, "percentage": 93.98, "elapsed_time": "21:28:45", "remaining_time": "1:22:30", "throughput": "2311.64", "total_tokens": 178749440} {"current_steps": 21830, "total_steps": 23217, "loss": 0.878, "learning_rate": 4.390108957252781e-07, "epoch": 2.8207778782788475, "percentage": 94.03, "elapsed_time": "21:29:35", "remaining_time": "1:21:56", "throughput": "2311.20", "total_tokens": 178831360} {"current_steps": 21840, "total_steps": 23217, "loss": 0.7988, "learning_rate": 4.3272160972509524e-07, "epoch": 2.8220700348882284, "percentage": 94.07, "elapsed_time": "21:30:25", "remaining_time": "1:21:21", "throughput": "2310.77", "total_tokens": 178913280} {"current_steps": 21850, "total_steps": 23217, "loss": 1.0454, "learning_rate": 4.264773063217431e-07, "epoch": 2.8233621914976093, "percentage": 94.11, "elapsed_time": "21:31:15", "remaining_time": "1:20:47", "throughput": "2310.34", "total_tokens": 178995200} {"current_steps": 21860, "total_steps": 23217, "loss": 0.9275, "learning_rate": 4.20277996948526e-07, "epoch": 2.8246543481069906, "percentage": 94.16, "elapsed_time": "21:32:06", "remaining_time": "1:20:12", "throughput": "2309.88", "total_tokens": 179077120} {"current_steps": 21870, "total_steps": 23217, "loss": 0.95, "learning_rate": 4.1412369295635023e-07, "epoch": 2.825946504716372, "percentage": 94.2, "elapsed_time": "21:32:56", "remaining_time": "1:19:38", "throughput": "2309.44", "total_tokens": 179159040} {"current_steps": 21880, "total_steps": 23217, "loss": 0.8007, "learning_rate": 4.0801440561372694e-07, "epoch": 2.8272386613257527, "percentage": 94.24, "elapsed_time": "21:33:46", "remaining_time": "1:19:03", "throughput": "2309.02", "total_tokens": 179240960} {"current_steps": 21890, "total_steps": 23217, "loss": 0.8786, "learning_rate": 4.0195014610674153e-07, "epoch": 2.8285308179351336, "percentage": 94.28, "elapsed_time": "21:34:36", "remaining_time": "1:18:28", "throughput": "2308.58", "total_tokens": 179322880} {"current_steps": 21900, "total_steps": 23217, "loss": 0.8457, "learning_rate": 3.9593092553902587e-07, "epoch": 2.829822974544515, "percentage": 94.33, "elapsed_time": "21:35:26", "remaining_time": "1:17:54", "throughput": "2308.15", "total_tokens": 179404800} {"current_steps": 21910, "total_steps": 23217, "loss": 0.7406, "learning_rate": 3.899567549317529e-07, "epoch": 2.831115131153896, "percentage": 94.37, "elapsed_time": "21:36:17", "remaining_time": "1:17:19", "throughput": "2307.70", "total_tokens": 179486720} {"current_steps": 21920, "total_steps": 23217, "loss": 0.7223, "learning_rate": 3.840276452236058e-07, "epoch": 2.832407287763277, "percentage": 94.41, "elapsed_time": "21:37:06", "remaining_time": "1:16:44", "throughput": "2307.28", "total_tokens": 179568640} {"current_steps": 21930, "total_steps": 23217, "loss": 0.8734, "learning_rate": 3.7814360727076724e-07, "epoch": 2.833699444372658, "percentage": 94.46, "elapsed_time": "21:37:56", "remaining_time": "1:16:10", "throughput": "2306.85", "total_tokens": 179650560} {"current_steps": 21940, "total_steps": 23217, "loss": 0.5382, "learning_rate": 3.723046518468859e-07, "epoch": 2.834991600982039, "percentage": 94.5, "elapsed_time": "21:38:46", "remaining_time": "1:15:35", "throughput": "2306.42", "total_tokens": 179732480} {"current_steps": 21950, "total_steps": 23217, "loss": 1.0019, "learning_rate": 3.6651078964306807e-07, "epoch": 2.83628375759142, "percentage": 94.54, "elapsed_time": "21:39:36", "remaining_time": "1:15:00", "throughput": "2306.00", "total_tokens": 179814400} {"current_steps": 21960, "total_steps": 23217, "loss": 0.7448, "learning_rate": 3.607620312678528e-07, "epoch": 2.837575914200801, "percentage": 94.59, "elapsed_time": "21:40:26", "remaining_time": "1:14:26", "throughput": "2305.57", "total_tokens": 179896320} {"current_steps": 21970, "total_steps": 23217, "loss": 0.553, "learning_rate": 3.550583872471952e-07, "epoch": 2.8388680708101823, "percentage": 94.63, "elapsed_time": "21:41:16", "remaining_time": "1:13:51", "throughput": "2305.14", "total_tokens": 179978240} {"current_steps": 21980, "total_steps": 23217, "loss": 0.9766, "learning_rate": 3.4939986802445256e-07, "epoch": 2.840160227419563, "percentage": 94.67, "elapsed_time": "21:42:07", "remaining_time": "1:13:16", "throughput": "2304.70", "total_tokens": 180060160} {"current_steps": 21990, "total_steps": 23217, "loss": 0.3731, "learning_rate": 3.437864839603455e-07, "epoch": 2.841452384028944, "percentage": 94.72, "elapsed_time": "21:42:55", "remaining_time": "1:12:42", "throughput": "2304.32", "total_tokens": 180142080} {"current_steps": 22000, "total_steps": 23217, "loss": 0.5934, "learning_rate": 3.3821824533296633e-07, "epoch": 2.8427445406383254, "percentage": 94.76, "elapsed_time": "21:43:42", "remaining_time": "1:12:07", "throughput": "2303.98", "total_tokens": 180224000} {"current_steps": 22010, "total_steps": 23217, "loss": 0.7189, "learning_rate": 3.3269516233773446e-07, "epoch": 2.8440366972477067, "percentage": 94.8, "elapsed_time": "21:44:34", "remaining_time": "1:11:32", "throughput": "2303.52", "total_tokens": 180305920} {"current_steps": 22020, "total_steps": 23217, "loss": 0.6045, "learning_rate": 3.272172450873967e-07, "epoch": 2.8453288538570876, "percentage": 94.84, "elapsed_time": "21:45:21", "remaining_time": "1:10:57", "throughput": "2303.18", "total_tokens": 180387840} {"current_steps": 22030, "total_steps": 23217, "loss": 0.4563, "learning_rate": 3.217845036119993e-07, "epoch": 2.8466210104664684, "percentage": 94.89, "elapsed_time": "21:46:08", "remaining_time": "1:10:22", "throughput": "2302.84", "total_tokens": 180469760} {"current_steps": 22040, "total_steps": 23217, "loss": 0.7337, "learning_rate": 3.163969478588713e-07, "epoch": 2.8479131670758497, "percentage": 94.93, "elapsed_time": "21:46:55", "remaining_time": "1:09:47", "throughput": "2302.50", "total_tokens": 180551680} {"current_steps": 22050, "total_steps": 23217, "loss": 0.8102, "learning_rate": 3.11054587692608e-07, "epoch": 2.8492053236852306, "percentage": 94.97, "elapsed_time": "21:47:42", "remaining_time": "1:09:12", "throughput": "2302.16", "total_tokens": 180633600} {"current_steps": 22060, "total_steps": 23217, "loss": 0.841, "learning_rate": 3.057574328950541e-07, "epoch": 2.850497480294612, "percentage": 95.02, "elapsed_time": "21:48:29", "remaining_time": "1:08:37", "throughput": "2301.83", "total_tokens": 180715520} {"current_steps": 22070, "total_steps": 23217, "loss": 0.5297, "learning_rate": 3.005054931652762e-07, "epoch": 2.851789636903993, "percentage": 95.06, "elapsed_time": "21:49:16", "remaining_time": "1:08:02", "throughput": "2301.49", "total_tokens": 180797440} {"current_steps": 22080, "total_steps": 23217, "loss": 0.7995, "learning_rate": 2.952987781195599e-07, "epoch": 2.8530817935133737, "percentage": 95.1, "elapsed_time": "21:50:03", "remaining_time": "1:07:27", "throughput": "2301.15", "total_tokens": 180879360} {"current_steps": 22090, "total_steps": 23217, "loss": 0.8583, "learning_rate": 2.901372972913791e-07, "epoch": 2.854373950122755, "percentage": 95.15, "elapsed_time": "21:50:50", "remaining_time": "1:06:52", "throughput": "2300.82", "total_tokens": 180961280} {"current_steps": 22100, "total_steps": 23217, "loss": 0.8178, "learning_rate": 2.8502106013138516e-07, "epoch": 2.855666106732136, "percentage": 95.19, "elapsed_time": "21:51:38", "remaining_time": "1:06:17", "throughput": "2300.48", "total_tokens": 181043200} {"current_steps": 22110, "total_steps": 23217, "loss": 0.7179, "learning_rate": 2.799500760073931e-07, "epoch": 2.856958263341517, "percentage": 95.23, "elapsed_time": "21:52:25", "remaining_time": "1:05:42", "throughput": "2300.14", "total_tokens": 181125120} {"current_steps": 22120, "total_steps": 23217, "loss": 0.4239, "learning_rate": 2.749243542043561e-07, "epoch": 2.858250419950898, "percentage": 95.28, "elapsed_time": "21:53:12", "remaining_time": "1:05:07", "throughput": "2299.80", "total_tokens": 181207040} {"current_steps": 22130, "total_steps": 23217, "loss": 0.88, "learning_rate": 2.699439039243523e-07, "epoch": 2.859542576560279, "percentage": 95.32, "elapsed_time": "21:54:00", "remaining_time": "1:04:32", "throughput": "2299.44", "total_tokens": 181288960} {"current_steps": 22140, "total_steps": 23217, "loss": 0.4962, "learning_rate": 2.6500873428656483e-07, "epoch": 2.86083473316966, "percentage": 95.36, "elapsed_time": "21:54:48", "remaining_time": "1:03:57", "throughput": "2299.08", "total_tokens": 181370880} {"current_steps": 22150, "total_steps": 23217, "loss": 0.7783, "learning_rate": 2.601188543272737e-07, "epoch": 2.862126889779041, "percentage": 95.4, "elapsed_time": "21:55:37", "remaining_time": "1:03:22", "throughput": "2298.70", "total_tokens": 181452800} {"current_steps": 22160, "total_steps": 23217, "loss": 1.1341, "learning_rate": 2.552742729998309e-07, "epoch": 2.8634190463884224, "percentage": 95.45, "elapsed_time": "21:56:25", "remaining_time": "1:02:47", "throughput": "2298.32", "total_tokens": 181534720} {"current_steps": 22170, "total_steps": 23217, "loss": 0.6448, "learning_rate": 2.5047499917464636e-07, "epoch": 2.8647112029978032, "percentage": 95.49, "elapsed_time": "21:57:13", "remaining_time": "1:02:12", "throughput": "2297.97", "total_tokens": 181616640} {"current_steps": 22180, "total_steps": 23217, "loss": 0.7003, "learning_rate": 2.457210416391742e-07, "epoch": 2.8660033596071846, "percentage": 95.53, "elapsed_time": "21:58:01", "remaining_time": "1:01:37", "throughput": "2297.62", "total_tokens": 181698560} {"current_steps": 22190, "total_steps": 23217, "loss": 0.9887, "learning_rate": 2.4101240909789325e-07, "epoch": 2.8672955162165654, "percentage": 95.58, "elapsed_time": "21:58:48", "remaining_time": "1:01:02", "throughput": "2297.28", "total_tokens": 181780480} {"current_steps": 22200, "total_steps": 23217, "loss": 0.6259, "learning_rate": 2.3634911017229034e-07, "epoch": 2.8685876728259467, "percentage": 95.62, "elapsed_time": "21:59:35", "remaining_time": "1:00:27", "throughput": "2296.95", "total_tokens": 181862400} {"current_steps": 22210, "total_steps": 23217, "loss": 0.9638, "learning_rate": 2.3173115340085204e-07, "epoch": 2.8698798294353276, "percentage": 95.66, "elapsed_time": "22:00:24", "remaining_time": "0:59:52", "throughput": "2296.58", "total_tokens": 181944320} {"current_steps": 22220, "total_steps": 23217, "loss": 0.9015, "learning_rate": 2.2715854723903974e-07, "epoch": 2.8711719860447085, "percentage": 95.71, "elapsed_time": "22:01:11", "remaining_time": "0:59:16", "throughput": "2296.23", "total_tokens": 182026240} {"current_steps": 22230, "total_steps": 23217, "loss": 0.7179, "learning_rate": 2.2263130005927558e-07, "epoch": 2.87246414265409, "percentage": 95.75, "elapsed_time": "22:02:00", "remaining_time": "0:58:41", "throughput": "2295.85", "total_tokens": 182108160} {"current_steps": 22240, "total_steps": 23217, "loss": 0.936, "learning_rate": 2.181494201509343e-07, "epoch": 2.8737562992634706, "percentage": 95.79, "elapsed_time": "22:02:47", "remaining_time": "0:58:06", "throughput": "2295.52", "total_tokens": 182190080} {"current_steps": 22250, "total_steps": 23217, "loss": 0.5952, "learning_rate": 2.1371291572032382e-07, "epoch": 2.875048455872852, "percentage": 95.83, "elapsed_time": "22:03:34", "remaining_time": "0:57:31", "throughput": "2295.19", "total_tokens": 182272000} {"current_steps": 22260, "total_steps": 23217, "loss": 0.7432, "learning_rate": 2.0932179489066006e-07, "epoch": 2.876340612482233, "percentage": 95.88, "elapsed_time": "22:04:21", "remaining_time": "0:56:56", "throughput": "2294.86", "total_tokens": 182353920} {"current_steps": 22270, "total_steps": 23217, "loss": 0.8684, "learning_rate": 2.0497606570207829e-07, "epoch": 2.8776327690916137, "percentage": 95.92, "elapsed_time": "22:05:09", "remaining_time": "0:56:21", "throughput": "2294.52", "total_tokens": 182435840} {"current_steps": 22280, "total_steps": 23217, "loss": 0.6558, "learning_rate": 2.0067573611158853e-07, "epoch": 2.878924925700995, "percentage": 95.96, "elapsed_time": "22:05:58", "remaining_time": "0:55:45", "throughput": "2294.14", "total_tokens": 182517760} {"current_steps": 22290, "total_steps": 23217, "loss": 0.562, "learning_rate": 1.9642081399307844e-07, "epoch": 2.880217082310376, "percentage": 96.01, "elapsed_time": "22:06:56", "remaining_time": "0:55:11", "throughput": "2293.48", "total_tokens": 182599680} {"current_steps": 22300, "total_steps": 23217, "loss": 0.7792, "learning_rate": 1.9221130713729663e-07, "epoch": 2.881509238919757, "percentage": 96.05, "elapsed_time": "22:07:50", "remaining_time": "0:54:36", "throughput": "2292.96", "total_tokens": 182681600} {"current_steps": 22310, "total_steps": 23217, "loss": 0.7825, "learning_rate": 1.8804722325183044e-07, "epoch": 2.882801395529138, "percentage": 96.09, "elapsed_time": "22:08:39", "remaining_time": "0:54:00", "throughput": "2292.59", "total_tokens": 182763520} {"current_steps": 22320, "total_steps": 23217, "loss": 0.6558, "learning_rate": 1.8392856996110875e-07, "epoch": 2.884093552138519, "percentage": 96.14, "elapsed_time": "22:09:29", "remaining_time": "0:53:25", "throughput": "2292.16", "total_tokens": 182845440} {"current_steps": 22330, "total_steps": 23217, "loss": 0.6038, "learning_rate": 1.7985535480636584e-07, "epoch": 2.8853857087479002, "percentage": 96.18, "elapsed_time": "22:10:19", "remaining_time": "0:52:50", "throughput": "2291.75", "total_tokens": 182927360} {"current_steps": 22340, "total_steps": 23217, "loss": 0.787, "learning_rate": 1.7582758524564425e-07, "epoch": 2.8866778653572815, "percentage": 96.22, "elapsed_time": "22:11:10", "remaining_time": "0:52:15", "throughput": "2291.33", "total_tokens": 183009280} {"current_steps": 22350, "total_steps": 23217, "loss": 0.56, "learning_rate": 1.7184526865377805e-07, "epoch": 2.8879700219666624, "percentage": 96.27, "elapsed_time": "22:11:59", "remaining_time": "0:51:40", "throughput": "2290.95", "total_tokens": 183091200} {"current_steps": 22360, "total_steps": 23217, "loss": 0.494, "learning_rate": 1.6790841232237064e-07, "epoch": 2.8892621785760433, "percentage": 96.31, "elapsed_time": "22:12:47", "remaining_time": "0:51:04", "throughput": "2290.59", "total_tokens": 183173120} {"current_steps": 22370, "total_steps": 23217, "loss": 1.0883, "learning_rate": 1.6401702345979485e-07, "epoch": 2.8905543351854246, "percentage": 96.35, "elapsed_time": "22:13:36", "remaining_time": "0:50:29", "throughput": "2290.23", "total_tokens": 183255040} {"current_steps": 22380, "total_steps": 23217, "loss": 0.7701, "learning_rate": 1.6017110919116786e-07, "epoch": 2.8918464917948055, "percentage": 96.39, "elapsed_time": "22:14:24", "remaining_time": "0:49:54", "throughput": "2289.87", "total_tokens": 183336960} {"current_steps": 22390, "total_steps": 23217, "loss": 0.7901, "learning_rate": 1.5637067655834282e-07, "epoch": 2.8931386484041868, "percentage": 96.44, "elapsed_time": "22:15:12", "remaining_time": "0:49:19", "throughput": "2289.50", "total_tokens": 183418880} {"current_steps": 22400, "total_steps": 23217, "loss": 0.8333, "learning_rate": 1.526157325199007e-07, "epoch": 2.8944308050135676, "percentage": 96.48, "elapsed_time": "22:16:01", "remaining_time": "0:48:43", "throughput": "2289.14", "total_tokens": 183500800} {"current_steps": 22410, "total_steps": 23217, "loss": 0.3667, "learning_rate": 1.4890628395113072e-07, "epoch": 2.8957229616229485, "percentage": 96.52, "elapsed_time": "22:16:50", "remaining_time": "0:48:08", "throughput": "2288.75", "total_tokens": 183582720} {"current_steps": 22420, "total_steps": 23217, "loss": 1.0644, "learning_rate": 1.452423376440193e-07, "epoch": 2.89701511823233, "percentage": 96.57, "elapsed_time": "22:17:42", "remaining_time": "0:47:33", "throughput": "2288.31", "total_tokens": 183664640} {"current_steps": 22430, "total_steps": 23217, "loss": 0.6229, "learning_rate": 1.4162390030723617e-07, "epoch": 2.8983072748417107, "percentage": 96.61, "elapsed_time": "22:18:32", "remaining_time": "0:46:57", "throughput": "2287.88", "total_tokens": 183746560} {"current_steps": 22440, "total_steps": 23217, "loss": 0.8879, "learning_rate": 1.380509785661288e-07, "epoch": 2.899599431451092, "percentage": 96.65, "elapsed_time": "22:19:24", "remaining_time": "0:46:22", "throughput": "2287.44", "total_tokens": 183828480} {"current_steps": 22450, "total_steps": 23217, "loss": 0.7747, "learning_rate": 1.3452357896270308e-07, "epoch": 2.900891588060473, "percentage": 96.7, "elapsed_time": "22:20:15", "remaining_time": "0:45:47", "throughput": "2287.00", "total_tokens": 183910400} {"current_steps": 22460, "total_steps": 23217, "loss": 0.7773, "learning_rate": 1.3104170795561477e-07, "epoch": 2.9021837446698537, "percentage": 96.74, "elapsed_time": "22:21:10", "remaining_time": "0:45:12", "throughput": "2286.44", "total_tokens": 183992320} {"current_steps": 22470, "total_steps": 23217, "loss": 0.7762, "learning_rate": 1.2760537192015866e-07, "epoch": 2.903475901279235, "percentage": 96.78, "elapsed_time": "22:22:01", "remaining_time": "0:44:36", "throughput": "2286.03", "total_tokens": 184074240} {"current_steps": 22480, "total_steps": 23217, "loss": 0.7858, "learning_rate": 1.242145771482489e-07, "epoch": 2.9047680578886164, "percentage": 96.83, "elapsed_time": "22:22:51", "remaining_time": "0:44:01", "throughput": "2285.61", "total_tokens": 184156160} {"current_steps": 22490, "total_steps": 23217, "loss": 0.9757, "learning_rate": 1.2086932984842758e-07, "epoch": 2.9060602144979972, "percentage": 96.87, "elapsed_time": "22:23:42", "remaining_time": "0:43:26", "throughput": "2285.18", "total_tokens": 184238080} {"current_steps": 22500, "total_steps": 23217, "loss": 0.8254, "learning_rate": 1.1756963614582006e-07, "epoch": 2.907352371107378, "percentage": 96.91, "elapsed_time": "22:24:36", "remaining_time": "0:42:50", "throughput": "2284.69", "total_tokens": 184320000} {"current_steps": 22510, "total_steps": 23217, "loss": 0.2809, "learning_rate": 1.1431550208215736e-07, "epoch": 2.9086445277167594, "percentage": 96.95, "elapsed_time": "22:25:30", "remaining_time": "0:42:15", "throughput": "2284.16", "total_tokens": 184401920} {"current_steps": 22520, "total_steps": 23217, "loss": 0.779, "learning_rate": 1.1110693361574831e-07, "epoch": 2.9099366843261403, "percentage": 97.0, "elapsed_time": "22:26:21", "remaining_time": "0:41:40", "throughput": "2283.73", "total_tokens": 184483840} {"current_steps": 22530, "total_steps": 23217, "loss": 0.9263, "learning_rate": 1.0794393662147129e-07, "epoch": 2.9112288409355216, "percentage": 97.04, "elapsed_time": "22:27:13", "remaining_time": "0:41:04", "throughput": "2283.29", "total_tokens": 184565760} {"current_steps": 22540, "total_steps": 23217, "loss": 0.6628, "learning_rate": 1.0482651689075751e-07, "epoch": 2.9125209975449025, "percentage": 97.08, "elapsed_time": "22:28:03", "remaining_time": "0:40:29", "throughput": "2282.88", "total_tokens": 184647680} {"current_steps": 22550, "total_steps": 23217, "loss": 0.7321, "learning_rate": 1.0175468013159384e-07, "epoch": 2.9138131541542833, "percentage": 97.13, "elapsed_time": "22:28:54", "remaining_time": "0:39:53", "throughput": "2282.46", "total_tokens": 184729600} {"current_steps": 22560, "total_steps": 23217, "loss": 0.8234, "learning_rate": 9.872843196850057e-08, "epoch": 2.9151053107636646, "percentage": 97.17, "elapsed_time": "22:30:03", "remaining_time": "0:39:19", "throughput": "2281.54", "total_tokens": 184811520} {"current_steps": 22570, "total_steps": 23217, "loss": 0.5345, "learning_rate": 9.574777794253143e-08, "epoch": 2.9163974673730455, "percentage": 97.21, "elapsed_time": "22:30:56", "remaining_time": "0:38:43", "throughput": "2281.05", "total_tokens": 184893440} {"current_steps": 22580, "total_steps": 23217, "loss": 0.9455, "learning_rate": 9.281272351124859e-08, "epoch": 2.917689623982427, "percentage": 97.26, "elapsed_time": "22:31:44", "remaining_time": "0:38:08", "throughput": "2280.70", "total_tokens": 184975360} {"current_steps": 22590, "total_steps": 23217, "loss": 0.3409, "learning_rate": 8.992327404872825e-08, "epoch": 2.9189817805918077, "percentage": 97.3, "elapsed_time": "22:32:33", "remaining_time": "0:37:32", "throughput": "2280.35", "total_tokens": 185057280} {"current_steps": 22600, "total_steps": 23217, "loss": 0.5035, "learning_rate": 8.707943484553838e-08, "epoch": 2.9202739372011886, "percentage": 97.34, "elapsed_time": "22:33:22", "remaining_time": "0:36:56", "throughput": "2279.98", "total_tokens": 185139200} {"current_steps": 22610, "total_steps": 23217, "loss": 0.7041, "learning_rate": 8.428121110874154e-08, "epoch": 2.92156609381057, "percentage": 97.39, "elapsed_time": "22:34:10", "remaining_time": "0:36:21", "throughput": "2279.62", "total_tokens": 185221120} {"current_steps": 22620, "total_steps": 23217, "loss": 0.8394, "learning_rate": 8.152860796187545e-08, "epoch": 2.9228582504199507, "percentage": 97.43, "elapsed_time": "22:34:59", "remaining_time": "0:35:45", "throughput": "2279.26", "total_tokens": 185303040} {"current_steps": 22630, "total_steps": 23217, "loss": 0.3898, "learning_rate": 7.882163044494462e-08, "epoch": 2.924150407029332, "percentage": 97.47, "elapsed_time": "22:35:50", "remaining_time": "0:35:10", "throughput": "2278.84", "total_tokens": 185384960} {"current_steps": 22640, "total_steps": 23217, "loss": 0.7981, "learning_rate": 7.616028351441484e-08, "epoch": 2.925442563638713, "percentage": 97.51, "elapsed_time": "22:36:41", "remaining_time": "0:34:34", "throughput": "2278.42", "total_tokens": 185466880} {"current_steps": 22650, "total_steps": 23217, "loss": 0.8605, "learning_rate": 7.354457204320486e-08, "epoch": 2.9267347202480942, "percentage": 97.56, "elapsed_time": "22:37:32", "remaining_time": "0:33:59", "throughput": "2277.99", "total_tokens": 185548800} {"current_steps": 22660, "total_steps": 23217, "loss": 0.687, "learning_rate": 7.097450082066969e-08, "epoch": 2.928026876857475, "percentage": 97.6, "elapsed_time": "22:38:24", "remaining_time": "0:33:23", "throughput": "2277.56", "total_tokens": 185630720} {"current_steps": 22670, "total_steps": 23217, "loss": 0.6511, "learning_rate": 6.845007455260343e-08, "epoch": 2.9293190334668564, "percentage": 97.64, "elapsed_time": "22:39:15", "remaining_time": "0:32:47", "throughput": "2277.14", "total_tokens": 185712640} {"current_steps": 22680, "total_steps": 23217, "loss": 0.4383, "learning_rate": 6.59712978612198e-08, "epoch": 2.9306111900762373, "percentage": 97.69, "elapsed_time": "22:40:05", "remaining_time": "0:32:12", "throughput": "2276.75", "total_tokens": 185794560} {"current_steps": 22690, "total_steps": 23217, "loss": 0.4383, "learning_rate": 6.353817528514938e-08, "epoch": 2.931903346685618, "percentage": 97.73, "elapsed_time": "22:40:54", "remaining_time": "0:31:36", "throughput": "2276.39", "total_tokens": 185876480} {"current_steps": 22700, "total_steps": 23217, "loss": 0.6782, "learning_rate": 6.11507112794285e-08, "epoch": 2.9331955032949995, "percentage": 97.77, "elapsed_time": "22:41:44", "remaining_time": "0:31:00", "throughput": "2275.99", "total_tokens": 185958400} {"current_steps": 22710, "total_steps": 23217, "loss": 0.676, "learning_rate": 5.880891021549928e-08, "epoch": 2.9344876599043803, "percentage": 97.82, "elapsed_time": "22:42:33", "remaining_time": "0:30:25", "throughput": "2275.64", "total_tokens": 186040320} {"current_steps": 22720, "total_steps": 23217, "loss": 0.7285, "learning_rate": 5.6512776381192903e-08, "epoch": 2.9357798165137616, "percentage": 97.86, "elapsed_time": "22:43:21", "remaining_time": "0:29:49", "throughput": "2275.29", "total_tokens": 186122240} {"current_steps": 22730, "total_steps": 23217, "loss": 0.6244, "learning_rate": 5.426231398071302e-08, "epoch": 2.9370719731231425, "percentage": 97.9, "elapsed_time": "22:44:10", "remaining_time": "0:29:13", "throughput": "2274.93", "total_tokens": 186204160} {"current_steps": 22740, "total_steps": 23217, "loss": 0.8171, "learning_rate": 5.205752713465794e-08, "epoch": 2.9383641297325234, "percentage": 97.95, "elapsed_time": "22:44:58", "remaining_time": "0:28:37", "throughput": "2274.60", "total_tokens": 186286080} {"current_steps": 22750, "total_steps": 23217, "loss": 0.9641, "learning_rate": 4.989841987997901e-08, "epoch": 2.9396562863419047, "percentage": 97.99, "elapsed_time": "22:45:50", "remaining_time": "0:28:02", "throughput": "2274.16", "total_tokens": 186368000} {"current_steps": 22760, "total_steps": 23217, "loss": 0.7594, "learning_rate": 4.778499616999166e-08, "epoch": 2.9409484429512855, "percentage": 98.03, "elapsed_time": "22:46:39", "remaining_time": "0:27:26", "throughput": "2273.79", "total_tokens": 186449920} {"current_steps": 22770, "total_steps": 23217, "loss": 0.9113, "learning_rate": 4.57172598743727e-08, "epoch": 2.942240599560667, "percentage": 98.07, "elapsed_time": "22:47:29", "remaining_time": "0:26:50", "throughput": "2273.40", "total_tokens": 186531840} {"current_steps": 22780, "total_steps": 23217, "loss": 0.8022, "learning_rate": 4.369521477913529e-08, "epoch": 2.9435327561700477, "percentage": 98.12, "elapsed_time": "22:48:19", "remaining_time": "0:26:14", "throughput": "2273.01", "total_tokens": 186613760} {"current_steps": 22790, "total_steps": 23217, "loss": 0.7282, "learning_rate": 4.171886458664009e-08, "epoch": 2.9448249127794286, "percentage": 98.16, "elapsed_time": "22:49:09", "remaining_time": "0:25:39", "throughput": "2272.64", "total_tokens": 186695680} {"current_steps": 22800, "total_steps": 23217, "loss": 0.6295, "learning_rate": 3.9788212915573e-08, "epoch": 2.94611706938881, "percentage": 98.2, "elapsed_time": "22:50:00", "remaining_time": "0:25:03", "throughput": "2272.23", "total_tokens": 186777600} {"current_steps": 22810, "total_steps": 23217, "loss": 0.6325, "learning_rate": 3.7903263300956285e-08, "epoch": 2.947409225998191, "percentage": 98.25, "elapsed_time": "22:50:49", "remaining_time": "0:24:27", "throughput": "2271.87", "total_tokens": 186859520} {"current_steps": 22820, "total_steps": 23217, "loss": 0.8424, "learning_rate": 3.606401919411806e-08, "epoch": 2.948701382607572, "percentage": 98.29, "elapsed_time": "22:51:37", "remaining_time": "0:23:51", "throughput": "2271.52", "total_tokens": 186941440} {"current_steps": 22830, "total_steps": 23217, "loss": 1.1133, "learning_rate": 3.427048396271171e-08, "epoch": 2.949993539216953, "percentage": 98.33, "elapsed_time": "22:52:26", "remaining_time": "0:23:15", "throughput": "2271.17", "total_tokens": 187023360} {"current_steps": 22840, "total_steps": 23217, "loss": 0.6982, "learning_rate": 3.252266089069367e-08, "epoch": 2.9512856958263343, "percentage": 98.38, "elapsed_time": "22:53:16", "remaining_time": "0:22:40", "throughput": "2270.79", "total_tokens": 187105280} {"current_steps": 22850, "total_steps": 23217, "loss": 0.9222, "learning_rate": 3.0820553178320667e-08, "epoch": 2.952577852435715, "percentage": 98.42, "elapsed_time": "22:54:06", "remaining_time": "0:22:04", "throughput": "2270.41", "total_tokens": 187187200} {"current_steps": 22860, "total_steps": 23217, "loss": 0.5809, "learning_rate": 2.9164163942146937e-08, "epoch": 2.9538700090450964, "percentage": 98.46, "elapsed_time": "22:54:56", "remaining_time": "0:21:28", "throughput": "2270.02", "total_tokens": 187269120} {"current_steps": 22870, "total_steps": 23217, "loss": 0.7016, "learning_rate": 2.7553496215015907e-08, "epoch": 2.9551621656544773, "percentage": 98.51, "elapsed_time": "22:55:45", "remaining_time": "0:20:52", "throughput": "2269.66", "total_tokens": 187351040} {"current_steps": 22880, "total_steps": 23217, "loss": 0.5702, "learning_rate": 2.5988552946051848e-08, "epoch": 2.956454322263858, "percentage": 98.55, "elapsed_time": "22:56:35", "remaining_time": "0:20:16", "throughput": "2269.29", "total_tokens": 187432960} {"current_steps": 22890, "total_steps": 23217, "loss": 0.6657, "learning_rate": 2.44693370006599e-08, "epoch": 2.9577464788732395, "percentage": 98.59, "elapsed_time": "22:57:25", "remaining_time": "0:19:40", "throughput": "2268.91", "total_tokens": 187514880} {"current_steps": 22900, "total_steps": 23217, "loss": 0.6522, "learning_rate": 2.2995851160520498e-08, "epoch": 2.9590386354826204, "percentage": 98.63, "elapsed_time": "22:58:16", "remaining_time": "0:19:04", "throughput": "2268.51", "total_tokens": 187596800} {"current_steps": 22910, "total_steps": 23217, "loss": 0.8856, "learning_rate": 2.156809812358107e-08, "epoch": 2.9603307920920017, "percentage": 98.68, "elapsed_time": "22:59:05", "remaining_time": "0:18:28", "throughput": "2268.15", "total_tokens": 187678720} {"current_steps": 22920, "total_steps": 23217, "loss": 0.718, "learning_rate": 2.0186080504050466e-08, "epoch": 2.9616229487013825, "percentage": 98.72, "elapsed_time": "22:59:54", "remaining_time": "0:17:52", "throughput": "2267.79", "total_tokens": 187760640} {"current_steps": 22930, "total_steps": 23217, "loss": 0.7686, "learning_rate": 1.8849800832401733e-08, "epoch": 2.9629151053107634, "percentage": 98.76, "elapsed_time": "23:00:50", "remaining_time": "0:17:16", "throughput": "2267.24", "total_tokens": 187842560} {"current_steps": 22940, "total_steps": 23217, "loss": 0.8922, "learning_rate": 1.75592615553527e-08, "epoch": 2.9642072619201447, "percentage": 98.81, "elapsed_time": "23:01:45", "remaining_time": "0:16:41", "throughput": "2266.73", "total_tokens": 187924480} {"current_steps": 22950, "total_steps": 23217, "loss": 0.5413, "learning_rate": 1.6314465035879855e-08, "epoch": 2.965499418529526, "percentage": 98.85, "elapsed_time": "23:02:42", "remaining_time": "0:16:05", "throughput": "2266.16", "total_tokens": 188006400} {"current_steps": 22960, "total_steps": 23217, "loss": 0.4049, "learning_rate": 1.5115413553201674e-08, "epoch": 2.966791575138907, "percentage": 98.89, "elapsed_time": "23:03:38", "remaining_time": "0:15:29", "throughput": "2265.62", "total_tokens": 188088320} {"current_steps": 22970, "total_steps": 23217, "loss": 1.021, "learning_rate": 1.3962109302773085e-08, "epoch": 2.9680837317482878, "percentage": 98.94, "elapsed_time": "23:04:32", "remaining_time": "0:14:53", "throughput": "2265.13", "total_tokens": 188170240} {"current_steps": 22980, "total_steps": 23217, "loss": 0.4626, "learning_rate": 1.2854554396291018e-08, "epoch": 2.969375888357669, "percentage": 98.98, "elapsed_time": "23:05:27", "remaining_time": "0:14:17", "throughput": "2264.63", "total_tokens": 188252160} {"current_steps": 22990, "total_steps": 23217, "loss": 0.9079, "learning_rate": 1.1792750861686074e-08, "epoch": 2.97066804496705, "percentage": 99.02, "elapsed_time": "23:06:20", "remaining_time": "0:13:41", "throughput": "2264.15", "total_tokens": 188334080} {"current_steps": 23000, "total_steps": 23217, "loss": 0.8018, "learning_rate": 1.0776700643116976e-08, "epoch": 2.9719602015764313, "percentage": 99.07, "elapsed_time": "23:07:12", "remaining_time": "0:13:05", "throughput": "2263.72", "total_tokens": 188416000} {"current_steps": 23010, "total_steps": 23217, "loss": 0.6943, "learning_rate": 9.806405600967794e-09, "epoch": 2.973252358185812, "percentage": 99.11, "elapsed_time": "23:08:09", "remaining_time": "0:12:29", "throughput": "2263.16", "total_tokens": 188497920} {"current_steps": 23020, "total_steps": 23217, "loss": 1.0121, "learning_rate": 8.881867511845166e-09, "epoch": 2.974544514795193, "percentage": 99.15, "elapsed_time": "23:09:01", "remaining_time": "0:11:53", "throughput": "2262.75", "total_tokens": 188579840} {"current_steps": 23030, "total_steps": 23217, "loss": 1.0772, "learning_rate": 8.00308806857275e-09, "epoch": 2.9758366714045743, "percentage": 99.19, "elapsed_time": "23:09:52", "remaining_time": "0:11:17", "throughput": "2262.32", "total_tokens": 188661760} {"current_steps": 23040, "total_steps": 23217, "loss": 0.7207, "learning_rate": 7.1700688801940034e-09, "epoch": 2.977128828013955, "percentage": 99.24, "elapsed_time": "23:10:44", "remaining_time": "0:10:41", "throughput": "2261.91", "total_tokens": 188743680} {"current_steps": 23050, "total_steps": 23217, "loss": 0.589, "learning_rate": 6.382811471963846e-09, "epoch": 2.9784209846233365, "percentage": 99.28, "elapsed_time": "23:11:36", "remaining_time": "0:10:04", "throughput": "2261.49", "total_tokens": 188825600} {"current_steps": 23060, "total_steps": 23217, "loss": 0.5539, "learning_rate": 5.6413172853486685e-09, "epoch": 2.9797131412327174, "percentage": 99.32, "elapsed_time": "23:12:27", "remaining_time": "0:09:28", "throughput": "2261.09", "total_tokens": 188907520} {"current_steps": 23070, "total_steps": 23217, "loss": 1.0715, "learning_rate": 4.94558767802078e-09, "epoch": 2.9810052978420982, "percentage": 99.37, "elapsed_time": "23:13:18", "remaining_time": "0:08:52", "throughput": "2260.68", "total_tokens": 188989440} {"current_steps": 23080, "total_steps": 23217, "loss": 0.9075, "learning_rate": 4.295623923858405e-09, "epoch": 2.9822974544514795, "percentage": 99.41, "elapsed_time": "23:14:08", "remaining_time": "0:08:16", "throughput": "2260.30", "total_tokens": 189071360} {"current_steps": 23090, "total_steps": 23217, "loss": 0.9787, "learning_rate": 3.6914272129429106e-09, "epoch": 2.983589611060861, "percentage": 99.45, "elapsed_time": "23:15:01", "remaining_time": "0:07:40", "throughput": "2259.86", "total_tokens": 189153280} {"current_steps": 23100, "total_steps": 23217, "loss": 0.397, "learning_rate": 3.1329986515560295e-09, "epoch": 2.9848817676702417, "percentage": 99.5, "elapsed_time": "23:15:51", "remaining_time": "0:07:04", "throughput": "2259.48", "total_tokens": 189235200} {"current_steps": 23110, "total_steps": 23217, "loss": 0.8219, "learning_rate": 2.6203392621798605e-09, "epoch": 2.9861739242796226, "percentage": 99.54, "elapsed_time": "23:16:40", "remaining_time": "0:06:28", "throughput": "2259.13", "total_tokens": 189317120} {"current_steps": 23120, "total_steps": 23217, "loss": 0.93, "learning_rate": 2.153449983491318e-09, "epoch": 2.987466080889004, "percentage": 99.58, "elapsed_time": "23:17:30", "remaining_time": "0:05:51", "throughput": "2258.76", "total_tokens": 189399040} {"current_steps": 23130, "total_steps": 23217, "loss": 1.1683, "learning_rate": 1.7323316703621305e-09, "epoch": 2.9887582374983848, "percentage": 99.63, "elapsed_time": "23:18:23", "remaining_time": "0:05:15", "throughput": "2258.31", "total_tokens": 189480960} {"current_steps": 23140, "total_steps": 23217, "loss": 0.5163, "learning_rate": 1.356985093856067e-09, "epoch": 2.990050394107766, "percentage": 99.67, "elapsed_time": "23:19:30", "remaining_time": "0:04:39", "throughput": "2257.49", "total_tokens": 189562880} {"current_steps": 23150, "total_steps": 23217, "loss": 1.0414, "learning_rate": 1.0274109412372613e-09, "epoch": 2.991342550717147, "percentage": 99.71, "elapsed_time": "23:20:59", "remaining_time": "0:04:03", "throughput": "2256.09", "total_tokens": 189644800} {"current_steps": 23160, "total_steps": 23217, "loss": 0.743, "learning_rate": 7.436098159480099e-10, "epoch": 2.992634707326528, "percentage": 99.75, "elapsed_time": "23:21:53", "remaining_time": "0:03:27", "throughput": "2255.62", "total_tokens": 189726720} {"current_steps": 23170, "total_steps": 23217, "loss": 0.941, "learning_rate": 5.055822376337505e-10, "epoch": 2.993926863935909, "percentage": 99.8, "elapsed_time": "23:22:47", "remaining_time": "0:02:50", "throughput": "2255.14", "total_tokens": 189808640} {"current_steps": 23180, "total_steps": 23217, "loss": 0.6753, "learning_rate": 3.1332864211808254e-10, "epoch": 2.99521902054529, "percentage": 99.84, "elapsed_time": "23:23:40", "remaining_time": "0:02:14", "throughput": "2254.69", "total_tokens": 189890560} {"current_steps": 23190, "total_steps": 23217, "loss": 0.8739, "learning_rate": 1.6684938141664498e-10, "epoch": 2.9965111771546713, "percentage": 99.88, "elapsed_time": "23:24:32", "remaining_time": "0:01:38", "throughput": "2254.27", "total_tokens": 189972480} {"current_steps": 23200, "total_steps": 23217, "loss": 0.851, "learning_rate": 6.614472373434044e-11, "epoch": 2.997803333764052, "percentage": 99.93, "elapsed_time": "23:25:24", "remaining_time": "0:01:01", "throughput": "2253.86", "total_tokens": 190054400} {"current_steps": 23210, "total_steps": 23217, "loss": 0.7338, "learning_rate": 1.1214853459784457e-11, "epoch": 2.999095490373433, "percentage": 99.97, "elapsed_time": "23:26:13", "remaining_time": "0:00:25", "throughput": "2253.52", "total_tokens": 190136320} {"current_steps": 23217, "total_steps": 23217, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "23:26:50", "remaining_time": "0:00:00", "throughput": "2253.20", "total_tokens": 190193664} {"current_steps": 23217, "total_steps": 23217, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:00:00", "remaining_time": "0:00:00", "throughput": "190162108626.90", "total_tokens": 190193664}