{"current_steps": 5, "total_steps": 375, "loss": 4.5494, "lr": 4.997807075247146e-05, "epoch": 0.03980099502487562, "percentage": 1.33, "elapsed_time": "0:00:19", "remaining_time": "0:23:49", "throughput": 416.59, "total_tokens": 8048} {"current_steps": 10, "total_steps": 375, "loss": 4.5269, "lr": 4.991232148123761e-05, "epoch": 0.07960199004975124, "percentage": 2.67, "elapsed_time": "0:00:37", "remaining_time": "0:22:41", "throughput": 375.28, "total_tokens": 14000} {"current_steps": 15, "total_steps": 375, "loss": 4.0421, "lr": 4.980286753286195e-05, "epoch": 0.11940298507462686, "percentage": 4.0, "elapsed_time": "0:00:55", "remaining_time": "0:22:05", "throughput": 376.49, "total_tokens": 20800} {"current_steps": 20, "total_steps": 375, "loss": 3.8231, "lr": 4.964990092676263e-05, "epoch": 0.15920398009950248, "percentage": 5.33, "elapsed_time": "0:01:14", "remaining_time": "0:21:59", "throughput": 390.13, "total_tokens": 28992} {"current_steps": 25, "total_steps": 375, "loss": 3.5978, "lr": 4.9453690018345144e-05, "epoch": 0.19900497512437812, "percentage": 6.67, "elapsed_time": "0:01:32", "remaining_time": "0:21:30", "throughput": 372.36, "total_tokens": 34336} {"current_steps": 30, "total_steps": 375, "loss": 3.5563, "lr": 4.9214579028215776e-05, "epoch": 0.23880597014925373, "percentage": 8.0, "elapsed_time": "0:01:50", "remaining_time": "0:21:06", "throughput": 358.3, "total_tokens": 39456} {"current_steps": 35, "total_steps": 375, "loss": 3.7193, "lr": 4.893298743830168e-05, "epoch": 0.27860696517412936, "percentage": 9.33, "elapsed_time": "0:02:08", "remaining_time": "0:20:44", "throughput": 353.55, "total_tokens": 45280} {"current_steps": 40, "total_steps": 375, "loss": 3.4887, "lr": 4.860940925593703e-05, "epoch": 0.31840796019900497, "percentage": 10.67, "elapsed_time": "0:02:25", "remaining_time": "0:20:21", "throughput": 350.4, "total_tokens": 51104} {"current_steps": 45, "total_steps": 375, "loss": 3.4482, "lr": 4.8244412147206284e-05, "epoch": 0.3582089552238806, "percentage": 12.0, "elapsed_time": "0:02:43", "remaining_time": "0:19:59", "throughput": 346.39, "total_tokens": 56672} {"current_steps": 50, "total_steps": 375, "loss": 3.5251, "lr": 4.783863644106502e-05, "epoch": 0.39800995024875624, "percentage": 13.33, "elapsed_time": "0:03:01", "remaining_time": "0:19:40", "throughput": 339.62, "total_tokens": 61680} {"current_steps": 55, "total_steps": 375, "loss": 3.4091, "lr": 4.7392794005985326e-05, "epoch": 0.43781094527363185, "percentage": 14.67, "elapsed_time": "0:03:20", "remaining_time": "0:19:24", "throughput": 344.36, "total_tokens": 68928} {"current_steps": 60, "total_steps": 375, "loss": 3.4556, "lr": 4.690766700109659e-05, "epoch": 0.47761194029850745, "percentage": 16.0, "elapsed_time": "0:03:38", "remaining_time": "0:19:09", "throughput": 351.95, "total_tokens": 77056} {"current_steps": 65, "total_steps": 375, "loss": 3.3753, "lr": 4.638410650401267e-05, "epoch": 0.5174129353233831, "percentage": 17.33, "elapsed_time": "0:03:57", "remaining_time": "0:18:51", "throughput": 355.56, "total_tokens": 84368} {"current_steps": 70, "total_steps": 375, "loss": 3.3786, "lr": 4.5823031017752485e-05, "epoch": 0.5572139303482587, "percentage": 18.67, "elapsed_time": "0:04:15", "remaining_time": "0:18:33", "throughput": 353.28, "total_tokens": 90272} {"current_steps": 75, "total_steps": 375, "loss": 3.4089, "lr": 4.522542485937369e-05, "epoch": 0.5970149253731343, "percentage": 20.0, "elapsed_time": "0:04:33", "remaining_time": "0:18:14", "throughput": 349.53, "total_tokens": 95600} {"current_steps": 80, "total_steps": 375, "loss": 3.4508, "lr": 4.4592336433146e-05, "epoch": 0.6368159203980099, "percentage": 21.33, "elapsed_time": "0:04:52", "remaining_time": "0:17:57", "throughput": 352.33, "total_tokens": 102928} {"current_steps": 85, "total_steps": 375, "loss": 3.333, "lr": 4.3924876391293915e-05, "epoch": 0.6766169154228856, "percentage": 22.67, "elapsed_time": "0:05:10", "remaining_time": "0:17:38", "throughput": 353.37, "total_tokens": 109584} {"current_steps": 90, "total_steps": 375, "loss": 3.3651, "lr": 4.3224215685535294e-05, "epoch": 0.7164179104477612, "percentage": 24.0, "elapsed_time": "0:05:28", "remaining_time": "0:17:20", "throughput": 357.01, "total_tokens": 117312} {"current_steps": 95, "total_steps": 375, "loss": 3.285, "lr": 4.249158351283414e-05, "epoch": 0.7562189054726368, "percentage": 25.33, "elapsed_time": "0:05:46", "remaining_time": "0:17:01", "throughput": 355.97, "total_tokens": 123312} {"current_steps": 100, "total_steps": 375, "loss": 3.3726, "lr": 4.172826515897146e-05, "epoch": 0.7960199004975125, "percentage": 26.67, "elapsed_time": "0:06:04", "remaining_time": "0:16:41", "throughput": 356.11, "total_tokens": 129664} {"current_steps": 105, "total_steps": 375, "loss": 3.349, "lr": 4.093559974371725e-05, "epoch": 0.835820895522388, "percentage": 28.0, "elapsed_time": "0:06:23", "remaining_time": "0:16:26", "throughput": 360.08, "total_tokens": 138128} {"current_steps": 110, "total_steps": 375, "loss": 3.3335, "lr": 4.011497787155938e-05, "epoch": 0.8756218905472637, "percentage": 29.33, "elapsed_time": "0:06:41", "remaining_time": "0:16:07", "throughput": 358.69, "total_tokens": 144064} {"current_steps": 115, "total_steps": 375, "loss": 3.3096, "lr": 3.92678391921108e-05, "epoch": 0.9154228855721394, "percentage": 30.67, "elapsed_time": "0:06:59", "remaining_time": "0:15:48", "throughput": 356.95, "total_tokens": 149760} {"current_steps": 120, "total_steps": 375, "loss": 3.2696, "lr": 3.8395669874474915e-05, "epoch": 0.9552238805970149, "percentage": 32.0, "elapsed_time": "0:07:17", "remaining_time": "0:15:29", "throughput": 354.39, "total_tokens": 155088} {"current_steps": 125, "total_steps": 375, "loss": 3.3071, "lr": 3.7500000000000003e-05, "epoch": 0.9950248756218906, "percentage": 33.33, "elapsed_time": "0:07:36", "remaining_time": "0:15:13", "throughput": 357.59, "total_tokens": 163328} {"current_steps": 130, "total_steps": 375, "loss": 3.8956, "lr": 3.6582400877996546e-05, "epoch": 1.0398009950248757, "percentage": 34.67, "elapsed_time": "0:07:55", "remaining_time": "0:14:55", "throughput": 355.28, "total_tokens": 168832} {"current_steps": 135, "total_steps": 375, "loss": 3.2505, "lr": 3.564448228912682e-05, "epoch": 1.0796019900497513, "percentage": 36.0, "elapsed_time": "0:08:13", "remaining_time": "0:14:36", "throughput": 353.84, "total_tokens": 174544} {"current_steps": 140, "total_steps": 375, "loss": 3.249, "lr": 3.4687889661302576e-05, "epoch": 1.1194029850746268, "percentage": 37.33, "elapsed_time": "0:08:31", "remaining_time": "0:14:19", "throughput": 355.97, "total_tokens": 182176} {"current_steps": 145, "total_steps": 375, "loss": 3.1777, "lr": 3.3714301183045385e-05, "epoch": 1.1592039800995024, "percentage": 38.67, "elapsed_time": "0:08:49", "remaining_time": "0:14:00", "throughput": 354.36, "total_tokens": 187680} {"current_steps": 150, "total_steps": 375, "loss": 3.2005, "lr": 3.272542485937369e-05, "epoch": 1.199004975124378, "percentage": 40.0, "elapsed_time": "0:09:07", "remaining_time": "0:13:41", "throughput": 354.54, "total_tokens": 194176} {"current_steps": 155, "total_steps": 375, "loss": 3.1882, "lr": 3.172299551538164e-05, "epoch": 1.2388059701492538, "percentage": 41.33, "elapsed_time": "0:09:26", "remaining_time": "0:13:23", "throughput": 356.67, "total_tokens": 201904} {"current_steps": 160, "total_steps": 375, "loss": 3.2861, "lr": 3.0708771752766394e-05, "epoch": 1.2786069651741294, "percentage": 42.67, "elapsed_time": "0:09:44", "remaining_time": "0:13:04", "throughput": 354.95, "total_tokens": 207344} {"current_steps": 165, "total_steps": 375, "loss": 3.2012, "lr": 2.9684532864643122e-05, "epoch": 1.3184079601990049, "percentage": 44.0, "elapsed_time": "0:10:02", "remaining_time": "0:12:46", "throughput": 352.93, "total_tokens": 212480} {"current_steps": 170, "total_steps": 375, "loss": 3.1424, "lr": 2.8652075714060295e-05, "epoch": 1.3582089552238805, "percentage": 45.33, "elapsed_time": "0:10:21", "remaining_time": "0:12:28", "throughput": 353.98, "total_tokens": 219840} {"current_steps": 175, "total_steps": 375, "loss": 3.1061, "lr": 2.761321158169134e-05, "epoch": 1.3980099502487562, "percentage": 46.67, "elapsed_time": "0:10:38", "remaining_time": "0:12:10", "throughput": 351.42, "total_tokens": 224544} {"current_steps": 180, "total_steps": 375, "loss": 3.1739, "lr": 2.656976298823284e-05, "epoch": 1.4378109452736318, "percentage": 48.0, "elapsed_time": "0:10:57", "remaining_time": "0:11:52", "throughput": 352.41, "total_tokens": 231760} {"current_steps": 185, "total_steps": 375, "loss": 3.1692, "lr": 2.5523560497083926e-05, "epoch": 1.4776119402985075, "percentage": 49.33, "elapsed_time": "0:11:15", "remaining_time": "0:11:34", "throughput": 353.7, "total_tokens": 239056} {"current_steps": 190, "total_steps": 375, "loss": 3.2116, "lr": 2.447643950291608e-05, "epoch": 1.517412935323383, "percentage": 50.67, "elapsed_time": "0:11:34", "remaining_time": "0:11:16", "throughput": 355.0, "total_tokens": 246576} {"current_steps": 195, "total_steps": 375, "loss": 3.3134, "lr": 2.3430237011767167e-05, "epoch": 1.5572139303482588, "percentage": 52.0, "elapsed_time": "0:11:52", "remaining_time": "0:10:57", "throughput": 355.61, "total_tokens": 253360} {"current_steps": 200, "total_steps": 375, "loss": 3.2215, "lr": 2.238678841830867e-05, "epoch": 1.5970149253731343, "percentage": 53.33, "elapsed_time": "0:12:10", "remaining_time": "0:10:39", "throughput": 356.2, "total_tokens": 260240} {"current_steps": 205, "total_steps": 375, "loss": 3.0594, "lr": 2.1347924285939714e-05, "epoch": 1.63681592039801, "percentage": 54.67, "elapsed_time": "0:12:29", "remaining_time": "0:10:21", "throughput": 354.14, "total_tokens": 265520} {"current_steps": 210, "total_steps": 375, "loss": 3.1452, "lr": 2.031546713535688e-05, "epoch": 1.6766169154228856, "percentage": 56.0, "elapsed_time": "0:12:49", "remaining_time": "0:10:04", "throughput": 356.32, "total_tokens": 274144} {"current_steps": 215, "total_steps": 375, "loss": 3.2481, "lr": 1.9291228247233605e-05, "epoch": 1.716417910447761, "percentage": 57.33, "elapsed_time": "0:13:07", "remaining_time": "0:09:46", "throughput": 356.7, "total_tokens": 281024} {"current_steps": 220, "total_steps": 375, "loss": 3.1269, "lr": 1.827700448461836e-05, "epoch": 1.756218905472637, "percentage": 58.67, "elapsed_time": "0:13:27", "remaining_time": "0:09:28", "throughput": 359.85, "total_tokens": 290608} {"current_steps": 225, "total_steps": 375, "loss": 3.1888, "lr": 1.7274575140626318e-05, "epoch": 1.7960199004975124, "percentage": 60.0, "elapsed_time": "0:13:45", "remaining_time": "0:09:10", "throughput": 360.92, "total_tokens": 298064} {"current_steps": 230, "total_steps": 375, "loss": 3.2137, "lr": 1.6285698816954624e-05, "epoch": 1.835820895522388, "percentage": 61.33, "elapsed_time": "0:14:03", "remaining_time": "0:08:52", "throughput": 359.6, "total_tokens": 303456} {"current_steps": 235, "total_steps": 375, "loss": 3.1926, "lr": 1.5312110338697426e-05, "epoch": 1.8756218905472637, "percentage": 62.67, "elapsed_time": "0:14:21", "remaining_time": "0:08:33", "throughput": 358.0, "total_tokens": 308528} {"current_steps": 240, "total_steps": 375, "loss": 3.2949, "lr": 1.4355517710873184e-05, "epoch": 1.9154228855721394, "percentage": 64.0, "elapsed_time": "0:14:39", "remaining_time": "0:08:14", "throughput": 357.75, "total_tokens": 314816} {"current_steps": 245, "total_steps": 375, "loss": 3.1559, "lr": 1.3417599122003464e-05, "epoch": 1.955223880597015, "percentage": 65.33, "elapsed_time": "0:14:57", "remaining_time": "0:07:56", "throughput": 356.64, "total_tokens": 320224} {"current_steps": 250, "total_steps": 375, "loss": 3.1411, "lr": 1.2500000000000006e-05, "epoch": 1.9950248756218905, "percentage": 66.67, "elapsed_time": "0:15:15", "remaining_time": "0:07:37", "throughput": 355.99, "total_tokens": 326032} {"current_steps": 255, "total_steps": 375, "loss": 3.5418, "lr": 1.1604330125525079e-05, "epoch": 2.0398009950248754, "percentage": 68.0, "elapsed_time": "0:15:34", "remaining_time": "0:07:19", "throughput": 354.77, "total_tokens": 331440} {"current_steps": 260, "total_steps": 375, "loss": 3.0061, "lr": 1.0732160807889211e-05, "epoch": 2.0796019900497513, "percentage": 69.33, "elapsed_time": "0:15:51", "remaining_time": "0:07:01", "throughput": 354.05, "total_tokens": 337056} {"current_steps": 265, "total_steps": 375, "loss": 3.102, "lr": 9.88502212844063e-06, "epoch": 2.1194029850746268, "percentage": 70.67, "elapsed_time": "0:16:10", "remaining_time": "0:06:42", "throughput": 352.6, "total_tokens": 342064} {"current_steps": 270, "total_steps": 375, "loss": 2.9862, "lr": 9.064400256282757e-06, "epoch": 2.1592039800995027, "percentage": 72.0, "elapsed_time": "0:16:28", "remaining_time": "0:06:24", "throughput": 351.35, "total_tokens": 347152} {"current_steps": 275, "total_steps": 375, "loss": 3.0803, "lr": 8.271734841028553e-06, "epoch": 2.199004975124378, "percentage": 73.33, "elapsed_time": "0:16:46", "remaining_time": "0:06:06", "throughput": 352.72, "total_tokens": 355152} {"current_steps": 280, "total_steps": 375, "loss": 3.1944, "lr": 7.508416487165862e-06, "epoch": 2.2388059701492535, "percentage": 74.67, "elapsed_time": "0:17:05", "remaining_time": "0:05:47", "throughput": 352.51, "total_tokens": 361328} {"current_steps": 285, "total_steps": 375, "loss": 3.1717, "lr": 6.775784314464717e-06, "epoch": 2.2786069651741294, "percentage": 76.0, "elapsed_time": "0:17:23", "remaining_time": "0:05:29", "throughput": 354.26, "total_tokens": 369648} {"current_steps": 290, "total_steps": 375, "loss": 3.2106, "lr": 6.075123608706093e-06, "epoch": 2.318407960199005, "percentage": 77.33, "elapsed_time": "0:17:42", "remaining_time": "0:05:11", "throughput": 355.43, "total_tokens": 377664} {"current_steps": 295, "total_steps": 375, "loss": 3.0577, "lr": 5.4076635668540075e-06, "epoch": 2.3582089552238807, "percentage": 78.67, "elapsed_time": "0:18:00", "remaining_time": "0:04:53", "throughput": 356.33, "total_tokens": 385184} {"current_steps": 300, "total_steps": 375, "loss": 3.1227, "lr": 4.7745751406263165e-06, "epoch": 2.398009950248756, "percentage": 80.0, "elapsed_time": "0:18:18", "remaining_time": "0:04:34", "throughput": 356.28, "total_tokens": 391536} {"current_steps": 305, "total_steps": 375, "loss": 3.1015, "lr": 4.176968982247514e-06, "epoch": 2.4378109452736316, "percentage": 81.33, "elapsed_time": "0:18:37", "remaining_time": "0:04:16", "throughput": 355.52, "total_tokens": 397408} {"current_steps": 310, "total_steps": 375, "loss": 3.0393, "lr": 3.6158934959873353e-06, "epoch": 2.4776119402985075, "percentage": 82.67, "elapsed_time": "0:18:55", "remaining_time": "0:03:58", "throughput": 355.42, "total_tokens": 403712} {"current_steps": 315, "total_steps": 375, "loss": 2.9964, "lr": 3.092332998903416e-06, "epoch": 2.517412935323383, "percentage": 84.0, "elapsed_time": "0:19:13", "remaining_time": "0:03:39", "throughput": 354.97, "total_tokens": 409632} {"current_steps": 320, "total_steps": 375, "loss": 3.1617, "lr": 2.6072059940146775e-06, "epoch": 2.557213930348259, "percentage": 85.33, "elapsed_time": "0:19:32", "remaining_time": "0:03:21", "throughput": 355.4, "total_tokens": 416704} {"current_steps": 325, "total_steps": 375, "loss": 3.0388, "lr": 2.1613635589349756e-06, "epoch": 2.5970149253731343, "percentage": 86.67, "elapsed_time": "0:19:51", "remaining_time": "0:03:03", "throughput": 356.66, "total_tokens": 425056} {"current_steps": 330, "total_steps": 375, "loss": 3.158, "lr": 1.7555878527937164e-06, "epoch": 2.6368159203980097, "percentage": 88.0, "elapsed_time": "0:20:09", "remaining_time": "0:02:44", "throughput": 356.13, "total_tokens": 430816} {"current_steps": 335, "total_steps": 375, "loss": 3.0348, "lr": 1.3905907440629752e-06, "epoch": 2.6766169154228856, "percentage": 89.33, "elapsed_time": "0:20:27", "remaining_time": "0:02:26", "throughput": 356.25, "total_tokens": 437456} {"current_steps": 340, "total_steps": 375, "loss": 3.1515, "lr": 1.067012561698319e-06, "epoch": 2.716417910447761, "percentage": 90.67, "elapsed_time": "0:20:45", "remaining_time": "0:02:08", "throughput": 355.61, "total_tokens": 442976} {"current_steps": 345, "total_steps": 375, "loss": 3.0978, "lr": 7.854209717842231e-07, "epoch": 2.756218905472637, "percentage": 92.0, "elapsed_time": "0:21:05", "remaining_time": "0:01:50", "throughput": 356.26, "total_tokens": 450688} {"current_steps": 350, "total_steps": 375, "loss": 3.051, "lr": 5.463099816548579e-07, "epoch": 2.7960199004975124, "percentage": 93.33, "elapsed_time": "0:21:22", "remaining_time": "0:01:31", "throughput": 356.49, "total_tokens": 457344} {"current_steps": 355, "total_steps": 375, "loss": 3.0632, "lr": 3.5009907323737825e-07, "epoch": 2.835820895522388, "percentage": 94.67, "elapsed_time": "0:21:40", "remaining_time": "0:01:13", "throughput": 356.36, "total_tokens": 463584} {"current_steps": 360, "total_steps": 375, "loss": 3.0875, "lr": 1.9713246713805588e-07, "epoch": 2.8756218905472637, "percentage": 96.0, "elapsed_time": "0:21:58", "remaining_time": "0:00:54", "throughput": 355.21, "total_tokens": 468400} {"current_steps": 365, "total_steps": 375, "loss": 3.1218, "lr": 8.767851876239074e-08, "epoch": 2.9154228855721396, "percentage": 97.33, "elapsed_time": "0:22:17", "remaining_time": "0:00:36", "throughput": 356.1, "total_tokens": 476128} {"current_steps": 370, "total_steps": 375, "loss": 3.0581, "lr": 2.192924752854042e-08, "epoch": 2.955223880597015, "percentage": 98.67, "elapsed_time": "0:22:36", "remaining_time": "0:00:18", "throughput": 357.04, "total_tokens": 484320} {"current_steps": 375, "total_steps": 375, "loss": 2.9967, "lr": 0.0, "epoch": 2.9950248756218905, "percentage": 100.0, "elapsed_time": "0:22:54", "remaining_time": "0:00:00", "throughput": 356.12, "total_tokens": 489472} {"current_steps": 375, "total_steps": 375, "epoch": 2.9950248756218905, "percentage": 100.0, "elapsed_time": "0:22:55", "remaining_time": "0:00:00", "throughput": 355.84, "total_tokens": 489472}