{"current_steps": 5, "total_steps": 2652, "loss": 1.564, "learning_rate": 4.999956146783009e-05, "epoch": 0.003769317753486619, "percentage": 0.19, "elapsed_time": "0:00:26", "remaining_time": "3:54:15", "throughput": 898.51, "total_tokens": 23856} {"current_steps": 10, "total_steps": 2652, "loss": 0.968, "learning_rate": 4.9998245886705174e-05, "epoch": 0.007538635506973238, "percentage": 0.38, "elapsed_time": "0:00:50", "remaining_time": "3:40:11", "throughput": 951.59, "total_tokens": 47584} {"current_steps": 15, "total_steps": 2652, "loss": 0.9879, "learning_rate": 4.999605330277923e-05, "epoch": 0.011307953260459858, "percentage": 0.57, "elapsed_time": "0:01:13", "remaining_time": "3:34:40", "throughput": 967.22, "total_tokens": 70864} {"current_steps": 20, "total_steps": 2652, "loss": 1.073, "learning_rate": 4.999298379297376e-05, "epoch": 0.015077271013946476, "percentage": 0.75, "elapsed_time": "0:01:36", "remaining_time": "3:31:51", "throughput": 975.12, "total_tokens": 94192} {"current_steps": 25, "total_steps": 2652, "loss": 0.8549, "learning_rate": 4.998903746497505e-05, "epoch": 0.018846588767433094, "percentage": 0.94, "elapsed_time": "0:02:00", "remaining_time": "3:30:30", "throughput": 977.35, "total_tokens": 117472} {"current_steps": 30, "total_steps": 2652, "loss": 0.8704, "learning_rate": 4.998421445723046e-05, "epoch": 0.022615906520919715, "percentage": 1.13, "elapsed_time": "0:02:23", "remaining_time": "3:29:13", "throughput": 979.63, "total_tokens": 140704} {"current_steps": 35, "total_steps": 2652, "loss": 0.9786, "learning_rate": 4.997851493894349e-05, "epoch": 0.026385224274406333, "percentage": 1.32, "elapsed_time": "0:02:47", "remaining_time": "3:28:11", "throughput": 979.77, "total_tokens": 163680} {"current_steps": 40, "total_steps": 2652, "loss": 0.8356, "learning_rate": 4.997193911006793e-05, "epoch": 0.03015454202789295, "percentage": 1.51, "elapsed_time": "0:03:10", "remaining_time": "3:27:22", "throughput": 981.74, "total_tokens": 187072} {"current_steps": 45, "total_steps": 2652, "loss": 0.778, "learning_rate": 4.996448720130077e-05, "epoch": 0.03392385978137957, "percentage": 1.7, "elapsed_time": "0:03:34", "remaining_time": "3:27:05", "throughput": 984.0, "total_tokens": 211040} {"current_steps": 50, "total_steps": 2652, "loss": 0.939, "learning_rate": 4.995615947407415e-05, "epoch": 0.03769317753486619, "percentage": 1.89, "elapsed_time": "0:03:57", "remaining_time": "3:26:22", "throughput": 985.8, "total_tokens": 234560} {"current_steps": 55, "total_steps": 2652, "loss": 1.0274, "learning_rate": 4.994695622054618e-05, "epoch": 0.04146249528835281, "percentage": 2.07, "elapsed_time": "0:04:21", "remaining_time": "3:25:46", "throughput": 985.28, "total_tokens": 257632} {"current_steps": 60, "total_steps": 2652, "loss": 0.8822, "learning_rate": 4.9936877763590664e-05, "epoch": 0.04523181304183943, "percentage": 2.26, "elapsed_time": "0:04:45", "remaining_time": "3:25:20", "throughput": 985.34, "total_tokens": 281024} {"current_steps": 65, "total_steps": 2652, "loss": 0.8146, "learning_rate": 4.992592445678582e-05, "epoch": 0.049001130795326045, "percentage": 2.45, "elapsed_time": "0:05:08", "remaining_time": "3:24:44", "throughput": 987.15, "total_tokens": 304688} {"current_steps": 70, "total_steps": 2652, "loss": 0.9989, "learning_rate": 4.991409668440185e-05, "epoch": 0.052770448548812667, "percentage": 2.64, "elapsed_time": "0:05:32", "remaining_time": "3:24:09", "throughput": 985.91, "total_tokens": 327424} {"current_steps": 75, "total_steps": 2652, "loss": 0.9344, "learning_rate": 4.990139486138743e-05, "epoch": 0.05653976630229928, "percentage": 2.83, "elapsed_time": "0:05:55", "remaining_time": "3:23:31", "throughput": 986.28, "total_tokens": 350528} {"current_steps": 80, "total_steps": 2652, "loss": 0.7932, "learning_rate": 4.988781943335521e-05, "epoch": 0.0603090840557859, "percentage": 3.02, "elapsed_time": "0:06:18", "remaining_time": "3:22:51", "throughput": 985.98, "total_tokens": 373280} {"current_steps": 85, "total_steps": 2652, "loss": 0.9445, "learning_rate": 4.987337087656614e-05, "epoch": 0.06407840180927252, "percentage": 3.21, "elapsed_time": "0:06:41", "remaining_time": "3:22:12", "throughput": 985.39, "total_tokens": 395856} {"current_steps": 90, "total_steps": 2652, "loss": 0.7369, "learning_rate": 4.985804969791279e-05, "epoch": 0.06784771956275915, "percentage": 3.39, "elapsed_time": "0:07:05", "remaining_time": "3:21:47", "throughput": 984.44, "total_tokens": 418704} {"current_steps": 95, "total_steps": 2652, "loss": 1.0226, "learning_rate": 4.984185643490151e-05, "epoch": 0.07161703731624576, "percentage": 3.58, "elapsed_time": "0:07:29", "remaining_time": "3:21:37", "throughput": 984.39, "total_tokens": 442432} {"current_steps": 100, "total_steps": 2652, "loss": 0.7753, "learning_rate": 4.9824791655633676e-05, "epoch": 0.07538635506973237, "percentage": 3.77, "elapsed_time": "0:07:53", "remaining_time": "3:21:13", "throughput": 985.3, "total_tokens": 466128} {"current_steps": 105, "total_steps": 2652, "loss": 0.8278, "learning_rate": 4.9806855958785625e-05, "epoch": 0.079155672823219, "percentage": 3.96, "elapsed_time": "0:08:17", "remaining_time": "3:21:06", "throughput": 984.1, "total_tokens": 489536} {"current_steps": 110, "total_steps": 2652, "loss": 0.8432, "learning_rate": 4.978804997358779e-05, "epoch": 0.08292499057670562, "percentage": 4.15, "elapsed_time": "0:08:41", "remaining_time": "3:20:42", "throughput": 984.82, "total_tokens": 513200} {"current_steps": 115, "total_steps": 2652, "loss": 0.9649, "learning_rate": 4.9768374359802525e-05, "epoch": 0.08669430833019223, "percentage": 4.34, "elapsed_time": "0:09:04", "remaining_time": "3:20:20", "throughput": 984.52, "total_tokens": 536432} {"current_steps": 120, "total_steps": 2652, "loss": 0.8249, "learning_rate": 4.9747829807701e-05, "epoch": 0.09046362608367886, "percentage": 4.52, "elapsed_time": "0:09:28", "remaining_time": "3:19:57", "throughput": 984.45, "total_tokens": 559776} {"current_steps": 125, "total_steps": 2652, "loss": 0.9157, "learning_rate": 4.972641703803896e-05, "epoch": 0.09423294383716548, "percentage": 4.71, "elapsed_time": "0:09:52", "remaining_time": "3:19:32", "throughput": 984.87, "total_tokens": 583248} {"current_steps": 130, "total_steps": 2652, "loss": 0.885, "learning_rate": 4.9704136802031485e-05, "epoch": 0.09800226159065209, "percentage": 4.9, "elapsed_time": "0:10:16", "remaining_time": "3:19:14", "throughput": 984.68, "total_tokens": 606768} {"current_steps": 135, "total_steps": 2652, "loss": 0.8736, "learning_rate": 4.96809898813266e-05, "epoch": 0.1017715793441387, "percentage": 5.09, "elapsed_time": "0:10:40", "remaining_time": "3:18:56", "throughput": 985.41, "total_tokens": 630896} {"current_steps": 140, "total_steps": 2652, "loss": 0.7312, "learning_rate": 4.965697708797784e-05, "epoch": 0.10554089709762533, "percentage": 5.28, "elapsed_time": "0:11:03", "remaining_time": "3:18:31", "throughput": 985.61, "total_tokens": 654320} {"current_steps": 145, "total_steps": 2652, "loss": 0.9478, "learning_rate": 4.963209926441581e-05, "epoch": 0.10931021485111195, "percentage": 5.47, "elapsed_time": "0:11:27", "remaining_time": "3:18:07", "throughput": 985.01, "total_tokens": 677248} {"current_steps": 150, "total_steps": 2652, "loss": 0.9174, "learning_rate": 4.9606357283418575e-05, "epoch": 0.11307953260459856, "percentage": 5.66, "elapsed_time": "0:11:51", "remaining_time": "3:17:43", "throughput": 985.11, "total_tokens": 700672} {"current_steps": 155, "total_steps": 2652, "loss": 0.8453, "learning_rate": 4.957975204808108e-05, "epoch": 0.11684885035808519, "percentage": 5.84, "elapsed_time": "0:12:15", "remaining_time": "3:17:22", "throughput": 985.49, "total_tokens": 724480} {"current_steps": 160, "total_steps": 2652, "loss": 0.701, "learning_rate": 4.955228449178345e-05, "epoch": 0.1206181681115718, "percentage": 6.03, "elapsed_time": "0:12:38", "remaining_time": "3:16:59", "throughput": 985.88, "total_tokens": 748144} {"current_steps": 165, "total_steps": 2652, "loss": 0.7981, "learning_rate": 4.952395557815826e-05, "epoch": 0.12438748586505842, "percentage": 6.22, "elapsed_time": "0:13:02", "remaining_time": "3:16:33", "throughput": 986.17, "total_tokens": 771584} {"current_steps": 170, "total_steps": 2652, "loss": 0.8824, "learning_rate": 4.949476630105669e-05, "epoch": 0.12815680361854503, "percentage": 6.41, "elapsed_time": "0:13:26", "remaining_time": "3:16:08", "throughput": 986.61, "total_tokens": 795248} {"current_steps": 175, "total_steps": 2652, "loss": 0.8368, "learning_rate": 4.9464717684513726e-05, "epoch": 0.13192612137203166, "percentage": 6.6, "elapsed_time": "0:13:49", "remaining_time": "3:15:45", "throughput": 986.12, "total_tokens": 818272} {"current_steps": 180, "total_steps": 2652, "loss": 0.951, "learning_rate": 4.943381078271214e-05, "epoch": 0.1356954391255183, "percentage": 6.79, "elapsed_time": "0:14:13", "remaining_time": "3:15:16", "throughput": 986.25, "total_tokens": 841440} {"current_steps": 185, "total_steps": 2652, "loss": 0.8697, "learning_rate": 4.9402046679945613e-05, "epoch": 0.1394647568790049, "percentage": 6.98, "elapsed_time": "0:14:36", "remaining_time": "3:14:52", "throughput": 986.11, "total_tokens": 864640} {"current_steps": 190, "total_steps": 2652, "loss": 0.7765, "learning_rate": 4.936942649058061e-05, "epoch": 0.14323407463249152, "percentage": 7.16, "elapsed_time": "0:15:00", "remaining_time": "3:14:26", "throughput": 986.31, "total_tokens": 888032} {"current_steps": 195, "total_steps": 2652, "loss": 0.778, "learning_rate": 4.933595135901732e-05, "epoch": 0.14700339238597815, "percentage": 7.35, "elapsed_time": "0:15:23", "remaining_time": "3:13:59", "throughput": 986.2, "total_tokens": 911008} {"current_steps": 200, "total_steps": 2652, "loss": 0.8926, "learning_rate": 4.930162245964952e-05, "epoch": 0.15077271013946475, "percentage": 7.54, "elapsed_time": "0:15:47", "remaining_time": "3:13:36", "throughput": 986.17, "total_tokens": 934432} {"current_steps": 205, "total_steps": 2652, "loss": 0.805, "learning_rate": 4.926644099682334e-05, "epoch": 0.15454202789295138, "percentage": 7.73, "elapsed_time": "0:16:11", "remaining_time": "3:13:20", "throughput": 985.85, "total_tokens": 958064} {"current_steps": 210, "total_steps": 2652, "loss": 0.8433, "learning_rate": 4.9230408204795034e-05, "epoch": 0.158311345646438, "percentage": 7.92, "elapsed_time": "0:16:34", "remaining_time": "3:12:48", "throughput": 986.1, "total_tokens": 980992} {"current_steps": 215, "total_steps": 2652, "loss": 0.8483, "learning_rate": 4.9193525347687696e-05, "epoch": 0.1620806633999246, "percentage": 8.11, "elapsed_time": "0:16:58", "remaining_time": "3:12:27", "throughput": 986.28, "total_tokens": 1004736} {"current_steps": 220, "total_steps": 2652, "loss": 0.9689, "learning_rate": 4.9155793719446863e-05, "epoch": 0.16584998115341124, "percentage": 8.3, "elapsed_time": "0:17:22", "remaining_time": "3:12:03", "throughput": 986.51, "total_tokens": 1028320} {"current_steps": 225, "total_steps": 2652, "loss": 0.9025, "learning_rate": 4.911721464379516e-05, "epoch": 0.16961929890689786, "percentage": 8.48, "elapsed_time": "0:17:46", "remaining_time": "3:11:41", "throughput": 986.33, "total_tokens": 1051696} {"current_steps": 230, "total_steps": 2652, "loss": 0.8423, "learning_rate": 4.907778947418585e-05, "epoch": 0.17338861666038446, "percentage": 8.67, "elapsed_time": "0:18:09", "remaining_time": "3:11:14", "throughput": 986.18, "total_tokens": 1074640} {"current_steps": 235, "total_steps": 2652, "loss": 0.968, "learning_rate": 4.9037519593755356e-05, "epoch": 0.1771579344138711, "percentage": 8.86, "elapsed_time": "0:18:33", "remaining_time": "3:10:48", "throughput": 986.51, "total_tokens": 1098096} {"current_steps": 240, "total_steps": 2652, "loss": 0.8118, "learning_rate": 4.89964064152747e-05, "epoch": 0.18092725216735772, "percentage": 9.05, "elapsed_time": "0:18:56", "remaining_time": "3:10:20", "throughput": 986.75, "total_tokens": 1121344} {"current_steps": 245, "total_steps": 2652, "loss": 0.8695, "learning_rate": 4.895445138110001e-05, "epoch": 0.18469656992084432, "percentage": 9.24, "elapsed_time": "0:19:20", "remaining_time": "3:09:57", "throughput": 986.6, "total_tokens": 1144608} {"current_steps": 250, "total_steps": 2652, "loss": 0.9135, "learning_rate": 4.891165596312186e-05, "epoch": 0.18846588767433095, "percentage": 9.43, "elapsed_time": "0:19:44", "remaining_time": "3:09:37", "throughput": 986.45, "total_tokens": 1168112} {"current_steps": 255, "total_steps": 2652, "loss": 0.798, "learning_rate": 4.886802166271364e-05, "epoch": 0.19223520542781755, "percentage": 9.62, "elapsed_time": "0:20:07", "remaining_time": "3:09:10", "throughput": 986.35, "total_tokens": 1190992} {"current_steps": 260, "total_steps": 2652, "loss": 0.8068, "learning_rate": 4.882355001067892e-05, "epoch": 0.19600452318130418, "percentage": 9.8, "elapsed_time": "0:20:31", "remaining_time": "3:08:48", "throughput": 986.58, "total_tokens": 1214832} {"current_steps": 265, "total_steps": 2652, "loss": 0.7621, "learning_rate": 4.8778242567197685e-05, "epoch": 0.1997738409347908, "percentage": 9.99, "elapsed_time": "0:20:54", "remaining_time": "3:08:23", "throughput": 986.59, "total_tokens": 1238080} {"current_steps": 270, "total_steps": 2652, "loss": 0.7604, "learning_rate": 4.873210092177167e-05, "epoch": 0.2035431586882774, "percentage": 10.18, "elapsed_time": "0:21:18", "remaining_time": "3:07:55", "throughput": 986.68, "total_tokens": 1261056} {"current_steps": 275, "total_steps": 2652, "loss": 0.9166, "learning_rate": 4.868512669316855e-05, "epoch": 0.20731247644176404, "percentage": 10.37, "elapsed_time": "0:21:41", "remaining_time": "3:07:28", "throughput": 986.66, "total_tokens": 1283968} {"current_steps": 280, "total_steps": 2652, "loss": 0.8487, "learning_rate": 4.863732152936514e-05, "epoch": 0.21108179419525067, "percentage": 10.56, "elapsed_time": "0:22:05", "remaining_time": "3:07:08", "throughput": 986.95, "total_tokens": 1308192} {"current_steps": 285, "total_steps": 2652, "loss": 0.9388, "learning_rate": 4.858868710748963e-05, "epoch": 0.21485111194873727, "percentage": 10.75, "elapsed_time": "0:22:29", "remaining_time": "3:06:45", "throughput": 987.01, "total_tokens": 1331648} {"current_steps": 290, "total_steps": 2652, "loss": 0.8762, "learning_rate": 4.85392251337627e-05, "epoch": 0.2186204297022239, "percentage": 10.94, "elapsed_time": "0:22:52", "remaining_time": "3:06:21", "throughput": 986.88, "total_tokens": 1354880} {"current_steps": 295, "total_steps": 2652, "loss": 0.8672, "learning_rate": 4.848893734343769e-05, "epoch": 0.22238974745571052, "percentage": 11.12, "elapsed_time": "0:23:16", "remaining_time": "3:06:00", "throughput": 986.59, "total_tokens": 1378064} {"current_steps": 300, "total_steps": 2652, "loss": 0.9335, "learning_rate": 4.8437825500739696e-05, "epoch": 0.22615906520919712, "percentage": 11.31, "elapsed_time": "0:23:40", "remaining_time": "3:05:37", "throughput": 986.57, "total_tokens": 1401568} {"current_steps": 305, "total_steps": 2652, "loss": 0.7408, "learning_rate": 4.838589139880371e-05, "epoch": 0.22992838296268375, "percentage": 11.5, "elapsed_time": "0:24:05", "remaining_time": "3:05:20", "throughput": 986.04, "total_tokens": 1424960} {"current_steps": 310, "total_steps": 2652, "loss": 0.7255, "learning_rate": 4.833313685961167e-05, "epoch": 0.23369770071617038, "percentage": 11.69, "elapsed_time": "0:24:28", "remaining_time": "3:04:57", "throughput": 986.13, "total_tokens": 1448560} {"current_steps": 315, "total_steps": 2652, "loss": 0.8214, "learning_rate": 4.82795637339286e-05, "epoch": 0.23746701846965698, "percentage": 11.88, "elapsed_time": "0:24:52", "remaining_time": "3:04:33", "throughput": 986.33, "total_tokens": 1472224} {"current_steps": 320, "total_steps": 2652, "loss": 0.7577, "learning_rate": 4.822517390123761e-05, "epoch": 0.2412363362231436, "percentage": 12.07, "elapsed_time": "0:25:16", "remaining_time": "3:04:08", "throughput": 986.27, "total_tokens": 1495232} {"current_steps": 325, "total_steps": 2652, "loss": 0.7087, "learning_rate": 4.8169969269674016e-05, "epoch": 0.24500565397663024, "percentage": 12.25, "elapsed_time": "0:25:39", "remaining_time": "3:03:45", "throughput": 986.21, "total_tokens": 1518608} {"current_steps": 330, "total_steps": 2652, "loss": 0.8798, "learning_rate": 4.811395177595836e-05, "epoch": 0.24877497173011684, "percentage": 12.44, "elapsed_time": "0:26:03", "remaining_time": "3:03:19", "throughput": 986.1, "total_tokens": 1541552} {"current_steps": 335, "total_steps": 2652, "loss": 0.8511, "learning_rate": 4.8057123385328495e-05, "epoch": 0.25254428948360347, "percentage": 12.63, "elapsed_time": "0:26:26", "remaining_time": "3:02:55", "throughput": 986.31, "total_tokens": 1565136} {"current_steps": 340, "total_steps": 2652, "loss": 0.8655, "learning_rate": 4.799948609147061e-05, "epoch": 0.25631360723709007, "percentage": 12.82, "elapsed_time": "0:26:50", "remaining_time": "3:02:32", "throughput": 986.35, "total_tokens": 1588624} {"current_steps": 345, "total_steps": 2652, "loss": 0.7643, "learning_rate": 4.7941041916449316e-05, "epoch": 0.2600829249905767, "percentage": 13.01, "elapsed_time": "0:27:14", "remaining_time": "3:02:09", "throughput": 986.27, "total_tokens": 1612016} {"current_steps": 350, "total_steps": 2652, "loss": 0.8325, "learning_rate": 4.788179291063667e-05, "epoch": 0.2638522427440633, "percentage": 13.2, "elapsed_time": "0:27:38", "remaining_time": "3:01:47", "throughput": 986.42, "total_tokens": 1635856} {"current_steps": 355, "total_steps": 2652, "loss": 0.6917, "learning_rate": 4.78217411526403e-05, "epoch": 0.2676215604975499, "percentage": 13.39, "elapsed_time": "0:28:01", "remaining_time": "3:01:22", "throughput": 986.45, "total_tokens": 1659168} {"current_steps": 360, "total_steps": 2652, "loss": 0.9086, "learning_rate": 4.7760888749230416e-05, "epoch": 0.2713908782510366, "percentage": 13.57, "elapsed_time": "0:28:25", "remaining_time": "3:00:58", "throughput": 986.48, "total_tokens": 1682480} {"current_steps": 365, "total_steps": 2652, "loss": 0.9648, "learning_rate": 4.769923783526593e-05, "epoch": 0.2751601960045232, "percentage": 13.76, "elapsed_time": "0:28:49", "remaining_time": "3:00:34", "throughput": 986.61, "total_tokens": 1705952} {"current_steps": 370, "total_steps": 2652, "loss": 0.8712, "learning_rate": 4.7636790573619586e-05, "epoch": 0.2789295137580098, "percentage": 13.95, "elapsed_time": "0:29:12", "remaining_time": "3:00:09", "throughput": 986.8, "total_tokens": 1729504} {"current_steps": 375, "total_steps": 2652, "loss": 0.7044, "learning_rate": 4.7573549155102014e-05, "epoch": 0.28269883151149644, "percentage": 14.14, "elapsed_time": "0:29:36", "remaining_time": "2:59:45", "throughput": 986.81, "total_tokens": 1752784} {"current_steps": 380, "total_steps": 2652, "loss": 0.92, "learning_rate": 4.7509515798384956e-05, "epoch": 0.28646814926498304, "percentage": 14.33, "elapsed_time": "0:29:59", "remaining_time": "2:59:20", "throughput": 986.72, "total_tokens": 1775840} {"current_steps": 385, "total_steps": 2652, "loss": 0.7396, "learning_rate": 4.7444692749923345e-05, "epoch": 0.29023746701846964, "percentage": 14.52, "elapsed_time": "0:30:23", "remaining_time": "2:58:56", "throughput": 986.62, "total_tokens": 1798944} {"current_steps": 390, "total_steps": 2652, "loss": 0.8619, "learning_rate": 4.7379082283876566e-05, "epoch": 0.2940067847719563, "percentage": 14.71, "elapsed_time": "0:30:46", "remaining_time": "2:58:31", "throughput": 986.54, "total_tokens": 1822016} {"current_steps": 395, "total_steps": 2652, "loss": 0.7399, "learning_rate": 4.73126867020286e-05, "epoch": 0.2977761025254429, "percentage": 14.89, "elapsed_time": "0:31:10", "remaining_time": "2:58:06", "throughput": 986.83, "total_tokens": 1845584} {"current_steps": 400, "total_steps": 2652, "loss": 0.7882, "learning_rate": 4.724550833370735e-05, "epoch": 0.3015454202789295, "percentage": 15.08, "elapsed_time": "0:31:33", "remaining_time": "2:57:41", "throughput": 986.96, "total_tokens": 1868976} {"current_steps": 405, "total_steps": 2652, "loss": 0.7579, "learning_rate": 4.717754953570286e-05, "epoch": 0.30531473803241616, "percentage": 15.27, "elapsed_time": "0:31:57", "remaining_time": "2:57:21", "throughput": 986.5, "total_tokens": 1892096} {"current_steps": 410, "total_steps": 2652, "loss": 0.8531, "learning_rate": 4.710881269218467e-05, "epoch": 0.30908405578590276, "percentage": 15.46, "elapsed_time": "0:32:21", "remaining_time": "2:56:55", "throughput": 986.52, "total_tokens": 1915136} {"current_steps": 415, "total_steps": 2652, "loss": 0.8279, "learning_rate": 4.7039300214618134e-05, "epoch": 0.31285337353938936, "percentage": 15.65, "elapsed_time": "0:32:44", "remaining_time": "2:56:31", "throughput": 986.52, "total_tokens": 1938464} {"current_steps": 420, "total_steps": 2652, "loss": 0.9496, "learning_rate": 4.696901454167988e-05, "epoch": 0.316622691292876, "percentage": 15.84, "elapsed_time": "0:33:08", "remaining_time": "2:56:08", "throughput": 986.39, "total_tokens": 1961696} {"current_steps": 425, "total_steps": 2652, "loss": 0.7804, "learning_rate": 4.68979581391722e-05, "epoch": 0.3203920090463626, "percentage": 16.03, "elapsed_time": "0:33:32", "remaining_time": "2:55:43", "throughput": 986.51, "total_tokens": 1985072} {"current_steps": 430, "total_steps": 2652, "loss": 0.8848, "learning_rate": 4.682613349993655e-05, "epoch": 0.3241613267998492, "percentage": 16.21, "elapsed_time": "0:33:55", "remaining_time": "2:55:19", "throughput": 986.38, "total_tokens": 2007936} {"current_steps": 435, "total_steps": 2652, "loss": 0.7155, "learning_rate": 4.675354314376614e-05, "epoch": 0.32793064455333587, "percentage": 16.4, "elapsed_time": "0:34:19", "remaining_time": "2:54:54", "throughput": 986.47, "total_tokens": 2031280} {"current_steps": 440, "total_steps": 2652, "loss": 0.7408, "learning_rate": 4.6680189617317474e-05, "epoch": 0.33169996230682247, "percentage": 16.59, "elapsed_time": "0:34:42", "remaining_time": "2:54:28", "throughput": 986.45, "total_tokens": 2054176} {"current_steps": 445, "total_steps": 2652, "loss": 0.6917, "learning_rate": 4.660607549402103e-05, "epoch": 0.33546928006030907, "percentage": 16.78, "elapsed_time": "0:35:05", "remaining_time": "2:54:04", "throughput": 986.46, "total_tokens": 2077392} {"current_steps": 450, "total_steps": 2652, "loss": 0.8376, "learning_rate": 4.6531203373991014e-05, "epoch": 0.33923859781379573, "percentage": 16.97, "elapsed_time": "0:35:29", "remaining_time": "2:53:40", "throughput": 986.31, "total_tokens": 2100464} {"current_steps": 455, "total_steps": 2652, "loss": 0.7672, "learning_rate": 4.645557588393407e-05, "epoch": 0.34300791556728233, "percentage": 17.16, "elapsed_time": "0:35:53", "remaining_time": "2:53:18", "throughput": 986.44, "total_tokens": 2124240} {"current_steps": 460, "total_steps": 2652, "loss": 0.7285, "learning_rate": 4.63791956770572e-05, "epoch": 0.34677723332076893, "percentage": 17.35, "elapsed_time": "0:36:17", "remaining_time": "2:52:54", "throughput": 986.38, "total_tokens": 2147584} {"current_steps": 465, "total_steps": 2652, "loss": 0.8577, "learning_rate": 4.6302065432974616e-05, "epoch": 0.3505465510742556, "percentage": 17.53, "elapsed_time": "0:36:41", "remaining_time": "2:52:31", "throughput": 986.35, "total_tokens": 2170976} {"current_steps": 470, "total_steps": 2652, "loss": 0.8195, "learning_rate": 4.6224187857613786e-05, "epoch": 0.3543158688277422, "percentage": 17.72, "elapsed_time": "0:37:04", "remaining_time": "2:52:07", "throughput": 986.31, "total_tokens": 2194128} {"current_steps": 475, "total_steps": 2652, "loss": 0.878, "learning_rate": 4.6145565683120496e-05, "epoch": 0.3580851865812288, "percentage": 17.91, "elapsed_time": "0:37:28", "remaining_time": "2:51:43", "throughput": 986.15, "total_tokens": 2217056} {"current_steps": 480, "total_steps": 2652, "loss": 0.8187, "learning_rate": 4.606620166776294e-05, "epoch": 0.36185450433471544, "percentage": 18.1, "elapsed_time": "0:37:51", "remaining_time": "2:51:20", "throughput": 986.31, "total_tokens": 2240800} {"current_steps": 485, "total_steps": 2652, "loss": 0.7713, "learning_rate": 4.598609859583506e-05, "epoch": 0.36562382208820204, "percentage": 18.29, "elapsed_time": "0:38:15", "remaining_time": "2:50:56", "throughput": 986.3, "total_tokens": 2263984} {"current_steps": 490, "total_steps": 2652, "loss": 0.8583, "learning_rate": 4.590525927755874e-05, "epoch": 0.36939313984168864, "percentage": 18.48, "elapsed_time": "0:38:39", "remaining_time": "2:50:33", "throughput": 986.43, "total_tokens": 2287776} {"current_steps": 495, "total_steps": 2652, "loss": 0.8106, "learning_rate": 4.582368654898533e-05, "epoch": 0.3731624575951753, "percentage": 18.67, "elapsed_time": "0:39:02", "remaining_time": "2:50:08", "throughput": 986.47, "total_tokens": 2311072} {"current_steps": 500, "total_steps": 2652, "loss": 0.8578, "learning_rate": 4.5741383271896094e-05, "epoch": 0.3769317753486619, "percentage": 18.85, "elapsed_time": "0:39:26", "remaining_time": "2:49:46", "throughput": 986.53, "total_tokens": 2334768} {"current_steps": 505, "total_steps": 2652, "loss": 0.7192, "learning_rate": 4.565835233370178e-05, "epoch": 0.3807010931021485, "percentage": 19.04, "elapsed_time": "0:39:51", "remaining_time": "2:49:25", "throughput": 986.25, "total_tokens": 2358272} {"current_steps": 510, "total_steps": 2652, "loss": 0.8681, "learning_rate": 4.557459664734141e-05, "epoch": 0.3844704108556351, "percentage": 19.23, "elapsed_time": "0:40:14", "remaining_time": "2:49:01", "throughput": 986.21, "total_tokens": 2381440} {"current_steps": 515, "total_steps": 2652, "loss": 0.6713, "learning_rate": 4.549011915118001e-05, "epoch": 0.38823972860912176, "percentage": 19.42, "elapsed_time": "0:40:37", "remaining_time": "2:48:35", "throughput": 986.13, "total_tokens": 2403984} {"current_steps": 520, "total_steps": 2652, "loss": 0.7997, "learning_rate": 4.540492280890555e-05, "epoch": 0.39200904636260836, "percentage": 19.61, "elapsed_time": "0:41:01", "remaining_time": "2:48:11", "throughput": 986.17, "total_tokens": 2427392} {"current_steps": 525, "total_steps": 2652, "loss": 0.8715, "learning_rate": 4.531901060942497e-05, "epoch": 0.39577836411609496, "percentage": 19.8, "elapsed_time": "0:41:24", "remaining_time": "2:47:46", "throughput": 986.16, "total_tokens": 2450384} {"current_steps": 530, "total_steps": 2652, "loss": 0.6608, "learning_rate": 4.523238556675935e-05, "epoch": 0.3995476818695816, "percentage": 19.98, "elapsed_time": "0:41:48", "remaining_time": "2:47:22", "throughput": 986.12, "total_tokens": 2473424} {"current_steps": 535, "total_steps": 2652, "loss": 0.7568, "learning_rate": 4.514505071993812e-05, "epoch": 0.4033169996230682, "percentage": 20.17, "elapsed_time": "0:42:11", "remaining_time": "2:46:59", "throughput": 986.27, "total_tokens": 2497232} {"current_steps": 540, "total_steps": 2652, "loss": 0.8325, "learning_rate": 4.505700913289246e-05, "epoch": 0.4070863173765548, "percentage": 20.36, "elapsed_time": "0:42:35", "remaining_time": "2:46:33", "throughput": 986.37, "total_tokens": 2520432} {"current_steps": 545, "total_steps": 2652, "loss": 0.8083, "learning_rate": 4.496826389434784e-05, "epoch": 0.4108556351300415, "percentage": 20.55, "elapsed_time": "0:42:58", "remaining_time": "2:46:09", "throughput": 986.4, "total_tokens": 2543616} {"current_steps": 550, "total_steps": 2652, "loss": 0.7702, "learning_rate": 4.48788181177156e-05, "epoch": 0.4146249528835281, "percentage": 20.74, "elapsed_time": "0:43:22", "remaining_time": "2:45:45", "throughput": 986.46, "total_tokens": 2566992} {"current_steps": 555, "total_steps": 2652, "loss": 0.6993, "learning_rate": 4.478867494098381e-05, "epoch": 0.4183942706370147, "percentage": 20.93, "elapsed_time": "0:43:45", "remaining_time": "2:45:20", "throughput": 986.52, "total_tokens": 2590144} {"current_steps": 560, "total_steps": 2652, "loss": 0.8109, "learning_rate": 4.469783752660709e-05, "epoch": 0.42216358839050133, "percentage": 21.12, "elapsed_time": "0:44:09", "remaining_time": "2:44:57", "throughput": 986.68, "total_tokens": 2614240} {"current_steps": 565, "total_steps": 2652, "loss": 0.7901, "learning_rate": 4.460630906139571e-05, "epoch": 0.42593290614398793, "percentage": 21.3, "elapsed_time": "0:44:33", "remaining_time": "2:44:33", "throughput": 986.75, "total_tokens": 2637696} {"current_steps": 570, "total_steps": 2652, "loss": 0.9066, "learning_rate": 4.451409275640379e-05, "epoch": 0.42970222389747453, "percentage": 21.49, "elapsed_time": "0:44:56", "remaining_time": "2:44:09", "throughput": 986.72, "total_tokens": 2660768} {"current_steps": 575, "total_steps": 2652, "loss": 0.703, "learning_rate": 4.442119184681664e-05, "epoch": 0.4334715416509612, "percentage": 21.68, "elapsed_time": "0:45:20", "remaining_time": "2:43:45", "throughput": 986.65, "total_tokens": 2683792} {"current_steps": 580, "total_steps": 2652, "loss": 0.9203, "learning_rate": 4.432760959183725e-05, "epoch": 0.4372408594044478, "percentage": 21.87, "elapsed_time": "0:45:43", "remaining_time": "2:43:22", "throughput": 986.61, "total_tokens": 2707136} {"current_steps": 585, "total_steps": 2652, "loss": 0.9314, "learning_rate": 4.423334927457198e-05, "epoch": 0.4410101771579344, "percentage": 22.06, "elapsed_time": "0:46:06", "remaining_time": "2:42:56", "throughput": 986.6, "total_tokens": 2729808} {"current_steps": 590, "total_steps": 2652, "loss": 0.7105, "learning_rate": 4.413841420191532e-05, "epoch": 0.44477949491142105, "percentage": 22.25, "elapsed_time": "0:46:30", "remaining_time": "2:42:32", "throughput": 986.52, "total_tokens": 2752992} {"current_steps": 595, "total_steps": 2652, "loss": 0.894, "learning_rate": 4.404280770443398e-05, "epoch": 0.44854881266490765, "percentage": 22.44, "elapsed_time": "0:46:54", "remaining_time": "2:42:09", "throughput": 986.55, "total_tokens": 2776480} {"current_steps": 600, "total_steps": 2652, "loss": 0.8868, "learning_rate": 4.3946533136249926e-05, "epoch": 0.45231813041839425, "percentage": 22.62, "elapsed_time": "0:47:18", "remaining_time": "2:41:46", "throughput": 986.5, "total_tokens": 2799728} {"current_steps": 605, "total_steps": 2652, "loss": 0.7679, "learning_rate": 4.384959387492277e-05, "epoch": 0.4560874481718809, "percentage": 22.81, "elapsed_time": "0:47:42", "remaining_time": "2:41:24", "throughput": 986.3, "total_tokens": 2823008} {"current_steps": 610, "total_steps": 2652, "loss": 0.7895, "learning_rate": 4.37519933213313e-05, "epoch": 0.4598567659253675, "percentage": 23.0, "elapsed_time": "0:48:05", "remaining_time": "2:41:00", "throughput": 986.2, "total_tokens": 2845984} {"current_steps": 615, "total_steps": 2652, "loss": 0.8527, "learning_rate": 4.365373489955411e-05, "epoch": 0.4636260836788541, "percentage": 23.19, "elapsed_time": "0:48:29", "remaining_time": "2:40:37", "throughput": 986.05, "total_tokens": 2869024} {"current_steps": 620, "total_steps": 2652, "loss": 0.7533, "learning_rate": 4.355482205674951e-05, "epoch": 0.46739540143234076, "percentage": 23.38, "elapsed_time": "0:48:53", "remaining_time": "2:40:12", "throughput": 986.09, "total_tokens": 2892240} {"current_steps": 625, "total_steps": 2652, "loss": 0.8048, "learning_rate": 4.3455258263034605e-05, "epoch": 0.47116471918582736, "percentage": 23.57, "elapsed_time": "0:49:16", "remaining_time": "2:39:48", "throughput": 986.24, "total_tokens": 2915792} {"current_steps": 630, "total_steps": 2652, "loss": 0.7072, "learning_rate": 4.33550470113635e-05, "epoch": 0.47493403693931396, "percentage": 23.76, "elapsed_time": "0:49:40", "remaining_time": "2:39:25", "throughput": 986.32, "total_tokens": 2939488} {"current_steps": 635, "total_steps": 2652, "loss": 0.7911, "learning_rate": 4.3254191817404804e-05, "epoch": 0.4787033546928006, "percentage": 23.94, "elapsed_time": "0:50:04", "remaining_time": "2:39:01", "throughput": 986.35, "total_tokens": 2962992} {"current_steps": 640, "total_steps": 2652, "loss": 0.8293, "learning_rate": 4.3152696219418295e-05, "epoch": 0.4824726724462872, "percentage": 24.13, "elapsed_time": "0:50:27", "remaining_time": "2:38:38", "throughput": 986.38, "total_tokens": 2986544} {"current_steps": 645, "total_steps": 2652, "loss": 0.8835, "learning_rate": 4.305056377813075e-05, "epoch": 0.4862419901997738, "percentage": 24.32, "elapsed_time": "0:50:51", "remaining_time": "2:38:14", "throughput": 986.44, "total_tokens": 3009984} {"current_steps": 650, "total_steps": 2652, "loss": 0.7262, "learning_rate": 4.294779807661105e-05, "epoch": 0.4900113079532605, "percentage": 24.51, "elapsed_time": "0:51:14", "remaining_time": "2:37:50", "throughput": 986.53, "total_tokens": 3033520} {"current_steps": 655, "total_steps": 2652, "loss": 0.8231, "learning_rate": 4.2844402720144496e-05, "epoch": 0.4937806257067471, "percentage": 24.7, "elapsed_time": "0:51:38", "remaining_time": "2:37:28", "throughput": 986.5, "total_tokens": 3057056} {"current_steps": 660, "total_steps": 2652, "loss": 0.8302, "learning_rate": 4.274038133610628e-05, "epoch": 0.4975499434602337, "percentage": 24.89, "elapsed_time": "0:52:02", "remaining_time": "2:37:04", "throughput": 986.57, "total_tokens": 3080656} {"current_steps": 665, "total_steps": 2652, "loss": 0.8095, "learning_rate": 4.263573757383427e-05, "epoch": 0.5013192612137203, "percentage": 25.08, "elapsed_time": "0:52:26", "remaining_time": "2:36:40", "throughput": 986.58, "total_tokens": 3103792} {"current_steps": 670, "total_steps": 2652, "loss": 0.8756, "learning_rate": 4.2530475104500956e-05, "epoch": 0.5050885789672069, "percentage": 25.26, "elapsed_time": "0:52:49", "remaining_time": "2:36:16", "throughput": 986.58, "total_tokens": 3126976} {"current_steps": 675, "total_steps": 2652, "loss": 0.7733, "learning_rate": 4.242459762098466e-05, "epoch": 0.5088578967206936, "percentage": 25.45, "elapsed_time": "0:53:12", "remaining_time": "2:35:51", "throughput": 986.61, "total_tokens": 3150224} {"current_steps": 680, "total_steps": 2652, "loss": 0.7715, "learning_rate": 4.231810883773999e-05, "epoch": 0.5126272144741801, "percentage": 25.64, "elapsed_time": "0:53:36", "remaining_time": "2:35:27", "throughput": 986.58, "total_tokens": 3173296} {"current_steps": 685, "total_steps": 2652, "loss": 0.6996, "learning_rate": 4.2211012490667524e-05, "epoch": 0.5163965322276668, "percentage": 25.83, "elapsed_time": "0:54:00", "remaining_time": "2:35:03", "throughput": 986.59, "total_tokens": 3196560} {"current_steps": 690, "total_steps": 2652, "loss": 0.8889, "learning_rate": 4.2103312336982734e-05, "epoch": 0.5201658499811534, "percentage": 26.02, "elapsed_time": "0:54:24", "remaining_time": "2:34:41", "throughput": 986.65, "total_tokens": 3220432} {"current_steps": 695, "total_steps": 2652, "loss": 0.8717, "learning_rate": 4.19950121550842e-05, "epoch": 0.52393516773464, "percentage": 26.21, "elapsed_time": "0:54:47", "remaining_time": "2:34:16", "throughput": 986.69, "total_tokens": 3243712} {"current_steps": 700, "total_steps": 2652, "loss": 0.6314, "learning_rate": 4.188611574442101e-05, "epoch": 0.5277044854881267, "percentage": 26.4, "elapsed_time": "0:55:10", "remaining_time": "2:33:52", "throughput": 986.71, "total_tokens": 3266976} {"current_steps": 705, "total_steps": 2652, "loss": 0.7517, "learning_rate": 4.177662692535952e-05, "epoch": 0.5314738032416133, "percentage": 26.58, "elapsed_time": "0:55:35", "remaining_time": "2:33:32", "throughput": 986.49, "total_tokens": 3290656} {"current_steps": 710, "total_steps": 2652, "loss": 0.8373, "learning_rate": 4.166654953904926e-05, "epoch": 0.5352431209950999, "percentage": 26.77, "elapsed_time": "0:55:59", "remaining_time": "2:33:08", "throughput": 986.45, "total_tokens": 3313712} {"current_steps": 715, "total_steps": 2652, "loss": 0.7025, "learning_rate": 4.155588744728826e-05, "epoch": 0.5390124387485865, "percentage": 26.96, "elapsed_time": "0:56:22", "remaining_time": "2:32:43", "throughput": 986.49, "total_tokens": 3336880} {"current_steps": 720, "total_steps": 2652, "loss": 0.6709, "learning_rate": 4.144464453238748e-05, "epoch": 0.5427817565020732, "percentage": 27.15, "elapsed_time": "0:56:46", "remaining_time": "2:32:20", "throughput": 986.52, "total_tokens": 3360416} {"current_steps": 725, "total_steps": 2652, "loss": 0.6451, "learning_rate": 4.133282469703469e-05, "epoch": 0.5465510742555597, "percentage": 27.34, "elapsed_time": "0:57:09", "remaining_time": "2:31:55", "throughput": 986.53, "total_tokens": 3383408} {"current_steps": 730, "total_steps": 2652, "loss": 0.754, "learning_rate": 4.122043186415746e-05, "epoch": 0.5503203920090464, "percentage": 27.53, "elapsed_time": "0:57:33", "remaining_time": "2:31:32", "throughput": 986.5, "total_tokens": 3406752} {"current_steps": 735, "total_steps": 2652, "loss": 0.8784, "learning_rate": 4.110746997678565e-05, "epoch": 0.554089709762533, "percentage": 27.71, "elapsed_time": "0:57:57", "remaining_time": "2:31:08", "throughput": 986.47, "total_tokens": 3429968} {"current_steps": 740, "total_steps": 2652, "loss": 0.9384, "learning_rate": 4.0993942997912984e-05, "epoch": 0.5578590275160196, "percentage": 27.9, "elapsed_time": "0:58:20", "remaining_time": "2:30:45", "throughput": 986.39, "total_tokens": 3453136} {"current_steps": 745, "total_steps": 2652, "loss": 0.7915, "learning_rate": 4.087985491035804e-05, "epoch": 0.5616283452695062, "percentage": 28.09, "elapsed_time": "0:58:44", "remaining_time": "2:30:21", "throughput": 986.39, "total_tokens": 3476384} {"current_steps": 750, "total_steps": 2652, "loss": 0.8374, "learning_rate": 4.076520971662455e-05, "epoch": 0.5653976630229929, "percentage": 28.28, "elapsed_time": "0:59:08", "remaining_time": "2:29:58", "throughput": 986.42, "total_tokens": 3500176} {"current_steps": 755, "total_steps": 2652, "loss": 0.7302, "learning_rate": 4.065001143876097e-05, "epoch": 0.5691669807764794, "percentage": 28.47, "elapsed_time": "0:59:32", "remaining_time": "2:29:35", "throughput": 986.52, "total_tokens": 3524048} {"current_steps": 760, "total_steps": 2652, "loss": 0.754, "learning_rate": 4.053426411821934e-05, "epoch": 0.5729362985299661, "percentage": 28.66, "elapsed_time": "0:59:55", "remaining_time": "2:29:11", "throughput": 986.5, "total_tokens": 3547056} {"current_steps": 765, "total_steps": 2652, "loss": 0.8208, "learning_rate": 4.0417971815713584e-05, "epoch": 0.5767056162834527, "percentage": 28.85, "elapsed_time": "1:00:19", "remaining_time": "2:28:47", "throughput": 986.52, "total_tokens": 3570608} {"current_steps": 770, "total_steps": 2652, "loss": 0.9635, "learning_rate": 4.030113861107693e-05, "epoch": 0.5804749340369393, "percentage": 29.03, "elapsed_time": "1:00:43", "remaining_time": "2:28:24", "throughput": 986.58, "total_tokens": 3594192} {"current_steps": 775, "total_steps": 2652, "loss": 0.7606, "learning_rate": 4.0183768603118886e-05, "epoch": 0.5842442517904259, "percentage": 29.22, "elapsed_time": "1:01:06", "remaining_time": "2:28:00", "throughput": 986.57, "total_tokens": 3617600} {"current_steps": 780, "total_steps": 2652, "loss": 0.7283, "learning_rate": 4.0065865909481417e-05, "epoch": 0.5880135695439126, "percentage": 29.41, "elapsed_time": "1:01:30", "remaining_time": "2:27:36", "throughput": 986.48, "total_tokens": 3640416} {"current_steps": 785, "total_steps": 2652, "loss": 0.6878, "learning_rate": 3.994743466649442e-05, "epoch": 0.5917828872973991, "percentage": 29.6, "elapsed_time": "1:01:54", "remaining_time": "2:27:13", "throughput": 986.44, "total_tokens": 3663696} {"current_steps": 790, "total_steps": 2652, "loss": 0.8009, "learning_rate": 3.982847902903071e-05, "epoch": 0.5955522050508858, "percentage": 29.79, "elapsed_time": "1:02:17", "remaining_time": "2:26:49", "throughput": 986.44, "total_tokens": 3686880} {"current_steps": 795, "total_steps": 2652, "loss": 0.794, "learning_rate": 3.9709003170360176e-05, "epoch": 0.5993215228043725, "percentage": 29.98, "elapsed_time": "1:02:41", "remaining_time": "2:26:25", "throughput": 986.45, "total_tokens": 3710224} {"current_steps": 800, "total_steps": 2652, "loss": 0.7532, "learning_rate": 3.958901128200344e-05, "epoch": 0.603090840557859, "percentage": 30.17, "elapsed_time": "1:03:04", "remaining_time": "2:26:01", "throughput": 986.49, "total_tokens": 3733536} {"current_steps": 805, "total_steps": 2652, "loss": 0.8581, "learning_rate": 3.946850757358475e-05, "epoch": 0.6068601583113457, "percentage": 30.35, "elapsed_time": "1:03:29", "remaining_time": "2:25:39", "throughput": 986.26, "total_tokens": 3756688} {"current_steps": 810, "total_steps": 2652, "loss": 0.7889, "learning_rate": 3.9347496272684325e-05, "epoch": 0.6106294760648323, "percentage": 30.54, "elapsed_time": "1:03:52", "remaining_time": "2:25:15", "throughput": 986.17, "total_tokens": 3779504} {"current_steps": 815, "total_steps": 2652, "loss": 0.7401, "learning_rate": 3.922598162469003e-05, "epoch": 0.6143987938183189, "percentage": 30.73, "elapsed_time": "1:04:16", "remaining_time": "2:24:52", "throughput": 986.06, "total_tokens": 3802544} {"current_steps": 820, "total_steps": 2652, "loss": 0.799, "learning_rate": 3.910396789264845e-05, "epoch": 0.6181681115718055, "percentage": 30.92, "elapsed_time": "1:04:39", "remaining_time": "2:24:27", "throughput": 986.09, "total_tokens": 3825680} {"current_steps": 825, "total_steps": 2652, "loss": 0.8015, "learning_rate": 3.8981459357115325e-05, "epoch": 0.6219374293252922, "percentage": 31.11, "elapsed_time": "1:05:03", "remaining_time": "2:24:04", "throughput": 986.04, "total_tokens": 3849040} {"current_steps": 830, "total_steps": 2652, "loss": 0.6905, "learning_rate": 3.885846031600536e-05, "epoch": 0.6257067470787787, "percentage": 31.3, "elapsed_time": "1:05:27", "remaining_time": "2:23:41", "throughput": 986.0, "total_tokens": 3872320} {"current_steps": 835, "total_steps": 2652, "loss": 0.845, "learning_rate": 3.8734975084441466e-05, "epoch": 0.6294760648322654, "percentage": 31.49, "elapsed_time": "1:05:51", "remaining_time": "2:23:18", "throughput": 986.0, "total_tokens": 3895920} {"current_steps": 840, "total_steps": 2652, "loss": 0.7317, "learning_rate": 3.8611007994603365e-05, "epoch": 0.633245382585752, "percentage": 31.67, "elapsed_time": "1:06:14", "remaining_time": "2:22:54", "throughput": 986.04, "total_tokens": 3919360} {"current_steps": 845, "total_steps": 2652, "loss": 0.724, "learning_rate": 3.8486563395575625e-05, "epoch": 0.6370147003392386, "percentage": 31.86, "elapsed_time": "1:06:38", "remaining_time": "2:22:30", "throughput": 986.07, "total_tokens": 3942736} {"current_steps": 850, "total_steps": 2652, "loss": 0.664, "learning_rate": 3.8361645653195026e-05, "epoch": 0.6407840180927252, "percentage": 32.05, "elapsed_time": "1:07:02", "remaining_time": "2:22:06", "throughput": 986.11, "total_tokens": 3966144} {"current_steps": 855, "total_steps": 2652, "loss": 0.5922, "learning_rate": 3.823625914989748e-05, "epoch": 0.6445533358462119, "percentage": 32.24, "elapsed_time": "1:07:25", "remaining_time": "2:21:42", "throughput": 986.23, "total_tokens": 3989472} {"current_steps": 860, "total_steps": 2652, "loss": 0.9465, "learning_rate": 3.811040828456421e-05, "epoch": 0.6483226535996984, "percentage": 32.43, "elapsed_time": "1:07:48", "remaining_time": "2:21:17", "throughput": 986.26, "total_tokens": 4012656} {"current_steps": 865, "total_steps": 2652, "loss": 0.7781, "learning_rate": 3.798409747236745e-05, "epoch": 0.6520919713531851, "percentage": 32.62, "elapsed_time": "1:08:12", "remaining_time": "2:20:53", "throughput": 986.28, "total_tokens": 4035888} {"current_steps": 870, "total_steps": 2652, "loss": 0.8309, "learning_rate": 3.7857331144615574e-05, "epoch": 0.6558612891066717, "percentage": 32.81, "elapsed_time": "1:08:36", "remaining_time": "2:20:30", "throughput": 986.27, "total_tokens": 4059504} {"current_steps": 875, "total_steps": 2652, "loss": 0.7812, "learning_rate": 3.773011374859761e-05, "epoch": 0.6596306068601583, "percentage": 32.99, "elapsed_time": "1:09:00", "remaining_time": "2:20:07", "throughput": 986.34, "total_tokens": 4083440} {"current_steps": 880, "total_steps": 2652, "loss": 0.7888, "learning_rate": 3.7602449747427204e-05, "epoch": 0.6633999246136449, "percentage": 33.18, "elapsed_time": "1:09:23", "remaining_time": "2:19:43", "throughput": 986.4, "total_tokens": 4106928} {"current_steps": 885, "total_steps": 2652, "loss": 0.7584, "learning_rate": 3.747434361988608e-05, "epoch": 0.6671692423671316, "percentage": 33.37, "elapsed_time": "1:09:46", "remaining_time": "2:19:19", "throughput": 986.5, "total_tokens": 4130336} {"current_steps": 890, "total_steps": 2652, "loss": 0.6848, "learning_rate": 3.734579986026688e-05, "epoch": 0.6709385601206181, "percentage": 33.56, "elapsed_time": "1:10:10", "remaining_time": "2:18:55", "throughput": 986.57, "total_tokens": 4153872} {"current_steps": 895, "total_steps": 2652, "loss": 0.8068, "learning_rate": 3.7216822978215514e-05, "epoch": 0.6747078778741048, "percentage": 33.75, "elapsed_time": "1:10:33", "remaining_time": "2:18:31", "throughput": 986.6, "total_tokens": 4177072} {"current_steps": 900, "total_steps": 2652, "loss": 0.8122, "learning_rate": 3.7087417498572944e-05, "epoch": 0.6784771956275915, "percentage": 33.94, "elapsed_time": "1:10:57", "remaining_time": "2:18:07", "throughput": 986.56, "total_tokens": 4200256} {"current_steps": 905, "total_steps": 2652, "loss": 0.5764, "learning_rate": 3.695758796121642e-05, "epoch": 0.682246513381078, "percentage": 34.13, "elapsed_time": "1:11:21", "remaining_time": "2:17:45", "throughput": 986.39, "total_tokens": 4223264} {"current_steps": 910, "total_steps": 2652, "loss": 0.8898, "learning_rate": 3.6827338920900254e-05, "epoch": 0.6860158311345647, "percentage": 34.31, "elapsed_time": "1:11:45", "remaining_time": "2:17:21", "throughput": 986.49, "total_tokens": 4247024} {"current_steps": 915, "total_steps": 2652, "loss": 0.7741, "learning_rate": 3.6696674947095984e-05, "epoch": 0.6897851488880513, "percentage": 34.5, "elapsed_time": "1:12:08", "remaining_time": "2:16:57", "throughput": 986.6, "total_tokens": 4270800} {"current_steps": 920, "total_steps": 2652, "loss": 0.8219, "learning_rate": 3.656560062383208e-05, "epoch": 0.6935544666415379, "percentage": 34.69, "elapsed_time": "1:12:32", "remaining_time": "2:16:34", "throughput": 986.64, "total_tokens": 4294352} {"current_steps": 925, "total_steps": 2652, "loss": 0.6813, "learning_rate": 3.6434120549533135e-05, "epoch": 0.6973237843950245, "percentage": 34.88, "elapsed_time": "1:12:56", "remaining_time": "2:16:11", "throughput": 986.65, "total_tokens": 4318208} {"current_steps": 930, "total_steps": 2652, "loss": 0.6866, "learning_rate": 3.6302239336858545e-05, "epoch": 0.7010931021485112, "percentage": 35.07, "elapsed_time": "1:13:20", "remaining_time": "2:15:47", "throughput": 986.67, "total_tokens": 4341728} {"current_steps": 935, "total_steps": 2652, "loss": 0.8628, "learning_rate": 3.6169961612540645e-05, "epoch": 0.7048624199019977, "percentage": 35.26, "elapsed_time": "1:13:44", "remaining_time": "2:15:24", "throughput": 986.66, "total_tokens": 4365392} {"current_steps": 940, "total_steps": 2652, "loss": 0.8978, "learning_rate": 3.603729201722244e-05, "epoch": 0.7086317376554844, "percentage": 35.44, "elapsed_time": "1:14:08", "remaining_time": "2:15:01", "throughput": 986.67, "total_tokens": 4389184} {"current_steps": 945, "total_steps": 2652, "loss": 0.7572, "learning_rate": 3.5904235205294776e-05, "epoch": 0.712401055408971, "percentage": 35.63, "elapsed_time": "1:14:31", "remaining_time": "2:14:37", "throughput": 986.67, "total_tokens": 4412272} {"current_steps": 950, "total_steps": 2652, "loss": 0.7205, "learning_rate": 3.5770795844733035e-05, "epoch": 0.7161703731624576, "percentage": 35.82, "elapsed_time": "1:14:54", "remaining_time": "2:14:13", "throughput": 986.67, "total_tokens": 4435072} {"current_steps": 955, "total_steps": 2652, "loss": 0.7521, "learning_rate": 3.5636978616933416e-05, "epoch": 0.7199396909159442, "percentage": 36.01, "elapsed_time": "1:15:18", "remaining_time": "2:13:49", "throughput": 986.62, "total_tokens": 4458272} {"current_steps": 960, "total_steps": 2652, "loss": 0.7205, "learning_rate": 3.550278821654866e-05, "epoch": 0.7237090086694309, "percentage": 36.2, "elapsed_time": "1:15:42", "remaining_time": "2:13:25", "throughput": 986.53, "total_tokens": 4481056} {"current_steps": 965, "total_steps": 2652, "loss": 0.6597, "learning_rate": 3.536822935132336e-05, "epoch": 0.7274783264229174, "percentage": 36.39, "elapsed_time": "1:16:06", "remaining_time": "2:13:02", "throughput": 986.45, "total_tokens": 4504288} {"current_steps": 970, "total_steps": 2652, "loss": 0.7293, "learning_rate": 3.5233306741928806e-05, "epoch": 0.7312476441764041, "percentage": 36.58, "elapsed_time": "1:16:29", "remaining_time": "2:12:38", "throughput": 986.45, "total_tokens": 4527552} {"current_steps": 975, "total_steps": 2652, "loss": 0.7055, "learning_rate": 3.509802512179737e-05, "epoch": 0.7350169619298907, "percentage": 36.76, "elapsed_time": "1:16:53", "remaining_time": "2:12:15", "throughput": 986.44, "total_tokens": 4551024} {"current_steps": 980, "total_steps": 2652, "loss": 0.763, "learning_rate": 3.496238923695646e-05, "epoch": 0.7387862796833773, "percentage": 36.95, "elapsed_time": "1:17:17", "remaining_time": "2:11:52", "throughput": 986.4, "total_tokens": 4574464} {"current_steps": 985, "total_steps": 2652, "loss": 0.6831, "learning_rate": 3.4826403845861986e-05, "epoch": 0.742555597436864, "percentage": 37.14, "elapsed_time": "1:17:40", "remaining_time": "2:11:28", "throughput": 986.42, "total_tokens": 4597600} {"current_steps": 990, "total_steps": 2652, "loss": 0.6586, "learning_rate": 3.4690073719231425e-05, "epoch": 0.7463249151903506, "percentage": 37.33, "elapsed_time": "1:18:04", "remaining_time": "2:11:04", "throughput": 986.47, "total_tokens": 4621424} {"current_steps": 995, "total_steps": 2652, "loss": 0.7481, "learning_rate": 3.455340363987648e-05, "epoch": 0.7500942329438371, "percentage": 37.52, "elapsed_time": "1:18:27", "remaining_time": "2:10:40", "throughput": 986.51, "total_tokens": 4644400} {"current_steps": 1000, "total_steps": 2652, "loss": 0.8084, "learning_rate": 3.4416398402535284e-05, "epoch": 0.7538635506973238, "percentage": 37.71, "elapsed_time": "1:18:51", "remaining_time": "2:10:16", "throughput": 986.51, "total_tokens": 4667568} {"current_steps": 1005, "total_steps": 2652, "loss": 0.8876, "learning_rate": 3.427906281370414e-05, "epoch": 0.7576328684508103, "percentage": 37.9, "elapsed_time": "1:19:15", "remaining_time": "2:09:53", "throughput": 986.32, "total_tokens": 4690624} {"current_steps": 1010, "total_steps": 2652, "loss": 0.8391, "learning_rate": 3.414140169146896e-05, "epoch": 0.761402186204297, "percentage": 38.08, "elapsed_time": "1:19:39", "remaining_time": "2:09:30", "throughput": 986.31, "total_tokens": 4714032} {"current_steps": 1015, "total_steps": 2652, "loss": 0.6847, "learning_rate": 3.400341986533618e-05, "epoch": 0.7651715039577837, "percentage": 38.27, "elapsed_time": "1:20:03", "remaining_time": "2:09:06", "throughput": 986.31, "total_tokens": 4737280} {"current_steps": 1020, "total_steps": 2652, "loss": 0.6742, "learning_rate": 3.386512217606339e-05, "epoch": 0.7689408217112702, "percentage": 38.46, "elapsed_time": "1:20:26", "remaining_time": "2:08:42", "throughput": 986.42, "total_tokens": 4760848} {"current_steps": 1025, "total_steps": 2652, "loss": 0.8607, "learning_rate": 3.3726513475489445e-05, "epoch": 0.7727101394647569, "percentage": 38.65, "elapsed_time": "1:20:49", "remaining_time": "2:08:18", "throughput": 986.4, "total_tokens": 4783888} {"current_steps": 1030, "total_steps": 2652, "loss": 0.6614, "learning_rate": 3.3587598626364294e-05, "epoch": 0.7764794572182435, "percentage": 38.84, "elapsed_time": "1:21:13", "remaining_time": "2:07:53", "throughput": 986.49, "total_tokens": 4807312} {"current_steps": 1035, "total_steps": 2652, "loss": 0.7078, "learning_rate": 3.344838250217833e-05, "epoch": 0.7802487749717301, "percentage": 39.03, "elapsed_time": "1:21:36", "remaining_time": "2:07:30", "throughput": 986.6, "total_tokens": 4831088} {"current_steps": 1040, "total_steps": 2652, "loss": 0.7944, "learning_rate": 3.330886998699149e-05, "epoch": 0.7840180927252167, "percentage": 39.22, "elapsed_time": "1:22:00", "remaining_time": "2:07:06", "throughput": 986.64, "total_tokens": 4854608} {"current_steps": 1045, "total_steps": 2652, "loss": 0.7436, "learning_rate": 3.316906597526186e-05, "epoch": 0.7877874104787034, "percentage": 39.4, "elapsed_time": "1:22:23", "remaining_time": "2:06:42", "throughput": 986.64, "total_tokens": 4877648} {"current_steps": 1050, "total_steps": 2652, "loss": 0.8234, "learning_rate": 3.302897537167397e-05, "epoch": 0.7915567282321899, "percentage": 39.59, "elapsed_time": "1:22:46", "remaining_time": "2:06:18", "throughput": 986.67, "total_tokens": 4900672} {"current_steps": 1055, "total_steps": 2652, "loss": 0.6463, "learning_rate": 3.288860309096671e-05, "epoch": 0.7953260459856766, "percentage": 39.78, "elapsed_time": "1:23:10", "remaining_time": "2:05:54", "throughput": 986.73, "total_tokens": 4924192} {"current_steps": 1060, "total_steps": 2652, "loss": 0.6872, "learning_rate": 3.2747954057760965e-05, "epoch": 0.7990953637391632, "percentage": 39.97, "elapsed_time": "1:23:33", "remaining_time": "2:05:30", "throughput": 986.8, "total_tokens": 4947600} {"current_steps": 1065, "total_steps": 2652, "loss": 0.6143, "learning_rate": 3.260703320638679e-05, "epoch": 0.8028646814926498, "percentage": 40.16, "elapsed_time": "1:23:57", "remaining_time": "2:05:06", "throughput": 986.93, "total_tokens": 4971888} {"current_steps": 1070, "total_steps": 2652, "loss": 0.8022, "learning_rate": 3.246584548071034e-05, "epoch": 0.8066339992461364, "percentage": 40.35, "elapsed_time": "1:24:21", "remaining_time": "2:04:42", "throughput": 986.93, "total_tokens": 4995056} {"current_steps": 1075, "total_steps": 2652, "loss": 0.7144, "learning_rate": 3.232439583396036e-05, "epoch": 0.8104033169996231, "percentage": 40.54, "elapsed_time": "1:24:44", "remaining_time": "2:04:18", "throughput": 986.96, "total_tokens": 5018208} {"current_steps": 1080, "total_steps": 2652, "loss": 0.757, "learning_rate": 3.2182689228554517e-05, "epoch": 0.8141726347531096, "percentage": 40.72, "elapsed_time": "1:25:08", "remaining_time": "2:03:55", "throughput": 986.98, "total_tokens": 5041584} {"current_steps": 1085, "total_steps": 2652, "loss": 0.729, "learning_rate": 3.204073063592522e-05, "epoch": 0.8179419525065963, "percentage": 40.91, "elapsed_time": "1:25:31", "remaining_time": "2:03:30", "throughput": 986.95, "total_tokens": 5064352} {"current_steps": 1090, "total_steps": 2652, "loss": 0.7441, "learning_rate": 3.189852503634523e-05, "epoch": 0.821711270260083, "percentage": 41.1, "elapsed_time": "1:25:54", "remaining_time": "2:03:07", "throughput": 986.98, "total_tokens": 5087712} {"current_steps": 1095, "total_steps": 2652, "loss": 0.8861, "learning_rate": 3.1756077418752967e-05, "epoch": 0.8254805880135695, "percentage": 41.29, "elapsed_time": "1:26:18", "remaining_time": "2:02:43", "throughput": 986.98, "total_tokens": 5111104} {"current_steps": 1100, "total_steps": 2652, "loss": 0.7098, "learning_rate": 3.1613392780577455e-05, "epoch": 0.8292499057670562, "percentage": 41.48, "elapsed_time": "1:26:41", "remaining_time": "2:02:19", "throughput": 987.09, "total_tokens": 5134720} {"current_steps": 1105, "total_steps": 2652, "loss": 0.7099, "learning_rate": 3.147047612756302e-05, "epoch": 0.8330192235205428, "percentage": 41.67, "elapsed_time": "1:27:05", "remaining_time": "2:01:56", "throughput": 986.95, "total_tokens": 5157744} {"current_steps": 1110, "total_steps": 2652, "loss": 0.7648, "learning_rate": 3.132733247359366e-05, "epoch": 0.8367885412740294, "percentage": 41.86, "elapsed_time": "1:27:29", "remaining_time": "2:01:32", "throughput": 986.92, "total_tokens": 5180976} {"current_steps": 1115, "total_steps": 2652, "loss": 0.7906, "learning_rate": 3.118396684051714e-05, "epoch": 0.840557859027516, "percentage": 42.04, "elapsed_time": "1:27:53", "remaining_time": "2:01:09", "throughput": 987.05, "total_tokens": 5204976} {"current_steps": 1120, "total_steps": 2652, "loss": 0.6022, "learning_rate": 3.104038425796884e-05, "epoch": 0.8443271767810027, "percentage": 42.23, "elapsed_time": "1:28:16", "remaining_time": "2:00:45", "throughput": 987.03, "total_tokens": 5228048} {"current_steps": 1125, "total_steps": 2652, "loss": 0.8142, "learning_rate": 3.089658976319528e-05, "epoch": 0.8480964945344892, "percentage": 42.42, "elapsed_time": "1:28:40", "remaining_time": "2:00:21", "throughput": 987.05, "total_tokens": 5251664} {"current_steps": 1130, "total_steps": 2652, "loss": 0.8263, "learning_rate": 3.0752588400877405e-05, "epoch": 0.8518658122879759, "percentage": 42.61, "elapsed_time": "1:29:04", "remaining_time": "1:59:57", "throughput": 987.07, "total_tokens": 5274976} {"current_steps": 1135, "total_steps": 2652, "loss": 0.8581, "learning_rate": 3.060838522295361e-05, "epoch": 0.8556351300414625, "percentage": 42.8, "elapsed_time": "1:29:27", "remaining_time": "1:59:34", "throughput": 987.1, "total_tokens": 5298352} {"current_steps": 1140, "total_steps": 2652, "loss": 0.7224, "learning_rate": 3.0463985288442475e-05, "epoch": 0.8594044477949491, "percentage": 42.99, "elapsed_time": "1:29:50", "remaining_time": "1:59:09", "throughput": 987.14, "total_tokens": 5321440} {"current_steps": 1145, "total_steps": 2652, "loss": 0.7379, "learning_rate": 3.031939366326535e-05, "epoch": 0.8631737655484357, "percentage": 43.17, "elapsed_time": "1:30:14", "remaining_time": "1:58:46", "throughput": 987.14, "total_tokens": 5344992} {"current_steps": 1150, "total_steps": 2652, "loss": 0.6864, "learning_rate": 3.0174615420068563e-05, "epoch": 0.8669430833019224, "percentage": 43.36, "elapsed_time": "1:30:38", "remaining_time": "1:58:22", "throughput": 987.21, "total_tokens": 5368448} {"current_steps": 1155, "total_steps": 2652, "loss": 0.6144, "learning_rate": 3.0029655638045496e-05, "epoch": 0.8707124010554089, "percentage": 43.55, "elapsed_time": "1:31:01", "remaining_time": "1:57:58", "throughput": 987.22, "total_tokens": 5391568} {"current_steps": 1160, "total_steps": 2652, "loss": 0.6818, "learning_rate": 2.9884519402758342e-05, "epoch": 0.8744817188088956, "percentage": 43.74, "elapsed_time": "1:31:25", "remaining_time": "1:57:34", "throughput": 987.22, "total_tokens": 5414992} {"current_steps": 1165, "total_steps": 2652, "loss": 0.8296, "learning_rate": 2.9739211805959783e-05, "epoch": 0.8782510365623822, "percentage": 43.93, "elapsed_time": "1:31:48", "remaining_time": "1:57:11", "throughput": 987.27, "total_tokens": 5438368} {"current_steps": 1170, "total_steps": 2652, "loss": 0.7764, "learning_rate": 2.9593737945414264e-05, "epoch": 0.8820203543158688, "percentage": 44.12, "elapsed_time": "1:32:11", "remaining_time": "1:56:46", "throughput": 987.29, "total_tokens": 5461504} {"current_steps": 1175, "total_steps": 2652, "loss": 0.7245, "learning_rate": 2.9448102924719207e-05, "epoch": 0.8857896720693554, "percentage": 44.31, "elapsed_time": "1:32:35", "remaining_time": "1:56:23", "throughput": 987.31, "total_tokens": 5484992} {"current_steps": 1180, "total_steps": 2652, "loss": 0.8319, "learning_rate": 2.9302311853125942e-05, "epoch": 0.8895589898228421, "percentage": 44.49, "elapsed_time": "1:32:58", "remaining_time": "1:55:59", "throughput": 987.37, "total_tokens": 5508480} {"current_steps": 1185, "total_steps": 2652, "loss": 0.6652, "learning_rate": 2.9156369845360467e-05, "epoch": 0.8933283075763286, "percentage": 44.68, "elapsed_time": "1:33:22", "remaining_time": "1:55:35", "throughput": 987.38, "total_tokens": 5531520} {"current_steps": 1190, "total_steps": 2652, "loss": 0.5858, "learning_rate": 2.9010282021444008e-05, "epoch": 0.8970976253298153, "percentage": 44.87, "elapsed_time": "1:33:45", "remaining_time": "1:55:11", "throughput": 987.38, "total_tokens": 5554480} {"current_steps": 1195, "total_steps": 2652, "loss": 0.6248, "learning_rate": 2.8864053506513405e-05, "epoch": 0.900866943083302, "percentage": 45.06, "elapsed_time": "1:34:08", "remaining_time": "1:54:47", "throughput": 987.43, "total_tokens": 5577888} {"current_steps": 1200, "total_steps": 2652, "loss": 0.8447, "learning_rate": 2.8717689430641292e-05, "epoch": 0.9046362608367885, "percentage": 45.25, "elapsed_time": "1:34:32", "remaining_time": "1:54:23", "throughput": 987.44, "total_tokens": 5601424} {"current_steps": 1205, "total_steps": 2652, "loss": 0.6355, "learning_rate": 2.857119492865613e-05, "epoch": 0.9084055785902752, "percentage": 45.44, "elapsed_time": "1:34:57", "remaining_time": "1:54:01", "throughput": 987.3, "total_tokens": 5624880} {"current_steps": 1210, "total_steps": 2652, "loss": 0.5075, "learning_rate": 2.842457513996207e-05, "epoch": 0.9121748963437618, "percentage": 45.63, "elapsed_time": "1:35:20", "remaining_time": "1:53:37", "throughput": 987.35, "total_tokens": 5648160} {"current_steps": 1215, "total_steps": 2652, "loss": 0.5762, "learning_rate": 2.8277835208358637e-05, "epoch": 0.9159442140972484, "percentage": 45.81, "elapsed_time": "1:35:44", "remaining_time": "1:53:13", "throughput": 987.33, "total_tokens": 5671280} {"current_steps": 1220, "total_steps": 2652, "loss": 0.666, "learning_rate": 2.813098028186028e-05, "epoch": 0.919713531850735, "percentage": 46.0, "elapsed_time": "1:36:07", "remaining_time": "1:52:49", "throughput": 987.38, "total_tokens": 5694352} {"current_steps": 1225, "total_steps": 2652, "loss": 0.6056, "learning_rate": 2.798401551251576e-05, "epoch": 0.9234828496042217, "percentage": 46.19, "elapsed_time": "1:36:30", "remaining_time": "1:52:25", "throughput": 987.35, "total_tokens": 5717536} {"current_steps": 1230, "total_steps": 2652, "loss": 0.8095, "learning_rate": 2.7836946056227426e-05, "epoch": 0.9272521673577082, "percentage": 46.38, "elapsed_time": "1:36:54", "remaining_time": "1:52:01", "throughput": 987.31, "total_tokens": 5740416} {"current_steps": 1235, "total_steps": 2652, "loss": 0.7501, "learning_rate": 2.7689777072570287e-05, "epoch": 0.9310214851111949, "percentage": 46.57, "elapsed_time": "1:37:17", "remaining_time": "1:51:38", "throughput": 987.3, "total_tokens": 5763712} {"current_steps": 1240, "total_steps": 2652, "loss": 0.5595, "learning_rate": 2.7542513724611057e-05, "epoch": 0.9347908028646815, "percentage": 46.76, "elapsed_time": "1:37:41", "remaining_time": "1:51:14", "throughput": 987.3, "total_tokens": 5787168} {"current_steps": 1245, "total_steps": 2652, "loss": 0.694, "learning_rate": 2.739516117872697e-05, "epoch": 0.9385601206181681, "percentage": 46.95, "elapsed_time": "1:38:05", "remaining_time": "1:50:51", "throughput": 987.31, "total_tokens": 5810704} {"current_steps": 1250, "total_steps": 2652, "loss": 0.8521, "learning_rate": 2.7247724604424557e-05, "epoch": 0.9423294383716547, "percentage": 47.13, "elapsed_time": "1:38:29", "remaining_time": "1:50:27", "throughput": 987.33, "total_tokens": 5834192} {"current_steps": 1255, "total_steps": 2652, "loss": 0.7794, "learning_rate": 2.71002091741583e-05, "epoch": 0.9460987561251414, "percentage": 47.32, "elapsed_time": "1:38:52", "remaining_time": "1:50:03", "throughput": 987.38, "total_tokens": 5857344} {"current_steps": 1260, "total_steps": 2652, "loss": 0.7721, "learning_rate": 2.695262006314912e-05, "epoch": 0.9498680738786279, "percentage": 47.51, "elapsed_time": "1:39:15", "remaining_time": "1:49:38", "throughput": 987.46, "total_tokens": 5880448} {"current_steps": 1265, "total_steps": 2652, "loss": 0.6403, "learning_rate": 2.680496244920287e-05, "epoch": 0.9536373916321146, "percentage": 47.7, "elapsed_time": "1:39:38", "remaining_time": "1:49:14", "throughput": 987.43, "total_tokens": 5903200} {"current_steps": 1270, "total_steps": 2652, "loss": 0.738, "learning_rate": 2.665724151252868e-05, "epoch": 0.9574067093856012, "percentage": 47.89, "elapsed_time": "1:40:02", "remaining_time": "1:48:51", "throughput": 987.38, "total_tokens": 5926272} {"current_steps": 1275, "total_steps": 2652, "loss": 0.6469, "learning_rate": 2.6509462435557152e-05, "epoch": 0.9611760271390878, "percentage": 48.08, "elapsed_time": "1:40:25", "remaining_time": "1:48:27", "throughput": 987.43, "total_tokens": 5949680} {"current_steps": 1280, "total_steps": 2652, "loss": 0.6953, "learning_rate": 2.6361630402758648e-05, "epoch": 0.9649453448925744, "percentage": 48.27, "elapsed_time": "1:40:48", "remaining_time": "1:48:03", "throughput": 987.45, "total_tokens": 5973088} {"current_steps": 1285, "total_steps": 2652, "loss": 0.6365, "learning_rate": 2.6213750600461334e-05, "epoch": 0.9687146626460611, "percentage": 48.45, "elapsed_time": "1:41:12", "remaining_time": "1:47:39", "throughput": 987.55, "total_tokens": 5996688} {"current_steps": 1290, "total_steps": 2652, "loss": 0.6691, "learning_rate": 2.6065828216669253e-05, "epoch": 0.9724839803995476, "percentage": 48.64, "elapsed_time": "1:41:35", "remaining_time": "1:47:15", "throughput": 987.55, "total_tokens": 6019744} {"current_steps": 1295, "total_steps": 2652, "loss": 0.64, "learning_rate": 2.5917868440880317e-05, "epoch": 0.9762532981530343, "percentage": 48.83, "elapsed_time": "1:41:58", "remaining_time": "1:46:51", "throughput": 987.55, "total_tokens": 6042640} {"current_steps": 1300, "total_steps": 2652, "loss": 0.6674, "learning_rate": 2.5769876463904265e-05, "epoch": 0.980022615906521, "percentage": 49.02, "elapsed_time": "1:42:22", "remaining_time": "1:46:28", "throughput": 987.58, "total_tokens": 6066112} {"current_steps": 1305, "total_steps": 2652, "loss": 0.6288, "learning_rate": 2.5621857477680506e-05, "epoch": 0.9837919336600075, "percentage": 49.21, "elapsed_time": "1:42:46", "remaining_time": "1:46:05", "throughput": 987.42, "total_tokens": 6089296} {"current_steps": 1310, "total_steps": 2652, "loss": 0.8477, "learning_rate": 2.5473816675096017e-05, "epoch": 0.9875612514134942, "percentage": 49.4, "elapsed_time": "1:43:10", "remaining_time": "1:45:41", "throughput": 987.45, "total_tokens": 6112784} {"current_steps": 1315, "total_steps": 2652, "loss": 0.7663, "learning_rate": 2.5325759249803154e-05, "epoch": 0.9913305691669808, "percentage": 49.59, "elapsed_time": "1:43:33", "remaining_time": "1:45:17", "throughput": 987.47, "total_tokens": 6136048} {"current_steps": 1320, "total_steps": 2652, "loss": 0.861, "learning_rate": 2.517769039603744e-05, "epoch": 0.9950998869204674, "percentage": 49.77, "elapsed_time": "1:43:57", "remaining_time": "1:44:54", "throughput": 987.54, "total_tokens": 6159920} {"current_steps": 1325, "total_steps": 2652, "loss": 0.8545, "learning_rate": 2.5029615308435338e-05, "epoch": 0.998869204673954, "percentage": 49.96, "elapsed_time": "1:44:21", "remaining_time": "1:44:30", "throughput": 987.53, "total_tokens": 6183024} {"current_steps": 1330, "total_steps": 2652, "loss": 0.6469, "learning_rate": 2.4881539181851986e-05, "epoch": 1.0026385224274406, "percentage": 50.15, "elapsed_time": "1:44:44", "remaining_time": "1:44:06", "throughput": 987.54, "total_tokens": 6206224} {"current_steps": 1335, "total_steps": 2652, "loss": 0.7507, "learning_rate": 2.4733467211179008e-05, "epoch": 1.0064078401809273, "percentage": 50.34, "elapsed_time": "1:45:08", "remaining_time": "1:43:43", "throughput": 987.55, "total_tokens": 6229936} {"current_steps": 1340, "total_steps": 2652, "loss": 0.7181, "learning_rate": 2.4585404591162218e-05, "epoch": 1.0101771579344139, "percentage": 50.53, "elapsed_time": "1:45:32", "remaining_time": "1:43:19", "throughput": 987.54, "total_tokens": 6253152} {"current_steps": 1345, "total_steps": 2652, "loss": 0.627, "learning_rate": 2.4437356516219358e-05, "epoch": 1.0139464756879004, "percentage": 50.72, "elapsed_time": "1:45:55", "remaining_time": "1:42:56", "throughput": 987.51, "total_tokens": 6276208} {"current_steps": 1350, "total_steps": 2652, "loss": 0.7266, "learning_rate": 2.4289328180257926e-05, "epoch": 1.0177157934413872, "percentage": 50.9, "elapsed_time": "1:46:18", "remaining_time": "1:42:31", "throughput": 987.55, "total_tokens": 6299408} {"current_steps": 1355, "total_steps": 2652, "loss": 0.5684, "learning_rate": 2.4141324776492915e-05, "epoch": 1.0214851111948737, "percentage": 51.09, "elapsed_time": "1:46:42", "remaining_time": "1:42:08", "throughput": 987.58, "total_tokens": 6323024} {"current_steps": 1360, "total_steps": 2652, "loss": 0.6196, "learning_rate": 2.399335149726463e-05, "epoch": 1.0252544289483603, "percentage": 51.28, "elapsed_time": "1:47:05", "remaining_time": "1:41:44", "throughput": 987.56, "total_tokens": 6345952} {"current_steps": 1365, "total_steps": 2652, "loss": 0.5296, "learning_rate": 2.3845413533856517e-05, "epoch": 1.029023746701847, "percentage": 51.47, "elapsed_time": "1:47:29", "remaining_time": "1:41:20", "throughput": 987.67, "total_tokens": 6369856} {"current_steps": 1370, "total_steps": 2652, "loss": 0.7537, "learning_rate": 2.3697516076313066e-05, "epoch": 1.0327930644553336, "percentage": 51.66, "elapsed_time": "1:47:52", "remaining_time": "1:40:56", "throughput": 987.7, "total_tokens": 6393136} {"current_steps": 1375, "total_steps": 2652, "loss": 0.5909, "learning_rate": 2.354966431325773e-05, "epoch": 1.0365623822088201, "percentage": 51.85, "elapsed_time": "1:48:16", "remaining_time": "1:40:33", "throughput": 987.77, "total_tokens": 6416736} {"current_steps": 1380, "total_steps": 2652, "loss": 0.7042, "learning_rate": 2.3401863431710863e-05, "epoch": 1.040331699962307, "percentage": 52.04, "elapsed_time": "1:48:39", "remaining_time": "1:40:09", "throughput": 987.77, "total_tokens": 6440048} {"current_steps": 1385, "total_steps": 2652, "loss": 0.7301, "learning_rate": 2.325411861690776e-05, "epoch": 1.0441010177157934, "percentage": 52.22, "elapsed_time": "1:49:03", "remaining_time": "1:39:45", "throughput": 987.79, "total_tokens": 6463504} {"current_steps": 1390, "total_steps": 2652, "loss": 0.7472, "learning_rate": 2.3106435052116764e-05, "epoch": 1.04787033546928, "percentage": 52.41, "elapsed_time": "1:49:26", "remaining_time": "1:39:21", "throughput": 987.84, "total_tokens": 6486608} {"current_steps": 1395, "total_steps": 2652, "loss": 0.5799, "learning_rate": 2.2958817918457412e-05, "epoch": 1.0516396532227668, "percentage": 52.6, "elapsed_time": "1:49:49", "remaining_time": "1:38:58", "throughput": 987.83, "total_tokens": 6509760} {"current_steps": 1400, "total_steps": 2652, "loss": 0.6512, "learning_rate": 2.2811272394718647e-05, "epoch": 1.0554089709762533, "percentage": 52.79, "elapsed_time": "1:50:13", "remaining_time": "1:38:34", "throughput": 987.84, "total_tokens": 6532992} {"current_steps": 1405, "total_steps": 2652, "loss": 0.748, "learning_rate": 2.2663803657177173e-05, "epoch": 1.0591782887297398, "percentage": 52.98, "elapsed_time": "1:50:37", "remaining_time": "1:38:11", "throughput": 987.78, "total_tokens": 6556384} {"current_steps": 1410, "total_steps": 2652, "loss": 0.6635, "learning_rate": 2.2516416879415824e-05, "epoch": 1.0629476064832266, "percentage": 53.17, "elapsed_time": "1:51:01", "remaining_time": "1:37:47", "throughput": 987.88, "total_tokens": 6580336} {"current_steps": 1415, "total_steps": 2652, "loss": 0.5894, "learning_rate": 2.2369117232142077e-05, "epoch": 1.0667169242367132, "percentage": 53.36, "elapsed_time": "1:51:24", "remaining_time": "1:37:23", "throughput": 987.92, "total_tokens": 6603584} {"current_steps": 1420, "total_steps": 2652, "loss": 0.5952, "learning_rate": 2.2221909883006646e-05, "epoch": 1.0704862419901997, "percentage": 53.54, "elapsed_time": "1:51:48", "remaining_time": "1:36:59", "throughput": 987.89, "total_tokens": 6626864} {"current_steps": 1425, "total_steps": 2652, "loss": 0.7849, "learning_rate": 2.20747999964222e-05, "epoch": 1.0742555597436865, "percentage": 53.73, "elapsed_time": "1:52:11", "remaining_time": "1:36:36", "throughput": 987.93, "total_tokens": 6650480} {"current_steps": 1430, "total_steps": 2652, "loss": 0.7059, "learning_rate": 2.192779273338215e-05, "epoch": 1.078024877497173, "percentage": 53.92, "elapsed_time": "1:52:35", "remaining_time": "1:36:12", "throughput": 987.95, "total_tokens": 6673808} {"current_steps": 1435, "total_steps": 2652, "loss": 0.7389, "learning_rate": 2.1780893251279626e-05, "epoch": 1.0817941952506596, "percentage": 54.11, "elapsed_time": "1:52:58", "remaining_time": "1:35:49", "throughput": 987.96, "total_tokens": 6697232} {"current_steps": 1440, "total_steps": 2652, "loss": 0.5858, "learning_rate": 2.163410670372652e-05, "epoch": 1.0855635130041463, "percentage": 54.3, "elapsed_time": "1:53:22", "remaining_time": "1:35:25", "throughput": 988.03, "total_tokens": 6721104} {"current_steps": 1445, "total_steps": 2652, "loss": 0.6743, "learning_rate": 2.148743824037269e-05, "epoch": 1.0893328307576329, "percentage": 54.49, "elapsed_time": "1:53:46", "remaining_time": "1:35:01", "throughput": 988.05, "total_tokens": 6744624} {"current_steps": 1450, "total_steps": 2652, "loss": 0.5893, "learning_rate": 2.1340893006725288e-05, "epoch": 1.0931021485111194, "percentage": 54.68, "elapsed_time": "1:54:09", "remaining_time": "1:34:38", "throughput": 988.08, "total_tokens": 6768000} {"current_steps": 1455, "total_steps": 2652, "loss": 0.653, "learning_rate": 2.1194476143968258e-05, "epoch": 1.0968714662646062, "percentage": 54.86, "elapsed_time": "1:54:33", "remaining_time": "1:34:14", "throughput": 988.1, "total_tokens": 6791296} {"current_steps": 1460, "total_steps": 2652, "loss": 0.6829, "learning_rate": 2.1048192788781977e-05, "epoch": 1.1006407840180927, "percentage": 55.05, "elapsed_time": "1:54:56", "remaining_time": "1:33:50", "throughput": 988.13, "total_tokens": 6814800} {"current_steps": 1465, "total_steps": 2652, "loss": 0.5642, "learning_rate": 2.090204807316301e-05, "epoch": 1.1044101017715793, "percentage": 55.24, "elapsed_time": "1:55:19", "remaining_time": "1:33:26", "throughput": 988.18, "total_tokens": 6838128} {"current_steps": 1470, "total_steps": 2652, "loss": 0.6401, "learning_rate": 2.0756047124244095e-05, "epoch": 1.108179419525066, "percentage": 55.43, "elapsed_time": "1:55:43", "remaining_time": "1:33:03", "throughput": 988.18, "total_tokens": 6861312} {"current_steps": 1475, "total_steps": 2652, "loss": 0.6188, "learning_rate": 2.0610195064114273e-05, "epoch": 1.1119487372785526, "percentage": 55.62, "elapsed_time": "1:56:06", "remaining_time": "1:32:39", "throughput": 988.11, "total_tokens": 6884128} {"current_steps": 1480, "total_steps": 2652, "loss": 0.5929, "learning_rate": 2.0464497009639176e-05, "epoch": 1.1157180550320391, "percentage": 55.81, "elapsed_time": "1:56:30", "remaining_time": "1:32:15", "throughput": 988.25, "total_tokens": 6908336} {"current_steps": 1485, "total_steps": 2652, "loss": 0.7596, "learning_rate": 2.0318958072281517e-05, "epoch": 1.119487372785526, "percentage": 56.0, "elapsed_time": "1:56:53", "remaining_time": "1:31:51", "throughput": 988.24, "total_tokens": 6931392} {"current_steps": 1490, "total_steps": 2652, "loss": 0.6313, "learning_rate": 2.017358335792178e-05, "epoch": 1.1232566905390124, "percentage": 56.18, "elapsed_time": "1:57:17", "remaining_time": "1:31:28", "throughput": 988.22, "total_tokens": 6954800} {"current_steps": 1495, "total_steps": 2652, "loss": 0.6371, "learning_rate": 2.0028377966679092e-05, "epoch": 1.127026008292499, "percentage": 56.37, "elapsed_time": "1:57:41", "remaining_time": "1:31:04", "throughput": 988.23, "total_tokens": 6978384} {"current_steps": 1500, "total_steps": 2652, "loss": 0.6982, "learning_rate": 1.9883346992732256e-05, "epoch": 1.1307953260459858, "percentage": 56.56, "elapsed_time": "1:58:05", "remaining_time": "1:30:41", "throughput": 988.2, "total_tokens": 7001632} {"current_steps": 1505, "total_steps": 2652, "loss": 0.7299, "learning_rate": 1.9738495524141098e-05, "epoch": 1.1345646437994723, "percentage": 56.75, "elapsed_time": "1:58:29", "remaining_time": "1:30:18", "throughput": 988.1, "total_tokens": 7024768} {"current_steps": 1510, "total_steps": 2652, "loss": 0.6548, "learning_rate": 1.9593828642667928e-05, "epoch": 1.1383339615529589, "percentage": 56.94, "elapsed_time": "1:58:52", "remaining_time": "1:29:54", "throughput": 988.17, "total_tokens": 7047936} {"current_steps": 1515, "total_steps": 2652, "loss": 0.8541, "learning_rate": 1.944935142359926e-05, "epoch": 1.1421032793064456, "percentage": 57.13, "elapsed_time": "1:59:15", "remaining_time": "1:29:30", "throughput": 988.13, "total_tokens": 7070672} {"current_steps": 1520, "total_steps": 2652, "loss": 0.6746, "learning_rate": 1.9305068935567767e-05, "epoch": 1.1458725970599322, "percentage": 57.32, "elapsed_time": "1:59:38", "remaining_time": "1:29:06", "throughput": 988.12, "total_tokens": 7093616} {"current_steps": 1525, "total_steps": 2652, "loss": 0.7696, "learning_rate": 1.9160986240374445e-05, "epoch": 1.1496419148134187, "percentage": 57.5, "elapsed_time": "2:00:02", "remaining_time": "1:28:42", "throughput": 988.11, "total_tokens": 7116560} {"current_steps": 1530, "total_steps": 2652, "loss": 0.7202, "learning_rate": 1.9017108392811065e-05, "epoch": 1.1534112325669055, "percentage": 57.69, "elapsed_time": "2:00:25", "remaining_time": "1:28:18", "throughput": 988.17, "total_tokens": 7140224} {"current_steps": 1535, "total_steps": 2652, "loss": 0.7255, "learning_rate": 1.887344044048278e-05, "epoch": 1.157180550320392, "percentage": 57.88, "elapsed_time": "2:00:49", "remaining_time": "1:27:55", "throughput": 988.19, "total_tokens": 7163696} {"current_steps": 1540, "total_steps": 2652, "loss": 0.5598, "learning_rate": 1.8729987423631128e-05, "epoch": 1.1609498680738786, "percentage": 58.07, "elapsed_time": "2:01:13", "remaining_time": "1:27:31", "throughput": 988.21, "total_tokens": 7187376} {"current_steps": 1545, "total_steps": 2652, "loss": 0.6163, "learning_rate": 1.8586754374957112e-05, "epoch": 1.1647191858273653, "percentage": 58.26, "elapsed_time": "2:01:36", "remaining_time": "1:27:07", "throughput": 988.23, "total_tokens": 7210576} {"current_steps": 1550, "total_steps": 2652, "loss": 0.6024, "learning_rate": 1.8443746319444717e-05, "epoch": 1.1684885035808519, "percentage": 58.45, "elapsed_time": "2:01:59", "remaining_time": "1:26:44", "throughput": 988.23, "total_tokens": 7233824} {"current_steps": 1555, "total_steps": 2652, "loss": 0.7974, "learning_rate": 1.830096827418456e-05, "epoch": 1.1722578213343384, "percentage": 58.63, "elapsed_time": "2:02:23", "remaining_time": "1:26:20", "throughput": 988.24, "total_tokens": 7257248} {"current_steps": 1560, "total_steps": 2652, "loss": 0.6738, "learning_rate": 1.815842524819793e-05, "epoch": 1.1760271390878252, "percentage": 58.82, "elapsed_time": "2:02:47", "remaining_time": "1:25:57", "throughput": 988.26, "total_tokens": 7281040} {"current_steps": 1565, "total_steps": 2652, "loss": 0.7753, "learning_rate": 1.8016122242261024e-05, "epoch": 1.1797964568413117, "percentage": 59.01, "elapsed_time": "2:03:11", "remaining_time": "1:25:33", "throughput": 988.23, "total_tokens": 7304592} {"current_steps": 1570, "total_steps": 2652, "loss": 0.6555, "learning_rate": 1.787406424872952e-05, "epoch": 1.1835657745947983, "percentage": 59.2, "elapsed_time": "2:03:34", "remaining_time": "1:25:10", "throughput": 988.27, "total_tokens": 7327840} {"current_steps": 1575, "total_steps": 2652, "loss": 0.5336, "learning_rate": 1.7732256251363433e-05, "epoch": 1.187335092348285, "percentage": 59.39, "elapsed_time": "2:03:58", "remaining_time": "1:24:46", "throughput": 988.29, "total_tokens": 7351024} {"current_steps": 1580, "total_steps": 2652, "loss": 0.5507, "learning_rate": 1.7590703225152266e-05, "epoch": 1.1911044101017716, "percentage": 59.58, "elapsed_time": "2:04:21", "remaining_time": "1:24:22", "throughput": 988.29, "total_tokens": 7373824} {"current_steps": 1585, "total_steps": 2652, "loss": 0.5809, "learning_rate": 1.744941013614047e-05, "epoch": 1.1948737278552581, "percentage": 59.77, "elapsed_time": "2:04:45", "remaining_time": "1:23:59", "throughput": 988.29, "total_tokens": 7397648} {"current_steps": 1590, "total_steps": 2652, "loss": 0.7303, "learning_rate": 1.7308381941253253e-05, "epoch": 1.198643045608745, "percentage": 59.95, "elapsed_time": "2:05:08", "remaining_time": "1:23:35", "throughput": 988.3, "total_tokens": 7421104} {"current_steps": 1595, "total_steps": 2652, "loss": 0.6493, "learning_rate": 1.716762358812263e-05, "epoch": 1.2024123633622315, "percentage": 60.14, "elapsed_time": "2:05:32", "remaining_time": "1:23:11", "throughput": 988.29, "total_tokens": 7444128} {"current_steps": 1600, "total_steps": 2652, "loss": 0.5308, "learning_rate": 1.7027140014913897e-05, "epoch": 1.206181681115718, "percentage": 60.33, "elapsed_time": "2:05:55", "remaining_time": "1:22:47", "throughput": 988.3, "total_tokens": 7467152} {"current_steps": 1605, "total_steps": 2652, "loss": 0.6573, "learning_rate": 1.6886936150152325e-05, "epoch": 1.2099509988692048, "percentage": 60.52, "elapsed_time": "2:06:20", "remaining_time": "1:22:24", "throughput": 988.16, "total_tokens": 7490320} {"current_steps": 1610, "total_steps": 2652, "loss": 0.6721, "learning_rate": 1.674701691255034e-05, "epoch": 1.2137203166226913, "percentage": 60.71, "elapsed_time": "2:06:43", "remaining_time": "1:22:00", "throughput": 988.15, "total_tokens": 7513312} {"current_steps": 1615, "total_steps": 2652, "loss": 0.7255, "learning_rate": 1.6607387210834887e-05, "epoch": 1.2174896343761779, "percentage": 60.9, "elapsed_time": "2:07:06", "remaining_time": "1:21:37", "throughput": 988.17, "total_tokens": 7536752} {"current_steps": 1620, "total_steps": 2652, "loss": 0.6997, "learning_rate": 1.646805194357524e-05, "epoch": 1.2212589521296646, "percentage": 61.09, "elapsed_time": "2:07:30", "remaining_time": "1:21:13", "throughput": 988.15, "total_tokens": 7559872} {"current_steps": 1625, "total_steps": 2652, "loss": 0.7311, "learning_rate": 1.6329015999011183e-05, "epoch": 1.2250282698831512, "percentage": 61.27, "elapsed_time": "2:07:54", "remaining_time": "1:20:50", "throughput": 988.14, "total_tokens": 7583456} {"current_steps": 1630, "total_steps": 2652, "loss": 0.6106, "learning_rate": 1.6190284254881466e-05, "epoch": 1.2287975876366377, "percentage": 61.46, "elapsed_time": "2:08:17", "remaining_time": "1:20:26", "throughput": 988.15, "total_tokens": 7606608} {"current_steps": 1635, "total_steps": 2652, "loss": 0.6203, "learning_rate": 1.6051861578252718e-05, "epoch": 1.2325669053901245, "percentage": 61.65, "elapsed_time": "2:08:41", "remaining_time": "1:20:02", "throughput": 988.13, "total_tokens": 7629744} {"current_steps": 1640, "total_steps": 2652, "loss": 0.611, "learning_rate": 1.5913752825348675e-05, "epoch": 1.236336223143611, "percentage": 61.84, "elapsed_time": "2:09:05", "remaining_time": "1:19:39", "throughput": 988.11, "total_tokens": 7653200} {"current_steps": 1645, "total_steps": 2652, "loss": 0.5812, "learning_rate": 1.5775962841379818e-05, "epoch": 1.2401055408970976, "percentage": 62.03, "elapsed_time": "2:09:28", "remaining_time": "1:19:15", "throughput": 988.08, "total_tokens": 7676352} {"current_steps": 1650, "total_steps": 2652, "loss": 0.7053, "learning_rate": 1.5638496460373413e-05, "epoch": 1.2438748586505843, "percentage": 62.22, "elapsed_time": "2:09:52", "remaining_time": "1:18:52", "throughput": 988.09, "total_tokens": 7699488} {"current_steps": 1655, "total_steps": 2652, "loss": 0.6876, "learning_rate": 1.5501358505003874e-05, "epoch": 1.2476441764040709, "percentage": 62.41, "elapsed_time": "2:10:15", "remaining_time": "1:18:28", "throughput": 988.09, "total_tokens": 7722720} {"current_steps": 1660, "total_steps": 2652, "loss": 0.6504, "learning_rate": 1.5364553786423623e-05, "epoch": 1.2514134941575574, "percentage": 62.59, "elapsed_time": "2:10:39", "remaining_time": "1:18:04", "throughput": 988.12, "total_tokens": 7746448} {"current_steps": 1665, "total_steps": 2652, "loss": 0.5559, "learning_rate": 1.5228087104094261e-05, "epoch": 1.2551828119110442, "percentage": 62.78, "elapsed_time": "2:11:03", "remaining_time": "1:17:41", "throughput": 988.14, "total_tokens": 7769824} {"current_steps": 1670, "total_steps": 2652, "loss": 0.6128, "learning_rate": 1.5091963245618224e-05, "epoch": 1.2589521296645307, "percentage": 62.97, "elapsed_time": "2:11:26", "remaining_time": "1:17:17", "throughput": 988.12, "total_tokens": 7793072} {"current_steps": 1675, "total_steps": 2652, "loss": 0.7294, "learning_rate": 1.495618698657078e-05, "epoch": 1.2627214474180173, "percentage": 63.16, "elapsed_time": "2:11:50", "remaining_time": "1:16:54", "throughput": 988.08, "total_tokens": 7816448} {"current_steps": 1680, "total_steps": 2652, "loss": 0.7042, "learning_rate": 1.482076309033254e-05, "epoch": 1.266490765171504, "percentage": 63.35, "elapsed_time": "2:12:14", "remaining_time": "1:16:30", "throughput": 988.11, "total_tokens": 7839712} {"current_steps": 1685, "total_steps": 2652, "loss": 0.673, "learning_rate": 1.4685696307922312e-05, "epoch": 1.2702600829249906, "percentage": 63.54, "elapsed_time": "2:12:37", "remaining_time": "1:16:06", "throughput": 988.18, "total_tokens": 7863504} {"current_steps": 1690, "total_steps": 2652, "loss": 0.6719, "learning_rate": 1.4550991377830426e-05, "epoch": 1.2740294006784771, "percentage": 63.73, "elapsed_time": "2:13:01", "remaining_time": "1:15:43", "throughput": 988.17, "total_tokens": 7886720} {"current_steps": 1695, "total_steps": 2652, "loss": 0.5221, "learning_rate": 1.4416653025852498e-05, "epoch": 1.277798718431964, "percentage": 63.91, "elapsed_time": "2:13:25", "remaining_time": "1:15:19", "throughput": 988.11, "total_tokens": 7910032} {"current_steps": 1700, "total_steps": 2652, "loss": 0.576, "learning_rate": 1.4282685964923642e-05, "epoch": 1.2815680361854505, "percentage": 64.1, "elapsed_time": "2:13:48", "remaining_time": "1:14:56", "throughput": 988.1, "total_tokens": 7933408} {"current_steps": 1705, "total_steps": 2652, "loss": 0.7068, "learning_rate": 1.4149094894953157e-05, "epoch": 1.285337353938937, "percentage": 64.29, "elapsed_time": "2:14:13", "remaining_time": "1:14:32", "throughput": 987.98, "total_tokens": 7956400} {"current_steps": 1710, "total_steps": 2652, "loss": 0.7079, "learning_rate": 1.4015884502659573e-05, "epoch": 1.2891066716924238, "percentage": 64.48, "elapsed_time": "2:14:36", "remaining_time": "1:14:09", "throughput": 987.97, "total_tokens": 7979536} {"current_steps": 1715, "total_steps": 2652, "loss": 0.6605, "learning_rate": 1.3883059461406294e-05, "epoch": 1.2928759894459103, "percentage": 64.67, "elapsed_time": "2:15:00", "remaining_time": "1:13:45", "throughput": 987.99, "total_tokens": 8002992} {"current_steps": 1720, "total_steps": 2652, "loss": 0.7572, "learning_rate": 1.3750624431037581e-05, "epoch": 1.2966453071993969, "percentage": 64.86, "elapsed_time": "2:15:23", "remaining_time": "1:13:21", "throughput": 988.05, "total_tokens": 8026448} {"current_steps": 1725, "total_steps": 2652, "loss": 0.7231, "learning_rate": 1.3618584057715144e-05, "epoch": 1.3004146249528836, "percentage": 65.05, "elapsed_time": "2:15:46", "remaining_time": "1:12:57", "throughput": 988.06, "total_tokens": 8049392} {"current_steps": 1730, "total_steps": 2652, "loss": 0.5847, "learning_rate": 1.3486942973755101e-05, "epoch": 1.3041839427063702, "percentage": 65.23, "elapsed_time": "2:16:10", "remaining_time": "1:12:34", "throughput": 988.11, "total_tokens": 8072992} {"current_steps": 1735, "total_steps": 2652, "loss": 0.4926, "learning_rate": 1.3355705797465462e-05, "epoch": 1.3079532604598567, "percentage": 65.42, "elapsed_time": "2:16:33", "remaining_time": "1:12:10", "throughput": 988.13, "total_tokens": 8096464} {"current_steps": 1740, "total_steps": 2652, "loss": 0.7734, "learning_rate": 1.3224877132984132e-05, "epoch": 1.3117225782133435, "percentage": 65.61, "elapsed_time": "2:16:56", "remaining_time": "1:11:46", "throughput": 988.22, "total_tokens": 8120048} {"current_steps": 1745, "total_steps": 2652, "loss": 0.52, "learning_rate": 1.3094461570117356e-05, "epoch": 1.31549189596683, "percentage": 65.8, "elapsed_time": "2:17:20", "remaining_time": "1:11:23", "throughput": 988.22, "total_tokens": 8143104} {"current_steps": 1750, "total_steps": 2652, "loss": 0.5911, "learning_rate": 1.296446368417871e-05, "epoch": 1.3192612137203166, "percentage": 65.99, "elapsed_time": "2:17:43", "remaining_time": "1:10:59", "throughput": 988.24, "total_tokens": 8166624} {"current_steps": 1755, "total_steps": 2652, "loss": 0.682, "learning_rate": 1.2834888035828596e-05, "epoch": 1.3230305314738033, "percentage": 66.18, "elapsed_time": "2:18:07", "remaining_time": "1:10:36", "throughput": 988.29, "total_tokens": 8190800} {"current_steps": 1760, "total_steps": 2652, "loss": 0.4787, "learning_rate": 1.2705739170914238e-05, "epoch": 1.3267998492272899, "percentage": 66.37, "elapsed_time": "2:18:31", "remaining_time": "1:10:12", "throughput": 988.27, "total_tokens": 8213840} {"current_steps": 1765, "total_steps": 2652, "loss": 0.6678, "learning_rate": 1.2577021620310192e-05, "epoch": 1.3305691669807764, "percentage": 66.55, "elapsed_time": "2:18:55", "remaining_time": "1:09:48", "throughput": 988.31, "total_tokens": 8237840} {"current_steps": 1770, "total_steps": 2652, "loss": 0.7067, "learning_rate": 1.2448739899759398e-05, "epoch": 1.3343384847342632, "percentage": 66.74, "elapsed_time": "2:19:19", "remaining_time": "1:09:25", "throughput": 988.28, "total_tokens": 8261216} {"current_steps": 1775, "total_steps": 2652, "loss": 0.619, "learning_rate": 1.232089850971477e-05, "epoch": 1.3381078024877497, "percentage": 66.93, "elapsed_time": "2:19:43", "remaining_time": "1:09:01", "throughput": 988.22, "total_tokens": 8284304} {"current_steps": 1780, "total_steps": 2652, "loss": 0.571, "learning_rate": 1.2193501935181264e-05, "epoch": 1.3418771202412363, "percentage": 67.12, "elapsed_time": "2:20:06", "remaining_time": "1:08:38", "throughput": 988.22, "total_tokens": 8307360} {"current_steps": 1785, "total_steps": 2652, "loss": 0.5191, "learning_rate": 1.2066554645558578e-05, "epoch": 1.345646437994723, "percentage": 67.31, "elapsed_time": "2:20:29", "remaining_time": "1:08:14", "throughput": 988.2, "total_tokens": 8330480} {"current_steps": 1790, "total_steps": 2652, "loss": 0.545, "learning_rate": 1.1940061094484365e-05, "epoch": 1.3494157557482096, "percentage": 67.5, "elapsed_time": "2:20:53", "remaining_time": "1:07:50", "throughput": 988.24, "total_tokens": 8354208} {"current_steps": 1795, "total_steps": 2652, "loss": 0.5501, "learning_rate": 1.181402571967793e-05, "epoch": 1.3531850735016961, "percentage": 67.68, "elapsed_time": "2:21:17", "remaining_time": "1:07:27", "throughput": 988.28, "total_tokens": 8377936} {"current_steps": 1800, "total_steps": 2652, "loss": 0.5564, "learning_rate": 1.1688452942784591e-05, "epoch": 1.356954391255183, "percentage": 67.87, "elapsed_time": "2:21:40", "remaining_time": "1:07:03", "throughput": 988.28, "total_tokens": 8401120} {"current_steps": 1805, "total_steps": 2652, "loss": 0.6894, "learning_rate": 1.156334716922052e-05, "epoch": 1.3607237090086695, "percentage": 68.06, "elapsed_time": "2:22:04", "remaining_time": "1:06:40", "throughput": 988.27, "total_tokens": 8424704} {"current_steps": 1810, "total_steps": 2652, "loss": 0.6809, "learning_rate": 1.1438712788018233e-05, "epoch": 1.364493026762156, "percentage": 68.25, "elapsed_time": "2:22:28", "remaining_time": "1:06:16", "throughput": 988.32, "total_tokens": 8448784} {"current_steps": 1815, "total_steps": 2652, "loss": 0.7183, "learning_rate": 1.1314554171672578e-05, "epoch": 1.3682623445156428, "percentage": 68.44, "elapsed_time": "2:22:51", "remaining_time": "1:05:52", "throughput": 988.34, "total_tokens": 8471888} {"current_steps": 1820, "total_steps": 2652, "loss": 0.6292, "learning_rate": 1.1190875675987356e-05, "epoch": 1.3720316622691293, "percentage": 68.63, "elapsed_time": "2:23:15", "remaining_time": "1:05:29", "throughput": 988.34, "total_tokens": 8495168} {"current_steps": 1825, "total_steps": 2652, "loss": 0.6579, "learning_rate": 1.1067681639922486e-05, "epoch": 1.3758009800226159, "percentage": 68.82, "elapsed_time": "2:23:39", "remaining_time": "1:05:05", "throughput": 988.37, "total_tokens": 8518864} {"current_steps": 1830, "total_steps": 2652, "loss": 0.6564, "learning_rate": 1.0944976385441821e-05, "epoch": 1.3795702977761026, "percentage": 69.0, "elapsed_time": "2:24:02", "remaining_time": "1:04:42", "throughput": 988.32, "total_tokens": 8541904} {"current_steps": 1835, "total_steps": 2652, "loss": 0.5748, "learning_rate": 1.0822764217361462e-05, "epoch": 1.3833396155295892, "percentage": 69.19, "elapsed_time": "2:24:26", "remaining_time": "1:04:18", "throughput": 988.32, "total_tokens": 8565152} {"current_steps": 1840, "total_steps": 2652, "loss": 0.7318, "learning_rate": 1.0701049423198794e-05, "epoch": 1.3871089332830757, "percentage": 69.38, "elapsed_time": "2:24:49", "remaining_time": "1:03:54", "throughput": 988.34, "total_tokens": 8588448} {"current_steps": 1845, "total_steps": 2652, "loss": 0.6908, "learning_rate": 1.0579836273022045e-05, "epoch": 1.3908782510365625, "percentage": 69.57, "elapsed_time": "2:25:13", "remaining_time": "1:03:31", "throughput": 988.33, "total_tokens": 8611520} {"current_steps": 1850, "total_steps": 2652, "loss": 0.6769, "learning_rate": 1.0459129019300476e-05, "epoch": 1.394647568790049, "percentage": 69.76, "elapsed_time": "2:25:36", "remaining_time": "1:03:07", "throughput": 988.32, "total_tokens": 8634672} {"current_steps": 1855, "total_steps": 2652, "loss": 0.6782, "learning_rate": 1.03389318967552e-05, "epoch": 1.3984168865435356, "percentage": 69.95, "elapsed_time": "2:26:00", "remaining_time": "1:02:43", "throughput": 988.32, "total_tokens": 8657792} {"current_steps": 1860, "total_steps": 2652, "loss": 0.6511, "learning_rate": 1.021924912221062e-05, "epoch": 1.4021862042970223, "percentage": 70.14, "elapsed_time": "2:26:23", "remaining_time": "1:02:20", "throughput": 988.31, "total_tokens": 8681120} {"current_steps": 1865, "total_steps": 2652, "loss": 0.689, "learning_rate": 1.0100084894446455e-05, "epoch": 1.4059555220505089, "percentage": 70.32, "elapsed_time": "2:26:47", "remaining_time": "1:01:56", "throughput": 988.26, "total_tokens": 8704096} {"current_steps": 1870, "total_steps": 2652, "loss": 0.4842, "learning_rate": 9.981443394050525e-06, "epoch": 1.4097248398039954, "percentage": 70.51, "elapsed_time": "2:27:10", "remaining_time": "1:01:32", "throughput": 988.25, "total_tokens": 8727168} {"current_steps": 1875, "total_steps": 2652, "loss": 0.7458, "learning_rate": 9.863328783271989e-06, "epoch": 1.4134941575574822, "percentage": 70.7, "elapsed_time": "2:27:34", "remaining_time": "1:01:09", "throughput": 988.27, "total_tokens": 8750704} {"current_steps": 1880, "total_steps": 2652, "loss": 0.5579, "learning_rate": 9.745745205875373e-06, "epoch": 1.4172634753109687, "percentage": 70.89, "elapsed_time": "2:27:57", "remaining_time": "1:00:45", "throughput": 988.26, "total_tokens": 8773680} {"current_steps": 1885, "total_steps": 2652, "loss": 0.5636, "learning_rate": 9.62869678699519e-06, "epoch": 1.4210327930644553, "percentage": 71.08, "elapsed_time": "2:28:21", "remaining_time": "1:00:22", "throughput": 988.26, "total_tokens": 8797200} {"current_steps": 1890, "total_steps": 2652, "loss": 0.5483, "learning_rate": 9.512187632991192e-06, "epoch": 1.424802110817942, "percentage": 71.27, "elapsed_time": "2:28:45", "remaining_time": "0:59:58", "throughput": 988.3, "total_tokens": 8820832} {"current_steps": 1895, "total_steps": 2652, "loss": 0.6082, "learning_rate": 9.396221831304364e-06, "epoch": 1.4285714285714286, "percentage": 71.46, "elapsed_time": "2:29:08", "remaining_time": "0:59:34", "throughput": 988.3, "total_tokens": 8844096} {"current_steps": 1900, "total_steps": 2652, "loss": 0.6085, "learning_rate": 9.28080345031347e-06, "epoch": 1.4323407463249151, "percentage": 71.64, "elapsed_time": "2:29:32", "remaining_time": "0:59:11", "throughput": 988.3, "total_tokens": 8867264} {"current_steps": 1905, "total_steps": 2652, "loss": 0.5687, "learning_rate": 9.165936539192358e-06, "epoch": 1.436110064078402, "percentage": 71.83, "elapsed_time": "2:29:56", "remaining_time": "0:58:47", "throughput": 988.27, "total_tokens": 8890896} {"current_steps": 1910, "total_steps": 2652, "loss": 0.5493, "learning_rate": 9.05162512776789e-06, "epoch": 1.4398793818318885, "percentage": 72.02, "elapsed_time": "2:30:19", "remaining_time": "0:58:24", "throughput": 988.24, "total_tokens": 8913712} {"current_steps": 1915, "total_steps": 2652, "loss": 0.6865, "learning_rate": 8.937873226378582e-06, "epoch": 1.443648699585375, "percentage": 72.21, "elapsed_time": "2:30:43", "remaining_time": "0:58:00", "throughput": 988.29, "total_tokens": 8937536} {"current_steps": 1920, "total_steps": 2652, "loss": 0.6156, "learning_rate": 8.824684825733865e-06, "epoch": 1.4474180173388618, "percentage": 72.4, "elapsed_time": "2:31:06", "remaining_time": "0:57:36", "throughput": 988.29, "total_tokens": 8960752} {"current_steps": 1925, "total_steps": 2652, "loss": 0.7309, "learning_rate": 8.712063896774145e-06, "epoch": 1.4511873350923483, "percentage": 72.59, "elapsed_time": "2:31:29", "remaining_time": "0:57:12", "throughput": 988.31, "total_tokens": 8983760} {"current_steps": 1930, "total_steps": 2652, "loss": 0.5862, "learning_rate": 8.60001439053145e-06, "epoch": 1.4549566528458349, "percentage": 72.78, "elapsed_time": "2:31:53", "remaining_time": "0:56:49", "throughput": 988.31, "total_tokens": 9006688} {"current_steps": 1935, "total_steps": 2652, "loss": 0.6271, "learning_rate": 8.488540237990828e-06, "epoch": 1.4587259705993216, "percentage": 72.96, "elapsed_time": "2:32:16", "remaining_time": "0:56:25", "throughput": 988.33, "total_tokens": 9030112} {"current_steps": 1940, "total_steps": 2652, "loss": 0.6465, "learning_rate": 8.37764534995244e-06, "epoch": 1.4624952883528082, "percentage": 73.15, "elapsed_time": "2:32:40", "remaining_time": "0:56:01", "throughput": 988.38, "total_tokens": 9054000} {"current_steps": 1945, "total_steps": 2652, "loss": 0.4938, "learning_rate": 8.267333616894363e-06, "epoch": 1.4662646061062947, "percentage": 73.34, "elapsed_time": "2:33:04", "remaining_time": "0:55:38", "throughput": 988.42, "total_tokens": 9078032} {"current_steps": 1950, "total_steps": 2652, "loss": 0.3723, "learning_rate": 8.15760890883607e-06, "epoch": 1.4700339238597815, "percentage": 73.53, "elapsed_time": "2:33:27", "remaining_time": "0:55:14", "throughput": 988.43, "total_tokens": 9101488} {"current_steps": 1955, "total_steps": 2652, "loss": 0.574, "learning_rate": 8.048475075202727e-06, "epoch": 1.473803241613268, "percentage": 73.72, "elapsed_time": "2:33:51", "remaining_time": "0:54:51", "throughput": 988.39, "total_tokens": 9124464} {"current_steps": 1960, "total_steps": 2652, "loss": 0.6388, "learning_rate": 7.939935944690077e-06, "epoch": 1.4775725593667546, "percentage": 73.91, "elapsed_time": "2:34:15", "remaining_time": "0:54:27", "throughput": 988.38, "total_tokens": 9147616} {"current_steps": 1965, "total_steps": 2652, "loss": 0.6665, "learning_rate": 7.831995325130153e-06, "epoch": 1.4813418771202413, "percentage": 74.1, "elapsed_time": "2:34:38", "remaining_time": "0:54:03", "throughput": 988.37, "total_tokens": 9170624} {"current_steps": 1970, "total_steps": 2652, "loss": 0.6963, "learning_rate": 7.724657003357696e-06, "epoch": 1.485111194873728, "percentage": 74.28, "elapsed_time": "2:35:02", "remaining_time": "0:53:40", "throughput": 988.35, "total_tokens": 9193808} {"current_steps": 1975, "total_steps": 2652, "loss": 0.626, "learning_rate": 7.617924745077259e-06, "epoch": 1.4888805126272144, "percentage": 74.47, "elapsed_time": "2:35:25", "remaining_time": "0:53:16", "throughput": 988.37, "total_tokens": 9216880} {"current_steps": 1980, "total_steps": 2652, "loss": 0.6302, "learning_rate": 7.51180229473116e-06, "epoch": 1.4926498303807012, "percentage": 74.66, "elapsed_time": "2:35:48", "remaining_time": "0:52:52", "throughput": 988.38, "total_tokens": 9240080} {"current_steps": 1985, "total_steps": 2652, "loss": 0.6275, "learning_rate": 7.406293375368067e-06, "epoch": 1.4964191481341877, "percentage": 74.85, "elapsed_time": "2:36:11", "remaining_time": "0:52:29", "throughput": 988.41, "total_tokens": 9263216} {"current_steps": 1990, "total_steps": 2652, "loss": 0.5228, "learning_rate": 7.301401688512416e-06, "epoch": 1.5001884658876743, "percentage": 75.04, "elapsed_time": "2:36:35", "remaining_time": "0:52:05", "throughput": 988.47, "total_tokens": 9287088} {"current_steps": 1995, "total_steps": 2652, "loss": 0.6225, "learning_rate": 7.197130914034522e-06, "epoch": 1.503957783641161, "percentage": 75.23, "elapsed_time": "2:36:59", "remaining_time": "0:51:41", "throughput": 988.47, "total_tokens": 9310480} {"current_steps": 2000, "total_steps": 2652, "loss": 0.5698, "learning_rate": 7.0934847100215195e-06, "epoch": 1.5077271013946476, "percentage": 75.41, "elapsed_time": "2:37:22", "remaining_time": "0:51:18", "throughput": 988.49, "total_tokens": 9333520} {"current_steps": 2005, "total_steps": 2652, "loss": 0.5032, "learning_rate": 6.9904667126489685e-06, "epoch": 1.5114964191481342, "percentage": 75.6, "elapsed_time": "2:37:46", "remaining_time": "0:50:54", "throughput": 988.41, "total_tokens": 9356928} {"current_steps": 2010, "total_steps": 2652, "loss": 0.6599, "learning_rate": 6.888080536053351e-06, "epoch": 1.515265736901621, "percentage": 75.79, "elapsed_time": "2:38:10", "remaining_time": "0:50:31", "throughput": 988.44, "total_tokens": 9380672} {"current_steps": 2015, "total_steps": 2652, "loss": 0.6288, "learning_rate": 6.786329772205247e-06, "epoch": 1.5190350546551075, "percentage": 75.98, "elapsed_time": "2:38:33", "remaining_time": "0:50:07", "throughput": 988.46, "total_tokens": 9403888} {"current_steps": 2020, "total_steps": 2652, "loss": 0.5918, "learning_rate": 6.68521799078331e-06, "epoch": 1.522804372408594, "percentage": 76.17, "elapsed_time": "2:38:57", "remaining_time": "0:49:43", "throughput": 988.48, "total_tokens": 9427312} {"current_steps": 2025, "total_steps": 2652, "loss": 0.5564, "learning_rate": 6.58474873904906e-06, "epoch": 1.5265736901620808, "percentage": 76.36, "elapsed_time": "2:39:20", "remaining_time": "0:49:20", "throughput": 988.46, "total_tokens": 9450416} {"current_steps": 2030, "total_steps": 2652, "loss": 0.6373, "learning_rate": 6.484925541722417e-06, "epoch": 1.5303430079155673, "percentage": 76.55, "elapsed_time": "2:39:44", "remaining_time": "0:48:56", "throughput": 988.49, "total_tokens": 9474080} {"current_steps": 2035, "total_steps": 2652, "loss": 0.6829, "learning_rate": 6.385751900858031e-06, "epoch": 1.5341123256690539, "percentage": 76.73, "elapsed_time": "2:40:08", "remaining_time": "0:48:33", "throughput": 988.5, "total_tokens": 9497584} {"current_steps": 2040, "total_steps": 2652, "loss": 0.5933, "learning_rate": 6.28723129572247e-06, "epoch": 1.5378816434225406, "percentage": 76.92, "elapsed_time": "2:40:31", "remaining_time": "0:48:09", "throughput": 988.49, "total_tokens": 9520832} {"current_steps": 2045, "total_steps": 2652, "loss": 0.6933, "learning_rate": 6.189367182672115e-06, "epoch": 1.5416509611760272, "percentage": 77.11, "elapsed_time": "2:40:55", "remaining_time": "0:47:45", "throughput": 988.52, "total_tokens": 9544480} {"current_steps": 2050, "total_steps": 2652, "loss": 0.5513, "learning_rate": 6.092162995031911e-06, "epoch": 1.5454202789295137, "percentage": 77.3, "elapsed_time": "2:41:19", "remaining_time": "0:47:22", "throughput": 988.52, "total_tokens": 9567888} {"current_steps": 2055, "total_steps": 2652, "loss": 0.5939, "learning_rate": 5.99562214297493e-06, "epoch": 1.5491895966830005, "percentage": 77.49, "elapsed_time": "2:41:42", "remaining_time": "0:46:58", "throughput": 988.51, "total_tokens": 9590688} {"current_steps": 2060, "total_steps": 2652, "loss": 0.6753, "learning_rate": 5.899748013402706e-06, "epoch": 1.552958914436487, "percentage": 77.68, "elapsed_time": "2:42:05", "remaining_time": "0:46:34", "throughput": 988.49, "total_tokens": 9613376} {"current_steps": 2065, "total_steps": 2652, "loss": 0.7191, "learning_rate": 5.804543969826453e-06, "epoch": 1.5567282321899736, "percentage": 77.87, "elapsed_time": "2:42:28", "remaining_time": "0:46:11", "throughput": 988.54, "total_tokens": 9636608} {"current_steps": 2070, "total_steps": 2652, "loss": 0.6538, "learning_rate": 5.710013352249038e-06, "epoch": 1.5604975499434603, "percentage": 78.05, "elapsed_time": "2:42:51", "remaining_time": "0:45:47", "throughput": 988.57, "total_tokens": 9659888} {"current_steps": 2075, "total_steps": 2652, "loss": 0.5668, "learning_rate": 5.616159477047806e-06, "epoch": 1.564266867696947, "percentage": 78.24, "elapsed_time": "2:43:15", "remaining_time": "0:45:23", "throughput": 988.61, "total_tokens": 9683520} {"current_steps": 2080, "total_steps": 2652, "loss": 0.6383, "learning_rate": 5.522985636858239e-06, "epoch": 1.5680361854504334, "percentage": 78.43, "elapsed_time": "2:43:38", "remaining_time": "0:45:00", "throughput": 988.59, "total_tokens": 9706384} {"current_steps": 2085, "total_steps": 2652, "loss": 0.7085, "learning_rate": 5.430495100458454e-06, "epoch": 1.5718055032039202, "percentage": 78.62, "elapsed_time": "2:44:02", "remaining_time": "0:44:36", "throughput": 988.58, "total_tokens": 9729760} {"current_steps": 2090, "total_steps": 2652, "loss": 0.5722, "learning_rate": 5.338691112654484e-06, "epoch": 1.5755748209574068, "percentage": 78.81, "elapsed_time": "2:44:25", "remaining_time": "0:44:12", "throughput": 988.57, "total_tokens": 9753200} {"current_steps": 2095, "total_steps": 2652, "loss": 0.549, "learning_rate": 5.247576894166495e-06, "epoch": 1.5793441387108933, "percentage": 79.0, "elapsed_time": "2:44:49", "remaining_time": "0:43:49", "throughput": 988.59, "total_tokens": 9776464} {"current_steps": 2100, "total_steps": 2652, "loss": 0.6631, "learning_rate": 5.157155641515765e-06, "epoch": 1.58311345646438, "percentage": 79.19, "elapsed_time": "2:45:12", "remaining_time": "0:43:25", "throughput": 988.62, "total_tokens": 9800160} {"current_steps": 2105, "total_steps": 2652, "loss": 0.5433, "learning_rate": 5.067430526912539e-06, "epoch": 1.5868827742178666, "percentage": 79.37, "elapsed_time": "2:45:37", "remaining_time": "0:43:02", "throughput": 988.59, "total_tokens": 9823616} {"current_steps": 2110, "total_steps": 2652, "loss": 0.6165, "learning_rate": 4.978404698144759e-06, "epoch": 1.5906520919713532, "percentage": 79.56, "elapsed_time": "2:46:00", "remaining_time": "0:42:38", "throughput": 988.63, "total_tokens": 9847264} {"current_steps": 2115, "total_steps": 2652, "loss": 0.6133, "learning_rate": 4.890081278467612e-06, "epoch": 1.59442140972484, "percentage": 79.75, "elapsed_time": "2:46:23", "remaining_time": "0:42:14", "throughput": 988.65, "total_tokens": 9870288} {"current_steps": 2120, "total_steps": 2652, "loss": 0.7198, "learning_rate": 4.80246336649397e-06, "epoch": 1.5981907274783265, "percentage": 79.94, "elapsed_time": "2:46:47", "remaining_time": "0:41:51", "throughput": 988.66, "total_tokens": 9893888} {"current_steps": 2125, "total_steps": 2652, "loss": 0.6391, "learning_rate": 4.715554036085673e-06, "epoch": 1.601960045231813, "percentage": 80.13, "elapsed_time": "2:47:11", "remaining_time": "0:41:27", "throughput": 988.69, "total_tokens": 9917680} {"current_steps": 2130, "total_steps": 2652, "loss": 0.6299, "learning_rate": 4.629356336245707e-06, "epoch": 1.6057293629852998, "percentage": 80.32, "elapsed_time": "2:47:34", "remaining_time": "0:41:04", "throughput": 988.72, "total_tokens": 9941200} {"current_steps": 2135, "total_steps": 2652, "loss": 0.5748, "learning_rate": 4.543873291011219e-06, "epoch": 1.6094986807387863, "percentage": 80.51, "elapsed_time": "2:47:58", "remaining_time": "0:40:40", "throughput": 988.71, "total_tokens": 9964368} {"current_steps": 2140, "total_steps": 2652, "loss": 0.5355, "learning_rate": 4.4591078993474395e-06, "epoch": 1.6132679984922729, "percentage": 80.69, "elapsed_time": "2:48:21", "remaining_time": "0:40:16", "throughput": 988.69, "total_tokens": 9987616} {"current_steps": 2145, "total_steps": 2652, "loss": 0.5919, "learning_rate": 4.375063135042445e-06, "epoch": 1.6170373162457596, "percentage": 80.88, "elapsed_time": "2:48:45", "remaining_time": "0:39:53", "throughput": 988.72, "total_tokens": 10010832} {"current_steps": 2150, "total_steps": 2652, "loss": 0.8046, "learning_rate": 4.291741946602873e-06, "epoch": 1.6208066339992462, "percentage": 81.07, "elapsed_time": "2:49:08", "remaining_time": "0:39:29", "throughput": 988.7, "total_tokens": 10033824} {"current_steps": 2155, "total_steps": 2652, "loss": 0.597, "learning_rate": 4.209147257150451e-06, "epoch": 1.6245759517527327, "percentage": 81.26, "elapsed_time": "2:49:31", "remaining_time": "0:39:05", "throughput": 988.72, "total_tokens": 10057184} {"current_steps": 2160, "total_steps": 2652, "loss": 0.5736, "learning_rate": 4.127281964319446e-06, "epoch": 1.6283452695062195, "percentage": 81.45, "elapsed_time": "2:49:55", "remaining_time": "0:38:42", "throughput": 988.74, "total_tokens": 10080256} {"current_steps": 2165, "total_steps": 2652, "loss": 0.596, "learning_rate": 4.04614894015502e-06, "epoch": 1.632114587259706, "percentage": 81.64, "elapsed_time": "2:50:18", "remaining_time": "0:38:18", "throughput": 988.72, "total_tokens": 10103312} {"current_steps": 2170, "total_steps": 2652, "loss": 0.6338, "learning_rate": 3.965751031012474e-06, "epoch": 1.6358839050131926, "percentage": 81.83, "elapsed_time": "2:50:42", "remaining_time": "0:37:55", "throughput": 988.72, "total_tokens": 10126768} {"current_steps": 2175, "total_steps": 2652, "loss": 0.6239, "learning_rate": 3.886091057457353e-06, "epoch": 1.6396532227666794, "percentage": 82.01, "elapsed_time": "2:51:05", "remaining_time": "0:37:31", "throughput": 988.74, "total_tokens": 10150160} {"current_steps": 2180, "total_steps": 2652, "loss": 0.7062, "learning_rate": 3.807171814166552e-06, "epoch": 1.643422540520166, "percentage": 82.2, "elapsed_time": "2:51:29", "remaining_time": "0:37:07", "throughput": 988.77, "total_tokens": 10173504} {"current_steps": 2185, "total_steps": 2652, "loss": 0.5942, "learning_rate": 3.728996069830232e-06, "epoch": 1.6471918582736524, "percentage": 82.39, "elapsed_time": "2:51:52", "remaining_time": "0:36:44", "throughput": 988.8, "total_tokens": 10197312} {"current_steps": 2190, "total_steps": 2652, "loss": 0.5095, "learning_rate": 3.6515665670546957e-06, "epoch": 1.6509611760271392, "percentage": 82.58, "elapsed_time": "2:52:16", "remaining_time": "0:36:20", "throughput": 988.83, "total_tokens": 10220656} {"current_steps": 2195, "total_steps": 2652, "loss": 0.664, "learning_rate": 3.574886022266172e-06, "epoch": 1.6547304937806258, "percentage": 82.77, "elapsed_time": "2:52:39", "remaining_time": "0:35:56", "throughput": 988.81, "total_tokens": 10243616} {"current_steps": 2200, "total_steps": 2652, "loss": 0.6661, "learning_rate": 3.4989571256155178e-06, "epoch": 1.6584998115341123, "percentage": 82.96, "elapsed_time": "2:53:02", "remaining_time": "0:35:33", "throughput": 988.8, "total_tokens": 10266256} {"current_steps": 2205, "total_steps": 2652, "loss": 0.6184, "learning_rate": 3.423782540883838e-06, "epoch": 1.662269129287599, "percentage": 83.14, "elapsed_time": "2:53:26", "remaining_time": "0:35:09", "throughput": 988.71, "total_tokens": 10289536} {"current_steps": 2210, "total_steps": 2652, "loss": 0.5606, "learning_rate": 3.3493649053890326e-06, "epoch": 1.6660384470410856, "percentage": 83.33, "elapsed_time": "2:53:50", "remaining_time": "0:34:46", "throughput": 988.7, "total_tokens": 10312624} {"current_steps": 2215, "total_steps": 2652, "loss": 0.5439, "learning_rate": 3.275706829893277e-06, "epoch": 1.6698077647945722, "percentage": 83.52, "elapsed_time": "2:54:13", "remaining_time": "0:34:22", "throughput": 988.74, "total_tokens": 10336192} {"current_steps": 2220, "total_steps": 2652, "loss": 0.5271, "learning_rate": 3.202810898511424e-06, "epoch": 1.673577082548059, "percentage": 83.71, "elapsed_time": "2:54:37", "remaining_time": "0:33:58", "throughput": 988.73, "total_tokens": 10359520} {"current_steps": 2225, "total_steps": 2652, "loss": 0.5794, "learning_rate": 3.1306796686203566e-06, "epoch": 1.6773464003015455, "percentage": 83.9, "elapsed_time": "2:55:01", "remaining_time": "0:33:35", "throughput": 988.69, "total_tokens": 10382288} {"current_steps": 2230, "total_steps": 2652, "loss": 0.6939, "learning_rate": 3.0593156707692444e-06, "epoch": 1.681115718055032, "percentage": 84.09, "elapsed_time": "2:55:24", "remaining_time": "0:33:11", "throughput": 988.71, "total_tokens": 10406032} {"current_steps": 2235, "total_steps": 2652, "loss": 0.6781, "learning_rate": 2.9887214085908e-06, "epoch": 1.6848850358085188, "percentage": 84.28, "elapsed_time": "2:55:48", "remaining_time": "0:32:48", "throughput": 988.75, "total_tokens": 10429504} {"current_steps": 2240, "total_steps": 2652, "loss": 0.6285, "learning_rate": 2.918899358713423e-06, "epoch": 1.6886543535620053, "percentage": 84.46, "elapsed_time": "2:56:11", "remaining_time": "0:32:24", "throughput": 988.75, "total_tokens": 10452848} {"current_steps": 2245, "total_steps": 2652, "loss": 0.6771, "learning_rate": 2.8498519706743166e-06, "epoch": 1.6924236713154919, "percentage": 84.65, "elapsed_time": "2:56:35", "remaining_time": "0:32:00", "throughput": 988.73, "total_tokens": 10476192} {"current_steps": 2250, "total_steps": 2652, "loss": 0.612, "learning_rate": 2.7815816668335494e-06, "epoch": 1.6961929890689786, "percentage": 84.84, "elapsed_time": "2:56:59", "remaining_time": "0:31:37", "throughput": 988.76, "total_tokens": 10499888} {"current_steps": 2255, "total_steps": 2652, "loss": 0.6568, "learning_rate": 2.714090842289088e-06, "epoch": 1.6999623068224652, "percentage": 85.03, "elapsed_time": "2:57:22", "remaining_time": "0:31:13", "throughput": 988.72, "total_tokens": 10522704} {"current_steps": 2260, "total_steps": 2652, "loss": 0.5911, "learning_rate": 2.6473818647927416e-06, "epoch": 1.7037316245759517, "percentage": 85.22, "elapsed_time": "2:57:46", "remaining_time": "0:30:50", "throughput": 988.72, "total_tokens": 10545792} {"current_steps": 2265, "total_steps": 2652, "loss": 0.6427, "learning_rate": 2.581457074667129e-06, "epoch": 1.7075009423294385, "percentage": 85.41, "elapsed_time": "2:58:09", "remaining_time": "0:30:26", "throughput": 988.74, "total_tokens": 10568880} {"current_steps": 2270, "total_steps": 2652, "loss": 0.4982, "learning_rate": 2.516318784723545e-06, "epoch": 1.711270260082925, "percentage": 85.6, "elapsed_time": "2:58:32", "remaining_time": "0:30:02", "throughput": 988.76, "total_tokens": 10592064} {"current_steps": 2275, "total_steps": 2652, "loss": 0.5204, "learning_rate": 2.451969280180849e-06, "epoch": 1.7150395778364116, "percentage": 85.78, "elapsed_time": "2:58:56", "remaining_time": "0:29:39", "throughput": 988.73, "total_tokens": 10615040} {"current_steps": 2280, "total_steps": 2652, "loss": 0.6076, "learning_rate": 2.388410818585263e-06, "epoch": 1.7188088955898984, "percentage": 85.97, "elapsed_time": "2:59:19", "remaining_time": "0:29:15", "throughput": 988.73, "total_tokens": 10638544} {"current_steps": 2285, "total_steps": 2652, "loss": 0.6799, "learning_rate": 2.325645629731196e-06, "epoch": 1.722578213343385, "percentage": 86.16, "elapsed_time": "2:59:43", "remaining_time": "0:28:51", "throughput": 988.72, "total_tokens": 10661456} {"current_steps": 2290, "total_steps": 2652, "loss": 0.6293, "learning_rate": 2.263675915583005e-06, "epoch": 1.7263475310968714, "percentage": 86.35, "elapsed_time": "3:00:06", "remaining_time": "0:28:28", "throughput": 988.71, "total_tokens": 10684704} {"current_steps": 2295, "total_steps": 2652, "loss": 0.4813, "learning_rate": 2.2025038501977486e-06, "epoch": 1.7301168488503582, "percentage": 86.54, "elapsed_time": "3:00:30", "remaining_time": "0:28:04", "throughput": 988.68, "total_tokens": 10707872} {"current_steps": 2300, "total_steps": 2652, "loss": 0.6269, "learning_rate": 2.1421315796489095e-06, "epoch": 1.7338861666038448, "percentage": 86.73, "elapsed_time": "3:00:54", "remaining_time": "0:27:41", "throughput": 988.67, "total_tokens": 10731024} {"current_steps": 2305, "total_steps": 2652, "loss": 0.6852, "learning_rate": 2.0825612219511126e-06, "epoch": 1.7376554843573313, "percentage": 86.92, "elapsed_time": "3:01:18", "remaining_time": "0:27:17", "throughput": 988.6, "total_tokens": 10754528} {"current_steps": 2310, "total_steps": 2652, "loss": 0.6111, "learning_rate": 2.023794866985823e-06, "epoch": 1.741424802110818, "percentage": 87.1, "elapsed_time": "3:01:42", "remaining_time": "0:26:54", "throughput": 988.59, "total_tokens": 10778080} {"current_steps": 2315, "total_steps": 2652, "loss": 0.6284, "learning_rate": 1.9658345764280053e-06, "epoch": 1.7451941198643046, "percentage": 87.29, "elapsed_time": "3:02:06", "remaining_time": "0:26:30", "throughput": 988.61, "total_tokens": 10801920} {"current_steps": 2320, "total_steps": 2652, "loss": 0.5381, "learning_rate": 1.9086823836738183e-06, "epoch": 1.7489634376177912, "percentage": 87.48, "elapsed_time": "3:02:30", "remaining_time": "0:26:07", "throughput": 988.62, "total_tokens": 10825968} {"current_steps": 2325, "total_steps": 2652, "loss": 0.5894, "learning_rate": 1.8523402937692723e-06, "epoch": 1.752732755371278, "percentage": 87.67, "elapsed_time": "3:02:54", "remaining_time": "0:25:43", "throughput": 988.63, "total_tokens": 10849504} {"current_steps": 2330, "total_steps": 2652, "loss": 0.5406, "learning_rate": 1.7968102833398836e-06, "epoch": 1.7565020731247643, "percentage": 87.86, "elapsed_time": "3:03:17", "remaining_time": "0:25:19", "throughput": 988.63, "total_tokens": 10872688} {"current_steps": 2335, "total_steps": 2652, "loss": 0.8542, "learning_rate": 1.7420943005213298e-06, "epoch": 1.760271390878251, "percentage": 88.05, "elapsed_time": "3:03:41", "remaining_time": "0:24:56", "throughput": 988.65, "total_tokens": 10896144} {"current_steps": 2340, "total_steps": 2652, "loss": 0.7438, "learning_rate": 1.6881942648911076e-06, "epoch": 1.7640407086317378, "percentage": 88.24, "elapsed_time": "3:04:04", "remaining_time": "0:24:32", "throughput": 988.66, "total_tokens": 10919472} {"current_steps": 2345, "total_steps": 2652, "loss": 0.5929, "learning_rate": 1.6351120674011788e-06, "epoch": 1.767810026385224, "percentage": 88.42, "elapsed_time": "3:04:28", "remaining_time": "0:24:09", "throughput": 988.66, "total_tokens": 10942976} {"current_steps": 2350, "total_steps": 2652, "loss": 0.6984, "learning_rate": 1.5828495703116424e-06, "epoch": 1.7715793441387109, "percentage": 88.61, "elapsed_time": "3:04:52", "remaining_time": "0:23:45", "throughput": 988.67, "total_tokens": 10966624} {"current_steps": 2355, "total_steps": 2652, "loss": 0.6263, "learning_rate": 1.5314086071254035e-06, "epoch": 1.7753486618921976, "percentage": 88.8, "elapsed_time": "3:05:15", "remaining_time": "0:23:21", "throughput": 988.66, "total_tokens": 10989824} {"current_steps": 2360, "total_steps": 2652, "loss": 0.646, "learning_rate": 1.4807909825238359e-06, "epoch": 1.779117979645684, "percentage": 88.99, "elapsed_time": "3:05:39", "remaining_time": "0:22:58", "throughput": 988.65, "total_tokens": 11013344} {"current_steps": 2365, "total_steps": 2652, "loss": 0.5548, "learning_rate": 1.4309984723034797e-06, "epoch": 1.7828872973991707, "percentage": 89.18, "elapsed_time": "3:06:03", "remaining_time": "0:22:34", "throughput": 988.64, "total_tokens": 11036912} {"current_steps": 2370, "total_steps": 2652, "loss": 0.8133, "learning_rate": 1.3820328233137391e-06, "epoch": 1.7866566151526575, "percentage": 89.37, "elapsed_time": "3:06:27", "remaining_time": "0:22:11", "throughput": 988.63, "total_tokens": 11060000} {"current_steps": 2375, "total_steps": 2652, "loss": 0.7866, "learning_rate": 1.3338957533956004e-06, "epoch": 1.7904259329061438, "percentage": 89.56, "elapsed_time": "3:06:51", "remaining_time": "0:21:47", "throughput": 988.63, "total_tokens": 11083632} {"current_steps": 2380, "total_steps": 2652, "loss": 0.6527, "learning_rate": 1.286588951321363e-06, "epoch": 1.7941952506596306, "percentage": 89.74, "elapsed_time": "3:07:14", "remaining_time": "0:21:23", "throughput": 988.62, "total_tokens": 11106512} {"current_steps": 2385, "total_steps": 2652, "loss": 0.6743, "learning_rate": 1.2401140767353853e-06, "epoch": 1.7979645684131174, "percentage": 89.93, "elapsed_time": "3:07:37", "remaining_time": "0:21:00", "throughput": 988.63, "total_tokens": 11129824} {"current_steps": 2390, "total_steps": 2652, "loss": 0.626, "learning_rate": 1.1944727600958827e-06, "epoch": 1.8017338861666037, "percentage": 90.12, "elapsed_time": "3:08:01", "remaining_time": "0:20:36", "throughput": 988.66, "total_tokens": 11153744} {"current_steps": 2395, "total_steps": 2652, "loss": 0.649, "learning_rate": 1.1496666026177021e-06, "epoch": 1.8055032039200904, "percentage": 90.31, "elapsed_time": "3:08:25", "remaining_time": "0:20:13", "throughput": 988.67, "total_tokens": 11177232} {"current_steps": 2400, "total_steps": 2652, "loss": 0.5395, "learning_rate": 1.1056971762161583e-06, "epoch": 1.8092725216735772, "percentage": 90.5, "elapsed_time": "3:08:48", "remaining_time": "0:19:49", "throughput": 988.67, "total_tokens": 11200320} {"current_steps": 2405, "total_steps": 2652, "loss": 0.6329, "learning_rate": 1.0625660234518913e-06, "epoch": 1.8130418394270635, "percentage": 90.69, "elapsed_time": "3:09:13", "remaining_time": "0:19:26", "throughput": 988.59, "total_tokens": 11223904} {"current_steps": 2410, "total_steps": 2652, "loss": 0.6464, "learning_rate": 1.0202746574767413e-06, "epoch": 1.8168111571805503, "percentage": 90.87, "elapsed_time": "3:09:37", "remaining_time": "0:19:02", "throughput": 988.59, "total_tokens": 11247488} {"current_steps": 2415, "total_steps": 2652, "loss": 0.6383, "learning_rate": 9.78824561980668e-07, "epoch": 1.820580474934037, "percentage": 91.06, "elapsed_time": "3:10:01", "remaining_time": "0:18:38", "throughput": 988.6, "total_tokens": 11271152} {"current_steps": 2420, "total_steps": 2652, "loss": 0.6538, "learning_rate": 9.38217191139698e-07, "epoch": 1.8243497926875234, "percentage": 91.25, "elapsed_time": "3:10:25", "remaining_time": "0:18:15", "throughput": 988.56, "total_tokens": 11294448} {"current_steps": 2425, "total_steps": 2652, "loss": 0.7752, "learning_rate": 8.98453969564908e-07, "epoch": 1.8281191104410102, "percentage": 91.44, "elapsed_time": "3:10:48", "remaining_time": "0:17:51", "throughput": 988.53, "total_tokens": 11317488} {"current_steps": 2430, "total_steps": 2652, "loss": 0.5098, "learning_rate": 8.595362922524414e-07, "epoch": 1.831888428194497, "percentage": 91.63, "elapsed_time": "3:11:12", "remaining_time": "0:17:28", "throughput": 988.56, "total_tokens": 11341088} {"current_steps": 2435, "total_steps": 2652, "loss": 0.5951, "learning_rate": 8.214655245345787e-07, "epoch": 1.8356577459479833, "percentage": 91.82, "elapsed_time": "3:11:35", "remaining_time": "0:17:04", "throughput": 988.58, "total_tokens": 11364336} {"current_steps": 2440, "total_steps": 2652, "loss": 0.6032, "learning_rate": 7.842430020318286e-07, "epoch": 1.83942706370147, "percentage": 92.01, "elapsed_time": "3:11:59", "remaining_time": "0:16:40", "throughput": 988.55, "total_tokens": 11387232} {"current_steps": 2445, "total_steps": 2652, "loss": 0.6975, "learning_rate": 7.478700306060765e-07, "epoch": 1.8431963814549568, "percentage": 92.19, "elapsed_time": "3:12:22", "remaining_time": "0:16:17", "throughput": 988.53, "total_tokens": 11410512} {"current_steps": 2450, "total_steps": 2652, "loss": 0.8238, "learning_rate": 7.123478863147764e-07, "epoch": 1.8469656992084431, "percentage": 92.38, "elapsed_time": "3:12:46", "remaining_time": "0:15:53", "throughput": 988.54, "total_tokens": 11433760} {"current_steps": 2455, "total_steps": 2652, "loss": 0.6553, "learning_rate": 6.776778153661595e-07, "epoch": 1.8507350169619299, "percentage": 92.57, "elapsed_time": "3:13:09", "remaining_time": "0:15:30", "throughput": 988.52, "total_tokens": 11456928} {"current_steps": 2460, "total_steps": 2652, "loss": 0.7553, "learning_rate": 6.438610340755463e-07, "epoch": 1.8545043347154166, "percentage": 92.76, "elapsed_time": "3:13:33", "remaining_time": "0:15:06", "throughput": 988.53, "total_tokens": 11480416} {"current_steps": 2465, "total_steps": 2652, "loss": 0.6948, "learning_rate": 6.108987288226536e-07, "epoch": 1.858273652468903, "percentage": 92.95, "elapsed_time": "3:13:56", "remaining_time": "0:14:42", "throughput": 988.53, "total_tokens": 11503472} {"current_steps": 2470, "total_steps": 2652, "loss": 0.6716, "learning_rate": 5.78792056009983e-07, "epoch": 1.8620429702223897, "percentage": 93.14, "elapsed_time": "3:14:20", "remaining_time": "0:14:19", "throughput": 988.55, "total_tokens": 11527040} {"current_steps": 2475, "total_steps": 2652, "loss": 0.6133, "learning_rate": 5.475421420222421e-07, "epoch": 1.8658122879758765, "percentage": 93.33, "elapsed_time": "3:14:44", "remaining_time": "0:13:55", "throughput": 988.58, "total_tokens": 11550592} {"current_steps": 2480, "total_steps": 2652, "loss": 0.6372, "learning_rate": 5.171500831868459e-07, "epoch": 1.8695816057293628, "percentage": 93.51, "elapsed_time": "3:15:07", "remaining_time": "0:13:31", "throughput": 988.59, "total_tokens": 11573776} {"current_steps": 2485, "total_steps": 2652, "loss": 0.6023, "learning_rate": 4.876169457354279e-07, "epoch": 1.8733509234828496, "percentage": 93.7, "elapsed_time": "3:15:30", "remaining_time": "0:13:08", "throughput": 988.59, "total_tokens": 11596800} {"current_steps": 2490, "total_steps": 2652, "loss": 0.5304, "learning_rate": 4.5894376576645915e-07, "epoch": 1.8771202412363364, "percentage": 93.89, "elapsed_time": "3:15:54", "remaining_time": "0:12:44", "throughput": 988.59, "total_tokens": 11620224} {"current_steps": 2495, "total_steps": 2652, "loss": 0.6759, "learning_rate": 4.311315492088852e-07, "epoch": 1.8808895589898227, "percentage": 94.08, "elapsed_time": "3:16:18", "remaining_time": "0:12:21", "throughput": 988.59, "total_tokens": 11643616} {"current_steps": 2500, "total_steps": 2652, "loss": 0.713, "learning_rate": 4.0418127178684095e-07, "epoch": 1.8846588767433095, "percentage": 94.27, "elapsed_time": "3:16:41", "remaining_time": "0:11:57", "throughput": 988.57, "total_tokens": 11666912} {"current_steps": 2505, "total_steps": 2652, "loss": 0.652, "learning_rate": 3.780938789854166e-07, "epoch": 1.8884281944967962, "percentage": 94.46, "elapsed_time": "3:17:06", "remaining_time": "0:11:33", "throughput": 988.5, "total_tokens": 11690224} {"current_steps": 2510, "total_steps": 2652, "loss": 0.5323, "learning_rate": 3.528702860174926e-07, "epoch": 1.8921975122502825, "percentage": 94.65, "elapsed_time": "3:17:30", "remaining_time": "0:11:10", "throughput": 988.48, "total_tokens": 11713472} {"current_steps": 2515, "total_steps": 2652, "loss": 0.5129, "learning_rate": 3.285113777916238e-07, "epoch": 1.8959668300037693, "percentage": 94.83, "elapsed_time": "3:17:53", "remaining_time": "0:10:46", "throughput": 988.51, "total_tokens": 11737344} {"current_steps": 2520, "total_steps": 2652, "loss": 0.6176, "learning_rate": 3.050180088809973e-07, "epoch": 1.899736147757256, "percentage": 95.02, "elapsed_time": "3:18:17", "remaining_time": "0:10:23", "throughput": 988.49, "total_tokens": 11760448} {"current_steps": 2525, "total_steps": 2652, "loss": 0.6782, "learning_rate": 2.8239100349346235e-07, "epoch": 1.9035054655107424, "percentage": 95.21, "elapsed_time": "3:18:41", "remaining_time": "0:09:59", "throughput": 988.45, "total_tokens": 11783360} {"current_steps": 2530, "total_steps": 2652, "loss": 0.5076, "learning_rate": 2.6063115544259497e-07, "epoch": 1.9072747832642292, "percentage": 95.4, "elapsed_time": "3:19:04", "remaining_time": "0:09:36", "throughput": 988.44, "total_tokens": 11806880} {"current_steps": 2535, "total_steps": 2652, "loss": 0.6615, "learning_rate": 2.397392281198729e-07, "epoch": 1.911044101017716, "percentage": 95.59, "elapsed_time": "3:19:28", "remaining_time": "0:09:12", "throughput": 988.43, "total_tokens": 11830384} {"current_steps": 2540, "total_steps": 2652, "loss": 0.8442, "learning_rate": 2.1971595446786675e-07, "epoch": 1.9148134187712023, "percentage": 95.78, "elapsed_time": "3:19:52", "remaining_time": "0:08:48", "throughput": 988.45, "total_tokens": 11853616} {"current_steps": 2545, "total_steps": 2652, "loss": 0.6779, "learning_rate": 2.0056203695455189e-07, "epoch": 1.918582736524689, "percentage": 95.97, "elapsed_time": "3:20:15", "remaining_time": "0:08:25", "throughput": 988.45, "total_tokens": 11877088} {"current_steps": 2550, "total_steps": 2652, "loss": 0.6313, "learning_rate": 1.8227814754865068e-07, "epoch": 1.9223520542781758, "percentage": 96.15, "elapsed_time": "3:20:39", "remaining_time": "0:08:01", "throughput": 988.48, "total_tokens": 11901008} {"current_steps": 2555, "total_steps": 2652, "loss": 0.8076, "learning_rate": 1.64864927696054e-07, "epoch": 1.9261213720316621, "percentage": 96.34, "elapsed_time": "3:21:03", "remaining_time": "0:07:37", "throughput": 988.44, "total_tokens": 11923888} {"current_steps": 2560, "total_steps": 2652, "loss": 0.7413, "learning_rate": 1.4832298829733359e-07, "epoch": 1.9298906897851489, "percentage": 96.53, "elapsed_time": "3:21:26", "remaining_time": "0:07:14", "throughput": 988.41, "total_tokens": 11946784} {"current_steps": 2565, "total_steps": 2652, "loss": 0.4589, "learning_rate": 1.3265290968629273e-07, "epoch": 1.9336600075386357, "percentage": 96.72, "elapsed_time": "3:21:50", "remaining_time": "0:06:50", "throughput": 988.43, "total_tokens": 11969968} {"current_steps": 2570, "total_steps": 2652, "loss": 0.5985, "learning_rate": 1.1785524160961847e-07, "epoch": 1.937429325292122, "percentage": 96.91, "elapsed_time": "3:22:13", "remaining_time": "0:06:27", "throughput": 988.46, "total_tokens": 11993008} {"current_steps": 2575, "total_steps": 2652, "loss": 0.6091, "learning_rate": 1.0393050320759157e-07, "epoch": 1.9411986430456087, "percentage": 97.1, "elapsed_time": "3:22:36", "remaining_time": "0:06:03", "throughput": 988.5, "total_tokens": 12016784} {"current_steps": 2580, "total_steps": 2652, "loss": 0.6144, "learning_rate": 9.087918299586773e-08, "epoch": 1.9449679607990955, "percentage": 97.29, "elapsed_time": "3:22:59", "remaining_time": "0:05:39", "throughput": 988.52, "total_tokens": 12039984} {"current_steps": 2585, "total_steps": 2652, "loss": 0.6865, "learning_rate": 7.870173884835241e-08, "epoch": 1.9487372785525818, "percentage": 97.47, "elapsed_time": "3:23:23", "remaining_time": "0:05:16", "throughput": 988.52, "total_tokens": 12063200} {"current_steps": 2590, "total_steps": 2652, "loss": 0.6852, "learning_rate": 6.73985979811248e-08, "epoch": 1.9525065963060686, "percentage": 97.66, "elapsed_time": "3:23:46", "remaining_time": "0:04:52", "throughput": 988.53, "total_tokens": 12086464} {"current_steps": 2595, "total_steps": 2652, "loss": 0.6579, "learning_rate": 5.6970156937458105e-08, "epoch": 1.9562759140595554, "percentage": 97.85, "elapsed_time": "3:24:09", "remaining_time": "0:04:29", "throughput": 988.55, "total_tokens": 12109568} {"current_steps": 2600, "total_steps": 2652, "loss": 0.7044, "learning_rate": 4.741678157389739e-08, "epoch": 1.9600452318130417, "percentage": 98.04, "elapsed_time": "3:24:33", "remaining_time": "0:04:05", "throughput": 988.57, "total_tokens": 12133104} {"current_steps": 2605, "total_steps": 2652, "loss": 0.5653, "learning_rate": 3.873880704744481e-08, "epoch": 1.9638145495665285, "percentage": 98.23, "elapsed_time": "3:24:57", "remaining_time": "0:03:41", "throughput": 988.53, "total_tokens": 12156752} {"current_steps": 2610, "total_steps": 2652, "loss": 0.6297, "learning_rate": 3.0936537803771814e-08, "epoch": 1.9675838673200152, "percentage": 98.42, "elapsed_time": "3:25:20", "remaining_time": "0:03:18", "throughput": 988.55, "total_tokens": 12179712} {"current_steps": 2615, "total_steps": 2652, "loss": 0.5759, "learning_rate": 2.4010247566569334e-08, "epoch": 1.9713531850735015, "percentage": 98.6, "elapsed_time": "3:25:44", "remaining_time": "0:02:54", "throughput": 988.57, "total_tokens": 12203056} {"current_steps": 2620, "total_steps": 2652, "loss": 0.6378, "learning_rate": 1.7960179327922156e-08, "epoch": 1.9751225028269883, "percentage": 98.79, "elapsed_time": "3:26:07", "remaining_time": "0:02:31", "throughput": 988.6, "total_tokens": 12226656} {"current_steps": 2625, "total_steps": 2652, "loss": 0.5149, "learning_rate": 1.2786545339796286e-08, "epoch": 1.978891820580475, "percentage": 98.98, "elapsed_time": "3:26:30", "remaining_time": "0:02:07", "throughput": 988.59, "total_tokens": 12249488} {"current_steps": 2630, "total_steps": 2652, "loss": 0.627, "learning_rate": 8.48952710658657e-09, "epoch": 1.9826611383339614, "percentage": 99.17, "elapsed_time": "3:26:54", "remaining_time": "0:01:43", "throughput": 988.59, "total_tokens": 12272576} {"current_steps": 2635, "total_steps": 2652, "loss": 0.6551, "learning_rate": 5.069275378746796e-09, "epoch": 1.9864304560874482, "percentage": 99.36, "elapsed_time": "3:27:17", "remaining_time": "0:01:20", "throughput": 988.58, "total_tokens": 12295632} {"current_steps": 2640, "total_steps": 2652, "loss": 0.5288, "learning_rate": 2.5259101475161305e-09, "epoch": 1.990199773840935, "percentage": 99.55, "elapsed_time": "3:27:40", "remaining_time": "0:00:56", "throughput": 988.6, "total_tokens": 12318880} {"current_steps": 2645, "total_steps": 2652, "loss": 0.6517, "learning_rate": 8.595206406891709e-10, "epoch": 1.9939690915944213, "percentage": 99.74, "elapsed_time": "3:28:04", "remaining_time": "0:00:33", "throughput": 988.6, "total_tokens": 12342048} {"current_steps": 2650, "total_steps": 2652, "loss": 0.5179, "learning_rate": 7.016531949621819e-11, "epoch": 1.997738409347908, "percentage": 99.92, "elapsed_time": "3:28:27", "remaining_time": "0:00:09", "throughput": 988.59, "total_tokens": 12365024} {"current_steps": 2652, "total_steps": 2652, "epoch": 1.9992461364493028, "percentage": 100.0, "elapsed_time": "3:28:38", "remaining_time": "0:00:00", "throughput": 988.54, "total_tokens": 12374624}