{"current_steps": 5, "total_steps": 310, "loss": 0.4352, "lr": 9.993582535855265e-06, "epoch": 0.08, "percentage": 1.61, "elapsed_time": "0:06:36", "remaining_time": "6:43:23", "throughput": 2280.65, "total_tokens": 904912} {"current_steps": 10, "total_steps": 310, "loss": 0.388, "lr": 9.974346616959476e-06, "epoch": 0.16, "percentage": 3.23, "elapsed_time": "0:13:10", "remaining_time": "6:35:22", "throughput": 2286.91, "total_tokens": 1808376} {"current_steps": 15, "total_steps": 310, "loss": 0.3875, "lr": 9.942341621640558e-06, "epoch": 0.24, "percentage": 4.84, "elapsed_time": "0:19:20", "remaining_time": "6:20:29", "throughput": 2312.8, "total_tokens": 2684696} {"current_steps": 20, "total_steps": 310, "loss": 0.3959, "lr": 9.897649706262474e-06, "epoch": 0.32, "percentage": 6.45, "elapsed_time": "0:25:50", "remaining_time": "6:14:37", "throughput": 2319.83, "total_tokens": 3596136} {"current_steps": 25, "total_steps": 310, "loss": 0.3718, "lr": 9.840385594331022e-06, "epoch": 0.4, "percentage": 8.06, "elapsed_time": "0:32:32", "remaining_time": "6:10:56", "throughput": 2330.35, "total_tokens": 4549488} {"current_steps": 30, "total_steps": 310, "loss": 0.3597, "lr": 9.770696282000245e-06, "epoch": 0.48, "percentage": 9.68, "elapsed_time": "0:39:27", "remaining_time": "6:08:17", "throughput": 2294.37, "total_tokens": 5432232} {"current_steps": 35, "total_steps": 310, "loss": 0.3683, "lr": 9.688760660735403e-06, "epoch": 0.56, "percentage": 11.29, "elapsed_time": "0:45:45", "remaining_time": "5:59:34", "throughput": 2290.47, "total_tokens": 6289320} {"current_steps": 40, "total_steps": 310, "loss": 0.3701, "lr": 9.594789058101154e-06, "epoch": 0.64, "percentage": 12.9, "elapsed_time": "0:52:17", "remaining_time": "5:52:55", "throughput": 2288.15, "total_tokens": 7178328} {"current_steps": 45, "total_steps": 310, "loss": 0.3796, "lr": 9.48902269785371e-06, "epoch": 0.72, "percentage": 14.52, "elapsed_time": "0:59:01", "remaining_time": "5:47:33", "throughput": 2280.22, "total_tokens": 8074600} {"current_steps": 50, "total_steps": 310, "loss": 0.3451, "lr": 9.371733080722911e-06, "epoch": 0.8, "percentage": 16.13, "elapsed_time": "1:05:31", "remaining_time": "5:40:44", "throughput": 2300.4, "total_tokens": 9044168} {"current_steps": 55, "total_steps": 310, "loss": 0.3526, "lr": 9.243221287473755e-06, "epoch": 0.88, "percentage": 17.74, "elapsed_time": "1:12:03", "remaining_time": "5:34:04", "throughput": 2306.03, "total_tokens": 9969944} {"current_steps": 60, "total_steps": 310, "loss": 0.3386, "lr": 9.103817206036383e-06, "epoch": 0.96, "percentage": 19.35, "elapsed_time": "1:18:52", "remaining_time": "5:28:39", "throughput": 2304.99, "total_tokens": 10909008} {"current_steps": 65, "total_steps": 310, "loss": 0.3002, "lr": 8.953878684688492e-06, "epoch": 1.032, "percentage": 20.97, "elapsed_time": "1:24:28", "remaining_time": "5:18:25", "throughput": 2301.09, "total_tokens": 11663840} {"current_steps": 70, "total_steps": 310, "loss": 0.2818, "lr": 8.793790613463956e-06, "epoch": 1.112, "percentage": 22.58, "elapsed_time": "1:31:07", "remaining_time": "5:12:26", "throughput": 2295.87, "total_tokens": 12553064} {"current_steps": 75, "total_steps": 310, "loss": 0.2778, "lr": 8.6239639361456e-06, "epoch": 1.192, "percentage": 24.19, "elapsed_time": "1:37:54", "remaining_time": "5:06:46", "throughput": 2292.82, "total_tokens": 13469144} {"current_steps": 80, "total_steps": 310, "loss": 0.2691, "lr": 8.444834595378434e-06, "epoch": 1.272, "percentage": 25.81, "elapsed_time": "1:44:42", "remaining_time": "5:01:02", "throughput": 2293.07, "total_tokens": 14406256} {"current_steps": 85, "total_steps": 310, "loss": 0.262, "lr": 8.256862413611113e-06, "epoch": 1.3519999999999999, "percentage": 27.42, "elapsed_time": "1:51:09", "remaining_time": "4:54:15", "throughput": 2294.76, "total_tokens": 15305328} {"current_steps": 90, "total_steps": 310, "loss": 0.2805, "lr": 8.060529912738316e-06, "epoch": 1.432, "percentage": 29.03, "elapsed_time": "1:57:31", "remaining_time": "4:47:16", "throughput": 2305.95, "total_tokens": 16259688} {"current_steps": 95, "total_steps": 310, "loss": 0.2775, "lr": 7.856341075473963e-06, "epoch": 1.512, "percentage": 30.65, "elapsed_time": "2:03:58", "remaining_time": "4:40:35", "throughput": 2307.76, "total_tokens": 17167192} {"current_steps": 100, "total_steps": 310, "loss": 0.2645, "lr": 7.644820051634813e-06, "epoch": 1.592, "percentage": 32.26, "elapsed_time": "2:10:49", "remaining_time": "4:34:44", "throughput": 2300.55, "total_tokens": 18059304} {"current_steps": 105, "total_steps": 310, "loss": 0.2773, "lr": 7.4265098126554065e-06, "epoch": 1.6720000000000002, "percentage": 33.87, "elapsed_time": "2:19:59", "remaining_time": "4:33:19", "throughput": 2258.82, "total_tokens": 18973864} {"current_steps": 110, "total_steps": 310, "loss": 0.2867, "lr": 7.201970757788172e-06, "epoch": 1.752, "percentage": 35.48, "elapsed_time": "2:26:26", "remaining_time": "4:26:15", "throughput": 2262.26, "total_tokens": 19877832} {"current_steps": 115, "total_steps": 310, "loss": 0.2697, "lr": 6.971779275566593e-06, "epoch": 1.8319999999999999, "percentage": 37.1, "elapsed_time": "2:32:30", "remaining_time": "4:18:36", "throughput": 2272.29, "total_tokens": 20793160} {"current_steps": 120, "total_steps": 310, "loss": 0.264, "lr": 6.736526264224101e-06, "epoch": 1.912, "percentage": 38.71, "elapsed_time": "2:38:41", "remaining_time": "4:11:15", "throughput": 2275.15, "total_tokens": 21662200} {"current_steps": 125, "total_steps": 310, "loss": 0.2734, "lr": 6.496815614866792e-06, "epoch": 1.992, "percentage": 40.32, "elapsed_time": "2:45:03", "remaining_time": "4:04:17", "throughput": 2279.9, "total_tokens": 22579968} {"current_steps": 130, "total_steps": 310, "loss": 0.2438, "lr": 6.2532626612936035e-06, "epoch": 2.064, "percentage": 41.94, "elapsed_time": "2:51:02", "remaining_time": "3:56:49", "throughput": 2281.06, "total_tokens": 23409800} {"current_steps": 135, "total_steps": 310, "loss": 0.2017, "lr": 6.006492600443301e-06, "epoch": 2.144, "percentage": 43.55, "elapsed_time": "2:57:34", "remaining_time": "3:50:11", "throughput": 2279.31, "total_tokens": 24285480} {"current_steps": 140, "total_steps": 310, "loss": 0.2014, "lr": 5.757138887522884e-06, "epoch": 2.224, "percentage": 45.16, "elapsed_time": "3:04:27", "remaining_time": "3:43:58", "throughput": 2272.95, "total_tokens": 25155560} {"current_steps": 145, "total_steps": 310, "loss": 0.193, "lr": 5.505841609937162e-06, "epoch": 2.304, "percentage": 46.77, "elapsed_time": "3:11:19", "remaining_time": "3:37:43", "throughput": 2268.81, "total_tokens": 26045360} {"current_steps": 150, "total_steps": 310, "loss": 0.204, "lr": 5.253245844193564e-06, "epoch": 2.384, "percentage": 48.39, "elapsed_time": "3:17:30", "remaining_time": "3:30:40", "throughput": 2274.44, "total_tokens": 26953512} {"current_steps": 155, "total_steps": 310, "loss": 0.2224, "lr": 5e-06, "epoch": 2.464, "percentage": 50.0, "elapsed_time": "3:23:43", "remaining_time": "3:23:43", "throughput": 2280.41, "total_tokens": 27875320} {"current_steps": 160, "total_steps": 310, "loss": 0.2122, "lr": 4.746754155806437e-06, "epoch": 2.544, "percentage": 51.61, "elapsed_time": "3:30:25", "remaining_time": "3:17:16", "throughput": 2280.0, "total_tokens": 28786896} {"current_steps": 165, "total_steps": 310, "loss": 0.1976, "lr": 4.49415839006284e-06, "epoch": 2.624, "percentage": 53.23, "elapsed_time": "3:36:42", "remaining_time": "3:10:26", "throughput": 2278.73, "total_tokens": 29630128} {"current_steps": 170, "total_steps": 310, "loss": 0.1935, "lr": 4.2428611124771184e-06, "epoch": 2.7039999999999997, "percentage": 54.84, "elapsed_time": "3:43:10", "remaining_time": "3:03:47", "throughput": 2278.02, "total_tokens": 30503816} {"current_steps": 175, "total_steps": 310, "loss": 0.2237, "lr": 3.993507399556699e-06, "epoch": 2.784, "percentage": 56.45, "elapsed_time": "3:50:02", "remaining_time": "2:57:27", "throughput": 2277.37, "total_tokens": 31433032} {"current_steps": 180, "total_steps": 310, "loss": 0.2002, "lr": 3.7467373387063973e-06, "epoch": 2.864, "percentage": 58.06, "elapsed_time": "3:56:52", "remaining_time": "2:51:04", "throughput": 2276.09, "total_tokens": 32347864} {"current_steps": 185, "total_steps": 310, "loss": 0.2138, "lr": 3.5031843851332105e-06, "epoch": 2.944, "percentage": 59.68, "elapsed_time": "4:03:27", "remaining_time": "2:44:30", "throughput": 2282.79, "total_tokens": 33346576} {"current_steps": 190, "total_steps": 310, "loss": 0.1904, "lr": 3.2634737357758994e-06, "epoch": 3.016, "percentage": 61.29, "elapsed_time": "4:08:53", "remaining_time": "2:37:11", "throughput": 2291.47, "total_tokens": 34219176} {"current_steps": 195, "total_steps": 310, "loss": 0.1643, "lr": 3.0282207244334084e-06, "epoch": 3.096, "percentage": 62.9, "elapsed_time": "4:15:38", "remaining_time": "2:30:45", "throughput": 2292.16, "total_tokens": 35158432} {"current_steps": 200, "total_steps": 310, "loss": 0.16, "lr": 2.7980292422118282e-06, "epoch": 3.176, "percentage": 64.52, "elapsed_time": "4:21:22", "remaining_time": "2:23:45", "throughput": 2299.12, "total_tokens": 36055520} {"current_steps": 205, "total_steps": 310, "loss": 0.1493, "lr": 2.573490187344596e-06, "epoch": 3.2560000000000002, "percentage": 66.13, "elapsed_time": "4:30:13", "remaining_time": "2:18:24", "throughput": 2281.09, "total_tokens": 36983672} {"current_steps": 210, "total_steps": 310, "loss": 0.1436, "lr": 2.3551799483651894e-06, "epoch": 3.336, "percentage": 67.74, "elapsed_time": "4:36:34", "remaining_time": "2:11:41", "throughput": 2280.19, "total_tokens": 37837680} {"current_steps": 215, "total_steps": 310, "loss": 0.154, "lr": 2.1436589245260375e-06, "epoch": 3.416, "percentage": 69.35, "elapsed_time": "4:43:21", "remaining_time": "2:05:12", "throughput": 2280.16, "total_tokens": 38766568} {"current_steps": 220, "total_steps": 310, "loss": 0.1658, "lr": 1.9394700872616856e-06, "epoch": 3.496, "percentage": 70.97, "elapsed_time": "4:50:05", "remaining_time": "1:58:40", "throughput": 2278.95, "total_tokens": 39667328} {"current_steps": 225, "total_steps": 310, "loss": 0.1472, "lr": 1.74313758638889e-06, "epoch": 3.576, "percentage": 72.58, "elapsed_time": "4:56:17", "remaining_time": "1:51:55", "throughput": 2280.01, "total_tokens": 40532840} {"current_steps": 230, "total_steps": 310, "loss": 0.1654, "lr": 1.555165404621567e-06, "epoch": 3.656, "percentage": 74.19, "elapsed_time": "5:03:37", "remaining_time": "1:45:36", "throughput": 2277.91, "total_tokens": 41498224} {"current_steps": 235, "total_steps": 310, "loss": 0.1583, "lr": 1.3760360638544012e-06, "epoch": 3.7359999999999998, "percentage": 75.81, "elapsed_time": "5:09:58", "remaining_time": "1:38:55", "throughput": 2282.42, "total_tokens": 42449096} {"current_steps": 240, "total_steps": 310, "loss": 0.1463, "lr": 1.2062093865360458e-06, "epoch": 3.816, "percentage": 77.42, "elapsed_time": "5:16:18", "remaining_time": "1:32:15", "throughput": 2281.13, "total_tokens": 43293600} {"current_steps": 245, "total_steps": 310, "loss": 0.1599, "lr": 1.046121315311508e-06, "epoch": 3.896, "percentage": 79.03, "elapsed_time": "5:22:36", "remaining_time": "1:25:35", "throughput": 2282.95, "total_tokens": 44190712} {"current_steps": 250, "total_steps": 310, "loss": 0.1609, "lr": 8.961827939636198e-07, "epoch": 3.976, "percentage": 80.65, "elapsed_time": "5:29:07", "remaining_time": "1:18:59", "throughput": 2283.68, "total_tokens": 45096112} {"current_steps": 255, "total_steps": 310, "loss": 0.1428, "lr": 7.567787125262449e-07, "epoch": 4.048, "percentage": 82.26, "elapsed_time": "5:34:47", "remaining_time": "1:12:12", "throughput": 2285.86, "total_tokens": 45916648} {"current_steps": 260, "total_steps": 310, "loss": 0.1216, "lr": 6.282669192770896e-07, "epoch": 4.128, "percentage": 83.87, "elapsed_time": "5:41:25", "remaining_time": "1:05:39", "throughput": 2284.68, "total_tokens": 46801776} {"current_steps": 265, "total_steps": 310, "loss": 0.1309, "lr": 5.109773021462921e-07, "epoch": 4.208, "percentage": 85.48, "elapsed_time": "5:47:55", "remaining_time": "0:59:04", "throughput": 2284.28, "total_tokens": 47685704} {"current_steps": 270, "total_steps": 310, "loss": 0.1346, "lr": 4.05210941898847e-07, "epoch": 4.288, "percentage": 87.1, "elapsed_time": "5:54:32", "remaining_time": "0:52:31", "throughput": 2283.14, "total_tokens": 48567032} {"current_steps": 275, "total_steps": 310, "loss": 0.1318, "lr": 3.112393392645985e-07, "epoch": 4.368, "percentage": 88.71, "elapsed_time": "6:01:16", "remaining_time": "0:45:58", "throughput": 2283.19, "total_tokens": 49491568} {"current_steps": 280, "total_steps": 310, "loss": 0.1355, "lr": 2.2930371799975593e-07, "epoch": 4.448, "percentage": 90.32, "elapsed_time": "6:08:25", "remaining_time": "0:39:28", "throughput": 2281.89, "total_tokens": 50442584} {"current_steps": 285, "total_steps": 310, "loss": 0.1418, "lr": 1.5961440566897913e-07, "epoch": 4.5280000000000005, "percentage": 91.94, "elapsed_time": "6:15:07", "remaining_time": "0:32:54", "throughput": 2284.27, "total_tokens": 51413272} {"current_steps": 290, "total_steps": 310, "loss": 0.1358, "lr": 1.0235029373752758e-07, "epoch": 4.608, "percentage": 93.55, "elapsed_time": "6:21:51", "remaining_time": "0:26:20", "throughput": 2281.64, "total_tokens": 52276024} {"current_steps": 295, "total_steps": 310, "loss": 0.1319, "lr": 5.7658378359443104e-08, "epoch": 4.688, "percentage": 95.16, "elapsed_time": "6:28:30", "remaining_time": "0:19:45", "throughput": 2281.27, "total_tokens": 53176640} {"current_steps": 300, "total_steps": 310, "loss": 0.1401, "lr": 2.5653383040524228e-08, "epoch": 4.768, "percentage": 96.77, "elapsed_time": "6:35:18", "remaining_time": "0:13:10", "throughput": 2282.16, "total_tokens": 54130624} {"current_steps": 305, "total_steps": 310, "loss": 0.1395, "lr": 6.417464144736208e-09, "epoch": 4.848, "percentage": 98.39, "elapsed_time": "6:44:10", "remaining_time": "0:06:37", "throughput": 2268.78, "total_tokens": 55018008} {"current_steps": 310, "total_steps": 310, "loss": 0.1385, "lr": 0.0, "epoch": 4.928, "percentage": 100.0, "elapsed_time": "6:50:51", "remaining_time": "0:00:00", "throughput": 2269.67, "total_tokens": 55950608} {"current_steps": 310, "total_steps": 310, "epoch": 4.928, "percentage": 100.0, "elapsed_time": "6:53:15", "remaining_time": "0:00:00", "throughput": 2256.44, "total_tokens": 55950608}