{"current_steps": 10, "total_steps": 5000, "loss": 1.3992, "lr": 2.4000000000000003e-07, "epoch": 0.02, "percentage": 0.2, "elapsed_time": "0:01:03", "remaining_time": "8:51:52"} {"current_steps": 20, "total_steps": 5000, "loss": 1.4497, "lr": 6.000000000000001e-07, "epoch": 0.04, "percentage": 0.4, "elapsed_time": "0:02:15", "remaining_time": "9:21:43"} {"current_steps": 30, "total_steps": 5000, "loss": 1.2599, "lr": 1.0000000000000002e-06, "epoch": 0.06, "percentage": 0.6, "elapsed_time": "0:03:26", "remaining_time": "9:30:46"} {"current_steps": 40, "total_steps": 5000, "loss": 1.4124, "lr": 1.4000000000000001e-06, "epoch": 0.08, "percentage": 0.8, "elapsed_time": "0:04:37", "remaining_time": "9:33:42"} {"current_steps": 50, "total_steps": 5000, "loss": 1.3542, "lr": 1.8000000000000001e-06, "epoch": 0.1, "percentage": 1.0, "elapsed_time": "0:05:48", "remaining_time": "9:35:37"} {"current_steps": 60, "total_steps": 5000, "loss": 1.2123, "lr": 2.2e-06, "epoch": 0.12, "percentage": 1.2, "elapsed_time": "0:07:00", "remaining_time": "9:36:27"} {"current_steps": 70, "total_steps": 5000, "loss": 1.2098, "lr": 2.6e-06, "epoch": 0.14, "percentage": 1.4, "elapsed_time": "0:08:11", "remaining_time": "9:37:19"} {"current_steps": 80, "total_steps": 5000, "loss": 1.2226, "lr": 3e-06, "epoch": 0.16, "percentage": 1.6, "elapsed_time": "0:09:24", "remaining_time": "9:38:53"} {"current_steps": 90, "total_steps": 5000, "loss": 1.0624, "lr": 3.3600000000000004e-06, "epoch": 0.18, "percentage": 1.8, "elapsed_time": "0:10:36", "remaining_time": "9:39:02"} {"current_steps": 100, "total_steps": 5000, "loss": 1.0969, "lr": 3.7600000000000004e-06, "epoch": 0.2, "percentage": 2.0, "elapsed_time": "0:11:49", "remaining_time": "9:39:23"} {"current_steps": 110, "total_steps": 5000, "loss": 1.0879, "lr": 4.16e-06, "epoch": 0.22, "percentage": 2.2, "elapsed_time": "0:13:03", "remaining_time": "9:40:32"} {"current_steps": 120, "total_steps": 5000, "loss": 1.0195, "lr": 4.56e-06, "epoch": 0.24, "percentage": 2.4, "elapsed_time": "0:14:15", "remaining_time": "9:39:40"} {"current_steps": 130, "total_steps": 5000, "loss": 0.9765, "lr": 4.960000000000001e-06, "epoch": 0.26, "percentage": 2.6, "elapsed_time": "0:15:27", "remaining_time": "9:39:11"} {"current_steps": 140, "total_steps": 5000, "loss": 1.0205, "lr": 5.36e-06, "epoch": 0.28, "percentage": 2.8, "elapsed_time": "0:16:40", "remaining_time": "9:38:36"} {"current_steps": 150, "total_steps": 5000, "loss": 0.9517, "lr": 5.76e-06, "epoch": 0.3, "percentage": 3.0, "elapsed_time": "0:17:51", "remaining_time": "9:37:25"} {"current_steps": 160, "total_steps": 5000, "loss": 0.9324, "lr": 6.16e-06, "epoch": 0.32, "percentage": 3.2, "elapsed_time": "0:19:02", "remaining_time": "9:35:59"} {"current_steps": 170, "total_steps": 5000, "loss": 0.804, "lr": 6.560000000000001e-06, "epoch": 0.34, "percentage": 3.4, "elapsed_time": "0:20:13", "remaining_time": "9:34:49"} {"current_steps": 180, "total_steps": 5000, "loss": 0.7821, "lr": 6.96e-06, "epoch": 0.36, "percentage": 3.6, "elapsed_time": "0:21:26", "remaining_time": "9:33:57"} {"current_steps": 190, "total_steps": 5000, "loss": 0.8086, "lr": 7.360000000000001e-06, "epoch": 0.38, "percentage": 3.8, "elapsed_time": "0:22:38", "remaining_time": "9:32:59"} {"current_steps": 200, "total_steps": 5000, "loss": 0.7655, "lr": 7.76e-06, "epoch": 0.4, "percentage": 4.0, "elapsed_time": "0:23:50", "remaining_time": "9:32:02"} {"current_steps": 210, "total_steps": 5000, "loss": 0.7508, "lr": 8.16e-06, "epoch": 0.42, "percentage": 4.2, "elapsed_time": "0:25:03", "remaining_time": "9:31:34"} {"current_steps": 220, "total_steps": 5000, "loss": 0.7429, "lr": 8.560000000000001e-06, "epoch": 0.44, "percentage": 4.4, "elapsed_time": "0:26:15", "remaining_time": "9:30:29"} {"current_steps": 230, "total_steps": 5000, "loss": 0.7502, "lr": 8.96e-06, "epoch": 0.46, "percentage": 4.6, "elapsed_time": "0:27:27", "remaining_time": "9:29:27"} {"current_steps": 240, "total_steps": 5000, "loss": 0.7029, "lr": 9.360000000000002e-06, "epoch": 0.48, "percentage": 4.8, "elapsed_time": "0:28:39", "remaining_time": "9:28:22"} {"current_steps": 250, "total_steps": 5000, "loss": 0.7324, "lr": 9.760000000000001e-06, "epoch": 0.5, "percentage": 5.0, "elapsed_time": "0:29:50", "remaining_time": "9:27:08"} {"current_steps": 260, "total_steps": 5000, "loss": 0.7521, "lr": 1.0160000000000001e-05, "epoch": 0.52, "percentage": 5.2, "elapsed_time": "0:31:02", "remaining_time": "9:25:48"} {"current_steps": 270, "total_steps": 5000, "loss": 0.698, "lr": 1.056e-05, "epoch": 0.54, "percentage": 5.4, "elapsed_time": "0:32:13", "remaining_time": "9:24:30"} {"current_steps": 280, "total_steps": 5000, "loss": 0.6859, "lr": 1.0960000000000002e-05, "epoch": 0.56, "percentage": 5.6, "elapsed_time": "0:33:24", "remaining_time": "9:23:15"} {"current_steps": 290, "total_steps": 5000, "loss": 0.6716, "lr": 1.136e-05, "epoch": 0.58, "percentage": 5.8, "elapsed_time": "0:34:36", "remaining_time": "9:22:04"} {"current_steps": 300, "total_steps": 5000, "loss": 0.6978, "lr": 1.1760000000000001e-05, "epoch": 0.6, "percentage": 6.0, "elapsed_time": "0:35:47", "remaining_time": "9:20:48"} {"current_steps": 310, "total_steps": 5000, "loss": 0.6584, "lr": 1.216e-05, "epoch": 0.62, "percentage": 6.2, "elapsed_time": "0:37:01", "remaining_time": "9:20:02"} {"current_steps": 320, "total_steps": 5000, "loss": 0.7188, "lr": 1.2560000000000002e-05, "epoch": 0.64, "percentage": 6.4, "elapsed_time": "0:38:12", "remaining_time": "9:18:52"} {"current_steps": 330, "total_steps": 5000, "loss": 0.6687, "lr": 1.2960000000000001e-05, "epoch": 0.66, "percentage": 6.6, "elapsed_time": "0:39:25", "remaining_time": "9:17:48"} {"current_steps": 340, "total_steps": 5000, "loss": 0.623, "lr": 1.3360000000000003e-05, "epoch": 0.68, "percentage": 6.8, "elapsed_time": "0:40:37", "remaining_time": "9:16:48"} {"current_steps": 350, "total_steps": 5000, "loss": 0.6795, "lr": 1.376e-05, "epoch": 0.7, "percentage": 7.0, "elapsed_time": "0:41:49", "remaining_time": "9:15:38"} {"current_steps": 360, "total_steps": 5000, "loss": 0.6455, "lr": 1.416e-05, "epoch": 0.72, "percentage": 7.2, "elapsed_time": "0:43:00", "remaining_time": "9:14:20"} {"current_steps": 370, "total_steps": 5000, "loss": 0.6548, "lr": 1.4560000000000001e-05, "epoch": 0.74, "percentage": 7.4, "elapsed_time": "0:44:13", "remaining_time": "9:13:18"} {"current_steps": 380, "total_steps": 5000, "loss": 0.6508, "lr": 1.496e-05, "epoch": 0.76, "percentage": 7.6, "elapsed_time": "0:45:24", "remaining_time": "9:12:03"} {"current_steps": 390, "total_steps": 5000, "loss": 0.7105, "lr": 1.5360000000000002e-05, "epoch": 0.78, "percentage": 7.8, "elapsed_time": "0:46:36", "remaining_time": "9:10:53"} {"current_steps": 400, "total_steps": 5000, "loss": 0.6738, "lr": 1.576e-05, "epoch": 0.8, "percentage": 8.0, "elapsed_time": "0:47:47", "remaining_time": "9:09:33"} {"current_steps": 410, "total_steps": 5000, "loss": 0.6741, "lr": 1.616e-05, "epoch": 0.82, "percentage": 8.2, "elapsed_time": "0:49:00", "remaining_time": "9:08:40"} {"current_steps": 420, "total_steps": 5000, "loss": 0.6385, "lr": 1.656e-05, "epoch": 0.84, "percentage": 8.4, "elapsed_time": "0:50:12", "remaining_time": "9:07:28"} {"current_steps": 430, "total_steps": 5000, "loss": 0.6304, "lr": 1.696e-05, "epoch": 0.86, "percentage": 8.6, "elapsed_time": "0:51:24", "remaining_time": "9:06:26"} {"current_steps": 440, "total_steps": 5000, "loss": 0.652, "lr": 1.736e-05, "epoch": 0.88, "percentage": 8.8, "elapsed_time": "0:52:37", "remaining_time": "9:05:18"} {"current_steps": 450, "total_steps": 5000, "loss": 0.6517, "lr": 1.7760000000000003e-05, "epoch": 0.9, "percentage": 9.0, "elapsed_time": "0:53:48", "remaining_time": "9:03:58"} {"current_steps": 460, "total_steps": 5000, "loss": 0.7044, "lr": 1.8160000000000002e-05, "epoch": 0.92, "percentage": 9.2, "elapsed_time": "0:54:59", "remaining_time": "9:02:41"} {"current_steps": 470, "total_steps": 5000, "loss": 0.6801, "lr": 1.8560000000000002e-05, "epoch": 0.94, "percentage": 9.4, "elapsed_time": "0:56:11", "remaining_time": "9:01:32"} {"current_steps": 480, "total_steps": 5000, "loss": 0.6531, "lr": 1.896e-05, "epoch": 0.96, "percentage": 9.6, "elapsed_time": "0:57:21", "remaining_time": "9:00:11"} {"current_steps": 490, "total_steps": 5000, "loss": 0.6837, "lr": 1.936e-05, "epoch": 0.98, "percentage": 9.8, "elapsed_time": "0:58:33", "remaining_time": "8:59:03"} {"current_steps": 500, "total_steps": 5000, "loss": 0.6659, "lr": 1.976e-05, "epoch": 1.0, "percentage": 10.0, "elapsed_time": "0:59:46", "remaining_time": "8:57:56"} {"current_steps": 510, "total_steps": 5000, "loss": 0.6212, "lr": 1.9999961008995607e-05, "epoch": 1.02, "percentage": 10.2, "elapsed_time": "1:00:59", "remaining_time": "8:56:59"} {"current_steps": 520, "total_steps": 5000, "loss": 0.6705, "lr": 1.99995223636881e-05, "epoch": 1.04, "percentage": 10.4, "elapsed_time": "1:02:10", "remaining_time": "8:55:42"} {"current_steps": 530, "total_steps": 5000, "loss": 0.6346, "lr": 1.9998596355767805e-05, "epoch": 1.06, "percentage": 10.6, "elapsed_time": "1:03:22", "remaining_time": "8:54:29"} {"current_steps": 540, "total_steps": 5000, "loss": 0.6698, "lr": 1.999718303036705e-05, "epoch": 1.08, "percentage": 10.8, "elapsed_time": "1:04:34", "remaining_time": "8:53:20"} {"current_steps": 550, "total_steps": 5000, "loss": 0.5925, "lr": 1.9995282456369313e-05, "epoch": 1.1, "percentage": 11.0, "elapsed_time": "1:05:46", "remaining_time": "8:52:09"} {"current_steps": 560, "total_steps": 5000, "loss": 0.6795, "lr": 1.9992894726405894e-05, "epoch": 1.12, "percentage": 11.2, "elapsed_time": "1:06:58", "remaining_time": "8:50:57"} {"current_steps": 570, "total_steps": 5000, "loss": 0.6096, "lr": 1.9990019956851384e-05, "epoch": 1.1400000000000001, "percentage": 11.4, "elapsed_time": "1:08:10", "remaining_time": "8:49:49"} {"current_steps": 580, "total_steps": 5000, "loss": 0.5971, "lr": 1.998665828781799e-05, "epoch": 1.16, "percentage": 11.6, "elapsed_time": "1:09:22", "remaining_time": "8:48:40"} {"current_steps": 590, "total_steps": 5000, "loss": 0.6055, "lr": 1.998280988314872e-05, "epoch": 1.18, "percentage": 11.8, "elapsed_time": "1:10:34", "remaining_time": "8:47:31"} {"current_steps": 600, "total_steps": 5000, "loss": 0.6304, "lr": 1.9978474930409396e-05, "epoch": 1.2, "percentage": 12.0, "elapsed_time": "1:11:46", "remaining_time": "8:46:23"} {"current_steps": 610, "total_steps": 5000, "loss": 0.6812, "lr": 1.9973653640879486e-05, "epoch": 1.22, "percentage": 12.2, "elapsed_time": "1:12:59", "remaining_time": "8:45:20"} {"current_steps": 620, "total_steps": 5000, "loss": 0.5842, "lr": 1.9968346249541848e-05, "epoch": 1.24, "percentage": 12.4, "elapsed_time": "1:14:11", "remaining_time": "8:44:09"} {"current_steps": 630, "total_steps": 5000, "loss": 0.6478, "lr": 1.996255301507125e-05, "epoch": 1.26, "percentage": 12.6, "elapsed_time": "1:15:22", "remaining_time": "8:42:53"} {"current_steps": 640, "total_steps": 5000, "loss": 0.6003, "lr": 1.995627421982176e-05, "epoch": 1.28, "percentage": 12.8, "elapsed_time": "1:16:34", "remaining_time": "8:41:42"} {"current_steps": 650, "total_steps": 5000, "loss": 0.6087, "lr": 1.9949510169813006e-05, "epoch": 1.3, "percentage": 13.0, "elapsed_time": "1:17:46", "remaining_time": "8:40:27"} {"current_steps": 660, "total_steps": 5000, "loss": 0.5905, "lr": 1.9942261194715236e-05, "epoch": 1.32, "percentage": 13.2, "elapsed_time": "1:18:57", "remaining_time": "8:39:12"} {"current_steps": 670, "total_steps": 5000, "loss": 0.593, "lr": 1.9934527647833276e-05, "epoch": 1.34, "percentage": 13.4, "elapsed_time": "1:20:10", "remaining_time": "8:38:05"} {"current_steps": 680, "total_steps": 5000, "loss": 0.6253, "lr": 1.992630990608929e-05, "epoch": 1.3599999999999999, "percentage": 13.6, "elapsed_time": "1:21:22", "remaining_time": "8:36:55"} {"current_steps": 690, "total_steps": 5000, "loss": 0.6338, "lr": 1.9917608370004417e-05, "epoch": 1.38, "percentage": 13.8, "elapsed_time": "1:22:34", "remaining_time": "8:35:47"} {"current_steps": 700, "total_steps": 5000, "loss": 0.6148, "lr": 1.9908423463679246e-05, "epoch": 1.4, "percentage": 14.0, "elapsed_time": "1:23:45", "remaining_time": "8:34:31"} {"current_steps": 710, "total_steps": 5000, "loss": 0.6271, "lr": 1.989875563477316e-05, "epoch": 1.42, "percentage": 14.2, "elapsed_time": "1:24:58", "remaining_time": "8:33:27"} {"current_steps": 720, "total_steps": 5000, "loss": 0.638, "lr": 1.9888605354482494e-05, "epoch": 1.44, "percentage": 14.4, "elapsed_time": "1:26:12", "remaining_time": "8:32:25"} {"current_steps": 730, "total_steps": 5000, "loss": 0.6304, "lr": 1.987797311751759e-05, "epoch": 1.46, "percentage": 14.6, "elapsed_time": "1:27:25", "remaining_time": "8:31:20"} {"current_steps": 740, "total_steps": 5000, "loss": 0.5877, "lr": 1.986685944207868e-05, "epoch": 1.48, "percentage": 14.8, "elapsed_time": "1:28:37", "remaining_time": "8:30:11"} {"current_steps": 750, "total_steps": 5000, "loss": 0.5747, "lr": 1.985526486983063e-05, "epoch": 1.5, "percentage": 15.0, "elapsed_time": "1:29:49", "remaining_time": "8:28:59"} {"current_steps": 760, "total_steps": 5000, "loss": 0.6514, "lr": 1.9843189965876525e-05, "epoch": 1.52, "percentage": 15.2, "elapsed_time": "1:31:01", "remaining_time": "8:27:49"} {"current_steps": 770, "total_steps": 5000, "loss": 0.5879, "lr": 1.9830635318730155e-05, "epoch": 1.54, "percentage": 15.4, "elapsed_time": "1:32:12", "remaining_time": "8:26:34"} {"current_steps": 780, "total_steps": 5000, "loss": 0.6152, "lr": 1.981760154028731e-05, "epoch": 1.56, "percentage": 15.6, "elapsed_time": "1:33:24", "remaining_time": "8:25:19"} {"current_steps": 790, "total_steps": 5000, "loss": 0.6342, "lr": 1.980408926579596e-05, "epoch": 1.58, "percentage": 15.8, "elapsed_time": "1:34:35", "remaining_time": "8:24:06"} {"current_steps": 800, "total_steps": 5000, "loss": 0.6167, "lr": 1.97900991538253e-05, "epoch": 1.6, "percentage": 16.0, "elapsed_time": "1:35:47", "remaining_time": "8:22:54"} {"current_steps": 810, "total_steps": 5000, "loss": 0.5688, "lr": 1.9775631886233655e-05, "epoch": 1.62, "percentage": 16.2, "elapsed_time": "1:37:00", "remaining_time": "8:21:48"} {"current_steps": 820, "total_steps": 5000, "loss": 0.6023, "lr": 1.9760688168135233e-05, "epoch": 1.6400000000000001, "percentage": 16.4, "elapsed_time": "1:38:11", "remaining_time": "8:20:34"} {"current_steps": 830, "total_steps": 5000, "loss": 0.5957, "lr": 1.9745268727865774e-05, "epoch": 1.6600000000000001, "percentage": 16.6, "elapsed_time": "1:39:23", "remaining_time": "8:19:19"} {"current_steps": 840, "total_steps": 5000, "loss": 0.5409, "lr": 1.972937431694704e-05, "epoch": 1.6800000000000002, "percentage": 16.8, "elapsed_time": "1:40:34", "remaining_time": "8:18:06"} {"current_steps": 850, "total_steps": 5000, "loss": 0.6286, "lr": 1.9713005710050203e-05, "epoch": 1.7, "percentage": 17.0, "elapsed_time": "1:41:46", "remaining_time": "8:16:52"} {"current_steps": 860, "total_steps": 5000, "loss": 0.5936, "lr": 1.969616370495806e-05, "epoch": 1.72, "percentage": 17.2, "elapsed_time": "1:42:57", "remaining_time": "8:15:39"} {"current_steps": 870, "total_steps": 5000, "loss": 0.6535, "lr": 1.967884912252619e-05, "epoch": 1.74, "percentage": 17.4, "elapsed_time": "1:44:09", "remaining_time": "8:14:24"} {"current_steps": 880, "total_steps": 5000, "loss": 0.5864, "lr": 1.9661062806642903e-05, "epoch": 1.76, "percentage": 17.6, "elapsed_time": "1:45:20", "remaining_time": "8:13:12"} {"current_steps": 890, "total_steps": 5000, "loss": 0.6181, "lr": 1.964280562418815e-05, "epoch": 1.78, "percentage": 17.8, "elapsed_time": "1:46:32", "remaining_time": "8:11:59"} {"current_steps": 900, "total_steps": 5000, "loss": 0.5736, "lr": 1.962407846499124e-05, "epoch": 1.8, "percentage": 18.0, "elapsed_time": "1:47:43", "remaining_time": "8:10:46"} {"current_steps": 910, "total_steps": 5000, "loss": 0.5769, "lr": 1.96048822417875e-05, "epoch": 1.8199999999999998, "percentage": 18.2, "elapsed_time": "1:48:56", "remaining_time": "8:09:40"} {"current_steps": 920, "total_steps": 5000, "loss": 0.6056, "lr": 1.958521789017376e-05, "epoch": 1.8399999999999999, "percentage": 18.4, "elapsed_time": "1:50:09", "remaining_time": "8:08:29"} {"current_steps": 930, "total_steps": 5000, "loss": 0.6632, "lr": 1.956508636856278e-05, "epoch": 1.8599999999999999, "percentage": 18.6, "elapsed_time": "1:51:20", "remaining_time": "8:07:16"} {"current_steps": 940, "total_steps": 5000, "loss": 0.5803, "lr": 1.9546569379242446e-05, "epoch": 1.88, "percentage": 18.8, "elapsed_time": "1:52:31", "remaining_time": "8:06:00"} {"current_steps": 950, "total_steps": 5000, "loss": 0.6028, "lr": 1.9525552956573244e-05, "epoch": 1.9, "percentage": 19.0, "elapsed_time": "1:53:42", "remaining_time": "8:04:44"} {"current_steps": 960, "total_steps": 5000, "loss": 0.5932, "lr": 1.9504072271891486e-05, "epoch": 1.92, "percentage": 19.2, "elapsed_time": "1:54:54", "remaining_time": "8:03:32"} {"current_steps": 970, "total_steps": 5000, "loss": 0.581, "lr": 1.9482128372135446e-05, "epoch": 1.94, "percentage": 19.4, "elapsed_time": "1:56:06", "remaining_time": "8:02:21"} {"current_steps": 980, "total_steps": 5000, "loss": 0.6207, "lr": 1.945972232681984e-05, "epoch": 1.96, "percentage": 19.6, "elapsed_time": "1:57:18", "remaining_time": "8:01:12"} {"current_steps": 990, "total_steps": 5000, "loss": 0.5576, "lr": 1.9436855227983695e-05, "epoch": 1.98, "percentage": 19.8, "elapsed_time": "1:58:30", "remaining_time": "8:00:00"} {"current_steps": 1000, "total_steps": 5000, "loss": 0.6121, "lr": 1.9413528190137158e-05, "epoch": 2.0, "percentage": 20.0, "elapsed_time": "1:59:42", "remaining_time": "7:58:48"} {"current_steps": 1010, "total_steps": 5000, "loss": 0.5909, "lr": 1.938974235020714e-05, "epoch": 2.02, "percentage": 20.2, "elapsed_time": "2:00:56", "remaining_time": "7:57:45"} {"current_steps": 1020, "total_steps": 5000, "loss": 0.5459, "lr": 1.9365498867481926e-05, "epoch": 2.04, "percentage": 20.4, "elapsed_time": "2:02:07", "remaining_time": "7:56:32"} {"current_steps": 1030, "total_steps": 5000, "loss": 0.5781, "lr": 1.9340798923554657e-05, "epoch": 2.06, "percentage": 20.6, "elapsed_time": "2:03:18", "remaining_time": "7:55:16"} {"current_steps": 1040, "total_steps": 5000, "loss": 0.5284, "lr": 1.931564372226576e-05, "epoch": 2.08, "percentage": 20.8, "elapsed_time": "2:04:30", "remaining_time": "7:54:04"} {"current_steps": 1050, "total_steps": 5000, "loss": 0.5476, "lr": 1.9290034489644247e-05, "epoch": 2.1, "percentage": 21.0, "elapsed_time": "2:05:41", "remaining_time": "7:52:50"} {"current_steps": 1060, "total_steps": 5000, "loss": 0.5386, "lr": 1.9263972473847995e-05, "epoch": 2.12, "percentage": 21.2, "elapsed_time": "2:06:52", "remaining_time": "7:51:36"} {"current_steps": 1070, "total_steps": 5000, "loss": 0.5864, "lr": 1.923745894510288e-05, "epoch": 2.14, "percentage": 21.4, "elapsed_time": "2:08:04", "remaining_time": "7:50:24"} {"current_steps": 1080, "total_steps": 5000, "loss": 0.5413, "lr": 1.9210495195640895e-05, "epoch": 2.16, "percentage": 21.6, "elapsed_time": "2:09:15", "remaining_time": "7:49:10"} {"current_steps": 1090, "total_steps": 5000, "loss": 0.5201, "lr": 1.918308253963715e-05, "epoch": 2.18, "percentage": 21.8, "elapsed_time": "2:10:28", "remaining_time": "7:48:00"} {"current_steps": 1100, "total_steps": 5000, "loss": 0.5658, "lr": 1.9155222313145817e-05, "epoch": 2.2, "percentage": 22.0, "elapsed_time": "2:11:39", "remaining_time": "7:46:47"} {"current_steps": 1110, "total_steps": 5000, "loss": 0.5578, "lr": 1.912691587403503e-05, "epoch": 2.22, "percentage": 22.2, "elapsed_time": "2:12:53", "remaining_time": "7:45:41"} {"current_steps": 1120, "total_steps": 5000, "loss": 0.4792, "lr": 1.9098164601920702e-05, "epoch": 2.24, "percentage": 22.4, "elapsed_time": "2:14:04", "remaining_time": "7:44:29"} {"current_steps": 1130, "total_steps": 5000, "loss": 0.6048, "lr": 1.906896989809927e-05, "epoch": 2.26, "percentage": 22.6, "elapsed_time": "2:15:16", "remaining_time": "7:43:16"} {"current_steps": 1140, "total_steps": 5000, "loss": 0.567, "lr": 1.903933318547942e-05, "epoch": 2.2800000000000002, "percentage": 22.8, "elapsed_time": "2:16:28", "remaining_time": "7:42:06"} {"current_steps": 1150, "total_steps": 5000, "loss": 0.5965, "lr": 1.9009255908512704e-05, "epoch": 2.3, "percentage": 23.0, "elapsed_time": "2:17:40", "remaining_time": "7:40:53"} {"current_steps": 1160, "total_steps": 5000, "loss": 0.5561, "lr": 1.897873953312317e-05, "epoch": 2.32, "percentage": 23.2, "elapsed_time": "2:18:52", "remaining_time": "7:39:43"} {"current_steps": 1170, "total_steps": 5000, "loss": 0.5529, "lr": 1.8947785546635905e-05, "epoch": 2.34, "percentage": 23.4, "elapsed_time": "2:20:04", "remaining_time": "7:38:30"} {"current_steps": 1180, "total_steps": 5000, "loss": 0.5818, "lr": 1.8916395457704536e-05, "epoch": 2.36, "percentage": 23.6, "elapsed_time": "2:21:16", "remaining_time": "7:37:19"} {"current_steps": 1190, "total_steps": 5000, "loss": 0.5558, "lr": 1.888457079623772e-05, "epoch": 2.38, "percentage": 23.8, "elapsed_time": "2:22:28", "remaining_time": "7:36:08"} {"current_steps": 1200, "total_steps": 5000, "loss": 0.5833, "lr": 1.8852313113324553e-05, "epoch": 2.4, "percentage": 24.0, "elapsed_time": "2:23:39", "remaining_time": "7:34:56"} {"current_steps": 1210, "total_steps": 5000, "loss": 0.527, "lr": 1.8819623981158996e-05, "epoch": 2.42, "percentage": 24.2, "elapsed_time": "2:24:52", "remaining_time": "7:33:47"} {"current_steps": 1220, "total_steps": 5000, "loss": 0.5605, "lr": 1.878650499296323e-05, "epoch": 2.44, "percentage": 24.4, "elapsed_time": "2:26:03", "remaining_time": "7:32:32"} {"current_steps": 1230, "total_steps": 5000, "loss": 0.5528, "lr": 1.8752957762910016e-05, "epoch": 2.46, "percentage": 24.6, "elapsed_time": "2:27:14", "remaining_time": "7:31:17"} {"current_steps": 1240, "total_steps": 5000, "loss": 0.5239, "lr": 1.871898392604402e-05, "epoch": 2.48, "percentage": 24.8, "elapsed_time": "2:28:25", "remaining_time": "7:30:03"} {"current_steps": 1250, "total_steps": 5000, "loss": 0.5825, "lr": 1.8684585138202122e-05, "epoch": 2.5, "percentage": 25.0, "elapsed_time": "2:29:36", "remaining_time": "7:28:49"} {"current_steps": 1260, "total_steps": 5000, "loss": 0.5816, "lr": 1.864976307593271e-05, "epoch": 2.52, "percentage": 25.2, "elapsed_time": "2:30:48", "remaining_time": "7:27:38"} {"current_steps": 1270, "total_steps": 5000, "loss": 0.595, "lr": 1.8614519436413968e-05, "epoch": 2.54, "percentage": 25.4, "elapsed_time": "2:32:01", "remaining_time": "7:26:28"} {"current_steps": 1280, "total_steps": 5000, "loss": 0.5828, "lr": 1.8578855937371176e-05, "epoch": 2.56, "percentage": 25.6, "elapsed_time": "2:33:12", "remaining_time": "7:25:15"} {"current_steps": 1290, "total_steps": 5000, "loss": 0.5408, "lr": 1.8542774316992953e-05, "epoch": 2.58, "percentage": 25.8, "elapsed_time": "2:34:24", "remaining_time": "7:24:04"} {"current_steps": 1300, "total_steps": 5000, "loss": 0.5683, "lr": 1.850627633384658e-05, "epoch": 2.6, "percentage": 26.0, "elapsed_time": "2:35:35", "remaining_time": "7:22:50"} {"current_steps": 1310, "total_steps": 5000, "loss": 0.5734, "lr": 1.8469363766792258e-05, "epoch": 2.62, "percentage": 26.2, "elapsed_time": "2:36:48", "remaining_time": "7:21:42"} {"current_steps": 1320, "total_steps": 5000, "loss": 0.5581, "lr": 1.8432038414896432e-05, "epoch": 2.64, "percentage": 26.4, "elapsed_time": "2:38:00", "remaining_time": "7:20:29"} {"current_steps": 1330, "total_steps": 5000, "loss": 0.5781, "lr": 1.8394302097344103e-05, "epoch": 2.66, "percentage": 26.6, "elapsed_time": "2:39:11", "remaining_time": "7:19:17"} {"current_steps": 1340, "total_steps": 5000, "loss": 0.5468, "lr": 1.8356156653350138e-05, "epoch": 2.68, "percentage": 26.8, "elapsed_time": "2:40:22", "remaining_time": "7:18:03"} {"current_steps": 1350, "total_steps": 5000, "loss": 0.543, "lr": 1.8317603942069665e-05, "epoch": 2.7, "percentage": 27.0, "elapsed_time": "2:41:34", "remaining_time": "7:16:51"} {"current_steps": 1360, "total_steps": 5000, "loss": 0.5416, "lr": 1.8278645842507448e-05, "epoch": 2.7199999999999998, "percentage": 27.2, "elapsed_time": "2:42:45", "remaining_time": "7:15:38"} {"current_steps": 1370, "total_steps": 5000, "loss": 0.5692, "lr": 1.8239284253426294e-05, "epoch": 2.74, "percentage": 27.4, "elapsed_time": "2:43:57", "remaining_time": "7:14:26"} {"current_steps": 1380, "total_steps": 5000, "loss": 0.5372, "lr": 1.8199521093254524e-05, "epoch": 2.76, "percentage": 27.6, "elapsed_time": "2:45:08", "remaining_time": "7:13:11"} {"current_steps": 1390, "total_steps": 5000, "loss": 0.5205, "lr": 1.815935829999247e-05, "epoch": 2.7800000000000002, "percentage": 27.8, "elapsed_time": "2:46:19", "remaining_time": "7:11:58"} {"current_steps": 1400, "total_steps": 5000, "loss": 0.5159, "lr": 1.811879783111801e-05, "epoch": 2.8, "percentage": 28.0, "elapsed_time": "2:47:31", "remaining_time": "7:10:45"} {"current_steps": 1410, "total_steps": 5000, "loss": 0.5405, "lr": 1.8077841663491174e-05, "epoch": 2.82, "percentage": 28.2, "elapsed_time": "2:48:44", "remaining_time": "7:09:37"} {"current_steps": 1420, "total_steps": 5000, "loss": 0.5769, "lr": 1.80364917932578e-05, "epoch": 2.84, "percentage": 28.4, "elapsed_time": "2:49:56", "remaining_time": "7:08:26"} {"current_steps": 1430, "total_steps": 5000, "loss": 0.5724, "lr": 1.799475023575222e-05, "epoch": 2.86, "percentage": 28.6, "elapsed_time": "2:51:07", "remaining_time": "7:07:12"} {"current_steps": 1440, "total_steps": 5000, "loss": 0.5603, "lr": 1.795261902539906e-05, "epoch": 2.88, "percentage": 28.8, "elapsed_time": "2:52:19", "remaining_time": "7:06:00"} {"current_steps": 1450, "total_steps": 5000, "loss": 0.5609, "lr": 1.791010021561407e-05, "epoch": 2.9, "percentage": 29.0, "elapsed_time": "2:53:30", "remaining_time": "7:04:47"} {"current_steps": 1460, "total_steps": 5000, "loss": 0.585, "lr": 1.7867195878704062e-05, "epoch": 2.92, "percentage": 29.2, "elapsed_time": "2:54:42", "remaining_time": "7:03:37"} {"current_steps": 1470, "total_steps": 5000, "loss": 0.5818, "lr": 1.7823908105765883e-05, "epoch": 2.94, "percentage": 29.4, "elapsed_time": "2:55:55", "remaining_time": "7:02:26"} {"current_steps": 1480, "total_steps": 5000, "loss": 0.5453, "lr": 1.7780239006584515e-05, "epoch": 2.96, "percentage": 29.6, "elapsed_time": "2:57:06", "remaining_time": "7:01:13"} {"current_steps": 1490, "total_steps": 5000, "loss": 0.5526, "lr": 1.773619070953025e-05, "epoch": 2.98, "percentage": 29.8, "elapsed_time": "2:58:18", "remaining_time": "7:00:01"} {"current_steps": 1500, "total_steps": 5000, "loss": 0.5664, "lr": 1.769176536145494e-05, "epoch": 3.0, "percentage": 30.0, "elapsed_time": "2:59:29", "remaining_time": "6:58:49"} {"current_steps": 1510, "total_steps": 5000, "loss": 0.4993, "lr": 1.7646965127587373e-05, "epoch": 3.02, "percentage": 30.2, "elapsed_time": "3:00:42", "remaining_time": "6:57:39"} {"current_steps": 1520, "total_steps": 5000, "loss": 0.5302, "lr": 1.760179219142774e-05, "epoch": 3.04, "percentage": 30.4, "elapsed_time": "3:01:53", "remaining_time": "6:56:26"} {"current_steps": 1530, "total_steps": 5000, "loss": 0.4995, "lr": 1.7556248754641237e-05, "epoch": 3.06, "percentage": 30.6, "elapsed_time": "3:03:04", "remaining_time": "6:55:12"} {"current_steps": 1540, "total_steps": 5000, "loss": 0.4902, "lr": 1.7510337036950703e-05, "epoch": 3.08, "percentage": 30.8, "elapsed_time": "3:04:17", "remaining_time": "6:54:02"} {"current_steps": 1550, "total_steps": 5000, "loss": 0.5571, "lr": 1.7464059276028497e-05, "epoch": 3.1, "percentage": 31.0, "elapsed_time": "3:05:27", "remaining_time": "6:52:48"} {"current_steps": 1560, "total_steps": 5000, "loss": 0.5441, "lr": 1.7417417727387392e-05, "epoch": 3.12, "percentage": 31.2, "elapsed_time": "3:06:39", "remaining_time": "6:51:36"} {"current_steps": 1570, "total_steps": 5000, "loss": 0.5498, "lr": 1.7370414664270675e-05, "epoch": 3.14, "percentage": 31.4, "elapsed_time": "3:07:52", "remaining_time": "6:50:26"} {"current_steps": 1580, "total_steps": 5000, "loss": 0.4799, "lr": 1.732305237754132e-05, "epoch": 3.16, "percentage": 31.6, "elapsed_time": "3:09:03", "remaining_time": "6:49:13"} {"current_steps": 1590, "total_steps": 5000, "loss": 0.5285, "lr": 1.727533317557037e-05, "epoch": 3.18, "percentage": 31.8, "elapsed_time": "3:10:14", "remaining_time": "6:48:00"} {"current_steps": 1600, "total_steps": 5000, "loss": 0.5328, "lr": 1.7227259384124408e-05, "epoch": 3.2, "percentage": 32.0, "elapsed_time": "3:11:26", "remaining_time": "6:46:49"} {"current_steps": 1610, "total_steps": 5000, "loss": 0.5333, "lr": 1.7178833346252208e-05, "epoch": 3.22, "percentage": 32.2, "elapsed_time": "3:12:40", "remaining_time": "6:45:41"} {"current_steps": 1620, "total_steps": 5000, "loss": 0.5163, "lr": 1.713005742217053e-05, "epoch": 3.24, "percentage": 32.4, "elapsed_time": "3:13:52", "remaining_time": "6:44:30"} {"current_steps": 1630, "total_steps": 5000, "loss": 0.5173, "lr": 1.7080933989149112e-05, "epoch": 3.26, "percentage": 32.6, "elapsed_time": "3:15:04", "remaining_time": "6:43:19"} {"current_steps": 1640, "total_steps": 5000, "loss": 0.5187, "lr": 1.7031465441394766e-05, "epoch": 3.2800000000000002, "percentage": 32.8, "elapsed_time": "3:16:15", "remaining_time": "6:42:05"} {"current_steps": 1650, "total_steps": 5000, "loss": 0.5611, "lr": 1.698165418993473e-05, "epoch": 3.3, "percentage": 33.0, "elapsed_time": "3:17:27", "remaining_time": "6:40:54"} {"current_steps": 1660, "total_steps": 5000, "loss": 0.5381, "lr": 1.6931502662499116e-05, "epoch": 3.32, "percentage": 33.2, "elapsed_time": "3:18:40", "remaining_time": "6:39:43"} {"current_steps": 1670, "total_steps": 5000, "loss": 0.5089, "lr": 1.688101330340263e-05, "epoch": 3.34, "percentage": 33.4, "elapsed_time": "3:19:52", "remaining_time": "6:38:32"} {"current_steps": 1680, "total_steps": 5000, "loss": 0.5538, "lr": 1.683018857342539e-05, "epoch": 3.36, "percentage": 33.6, "elapsed_time": "3:21:04", "remaining_time": "6:37:20"} {"current_steps": 1690, "total_steps": 5000, "loss": 0.5216, "lr": 1.6779030949693044e-05, "epoch": 3.38, "percentage": 33.8, "elapsed_time": "3:22:15", "remaining_time": "6:36:08"} {"current_steps": 1700, "total_steps": 5000, "loss": 0.5356, "lr": 1.6727542925556e-05, "epoch": 3.4, "percentage": 34.0, "elapsed_time": "3:23:27", "remaining_time": "6:34:56"} {"current_steps": 1710, "total_steps": 5000, "loss": 0.497, "lr": 1.667572701046791e-05, "epoch": 3.42, "percentage": 34.2, "elapsed_time": "3:24:40", "remaining_time": "6:33:46"} {"current_steps": 1720, "total_steps": 5000, "loss": 0.4934, "lr": 1.662358572986337e-05, "epoch": 3.44, "percentage": 34.4, "elapsed_time": "3:25:51", "remaining_time": "6:32:33"} {"current_steps": 1730, "total_steps": 5000, "loss": 0.5327, "lr": 1.6571121625034847e-05, "epoch": 3.46, "percentage": 34.6, "elapsed_time": "3:27:03", "remaining_time": "6:31:22"} {"current_steps": 1740, "total_steps": 5000, "loss": 0.4995, "lr": 1.651833725300879e-05, "epoch": 3.48, "percentage": 34.8, "elapsed_time": "3:28:14", "remaining_time": "6:30:10"} {"current_steps": 1750, "total_steps": 5000, "loss": 0.4945, "lr": 1.6465235186421024e-05, "epoch": 3.5, "percentage": 35.0, "elapsed_time": "3:29:26", "remaining_time": "6:28:57"} {"current_steps": 1760, "total_steps": 5000, "loss": 0.4969, "lr": 1.6411818013391357e-05, "epoch": 3.52, "percentage": 35.2, "elapsed_time": "3:30:38", "remaining_time": "6:27:45"} {"current_steps": 1770, "total_steps": 5000, "loss": 0.5133, "lr": 1.6358088337397444e-05, "epoch": 3.54, "percentage": 35.4, "elapsed_time": "3:31:49", "remaining_time": "6:26:32"} {"current_steps": 1780, "total_steps": 5000, "loss": 0.4598, "lr": 1.630404877714789e-05, "epoch": 3.56, "percentage": 35.6, "elapsed_time": "3:33:01", "remaining_time": "6:25:21"} {"current_steps": 1790, "total_steps": 5000, "loss": 0.5721, "lr": 1.6249701966454626e-05, "epoch": 3.58, "percentage": 35.8, "elapsed_time": "3:34:13", "remaining_time": "6:24:09"} {"current_steps": 1800, "total_steps": 5000, "loss": 0.5549, "lr": 1.619505055410453e-05, "epoch": 3.6, "percentage": 36.0, "elapsed_time": "3:35:25", "remaining_time": "6:22:58"} {"current_steps": 1810, "total_steps": 5000, "loss": 0.5192, "lr": 1.614009720373034e-05, "epoch": 3.62, "percentage": 36.2, "elapsed_time": "3:36:38", "remaining_time": "6:21:49"} {"current_steps": 1820, "total_steps": 5000, "loss": 0.4927, "lr": 1.608484459368082e-05, "epoch": 3.64, "percentage": 36.4, "elapsed_time": "3:37:50", "remaining_time": "6:20:37"} {"current_steps": 1830, "total_steps": 5000, "loss": 0.5319, "lr": 1.602929541689025e-05, "epoch": 3.66, "percentage": 36.6, "elapsed_time": "3:39:02", "remaining_time": "6:19:26"} {"current_steps": 1840, "total_steps": 5000, "loss": 0.5025, "lr": 1.5973452380747125e-05, "epoch": 3.68, "percentage": 36.8, "elapsed_time": "3:40:14", "remaining_time": "6:18:14"} {"current_steps": 1850, "total_steps": 5000, "loss": 0.497, "lr": 1.591731820696224e-05, "epoch": 3.7, "percentage": 37.0, "elapsed_time": "3:41:25", "remaining_time": "6:17:02"} {"current_steps": 1860, "total_steps": 5000, "loss": 0.556, "lr": 1.5860895631436044e-05, "epoch": 3.7199999999999998, "percentage": 37.2, "elapsed_time": "3:42:37", "remaining_time": "6:15:49"} {"current_steps": 1870, "total_steps": 5000, "loss": 0.506, "lr": 1.580418740412526e-05, "epoch": 3.74, "percentage": 37.4, "elapsed_time": "3:43:49", "remaining_time": "6:14:37"} {"current_steps": 1880, "total_steps": 5000, "loss": 0.5154, "lr": 1.5747196288908887e-05, "epoch": 3.76, "percentage": 37.6, "elapsed_time": "3:45:00", "remaining_time": "6:13:25"} {"current_steps": 1890, "total_steps": 5000, "loss": 0.5887, "lr": 1.5689925063453483e-05, "epoch": 3.7800000000000002, "percentage": 37.8, "elapsed_time": "3:46:13", "remaining_time": "6:12:14"} {"current_steps": 1900, "total_steps": 5000, "loss": 0.508, "lr": 1.563237651907777e-05, "epoch": 3.8, "percentage": 38.0, "elapsed_time": "3:47:24", "remaining_time": "6:11:02"} {"current_steps": 1910, "total_steps": 5000, "loss": 0.4954, "lr": 1.5574553460616608e-05, "epoch": 3.82, "percentage": 38.2, "elapsed_time": "3:48:38", "remaining_time": "6:09:53"} {"current_steps": 1920, "total_steps": 5000, "loss": 0.5628, "lr": 1.5516458706284306e-05, "epoch": 3.84, "percentage": 38.4, "elapsed_time": "3:49:50", "remaining_time": "6:08:42"} {"current_steps": 1930, "total_steps": 5000, "loss": 0.4494, "lr": 1.5458095087537216e-05, "epoch": 3.86, "percentage": 38.6, "elapsed_time": "3:51:02", "remaining_time": "6:07:30"} {"current_steps": 1940, "total_steps": 5000, "loss": 0.522, "lr": 1.5399465448935788e-05, "epoch": 3.88, "percentage": 38.8, "elapsed_time": "3:52:14", "remaining_time": "6:06:19"} {"current_steps": 1950, "total_steps": 5000, "loss": 0.5225, "lr": 1.5340572648005887e-05, "epoch": 3.9, "percentage": 39.0, "elapsed_time": "3:53:26", "remaining_time": "6:05:07"} {"current_steps": 1960, "total_steps": 5000, "loss": 0.5092, "lr": 1.5281419555099547e-05, "epoch": 3.92, "percentage": 39.2, "elapsed_time": "3:54:38", "remaining_time": "6:03:55"} {"current_steps": 1970, "total_steps": 5000, "loss": 0.5167, "lr": 1.5222009053255061e-05, "epoch": 3.94, "percentage": 39.4, "elapsed_time": "3:55:49", "remaining_time": "6:02:43"} {"current_steps": 1980, "total_steps": 5000, "loss": 0.5198, "lr": 1.5162344038056476e-05, "epoch": 3.96, "percentage": 39.6, "elapsed_time": "3:57:00", "remaining_time": "6:01:30"} {"current_steps": 1990, "total_steps": 5000, "loss": 0.5723, "lr": 1.510242741749246e-05, "epoch": 3.98, "percentage": 39.8, "elapsed_time": "3:58:12", "remaining_time": "6:00:18"} {"current_steps": 2000, "total_steps": 5000, "loss": 0.4707, "lr": 1.5042262111814566e-05, "epoch": 4.0, "percentage": 40.0, "elapsed_time": "3:59:23", "remaining_time": "5:59:05"} {"current_steps": 2010, "total_steps": 5000, "loss": 0.523, "lr": 1.498185105339491e-05, "epoch": 4.02, "percentage": 40.2, "elapsed_time": "4:00:37", "remaining_time": "5:57:56"} {"current_steps": 2020, "total_steps": 5000, "loss": 0.4433, "lr": 1.4921197186583256e-05, "epoch": 4.04, "percentage": 40.4, "elapsed_time": "4:01:48", "remaining_time": "5:56:44"} {"current_steps": 2030, "total_steps": 5000, "loss": 0.4861, "lr": 1.4860303467563504e-05, "epoch": 4.06, "percentage": 40.6, "elapsed_time": "4:03:01", "remaining_time": "5:55:32"} {"current_steps": 2040, "total_steps": 5000, "loss": 0.4621, "lr": 1.4799172864209607e-05, "epoch": 4.08, "percentage": 40.8, "elapsed_time": "4:04:13", "remaining_time": "5:54:21"} {"current_steps": 2050, "total_steps": 5000, "loss": 0.5454, "lr": 1.4737808355940932e-05, "epoch": 4.1, "percentage": 41.0, "elapsed_time": "4:05:25", "remaining_time": "5:53:10"} {"current_steps": 2060, "total_steps": 5000, "loss": 0.4984, "lr": 1.467621293357704e-05, "epoch": 4.12, "percentage": 41.2, "elapsed_time": "4:06:37", "remaining_time": "5:51:58"} {"current_steps": 2070, "total_steps": 5000, "loss": 0.5375, "lr": 1.4614389599191917e-05, "epoch": 4.14, "percentage": 41.4, "elapsed_time": "4:07:49", "remaining_time": "5:50:46"} {"current_steps": 2080, "total_steps": 5000, "loss": 0.5191, "lr": 1.455234136596766e-05, "epoch": 4.16, "percentage": 41.6, "elapsed_time": "4:09:01", "remaining_time": "5:49:36"} {"current_steps": 2090, "total_steps": 5000, "loss": 0.4872, "lr": 1.4490071258047625e-05, "epoch": 4.18, "percentage": 41.8, "elapsed_time": "4:10:14", "remaining_time": "5:48:25"} {"current_steps": 2100, "total_steps": 5000, "loss": 0.4883, "lr": 1.442758231038902e-05, "epoch": 4.2, "percentage": 42.0, "elapsed_time": "4:11:27", "remaining_time": "5:47:14"} {"current_steps": 2110, "total_steps": 5000, "loss": 0.4564, "lr": 1.436487756861499e-05, "epoch": 4.22, "percentage": 42.2, "elapsed_time": "4:12:40", "remaining_time": "5:46:05"} {"current_steps": 2120, "total_steps": 5000, "loss": 0.4311, "lr": 1.4301960088866187e-05, "epoch": 4.24, "percentage": 42.4, "elapsed_time": "4:13:52", "remaining_time": "5:44:52"} {"current_steps": 2130, "total_steps": 5000, "loss": 0.4663, "lr": 1.4238832937651816e-05, "epoch": 4.26, "percentage": 42.6, "elapsed_time": "4:15:02", "remaining_time": "5:43:39"} {"current_steps": 2140, "total_steps": 5000, "loss": 0.5048, "lr": 1.4175499191700169e-05, "epoch": 4.28, "percentage": 42.8, "elapsed_time": "4:16:14", "remaining_time": "5:42:27"} {"current_steps": 2150, "total_steps": 5000, "loss": 0.493, "lr": 1.4111961937808665e-05, "epoch": 4.3, "percentage": 43.0, "elapsed_time": "4:17:27", "remaining_time": "5:41:16"} {"current_steps": 2160, "total_steps": 5000, "loss": 0.4712, "lr": 1.4048224272693426e-05, "epoch": 4.32, "percentage": 43.2, "elapsed_time": "4:18:39", "remaining_time": "5:40:04"} {"current_steps": 2170, "total_steps": 5000, "loss": 0.4641, "lr": 1.3984289302838327e-05, "epoch": 4.34, "percentage": 43.4, "elapsed_time": "4:19:50", "remaining_time": "5:38:52"} {"current_steps": 2180, "total_steps": 5000, "loss": 0.4929, "lr": 1.3920160144343604e-05, "epoch": 4.36, "percentage": 43.6, "elapsed_time": "4:21:02", "remaining_time": "5:37:40"} {"current_steps": 2190, "total_steps": 5000, "loss": 0.5269, "lr": 1.3855839922773968e-05, "epoch": 4.38, "percentage": 43.8, "elapsed_time": "4:22:14", "remaining_time": "5:36:28"} {"current_steps": 2200, "total_steps": 5000, "loss": 0.4857, "lr": 1.3791331773006272e-05, "epoch": 4.4, "percentage": 44.0, "elapsed_time": "4:23:25", "remaining_time": "5:35:15"} {"current_steps": 2210, "total_steps": 5000, "loss": 0.5613, "lr": 1.3726638839076732e-05, "epoch": 4.42, "percentage": 44.2, "elapsed_time": "4:24:38", "remaining_time": "5:34:06"} {"current_steps": 2220, "total_steps": 5000, "loss": 0.4884, "lr": 1.3661764274027678e-05, "epoch": 4.44, "percentage": 44.4, "elapsed_time": "4:25:50", "remaining_time": "5:32:54"} {"current_steps": 2230, "total_steps": 5000, "loss": 0.4849, "lr": 1.3596711239753889e-05, "epoch": 4.46, "percentage": 44.6, "elapsed_time": "4:27:02", "remaining_time": "5:31:42"} {"current_steps": 2240, "total_steps": 5000, "loss": 0.4752, "lr": 1.3531482906848474e-05, "epoch": 4.48, "percentage": 44.8, "elapsed_time": "4:28:14", "remaining_time": "5:30:30"} {"current_steps": 2250, "total_steps": 5000, "loss": 0.4804, "lr": 1.3466082454448364e-05, "epoch": 4.5, "percentage": 45.0, "elapsed_time": "4:29:25", "remaining_time": "5:29:17"} {"current_steps": 2260, "total_steps": 5000, "loss": 0.4719, "lr": 1.340051307007933e-05, "epoch": 4.52, "percentage": 45.2, "elapsed_time": "4:30:37", "remaining_time": "5:28:06"} {"current_steps": 2270, "total_steps": 5000, "loss": 0.4599, "lr": 1.3334777949500673e-05, "epoch": 4.54, "percentage": 45.4, "elapsed_time": "4:31:48", "remaining_time": "5:26:53"} {"current_steps": 2280, "total_steps": 5000, "loss": 0.4712, "lr": 1.3268880296549424e-05, "epoch": 4.5600000000000005, "percentage": 45.6, "elapsed_time": "4:32:59", "remaining_time": "5:25:40"} {"current_steps": 2290, "total_steps": 5000, "loss": 0.4772, "lr": 1.3202823322984228e-05, "epoch": 4.58, "percentage": 45.8, "elapsed_time": "4:34:11", "remaining_time": "5:24:28"} {"current_steps": 2300, "total_steps": 5000, "loss": 0.453, "lr": 1.3136610248328779e-05, "epoch": 4.6, "percentage": 46.0, "elapsed_time": "4:35:22", "remaining_time": "5:23:16"} {"current_steps": 2310, "total_steps": 5000, "loss": 0.4657, "lr": 1.307024429971492e-05, "epoch": 4.62, "percentage": 46.2, "elapsed_time": "4:36:35", "remaining_time": "5:22:05"} {"current_steps": 2320, "total_steps": 5000, "loss": 0.4791, "lr": 1.3003728711725364e-05, "epoch": 4.64, "percentage": 46.4, "elapsed_time": "4:37:46", "remaining_time": "5:20:52"} {"current_steps": 2330, "total_steps": 5000, "loss": 0.5586, "lr": 1.2937066726236029e-05, "epoch": 4.66, "percentage": 46.6, "elapsed_time": "4:38:58", "remaining_time": "5:19:40"} {"current_steps": 2340, "total_steps": 5000, "loss": 0.4603, "lr": 1.2870261592258038e-05, "epoch": 4.68, "percentage": 46.8, "elapsed_time": "4:40:10", "remaining_time": "5:18:28"} {"current_steps": 2350, "total_steps": 5000, "loss": 0.4618, "lr": 1.2803316565779378e-05, "epoch": 4.7, "percentage": 47.0, "elapsed_time": "4:41:21", "remaining_time": "5:17:16"} {"current_steps": 2360, "total_steps": 5000, "loss": 0.4643, "lr": 1.2736234909606186e-05, "epoch": 4.72, "percentage": 47.2, "elapsed_time": "4:42:33", "remaining_time": "5:16:05"} {"current_steps": 2370, "total_steps": 5000, "loss": 0.5017, "lr": 1.2669019893203758e-05, "epoch": 4.74, "percentage": 47.4, "elapsed_time": "4:43:45", "remaining_time": "5:14:53"} {"current_steps": 2380, "total_steps": 5000, "loss": 0.451, "lr": 1.2601674792537157e-05, "epoch": 4.76, "percentage": 47.6, "elapsed_time": "4:44:56", "remaining_time": "5:13:40"} {"current_steps": 2390, "total_steps": 5000, "loss": 0.4763, "lr": 1.2534202889911584e-05, "epoch": 4.78, "percentage": 47.8, "elapsed_time": "4:46:09", "remaining_time": "5:12:29"} {"current_steps": 2400, "total_steps": 5000, "loss": 0.4984, "lr": 1.2466607473812386e-05, "epoch": 4.8, "percentage": 48.0, "elapsed_time": "4:47:21", "remaining_time": "5:11:18"} {"current_steps": 2410, "total_steps": 5000, "loss": 0.4594, "lr": 1.2398891838744777e-05, "epoch": 4.82, "percentage": 48.2, "elapsed_time": "4:48:34", "remaining_time": "5:10:07"} {"current_steps": 2420, "total_steps": 5000, "loss": 0.476, "lr": 1.233105928507328e-05, "epoch": 4.84, "percentage": 48.4, "elapsed_time": "4:49:46", "remaining_time": "5:08:56"} {"current_steps": 2430, "total_steps": 5000, "loss": 0.4599, "lr": 1.226311311886086e-05, "epoch": 4.86, "percentage": 48.6, "elapsed_time": "4:50:58", "remaining_time": "5:07:44"} {"current_steps": 2440, "total_steps": 5000, "loss": 0.4786, "lr": 1.2195056651707806e-05, "epoch": 4.88, "percentage": 48.8, "elapsed_time": "4:52:10", "remaining_time": "5:06:32"} {"current_steps": 2450, "total_steps": 5000, "loss": 0.539, "lr": 1.2126893200590309e-05, "epoch": 4.9, "percentage": 49.0, "elapsed_time": "4:53:22", "remaining_time": "5:05:20"} {"current_steps": 2460, "total_steps": 5000, "loss": 0.442, "lr": 1.2058626087698814e-05, "epoch": 4.92, "percentage": 49.2, "elapsed_time": "4:54:32", "remaining_time": "5:04:07"} {"current_steps": 2470, "total_steps": 5000, "loss": 0.4829, "lr": 1.1990258640276094e-05, "epoch": 4.9399999999999995, "percentage": 49.4, "elapsed_time": "4:55:44", "remaining_time": "5:02:55"} {"current_steps": 2480, "total_steps": 5000, "loss": 0.5055, "lr": 1.1921794190455082e-05, "epoch": 4.96, "percentage": 49.6, "elapsed_time": "4:56:56", "remaining_time": "5:01:44"} {"current_steps": 2490, "total_steps": 5000, "loss": 0.4857, "lr": 1.1853236075096474e-05, "epoch": 4.98, "percentage": 49.8, "elapsed_time": "4:58:08", "remaining_time": "5:00:32"} {"current_steps": 2500, "total_steps": 5000, "loss": 0.4962, "lr": 1.1784587635626095e-05, "epoch": 5.0, "percentage": 50.0, "elapsed_time": "4:59:20", "remaining_time": "4:59:20"} {"current_steps": 2510, "total_steps": 5000, "loss": 0.4185, "lr": 1.171585221787203e-05, "epoch": 5.02, "percentage": 50.2, "elapsed_time": "5:00:33", "remaining_time": "4:58:09"} {"current_steps": 2520, "total_steps": 5000, "loss": 0.4545, "lr": 1.1647033171901573e-05, "epoch": 5.04, "percentage": 50.4, "elapsed_time": "5:01:45", "remaining_time": "4:56:58"} {"current_steps": 2530, "total_steps": 5000, "loss": 0.4162, "lr": 1.157813385185794e-05, "epoch": 5.06, "percentage": 50.6, "elapsed_time": "5:02:56", "remaining_time": "4:55:45"} {"current_steps": 2540, "total_steps": 5000, "loss": 0.425, "lr": 1.1509157615796775e-05, "epoch": 5.08, "percentage": 50.8, "elapsed_time": "5:04:07", "remaining_time": "4:54:33"} {"current_steps": 2550, "total_steps": 5000, "loss": 0.4514, "lr": 1.1440107825522522e-05, "epoch": 5.1, "percentage": 51.0, "elapsed_time": "5:05:19", "remaining_time": "4:53:21"} {"current_steps": 2560, "total_steps": 5000, "loss": 0.4687, "lr": 1.1370987846424547e-05, "epoch": 5.12, "percentage": 51.2, "elapsed_time": "5:06:31", "remaining_time": "4:52:09"} {"current_steps": 2570, "total_steps": 5000, "loss": 0.4892, "lr": 1.1301801047313106e-05, "epoch": 5.14, "percentage": 51.4, "elapsed_time": "5:07:43", "remaining_time": "4:50:57"} {"current_steps": 2580, "total_steps": 5000, "loss": 0.4675, "lr": 1.1232550800255188e-05, "epoch": 5.16, "percentage": 51.6, "elapsed_time": "5:08:55", "remaining_time": "4:49:45"} {"current_steps": 2590, "total_steps": 5000, "loss": 0.4336, "lr": 1.1163240480410136e-05, "epoch": 5.18, "percentage": 51.8, "elapsed_time": "5:10:06", "remaining_time": "4:48:33"} {"current_steps": 2600, "total_steps": 5000, "loss": 0.4358, "lr": 1.1093873465865156e-05, "epoch": 5.2, "percentage": 52.0, "elapsed_time": "5:11:17", "remaining_time": "4:47:20"} {"current_steps": 2610, "total_steps": 5000, "loss": 0.4709, "lr": 1.1024453137470677e-05, "epoch": 5.22, "percentage": 52.2, "elapsed_time": "5:12:30", "remaining_time": "4:46:10"} {"current_steps": 2620, "total_steps": 5000, "loss": 0.4349, "lr": 1.0954982878675564e-05, "epoch": 5.24, "percentage": 52.4, "elapsed_time": "5:13:42", "remaining_time": "4:44:58"} {"current_steps": 2630, "total_steps": 5000, "loss": 0.4581, "lr": 1.0885466075362224e-05, "epoch": 5.26, "percentage": 52.6, "elapsed_time": "5:14:53", "remaining_time": "4:43:45"} {"current_steps": 2640, "total_steps": 5000, "loss": 0.4482, "lr": 1.0815906115681579e-05, "epoch": 5.28, "percentage": 52.8, "elapsed_time": "5:16:05", "remaining_time": "4:42:34"} {"current_steps": 2650, "total_steps": 5000, "loss": 0.4771, "lr": 1.0746306389887924e-05, "epoch": 5.3, "percentage": 53.0, "elapsed_time": "5:17:17", "remaining_time": "4:41:22"} {"current_steps": 2660, "total_steps": 5000, "loss": 0.4893, "lr": 1.067667029017371e-05, "epoch": 5.32, "percentage": 53.2, "elapsed_time": "5:18:28", "remaining_time": "4:40:09"} {"current_steps": 2670, "total_steps": 5000, "loss": 0.4823, "lr": 1.060700121050419e-05, "epoch": 5.34, "percentage": 53.4, "elapsed_time": "5:19:40", "remaining_time": "4:38:57"} {"current_steps": 2680, "total_steps": 5000, "loss": 0.45, "lr": 1.0537302546452022e-05, "epoch": 5.36, "percentage": 53.6, "elapsed_time": "5:20:52", "remaining_time": "4:37:46"} {"current_steps": 2690, "total_steps": 5000, "loss": 0.4817, "lr": 1.0467577695031763e-05, "epoch": 5.38, "percentage": 53.8, "elapsed_time": "5:22:04", "remaining_time": "4:36:34"} {"current_steps": 2700, "total_steps": 5000, "loss": 0.4472, "lr": 1.03978300545343e-05, "epoch": 5.4, "percentage": 54.0, "elapsed_time": "5:23:15", "remaining_time": "4:35:22"} {"current_steps": 2710, "total_steps": 5000, "loss": 0.4351, "lr": 1.0328063024361232e-05, "epoch": 5.42, "percentage": 54.2, "elapsed_time": "5:24:28", "remaining_time": "4:34:11"} {"current_steps": 2720, "total_steps": 5000, "loss": 0.4052, "lr": 1.0258280004859189e-05, "epoch": 5.44, "percentage": 54.4, "elapsed_time": "5:25:40", "remaining_time": "4:32:59"} {"current_steps": 2730, "total_steps": 5000, "loss": 0.51, "lr": 1.0188484397154083e-05, "epoch": 5.46, "percentage": 54.6, "elapsed_time": "5:26:52", "remaining_time": "4:31:48"} {"current_steps": 2740, "total_steps": 5000, "loss": 0.4678, "lr": 1.0118679602985373e-05, "epoch": 5.48, "percentage": 54.8, "elapsed_time": "5:28:04", "remaining_time": "4:30:35"} {"current_steps": 2750, "total_steps": 5000, "loss": 0.4802, "lr": 1.0048869024540247e-05, "epoch": 5.5, "percentage": 55.0, "elapsed_time": "5:29:15", "remaining_time": "4:29:23"} {"current_steps": 2760, "total_steps": 5000, "loss": 0.4416, "lr": 9.979056064287807e-06, "epoch": 5.52, "percentage": 55.2, "elapsed_time": "5:30:26", "remaining_time": "4:28:11"} {"current_steps": 2770, "total_steps": 5000, "loss": 0.4613, "lr": 9.909244124813246e-06, "epoch": 5.54, "percentage": 55.4, "elapsed_time": "5:31:38", "remaining_time": "4:26:59"} {"current_steps": 2780, "total_steps": 5000, "loss": 0.4163, "lr": 9.839436608652007e-06, "epoch": 5.5600000000000005, "percentage": 55.6, "elapsed_time": "5:32:50", "remaining_time": "4:25:47"} {"current_steps": 2790, "total_steps": 5000, "loss": 0.4753, "lr": 9.76963691812394e-06, "epoch": 5.58, "percentage": 55.8, "elapsed_time": "5:34:03", "remaining_time": "4:24:36"} {"current_steps": 2800, "total_steps": 5000, "loss": 0.4725, "lr": 9.699848455167489e-06, "epoch": 5.6, "percentage": 56.0, "elapsed_time": "5:35:15", "remaining_time": "4:23:24"} {"current_steps": 2810, "total_steps": 5000, "loss": 0.4521, "lr": 9.630074621173882e-06, "epoch": 5.62, "percentage": 56.2, "elapsed_time": "5:36:28", "remaining_time": "4:22:14"} {"current_steps": 2820, "total_steps": 5000, "loss": 0.3838, "lr": 9.560318816821354e-06, "epoch": 5.64, "percentage": 56.4, "elapsed_time": "5:37:39", "remaining_time": "4:21:01"} {"current_steps": 2830, "total_steps": 5000, "loss": 0.4603, "lr": 9.490584441909392e-06, "epoch": 5.66, "percentage": 56.6, "elapsed_time": "5:38:50", "remaining_time": "4:19:49"} {"current_steps": 2840, "total_steps": 5000, "loss": 0.4538, "lr": 9.420874895193056e-06, "epoch": 5.68, "percentage": 56.8, "elapsed_time": "5:40:03", "remaining_time": "4:18:37"} {"current_steps": 2850, "total_steps": 5000, "loss": 0.4527, "lr": 9.351193574217305e-06, "epoch": 5.7, "percentage": 57.0, "elapsed_time": "5:41:14", "remaining_time": "4:17:25"} {"current_steps": 2860, "total_steps": 5000, "loss": 0.4915, "lr": 9.281543875151419e-06, "epoch": 5.72, "percentage": 57.2, "elapsed_time": "5:42:27", "remaining_time": "4:16:14"} {"current_steps": 2870, "total_steps": 5000, "loss": 0.4338, "lr": 9.211929192623466e-06, "epoch": 5.74, "percentage": 57.4, "elapsed_time": "5:43:38", "remaining_time": "4:15:02"} {"current_steps": 2880, "total_steps": 5000, "loss": 0.4573, "lr": 9.142352919554862e-06, "epoch": 5.76, "percentage": 57.6, "elapsed_time": "5:44:49", "remaining_time": "4:13:49"} {"current_steps": 2890, "total_steps": 5000, "loss": 0.4494, "lr": 9.072818446995e-06, "epoch": 5.78, "percentage": 57.8, "elapsed_time": "5:46:01", "remaining_time": "4:12:38"} {"current_steps": 2900, "total_steps": 5000, "loss": 0.5061, "lr": 9.003329163955973e-06, "epoch": 5.8, "percentage": 58.0, "elapsed_time": "5:47:13", "remaining_time": "4:11:26"} {"current_steps": 2910, "total_steps": 5000, "loss": 0.4537, "lr": 8.933888457247402e-06, "epoch": 5.82, "percentage": 58.2, "elapsed_time": "5:48:27", "remaining_time": "4:10:15"} {"current_steps": 2920, "total_steps": 5000, "loss": 0.4764, "lr": 8.864499711311362e-06, "epoch": 5.84, "percentage": 58.4, "elapsed_time": "5:49:38", "remaining_time": "4:09:03"} {"current_steps": 2930, "total_steps": 5000, "loss": 0.4563, "lr": 8.79516630805745e-06, "epoch": 5.86, "percentage": 58.6, "elapsed_time": "5:50:50", "remaining_time": "4:07:51"} {"current_steps": 2940, "total_steps": 5000, "loss": 0.4887, "lr": 8.725891626697912e-06, "epoch": 5.88, "percentage": 58.8, "elapsed_time": "5:52:03", "remaining_time": "4:06:40"} {"current_steps": 2950, "total_steps": 5000, "loss": 0.446, "lr": 8.656679043582986e-06, "epoch": 5.9, "percentage": 59.0, "elapsed_time": "5:53:13", "remaining_time": "4:05:28"} {"current_steps": 2960, "total_steps": 5000, "loss": 0.4533, "lr": 8.587531932036334e-06, "epoch": 5.92, "percentage": 59.2, "elapsed_time": "5:54:26", "remaining_time": "4:04:16"} {"current_steps": 2970, "total_steps": 5000, "loss": 0.4451, "lr": 8.518453662190622e-06, "epoch": 5.9399999999999995, "percentage": 59.4, "elapsed_time": "5:55:37", "remaining_time": "4:03:04"} {"current_steps": 2980, "total_steps": 5000, "loss": 0.393, "lr": 8.449447600823262e-06, "epoch": 5.96, "percentage": 59.6, "elapsed_time": "5:56:49", "remaining_time": "4:01:52"} {"current_steps": 2990, "total_steps": 5000, "loss": 0.4406, "lr": 8.380517111192336e-06, "epoch": 5.98, "percentage": 59.8, "elapsed_time": "5:58:00", "remaining_time": "4:00:39"} {"current_steps": 3000, "total_steps": 5000, "loss": 0.474, "lr": 8.311665552872662e-06, "epoch": 6.0, "percentage": 60.0, "elapsed_time": "5:59:11", "remaining_time": "3:59:27"} {"current_steps": 3010, "total_steps": 5000, "loss": 0.3953, "lr": 8.242896281592057e-06, "epoch": 6.02, "percentage": 60.2, "elapsed_time": "6:00:25", "remaining_time": "3:58:17"} {"current_steps": 3020, "total_steps": 5000, "loss": 0.4117, "lr": 8.174212649067781e-06, "epoch": 6.04, "percentage": 60.4, "elapsed_time": "6:01:37", "remaining_time": "3:57:05"} {"current_steps": 3030, "total_steps": 5000, "loss": 0.3988, "lr": 8.10561800284319e-06, "epoch": 6.06, "percentage": 60.6, "elapsed_time": "6:02:48", "remaining_time": "3:55:52"} {"current_steps": 3040, "total_steps": 5000, "loss": 0.418, "lr": 8.037115686124564e-06, "epoch": 6.08, "percentage": 60.8, "elapsed_time": "6:04:00", "remaining_time": "3:54:41"} {"current_steps": 3050, "total_steps": 5000, "loss": 0.4084, "lr": 7.96870903761818e-06, "epoch": 6.1, "percentage": 61.0, "elapsed_time": "6:05:11", "remaining_time": "3:53:29"} {"current_steps": 3060, "total_steps": 5000, "loss": 0.3739, "lr": 7.900401391367576e-06, "epoch": 6.12, "percentage": 61.2, "elapsed_time": "6:06:22", "remaining_time": "3:52:16"} {"current_steps": 3070, "total_steps": 5000, "loss": 0.3763, "lr": 7.832196076591067e-06, "epoch": 6.14, "percentage": 61.4, "elapsed_time": "6:07:33", "remaining_time": "3:51:04"} {"current_steps": 3080, "total_steps": 5000, "loss": 0.4522, "lr": 7.76409641751947e-06, "epoch": 6.16, "percentage": 61.6, "elapsed_time": "6:08:45", "remaining_time": "3:49:52"} {"current_steps": 3090, "total_steps": 5000, "loss": 0.4661, "lr": 7.696105733234099e-06, "epoch": 6.18, "percentage": 61.8, "elapsed_time": "6:09:57", "remaining_time": "3:48:41"} {"current_steps": 3100, "total_steps": 5000, "loss": 0.4519, "lr": 7.628227337504972e-06, "epoch": 6.2, "percentage": 62.0, "elapsed_time": "6:11:09", "remaining_time": "3:47:29"} {"current_steps": 3110, "total_steps": 5000, "loss": 0.4073, "lr": 7.560464538629345e-06, "epoch": 6.22, "percentage": 62.2, "elapsed_time": "6:12:23", "remaining_time": "3:46:18"} {"current_steps": 3120, "total_steps": 5000, "loss": 0.4458, "lr": 7.492820639270435e-06, "epoch": 6.24, "percentage": 62.4, "elapsed_time": "6:13:35", "remaining_time": "3:45:06"} {"current_steps": 3130, "total_steps": 5000, "loss": 0.3703, "lr": 7.4252989362964635e-06, "epoch": 6.26, "percentage": 62.6, "elapsed_time": "6:14:47", "remaining_time": "3:43:54"} {"current_steps": 3140, "total_steps": 5000, "loss": 0.4393, "lr": 7.357902720619976e-06, "epoch": 6.28, "percentage": 62.8, "elapsed_time": "6:15:59", "remaining_time": "3:42:43"} {"current_steps": 3150, "total_steps": 5000, "loss": 0.437, "lr": 7.290635277037442e-06, "epoch": 6.3, "percentage": 63.0, "elapsed_time": "6:17:11", "remaining_time": "3:41:31"} {"current_steps": 3160, "total_steps": 5000, "loss": 0.3979, "lr": 7.22349988406916e-06, "epoch": 6.32, "percentage": 63.2, "elapsed_time": "6:18:23", "remaining_time": "3:40:19"} {"current_steps": 3170, "total_steps": 5000, "loss": 0.4078, "lr": 7.156499813799477e-06, "epoch": 6.34, "percentage": 63.4, "elapsed_time": "6:19:35", "remaining_time": "3:39:07"} {"current_steps": 3180, "total_steps": 5000, "loss": 0.4182, "lr": 7.0896383317172845e-06, "epoch": 6.36, "percentage": 63.6, "elapsed_time": "6:20:47", "remaining_time": "3:37:55"} {"current_steps": 3190, "total_steps": 5000, "loss": 0.4239, "lr": 7.022918696556896e-06, "epoch": 6.38, "percentage": 63.8, "elapsed_time": "6:21:59", "remaining_time": "3:36:44"} {"current_steps": 3200, "total_steps": 5000, "loss": 0.4369, "lr": 6.956344160139201e-06, "epoch": 6.4, "percentage": 64.0, "elapsed_time": "6:23:11", "remaining_time": "3:35:32"} {"current_steps": 3210, "total_steps": 5000, "loss": 0.4469, "lr": 6.889917967213184e-06, "epoch": 6.42, "percentage": 64.2, "elapsed_time": "6:24:25", "remaining_time": "3:34:22"} {"current_steps": 3220, "total_steps": 5000, "loss": 0.4312, "lr": 6.823643355297774e-06, "epoch": 6.44, "percentage": 64.4, "elapsed_time": "6:25:37", "remaining_time": "3:33:10"} {"current_steps": 3230, "total_steps": 5000, "loss": 0.4465, "lr": 6.757523554524056e-06, "epoch": 6.46, "percentage": 64.6, "elapsed_time": "6:26:50", "remaining_time": "3:31:59"} {"current_steps": 3240, "total_steps": 5000, "loss": 0.4201, "lr": 6.69156178747784e-06, "epoch": 6.48, "percentage": 64.8, "elapsed_time": "6:28:01", "remaining_time": "3:30:46"} {"current_steps": 3250, "total_steps": 5000, "loss": 0.3882, "lr": 6.62576126904259e-06, "epoch": 6.5, "percentage": 65.0, "elapsed_time": "6:29:12", "remaining_time": "3:29:34"} {"current_steps": 3260, "total_steps": 5000, "loss": 0.4448, "lr": 6.560125206242746e-06, "epoch": 6.52, "percentage": 65.2, "elapsed_time": "6:30:24", "remaining_time": "3:28:22"} {"current_steps": 3270, "total_steps": 5000, "loss": 0.3915, "lr": 6.494656798087412e-06, "epoch": 6.54, "percentage": 65.4, "elapsed_time": "6:31:35", "remaining_time": "3:27:10"} {"current_steps": 3280, "total_steps": 5000, "loss": 0.3769, "lr": 6.4293592354144365e-06, "epoch": 6.5600000000000005, "percentage": 65.6, "elapsed_time": "6:32:47", "remaining_time": "3:25:58"} {"current_steps": 3290, "total_steps": 5000, "loss": 0.4503, "lr": 6.364235700734903e-06, "epoch": 6.58, "percentage": 65.8, "elapsed_time": "6:33:59", "remaining_time": "3:24:46"} {"current_steps": 3300, "total_steps": 5000, "loss": 0.4398, "lr": 6.299289368078016e-06, "epoch": 6.6, "percentage": 66.0, "elapsed_time": "6:35:10", "remaining_time": "3:23:34"} {"current_steps": 3310, "total_steps": 5000, "loss": 0.4199, "lr": 6.234523402836408e-06, "epoch": 6.62, "percentage": 66.2, "elapsed_time": "6:36:23", "remaining_time": "3:22:23"} {"current_steps": 3320, "total_steps": 5000, "loss": 0.4574, "lr": 6.169940961611853e-06, "epoch": 6.64, "percentage": 66.4, "elapsed_time": "6:37:36", "remaining_time": "3:21:11"} {"current_steps": 3330, "total_steps": 5000, "loss": 0.4252, "lr": 6.1055451920614165e-06, "epoch": 6.66, "percentage": 66.6, "elapsed_time": "6:38:47", "remaining_time": "3:19:59"} {"current_steps": 3340, "total_steps": 5000, "loss": 0.4069, "lr": 6.0413392327440635e-06, "epoch": 6.68, "percentage": 66.8, "elapsed_time": "6:39:59", "remaining_time": "3:18:47"} {"current_steps": 3350, "total_steps": 5000, "loss": 0.4173, "lr": 5.977326212967671e-06, "epoch": 6.7, "percentage": 67.0, "elapsed_time": "6:41:11", "remaining_time": "3:17:36"} {"current_steps": 3360, "total_steps": 5000, "loss": 0.3737, "lr": 5.913509252636511e-06, "epoch": 6.72, "percentage": 67.2, "elapsed_time": "6:42:22", "remaining_time": "3:16:23"} {"current_steps": 3370, "total_steps": 5000, "loss": 0.437, "lr": 5.849891462099199e-06, "epoch": 6.74, "percentage": 67.4, "elapsed_time": "6:43:34", "remaining_time": "3:15:11"} {"current_steps": 3380, "total_steps": 5000, "loss": 0.4457, "lr": 5.786475941997094e-06, "epoch": 6.76, "percentage": 67.6, "elapsed_time": "6:44:46", "remaining_time": "3:14:00"} {"current_steps": 3390, "total_steps": 5000, "loss": 0.3989, "lr": 5.723265783113181e-06, "epoch": 6.78, "percentage": 67.8, "elapsed_time": "6:45:58", "remaining_time": "3:12:48"} {"current_steps": 3400, "total_steps": 5000, "loss": 0.4314, "lr": 5.660264066221426e-06, "epoch": 6.8, "percentage": 68.0, "elapsed_time": "6:47:10", "remaining_time": "3:11:36"} {"current_steps": 3410, "total_steps": 5000, "loss": 0.3989, "lr": 5.59747386193663e-06, "epoch": 6.82, "percentage": 68.2, "elapsed_time": "6:48:23", "remaining_time": "3:10:25"} {"current_steps": 3420, "total_steps": 5000, "loss": 0.3792, "lr": 5.534898230564765e-06, "epoch": 6.84, "percentage": 68.4, "elapsed_time": "6:49:34", "remaining_time": "3:09:13"} {"current_steps": 3430, "total_steps": 5000, "loss": 0.4115, "lr": 5.472540221953824e-06, "epoch": 6.86, "percentage": 68.6, "elapsed_time": "6:50:45", "remaining_time": "3:08:01"} {"current_steps": 3440, "total_steps": 5000, "loss": 0.4067, "lr": 5.41040287534517e-06, "epoch": 6.88, "percentage": 68.8, "elapsed_time": "6:51:57", "remaining_time": "3:06:49"} {"current_steps": 3450, "total_steps": 5000, "loss": 0.4424, "lr": 5.348489219225417e-06, "epoch": 6.9, "percentage": 69.0, "elapsed_time": "6:53:08", "remaining_time": "3:05:37"} {"current_steps": 3460, "total_steps": 5000, "loss": 0.4508, "lr": 5.286802271178815e-06, "epoch": 6.92, "percentage": 69.2, "elapsed_time": "6:54:21", "remaining_time": "3:04:25"} {"current_steps": 3470, "total_steps": 5000, "loss": 0.3984, "lr": 5.225345037740186e-06, "epoch": 6.9399999999999995, "percentage": 69.4, "elapsed_time": "6:55:32", "remaining_time": "3:03:13"} {"current_steps": 3480, "total_steps": 5000, "loss": 0.4499, "lr": 5.16412051424839e-06, "epoch": 6.96, "percentage": 69.6, "elapsed_time": "6:56:43", "remaining_time": "3:02:00"} {"current_steps": 3490, "total_steps": 5000, "loss": 0.4154, "lr": 5.103131684700315e-06, "epoch": 6.98, "percentage": 69.8, "elapsed_time": "6:57:54", "remaining_time": "3:00:49"} {"current_steps": 3500, "total_steps": 5000, "loss": 0.391, "lr": 5.042381521605473e-06, "epoch": 7.0, "percentage": 70.0, "elapsed_time": "6:59:06", "remaining_time": "2:59:37"} {"current_steps": 3510, "total_steps": 5000, "loss": 0.38, "lr": 4.981872985841115e-06, "epoch": 7.02, "percentage": 70.2, "elapsed_time": "7:00:19", "remaining_time": "2:58:25"} {"current_steps": 3520, "total_steps": 5000, "loss": 0.3478, "lr": 4.921609026507907e-06, "epoch": 7.04, "percentage": 70.4, "elapsed_time": "7:01:30", "remaining_time": "2:57:13"} {"current_steps": 3530, "total_steps": 5000, "loss": 0.3712, "lr": 4.861592580786205e-06, "epoch": 7.06, "percentage": 70.6, "elapsed_time": "7:02:41", "remaining_time": "2:56:01"} {"current_steps": 3540, "total_steps": 5000, "loss": 0.3801, "lr": 4.801826573792905e-06, "epoch": 7.08, "percentage": 70.8, "elapsed_time": "7:03:53", "remaining_time": "2:54:49"} {"current_steps": 3550, "total_steps": 5000, "loss": 0.3881, "lr": 4.7423139184388725e-06, "epoch": 7.1, "percentage": 71.0, "elapsed_time": "7:05:05", "remaining_time": "2:53:37"} {"current_steps": 3560, "total_steps": 5000, "loss": 0.3489, "lr": 4.6830575152869615e-06, "epoch": 7.12, "percentage": 71.2, "elapsed_time": "7:06:17", "remaining_time": "2:52:25"} {"current_steps": 3570, "total_steps": 5000, "loss": 0.4284, "lr": 4.62406025241067e-06, "epoch": 7.14, "percentage": 71.4, "elapsed_time": "7:07:28", "remaining_time": "2:51:13"} {"current_steps": 3580, "total_steps": 5000, "loss": 0.4055, "lr": 4.565325005253356e-06, "epoch": 7.16, "percentage": 71.6, "elapsed_time": "7:08:40", "remaining_time": "2:50:01"} {"current_steps": 3590, "total_steps": 5000, "loss": 0.3627, "lr": 4.506854636488103e-06, "epoch": 7.18, "percentage": 71.8, "elapsed_time": "7:09:51", "remaining_time": "2:48:49"} {"current_steps": 3600, "total_steps": 5000, "loss": 0.3866, "lr": 4.44865199587819e-06, "epoch": 7.2, "percentage": 72.0, "elapsed_time": "7:11:03", "remaining_time": "2:47:37"} {"current_steps": 3610, "total_steps": 5000, "loss": 0.3947, "lr": 4.39071992013822e-06, "epoch": 7.22, "percentage": 72.2, "elapsed_time": "7:12:17", "remaining_time": "2:46:27"} {"current_steps": 3620, "total_steps": 5000, "loss": 0.4266, "lr": 4.3330612327958265e-06, "epoch": 7.24, "percentage": 72.4, "elapsed_time": "7:13:30", "remaining_time": "2:45:15"} {"current_steps": 3630, "total_steps": 5000, "loss": 0.3495, "lr": 4.275678744054094e-06, "epoch": 7.26, "percentage": 72.6, "elapsed_time": "7:14:41", "remaining_time": "2:44:03"} {"current_steps": 3640, "total_steps": 5000, "loss": 0.4153, "lr": 4.218575250654559e-06, "epoch": 7.28, "percentage": 72.8, "elapsed_time": "7:15:54", "remaining_time": "2:42:52"} {"current_steps": 3650, "total_steps": 5000, "loss": 0.3819, "lr": 4.161753535740932e-06, "epoch": 7.3, "percentage": 73.0, "elapsed_time": "7:17:06", "remaining_time": "2:41:40"} {"current_steps": 3660, "total_steps": 5000, "loss": 0.4032, "lr": 4.105216368723437e-06, "epoch": 7.32, "percentage": 73.2, "elapsed_time": "7:18:18", "remaining_time": "2:40:28"} {"current_steps": 3670, "total_steps": 5000, "loss": 0.358, "lr": 4.048966505143831e-06, "epoch": 7.34, "percentage": 73.4, "elapsed_time": "7:19:30", "remaining_time": "2:39:16"} {"current_steps": 3680, "total_steps": 5000, "loss": 0.4101, "lr": 3.993006686541108e-06, "epoch": 7.36, "percentage": 73.6, "elapsed_time": "7:20:41", "remaining_time": "2:38:04"} {"current_steps": 3690, "total_steps": 5000, "loss": 0.3803, "lr": 3.937339640317879e-06, "epoch": 7.38, "percentage": 73.8, "elapsed_time": "7:21:54", "remaining_time": "2:36:52"} {"current_steps": 3700, "total_steps": 5000, "loss": 0.3844, "lr": 3.88196807960744e-06, "epoch": 7.4, "percentage": 74.0, "elapsed_time": "7:23:06", "remaining_time": "2:35:41"} {"current_steps": 3710, "total_steps": 5000, "loss": 0.3536, "lr": 3.826894703141552e-06, "epoch": 7.42, "percentage": 74.2, "elapsed_time": "7:24:19", "remaining_time": "2:34:29"} {"current_steps": 3720, "total_steps": 5000, "loss": 0.3957, "lr": 3.772122195118877e-06, "epoch": 7.44, "percentage": 74.4, "elapsed_time": "7:25:31", "remaining_time": "2:33:17"} {"current_steps": 3730, "total_steps": 5000, "loss": 0.4308, "lr": 3.7176532250741857e-06, "epoch": 7.46, "percentage": 74.6, "elapsed_time": "7:26:44", "remaining_time": "2:32:06"} {"current_steps": 3740, "total_steps": 5000, "loss": 0.3988, "lr": 3.663490447748236e-06, "epoch": 7.48, "percentage": 74.8, "elapsed_time": "7:27:56", "remaining_time": "2:30:54"} {"current_steps": 3750, "total_steps": 5000, "loss": 0.3983, "lr": 3.6096365029583803e-06, "epoch": 7.5, "percentage": 75.0, "elapsed_time": "7:29:08", "remaining_time": "2:29:42"} {"current_steps": 3760, "total_steps": 5000, "loss": 0.37, "lr": 3.5560940154699133e-06, "epoch": 7.52, "percentage": 75.2, "elapsed_time": "7:30:19", "remaining_time": "2:28:30"} {"current_steps": 3770, "total_steps": 5000, "loss": 0.3645, "lr": 3.502865594868136e-06, "epoch": 7.54, "percentage": 75.4, "elapsed_time": "7:31:30", "remaining_time": "2:27:18"} {"current_steps": 3780, "total_steps": 5000, "loss": 0.4179, "lr": 3.4499538354311757e-06, "epoch": 7.5600000000000005, "percentage": 75.6, "elapsed_time": "7:32:42", "remaining_time": "2:26:06"} {"current_steps": 3790, "total_steps": 5000, "loss": 0.324, "lr": 3.397361316003539e-06, "epoch": 7.58, "percentage": 75.8, "elapsed_time": "7:33:54", "remaining_time": "2:24:54"} {"current_steps": 3800, "total_steps": 5000, "loss": 0.3789, "lr": 3.3450905998704274e-06, "epoch": 7.6, "percentage": 76.0, "elapsed_time": "7:35:06", "remaining_time": "2:23:42"} {"current_steps": 3810, "total_steps": 5000, "loss": 0.3608, "lr": 3.2931442346328e-06, "epoch": 7.62, "percentage": 76.2, "elapsed_time": "7:36:19", "remaining_time": "2:22:31"} {"current_steps": 3820, "total_steps": 5000, "loss": 0.3985, "lr": 3.241524752083215e-06, "epoch": 7.64, "percentage": 76.4, "elapsed_time": "7:37:30", "remaining_time": "2:21:19"} {"current_steps": 3830, "total_steps": 5000, "loss": 0.3447, "lr": 3.190234668082427e-06, "epoch": 7.66, "percentage": 76.6, "elapsed_time": "7:38:42", "remaining_time": "2:20:07"} {"current_steps": 3840, "total_steps": 5000, "loss": 0.3426, "lr": 3.1392764824367706e-06, "epoch": 7.68, "percentage": 76.8, "elapsed_time": "7:39:53", "remaining_time": "2:18:55"} {"current_steps": 3850, "total_steps": 5000, "loss": 0.3576, "lr": 3.0886526787763237e-06, "epoch": 7.7, "percentage": 77.0, "elapsed_time": "7:41:05", "remaining_time": "2:17:43"} {"current_steps": 3860, "total_steps": 5000, "loss": 0.3928, "lr": 3.038365724433858e-06, "epoch": 7.72, "percentage": 77.2, "elapsed_time": "7:42:16", "remaining_time": "2:16:31"} {"current_steps": 3870, "total_steps": 5000, "loss": 0.3589, "lr": 2.988418070324577e-06, "epoch": 7.74, "percentage": 77.4, "elapsed_time": "7:43:28", "remaining_time": "2:15:19"} {"current_steps": 3880, "total_steps": 5000, "loss": 0.3851, "lr": 2.938812150826684e-06, "epoch": 7.76, "percentage": 77.6, "elapsed_time": "7:44:40", "remaining_time": "2:14:07"} {"current_steps": 3890, "total_steps": 5000, "loss": 0.3688, "lr": 2.8895503836627105e-06, "epoch": 7.78, "percentage": 77.8, "elapsed_time": "7:45:51", "remaining_time": "2:12:55"} {"current_steps": 3900, "total_steps": 5000, "loss": 0.3585, "lr": 2.840635169781688e-06, "epoch": 7.8, "percentage": 78.0, "elapsed_time": "7:47:03", "remaining_time": "2:11:44"} {"current_steps": 3910, "total_steps": 5000, "loss": 0.3653, "lr": 2.7920688932421337e-06, "epoch": 7.82, "percentage": 78.2, "elapsed_time": "7:48:16", "remaining_time": "2:10:32"} {"current_steps": 3920, "total_steps": 5000, "loss": 0.3512, "lr": 2.7438539210958483e-06, "epoch": 7.84, "percentage": 78.4, "elapsed_time": "7:49:28", "remaining_time": "2:09:20"} {"current_steps": 3930, "total_steps": 5000, "loss": 0.3717, "lr": 2.6959926032725537e-06, "epoch": 7.86, "percentage": 78.6, "elapsed_time": "7:50:39", "remaining_time": "2:08:08"} {"current_steps": 3940, "total_steps": 5000, "loss": 0.3806, "lr": 2.648487272465361e-06, "epoch": 7.88, "percentage": 78.8, "elapsed_time": "7:51:51", "remaining_time": "2:06:56"} {"current_steps": 3950, "total_steps": 5000, "loss": 0.3993, "lr": 2.6013402440170676e-06, "epoch": 7.9, "percentage": 79.0, "elapsed_time": "7:53:04", "remaining_time": "2:05:45"} {"current_steps": 3960, "total_steps": 5000, "loss": 0.3387, "lr": 2.5545538158073278e-06, "epoch": 7.92, "percentage": 79.2, "elapsed_time": "7:54:15", "remaining_time": "2:04:33"} {"current_steps": 3970, "total_steps": 5000, "loss": 0.37, "lr": 2.512756228659141e-06, "epoch": 7.9399999999999995, "percentage": 79.4, "elapsed_time": "7:55:26", "remaining_time": "2:03:21"} {"current_steps": 3980, "total_steps": 5000, "loss": 0.3967, "lr": 2.4666612085261344e-06, "epoch": 7.96, "percentage": 79.6, "elapsed_time": "7:56:38", "remaining_time": "2:02:09"} {"current_steps": 3990, "total_steps": 5000, "loss": 0.4029, "lr": 2.420933352697865e-06, "epoch": 7.98, "percentage": 79.8, "elapsed_time": "7:57:50", "remaining_time": "2:00:57"} {"current_steps": 4000, "total_steps": 5000, "loss": 0.3713, "lr": 2.37557488988552e-06, "epoch": 8.0, "percentage": 80.0, "elapsed_time": "7:59:01", "remaining_time": "1:59:45"} {"current_steps": 4010, "total_steps": 5000, "loss": 0.3232, "lr": 2.3305880307965834e-06, "epoch": 8.02, "percentage": 80.2, "elapsed_time": "8:00:14", "remaining_time": "1:58:33"} {"current_steps": 4020, "total_steps": 5000, "loss": 0.331, "lr": 2.2859749680270983e-06, "epoch": 8.04, "percentage": 80.4, "elapsed_time": "8:01:26", "remaining_time": "1:57:22"} {"current_steps": 4030, "total_steps": 5000, "loss": 0.3818, "lr": 2.241737875954808e-06, "epoch": 8.06, "percentage": 80.6, "elapsed_time": "8:02:38", "remaining_time": "1:56:10"} {"current_steps": 4040, "total_steps": 5000, "loss": 0.3482, "lr": 2.1978789106331666e-06, "epoch": 8.08, "percentage": 80.8, "elapsed_time": "8:03:50", "remaining_time": "1:54:58"} {"current_steps": 4050, "total_steps": 5000, "loss": 0.3195, "lr": 2.154400209686268e-06, "epoch": 8.1, "percentage": 81.0, "elapsed_time": "8:05:02", "remaining_time": "1:53:46"} {"current_steps": 4060, "total_steps": 5000, "loss": 0.3557, "lr": 2.1113038922046603e-06, "epoch": 8.12, "percentage": 81.2, "elapsed_time": "8:06:13", "remaining_time": "1:52:34"} {"current_steps": 4070, "total_steps": 5000, "loss": 0.2853, "lr": 2.0685920586420562e-06, "epoch": 8.14, "percentage": 81.4, "elapsed_time": "8:07:24", "remaining_time": "1:51:22"} {"current_steps": 4080, "total_steps": 5000, "loss": 0.316, "lr": 2.026266790712965e-06, "epoch": 8.16, "percentage": 81.6, "elapsed_time": "8:08:35", "remaining_time": "1:50:10"} {"current_steps": 4090, "total_steps": 5000, "loss": 0.3328, "lr": 1.984330151291233e-06, "epoch": 8.18, "percentage": 81.8, "elapsed_time": "8:09:47", "remaining_time": "1:48:58"} {"current_steps": 4100, "total_steps": 5000, "loss": 0.3338, "lr": 1.9427841843095063e-06, "epoch": 8.2, "percentage": 82.0, "elapsed_time": "8:10:59", "remaining_time": "1:47:46"} {"current_steps": 4110, "total_steps": 5000, "loss": 0.3226, "lr": 1.9016309146596024e-06, "epoch": 8.22, "percentage": 82.2, "elapsed_time": "8:12:12", "remaining_time": "1:46:35"} {"current_steps": 4120, "total_steps": 5000, "loss": 0.3147, "lr": 1.8608723480938207e-06, "epoch": 8.24, "percentage": 82.4, "elapsed_time": "8:13:23", "remaining_time": "1:45:23"} {"current_steps": 4130, "total_steps": 5000, "loss": 0.3549, "lr": 1.820510471127196e-06, "epoch": 8.26, "percentage": 82.6, "elapsed_time": "8:14:35", "remaining_time": "1:44:11"} {"current_steps": 4140, "total_steps": 5000, "loss": 0.3701, "lr": 1.7805472509406695e-06, "epoch": 8.28, "percentage": 82.8, "elapsed_time": "8:15:47", "remaining_time": "1:42:59"} {"current_steps": 4150, "total_steps": 5000, "loss": 0.341, "lr": 1.7409846352852144e-06, "epoch": 8.3, "percentage": 83.0, "elapsed_time": "8:16:59", "remaining_time": "1:41:47"} {"current_steps": 4160, "total_steps": 5000, "loss": 0.2754, "lr": 1.7018245523869038e-06, "epoch": 8.32, "percentage": 83.2, "elapsed_time": "8:18:11", "remaining_time": "1:40:35"} {"current_steps": 4170, "total_steps": 5000, "loss": 0.3958, "lr": 1.6630689108529286e-06, "epoch": 8.34, "percentage": 83.4, "elapsed_time": "8:19:23", "remaining_time": "1:39:23"} {"current_steps": 4180, "total_steps": 5000, "loss": 0.3512, "lr": 1.6247195995785836e-06, "epoch": 8.36, "percentage": 83.6, "elapsed_time": "8:20:35", "remaining_time": "1:38:12"} {"current_steps": 4190, "total_steps": 5000, "loss": 0.3533, "lr": 1.5867784876551973e-06, "epoch": 8.38, "percentage": 83.8, "elapsed_time": "8:21:46", "remaining_time": "1:37:00"} {"current_steps": 4200, "total_steps": 5000, "loss": 0.3746, "lr": 1.5492474242790368e-06, "epoch": 8.4, "percentage": 84.0, "elapsed_time": "8:22:59", "remaining_time": "1:35:48"} {"current_steps": 4210, "total_steps": 5000, "loss": 0.3274, "lr": 1.5121282386611823e-06, "epoch": 8.42, "percentage": 84.2, "elapsed_time": "8:24:12", "remaining_time": "1:34:36"} {"current_steps": 4220, "total_steps": 5000, "loss": 0.3055, "lr": 1.4754227399383758e-06, "epoch": 8.44, "percentage": 84.4, "elapsed_time": "8:25:23", "remaining_time": "1:33:24"} {"current_steps": 4230, "total_steps": 5000, "loss": 0.3078, "lr": 1.439132717084839e-06, "epoch": 8.46, "percentage": 84.6, "elapsed_time": "8:26:35", "remaining_time": "1:32:13"} {"current_steps": 4240, "total_steps": 5000, "loss": 0.3194, "lr": 1.40325993882509e-06, "epoch": 8.48, "percentage": 84.8, "elapsed_time": "8:27:47", "remaining_time": "1:31:01"} {"current_steps": 4250, "total_steps": 5000, "loss": 0.352, "lr": 1.3678061535477305e-06, "epoch": 8.5, "percentage": 85.0, "elapsed_time": "8:28:59", "remaining_time": "1:29:49"} {"current_steps": 4260, "total_steps": 5000, "loss": 0.3061, "lr": 1.3327730892202384e-06, "epoch": 8.52, "percentage": 85.2, "elapsed_time": "8:30:11", "remaining_time": "1:28:37"} {"current_steps": 4270, "total_steps": 5000, "loss": 0.406, "lr": 1.2981624533047432e-06, "epoch": 8.54, "percentage": 85.4, "elapsed_time": "8:31:24", "remaining_time": "1:27:25"} {"current_steps": 4280, "total_steps": 5000, "loss": 0.3335, "lr": 1.2639759326748136e-06, "epoch": 8.56, "percentage": 85.6, "elapsed_time": "8:32:35", "remaining_time": "1:26:13"} {"current_steps": 4290, "total_steps": 5000, "loss": 0.4048, "lr": 1.230215193533233e-06, "epoch": 8.58, "percentage": 85.8, "elapsed_time": "8:33:47", "remaining_time": "1:25:02"} {"current_steps": 4300, "total_steps": 5000, "loss": 0.3388, "lr": 1.196881881330798e-06, "epoch": 8.6, "percentage": 86.0, "elapsed_time": "8:34:59", "remaining_time": "1:23:50"} {"current_steps": 4310, "total_steps": 5000, "loss": 0.358, "lr": 1.1639776206861197e-06, "epoch": 8.62, "percentage": 86.2, "elapsed_time": "8:36:11", "remaining_time": "1:22:38"} {"current_steps": 4320, "total_steps": 5000, "loss": 0.3628, "lr": 1.1315040153064416e-06, "epoch": 8.64, "percentage": 86.4, "elapsed_time": "8:37:23", "remaining_time": "1:21:26"} {"current_steps": 4330, "total_steps": 5000, "loss": 0.3585, "lr": 1.0994626479094749e-06, "epoch": 8.66, "percentage": 86.6, "elapsed_time": "8:38:35", "remaining_time": "1:20:14"} {"current_steps": 4340, "total_steps": 5000, "loss": 0.3583, "lr": 1.0678550801462662e-06, "epoch": 8.68, "percentage": 86.8, "elapsed_time": "8:39:47", "remaining_time": "1:19:02"} {"current_steps": 4350, "total_steps": 5000, "loss": 0.2861, "lr": 1.0366828525250728e-06, "epoch": 8.7, "percentage": 87.0, "elapsed_time": "8:40:58", "remaining_time": "1:17:50"} {"current_steps": 4360, "total_steps": 5000, "loss": 0.3422, "lr": 1.0059474843362893e-06, "epoch": 8.72, "percentage": 87.2, "elapsed_time": "8:42:10", "remaining_time": "1:16:38"} {"current_steps": 4370, "total_steps": 5000, "loss": 0.3337, "lr": 9.756504735784067e-07, "epoch": 8.74, "percentage": 87.4, "elapsed_time": "8:43:21", "remaining_time": "1:15:26"} {"current_steps": 4380, "total_steps": 5000, "loss": 0.3163, "lr": 9.457932968849826e-07, "epoch": 8.76, "percentage": 87.6, "elapsed_time": "8:44:33", "remaining_time": "1:14:15"} {"current_steps": 4390, "total_steps": 5000, "loss": 0.3132, "lr": 9.16377409452689e-07, "epoch": 8.78, "percentage": 87.8, "elapsed_time": "8:45:45", "remaining_time": "1:13:03"} {"current_steps": 4400, "total_steps": 5000, "loss": 0.3108, "lr": 8.874042449703779e-07, "epoch": 8.8, "percentage": 88.0, "elapsed_time": "8:46:56", "remaining_time": "1:11:51"} {"current_steps": 4410, "total_steps": 5000, "loss": 0.3444, "lr": 8.58875215549212e-07, "epoch": 8.82, "percentage": 88.2, "elapsed_time": "8:48:10", "remaining_time": "1:10:39"} {"current_steps": 4420, "total_steps": 5000, "loss": 0.3582, "lr": 8.307917116538378e-07, "epoch": 8.84, "percentage": 88.4, "elapsed_time": "8:49:22", "remaining_time": "1:09:27"} {"current_steps": 4430, "total_steps": 5000, "loss": 0.3014, "lr": 8.031551020346129e-07, "epoch": 8.86, "percentage": 88.6, "elapsed_time": "8:50:33", "remaining_time": "1:08:16"} {"current_steps": 4440, "total_steps": 5000, "loss": 0.3578, "lr": 7.759667336609011e-07, "epoch": 8.88, "percentage": 88.8, "elapsed_time": "8:51:45", "remaining_time": "1:07:04"} {"current_steps": 4450, "total_steps": 5000, "loss": 0.3253, "lr": 7.492279316554207e-07, "epoch": 8.9, "percentage": 89.0, "elapsed_time": "8:52:57", "remaining_time": "1:05:52"} {"current_steps": 4460, "total_steps": 5000, "loss": 0.3839, "lr": 7.22939999229657e-07, "epoch": 8.92, "percentage": 89.2, "elapsed_time": "8:54:08", "remaining_time": "1:04:40"} {"current_steps": 4470, "total_steps": 5000, "loss": 0.268, "lr": 6.971042176203535e-07, "epoch": 8.94, "percentage": 89.4, "elapsed_time": "8:55:20", "remaining_time": "1:03:28"} {"current_steps": 4480, "total_steps": 5000, "loss": 0.332, "lr": 6.717218460270536e-07, "epoch": 8.96, "percentage": 89.6, "elapsed_time": "8:56:31", "remaining_time": "1:02:16"} {"current_steps": 4490, "total_steps": 5000, "loss": 0.361, "lr": 6.467941215507434e-07, "epoch": 8.98, "percentage": 89.8, "elapsed_time": "8:57:43", "remaining_time": "1:01:04"} {"current_steps": 4500, "total_steps": 5000, "loss": 0.3358, "lr": 6.223222591335409e-07, "epoch": 9.0, "percentage": 90.0, "elapsed_time": "8:58:54", "remaining_time": "0:59:52"} {"current_steps": 4510, "total_steps": 5000, "loss": 0.2874, "lr": 5.98307451499498e-07, "epoch": 9.02, "percentage": 90.2, "elapsed_time": "9:00:07", "remaining_time": "0:58:40"} {"current_steps": 4520, "total_steps": 5000, "loss": 0.361, "lr": 5.747508690964599e-07, "epoch": 9.04, "percentage": 90.4, "elapsed_time": "9:01:18", "remaining_time": "0:57:29"} {"current_steps": 4530, "total_steps": 5000, "loss": 0.2929, "lr": 5.516536600390188e-07, "epoch": 9.06, "percentage": 90.6, "elapsed_time": "9:02:30", "remaining_time": "0:56:17"} {"current_steps": 4540, "total_steps": 5000, "loss": 0.2854, "lr": 5.290169500525577e-07, "epoch": 9.08, "percentage": 90.8, "elapsed_time": "9:03:41", "remaining_time": "0:55:05"} {"current_steps": 4550, "total_steps": 5000, "loss": 0.3173, "lr": 5.068418424183874e-07, "epoch": 9.1, "percentage": 91.0, "elapsed_time": "9:04:52", "remaining_time": "0:53:53"} {"current_steps": 4560, "total_steps": 5000, "loss": 0.3683, "lr": 4.851294179199673e-07, "epoch": 9.12, "percentage": 91.2, "elapsed_time": "9:06:03", "remaining_time": "0:52:41"} {"current_steps": 4570, "total_steps": 5000, "loss": 0.3256, "lr": 4.638807347902408e-07, "epoch": 9.14, "percentage": 91.4, "elapsed_time": "9:07:15", "remaining_time": "0:51:29"} {"current_steps": 4580, "total_steps": 5000, "loss": 0.319, "lr": 4.4309682866004124e-07, "epoch": 9.16, "percentage": 91.6, "elapsed_time": "9:08:26", "remaining_time": "0:50:17"} {"current_steps": 4590, "total_steps": 5000, "loss": 0.3221, "lr": 4.2277871250763327e-07, "epoch": 9.18, "percentage": 91.8, "elapsed_time": "9:09:37", "remaining_time": "0:49:05"} {"current_steps": 4600, "total_steps": 5000, "loss": 0.2951, "lr": 4.0292737660933335e-07, "epoch": 9.2, "percentage": 92.0, "elapsed_time": "9:10:49", "remaining_time": "0:47:53"} {"current_steps": 4610, "total_steps": 5000, "loss": 0.3738, "lr": 3.835437884912474e-07, "epoch": 9.22, "percentage": 92.2, "elapsed_time": "9:12:03", "remaining_time": "0:46:42"} {"current_steps": 4620, "total_steps": 5000, "loss": 0.2898, "lr": 3.646288928821151e-07, "epoch": 9.24, "percentage": 92.4, "elapsed_time": "9:13:15", "remaining_time": "0:45:30"} {"current_steps": 4630, "total_steps": 5000, "loss": 0.3792, "lr": 3.4618361166726123e-07, "epoch": 9.26, "percentage": 92.6, "elapsed_time": "9:14:26", "remaining_time": "0:44:18"} {"current_steps": 4640, "total_steps": 5000, "loss": 0.3424, "lr": 3.282088438436715e-07, "epoch": 9.28, "percentage": 92.8, "elapsed_time": "9:15:38", "remaining_time": "0:43:06"} {"current_steps": 4650, "total_steps": 5000, "loss": 0.358, "lr": 3.10705465476171e-07, "epoch": 9.3, "percentage": 93.0, "elapsed_time": "9:16:51", "remaining_time": "0:41:54"} {"current_steps": 4660, "total_steps": 5000, "loss": 0.32, "lr": 2.936743296547273e-07, "epoch": 9.32, "percentage": 93.2, "elapsed_time": "9:18:03", "remaining_time": "0:40:43"} {"current_steps": 4670, "total_steps": 5000, "loss": 0.3079, "lr": 2.771162664528726e-07, "epoch": 9.34, "percentage": 93.4, "elapsed_time": "9:19:14", "remaining_time": "0:39:31"} {"current_steps": 4680, "total_steps": 5000, "loss": 0.2834, "lr": 2.6103208288724815e-07, "epoch": 9.36, "percentage": 93.6, "elapsed_time": "9:20:26", "remaining_time": "0:38:19"} {"current_steps": 4690, "total_steps": 5000, "loss": 0.354, "lr": 2.4542256287826915e-07, "epoch": 9.38, "percentage": 93.8, "elapsed_time": "9:21:39", "remaining_time": "0:37:07"} {"current_steps": 4700, "total_steps": 5000, "loss": 0.3243, "lr": 2.3028846721191878e-07, "epoch": 9.4, "percentage": 94.0, "elapsed_time": "9:22:50", "remaining_time": "0:35:55"} {"current_steps": 4710, "total_steps": 5000, "loss": 0.3121, "lr": 2.1563053350266983e-07, "epoch": 9.42, "percentage": 94.2, "elapsed_time": "9:24:04", "remaining_time": "0:34:43"} {"current_steps": 4720, "total_steps": 5000, "loss": 0.3142, "lr": 2.014494761575314e-07, "epoch": 9.44, "percentage": 94.4, "elapsed_time": "9:25:15", "remaining_time": "0:33:31"} {"current_steps": 4730, "total_steps": 5000, "loss": 0.3287, "lr": 1.877459863412323e-07, "epoch": 9.46, "percentage": 94.6, "elapsed_time": "9:26:27", "remaining_time": "0:32:20"} {"current_steps": 4740, "total_steps": 5000, "loss": 0.2989, "lr": 1.7452073194253237e-07, "epoch": 9.48, "percentage": 94.8, "elapsed_time": "9:27:38", "remaining_time": "0:31:08"} {"current_steps": 4750, "total_steps": 5000, "loss": 0.3632, "lr": 1.6177435754167413e-07, "epoch": 9.5, "percentage": 95.0, "elapsed_time": "9:28:49", "remaining_time": "0:29:56"} {"current_steps": 4760, "total_steps": 5000, "loss": 0.265, "lr": 1.4950748437896235e-07, "epoch": 9.52, "percentage": 95.2, "elapsed_time": "9:30:01", "remaining_time": "0:28:44"} {"current_steps": 4770, "total_steps": 5000, "loss": 0.283, "lr": 1.377207103244904e-07, "epoch": 9.54, "percentage": 95.4, "elapsed_time": "9:31:12", "remaining_time": "0:27:32"} {"current_steps": 4780, "total_steps": 5000, "loss": 0.2264, "lr": 1.26414609848996e-07, "epoch": 9.56, "percentage": 95.6, "elapsed_time": "9:32:23", "remaining_time": "0:26:20"} {"current_steps": 4790, "total_steps": 5000, "loss": 0.3198, "lr": 1.1558973399586671e-07, "epoch": 9.58, "percentage": 95.8, "elapsed_time": "9:33:35", "remaining_time": "0:25:08"} {"current_steps": 4800, "total_steps": 5000, "loss": 0.2258, "lr": 1.052466103542793e-07, "epoch": 9.6, "percentage": 96.0, "elapsed_time": "9:34:45", "remaining_time": "0:23:56"} {"current_steps": 4810, "total_steps": 5000, "loss": 0.3053, "lr": 9.538574303348813e-08, "epoch": 9.62, "percentage": 96.2, "elapsed_time": "9:35:59", "remaining_time": "0:22:45"} {"current_steps": 4820, "total_steps": 5000, "loss": 0.278, "lr": 8.600761263825475e-08, "epoch": 9.64, "percentage": 96.4, "elapsed_time": "9:37:10", "remaining_time": "0:21:33"} {"current_steps": 4830, "total_steps": 5000, "loss": 0.3211, "lr": 7.71126762454233e-08, "epoch": 9.66, "percentage": 96.6, "elapsed_time": "9:38:21", "remaining_time": "0:20:21"} {"current_steps": 4840, "total_steps": 5000, "loss": 0.3079, "lr": 6.870136738164612e-08, "epoch": 9.68, "percentage": 96.8, "elapsed_time": "9:39:33", "remaining_time": "0:19:09"} {"current_steps": 4850, "total_steps": 5000, "loss": 0.3717, "lr": 6.07740960022507e-08, "epoch": 9.7, "percentage": 97.0, "elapsed_time": "9:40:45", "remaining_time": "0:17:57"} {"current_steps": 4860, "total_steps": 5000, "loss": 0.3052, "lr": 5.3331248471258926e-08, "epoch": 9.72, "percentage": 97.2, "elapsed_time": "9:41:57", "remaining_time": "0:16:45"} {"current_steps": 4870, "total_steps": 5000, "loss": 0.3018, "lr": 4.6373187542561036e-08, "epoch": 9.74, "percentage": 97.4, "elapsed_time": "9:43:08", "remaining_time": "0:15:33"} {"current_steps": 4880, "total_steps": 5000, "loss": 0.2694, "lr": 3.990025234222872e-08, "epoch": 9.76, "percentage": 97.6, "elapsed_time": "9:44:19", "remaining_time": "0:14:22"} {"current_steps": 4890, "total_steps": 5000, "loss": 0.323, "lr": 3.391275835199159e-08, "epoch": 9.78, "percentage": 97.8, "elapsed_time": "9:45:31", "remaining_time": "0:13:10"} {"current_steps": 4900, "total_steps": 5000, "loss": 0.302, "lr": 2.8410997393860663e-08, "epoch": 9.8, "percentage": 98.0, "elapsed_time": "9:46:42", "remaining_time": "0:11:58"} {"current_steps": 4910, "total_steps": 5000, "loss": 0.3561, "lr": 2.339523761590301e-08, "epoch": 9.82, "percentage": 98.2, "elapsed_time": "9:47:56", "remaining_time": "0:10:46"} {"current_steps": 4920, "total_steps": 5000, "loss": 0.3486, "lr": 1.886572347917337e-08, "epoch": 9.84, "percentage": 98.4, "elapsed_time": "9:49:07", "remaining_time": "0:09:34"} {"current_steps": 4930, "total_steps": 5000, "loss": 0.3651, "lr": 1.482267574580143e-08, "epoch": 9.86, "percentage": 98.6, "elapsed_time": "9:50:19", "remaining_time": "0:08:22"} {"current_steps": 4940, "total_steps": 5000, "loss": 0.2544, "lr": 1.126629146822933e-08, "epoch": 9.88, "percentage": 98.8, "elapsed_time": "9:51:30", "remaining_time": "0:07:11"} {"current_steps": 4950, "total_steps": 5000, "loss": 0.2575, "lr": 8.196743979610455e-09, "epoch": 9.9, "percentage": 99.0, "elapsed_time": "9:52:42", "remaining_time": "0:05:59"} {"current_steps": 4960, "total_steps": 5000, "loss": 0.2833, "lr": 5.614182885357311e-09, "epoch": 9.92, "percentage": 99.2, "elapsed_time": "9:53:53", "remaining_time": "0:04:47"} {"current_steps": 4970, "total_steps": 5000, "loss": 0.3345, "lr": 3.518734055855122e-09, "epoch": 9.94, "percentage": 99.4, "elapsed_time": "9:55:05", "remaining_time": "0:03:35"} {"current_steps": 4980, "total_steps": 5000, "loss": 0.3034, "lr": 1.910499620322304e-09, "epoch": 9.96, "percentage": 99.6, "elapsed_time": "9:56:16", "remaining_time": "0:02:23"} {"current_steps": 4990, "total_steps": 5000, "loss": 0.2543, "lr": 7.895579618388827e-10, "epoch": 9.98, "percentage": 99.8, "elapsed_time": "9:57:27", "remaining_time": "0:01:11"} {"current_steps": 5000, "total_steps": 5000, "loss": 0.3149, "lr": 1.559637135173375e-10, "epoch": 10.0, "percentage": 100.0, "elapsed_time": "9:58:39", "remaining_time": "0:00:00"} {"current_steps": 5000, "total_steps": 5000, "epoch": 10.0, "percentage": 100.0, "elapsed_time": "9:58:40", "remaining_time": "0:00:00"}