| {"current_steps": 10, "total_steps": 8436, "loss": 2.2225, "learning_rate": 1.1848341232227489e-07, "epoch": 0.0035555555555555557, "percentage": 0.12, "elapsed_time": "0:00:45", "remaining_time": "10:41:26"} | |
| {"current_steps": 20, "total_steps": 8436, "loss": 2.0266, "learning_rate": 2.3696682464454978e-07, "epoch": 0.0071111111111111115, "percentage": 0.24, "elapsed_time": "0:01:22", "remaining_time": "9:38:45"} | |
| {"current_steps": 30, "total_steps": 8436, "loss": 1.7378, "learning_rate": 3.5545023696682467e-07, "epoch": 0.010666666666666666, "percentage": 0.36, "elapsed_time": "0:01:58", "remaining_time": "9:13:39"} | |
| {"current_steps": 40, "total_steps": 8436, "loss": 1.4898, "learning_rate": 4.7393364928909956e-07, "epoch": 0.014222222222222223, "percentage": 0.47, "elapsed_time": "0:02:32", "remaining_time": "8:53:01"} | |
| {"current_steps": 50, "total_steps": 8436, "loss": 1.1851, "learning_rate": 5.924170616113745e-07, "epoch": 0.017777777777777778, "percentage": 0.59, "elapsed_time": "0:03:08", "remaining_time": "8:48:10"} | |
| {"current_steps": 60, "total_steps": 8436, "loss": 0.988, "learning_rate": 7.109004739336493e-07, "epoch": 0.021333333333333333, "percentage": 0.71, "elapsed_time": "0:03:45", "remaining_time": "8:45:33"} | |
| {"current_steps": 70, "total_steps": 8436, "loss": 0.862, "learning_rate": 8.293838862559242e-07, "epoch": 0.024888888888888887, "percentage": 0.83, "elapsed_time": "0:04:22", "remaining_time": "8:42:25"} | |
| {"current_steps": 80, "total_steps": 8436, "loss": 0.7813, "learning_rate": 9.478672985781991e-07, "epoch": 0.028444444444444446, "percentage": 0.95, "elapsed_time": "0:04:56", "remaining_time": "8:35:38"} | |
| {"current_steps": 90, "total_steps": 8436, "loss": 0.6638, "learning_rate": 1.0663507109004742e-06, "epoch": 0.032, "percentage": 1.07, "elapsed_time": "0:05:32", "remaining_time": "8:34:06"} | |
| {"current_steps": 100, "total_steps": 8436, "loss": 0.6073, "learning_rate": 1.184834123222749e-06, "epoch": 0.035555555555555556, "percentage": 1.19, "elapsed_time": "0:06:09", "remaining_time": "8:32:46"} | |
| {"current_steps": 110, "total_steps": 8436, "loss": 0.5392, "learning_rate": 1.303317535545024e-06, "epoch": 0.03911111111111111, "percentage": 1.3, "elapsed_time": "0:06:46", "remaining_time": "8:33:02"} | |
| {"current_steps": 120, "total_steps": 8436, "loss": 0.5798, "learning_rate": 1.4218009478672987e-06, "epoch": 0.042666666666666665, "percentage": 1.42, "elapsed_time": "0:07:25", "remaining_time": "8:34:21"} | |
| {"current_steps": 130, "total_steps": 8436, "loss": 0.5119, "learning_rate": 1.5402843601895737e-06, "epoch": 0.04622222222222222, "percentage": 1.54, "elapsed_time": "0:08:03", "remaining_time": "8:35:13"} | |
| {"current_steps": 140, "total_steps": 8436, "loss": 0.4432, "learning_rate": 1.6587677725118483e-06, "epoch": 0.049777777777777775, "percentage": 1.66, "elapsed_time": "0:08:38", "remaining_time": "8:31:42"} | |
| {"current_steps": 150, "total_steps": 8436, "loss": 0.4637, "learning_rate": 1.7772511848341234e-06, "epoch": 0.05333333333333334, "percentage": 1.78, "elapsed_time": "0:09:14", "remaining_time": "8:30:34"} | |
| {"current_steps": 160, "total_steps": 8436, "loss": 0.4623, "learning_rate": 1.8957345971563982e-06, "epoch": 0.05688888888888889, "percentage": 1.9, "elapsed_time": "0:09:51", "remaining_time": "8:29:53"} | |
| {"current_steps": 170, "total_steps": 8436, "loss": 0.4909, "learning_rate": 2.0142180094786733e-06, "epoch": 0.060444444444444446, "percentage": 2.02, "elapsed_time": "0:10:26", "remaining_time": "8:27:23"} | |
| {"current_steps": 180, "total_steps": 8436, "loss": 0.4522, "learning_rate": 2.1327014218009483e-06, "epoch": 0.064, "percentage": 2.13, "elapsed_time": "0:11:02", "remaining_time": "8:26:16"} | |
| {"current_steps": 190, "total_steps": 8436, "loss": 0.4683, "learning_rate": 2.251184834123223e-06, "epoch": 0.06755555555555555, "percentage": 2.25, "elapsed_time": "0:11:38", "remaining_time": "8:25:00"} | |
| {"current_steps": 200, "total_steps": 8436, "loss": 0.4544, "learning_rate": 2.369668246445498e-06, "epoch": 0.07111111111111111, "percentage": 2.37, "elapsed_time": "0:12:15", "remaining_time": "8:25:01"} | |
| {"current_steps": 210, "total_steps": 8436, "loss": 0.452, "learning_rate": 2.4881516587677726e-06, "epoch": 0.07466666666666667, "percentage": 2.49, "elapsed_time": "0:12:49", "remaining_time": "8:22:40"} | |
| {"current_steps": 220, "total_steps": 8436, "loss": 0.4594, "learning_rate": 2.606635071090048e-06, "epoch": 0.07822222222222222, "percentage": 2.61, "elapsed_time": "0:13:27", "remaining_time": "8:22:30"} | |
| {"current_steps": 230, "total_steps": 8436, "loss": 0.4079, "learning_rate": 2.7251184834123223e-06, "epoch": 0.08177777777777778, "percentage": 2.73, "elapsed_time": "0:14:02", "remaining_time": "8:20:59"} | |
| {"current_steps": 240, "total_steps": 8436, "loss": 0.4586, "learning_rate": 2.8436018957345973e-06, "epoch": 0.08533333333333333, "percentage": 2.84, "elapsed_time": "0:14:38", "remaining_time": "8:19:46"} | |
| {"current_steps": 250, "total_steps": 8436, "loss": 0.4143, "learning_rate": 2.9620853080568724e-06, "epoch": 0.08888888888888889, "percentage": 2.96, "elapsed_time": "0:15:13", "remaining_time": "8:18:19"} | |
| {"current_steps": 260, "total_steps": 8436, "loss": 0.454, "learning_rate": 3.0805687203791474e-06, "epoch": 0.09244444444444444, "percentage": 3.08, "elapsed_time": "0:15:50", "remaining_time": "8:17:55"} | |
| {"current_steps": 270, "total_steps": 8436, "loss": 0.3998, "learning_rate": 3.1990521327014216e-06, "epoch": 0.096, "percentage": 3.2, "elapsed_time": "0:16:26", "remaining_time": "8:17:02"} | |
| {"current_steps": 280, "total_steps": 8436, "loss": 0.397, "learning_rate": 3.3175355450236967e-06, "epoch": 0.09955555555555555, "percentage": 3.32, "elapsed_time": "0:17:02", "remaining_time": "8:16:15"} | |
| {"current_steps": 290, "total_steps": 8436, "loss": 0.416, "learning_rate": 3.4360189573459717e-06, "epoch": 0.10311111111111111, "percentage": 3.44, "elapsed_time": "0:17:37", "remaining_time": "8:14:57"} | |
| {"current_steps": 300, "total_steps": 8436, "loss": 0.4521, "learning_rate": 3.5545023696682468e-06, "epoch": 0.10666666666666667, "percentage": 3.56, "elapsed_time": "0:18:13", "remaining_time": "8:14:19"} | |
| {"current_steps": 310, "total_steps": 8436, "loss": 0.4023, "learning_rate": 3.672985781990522e-06, "epoch": 0.11022222222222222, "percentage": 3.67, "elapsed_time": "0:18:49", "remaining_time": "8:13:16"} | |
| {"current_steps": 320, "total_steps": 8436, "loss": 0.4191, "learning_rate": 3.7914691943127964e-06, "epoch": 0.11377777777777778, "percentage": 3.79, "elapsed_time": "0:19:26", "remaining_time": "8:13:12"} | |
| {"current_steps": 330, "total_steps": 8436, "loss": 0.4122, "learning_rate": 3.9099526066350715e-06, "epoch": 0.11733333333333333, "percentage": 3.91, "elapsed_time": "0:20:01", "remaining_time": "8:11:59"} | |
| {"current_steps": 340, "total_steps": 8436, "loss": 0.3498, "learning_rate": 4.0284360189573465e-06, "epoch": 0.12088888888888889, "percentage": 4.03, "elapsed_time": "0:20:40", "remaining_time": "8:12:17"} | |
| {"current_steps": 350, "total_steps": 8436, "loss": 0.4094, "learning_rate": 4.146919431279622e-06, "epoch": 0.12444444444444444, "percentage": 4.15, "elapsed_time": "0:21:18", "remaining_time": "8:12:06"} | |
| {"current_steps": 360, "total_steps": 8436, "loss": 0.4298, "learning_rate": 4.265402843601897e-06, "epoch": 0.128, "percentage": 4.27, "elapsed_time": "0:21:54", "remaining_time": "8:11:19"} | |
| {"current_steps": 370, "total_steps": 8436, "loss": 0.4216, "learning_rate": 4.383886255924171e-06, "epoch": 0.13155555555555556, "percentage": 4.39, "elapsed_time": "0:22:30", "remaining_time": "8:10:40"} | |
| {"current_steps": 380, "total_steps": 8436, "loss": 0.3808, "learning_rate": 4.502369668246446e-06, "epoch": 0.1351111111111111, "percentage": 4.5, "elapsed_time": "0:23:08", "remaining_time": "8:10:28"} | |
| {"current_steps": 390, "total_steps": 8436, "loss": 0.3618, "learning_rate": 4.620853080568721e-06, "epoch": 0.13866666666666666, "percentage": 4.62, "elapsed_time": "0:23:44", "remaining_time": "8:09:43"} | |
| {"current_steps": 400, "total_steps": 8436, "loss": 0.4044, "learning_rate": 4.739336492890996e-06, "epoch": 0.14222222222222222, "percentage": 4.74, "elapsed_time": "0:24:19", "remaining_time": "8:08:35"} | |
| {"current_steps": 410, "total_steps": 8436, "loss": 0.4071, "learning_rate": 4.857819905213271e-06, "epoch": 0.14577777777777778, "percentage": 4.86, "elapsed_time": "0:24:54", "remaining_time": "8:07:37"} | |
| {"current_steps": 420, "total_steps": 8436, "loss": 0.4272, "learning_rate": 4.976303317535545e-06, "epoch": 0.14933333333333335, "percentage": 4.98, "elapsed_time": "0:25:29", "remaining_time": "8:06:34"} | |
| {"current_steps": 430, "total_steps": 8436, "loss": 0.434, "learning_rate": 5.09478672985782e-06, "epoch": 0.15288888888888888, "percentage": 5.1, "elapsed_time": "0:26:04", "remaining_time": "8:05:20"} | |
| {"current_steps": 440, "total_steps": 8436, "loss": 0.3695, "learning_rate": 5.213270142180096e-06, "epoch": 0.15644444444444444, "percentage": 5.22, "elapsed_time": "0:26:39", "remaining_time": "8:04:21"} | |
| {"current_steps": 450, "total_steps": 8436, "loss": 0.3723, "learning_rate": 5.33175355450237e-06, "epoch": 0.16, "percentage": 5.33, "elapsed_time": "0:27:12", "remaining_time": "8:02:57"} | |
| {"current_steps": 460, "total_steps": 8436, "loss": 0.4147, "learning_rate": 5.4502369668246446e-06, "epoch": 0.16355555555555557, "percentage": 5.45, "elapsed_time": "0:27:48", "remaining_time": "8:02:03"} | |
| {"current_steps": 470, "total_steps": 8436, "loss": 0.4083, "learning_rate": 5.5687203791469205e-06, "epoch": 0.1671111111111111, "percentage": 5.57, "elapsed_time": "0:28:25", "remaining_time": "8:01:47"} | |
| {"current_steps": 480, "total_steps": 8436, "loss": 0.3631, "learning_rate": 5.687203791469195e-06, "epoch": 0.17066666666666666, "percentage": 5.69, "elapsed_time": "0:29:02", "remaining_time": "8:01:14"} | |
| {"current_steps": 490, "total_steps": 8436, "loss": 0.3838, "learning_rate": 5.8056872037914706e-06, "epoch": 0.17422222222222222, "percentage": 5.81, "elapsed_time": "0:29:38", "remaining_time": "8:00:39"} | |
| {"current_steps": 500, "total_steps": 8436, "loss": 0.3703, "learning_rate": 5.924170616113745e-06, "epoch": 0.17777777777777778, "percentage": 5.93, "elapsed_time": "0:30:16", "remaining_time": "8:00:32"} | |
| {"current_steps": 500, "total_steps": 8436, "eval_loss": 0.27164188027381897, "epoch": 0.17777777777777778, "percentage": 5.93, "elapsed_time": "0:39:38", "remaining_time": "10:29:07"} | |
| {"current_steps": 510, "total_steps": 8436, "loss": 0.3936, "learning_rate": 6.042654028436019e-06, "epoch": 0.18133333333333335, "percentage": 6.05, "elapsed_time": "0:40:15", "remaining_time": "10:25:40"} | |
| {"current_steps": 520, "total_steps": 8436, "loss": 0.4097, "learning_rate": 6.161137440758295e-06, "epoch": 0.18488888888888888, "percentage": 6.16, "elapsed_time": "0:40:53", "remaining_time": "10:22:22"} | |
| {"current_steps": 530, "total_steps": 8436, "loss": 0.3487, "learning_rate": 6.279620853080569e-06, "epoch": 0.18844444444444444, "percentage": 6.28, "elapsed_time": "0:41:31", "remaining_time": "10:19:28"} | |
| {"current_steps": 540, "total_steps": 8436, "loss": 0.3795, "learning_rate": 6.398104265402843e-06, "epoch": 0.192, "percentage": 6.4, "elapsed_time": "0:42:07", "remaining_time": "10:15:57"} | |
| {"current_steps": 550, "total_steps": 8436, "loss": 0.3592, "learning_rate": 6.516587677725119e-06, "epoch": 0.19555555555555557, "percentage": 6.52, "elapsed_time": "0:42:45", "remaining_time": "10:12:59"} | |
| {"current_steps": 560, "total_steps": 8436, "loss": 0.3759, "learning_rate": 6.635071090047393e-06, "epoch": 0.1991111111111111, "percentage": 6.64, "elapsed_time": "0:43:23", "remaining_time": "10:10:18"} | |
| {"current_steps": 570, "total_steps": 8436, "loss": 0.3372, "learning_rate": 6.753554502369669e-06, "epoch": 0.20266666666666666, "percentage": 6.76, "elapsed_time": "0:43:58", "remaining_time": "10:06:56"} | |
| {"current_steps": 580, "total_steps": 8436, "loss": 0.3821, "learning_rate": 6.8720379146919435e-06, "epoch": 0.20622222222222222, "percentage": 6.88, "elapsed_time": "0:44:36", "remaining_time": "10:04:11"} | |
| {"current_steps": 590, "total_steps": 8436, "loss": 0.4033, "learning_rate": 6.990521327014218e-06, "epoch": 0.20977777777777779, "percentage": 6.99, "elapsed_time": "0:45:14", "remaining_time": "10:01:31"} | |
| {"current_steps": 600, "total_steps": 8436, "loss": 0.3498, "learning_rate": 7.1090047393364935e-06, "epoch": 0.21333333333333335, "percentage": 7.11, "elapsed_time": "0:45:50", "remaining_time": "9:58:36"} | |
| {"current_steps": 610, "total_steps": 8436, "loss": 0.3974, "learning_rate": 7.227488151658768e-06, "epoch": 0.21688888888888888, "percentage": 7.23, "elapsed_time": "0:46:26", "remaining_time": "9:55:45"} | |
| {"current_steps": 620, "total_steps": 8436, "loss": 0.3522, "learning_rate": 7.345971563981044e-06, "epoch": 0.22044444444444444, "percentage": 7.35, "elapsed_time": "0:47:02", "remaining_time": "9:53:01"} | |
| {"current_steps": 630, "total_steps": 8436, "loss": 0.3843, "learning_rate": 7.464454976303318e-06, "epoch": 0.224, "percentage": 7.47, "elapsed_time": "0:47:39", "remaining_time": "9:50:27"} | |
| {"current_steps": 640, "total_steps": 8436, "loss": 0.3852, "learning_rate": 7.582938388625593e-06, "epoch": 0.22755555555555557, "percentage": 7.59, "elapsed_time": "0:48:15", "remaining_time": "9:47:50"} | |
| {"current_steps": 650, "total_steps": 8436, "loss": 0.3753, "learning_rate": 7.701421800947868e-06, "epoch": 0.2311111111111111, "percentage": 7.71, "elapsed_time": "0:48:54", "remaining_time": "9:45:45"} | |
| {"current_steps": 660, "total_steps": 8436, "loss": 0.3622, "learning_rate": 7.819905213270143e-06, "epoch": 0.23466666666666666, "percentage": 7.82, "elapsed_time": "0:49:29", "remaining_time": "9:43:10"} | |
| {"current_steps": 670, "total_steps": 8436, "loss": 0.3776, "learning_rate": 7.938388625592418e-06, "epoch": 0.23822222222222222, "percentage": 7.94, "elapsed_time": "0:50:09", "remaining_time": "9:41:22"} | |
| {"current_steps": 680, "total_steps": 8436, "loss": 0.4131, "learning_rate": 8.056872037914693e-06, "epoch": 0.24177777777777779, "percentage": 8.06, "elapsed_time": "0:50:46", "remaining_time": "9:39:12"} | |
| {"current_steps": 690, "total_steps": 8436, "loss": 0.4041, "learning_rate": 8.175355450236966e-06, "epoch": 0.24533333333333332, "percentage": 8.18, "elapsed_time": "0:51:21", "remaining_time": "9:36:35"} | |
| {"current_steps": 700, "total_steps": 8436, "loss": 0.4342, "learning_rate": 8.293838862559243e-06, "epoch": 0.24888888888888888, "percentage": 8.3, "elapsed_time": "0:52:01", "remaining_time": "9:34:57"} | |
| {"current_steps": 710, "total_steps": 8436, "loss": 0.3753, "learning_rate": 8.412322274881517e-06, "epoch": 0.25244444444444447, "percentage": 8.42, "elapsed_time": "0:52:37", "remaining_time": "9:32:44"} | |
| {"current_steps": 720, "total_steps": 8436, "loss": 0.3499, "learning_rate": 8.530805687203793e-06, "epoch": 0.256, "percentage": 8.53, "elapsed_time": "0:53:15", "remaining_time": "9:30:41"} | |
| {"current_steps": 730, "total_steps": 8436, "loss": 0.3676, "learning_rate": 8.649289099526067e-06, "epoch": 0.25955555555555554, "percentage": 8.65, "elapsed_time": "0:53:50", "remaining_time": "9:28:19"} | |
| {"current_steps": 740, "total_steps": 8436, "loss": 0.3882, "learning_rate": 8.767772511848342e-06, "epoch": 0.26311111111111113, "percentage": 8.77, "elapsed_time": "0:54:24", "remaining_time": "9:25:53"} | |
| {"current_steps": 750, "total_steps": 8436, "loss": 0.3906, "learning_rate": 8.886255924170617e-06, "epoch": 0.26666666666666666, "percentage": 8.89, "elapsed_time": "0:55:01", "remaining_time": "9:23:57"} | |
| {"current_steps": 760, "total_steps": 8436, "loss": 0.3881, "learning_rate": 9.004739336492892e-06, "epoch": 0.2702222222222222, "percentage": 9.01, "elapsed_time": "0:55:38", "remaining_time": "9:21:55"} | |
| {"current_steps": 770, "total_steps": 8436, "loss": 0.3598, "learning_rate": 9.123222748815167e-06, "epoch": 0.2737777777777778, "percentage": 9.13, "elapsed_time": "0:56:13", "remaining_time": "9:19:49"} | |
| {"current_steps": 780, "total_steps": 8436, "loss": 0.3411, "learning_rate": 9.241706161137442e-06, "epoch": 0.2773333333333333, "percentage": 9.25, "elapsed_time": "0:56:51", "remaining_time": "9:18:08"} | |
| {"current_steps": 790, "total_steps": 8436, "loss": 0.3989, "learning_rate": 9.360189573459715e-06, "epoch": 0.2808888888888889, "percentage": 9.36, "elapsed_time": "0:57:31", "remaining_time": "9:16:43"} | |
| {"current_steps": 800, "total_steps": 8436, "loss": 0.3982, "learning_rate": 9.478672985781992e-06, "epoch": 0.28444444444444444, "percentage": 9.48, "elapsed_time": "0:58:09", "remaining_time": "9:15:11"} | |
| {"current_steps": 810, "total_steps": 8436, "loss": 0.414, "learning_rate": 9.597156398104265e-06, "epoch": 0.288, "percentage": 9.6, "elapsed_time": "0:58:44", "remaining_time": "9:13:04"} | |
| {"current_steps": 820, "total_steps": 8436, "loss": 0.3767, "learning_rate": 9.715639810426542e-06, "epoch": 0.29155555555555557, "percentage": 9.72, "elapsed_time": "0:59:22", "remaining_time": "9:11:31"} | |
| {"current_steps": 830, "total_steps": 8436, "loss": 0.3775, "learning_rate": 9.834123222748815e-06, "epoch": 0.2951111111111111, "percentage": 9.84, "elapsed_time": "0:59:58", "remaining_time": "9:09:35"} | |
| {"current_steps": 840, "total_steps": 8436, "loss": 0.3955, "learning_rate": 9.95260663507109e-06, "epoch": 0.2986666666666667, "percentage": 9.96, "elapsed_time": "1:00:34", "remaining_time": "9:07:43"} | |
| {"current_steps": 850, "total_steps": 8436, "loss": 0.3897, "learning_rate": 9.999984589042141e-06, "epoch": 0.3022222222222222, "percentage": 10.08, "elapsed_time": "1:01:10", "remaining_time": "9:05:53"} | |
| {"current_steps": 860, "total_steps": 8436, "loss": 0.3657, "learning_rate": 9.999890411310363e-06, "epoch": 0.30577777777777776, "percentage": 10.19, "elapsed_time": "1:01:46", "remaining_time": "9:04:08"} | |
| {"current_steps": 870, "total_steps": 8436, "loss": 0.3699, "learning_rate": 9.999710619100732e-06, "epoch": 0.30933333333333335, "percentage": 10.31, "elapsed_time": "1:02:21", "remaining_time": "9:02:15"} | |
| {"current_steps": 880, "total_steps": 8436, "loss": 0.3675, "learning_rate": 9.999445215491888e-06, "epoch": 0.3128888888888889, "percentage": 10.43, "elapsed_time": "1:02:57", "remaining_time": "9:00:35"} | |
| {"current_steps": 890, "total_steps": 8436, "loss": 0.3804, "learning_rate": 9.999094205028403e-06, "epoch": 0.3164444444444444, "percentage": 10.55, "elapsed_time": "1:03:34", "remaining_time": "8:58:59"} | |
| {"current_steps": 900, "total_steps": 8436, "loss": 0.3628, "learning_rate": 9.998657593720726e-06, "epoch": 0.32, "percentage": 10.67, "elapsed_time": "1:04:09", "remaining_time": "8:57:15"} | |
| {"current_steps": 910, "total_steps": 8436, "loss": 0.3832, "learning_rate": 9.998135389045071e-06, "epoch": 0.32355555555555554, "percentage": 10.79, "elapsed_time": "1:04:46", "remaining_time": "8:55:39"} | |
| {"current_steps": 920, "total_steps": 8436, "loss": 0.3931, "learning_rate": 9.997527599943288e-06, "epoch": 0.32711111111111113, "percentage": 10.91, "elapsed_time": "1:05:23", "remaining_time": "8:54:15"} | |
| {"current_steps": 930, "total_steps": 8436, "loss": 0.3587, "learning_rate": 9.996834236822718e-06, "epoch": 0.33066666666666666, "percentage": 11.02, "elapsed_time": "1:06:03", "remaining_time": "8:53:10"} | |
| {"current_steps": 940, "total_steps": 8436, "loss": 0.4065, "learning_rate": 9.996055311556002e-06, "epoch": 0.3342222222222222, "percentage": 11.14, "elapsed_time": "1:06:39", "remaining_time": "8:51:30"} | |
| {"current_steps": 950, "total_steps": 8436, "loss": 0.3861, "learning_rate": 9.99519083748089e-06, "epoch": 0.3377777777777778, "percentage": 11.26, "elapsed_time": "1:07:18", "remaining_time": "8:50:20"} | |
| {"current_steps": 960, "total_steps": 8436, "loss": 0.3794, "learning_rate": 9.994240829400006e-06, "epoch": 0.3413333333333333, "percentage": 11.38, "elapsed_time": "1:07:56", "remaining_time": "8:49:07"} | |
| {"current_steps": 970, "total_steps": 8436, "loss": 0.3675, "learning_rate": 9.993205303580596e-06, "epoch": 0.3448888888888889, "percentage": 11.5, "elapsed_time": "1:08:33", "remaining_time": "8:47:38"} | |
| {"current_steps": 980, "total_steps": 8436, "loss": 0.3725, "learning_rate": 9.992084277754246e-06, "epoch": 0.34844444444444445, "percentage": 11.62, "elapsed_time": "1:09:11", "remaining_time": "8:46:25"} | |
| {"current_steps": 990, "total_steps": 8436, "loss": 0.3526, "learning_rate": 9.990877771116588e-06, "epoch": 0.352, "percentage": 11.74, "elapsed_time": "1:09:47", "remaining_time": "8:44:58"} | |
| {"current_steps": 1000, "total_steps": 8436, "loss": 0.3451, "learning_rate": 9.989585804326963e-06, "epoch": 0.35555555555555557, "percentage": 11.85, "elapsed_time": "1:10:23", "remaining_time": "8:43:22"} | |
| {"current_steps": 1000, "total_steps": 8436, "eval_loss": 0.2586575448513031, "epoch": 0.35555555555555557, "percentage": 11.85, "elapsed_time": "1:19:44", "remaining_time": "9:53:00"} | |
| {"current_steps": 1010, "total_steps": 8436, "loss": 0.3923, "learning_rate": 9.988208399508064e-06, "epoch": 0.3591111111111111, "percentage": 11.97, "elapsed_time": "1:20:19", "remaining_time": "9:50:32"} | |
| {"current_steps": 1020, "total_steps": 8436, "loss": 0.3077, "learning_rate": 9.986745580245569e-06, "epoch": 0.3626666666666667, "percentage": 12.09, "elapsed_time": "1:20:56", "remaining_time": "9:48:32"} | |
| {"current_steps": 1030, "total_steps": 8436, "loss": 0.389, "learning_rate": 9.985197371587732e-06, "epoch": 0.3662222222222222, "percentage": 12.21, "elapsed_time": "1:21:33", "remaining_time": "9:46:23"} | |
| {"current_steps": 1040, "total_steps": 8436, "loss": 0.3424, "learning_rate": 9.983563800044942e-06, "epoch": 0.36977777777777776, "percentage": 12.33, "elapsed_time": "1:22:08", "remaining_time": "9:44:11"} | |
| {"current_steps": 1050, "total_steps": 8436, "loss": 0.3558, "learning_rate": 9.981844893589294e-06, "epoch": 0.37333333333333335, "percentage": 12.45, "elapsed_time": "1:22:46", "remaining_time": "9:42:14"} | |
| {"current_steps": 1060, "total_steps": 8436, "loss": 0.3693, "learning_rate": 9.980040681654085e-06, "epoch": 0.3768888888888889, "percentage": 12.57, "elapsed_time": "1:23:21", "remaining_time": "9:40:04"} | |
| {"current_steps": 1070, "total_steps": 8436, "loss": 0.3638, "learning_rate": 9.978151195133326e-06, "epoch": 0.3804444444444444, "percentage": 12.68, "elapsed_time": "1:23:57", "remaining_time": "9:37:56"} | |
| {"current_steps": 1080, "total_steps": 8436, "loss": 0.3484, "learning_rate": 9.976176466381205e-06, "epoch": 0.384, "percentage": 12.8, "elapsed_time": "1:24:32", "remaining_time": "9:35:50"} | |
| {"current_steps": 1090, "total_steps": 8436, "loss": 0.3967, "learning_rate": 9.974116529211539e-06, "epoch": 0.38755555555555554, "percentage": 12.92, "elapsed_time": "1:25:08", "remaining_time": "9:33:47"} | |
| {"current_steps": 1100, "total_steps": 8436, "loss": 0.3741, "learning_rate": 9.971971418897189e-06, "epoch": 0.39111111111111113, "percentage": 13.04, "elapsed_time": "1:25:42", "remaining_time": "9:31:34"} | |
| {"current_steps": 1110, "total_steps": 8436, "loss": 0.3904, "learning_rate": 9.969741172169461e-06, "epoch": 0.39466666666666667, "percentage": 13.16, "elapsed_time": "1:26:18", "remaining_time": "9:29:39"} | |
| {"current_steps": 1120, "total_steps": 8436, "loss": 0.3485, "learning_rate": 9.967425827217473e-06, "epoch": 0.3982222222222222, "percentage": 13.28, "elapsed_time": "1:26:55", "remaining_time": "9:27:45"} | |
| {"current_steps": 1130, "total_steps": 8436, "loss": 0.346, "learning_rate": 9.965025423687505e-06, "epoch": 0.4017777777777778, "percentage": 13.39, "elapsed_time": "1:27:31", "remaining_time": "9:25:55"} | |
| {"current_steps": 1140, "total_steps": 8436, "loss": 0.3635, "learning_rate": 9.962540002682314e-06, "epoch": 0.4053333333333333, "percentage": 13.51, "elapsed_time": "1:28:09", "remaining_time": "9:24:15"} | |
| {"current_steps": 1150, "total_steps": 8436, "loss": 0.3794, "learning_rate": 9.95996960676044e-06, "epoch": 0.4088888888888889, "percentage": 13.63, "elapsed_time": "1:28:46", "remaining_time": "9:22:27"} | |
| {"current_steps": 1160, "total_steps": 8436, "loss": 0.3727, "learning_rate": 9.957314279935467e-06, "epoch": 0.41244444444444445, "percentage": 13.75, "elapsed_time": "1:29:23", "remaining_time": "9:20:40"} | |
| {"current_steps": 1170, "total_steps": 8436, "loss": 0.3472, "learning_rate": 9.954574067675276e-06, "epoch": 0.416, "percentage": 13.87, "elapsed_time": "1:30:01", "remaining_time": "9:19:07"} | |
| {"current_steps": 1180, "total_steps": 8436, "loss": 0.3651, "learning_rate": 9.951749016901266e-06, "epoch": 0.41955555555555557, "percentage": 13.99, "elapsed_time": "1:30:37", "remaining_time": "9:17:18"} | |
| {"current_steps": 1190, "total_steps": 8436, "loss": 0.4007, "learning_rate": 9.948839175987543e-06, "epoch": 0.4231111111111111, "percentage": 14.11, "elapsed_time": "1:31:13", "remaining_time": "9:15:26"} | |
| {"current_steps": 1200, "total_steps": 8436, "loss": 0.3662, "learning_rate": 9.945844594760104e-06, "epoch": 0.4266666666666667, "percentage": 14.22, "elapsed_time": "1:31:49", "remaining_time": "9:13:44"} | |
| {"current_steps": 1210, "total_steps": 8436, "loss": 0.3266, "learning_rate": 9.94276532449597e-06, "epoch": 0.43022222222222223, "percentage": 14.34, "elapsed_time": "1:32:25", "remaining_time": "9:11:54"} | |
| {"current_steps": 1220, "total_steps": 8436, "loss": 0.367, "learning_rate": 9.939601417922326e-06, "epoch": 0.43377777777777776, "percentage": 14.46, "elapsed_time": "1:32:59", "remaining_time": "9:10:00"} | |
| {"current_steps": 1230, "total_steps": 8436, "loss": 0.3479, "learning_rate": 9.936352929215598e-06, "epoch": 0.43733333333333335, "percentage": 14.58, "elapsed_time": "1:33:36", "remaining_time": "9:08:24"} | |
| {"current_steps": 1240, "total_steps": 8436, "loss": 0.3991, "learning_rate": 9.933019914000537e-06, "epoch": 0.4408888888888889, "percentage": 14.7, "elapsed_time": "1:34:13", "remaining_time": "9:06:46"} | |
| {"current_steps": 1250, "total_steps": 8436, "loss": 0.387, "learning_rate": 9.929602429349267e-06, "epoch": 0.4444444444444444, "percentage": 14.82, "elapsed_time": "1:34:48", "remaining_time": "9:05:03"} | |
| {"current_steps": 1260, "total_steps": 8436, "loss": 0.3623, "learning_rate": 9.926100533780304e-06, "epoch": 0.448, "percentage": 14.94, "elapsed_time": "1:35:22", "remaining_time": "9:03:13"} | |
| {"current_steps": 1270, "total_steps": 8436, "loss": 0.3758, "learning_rate": 9.922514287257553e-06, "epoch": 0.45155555555555554, "percentage": 15.05, "elapsed_time": "1:36:01", "remaining_time": "9:01:50"} | |
| {"current_steps": 1280, "total_steps": 8436, "loss": 0.3355, "learning_rate": 9.918843751189285e-06, "epoch": 0.45511111111111113, "percentage": 15.17, "elapsed_time": "1:36:36", "remaining_time": "9:00:04"} | |
| {"current_steps": 1290, "total_steps": 8436, "loss": 0.3698, "learning_rate": 9.915088988427085e-06, "epoch": 0.45866666666666667, "percentage": 15.29, "elapsed_time": "1:37:10", "remaining_time": "8:58:18"} | |
| {"current_steps": 1300, "total_steps": 8436, "loss": 0.4047, "learning_rate": 9.911250063264768e-06, "epoch": 0.4622222222222222, "percentage": 15.41, "elapsed_time": "1:37:48", "remaining_time": "8:56:50"} | |
| {"current_steps": 1310, "total_steps": 8436, "loss": 0.3692, "learning_rate": 9.907327041437295e-06, "epoch": 0.4657777777777778, "percentage": 15.53, "elapsed_time": "1:38:23", "remaining_time": "8:55:11"} | |
| {"current_steps": 1320, "total_steps": 8436, "loss": 0.36, "learning_rate": 9.903319990119629e-06, "epoch": 0.4693333333333333, "percentage": 15.65, "elapsed_time": "1:38:59", "remaining_time": "8:53:40"} | |
| {"current_steps": 1330, "total_steps": 8436, "loss": 0.3741, "learning_rate": 9.899228977925594e-06, "epoch": 0.4728888888888889, "percentage": 15.77, "elapsed_time": "1:39:34", "remaining_time": "8:51:59"} | |
| {"current_steps": 1340, "total_steps": 8436, "loss": 0.3407, "learning_rate": 9.895054074906703e-06, "epoch": 0.47644444444444445, "percentage": 15.88, "elapsed_time": "1:40:09", "remaining_time": "8:50:24"} | |
| {"current_steps": 1350, "total_steps": 8436, "loss": 0.3737, "learning_rate": 9.890795352550949e-06, "epoch": 0.48, "percentage": 16.0, "elapsed_time": "1:40:46", "remaining_time": "8:48:59"} | |
| {"current_steps": 1360, "total_steps": 8436, "loss": 0.3706, "learning_rate": 9.886452883781588e-06, "epoch": 0.48355555555555557, "percentage": 16.12, "elapsed_time": "1:41:22", "remaining_time": "8:47:24"} | |
| {"current_steps": 1370, "total_steps": 8436, "loss": 0.3593, "learning_rate": 9.882026742955892e-06, "epoch": 0.4871111111111111, "percentage": 16.24, "elapsed_time": "1:41:56", "remaining_time": "8:45:45"} | |
| {"current_steps": 1380, "total_steps": 8436, "loss": 0.388, "learning_rate": 9.877517005863865e-06, "epoch": 0.49066666666666664, "percentage": 16.36, "elapsed_time": "1:42:32", "remaining_time": "8:44:16"} | |
| {"current_steps": 1390, "total_steps": 8436, "loss": 0.3825, "learning_rate": 9.872923749726959e-06, "epoch": 0.49422222222222223, "percentage": 16.48, "elapsed_time": "1:43:09", "remaining_time": "8:42:57"} | |
| {"current_steps": 1400, "total_steps": 8436, "loss": 0.3406, "learning_rate": 9.868247053196744e-06, "epoch": 0.49777777777777776, "percentage": 16.6, "elapsed_time": "1:43:44", "remaining_time": "8:41:22"} | |
| {"current_steps": 1410, "total_steps": 8436, "loss": 0.3718, "learning_rate": 9.86348699635356e-06, "epoch": 0.5013333333333333, "percentage": 16.71, "elapsed_time": "1:44:19", "remaining_time": "8:39:48"} | |
| {"current_steps": 1420, "total_steps": 8436, "loss": 0.3728, "learning_rate": 9.85864366070515e-06, "epoch": 0.5048888888888889, "percentage": 16.83, "elapsed_time": "1:44:57", "remaining_time": "8:38:35"} | |
| {"current_steps": 1430, "total_steps": 8436, "loss": 0.3371, "learning_rate": 9.853717129185262e-06, "epoch": 0.5084444444444445, "percentage": 16.95, "elapsed_time": "1:45:33", "remaining_time": "8:37:11"} | |
| {"current_steps": 1440, "total_steps": 8436, "loss": 0.3468, "learning_rate": 9.848707486152231e-06, "epoch": 0.512, "percentage": 17.07, "elapsed_time": "1:46:08", "remaining_time": "8:35:39"} | |
| {"current_steps": 1450, "total_steps": 8436, "loss": 0.3456, "learning_rate": 9.843614817387531e-06, "epoch": 0.5155555555555555, "percentage": 17.19, "elapsed_time": "1:46:43", "remaining_time": "8:34:12"} | |
| {"current_steps": 1460, "total_steps": 8436, "loss": 0.3244, "learning_rate": 9.838439210094309e-06, "epoch": 0.5191111111111111, "percentage": 17.31, "elapsed_time": "1:47:23", "remaining_time": "8:33:08"} | |
| {"current_steps": 1470, "total_steps": 8436, "loss": 0.3391, "learning_rate": 9.833180752895887e-06, "epoch": 0.5226666666666666, "percentage": 17.43, "elapsed_time": "1:48:04", "remaining_time": "8:32:08"} | |
| {"current_steps": 1480, "total_steps": 8436, "loss": 0.3922, "learning_rate": 9.827839535834258e-06, "epoch": 0.5262222222222223, "percentage": 17.54, "elapsed_time": "1:48:39", "remaining_time": "8:30:43"} | |
| {"current_steps": 1490, "total_steps": 8436, "loss": 0.304, "learning_rate": 9.822415650368525e-06, "epoch": 0.5297777777777778, "percentage": 17.66, "elapsed_time": "1:49:17", "remaining_time": "8:29:27"} | |
| {"current_steps": 1500, "total_steps": 8436, "loss": 0.3531, "learning_rate": 9.816909189373347e-06, "epoch": 0.5333333333333333, "percentage": 17.78, "elapsed_time": "1:49:51", "remaining_time": "8:27:59"} | |
| {"current_steps": 1500, "total_steps": 8436, "eval_loss": 0.24488620460033417, "epoch": 0.5333333333333333, "percentage": 17.78, "elapsed_time": "1:59:13", "remaining_time": "9:11:18"} | |
| {"current_steps": 1510, "total_steps": 8436, "loss": 0.3771, "learning_rate": 9.81132024713735e-06, "epoch": 0.5368888888888889, "percentage": 17.9, "elapsed_time": "1:59:50", "remaining_time": "9:09:43"} | |
| {"current_steps": 1520, "total_steps": 8436, "loss": 0.3848, "learning_rate": 9.805648919361505e-06, "epoch": 0.5404444444444444, "percentage": 18.02, "elapsed_time": "2:00:26", "remaining_time": "9:08:00"} | |
| {"current_steps": 1530, "total_steps": 8436, "loss": 0.3694, "learning_rate": 9.799895303157492e-06, "epoch": 0.544, "percentage": 18.14, "elapsed_time": "2:01:02", "remaining_time": "9:06:22"} | |
| {"current_steps": 1540, "total_steps": 8436, "loss": 0.3553, "learning_rate": 9.794059497046043e-06, "epoch": 0.5475555555555556, "percentage": 18.26, "elapsed_time": "2:01:39", "remaining_time": "9:04:47"} | |
| {"current_steps": 1550, "total_steps": 8436, "loss": 0.3357, "learning_rate": 9.788141600955244e-06, "epoch": 0.5511111111111111, "percentage": 18.37, "elapsed_time": "2:02:14", "remaining_time": "9:03:05"} | |
| {"current_steps": 1560, "total_steps": 8436, "loss": 0.3448, "learning_rate": 9.782141716218832e-06, "epoch": 0.5546666666666666, "percentage": 18.49, "elapsed_time": "2:02:50", "remaining_time": "9:01:24"} | |
| {"current_steps": 1570, "total_steps": 8436, "loss": 0.3336, "learning_rate": 9.77605994557446e-06, "epoch": 0.5582222222222222, "percentage": 18.61, "elapsed_time": "2:03:27", "remaining_time": "8:59:56"} | |
| {"current_steps": 1580, "total_steps": 8436, "loss": 0.336, "learning_rate": 9.769896393161937e-06, "epoch": 0.5617777777777778, "percentage": 18.73, "elapsed_time": "2:04:03", "remaining_time": "8:58:18"} | |
| {"current_steps": 1590, "total_steps": 8436, "loss": 0.3505, "learning_rate": 9.763651164521436e-06, "epoch": 0.5653333333333334, "percentage": 18.85, "elapsed_time": "2:04:40", "remaining_time": "8:56:50"} | |
| {"current_steps": 1600, "total_steps": 8436, "loss": 0.3816, "learning_rate": 9.7573243665917e-06, "epoch": 0.5688888888888889, "percentage": 18.97, "elapsed_time": "2:05:16", "remaining_time": "8:55:12"} | |
| {"current_steps": 1610, "total_steps": 8436, "loss": 0.358, "learning_rate": 9.750916107708205e-06, "epoch": 0.5724444444444444, "percentage": 19.08, "elapsed_time": "2:05:53", "remaining_time": "8:53:44"} | |
| {"current_steps": 1620, "total_steps": 8436, "loss": 0.363, "learning_rate": 9.744426497601305e-06, "epoch": 0.576, "percentage": 19.2, "elapsed_time": "2:06:28", "remaining_time": "8:52:09"} | |
| {"current_steps": 1630, "total_steps": 8436, "loss": 0.3544, "learning_rate": 9.737855647394346e-06, "epoch": 0.5795555555555556, "percentage": 19.32, "elapsed_time": "2:07:06", "remaining_time": "8:50:44"} | |
| {"current_steps": 1640, "total_steps": 8436, "loss": 0.375, "learning_rate": 9.73120366960178e-06, "epoch": 0.5831111111111111, "percentage": 19.44, "elapsed_time": "2:07:43", "remaining_time": "8:49:15"} | |
| {"current_steps": 1650, "total_steps": 8436, "loss": 0.3649, "learning_rate": 9.724470678127226e-06, "epoch": 0.5866666666666667, "percentage": 19.56, "elapsed_time": "2:08:23", "remaining_time": "8:48:02"} | |
| {"current_steps": 1660, "total_steps": 8436, "loss": 0.3716, "learning_rate": 9.717656788261519e-06, "epoch": 0.5902222222222222, "percentage": 19.68, "elapsed_time": "2:09:00", "remaining_time": "8:46:35"} | |
| {"current_steps": 1670, "total_steps": 8436, "loss": 0.352, "learning_rate": 9.71076211668074e-06, "epoch": 0.5937777777777777, "percentage": 19.8, "elapsed_time": "2:09:35", "remaining_time": "8:45:03"} | |
| {"current_steps": 1680, "total_steps": 8436, "loss": 0.3555, "learning_rate": 9.703786781444218e-06, "epoch": 0.5973333333333334, "percentage": 19.91, "elapsed_time": "2:10:12", "remaining_time": "8:43:37"} | |
| {"current_steps": 1690, "total_steps": 8436, "loss": 0.3348, "learning_rate": 9.69673090199251e-06, "epoch": 0.6008888888888889, "percentage": 20.03, "elapsed_time": "2:10:47", "remaining_time": "8:42:06"} | |
| {"current_steps": 1700, "total_steps": 8436, "loss": 0.3499, "learning_rate": 9.689594599145348e-06, "epoch": 0.6044444444444445, "percentage": 20.15, "elapsed_time": "2:11:26", "remaining_time": "8:40:47"} | |
| {"current_steps": 1710, "total_steps": 8436, "loss": 0.3389, "learning_rate": 9.682377995099581e-06, "epoch": 0.608, "percentage": 20.27, "elapsed_time": "2:12:02", "remaining_time": "8:39:20"} | |
| {"current_steps": 1720, "total_steps": 8436, "loss": 0.3412, "learning_rate": 9.675081213427076e-06, "epoch": 0.6115555555555555, "percentage": 20.39, "elapsed_time": "2:12:40", "remaining_time": "8:38:03"} | |
| {"current_steps": 1730, "total_steps": 8436, "loss": 0.3363, "learning_rate": 9.667704379072597e-06, "epoch": 0.6151111111111112, "percentage": 20.51, "elapsed_time": "2:13:19", "remaining_time": "8:36:50"} | |
| {"current_steps": 1740, "total_steps": 8436, "loss": 0.3328, "learning_rate": 9.660247618351683e-06, "epoch": 0.6186666666666667, "percentage": 20.63, "elapsed_time": "2:13:55", "remaining_time": "8:35:22"} | |
| {"current_steps": 1750, "total_steps": 8436, "loss": 0.3509, "learning_rate": 9.652711058948463e-06, "epoch": 0.6222222222222222, "percentage": 20.74, "elapsed_time": "2:14:30", "remaining_time": "8:33:54"} | |
| {"current_steps": 1760, "total_steps": 8436, "loss": 0.3471, "learning_rate": 9.645094829913487e-06, "epoch": 0.6257777777777778, "percentage": 20.86, "elapsed_time": "2:15:06", "remaining_time": "8:32:29"} | |
| {"current_steps": 1770, "total_steps": 8436, "loss": 0.3246, "learning_rate": 9.637399061661507e-06, "epoch": 0.6293333333333333, "percentage": 20.98, "elapsed_time": "2:15:42", "remaining_time": "8:31:05"} | |
| {"current_steps": 1780, "total_steps": 8436, "loss": 0.3399, "learning_rate": 9.62962388596925e-06, "epoch": 0.6328888888888888, "percentage": 21.1, "elapsed_time": "2:16:18", "remaining_time": "8:29:42"} | |
| {"current_steps": 1790, "total_steps": 8436, "loss": 0.3478, "learning_rate": 9.621769435973152e-06, "epoch": 0.6364444444444445, "percentage": 21.22, "elapsed_time": "2:16:52", "remaining_time": "8:28:12"} | |
| {"current_steps": 1800, "total_steps": 8436, "loss": 0.3251, "learning_rate": 9.61383584616709e-06, "epoch": 0.64, "percentage": 21.34, "elapsed_time": "2:17:27", "remaining_time": "8:26:45"} | |
| {"current_steps": 1810, "total_steps": 8436, "loss": 0.3553, "learning_rate": 9.60582325240007e-06, "epoch": 0.6435555555555555, "percentage": 21.46, "elapsed_time": "2:18:03", "remaining_time": "8:25:25"} | |
| {"current_steps": 1820, "total_steps": 8436, "loss": 0.3594, "learning_rate": 9.597731791873907e-06, "epoch": 0.6471111111111111, "percentage": 21.57, "elapsed_time": "2:18:40", "remaining_time": "8:24:06"} | |
| {"current_steps": 1830, "total_steps": 8436, "loss": 0.3549, "learning_rate": 9.58956160314087e-06, "epoch": 0.6506666666666666, "percentage": 21.69, "elapsed_time": "2:19:16", "remaining_time": "8:22:44"} | |
| {"current_steps": 1840, "total_steps": 8436, "loss": 0.3813, "learning_rate": 9.581312826101315e-06, "epoch": 0.6542222222222223, "percentage": 21.81, "elapsed_time": "2:19:54", "remaining_time": "8:21:31"} | |
| {"current_steps": 1850, "total_steps": 8436, "loss": 0.3518, "learning_rate": 9.572985602001283e-06, "epoch": 0.6577777777777778, "percentage": 21.93, "elapsed_time": "2:20:29", "remaining_time": "8:20:09"} | |
| {"current_steps": 1860, "total_steps": 8436, "loss": 0.3303, "learning_rate": 9.56458007343009e-06, "epoch": 0.6613333333333333, "percentage": 22.05, "elapsed_time": "2:21:05", "remaining_time": "8:18:51"} | |
| {"current_steps": 1870, "total_steps": 8436, "loss": 0.3403, "learning_rate": 9.556096384317878e-06, "epoch": 0.6648888888888889, "percentage": 22.17, "elapsed_time": "2:21:42", "remaining_time": "8:17:35"} | |
| {"current_steps": 1880, "total_steps": 8436, "loss": 0.3717, "learning_rate": 9.547534679933155e-06, "epoch": 0.6684444444444444, "percentage": 22.29, "elapsed_time": "2:22:21", "remaining_time": "8:16:26"} | |
| {"current_steps": 1890, "total_steps": 8436, "loss": 0.3468, "learning_rate": 9.538895106880302e-06, "epoch": 0.672, "percentage": 22.4, "elapsed_time": "2:23:00", "remaining_time": "8:15:18"} | |
| {"current_steps": 1900, "total_steps": 8436, "loss": 0.3495, "learning_rate": 9.53017781309707e-06, "epoch": 0.6755555555555556, "percentage": 22.52, "elapsed_time": "2:23:37", "remaining_time": "8:14:03"} | |
| {"current_steps": 1910, "total_steps": 8436, "loss": 0.3631, "learning_rate": 9.521382947852042e-06, "epoch": 0.6791111111111111, "percentage": 22.64, "elapsed_time": "2:24:15", "remaining_time": "8:12:53"} | |
| {"current_steps": 1920, "total_steps": 8436, "loss": 0.366, "learning_rate": 9.512510661742078e-06, "epoch": 0.6826666666666666, "percentage": 22.76, "elapsed_time": "2:24:50", "remaining_time": "8:11:33"} | |
| {"current_steps": 1930, "total_steps": 8436, "loss": 0.3165, "learning_rate": 9.503561106689736e-06, "epoch": 0.6862222222222222, "percentage": 22.88, "elapsed_time": "2:25:27", "remaining_time": "8:10:21"} | |
| {"current_steps": 1940, "total_steps": 8436, "loss": 0.3199, "learning_rate": 9.494534435940668e-06, "epoch": 0.6897777777777778, "percentage": 23.0, "elapsed_time": "2:26:05", "remaining_time": "8:09:12"} | |
| {"current_steps": 1950, "total_steps": 8436, "loss": 0.3244, "learning_rate": 9.485430804061009e-06, "epoch": 0.6933333333333334, "percentage": 23.12, "elapsed_time": "2:26:42", "remaining_time": "8:07:58"} | |
| {"current_steps": 1960, "total_steps": 8436, "loss": 0.3557, "learning_rate": 9.476250366934708e-06, "epoch": 0.6968888888888889, "percentage": 23.23, "elapsed_time": "2:27:17", "remaining_time": "8:06:41"} | |
| {"current_steps": 1970, "total_steps": 8436, "loss": 0.3367, "learning_rate": 9.466993281760879e-06, "epoch": 0.7004444444444444, "percentage": 23.35, "elapsed_time": "2:27:53", "remaining_time": "8:05:26"} | |
| {"current_steps": 1980, "total_steps": 8436, "loss": 0.335, "learning_rate": 9.457659707051099e-06, "epoch": 0.704, "percentage": 23.47, "elapsed_time": "2:28:32", "remaining_time": "8:04:18"} | |
| {"current_steps": 1990, "total_steps": 8436, "loss": 0.3286, "learning_rate": 9.448249802626696e-06, "epoch": 0.7075555555555556, "percentage": 23.59, "elapsed_time": "2:29:07", "remaining_time": "8:03:02"} | |
| {"current_steps": 2000, "total_steps": 8436, "loss": 0.3544, "learning_rate": 9.43876372961601e-06, "epoch": 0.7111111111111111, "percentage": 23.71, "elapsed_time": "2:29:42", "remaining_time": "8:01:44"} | |
| {"current_steps": 2000, "total_steps": 8436, "eval_loss": 0.23682241141796112, "epoch": 0.7111111111111111, "percentage": 23.71, "elapsed_time": "2:39:03", "remaining_time": "8:31:49"} | |
| {"current_steps": 2010, "total_steps": 8436, "loss": 0.3218, "learning_rate": 9.429201650451642e-06, "epoch": 0.7146666666666667, "percentage": 23.83, "elapsed_time": "2:40:03", "remaining_time": "8:31:43"} | |
| {"current_steps": 2020, "total_steps": 8436, "loss": 0.3417, "learning_rate": 9.419563728867663e-06, "epoch": 0.7182222222222222, "percentage": 23.94, "elapsed_time": "2:40:40", "remaining_time": "8:30:19"} | |
| {"current_steps": 2030, "total_steps": 8436, "loss": 0.3104, "learning_rate": 9.409850129896812e-06, "epoch": 0.7217777777777777, "percentage": 24.06, "elapsed_time": "2:41:17", "remaining_time": "8:28:57"} | |
| {"current_steps": 2040, "total_steps": 8436, "loss": 0.3371, "learning_rate": 9.40006101986768e-06, "epoch": 0.7253333333333334, "percentage": 24.18, "elapsed_time": "2:41:53", "remaining_time": "8:27:34"} | |
| {"current_steps": 2050, "total_steps": 8436, "loss": 0.3324, "learning_rate": 9.390196566401844e-06, "epoch": 0.7288888888888889, "percentage": 24.3, "elapsed_time": "2:42:29", "remaining_time": "8:26:09"} | |
| {"current_steps": 2060, "total_steps": 8436, "loss": 0.3384, "learning_rate": 9.38025693841102e-06, "epoch": 0.7324444444444445, "percentage": 24.42, "elapsed_time": "2:43:02", "remaining_time": "8:24:39"} | |
| {"current_steps": 2070, "total_steps": 8436, "loss": 0.3339, "learning_rate": 9.370242306094141e-06, "epoch": 0.736, "percentage": 24.54, "elapsed_time": "2:43:38", "remaining_time": "8:23:15"} | |
| {"current_steps": 2080, "total_steps": 8436, "loss": 0.3449, "learning_rate": 9.360152840934477e-06, "epoch": 0.7395555555555555, "percentage": 24.66, "elapsed_time": "2:44:14", "remaining_time": "8:21:53"} | |
| {"current_steps": 2090, "total_steps": 8436, "loss": 0.3444, "learning_rate": 9.349988715696671e-06, "epoch": 0.7431111111111111, "percentage": 24.77, "elapsed_time": "2:44:51", "remaining_time": "8:20:34"} | |
| {"current_steps": 2100, "total_steps": 8436, "loss": 0.3496, "learning_rate": 9.33975010442379e-06, "epoch": 0.7466666666666667, "percentage": 24.89, "elapsed_time": "2:45:28", "remaining_time": "8:19:16"} | |
| {"current_steps": 2110, "total_steps": 8436, "loss": 0.3202, "learning_rate": 9.329437182434351e-06, "epoch": 0.7502222222222222, "percentage": 25.01, "elapsed_time": "2:46:04", "remaining_time": "8:17:53"} | |
| {"current_steps": 2120, "total_steps": 8436, "loss": 0.3545, "learning_rate": 9.31905012631931e-06, "epoch": 0.7537777777777778, "percentage": 25.13, "elapsed_time": "2:46:45", "remaining_time": "8:16:48"} | |
| {"current_steps": 2130, "total_steps": 8436, "loss": 0.3457, "learning_rate": 9.30858911393904e-06, "epoch": 0.7573333333333333, "percentage": 25.25, "elapsed_time": "2:47:20", "remaining_time": "8:15:25"} | |
| {"current_steps": 2140, "total_steps": 8436, "loss": 0.3125, "learning_rate": 9.298054324420294e-06, "epoch": 0.7608888888888888, "percentage": 25.37, "elapsed_time": "2:47:58", "remaining_time": "8:14:10"} | |
| {"current_steps": 2150, "total_steps": 8436, "loss": 0.3596, "learning_rate": 9.287445938153121e-06, "epoch": 0.7644444444444445, "percentage": 25.49, "elapsed_time": "2:48:33", "remaining_time": "8:12:49"} | |
| {"current_steps": 2160, "total_steps": 8436, "loss": 0.3352, "learning_rate": 9.276764136787798e-06, "epoch": 0.768, "percentage": 25.6, "elapsed_time": "2:49:08", "remaining_time": "8:11:27"} | |
| {"current_steps": 2170, "total_steps": 8436, "loss": 0.3504, "learning_rate": 9.266009103231702e-06, "epoch": 0.7715555555555556, "percentage": 25.72, "elapsed_time": "2:49:45", "remaining_time": "8:10:10"} | |
| {"current_steps": 2180, "total_steps": 8436, "loss": 0.3289, "learning_rate": 9.255181021646182e-06, "epoch": 0.7751111111111111, "percentage": 25.84, "elapsed_time": "2:50:19", "remaining_time": "8:08:47"} | |
| {"current_steps": 2190, "total_steps": 8436, "loss": 0.3542, "learning_rate": 9.244280077443417e-06, "epoch": 0.7786666666666666, "percentage": 25.96, "elapsed_time": "2:50:56", "remaining_time": "8:07:31"} | |
| {"current_steps": 2200, "total_steps": 8436, "loss": 0.3516, "learning_rate": 9.233306457283223e-06, "epoch": 0.7822222222222223, "percentage": 26.08, "elapsed_time": "2:51:31", "remaining_time": "8:06:11"} | |
| {"current_steps": 2210, "total_steps": 8436, "loss": 0.3489, "learning_rate": 9.222260349069874e-06, "epoch": 0.7857777777777778, "percentage": 26.2, "elapsed_time": "2:52:08", "remaining_time": "8:04:56"} | |
| {"current_steps": 2220, "total_steps": 8436, "loss": 0.3581, "learning_rate": 9.211141941948872e-06, "epoch": 0.7893333333333333, "percentage": 26.32, "elapsed_time": "2:52:44", "remaining_time": "8:03:40"} | |
| {"current_steps": 2230, "total_steps": 8436, "loss": 0.3415, "learning_rate": 9.199951426303711e-06, "epoch": 0.7928888888888889, "percentage": 26.43, "elapsed_time": "2:53:21", "remaining_time": "8:02:26"} | |
| {"current_steps": 2240, "total_steps": 8436, "loss": 0.3355, "learning_rate": 9.188688993752626e-06, "epoch": 0.7964444444444444, "percentage": 26.55, "elapsed_time": "2:53:58", "remaining_time": "8:01:13"} | |
| {"current_steps": 2250, "total_steps": 8436, "loss": 0.3394, "learning_rate": 9.177354837145298e-06, "epoch": 0.8, "percentage": 26.67, "elapsed_time": "2:54:33", "remaining_time": "7:59:56"} | |
| {"current_steps": 2260, "total_steps": 8436, "loss": 0.3545, "learning_rate": 9.165949150559561e-06, "epoch": 0.8035555555555556, "percentage": 26.79, "elapsed_time": "2:55:08", "remaining_time": "7:58:37"} | |
| {"current_steps": 2270, "total_steps": 8436, "loss": 0.363, "learning_rate": 9.154472129298075e-06, "epoch": 0.8071111111111111, "percentage": 26.91, "elapsed_time": "2:55:46", "remaining_time": "7:57:27"} | |
| {"current_steps": 2280, "total_steps": 8436, "loss": 0.3395, "learning_rate": 9.142923969884984e-06, "epoch": 0.8106666666666666, "percentage": 27.03, "elapsed_time": "2:56:22", "remaining_time": "7:56:11"} | |
| {"current_steps": 2290, "total_steps": 8436, "loss": 0.3486, "learning_rate": 9.131304870062554e-06, "epoch": 0.8142222222222222, "percentage": 27.15, "elapsed_time": "2:57:01", "remaining_time": "7:55:05"} | |
| {"current_steps": 2300, "total_steps": 8436, "loss": 0.3509, "learning_rate": 9.119615028787771e-06, "epoch": 0.8177777777777778, "percentage": 27.26, "elapsed_time": "2:57:37", "remaining_time": "7:53:52"} | |
| {"current_steps": 2310, "total_steps": 8436, "loss": 0.325, "learning_rate": 9.107854646228961e-06, "epoch": 0.8213333333333334, "percentage": 27.38, "elapsed_time": "2:58:12", "remaining_time": "7:52:36"} | |
| {"current_steps": 2320, "total_steps": 8436, "loss": 0.3149, "learning_rate": 9.096023923762333e-06, "epoch": 0.8248888888888889, "percentage": 27.5, "elapsed_time": "2:58:52", "remaining_time": "7:51:32"} | |
| {"current_steps": 2330, "total_steps": 8436, "loss": 0.348, "learning_rate": 9.08412306396856e-06, "epoch": 0.8284444444444444, "percentage": 27.62, "elapsed_time": "2:59:29", "remaining_time": "7:50:23"} | |
| {"current_steps": 2340, "total_steps": 8436, "loss": 0.3096, "learning_rate": 9.072152270629281e-06, "epoch": 0.832, "percentage": 27.74, "elapsed_time": "3:00:05", "remaining_time": "7:49:09"} | |
| {"current_steps": 2350, "total_steps": 8436, "loss": 0.3609, "learning_rate": 9.060111748723639e-06, "epoch": 0.8355555555555556, "percentage": 27.86, "elapsed_time": "3:00:40", "remaining_time": "7:47:54"} | |
| {"current_steps": 2360, "total_steps": 8436, "loss": 0.3307, "learning_rate": 9.048001704424747e-06, "epoch": 0.8391111111111111, "percentage": 27.98, "elapsed_time": "3:01:14", "remaining_time": "7:46:37"} | |
| {"current_steps": 2370, "total_steps": 8436, "loss": 0.3327, "learning_rate": 9.035822345096177e-06, "epoch": 0.8426666666666667, "percentage": 28.09, "elapsed_time": "3:01:51", "remaining_time": "7:45:26"} | |
| {"current_steps": 2380, "total_steps": 8436, "loss": 0.3312, "learning_rate": 9.023573879288394e-06, "epoch": 0.8462222222222222, "percentage": 28.21, "elapsed_time": "3:02:28", "remaining_time": "7:44:19"} | |
| {"current_steps": 2390, "total_steps": 8436, "loss": 0.3298, "learning_rate": 9.0112565167352e-06, "epoch": 0.8497777777777777, "percentage": 28.33, "elapsed_time": "3:03:03", "remaining_time": "7:43:05"} | |
| {"current_steps": 2400, "total_steps": 8436, "loss": 0.3404, "learning_rate": 8.99887046835013e-06, "epoch": 0.8533333333333334, "percentage": 28.45, "elapsed_time": "3:03:37", "remaining_time": "7:41:50"} | |
| {"current_steps": 2410, "total_steps": 8436, "loss": 0.3351, "learning_rate": 8.986415946222843e-06, "epoch": 0.8568888888888889, "percentage": 28.57, "elapsed_time": "3:04:14", "remaining_time": "7:40:39"} | |
| {"current_steps": 2420, "total_steps": 8436, "loss": 0.3257, "learning_rate": 8.973893163615498e-06, "epoch": 0.8604444444444445, "percentage": 28.69, "elapsed_time": "3:04:50", "remaining_time": "7:39:29"} | |
| {"current_steps": 2430, "total_steps": 8436, "loss": 0.3199, "learning_rate": 8.96130233495909e-06, "epoch": 0.864, "percentage": 28.81, "elapsed_time": "3:05:28", "remaining_time": "7:38:25"} | |
| {"current_steps": 2440, "total_steps": 8436, "loss": 0.3442, "learning_rate": 8.948643675849793e-06, "epoch": 0.8675555555555555, "percentage": 28.92, "elapsed_time": "3:06:02", "remaining_time": "7:37:11"} | |
| {"current_steps": 2450, "total_steps": 8436, "loss": 0.2947, "learning_rate": 8.935917403045251e-06, "epoch": 0.8711111111111111, "percentage": 29.04, "elapsed_time": "3:06:38", "remaining_time": "7:36:01"} | |
| {"current_steps": 2460, "total_steps": 8436, "loss": 0.3577, "learning_rate": 8.923123734460885e-06, "epoch": 0.8746666666666667, "percentage": 29.16, "elapsed_time": "3:07:14", "remaining_time": "7:34:51"} | |
| {"current_steps": 2470, "total_steps": 8436, "loss": 0.3326, "learning_rate": 8.910262889166144e-06, "epoch": 0.8782222222222222, "percentage": 29.28, "elapsed_time": "3:07:56", "remaining_time": "7:33:57"} | |
| {"current_steps": 2480, "total_steps": 8436, "loss": 0.3212, "learning_rate": 8.897335087380769e-06, "epoch": 0.8817777777777778, "percentage": 29.4, "elapsed_time": "3:08:32", "remaining_time": "7:32:47"} | |
| {"current_steps": 2490, "total_steps": 8436, "loss": 0.3143, "learning_rate": 8.884340550471008e-06, "epoch": 0.8853333333333333, "percentage": 29.52, "elapsed_time": "3:09:07", "remaining_time": "7:31:37"} | |
| {"current_steps": 2500, "total_steps": 8436, "loss": 0.3747, "learning_rate": 8.87127950094584e-06, "epoch": 0.8888888888888888, "percentage": 29.63, "elapsed_time": "3:09:41", "remaining_time": "7:30:24"} | |
| {"current_steps": 2500, "total_steps": 8436, "eval_loss": 0.23135392367839813, "epoch": 0.8888888888888888, "percentage": 29.63, "elapsed_time": "3:19:03", "remaining_time": "7:52:39"} | |
| {"current_steps": 2510, "total_steps": 8436, "loss": 0.3251, "learning_rate": 8.85815216245315e-06, "epoch": 0.8924444444444445, "percentage": 29.75, "elapsed_time": "3:19:40", "remaining_time": "7:51:26"} | |
| {"current_steps": 2520, "total_steps": 8436, "loss": 0.3242, "learning_rate": 8.844958759775917e-06, "epoch": 0.896, "percentage": 29.87, "elapsed_time": "3:20:19", "remaining_time": "7:50:16"} | |
| {"current_steps": 2530, "total_steps": 8436, "loss": 0.3069, "learning_rate": 8.83169951882834e-06, "epoch": 0.8995555555555556, "percentage": 29.99, "elapsed_time": "3:20:55", "remaining_time": "7:49:01"} | |
| {"current_steps": 2540, "total_steps": 8436, "loss": 0.3303, "learning_rate": 8.818374666652001e-06, "epoch": 0.9031111111111111, "percentage": 30.11, "elapsed_time": "3:21:30", "remaining_time": "7:47:44"} | |
| {"current_steps": 2550, "total_steps": 8436, "loss": 0.3558, "learning_rate": 8.804984431411951e-06, "epoch": 0.9066666666666666, "percentage": 30.23, "elapsed_time": "3:22:06", "remaining_time": "7:46:30"} | |
| {"current_steps": 2560, "total_steps": 8436, "loss": 0.3947, "learning_rate": 8.791529042392813e-06, "epoch": 0.9102222222222223, "percentage": 30.35, "elapsed_time": "3:22:43", "remaining_time": "7:45:19"} | |
| {"current_steps": 2570, "total_steps": 8436, "loss": 0.3362, "learning_rate": 8.77800872999486e-06, "epoch": 0.9137777777777778, "percentage": 30.46, "elapsed_time": "3:23:19", "remaining_time": "7:44:06"} | |
| {"current_steps": 2580, "total_steps": 8436, "loss": 0.3298, "learning_rate": 8.764423725730062e-06, "epoch": 0.9173333333333333, "percentage": 30.58, "elapsed_time": "3:23:56", "remaining_time": "7:42:53"} | |
| {"current_steps": 2590, "total_steps": 8436, "loss": 0.3218, "learning_rate": 8.750774262218129e-06, "epoch": 0.9208888888888889, "percentage": 30.7, "elapsed_time": "3:24:31", "remaining_time": "7:41:38"} | |
| {"current_steps": 2600, "total_steps": 8436, "loss": 0.3325, "learning_rate": 8.737060573182518e-06, "epoch": 0.9244444444444444, "percentage": 30.82, "elapsed_time": "3:25:07", "remaining_time": "7:40:25"} | |
| {"current_steps": 2610, "total_steps": 8436, "loss": 0.3496, "learning_rate": 8.723282893446447e-06, "epoch": 0.928, "percentage": 30.94, "elapsed_time": "3:25:46", "remaining_time": "7:39:18"} | |
| {"current_steps": 2620, "total_steps": 8436, "loss": 0.3197, "learning_rate": 8.709441458928853e-06, "epoch": 0.9315555555555556, "percentage": 31.06, "elapsed_time": "3:26:22", "remaining_time": "7:38:06"} | |
| {"current_steps": 2630, "total_steps": 8436, "loss": 0.3349, "learning_rate": 8.695536506640369e-06, "epoch": 0.9351111111111111, "percentage": 31.18, "elapsed_time": "3:26:57", "remaining_time": "7:36:53"} | |
| {"current_steps": 2640, "total_steps": 8436, "loss": 0.3357, "learning_rate": 8.681568274679264e-06, "epoch": 0.9386666666666666, "percentage": 31.29, "elapsed_time": "3:27:33", "remaining_time": "7:35:40"} | |
| {"current_steps": 2650, "total_steps": 8436, "loss": 0.3023, "learning_rate": 8.66753700222735e-06, "epoch": 0.9422222222222222, "percentage": 31.41, "elapsed_time": "3:28:09", "remaining_time": "7:34:29"} | |
| {"current_steps": 2660, "total_steps": 8436, "loss": 0.3482, "learning_rate": 8.653442929545914e-06, "epoch": 0.9457777777777778, "percentage": 31.53, "elapsed_time": "3:28:45", "remaining_time": "7:33:18"} | |
| {"current_steps": 2670, "total_steps": 8436, "loss": 0.3111, "learning_rate": 8.639286297971575e-06, "epoch": 0.9493333333333334, "percentage": 31.65, "elapsed_time": "3:29:22", "remaining_time": "7:32:08"} | |
| {"current_steps": 2680, "total_steps": 8436, "loss": 0.3333, "learning_rate": 8.625067349912171e-06, "epoch": 0.9528888888888889, "percentage": 31.77, "elapsed_time": "3:29:57", "remaining_time": "7:30:57"} | |
| {"current_steps": 2690, "total_steps": 8436, "loss": 0.3012, "learning_rate": 8.610786328842602e-06, "epoch": 0.9564444444444444, "percentage": 31.89, "elapsed_time": "3:30:33", "remaining_time": "7:29:45"} | |
| {"current_steps": 2700, "total_steps": 8436, "loss": 0.3158, "learning_rate": 8.59644347930066e-06, "epoch": 0.96, "percentage": 32.01, "elapsed_time": "3:31:08", "remaining_time": "7:28:32"} | |
| {"current_steps": 2710, "total_steps": 8436, "loss": 0.3045, "learning_rate": 8.582039046882842e-06, "epoch": 0.9635555555555556, "percentage": 32.12, "elapsed_time": "3:31:43", "remaining_time": "7:27:20"} | |
| {"current_steps": 2720, "total_steps": 8436, "loss": 0.3379, "learning_rate": 8.567573278240147e-06, "epoch": 0.9671111111111111, "percentage": 32.24, "elapsed_time": "3:32:18", "remaining_time": "7:26:09"} | |
| {"current_steps": 2730, "total_steps": 8436, "loss": 0.3376, "learning_rate": 8.55304642107385e-06, "epoch": 0.9706666666666667, "percentage": 32.36, "elapsed_time": "3:32:56", "remaining_time": "7:25:05"} | |
| {"current_steps": 2740, "total_steps": 8436, "loss": 0.3395, "learning_rate": 8.538458724131258e-06, "epoch": 0.9742222222222222, "percentage": 32.48, "elapsed_time": "3:33:32", "remaining_time": "7:23:55"} | |
| {"current_steps": 2750, "total_steps": 8436, "loss": 0.3105, "learning_rate": 8.523810437201463e-06, "epoch": 0.9777777777777777, "percentage": 32.6, "elapsed_time": "3:34:08", "remaining_time": "7:22:46"} | |
| {"current_steps": 2760, "total_steps": 8436, "loss": 0.314, "learning_rate": 8.509101811111045e-06, "epoch": 0.9813333333333333, "percentage": 32.72, "elapsed_time": "3:34:46", "remaining_time": "7:21:40"} | |
| {"current_steps": 2770, "total_steps": 8436, "loss": 0.3183, "learning_rate": 8.494333097719795e-06, "epoch": 0.9848888888888889, "percentage": 32.84, "elapsed_time": "3:35:25", "remaining_time": "7:20:38"} | |
| {"current_steps": 2780, "total_steps": 8436, "loss": 0.3459, "learning_rate": 8.479504549916393e-06, "epoch": 0.9884444444444445, "percentage": 32.95, "elapsed_time": "3:36:02", "remaining_time": "7:19:31"} | |
| {"current_steps": 2790, "total_steps": 8436, "loss": 0.3655, "learning_rate": 8.464616421614077e-06, "epoch": 0.992, "percentage": 33.07, "elapsed_time": "3:36:39", "remaining_time": "7:18:26"} | |
| {"current_steps": 2800, "total_steps": 8436, "loss": 0.3145, "learning_rate": 8.449668967746303e-06, "epoch": 0.9955555555555555, "percentage": 33.19, "elapsed_time": "3:37:15", "remaining_time": "7:17:17"} | |
| {"current_steps": 2810, "total_steps": 8436, "loss": 0.3152, "learning_rate": 8.434662444262374e-06, "epoch": 0.9991111111111111, "percentage": 33.31, "elapsed_time": "3:37:51", "remaining_time": "7:16:10"} | |
| {"current_steps": 2820, "total_steps": 8436, "loss": 0.256, "learning_rate": 8.419597108123054e-06, "epoch": 1.0026666666666666, "percentage": 33.43, "elapsed_time": "3:38:26", "remaining_time": "7:15:01"} | |
| {"current_steps": 2830, "total_steps": 8436, "loss": 0.2304, "learning_rate": 8.404473217296174e-06, "epoch": 1.0062222222222221, "percentage": 33.55, "elapsed_time": "3:39:03", "remaining_time": "7:13:56"} | |
| {"current_steps": 2840, "total_steps": 8436, "loss": 0.2451, "learning_rate": 8.389291030752215e-06, "epoch": 1.0097777777777779, "percentage": 33.67, "elapsed_time": "3:39:41", "remaining_time": "7:12:53"} | |
| {"current_steps": 2850, "total_steps": 8436, "loss": 0.2463, "learning_rate": 8.37405080845987e-06, "epoch": 1.0133333333333334, "percentage": 33.78, "elapsed_time": "3:40:20", "remaining_time": "7:11:51"} | |
| {"current_steps": 2860, "total_steps": 8436, "loss": 0.2439, "learning_rate": 8.358752811381592e-06, "epoch": 1.016888888888889, "percentage": 33.9, "elapsed_time": "3:40:56", "remaining_time": "7:10:45"} | |
| {"current_steps": 2870, "total_steps": 8436, "loss": 0.2301, "learning_rate": 8.343397301469127e-06, "epoch": 1.0204444444444445, "percentage": 34.02, "elapsed_time": "3:41:31", "remaining_time": "7:09:37"} | |
| {"current_steps": 2880, "total_steps": 8436, "loss": 0.26, "learning_rate": 8.327984541659035e-06, "epoch": 1.024, "percentage": 34.14, "elapsed_time": "3:42:09", "remaining_time": "7:08:34"} | |
| {"current_steps": 2890, "total_steps": 8436, "loss": 0.2537, "learning_rate": 8.312514795868177e-06, "epoch": 1.0275555555555556, "percentage": 34.26, "elapsed_time": "3:42:45", "remaining_time": "7:07:28"} | |
| {"current_steps": 2900, "total_steps": 8436, "loss": 0.2474, "learning_rate": 8.296988328989195e-06, "epoch": 1.031111111111111, "percentage": 34.38, "elapsed_time": "3:43:21", "remaining_time": "7:06:22"} | |
| {"current_steps": 2910, "total_steps": 8436, "loss": 0.2259, "learning_rate": 8.281405406885992e-06, "epoch": 1.0346666666666666, "percentage": 34.5, "elapsed_time": "3:43:57", "remaining_time": "7:05:16"} | |
| {"current_steps": 2920, "total_steps": 8436, "loss": 0.2206, "learning_rate": 8.265766296389164e-06, "epoch": 1.0382222222222222, "percentage": 34.61, "elapsed_time": "3:44:31", "remaining_time": "7:04:08"} | |
| {"current_steps": 2930, "total_steps": 8436, "loss": 0.2498, "learning_rate": 8.250071265291432e-06, "epoch": 1.0417777777777777, "percentage": 34.73, "elapsed_time": "3:45:07", "remaining_time": "7:03:02"} | |
| {"current_steps": 2940, "total_steps": 8436, "loss": 0.2316, "learning_rate": 8.23432058234307e-06, "epoch": 1.0453333333333332, "percentage": 34.85, "elapsed_time": "3:45:42", "remaining_time": "7:01:55"} | |
| {"current_steps": 2950, "total_steps": 8436, "loss": 0.2421, "learning_rate": 8.218514517247287e-06, "epoch": 1.048888888888889, "percentage": 34.97, "elapsed_time": "3:46:20", "remaining_time": "7:00:54"} | |
| {"current_steps": 2960, "total_steps": 8436, "loss": 0.2547, "learning_rate": 8.202653340655614e-06, "epoch": 1.0524444444444445, "percentage": 35.09, "elapsed_time": "3:46:55", "remaining_time": "6:59:48"} | |
| {"current_steps": 2970, "total_steps": 8436, "loss": 0.2609, "learning_rate": 8.18673732416328e-06, "epoch": 1.056, "percentage": 35.21, "elapsed_time": "3:47:32", "remaining_time": "6:58:46"} | |
| {"current_steps": 2980, "total_steps": 8436, "loss": 0.2369, "learning_rate": 8.170766740304541e-06, "epoch": 1.0595555555555556, "percentage": 35.32, "elapsed_time": "3:48:06", "remaining_time": "6:57:38"} | |
| {"current_steps": 2990, "total_steps": 8436, "loss": 0.2519, "learning_rate": 8.154741862548035e-06, "epoch": 1.0631111111111111, "percentage": 35.44, "elapsed_time": "3:48:40", "remaining_time": "6:56:31"} | |
| {"current_steps": 3000, "total_steps": 8436, "loss": 0.2248, "learning_rate": 8.13866296529208e-06, "epoch": 1.0666666666666667, "percentage": 35.56, "elapsed_time": "3:49:16", "remaining_time": "6:55:27"} | |
| {"current_steps": 3000, "total_steps": 8436, "eval_loss": 0.23144060373306274, "epoch": 1.0666666666666667, "percentage": 35.56, "elapsed_time": "3:58:38", "remaining_time": "7:12:25"} | |
| {"current_steps": 3010, "total_steps": 8436, "loss": 0.2494, "learning_rate": 8.122530323859992e-06, "epoch": 1.0702222222222222, "percentage": 35.68, "elapsed_time": "3:59:12", "remaining_time": "7:11:13"} | |
| {"current_steps": 3020, "total_steps": 8436, "loss": 0.2168, "learning_rate": 8.106344214495359e-06, "epoch": 1.0737777777777777, "percentage": 35.8, "elapsed_time": "3:59:47", "remaining_time": "7:10:02"} | |
| {"current_steps": 3030, "total_steps": 8436, "loss": 0.2544, "learning_rate": 8.090104914357316e-06, "epoch": 1.0773333333333333, "percentage": 35.92, "elapsed_time": "4:00:23", "remaining_time": "7:08:53"} | |
| {"current_steps": 3040, "total_steps": 8436, "loss": 0.2362, "learning_rate": 8.073812701515799e-06, "epoch": 1.0808888888888888, "percentage": 36.04, "elapsed_time": "4:00:59", "remaining_time": "7:07:46"} | |
| {"current_steps": 3050, "total_steps": 8436, "loss": 0.238, "learning_rate": 8.057467854946783e-06, "epoch": 1.0844444444444445, "percentage": 36.15, "elapsed_time": "4:01:37", "remaining_time": "7:06:41"} | |
| {"current_steps": 3060, "total_steps": 8436, "loss": 0.2329, "learning_rate": 8.041070654527498e-06, "epoch": 1.088, "percentage": 36.27, "elapsed_time": "4:02:14", "remaining_time": "7:05:34"} | |
| {"current_steps": 3070, "total_steps": 8436, "loss": 0.2525, "learning_rate": 8.024621381031654e-06, "epoch": 1.0915555555555556, "percentage": 36.39, "elapsed_time": "4:02:49", "remaining_time": "7:04:25"} | |
| {"current_steps": 3080, "total_steps": 8436, "loss": 0.2378, "learning_rate": 8.008120316124612e-06, "epoch": 1.0951111111111111, "percentage": 36.51, "elapsed_time": "4:03:27", "remaining_time": "7:03:22"} | |
| {"current_steps": 3090, "total_steps": 8436, "loss": 0.2469, "learning_rate": 7.991567742358582e-06, "epoch": 1.0986666666666667, "percentage": 36.63, "elapsed_time": "4:04:06", "remaining_time": "7:02:20"} | |
| {"current_steps": 3100, "total_steps": 8436, "loss": 0.2721, "learning_rate": 7.974963943167761e-06, "epoch": 1.1022222222222222, "percentage": 36.75, "elapsed_time": "4:04:41", "remaining_time": "7:01:11"} | |
| {"current_steps": 3110, "total_steps": 8436, "loss": 0.2457, "learning_rate": 7.958309202863506e-06, "epoch": 1.1057777777777777, "percentage": 36.87, "elapsed_time": "4:05:18", "remaining_time": "7:00:05"} | |
| {"current_steps": 3120, "total_steps": 8436, "loss": 0.2274, "learning_rate": 7.941603806629444e-06, "epoch": 1.1093333333333333, "percentage": 36.98, "elapsed_time": "4:05:52", "remaining_time": "6:58:56"} | |
| {"current_steps": 3130, "total_steps": 8436, "loss": 0.2595, "learning_rate": 7.9248480405166e-06, "epoch": 1.1128888888888888, "percentage": 37.1, "elapsed_time": "4:06:27", "remaining_time": "6:57:47"} | |
| {"current_steps": 3140, "total_steps": 8436, "loss": 0.2374, "learning_rate": 7.908042191438497e-06, "epoch": 1.1164444444444444, "percentage": 37.22, "elapsed_time": "4:07:05", "remaining_time": "6:56:45"} | |
| {"current_steps": 3150, "total_steps": 8436, "loss": 0.2128, "learning_rate": 7.891186547166238e-06, "epoch": 1.12, "percentage": 37.34, "elapsed_time": "4:07:40", "remaining_time": "6:55:37"} | |
| {"current_steps": 3160, "total_steps": 8436, "loss": 0.2263, "learning_rate": 7.874281396323589e-06, "epoch": 1.1235555555555556, "percentage": 37.46, "elapsed_time": "4:08:16", "remaining_time": "6:54:31"} | |
| {"current_steps": 3170, "total_steps": 8436, "loss": 0.2392, "learning_rate": 7.857327028382025e-06, "epoch": 1.1271111111111112, "percentage": 37.58, "elapsed_time": "4:08:50", "remaining_time": "6:53:22"} | |
| {"current_steps": 3180, "total_steps": 8436, "loss": 0.2342, "learning_rate": 7.84032373365578e-06, "epoch": 1.1306666666666667, "percentage": 37.7, "elapsed_time": "4:09:26", "remaining_time": "6:52:16"} | |
| {"current_steps": 3190, "total_steps": 8436, "loss": 0.2271, "learning_rate": 7.823271803296876e-06, "epoch": 1.1342222222222222, "percentage": 37.81, "elapsed_time": "4:10:03", "remaining_time": "6:51:13"} | |
| {"current_steps": 3200, "total_steps": 8436, "loss": 0.2376, "learning_rate": 7.80617152929014e-06, "epoch": 1.1377777777777778, "percentage": 37.93, "elapsed_time": "4:10:37", "remaining_time": "6:50:05"} | |
| {"current_steps": 3210, "total_steps": 8436, "loss": 0.2516, "learning_rate": 7.789023204448189e-06, "epoch": 1.1413333333333333, "percentage": 38.05, "elapsed_time": "4:11:14", "remaining_time": "6:49:02"} | |
| {"current_steps": 3220, "total_steps": 8436, "loss": 0.2265, "learning_rate": 7.771827122406437e-06, "epoch": 1.1448888888888888, "percentage": 38.17, "elapsed_time": "4:11:49", "remaining_time": "6:47:56"} | |
| {"current_steps": 3230, "total_steps": 8436, "loss": 0.2554, "learning_rate": 7.754583577618057e-06, "epoch": 1.1484444444444444, "percentage": 38.29, "elapsed_time": "4:12:25", "remaining_time": "6:46:51"} | |
| {"current_steps": 3240, "total_steps": 8436, "loss": 0.2408, "learning_rate": 7.737292865348933e-06, "epoch": 1.152, "percentage": 38.41, "elapsed_time": "4:13:03", "remaining_time": "6:45:49"} | |
| {"current_steps": 3250, "total_steps": 8436, "loss": 0.2287, "learning_rate": 7.719955281672618e-06, "epoch": 1.1555555555555554, "percentage": 38.53, "elapsed_time": "4:13:40", "remaining_time": "6:44:47"} | |
| {"current_steps": 3260, "total_steps": 8436, "loss": 0.237, "learning_rate": 7.702571123465252e-06, "epoch": 1.1591111111111112, "percentage": 38.64, "elapsed_time": "4:14:14", "remaining_time": "6:43:40"} | |
| {"current_steps": 3270, "total_steps": 8436, "loss": 0.2393, "learning_rate": 7.685140688400484e-06, "epoch": 1.1626666666666667, "percentage": 38.76, "elapsed_time": "4:14:53", "remaining_time": "6:42:41"} | |
| {"current_steps": 3280, "total_steps": 8436, "loss": 0.2158, "learning_rate": 7.66766427494438e-06, "epoch": 1.1662222222222223, "percentage": 38.88, "elapsed_time": "4:15:31", "remaining_time": "6:41:39"} | |
| {"current_steps": 3290, "total_steps": 8436, "loss": 0.201, "learning_rate": 7.650142182350294e-06, "epoch": 1.1697777777777778, "percentage": 39.0, "elapsed_time": "4:16:08", "remaining_time": "6:40:38"} | |
| {"current_steps": 3300, "total_steps": 8436, "loss": 0.2627, "learning_rate": 7.632574710653773e-06, "epoch": 1.1733333333333333, "percentage": 39.12, "elapsed_time": "4:16:43", "remaining_time": "6:39:34"} | |
| {"current_steps": 3310, "total_steps": 8436, "loss": 0.221, "learning_rate": 7.614962160667384e-06, "epoch": 1.1768888888888889, "percentage": 39.24, "elapsed_time": "4:17:24", "remaining_time": "6:38:37"} | |
| {"current_steps": 3320, "total_steps": 8436, "loss": 0.2419, "learning_rate": 7.597304833975596e-06, "epoch": 1.1804444444444444, "percentage": 39.36, "elapsed_time": "4:17:58", "remaining_time": "6:37:32"} | |
| {"current_steps": 3330, "total_steps": 8436, "loss": 0.2572, "learning_rate": 7.579603032929597e-06, "epoch": 1.184, "percentage": 39.47, "elapsed_time": "4:18:37", "remaining_time": "6:36:33"} | |
| {"current_steps": 3340, "total_steps": 8436, "loss": 0.2462, "learning_rate": 7.56185706064212e-06, "epoch": 1.1875555555555555, "percentage": 39.59, "elapsed_time": "4:19:15", "remaining_time": "6:35:33"} | |
| {"current_steps": 3350, "total_steps": 8436, "loss": 0.2312, "learning_rate": 7.544067220982254e-06, "epoch": 1.1911111111111112, "percentage": 39.71, "elapsed_time": "4:19:53", "remaining_time": "6:34:34"} | |
| {"current_steps": 3360, "total_steps": 8436, "loss": 0.2067, "learning_rate": 7.526233818570245e-06, "epoch": 1.1946666666666665, "percentage": 39.83, "elapsed_time": "4:20:28", "remaining_time": "6:33:30"} | |
| {"current_steps": 3370, "total_steps": 8436, "loss": 0.2448, "learning_rate": 7.508357158772273e-06, "epoch": 1.1982222222222223, "percentage": 39.95, "elapsed_time": "4:21:04", "remaining_time": "6:32:27"} | |
| {"current_steps": 3380, "total_steps": 8436, "loss": 0.2194, "learning_rate": 7.490437547695224e-06, "epoch": 1.2017777777777778, "percentage": 40.07, "elapsed_time": "4:21:39", "remaining_time": "6:31:24"} | |
| {"current_steps": 3390, "total_steps": 8436, "loss": 0.2501, "learning_rate": 7.472475292181454e-06, "epoch": 1.2053333333333334, "percentage": 40.18, "elapsed_time": "4:22:16", "remaining_time": "6:30:23"} | |
| {"current_steps": 3400, "total_steps": 8436, "loss": 0.2515, "learning_rate": 7.45447069980353e-06, "epoch": 1.208888888888889, "percentage": 40.3, "elapsed_time": "4:22:51", "remaining_time": "6:29:20"} | |
| {"current_steps": 3410, "total_steps": 8436, "loss": 0.2461, "learning_rate": 7.4364240788589625e-06, "epoch": 1.2124444444444444, "percentage": 40.42, "elapsed_time": "4:23:26", "remaining_time": "6:28:17"} | |
| {"current_steps": 3420, "total_steps": 8436, "loss": 0.2241, "learning_rate": 7.418335738364931e-06, "epoch": 1.216, "percentage": 40.54, "elapsed_time": "4:24:01", "remaining_time": "6:27:14"} | |
| {"current_steps": 3430, "total_steps": 8436, "loss": 0.2298, "learning_rate": 7.400205988052991e-06, "epoch": 1.2195555555555555, "percentage": 40.66, "elapsed_time": "4:24:36", "remaining_time": "6:26:11"} | |
| {"current_steps": 3440, "total_steps": 8436, "loss": 0.2516, "learning_rate": 7.382035138363764e-06, "epoch": 1.223111111111111, "percentage": 40.78, "elapsed_time": "4:25:10", "remaining_time": "6:25:07"} | |
| {"current_steps": 3450, "total_steps": 8436, "loss": 0.2422, "learning_rate": 7.363823500441636e-06, "epoch": 1.2266666666666666, "percentage": 40.9, "elapsed_time": "4:25:49", "remaining_time": "6:24:09"} | |
| {"current_steps": 3460, "total_steps": 8436, "loss": 0.2368, "learning_rate": 7.345571386129413e-06, "epoch": 1.2302222222222223, "percentage": 41.01, "elapsed_time": "4:26:24", "remaining_time": "6:23:07"} | |
| {"current_steps": 3470, "total_steps": 8436, "loss": 0.2488, "learning_rate": 7.327279107962995e-06, "epoch": 1.2337777777777779, "percentage": 41.13, "elapsed_time": "4:26:59", "remaining_time": "6:22:05"} | |
| {"current_steps": 3480, "total_steps": 8436, "loss": 0.2277, "learning_rate": 7.308946979166012e-06, "epoch": 1.2373333333333334, "percentage": 41.25, "elapsed_time": "4:27:37", "remaining_time": "6:21:07"} | |
| {"current_steps": 3490, "total_steps": 8436, "loss": 0.2329, "learning_rate": 7.290575313644476e-06, "epoch": 1.240888888888889, "percentage": 41.37, "elapsed_time": "4:28:13", "remaining_time": "6:20:07"} | |
| {"current_steps": 3500, "total_steps": 8436, "loss": 0.2575, "learning_rate": 7.272164425981387e-06, "epoch": 1.2444444444444445, "percentage": 41.49, "elapsed_time": "4:28:53", "remaining_time": "6:19:12"} | |
| {"current_steps": 3500, "total_steps": 8436, "eval_loss": 0.22694812715053558, "epoch": 1.2444444444444445, "percentage": 41.49, "elapsed_time": "4:38:17", "remaining_time": "6:32:27"} | |
| {"current_steps": 3510, "total_steps": 8436, "loss": 0.2492, "learning_rate": 7.253714631431366e-06, "epoch": 1.248, "percentage": 41.61, "elapsed_time": "4:38:52", "remaining_time": "6:31:23"} | |
| {"current_steps": 3520, "total_steps": 8436, "loss": 0.2259, "learning_rate": 7.235226245915239e-06, "epoch": 1.2515555555555555, "percentage": 41.73, "elapsed_time": "4:39:30", "remaining_time": "6:30:21"} | |
| {"current_steps": 3530, "total_steps": 8436, "loss": 0.2487, "learning_rate": 7.216699586014642e-06, "epoch": 1.255111111111111, "percentage": 41.84, "elapsed_time": "4:40:05", "remaining_time": "6:29:16"} | |
| {"current_steps": 3540, "total_steps": 8436, "loss": 0.2341, "learning_rate": 7.198134968966588e-06, "epoch": 1.2586666666666666, "percentage": 41.96, "elapsed_time": "4:40:39", "remaining_time": "6:28:10"} | |
| {"current_steps": 3550, "total_steps": 8436, "loss": 0.2625, "learning_rate": 7.179532712658047e-06, "epoch": 1.2622222222222224, "percentage": 42.08, "elapsed_time": "4:41:16", "remaining_time": "6:27:08"} | |
| {"current_steps": 3560, "total_steps": 8436, "loss": 0.2602, "learning_rate": 7.160893135620488e-06, "epoch": 1.2657777777777777, "percentage": 42.2, "elapsed_time": "4:41:52", "remaining_time": "6:26:04"} | |
| {"current_steps": 3570, "total_steps": 8436, "loss": 0.2221, "learning_rate": 7.142216557024443e-06, "epoch": 1.2693333333333334, "percentage": 42.32, "elapsed_time": "4:42:32", "remaining_time": "6:25:06"} | |
| {"current_steps": 3580, "total_steps": 8436, "loss": 0.247, "learning_rate": 7.123503296674021e-06, "epoch": 1.272888888888889, "percentage": 42.44, "elapsed_time": "4:43:07", "remaining_time": "6:24:02"} | |
| {"current_steps": 3590, "total_steps": 8436, "loss": 0.2405, "learning_rate": 7.104753675001453e-06, "epoch": 1.2764444444444445, "percentage": 42.56, "elapsed_time": "4:43:42", "remaining_time": "6:22:58"} | |
| {"current_steps": 3600, "total_steps": 8436, "loss": 0.2452, "learning_rate": 7.085968013061585e-06, "epoch": 1.28, "percentage": 42.67, "elapsed_time": "4:44:17", "remaining_time": "6:21:54"} | |
| {"current_steps": 3610, "total_steps": 8436, "loss": 0.2813, "learning_rate": 7.067146632526398e-06, "epoch": 1.2835555555555556, "percentage": 42.79, "elapsed_time": "4:44:55", "remaining_time": "6:20:53"} | |
| {"current_steps": 3620, "total_steps": 8436, "loss": 0.2272, "learning_rate": 7.048289855679487e-06, "epoch": 1.287111111111111, "percentage": 42.91, "elapsed_time": "4:45:32", "remaining_time": "6:19:52"} | |
| {"current_steps": 3630, "total_steps": 8436, "loss": 0.2588, "learning_rate": 7.029398005410551e-06, "epoch": 1.2906666666666666, "percentage": 43.03, "elapsed_time": "4:46:06", "remaining_time": "6:18:47"} | |
| {"current_steps": 3640, "total_steps": 8436, "loss": 0.2403, "learning_rate": 7.01047140520986e-06, "epoch": 1.2942222222222222, "percentage": 43.15, "elapsed_time": "4:46:44", "remaining_time": "6:17:47"} | |
| {"current_steps": 3650, "total_steps": 8436, "loss": 0.2477, "learning_rate": 6.9915103791627146e-06, "epoch": 1.2977777777777777, "percentage": 43.27, "elapsed_time": "4:47:22", "remaining_time": "6:16:48"} | |
| {"current_steps": 3660, "total_steps": 8436, "loss": 0.2279, "learning_rate": 6.972515251943901e-06, "epoch": 1.3013333333333335, "percentage": 43.39, "elapsed_time": "4:47:58", "remaining_time": "6:15:47"} | |
| {"current_steps": 3670, "total_steps": 8436, "loss": 0.2414, "learning_rate": 6.953486348812127e-06, "epoch": 1.3048888888888888, "percentage": 43.5, "elapsed_time": "4:48:36", "remaining_time": "6:14:47"} | |
| {"current_steps": 3680, "total_steps": 8436, "loss": 0.248, "learning_rate": 6.934423995604455e-06, "epoch": 1.3084444444444445, "percentage": 43.62, "elapsed_time": "4:49:13", "remaining_time": "6:13:47"} | |
| {"current_steps": 3690, "total_steps": 8436, "loss": 0.2459, "learning_rate": 6.915328518730724e-06, "epoch": 1.312, "percentage": 43.74, "elapsed_time": "4:49:54", "remaining_time": "6:12:52"} | |
| {"current_steps": 3700, "total_steps": 8436, "loss": 0.2546, "learning_rate": 6.896200245167956e-06, "epoch": 1.3155555555555556, "percentage": 43.86, "elapsed_time": "4:50:33", "remaining_time": "6:11:54"} | |
| {"current_steps": 3710, "total_steps": 8436, "loss": 0.2006, "learning_rate": 6.877039502454758e-06, "epoch": 1.3191111111111111, "percentage": 43.98, "elapsed_time": "4:51:09", "remaining_time": "6:10:53"} | |
| {"current_steps": 3720, "total_steps": 8436, "loss": 0.2213, "learning_rate": 6.857846618685724e-06, "epoch": 1.3226666666666667, "percentage": 44.1, "elapsed_time": "4:51:45", "remaining_time": "6:09:52"} | |
| {"current_steps": 3730, "total_steps": 8436, "loss": 0.2315, "learning_rate": 6.8386219225057945e-06, "epoch": 1.3262222222222222, "percentage": 44.22, "elapsed_time": "4:52:21", "remaining_time": "6:08:51"} | |
| {"current_steps": 3740, "total_steps": 8436, "loss": 0.2235, "learning_rate": 6.819365743104655e-06, "epoch": 1.3297777777777777, "percentage": 44.33, "elapsed_time": "4:52:59", "remaining_time": "6:07:52"} | |
| {"current_steps": 3750, "total_steps": 8436, "loss": 0.2348, "learning_rate": 6.8000784102110795e-06, "epoch": 1.3333333333333333, "percentage": 44.45, "elapsed_time": "4:53:35", "remaining_time": "6:06:51"} | |
| {"current_steps": 3760, "total_steps": 8436, "loss": 0.2433, "learning_rate": 6.780760254087293e-06, "epoch": 1.3368888888888888, "percentage": 44.57, "elapsed_time": "4:54:14", "remaining_time": "6:05:54"} | |
| {"current_steps": 3770, "total_steps": 8436, "loss": 0.2511, "learning_rate": 6.7614116055233146e-06, "epoch": 1.3404444444444445, "percentage": 44.69, "elapsed_time": "4:54:50", "remaining_time": "6:04:55"} | |
| {"current_steps": 3780, "total_steps": 8436, "loss": 0.2218, "learning_rate": 6.742032795831298e-06, "epoch": 1.3439999999999999, "percentage": 44.81, "elapsed_time": "4:55:26", "remaining_time": "6:03:54"} | |
| {"current_steps": 3790, "total_steps": 8436, "loss": 0.2607, "learning_rate": 6.722624156839847e-06, "epoch": 1.3475555555555556, "percentage": 44.93, "elapsed_time": "4:56:04", "remaining_time": "6:02:56"} | |
| {"current_steps": 3800, "total_steps": 8436, "loss": 0.2434, "learning_rate": 6.703186020888347e-06, "epoch": 1.3511111111111112, "percentage": 45.05, "elapsed_time": "4:56:43", "remaining_time": "6:02:00"} | |
| {"current_steps": 3810, "total_steps": 8436, "loss": 0.2494, "learning_rate": 6.683718720821264e-06, "epoch": 1.3546666666666667, "percentage": 45.16, "elapsed_time": "4:57:20", "remaining_time": "6:01:00"} | |
| {"current_steps": 3820, "total_steps": 8436, "loss": 0.2215, "learning_rate": 6.664222589982451e-06, "epoch": 1.3582222222222222, "percentage": 45.28, "elapsed_time": "4:57:55", "remaining_time": "6:00:00"} | |
| {"current_steps": 3830, "total_steps": 8436, "loss": 0.2346, "learning_rate": 6.644697962209434e-06, "epoch": 1.3617777777777778, "percentage": 45.4, "elapsed_time": "4:58:31", "remaining_time": "5:59:00"} | |
| {"current_steps": 3840, "total_steps": 8436, "loss": 0.2122, "learning_rate": 6.6251451718277095e-06, "epoch": 1.3653333333333333, "percentage": 45.52, "elapsed_time": "4:59:06", "remaining_time": "5:57:59"} | |
| {"current_steps": 3850, "total_steps": 8436, "loss": 0.2289, "learning_rate": 6.605564553644998e-06, "epoch": 1.3688888888888888, "percentage": 45.64, "elapsed_time": "4:59:41", "remaining_time": "5:56:59"} | |
| {"current_steps": 3860, "total_steps": 8436, "loss": 0.2304, "learning_rate": 6.585956442945531e-06, "epoch": 1.3724444444444446, "percentage": 45.76, "elapsed_time": "5:00:17", "remaining_time": "5:55:59"} | |
| {"current_steps": 3870, "total_steps": 8436, "loss": 0.2524, "learning_rate": 6.566321175484298e-06, "epoch": 1.376, "percentage": 45.87, "elapsed_time": "5:00:52", "remaining_time": "5:54:59"} | |
| {"current_steps": 3880, "total_steps": 8436, "loss": 0.2344, "learning_rate": 6.546659087481304e-06, "epoch": 1.3795555555555556, "percentage": 45.99, "elapsed_time": "5:01:29", "remaining_time": "5:54:01"} | |
| {"current_steps": 3890, "total_steps": 8436, "loss": 0.2278, "learning_rate": 6.526970515615807e-06, "epoch": 1.3831111111111112, "percentage": 46.11, "elapsed_time": "5:02:05", "remaining_time": "5:53:01"} | |
| {"current_steps": 3900, "total_steps": 8436, "loss": 0.2299, "learning_rate": 6.507255797020555e-06, "epoch": 1.3866666666666667, "percentage": 46.23, "elapsed_time": "5:02:40", "remaining_time": "5:52:01"} | |
| {"current_steps": 3910, "total_steps": 8436, "loss": 0.2518, "learning_rate": 6.487515269276015e-06, "epoch": 1.3902222222222222, "percentage": 46.35, "elapsed_time": "5:03:15", "remaining_time": "5:51:02"} | |
| {"current_steps": 3920, "total_steps": 8436, "loss": 0.2196, "learning_rate": 6.467749270404593e-06, "epoch": 1.3937777777777778, "percentage": 46.47, "elapsed_time": "5:03:52", "remaining_time": "5:50:04"} | |
| {"current_steps": 3930, "total_steps": 8436, "loss": 0.2527, "learning_rate": 6.4479581388648404e-06, "epoch": 1.3973333333333333, "percentage": 46.59, "elapsed_time": "5:04:29", "remaining_time": "5:49:07"} | |
| {"current_steps": 3940, "total_steps": 8436, "loss": 0.2663, "learning_rate": 6.428142213545662e-06, "epoch": 1.4008888888888889, "percentage": 46.7, "elapsed_time": "5:05:09", "remaining_time": "5:48:12"} | |
| {"current_steps": 3950, "total_steps": 8436, "loss": 0.2141, "learning_rate": 6.408301833760517e-06, "epoch": 1.4044444444444444, "percentage": 46.82, "elapsed_time": "5:05:45", "remaining_time": "5:47:15"} | |
| {"current_steps": 3960, "total_steps": 8436, "loss": 0.2419, "learning_rate": 6.388437339241601e-06, "epoch": 1.408, "percentage": 46.94, "elapsed_time": "5:06:21", "remaining_time": "5:46:17"} | |
| {"current_steps": 3970, "total_steps": 8436, "loss": 0.2205, "learning_rate": 6.368549070134036e-06, "epoch": 1.4115555555555557, "percentage": 47.06, "elapsed_time": "5:06:56", "remaining_time": "5:45:17"} | |
| {"current_steps": 3980, "total_steps": 8436, "loss": 0.2403, "learning_rate": 6.348637366990038e-06, "epoch": 1.415111111111111, "percentage": 47.18, "elapsed_time": "5:07:33", "remaining_time": "5:44:20"} | |
| {"current_steps": 3990, "total_steps": 8436, "loss": 0.243, "learning_rate": 6.328702570763098e-06, "epoch": 1.4186666666666667, "percentage": 47.3, "elapsed_time": "5:08:09", "remaining_time": "5:43:22"} | |
| {"current_steps": 4000, "total_steps": 8436, "loss": 0.2376, "learning_rate": 6.308745022802128e-06, "epoch": 1.4222222222222223, "percentage": 47.42, "elapsed_time": "5:08:46", "remaining_time": "5:42:25"} | |
| {"current_steps": 4000, "total_steps": 8436, "eval_loss": 0.22332721948623657, "epoch": 1.4222222222222223, "percentage": 47.42, "elapsed_time": "5:18:08", "remaining_time": "5:52:49"} | |
| {"current_steps": 4010, "total_steps": 8436, "loss": 0.2119, "learning_rate": 6.288765064845629e-06, "epoch": 1.4257777777777778, "percentage": 47.53, "elapsed_time": "5:19:04", "remaining_time": "5:52:10"} | |
| {"current_steps": 4020, "total_steps": 8436, "loss": 0.2372, "learning_rate": 6.268763039015833e-06, "epoch": 1.4293333333333333, "percentage": 47.65, "elapsed_time": "5:19:39", "remaining_time": "5:51:09"} | |
| {"current_steps": 4030, "total_steps": 8436, "loss": 0.2378, "learning_rate": 6.248739287812846e-06, "epoch": 1.4328888888888889, "percentage": 47.77, "elapsed_time": "5:20:15", "remaining_time": "5:50:08"} | |
| {"current_steps": 4040, "total_steps": 8436, "loss": 0.236, "learning_rate": 6.228694154108783e-06, "epoch": 1.4364444444444444, "percentage": 47.89, "elapsed_time": "5:20:51", "remaining_time": "5:49:07"} | |
| {"current_steps": 4050, "total_steps": 8436, "loss": 0.2165, "learning_rate": 6.208627981141902e-06, "epoch": 1.44, "percentage": 48.01, "elapsed_time": "5:21:27", "remaining_time": "5:48:07"} | |
| {"current_steps": 4060, "total_steps": 8436, "loss": 0.2405, "learning_rate": 6.188541112510713e-06, "epoch": 1.4435555555555555, "percentage": 48.13, "elapsed_time": "5:22:04", "remaining_time": "5:47:08"} | |
| {"current_steps": 4070, "total_steps": 8436, "loss": 0.2288, "learning_rate": 6.168433892168113e-06, "epoch": 1.447111111111111, "percentage": 48.25, "elapsed_time": "5:22:41", "remaining_time": "5:46:09"} | |
| {"current_steps": 4080, "total_steps": 8436, "loss": 0.235, "learning_rate": 6.148306664415476e-06, "epoch": 1.4506666666666668, "percentage": 48.36, "elapsed_time": "5:23:17", "remaining_time": "5:45:10"} | |
| {"current_steps": 4090, "total_steps": 8436, "loss": 0.2143, "learning_rate": 6.128159773896783e-06, "epoch": 1.4542222222222223, "percentage": 48.48, "elapsed_time": "5:23:52", "remaining_time": "5:44:09"} | |
| {"current_steps": 4100, "total_steps": 8436, "loss": 0.239, "learning_rate": 6.107993565592693e-06, "epoch": 1.4577777777777778, "percentage": 48.6, "elapsed_time": "5:24:30", "remaining_time": "5:43:11"} | |
| {"current_steps": 4110, "total_steps": 8436, "loss": 0.2185, "learning_rate": 6.087808384814652e-06, "epoch": 1.4613333333333334, "percentage": 48.72, "elapsed_time": "5:25:06", "remaining_time": "5:42:11"} | |
| {"current_steps": 4120, "total_steps": 8436, "loss": 0.238, "learning_rate": 6.067604577198981e-06, "epoch": 1.464888888888889, "percentage": 48.84, "elapsed_time": "5:25:44", "remaining_time": "5:41:14"} | |
| {"current_steps": 4130, "total_steps": 8436, "loss": 0.2238, "learning_rate": 6.04738248870095e-06, "epoch": 1.4684444444444444, "percentage": 48.96, "elapsed_time": "5:26:22", "remaining_time": "5:40:16"} | |
| {"current_steps": 4140, "total_steps": 8436, "loss": 0.2453, "learning_rate": 6.027142465588855e-06, "epoch": 1.472, "percentage": 49.08, "elapsed_time": "5:26:59", "remaining_time": "5:39:18"} | |
| {"current_steps": 4150, "total_steps": 8436, "loss": 0.2375, "learning_rate": 6.006884854438099e-06, "epoch": 1.4755555555555555, "percentage": 49.19, "elapsed_time": "5:27:34", "remaining_time": "5:38:18"} | |
| {"current_steps": 4160, "total_steps": 8436, "loss": 0.2331, "learning_rate": 5.9866100021252415e-06, "epoch": 1.479111111111111, "percentage": 49.31, "elapsed_time": "5:28:10", "remaining_time": "5:37:20"} | |
| {"current_steps": 4170, "total_steps": 8436, "loss": 0.2131, "learning_rate": 5.966318255822072e-06, "epoch": 1.4826666666666668, "percentage": 49.43, "elapsed_time": "5:28:50", "remaining_time": "5:36:24"} | |
| {"current_steps": 4180, "total_steps": 8436, "loss": 0.243, "learning_rate": 5.946009962989659e-06, "epoch": 1.4862222222222221, "percentage": 49.55, "elapsed_time": "5:29:27", "remaining_time": "5:35:26"} | |
| {"current_steps": 4190, "total_steps": 8436, "loss": 0.2344, "learning_rate": 5.9256854713724e-06, "epoch": 1.4897777777777779, "percentage": 49.67, "elapsed_time": "5:30:05", "remaining_time": "5:34:30"} | |
| {"current_steps": 4200, "total_steps": 8436, "loss": 0.2372, "learning_rate": 5.905345128992072e-06, "epoch": 1.4933333333333334, "percentage": 49.79, "elapsed_time": "5:30:40", "remaining_time": "5:33:30"} | |
| {"current_steps": 4210, "total_steps": 8436, "loss": 0.2137, "learning_rate": 5.884989284141866e-06, "epoch": 1.496888888888889, "percentage": 49.91, "elapsed_time": "5:31:15", "remaining_time": "5:32:31"} | |
| {"current_steps": 4220, "total_steps": 8436, "loss": 0.2264, "learning_rate": 5.86461828538043e-06, "epoch": 1.5004444444444445, "percentage": 50.02, "elapsed_time": "5:31:53", "remaining_time": "5:31:34"} | |
| {"current_steps": 4230, "total_steps": 8436, "loss": 0.2167, "learning_rate": 5.84423248152589e-06, "epoch": 1.504, "percentage": 50.14, "elapsed_time": "5:32:28", "remaining_time": "5:30:35"} | |
| {"current_steps": 4240, "total_steps": 8436, "loss": 0.2223, "learning_rate": 5.82383222164989e-06, "epoch": 1.5075555555555555, "percentage": 50.26, "elapsed_time": "5:33:03", "remaining_time": "5:29:36"} | |
| {"current_steps": 4250, "total_steps": 8436, "loss": 0.2361, "learning_rate": 5.803417855071603e-06, "epoch": 1.511111111111111, "percentage": 50.38, "elapsed_time": "5:33:39", "remaining_time": "5:28:38"} | |
| {"current_steps": 4260, "total_steps": 8436, "loss": 0.2665, "learning_rate": 5.782989731351762e-06, "epoch": 1.5146666666666668, "percentage": 50.5, "elapsed_time": "5:34:17", "remaining_time": "5:27:41"} | |
| {"current_steps": 4270, "total_steps": 8436, "loss": 0.212, "learning_rate": 5.762548200286659e-06, "epoch": 1.5182222222222221, "percentage": 50.62, "elapsed_time": "5:34:52", "remaining_time": "5:26:43"} | |
| {"current_steps": 4280, "total_steps": 8436, "loss": 0.2142, "learning_rate": 5.742093611902168e-06, "epoch": 1.521777777777778, "percentage": 50.73, "elapsed_time": "5:35:30", "remaining_time": "5:25:47"} | |
| {"current_steps": 4290, "total_steps": 8436, "loss": 0.2302, "learning_rate": 5.721626316447748e-06, "epoch": 1.5253333333333332, "percentage": 50.85, "elapsed_time": "5:36:07", "remaining_time": "5:24:50"} | |
| {"current_steps": 4300, "total_steps": 8436, "loss": 0.2209, "learning_rate": 5.7011466643904434e-06, "epoch": 1.528888888888889, "percentage": 50.97, "elapsed_time": "5:36:46", "remaining_time": "5:23:55"} | |
| {"current_steps": 4310, "total_steps": 8436, "loss": 0.2398, "learning_rate": 5.680655006408882e-06, "epoch": 1.5324444444444445, "percentage": 51.09, "elapsed_time": "5:37:26", "remaining_time": "5:23:02"} | |
| {"current_steps": 4320, "total_steps": 8436, "loss": 0.2335, "learning_rate": 5.660151693387273e-06, "epoch": 1.536, "percentage": 51.21, "elapsed_time": "5:38:00", "remaining_time": "5:22:02"} | |
| {"current_steps": 4330, "total_steps": 8436, "loss": 0.2207, "learning_rate": 5.639637076409404e-06, "epoch": 1.5395555555555556, "percentage": 51.33, "elapsed_time": "5:38:38", "remaining_time": "5:21:07"} | |
| {"current_steps": 4340, "total_steps": 8436, "loss": 0.2411, "learning_rate": 5.6191115067526135e-06, "epoch": 1.543111111111111, "percentage": 51.45, "elapsed_time": "5:39:16", "remaining_time": "5:20:11"} | |
| {"current_steps": 4350, "total_steps": 8436, "loss": 0.2161, "learning_rate": 5.598575335881792e-06, "epoch": 1.5466666666666666, "percentage": 51.56, "elapsed_time": "5:39:51", "remaining_time": "5:19:14"} | |
| {"current_steps": 4360, "total_steps": 8436, "loss": 0.2104, "learning_rate": 5.578028915443356e-06, "epoch": 1.5502222222222222, "percentage": 51.68, "elapsed_time": "5:40:25", "remaining_time": "5:18:15"} | |
| {"current_steps": 4370, "total_steps": 8436, "loss": 0.2333, "learning_rate": 5.55747259725923e-06, "epoch": 1.553777777777778, "percentage": 51.8, "elapsed_time": "5:41:02", "remaining_time": "5:17:19"} | |
| {"current_steps": 4380, "total_steps": 8436, "loss": 0.2447, "learning_rate": 5.536906733320816e-06, "epoch": 1.5573333333333332, "percentage": 51.92, "elapsed_time": "5:41:41", "remaining_time": "5:16:24"} | |
| {"current_steps": 4390, "total_steps": 8436, "loss": 0.2445, "learning_rate": 5.516331675782973e-06, "epoch": 1.560888888888889, "percentage": 52.04, "elapsed_time": "5:42:18", "remaining_time": "5:15:29"} | |
| {"current_steps": 4400, "total_steps": 8436, "loss": 0.2382, "learning_rate": 5.495747776957987e-06, "epoch": 1.5644444444444443, "percentage": 52.16, "elapsed_time": "5:42:55", "remaining_time": "5:14:33"} | |
| {"current_steps": 4410, "total_steps": 8436, "loss": 0.2162, "learning_rate": 5.475155389309531e-06, "epoch": 1.568, "percentage": 52.28, "elapsed_time": "5:43:30", "remaining_time": "5:13:35"} | |
| {"current_steps": 4420, "total_steps": 8436, "loss": 0.2351, "learning_rate": 5.4545548654466366e-06, "epoch": 1.5715555555555556, "percentage": 52.39, "elapsed_time": "5:44:04", "remaining_time": "5:12:37"} | |
| {"current_steps": 4430, "total_steps": 8436, "loss": 0.2259, "learning_rate": 5.433946558117654e-06, "epoch": 1.5751111111111111, "percentage": 52.51, "elapsed_time": "5:44:40", "remaining_time": "5:11:40"} | |
| {"current_steps": 4440, "total_steps": 8436, "loss": 0.2269, "learning_rate": 5.413330820204214e-06, "epoch": 1.5786666666666667, "percentage": 52.63, "elapsed_time": "5:45:16", "remaining_time": "5:10:45"} | |
| {"current_steps": 4450, "total_steps": 8436, "loss": 0.233, "learning_rate": 5.392708004715178e-06, "epoch": 1.5822222222222222, "percentage": 52.75, "elapsed_time": "5:45:54", "remaining_time": "5:09:50"} | |
| {"current_steps": 4460, "total_steps": 8436, "loss": 0.2428, "learning_rate": 5.372078464780603e-06, "epoch": 1.5857777777777777, "percentage": 52.87, "elapsed_time": "5:46:31", "remaining_time": "5:08:54"} | |
| {"current_steps": 4470, "total_steps": 8436, "loss": 0.2095, "learning_rate": 5.351442553645691e-06, "epoch": 1.5893333333333333, "percentage": 52.99, "elapsed_time": "5:47:06", "remaining_time": "5:07:58"} | |
| {"current_steps": 4480, "total_steps": 8436, "loss": 0.2375, "learning_rate": 5.330800624664736e-06, "epoch": 1.592888888888889, "percentage": 53.11, "elapsed_time": "5:47:42", "remaining_time": "5:07:01"} | |
| {"current_steps": 4490, "total_steps": 8436, "loss": 0.2365, "learning_rate": 5.310153031295079e-06, "epoch": 1.5964444444444443, "percentage": 53.22, "elapsed_time": "5:48:17", "remaining_time": "5:06:05"} | |
| {"current_steps": 4500, "total_steps": 8436, "loss": 0.2521, "learning_rate": 5.289500127091056e-06, "epoch": 1.6, "percentage": 53.34, "elapsed_time": "5:48:55", "remaining_time": "5:05:11"} | |
| {"current_steps": 4500, "total_steps": 8436, "eval_loss": 0.22019484639167786, "epoch": 1.6, "percentage": 53.34, "elapsed_time": "5:58:17", "remaining_time": "5:13:23"} | |
| {"current_steps": 4510, "total_steps": 8436, "loss": 0.2445, "learning_rate": 5.26884226569794e-06, "epoch": 1.6035555555555554, "percentage": 53.46, "elapsed_time": "5:58:55", "remaining_time": "5:12:27"} | |
| {"current_steps": 4520, "total_steps": 8436, "loss": 0.2586, "learning_rate": 5.248179800845884e-06, "epoch": 1.6071111111111112, "percentage": 53.58, "elapsed_time": "5:59:34", "remaining_time": "5:11:31"} | |
| {"current_steps": 4530, "total_steps": 8436, "loss": 0.2342, "learning_rate": 5.227513086343875e-06, "epoch": 1.6106666666666667, "percentage": 53.7, "elapsed_time": "6:00:09", "remaining_time": "5:10:32"} | |
| {"current_steps": 4540, "total_steps": 8436, "loss": 0.2149, "learning_rate": 5.20684247607366e-06, "epoch": 1.6142222222222222, "percentage": 53.82, "elapsed_time": "6:00:45", "remaining_time": "5:09:35"} | |
| {"current_steps": 4550, "total_steps": 8436, "loss": 0.2361, "learning_rate": 5.186168323983702e-06, "epoch": 1.6177777777777778, "percentage": 53.94, "elapsed_time": "6:01:21", "remaining_time": "5:08:37"} | |
| {"current_steps": 4560, "total_steps": 8436, "loss": 0.2422, "learning_rate": 5.1654909840831e-06, "epoch": 1.6213333333333333, "percentage": 54.05, "elapsed_time": "6:01:57", "remaining_time": "5:07:39"} | |
| {"current_steps": 4570, "total_steps": 8436, "loss": 0.2702, "learning_rate": 5.144810810435553e-06, "epoch": 1.624888888888889, "percentage": 54.17, "elapsed_time": "6:02:32", "remaining_time": "5:06:41"} | |
| {"current_steps": 4580, "total_steps": 8436, "loss": 0.211, "learning_rate": 5.124128157153273e-06, "epoch": 1.6284444444444444, "percentage": 54.29, "elapsed_time": "6:03:08", "remaining_time": "5:05:44"} | |
| {"current_steps": 4590, "total_steps": 8436, "loss": 0.213, "learning_rate": 5.103443378390935e-06, "epoch": 1.6320000000000001, "percentage": 54.41, "elapsed_time": "6:03:42", "remaining_time": "5:04:45"} | |
| {"current_steps": 4600, "total_steps": 8436, "loss": 0.2348, "learning_rate": 5.08275682833961e-06, "epoch": 1.6355555555555554, "percentage": 54.53, "elapsed_time": "6:04:16", "remaining_time": "5:03:46"} | |
| {"current_steps": 4610, "total_steps": 8436, "loss": 0.2323, "learning_rate": 5.062068861220697e-06, "epoch": 1.6391111111111112, "percentage": 54.65, "elapsed_time": "6:04:53", "remaining_time": "5:02:50"} | |
| {"current_steps": 4620, "total_steps": 8436, "loss": 0.2274, "learning_rate": 5.041379831279859e-06, "epoch": 1.6426666666666667, "percentage": 54.77, "elapsed_time": "6:05:29", "remaining_time": "5:01:53"} | |
| {"current_steps": 4630, "total_steps": 8436, "loss": 0.2382, "learning_rate": 5.020690092780961e-06, "epoch": 1.6462222222222223, "percentage": 54.88, "elapsed_time": "6:06:09", "remaining_time": "5:00:59"} | |
| {"current_steps": 4640, "total_steps": 8436, "loss": 0.2263, "learning_rate": 5e-06, "epoch": 1.6497777777777778, "percentage": 55.0, "elapsed_time": "6:06:44", "remaining_time": "5:00:02"} | |
| {"current_steps": 4650, "total_steps": 8436, "loss": 0.2225, "learning_rate": 4.9793099072190406e-06, "epoch": 1.6533333333333333, "percentage": 55.12, "elapsed_time": "6:07:20", "remaining_time": "4:59:05"} | |
| {"current_steps": 4660, "total_steps": 8436, "loss": 0.2225, "learning_rate": 4.958620168720144e-06, "epoch": 1.6568888888888889, "percentage": 55.24, "elapsed_time": "6:07:56", "remaining_time": "4:58:08"} | |
| {"current_steps": 4670, "total_steps": 8436, "loss": 0.2438, "learning_rate": 4.937931138779305e-06, "epoch": 1.6604444444444444, "percentage": 55.36, "elapsed_time": "6:08:31", "remaining_time": "4:57:11"} | |
| {"current_steps": 4680, "total_steps": 8436, "loss": 0.2127, "learning_rate": 4.917243171660391e-06, "epoch": 1.6640000000000001, "percentage": 55.48, "elapsed_time": "6:09:09", "remaining_time": "4:56:16"} | |
| {"current_steps": 4690, "total_steps": 8436, "loss": 0.223, "learning_rate": 4.896556621609066e-06, "epoch": 1.6675555555555555, "percentage": 55.6, "elapsed_time": "6:09:45", "remaining_time": "4:55:20"} | |
| {"current_steps": 4700, "total_steps": 8436, "loss": 0.2332, "learning_rate": 4.8758718428467275e-06, "epoch": 1.6711111111111112, "percentage": 55.71, "elapsed_time": "6:10:24", "remaining_time": "4:54:25"} | |
| {"current_steps": 4710, "total_steps": 8436, "loss": 0.2381, "learning_rate": 4.8551891895644485e-06, "epoch": 1.6746666666666665, "percentage": 55.83, "elapsed_time": "6:11:02", "remaining_time": "4:53:31"} | |
| {"current_steps": 4720, "total_steps": 8436, "loss": 0.2182, "learning_rate": 4.8345090159169015e-06, "epoch": 1.6782222222222223, "percentage": 55.95, "elapsed_time": "6:11:37", "remaining_time": "4:52:34"} | |
| {"current_steps": 4730, "total_steps": 8436, "loss": 0.2323, "learning_rate": 4.813831676016301e-06, "epoch": 1.6817777777777778, "percentage": 56.07, "elapsed_time": "6:12:12", "remaining_time": "4:51:37"} | |
| {"current_steps": 4740, "total_steps": 8436, "loss": 0.2236, "learning_rate": 4.793157523926343e-06, "epoch": 1.6853333333333333, "percentage": 56.19, "elapsed_time": "6:12:48", "remaining_time": "4:50:42"} | |
| {"current_steps": 4750, "total_steps": 8436, "loss": 0.216, "learning_rate": 4.772486913656126e-06, "epoch": 1.6888888888888889, "percentage": 56.31, "elapsed_time": "6:13:24", "remaining_time": "4:49:45"} | |
| {"current_steps": 4760, "total_steps": 8436, "loss": 0.2104, "learning_rate": 4.751820199154116e-06, "epoch": 1.6924444444444444, "percentage": 56.42, "elapsed_time": "6:14:00", "remaining_time": "4:48:50"} | |
| {"current_steps": 4770, "total_steps": 8436, "loss": 0.2255, "learning_rate": 4.731157734302063e-06, "epoch": 1.696, "percentage": 56.54, "elapsed_time": "6:14:41", "remaining_time": "4:47:58"} | |
| {"current_steps": 4780, "total_steps": 8436, "loss": 0.2216, "learning_rate": 4.7104998729089456e-06, "epoch": 1.6995555555555555, "percentage": 56.66, "elapsed_time": "6:15:18", "remaining_time": "4:47:03"} | |
| {"current_steps": 4790, "total_steps": 8436, "loss": 0.2316, "learning_rate": 4.689846968704921e-06, "epoch": 1.7031111111111112, "percentage": 56.78, "elapsed_time": "6:15:57", "remaining_time": "4:46:10"} | |
| {"current_steps": 4800, "total_steps": 8436, "loss": 0.2211, "learning_rate": 4.669199375335267e-06, "epoch": 1.7066666666666666, "percentage": 56.9, "elapsed_time": "6:16:35", "remaining_time": "4:45:15"} | |
| {"current_steps": 4810, "total_steps": 8436, "loss": 0.2279, "learning_rate": 4.64855744635431e-06, "epoch": 1.7102222222222223, "percentage": 57.02, "elapsed_time": "6:17:11", "remaining_time": "4:44:20"} | |
| {"current_steps": 4820, "total_steps": 8436, "loss": 0.2076, "learning_rate": 4.627921535219398e-06, "epoch": 1.7137777777777776, "percentage": 57.14, "elapsed_time": "6:17:46", "remaining_time": "4:43:24"} | |
| {"current_steps": 4830, "total_steps": 8436, "loss": 0.2272, "learning_rate": 4.607291995284824e-06, "epoch": 1.7173333333333334, "percentage": 57.25, "elapsed_time": "6:18:23", "remaining_time": "4:42:29"} | |
| {"current_steps": 4840, "total_steps": 8436, "loss": 0.2269, "learning_rate": 4.586669179795789e-06, "epoch": 1.720888888888889, "percentage": 57.37, "elapsed_time": "6:19:00", "remaining_time": "4:41:35"} | |
| {"current_steps": 4850, "total_steps": 8436, "loss": 0.2187, "learning_rate": 4.566053441882346e-06, "epoch": 1.7244444444444444, "percentage": 57.49, "elapsed_time": "6:19:37", "remaining_time": "4:40:41"} | |
| {"current_steps": 4860, "total_steps": 8436, "loss": 0.2179, "learning_rate": 4.545445134553365e-06, "epoch": 1.728, "percentage": 57.61, "elapsed_time": "6:20:14", "remaining_time": "4:39:47"} | |
| {"current_steps": 4870, "total_steps": 8436, "loss": 0.2262, "learning_rate": 4.52484461069047e-06, "epoch": 1.7315555555555555, "percentage": 57.73, "elapsed_time": "6:20:49", "remaining_time": "4:38:51"} | |
| {"current_steps": 4880, "total_steps": 8436, "loss": 0.2363, "learning_rate": 4.504252223042015e-06, "epoch": 1.7351111111111113, "percentage": 57.85, "elapsed_time": "6:21:27", "remaining_time": "4:37:57"} | |
| {"current_steps": 4890, "total_steps": 8436, "loss": 0.2297, "learning_rate": 4.4836683242170274e-06, "epoch": 1.7386666666666666, "percentage": 57.97, "elapsed_time": "6:22:05", "remaining_time": "4:37:04"} | |
| {"current_steps": 4900, "total_steps": 8436, "loss": 0.2223, "learning_rate": 4.463093266679185e-06, "epoch": 1.7422222222222223, "percentage": 58.08, "elapsed_time": "6:22:39", "remaining_time": "4:36:08"} | |
| {"current_steps": 4910, "total_steps": 8436, "loss": 0.2177, "learning_rate": 4.442527402740773e-06, "epoch": 1.7457777777777777, "percentage": 58.2, "elapsed_time": "6:23:19", "remaining_time": "4:35:16"} | |
| {"current_steps": 4920, "total_steps": 8436, "loss": 0.2266, "learning_rate": 4.4219710845566445e-06, "epoch": 1.7493333333333334, "percentage": 58.32, "elapsed_time": "6:23:58", "remaining_time": "4:34:23"} | |
| {"current_steps": 4930, "total_steps": 8436, "loss": 0.2385, "learning_rate": 4.401424664118209e-06, "epoch": 1.752888888888889, "percentage": 58.44, "elapsed_time": "6:24:32", "remaining_time": "4:33:28"} | |
| {"current_steps": 4940, "total_steps": 8436, "loss": 0.2209, "learning_rate": 4.380888493247389e-06, "epoch": 1.7564444444444445, "percentage": 58.56, "elapsed_time": "6:25:09", "remaining_time": "4:32:34"} | |
| {"current_steps": 4950, "total_steps": 8436, "loss": 0.2273, "learning_rate": 4.360362923590599e-06, "epoch": 1.76, "percentage": 58.68, "elapsed_time": "6:25:44", "remaining_time": "4:31:39"} | |
| {"current_steps": 4960, "total_steps": 8436, "loss": 0.2263, "learning_rate": 4.339848306612726e-06, "epoch": 1.7635555555555555, "percentage": 58.8, "elapsed_time": "6:26:18", "remaining_time": "4:30:43"} | |
| {"current_steps": 4970, "total_steps": 8436, "loss": 0.2317, "learning_rate": 4.319344993591122e-06, "epoch": 1.767111111111111, "percentage": 58.91, "elapsed_time": "6:26:57", "remaining_time": "4:29:51"} | |
| {"current_steps": 4980, "total_steps": 8436, "loss": 0.2352, "learning_rate": 4.298853335609558e-06, "epoch": 1.7706666666666666, "percentage": 59.03, "elapsed_time": "6:27:32", "remaining_time": "4:28:56"} | |
| {"current_steps": 4990, "total_steps": 8436, "loss": 0.2451, "learning_rate": 4.278373683552252e-06, "epoch": 1.7742222222222224, "percentage": 59.15, "elapsed_time": "6:28:06", "remaining_time": "4:28:01"} | |
| {"current_steps": 5000, "total_steps": 8436, "loss": 0.2119, "learning_rate": 4.257906388097833e-06, "epoch": 1.7777777777777777, "percentage": 59.27, "elapsed_time": "6:28:44", "remaining_time": "4:27:08"} | |
| {"current_steps": 5000, "total_steps": 8436, "eval_loss": 0.2164340764284134, "epoch": 1.7777777777777777, "percentage": 59.27, "elapsed_time": "6:38:04", "remaining_time": "4:33:33"} | |
| {"current_steps": 5010, "total_steps": 8436, "loss": 0.2311, "learning_rate": 4.237451799713343e-06, "epoch": 1.7813333333333334, "percentage": 59.39, "elapsed_time": "6:38:41", "remaining_time": "4:32:38"} | |
| {"current_steps": 5020, "total_steps": 8436, "loss": 0.2308, "learning_rate": 4.2170102686482386e-06, "epoch": 1.7848888888888887, "percentage": 59.51, "elapsed_time": "6:39:16", "remaining_time": "4:31:41"} | |
| {"current_steps": 5030, "total_steps": 8436, "loss": 0.2343, "learning_rate": 4.196582144928398e-06, "epoch": 1.7884444444444445, "percentage": 59.63, "elapsed_time": "6:39:52", "remaining_time": "4:30:46"} | |
| {"current_steps": 5040, "total_steps": 8436, "loss": 0.2471, "learning_rate": 4.176167778350111e-06, "epoch": 1.792, "percentage": 59.74, "elapsed_time": "6:40:31", "remaining_time": "4:29:52"} | |
| {"current_steps": 5050, "total_steps": 8436, "loss": 0.2334, "learning_rate": 4.155767518474112e-06, "epoch": 1.7955555555555556, "percentage": 59.86, "elapsed_time": "6:41:06", "remaining_time": "4:28:56"} | |
| {"current_steps": 5060, "total_steps": 8436, "loss": 0.2352, "learning_rate": 4.135381714619572e-06, "epoch": 1.799111111111111, "percentage": 59.98, "elapsed_time": "6:41:44", "remaining_time": "4:28:02"} | |
| {"current_steps": 5070, "total_steps": 8436, "loss": 0.2295, "learning_rate": 4.115010715858135e-06, "epoch": 1.8026666666666666, "percentage": 60.1, "elapsed_time": "6:42:22", "remaining_time": "4:27:08"} | |
| {"current_steps": 5080, "total_steps": 8436, "loss": 0.2227, "learning_rate": 4.09465487100793e-06, "epoch": 1.8062222222222222, "percentage": 60.22, "elapsed_time": "6:42:57", "remaining_time": "4:26:12"} | |
| {"current_steps": 5090, "total_steps": 8436, "loss": 0.2355, "learning_rate": 4.074314528627602e-06, "epoch": 1.8097777777777777, "percentage": 60.34, "elapsed_time": "6:43:33", "remaining_time": "4:25:16"} | |
| {"current_steps": 5100, "total_steps": 8436, "loss": 0.2323, "learning_rate": 4.053990037010342e-06, "epoch": 1.8133333333333335, "percentage": 60.46, "elapsed_time": "6:44:11", "remaining_time": "4:24:23"} | |
| {"current_steps": 5110, "total_steps": 8436, "loss": 0.2069, "learning_rate": 4.033681744177929e-06, "epoch": 1.8168888888888888, "percentage": 60.57, "elapsed_time": "6:44:45", "remaining_time": "4:23:26"} | |
| {"current_steps": 5120, "total_steps": 8436, "loss": 0.2076, "learning_rate": 4.013389997874759e-06, "epoch": 1.8204444444444445, "percentage": 60.69, "elapsed_time": "6:45:20", "remaining_time": "4:22:31"} | |
| {"current_steps": 5130, "total_steps": 8436, "loss": 0.2425, "learning_rate": 3.993115145561902e-06, "epoch": 1.8239999999999998, "percentage": 60.81, "elapsed_time": "6:45:56", "remaining_time": "4:21:36"} | |
| {"current_steps": 5140, "total_steps": 8436, "loss": 0.234, "learning_rate": 3.9728575344111456e-06, "epoch": 1.8275555555555556, "percentage": 60.93, "elapsed_time": "6:46:32", "remaining_time": "4:20:41"} | |
| {"current_steps": 5150, "total_steps": 8436, "loss": 0.1987, "learning_rate": 3.9526175112990515e-06, "epoch": 1.8311111111111111, "percentage": 61.05, "elapsed_time": "6:47:08", "remaining_time": "4:19:46"} | |
| {"current_steps": 5160, "total_steps": 8436, "loss": 0.2137, "learning_rate": 3.93239542280102e-06, "epoch": 1.8346666666666667, "percentage": 61.17, "elapsed_time": "6:47:44", "remaining_time": "4:18:51"} | |
| {"current_steps": 5170, "total_steps": 8436, "loss": 0.2235, "learning_rate": 3.912191615185349e-06, "epoch": 1.8382222222222222, "percentage": 61.28, "elapsed_time": "6:48:17", "remaining_time": "4:17:55"} | |
| {"current_steps": 5180, "total_steps": 8436, "loss": 0.2218, "learning_rate": 3.892006434407309e-06, "epoch": 1.8417777777777777, "percentage": 61.4, "elapsed_time": "6:48:52", "remaining_time": "4:17:00"} | |
| {"current_steps": 5190, "total_steps": 8436, "loss": 0.2287, "learning_rate": 3.871840226103219e-06, "epoch": 1.8453333333333335, "percentage": 61.52, "elapsed_time": "6:49:26", "remaining_time": "4:16:04"} | |
| {"current_steps": 5200, "total_steps": 8436, "loss": 0.2228, "learning_rate": 3.851693335584525e-06, "epoch": 1.8488888888888888, "percentage": 61.64, "elapsed_time": "6:50:00", "remaining_time": "4:15:09"} | |
| {"current_steps": 5210, "total_steps": 8436, "loss": 0.2331, "learning_rate": 3.831566107831889e-06, "epoch": 1.8524444444444446, "percentage": 61.76, "elapsed_time": "6:50:37", "remaining_time": "4:14:15"} | |
| {"current_steps": 5220, "total_steps": 8436, "loss": 0.2137, "learning_rate": 3.8114588874892893e-06, "epoch": 1.8559999999999999, "percentage": 61.88, "elapsed_time": "6:51:11", "remaining_time": "4:13:19"} | |
| {"current_steps": 5230, "total_steps": 8436, "loss": 0.2135, "learning_rate": 3.791372018858099e-06, "epoch": 1.8595555555555556, "percentage": 62.0, "elapsed_time": "6:51:48", "remaining_time": "4:12:26"} | |
| {"current_steps": 5240, "total_steps": 8436, "loss": 0.2217, "learning_rate": 3.7713058458912164e-06, "epoch": 1.8631111111111112, "percentage": 62.11, "elapsed_time": "6:52:24", "remaining_time": "4:11:32"} | |
| {"current_steps": 5250, "total_steps": 8436, "loss": 0.2539, "learning_rate": 3.751260712187156e-06, "epoch": 1.8666666666666667, "percentage": 62.23, "elapsed_time": "6:53:01", "remaining_time": "4:10:39"} | |
| {"current_steps": 5260, "total_steps": 8436, "loss": 0.2179, "learning_rate": 3.731236960984169e-06, "epoch": 1.8702222222222222, "percentage": 62.35, "elapsed_time": "6:53:39", "remaining_time": "4:09:46"} | |
| {"current_steps": 5270, "total_steps": 8436, "loss": 0.2183, "learning_rate": 3.711234935154372e-06, "epoch": 1.8737777777777778, "percentage": 62.47, "elapsed_time": "6:54:14", "remaining_time": "4:08:51"} | |
| {"current_steps": 5280, "total_steps": 8436, "loss": 0.2354, "learning_rate": 3.6912549771978747e-06, "epoch": 1.8773333333333333, "percentage": 62.59, "elapsed_time": "6:54:51", "remaining_time": "4:07:58"} | |
| {"current_steps": 5290, "total_steps": 8436, "loss": 0.2268, "learning_rate": 3.6712974292369035e-06, "epoch": 1.8808888888888888, "percentage": 62.71, "elapsed_time": "6:55:27", "remaining_time": "4:07:04"} | |
| {"current_steps": 5300, "total_steps": 8436, "loss": 0.204, "learning_rate": 3.651362633009962e-06, "epoch": 1.8844444444444446, "percentage": 62.83, "elapsed_time": "6:56:03", "remaining_time": "4:06:10"} | |
| {"current_steps": 5310, "total_steps": 8436, "loss": 0.208, "learning_rate": 3.6314509298659663e-06, "epoch": 1.888, "percentage": 62.94, "elapsed_time": "6:56:37", "remaining_time": "4:05:16"} | |
| {"current_steps": 5320, "total_steps": 8436, "loss": 0.2372, "learning_rate": 3.6115626607584e-06, "epoch": 1.8915555555555557, "percentage": 63.06, "elapsed_time": "6:57:14", "remaining_time": "4:04:22"} | |
| {"current_steps": 5330, "total_steps": 8436, "loss": 0.2257, "learning_rate": 3.5916981662394856e-06, "epoch": 1.895111111111111, "percentage": 63.18, "elapsed_time": "6:57:50", "remaining_time": "4:03:29"} | |
| {"current_steps": 5340, "total_steps": 8436, "loss": 0.2103, "learning_rate": 3.5718577864543396e-06, "epoch": 1.8986666666666667, "percentage": 63.3, "elapsed_time": "6:58:27", "remaining_time": "4:02:36"} | |
| {"current_steps": 5350, "total_steps": 8436, "loss": 0.211, "learning_rate": 3.552041861135161e-06, "epoch": 1.9022222222222223, "percentage": 63.42, "elapsed_time": "6:59:03", "remaining_time": "4:01:43"} | |
| {"current_steps": 5360, "total_steps": 8436, "loss": 0.2164, "learning_rate": 3.532250729595408e-06, "epoch": 1.9057777777777778, "percentage": 63.54, "elapsed_time": "6:59:41", "remaining_time": "4:00:51"} | |
| {"current_steps": 5370, "total_steps": 8436, "loss": 0.2265, "learning_rate": 3.5124847307239863e-06, "epoch": 1.9093333333333333, "percentage": 63.66, "elapsed_time": "7:00:18", "remaining_time": "3:59:58"} | |
| {"current_steps": 5380, "total_steps": 8436, "loss": 0.2316, "learning_rate": 3.4927442029794467e-06, "epoch": 1.9128888888888889, "percentage": 63.77, "elapsed_time": "7:00:57", "remaining_time": "3:59:06"} | |
| {"current_steps": 5390, "total_steps": 8436, "loss": 0.219, "learning_rate": 3.473029484384196e-06, "epoch": 1.9164444444444444, "percentage": 63.89, "elapsed_time": "7:01:34", "remaining_time": "3:58:14"} | |
| {"current_steps": 5400, "total_steps": 8436, "loss": 0.2252, "learning_rate": 3.4533409125186974e-06, "epoch": 1.92, "percentage": 64.01, "elapsed_time": "7:02:11", "remaining_time": "3:57:21"} | |
| {"current_steps": 5410, "total_steps": 8436, "loss": 0.2222, "learning_rate": 3.4336788245157026e-06, "epoch": 1.9235555555555557, "percentage": 64.13, "elapsed_time": "7:02:48", "remaining_time": "3:56:29"} | |
| {"current_steps": 5420, "total_steps": 8436, "loss": 0.2345, "learning_rate": 3.4140435570544708e-06, "epoch": 1.927111111111111, "percentage": 64.25, "elapsed_time": "7:03:25", "remaining_time": "3:55:36"} | |
| {"current_steps": 5430, "total_steps": 8436, "loss": 0.214, "learning_rate": 3.3944354463550035e-06, "epoch": 1.9306666666666668, "percentage": 64.37, "elapsed_time": "7:04:02", "remaining_time": "3:54:44"} | |
| {"current_steps": 5440, "total_steps": 8436, "loss": 0.234, "learning_rate": 3.374854828172292e-06, "epoch": 1.934222222222222, "percentage": 64.49, "elapsed_time": "7:04:43", "remaining_time": "3:53:54"} | |
| {"current_steps": 5450, "total_steps": 8436, "loss": 0.2242, "learning_rate": 3.3553020377905663e-06, "epoch": 1.9377777777777778, "percentage": 64.6, "elapsed_time": "7:05:20", "remaining_time": "3:53:02"} | |
| {"current_steps": 5460, "total_steps": 8436, "loss": 0.2245, "learning_rate": 3.3357774100175513e-06, "epoch": 1.9413333333333334, "percentage": 64.72, "elapsed_time": "7:05:59", "remaining_time": "3:52:11"} | |
| {"current_steps": 5470, "total_steps": 8436, "loss": 0.2114, "learning_rate": 3.316281279178737e-06, "epoch": 1.944888888888889, "percentage": 64.84, "elapsed_time": "7:06:33", "remaining_time": "3:51:17"} | |
| {"current_steps": 5480, "total_steps": 8436, "loss": 0.2182, "learning_rate": 3.296813979111655e-06, "epoch": 1.9484444444444444, "percentage": 64.96, "elapsed_time": "7:07:10", "remaining_time": "3:50:25"} | |
| {"current_steps": 5490, "total_steps": 8436, "loss": 0.2234, "learning_rate": 3.2773758431601543e-06, "epoch": 1.952, "percentage": 65.08, "elapsed_time": "7:07:49", "remaining_time": "3:49:34"} | |
| {"current_steps": 5500, "total_steps": 8436, "loss": 0.238, "learning_rate": 3.257967204168705e-06, "epoch": 1.9555555555555557, "percentage": 65.2, "elapsed_time": "7:08:24", "remaining_time": "3:48:41"} | |
| {"current_steps": 5500, "total_steps": 8436, "eval_loss": 0.21176277101039886, "epoch": 1.9555555555555557, "percentage": 65.2, "elapsed_time": "7:17:45", "remaining_time": "3:53:41"} | |
| {"current_steps": 5510, "total_steps": 8436, "loss": 0.1932, "learning_rate": 3.2385883944766867e-06, "epoch": 1.959111111111111, "percentage": 65.32, "elapsed_time": "7:18:19", "remaining_time": "3:52:45"} | |
| {"current_steps": 5520, "total_steps": 8436, "loss": 0.2194, "learning_rate": 3.2192397459127077e-06, "epoch": 1.9626666666666668, "percentage": 65.43, "elapsed_time": "7:18:54", "remaining_time": "3:51:51"} | |
| {"current_steps": 5530, "total_steps": 8436, "loss": 0.2092, "learning_rate": 3.199921589788923e-06, "epoch": 1.966222222222222, "percentage": 65.55, "elapsed_time": "7:19:30", "remaining_time": "3:50:57"} | |
| {"current_steps": 5540, "total_steps": 8436, "loss": 0.2328, "learning_rate": 3.180634256895345e-06, "epoch": 1.9697777777777778, "percentage": 65.67, "elapsed_time": "7:20:05", "remaining_time": "3:50:03"} | |
| {"current_steps": 5550, "total_steps": 8436, "loss": 0.234, "learning_rate": 3.161378077494205e-06, "epoch": 1.9733333333333334, "percentage": 65.79, "elapsed_time": "7:20:42", "remaining_time": "3:49:09"} | |
| {"current_steps": 5560, "total_steps": 8436, "loss": 0.2285, "learning_rate": 3.142153381314278e-06, "epoch": 1.976888888888889, "percentage": 65.91, "elapsed_time": "7:21:20", "remaining_time": "3:48:17"} | |
| {"current_steps": 5570, "total_steps": 8436, "loss": 0.2347, "learning_rate": 3.122960497545242e-06, "epoch": 1.9804444444444445, "percentage": 66.03, "elapsed_time": "7:21:56", "remaining_time": "3:47:24"} | |
| {"current_steps": 5580, "total_steps": 8436, "loss": 0.2017, "learning_rate": 3.103799754832045e-06, "epoch": 1.984, "percentage": 66.15, "elapsed_time": "7:22:32", "remaining_time": "3:46:30"} | |
| {"current_steps": 5590, "total_steps": 8436, "loss": 0.2282, "learning_rate": 3.0846714812692774e-06, "epoch": 1.9875555555555555, "percentage": 66.26, "elapsed_time": "7:23:09", "remaining_time": "3:45:37"} | |
| {"current_steps": 5600, "total_steps": 8436, "loss": 0.2193, "learning_rate": 3.065576004395546e-06, "epoch": 1.991111111111111, "percentage": 66.38, "elapsed_time": "7:23:45", "remaining_time": "3:44:44"} | |
| {"current_steps": 5610, "total_steps": 8436, "loss": 0.205, "learning_rate": 3.046513651187874e-06, "epoch": 1.9946666666666668, "percentage": 66.5, "elapsed_time": "7:24:24", "remaining_time": "3:43:52"} | |
| {"current_steps": 5620, "total_steps": 8436, "loss": 0.2052, "learning_rate": 3.027484748056101e-06, "epoch": 1.9982222222222221, "percentage": 66.62, "elapsed_time": "7:24:59", "remaining_time": "3:42:58"} | |
| {"current_steps": 5630, "total_steps": 8436, "loss": 0.1793, "learning_rate": 3.008489620837287e-06, "epoch": 2.001777777777778, "percentage": 66.74, "elapsed_time": "7:25:37", "remaining_time": "3:42:05"} | |
| {"current_steps": 5640, "total_steps": 8436, "loss": 0.133, "learning_rate": 2.989528594790142e-06, "epoch": 2.005333333333333, "percentage": 66.86, "elapsed_time": "7:26:14", "remaining_time": "3:41:13"} | |
| {"current_steps": 5650, "total_steps": 8436, "loss": 0.1364, "learning_rate": 2.97060199458945e-06, "epoch": 2.008888888888889, "percentage": 66.97, "elapsed_time": "7:26:49", "remaining_time": "3:40:19"} | |
| {"current_steps": 5660, "total_steps": 8436, "loss": 0.138, "learning_rate": 2.9517101443205143e-06, "epoch": 2.0124444444444443, "percentage": 67.09, "elapsed_time": "7:27:25", "remaining_time": "3:39:26"} | |
| {"current_steps": 5670, "total_steps": 8436, "loss": 0.1372, "learning_rate": 2.9328533674736043e-06, "epoch": 2.016, "percentage": 67.21, "elapsed_time": "7:28:02", "remaining_time": "3:38:33"} | |
| {"current_steps": 5680, "total_steps": 8436, "loss": 0.1376, "learning_rate": 2.914031986938417e-06, "epoch": 2.0195555555555558, "percentage": 67.33, "elapsed_time": "7:28:38", "remaining_time": "3:37:41"} | |
| {"current_steps": 5690, "total_steps": 8436, "loss": 0.132, "learning_rate": 2.895246324998549e-06, "epoch": 2.023111111111111, "percentage": 67.45, "elapsed_time": "7:29:15", "remaining_time": "3:36:48"} | |
| {"current_steps": 5700, "total_steps": 8436, "loss": 0.1332, "learning_rate": 2.8764967033259793e-06, "epoch": 2.026666666666667, "percentage": 67.57, "elapsed_time": "7:29:54", "remaining_time": "3:35:57"} | |
| {"current_steps": 5710, "total_steps": 8436, "loss": 0.137, "learning_rate": 2.8577834429755586e-06, "epoch": 2.030222222222222, "percentage": 67.69, "elapsed_time": "7:30:31", "remaining_time": "3:35:04"} | |
| {"current_steps": 5720, "total_steps": 8436, "loss": 0.1311, "learning_rate": 2.839106864379512e-06, "epoch": 2.033777777777778, "percentage": 67.8, "elapsed_time": "7:31:05", "remaining_time": "3:34:11"} | |
| {"current_steps": 5730, "total_steps": 8436, "loss": 0.1359, "learning_rate": 2.8204672873419565e-06, "epoch": 2.037333333333333, "percentage": 67.92, "elapsed_time": "7:31:40", "remaining_time": "3:33:18"} | |
| {"current_steps": 5740, "total_steps": 8436, "loss": 0.1524, "learning_rate": 2.8018650310334118e-06, "epoch": 2.040888888888889, "percentage": 68.04, "elapsed_time": "7:32:18", "remaining_time": "3:32:26"} | |
| {"current_steps": 5750, "total_steps": 8436, "loss": 0.1216, "learning_rate": 2.783300413985359e-06, "epoch": 2.0444444444444443, "percentage": 68.16, "elapsed_time": "7:32:54", "remaining_time": "3:31:33"} | |
| {"current_steps": 5760, "total_steps": 8436, "loss": 0.1393, "learning_rate": 2.764773754084763e-06, "epoch": 2.048, "percentage": 68.28, "elapsed_time": "7:33:30", "remaining_time": "3:30:41"} | |
| {"current_steps": 5770, "total_steps": 8436, "loss": 0.1429, "learning_rate": 2.7462853685686362e-06, "epoch": 2.0515555555555554, "percentage": 68.4, "elapsed_time": "7:34:05", "remaining_time": "3:29:48"} | |
| {"current_steps": 5780, "total_steps": 8436, "loss": 0.1336, "learning_rate": 2.7278355740186123e-06, "epoch": 2.055111111111111, "percentage": 68.52, "elapsed_time": "7:34:39", "remaining_time": "3:28:55"} | |
| {"current_steps": 5790, "total_steps": 8436, "loss": 0.1359, "learning_rate": 2.7094246863555262e-06, "epoch": 2.058666666666667, "percentage": 68.63, "elapsed_time": "7:35:15", "remaining_time": "3:28:03"} | |
| {"current_steps": 5800, "total_steps": 8436, "loss": 0.1388, "learning_rate": 2.691053020833988e-06, "epoch": 2.062222222222222, "percentage": 68.75, "elapsed_time": "7:35:52", "remaining_time": "3:27:11"} | |
| {"current_steps": 5810, "total_steps": 8436, "loss": 0.1355, "learning_rate": 2.6727208920370063e-06, "epoch": 2.065777777777778, "percentage": 68.87, "elapsed_time": "7:36:30", "remaining_time": "3:26:19"} | |
| {"current_steps": 5820, "total_steps": 8436, "loss": 0.1328, "learning_rate": 2.6544286138705867e-06, "epoch": 2.0693333333333332, "percentage": 68.99, "elapsed_time": "7:37:06", "remaining_time": "3:25:27"} | |
| {"current_steps": 5830, "total_steps": 8436, "loss": 0.1354, "learning_rate": 2.636176499558364e-06, "epoch": 2.072888888888889, "percentage": 69.11, "elapsed_time": "7:37:44", "remaining_time": "3:24:36"} | |
| {"current_steps": 5840, "total_steps": 8436, "loss": 0.1493, "learning_rate": 2.6179648616362374e-06, "epoch": 2.0764444444444443, "percentage": 69.23, "elapsed_time": "7:38:20", "remaining_time": "3:23:44"} | |
| {"current_steps": 5850, "total_steps": 8436, "loss": 0.1579, "learning_rate": 2.599794011947012e-06, "epoch": 2.08, "percentage": 69.35, "elapsed_time": "7:38:55", "remaining_time": "3:22:51"} | |
| {"current_steps": 5860, "total_steps": 8436, "loss": 0.1446, "learning_rate": 2.581664261635069e-06, "epoch": 2.0835555555555554, "percentage": 69.46, "elapsed_time": "7:39:30", "remaining_time": "3:21:59"} | |
| {"current_steps": 5870, "total_steps": 8436, "loss": 0.1406, "learning_rate": 2.5635759211410396e-06, "epoch": 2.087111111111111, "percentage": 69.58, "elapsed_time": "7:40:08", "remaining_time": "3:21:08"} | |
| {"current_steps": 5880, "total_steps": 8436, "loss": 0.1244, "learning_rate": 2.545529300196472e-06, "epoch": 2.0906666666666665, "percentage": 69.7, "elapsed_time": "7:40:43", "remaining_time": "3:20:16"} | |
| {"current_steps": 5890, "total_steps": 8436, "loss": 0.1289, "learning_rate": 2.527524707818547e-06, "epoch": 2.094222222222222, "percentage": 69.82, "elapsed_time": "7:41:21", "remaining_time": "3:19:25"} | |
| {"current_steps": 5900, "total_steps": 8436, "loss": 0.1151, "learning_rate": 2.5095624523047775e-06, "epoch": 2.097777777777778, "percentage": 69.94, "elapsed_time": "7:41:56", "remaining_time": "3:18:33"} | |
| {"current_steps": 5910, "total_steps": 8436, "loss": 0.1386, "learning_rate": 2.491642841227729e-06, "epoch": 2.1013333333333333, "percentage": 70.06, "elapsed_time": "7:42:33", "remaining_time": "3:17:42"} | |
| {"current_steps": 5920, "total_steps": 8436, "loss": 0.1152, "learning_rate": 2.4737661814297557e-06, "epoch": 2.104888888888889, "percentage": 70.18, "elapsed_time": "7:43:08", "remaining_time": "3:16:49"} | |
| {"current_steps": 5930, "total_steps": 8436, "loss": 0.1267, "learning_rate": 2.455932779017747e-06, "epoch": 2.1084444444444443, "percentage": 70.29, "elapsed_time": "7:43:44", "remaining_time": "3:15:58"} | |
| {"current_steps": 5940, "total_steps": 8436, "loss": 0.1468, "learning_rate": 2.438142939357882e-06, "epoch": 2.112, "percentage": 70.41, "elapsed_time": "7:44:20", "remaining_time": "3:15:06"} | |
| {"current_steps": 5950, "total_steps": 8436, "loss": 0.1426, "learning_rate": 2.4203969670704065e-06, "epoch": 2.1155555555555554, "percentage": 70.53, "elapsed_time": "7:44:57", "remaining_time": "3:14:16"} | |
| {"current_steps": 5960, "total_steps": 8436, "loss": 0.1519, "learning_rate": 2.4026951660244063e-06, "epoch": 2.119111111111111, "percentage": 70.65, "elapsed_time": "7:45:36", "remaining_time": "3:13:25"} | |
| {"current_steps": 5970, "total_steps": 8436, "loss": 0.1449, "learning_rate": 2.385037839332616e-06, "epoch": 2.1226666666666665, "percentage": 70.77, "elapsed_time": "7:46:14", "remaining_time": "3:12:35"} | |
| {"current_steps": 5980, "total_steps": 8436, "loss": 0.1508, "learning_rate": 2.3674252893462304e-06, "epoch": 2.1262222222222222, "percentage": 70.89, "elapsed_time": "7:46:50", "remaining_time": "3:11:44"} | |
| {"current_steps": 5990, "total_steps": 8436, "loss": 0.1336, "learning_rate": 2.3498578176497055e-06, "epoch": 2.129777777777778, "percentage": 71.01, "elapsed_time": "7:47:29", "remaining_time": "3:10:54"} | |
| {"current_steps": 6000, "total_steps": 8436, "loss": 0.1289, "learning_rate": 2.3323357250556213e-06, "epoch": 2.1333333333333333, "percentage": 71.12, "elapsed_time": "7:48:07", "remaining_time": "3:10:03"} | |
| {"current_steps": 6000, "total_steps": 8436, "eval_loss": 0.24109843373298645, "epoch": 2.1333333333333333, "percentage": 71.12, "elapsed_time": "7:57:28", "remaining_time": "3:13:51"} | |
| {"current_steps": 6010, "total_steps": 8436, "loss": 0.1232, "learning_rate": 2.3148593115995155e-06, "epoch": 2.136888888888889, "percentage": 71.24, "elapsed_time": "7:58:24", "remaining_time": "3:13:06"} | |
| {"current_steps": 6020, "total_steps": 8436, "loss": 0.1406, "learning_rate": 2.2974288765347484e-06, "epoch": 2.1404444444444444, "percentage": 71.36, "elapsed_time": "7:59:01", "remaining_time": "3:12:14"} | |
| {"current_steps": 6030, "total_steps": 8436, "loss": 0.1366, "learning_rate": 2.280044718327383e-06, "epoch": 2.144, "percentage": 71.48, "elapsed_time": "7:59:41", "remaining_time": "3:11:24"} | |
| {"current_steps": 6040, "total_steps": 8436, "loss": 0.1347, "learning_rate": 2.262707134651069e-06, "epoch": 2.1475555555555554, "percentage": 71.6, "elapsed_time": "8:00:17", "remaining_time": "3:10:31"} | |
| {"current_steps": 6050, "total_steps": 8436, "loss": 0.1435, "learning_rate": 2.2454164223819443e-06, "epoch": 2.151111111111111, "percentage": 71.72, "elapsed_time": "8:00:52", "remaining_time": "3:09:38"} | |
| {"current_steps": 6060, "total_steps": 8436, "loss": 0.1248, "learning_rate": 2.228172877593563e-06, "epoch": 2.1546666666666665, "percentage": 71.83, "elapsed_time": "8:01:27", "remaining_time": "3:08:46"} | |
| {"current_steps": 6070, "total_steps": 8436, "loss": 0.129, "learning_rate": 2.2109767955518135e-06, "epoch": 2.1582222222222223, "percentage": 71.95, "elapsed_time": "8:02:06", "remaining_time": "3:07:55"} | |
| {"current_steps": 6080, "total_steps": 8436, "loss": 0.1259, "learning_rate": 2.193828470709863e-06, "epoch": 2.1617777777777776, "percentage": 72.07, "elapsed_time": "8:02:42", "remaining_time": "3:07:02"} | |
| {"current_steps": 6090, "total_steps": 8436, "loss": 0.1308, "learning_rate": 2.176728196703122e-06, "epoch": 2.1653333333333333, "percentage": 72.19, "elapsed_time": "8:03:18", "remaining_time": "3:06:10"} | |
| {"current_steps": 6100, "total_steps": 8436, "loss": 0.1496, "learning_rate": 2.159676266344222e-06, "epoch": 2.168888888888889, "percentage": 72.31, "elapsed_time": "8:03:55", "remaining_time": "3:05:18"} | |
| {"current_steps": 6110, "total_steps": 8436, "loss": 0.1359, "learning_rate": 2.142672971617978e-06, "epoch": 2.1724444444444444, "percentage": 72.43, "elapsed_time": "8:04:32", "remaining_time": "3:04:27"} | |
| {"current_steps": 6120, "total_steps": 8436, "loss": 0.1412, "learning_rate": 2.125718603676413e-06, "epoch": 2.176, "percentage": 72.55, "elapsed_time": "8:05:09", "remaining_time": "3:03:35"} | |
| {"current_steps": 6130, "total_steps": 8436, "loss": 0.1357, "learning_rate": 2.1088134528337635e-06, "epoch": 2.1795555555555555, "percentage": 72.66, "elapsed_time": "8:05:44", "remaining_time": "3:02:43"} | |
| {"current_steps": 6140, "total_steps": 8436, "loss": 0.1388, "learning_rate": 2.091957808561505e-06, "epoch": 2.1831111111111112, "percentage": 72.78, "elapsed_time": "8:06:20", "remaining_time": "3:01:51"} | |
| {"current_steps": 6150, "total_steps": 8436, "loss": 0.1359, "learning_rate": 2.0751519594834025e-06, "epoch": 2.1866666666666665, "percentage": 72.9, "elapsed_time": "8:06:59", "remaining_time": "3:01:00"} | |
| {"current_steps": 6160, "total_steps": 8436, "loss": 0.1364, "learning_rate": 2.058396193370556e-06, "epoch": 2.1902222222222223, "percentage": 73.02, "elapsed_time": "8:07:34", "remaining_time": "3:00:08"} | |
| {"current_steps": 6170, "total_steps": 8436, "loss": 0.1286, "learning_rate": 2.0416907971364937e-06, "epoch": 2.1937777777777776, "percentage": 73.14, "elapsed_time": "8:08:08", "remaining_time": "2:59:16"} | |
| {"current_steps": 6180, "total_steps": 8436, "loss": 0.132, "learning_rate": 2.0250360568322395e-06, "epoch": 2.1973333333333334, "percentage": 73.26, "elapsed_time": "8:08:45", "remaining_time": "2:58:25"} | |
| {"current_steps": 6190, "total_steps": 8436, "loss": 0.1311, "learning_rate": 2.0084322576414205e-06, "epoch": 2.2008888888888887, "percentage": 73.38, "elapsed_time": "8:09:19", "remaining_time": "2:57:32"} | |
| {"current_steps": 6200, "total_steps": 8436, "loss": 0.1412, "learning_rate": 1.991879683875386e-06, "epoch": 2.2044444444444444, "percentage": 73.49, "elapsed_time": "8:09:58", "remaining_time": "2:56:42"} | |
| {"current_steps": 6210, "total_steps": 8436, "loss": 0.1358, "learning_rate": 1.975378618968348e-06, "epoch": 2.208, "percentage": 73.61, "elapsed_time": "8:10:34", "remaining_time": "2:55:50"} | |
| {"current_steps": 6220, "total_steps": 8436, "loss": 0.1272, "learning_rate": 1.958929345472503e-06, "epoch": 2.2115555555555555, "percentage": 73.73, "elapsed_time": "8:11:11", "remaining_time": "2:54:59"} | |
| {"current_steps": 6230, "total_steps": 8436, "loss": 0.1335, "learning_rate": 1.942532145053219e-06, "epoch": 2.2151111111111113, "percentage": 73.85, "elapsed_time": "8:11:46", "remaining_time": "2:54:08"} | |
| {"current_steps": 6240, "total_steps": 8436, "loss": 0.13, "learning_rate": 1.926187298484201e-06, "epoch": 2.2186666666666666, "percentage": 73.97, "elapsed_time": "8:12:21", "remaining_time": "2:53:16"} | |
| {"current_steps": 6250, "total_steps": 8436, "loss": 0.1197, "learning_rate": 1.9098950856426845e-06, "epoch": 2.2222222222222223, "percentage": 74.09, "elapsed_time": "8:12:58", "remaining_time": "2:52:25"} | |
| {"current_steps": 6260, "total_steps": 8436, "loss": 0.136, "learning_rate": 1.893655785504644e-06, "epoch": 2.2257777777777776, "percentage": 74.21, "elapsed_time": "8:13:32", "remaining_time": "2:51:33"} | |
| {"current_steps": 6270, "total_steps": 8436, "loss": 0.1351, "learning_rate": 1.8774696761400107e-06, "epoch": 2.2293333333333334, "percentage": 74.32, "elapsed_time": "8:14:11", "remaining_time": "2:50:43"} | |
| {"current_steps": 6280, "total_steps": 8436, "loss": 0.1316, "learning_rate": 1.8613370347079207e-06, "epoch": 2.2328888888888887, "percentage": 74.44, "elapsed_time": "8:14:47", "remaining_time": "2:49:52"} | |
| {"current_steps": 6290, "total_steps": 8436, "loss": 0.1343, "learning_rate": 1.845258137451968e-06, "epoch": 2.2364444444444445, "percentage": 74.56, "elapsed_time": "8:15:23", "remaining_time": "2:49:00"} | |
| {"current_steps": 6300, "total_steps": 8436, "loss": 0.1252, "learning_rate": 1.8292332596954605e-06, "epoch": 2.24, "percentage": 74.68, "elapsed_time": "8:15:57", "remaining_time": "2:48:09"} | |
| {"current_steps": 6310, "total_steps": 8436, "loss": 0.1373, "learning_rate": 1.8132626758367217e-06, "epoch": 2.2435555555555555, "percentage": 74.8, "elapsed_time": "8:16:35", "remaining_time": "2:47:18"} | |
| {"current_steps": 6320, "total_steps": 8436, "loss": 0.1238, "learning_rate": 1.7973466593443861e-06, "epoch": 2.2471111111111113, "percentage": 74.92, "elapsed_time": "8:17:10", "remaining_time": "2:46:27"} | |
| {"current_steps": 6330, "total_steps": 8436, "loss": 0.1331, "learning_rate": 1.7814854827527144e-06, "epoch": 2.2506666666666666, "percentage": 75.04, "elapsed_time": "8:17:44", "remaining_time": "2:45:35"} | |
| {"current_steps": 6340, "total_steps": 8436, "loss": 0.1392, "learning_rate": 1.7656794176569302e-06, "epoch": 2.2542222222222223, "percentage": 75.15, "elapsed_time": "8:18:22", "remaining_time": "2:44:45"} | |
| {"current_steps": 6350, "total_steps": 8436, "loss": 0.1482, "learning_rate": 1.749928734708568e-06, "epoch": 2.2577777777777777, "percentage": 75.27, "elapsed_time": "8:18:56", "remaining_time": "2:43:54"} | |
| {"current_steps": 6360, "total_steps": 8436, "loss": 0.1318, "learning_rate": 1.734233703610838e-06, "epoch": 2.2613333333333334, "percentage": 75.39, "elapsed_time": "8:19:34", "remaining_time": "2:43:04"} | |
| {"current_steps": 6370, "total_steps": 8436, "loss": 0.1389, "learning_rate": 1.7185945931140086e-06, "epoch": 2.2648888888888887, "percentage": 75.51, "elapsed_time": "8:20:10", "remaining_time": "2:42:13"} | |
| {"current_steps": 6380, "total_steps": 8436, "loss": 0.1402, "learning_rate": 1.7030116710108068e-06, "epoch": 2.2684444444444445, "percentage": 75.63, "elapsed_time": "8:20:46", "remaining_time": "2:41:22"} | |
| {"current_steps": 6390, "total_steps": 8436, "loss": 0.1383, "learning_rate": 1.6874852041318246e-06, "epoch": 2.2720000000000002, "percentage": 75.75, "elapsed_time": "8:21:23", "remaining_time": "2:40:32"} | |
| {"current_steps": 6400, "total_steps": 8436, "loss": 0.1297, "learning_rate": 1.6720154583409642e-06, "epoch": 2.2755555555555556, "percentage": 75.87, "elapsed_time": "8:21:58", "remaining_time": "2:39:41"} | |
| {"current_steps": 6410, "total_steps": 8436, "loss": 0.1265, "learning_rate": 1.6566026985308737e-06, "epoch": 2.279111111111111, "percentage": 75.98, "elapsed_time": "8:22:35", "remaining_time": "2:38:51"} | |
| {"current_steps": 6420, "total_steps": 8436, "loss": 0.1433, "learning_rate": 1.6412471886184106e-06, "epoch": 2.2826666666666666, "percentage": 76.1, "elapsed_time": "8:23:12", "remaining_time": "2:38:00"} | |
| {"current_steps": 6430, "total_steps": 8436, "loss": 0.1295, "learning_rate": 1.6259491915401322e-06, "epoch": 2.2862222222222224, "percentage": 76.22, "elapsed_time": "8:23:50", "remaining_time": "2:37:11"} | |
| {"current_steps": 6440, "total_steps": 8436, "loss": 0.1506, "learning_rate": 1.6107089692477856e-06, "epoch": 2.2897777777777777, "percentage": 76.34, "elapsed_time": "8:24:26", "remaining_time": "2:36:20"} | |
| {"current_steps": 6450, "total_steps": 8436, "loss": 0.1309, "learning_rate": 1.5955267827038267e-06, "epoch": 2.2933333333333334, "percentage": 76.46, "elapsed_time": "8:25:02", "remaining_time": "2:35:30"} | |
| {"current_steps": 6460, "total_steps": 8436, "loss": 0.1245, "learning_rate": 1.5804028918769488e-06, "epoch": 2.2968888888888888, "percentage": 76.58, "elapsed_time": "8:25:41", "remaining_time": "2:34:40"} | |
| {"current_steps": 6470, "total_steps": 8436, "loss": 0.1419, "learning_rate": 1.5653375557376266e-06, "epoch": 2.3004444444444445, "percentage": 76.7, "elapsed_time": "8:26:16", "remaining_time": "2:33:50"} | |
| {"current_steps": 6480, "total_steps": 8436, "loss": 0.1357, "learning_rate": 1.5503310322536962e-06, "epoch": 2.304, "percentage": 76.81, "elapsed_time": "8:26:52", "remaining_time": "2:33:00"} | |
| {"current_steps": 6490, "total_steps": 8436, "loss": 0.1344, "learning_rate": 1.5353835783859244e-06, "epoch": 2.3075555555555556, "percentage": 76.93, "elapsed_time": "8:27:32", "remaining_time": "2:32:10"} | |
| {"current_steps": 6500, "total_steps": 8436, "loss": 0.1336, "learning_rate": 1.5204954500836095e-06, "epoch": 2.311111111111111, "percentage": 77.05, "elapsed_time": "8:28:08", "remaining_time": "2:31:20"} | |
| {"current_steps": 6500, "total_steps": 8436, "eval_loss": 0.2400493621826172, "epoch": 2.311111111111111, "percentage": 77.05, "elapsed_time": "8:37:31", "remaining_time": "2:34:08"} | |
| {"current_steps": 6510, "total_steps": 8436, "loss": 0.1578, "learning_rate": 1.5056669022802051e-06, "epoch": 2.3146666666666667, "percentage": 77.17, "elapsed_time": "8:38:07", "remaining_time": "2:33:17"} | |
| {"current_steps": 6520, "total_steps": 8436, "loss": 0.1236, "learning_rate": 1.4908981888889562e-06, "epoch": 2.3182222222222224, "percentage": 77.29, "elapsed_time": "8:38:46", "remaining_time": "2:32:27"} | |
| {"current_steps": 6530, "total_steps": 8436, "loss": 0.1437, "learning_rate": 1.4761895627985384e-06, "epoch": 2.3217777777777777, "percentage": 77.41, "elapsed_time": "8:39:25", "remaining_time": "2:31:36"} | |
| {"current_steps": 6540, "total_steps": 8436, "loss": 0.1244, "learning_rate": 1.461541275868742e-06, "epoch": 2.3253333333333335, "percentage": 77.52, "elapsed_time": "8:40:01", "remaining_time": "2:30:45"} | |
| {"current_steps": 6550, "total_steps": 8436, "loss": 0.138, "learning_rate": 1.4469535789261518e-06, "epoch": 2.328888888888889, "percentage": 77.64, "elapsed_time": "8:40:37", "remaining_time": "2:29:54"} | |
| {"current_steps": 6560, "total_steps": 8436, "loss": 0.1311, "learning_rate": 1.4324267217598543e-06, "epoch": 2.3324444444444445, "percentage": 77.76, "elapsed_time": "8:41:13", "remaining_time": "2:29:03"} | |
| {"current_steps": 6570, "total_steps": 8436, "loss": 0.1476, "learning_rate": 1.41796095311716e-06, "epoch": 2.336, "percentage": 77.88, "elapsed_time": "8:41:48", "remaining_time": "2:28:12"} | |
| {"current_steps": 6580, "total_steps": 8436, "loss": 0.1313, "learning_rate": 1.4035565206993407e-06, "epoch": 2.3395555555555556, "percentage": 78.0, "elapsed_time": "8:42:23", "remaining_time": "2:27:20"} | |
| {"current_steps": 6590, "total_steps": 8436, "loss": 0.1481, "learning_rate": 1.3892136711573983e-06, "epoch": 2.343111111111111, "percentage": 78.12, "elapsed_time": "8:42:59", "remaining_time": "2:26:30"} | |
| {"current_steps": 6600, "total_steps": 8436, "loss": 0.1329, "learning_rate": 1.3749326500878308e-06, "epoch": 2.3466666666666667, "percentage": 78.24, "elapsed_time": "8:43:37", "remaining_time": "2:25:39"} | |
| {"current_steps": 6610, "total_steps": 8436, "loss": 0.1296, "learning_rate": 1.3607137020284267e-06, "epoch": 2.3502222222222224, "percentage": 78.35, "elapsed_time": "8:44:12", "remaining_time": "2:24:48"} | |
| {"current_steps": 6620, "total_steps": 8436, "loss": 0.1323, "learning_rate": 1.3465570704540877e-06, "epoch": 2.3537777777777777, "percentage": 78.47, "elapsed_time": "8:44:50", "remaining_time": "2:23:58"} | |
| {"current_steps": 6630, "total_steps": 8436, "loss": 0.1353, "learning_rate": 1.33246299777265e-06, "epoch": 2.3573333333333335, "percentage": 78.59, "elapsed_time": "8:45:27", "remaining_time": "2:23:07"} | |
| {"current_steps": 6640, "total_steps": 8436, "loss": 0.1198, "learning_rate": 1.3184317253207379e-06, "epoch": 2.360888888888889, "percentage": 78.71, "elapsed_time": "8:46:02", "remaining_time": "2:22:17"} | |
| {"current_steps": 6650, "total_steps": 8436, "loss": 0.1398, "learning_rate": 1.3044634933596311e-06, "epoch": 2.3644444444444446, "percentage": 78.83, "elapsed_time": "8:46:37", "remaining_time": "2:21:26"} | |
| {"current_steps": 6660, "total_steps": 8436, "loss": 0.123, "learning_rate": 1.290558541071148e-06, "epoch": 2.368, "percentage": 78.95, "elapsed_time": "8:47:14", "remaining_time": "2:20:35"} | |
| {"current_steps": 6670, "total_steps": 8436, "loss": 0.1221, "learning_rate": 1.2767171065535538e-06, "epoch": 2.3715555555555556, "percentage": 79.07, "elapsed_time": "8:47:48", "remaining_time": "2:19:44"} | |
| {"current_steps": 6680, "total_steps": 8436, "loss": 0.1398, "learning_rate": 1.2629394268174811e-06, "epoch": 2.375111111111111, "percentage": 79.18, "elapsed_time": "8:48:24", "remaining_time": "2:18:54"} | |
| {"current_steps": 6690, "total_steps": 8436, "loss": 0.122, "learning_rate": 1.2492257377818734e-06, "epoch": 2.3786666666666667, "percentage": 79.3, "elapsed_time": "8:49:02", "remaining_time": "2:18:04"} | |
| {"current_steps": 6700, "total_steps": 8436, "loss": 0.1366, "learning_rate": 1.235576274269938e-06, "epoch": 2.3822222222222225, "percentage": 79.42, "elapsed_time": "8:49:39", "remaining_time": "2:17:14"} | |
| {"current_steps": 6710, "total_steps": 8436, "loss": 0.1304, "learning_rate": 1.2219912700051417e-06, "epoch": 2.3857777777777778, "percentage": 79.54, "elapsed_time": "8:50:14", "remaining_time": "2:16:23"} | |
| {"current_steps": 6720, "total_steps": 8436, "loss": 0.1339, "learning_rate": 1.2084709576071885e-06, "epoch": 2.389333333333333, "percentage": 79.66, "elapsed_time": "8:50:53", "remaining_time": "2:15:33"} | |
| {"current_steps": 6730, "total_steps": 8436, "loss": 0.138, "learning_rate": 1.1950155685880504e-06, "epoch": 2.392888888888889, "percentage": 79.78, "elapsed_time": "8:51:30", "remaining_time": "2:14:44"} | |
| {"current_steps": 6740, "total_steps": 8436, "loss": 0.1402, "learning_rate": 1.1816253333479994e-06, "epoch": 2.3964444444444446, "percentage": 79.9, "elapsed_time": "8:52:07", "remaining_time": "2:13:53"} | |
| {"current_steps": 6750, "total_steps": 8436, "loss": 0.1219, "learning_rate": 1.1683004811716597e-06, "epoch": 2.4, "percentage": 80.01, "elapsed_time": "8:52:44", "remaining_time": "2:13:04"} | |
| {"current_steps": 6760, "total_steps": 8436, "loss": 0.1472, "learning_rate": 1.1550412402240852e-06, "epoch": 2.4035555555555557, "percentage": 80.13, "elapsed_time": "8:53:19", "remaining_time": "2:12:13"} | |
| {"current_steps": 6770, "total_steps": 8436, "loss": 0.14, "learning_rate": 1.1418478375468496e-06, "epoch": 2.407111111111111, "percentage": 80.25, "elapsed_time": "8:53:55", "remaining_time": "2:11:23"} | |
| {"current_steps": 6780, "total_steps": 8436, "loss": 0.1382, "learning_rate": 1.1287204990541612e-06, "epoch": 2.4106666666666667, "percentage": 80.37, "elapsed_time": "8:54:30", "remaining_time": "2:10:33"} | |
| {"current_steps": 6790, "total_steps": 8436, "loss": 0.1508, "learning_rate": 1.1156594495289923e-06, "epoch": 2.414222222222222, "percentage": 80.49, "elapsed_time": "8:55:06", "remaining_time": "2:09:43"} | |
| {"current_steps": 6800, "total_steps": 8436, "loss": 0.1244, "learning_rate": 1.1026649126192334e-06, "epoch": 2.417777777777778, "percentage": 80.61, "elapsed_time": "8:55:46", "remaining_time": "2:08:54"} | |
| {"current_steps": 6810, "total_steps": 8436, "loss": 0.1262, "learning_rate": 1.0897371108338572e-06, "epoch": 2.421333333333333, "percentage": 80.73, "elapsed_time": "8:56:20", "remaining_time": "2:08:03"} | |
| {"current_steps": 6820, "total_steps": 8436, "loss": 0.1397, "learning_rate": 1.076876265539115e-06, "epoch": 2.424888888888889, "percentage": 80.84, "elapsed_time": "8:56:59", "remaining_time": "2:07:14"} | |
| {"current_steps": 6830, "total_steps": 8436, "loss": 0.1298, "learning_rate": 1.0640825969547498e-06, "epoch": 2.4284444444444446, "percentage": 80.96, "elapsed_time": "8:57:37", "remaining_time": "2:06:24"} | |
| {"current_steps": 6840, "total_steps": 8436, "loss": 0.1334, "learning_rate": 1.051356324150209e-06, "epoch": 2.432, "percentage": 81.08, "elapsed_time": "8:58:16", "remaining_time": "2:05:35"} | |
| {"current_steps": 6850, "total_steps": 8436, "loss": 0.1342, "learning_rate": 1.0386976650409102e-06, "epoch": 2.4355555555555557, "percentage": 81.2, "elapsed_time": "8:58:53", "remaining_time": "2:04:46"} | |
| {"current_steps": 6860, "total_steps": 8436, "loss": 0.1297, "learning_rate": 1.0261068363845034e-06, "epoch": 2.439111111111111, "percentage": 81.32, "elapsed_time": "8:59:28", "remaining_time": "2:03:56"} | |
| {"current_steps": 6870, "total_steps": 8436, "loss": 0.1355, "learning_rate": 1.0135840537771574e-06, "epoch": 2.4426666666666668, "percentage": 81.44, "elapsed_time": "9:00:03", "remaining_time": "2:03:06"} | |
| {"current_steps": 6880, "total_steps": 8436, "loss": 0.1255, "learning_rate": 1.001129531649872e-06, "epoch": 2.446222222222222, "percentage": 81.56, "elapsed_time": "9:00:41", "remaining_time": "2:02:17"} | |
| {"current_steps": 6890, "total_steps": 8436, "loss": 0.1355, "learning_rate": 9.887434832647997e-07, "epoch": 2.449777777777778, "percentage": 81.67, "elapsed_time": "9:01:15", "remaining_time": "2:01:27"} | |
| {"current_steps": 6900, "total_steps": 8436, "loss": 0.1437, "learning_rate": 9.764261207116061e-07, "epoch": 2.453333333333333, "percentage": 81.79, "elapsed_time": "9:01:50", "remaining_time": "2:00:37"} | |
| {"current_steps": 6910, "total_steps": 8436, "loss": 0.1274, "learning_rate": 9.641776549038257e-07, "epoch": 2.456888888888889, "percentage": 81.91, "elapsed_time": "9:02:24", "remaining_time": "1:59:47"} | |
| {"current_steps": 6920, "total_steps": 8436, "loss": 0.1321, "learning_rate": 9.519982955752549e-07, "epoch": 2.4604444444444447, "percentage": 82.03, "elapsed_time": "9:02:58", "remaining_time": "1:58:57"} | |
| {"current_steps": 6930, "total_steps": 8436, "loss": 0.1299, "learning_rate": 9.398882512763618e-07, "epoch": 2.464, "percentage": 82.15, "elapsed_time": "9:03:35", "remaining_time": "1:58:07"} | |
| {"current_steps": 6940, "total_steps": 8436, "loss": 0.1454, "learning_rate": 9.278477293707189e-07, "epoch": 2.4675555555555557, "percentage": 82.27, "elapsed_time": "9:04:10", "remaining_time": "1:57:18"} | |
| {"current_steps": 6950, "total_steps": 8436, "loss": 0.1301, "learning_rate": 9.158769360314412e-07, "epoch": 2.471111111111111, "percentage": 82.39, "elapsed_time": "9:04:46", "remaining_time": "1:56:28"} | |
| {"current_steps": 6960, "total_steps": 8436, "loss": 0.1329, "learning_rate": 9.039760762376665e-07, "epoch": 2.474666666666667, "percentage": 82.5, "elapsed_time": "9:05:21", "remaining_time": "1:55:39"} | |
| {"current_steps": 6970, "total_steps": 8436, "loss": 0.1301, "learning_rate": 8.921453537710406e-07, "epoch": 2.478222222222222, "percentage": 82.62, "elapsed_time": "9:05:59", "remaining_time": "1:54:50"} | |
| {"current_steps": 6980, "total_steps": 8436, "loss": 0.1366, "learning_rate": 8.803849712122292e-07, "epoch": 2.481777777777778, "percentage": 82.74, "elapsed_time": "9:06:33", "remaining_time": "1:54:00"} | |
| {"current_steps": 6990, "total_steps": 8436, "loss": 0.1248, "learning_rate": 8.686951299374474e-07, "epoch": 2.485333333333333, "percentage": 82.86, "elapsed_time": "9:07:13", "remaining_time": "1:53:12"} | |
| {"current_steps": 7000, "total_steps": 8436, "loss": 0.1397, "learning_rate": 8.570760301150166e-07, "epoch": 2.488888888888889, "percentage": 82.98, "elapsed_time": "9:07:50", "remaining_time": "1:52:23"} | |
| {"current_steps": 7000, "total_steps": 8436, "eval_loss": 0.239632710814476, "epoch": 2.488888888888889, "percentage": 82.98, "elapsed_time": "9:17:13", "remaining_time": "1:54:18"} | |
| {"current_steps": 7010, "total_steps": 8436, "loss": 0.133, "learning_rate": 8.455278707019255e-07, "epoch": 2.4924444444444447, "percentage": 83.1, "elapsed_time": "9:17:50", "remaining_time": "1:53:28"} | |
| {"current_steps": 7020, "total_steps": 8436, "loss": 0.128, "learning_rate": 8.340508494404415e-07, "epoch": 2.496, "percentage": 83.21, "elapsed_time": "9:18:29", "remaining_time": "1:52:39"} | |
| {"current_steps": 7030, "total_steps": 8436, "loss": 0.1304, "learning_rate": 8.226451628547039e-07, "epoch": 2.4995555555555553, "percentage": 83.33, "elapsed_time": "9:19:08", "remaining_time": "1:51:49"} | |
| {"current_steps": 7040, "total_steps": 8436, "loss": 0.1337, "learning_rate": 8.113110062473756e-07, "epoch": 2.503111111111111, "percentage": 83.45, "elapsed_time": "9:19:44", "remaining_time": "1:50:59"} | |
| {"current_steps": 7050, "total_steps": 8436, "loss": 0.1365, "learning_rate": 8.000485736962899e-07, "epoch": 2.506666666666667, "percentage": 83.57, "elapsed_time": "9:20:22", "remaining_time": "1:50:09"} | |
| {"current_steps": 7060, "total_steps": 8436, "loss": 0.1157, "learning_rate": 7.888580580511307e-07, "epoch": 2.510222222222222, "percentage": 83.69, "elapsed_time": "9:20:58", "remaining_time": "1:49:20"} | |
| {"current_steps": 7070, "total_steps": 8436, "loss": 0.1258, "learning_rate": 7.777396509301278e-07, "epoch": 2.513777777777778, "percentage": 83.81, "elapsed_time": "9:21:35", "remaining_time": "1:48:30"} | |
| {"current_steps": 7080, "total_steps": 8436, "loss": 0.1261, "learning_rate": 7.666935427167777e-07, "epoch": 2.517333333333333, "percentage": 83.93, "elapsed_time": "9:22:09", "remaining_time": "1:47:40"} | |
| {"current_steps": 7090, "total_steps": 8436, "loss": 0.1353, "learning_rate": 7.557199225565848e-07, "epoch": 2.520888888888889, "percentage": 84.04, "elapsed_time": "9:22:47", "remaining_time": "1:46:50"} | |
| {"current_steps": 7100, "total_steps": 8436, "loss": 0.1223, "learning_rate": 7.448189783538184e-07, "epoch": 2.5244444444444447, "percentage": 84.16, "elapsed_time": "9:23:25", "remaining_time": "1:46:01"} | |
| {"current_steps": 7110, "total_steps": 8436, "loss": 0.1227, "learning_rate": 7.339908967683007e-07, "epoch": 2.528, "percentage": 84.28, "elapsed_time": "9:23:59", "remaining_time": "1:45:10"} | |
| {"current_steps": 7120, "total_steps": 8436, "loss": 0.1365, "learning_rate": 7.232358632122022e-07, "epoch": 2.5315555555555553, "percentage": 84.4, "elapsed_time": "9:24:36", "remaining_time": "1:44:21"} | |
| {"current_steps": 7130, "total_steps": 8436, "loss": 0.1435, "learning_rate": 7.125540618468784e-07, "epoch": 2.535111111111111, "percentage": 84.52, "elapsed_time": "9:25:14", "remaining_time": "1:43:32"} | |
| {"current_steps": 7140, "total_steps": 8436, "loss": 0.1333, "learning_rate": 7.019456755797083e-07, "epoch": 2.538666666666667, "percentage": 84.64, "elapsed_time": "9:25:52", "remaining_time": "1:42:42"} | |
| {"current_steps": 7150, "total_steps": 8436, "loss": 0.1372, "learning_rate": 6.914108860609608e-07, "epoch": 2.542222222222222, "percentage": 84.76, "elapsed_time": "9:26:27", "remaining_time": "1:41:52"} | |
| {"current_steps": 7160, "total_steps": 8436, "loss": 0.135, "learning_rate": 6.809498736806919e-07, "epoch": 2.545777777777778, "percentage": 84.87, "elapsed_time": "9:27:05", "remaining_time": "1:41:03"} | |
| {"current_steps": 7170, "total_steps": 8436, "loss": 0.1304, "learning_rate": 6.705628175656498e-07, "epoch": 2.5493333333333332, "percentage": 84.99, "elapsed_time": "9:27:40", "remaining_time": "1:40:14"} | |
| {"current_steps": 7180, "total_steps": 8436, "loss": 0.1361, "learning_rate": 6.602498955762105e-07, "epoch": 2.552888888888889, "percentage": 85.11, "elapsed_time": "9:28:16", "remaining_time": "1:39:24"} | |
| {"current_steps": 7190, "total_steps": 8436, "loss": 0.1235, "learning_rate": 6.500112843033313e-07, "epoch": 2.5564444444444443, "percentage": 85.23, "elapsed_time": "9:28:53", "remaining_time": "1:38:35"} | |
| {"current_steps": 7200, "total_steps": 8436, "loss": 0.1268, "learning_rate": 6.39847159065523e-07, "epoch": 2.56, "percentage": 85.35, "elapsed_time": "9:29:28", "remaining_time": "1:37:45"} | |
| {"current_steps": 7210, "total_steps": 8436, "loss": 0.1338, "learning_rate": 6.297576939058586e-07, "epoch": 2.5635555555555554, "percentage": 85.47, "elapsed_time": "9:30:05", "remaining_time": "1:36:56"} | |
| {"current_steps": 7220, "total_steps": 8436, "loss": 0.1304, "learning_rate": 6.197430615889838e-07, "epoch": 2.567111111111111, "percentage": 85.59, "elapsed_time": "9:30:43", "remaining_time": "1:36:07"} | |
| {"current_steps": 7230, "total_steps": 8436, "loss": 0.1255, "learning_rate": 6.098034335981573e-07, "epoch": 2.570666666666667, "percentage": 85.7, "elapsed_time": "9:31:22", "remaining_time": "1:35:18"} | |
| {"current_steps": 7240, "total_steps": 8436, "loss": 0.128, "learning_rate": 5.999389801323219e-07, "epoch": 2.574222222222222, "percentage": 85.82, "elapsed_time": "9:31:59", "remaining_time": "1:34:29"} | |
| {"current_steps": 7250, "total_steps": 8436, "loss": 0.131, "learning_rate": 5.901498701031894e-07, "epoch": 2.5777777777777775, "percentage": 85.94, "elapsed_time": "9:32:34", "remaining_time": "1:33:39"} | |
| {"current_steps": 7260, "total_steps": 8436, "loss": 0.1273, "learning_rate": 5.804362711323391e-07, "epoch": 2.5813333333333333, "percentage": 86.06, "elapsed_time": "9:33:10", "remaining_time": "1:32:50"} | |
| {"current_steps": 7270, "total_steps": 8436, "loss": 0.122, "learning_rate": 5.707983495483593e-07, "epoch": 2.584888888888889, "percentage": 86.18, "elapsed_time": "9:33:46", "remaining_time": "1:32:01"} | |
| {"current_steps": 7280, "total_steps": 8436, "loss": 0.1308, "learning_rate": 5.612362703839907e-07, "epoch": 2.5884444444444443, "percentage": 86.3, "elapsed_time": "9:34:21", "remaining_time": "1:31:12"} | |
| {"current_steps": 7290, "total_steps": 8436, "loss": 0.1239, "learning_rate": 5.517501973733059e-07, "epoch": 2.592, "percentage": 86.42, "elapsed_time": "9:34:57", "remaining_time": "1:30:23"} | |
| {"current_steps": 7300, "total_steps": 8436, "loss": 0.1242, "learning_rate": 5.423402929489019e-07, "epoch": 2.5955555555555554, "percentage": 86.53, "elapsed_time": "9:35:31", "remaining_time": "1:29:33"} | |
| {"current_steps": 7310, "total_steps": 8436, "loss": 0.1258, "learning_rate": 5.330067182391219e-07, "epoch": 2.599111111111111, "percentage": 86.65, "elapsed_time": "9:36:08", "remaining_time": "1:28:44"} | |
| {"current_steps": 7320, "total_steps": 8436, "loss": 0.1318, "learning_rate": 5.237496330652925e-07, "epoch": 2.602666666666667, "percentage": 86.77, "elapsed_time": "9:36:42", "remaining_time": "1:27:55"} | |
| {"current_steps": 7330, "total_steps": 8436, "loss": 0.1292, "learning_rate": 5.145691959389932e-07, "epoch": 2.606222222222222, "percentage": 86.89, "elapsed_time": "9:37:19", "remaining_time": "1:27:06"} | |
| {"current_steps": 7340, "total_steps": 8436, "loss": 0.1446, "learning_rate": 5.054655640593325e-07, "epoch": 2.6097777777777775, "percentage": 87.01, "elapsed_time": "9:37:56", "remaining_time": "1:26:17"} | |
| {"current_steps": 7350, "total_steps": 8436, "loss": 0.1418, "learning_rate": 4.964388933102666e-07, "epoch": 2.6133333333333333, "percentage": 87.13, "elapsed_time": "9:38:33", "remaining_time": "1:25:29"} | |
| {"current_steps": 7360, "total_steps": 8436, "loss": 0.1269, "learning_rate": 4.874893382579232e-07, "epoch": 2.616888888888889, "percentage": 87.25, "elapsed_time": "9:39:08", "remaining_time": "1:24:40"} | |
| {"current_steps": 7370, "total_steps": 8436, "loss": 0.1223, "learning_rate": 4.786170521479588e-07, "epoch": 2.6204444444444444, "percentage": 87.36, "elapsed_time": "9:39:43", "remaining_time": "1:23:51"} | |
| {"current_steps": 7380, "total_steps": 8436, "loss": 0.1443, "learning_rate": 4.698221869029307e-07, "epoch": 2.624, "percentage": 87.48, "elapsed_time": "9:40:17", "remaining_time": "1:23:02"} | |
| {"current_steps": 7390, "total_steps": 8436, "loss": 0.1429, "learning_rate": 4.6110489311969876e-07, "epoch": 2.6275555555555554, "percentage": 87.6, "elapsed_time": "9:40:52", "remaining_time": "1:22:13"} | |
| {"current_steps": 7400, "total_steps": 8436, "loss": 0.1264, "learning_rate": 4.524653200668461e-07, "epoch": 2.631111111111111, "percentage": 87.72, "elapsed_time": "9:41:28", "remaining_time": "1:21:24"} | |
| {"current_steps": 7410, "total_steps": 8436, "loss": 0.1213, "learning_rate": 4.439036156821225e-07, "epoch": 2.634666666666667, "percentage": 87.84, "elapsed_time": "9:42:06", "remaining_time": "1:20:35"} | |
| {"current_steps": 7420, "total_steps": 8436, "loss": 0.1182, "learning_rate": 4.3541992656991163e-07, "epoch": 2.6382222222222222, "percentage": 87.96, "elapsed_time": "9:42:44", "remaining_time": "1:19:47"} | |
| {"current_steps": 7430, "total_steps": 8436, "loss": 0.1453, "learning_rate": 4.2701439799871847e-07, "epoch": 2.6417777777777776, "percentage": 88.07, "elapsed_time": "9:43:20", "remaining_time": "1:18:59"} | |
| {"current_steps": 7440, "total_steps": 8436, "loss": 0.1284, "learning_rate": 4.1868717389868694e-07, "epoch": 2.6453333333333333, "percentage": 88.19, "elapsed_time": "9:43:56", "remaining_time": "1:18:10"} | |
| {"current_steps": 7450, "total_steps": 8436, "loss": 0.1289, "learning_rate": 4.1043839685913135e-07, "epoch": 2.648888888888889, "percentage": 88.31, "elapsed_time": "9:44:33", "remaining_time": "1:17:21"} | |
| {"current_steps": 7460, "total_steps": 8436, "loss": 0.122, "learning_rate": 4.022682081260942e-07, "epoch": 2.6524444444444444, "percentage": 88.43, "elapsed_time": "9:45:10", "remaining_time": "1:16:33"} | |
| {"current_steps": 7470, "total_steps": 8436, "loss": 0.1292, "learning_rate": 3.941767475999297e-07, "epoch": 2.656, "percentage": 88.55, "elapsed_time": "9:45:49", "remaining_time": "1:15:45"} | |
| {"current_steps": 7480, "total_steps": 8436, "loss": 0.1281, "learning_rate": 3.8616415383291083e-07, "epoch": 2.6595555555555555, "percentage": 88.67, "elapsed_time": "9:46:25", "remaining_time": "1:14:56"} | |
| {"current_steps": 7490, "total_steps": 8436, "loss": 0.1205, "learning_rate": 3.7823056402684856e-07, "epoch": 2.663111111111111, "percentage": 88.79, "elapsed_time": "9:46:59", "remaining_time": "1:14:08"} | |
| {"current_steps": 7500, "total_steps": 8436, "loss": 0.1405, "learning_rate": 3.70376114030751e-07, "epoch": 2.6666666666666665, "percentage": 88.9, "elapsed_time": "9:47:34", "remaining_time": "1:13:19"} | |
| {"current_steps": 7500, "total_steps": 8436, "eval_loss": 0.2399507761001587, "epoch": 2.6666666666666665, "percentage": 88.9, "elapsed_time": "9:56:56", "remaining_time": "1:14:29"} | |
| {"current_steps": 7510, "total_steps": 8436, "loss": 0.1424, "learning_rate": 3.626009383384926e-07, "epoch": 2.6702222222222223, "percentage": 89.02, "elapsed_time": "9:57:34", "remaining_time": "1:13:40"} | |
| {"current_steps": 7520, "total_steps": 8436, "loss": 0.1242, "learning_rate": 3.549051700865136e-07, "epoch": 2.6737777777777776, "percentage": 89.14, "elapsed_time": "9:58:11", "remaining_time": "1:12:51"} | |
| {"current_steps": 7530, "total_steps": 8436, "loss": 0.125, "learning_rate": 3.47288941051539e-07, "epoch": 2.6773333333333333, "percentage": 89.26, "elapsed_time": "9:58:48", "remaining_time": "1:12:02"} | |
| {"current_steps": 7540, "total_steps": 8436, "loss": 0.1253, "learning_rate": 3.3975238164831893e-07, "epoch": 2.680888888888889, "percentage": 89.38, "elapsed_time": "9:59:25", "remaining_time": "1:11:13"} | |
| {"current_steps": 7550, "total_steps": 8436, "loss": 0.1322, "learning_rate": 3.322956209274031e-07, "epoch": 2.6844444444444444, "percentage": 89.5, "elapsed_time": "10:00:03", "remaining_time": "1:10:25"} | |
| {"current_steps": 7560, "total_steps": 8436, "loss": 0.1355, "learning_rate": 3.2491878657292643e-07, "epoch": 2.6879999999999997, "percentage": 89.62, "elapsed_time": "10:00:37", "remaining_time": "1:09:35"} | |
| {"current_steps": 7570, "total_steps": 8436, "loss": 0.1179, "learning_rate": 3.176220049004197e-07, "epoch": 2.6915555555555555, "percentage": 89.73, "elapsed_time": "10:01:14", "remaining_time": "1:08:46"} | |
| {"current_steps": 7580, "total_steps": 8436, "loss": 0.1338, "learning_rate": 3.104054008546525e-07, "epoch": 2.6951111111111112, "percentage": 89.85, "elapsed_time": "10:01:49", "remaining_time": "1:07:57"} | |
| {"current_steps": 7590, "total_steps": 8436, "loss": 0.131, "learning_rate": 3.032690980074915e-07, "epoch": 2.6986666666666665, "percentage": 89.97, "elapsed_time": "10:02:24", "remaining_time": "1:07:08"} | |
| {"current_steps": 7600, "total_steps": 8436, "loss": 0.1223, "learning_rate": 2.962132185557826e-07, "epoch": 2.7022222222222223, "percentage": 90.09, "elapsed_time": "10:03:00", "remaining_time": "1:06:19"} | |
| {"current_steps": 7610, "total_steps": 8436, "loss": 0.1282, "learning_rate": 2.892378833192611e-07, "epoch": 2.7057777777777776, "percentage": 90.21, "elapsed_time": "10:03:39", "remaining_time": "1:05:31"} | |
| {"current_steps": 7620, "total_steps": 8436, "loss": 0.1321, "learning_rate": 2.823432117384822e-07, "epoch": 2.7093333333333334, "percentage": 90.33, "elapsed_time": "10:04:14", "remaining_time": "1:04:42"} | |
| {"current_steps": 7630, "total_steps": 8436, "loss": 0.1266, "learning_rate": 2.755293218727739e-07, "epoch": 2.712888888888889, "percentage": 90.45, "elapsed_time": "10:04:50", "remaining_time": "1:03:53"} | |
| {"current_steps": 7640, "total_steps": 8436, "loss": 0.1356, "learning_rate": 2.6879633039821994e-07, "epoch": 2.7164444444444444, "percentage": 90.56, "elapsed_time": "10:05:26", "remaining_time": "1:03:04"} | |
| {"current_steps": 7650, "total_steps": 8436, "loss": 0.1262, "learning_rate": 2.62144352605655e-07, "epoch": 2.7199999999999998, "percentage": 90.68, "elapsed_time": "10:06:01", "remaining_time": "1:02:15"} | |
| {"current_steps": 7660, "total_steps": 8436, "loss": 0.1315, "learning_rate": 2.555735023986966e-07, "epoch": 2.7235555555555555, "percentage": 90.8, "elapsed_time": "10:06:38", "remaining_time": "1:01:27"} | |
| {"current_steps": 7670, "total_steps": 8436, "loss": 0.1179, "learning_rate": 2.4908389229179484e-07, "epoch": 2.7271111111111113, "percentage": 90.92, "elapsed_time": "10:07:15", "remaining_time": "1:00:38"} | |
| {"current_steps": 7680, "total_steps": 8436, "loss": 0.1122, "learning_rate": 2.4267563340830026e-07, "epoch": 2.7306666666666666, "percentage": 91.04, "elapsed_time": "10:07:52", "remaining_time": "0:59:50"} | |
| {"current_steps": 7690, "total_steps": 8436, "loss": 0.1372, "learning_rate": 2.363488354785648e-07, "epoch": 2.7342222222222223, "percentage": 91.16, "elapsed_time": "10:08:27", "remaining_time": "0:59:01"} | |
| {"current_steps": 7700, "total_steps": 8436, "loss": 0.1303, "learning_rate": 2.301036068380641e-07, "epoch": 2.7377777777777776, "percentage": 91.28, "elapsed_time": "10:09:05", "remaining_time": "0:58:13"} | |
| {"current_steps": 7710, "total_steps": 8436, "loss": 0.121, "learning_rate": 2.239400544255399e-07, "epoch": 2.7413333333333334, "percentage": 91.39, "elapsed_time": "10:09:40", "remaining_time": "0:57:24"} | |
| {"current_steps": 7720, "total_steps": 8436, "loss": 0.1249, "learning_rate": 2.178582837811688e-07, "epoch": 2.744888888888889, "percentage": 91.51, "elapsed_time": "10:10:17", "remaining_time": "0:56:36"} | |
| {"current_steps": 7730, "total_steps": 8436, "loss": 0.133, "learning_rate": 2.1185839904475869e-07, "epoch": 2.7484444444444445, "percentage": 91.63, "elapsed_time": "10:10:51", "remaining_time": "0:55:47"} | |
| {"current_steps": 7740, "total_steps": 8436, "loss": 0.1304, "learning_rate": 2.0594050295395852e-07, "epoch": 2.752, "percentage": 91.75, "elapsed_time": "10:11:24", "remaining_time": "0:54:58"} | |
| {"current_steps": 7750, "total_steps": 8436, "loss": 0.1385, "learning_rate": 2.0010469684250856e-07, "epoch": 2.7555555555555555, "percentage": 91.87, "elapsed_time": "10:11:59", "remaining_time": "0:54:10"} | |
| {"current_steps": 7760, "total_steps": 8436, "loss": 0.1365, "learning_rate": 1.9435108063849684e-07, "epoch": 2.7591111111111113, "percentage": 91.99, "elapsed_time": "10:12:36", "remaining_time": "0:53:21"} | |
| {"current_steps": 7770, "total_steps": 8436, "loss": 0.1278, "learning_rate": 1.8867975286265106e-07, "epoch": 2.7626666666666666, "percentage": 92.11, "elapsed_time": "10:13:11", "remaining_time": "0:52:33"} | |
| {"current_steps": 7780, "total_steps": 8436, "loss": 0.1169, "learning_rate": 1.830908106266538e-07, "epoch": 2.7662222222222224, "percentage": 92.22, "elapsed_time": "10:13:46", "remaining_time": "0:51:45"} | |
| {"current_steps": 7790, "total_steps": 8436, "loss": 0.143, "learning_rate": 1.7758434963147665e-07, "epoch": 2.7697777777777777, "percentage": 92.34, "elapsed_time": "10:14:22", "remaining_time": "0:50:56"} | |
| {"current_steps": 7800, "total_steps": 8436, "loss": 0.1335, "learning_rate": 1.7216046416574316e-07, "epoch": 2.7733333333333334, "percentage": 92.46, "elapsed_time": "10:14:57", "remaining_time": "0:50:08"} | |
| {"current_steps": 7810, "total_steps": 8436, "loss": 0.1338, "learning_rate": 1.66819247104113e-07, "epoch": 2.7768888888888887, "percentage": 92.58, "elapsed_time": "10:15:32", "remaining_time": "0:49:20"} | |
| {"current_steps": 7820, "total_steps": 8436, "loss": 0.1203, "learning_rate": 1.6156078990569313e-07, "epoch": 2.7804444444444445, "percentage": 92.7, "elapsed_time": "10:16:09", "remaining_time": "0:48:32"} | |
| {"current_steps": 7830, "total_steps": 8436, "loss": 0.1216, "learning_rate": 1.563851826124696e-07, "epoch": 2.784, "percentage": 92.82, "elapsed_time": "10:16:45", "remaining_time": "0:47:44"} | |
| {"current_steps": 7840, "total_steps": 8436, "loss": 0.1181, "learning_rate": 1.5129251384776998e-07, "epoch": 2.7875555555555556, "percentage": 92.94, "elapsed_time": "10:17:19", "remaining_time": "0:46:55"} | |
| {"current_steps": 7850, "total_steps": 8436, "loss": 0.139, "learning_rate": 1.462828708147379e-07, "epoch": 2.7911111111111113, "percentage": 93.05, "elapsed_time": "10:17:57", "remaining_time": "0:46:07"} | |
| {"current_steps": 7860, "total_steps": 8436, "loss": 0.1373, "learning_rate": 1.4135633929485026e-07, "epoch": 2.7946666666666666, "percentage": 93.17, "elapsed_time": "10:18:32", "remaining_time": "0:45:19"} | |
| {"current_steps": 7870, "total_steps": 8436, "loss": 0.1294, "learning_rate": 1.3651300364644126e-07, "epoch": 2.7982222222222224, "percentage": 93.29, "elapsed_time": "10:19:08", "remaining_time": "0:44:31"} | |
| {"current_steps": 7880, "total_steps": 8436, "loss": 0.1158, "learning_rate": 1.317529468032569e-07, "epoch": 2.8017777777777777, "percentage": 93.41, "elapsed_time": "10:19:47", "remaining_time": "0:43:43"} | |
| {"current_steps": 7890, "total_steps": 8436, "loss": 0.124, "learning_rate": 1.2707625027304104e-07, "epoch": 2.8053333333333335, "percentage": 93.53, "elapsed_time": "10:20:24", "remaining_time": "0:42:56"} | |
| {"current_steps": 7900, "total_steps": 8436, "loss": 0.1332, "learning_rate": 1.2248299413613607e-07, "epoch": 2.8088888888888888, "percentage": 93.65, "elapsed_time": "10:21:01", "remaining_time": "0:42:08"} | |
| {"current_steps": 7910, "total_steps": 8436, "loss": 0.1214, "learning_rate": 1.1797325704411e-07, "epoch": 2.8124444444444445, "percentage": 93.76, "elapsed_time": "10:21:35", "remaining_time": "0:41:20"} | |
| {"current_steps": 7920, "total_steps": 8436, "loss": 0.133, "learning_rate": 1.1354711621841208e-07, "epoch": 2.816, "percentage": 93.88, "elapsed_time": "10:22:13", "remaining_time": "0:40:32"} | |
| {"current_steps": 7930, "total_steps": 8436, "loss": 0.1205, "learning_rate": 1.0920464744905157e-07, "epoch": 2.8195555555555556, "percentage": 94.0, "elapsed_time": "10:22:49", "remaining_time": "0:39:44"} | |
| {"current_steps": 7940, "total_steps": 8436, "loss": 0.1469, "learning_rate": 1.0494592509329716e-07, "epoch": 2.8231111111111113, "percentage": 94.12, "elapsed_time": "10:23:25", "remaining_time": "0:38:56"} | |
| {"current_steps": 7950, "total_steps": 8436, "loss": 0.1269, "learning_rate": 1.007710220744057e-07, "epoch": 2.8266666666666667, "percentage": 94.24, "elapsed_time": "10:24:05", "remaining_time": "0:38:09"} | |
| {"current_steps": 7960, "total_steps": 8436, "loss": 0.1322, "learning_rate": 9.668000988037163e-08, "epoch": 2.830222222222222, "percentage": 94.36, "elapsed_time": "10:24:43", "remaining_time": "0:37:21"} | |
| {"current_steps": 7970, "total_steps": 8436, "loss": 0.1354, "learning_rate": 9.267295856270509e-08, "epoch": 2.8337777777777777, "percentage": 94.48, "elapsed_time": "10:25:18", "remaining_time": "0:36:33"} | |
| {"current_steps": 7980, "total_steps": 8436, "loss": 0.1319, "learning_rate": 8.874993673523236e-08, "epoch": 2.8373333333333335, "percentage": 94.59, "elapsed_time": "10:25:55", "remaining_time": "0:35:46"} | |
| {"current_steps": 7990, "total_steps": 8436, "loss": 0.1274, "learning_rate": 8.491101157291737e-08, "epoch": 2.840888888888889, "percentage": 94.71, "elapsed_time": "10:26:30", "remaining_time": "0:34:58"} | |
| {"current_steps": 8000, "total_steps": 8436, "loss": 0.1318, "learning_rate": 8.115624881071594e-08, "epoch": 2.8444444444444446, "percentage": 94.83, "elapsed_time": "10:27:05", "remaining_time": "0:34:10"} | |
| {"current_steps": 8000, "total_steps": 8436, "eval_loss": 0.23905394971370697, "epoch": 2.8444444444444446, "percentage": 94.83, "elapsed_time": "10:36:25", "remaining_time": "0:34:41"} | |
| {"current_steps": 8010, "total_steps": 8436, "loss": 0.1199, "learning_rate": 7.748571274244776e-08, "epoch": 2.848, "percentage": 94.95, "elapsed_time": "10:37:20", "remaining_time": "0:33:53"} | |
| {"current_steps": 8020, "total_steps": 8436, "loss": 0.1494, "learning_rate": 7.389946621969679e-08, "epoch": 2.8515555555555556, "percentage": 95.07, "elapsed_time": "10:37:58", "remaining_time": "0:33:05"} | |
| {"current_steps": 8030, "total_steps": 8436, "loss": 0.1354, "learning_rate": 7.039757065073316e-08, "epoch": 2.8551111111111114, "percentage": 95.19, "elapsed_time": "10:38:34", "remaining_time": "0:32:17"} | |
| {"current_steps": 8040, "total_steps": 8436, "loss": 0.1246, "learning_rate": 6.698008599946404e-08, "epoch": 2.8586666666666667, "percentage": 95.31, "elapsed_time": "10:39:11", "remaining_time": "0:31:28"} | |
| {"current_steps": 8050, "total_steps": 8436, "loss": 0.1266, "learning_rate": 6.364707078440335e-08, "epoch": 2.862222222222222, "percentage": 95.42, "elapsed_time": "10:39:49", "remaining_time": "0:30:40"} | |
| {"current_steps": 8060, "total_steps": 8436, "loss": 0.134, "learning_rate": 6.039858207767479e-08, "epoch": 2.8657777777777778, "percentage": 95.54, "elapsed_time": "10:40:26", "remaining_time": "0:29:52"} | |
| {"current_steps": 8070, "total_steps": 8436, "loss": 0.1326, "learning_rate": 5.723467550403039e-08, "epoch": 2.8693333333333335, "percentage": 95.66, "elapsed_time": "10:41:01", "remaining_time": "0:29:04"} | |
| {"current_steps": 8080, "total_steps": 8436, "loss": 0.1488, "learning_rate": 5.4155405239897926e-08, "epoch": 2.872888888888889, "percentage": 95.78, "elapsed_time": "10:41:38", "remaining_time": "0:28:16"} | |
| {"current_steps": 8090, "total_steps": 8436, "loss": 0.1232, "learning_rate": 5.1160824012458367e-08, "epoch": 2.8764444444444446, "percentage": 95.9, "elapsed_time": "10:42:13", "remaining_time": "0:27:28"} | |
| {"current_steps": 8100, "total_steps": 8436, "loss": 0.1264, "learning_rate": 4.825098309873544e-08, "epoch": 2.88, "percentage": 96.02, "elapsed_time": "10:42:50", "remaining_time": "0:26:39"} | |
| {"current_steps": 8110, "total_steps": 8436, "loss": 0.1328, "learning_rate": 4.542593232472414e-08, "epoch": 2.8835555555555556, "percentage": 96.14, "elapsed_time": "10:43:25", "remaining_time": "0:25:51"} | |
| {"current_steps": 8120, "total_steps": 8436, "loss": 0.1264, "learning_rate": 4.268572006453364e-08, "epoch": 2.887111111111111, "percentage": 96.25, "elapsed_time": "10:44:01", "remaining_time": "0:25:03"} | |
| {"current_steps": 8130, "total_steps": 8436, "loss": 0.1308, "learning_rate": 4.003039323956126e-08, "epoch": 2.8906666666666667, "percentage": 96.37, "elapsed_time": "10:44:37", "remaining_time": "0:24:15"} | |
| {"current_steps": 8140, "total_steps": 8436, "loss": 0.1101, "learning_rate": 3.7459997317687014e-08, "epoch": 2.894222222222222, "percentage": 96.49, "elapsed_time": "10:45:12", "remaining_time": "0:23:27"} | |
| {"current_steps": 8150, "total_steps": 8436, "loss": 0.1249, "learning_rate": 3.4974576312497564e-08, "epoch": 2.897777777777778, "percentage": 96.61, "elapsed_time": "10:45:48", "remaining_time": "0:22:39"} | |
| {"current_steps": 8160, "total_steps": 8436, "loss": 0.1193, "learning_rate": 3.25741727825285e-08, "epoch": 2.9013333333333335, "percentage": 96.73, "elapsed_time": "10:46:22", "remaining_time": "0:21:51"} | |
| {"current_steps": 8170, "total_steps": 8436, "loss": 0.1199, "learning_rate": 3.025882783054046e-08, "epoch": 2.904888888888889, "percentage": 96.85, "elapsed_time": "10:46:59", "remaining_time": "0:21:03"} | |
| {"current_steps": 8180, "total_steps": 8436, "loss": 0.1365, "learning_rate": 2.8028581102811924e-08, "epoch": 2.9084444444444446, "percentage": 96.97, "elapsed_time": "10:47:35", "remaining_time": "0:20:16"} | |
| {"current_steps": 8190, "total_steps": 8436, "loss": 0.1323, "learning_rate": 2.588347078846254e-08, "epoch": 2.912, "percentage": 97.08, "elapsed_time": "10:48:09", "remaining_time": "0:19:28"} | |
| {"current_steps": 8200, "total_steps": 8436, "loss": 0.1244, "learning_rate": 2.382353361879586e-08, "epoch": 2.9155555555555557, "percentage": 97.2, "elapsed_time": "10:48:45", "remaining_time": "0:18:40"} | |
| {"current_steps": 8210, "total_steps": 8436, "loss": 0.1241, "learning_rate": 2.18488048666754e-08, "epoch": 2.919111111111111, "percentage": 97.32, "elapsed_time": "10:49:24", "remaining_time": "0:17:52"} | |
| {"current_steps": 8220, "total_steps": 8436, "loss": 0.132, "learning_rate": 1.995931834591569e-08, "epoch": 2.9226666666666667, "percentage": 97.44, "elapsed_time": "10:50:03", "remaining_time": "0:17:04"} | |
| {"current_steps": 8230, "total_steps": 8436, "loss": 0.1359, "learning_rate": 1.8155106410706613e-08, "epoch": 2.926222222222222, "percentage": 97.56, "elapsed_time": "10:50:41", "remaining_time": "0:16:17"} | |
| {"current_steps": 8240, "total_steps": 8436, "loss": 0.1477, "learning_rate": 1.6436199955057742e-08, "epoch": 2.929777777777778, "percentage": 97.68, "elapsed_time": "10:51:18", "remaining_time": "0:15:29"} | |
| {"current_steps": 8250, "total_steps": 8436, "loss": 0.1482, "learning_rate": 1.480262841226987e-08, "epoch": 2.9333333333333336, "percentage": 97.8, "elapsed_time": "10:51:57", "remaining_time": "0:14:41"} | |
| {"current_steps": 8260, "total_steps": 8436, "loss": 0.1369, "learning_rate": 1.3254419754430981e-08, "epoch": 2.936888888888889, "percentage": 97.91, "elapsed_time": "10:52:33", "remaining_time": "0:13:54"} | |
| {"current_steps": 8270, "total_steps": 8436, "loss": 0.1265, "learning_rate": 1.1791600491937172e-08, "epoch": 2.940444444444444, "percentage": 98.03, "elapsed_time": "10:53:11", "remaining_time": "0:13:06"} | |
| {"current_steps": 8280, "total_steps": 8436, "loss": 0.1233, "learning_rate": 1.041419567303914e-08, "epoch": 2.944, "percentage": 98.15, "elapsed_time": "10:53:45", "remaining_time": "0:12:19"} | |
| {"current_steps": 8290, "total_steps": 8436, "loss": 0.1308, "learning_rate": 9.12222888341252e-09, "epoch": 2.9475555555555557, "percentage": 98.27, "elapsed_time": "10:54:24", "remaining_time": "0:11:31"} | |
| {"current_steps": 8300, "total_steps": 8436, "loss": 0.141, "learning_rate": 7.915722245754876e-09, "epoch": 2.951111111111111, "percentage": 98.39, "elapsed_time": "10:55:03", "remaining_time": "0:10:44"} | |
| {"current_steps": 8310, "total_steps": 8436, "loss": 0.1493, "learning_rate": 6.7946964194059994e-09, "epoch": 2.9546666666666668, "percentage": 98.51, "elapsed_time": "10:55:39", "remaining_time": "0:09:56"} | |
| {"current_steps": 8320, "total_steps": 8436, "loss": 0.1284, "learning_rate": 5.759170599994868e-09, "epoch": 2.958222222222222, "percentage": 98.62, "elapsed_time": "10:56:15", "remaining_time": "0:09:08"} | |
| {"current_steps": 8330, "total_steps": 8436, "loss": 0.1231, "learning_rate": 4.809162519110455e-09, "epoch": 2.961777777777778, "percentage": 98.74, "elapsed_time": "10:56:52", "remaining_time": "0:08:21"} | |
| {"current_steps": 8340, "total_steps": 8436, "loss": 0.1466, "learning_rate": 3.944688443998646e-09, "epoch": 2.9653333333333336, "percentage": 98.86, "elapsed_time": "10:57:27", "remaining_time": "0:07:34"} | |
| {"current_steps": 8350, "total_steps": 8436, "loss": 0.126, "learning_rate": 3.16576317728301e-09, "epoch": 2.968888888888889, "percentage": 98.98, "elapsed_time": "10:58:01", "remaining_time": "0:06:46"} | |
| {"current_steps": 8360, "total_steps": 8436, "loss": 0.1361, "learning_rate": 2.4724000567116768e-09, "epoch": 2.9724444444444442, "percentage": 99.1, "elapsed_time": "10:58:36", "remaining_time": "0:05:59"} | |
| {"current_steps": 8370, "total_steps": 8436, "loss": 0.1258, "learning_rate": 1.86461095492918e-09, "epoch": 2.976, "percentage": 99.22, "elapsed_time": "10:59:13", "remaining_time": "0:05:11"} | |
| {"current_steps": 8380, "total_steps": 8436, "loss": 0.1311, "learning_rate": 1.3424062792738445e-09, "epoch": 2.9795555555555557, "percentage": 99.34, "elapsed_time": "10:59:49", "remaining_time": "0:04:24"} | |
| {"current_steps": 8390, "total_steps": 8436, "loss": 0.1236, "learning_rate": 9.057949715968183e-10, "epoch": 2.983111111111111, "percentage": 99.45, "elapsed_time": "11:00:27", "remaining_time": "0:03:37"} | |
| {"current_steps": 8400, "total_steps": 8436, "loss": 0.1171, "learning_rate": 5.547845081121939e-10, "epoch": 2.986666666666667, "percentage": 99.57, "elapsed_time": "11:01:04", "remaining_time": "0:02:49"} | |
| {"current_steps": 8410, "total_steps": 8436, "loss": 0.1309, "learning_rate": 2.89380899267111e-10, "epoch": 2.990222222222222, "percentage": 99.69, "elapsed_time": "11:01:45", "remaining_time": "0:02:02"} | |
| {"current_steps": 8420, "total_steps": 8436, "loss": 0.1314, "learning_rate": 1.0958868963906188e-10, "epoch": 2.993777777777778, "percentage": 99.81, "elapsed_time": "11:02:22", "remaining_time": "0:01:15"} | |
| {"current_steps": 8430, "total_steps": 8436, "loss": 0.1267, "learning_rate": 1.541095785984048e-11, "epoch": 2.997333333333333, "percentage": 99.93, "elapsed_time": "11:03:01", "remaining_time": "0:00:28"} | |
| {"current_steps": 8436, "total_steps": 8436, "epoch": 2.9994666666666667, "percentage": 100.0, "elapsed_time": "11:03:43", "remaining_time": "0:00:00"} | |