sedrickkeh's picture
Training in progress, epoch 2
a9a93fd verified
{"current_steps": 10, "total_steps": 672, "loss": 0.7473, "lr": 5e-06, "epoch": 0.044617958728388175, "percentage": 1.49, "elapsed_time": "0:08:56", "remaining_time": "9:52:22"}
{"current_steps": 20, "total_steps": 672, "loss": 0.6749, "lr": 5e-06, "epoch": 0.08923591745677635, "percentage": 2.98, "elapsed_time": "0:17:49", "remaining_time": "9:40:58"}
{"current_steps": 30, "total_steps": 672, "loss": 0.6518, "lr": 5e-06, "epoch": 0.13385387618516453, "percentage": 4.46, "elapsed_time": "0:26:41", "remaining_time": "9:31:06"}
{"current_steps": 40, "total_steps": 672, "loss": 0.6309, "lr": 5e-06, "epoch": 0.1784718349135527, "percentage": 5.95, "elapsed_time": "0:35:35", "remaining_time": "9:22:15"}
{"current_steps": 50, "total_steps": 672, "loss": 0.6242, "lr": 5e-06, "epoch": 0.22308979364194087, "percentage": 7.44, "elapsed_time": "0:44:28", "remaining_time": "9:13:11"}
{"current_steps": 60, "total_steps": 672, "loss": 0.6177, "lr": 5e-06, "epoch": 0.26770775237032907, "percentage": 8.93, "elapsed_time": "0:53:19", "remaining_time": "9:03:57"}
{"current_steps": 70, "total_steps": 672, "loss": 0.607, "lr": 5e-06, "epoch": 0.3123257110987172, "percentage": 10.42, "elapsed_time": "1:02:11", "remaining_time": "8:54:55"}
{"current_steps": 80, "total_steps": 672, "loss": 0.608, "lr": 5e-06, "epoch": 0.3569436698271054, "percentage": 11.9, "elapsed_time": "1:11:04", "remaining_time": "8:45:53"}
{"current_steps": 90, "total_steps": 672, "loss": 0.5995, "lr": 5e-06, "epoch": 0.4015616285554936, "percentage": 13.39, "elapsed_time": "1:19:55", "remaining_time": "8:36:50"}
{"current_steps": 100, "total_steps": 672, "loss": 0.6024, "lr": 5e-06, "epoch": 0.44617958728388174, "percentage": 14.88, "elapsed_time": "1:28:47", "remaining_time": "8:27:54"}
{"current_steps": 110, "total_steps": 672, "loss": 0.584, "lr": 5e-06, "epoch": 0.49079754601226994, "percentage": 16.37, "elapsed_time": "1:37:39", "remaining_time": "8:18:54"}
{"current_steps": 120, "total_steps": 672, "loss": 0.5869, "lr": 5e-06, "epoch": 0.5354155047406581, "percentage": 17.86, "elapsed_time": "1:46:31", "remaining_time": "8:10:01"}
{"current_steps": 130, "total_steps": 672, "loss": 0.5869, "lr": 5e-06, "epoch": 0.5800334634690463, "percentage": 19.35, "elapsed_time": "1:55:24", "remaining_time": "8:01:09"}
{"current_steps": 140, "total_steps": 672, "loss": 0.5874, "lr": 5e-06, "epoch": 0.6246514221974344, "percentage": 20.83, "elapsed_time": "2:04:17", "remaining_time": "7:52:16"}
{"current_steps": 150, "total_steps": 672, "loss": 0.5779, "lr": 5e-06, "epoch": 0.6692693809258227, "percentage": 22.32, "elapsed_time": "2:13:09", "remaining_time": "7:43:24"}
{"current_steps": 160, "total_steps": 672, "loss": 0.5841, "lr": 5e-06, "epoch": 0.7138873396542108, "percentage": 23.81, "elapsed_time": "2:22:03", "remaining_time": "7:34:33"}
{"current_steps": 170, "total_steps": 672, "loss": 0.5779, "lr": 5e-06, "epoch": 0.758505298382599, "percentage": 25.3, "elapsed_time": "2:30:56", "remaining_time": "7:25:44"}
{"current_steps": 180, "total_steps": 672, "loss": 0.574, "lr": 5e-06, "epoch": 0.8031232571109872, "percentage": 26.79, "elapsed_time": "2:39:48", "remaining_time": "7:16:49"}
{"current_steps": 190, "total_steps": 672, "loss": 0.5733, "lr": 5e-06, "epoch": 0.8477412158393753, "percentage": 28.27, "elapsed_time": "2:48:42", "remaining_time": "7:07:59"}
{"current_steps": 200, "total_steps": 672, "loss": 0.572, "lr": 5e-06, "epoch": 0.8923591745677635, "percentage": 29.76, "elapsed_time": "2:57:35", "remaining_time": "6:59:06"}
{"current_steps": 210, "total_steps": 672, "loss": 0.5717, "lr": 5e-06, "epoch": 0.9369771332961517, "percentage": 31.25, "elapsed_time": "3:06:27", "remaining_time": "6:50:13"}
{"current_steps": 220, "total_steps": 672, "loss": 0.5714, "lr": 5e-06, "epoch": 0.9815950920245399, "percentage": 32.74, "elapsed_time": "3:15:20", "remaining_time": "6:41:21"}
{"current_steps": 224, "total_steps": 672, "eval_loss": 0.5709418058395386, "epoch": 0.9994422755158952, "percentage": 33.33, "elapsed_time": "3:22:42", "remaining_time": "6:45:24"}
{"current_steps": 230, "total_steps": 672, "loss": 0.6088, "lr": 5e-06, "epoch": 1.0262130507529281, "percentage": 34.23, "elapsed_time": "3:28:54", "remaining_time": "6:41:28"}
{"current_steps": 240, "total_steps": 672, "loss": 0.5447, "lr": 5e-06, "epoch": 1.0708310094813163, "percentage": 35.71, "elapsed_time": "3:37:47", "remaining_time": "6:32:00"}
{"current_steps": 250, "total_steps": 672, "loss": 0.5438, "lr": 5e-06, "epoch": 1.1154489682097044, "percentage": 37.2, "elapsed_time": "3:46:40", "remaining_time": "6:22:37"}
{"current_steps": 260, "total_steps": 672, "loss": 0.5458, "lr": 5e-06, "epoch": 1.1600669269380925, "percentage": 38.69, "elapsed_time": "3:55:34", "remaining_time": "6:13:17"}
{"current_steps": 270, "total_steps": 672, "loss": 0.5483, "lr": 5e-06, "epoch": 1.2046848856664807, "percentage": 40.18, "elapsed_time": "4:04:26", "remaining_time": "6:03:57"}
{"current_steps": 280, "total_steps": 672, "loss": 0.5442, "lr": 5e-06, "epoch": 1.2493028443948688, "percentage": 41.67, "elapsed_time": "4:13:19", "remaining_time": "5:54:39"}
{"current_steps": 290, "total_steps": 672, "loss": 0.5474, "lr": 5e-06, "epoch": 1.2939208031232572, "percentage": 43.15, "elapsed_time": "4:22:14", "remaining_time": "5:45:25"}
{"current_steps": 300, "total_steps": 672, "loss": 0.5327, "lr": 5e-06, "epoch": 1.3385387618516453, "percentage": 44.64, "elapsed_time": "4:31:07", "remaining_time": "5:36:11"}
{"current_steps": 310, "total_steps": 672, "loss": 0.5388, "lr": 5e-06, "epoch": 1.3831567205800335, "percentage": 46.13, "elapsed_time": "4:40:00", "remaining_time": "5:26:58"}
{"current_steps": 320, "total_steps": 672, "loss": 0.5392, "lr": 5e-06, "epoch": 1.4277746793084216, "percentage": 47.62, "elapsed_time": "4:48:54", "remaining_time": "5:17:47"}
{"current_steps": 330, "total_steps": 672, "loss": 0.5353, "lr": 5e-06, "epoch": 1.4723926380368098, "percentage": 49.11, "elapsed_time": "4:57:48", "remaining_time": "5:08:38"}
{"current_steps": 340, "total_steps": 672, "loss": 0.5388, "lr": 5e-06, "epoch": 1.5170105967651981, "percentage": 50.6, "elapsed_time": "5:06:41", "remaining_time": "4:59:28"}
{"current_steps": 350, "total_steps": 672, "loss": 0.5321, "lr": 5e-06, "epoch": 1.561628555493586, "percentage": 52.08, "elapsed_time": "5:15:34", "remaining_time": "4:50:19"}
{"current_steps": 360, "total_steps": 672, "loss": 0.5355, "lr": 5e-06, "epoch": 1.6062465142219744, "percentage": 53.57, "elapsed_time": "5:24:27", "remaining_time": "4:41:12"}
{"current_steps": 370, "total_steps": 672, "loss": 0.5327, "lr": 5e-06, "epoch": 1.6508644729503625, "percentage": 55.06, "elapsed_time": "5:33:22", "remaining_time": "4:32:06"}
{"current_steps": 380, "total_steps": 672, "loss": 0.5405, "lr": 5e-06, "epoch": 1.6954824316787507, "percentage": 56.55, "elapsed_time": "5:42:16", "remaining_time": "4:23:00"}
{"current_steps": 390, "total_steps": 672, "loss": 0.5337, "lr": 5e-06, "epoch": 1.7401003904071388, "percentage": 58.04, "elapsed_time": "5:51:11", "remaining_time": "4:13:56"}
{"current_steps": 400, "total_steps": 672, "loss": 0.5325, "lr": 5e-06, "epoch": 1.784718349135527, "percentage": 59.52, "elapsed_time": "6:00:04", "remaining_time": "4:04:51"}
{"current_steps": 410, "total_steps": 672, "loss": 0.5315, "lr": 5e-06, "epoch": 1.8293363078639153, "percentage": 61.01, "elapsed_time": "6:08:59", "remaining_time": "3:55:47"}
{"current_steps": 420, "total_steps": 672, "loss": 0.5281, "lr": 5e-06, "epoch": 1.8739542665923032, "percentage": 62.5, "elapsed_time": "6:17:54", "remaining_time": "3:46:44"}
{"current_steps": 430, "total_steps": 672, "loss": 0.5316, "lr": 5e-06, "epoch": 1.9185722253206916, "percentage": 63.99, "elapsed_time": "6:26:50", "remaining_time": "3:37:42"}
{"current_steps": 440, "total_steps": 672, "loss": 0.5317, "lr": 5e-06, "epoch": 1.9631901840490797, "percentage": 65.48, "elapsed_time": "6:35:44", "remaining_time": "3:28:39"}
{"current_steps": 448, "total_steps": 672, "eval_loss": 0.5504088997840881, "epoch": 1.9988845510317903, "percentage": 66.67, "elapsed_time": "6:46:48", "remaining_time": "3:23:24"}
{"current_steps": 450, "total_steps": 672, "loss": 0.5741, "lr": 5e-06, "epoch": 2.007808142777468, "percentage": 66.96, "elapsed_time": "6:49:27", "remaining_time": "3:22:00"}
{"current_steps": 460, "total_steps": 672, "loss": 0.5027, "lr": 5e-06, "epoch": 2.0524261015058562, "percentage": 68.45, "elapsed_time": "6:58:22", "remaining_time": "3:12:48"}
{"current_steps": 470, "total_steps": 672, "loss": 0.5015, "lr": 5e-06, "epoch": 2.097044060234244, "percentage": 69.94, "elapsed_time": "7:07:16", "remaining_time": "3:03:38"}
{"current_steps": 480, "total_steps": 672, "loss": 0.4997, "lr": 5e-06, "epoch": 2.1416620189626325, "percentage": 71.43, "elapsed_time": "7:16:09", "remaining_time": "2:54:27"}
{"current_steps": 490, "total_steps": 672, "loss": 0.5066, "lr": 5e-06, "epoch": 2.1862799776910204, "percentage": 72.92, "elapsed_time": "7:25:02", "remaining_time": "2:45:18"}
{"current_steps": 500, "total_steps": 672, "loss": 0.5, "lr": 5e-06, "epoch": 2.230897936419409, "percentage": 74.4, "elapsed_time": "7:33:57", "remaining_time": "2:36:09"}
{"current_steps": 510, "total_steps": 672, "loss": 0.5048, "lr": 5e-06, "epoch": 2.275515895147797, "percentage": 75.89, "elapsed_time": "7:42:53", "remaining_time": "2:27:02"}
{"current_steps": 520, "total_steps": 672, "loss": 0.4972, "lr": 5e-06, "epoch": 2.320133853876185, "percentage": 77.38, "elapsed_time": "7:51:48", "remaining_time": "2:17:54"}
{"current_steps": 530, "total_steps": 672, "loss": 0.512, "lr": 5e-06, "epoch": 2.3647518126045735, "percentage": 78.87, "elapsed_time": "8:00:42", "remaining_time": "2:08:47"}
{"current_steps": 540, "total_steps": 672, "loss": 0.5102, "lr": 5e-06, "epoch": 2.4093697713329614, "percentage": 80.36, "elapsed_time": "8:09:36", "remaining_time": "1:59:40"}
{"current_steps": 550, "total_steps": 672, "loss": 0.5103, "lr": 5e-06, "epoch": 2.4539877300613497, "percentage": 81.85, "elapsed_time": "8:18:29", "remaining_time": "1:50:34"}
{"current_steps": 560, "total_steps": 672, "loss": 0.496, "lr": 5e-06, "epoch": 2.4986056887897377, "percentage": 83.33, "elapsed_time": "8:27:24", "remaining_time": "1:41:28"}
{"current_steps": 570, "total_steps": 672, "loss": 0.5098, "lr": 5e-06, "epoch": 2.543223647518126, "percentage": 84.82, "elapsed_time": "8:36:17", "remaining_time": "1:32:23"}
{"current_steps": 580, "total_steps": 672, "loss": 0.4983, "lr": 5e-06, "epoch": 2.5878416062465144, "percentage": 86.31, "elapsed_time": "8:45:11", "remaining_time": "1:23:18"}
{"current_steps": 590, "total_steps": 672, "loss": 0.5024, "lr": 5e-06, "epoch": 2.6324595649749023, "percentage": 87.8, "elapsed_time": "8:54:06", "remaining_time": "1:14:13"}
{"current_steps": 600, "total_steps": 672, "loss": 0.5018, "lr": 5e-06, "epoch": 2.6770775237032907, "percentage": 89.29, "elapsed_time": "9:03:01", "remaining_time": "1:05:09"}
{"current_steps": 610, "total_steps": 672, "loss": 0.4986, "lr": 5e-06, "epoch": 2.721695482431679, "percentage": 90.77, "elapsed_time": "9:11:57", "remaining_time": "0:56:06"}
{"current_steps": 620, "total_steps": 672, "loss": 0.5044, "lr": 5e-06, "epoch": 2.766313441160067, "percentage": 92.26, "elapsed_time": "9:20:52", "remaining_time": "0:47:02"}
{"current_steps": 630, "total_steps": 672, "loss": 0.4959, "lr": 5e-06, "epoch": 2.810931399888455, "percentage": 93.75, "elapsed_time": "9:29:47", "remaining_time": "0:37:59"}
{"current_steps": 640, "total_steps": 672, "loss": 0.5051, "lr": 5e-06, "epoch": 2.8555493586168432, "percentage": 95.24, "elapsed_time": "9:38:42", "remaining_time": "0:28:56"}
{"current_steps": 650, "total_steps": 672, "loss": 0.4967, "lr": 5e-06, "epoch": 2.9001673173452316, "percentage": 96.73, "elapsed_time": "9:47:37", "remaining_time": "0:19:53"}
{"current_steps": 660, "total_steps": 672, "loss": 0.4981, "lr": 5e-06, "epoch": 2.9447852760736195, "percentage": 98.21, "elapsed_time": "9:56:32", "remaining_time": "0:10:50"}
{"current_steps": 670, "total_steps": 672, "loss": 0.4944, "lr": 5e-06, "epoch": 2.989403234802008, "percentage": 99.7, "elapsed_time": "10:05:29", "remaining_time": "0:01:48"}
{"current_steps": 672, "total_steps": 672, "eval_loss": 0.5417667031288147, "epoch": 2.9983268265476855, "percentage": 100.0, "elapsed_time": "10:12:06", "remaining_time": "0:00:00"}
{"current_steps": 672, "total_steps": 672, "epoch": 2.9983268265476855, "percentage": 100.0, "elapsed_time": "10:13:21", "remaining_time": "0:00:00"}