sedrickkeh's picture
Training in progress, epoch 2
5af5347 verified
{"current_steps": 1, "total_steps": 93, "loss": 1.274, "lr": 1.0000000000000002e-06, "epoch": 0.032, "percentage": 1.08, "elapsed_time": "0:01:04", "remaining_time": "1:38:31"}
{"current_steps": 2, "total_steps": 93, "loss": 1.2584, "lr": 2.0000000000000003e-06, "epoch": 0.064, "percentage": 2.15, "elapsed_time": "0:01:58", "remaining_time": "1:29:56"}
{"current_steps": 3, "total_steps": 93, "loss": 1.2997, "lr": 3e-06, "epoch": 0.096, "percentage": 3.23, "elapsed_time": "0:02:53", "remaining_time": "1:26:45"}
{"current_steps": 4, "total_steps": 93, "loss": 1.2787, "lr": 4.000000000000001e-06, "epoch": 0.128, "percentage": 4.3, "elapsed_time": "0:03:54", "remaining_time": "1:27:06"}
{"current_steps": 5, "total_steps": 93, "loss": 1.1893, "lr": 5e-06, "epoch": 0.16, "percentage": 5.38, "elapsed_time": "0:04:49", "remaining_time": "1:25:00"}
{"current_steps": 6, "total_steps": 93, "loss": 1.1767, "lr": 6e-06, "epoch": 0.192, "percentage": 6.45, "elapsed_time": "0:05:35", "remaining_time": "1:21:05"}
{"current_steps": 7, "total_steps": 93, "loss": 1.1806, "lr": 7e-06, "epoch": 0.224, "percentage": 7.53, "elapsed_time": "0:06:38", "remaining_time": "1:21:38"}
{"current_steps": 8, "total_steps": 93, "loss": 1.158, "lr": 8.000000000000001e-06, "epoch": 0.256, "percentage": 8.6, "elapsed_time": "0:07:36", "remaining_time": "1:20:49"}
{"current_steps": 9, "total_steps": 93, "loss": 1.1352, "lr": 9e-06, "epoch": 0.288, "percentage": 9.68, "elapsed_time": "0:08:37", "remaining_time": "1:20:30"}
{"current_steps": 10, "total_steps": 93, "loss": 1.1387, "lr": 1e-05, "epoch": 0.32, "percentage": 10.75, "elapsed_time": "0:09:41", "remaining_time": "1:20:23"}
{"current_steps": 11, "total_steps": 93, "loss": 1.1677, "lr": 9.996418774081658e-06, "epoch": 0.352, "percentage": 11.83, "elapsed_time": "0:10:34", "remaining_time": "1:18:51"}
{"current_steps": 12, "total_steps": 93, "loss": 1.1415, "lr": 9.985680226398261e-06, "epoch": 0.384, "percentage": 12.9, "elapsed_time": "0:11:25", "remaining_time": "1:17:08"}
{"current_steps": 13, "total_steps": 93, "loss": 1.0675, "lr": 9.967799739815925e-06, "epoch": 0.416, "percentage": 13.98, "elapsed_time": "0:12:20", "remaining_time": "1:15:54"}
{"current_steps": 14, "total_steps": 93, "loss": 1.0578, "lr": 9.942802927959444e-06, "epoch": 0.448, "percentage": 15.05, "elapsed_time": "0:13:10", "remaining_time": "1:14:20"}
{"current_steps": 15, "total_steps": 93, "loss": 1.0096, "lr": 9.910725598521014e-06, "epoch": 0.48, "percentage": 16.13, "elapsed_time": "0:14:11", "remaining_time": "1:13:47"}
{"current_steps": 16, "total_steps": 93, "loss": 1.0094, "lr": 9.871613701966067e-06, "epoch": 0.512, "percentage": 17.2, "elapsed_time": "0:15:15", "remaining_time": "1:13:26"}
{"current_steps": 17, "total_steps": 93, "loss": 1.0001, "lr": 9.825523265709667e-06, "epoch": 0.544, "percentage": 18.28, "elapsed_time": "0:16:06", "remaining_time": "1:12:01"}
{"current_steps": 18, "total_steps": 93, "loss": 0.9683, "lr": 9.772520313857777e-06, "epoch": 0.576, "percentage": 19.35, "elapsed_time": "0:17:03", "remaining_time": "1:11:05"}
{"current_steps": 19, "total_steps": 93, "loss": 0.983, "lr": 9.712680772628365e-06, "epoch": 0.608, "percentage": 20.43, "elapsed_time": "0:18:00", "remaining_time": "1:10:10"}
{"current_steps": 20, "total_steps": 93, "loss": 0.97, "lr": 9.646090361587828e-06, "epoch": 0.64, "percentage": 21.51, "elapsed_time": "0:18:51", "remaining_time": "1:08:51"}
{"current_steps": 21, "total_steps": 93, "loss": 0.9922, "lr": 9.572844470858537e-06, "epoch": 0.672, "percentage": 22.58, "elapsed_time": "0:19:49", "remaining_time": "1:07:59"}
{"current_steps": 22, "total_steps": 93, "loss": 0.9464, "lr": 9.493048024473413e-06, "epoch": 0.704, "percentage": 23.66, "elapsed_time": "0:20:42", "remaining_time": "1:06:49"}
{"current_steps": 23, "total_steps": 93, "loss": 0.982, "lr": 9.406815330073244e-06, "epoch": 0.736, "percentage": 24.73, "elapsed_time": "0:21:25", "remaining_time": "1:05:12"}
{"current_steps": 24, "total_steps": 93, "loss": 0.9922, "lr": 9.314269915162115e-06, "epoch": 0.768, "percentage": 25.81, "elapsed_time": "0:22:25", "remaining_time": "1:04:27"}
{"current_steps": 25, "total_steps": 93, "loss": 0.9401, "lr": 9.215544350155423e-06, "epoch": 0.8, "percentage": 26.88, "elapsed_time": "0:23:19", "remaining_time": "1:03:25"}
{"current_steps": 26, "total_steps": 93, "loss": 0.9571, "lr": 9.110780058474052e-06, "epoch": 0.832, "percentage": 27.96, "elapsed_time": "0:24:13", "remaining_time": "1:02:25"}
{"current_steps": 27, "total_steps": 93, "loss": 0.9731, "lr": 9.000127113956673e-06, "epoch": 0.864, "percentage": 29.03, "elapsed_time": "0:25:09", "remaining_time": "1:01:29"}
{"current_steps": 28, "total_steps": 93, "loss": 0.9277, "lr": 8.883744025880429e-06, "epoch": 0.896, "percentage": 30.11, "elapsed_time": "0:25:54", "remaining_time": "1:00:07"}
{"current_steps": 29, "total_steps": 93, "loss": 0.9404, "lr": 8.761797511897907e-06, "epoch": 0.928, "percentage": 31.18, "elapsed_time": "0:26:53", "remaining_time": "0:59:21"}
{"current_steps": 30, "total_steps": 93, "loss": 0.9388, "lr": 8.634462259215719e-06, "epoch": 0.96, "percentage": 32.26, "elapsed_time": "0:27:48", "remaining_time": "0:58:22"}
{"current_steps": 31, "total_steps": 93, "loss": 0.9318, "lr": 8.501920674356755e-06, "epoch": 0.992, "percentage": 33.33, "elapsed_time": "0:28:36", "remaining_time": "0:57:13"}
{"current_steps": 32, "total_steps": 93, "loss": 1.7235, "lr": 8.364362621864595e-06, "epoch": 1.024, "percentage": 34.41, "elapsed_time": "0:30:30", "remaining_time": "0:58:09"}
{"current_steps": 33, "total_steps": 93, "loss": 0.8678, "lr": 8.221985152324385e-06, "epoch": 1.056, "percentage": 35.48, "elapsed_time": "0:31:18", "remaining_time": "0:56:55"}
{"current_steps": 34, "total_steps": 93, "loss": 0.8889, "lr": 8.07499222008977e-06, "epoch": 1.088, "percentage": 36.56, "elapsed_time": "0:32:10", "remaining_time": "0:55:49"}
{"current_steps": 35, "total_steps": 93, "loss": 0.9157, "lr": 7.923594391120237e-06, "epoch": 1.12, "percentage": 37.63, "elapsed_time": "0:33:02", "remaining_time": "0:54:44"}
{"current_steps": 36, "total_steps": 93, "loss": 0.9081, "lr": 7.768008541347423e-06, "epoch": 1.152, "percentage": 38.71, "elapsed_time": "0:33:54", "remaining_time": "0:53:41"}
{"current_steps": 37, "total_steps": 93, "loss": 0.8875, "lr": 7.608457546002423e-06, "epoch": 1.184, "percentage": 39.78, "elapsed_time": "0:34:48", "remaining_time": "0:52:40"}
{"current_steps": 38, "total_steps": 93, "loss": 0.8787, "lr": 7.445169960349167e-06, "epoch": 1.216, "percentage": 40.86, "elapsed_time": "0:35:40", "remaining_time": "0:51:37"}
{"current_steps": 39, "total_steps": 93, "loss": 0.9457, "lr": 7.278379692281209e-06, "epoch": 1.248, "percentage": 41.94, "elapsed_time": "0:36:31", "remaining_time": "0:50:34"}
{"current_steps": 40, "total_steps": 93, "loss": 0.8881, "lr": 7.10832566725092e-06, "epoch": 1.28, "percentage": 43.01, "elapsed_time": "0:37:28", "remaining_time": "0:49:39"}
{"current_steps": 41, "total_steps": 93, "loss": 0.8929, "lr": 6.9352514860110876e-06, "epoch": 1.312, "percentage": 44.09, "elapsed_time": "0:38:19", "remaining_time": "0:48:36"}
{"current_steps": 42, "total_steps": 93, "loss": 0.7808, "lr": 6.759405075659165e-06, "epoch": 1.3439999999999999, "percentage": 45.16, "elapsed_time": "0:38:57", "remaining_time": "0:47:18"}
{"current_steps": 43, "total_steps": 93, "loss": 0.8973, "lr": 6.58103833448412e-06, "epoch": 1.376, "percentage": 46.24, "elapsed_time": "0:39:52", "remaining_time": "0:46:21"}
{"current_steps": 44, "total_steps": 93, "loss": 0.9228, "lr": 6.4004067711245366e-06, "epoch": 1.408, "percentage": 47.31, "elapsed_time": "0:40:56", "remaining_time": "0:45:35"}
{"current_steps": 45, "total_steps": 93, "loss": 0.857, "lr": 6.2177691385549595e-06, "epoch": 1.44, "percentage": 48.39, "elapsed_time": "0:41:47", "remaining_time": "0:44:34"}
{"current_steps": 46, "total_steps": 93, "loss": 0.843, "lr": 6.033387063424765e-06, "epoch": 1.472, "percentage": 49.46, "elapsed_time": "0:42:36", "remaining_time": "0:43:32"}
{"current_steps": 47, "total_steps": 93, "loss": 1.0347, "lr": 5.8475246712804845e-06, "epoch": 1.504, "percentage": 50.54, "elapsed_time": "0:43:40", "remaining_time": "0:42:44"}
{"current_steps": 48, "total_steps": 93, "loss": 0.817, "lr": 5.660448208208513e-06, "epoch": 1.536, "percentage": 51.61, "elapsed_time": "0:44:23", "remaining_time": "0:41:37"}
{"current_steps": 49, "total_steps": 93, "loss": 0.8407, "lr": 5.472425659440157e-06, "epoch": 1.568, "percentage": 52.69, "elapsed_time": "0:45:17", "remaining_time": "0:40:39"}
{"current_steps": 50, "total_steps": 93, "loss": 0.8921, "lr": 5.2837263654653715e-06, "epoch": 1.6, "percentage": 53.76, "elapsed_time": "0:46:03", "remaining_time": "0:39:36"}
{"current_steps": 51, "total_steps": 93, "loss": 0.9579, "lr": 5.094620636205096e-06, "epoch": 1.6320000000000001, "percentage": 54.84, "elapsed_time": "0:46:57", "remaining_time": "0:38:40"}
{"current_steps": 52, "total_steps": 93, "loss": 0.7933, "lr": 4.905379363794907e-06, "epoch": 1.6640000000000001, "percentage": 55.91, "elapsed_time": "0:47:46", "remaining_time": "0:37:40"}
{"current_steps": 53, "total_steps": 93, "loss": 0.97, "lr": 4.71627363453463e-06, "epoch": 1.696, "percentage": 56.99, "elapsed_time": "0:48:52", "remaining_time": "0:36:53"}
{"current_steps": 54, "total_steps": 93, "loss": 0.8357, "lr": 4.527574340559844e-06, "epoch": 1.728, "percentage": 58.06, "elapsed_time": "0:49:51", "remaining_time": "0:36:00"}
{"current_steps": 55, "total_steps": 93, "loss": 0.828, "lr": 4.33955179179149e-06, "epoch": 1.76, "percentage": 59.14, "elapsed_time": "0:50:43", "remaining_time": "0:35:02"}
{"current_steps": 56, "total_steps": 93, "loss": 0.8928, "lr": 4.152475328719517e-06, "epoch": 1.792, "percentage": 60.22, "elapsed_time": "0:51:36", "remaining_time": "0:34:05"}
{"current_steps": 57, "total_steps": 93, "loss": 0.9052, "lr": 3.966612936575235e-06, "epoch": 1.8239999999999998, "percentage": 61.29, "elapsed_time": "0:52:29", "remaining_time": "0:33:08"}
{"current_steps": 58, "total_steps": 93, "loss": 0.9586, "lr": 3.782230861445041e-06, "epoch": 1.8559999999999999, "percentage": 62.37, "elapsed_time": "0:53:28", "remaining_time": "0:32:16"}
{"current_steps": 59, "total_steps": 93, "loss": 0.8434, "lr": 3.5995932288754655e-06, "epoch": 1.888, "percentage": 63.44, "elapsed_time": "0:54:28", "remaining_time": "0:31:23"}
{"current_steps": 60, "total_steps": 93, "loss": 0.8777, "lr": 3.4189616655158803e-06, "epoch": 1.92, "percentage": 64.52, "elapsed_time": "0:55:26", "remaining_time": "0:30:29"}
{"current_steps": 61, "total_steps": 93, "loss": 0.8699, "lr": 3.240594924340835e-06, "epoch": 1.952, "percentage": 65.59, "elapsed_time": "0:56:22", "remaining_time": "0:29:34"}
{"current_steps": 62, "total_steps": 93, "loss": 0.8321, "lr": 3.0647485139889145e-06, "epoch": 1.984, "percentage": 66.67, "elapsed_time": "0:57:15", "remaining_time": "0:28:37"}
{"current_steps": 63, "total_steps": 93, "loss": 1.5436, "lr": 2.89167433274908e-06, "epoch": 2.016, "percentage": 67.74, "elapsed_time": "0:59:20", "remaining_time": "0:28:15"}
{"current_steps": 64, "total_steps": 93, "loss": 0.8582, "lr": 2.721620307718793e-06, "epoch": 2.048, "percentage": 68.82, "elapsed_time": "1:00:15", "remaining_time": "0:27:18"}
{"current_steps": 65, "total_steps": 93, "loss": 0.8665, "lr": 2.554830039650834e-06, "epoch": 2.08, "percentage": 69.89, "elapsed_time": "1:01:14", "remaining_time": "0:26:22"}
{"current_steps": 66, "total_steps": 93, "loss": 0.8705, "lr": 2.391542453997578e-06, "epoch": 2.112, "percentage": 70.97, "elapsed_time": "1:02:06", "remaining_time": "0:25:24"}
{"current_steps": 67, "total_steps": 93, "loss": 0.7992, "lr": 2.2319914586525776e-06, "epoch": 2.144, "percentage": 72.04, "elapsed_time": "1:02:56", "remaining_time": "0:24:25"}
{"current_steps": 68, "total_steps": 93, "loss": 0.8735, "lr": 2.0764056088797646e-06, "epoch": 2.176, "percentage": 73.12, "elapsed_time": "1:03:54", "remaining_time": "0:23:29"}
{"current_steps": 69, "total_steps": 93, "loss": 0.8379, "lr": 1.9250077799102323e-06, "epoch": 2.208, "percentage": 74.19, "elapsed_time": "1:04:40", "remaining_time": "0:22:29"}
{"current_steps": 70, "total_steps": 93, "loss": 0.8338, "lr": 1.7780148476756148e-06, "epoch": 2.24, "percentage": 75.27, "elapsed_time": "1:05:35", "remaining_time": "0:21:33"}
{"current_steps": 71, "total_steps": 93, "loss": 0.7843, "lr": 1.6356373781354058e-06, "epoch": 2.2720000000000002, "percentage": 76.34, "elapsed_time": "1:06:36", "remaining_time": "0:20:38"}
{"current_steps": 72, "total_steps": 93, "loss": 0.8256, "lr": 1.4980793256432474e-06, "epoch": 2.304, "percentage": 77.42, "elapsed_time": "1:07:28", "remaining_time": "0:19:40"}
{"current_steps": 73, "total_steps": 93, "loss": 0.8289, "lr": 1.3655377407842813e-06, "epoch": 2.336, "percentage": 78.49, "elapsed_time": "1:08:17", "remaining_time": "0:18:42"}
{"current_steps": 74, "total_steps": 93, "loss": 0.8025, "lr": 1.2382024881020937e-06, "epoch": 2.368, "percentage": 79.57, "elapsed_time": "1:09:09", "remaining_time": "0:17:45"}
{"current_steps": 75, "total_steps": 93, "loss": 0.9191, "lr": 1.1162559741195733e-06, "epoch": 2.4, "percentage": 80.65, "elapsed_time": "1:10:06", "remaining_time": "0:16:49"}
{"current_steps": 76, "total_steps": 93, "loss": 0.8216, "lr": 9.998728860433277e-07, "epoch": 2.432, "percentage": 81.72, "elapsed_time": "1:10:59", "remaining_time": "0:15:52"}
{"current_steps": 77, "total_steps": 93, "loss": 0.8265, "lr": 8.892199415259501e-07, "epoch": 2.464, "percentage": 82.8, "elapsed_time": "1:11:59", "remaining_time": "0:14:57"}
{"current_steps": 78, "total_steps": 93, "loss": 0.8353, "lr": 7.844556498445788e-07, "epoch": 2.496, "percentage": 83.87, "elapsed_time": "1:12:49", "remaining_time": "0:14:00"}
{"current_steps": 79, "total_steps": 93, "loss": 0.8233, "lr": 6.857300848378857e-07, "epoch": 2.528, "percentage": 84.95, "elapsed_time": "1:13:41", "remaining_time": "0:13:03"}
{"current_steps": 80, "total_steps": 93, "loss": 0.918, "lr": 5.931846699267558e-07, "epoch": 2.56, "percentage": 86.02, "elapsed_time": "1:14:33", "remaining_time": "0:12:06"}
{"current_steps": 81, "total_steps": 93, "loss": 0.7847, "lr": 5.0695197552659e-07, "epoch": 2.592, "percentage": 87.1, "elapsed_time": "1:15:23", "remaining_time": "0:11:10"}
{"current_steps": 82, "total_steps": 93, "loss": 0.8077, "lr": 4.271555291414636e-07, "epoch": 2.624, "percentage": 88.17, "elapsed_time": "1:16:19", "remaining_time": "0:10:14"}
{"current_steps": 83, "total_steps": 93, "loss": 0.8602, "lr": 3.539096384121743e-07, "epoch": 2.656, "percentage": 89.25, "elapsed_time": "1:17:10", "remaining_time": "0:09:17"}
{"current_steps": 84, "total_steps": 93, "loss": 0.846, "lr": 2.873192273716369e-07, "epoch": 2.6879999999999997, "percentage": 90.32, "elapsed_time": "1:18:09", "remaining_time": "0:08:22"}
{"current_steps": 85, "total_steps": 93, "loss": 0.808, "lr": 2.274796861422246e-07, "epoch": 2.7199999999999998, "percentage": 91.4, "elapsed_time": "1:19:10", "remaining_time": "0:07:27"}
{"current_steps": 86, "total_steps": 93, "loss": 0.8078, "lr": 1.7447673429033361e-07, "epoch": 2.752, "percentage": 92.47, "elapsed_time": "1:20:09", "remaining_time": "0:06:31"}
{"current_steps": 87, "total_steps": 93, "loss": 0.8601, "lr": 1.2838629803393343e-07, "epoch": 2.784, "percentage": 93.55, "elapsed_time": "1:21:01", "remaining_time": "0:05:35"}
{"current_steps": 88, "total_steps": 93, "loss": 0.8478, "lr": 8.927440147898703e-08, "epoch": 2.816, "percentage": 94.62, "elapsed_time": "1:21:45", "remaining_time": "0:04:38"}
{"current_steps": 89, "total_steps": 93, "loss": 0.9191, "lr": 5.7197072040557356e-08, "epoch": 2.848, "percentage": 95.7, "elapsed_time": "1:22:47", "remaining_time": "0:03:43"}
{"current_steps": 90, "total_steps": 93, "loss": 0.7321, "lr": 3.220026018407541e-08, "epoch": 2.88, "percentage": 96.77, "elapsed_time": "1:23:34", "remaining_time": "0:02:47"}
{"current_steps": 91, "total_steps": 93, "loss": 0.8163, "lr": 1.431977360173975e-08, "epoch": 2.912, "percentage": 97.85, "elapsed_time": "1:24:30", "remaining_time": "0:01:51"}
{"current_steps": 92, "total_steps": 93, "loss": 0.8683, "lr": 3.5812259183426457e-09, "epoch": 2.944, "percentage": 98.92, "elapsed_time": "1:25:28", "remaining_time": "0:00:55"}
{"current_steps": 93, "total_steps": 93, "loss": 0.8822, "lr": 0.0, "epoch": 2.976, "percentage": 100.0, "elapsed_time": "1:26:27", "remaining_time": "0:00:00"}
{"current_steps": 93, "total_steps": 93, "epoch": 2.976, "percentage": 100.0, "elapsed_time": "1:28:37", "remaining_time": "0:00:00"}