PumeTu's picture
Add files using upload-large-folder tool
da844e0 verified
{"current_steps": 1, "total_steps": 261, "loss": 1.0671, "lr": 0.0, "epoch": 0.011494252873563218, "percentage": 0.38, "elapsed_time": "0:03:19", "remaining_time": "14:25:14"}
{"current_steps": 2, "total_steps": 261, "loss": 1.0786, "lr": 7.4074074074074075e-06, "epoch": 0.022988505747126436, "percentage": 0.77, "elapsed_time": "0:06:36", "remaining_time": "14:16:07"}
{"current_steps": 3, "total_steps": 261, "loss": 1.074, "lr": 1.4814814814814815e-05, "epoch": 0.034482758620689655, "percentage": 1.15, "elapsed_time": "0:09:52", "remaining_time": "14:09:45"}
{"current_steps": 4, "total_steps": 261, "loss": 1.0617, "lr": 2.2222222222222223e-05, "epoch": 0.04597701149425287, "percentage": 1.53, "elapsed_time": "0:13:06", "remaining_time": "14:01:48"}
{"current_steps": 5, "total_steps": 261, "loss": 1.0856, "lr": 2.962962962962963e-05, "epoch": 0.05747126436781609, "percentage": 1.92, "elapsed_time": "0:16:18", "remaining_time": "13:55:13"}
{"current_steps": 6, "total_steps": 261, "loss": 1.0464, "lr": 3.7037037037037037e-05, "epoch": 0.06896551724137931, "percentage": 2.3, "elapsed_time": "0:19:33", "remaining_time": "13:50:54"}
{"current_steps": 7, "total_steps": 261, "loss": 1.0201, "lr": 4.4444444444444447e-05, "epoch": 0.08045977011494253, "percentage": 2.68, "elapsed_time": "0:22:48", "remaining_time": "13:47:35"}
{"current_steps": 8, "total_steps": 261, "loss": 0.983, "lr": 5.185185185185185e-05, "epoch": 0.09195402298850575, "percentage": 3.07, "elapsed_time": "0:26:02", "remaining_time": "13:43:46"}
{"current_steps": 9, "total_steps": 261, "loss": 0.9627, "lr": 5.925925925925926e-05, "epoch": 0.10344827586206896, "percentage": 3.45, "elapsed_time": "0:29:16", "remaining_time": "13:39:43"}
{"current_steps": 10, "total_steps": 261, "loss": 0.9351, "lr": 6.666666666666667e-05, "epoch": 0.11494252873563218, "percentage": 3.83, "elapsed_time": "0:32:35", "remaining_time": "13:37:53"}
{"current_steps": 10, "total_steps": 261, "eval_loss": 0.9996559023857117, "epoch": 0.11494252873563218, "percentage": 3.83, "elapsed_time": "0:42:12", "remaining_time": "17:39:26"}
{"current_steps": 11, "total_steps": 261, "loss": 0.9269, "lr": 7.407407407407407e-05, "epoch": 0.12643678160919541, "percentage": 4.21, "elapsed_time": "0:45:29", "remaining_time": "17:13:46"}
{"current_steps": 12, "total_steps": 261, "loss": 0.8617, "lr": 8.148148148148148e-05, "epoch": 0.13793103448275862, "percentage": 4.6, "elapsed_time": "0:48:42", "remaining_time": "16:50:36"}
{"current_steps": 13, "total_steps": 261, "loss": 0.8568, "lr": 8.888888888888889e-05, "epoch": 0.14942528735632185, "percentage": 4.98, "elapsed_time": "0:51:54", "remaining_time": "16:30:19"}
{"current_steps": 14, "total_steps": 261, "loss": 0.8651, "lr": 9.62962962962963e-05, "epoch": 0.16091954022988506, "percentage": 5.36, "elapsed_time": "0:55:14", "remaining_time": "16:14:34"}
{"current_steps": 15, "total_steps": 261, "loss": 0.8281, "lr": 0.0001037037037037037, "epoch": 0.1724137931034483, "percentage": 5.75, "elapsed_time": "0:58:30", "remaining_time": "15:59:29"}
{"current_steps": 16, "total_steps": 261, "loss": 0.8296, "lr": 0.00011111111111111112, "epoch": 0.1839080459770115, "percentage": 6.13, "elapsed_time": "1:01:43", "remaining_time": "15:45:12"}
{"current_steps": 17, "total_steps": 261, "loss": 0.8494, "lr": 0.00011851851851851852, "epoch": 0.19540229885057472, "percentage": 6.51, "elapsed_time": "1:04:55", "remaining_time": "15:31:58"}
{"current_steps": 18, "total_steps": 261, "loss": 0.8236, "lr": 0.00012592592592592592, "epoch": 0.20689655172413793, "percentage": 6.9, "elapsed_time": "1:08:12", "remaining_time": "15:20:48"}
{"current_steps": 19, "total_steps": 261, "loss": 0.821, "lr": 0.00013333333333333334, "epoch": 0.21839080459770116, "percentage": 7.28, "elapsed_time": "1:11:27", "remaining_time": "15:10:12"}
{"current_steps": 20, "total_steps": 261, "loss": 0.8087, "lr": 0.00014074074074074076, "epoch": 0.22988505747126436, "percentage": 7.66, "elapsed_time": "1:14:43", "remaining_time": "15:00:21"}
{"current_steps": 20, "total_steps": 261, "eval_loss": 0.8203959465026855, "epoch": 0.22988505747126436, "percentage": 7.66, "elapsed_time": "1:24:16", "remaining_time": "16:55:28"}
{"current_steps": 21, "total_steps": 261, "loss": 0.8005, "lr": 0.00014814814814814815, "epoch": 0.2413793103448276, "percentage": 8.05, "elapsed_time": "1:27:31", "remaining_time": "16:40:17"}
{"current_steps": 22, "total_steps": 261, "loss": 0.8099, "lr": 0.00015555555555555556, "epoch": 0.25287356321839083, "percentage": 8.43, "elapsed_time": "1:30:47", "remaining_time": "16:26:18"}
{"current_steps": 23, "total_steps": 261, "loss": 0.8084, "lr": 0.00016296296296296295, "epoch": 0.26436781609195403, "percentage": 8.81, "elapsed_time": "1:34:00", "remaining_time": "16:12:48"}
{"current_steps": 24, "total_steps": 261, "loss": 0.7786, "lr": 0.00017037037037037037, "epoch": 0.27586206896551724, "percentage": 9.2, "elapsed_time": "1:37:14", "remaining_time": "16:00:14"}
{"current_steps": 25, "total_steps": 261, "loss": 0.794, "lr": 0.00017777777777777779, "epoch": 0.28735632183908044, "percentage": 9.58, "elapsed_time": "1:40:28", "remaining_time": "15:48:29"}
{"current_steps": 26, "total_steps": 261, "loss": 0.7793, "lr": 0.0001851851851851852, "epoch": 0.2988505747126437, "percentage": 9.96, "elapsed_time": "1:43:43", "remaining_time": "15:37:27"}
{"current_steps": 27, "total_steps": 261, "loss": 0.7779, "lr": 0.0001925925925925926, "epoch": 0.3103448275862069, "percentage": 10.34, "elapsed_time": "1:46:55", "remaining_time": "15:26:39"}
{"current_steps": 28, "total_steps": 261, "loss": 0.7871, "lr": 0.0002, "epoch": 0.3218390804597701, "percentage": 10.73, "elapsed_time": "1:50:08", "remaining_time": "15:16:32"}
{"current_steps": 29, "total_steps": 261, "loss": 0.7645, "lr": 0.00019999098778567212, "epoch": 0.3333333333333333, "percentage": 11.11, "elapsed_time": "1:53:21", "remaining_time": "15:06:49"}
{"current_steps": 30, "total_steps": 261, "loss": 0.7724, "lr": 0.00019996395276708856, "epoch": 0.3448275862068966, "percentage": 11.49, "elapsed_time": "1:56:34", "remaining_time": "14:57:38"}
{"current_steps": 30, "total_steps": 261, "eval_loss": 0.7786664366722107, "epoch": 0.3448275862068966, "percentage": 11.49, "elapsed_time": "2:06:14", "remaining_time": "16:12:02"}
{"current_steps": 31, "total_steps": 261, "loss": 0.7634, "lr": 0.00019991889981715698, "epoch": 0.3563218390804598, "percentage": 11.88, "elapsed_time": "2:09:29", "remaining_time": "16:00:45"}
{"current_steps": 32, "total_steps": 261, "loss": 0.7539, "lr": 0.00019985583705641418, "epoch": 0.367816091954023, "percentage": 12.26, "elapsed_time": "2:12:43", "remaining_time": "15:49:49"}
{"current_steps": 33, "total_steps": 261, "loss": 0.7649, "lr": 0.00019977477585156252, "epoch": 0.3793103448275862, "percentage": 12.64, "elapsed_time": "2:15:56", "remaining_time": "15:39:12"}
{"current_steps": 34, "total_steps": 261, "loss": 0.7698, "lr": 0.00019967573081342103, "epoch": 0.39080459770114945, "percentage": 13.03, "elapsed_time": "2:19:10", "remaining_time": "15:29:11"}
{"current_steps": 35, "total_steps": 261, "loss": 0.7316, "lr": 0.0001995587197942919, "epoch": 0.40229885057471265, "percentage": 13.41, "elapsed_time": "2:22:24", "remaining_time": "15:19:35"}
{"current_steps": 36, "total_steps": 261, "loss": 0.7694, "lr": 0.0001994237638847428, "epoch": 0.41379310344827586, "percentage": 13.79, "elapsed_time": "2:25:37", "remaining_time": "15:10:08"}
{"current_steps": 37, "total_steps": 261, "loss": 0.7664, "lr": 0.0001992708874098054, "epoch": 0.42528735632183906, "percentage": 14.18, "elapsed_time": "2:28:53", "remaining_time": "15:01:25"}
{"current_steps": 38, "total_steps": 261, "loss": 0.7676, "lr": 0.00019910011792459087, "epoch": 0.4367816091954023, "percentage": 14.56, "elapsed_time": "2:32:09", "remaining_time": "14:52:53"}
{"current_steps": 39, "total_steps": 261, "loss": 0.7492, "lr": 0.00019891148620932318, "epoch": 0.4482758620689655, "percentage": 14.94, "elapsed_time": "2:35:21", "remaining_time": "14:44:23"}
{"current_steps": 40, "total_steps": 261, "loss": 0.7386, "lr": 0.00019870502626379127, "epoch": 0.45977011494252873, "percentage": 15.33, "elapsed_time": "2:38:38", "remaining_time": "14:36:28"}
{"current_steps": 40, "total_steps": 261, "eval_loss": 0.7544006705284119, "epoch": 0.45977011494252873, "percentage": 15.33, "elapsed_time": "2:48:12", "remaining_time": "15:29:18"}
{"current_steps": 41, "total_steps": 261, "loss": 0.7328, "lr": 0.00019848077530122083, "epoch": 0.47126436781609193, "percentage": 15.71, "elapsed_time": "2:51:28", "remaining_time": "15:20:05"}
{"current_steps": 42, "total_steps": 261, "loss": 0.7705, "lr": 0.00019823877374156647, "epoch": 0.4827586206896552, "percentage": 16.09, "elapsed_time": "2:54:41", "remaining_time": "15:10:56"}
{"current_steps": 43, "total_steps": 261, "loss": 0.7501, "lr": 0.00019797906520422677, "epoch": 0.4942528735632184, "percentage": 16.48, "elapsed_time": "2:57:54", "remaining_time": "15:01:56"}
{"current_steps": 44, "total_steps": 261, "loss": 0.7401, "lr": 0.00019770169650018172, "epoch": 0.5057471264367817, "percentage": 16.86, "elapsed_time": "3:01:07", "remaining_time": "14:53:18"}
{"current_steps": 45, "total_steps": 261, "loss": 0.7582, "lr": 0.00019740671762355548, "epoch": 0.5172413793103449, "percentage": 17.24, "elapsed_time": "3:04:21", "remaining_time": "14:44:55"}
{"current_steps": 46, "total_steps": 261, "loss": 0.7223, "lr": 0.0001970941817426052, "epoch": 0.5287356321839081, "percentage": 17.62, "elapsed_time": "3:07:35", "remaining_time": "14:36:48"}
{"current_steps": 47, "total_steps": 261, "loss": 0.7318, "lr": 0.00019676414519013781, "epoch": 0.5402298850574713, "percentage": 18.01, "elapsed_time": "3:10:49", "remaining_time": "14:28:53"}
{"current_steps": 48, "total_steps": 261, "loss": 0.7317, "lr": 0.00019641666745335624, "epoch": 0.5517241379310345, "percentage": 18.39, "elapsed_time": "3:14:03", "remaining_time": "14:21:07"}
{"current_steps": 49, "total_steps": 261, "loss": 0.746, "lr": 0.00019605181116313724, "epoch": 0.5632183908045977, "percentage": 18.77, "elapsed_time": "3:17:21", "remaining_time": "14:13:51"}
{"current_steps": 50, "total_steps": 261, "loss": 0.7351, "lr": 0.00019566964208274254, "epoch": 0.5747126436781609, "percentage": 19.16, "elapsed_time": "3:20:38", "remaining_time": "14:06:41"}
{"current_steps": 50, "total_steps": 261, "eval_loss": 0.7382059097290039, "epoch": 0.5747126436781609, "percentage": 19.16, "elapsed_time": "3:30:15", "remaining_time": "14:47:18"}
{"current_steps": 51, "total_steps": 261, "loss": 0.7231, "lr": 0.00019527022909596536, "epoch": 0.5862068965517241, "percentage": 19.54, "elapsed_time": "3:33:53", "remaining_time": "14:40:44"}
{"current_steps": 52, "total_steps": 261, "loss": 0.734, "lr": 0.00019485364419471454, "epoch": 0.5977011494252874, "percentage": 19.92, "elapsed_time": "3:37:09", "remaining_time": "14:32:47"}
{"current_steps": 53, "total_steps": 261, "loss": 0.7154, "lr": 0.00019441996246603846, "epoch": 0.6091954022988506, "percentage": 20.31, "elapsed_time": "3:40:23", "remaining_time": "14:24:57"}
{"current_steps": 54, "total_steps": 261, "loss": 0.7042, "lr": 0.00019396926207859084, "epoch": 0.6206896551724138, "percentage": 20.69, "elapsed_time": "3:43:38", "remaining_time": "14:17:18"}
{"current_steps": 55, "total_steps": 261, "loss": 0.7405, "lr": 0.0001935016242685415, "epoch": 0.632183908045977, "percentage": 21.07, "elapsed_time": "3:46:52", "remaining_time": "14:09:43"}
{"current_steps": 56, "total_steps": 261, "loss": 0.7413, "lr": 0.00019301713332493386, "epoch": 0.6436781609195402, "percentage": 21.46, "elapsed_time": "3:50:08", "remaining_time": "14:02:30"}
{"current_steps": 57, "total_steps": 261, "loss": 0.7237, "lr": 0.00019251587657449236, "epoch": 0.6551724137931034, "percentage": 21.84, "elapsed_time": "3:53:22", "remaining_time": "13:55:14"}
{"current_steps": 58, "total_steps": 261, "loss": 0.7189, "lr": 0.00019199794436588243, "epoch": 0.6666666666666666, "percentage": 22.22, "elapsed_time": "3:56:38", "remaining_time": "13:48:13"}
{"current_steps": 59, "total_steps": 261, "loss": 0.7346, "lr": 0.00019146343005342547, "epoch": 0.6781609195402298, "percentage": 22.61, "elapsed_time": "3:59:51", "remaining_time": "13:41:11"}
{"current_steps": 60, "total_steps": 261, "loss": 0.7431, "lr": 0.0001909124299802724, "epoch": 0.6896551724137931, "percentage": 22.99, "elapsed_time": "4:03:06", "remaining_time": "13:34:23"}
{"current_steps": 60, "total_steps": 261, "eval_loss": 0.7254042029380798, "epoch": 0.6896551724137931, "percentage": 22.99, "elapsed_time": "4:12:45", "remaining_time": "14:06:43"}
{"current_steps": 61, "total_steps": 261, "loss": 0.7269, "lr": 0.00019034504346103823, "epoch": 0.7011494252873564, "percentage": 23.37, "elapsed_time": "4:16:00", "remaining_time": "13:59:22"}
{"current_steps": 62, "total_steps": 261, "loss": 0.7408, "lr": 0.0001897613727639014, "epoch": 0.7126436781609196, "percentage": 23.75, "elapsed_time": "4:19:13", "remaining_time": "13:52:01"}
{"current_steps": 63, "total_steps": 261, "loss": 0.7216, "lr": 0.0001891615230921703, "epoch": 0.7241379310344828, "percentage": 24.14, "elapsed_time": "4:22:29", "remaining_time": "13:44:58"}
{"current_steps": 64, "total_steps": 261, "loss": 0.7356, "lr": 0.000188545602565321, "epoch": 0.735632183908046, "percentage": 24.52, "elapsed_time": "4:25:45", "remaining_time": "13:38:01"}
{"current_steps": 65, "total_steps": 261, "loss": 0.7292, "lr": 0.00018791372219950948, "epoch": 0.7471264367816092, "percentage": 24.9, "elapsed_time": "4:29:00", "remaining_time": "13:31:08"}
{"current_steps": 66, "total_steps": 261, "loss": 0.7161, "lr": 0.00018726599588756145, "epoch": 0.7586206896551724, "percentage": 25.29, "elapsed_time": "4:32:14", "remaining_time": "13:24:20"}
{"current_steps": 67, "total_steps": 261, "loss": 0.7261, "lr": 0.00018660254037844388, "epoch": 0.7701149425287356, "percentage": 25.67, "elapsed_time": "4:35:33", "remaining_time": "13:17:52"}
{"current_steps": 68, "total_steps": 261, "loss": 0.7267, "lr": 0.0001859234752562217, "epoch": 0.7816091954022989, "percentage": 26.05, "elapsed_time": "4:38:49", "remaining_time": "13:11:21"}
{"current_steps": 69, "total_steps": 261, "loss": 0.7193, "lr": 0.00018522892291850335, "epoch": 0.7931034482758621, "percentage": 26.44, "elapsed_time": "4:42:05", "remaining_time": "13:04:57"}
{"current_steps": 70, "total_steps": 261, "loss": 0.7183, "lr": 0.0001845190085543795, "epoch": 0.8045977011494253, "percentage": 26.82, "elapsed_time": "4:45:22", "remaining_time": "12:58:40"}
{"current_steps": 70, "total_steps": 261, "eval_loss": 0.7151289582252502, "epoch": 0.8045977011494253, "percentage": 26.82, "elapsed_time": "4:54:56", "remaining_time": "13:24:47"}
{"current_steps": 71, "total_steps": 261, "loss": 0.7031, "lr": 0.00018379386012185814, "epoch": 0.8160919540229885, "percentage": 27.2, "elapsed_time": "4:58:12", "remaining_time": "13:18:01"}
{"current_steps": 72, "total_steps": 261, "loss": 0.7205, "lr": 0.00018305360832480117, "epoch": 0.8275862068965517, "percentage": 27.59, "elapsed_time": "5:01:28", "remaining_time": "13:11:21"}
{"current_steps": 73, "total_steps": 261, "loss": 0.7307, "lr": 0.00018229838658936564, "epoch": 0.8390804597701149, "percentage": 27.97, "elapsed_time": "5:04:41", "remaining_time": "13:04:40"}
{"current_steps": 74, "total_steps": 261, "loss": 0.7103, "lr": 0.00018152833103995443, "epoch": 0.8505747126436781, "percentage": 28.35, "elapsed_time": "5:07:55", "remaining_time": "12:58:08"}
{"current_steps": 75, "total_steps": 261, "loss": 0.7115, "lr": 0.0001807435804746807, "epoch": 0.8620689655172413, "percentage": 28.74, "elapsed_time": "5:11:10", "remaining_time": "12:51:42"}
{"current_steps": 76, "total_steps": 261, "loss": 0.6942, "lr": 0.00017994427634035015, "epoch": 0.8735632183908046, "percentage": 29.12, "elapsed_time": "5:14:24", "remaining_time": "12:45:20"}
{"current_steps": 77, "total_steps": 261, "loss": 0.6856, "lr": 0.0001791305627069662, "epoch": 0.8850574712643678, "percentage": 29.5, "elapsed_time": "5:17:38", "remaining_time": "12:39:03"}
{"current_steps": 78, "total_steps": 261, "loss": 0.7409, "lr": 0.00017830258624176225, "epoch": 0.896551724137931, "percentage": 29.89, "elapsed_time": "5:20:55", "remaining_time": "12:32:56"}
{"current_steps": 79, "total_steps": 261, "loss": 0.7354, "lr": 0.00017746049618276545, "epoch": 0.9080459770114943, "percentage": 30.27, "elapsed_time": "5:24:10", "remaining_time": "12:26:50"}
{"current_steps": 80, "total_steps": 261, "loss": 0.711, "lr": 0.0001766044443118978, "epoch": 0.9195402298850575, "percentage": 30.65, "elapsed_time": "5:27:25", "remaining_time": "12:20:47"}
{"current_steps": 80, "total_steps": 261, "eval_loss": 0.706480085849762, "epoch": 0.9195402298850575, "percentage": 30.65, "elapsed_time": "5:37:03", "remaining_time": "12:42:36"}
{"current_steps": 81, "total_steps": 261, "loss": 0.7161, "lr": 0.00017573458492761801, "epoch": 0.9310344827586207, "percentage": 31.03, "elapsed_time": "5:40:18", "remaining_time": "12:36:14"}
{"current_steps": 82, "total_steps": 261, "loss": 0.7062, "lr": 0.00017485107481711012, "epoch": 0.9425287356321839, "percentage": 31.42, "elapsed_time": "5:43:34", "remaining_time": "12:30:00"}
{"current_steps": 83, "total_steps": 261, "loss": 0.7136, "lr": 0.00017395407322802372, "epoch": 0.9540229885057471, "percentage": 31.8, "elapsed_time": "5:46:51", "remaining_time": "12:23:50"}
{"current_steps": 84, "total_steps": 261, "loss": 0.675, "lr": 0.00017304374183977033, "epoch": 0.9655172413793104, "percentage": 32.18, "elapsed_time": "5:50:09", "remaining_time": "12:17:49"}
{"current_steps": 85, "total_steps": 261, "loss": 0.7069, "lr": 0.00017212024473438147, "epoch": 0.9770114942528736, "percentage": 32.57, "elapsed_time": "5:53:21", "remaining_time": "12:11:40"}
{"current_steps": 86, "total_steps": 261, "loss": 0.7224, "lr": 0.00017118374836693406, "epoch": 0.9885057471264368, "percentage": 32.95, "elapsed_time": "5:56:33", "remaining_time": "12:05:34"}
{"current_steps": 87, "total_steps": 261, "loss": 0.7199, "lr": 0.00017023442153554777, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "5:59:49", "remaining_time": "11:59:38"}
{"current_steps": 88, "total_steps": 261, "loss": 0.6927, "lr": 0.00016927243535095997, "epoch": 1.0114942528735633, "percentage": 33.72, "elapsed_time": "6:03:04", "remaining_time": "11:53:45"}
{"current_steps": 89, "total_steps": 261, "loss": 0.6876, "lr": 0.00016829796320568416, "epoch": 1.0229885057471264, "percentage": 34.1, "elapsed_time": "6:06:19", "remaining_time": "11:47:56"}
{"current_steps": 90, "total_steps": 261, "loss": 0.6909, "lr": 0.00016731118074275704, "epoch": 1.0344827586206897, "percentage": 34.48, "elapsed_time": "6:09:35", "remaining_time": "11:42:13"}
{"current_steps": 90, "total_steps": 261, "eval_loss": 0.6995226740837097, "epoch": 1.0344827586206897, "percentage": 34.48, "elapsed_time": "6:19:08", "remaining_time": "12:00:21"}
{"current_steps": 91, "total_steps": 261, "loss": 0.6968, "lr": 0.00016631226582407952, "epoch": 1.0459770114942528, "percentage": 34.87, "elapsed_time": "6:22:22", "remaining_time": "11:54:19"}
{"current_steps": 92, "total_steps": 261, "loss": 0.6863, "lr": 0.0001653013984983585, "epoch": 1.0574712643678161, "percentage": 35.25, "elapsed_time": "6:25:37", "remaining_time": "11:48:22"}
{"current_steps": 93, "total_steps": 261, "loss": 0.7024, "lr": 0.00016427876096865394, "epoch": 1.0689655172413792, "percentage": 35.63, "elapsed_time": "6:28:51", "remaining_time": "11:42:27"}
{"current_steps": 94, "total_steps": 261, "loss": 0.6943, "lr": 0.00016324453755953773, "epoch": 1.0804597701149425, "percentage": 36.02, "elapsed_time": "6:32:05", "remaining_time": "11:36:35"}
{"current_steps": 95, "total_steps": 261, "loss": 0.669, "lr": 0.0001621989146838704, "epoch": 1.0919540229885056, "percentage": 36.4, "elapsed_time": "6:35:19", "remaining_time": "11:30:47"}
{"current_steps": 96, "total_steps": 261, "loss": 0.687, "lr": 0.00016114208080920123, "epoch": 1.103448275862069, "percentage": 36.78, "elapsed_time": "6:38:34", "remaining_time": "11:25:03"}
{"current_steps": 97, "total_steps": 261, "loss": 0.6912, "lr": 0.0001600742264237979, "epoch": 1.1149425287356323, "percentage": 37.16, "elapsed_time": "6:41:47", "remaining_time": "11:19:19"}
{"current_steps": 98, "total_steps": 261, "loss": 0.6944, "lr": 0.00015899554400231232, "epoch": 1.1264367816091954, "percentage": 37.55, "elapsed_time": "6:45:02", "remaining_time": "11:13:41"}
{"current_steps": 99, "total_steps": 261, "loss": 0.6569, "lr": 0.0001579062279710879, "epoch": 1.1379310344827587, "percentage": 37.93, "elapsed_time": "6:48:19", "remaining_time": "11:08:10"}
{"current_steps": 100, "total_steps": 261, "loss": 0.6893, "lr": 0.00015680647467311557, "epoch": 1.1494252873563218, "percentage": 38.31, "elapsed_time": "6:51:33", "remaining_time": "11:02:36"}
{"current_steps": 100, "total_steps": 261, "eval_loss": 0.6938582062721252, "epoch": 1.1494252873563218, "percentage": 38.31, "elapsed_time": "7:01:06", "remaining_time": "11:17:59"}
{"current_steps": 101, "total_steps": 261, "loss": 0.6919, "lr": 0.00015569648233264394, "epoch": 1.160919540229885, "percentage": 38.7, "elapsed_time": "7:04:45", "remaining_time": "11:12:52"}
{"current_steps": 102, "total_steps": 261, "loss": 0.6851, "lr": 0.00015457645101945046, "epoch": 1.1724137931034484, "percentage": 39.08, "elapsed_time": "7:07:57", "remaining_time": "11:07:07"}
{"current_steps": 103, "total_steps": 261, "loss": 0.6826, "lr": 0.0001534465826127801, "epoch": 1.1839080459770115, "percentage": 39.46, "elapsed_time": "7:11:18", "remaining_time": "11:01:36"}
{"current_steps": 104, "total_steps": 261, "loss": 0.6548, "lr": 0.00015230708076495775, "epoch": 1.1954022988505748, "percentage": 39.85, "elapsed_time": "7:14:31", "remaining_time": "10:55:57"}
{"current_steps": 105, "total_steps": 261, "loss": 0.6736, "lr": 0.00015115815086468102, "epoch": 1.206896551724138, "percentage": 40.23, "elapsed_time": "7:17:44", "remaining_time": "10:50:20"}
{"current_steps": 106, "total_steps": 261, "loss": 0.6823, "lr": 0.00015000000000000001, "epoch": 1.2183908045977012, "percentage": 40.61, "elapsed_time": "7:20:59", "remaining_time": "10:44:50"}
{"current_steps": 107, "total_steps": 261, "loss": 0.6698, "lr": 0.00014883283692099112, "epoch": 1.2298850574712643, "percentage": 41.0, "elapsed_time": "7:24:16", "remaining_time": "10:39:25"}
{"current_steps": 108, "total_steps": 261, "loss": 0.7054, "lr": 0.0001476568720021308, "epoch": 1.2413793103448276, "percentage": 41.38, "elapsed_time": "7:27:29", "remaining_time": "10:33:57"}
{"current_steps": 109, "total_steps": 261, "loss": 0.6761, "lr": 0.00014647231720437686, "epoch": 1.2528735632183907, "percentage": 41.76, "elapsed_time": "7:30:43", "remaining_time": "10:28:32"}
{"current_steps": 110, "total_steps": 261, "loss": 0.6796, "lr": 0.00014527938603696376, "epoch": 1.264367816091954, "percentage": 42.15, "elapsed_time": "7:34:02", "remaining_time": "10:23:16"}
{"current_steps": 110, "total_steps": 261, "eval_loss": 0.6874342560768127, "epoch": 1.264367816091954, "percentage": 42.15, "elapsed_time": "7:43:41", "remaining_time": "10:36:31"}
{"current_steps": 111, "total_steps": 261, "loss": 0.671, "lr": 0.00014407829351891857, "epoch": 1.2758620689655173, "percentage": 42.53, "elapsed_time": "7:46:58", "remaining_time": "10:31:03"}
{"current_steps": 112, "total_steps": 261, "loss": 0.6834, "lr": 0.00014286925614030542, "epoch": 1.2873563218390804, "percentage": 42.91, "elapsed_time": "7:50:12", "remaining_time": "10:25:33"}
{"current_steps": 113, "total_steps": 261, "loss": 0.6676, "lr": 0.00014165249182320402, "epoch": 1.2988505747126438, "percentage": 43.3, "elapsed_time": "7:53:29", "remaining_time": "10:20:09"}
{"current_steps": 114, "total_steps": 261, "loss": 0.6605, "lr": 0.0001404282198824305, "epoch": 1.3103448275862069, "percentage": 43.68, "elapsed_time": "7:56:44", "remaining_time": "10:14:45"}
{"current_steps": 115, "total_steps": 261, "loss": 0.6805, "lr": 0.00013919666098600753, "epoch": 1.3218390804597702, "percentage": 44.06, "elapsed_time": "7:59:59", "remaining_time": "10:09:22"}
{"current_steps": 116, "total_steps": 261, "loss": 0.6844, "lr": 0.00013795803711538966, "epoch": 1.3333333333333333, "percentage": 44.44, "elapsed_time": "8:03:11", "remaining_time": "10:03:59"}
{"current_steps": 117, "total_steps": 261, "loss": 0.6736, "lr": 0.00013671257152545277, "epoch": 1.3448275862068966, "percentage": 44.83, "elapsed_time": "8:06:24", "remaining_time": "9:58:38"}
{"current_steps": 118, "total_steps": 261, "loss": 0.6715, "lr": 0.00013546048870425356, "epoch": 1.3563218390804597, "percentage": 45.21, "elapsed_time": "8:09:38", "remaining_time": "9:53:22"}
{"current_steps": 119, "total_steps": 261, "loss": 0.6501, "lr": 0.00013420201433256689, "epoch": 1.367816091954023, "percentage": 45.59, "elapsed_time": "8:12:54", "remaining_time": "9:48:10"}
{"current_steps": 120, "total_steps": 261, "loss": 0.65, "lr": 0.00013293737524320797, "epoch": 1.3793103448275863, "percentage": 45.98, "elapsed_time": "8:16:12", "remaining_time": "9:43:02"}
{"current_steps": 120, "total_steps": 261, "eval_loss": 0.681229293346405, "epoch": 1.3793103448275863, "percentage": 45.98, "elapsed_time": "8:25:46", "remaining_time": "9:54:16"}
{"current_steps": 121, "total_steps": 261, "loss": 0.6613, "lr": 0.00013166679938014726, "epoch": 1.3908045977011494, "percentage": 46.36, "elapsed_time": "8:29:04", "remaining_time": "9:49:00"}
{"current_steps": 122, "total_steps": 261, "loss": 0.6707, "lr": 0.0001303905157574247, "epoch": 1.4022988505747127, "percentage": 46.74, "elapsed_time": "8:32:20", "remaining_time": "9:43:44"}
{"current_steps": 123, "total_steps": 261, "loss": 0.6616, "lr": 0.00012910875441787128, "epoch": 1.4137931034482758, "percentage": 47.13, "elapsed_time": "8:35:36", "remaining_time": "9:38:29"}
{"current_steps": 124, "total_steps": 261, "loss": 0.6846, "lr": 0.0001278217463916453, "epoch": 1.4252873563218391, "percentage": 47.51, "elapsed_time": "8:38:50", "remaining_time": "9:33:14"}
{"current_steps": 125, "total_steps": 261, "loss": 0.6949, "lr": 0.0001265297236545901, "epoch": 1.4367816091954024, "percentage": 47.89, "elapsed_time": "8:42:06", "remaining_time": "9:28:02"}
{"current_steps": 126, "total_steps": 261, "loss": 0.6587, "lr": 0.00012523291908642217, "epoch": 1.4482758620689655, "percentage": 48.28, "elapsed_time": "8:45:20", "remaining_time": "9:22:51"}
{"current_steps": 127, "total_steps": 261, "loss": 0.6564, "lr": 0.0001239315664287558, "epoch": 1.4597701149425286, "percentage": 48.66, "elapsed_time": "8:48:33", "remaining_time": "9:17:41"}
{"current_steps": 128, "total_steps": 261, "loss": 0.6588, "lr": 0.00012262590024297225, "epoch": 1.471264367816092, "percentage": 49.04, "elapsed_time": "8:51:48", "remaining_time": "9:12:34"}
{"current_steps": 129, "total_steps": 261, "loss": 0.6799, "lr": 0.0001213161558679416, "epoch": 1.4827586206896552, "percentage": 49.43, "elapsed_time": "8:55:02", "remaining_time": "9:07:29"}
{"current_steps": 130, "total_steps": 261, "loss": 0.6615, "lr": 0.00012000256937760445, "epoch": 1.4942528735632183, "percentage": 49.81, "elapsed_time": "8:58:17", "remaining_time": "9:02:26"}
{"current_steps": 130, "total_steps": 261, "eval_loss": 0.6774752140045166, "epoch": 1.4942528735632183, "percentage": 49.81, "elapsed_time": "9:07:52", "remaining_time": "9:12:05"}
{"current_steps": 131, "total_steps": 261, "loss": 0.6726, "lr": 0.00011868537753842051, "epoch": 1.5057471264367817, "percentage": 50.19, "elapsed_time": "9:11:06", "remaining_time": "9:06:54"}
{"current_steps": 132, "total_steps": 261, "loss": 0.6517, "lr": 0.00011736481776669306, "epoch": 1.5172413793103448, "percentage": 50.57, "elapsed_time": "9:14:20", "remaining_time": "9:01:44"}
{"current_steps": 133, "total_steps": 261, "loss": 0.6418, "lr": 0.00011604112808577603, "epoch": 1.528735632183908, "percentage": 50.96, "elapsed_time": "9:17:36", "remaining_time": "8:56:38"}
{"current_steps": 134, "total_steps": 261, "loss": 0.6773, "lr": 0.00011471454708317162, "epoch": 1.5402298850574714, "percentage": 51.34, "elapsed_time": "9:20:52", "remaining_time": "8:51:34"}
{"current_steps": 135, "total_steps": 261, "loss": 0.6815, "lr": 0.00011338531386752618, "epoch": 1.5517241379310345, "percentage": 51.72, "elapsed_time": "9:24:07", "remaining_time": "8:46:31"}
{"current_steps": 136, "total_steps": 261, "loss": 0.6762, "lr": 0.0001120536680255323, "epoch": 1.5632183908045976, "percentage": 52.11, "elapsed_time": "9:27:22", "remaining_time": "8:41:28"}
{"current_steps": 137, "total_steps": 261, "loss": 0.6568, "lr": 0.00011071984957874479, "epoch": 1.5747126436781609, "percentage": 52.49, "elapsed_time": "9:30:34", "remaining_time": "8:36:26"}
{"current_steps": 138, "total_steps": 261, "loss": 0.6382, "lr": 0.00010938409894031794, "epoch": 1.5862068965517242, "percentage": 52.87, "elapsed_time": "9:33:45", "remaining_time": "8:31:23"}
{"current_steps": 139, "total_steps": 261, "loss": 0.6805, "lr": 0.00010804665687167262, "epoch": 1.5977011494252875, "percentage": 53.26, "elapsed_time": "9:36:58", "remaining_time": "8:26:24"}
{"current_steps": 140, "total_steps": 261, "loss": 0.6555, "lr": 0.00010670776443910024, "epoch": 1.6091954022988506, "percentage": 53.64, "elapsed_time": "9:40:14", "remaining_time": "8:21:29"}
{"current_steps": 140, "total_steps": 261, "eval_loss": 0.6739147305488586, "epoch": 1.6091954022988506, "percentage": 53.64, "elapsed_time": "9:49:42", "remaining_time": "8:29:41"}
{"current_steps": 141, "total_steps": 261, "loss": 0.6679, "lr": 0.00010536766297031215, "epoch": 1.6206896551724137, "percentage": 54.02, "elapsed_time": "9:52:58", "remaining_time": "8:24:39"}
{"current_steps": 142, "total_steps": 261, "loss": 0.6664, "lr": 0.00010402659401094152, "epoch": 1.632183908045977, "percentage": 54.41, "elapsed_time": "9:56:10", "remaining_time": "8:19:36"}
{"current_steps": 143, "total_steps": 261, "loss": 0.636, "lr": 0.00010268479928100614, "epoch": 1.6436781609195403, "percentage": 54.79, "elapsed_time": "9:59:21", "remaining_time": "8:14:34"}
{"current_steps": 144, "total_steps": 261, "loss": 0.6727, "lr": 0.00010134252063133975, "epoch": 1.6551724137931034, "percentage": 55.17, "elapsed_time": "10:02:35", "remaining_time": "8:09:35"}
{"current_steps": 145, "total_steps": 261, "loss": 0.6674, "lr": 0.0001, "epoch": 1.6666666666666665, "percentage": 55.56, "elapsed_time": "10:05:49", "remaining_time": "8:04:39"}
{"current_steps": 146, "total_steps": 261, "loss": 0.6816, "lr": 9.865747936866027e-05, "epoch": 1.6781609195402298, "percentage": 55.94, "elapsed_time": "10:09:02", "remaining_time": "7:59:43"}
{"current_steps": 147, "total_steps": 261, "loss": 0.6658, "lr": 9.73152007189939e-05, "epoch": 1.6896551724137931, "percentage": 56.32, "elapsed_time": "10:12:18", "remaining_time": "7:54:51"}
{"current_steps": 148, "total_steps": 261, "loss": 0.6753, "lr": 9.597340598905852e-05, "epoch": 1.7011494252873565, "percentage": 56.7, "elapsed_time": "10:15:29", "remaining_time": "7:49:55"}
{"current_steps": 149, "total_steps": 261, "loss": 0.6806, "lr": 9.463233702968783e-05, "epoch": 1.7126436781609196, "percentage": 57.09, "elapsed_time": "10:18:46", "remaining_time": "7:45:06"}
{"current_steps": 150, "total_steps": 261, "loss": 0.6522, "lr": 9.329223556089975e-05, "epoch": 1.7241379310344827, "percentage": 57.47, "elapsed_time": "10:21:56", "remaining_time": "7:40:14"}
{"current_steps": 150, "total_steps": 261, "eval_loss": 0.6713330745697021, "epoch": 1.7241379310344827, "percentage": 57.47, "elapsed_time": "10:31:24", "remaining_time": "7:47:14"}
{"current_steps": 151, "total_steps": 261, "loss": 0.6606, "lr": 9.195334312832742e-05, "epoch": 1.735632183908046, "percentage": 57.85, "elapsed_time": "10:35:00", "remaining_time": "7:42:35"}
{"current_steps": 152, "total_steps": 261, "loss": 0.6671, "lr": 9.061590105968208e-05, "epoch": 1.7471264367816093, "percentage": 58.24, "elapsed_time": "10:38:17", "remaining_time": "7:37:43"}
{"current_steps": 153, "total_steps": 261, "loss": 0.6459, "lr": 8.928015042125523e-05, "epoch": 1.7586206896551724, "percentage": 58.62, "elapsed_time": "10:41:30", "remaining_time": "7:32:50"}
{"current_steps": 154, "total_steps": 261, "loss": 0.6684, "lr": 8.79463319744677e-05, "epoch": 1.7701149425287355, "percentage": 59.0, "elapsed_time": "10:44:45", "remaining_time": "7:27:59"}
{"current_steps": 155, "total_steps": 261, "loss": 0.6593, "lr": 8.661468613247387e-05, "epoch": 1.7816091954022988, "percentage": 59.39, "elapsed_time": "10:47:58", "remaining_time": "7:23:07"}
{"current_steps": 156, "total_steps": 261, "loss": 0.6674, "lr": 8.528545291682838e-05, "epoch": 1.793103448275862, "percentage": 59.77, "elapsed_time": "10:51:10", "remaining_time": "7:18:17"}
{"current_steps": 157, "total_steps": 261, "loss": 0.6555, "lr": 8.395887191422397e-05, "epoch": 1.8045977011494254, "percentage": 60.15, "elapsed_time": "10:54:28", "remaining_time": "7:13:32"}
{"current_steps": 158, "total_steps": 261, "loss": 0.6591, "lr": 8.263518223330697e-05, "epoch": 1.8160919540229885, "percentage": 60.54, "elapsed_time": "10:57:42", "remaining_time": "7:08:45"}
{"current_steps": 159, "total_steps": 261, "loss": 0.6464, "lr": 8.131462246157953e-05, "epoch": 1.8275862068965516, "percentage": 60.92, "elapsed_time": "11:00:57", "remaining_time": "7:04:00"}
{"current_steps": 160, "total_steps": 261, "loss": 0.6545, "lr": 7.999743062239557e-05, "epoch": 1.839080459770115, "percentage": 61.3, "elapsed_time": "11:04:12", "remaining_time": "6:59:16"}
{"current_steps": 160, "total_steps": 261, "eval_loss": 0.6687291264533997, "epoch": 1.839080459770115, "percentage": 61.3, "elapsed_time": "11:13:44", "remaining_time": "7:05:18"}
{"current_steps": 161, "total_steps": 261, "loss": 0.6612, "lr": 7.868384413205842e-05, "epoch": 1.8505747126436782, "percentage": 61.69, "elapsed_time": "11:16:58", "remaining_time": "7:00:28"}
{"current_steps": 162, "total_steps": 261, "loss": 0.6566, "lr": 7.73740997570278e-05, "epoch": 1.8620689655172413, "percentage": 62.07, "elapsed_time": "11:20:13", "remaining_time": "6:55:41"}
{"current_steps": 163, "total_steps": 261, "loss": 0.6498, "lr": 7.606843357124426e-05, "epoch": 1.8735632183908046, "percentage": 62.45, "elapsed_time": "11:23:28", "remaining_time": "6:50:55"}
{"current_steps": 164, "total_steps": 261, "loss": 0.6582, "lr": 7.476708091357782e-05, "epoch": 1.8850574712643677, "percentage": 62.84, "elapsed_time": "11:26:42", "remaining_time": "6:46:09"}
{"current_steps": 165, "total_steps": 261, "loss": 0.6421, "lr": 7.347027634540993e-05, "epoch": 1.896551724137931, "percentage": 63.22, "elapsed_time": "11:29:58", "remaining_time": "6:41:26"}
{"current_steps": 166, "total_steps": 261, "loss": 0.6553, "lr": 7.217825360835473e-05, "epoch": 1.9080459770114944, "percentage": 63.6, "elapsed_time": "11:33:12", "remaining_time": "6:36:43"}
{"current_steps": 167, "total_steps": 261, "loss": 0.6587, "lr": 7.089124558212871e-05, "epoch": 1.9195402298850575, "percentage": 63.98, "elapsed_time": "11:36:27", "remaining_time": "6:32:00"}
{"current_steps": 168, "total_steps": 261, "loss": 0.6646, "lr": 6.960948424257532e-05, "epoch": 1.9310344827586206, "percentage": 64.37, "elapsed_time": "11:39:43", "remaining_time": "6:27:21"}
{"current_steps": 169, "total_steps": 261, "loss": 0.6669, "lr": 6.833320061985277e-05, "epoch": 1.9425287356321839, "percentage": 64.75, "elapsed_time": "11:42:56", "remaining_time": "6:22:39"}
{"current_steps": 170, "total_steps": 261, "loss": 0.648, "lr": 6.706262475679205e-05, "epoch": 1.9540229885057472, "percentage": 65.13, "elapsed_time": "11:46:09", "remaining_time": "6:18:00"}
{"current_steps": 170, "total_steps": 261, "eval_loss": 0.6668276786804199, "epoch": 1.9540229885057472, "percentage": 65.13, "elapsed_time": "11:55:43", "remaining_time": "6:23:07"}
{"current_steps": 171, "total_steps": 261, "loss": 0.6329, "lr": 6.579798566743314e-05, "epoch": 1.9655172413793105, "percentage": 65.52, "elapsed_time": "11:58:57", "remaining_time": "6:18:23"}
{"current_steps": 172, "total_steps": 261, "loss": 0.6645, "lr": 6.453951129574644e-05, "epoch": 1.9770114942528736, "percentage": 65.9, "elapsed_time": "12:02:10", "remaining_time": "6:13:40"}
{"current_steps": 173, "total_steps": 261, "loss": 0.6529, "lr": 6.328742847454724e-05, "epoch": 1.9885057471264367, "percentage": 66.28, "elapsed_time": "12:05:23", "remaining_time": "6:08:59"}
{"current_steps": 174, "total_steps": 261, "loss": 0.6619, "lr": 6.204196288461037e-05, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "12:08:35", "remaining_time": "6:04:17"}
{"current_steps": 175, "total_steps": 261, "loss": 0.6569, "lr": 6.080333901399251e-05, "epoch": 2.0114942528735633, "percentage": 67.05, "elapsed_time": "12:11:50", "remaining_time": "5:59:38"}
{"current_steps": 176, "total_steps": 261, "loss": 0.6406, "lr": 5.957178011756952e-05, "epoch": 2.0229885057471266, "percentage": 67.43, "elapsed_time": "12:15:05", "remaining_time": "5:55:00"}
{"current_steps": 177, "total_steps": 261, "loss": 0.6171, "lr": 5.834750817679606e-05, "epoch": 2.0344827586206895, "percentage": 67.82, "elapsed_time": "12:18:19", "remaining_time": "5:50:23"}
{"current_steps": 178, "total_steps": 261, "loss": 0.6391, "lr": 5.713074385969457e-05, "epoch": 2.045977011494253, "percentage": 68.2, "elapsed_time": "12:21:34", "remaining_time": "5:45:47"}
{"current_steps": 179, "total_steps": 261, "loss": 0.6474, "lr": 5.59217064810814e-05, "epoch": 2.057471264367816, "percentage": 68.58, "elapsed_time": "12:24:46", "remaining_time": "5:41:10"}
{"current_steps": 180, "total_steps": 261, "loss": 0.6285, "lr": 5.472061396303629e-05, "epoch": 2.0689655172413794, "percentage": 68.97, "elapsed_time": "12:28:01", "remaining_time": "5:36:36"}
{"current_steps": 180, "total_steps": 261, "eval_loss": 0.6662968993186951, "epoch": 2.0689655172413794, "percentage": 68.97, "elapsed_time": "12:37:32", "remaining_time": "5:40:53"}
{"current_steps": 181, "total_steps": 261, "loss": 0.6484, "lr": 5.3527682795623146e-05, "epoch": 2.0804597701149423, "percentage": 69.35, "elapsed_time": "12:40:46", "remaining_time": "5:36:15"}
{"current_steps": 182, "total_steps": 261, "loss": 0.6571, "lr": 5.234312799786921e-05, "epoch": 2.0919540229885056, "percentage": 69.73, "elapsed_time": "12:43:58", "remaining_time": "5:31:37"}
{"current_steps": 183, "total_steps": 261, "loss": 0.6489, "lr": 5.116716307900893e-05, "epoch": 2.103448275862069, "percentage": 70.11, "elapsed_time": "12:47:11", "remaining_time": "5:27:00"}
{"current_steps": 184, "total_steps": 261, "loss": 0.651, "lr": 5.000000000000002e-05, "epoch": 2.1149425287356323, "percentage": 70.5, "elapsed_time": "12:50:24", "remaining_time": "5:22:23"}
{"current_steps": 185, "total_steps": 261, "loss": 0.6395, "lr": 4.884184913531902e-05, "epoch": 2.1264367816091956, "percentage": 70.88, "elapsed_time": "12:53:39", "remaining_time": "5:17:49"}
{"current_steps": 186, "total_steps": 261, "loss": 0.6348, "lr": 4.7692919235042255e-05, "epoch": 2.1379310344827585, "percentage": 71.26, "elapsed_time": "12:56:50", "remaining_time": "5:13:14"}
{"current_steps": 187, "total_steps": 261, "loss": 0.6213, "lr": 4.6553417387219886e-05, "epoch": 2.1494252873563218, "percentage": 71.65, "elapsed_time": "13:00:04", "remaining_time": "5:08:41"}
{"current_steps": 188, "total_steps": 261, "loss": 0.6391, "lr": 4.542354898054953e-05, "epoch": 2.160919540229885, "percentage": 72.03, "elapsed_time": "13:03:17", "remaining_time": "5:04:09"}
{"current_steps": 189, "total_steps": 261, "loss": 0.6576, "lr": 4.430351766735609e-05, "epoch": 2.1724137931034484, "percentage": 72.41, "elapsed_time": "13:06:27", "remaining_time": "4:59:36"}
{"current_steps": 190, "total_steps": 261, "loss": 0.6652, "lr": 4.3193525326884435e-05, "epoch": 2.1839080459770113, "percentage": 72.8, "elapsed_time": "13:09:36", "remaining_time": "4:55:03"}
{"current_steps": 190, "total_steps": 261, "eval_loss": 0.6655236482620239, "epoch": 2.1839080459770113, "percentage": 72.8, "elapsed_time": "13:19:12", "remaining_time": "4:58:39"}
{"current_steps": 191, "total_steps": 261, "loss": 0.6373, "lr": 4.209377202891212e-05, "epoch": 2.1954022988505746, "percentage": 73.18, "elapsed_time": "13:22:26", "remaining_time": "4:54:05"}
{"current_steps": 192, "total_steps": 261, "loss": 0.6414, "lr": 4.100445599768774e-05, "epoch": 2.206896551724138, "percentage": 73.56, "elapsed_time": "13:25:38", "remaining_time": "4:49:31"}
{"current_steps": 193, "total_steps": 261, "loss": 0.6596, "lr": 3.99257735762021e-05, "epoch": 2.218390804597701, "percentage": 73.95, "elapsed_time": "13:28:48", "remaining_time": "4:44:58"}
{"current_steps": 194, "total_steps": 261, "loss": 0.6049, "lr": 3.885791919079878e-05, "epoch": 2.2298850574712645, "percentage": 74.33, "elapsed_time": "13:32:01", "remaining_time": "4:40:26"}
{"current_steps": 195, "total_steps": 261, "loss": 0.6302, "lr": 3.7801085316129615e-05, "epoch": 2.2413793103448274, "percentage": 74.71, "elapsed_time": "13:35:12", "remaining_time": "4:35:54"}
{"current_steps": 196, "total_steps": 261, "loss": 0.653, "lr": 3.675546244046228e-05, "epoch": 2.2528735632183907, "percentage": 75.1, "elapsed_time": "13:38:23", "remaining_time": "4:31:24"}
{"current_steps": 197, "total_steps": 261, "loss": 0.6467, "lr": 3.5721239031346066e-05, "epoch": 2.264367816091954, "percentage": 75.48, "elapsed_time": "13:41:35", "remaining_time": "4:26:54"}
{"current_steps": 198, "total_steps": 261, "loss": 0.6383, "lr": 3.469860150164152e-05, "epoch": 2.2758620689655173, "percentage": 75.86, "elapsed_time": "13:44:45", "remaining_time": "4:22:25"}
{"current_steps": 199, "total_steps": 261, "loss": 0.629, "lr": 3.36877341759205e-05, "epoch": 2.2873563218390807, "percentage": 76.25, "elapsed_time": "13:47:57", "remaining_time": "4:17:57"}
{"current_steps": 200, "total_steps": 261, "loss": 0.6307, "lr": 3.268881925724297e-05, "epoch": 2.2988505747126435, "percentage": 76.63, "elapsed_time": "13:51:08", "remaining_time": "4:13:29"}
{"current_steps": 200, "total_steps": 261, "eval_loss": 0.6646614074707031, "epoch": 2.2988505747126435, "percentage": 76.63, "elapsed_time": "14:00:42", "remaining_time": "4:16:24"}
{"current_steps": 201, "total_steps": 261, "loss": 0.6327, "lr": 3.170203679431584e-05, "epoch": 2.310344827586207, "percentage": 77.01, "elapsed_time": "14:04:18", "remaining_time": "4:12:01"}
{"current_steps": 202, "total_steps": 261, "loss": 0.6359, "lr": 3.072756464904006e-05, "epoch": 2.32183908045977, "percentage": 77.39, "elapsed_time": "14:07:31", "remaining_time": "4:07:32"}
{"current_steps": 203, "total_steps": 261, "loss": 0.6485, "lr": 2.976557846445225e-05, "epoch": 2.3333333333333335, "percentage": 77.78, "elapsed_time": "14:10:42", "remaining_time": "4:03:03"}
{"current_steps": 204, "total_steps": 261, "loss": 0.6402, "lr": 2.881625163306596e-05, "epoch": 2.344827586206897, "percentage": 78.16, "elapsed_time": "14:13:53", "remaining_time": "3:58:35"}
{"current_steps": 205, "total_steps": 261, "loss": 0.6327, "lr": 2.7879755265618555e-05, "epoch": 2.3563218390804597, "percentage": 78.54, "elapsed_time": "14:17:04", "remaining_time": "3:54:07"}
{"current_steps": 206, "total_steps": 261, "loss": 0.622, "lr": 2.6956258160229695e-05, "epoch": 2.367816091954023, "percentage": 78.93, "elapsed_time": "14:20:16", "remaining_time": "3:49:41"}
{"current_steps": 207, "total_steps": 261, "loss": 0.6387, "lr": 2.6045926771976303e-05, "epoch": 2.3793103448275863, "percentage": 79.31, "elapsed_time": "14:23:27", "remaining_time": "3:45:14"}
{"current_steps": 208, "total_steps": 261, "loss": 0.6238, "lr": 2.514892518288988e-05, "epoch": 2.3908045977011496, "percentage": 79.69, "elapsed_time": "14:26:41", "remaining_time": "3:40:50"}
{"current_steps": 209, "total_steps": 261, "loss": 0.6294, "lr": 2.4265415072382016e-05, "epoch": 2.4022988505747125, "percentage": 80.08, "elapsed_time": "14:29:51", "remaining_time": "3:36:25"}
{"current_steps": 210, "total_steps": 261, "loss": 0.6383, "lr": 2.339555568810221e-05, "epoch": 2.413793103448276, "percentage": 80.46, "elapsed_time": "14:33:01", "remaining_time": "3:32:01"}
{"current_steps": 210, "total_steps": 261, "eval_loss": 0.664122462272644, "epoch": 2.413793103448276, "percentage": 80.46, "elapsed_time": "14:42:33", "remaining_time": "3:34:20"}
{"current_steps": 211, "total_steps": 261, "loss": 0.651, "lr": 2.2539503817234553e-05, "epoch": 2.425287356321839, "percentage": 80.84, "elapsed_time": "14:45:46", "remaining_time": "3:29:54"}
{"current_steps": 212, "total_steps": 261, "loss": 0.634, "lr": 2.1697413758237784e-05, "epoch": 2.4367816091954024, "percentage": 81.23, "elapsed_time": "14:48:58", "remaining_time": "3:25:28"}
{"current_steps": 213, "total_steps": 261, "loss": 0.626, "lr": 2.0869437293033835e-05, "epoch": 2.4482758620689653, "percentage": 81.61, "elapsed_time": "14:52:10", "remaining_time": "3:21:03"}
{"current_steps": 214, "total_steps": 261, "loss": 0.6321, "lr": 2.0055723659649904e-05, "epoch": 2.4597701149425286, "percentage": 81.99, "elapsed_time": "14:55:20", "remaining_time": "3:16:38"}
{"current_steps": 215, "total_steps": 261, "loss": 0.644, "lr": 1.9256419525319313e-05, "epoch": 2.471264367816092, "percentage": 82.38, "elapsed_time": "14:58:31", "remaining_time": "3:12:14"}
{"current_steps": 216, "total_steps": 261, "loss": 0.6242, "lr": 1.8471668960045574e-05, "epoch": 2.4827586206896552, "percentage": 82.76, "elapsed_time": "15:01:42", "remaining_time": "3:07:51"}
{"current_steps": 217, "total_steps": 261, "loss": 0.6525, "lr": 1.7701613410634365e-05, "epoch": 2.4942528735632186, "percentage": 83.14, "elapsed_time": "15:04:56", "remaining_time": "3:03:29"}
{"current_steps": 218, "total_steps": 261, "loss": 0.6026, "lr": 1.6946391675198836e-05, "epoch": 2.5057471264367814, "percentage": 83.52, "elapsed_time": "15:08:06", "remaining_time": "2:59:07"}
{"current_steps": 219, "total_steps": 261, "loss": 0.6285, "lr": 1.620613987814189e-05, "epoch": 2.5172413793103448, "percentage": 83.91, "elapsed_time": "15:11:19", "remaining_time": "2:54:46"}
{"current_steps": 220, "total_steps": 261, "loss": 0.6394, "lr": 1.5480991445620542e-05, "epoch": 2.528735632183908, "percentage": 84.29, "elapsed_time": "15:14:29", "remaining_time": "2:50:25"}
{"current_steps": 220, "total_steps": 261, "eval_loss": 0.6636479496955872, "epoch": 2.528735632183908, "percentage": 84.29, "elapsed_time": "15:24:02", "remaining_time": "2:52:12"}
{"current_steps": 221, "total_steps": 261, "loss": 0.6399, "lr": 1.4771077081496654e-05, "epoch": 2.5402298850574714, "percentage": 84.67, "elapsed_time": "15:27:14", "remaining_time": "2:47:49"}
{"current_steps": 222, "total_steps": 261, "loss": 0.6201, "lr": 1.4076524743778319e-05, "epoch": 2.5517241379310347, "percentage": 85.06, "elapsed_time": "15:30:24", "remaining_time": "2:43:26"}
{"current_steps": 223, "total_steps": 261, "loss": 0.618, "lr": 1.339745962155613e-05, "epoch": 2.5632183908045976, "percentage": 85.44, "elapsed_time": "15:33:37", "remaining_time": "2:39:05"}
{"current_steps": 224, "total_steps": 261, "loss": 0.6531, "lr": 1.2734004112438568e-05, "epoch": 2.574712643678161, "percentage": 85.82, "elapsed_time": "15:36:48", "remaining_time": "2:34:44"}
{"current_steps": 225, "total_steps": 261, "loss": 0.6364, "lr": 1.2086277800490554e-05, "epoch": 2.586206896551724, "percentage": 86.21, "elapsed_time": "15:39:58", "remaining_time": "2:30:23"}
{"current_steps": 226, "total_steps": 261, "loss": 0.6222, "lr": 1.1454397434679021e-05, "epoch": 2.5977011494252875, "percentage": 86.59, "elapsed_time": "15:43:14", "remaining_time": "2:26:04"}
{"current_steps": 227, "total_steps": 261, "loss": 0.6453, "lr": 1.083847690782972e-05, "epoch": 2.609195402298851, "percentage": 86.97, "elapsed_time": "15:46:28", "remaining_time": "2:21:45"}
{"current_steps": 228, "total_steps": 261, "loss": 0.6613, "lr": 1.0238627236098619e-05, "epoch": 2.6206896551724137, "percentage": 87.36, "elapsed_time": "15:49:40", "remaining_time": "2:17:27"}
{"current_steps": 229, "total_steps": 261, "loss": 0.6172, "lr": 9.65495653896179e-06, "epoch": 2.632183908045977, "percentage": 87.74, "elapsed_time": "15:52:54", "remaining_time": "2:13:09"}
{"current_steps": 230, "total_steps": 261, "loss": 0.632, "lr": 9.08757001972762e-06, "epoch": 2.6436781609195403, "percentage": 88.12, "elapsed_time": "15:56:04", "remaining_time": "2:08:51"}
{"current_steps": 230, "total_steps": 261, "eval_loss": 0.6632330417633057, "epoch": 2.6436781609195403, "percentage": 88.12, "elapsed_time": "16:05:34", "remaining_time": "2:10:08"}
{"current_steps": 231, "total_steps": 261, "loss": 0.6496, "lr": 8.536569946574546e-06, "epoch": 2.655172413793103, "percentage": 88.51, "elapsed_time": "16:08:46", "remaining_time": "2:05:48"}
{"current_steps": 232, "total_steps": 261, "loss": 0.6426, "lr": 8.002055634117578e-06, "epoch": 2.6666666666666665, "percentage": 88.89, "elapsed_time": "16:11:54", "remaining_time": "2:01:29"}
{"current_steps": 233, "total_steps": 261, "loss": 0.6352, "lr": 7.4841234255076495e-06, "epoch": 2.67816091954023, "percentage": 89.27, "elapsed_time": "16:15:07", "remaining_time": "1:57:10"}
{"current_steps": 234, "total_steps": 261, "loss": 0.6339, "lr": 6.9828666750661795e-06, "epoch": 2.689655172413793, "percentage": 89.66, "elapsed_time": "16:18:19", "remaining_time": "1:52:52"}
{"current_steps": 235, "total_steps": 261, "loss": 0.6415, "lr": 6.498375731458528e-06, "epoch": 2.7011494252873565, "percentage": 90.04, "elapsed_time": "16:21:30", "remaining_time": "1:48:35"}
{"current_steps": 236, "total_steps": 261, "loss": 0.6339, "lr": 6.030737921409169e-06, "epoch": 2.7126436781609193, "percentage": 90.42, "elapsed_time": "16:24:39", "remaining_time": "1:44:18"}
{"current_steps": 237, "total_steps": 261, "loss": 0.6152, "lr": 5.580037533961546e-06, "epoch": 2.7241379310344827, "percentage": 90.8, "elapsed_time": "16:27:50", "remaining_time": "1:40:02"}
{"current_steps": 238, "total_steps": 261, "loss": 0.6227, "lr": 5.146355805285452e-06, "epoch": 2.735632183908046, "percentage": 91.19, "elapsed_time": "16:31:00", "remaining_time": "1:35:46"}
{"current_steps": 239, "total_steps": 261, "loss": 0.6368, "lr": 4.729770904034647e-06, "epoch": 2.7471264367816093, "percentage": 91.57, "elapsed_time": "16:34:11", "remaining_time": "1:31:30"}
{"current_steps": 240, "total_steps": 261, "loss": 0.6416, "lr": 4.3303579172574885e-06, "epoch": 2.7586206896551726, "percentage": 91.95, "elapsed_time": "16:37:21", "remaining_time": "1:27:16"}
{"current_steps": 240, "total_steps": 261, "eval_loss": 0.6631439328193665, "epoch": 2.7586206896551726, "percentage": 91.95, "elapsed_time": "16:46:53", "remaining_time": "1:28:06"}
{"current_steps": 241, "total_steps": 261, "loss": 0.6332, "lr": 3.948188836862776e-06, "epoch": 2.7701149425287355, "percentage": 92.34, "elapsed_time": "16:50:06", "remaining_time": "1:23:49"}
{"current_steps": 242, "total_steps": 261, "loss": 0.6429, "lr": 3.5833325466437694e-06, "epoch": 2.781609195402299, "percentage": 92.72, "elapsed_time": "16:53:14", "remaining_time": "1:19:33"}
{"current_steps": 243, "total_steps": 261, "loss": 0.6149, "lr": 3.2358548098621932e-06, "epoch": 2.793103448275862, "percentage": 93.1, "elapsed_time": "16:56:24", "remaining_time": "1:15:17"}
{"current_steps": 244, "total_steps": 261, "loss": 0.6468, "lr": 2.905818257394799e-06, "epoch": 2.8045977011494254, "percentage": 93.49, "elapsed_time": "16:59:35", "remaining_time": "1:11:02"}
{"current_steps": 245, "total_steps": 261, "loss": 0.6319, "lr": 2.5932823764445392e-06, "epoch": 2.8160919540229887, "percentage": 93.87, "elapsed_time": "17:02:44", "remaining_time": "1:06:47"}
{"current_steps": 246, "total_steps": 261, "loss": 0.6093, "lr": 2.2983034998182997e-06, "epoch": 2.8275862068965516, "percentage": 94.25, "elapsed_time": "17:05:53", "remaining_time": "1:02:33"}
{"current_steps": 247, "total_steps": 261, "loss": 0.6433, "lr": 2.0209347957732328e-06, "epoch": 2.839080459770115, "percentage": 94.64, "elapsed_time": "17:09:03", "remaining_time": "0:58:19"}
{"current_steps": 248, "total_steps": 261, "loss": 0.6335, "lr": 1.7612262584335237e-06, "epoch": 2.8505747126436782, "percentage": 95.02, "elapsed_time": "17:12:14", "remaining_time": "0:54:06"}
{"current_steps": 249, "total_steps": 261, "loss": 0.6285, "lr": 1.5192246987791981e-06, "epoch": 2.862068965517241, "percentage": 95.4, "elapsed_time": "17:15:23", "remaining_time": "0:49:53"}
{"current_steps": 250, "total_steps": 261, "loss": 0.6228, "lr": 1.2949737362087156e-06, "epoch": 2.873563218390805, "percentage": 95.79, "elapsed_time": "17:18:32", "remaining_time": "0:45:41"}
{"current_steps": 250, "total_steps": 261, "eval_loss": 0.6631085276603699, "epoch": 2.873563218390805, "percentage": 95.79, "elapsed_time": "17:28:00", "remaining_time": "0:46:06"}
{"current_steps": 251, "total_steps": 261, "loss": 0.6338, "lr": 1.0885137906768372e-06, "epoch": 2.8850574712643677, "percentage": 96.17, "elapsed_time": "17:31:31", "remaining_time": "0:41:53"}
{"current_steps": 252, "total_steps": 261, "loss": 0.6277, "lr": 8.998820754091531e-07, "epoch": 2.896551724137931, "percentage": 96.55, "elapsed_time": "17:34:41", "remaining_time": "0:37:40"}
{"current_steps": 253, "total_steps": 261, "loss": 0.6186, "lr": 7.291125901946027e-07, "epoch": 2.9080459770114944, "percentage": 96.93, "elapsed_time": "17:37:48", "remaining_time": "0:33:26"}
{"current_steps": 254, "total_steps": 261, "loss": 0.6428, "lr": 5.762361152572115e-07, "epoch": 2.9195402298850572, "percentage": 97.32, "elapsed_time": "17:40:59", "remaining_time": "0:29:14"}
{"current_steps": 255, "total_steps": 261, "loss": 0.6311, "lr": 4.412802057081278e-07, "epoch": 2.9310344827586206, "percentage": 97.7, "elapsed_time": "17:44:08", "remaining_time": "0:25:02"}
{"current_steps": 256, "total_steps": 261, "loss": 0.6268, "lr": 3.2426918657900704e-07, "epoch": 2.942528735632184, "percentage": 98.08, "elapsed_time": "17:47:18", "remaining_time": "0:20:50"}
{"current_steps": 257, "total_steps": 261, "loss": 0.6289, "lr": 2.2522414843748618e-07, "epoch": 2.954022988505747, "percentage": 98.47, "elapsed_time": "17:50:28", "remaining_time": "0:16:39"}
{"current_steps": 258, "total_steps": 261, "loss": 0.6176, "lr": 1.4416294358582384e-07, "epoch": 2.9655172413793105, "percentage": 98.85, "elapsed_time": "17:53:37", "remaining_time": "0:12:29"}
{"current_steps": 259, "total_steps": 261, "loss": 0.6537, "lr": 8.110018284304133e-08, "epoch": 2.9770114942528734, "percentage": 99.23, "elapsed_time": "17:56:48", "remaining_time": "0:08:18"}
{"current_steps": 260, "total_steps": 261, "loss": 0.6316, "lr": 3.60472329114625e-08, "epoch": 2.9885057471264367, "percentage": 99.62, "elapsed_time": "17:59:57", "remaining_time": "0:04:09"}
{"current_steps": 260, "total_steps": 261, "eval_loss": 0.6630376577377319, "epoch": 2.9885057471264367, "percentage": 99.62, "elapsed_time": "18:09:22", "remaining_time": "0:04:11"}
{"current_steps": 261, "total_steps": 261, "loss": 0.6399, "lr": 9.012214327897006e-09, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "18:12:33", "remaining_time": "0:00:00"}
{"current_steps": 261, "total_steps": 261, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "18:12:54", "remaining_time": "0:00:00"}