distill_r1_code_evol_instruct / trainer_log.jsonl
sedrickkeh's picture
Training in progress, epoch 2
a1bff54 verified
{"current_steps": 1, "total_steps": 78, "loss": 1.2115, "lr": 1.25e-06, "epoch": 0.038338658146964855, "percentage": 1.28, "elapsed_time": "0:01:06", "remaining_time": "1:25:07"}
{"current_steps": 2, "total_steps": 78, "loss": 1.2297, "lr": 2.5e-06, "epoch": 0.07667731629392971, "percentage": 2.56, "elapsed_time": "0:02:02", "remaining_time": "1:17:38"}
{"current_steps": 3, "total_steps": 78, "loss": 1.2244, "lr": 3.7500000000000005e-06, "epoch": 0.11501597444089456, "percentage": 3.85, "elapsed_time": "0:03:03", "remaining_time": "1:16:31"}
{"current_steps": 4, "total_steps": 78, "loss": 1.2321, "lr": 5e-06, "epoch": 0.15335463258785942, "percentage": 5.13, "elapsed_time": "0:04:06", "remaining_time": "1:15:53"}
{"current_steps": 5, "total_steps": 78, "loss": 1.1354, "lr": 6.25e-06, "epoch": 0.19169329073482427, "percentage": 6.41, "elapsed_time": "0:05:01", "remaining_time": "1:13:23"}
{"current_steps": 6, "total_steps": 78, "loss": 1.1373, "lr": 7.500000000000001e-06, "epoch": 0.23003194888178913, "percentage": 7.69, "elapsed_time": "0:05:53", "remaining_time": "1:10:41"}
{"current_steps": 7, "total_steps": 78, "loss": 1.1164, "lr": 8.750000000000001e-06, "epoch": 0.268370607028754, "percentage": 8.97, "elapsed_time": "0:06:35", "remaining_time": "1:06:52"}
{"current_steps": 8, "total_steps": 78, "loss": 1.1487, "lr": 1e-05, "epoch": 0.30670926517571884, "percentage": 10.26, "elapsed_time": "0:07:23", "remaining_time": "1:04:43"}
{"current_steps": 9, "total_steps": 78, "loss": 1.1092, "lr": 9.994965332706574e-06, "epoch": 0.3450479233226837, "percentage": 11.54, "elapsed_time": "0:08:19", "remaining_time": "1:03:50"}
{"current_steps": 10, "total_steps": 78, "loss": 1.0593, "lr": 9.979871469976197e-06, "epoch": 0.38338658146964855, "percentage": 12.82, "elapsed_time": "0:09:08", "remaining_time": "1:02:07"}
{"current_steps": 11, "total_steps": 78, "loss": 1.0775, "lr": 9.954748808839675e-06, "epoch": 0.4217252396166134, "percentage": 14.1, "elapsed_time": "0:10:00", "remaining_time": "1:00:59"}
{"current_steps": 12, "total_steps": 78, "loss": 1.0507, "lr": 9.91964794299315e-06, "epoch": 0.46006389776357826, "percentage": 15.38, "elapsed_time": "0:10:51", "remaining_time": "0:59:41"}
{"current_steps": 13, "total_steps": 78, "loss": 1.0538, "lr": 9.874639560909118e-06, "epoch": 0.4984025559105431, "percentage": 16.67, "elapsed_time": "0:11:39", "remaining_time": "0:58:19"}
{"current_steps": 14, "total_steps": 78, "loss": 1.0135, "lr": 9.819814303479268e-06, "epoch": 0.536741214057508, "percentage": 17.95, "elapsed_time": "0:12:38", "remaining_time": "0:57:48"}
{"current_steps": 15, "total_steps": 78, "loss": 0.9451, "lr": 9.755282581475769e-06, "epoch": 0.5750798722044729, "percentage": 19.23, "elapsed_time": "0:13:24", "remaining_time": "0:56:17"}
{"current_steps": 16, "total_steps": 78, "loss": 0.9612, "lr": 9.681174353198687e-06, "epoch": 0.6134185303514377, "percentage": 20.51, "elapsed_time": "0:14:16", "remaining_time": "0:55:17"}
{"current_steps": 17, "total_steps": 78, "loss": 0.933, "lr": 9.597638862757255e-06, "epoch": 0.6517571884984026, "percentage": 21.79, "elapsed_time": "0:15:02", "remaining_time": "0:53:58"}
{"current_steps": 18, "total_steps": 78, "loss": 0.952, "lr": 9.504844339512096e-06, "epoch": 0.6900958466453674, "percentage": 23.08, "elapsed_time": "0:15:52", "remaining_time": "0:52:54"}
{"current_steps": 19, "total_steps": 78, "loss": 0.9445, "lr": 9.40297765928369e-06, "epoch": 0.7284345047923323, "percentage": 24.36, "elapsed_time": "0:16:40", "remaining_time": "0:51:48"}
{"current_steps": 20, "total_steps": 78, "loss": 0.9118, "lr": 9.292243968009332e-06, "epoch": 0.7667731629392971, "percentage": 25.64, "elapsed_time": "0:17:29", "remaining_time": "0:50:44"}
{"current_steps": 21, "total_steps": 78, "loss": 0.9449, "lr": 9.172866268606514e-06, "epoch": 0.805111821086262, "percentage": 26.92, "elapsed_time": "0:18:23", "remaining_time": "0:49:55"}
{"current_steps": 22, "total_steps": 78, "loss": 0.9324, "lr": 9.045084971874738e-06, "epoch": 0.8434504792332268, "percentage": 28.21, "elapsed_time": "0:19:17", "remaining_time": "0:49:07"}
{"current_steps": 23, "total_steps": 78, "loss": 0.9171, "lr": 8.90915741234015e-06, "epoch": 0.8817891373801917, "percentage": 29.49, "elapsed_time": "0:20:11", "remaining_time": "0:48:16"}
{"current_steps": 24, "total_steps": 78, "loss": 0.8944, "lr": 8.765357330018056e-06, "epoch": 0.9201277955271565, "percentage": 30.77, "elapsed_time": "0:20:57", "remaining_time": "0:47:09"}
{"current_steps": 25, "total_steps": 78, "loss": 0.9277, "lr": 8.613974319136959e-06, "epoch": 0.9584664536741214, "percentage": 32.05, "elapsed_time": "0:21:51", "remaining_time": "0:46:21"}
{"current_steps": 26, "total_steps": 78, "loss": 0.8892, "lr": 8.455313244934324e-06, "epoch": 0.9968051118210862, "percentage": 33.33, "elapsed_time": "0:22:37", "remaining_time": "0:45:14"}
{"current_steps": 27, "total_steps": 78, "loss": 1.6425, "lr": 8.289693629698564e-06, "epoch": 1.035143769968051, "percentage": 34.62, "elapsed_time": "0:24:21", "remaining_time": "0:46:01"}
{"current_steps": 28, "total_steps": 78, "loss": 0.8882, "lr": 8.117449009293668e-06, "epoch": 1.073482428115016, "percentage": 35.9, "elapsed_time": "0:25:16", "remaining_time": "0:45:07"}
{"current_steps": 29, "total_steps": 78, "loss": 0.8174, "lr": 7.938926261462366e-06, "epoch": 1.1118210862619808, "percentage": 37.18, "elapsed_time": "0:26:03", "remaining_time": "0:44:01"}
{"current_steps": 30, "total_steps": 78, "loss": 0.8943, "lr": 7.754484907260513e-06, "epoch": 1.1501597444089458, "percentage": 38.46, "elapsed_time": "0:27:06", "remaining_time": "0:43:21"}
{"current_steps": 31, "total_steps": 78, "loss": 0.9146, "lr": 7.564496387029532e-06, "epoch": 1.1884984025559104, "percentage": 39.74, "elapsed_time": "0:28:06", "remaining_time": "0:42:36"}
{"current_steps": 32, "total_steps": 78, "loss": 0.8061, "lr": 7.369343312364994e-06, "epoch": 1.2268370607028753, "percentage": 41.03, "elapsed_time": "0:28:46", "remaining_time": "0:41:22"}
{"current_steps": 33, "total_steps": 78, "loss": 0.9283, "lr": 7.169418695587791e-06, "epoch": 1.2651757188498403, "percentage": 42.31, "elapsed_time": "0:29:34", "remaining_time": "0:40:19"}
{"current_steps": 34, "total_steps": 78, "loss": 0.8699, "lr": 6.965125158269619e-06, "epoch": 1.3035143769968052, "percentage": 43.59, "elapsed_time": "0:30:20", "remaining_time": "0:39:15"}
{"current_steps": 35, "total_steps": 78, "loss": 0.8696, "lr": 6.7568741204067145e-06, "epoch": 1.34185303514377, "percentage": 44.87, "elapsed_time": "0:31:21", "remaining_time": "0:38:31"}
{"current_steps": 36, "total_steps": 78, "loss": 0.883, "lr": 6.545084971874738e-06, "epoch": 1.3801916932907348, "percentage": 46.15, "elapsed_time": "0:32:13", "remaining_time": "0:37:36"}
{"current_steps": 37, "total_steps": 78, "loss": 0.844, "lr": 6.330184227833376e-06, "epoch": 1.4185303514376997, "percentage": 47.44, "elapsed_time": "0:33:10", "remaining_time": "0:36:45"}
{"current_steps": 38, "total_steps": 78, "loss": 0.9176, "lr": 6.112604669781572e-06, "epoch": 1.4568690095846646, "percentage": 48.72, "elapsed_time": "0:34:01", "remaining_time": "0:35:48"}
{"current_steps": 39, "total_steps": 78, "loss": 0.8606, "lr": 5.892784473993184e-06, "epoch": 1.4952076677316293, "percentage": 50.0, "elapsed_time": "0:34:56", "remaining_time": "0:34:56"}
{"current_steps": 40, "total_steps": 78, "loss": 0.8542, "lr": 5.671166329088278e-06, "epoch": 1.5335463258785942, "percentage": 51.28, "elapsed_time": "0:35:43", "remaining_time": "0:33:55"}
{"current_steps": 41, "total_steps": 78, "loss": 0.8272, "lr": 5.448196544517168e-06, "epoch": 1.571884984025559, "percentage": 52.56, "elapsed_time": "0:36:38", "remaining_time": "0:33:03"}
{"current_steps": 42, "total_steps": 78, "loss": 0.8341, "lr": 5.224324151752575e-06, "epoch": 1.610223642172524, "percentage": 53.85, "elapsed_time": "0:37:33", "remaining_time": "0:32:11"}
{"current_steps": 43, "total_steps": 78, "loss": 0.8258, "lr": 5e-06, "epoch": 1.648562300319489, "percentage": 55.13, "elapsed_time": "0:38:14", "remaining_time": "0:31:07"}
{"current_steps": 44, "total_steps": 78, "loss": 0.8092, "lr": 4.775675848247427e-06, "epoch": 1.6869009584664538, "percentage": 56.41, "elapsed_time": "0:39:03", "remaining_time": "0:30:11"}
{"current_steps": 45, "total_steps": 78, "loss": 0.8257, "lr": 4.551803455482833e-06, "epoch": 1.7252396166134185, "percentage": 57.69, "elapsed_time": "0:39:50", "remaining_time": "0:29:13"}
{"current_steps": 46, "total_steps": 78, "loss": 0.9231, "lr": 4.3288336709117246e-06, "epoch": 1.7635782747603834, "percentage": 58.97, "elapsed_time": "0:40:54", "remaining_time": "0:28:27"}
{"current_steps": 47, "total_steps": 78, "loss": 0.8637, "lr": 4.107215526006818e-06, "epoch": 1.8019169329073481, "percentage": 60.26, "elapsed_time": "0:42:01", "remaining_time": "0:27:43"}
{"current_steps": 48, "total_steps": 78, "loss": 0.8697, "lr": 3.887395330218429e-06, "epoch": 1.840255591054313, "percentage": 61.54, "elapsed_time": "0:42:55", "remaining_time": "0:26:49"}
{"current_steps": 49, "total_steps": 78, "loss": 0.8528, "lr": 3.669815772166625e-06, "epoch": 1.878594249201278, "percentage": 62.82, "elapsed_time": "0:43:48", "remaining_time": "0:25:55"}
{"current_steps": 50, "total_steps": 78, "loss": 0.8719, "lr": 3.4549150281252635e-06, "epoch": 1.9169329073482428, "percentage": 64.1, "elapsed_time": "0:44:38", "remaining_time": "0:25:00"}
{"current_steps": 51, "total_steps": 78, "loss": 0.8398, "lr": 3.2431258795932863e-06, "epoch": 1.9552715654952078, "percentage": 65.38, "elapsed_time": "0:45:28", "remaining_time": "0:24:04"}
{"current_steps": 52, "total_steps": 78, "loss": 0.8779, "lr": 3.0348748417303826e-06, "epoch": 1.9936102236421727, "percentage": 66.67, "elapsed_time": "0:46:15", "remaining_time": "0:23:07"}
{"current_steps": 53, "total_steps": 78, "loss": 1.4471, "lr": 2.83058130441221e-06, "epoch": 2.0319488817891376, "percentage": 67.95, "elapsed_time": "0:48:18", "remaining_time": "0:22:47"}
{"current_steps": 54, "total_steps": 78, "loss": 0.8478, "lr": 2.6306566876350072e-06, "epoch": 2.070287539936102, "percentage": 69.23, "elapsed_time": "0:49:15", "remaining_time": "0:21:53"}
{"current_steps": 55, "total_steps": 78, "loss": 0.6975, "lr": 2.43550361297047e-06, "epoch": 2.108626198083067, "percentage": 70.51, "elapsed_time": "0:50:05", "remaining_time": "0:20:56"}
{"current_steps": 56, "total_steps": 78, "loss": 0.8813, "lr": 2.245515092739488e-06, "epoch": 2.146964856230032, "percentage": 71.79, "elapsed_time": "0:50:54", "remaining_time": "0:19:59"}
{"current_steps": 57, "total_steps": 78, "loss": 0.7837, "lr": 2.061073738537635e-06, "epoch": 2.1853035143769968, "percentage": 73.08, "elapsed_time": "0:51:43", "remaining_time": "0:19:03"}
{"current_steps": 58, "total_steps": 78, "loss": 0.813, "lr": 1.8825509907063328e-06, "epoch": 2.2236421725239617, "percentage": 74.36, "elapsed_time": "0:52:28", "remaining_time": "0:18:05"}
{"current_steps": 59, "total_steps": 78, "loss": 0.8443, "lr": 1.7103063703014372e-06, "epoch": 2.2619808306709266, "percentage": 75.64, "elapsed_time": "0:53:27", "remaining_time": "0:17:13"}
{"current_steps": 60, "total_steps": 78, "loss": 0.8034, "lr": 1.544686755065677e-06, "epoch": 2.3003194888178915, "percentage": 76.92, "elapsed_time": "0:54:22", "remaining_time": "0:16:18"}
{"current_steps": 61, "total_steps": 78, "loss": 0.8218, "lr": 1.3860256808630429e-06, "epoch": 2.3386581469648564, "percentage": 78.21, "elapsed_time": "0:55:07", "remaining_time": "0:15:21"}
{"current_steps": 62, "total_steps": 78, "loss": 0.8328, "lr": 1.234642669981946e-06, "epoch": 2.376996805111821, "percentage": 79.49, "elapsed_time": "0:55:52", "remaining_time": "0:14:25"}
{"current_steps": 63, "total_steps": 78, "loss": 0.8163, "lr": 1.0908425876598512e-06, "epoch": 2.415335463258786, "percentage": 80.77, "elapsed_time": "0:56:38", "remaining_time": "0:13:29"}
{"current_steps": 64, "total_steps": 78, "loss": 0.8503, "lr": 9.549150281252633e-07, "epoch": 2.4536741214057507, "percentage": 82.05, "elapsed_time": "0:57:32", "remaining_time": "0:12:35"}
{"current_steps": 65, "total_steps": 78, "loss": 0.8144, "lr": 8.271337313934869e-07, "epoch": 2.4920127795527156, "percentage": 83.33, "elapsed_time": "0:58:25", "remaining_time": "0:11:41"}
{"current_steps": 66, "total_steps": 78, "loss": 0.8012, "lr": 7.077560319906696e-07, "epoch": 2.5303514376996805, "percentage": 84.62, "elapsed_time": "0:59:18", "remaining_time": "0:10:47"}
{"current_steps": 67, "total_steps": 78, "loss": 0.8369, "lr": 5.9702234071631e-07, "epoch": 2.5686900958466454, "percentage": 85.9, "elapsed_time": "1:00:09", "remaining_time": "0:09:52"}
{"current_steps": 68, "total_steps": 78, "loss": 0.8044, "lr": 4.951556604879049e-07, "epoch": 2.6070287539936103, "percentage": 87.18, "elapsed_time": "1:01:06", "remaining_time": "0:08:59"}
{"current_steps": 69, "total_steps": 78, "loss": 0.8484, "lr": 4.0236113724274716e-07, "epoch": 2.6453674121405752, "percentage": 88.46, "elapsed_time": "1:01:57", "remaining_time": "0:08:04"}
{"current_steps": 70, "total_steps": 78, "loss": 0.8267, "lr": 3.18825646801314e-07, "epoch": 2.68370607028754, "percentage": 89.74, "elapsed_time": "1:02:52", "remaining_time": "0:07:11"}
{"current_steps": 71, "total_steps": 78, "loss": 0.7495, "lr": 2.447174185242324e-07, "epoch": 2.722044728434505, "percentage": 91.03, "elapsed_time": "1:03:38", "remaining_time": "0:06:16"}
{"current_steps": 72, "total_steps": 78, "loss": 0.8841, "lr": 1.801856965207338e-07, "epoch": 2.7603833865814695, "percentage": 92.31, "elapsed_time": "1:04:37", "remaining_time": "0:05:23"}
{"current_steps": 73, "total_steps": 78, "loss": 0.7166, "lr": 1.253604390908819e-07, "epoch": 2.7987220447284344, "percentage": 93.59, "elapsed_time": "1:05:19", "remaining_time": "0:04:28"}
{"current_steps": 74, "total_steps": 78, "loss": 0.8212, "lr": 8.035205700685167e-08, "epoch": 2.8370607028753994, "percentage": 94.87, "elapsed_time": "1:06:17", "remaining_time": "0:03:35"}
{"current_steps": 75, "total_steps": 78, "loss": 0.8516, "lr": 4.52511911603265e-08, "epoch": 2.8753993610223643, "percentage": 96.15, "elapsed_time": "1:07:10", "remaining_time": "0:02:41"}
{"current_steps": 76, "total_steps": 78, "loss": 0.7457, "lr": 2.012853002380466e-08, "epoch": 2.913738019169329, "percentage": 97.44, "elapsed_time": "1:07:58", "remaining_time": "0:01:47"}
{"current_steps": 77, "total_steps": 78, "loss": 0.8133, "lr": 5.034667293427053e-09, "epoch": 2.952076677316294, "percentage": 98.72, "elapsed_time": "1:08:44", "remaining_time": "0:00:53"}
{"current_steps": 78, "total_steps": 78, "loss": 0.7707, "lr": 0.0, "epoch": 2.9904153354632586, "percentage": 100.0, "elapsed_time": "1:09:36", "remaining_time": "0:00:00"}
{"current_steps": 78, "total_steps": 78, "epoch": 2.9904153354632586, "percentage": 100.0, "elapsed_time": "1:11:54", "remaining_time": "0:00:00"}