|
{"current_steps": 1, "total_steps": 34, "loss": 1.4719, "lr": 4.989335440737586e-05, "epoch": 0.02877697841726619, "percentage": 2.94, "elapsed_time": "0:02:58", "remaining_time": "1:38:02", "throughput": 11764.63, "total_tokens": 2097152} |
|
{"current_steps": 2, "total_steps": 34, "loss": 1.4237, "lr": 4.957432749209755e-05, "epoch": 0.05755395683453238, "percentage": 5.88, "elapsed_time": "0:05:48", "remaining_time": "1:32:57", "throughput": 12031.95, "total_tokens": 4194304} |
|
{"current_steps": 3, "total_steps": 34, "loss": 1.3171, "lr": 4.9045641079320484e-05, "epoch": 0.08633093525179857, "percentage": 8.82, "elapsed_time": "0:08:38", "remaining_time": "1:29:22", "throughput": 12123.74, "total_tokens": 6291456} |
|
{"current_steps": 4, "total_steps": 34, "loss": 1.262, "lr": 4.8311805735108894e-05, "epoch": 0.11510791366906475, "percentage": 11.76, "elapsed_time": "0:11:29", "remaining_time": "1:26:09", "throughput": 12169.2, "total_tokens": 8388608} |
|
{"current_steps": 5, "total_steps": 34, "loss": 1.2216, "lr": 4.7379082283876566e-05, "epoch": 0.14388489208633093, "percentage": 14.71, "elapsed_time": "0:14:19", "remaining_time": "1:23:03", "throughput": 12203.19, "total_tokens": 10485760} |
|
{"current_steps": 6, "total_steps": 34, "loss": 1.1564, "lr": 4.625542839324036e-05, "epoch": 0.17266187050359713, "percentage": 17.65, "elapsed_time": "0:17:09", "remaining_time": "1:20:05", "throughput": 12218.23, "total_tokens": 12582912} |
|
{"current_steps": 7, "total_steps": 34, "loss": 1.1289, "lr": 4.4950430682006e-05, "epoch": 0.2014388489208633, "percentage": 20.59, "elapsed_time": "0:20:00", "remaining_time": "1:17:09", "throughput": 12231.27, "total_tokens": 14680064} |
|
{"current_steps": 8, "total_steps": 34, "loss": 1.0862, "lr": 4.347522293051648e-05, "epoch": 0.2302158273381295, "percentage": 23.53, "elapsed_time": "0:22:50", "remaining_time": "1:14:14", "throughput": 12241.38, "total_tokens": 16777216} |
|
{"current_steps": 9, "total_steps": 34, "loss": 1.0842, "lr": 4.184239109116393e-05, "epoch": 0.2589928057553957, "percentage": 26.47, "elapsed_time": "0:25:40", "remaining_time": "1:11:19", "throughput": 12249.91, "total_tokens": 18874368} |
|
{"current_steps": 10, "total_steps": 34, "loss": 1.0345, "lr": 4.0065865909481417e-05, "epoch": 0.28776978417266186, "percentage": 29.41, "elapsed_time": "0:28:31", "remaining_time": "1:08:26", "throughput": 12256.81, "total_tokens": 20971520} |
|
{"current_steps": 11, "total_steps": 34, "loss": 1.0473, "lr": 3.81608040719339e-05, "epoch": 0.31654676258992803, "percentage": 32.35, "elapsed_time": "0:31:21", "remaining_time": "1:05:33", "throughput": 12261.69, "total_tokens": 23068672} |
|
{"current_steps": 12, "total_steps": 34, "loss": 1.0355, "lr": 3.6143458894413465e-05, "epoch": 0.34532374100719426, "percentage": 35.29, "elapsed_time": "0:34:11", "remaining_time": "1:02:41", "throughput": 12266.49, "total_tokens": 25165824} |
|
{"current_steps": 13, "total_steps": 34, "loss": 1.0341, "lr": 3.403104165467883e-05, "epoch": 0.37410071942446044, "percentage": 38.24, "elapsed_time": "0:37:01", "remaining_time": "0:59:49", "throughput": 12270.2, "total_tokens": 27262976} |
|
{"current_steps": 14, "total_steps": 34, "loss": 0.9967, "lr": 3.1841574751802076e-05, "epoch": 0.4028776978417266, "percentage": 41.18, "elapsed_time": "0:39:52", "remaining_time": "0:56:57", "throughput": 12272.56, "total_tokens": 29360128} |
|
{"current_steps": 15, "total_steps": 34, "loss": 0.9901, "lr": 2.9593737945414264e-05, "epoch": 0.4316546762589928, "percentage": 44.12, "elapsed_time": "0:42:42", "remaining_time": "0:54:06", "throughput": 12275.23, "total_tokens": 31457280} |
|
{"current_steps": 16, "total_steps": 34, "loss": 0.9894, "lr": 2.7306708986582553e-05, "epoch": 0.460431654676259, "percentage": 47.06, "elapsed_time": "0:45:33", "remaining_time": "0:51:14", "throughput": 12277.3, "total_tokens": 33554432} |
|
{"current_steps": 17, "total_steps": 34, "loss": 0.9596, "lr": 2.5e-05, "epoch": 0.4892086330935252, "percentage": 50.0, "elapsed_time": "0:48:23", "remaining_time": "0:48:23", "throughput": 12279.41, "total_tokens": 35651584} |
|
{"current_steps": 18, "total_steps": 34, "loss": 0.9862, "lr": 2.2693291013417453e-05, "epoch": 0.5179856115107914, "percentage": 52.94, "elapsed_time": "0:51:13", "remaining_time": "0:45:32", "throughput": 12280.58, "total_tokens": 37748736} |
|
{"current_steps": 19, "total_steps": 34, "loss": 0.9911, "lr": 2.0406262054585738e-05, "epoch": 0.5467625899280576, "percentage": 55.88, "elapsed_time": "0:54:04", "remaining_time": "0:42:41", "throughput": 12282.58, "total_tokens": 39845888} |
|
{"current_steps": 20, "total_steps": 34, "loss": 0.95, "lr": 1.815842524819793e-05, "epoch": 0.5755395683453237, "percentage": 58.82, "elapsed_time": "0:56:54", "remaining_time": "0:39:49", "throughput": 12284.7, "total_tokens": 41943040} |
|
{"current_steps": 21, "total_steps": 34, "loss": 0.9235, "lr": 1.5968958345321178e-05, "epoch": 0.60431654676259, "percentage": 61.76, "elapsed_time": "0:59:44", "remaining_time": "0:36:59", "throughput": 12286.03, "total_tokens": 44040192} |
|
{"current_steps": 22, "total_steps": 34, "loss": 0.952, "lr": 1.3856541105586545e-05, "epoch": 0.6330935251798561, "percentage": 64.71, "elapsed_time": "1:02:34", "remaining_time": "0:34:08", "throughput": 12286.99, "total_tokens": 46137344} |
|
{"current_steps": 23, "total_steps": 34, "loss": 0.9199, "lr": 1.1839195928066102e-05, "epoch": 0.6618705035971223, "percentage": 67.65, "elapsed_time": "1:05:22", "remaining_time": "0:31:15", "throughput": 12297.96, "total_tokens": 48234496} |
|
{"current_steps": 24, "total_steps": 34, "loss": 0.9399, "lr": 9.934134090518593e-06, "epoch": 0.6906474820143885, "percentage": 70.59, "elapsed_time": "1:08:09", "remaining_time": "0:28:24", "throughput": 12307.13, "total_tokens": 50331648} |
|
{"current_steps": 25, "total_steps": 34, "loss": 0.9307, "lr": 8.15760890883607e-06, "epoch": 0.7194244604316546, "percentage": 73.53, "elapsed_time": "1:10:56", "remaining_time": "0:25:32", "throughput": 12316.17, "total_tokens": 52428800} |
|
{"current_steps": 26, "total_steps": 34, "loss": 0.9579, "lr": 6.524777069483526e-06, "epoch": 0.7482014388489209, "percentage": 76.47, "elapsed_time": "1:13:44", "remaining_time": "0:22:41", "throughput": 12324.45, "total_tokens": 54525952} |
|
{"current_steps": 27, "total_steps": 34, "loss": 0.9388, "lr": 5.049569317994013e-06, "epoch": 0.7769784172661871, "percentage": 79.41, "elapsed_time": "1:16:31", "remaining_time": "0:19:50", "throughput": 12332.52, "total_tokens": 56623104} |
|
{"current_steps": 28, "total_steps": 34, "loss": 0.9241, "lr": 3.7445716067596503e-06, "epoch": 0.8057553956834532, "percentage": 82.35, "elapsed_time": "1:19:18", "remaining_time": "0:16:59", "throughput": 12339.87, "total_tokens": 58720256} |
|
{"current_steps": 29, "total_steps": 34, "loss": 0.9275, "lr": 2.6209177161234445e-06, "epoch": 0.8345323741007195, "percentage": 85.29, "elapsed_time": "1:22:05", "remaining_time": "0:14:09", "throughput": 12347.61, "total_tokens": 60817408} |
|
{"current_steps": 30, "total_steps": 34, "loss": 0.9295, "lr": 1.6881942648911076e-06, "epoch": 0.8633093525179856, "percentage": 88.24, "elapsed_time": "1:24:52", "remaining_time": "0:11:19", "throughput": 12353.74, "total_tokens": 62914560} |
|
{"current_steps": 31, "total_steps": 34, "loss": 0.9255, "lr": 9.54358920679524e-07, "epoch": 0.8920863309352518, "percentage": 91.18, "elapsed_time": "1:27:39", "remaining_time": "0:08:29", "throughput": 12359.89, "total_tokens": 65011712} |
|
{"current_steps": 32, "total_steps": 34, "loss": 0.9277, "lr": 4.256725079024554e-07, "epoch": 0.920863309352518, "percentage": 94.12, "elapsed_time": "1:30:27", "remaining_time": "0:05:39", "throughput": 12365.08, "total_tokens": 67108864} |
|
{"current_steps": 33, "total_steps": 34, "loss": 0.9263, "lr": 1.0664559262413831e-07, "epoch": 0.9496402877697842, "percentage": 97.06, "elapsed_time": "1:33:14", "remaining_time": "0:02:49", "throughput": 12371.42, "total_tokens": 69206016} |
|
{"current_steps": 34, "total_steps": 34, "loss": 0.9213, "lr": 0.0, "epoch": 0.9784172661870504, "percentage": 100.0, "elapsed_time": "1:36:00", "remaining_time": "0:00:00", "throughput": 12377.65, "total_tokens": 71303168} |
|
{"current_steps": 34, "total_steps": 34, "epoch": 0.9784172661870504, "percentage": 100.0, "elapsed_time": "1:36:24", "remaining_time": "0:00:00", "throughput": 12325.82, "total_tokens": 71303168} |
|
|