seed_math_open2math / trainer_log.jsonl
sedrickkeh's picture
Training in progress, epoch 2
28f00b4 verified
{"current_steps": 10, "total_steps": 96, "loss": 0.6144, "lr": 5e-06, "epoch": 0.3065134099616858, "percentage": 10.42, "elapsed_time": "0:09:45", "remaining_time": "1:23:51"}
{"current_steps": 20, "total_steps": 96, "loss": 0.5117, "lr": 5e-06, "epoch": 0.6130268199233716, "percentage": 20.83, "elapsed_time": "0:19:24", "remaining_time": "1:13:46"}
{"current_steps": 30, "total_steps": 96, "loss": 0.4837, "lr": 5e-06, "epoch": 0.9195402298850575, "percentage": 31.25, "elapsed_time": "0:29:04", "remaining_time": "1:03:57"}
{"current_steps": 32, "total_steps": 96, "eval_loss": 0.45525598526000977, "epoch": 0.9808429118773946, "percentage": 33.33, "elapsed_time": "0:31:50", "remaining_time": "1:03:41"}
{"current_steps": 40, "total_steps": 96, "loss": 0.4907, "lr": 5e-06, "epoch": 1.2375478927203065, "percentage": 41.67, "elapsed_time": "0:40:30", "remaining_time": "0:56:42"}
{"current_steps": 50, "total_steps": 96, "loss": 0.4442, "lr": 5e-06, "epoch": 1.5440613026819925, "percentage": 52.08, "elapsed_time": "0:50:12", "remaining_time": "0:46:11"}
{"current_steps": 60, "total_steps": 96, "loss": 0.4322, "lr": 5e-06, "epoch": 1.8505747126436782, "percentage": 62.5, "elapsed_time": "0:59:53", "remaining_time": "0:35:55"}
{"current_steps": 64, "total_steps": 96, "eval_loss": 0.4297981858253479, "epoch": 1.9731800766283525, "percentage": 66.67, "elapsed_time": "1:04:49", "remaining_time": "0:32:24"}
{"current_steps": 70, "total_steps": 96, "loss": 0.4571, "lr": 5e-06, "epoch": 2.1685823754789273, "percentage": 72.92, "elapsed_time": "1:11:22", "remaining_time": "0:26:30"}
{"current_steps": 80, "total_steps": 96, "loss": 0.4056, "lr": 5e-06, "epoch": 2.475095785440613, "percentage": 83.33, "elapsed_time": "1:21:02", "remaining_time": "0:16:12"}
{"current_steps": 90, "total_steps": 96, "loss": 0.4044, "lr": 5e-06, "epoch": 2.781609195402299, "percentage": 93.75, "elapsed_time": "1:30:41", "remaining_time": "0:06:02"}
{"current_steps": 96, "total_steps": 96, "eval_loss": 0.4229108989238739, "epoch": 2.9655172413793105, "percentage": 100.0, "elapsed_time": "1:38:17", "remaining_time": "0:00:00"}
{"current_steps": 96, "total_steps": 96, "epoch": 2.9655172413793105, "percentage": 100.0, "elapsed_time": "1:39:33", "remaining_time": "0:00:00"}