llama3-1_8b_McEval-Instruct / trainer_log.jsonl
gsmyrnis's picture
Training in progress, epoch 1
33e1da8 verified
{"current_steps": 10, "total_steps": 120, "loss": 0.6045, "lr": 5e-06, "epoch": 0.25, "percentage": 8.33, "elapsed_time": "0:01:00", "remaining_time": "0:11:01"}
{"current_steps": 20, "total_steps": 120, "loss": 0.5281, "lr": 5e-06, "epoch": 0.5, "percentage": 16.67, "elapsed_time": "0:01:59", "remaining_time": "0:09:55"}
{"current_steps": 30, "total_steps": 120, "loss": 0.5047, "lr": 5e-06, "epoch": 0.75, "percentage": 25.0, "elapsed_time": "0:02:58", "remaining_time": "0:08:54"}
{"current_steps": 40, "total_steps": 120, "loss": 0.4873, "lr": 5e-06, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "0:03:57", "remaining_time": "0:07:54"}
{"current_steps": 40, "total_steps": 120, "eval_loss": 0.4834265112876892, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "0:04:01", "remaining_time": "0:08:03"}
{"current_steps": 50, "total_steps": 120, "loss": 0.4595, "lr": 5e-06, "epoch": 1.25, "percentage": 41.67, "elapsed_time": "0:06:28", "remaining_time": "0:09:04"}
{"current_steps": 60, "total_steps": 120, "loss": 0.4446, "lr": 5e-06, "epoch": 1.5, "percentage": 50.0, "elapsed_time": "0:07:28", "remaining_time": "0:07:28"}
{"current_steps": 70, "total_steps": 120, "loss": 0.4398, "lr": 5e-06, "epoch": 1.75, "percentage": 58.33, "elapsed_time": "0:08:28", "remaining_time": "0:06:03"}
{"current_steps": 80, "total_steps": 120, "loss": 0.433, "lr": 5e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:09:28", "remaining_time": "0:04:44"}
{"current_steps": 80, "total_steps": 120, "eval_loss": 0.45972347259521484, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:09:33", "remaining_time": "0:04:46"}
{"current_steps": 90, "total_steps": 120, "loss": 0.3955, "lr": 5e-06, "epoch": 2.25, "percentage": 75.0, "elapsed_time": "0:12:00", "remaining_time": "0:04:00"}
{"current_steps": 100, "total_steps": 120, "loss": 0.3947, "lr": 5e-06, "epoch": 2.5, "percentage": 83.33, "elapsed_time": "0:13:00", "remaining_time": "0:02:36"}
{"current_steps": 110, "total_steps": 120, "loss": 0.3906, "lr": 5e-06, "epoch": 2.75, "percentage": 91.67, "elapsed_time": "0:14:00", "remaining_time": "0:01:16"}
{"current_steps": 120, "total_steps": 120, "loss": 0.3885, "lr": 5e-06, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:14:59", "remaining_time": "0:00:00"}
{"current_steps": 120, "total_steps": 120, "eval_loss": 0.4611949920654297, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:16:30", "remaining_time": "0:00:00"}
{"current_steps": 120, "total_steps": 120, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:18:04", "remaining_time": "0:00:00"}