llama-3-86-lora-pretrain_v2 / trainer_log.jsonl
ytcheng's picture
Training in progress, step 500
b94a7c5 verified
{"current_steps": 10, "total_steps": 1596, "loss": 3.1063, "learning_rate": 2.0000000000000003e-06, "epoch": 0.018774935461159353, "percentage": 0.63, "elapsed_time": "0:00:59", "remaining_time": "2:36:11"}
{"current_steps": 20, "total_steps": 1596, "loss": 3.0935, "learning_rate": 4.000000000000001e-06, "epoch": 0.03754987092231871, "percentage": 1.25, "elapsed_time": "0:01:59", "remaining_time": "2:37:09"}
{"current_steps": 30, "total_steps": 1596, "loss": 3.0475, "learning_rate": 6e-06, "epoch": 0.05632480638347806, "percentage": 1.88, "elapsed_time": "0:03:00", "remaining_time": "2:37:21"}
{"current_steps": 40, "total_steps": 1596, "loss": 3.0609, "learning_rate": 8.000000000000001e-06, "epoch": 0.07509974184463741, "percentage": 2.51, "elapsed_time": "0:04:02", "remaining_time": "2:37:02"}
{"current_steps": 50, "total_steps": 1596, "loss": 3.026, "learning_rate": 1e-05, "epoch": 0.09387467730579677, "percentage": 3.13, "elapsed_time": "0:05:03", "remaining_time": "2:36:28"}
{"current_steps": 60, "total_steps": 1596, "loss": 3.0134, "learning_rate": 1.2e-05, "epoch": 0.11264961276695612, "percentage": 3.76, "elapsed_time": "0:06:04", "remaining_time": "2:35:41"}
{"current_steps": 70, "total_steps": 1596, "loss": 2.9549, "learning_rate": 1.4000000000000001e-05, "epoch": 0.13142454822811547, "percentage": 4.39, "elapsed_time": "0:07:06", "remaining_time": "2:34:50"}
{"current_steps": 80, "total_steps": 1596, "loss": 2.9301, "learning_rate": 1.6000000000000003e-05, "epoch": 0.15019948368927483, "percentage": 5.01, "elapsed_time": "0:08:07", "remaining_time": "2:33:55"}
{"current_steps": 90, "total_steps": 1596, "loss": 2.9109, "learning_rate": 1.8e-05, "epoch": 0.16897441915043418, "percentage": 5.64, "elapsed_time": "0:09:08", "remaining_time": "2:32:59"}
{"current_steps": 100, "total_steps": 1596, "loss": 2.8142, "learning_rate": 2e-05, "epoch": 0.18774935461159353, "percentage": 6.27, "elapsed_time": "0:10:09", "remaining_time": "2:32:02"}
{"current_steps": 100, "total_steps": 1596, "eval_loss": 2.856565237045288, "epoch": 0.18774935461159353, "percentage": 6.27, "elapsed_time": "0:12:05", "remaining_time": "3:00:51"}