qwen3-8B-sft-mix-v20250921_05 / trainer_log.jsonl
rulins's picture
Upload folder using huggingface_hub
0ca93ec verified
{"current_steps": 5, "total_steps": 315, "loss": 1.5771, "lr": 5e-06, "epoch": 0.08, "percentage": 1.59, "elapsed_time": "0:08:56", "remaining_time": "9:14:35"}
{"current_steps": 10, "total_steps": 315, "loss": 1.3507, "lr": 1.125e-05, "epoch": 0.16, "percentage": 3.17, "elapsed_time": "0:16:49", "remaining_time": "8:33:00"}
{"current_steps": 15, "total_steps": 315, "loss": 1.1892, "lr": 1.7500000000000002e-05, "epoch": 0.24, "percentage": 4.76, "elapsed_time": "0:24:52", "remaining_time": "8:17:29"}
{"current_steps": 20, "total_steps": 315, "loss": 1.0968, "lr": 2.375e-05, "epoch": 0.32, "percentage": 6.35, "elapsed_time": "0:32:55", "remaining_time": "8:05:39"}
{"current_steps": 25, "total_steps": 315, "loss": 1.0402, "lr": 3.0000000000000004e-05, "epoch": 0.4, "percentage": 7.94, "elapsed_time": "0:40:58", "remaining_time": "7:55:13"}
{"current_steps": 30, "total_steps": 315, "loss": 1.009, "lr": 3.625e-05, "epoch": 0.48, "percentage": 9.52, "elapsed_time": "0:48:39", "remaining_time": "7:42:16"}
{"current_steps": 35, "total_steps": 315, "loss": 0.9836, "lr": 3.9995070884147604e-05, "epoch": 0.56, "percentage": 11.11, "elapsed_time": "0:56:16", "remaining_time": "7:30:15"}
{"current_steps": 40, "total_steps": 315, "loss": 0.9736, "lr": 3.9939646229673775e-05, "epoch": 0.64, "percentage": 12.7, "elapsed_time": "1:04:25", "remaining_time": "7:22:57"}
{"current_steps": 45, "total_steps": 315, "loss": 0.9654, "lr": 3.98228068051382e-05, "epoch": 0.72, "percentage": 14.29, "elapsed_time": "1:12:29", "remaining_time": "7:14:59"}
{"current_steps": 50, "total_steps": 315, "loss": 0.9757, "lr": 3.964491247983392e-05, "epoch": 0.8, "percentage": 15.87, "elapsed_time": "1:20:07", "remaining_time": "7:04:37"}
{"current_steps": 55, "total_steps": 315, "loss": 0.9615, "lr": 3.940651117416824e-05, "epoch": 0.88, "percentage": 17.46, "elapsed_time": "1:28:04", "remaining_time": "6:56:20"}
{"current_steps": 60, "total_steps": 315, "loss": 0.9429, "lr": 3.9108337172049794e-05, "epoch": 0.96, "percentage": 19.05, "elapsed_time": "1:35:53", "remaining_time": "6:47:32"}
{"current_steps": 65, "total_steps": 315, "loss": 0.8927, "lr": 3.875130885926973e-05, "epoch": 1.032, "percentage": 20.63, "elapsed_time": "1:43:56", "remaining_time": "6:39:46"}
{"current_steps": 70, "total_steps": 315, "loss": 0.8357, "lr": 3.83365258948432e-05, "epoch": 1.112, "percentage": 22.22, "elapsed_time": "1:51:59", "remaining_time": "6:31:58"}
{"current_steps": 75, "total_steps": 315, "loss": 0.8072, "lr": 3.786526582402313e-05, "epoch": 1.192, "percentage": 23.81, "elapsed_time": "1:59:37", "remaining_time": "6:22:47"}
{"current_steps": 80, "total_steps": 315, "loss": 0.8157, "lr": 3.733898014341858e-05, "epoch": 1.272, "percentage": 25.4, "elapsed_time": "2:07:10", "remaining_time": "6:13:34"}
{"current_steps": 85, "total_steps": 315, "loss": 0.8038, "lr": 3.6759289830337246e-05, "epoch": 1.3519999999999999, "percentage": 26.98, "elapsed_time": "2:15:02", "remaining_time": "6:05:23"}
{"current_steps": 90, "total_steps": 315, "loss": 0.7911, "lr": 3.612798035012161e-05, "epoch": 1.432, "percentage": 28.57, "elapsed_time": "2:22:38", "remaining_time": "5:56:37"}