qwen-7b-lora-math / trainer_log.jsonl
Wuhuwill's picture
Upload LoRA weights and configs
fc4562b verified
{"current_steps": 100, "total_steps": 1686, "loss": 1.36, "lr": 2.958579881656805e-05, "epoch": 0.17777777777777778, "percentage": 5.93, "elapsed_time": "0:10:46", "remaining_time": "2:50:49"}
{"current_steps": 200, "total_steps": 1686, "loss": 1.0892, "lr": 4.9948499337185685e-05, "epoch": 0.35555555555555557, "percentage": 11.86, "elapsed_time": "0:21:32", "remaining_time": "2:40:00"}
{"current_steps": 300, "total_steps": 1686, "loss": 1.0346, "lr": 4.9085642733870516e-05, "epoch": 0.5333333333333333, "percentage": 17.79, "elapsed_time": "0:32:18", "remaining_time": "2:29:14"}
{"current_steps": 400, "total_steps": 1686, "loss": 1.0148, "lr": 4.7193504727388485e-05, "epoch": 0.7111111111111111, "percentage": 23.72, "elapsed_time": "0:43:05", "remaining_time": "2:18:32"}
{"current_steps": 500, "total_steps": 1686, "loss": 1.0175, "lr": 4.435294437904082e-05, "epoch": 0.8888888888888888, "percentage": 29.66, "elapsed_time": "0:53:52", "remaining_time": "2:07:46"}
{"current_steps": 563, "total_steps": 1686, "eval_loss": 0.9917173981666565, "epoch": 1.0, "percentage": 33.39, "elapsed_time": "1:02:35", "remaining_time": "2:04:51"}
{"current_steps": 600, "total_steps": 1686, "loss": 0.9865, "lr": 4.068535084889406e-05, "epoch": 1.0657777777777777, "percentage": 35.59, "elapsed_time": "1:06:35", "remaining_time": "2:00:32"}
{"current_steps": 700, "total_steps": 1686, "loss": 0.955, "lr": 3.634745592345962e-05, "epoch": 1.2435555555555555, "percentage": 41.52, "elapsed_time": "1:17:21", "remaining_time": "1:48:58"}
{"current_steps": 800, "total_steps": 1686, "loss": 0.9512, "lr": 3.1524636203435906e-05, "epoch": 1.4213333333333333, "percentage": 47.45, "elapsed_time": "1:28:07", "remaining_time": "1:37:36"}
{"current_steps": 900, "total_steps": 1686, "loss": 0.9495, "lr": 2.642299117736456e-05, "epoch": 1.5991111111111111, "percentage": 53.38, "elapsed_time": "1:38:54", "remaining_time": "1:26:22"}
{"current_steps": 1000, "total_steps": 1686, "loss": 0.949, "lr": 2.1260535718625273e-05, "epoch": 1.7768888888888887, "percentage": 59.31, "elapsed_time": "1:49:41", "remaining_time": "1:15:14"}
{"current_steps": 1100, "total_steps": 1686, "loss": 0.9563, "lr": 1.625788338763118e-05, "epoch": 1.9546666666666668, "percentage": 65.24, "elapsed_time": "2:00:27", "remaining_time": "1:04:10"}
{"current_steps": 1126, "total_steps": 1686, "eval_loss": 0.9714913368225098, "epoch": 2.0, "percentage": 66.79, "elapsed_time": "2:05:11", "remaining_time": "1:02:15"}
{"current_steps": 1200, "total_steps": 1686, "loss": 0.9097, "lr": 1.1628818681133966e-05, "epoch": 2.1315555555555554, "percentage": 71.17, "elapsed_time": "2:13:10", "remaining_time": "0:53:56"}
{"current_steps": 1300, "total_steps": 1686, "loss": 0.8999, "lr": 7.571161116308206e-06, "epoch": 2.3093333333333335, "percentage": 77.11, "elapsed_time": "2:23:56", "remaining_time": "0:42:44"}
{"current_steps": 1400, "total_steps": 1686, "loss": 0.8997, "lr": 4.258311565949436e-06, "epoch": 2.487111111111111, "percentage": 83.04, "elapsed_time": "2:34:42", "remaining_time": "0:31:36"}
{"current_steps": 1500, "total_steps": 1686, "loss": 0.9011, "lr": 1.8318421056443574e-06, "epoch": 2.664888888888889, "percentage": 88.97, "elapsed_time": "2:45:28", "remaining_time": "0:20:31"}
{"current_steps": 1600, "total_steps": 1686, "loss": 0.9017, "lr": 3.954460400907217e-07, "epoch": 2.8426666666666667, "percentage": 94.9, "elapsed_time": "2:56:14", "remaining_time": "0:09:28"}
{"current_steps": 1686, "total_steps": 1686, "eval_loss": 0.9726876020431519, "epoch": 2.9955555555555557, "percentage": 100.0, "elapsed_time": "3:07:29", "remaining_time": "0:00:00"}
{"current_steps": 1686, "total_steps": 1686, "epoch": 2.9955555555555557, "percentage": 100.0, "elapsed_time": "3:07:30", "remaining_time": "0:00:00"}