sft-parse_cot / trainer_log.jsonl
YahanYu's picture
Upload folder using huggingface_hub
adfd899 verified
{"current_steps": 10, "total_steps": 450, "loss": 1.2921, "lr": 2.0000000000000003e-06, "epoch": 0.06666666666666667, "percentage": 2.22, "elapsed_time": "0:01:13", "remaining_time": "0:53:38"}
{"current_steps": 20, "total_steps": 450, "loss": 0.6134, "lr": 4.222222222222223e-06, "epoch": 0.13333333333333333, "percentage": 4.44, "elapsed_time": "0:02:17", "remaining_time": "0:49:06"}
{"current_steps": 30, "total_steps": 450, "loss": 0.3546, "lr": 6.444444444444445e-06, "epoch": 0.2, "percentage": 6.67, "elapsed_time": "0:03:23", "remaining_time": "0:47:31"}
{"current_steps": 40, "total_steps": 450, "loss": 0.3599, "lr": 8.666666666666668e-06, "epoch": 0.26666666666666666, "percentage": 8.89, "elapsed_time": "0:04:31", "remaining_time": "0:46:20"}
{"current_steps": 50, "total_steps": 450, "loss": 0.2814, "lr": 9.997593339404757e-06, "epoch": 0.3333333333333333, "percentage": 11.11, "elapsed_time": "0:05:34", "remaining_time": "0:44:35"}
{"current_steps": 60, "total_steps": 450, "loss": 0.2467, "lr": 9.970545007734807e-06, "epoch": 0.4, "percentage": 13.33, "elapsed_time": "0:06:37", "remaining_time": "0:43:02"}
{"current_steps": 70, "total_steps": 450, "loss": 0.2778, "lr": 9.913603233532067e-06, "epoch": 0.4666666666666667, "percentage": 15.56, "elapsed_time": "0:07:43", "remaining_time": "0:41:55"}
{"current_steps": 80, "total_steps": 450, "loss": 0.2439, "lr": 9.827110471326612e-06, "epoch": 0.5333333333333333, "percentage": 17.78, "elapsed_time": "0:08:46", "remaining_time": "0:40:33"}
{"current_steps": 90, "total_steps": 450, "loss": 0.2588, "lr": 9.711586898767462e-06, "epoch": 0.6, "percentage": 20.0, "elapsed_time": "0:09:48", "remaining_time": "0:39:14"}
{"current_steps": 100, "total_steps": 450, "loss": 0.2113, "lr": 9.567727288213005e-06, "epoch": 0.6666666666666666, "percentage": 22.22, "elapsed_time": "0:10:52", "remaining_time": "0:38:04"}
{"current_steps": 110, "total_steps": 450, "loss": 0.2687, "lr": 9.396396828288272e-06, "epoch": 0.7333333333333333, "percentage": 24.44, "elapsed_time": "0:11:55", "remaining_time": "0:36:51"}
{"current_steps": 120, "total_steps": 450, "loss": 0.2585, "lr": 9.19862592053875e-06, "epoch": 0.8, "percentage": 26.67, "elapsed_time": "0:13:02", "remaining_time": "0:35:51"}
{"current_steps": 130, "total_steps": 450, "loss": 0.2307, "lr": 8.97560398247424e-06, "epoch": 0.8666666666666667, "percentage": 28.89, "elapsed_time": "0:14:05", "remaining_time": "0:34:40"}
{"current_steps": 140, "total_steps": 450, "loss": 0.2262, "lr": 8.728672294272009e-06, "epoch": 0.9333333333333333, "percentage": 31.11, "elapsed_time": "0:15:08", "remaining_time": "0:33:32"}
{"current_steps": 150, "total_steps": 450, "loss": 0.2261, "lr": 8.45931593215998e-06, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "0:16:10", "remaining_time": "0:32:21"}
{"current_steps": 160, "total_steps": 450, "loss": 0.1765, "lr": 8.16915483699355e-06, "epoch": 1.0666666666666667, "percentage": 35.56, "elapsed_time": "0:17:14", "remaining_time": "0:31:15"}
{"current_steps": 170, "total_steps": 450, "loss": 0.1954, "lr": 7.859934071740693e-06, "epoch": 1.1333333333333333, "percentage": 37.78, "elapsed_time": "0:18:21", "remaining_time": "0:30:13"}
{"current_steps": 180, "total_steps": 450, "loss": 0.1524, "lr": 7.533513326467911e-06, "epoch": 1.2, "percentage": 40.0, "elapsed_time": "0:19:23", "remaining_time": "0:29:05"}
{"current_steps": 190, "total_steps": 450, "loss": 0.1914, "lr": 7.191855733945388e-06, "epoch": 1.2666666666666666, "percentage": 42.22, "elapsed_time": "0:20:32", "remaining_time": "0:28:07"}
{"current_steps": 200, "total_steps": 450, "loss": 0.1729, "lr": 6.837016063135491e-06, "epoch": 1.3333333333333333, "percentage": 44.44, "elapsed_time": "0:21:36", "remaining_time": "0:27:00"}
{"current_steps": 210, "total_steps": 450, "loss": 0.1771, "lr": 6.4711283615704755e-06, "epoch": 1.4, "percentage": 46.67, "elapsed_time": "0:22:38", "remaining_time": "0:25:52"}
{"current_steps": 220, "total_steps": 450, "loss": 0.1853, "lr": 6.0963931209395165e-06, "epoch": 1.4666666666666668, "percentage": 48.89, "elapsed_time": "0:23:40", "remaining_time": "0:24:45"}
{"current_steps": 230, "total_steps": 450, "loss": 0.1767, "lr": 5.715064043072771e-06, "epoch": 1.5333333333333332, "percentage": 51.11, "elapsed_time": "0:24:43", "remaining_time": "0:23:38"}
{"current_steps": 240, "total_steps": 450, "loss": 0.1463, "lr": 5.329434485913393e-06, "epoch": 1.6, "percentage": 53.33, "elapsed_time": "0:25:46", "remaining_time": "0:22:32"}
{"current_steps": 250, "total_steps": 450, "loss": 0.1258, "lr": 4.941823670993016e-06, "epoch": 1.6666666666666665, "percentage": 55.56, "elapsed_time": "0:26:49", "remaining_time": "0:21:27"}
{"current_steps": 260, "total_steps": 450, "loss": 0.1468, "lr": 4.5545627353605705e-06, "epoch": 1.7333333333333334, "percentage": 57.78, "elapsed_time": "0:27:51", "remaining_time": "0:20:21"}
{"current_steps": 270, "total_steps": 450, "loss": 0.1604, "lr": 4.1699807118497815e-06, "epoch": 1.8, "percentage": 60.0, "elapsed_time": "0:28:55", "remaining_time": "0:19:16"}
{"current_steps": 280, "total_steps": 450, "loss": 0.1535, "lr": 3.790390522001662e-06, "epoch": 1.8666666666666667, "percentage": 62.22, "elapsed_time": "0:30:00", "remaining_time": "0:18:12"}
{"current_steps": 290, "total_steps": 450, "loss": 0.1403, "lr": 3.418075065882217e-06, "epoch": 1.9333333333333333, "percentage": 64.44, "elapsed_time": "0:31:02", "remaining_time": "0:17:07"}
{"current_steps": 300, "total_steps": 450, "loss": 0.1425, "lr": 3.0552734924528304e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:32:04", "remaining_time": "0:16:02"}
{"current_steps": 310, "total_steps": 450, "loss": 0.0884, "lr": 2.7041677330649408e-06, "epoch": 2.066666666666667, "percentage": 68.89, "elapsed_time": "0:33:07", "remaining_time": "0:14:57"}
{"current_steps": 320, "total_steps": 450, "loss": 0.076, "lr": 2.3668693790681634e-06, "epoch": 2.1333333333333333, "percentage": 71.11, "elapsed_time": "0:34:10", "remaining_time": "0:13:52"}
{"current_steps": 330, "total_steps": 450, "loss": 0.0727, "lr": 2.0454069824514445e-06, "epoch": 2.2, "percentage": 73.33, "elapsed_time": "0:35:14", "remaining_time": "0:12:48"}
{"current_steps": 340, "total_steps": 450, "loss": 0.0663, "lr": 1.7417138558927244e-06, "epoch": 2.2666666666666666, "percentage": 75.56, "elapsed_time": "0:36:17", "remaining_time": "0:11:44"}
{"current_steps": 350, "total_steps": 450, "loss": 0.0729, "lr": 1.4576164455890014e-06, "epoch": 2.3333333333333335, "percentage": 77.78, "elapsed_time": "0:37:20", "remaining_time": "0:10:40"}
{"current_steps": 360, "total_steps": 450, "loss": 0.0767, "lr": 1.1948233467939978e-06, "epoch": 2.4, "percentage": 80.0, "elapsed_time": "0:38:22", "remaining_time": "0:09:35"}
{"current_steps": 370, "total_steps": 450, "loss": 0.0578, "lr": 9.549150281252633e-07, "epoch": 2.466666666666667, "percentage": 82.22, "elapsed_time": "0:39:24", "remaining_time": "0:08:31"}
{"current_steps": 380, "total_steps": 450, "loss": 0.0667, "lr": 7.393343264399439e-07, "epoch": 2.533333333333333, "percentage": 84.44, "elapsed_time": "0:40:26", "remaining_time": "0:07:27"}
{"current_steps": 390, "total_steps": 450, "loss": 0.0655, "lr": 5.493777694441521e-07, "epoch": 2.6, "percentage": 86.67, "elapsed_time": "0:41:29", "remaining_time": "0:06:23"}
{"current_steps": 400, "total_steps": 450, "loss": 0.0685, "lr": 3.8618777822278854e-07, "epoch": 2.6666666666666665, "percentage": 88.89, "elapsed_time": "0:42:35", "remaining_time": "0:05:19"}
{"current_steps": 410, "total_steps": 450, "loss": 0.0843, "lr": 2.5074579658471266e-07, "epoch": 2.7333333333333334, "percentage": 91.11, "elapsed_time": "0:43:39", "remaining_time": "0:04:15"}
{"current_steps": 420, "total_steps": 450, "loss": 0.0662, "lr": 1.438663885441982e-07, "epoch": 2.8, "percentage": 93.33, "elapsed_time": "0:44:43", "remaining_time": "0:03:11"}
{"current_steps": 430, "total_steps": 450, "loss": 0.0714, "lr": 6.61923394371039e-08, "epoch": 2.8666666666666667, "percentage": 95.56, "elapsed_time": "0:45:46", "remaining_time": "0:02:07"}
{"current_steps": 440, "total_steps": 450, "loss": 0.0702, "lr": 1.8190790134231528e-08, "epoch": 2.9333333333333336, "percentage": 97.78, "elapsed_time": "0:46:48", "remaining_time": "0:01:03"}
{"current_steps": 450, "total_steps": 450, "loss": 0.0722, "lr": 1.504276011621286e-10, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:47:51", "remaining_time": "0:00:00"}
{"current_steps": 450, "total_steps": 450, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:52:09", "remaining_time": "0:00:00"}