full-train-openai / trainer_log.jsonl
anthonymeo's picture
Upload folder using huggingface_hub
b005065 verified
raw
history blame contribute delete
No virus
10.7 kB
{"current_steps": 10, "total_steps": 486, "loss": 1.0772, "learning_rate": 2.0408163265306125e-06, "epoch": 0.06172839506172839, "percentage": 2.06, "elapsed_time": "0:01:08", "remaining_time": "0:54:44"}
{"current_steps": 20, "total_steps": 486, "loss": 0.5972, "learning_rate": 4.081632653061225e-06, "epoch": 0.12345679012345678, "percentage": 4.12, "elapsed_time": "0:02:12", "remaining_time": "0:51:37"}
{"current_steps": 30, "total_steps": 486, "loss": 0.3747, "learning_rate": 6.122448979591837e-06, "epoch": 0.18518518518518517, "percentage": 6.17, "elapsed_time": "0:03:16", "remaining_time": "0:49:50"}
{"current_steps": 40, "total_steps": 486, "loss": 0.3125, "learning_rate": 8.16326530612245e-06, "epoch": 0.24691358024691357, "percentage": 8.23, "elapsed_time": "0:04:17", "remaining_time": "0:47:51"}
{"current_steps": 50, "total_steps": 486, "loss": 0.3415, "learning_rate": 9.999870796282452e-06, "epoch": 0.30864197530864196, "percentage": 10.29, "elapsed_time": "0:05:22", "remaining_time": "0:46:56"}
{"current_steps": 60, "total_steps": 486, "loss": 0.3261, "learning_rate": 9.984374428250894e-06, "epoch": 0.37037037037037035, "percentage": 12.35, "elapsed_time": "0:06:29", "remaining_time": "0:46:08"}
{"current_steps": 70, "total_steps": 486, "loss": 0.2905, "learning_rate": 9.943129053516176e-06, "epoch": 0.43209876543209874, "percentage": 14.4, "elapsed_time": "0:07:29", "remaining_time": "0:44:33"}
{"current_steps": 80, "total_steps": 486, "loss": 0.3551, "learning_rate": 9.876347743436758e-06, "epoch": 0.49382716049382713, "percentage": 16.46, "elapsed_time": "0:08:35", "remaining_time": "0:43:36"}
{"current_steps": 90, "total_steps": 486, "loss": 0.3212, "learning_rate": 9.78437548662167e-06, "epoch": 0.5555555555555556, "percentage": 18.52, "elapsed_time": "0:09:41", "remaining_time": "0:42:36"}
{"current_steps": 100, "total_steps": 486, "loss": 0.3022, "learning_rate": 9.66768740673815e-06, "epoch": 0.6172839506172839, "percentage": 20.58, "elapsed_time": "0:10:43", "remaining_time": "0:41:25"}
{"current_steps": 100, "total_steps": 486, "eval_loss": 0.28118011355400085, "epoch": 0.6172839506172839, "percentage": 20.58, "elapsed_time": "0:11:17", "remaining_time": "0:43:35"}
{"current_steps": 110, "total_steps": 486, "loss": 0.3117, "learning_rate": 9.52688630804867e-06, "epoch": 0.6790123456790124, "percentage": 22.63, "elapsed_time": "0:12:38", "remaining_time": "0:43:14"}
{"current_steps": 120, "total_steps": 486, "loss": 0.3195, "learning_rate": 9.362699561356957e-06, "epoch": 0.7407407407407407, "percentage": 24.69, "elapsed_time": "0:13:43", "remaining_time": "0:41:52"}
{"current_steps": 130, "total_steps": 486, "loss": 0.333, "learning_rate": 9.175975346450063e-06, "epoch": 0.8024691358024691, "percentage": 26.75, "elapsed_time": "0:14:42", "remaining_time": "0:40:16"}
{"current_steps": 140, "total_steps": 486, "loss": 0.2938, "learning_rate": 8.9676782704478e-06, "epoch": 0.8641975308641975, "percentage": 28.81, "elapsed_time": "0:15:44", "remaining_time": "0:38:55"}
{"current_steps": 150, "total_steps": 486, "loss": 0.2986, "learning_rate": 8.738884384694905e-06, "epoch": 0.9259259259259259, "percentage": 30.86, "elapsed_time": "0:16:48", "remaining_time": "0:37:38"}
{"current_steps": 160, "total_steps": 486, "loss": 0.2574, "learning_rate": 8.490775625938452e-06, "epoch": 0.9876543209876543, "percentage": 32.92, "elapsed_time": "0:17:51", "remaining_time": "0:36:24"}
{"current_steps": 170, "total_steps": 486, "loss": 0.1849, "learning_rate": 8.224633710506997e-06, "epoch": 1.0493827160493827, "percentage": 34.98, "elapsed_time": "0:18:50", "remaining_time": "0:35:02"}
{"current_steps": 180, "total_steps": 486, "loss": 0.2084, "learning_rate": 7.941833513033873e-06, "epoch": 1.1111111111111112, "percentage": 37.04, "elapsed_time": "0:19:52", "remaining_time": "0:33:46"}
{"current_steps": 190, "total_steps": 486, "loss": 0.239, "learning_rate": 7.643835963929747e-06, "epoch": 1.1728395061728394, "percentage": 39.09, "elapsed_time": "0:20:59", "remaining_time": "0:32:41"}
{"current_steps": 200, "total_steps": 486, "loss": 0.2176, "learning_rate": 7.332180502295729e-06, "epoch": 1.2345679012345678, "percentage": 41.15, "elapsed_time": "0:22:02", "remaining_time": "0:31:30"}
{"current_steps": 200, "total_steps": 486, "eval_loss": 0.28219473361968994, "epoch": 1.2345679012345678, "percentage": 41.15, "elapsed_time": "0:22:35", "remaining_time": "0:32:18"}
{"current_steps": 210, "total_steps": 486, "loss": 0.2283, "learning_rate": 7.008477123264849e-06, "epoch": 1.2962962962962963, "percentage": 43.21, "elapsed_time": "0:23:59", "remaining_time": "0:31:31"}
{"current_steps": 220, "total_steps": 486, "loss": 0.1902, "learning_rate": 6.674398060854931e-06, "epoch": 1.3580246913580247, "percentage": 45.27, "elapsed_time": "0:24:56", "remaining_time": "0:30:09"}
{"current_steps": 230, "total_steps": 486, "loss": 0.2333, "learning_rate": 6.331669149298781e-06, "epoch": 1.4197530864197532, "percentage": 47.33, "elapsed_time": "0:26:03", "remaining_time": "0:29:00"}
{"current_steps": 240, "total_steps": 486, "loss": 0.2069, "learning_rate": 5.982060907478568e-06, "epoch": 1.4814814814814814, "percentage": 49.38, "elapsed_time": "0:27:10", "remaining_time": "0:27:51"}
{"current_steps": 250, "total_steps": 486, "loss": 0.2263, "learning_rate": 5.627379392521758e-06, "epoch": 1.5432098765432098, "percentage": 51.44, "elapsed_time": "0:28:13", "remaining_time": "0:26:38"}
{"current_steps": 260, "total_steps": 486, "loss": 0.2573, "learning_rate": 5.2694568698084085e-06, "epoch": 1.6049382716049383, "percentage": 53.5, "elapsed_time": "0:29:16", "remaining_time": "0:25:26"}
{"current_steps": 270, "total_steps": 486, "loss": 0.2173, "learning_rate": 4.910142347588041e-06, "epoch": 1.6666666666666665, "percentage": 55.56, "elapsed_time": "0:30:23", "remaining_time": "0:24:18"}
{"current_steps": 280, "total_steps": 486, "loss": 0.1861, "learning_rate": 4.551292025103789e-06, "epoch": 1.7283950617283952, "percentage": 57.61, "elapsed_time": "0:31:27", "remaining_time": "0:23:08"}
{"current_steps": 290, "total_steps": 486, "loss": 0.2185, "learning_rate": 4.1947597035682355e-06, "epoch": 1.7901234567901234, "percentage": 59.67, "elapsed_time": "0:32:31", "remaining_time": "0:21:58"}
{"current_steps": 300, "total_steps": 486, "loss": 0.2157, "learning_rate": 3.842387209527374e-06, "epoch": 1.8518518518518519, "percentage": 61.73, "elapsed_time": "0:33:36", "remaining_time": "0:20:50"}
{"current_steps": 300, "total_steps": 486, "eval_loss": 0.27247950434684753, "epoch": 1.8518518518518519, "percentage": 61.73, "elapsed_time": "0:34:09", "remaining_time": "0:21:10"}
{"current_steps": 310, "total_steps": 486, "loss": 0.1885, "learning_rate": 3.4959948800850253e-06, "epoch": 1.9135802469135803, "percentage": 63.79, "elapsed_time": "0:35:32", "remaining_time": "0:20:10"}
{"current_steps": 320, "total_steps": 486, "loss": 0.2, "learning_rate": 3.1573721591405405e-06, "epoch": 1.9753086419753085, "percentage": 65.84, "elapsed_time": "0:36:38", "remaining_time": "0:19:00"}
{"current_steps": 330, "total_steps": 486, "loss": 0.1642, "learning_rate": 2.8282683532191333e-06, "epoch": 2.037037037037037, "percentage": 67.9, "elapsed_time": "0:37:38", "remaining_time": "0:17:47"}
{"current_steps": 340, "total_steps": 486, "loss": 0.1336, "learning_rate": 2.5103835946496846e-06, "epoch": 2.0987654320987654, "percentage": 69.96, "elapsed_time": "0:38:34", "remaining_time": "0:16:33"}
{"current_steps": 350, "total_steps": 486, "loss": 0.103, "learning_rate": 2.205360058773764e-06, "epoch": 2.1604938271604937, "percentage": 72.02, "elapsed_time": "0:39:36", "remaining_time": "0:15:23"}
{"current_steps": 360, "total_steps": 486, "loss": 0.1322, "learning_rate": 1.914773480557304e-06, "epoch": 2.2222222222222223, "percentage": 74.07, "elapsed_time": "0:40:41", "remaining_time": "0:14:14"}
{"current_steps": 370, "total_steps": 486, "loss": 0.1179, "learning_rate": 1.6401250144296239e-06, "epoch": 2.2839506172839505, "percentage": 76.13, "elapsed_time": "0:41:49", "remaining_time": "0:13:06"}
{"current_steps": 380, "total_steps": 486, "loss": 0.1292, "learning_rate": 1.382833479401438e-06, "epoch": 2.3456790123456788, "percentage": 78.19, "elapsed_time": "0:43:01", "remaining_time": "0:12:00"}
{"current_steps": 390, "total_steps": 486, "loss": 0.1332, "learning_rate": 1.1442280295231656e-06, "epoch": 2.4074074074074074, "percentage": 80.25, "elapsed_time": "0:44:00", "remaining_time": "0:10:49"}
{"current_steps": 400, "total_steps": 486, "loss": 0.126, "learning_rate": 9.255412875475256e-07, "epoch": 2.4691358024691357, "percentage": 82.3, "elapsed_time": "0:45:01", "remaining_time": "0:09:40"}
{"current_steps": 400, "total_steps": 486, "eval_loss": 0.30315688252449036, "epoch": 2.4691358024691357, "percentage": 82.3, "elapsed_time": "0:45:35", "remaining_time": "0:09:48"}
{"current_steps": 410, "total_steps": 486, "loss": 0.1301, "learning_rate": 7.279029772675572e-07, "epoch": 2.5308641975308643, "percentage": 84.36, "elapsed_time": "0:47:00", "remaining_time": "0:08:42"}
{"current_steps": 420, "total_steps": 486, "loss": 0.1266, "learning_rate": 5.523340874250704e-07, "epoch": 2.5925925925925926, "percentage": 86.42, "elapsed_time": "0:48:05", "remaining_time": "0:07:33"}
{"current_steps": 430, "total_steps": 486, "loss": 0.1176, "learning_rate": 3.997415973384311e-07, "epoch": 2.6543209876543212, "percentage": 88.48, "elapsed_time": "0:49:05", "remaining_time": "0:06:23"}
{"current_steps": 440, "total_steps": 486, "loss": 0.1289, "learning_rate": 2.7091379149682683e-07, "epoch": 2.7160493827160495, "percentage": 90.53, "elapsed_time": "0:50:07", "remaining_time": "0:05:14"}
{"current_steps": 450, "total_steps": 486, "loss": 0.1032, "learning_rate": 1.6651618732554774e-07, "epoch": 2.7777777777777777, "percentage": 92.59, "elapsed_time": "0:51:10", "remaining_time": "0:04:05"}
{"current_steps": 460, "total_steps": 486, "loss": 0.118, "learning_rate": 8.708809715922973e-08, "epoch": 2.8395061728395063, "percentage": 94.65, "elapsed_time": "0:52:19", "remaining_time": "0:02:57"}
{"current_steps": 470, "total_steps": 486, "loss": 0.1521, "learning_rate": 3.303984218372136e-08, "epoch": 2.9012345679012346, "percentage": 96.71, "elapsed_time": "0:53:22", "remaining_time": "0:01:49"}
{"current_steps": 480, "total_steps": 486, "loss": 0.1211, "learning_rate": 4.650632739194305e-09, "epoch": 2.962962962962963, "percentage": 98.77, "elapsed_time": "0:54:21", "remaining_time": "0:00:40"}
{"current_steps": 486, "total_steps": 486, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:55:26", "remaining_time": "0:00:00"}