OfficerChul's picture
Upload folder using huggingface_hub
ac6d119 verified
{"current_steps": 10, "total_steps": 450, "loss": 2.2662, "lr": 4.000000000000001e-06, "epoch": 0.11196641007697691, "percentage": 2.22, "elapsed_time": "0:08:59", "remaining_time": "6:35:21"}
{"current_steps": 20, "total_steps": 450, "loss": 0.4943, "lr": 8.444444444444446e-06, "epoch": 0.22393282015395383, "percentage": 4.44, "elapsed_time": "0:17:54", "remaining_time": "6:25:01"}
{"current_steps": 30, "total_steps": 450, "loss": 0.3753, "lr": 1.288888888888889e-05, "epoch": 0.3358992302309307, "percentage": 6.67, "elapsed_time": "0:26:52", "remaining_time": "6:16:20"}
{"current_steps": 40, "total_steps": 450, "loss": 0.3318, "lr": 1.7333333333333336e-05, "epoch": 0.44786564030790765, "percentage": 8.89, "elapsed_time": "0:35:51", "remaining_time": "6:07:35"}
{"current_steps": 50, "total_steps": 450, "loss": 0.3098, "lr": 1.9995186678809513e-05, "epoch": 0.5598320503848845, "percentage": 11.11, "elapsed_time": "0:44:51", "remaining_time": "5:58:54"}
{"current_steps": 60, "total_steps": 450, "loss": 0.3035, "lr": 1.9941090015469614e-05, "epoch": 0.6717984604618614, "percentage": 13.33, "elapsed_time": "0:53:51", "remaining_time": "5:50:06"}
{"current_steps": 70, "total_steps": 450, "loss": 0.2911, "lr": 1.9827206467064133e-05, "epoch": 0.7837648705388384, "percentage": 15.56, "elapsed_time": "1:02:53", "remaining_time": "5:41:22"}
{"current_steps": 80, "total_steps": 450, "loss": 0.2698, "lr": 1.9654220942653223e-05, "epoch": 0.8957312806158153, "percentage": 17.78, "elapsed_time": "1:11:54", "remaining_time": "5:32:35"}
{"current_steps": 90, "total_steps": 450, "loss": 0.2482, "lr": 1.9423173797534924e-05, "epoch": 1.0, "percentage": 20.0, "elapsed_time": "1:20:18", "remaining_time": "5:21:14"}
{"current_steps": 100, "total_steps": 450, "loss": 0.2389, "lr": 1.913545457642601e-05, "epoch": 1.1119664100769768, "percentage": 22.22, "elapsed_time": "1:29:21", "remaining_time": "5:12:43"}
{"current_steps": 100, "total_steps": 450, "eval_loss": 0.2237260341644287, "epoch": 1.1119664100769768, "percentage": 22.22, "elapsed_time": "1:34:06", "remaining_time": "5:29:23"}
{"current_steps": 110, "total_steps": 450, "loss": 0.2251, "lr": 1.8792793656576544e-05, "epoch": 1.2239328201539539, "percentage": 24.44, "elapsed_time": "1:44:36", "remaining_time": "5:23:20"}
{"current_steps": 120, "total_steps": 450, "loss": 0.2189, "lr": 1.83972518410775e-05, "epoch": 1.3358992302309307, "percentage": 26.67, "elapsed_time": "1:53:40", "remaining_time": "5:12:37"}
{"current_steps": 130, "total_steps": 450, "loss": 0.2067, "lr": 1.795120796494848e-05, "epoch": 1.4478656403079078, "percentage": 28.89, "elapsed_time": "2:02:45", "remaining_time": "5:02:10"}
{"current_steps": 140, "total_steps": 450, "loss": 0.1981, "lr": 1.7457344588544018e-05, "epoch": 1.5598320503848844, "percentage": 31.11, "elapsed_time": "2:11:50", "remaining_time": "4:51:55"}
{"current_steps": 150, "total_steps": 450, "loss": 0.191, "lr": 1.691863186431996e-05, "epoch": 1.6717984604618614, "percentage": 33.33, "elapsed_time": "2:20:53", "remaining_time": "4:41:47"}
{"current_steps": 160, "total_steps": 450, "loss": 0.1914, "lr": 1.63383096739871e-05, "epoch": 1.7837648705388385, "percentage": 35.56, "elapsed_time": "2:29:58", "remaining_time": "4:31:49"}
{"current_steps": 170, "total_steps": 450, "loss": 0.1903, "lr": 1.5719868143481385e-05, "epoch": 1.8957312806158153, "percentage": 37.78, "elapsed_time": "2:39:03", "remaining_time": "4:21:59"}
{"current_steps": 180, "total_steps": 450, "loss": 0.1863, "lr": 1.5067026652935823e-05, "epoch": 2.0, "percentage": 40.0, "elapsed_time": "2:47:31", "remaining_time": "4:11:17"}
{"current_steps": 190, "total_steps": 450, "loss": 0.157, "lr": 1.4383711467890776e-05, "epoch": 2.111966410076977, "percentage": 42.22, "elapsed_time": "2:56:38", "remaining_time": "4:01:42"}
{"current_steps": 200, "total_steps": 450, "loss": 0.153, "lr": 1.3674032126270982e-05, "epoch": 2.2239328201539537, "percentage": 44.44, "elapsed_time": "3:05:44", "remaining_time": "3:52:10"}
{"current_steps": 200, "total_steps": 450, "eval_loss": 0.16935566067695618, "epoch": 2.2239328201539537, "percentage": 44.44, "elapsed_time": "3:10:32", "remaining_time": "3:58:10"}
{"current_steps": 210, "total_steps": 450, "loss": 0.1498, "lr": 1.2942256723140951e-05, "epoch": 2.3358992302309307, "percentage": 46.67, "elapsed_time": "3:21:08", "remaining_time": "3:49:52"}
{"current_steps": 220, "total_steps": 450, "loss": 0.153, "lr": 1.2192786241879033e-05, "epoch": 2.4478656403079078, "percentage": 48.89, "elapsed_time": "3:30:14", "remaining_time": "3:39:48"}
{"current_steps": 230, "total_steps": 450, "loss": 0.1444, "lr": 1.1430128086145542e-05, "epoch": 2.5598320503848844, "percentage": 51.11, "elapsed_time": "3:39:23", "remaining_time": "3:29:51"}
{"current_steps": 240, "total_steps": 450, "loss": 0.1372, "lr": 1.0658868971826785e-05, "epoch": 2.6717984604618614, "percentage": 53.33, "elapsed_time": "3:48:32", "remaining_time": "3:19:58"}
{"current_steps": 250, "total_steps": 450, "loss": 0.1441, "lr": 9.883647341986032e-06, "epoch": 2.7837648705388385, "percentage": 55.56, "elapsed_time": "3:57:40", "remaining_time": "3:10:08"}
{"current_steps": 260, "total_steps": 450, "loss": 0.1387, "lr": 9.109125470721141e-06, "epoch": 2.8957312806158155, "percentage": 57.78, "elapsed_time": "4:06:48", "remaining_time": "3:00:21"}
{"current_steps": 270, "total_steps": 450, "loss": 0.1345, "lr": 8.339961423699563e-06, "epoch": 3.0, "percentage": 60.0, "elapsed_time": "4:15:20", "remaining_time": "2:50:13"}
{"current_steps": 280, "total_steps": 450, "loss": 0.097, "lr": 7.580781044003324e-06, "epoch": 3.111966410076977, "percentage": 62.22, "elapsed_time": "4:24:33", "remaining_time": "2:40:37"}
{"current_steps": 290, "total_steps": 450, "loss": 0.088, "lr": 6.836150131764434e-06, "epoch": 3.2239328201539537, "percentage": 64.44, "elapsed_time": "4:33:43", "remaining_time": "2:31:01"}
{"current_steps": 300, "total_steps": 450, "loss": 0.0898, "lr": 6.110546984905661e-06, "epoch": 3.3358992302309307, "percentage": 66.67, "elapsed_time": "4:42:52", "remaining_time": "2:21:26"}
{"current_steps": 300, "total_steps": 450, "eval_loss": 0.14970648288726807, "epoch": 3.3358992302309307, "percentage": 66.67, "elapsed_time": "4:47:44", "remaining_time": "2:23:52"}
{"current_steps": 310, "total_steps": 450, "loss": 0.0921, "lr": 5.4083354661298816e-06, "epoch": 3.4478656403079078, "percentage": 68.89, "elapsed_time": "4:58:26", "remaining_time": "2:14:46"}
{"current_steps": 320, "total_steps": 450, "loss": 0.0875, "lr": 4.733738758136327e-06, "epoch": 3.5598320503848844, "percentage": 71.11, "elapsed_time": "5:07:36", "remaining_time": "2:04:58"}
{"current_steps": 330, "total_steps": 450, "loss": 0.0887, "lr": 4.090813964902889e-06, "epoch": 3.6717984604618614, "percentage": 73.33, "elapsed_time": "5:16:49", "remaining_time": "1:55:12"}
{"current_steps": 340, "total_steps": 450, "loss": 0.0858, "lr": 3.483427711785449e-06, "epoch": 3.7837648705388385, "percentage": 75.56, "elapsed_time": "5:26:02", "remaining_time": "1:45:29"}
{"current_steps": 350, "total_steps": 450, "loss": 0.0852, "lr": 2.9152328911780027e-06, "epoch": 3.8957312806158155, "percentage": 77.78, "elapsed_time": "5:35:13", "remaining_time": "1:35:46"}
{"current_steps": 360, "total_steps": 450, "loss": 0.0829, "lr": 2.3896466935879957e-06, "epoch": 4.0, "percentage": 80.0, "elapsed_time": "5:43:46", "remaining_time": "1:25:56"}
{"current_steps": 370, "total_steps": 450, "loss": 0.0471, "lr": 1.9098300562505266e-06, "epoch": 4.111966410076977, "percentage": 82.22, "elapsed_time": "5:53:00", "remaining_time": "1:16:19"}
{"current_steps": 380, "total_steps": 450, "loss": 0.0424, "lr": 1.4786686528798878e-06, "epoch": 4.223932820153954, "percentage": 84.44, "elapsed_time": "6:02:14", "remaining_time": "1:06:43"}
{"current_steps": 390, "total_steps": 450, "loss": 0.0444, "lr": 1.0987555388883042e-06, "epoch": 4.335899230230931, "percentage": 86.67, "elapsed_time": "6:11:25", "remaining_time": "0:57:08"}
{"current_steps": 400, "total_steps": 450, "loss": 0.0425, "lr": 7.723755564455771e-07, "epoch": 4.447865640307907, "percentage": 88.89, "elapsed_time": "6:20:39", "remaining_time": "0:47:34"}
{"current_steps": 400, "total_steps": 450, "eval_loss": 0.16047585010528564, "epoch": 4.447865640307907, "percentage": 88.89, "elapsed_time": "6:25:29", "remaining_time": "0:48:11"}
{"current_steps": 410, "total_steps": 450, "loss": 0.0447, "lr": 5.014915931694253e-07, "epoch": 4.559832050384885, "percentage": 91.11, "elapsed_time": "6:36:13", "remaining_time": "0:38:39"}
{"current_steps": 420, "total_steps": 450, "loss": 0.0428, "lr": 2.877327770883964e-07, "epoch": 4.671798460461861, "percentage": 93.33, "elapsed_time": "6:45:23", "remaining_time": "0:28:57"}
{"current_steps": 430, "total_steps": 450, "loss": 0.0402, "lr": 1.323846788742078e-07, "epoch": 4.783764870538838, "percentage": 95.56, "elapsed_time": "6:54:34", "remaining_time": "0:19:16"}
{"current_steps": 440, "total_steps": 450, "loss": 0.0424, "lr": 3.6381580268463056e-08, "epoch": 4.8957312806158155, "percentage": 97.78, "elapsed_time": "7:03:43", "remaining_time": "0:09:37"}
{"current_steps": 450, "total_steps": 450, "loss": 0.0407, "lr": 3.008552023242572e-10, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "7:12:19", "remaining_time": "0:00:00"}
{"current_steps": 450, "total_steps": 450, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "7:13:48", "remaining_time": "0:00:00"}