Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3154eb3b3d19d9bb62568b8cd4d9c0414156d33d331afd8b663819b7e812a1c1
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8421d261ca4e3211025e9ebe0ea9321ee3208413b3bdc1039253d12be6b01947
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66f88371331c7ae4de63e3ccf23f1013ba8fab55df8010d2bf0fa0d038c2314e
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:113b91bc01a9471bdf479068fd8968294aecea8ad86445e1cf860975005fc90d
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -64,3 +64,36 @@
|
|
64 |
{"current_steps": 64, "total_steps": 224, "loss": 0.4782, "lr": 1.8016043638794975e-05, "epoch": 1.9518987341772152, "percentage": 28.57, "elapsed_time": "2:37:22", "remaining_time": "6:33:27"}
|
65 |
{"current_steps": 65, "total_steps": 224, "loss": 0.4688, "lr": 1.7921624734111292e-05, "epoch": 1.9822784810126581, "percentage": 29.02, "elapsed_time": "2:39:52", "remaining_time": "6:31:05"}
|
66 |
{"current_steps": 66, "total_steps": 224, "loss": 0.4474, "lr": 1.7825270686467567e-05, "epoch": 2.020253164556962, "percentage": 29.46, "elapsed_time": "2:43:07", "remaining_time": "6:30:30"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
64 |
{"current_steps": 64, "total_steps": 224, "loss": 0.4782, "lr": 1.8016043638794975e-05, "epoch": 1.9518987341772152, "percentage": 28.57, "elapsed_time": "2:37:22", "remaining_time": "6:33:27"}
|
65 |
{"current_steps": 65, "total_steps": 224, "loss": 0.4688, "lr": 1.7921624734111292e-05, "epoch": 1.9822784810126581, "percentage": 29.02, "elapsed_time": "2:39:52", "remaining_time": "6:31:05"}
|
66 |
{"current_steps": 66, "total_steps": 224, "loss": 0.4474, "lr": 1.7825270686467567e-05, "epoch": 2.020253164556962, "percentage": 29.46, "elapsed_time": "2:43:07", "remaining_time": "6:30:30"}
|
67 |
+
{"current_steps": 67, "total_steps": 224, "loss": 0.4178, "lr": 1.7727005033820117e-05, "epoch": 2.050632911392405, "percentage": 29.91, "elapsed_time": "2:45:28", "remaining_time": "6:27:45"}
|
68 |
+
{"current_steps": 68, "total_steps": 224, "loss": 0.4287, "lr": 1.762685178110382e-05, "epoch": 2.081012658227848, "percentage": 30.36, "elapsed_time": "2:47:51", "remaining_time": "6:25:04"}
|
69 |
+
{"current_steps": 69, "total_steps": 224, "loss": 0.3979, "lr": 1.752483539436807e-05, "epoch": 2.1113924050632913, "percentage": 30.8, "elapsed_time": "2:50:15", "remaining_time": "6:22:27"}
|
70 |
+
{"current_steps": 70, "total_steps": 224, "loss": 0.4105, "lr": 1.7420980794800013e-05, "epoch": 2.141772151898734, "percentage": 31.25, "elapsed_time": "2:52:42", "remaining_time": "6:19:57"}
|
71 |
+
{"current_steps": 71, "total_steps": 224, "loss": 0.4061, "lr": 1.731531335263669e-05, "epoch": 2.1721518987341772, "percentage": 31.7, "elapsed_time": "2:55:02", "remaining_time": "6:17:12"}
|
72 |
+
{"current_steps": 72, "total_steps": 224, "loss": 0.4174, "lr": 1.720785888096743e-05, "epoch": 2.2025316455696204, "percentage": 32.14, "elapsed_time": "2:57:30", "remaining_time": "6:14:44"}
|
73 |
+
{"current_steps": 73, "total_steps": 224, "loss": 0.4163, "lr": 1.7098643629428035e-05, "epoch": 2.232911392405063, "percentage": 32.59, "elapsed_time": "3:00:08", "remaining_time": "6:12:38"}
|
74 |
+
{"current_steps": 74, "total_steps": 224, "loss": 0.3913, "lr": 1.698769427778842e-05, "epoch": 2.2632911392405064, "percentage": 33.04, "elapsed_time": "3:02:34", "remaining_time": "6:10:04"}
|
75 |
+
{"current_steps": 75, "total_steps": 224, "loss": 0.4204, "lr": 1.687503792943506e-05, "epoch": 2.293670886075949, "percentage": 33.48, "elapsed_time": "3:05:06", "remaining_time": "6:07:44"}
|
76 |
+
{"current_steps": 76, "total_steps": 224, "loss": 0.3909, "lr": 1.6760702104750046e-05, "epoch": 2.3240506329113924, "percentage": 33.93, "elapsed_time": "3:07:21", "remaining_time": "6:04:50"}
|
77 |
+
{"current_steps": 77, "total_steps": 224, "loss": 0.4006, "lr": 1.664471473438822e-05, "epoch": 2.3544303797468356, "percentage": 34.38, "elapsed_time": "3:09:52", "remaining_time": "6:02:29"}
|
78 |
+
{"current_steps": 78, "total_steps": 224, "loss": 0.4245, "lr": 1.6527104152454096e-05, "epoch": 2.3848101265822783, "percentage": 34.82, "elapsed_time": "3:12:34", "remaining_time": "6:00:27"}
|
79 |
+
{"current_steps": 79, "total_steps": 224, "loss": 0.4257, "lr": 1.6407899089580263e-05, "epoch": 2.4151898734177215, "percentage": 35.27, "elapsed_time": "3:14:54", "remaining_time": "5:57:44"}
|
80 |
+
{"current_steps": 80, "total_steps": 224, "loss": 0.4176, "lr": 1.628712866590885e-05, "epoch": 2.4455696202531647, "percentage": 35.71, "elapsed_time": "3:17:29", "remaining_time": "5:55:28"}
|
81 |
+
{"current_steps": 81, "total_steps": 224, "loss": 0.4061, "lr": 1.6164822383977912e-05, "epoch": 2.4759493670886075, "percentage": 36.16, "elapsed_time": "3:19:55", "remaining_time": "5:52:57"}
|
82 |
+
{"current_steps": 82, "total_steps": 224, "loss": 0.4037, "lr": 1.604101012151436e-05, "epoch": 2.5063291139240507, "percentage": 36.61, "elapsed_time": "3:22:17", "remaining_time": "5:50:17"}
|
83 |
+
{"current_steps": 83, "total_steps": 224, "loss": 0.4074, "lr": 1.5915722124135227e-05, "epoch": 2.536708860759494, "percentage": 37.05, "elapsed_time": "3:24:38", "remaining_time": "5:47:37"}
|
84 |
+
{"current_steps": 84, "total_steps": 224, "loss": 0.4198, "lr": 1.5788988997959115e-05, "epoch": 2.5670886075949366, "percentage": 37.5, "elapsed_time": "3:27:12", "remaining_time": "5:45:20"}
|
85 |
+
{"current_steps": 85, "total_steps": 224, "loss": 0.4224, "lr": 1.5660841702129533e-05, "epoch": 2.59746835443038, "percentage": 37.95, "elapsed_time": "3:29:40", "remaining_time": "5:42:52"}
|
86 |
+
{"current_steps": 86, "total_steps": 224, "loss": 0.3984, "lr": 1.5531311541251995e-05, "epoch": 2.6278481012658226, "percentage": 38.39, "elapsed_time": "3:32:11", "remaining_time": "5:40:29"}
|
87 |
+
{"current_steps": 87, "total_steps": 224, "loss": 0.3933, "lr": 1.540043015774676e-05, "epoch": 2.6582278481012658, "percentage": 38.84, "elapsed_time": "3:34:48", "remaining_time": "5:38:16"}
|
88 |
+
{"current_steps": 88, "total_steps": 224, "loss": 0.4038, "lr": 1.5268229524119007e-05, "epoch": 2.688607594936709, "percentage": 39.29, "elapsed_time": "3:37:13", "remaining_time": "5:35:42"}
|
89 |
+
{"current_steps": 89, "total_steps": 224, "loss": 0.4069, "lr": 1.513474193514842e-05, "epoch": 2.7189873417721517, "percentage": 39.73, "elapsed_time": "3:39:42", "remaining_time": "5:33:16"}
|
90 |
+
{"current_steps": 90, "total_steps": 224, "loss": 0.3885, "lr": 1.5000000000000002e-05, "epoch": 2.749367088607595, "percentage": 40.18, "elapsed_time": "3:42:07", "remaining_time": "5:30:43"}
|
91 |
+
{"current_steps": 91, "total_steps": 224, "loss": 0.4182, "lr": 1.4864036634258112e-05, "epoch": 2.779746835443038, "percentage": 40.62, "elapsed_time": "3:44:37", "remaining_time": "5:28:18"}
|
92 |
+
{"current_steps": 92, "total_steps": 224, "loss": 0.4062, "lr": 1.4726885051885654e-05, "epoch": 2.810126582278481, "percentage": 41.07, "elapsed_time": "3:46:51", "remaining_time": "5:25:29"}
|
93 |
+
{"current_steps": 93, "total_steps": 224, "loss": 0.41, "lr": 1.4588578757110359e-05, "epoch": 2.840506329113924, "percentage": 41.52, "elapsed_time": "3:49:18", "remaining_time": "5:22:59"}
|
94 |
+
{"current_steps": 94, "total_steps": 224, "loss": 0.4064, "lr": 1.4449151536240167e-05, "epoch": 2.8708860759493673, "percentage": 41.96, "elapsed_time": "3:51:47", "remaining_time": "5:20:33"}
|
95 |
+
{"current_steps": 95, "total_steps": 224, "loss": 0.3911, "lr": 1.4308637449409705e-05, "epoch": 2.90126582278481, "percentage": 42.41, "elapsed_time": "3:54:12", "remaining_time": "5:18:02"}
|
96 |
+
{"current_steps": 96, "total_steps": 224, "loss": 0.4108, "lr": 1.4167070822259868e-05, "epoch": 2.9316455696202532, "percentage": 42.86, "elapsed_time": "3:56:46", "remaining_time": "5:15:41"}
|
97 |
+
{"current_steps": 97, "total_steps": 224, "loss": 0.4131, "lr": 1.402448623755254e-05, "epoch": 2.962025316455696, "percentage": 43.3, "elapsed_time": "3:59:19", "remaining_time": "5:13:20"}
|
98 |
+
{"current_steps": 98, "total_steps": 224, "loss": 0.4051, "lr": 1.3880918526722497e-05, "epoch": 2.992405063291139, "percentage": 43.75, "elapsed_time": "4:01:54", "remaining_time": "5:11:01"}
|
99 |
+
{"current_steps": 99, "total_steps": 224, "loss": 0.3711, "lr": 1.3736402761368597e-05, "epoch": 3.030379746835443, "percentage": 44.2, "elapsed_time": "4:05:11", "remaining_time": "5:09:35"}
|