Training in progress, epoch 7
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3bfff6006913dcd8633086e0ed140900b9d9db950821138f81392f53786b3a6e
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:474b5a30cb743f0eae0b508d85dbe4cbf433d867e6e9d8f3c4f373b23de59973
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7400a178ea7d3ae67de68267e370b7429ed6e97dace4dc70ba2c753f03eed08a
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1e6c28b74202f6c4fc88f49fe2279b1e65b469a46d6f1ec6e2fb5a8cb27fffb
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -199,3 +199,34 @@
|
|
199 |
{"current_steps": 199, "total_steps": 231, "loss": 0.2609, "lr": 1.156314638334277e-06, "epoch": 6.03030303030303, "percentage": 86.15, "elapsed_time": "2:04:15", "remaining_time": "0:19:58"}
|
200 |
{"current_steps": 200, "total_steps": 231, "loss": 0.2696, "lr": 1.086492267732462e-06, "epoch": 6.0606060606060606, "percentage": 86.58, "elapsed_time": "2:04:46", "remaining_time": "0:19:20"}
|
201 |
{"current_steps": 201, "total_steps": 231, "loss": 0.26, "lr": 1.01872294636304e-06, "epoch": 6.090909090909091, "percentage": 87.01, "elapsed_time": "2:05:20", "remaining_time": "0:18:42"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
199 |
{"current_steps": 199, "total_steps": 231, "loss": 0.2609, "lr": 1.156314638334277e-06, "epoch": 6.03030303030303, "percentage": 86.15, "elapsed_time": "2:04:15", "remaining_time": "0:19:58"}
|
200 |
{"current_steps": 200, "total_steps": 231, "loss": 0.2696, "lr": 1.086492267732462e-06, "epoch": 6.0606060606060606, "percentage": 86.58, "elapsed_time": "2:04:46", "remaining_time": "0:19:20"}
|
201 |
{"current_steps": 201, "total_steps": 231, "loss": 0.26, "lr": 1.01872294636304e-06, "epoch": 6.090909090909091, "percentage": 87.01, "elapsed_time": "2:05:20", "remaining_time": "0:18:42"}
|
202 |
+
{"current_steps": 202, "total_steps": 231, "loss": 0.2666, "lr": 9.530222835413739e-07, "epoch": 6.121212121212121, "percentage": 87.45, "elapsed_time": "2:05:54", "remaining_time": "0:18:04"}
|
203 |
+
{"current_steps": 203, "total_steps": 231, "loss": 0.2667, "lr": 8.894054121084839e-07, "epoch": 6.151515151515151, "percentage": 87.88, "elapsed_time": "2:06:26", "remaining_time": "0:17:26"}
|
204 |
+
{"current_steps": 204, "total_steps": 231, "loss": 0.2599, "lr": 8.278869849454718e-07, "epoch": 6.181818181818182, "percentage": 88.31, "elapsed_time": "2:06:58", "remaining_time": "0:16:48"}
|
205 |
+
{"current_steps": 205, "total_steps": 231, "loss": 0.2711, "lr": 7.684811715985429e-07, "epoch": 6.212121212121212, "percentage": 88.74, "elapsed_time": "2:07:31", "remaining_time": "0:16:10"}
|
206 |
+
{"current_steps": 206, "total_steps": 231, "loss": 0.2664, "lr": 7.1120165501533e-07, "epoch": 6.242424242424242, "percentage": 89.18, "elapsed_time": "2:08:05", "remaining_time": "0:15:32"}
|
207 |
+
{"current_steps": 207, "total_steps": 231, "loss": 0.264, "lr": 6.560616283932897e-07, "epoch": 6.2727272727272725, "percentage": 89.61, "elapsed_time": "2:08:38", "remaining_time": "0:14:54"}
|
208 |
+
{"current_steps": 208, "total_steps": 231, "loss": 0.2642, "lr": 6.030737921409169e-07, "epoch": 6.303030303030303, "percentage": 90.04, "elapsed_time": "2:09:12", "remaining_time": "0:14:17"}
|
209 |
+
{"current_steps": 209, "total_steps": 231, "loss": 0.2721, "lr": 5.522503509524591e-07, "epoch": 6.333333333333333, "percentage": 90.48, "elapsed_time": "2:09:46", "remaining_time": "0:13:39"}
|
210 |
+
{"current_steps": 210, "total_steps": 231, "loss": 0.2639, "lr": 5.036030109968082e-07, "epoch": 6.363636363636363, "percentage": 90.91, "elapsed_time": "2:10:17", "remaining_time": "0:13:01"}
|
211 |
+
{"current_steps": 211, "total_steps": 231, "loss": 0.2586, "lr": 4.5714297722121105e-07, "epoch": 6.393939393939394, "percentage": 91.34, "elapsed_time": "2:10:52", "remaining_time": "0:12:24"}
|
212 |
+
{"current_steps": 212, "total_steps": 231, "loss": 0.2681, "lr": 4.128809507704445e-07, "epoch": 6.424242424242424, "percentage": 91.77, "elapsed_time": "2:11:25", "remaining_time": "0:11:46"}
|
213 |
+
{"current_steps": 213, "total_steps": 231, "loss": 0.2626, "lr": 3.708271265220087e-07, "epoch": 6.454545454545454, "percentage": 92.21, "elapsed_time": "2:11:59", "remaining_time": "0:11:09"}
|
214 |
+
{"current_steps": 214, "total_steps": 231, "loss": 0.2622, "lr": 3.309911907379393e-07, "epoch": 6.484848484848484, "percentage": 92.64, "elapsed_time": "2:12:34", "remaining_time": "0:10:31"}
|
215 |
+
{"current_steps": 215, "total_steps": 231, "loss": 0.2522, "lr": 2.9338231883378365e-07, "epoch": 6.515151515151516, "percentage": 93.07, "elapsed_time": "2:13:09", "remaining_time": "0:09:54"}
|
216 |
+
{"current_steps": 216, "total_steps": 231, "loss": 0.2706, "lr": 2.5800917326521013e-07, "epoch": 6.545454545454545, "percentage": 93.51, "elapsed_time": "2:13:43", "remaining_time": "0:09:17"}
|
217 |
+
{"current_steps": 217, "total_steps": 231, "loss": 0.2459, "lr": 2.248799015327907e-07, "epoch": 6.575757575757576, "percentage": 93.94, "elapsed_time": "2:14:15", "remaining_time": "0:08:39"}
|
218 |
+
{"current_steps": 218, "total_steps": 231, "loss": 0.2536, "lr": 1.9400213430538773e-07, "epoch": 6.606060606060606, "percentage": 94.37, "elapsed_time": "2:14:46", "remaining_time": "0:08:02"}
|
219 |
+
{"current_steps": 219, "total_steps": 231, "loss": 0.2689, "lr": 1.6538298366257975e-07, "epoch": 6.636363636363637, "percentage": 94.81, "elapsed_time": "2:15:19", "remaining_time": "0:07:24"}
|
220 |
+
{"current_steps": 220, "total_steps": 231, "loss": 0.2725, "lr": 1.3902904145653094e-07, "epoch": 6.666666666666667, "percentage": 95.24, "elapsed_time": "2:15:51", "remaining_time": "0:06:47"}
|
221 |
+
{"current_steps": 221, "total_steps": 231, "loss": 0.2591, "lr": 1.1494637779369766e-07, "epoch": 6.696969696969697, "percentage": 95.67, "elapsed_time": "2:16:22", "remaining_time": "0:06:10"}
|
222 |
+
{"current_steps": 222, "total_steps": 231, "loss": 0.263, "lr": 9.314053963669245e-08, "epoch": 6.7272727272727275, "percentage": 96.1, "elapsed_time": "2:16:56", "remaining_time": "0:05:33"}
|
223 |
+
{"current_steps": 223, "total_steps": 231, "loss": 0.2642, "lr": 7.361654952665608e-08, "epoch": 6.757575757575758, "percentage": 96.54, "elapsed_time": "2:17:29", "remaining_time": "0:04:55"}
|
224 |
+
{"current_steps": 224, "total_steps": 231, "loss": 0.2749, "lr": 5.637890442641403e-08, "epoch": 6.787878787878788, "percentage": 96.97, "elapsed_time": "2:18:03", "remaining_time": "0:04:18"}
|
225 |
+
{"current_steps": 225, "total_steps": 231, "loss": 0.2596, "lr": 4.143157468468717e-08, "epoch": 6.818181818181818, "percentage": 97.4, "elapsed_time": "2:18:36", "remaining_time": "0:03:41"}
|
226 |
+
{"current_steps": 226, "total_steps": 231, "loss": 0.2657, "lr": 2.8778003121607834e-08, "epoch": 6.848484848484849, "percentage": 97.84, "elapsed_time": "2:19:10", "remaining_time": "0:03:04"}
|
227 |
+
{"current_steps": 227, "total_steps": 231, "loss": 0.2626, "lr": 1.8421104235727406e-08, "epoch": 6.878787878787879, "percentage": 98.27, "elapsed_time": "2:19:42", "remaining_time": "0:02:27"}
|
228 |
+
{"current_steps": 228, "total_steps": 231, "loss": 0.2768, "lr": 1.0363263532724433e-08, "epoch": 6.909090909090909, "percentage": 98.7, "elapsed_time": "2:20:16", "remaining_time": "0:01:50"}
|
229 |
+
{"current_steps": 229, "total_steps": 231, "loss": 0.26, "lr": 4.606336975948589e-09, "epoch": 6.9393939393939394, "percentage": 99.13, "elapsed_time": "2:20:48", "remaining_time": "0:01:13"}
|
230 |
+
{"current_steps": 230, "total_steps": 231, "loss": 0.2758, "lr": 1.1516505589381777e-09, "epoch": 6.96969696969697, "percentage": 99.57, "elapsed_time": "2:21:20", "remaining_time": "0:00:36"}
|
231 |
+
{"current_steps": 231, "total_steps": 231, "loss": 0.2744, "lr": 0.0, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "2:21:55", "remaining_time": "0:00:00"}
|
232 |
+
{"current_steps": 231, "total_steps": 231, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "2:25:11", "remaining_time": "0:00:00"}
|