Training in progress, step 246
Browse files
model-00001-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4986211280
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bdecb91c7c72093883c18ea8b0f700105bdca3189d36630b31da397e0c86ecc
|
3 |
size 4986211280
|
model-00002-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954847344
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93bb3b3fdba3cc610e8d88bf5a3148eb57db1c13eedf95326014933e4bdce950
|
3 |
size 4954847344
|
model-00003-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954847392
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e89222b71fe5c407f27b069718e773801f4d29775d647cdf9d119ba589deb4e
|
3 |
size 4954847392
|
model-00004-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954847392
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21afd318523103f6c7041d68fa82643ce547947e8e58696aa6b6c6e19b841300
|
3 |
size 4954847392
|
model-00005-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954847392
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86d076a9e29a56fcc7b097aa94cf32c7871025606917998b921522e2cfa68408
|
3 |
size 4954847392
|
model-00006-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4734533160
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a09cbff743c92d95cd3ce0b2f293a569ba045436edc6911cba2b0428ab3b31cb
|
3 |
size 4734533160
|
trainer_log.jsonl
CHANGED
@@ -200,3 +200,48 @@
|
|
200 |
{"current_steps": 200, "total_steps": 246, "loss": 0.2589, "lr": 1.075066023055527e-06, "epoch": 2.4341708542713567, "percentage": 81.3, "elapsed_time": "7:49:53", "remaining_time": "1:48:04"}
|
201 |
{"current_steps": 201, "total_steps": 246, "loss": 0.2608, "lr": 1.0314311283031531e-06, "epoch": 2.4462311557788947, "percentage": 81.71, "elapsed_time": "7:56:03", "remaining_time": "1:46:34"}
|
202 |
{"current_steps": 202, "total_steps": 246, "loss": 0.2862, "lr": 9.885981734215094e-07, "epoch": 2.4582914572864323, "percentage": 82.11, "elapsed_time": "7:58:25", "remaining_time": "1:44:12"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
200 |
{"current_steps": 200, "total_steps": 246, "loss": 0.2589, "lr": 1.075066023055527e-06, "epoch": 2.4341708542713567, "percentage": 81.3, "elapsed_time": "7:49:53", "remaining_time": "1:48:04"}
|
201 |
{"current_steps": 201, "total_steps": 246, "loss": 0.2608, "lr": 1.0314311283031531e-06, "epoch": 2.4462311557788947, "percentage": 81.71, "elapsed_time": "7:56:03", "remaining_time": "1:46:34"}
|
202 |
{"current_steps": 202, "total_steps": 246, "loss": 0.2862, "lr": 9.885981734215094e-07, "epoch": 2.4582914572864323, "percentage": 82.11, "elapsed_time": "7:58:25", "remaining_time": "1:44:12"}
|
203 |
+
{"current_steps": 203, "total_steps": 246, "loss": 0.2493, "lr": 9.465758137862264e-07, "epoch": 2.47035175879397, "percentage": 82.52, "elapsed_time": "8:00:43", "remaining_time": "1:41:49"}
|
204 |
+
{"current_steps": 204, "total_steps": 246, "loss": 0.2684, "lr": 9.053725409736752e-07, "epoch": 2.4824120603015074, "percentage": 82.93, "elapsed_time": "8:03:04", "remaining_time": "1:39:27"}
|
205 |
+
{"current_steps": 205, "total_steps": 246, "loss": 0.3274, "lr": 8.649966810450472e-07, "epoch": 2.4944723618090454, "percentage": 83.33, "elapsed_time": "8:05:16", "remaining_time": "1:37:03"}
|
206 |
+
{"current_steps": 206, "total_steps": 246, "loss": 0.2405, "lr": 8.254563928638892e-07, "epoch": 2.506532663316583, "percentage": 83.74, "elapsed_time": "8:07:41", "remaining_time": "1:34:41"}
|
207 |
+
{"current_steps": 207, "total_steps": 246, "loss": 0.2868, "lr": 7.86759666447412e-07, "epoch": 2.5185929648241205, "percentage": 84.15, "elapsed_time": "8:09:53", "remaining_time": "1:32:17"}
|
208 |
+
{"current_steps": 208, "total_steps": 246, "loss": 0.2584, "lr": 7.489143213519301e-07, "epoch": 2.530653266331658, "percentage": 84.55, "elapsed_time": "8:12:10", "remaining_time": "1:29:54"}
|
209 |
+
{"current_steps": 209, "total_steps": 246, "loss": 0.2817, "lr": 7.119280050927407e-07, "epoch": 2.542713567839196, "percentage": 84.96, "elapsed_time": "8:14:28", "remaining_time": "1:27:32"}
|
210 |
+
{"current_steps": 210, "total_steps": 246, "loss": 0.2781, "lr": 6.758081915987669e-07, "epoch": 2.5547738693467337, "percentage": 85.37, "elapsed_time": "8:17:15", "remaining_time": "1:25:14"}
|
211 |
+
{"current_steps": 211, "total_steps": 246, "loss": 0.2747, "lr": 6.405621797022848e-07, "epoch": 2.5668341708542712, "percentage": 85.77, "elapsed_time": "8:19:43", "remaining_time": "1:22:53"}
|
212 |
+
{"current_steps": 212, "total_steps": 246, "loss": 0.2506, "lr": 6.061970916640236e-07, "epoch": 2.5788944723618092, "percentage": 86.18, "elapsed_time": "8:22:09", "remaining_time": "1:20:32"}
|
213 |
+
{"current_steps": 213, "total_steps": 246, "loss": 0.2466, "lr": 5.727198717339511e-07, "epoch": 2.590954773869347, "percentage": 86.59, "elapsed_time": "8:24:37", "remaining_time": "1:18:10"}
|
214 |
+
{"current_steps": 214, "total_steps": 246, "loss": 0.2891, "lr": 5.401372847480285e-07, "epoch": 2.6030150753768844, "percentage": 86.99, "elapsed_time": "8:27:06", "remaining_time": "1:15:49"}
|
215 |
+
{"current_steps": 215, "total_steps": 246, "loss": 0.2778, "lr": 5.084559147612244e-07, "epoch": 2.6150753768844224, "percentage": 87.4, "elapsed_time": "8:29:15", "remaining_time": "1:13:25"}
|
216 |
+
{"current_steps": 216, "total_steps": 246, "loss": 0.271, "lr": 4.776821637170525e-07, "epoch": 2.62713567839196, "percentage": 87.8, "elapsed_time": "8:31:30", "remaining_time": "1:11:02"}
|
217 |
+
{"current_steps": 217, "total_steps": 246, "loss": 0.2594, "lr": 4.4782225015391754e-07, "epoch": 2.6391959798994975, "percentage": 88.21, "elapsed_time": "8:33:46", "remaining_time": "1:08:39"}
|
218 |
+
{"current_steps": 218, "total_steps": 246, "loss": 0.2789, "lr": 4.1888220794851386e-07, "epoch": 2.651256281407035, "percentage": 88.62, "elapsed_time": "8:35:59", "remaining_time": "1:06:16"}
|
219 |
+
{"current_steps": 219, "total_steps": 246, "loss": 0.2507, "lr": 3.908678850965425e-07, "epoch": 2.6633165829145726, "percentage": 89.02, "elapsed_time": "8:38:19", "remaining_time": "1:03:54"}
|
220 |
+
{"current_steps": 220, "total_steps": 246, "loss": 0.2765, "lr": 3.6378494253099307e-07, "epoch": 2.6753768844221106, "percentage": 89.43, "elapsed_time": "8:40:32", "remaining_time": "1:01:31"}
|
221 |
+
{"current_steps": 221, "total_steps": 246, "loss": 0.2909, "lr": 3.3763885297822153e-07, "epoch": 2.687437185929648, "percentage": 89.84, "elapsed_time": "8:42:39", "remaining_time": "0:59:07"}
|
222 |
+
{"current_steps": 222, "total_steps": 246, "loss": 0.2519, "lr": 3.1243489985206097e-07, "epoch": 2.6994974874371858, "percentage": 90.24, "elapsed_time": "8:44:54", "remaining_time": "0:56:44"}
|
223 |
+
{"current_steps": 223, "total_steps": 246, "loss": 0.2676, "lr": 2.8817817618618846e-07, "epoch": 2.7115577889447238, "percentage": 90.65, "elapsed_time": "8:47:11", "remaining_time": "0:54:22"}
|
224 |
+
{"current_steps": 224, "total_steps": 246, "loss": 0.2562, "lr": 2.648735836049615e-07, "epoch": 2.7236180904522613, "percentage": 91.06, "elapsed_time": "8:49:46", "remaining_time": "0:52:01"}
|
225 |
+
{"current_steps": 225, "total_steps": 246, "loss": 0.2797, "lr": 2.4252583133292927e-07, "epoch": 2.735678391959799, "percentage": 91.46, "elapsed_time": "8:52:06", "remaining_time": "0:49:39"}
|
226 |
+
{"current_steps": 226, "total_steps": 246, "loss": 0.2605, "lr": 2.2113943524323167e-07, "epoch": 2.747738693467337, "percentage": 91.87, "elapsed_time": "8:54:30", "remaining_time": "0:47:18"}
|
227 |
+
{"current_steps": 227, "total_steps": 246, "loss": 0.2635, "lr": 2.007187169450603e-07, "epoch": 2.7597989949748745, "percentage": 92.28, "elapsed_time": "8:56:55", "remaining_time": "0:44:56"}
|
228 |
+
{"current_steps": 228, "total_steps": 246, "loss": 0.2416, "lr": 1.8126780291038037e-07, "epoch": 2.771859296482412, "percentage": 92.68, "elapsed_time": "8:59:17", "remaining_time": "0:42:34"}
|
229 |
+
{"current_steps": 229, "total_steps": 246, "loss": 0.2616, "lr": 1.6279062364008446e-07, "epoch": 2.7839195979899496, "percentage": 93.09, "elapsed_time": "9:01:28", "remaining_time": "0:40:11"}
|
230 |
+
{"current_steps": 230, "total_steps": 246, "loss": 0.2287, "lr": 1.4529091286973994e-07, "epoch": 2.7959798994974876, "percentage": 93.5, "elapsed_time": "9:03:42", "remaining_time": "0:37:49"}
|
231 |
+
{"current_steps": 231, "total_steps": 246, "loss": 0.2622, "lr": 1.2877220681510927e-07, "epoch": 2.808040201005025, "percentage": 93.9, "elapsed_time": "9:05:54", "remaining_time": "0:35:26"}
|
232 |
+
{"current_steps": 232, "total_steps": 246, "loss": 0.2804, "lr": 1.1323784345757205e-07, "epoch": 2.8201005025125627, "percentage": 94.31, "elapsed_time": "9:08:09", "remaining_time": "0:33:04"}
|
233 |
+
{"current_steps": 233, "total_steps": 246, "loss": 0.2608, "lr": 9.869096186961025e-08, "epoch": 2.8321608040201003, "percentage": 94.72, "elapsed_time": "9:10:31", "remaining_time": "0:30:42"}
|
234 |
+
{"current_steps": 234, "total_steps": 246, "loss": 0.2967, "lr": 8.513450158049109e-08, "epoch": 2.8442211055276383, "percentage": 95.12, "elapsed_time": "9:12:54", "remaining_time": "0:28:21"}
|
235 |
+
{"current_steps": 235, "total_steps": 246, "loss": 0.324, "lr": 7.257120198226219e-08, "epoch": 2.856281407035176, "percentage": 95.53, "elapsed_time": "9:15:27", "remaining_time": "0:26:00"}
|
236 |
+
{"current_steps": 236, "total_steps": 246, "loss": 0.2671, "lr": 6.100360177619946e-08, "epoch": 2.8683417085427134, "percentage": 95.93, "elapsed_time": "9:17:41", "remaining_time": "0:23:37"}
|
237 |
+
{"current_steps": 237, "total_steps": 246, "loss": 0.2611, "lr": 5.0434038459801213e-08, "epoch": 2.8804020100502514, "percentage": 96.34, "elapsed_time": "9:19:54", "remaining_time": "0:21:15"}
|
238 |
+
{"current_steps": 238, "total_steps": 246, "loss": 0.2658, "lr": 4.086464785444777e-08, "epoch": 2.892462311557789, "percentage": 96.75, "elapsed_time": "9:22:16", "remaining_time": "0:18:54"}
|
239 |
+
{"current_steps": 239, "total_steps": 246, "loss": 0.2621, "lr": 3.229736367380498e-08, "epoch": 2.9045226130653266, "percentage": 97.15, "elapsed_time": "9:24:46", "remaining_time": "0:16:32"}
|
240 |
+
{"current_steps": 240, "total_steps": 246, "loss": 0.2597, "lr": 2.4733917133077378e-08, "epoch": 2.9165829145728646, "percentage": 97.56, "elapsed_time": "9:27:15", "remaining_time": "0:14:10"}
|
241 |
+
{"current_steps": 241, "total_steps": 246, "loss": 0.254, "lr": 1.8175836599173545e-08, "epoch": 2.928643216080402, "percentage": 97.97, "elapsed_time": "9:29:41", "remaining_time": "0:11:49"}
|
242 |
+
{"current_steps": 242, "total_steps": 246, "loss": 0.2697, "lr": 1.2624447281867625e-08, "epoch": 2.9407035175879397, "percentage": 98.37, "elapsed_time": "9:32:11", "remaining_time": "0:09:27"}
|
243 |
+
{"current_steps": 243, "total_steps": 246, "loss": 0.2788, "lr": 8.080870966008513e-09, "epoch": 2.9527638190954772, "percentage": 98.78, "elapsed_time": "9:34:42", "remaining_time": "0:07:05"}
|
244 |
+
{"current_steps": 244, "total_steps": 246, "loss": 0.2511, "lr": 4.546025784837316e-09, "epoch": 2.964824120603015, "percentage": 99.19, "elapsed_time": "9:36:51", "remaining_time": "0:04:43"}
|
245 |
+
{"current_steps": 245, "total_steps": 246, "loss": 0.2715, "lr": 2.0206260344590724e-09, "epoch": 2.976884422110553, "percentage": 99.59, "elapsed_time": "9:39:06", "remaining_time": "0:02:21"}
|
246 |
+
{"current_steps": 246, "total_steps": 246, "loss": 0.2695, "lr": 5.051820295032262e-10, "epoch": 2.9889447236180904, "percentage": 100.0, "elapsed_time": "9:41:19", "remaining_time": "0:00:00"}
|
247 |
+
{"current_steps": 246, "total_steps": 246, "epoch": 2.9889447236180904, "percentage": 100.0, "elapsed_time": "9:46:56", "remaining_time": "0:00:00"}
|