ryanmarten commited on
Commit
d696e69
·
verified ·
1 Parent(s): 107ada6

Training in progress, epoch 11

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:69028dc3c7aedb7203d724227a2eee8c692fa235afe747923d44985189048797
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:739d3c21348213c90d0e8ecbc4332878e85e05197e8da4c99ce81f52cb4c2071
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f7979a4e28a15be080868927d7d0e87806939bf95f9999b21c795abe1efcdf4a
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb531d36b1f617e593533f001d82f80374e85a44643b1f10f685191b3492dbfc
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ddc8468977bb0f8a0129dc1ef877a1384ef3a960bf53f70589944a4307065f54
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e18749951c323edc6307d8cb3c1784ff8b17b503724755d868012396f0146b2
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9454e29c9189d00de6f5ebc60b9d4a35e62015b7c74555c92f08f39213862250
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b25da2f92770d00a1a948724753e88ad269157f4d6ecb40ceaf2ad856a21566
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -105,3 +105,13 @@
105
  {"current_steps": 105, "total_steps": 117, "loss": 0.2629, "lr": 3.18825646801314e-07, "epoch": 11.050632911392405, "percentage": 89.74, "elapsed_time": "1:39:11", "remaining_time": "0:11:20"}
106
  {"current_steps": 106, "total_steps": 117, "loss": 0.2212, "lr": 2.6836308100417874e-07, "epoch": 11.151898734177216, "percentage": 90.6, "elapsed_time": "1:40:00", "remaining_time": "0:10:22"}
107
  {"current_steps": 107, "total_steps": 117, "loss": 0.2229, "lr": 2.2213597106929608e-07, "epoch": 11.253164556962025, "percentage": 91.45, "elapsed_time": "1:40:55", "remaining_time": "0:09:25"}
 
 
 
 
 
 
 
 
 
 
 
105
  {"current_steps": 105, "total_steps": 117, "loss": 0.2629, "lr": 3.18825646801314e-07, "epoch": 11.050632911392405, "percentage": 89.74, "elapsed_time": "1:39:11", "remaining_time": "0:11:20"}
106
  {"current_steps": 106, "total_steps": 117, "loss": 0.2212, "lr": 2.6836308100417874e-07, "epoch": 11.151898734177216, "percentage": 90.6, "elapsed_time": "1:40:00", "remaining_time": "0:10:22"}
107
  {"current_steps": 107, "total_steps": 117, "loss": 0.2229, "lr": 2.2213597106929608e-07, "epoch": 11.253164556962025, "percentage": 91.45, "elapsed_time": "1:40:55", "remaining_time": "0:09:25"}
108
+ {"current_steps": 108, "total_steps": 117, "loss": 0.255, "lr": 1.801856965207338e-07, "epoch": 11.354430379746836, "percentage": 92.31, "elapsed_time": "1:41:47", "remaining_time": "0:08:28"}
109
+ {"current_steps": 109, "total_steps": 117, "loss": 0.2295, "lr": 1.4254980853566248e-07, "epoch": 11.455696202531646, "percentage": 93.16, "elapsed_time": "1:42:34", "remaining_time": "0:07:31"}
110
+ {"current_steps": 110, "total_steps": 117, "loss": 0.2328, "lr": 1.0926199633097156e-07, "epoch": 11.556962025316455, "percentage": 94.02, "elapsed_time": "1:43:16", "remaining_time": "0:06:34"}
111
+ {"current_steps": 111, "total_steps": 117, "loss": 0.2236, "lr": 8.035205700685167e-08, "epoch": 11.658227848101266, "percentage": 94.87, "elapsed_time": "1:44:10", "remaining_time": "0:05:37"}
112
+ {"current_steps": 112, "total_steps": 117, "loss": 0.2559, "lr": 5.584586887435739e-08, "epoch": 11.759493670886076, "percentage": 95.73, "elapsed_time": "1:45:03", "remaining_time": "0:04:41"}
113
+ {"current_steps": 113, "total_steps": 117, "loss": 0.2409, "lr": 3.576536829081323e-08, "epoch": 11.860759493670885, "percentage": 96.58, "elapsed_time": "1:45:57", "remaining_time": "0:03:45"}
114
+ {"current_steps": 114, "total_steps": 117, "loss": 0.2435, "lr": 2.012853002380466e-08, "epoch": 11.962025316455696, "percentage": 97.44, "elapsed_time": "1:46:50", "remaining_time": "0:02:48"}
115
+ {"current_steps": 115, "total_steps": 117, "loss": 0.2131, "lr": 8.949351161324227e-09, "epoch": 12.10126582278481, "percentage": 98.29, "elapsed_time": "1:48:49", "remaining_time": "0:01:53"}
116
+ {"current_steps": 116, "total_steps": 117, "loss": 0.2441, "lr": 2.237838582483387e-09, "epoch": 12.20253164556962, "percentage": 99.15, "elapsed_time": "1:49:40", "remaining_time": "0:00:56"}
117
+ {"current_steps": 117, "total_steps": 117, "loss": 0.2293, "lr": 0.0, "epoch": 12.30379746835443, "percentage": 100.0, "elapsed_time": "1:50:29", "remaining_time": "0:00:00"}