yuzhounie commited on
Commit
a9900e7
·
verified ·
1 Parent(s): df2fe51

Training in progress, step 20

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5fc19435d964ece00dc5ecddecc6e9659ddeb5d628400682a47b36750f1c82a3
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ebea22ec9da3338da121f04cf932e6c0c24c689408609a61b15386e8725a8c5
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d81da1fa8c36103e482a541ff95c4e867538c24e46bba3e99a34a3dfdf58ea61
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39c8862e00f8a4cb27f3d78a118576b57853595398adc69ab4730c25258c530c
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4b4a494933112df9c624f87d536954a3280178756e5122dcbf85e65796277728
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:232026012fce69db864c46c3d0d5ce03f3bef49826b5c2d04faca4a782046b7f
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a8e23c7a39bc2fabfa11b06e0899ff21ded71385791371dd14ced0766c8d96d6
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7c62f24c56cef516d3ec6ea23d1670387ebd41d79e355b9679607e49abfd3cb
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -1,8 +1,20 @@
1
- {"current_steps": 1, "total_steps": 3, "loss": 0.7883, "lr": 0.0, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "0:00:29", "remaining_time": "0:00:58"}
2
- {"current_steps": 2, "total_steps": 3, "loss": 0.7883, "lr": 1e-05, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:00:55", "remaining_time": "0:00:27"}
3
- {"current_steps": 3, "total_steps": 3, "loss": 0.4374, "lr": 5e-06, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:01:22", "remaining_time": "0:00:00"}
4
- {"current_steps": 3, "total_steps": 3, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:02:23", "remaining_time": "0:00:00"}
5
- {"current_steps": 4, "total_steps": 6, "loss": 0.4374, "lr": 0.0, "epoch": 4.0, "percentage": 66.67, "elapsed_time": "0:00:29", "remaining_time": "0:00:14"}
6
- {"current_steps": 5, "total_steps": 6, "loss": 0.4374, "lr": 3.4549150281252635e-06, "epoch": 5.0, "percentage": 83.33, "elapsed_time": "0:00:56", "remaining_time": "0:00:11"}
7
- {"current_steps": 6, "total_steps": 6, "loss": 0.3766, "lr": 9.549150281252633e-07, "epoch": 6.0, "percentage": 100.0, "elapsed_time": "0:01:20", "remaining_time": "0:00:00"}
8
- {"current_steps": 6, "total_steps": 6, "epoch": 6.0, "percentage": 100.0, "elapsed_time": "0:02:45", "remaining_time": "0:00:00"}
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"current_steps": 1, "total_steps": 66, "loss": 0.4801, "lr": 0.0, "epoch": 0.08695652173913043, "percentage": 1.52, "elapsed_time": "0:02:44", "remaining_time": "2:58:05"}
2
+ {"current_steps": 2, "total_steps": 66, "loss": 0.4322, "lr": 1.4285714285714286e-06, "epoch": 0.17391304347826086, "percentage": 3.03, "elapsed_time": "0:07:04", "remaining_time": "3:46:33"}
3
+ {"current_steps": 3, "total_steps": 66, "loss": 0.4776, "lr": 2.8571428571428573e-06, "epoch": 0.2608695652173913, "percentage": 4.55, "elapsed_time": "0:10:54", "remaining_time": "3:49:11"}
4
+ {"current_steps": 4, "total_steps": 66, "loss": 0.3783, "lr": 4.2857142857142855e-06, "epoch": 0.34782608695652173, "percentage": 6.06, "elapsed_time": "0:14:55", "remaining_time": "3:51:27"}
5
+ {"current_steps": 5, "total_steps": 66, "loss": 0.3406, "lr": 5.7142857142857145e-06, "epoch": 0.43478260869565216, "percentage": 7.58, "elapsed_time": "0:18:09", "remaining_time": "3:41:37"}
6
+ {"current_steps": 6, "total_steps": 66, "loss": 0.351, "lr": 7.1428571428571436e-06, "epoch": 0.5217391304347826, "percentage": 9.09, "elapsed_time": "0:21:32", "remaining_time": "3:35:26"}
7
+ {"current_steps": 7, "total_steps": 66, "loss": 0.2918, "lr": 8.571428571428571e-06, "epoch": 0.6086956521739131, "percentage": 10.61, "elapsed_time": "0:25:17", "remaining_time": "3:33:09"}
8
+ {"current_steps": 8, "total_steps": 66, "loss": 0.2901, "lr": 1e-05, "epoch": 0.6956521739130435, "percentage": 12.12, "elapsed_time": "0:29:20", "remaining_time": "3:32:45"}
9
+ {"current_steps": 9, "total_steps": 66, "loss": 0.2935, "lr": 9.99291347838381e-06, "epoch": 0.782608695652174, "percentage": 13.64, "elapsed_time": "0:32:26", "remaining_time": "3:25:26"}
10
+ {"current_steps": 10, "total_steps": 66, "loss": 0.3237, "lr": 9.971674001050687e-06, "epoch": 0.8695652173913043, "percentage": 15.15, "elapsed_time": "0:34:19", "remaining_time": "3:12:12"}
11
+ {"current_steps": 11, "total_steps": 66, "loss": 0.2695, "lr": 9.936341773606723e-06, "epoch": 0.9565217391304348, "percentage": 16.67, "elapsed_time": "0:37:14", "remaining_time": "3:06:11"}
12
+ {"current_steps": 12, "total_steps": 66, "loss": 0.3371, "lr": 9.887016949089334e-06, "epoch": 1.0, "percentage": 18.18, "elapsed_time": "0:38:23", "remaining_time": "2:52:44"}
13
+ {"current_steps": 13, "total_steps": 66, "loss": 0.2463, "lr": 9.823839344072582e-06, "epoch": 1.0869565217391304, "percentage": 19.7, "elapsed_time": "0:42:43", "remaining_time": "2:54:09"}
14
+ {"current_steps": 14, "total_steps": 66, "loss": 0.228, "lr": 9.746988042341907e-06, "epoch": 1.1739130434782608, "percentage": 21.21, "elapsed_time": "0:44:40", "remaining_time": "2:45:54"}
15
+ {"current_steps": 15, "total_steps": 66, "loss": 0.2262, "lr": 9.656680887261693e-06, "epoch": 1.2608695652173914, "percentage": 22.73, "elapsed_time": "0:47:49", "remaining_time": "2:42:37"}
16
+ {"current_steps": 16, "total_steps": 66, "loss": 0.2012, "lr": 9.553173864274567e-06, "epoch": 1.3478260869565217, "percentage": 24.24, "elapsed_time": "0:50:38", "remaining_time": "2:38:16"}
17
+ {"current_steps": 17, "total_steps": 66, "loss": 0.2351, "lr": 9.436760375282858e-06, "epoch": 1.434782608695652, "percentage": 25.76, "elapsed_time": "0:55:21", "remaining_time": "2:39:35"}
18
+ {"current_steps": 18, "total_steps": 66, "loss": 0.2577, "lr": 9.307770406969032e-06, "epoch": 1.5217391304347827, "percentage": 27.27, "elapsed_time": "0:58:36", "remaining_time": "2:36:17"}
19
+ {"current_steps": 19, "total_steps": 66, "loss": 0.1864, "lr": 9.166569595412576e-06, "epoch": 1.608695652173913, "percentage": 28.79, "elapsed_time": "1:02:42", "remaining_time": "2:35:07"}
20
+ {"current_steps": 20, "total_steps": 66, "loss": 0.258, "lr": 9.013558189654819e-06, "epoch": 1.6956521739130435, "percentage": 30.3, "elapsed_time": "1:06:27", "remaining_time": "2:32:51"}
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:20b8c9e2a763a087603937d1ab764f1900fe3afa1cd3155f36f65d2dd76037bb
3
  size 7608
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11cfe797e23011f7391f073c189e3e9806843d7a34eb701ca049ae309739cbab
3
  size 7608