yuzhounie commited on
Commit
142a8c3
·
verified ·
1 Parent(s): b7e8289

Training in progress, step 60

Browse files
model-00001-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:44b36e093493b896f84d994d06831b2641901118c6e3e765051530e4018dea22
3
  size 4891730992
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2016cc0a9be46df8bef7859060b6cf9789105332044ae327f7a175e05e255d96
3
  size 4891730992
model-00002-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f3b409c4fcd5470666d27013b3b24595e4ab5b05ea2c910409b99149e02dae47
3
  size 4876059352
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:474c07d635e55f330cfe53a2ece25b42fe82cd661e574d68666a1e435b662678
3
  size 4876059352
model-00003-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:55f059e0a1e015a9f54caf070837d34ceb8474dd1dbce6e8408eb25f853b059e
3
  size 4876059384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:703d5933df268906f34495f5cbcbdf1307d010970e542195d33f8c32b212113d
3
  size 4876059384
model-00004-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4607a948a525c8a91f484e1ccd0e6d63d46b76f46c3969780f5d107be599ad51
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fb01c095811714480715cfb91012c242a7c0ff6519f0215549928a87f00339c
3
  size 4876059416
model-00005-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9684d5afd063010280fed57f354f9b0b1349db77f7ecca49a1c376c0feacc34
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2eff2ead8c5903eeceb1c24f5f97cba7298b67982676559b676871ea25e249fe
3
  size 4876059416
model-00006-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ee316660adaa711420814a4efdfe7f3f43436f4873e32ea7d871f2b70c0f606
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffb2f5063c25982cf50656591c75b43b6cf76c8d62ecaac67f1f23e2ee97d53d
3
  size 4876059416
model-00007-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:436d63b09bc582d99493c1859941adfa21e4dd75b5045dce7bc92eeb1afa5da1
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e35399d0d40f1b66f1212139f66767afc390cd705f79e1d36fc59de7211ced05
3
  size 4876059416
model-00008-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:783e4aab8cebccbbea32683a7decc8213bfae3a1411ffb3e9ad23b0d920caa38
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e34dd0ab728f1ab7c740e8692b07a6756681a264a8528863da928ec61258aec8
3
  size 4876059416
model-00009-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a43b0c96a9cc067e58033218a6daebf3afc827b8ddfd37c3229db76c54774c5a
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e87adce5c0015da7d74bb223aefe577aa73fd5f4a16c9a150b027eaf5c4ec65
3
  size 4876059416
model-00010-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a1330ad54e14159fd2b3a532027ff98772332c0d3135a7098cfb0bc3da45d53
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:009cf3582020a7555d670a41498ef2a31b9b78a71dae180761fbe34928ca8499
3
  size 4876059416
model-00011-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:215cf2f44190b0f5cc034630f9b89ed4ae7c39745994ce7337800a0b0d8c7d74
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2025415b892c7195f7de49f3b2532769ee40a72f19ae1b001fbc09fcac47e3d7
3
  size 4876059416
model-00012-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:37273c150922b0e4b354be81cb12081c21cb546b47dcffd96c82c4a65d31b9af
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c0c19b8d3a9d1dee0567f4a5d60583488f63e015f1d91d16ccaadb3c2f97e0c
3
  size 4876059416
model-00013-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:657c73bbbe43d8965895213495fe1fbe8075d0634ea51edb39911cfa867e6dca
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:095e7a735491a81438a949fdf0c7d517e62d850743c621c3d1311cbb8dbdce93
3
  size 4876059416
model-00014-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b73772bac89ec879f41f35a78958c6b80c5d182a591994ffaad43913c6ab399b
3
  size 2123397800
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c7b33307a4400e19bf21bf3b78c94432eb5cdfaf0c278c24c96c4d65ce16d4e
3
  size 2123397800
trainer_log.jsonl CHANGED
@@ -49,3 +49,23 @@
49
  {"current_steps": 38, "total_steps": 63, "loss": 0.1421, "lr": 4.162468883476319e-06, "epoch": 1.7559055118110236, "percentage": 60.32, "elapsed_time": "7:32:44", "remaining_time": "4:57:51"}
50
  {"current_steps": 39, "total_steps": 63, "loss": 0.1543, "lr": 3.887395330218429e-06, "epoch": 1.8031496062992125, "percentage": 61.9, "elapsed_time": "7:49:25", "remaining_time": "4:48:52"}
51
  {"current_steps": 40, "total_steps": 63, "loss": 0.1796, "lr": 3.6158224428757538e-06, "epoch": 1.8503937007874016, "percentage": 63.49, "elapsed_time": "7:59:50", "remaining_time": "4:35:54"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
49
  {"current_steps": 38, "total_steps": 63, "loss": 0.1421, "lr": 4.162468883476319e-06, "epoch": 1.7559055118110236, "percentage": 60.32, "elapsed_time": "7:32:44", "remaining_time": "4:57:51"}
50
  {"current_steps": 39, "total_steps": 63, "loss": 0.1543, "lr": 3.887395330218429e-06, "epoch": 1.8031496062992125, "percentage": 61.9, "elapsed_time": "7:49:25", "remaining_time": "4:48:52"}
51
  {"current_steps": 40, "total_steps": 63, "loss": 0.1796, "lr": 3.6158224428757538e-06, "epoch": 1.8503937007874016, "percentage": 63.49, "elapsed_time": "7:59:50", "remaining_time": "4:35:54"}
52
+ {"current_steps": 41, "total_steps": 63, "loss": 0.1771, "lr": 3.3486046902241663e-06, "epoch": 1.8976377952755905, "percentage": 65.08, "elapsed_time": "8:16:31", "remaining_time": "4:26:25"}
53
+ {"current_steps": 42, "total_steps": 63, "loss": 0.163, "lr": 3.0865828381745515e-06, "epoch": 1.9448818897637796, "percentage": 66.67, "elapsed_time": "8:26:02", "remaining_time": "4:13:01"}
54
+ {"current_steps": 43, "total_steps": 63, "loss": 0.1518, "lr": 2.83058130441221e-06, "epoch": 1.9921259842519685, "percentage": 68.25, "elapsed_time": "8:37:10", "remaining_time": "4:00:33"}
55
+ {"current_steps": 44, "total_steps": 63, "loss": 0.1685, "lr": 2.5814055644738013e-06, "epoch": 2.0, "percentage": 69.84, "elapsed_time": "8:38:30", "remaining_time": "3:43:54"}
56
+ {"current_steps": 45, "total_steps": 63, "loss": 0.135, "lr": 2.339839617423318e-06, "epoch": 2.047244094488189, "percentage": 71.43, "elapsed_time": "8:54:43", "remaining_time": "3:33:53"}
57
+ {"current_steps": 46, "total_steps": 63, "loss": 0.1472, "lr": 2.1066435191009717e-06, "epoch": 2.094488188976378, "percentage": 73.02, "elapsed_time": "9:06:16", "remaining_time": "3:21:52"}
58
+ {"current_steps": 47, "total_steps": 63, "loss": 0.1161, "lr": 1.8825509907063328e-06, "epoch": 2.141732283464567, "percentage": 74.6, "elapsed_time": "9:19:29", "remaining_time": "3:10:27"}
59
+ {"current_steps": 48, "total_steps": 63, "loss": 0.0941, "lr": 1.6682671102399806e-06, "epoch": 2.188976377952756, "percentage": 76.19, "elapsed_time": "9:27:49", "remaining_time": "2:57:26"}
60
+ {"current_steps": 49, "total_steps": 63, "loss": 0.1614, "lr": 1.4644660940672628e-06, "epoch": 2.236220472440945, "percentage": 77.78, "elapsed_time": "9:39:32", "remaining_time": "2:45:35"}
61
+ {"current_steps": 50, "total_steps": 63, "loss": 0.1533, "lr": 1.2717891755841722e-06, "epoch": 2.283464566929134, "percentage": 79.37, "elapsed_time": "9:48:50", "remaining_time": "2:33:05"}
62
+ {"current_steps": 51, "total_steps": 63, "loss": 0.1051, "lr": 1.0908425876598512e-06, "epoch": 2.3307086614173227, "percentage": 80.95, "elapsed_time": "10:04:28", "remaining_time": "2:22:13"}
63
+ {"current_steps": 52, "total_steps": 63, "loss": 0.0923, "lr": 9.221956552036992e-07, "epoch": 2.377952755905512, "percentage": 82.54, "elapsed_time": "10:13:47", "remaining_time": "2:09:50"}
64
+ {"current_steps": 53, "total_steps": 63, "loss": 0.0977, "lr": 7.663790038585794e-07, "epoch": 2.425196850393701, "percentage": 84.13, "elapsed_time": "10:27:30", "remaining_time": "1:58:23"}
65
+ {"current_steps": 54, "total_steps": 63, "loss": 0.1154, "lr": 6.238828904562316e-07, "epoch": 2.47244094488189, "percentage": 85.71, "elapsed_time": "10:35:38", "remaining_time": "1:45:56"}
66
+ {"current_steps": 55, "total_steps": 63, "loss": 0.1237, "lr": 4.951556604879049e-07, "epoch": 2.5196850393700787, "percentage": 87.3, "elapsed_time": "10:46:50", "remaining_time": "1:34:05"}
67
+ {"current_steps": 56, "total_steps": 63, "loss": 0.1042, "lr": 3.8060233744356634e-07, "epoch": 2.5669291338582676, "percentage": 88.89, "elapsed_time": "10:57:44", "remaining_time": "1:22:13"}
68
+ {"current_steps": 57, "total_steps": 63, "loss": 0.1259, "lr": 2.8058334845816214e-07, "epoch": 2.6141732283464565, "percentage": 90.48, "elapsed_time": "11:05:21", "remaining_time": "1:10:02"}
69
+ {"current_steps": 58, "total_steps": 63, "loss": 0.1105, "lr": 1.9541339027450256e-07, "epoch": 2.661417322834646, "percentage": 92.06, "elapsed_time": "11:17:59", "remaining_time": "0:58:26"}
70
+ {"current_steps": 59, "total_steps": 63, "loss": 0.1063, "lr": 1.253604390908819e-07, "epoch": 2.7086614173228347, "percentage": 93.65, "elapsed_time": "11:27:42", "remaining_time": "0:46:37"}
71
+ {"current_steps": 60, "total_steps": 63, "loss": 0.1343, "lr": 7.064490740882057e-08, "epoch": 2.7559055118110236, "percentage": 95.24, "elapsed_time": "11:40:49", "remaining_time": "0:35:02"}