masatochi commited on
Commit
6f66d38
·
verified ·
1 Parent(s): 9f1b2d4

Training in progress, step 985, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9945e31b638334bf494fdbd6bddbd7efb17b80e2cb934406af8bd6e740a52c13
3
  size 48679352
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6e5b896f8b2107fa474ed7dd4a3e70346065a15ff641a52c3f4f047b8b292b2
3
  size 48679352
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2faad1ff615b4367ac8f493089d35aa61ad18cd058aa6a59301eee8776decdbe
3
  size 25152884
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1eb16b5bd5f94102e9811db74952e3afddfa0eb03f909b03ec81c889aa909ad
3
  size 25152884
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a563e473225d388aa85a62aecbc6bdee80f72d3795da30b7a19c51113a1af02
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b712e2c7731e2e06b7c359163b91d5551189c894148dc86f6f8fd62dfef29d2
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0cdd00c1b48b23a3fb0db3f88bb5f4c0c6d9b16cd39a52129b3151d7da108592
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:708b500eeebd05993112b6d6ad4170e8b50c4b3fed50daf1ac656195272b9044
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.7086044830079538,
5
  "eval_steps": 692,
6
- "global_step": 980,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -6883,6 +6883,41 @@
6883
  "learning_rate": 1.9188404864839465e-05,
6884
  "loss": 1.1212,
6885
  "step": 980
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6886
  }
6887
  ],
6888
  "logging_steps": 1,
@@ -6902,7 +6937,7 @@
6902
  "attributes": {}
6903
  }
6904
  },
6905
- "total_flos": 2.1817874712625152e+18,
6906
  "train_batch_size": 4,
6907
  "trial_name": null,
6908
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.7122198120028923,
5
  "eval_steps": 692,
6
+ "global_step": 985,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
6883
  "learning_rate": 1.9188404864839465e-05,
6884
  "loss": 1.1212,
6885
  "step": 980
6886
+ },
6887
+ {
6888
+ "epoch": 0.7093275488069414,
6889
+ "grad_norm": 0.453218013048172,
6890
+ "learning_rate": 1.9186584719112724e-05,
6891
+ "loss": 0.9847,
6892
+ "step": 981
6893
+ },
6894
+ {
6895
+ "epoch": 0.7100506146059291,
6896
+ "grad_norm": 0.43997496366500854,
6897
+ "learning_rate": 1.9184762621195897e-05,
6898
+ "loss": 0.9984,
6899
+ "step": 982
6900
+ },
6901
+ {
6902
+ "epoch": 0.7107736804049168,
6903
+ "grad_norm": 0.5103498101234436,
6904
+ "learning_rate": 1.91829385714762e-05,
6905
+ "loss": 1.0727,
6906
+ "step": 983
6907
+ },
6908
+ {
6909
+ "epoch": 0.7114967462039046,
6910
+ "grad_norm": 0.5352555513381958,
6911
+ "learning_rate": 1.918111257034124e-05,
6912
+ "loss": 1.02,
6913
+ "step": 984
6914
+ },
6915
+ {
6916
+ "epoch": 0.7122198120028923,
6917
+ "grad_norm": 0.40594494342803955,
6918
+ "learning_rate": 1.917928461817906e-05,
6919
+ "loss": 1.0947,
6920
+ "step": 985
6921
  }
6922
  ],
6923
  "logging_steps": 1,
 
6937
  "attributes": {}
6938
  }
6939
  },
6940
+ "total_flos": 2.1929190399934464e+18,
6941
  "train_batch_size": 4,
6942
  "trial_name": null,
6943
  "trial_params": null