yunyus commited on
Commit
ef67f3c
·
verified ·
1 Parent(s): ef0eb44

Training in progress, epoch 1

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1282c2da93a10f875761d10363fbb5ab67026b95c76e9f3a5e2276759968fdab
3
  size 437958648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a99f8e2f451020963cc862630e225027c3a59459785f9d414c18cf527bf0df0c
3
  size 437958648
run-0/checkpoint-78/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:983079b3c184b69976e3e922ab414401c8dd25219df83429805a59bd095053dd
3
  size 437958648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e73a6a94dabb0efcd0fee951b4bb269e4bcbfd86b038cdb1f05f69be224987f
3
  size 437958648
run-0/checkpoint-78/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d628c74667cf811dff5a038d36527982b4b400445b151449a6ee357bf4659fe
3
  size 876038394
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0b9e49c0f111404bf3bb75f8aa46ebfe532888c0089618f9fee7181e88ff866
3
  size 876038394
run-0/checkpoint-78/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d5ea817570194d8e0e85204e3f66b3bc8aa9d4419d9d0feda444e6993af6a1e
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca3cccd11b77d5d203a4466ecd61d7de95628051c1e10e12242d864bf481cb9f
3
  size 1064
run-0/checkpoint-78/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a0f87a8069f7eac17becb3abe4f91c5f6d7edf26c85de5367deed4737c39966
3
  size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60d0f60e33d97e1e0e5b10975bfd55ba2fc1145f2d1c8aa831504b116b1fc39f
3
  size 5432
run-1/checkpoint-39/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aab3944602ff17de830dca74c2c3bdcf3ca2357a2c3946ff27d56be6f4489301
3
  size 437958648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d59550c1dea5879e3a1aec7065f8590e7113f652b84472de96c6c9c1e27d705
3
  size 437958648
run-1/checkpoint-39/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4fac6b678ea4e78123eebb2a57863cdcb7d5a6c102493d6beaba5f58b16a9ac7
3
  size 876038394
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e45c157362ad69595478c4daeb665be40748e26b910672812955c6656252fe88
3
  size 876038394
run-1/checkpoint-39/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2e728d62168539e162cfd12980713e2c0a527faec5a51cc3eef8e80293c895d1
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1357d27d6dcc07f61181342425227d9ce57d5241166fc1b33bb5b5fbf50cf5e6
3
  size 1064
run-1/checkpoint-39/trainer_state.json CHANGED
@@ -12,10 +12,10 @@
12
  {
13
  "epoch": 1.0,
14
  "eval_accuracy": 0.4729241877256318,
15
- "eval_loss": 0.7139573693275452,
16
- "eval_runtime": 1.9882,
17
- "eval_samples_per_second": 139.325,
18
- "eval_steps_per_second": 4.527,
19
  "step": 39
20
  }
21
  ],
@@ -40,8 +40,8 @@
40
  "train_batch_size": 64,
41
  "trial_name": null,
42
  "trial_params": {
43
- "dropout_rate": 0.32964696479911365,
44
- "learning_rate": 2.707454604407671e-06,
45
  "max_seq_length": 256,
46
  "num_train_epochs": 2,
47
  "per_device_train_batch_size": 64
 
12
  {
13
  "epoch": 1.0,
14
  "eval_accuracy": 0.4729241877256318,
15
+ "eval_loss": 0.7221417427062988,
16
+ "eval_runtime": 2.0129,
17
+ "eval_samples_per_second": 137.615,
18
+ "eval_steps_per_second": 2.484,
19
  "step": 39
20
  }
21
  ],
 
40
  "train_batch_size": 64,
41
  "trial_name": null,
42
  "trial_params": {
43
+ "dropout_rate": 0.1016397017464123,
44
+ "learning_rate": 1.2050894848379789e-06,
45
  "max_seq_length": 256,
46
  "num_train_epochs": 2,
47
  "per_device_train_batch_size": 64
run-1/checkpoint-39/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f20413c6f4f1baa91041a9640292f4bb307c9f460181077fcc3c0a98556ef3cb
3
  size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b58a714467b799b6a0ccb9002f056087cc69c203d1b9db91e56a40aedfe1659
3
  size 5432
run-1/checkpoint-78/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:54d7b95993061f4281902d35e5f3f462aad9fc8d79bebc829b5984d7b9f88290
3
  size 437958648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3934f42aedd032f285b4f5eb2d0bb0a9fb0739bfcdaf37c0d888b00008339c9b
3
  size 437958648
run-1/checkpoint-78/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7388507902d618d4a5636970d22e834775a6fc97b9789f3763f810c1ba3ce5a0
3
  size 876038394
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:650808565c7da7432db3554c69ce9024029ee48e9fcbfcba3fd875017715c8a6
3
  size 876038394
run-1/checkpoint-78/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:755c3933ed6cf784e3b07188774fc84009f398046b2422fd5db2b326826542cd
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf714d04f8d03c499d62b8995b10cdcefa51102cbc9dc743e413e17551e3d5da
3
  size 1064
run-1/checkpoint-78/trainer_state.json CHANGED
@@ -12,19 +12,19 @@
12
  {
13
  "epoch": 1.0,
14
  "eval_accuracy": 0.4729241877256318,
15
- "eval_loss": 0.7139573693275452,
16
- "eval_runtime": 1.9882,
17
- "eval_samples_per_second": 139.325,
18
- "eval_steps_per_second": 4.527,
19
  "step": 39
20
  },
21
  {
22
  "epoch": 2.0,
23
- "eval_accuracy": 0.4657039711191336,
24
- "eval_loss": 0.7088006138801575,
25
- "eval_runtime": 1.922,
26
- "eval_samples_per_second": 144.117,
27
- "eval_steps_per_second": 4.683,
28
  "step": 78
29
  }
30
  ],
@@ -49,8 +49,8 @@
49
  "train_batch_size": 64,
50
  "trial_name": null,
51
  "trial_params": {
52
- "dropout_rate": 0.32964696479911365,
53
- "learning_rate": 2.707454604407671e-06,
54
  "max_seq_length": 256,
55
  "num_train_epochs": 2,
56
  "per_device_train_batch_size": 64
 
12
  {
13
  "epoch": 1.0,
14
  "eval_accuracy": 0.4729241877256318,
15
+ "eval_loss": 0.7221417427062988,
16
+ "eval_runtime": 2.0129,
17
+ "eval_samples_per_second": 137.615,
18
+ "eval_steps_per_second": 2.484,
19
  "step": 39
20
  },
21
  {
22
  "epoch": 2.0,
23
+ "eval_accuracy": 0.4729241877256318,
24
+ "eval_loss": 0.7191658020019531,
25
+ "eval_runtime": 2.189,
26
+ "eval_samples_per_second": 126.544,
27
+ "eval_steps_per_second": 2.284,
28
  "step": 78
29
  }
30
  ],
 
49
  "train_batch_size": 64,
50
  "trial_name": null,
51
  "trial_params": {
52
+ "dropout_rate": 0.1016397017464123,
53
+ "learning_rate": 1.2050894848379789e-06,
54
  "max_seq_length": 256,
55
  "num_train_epochs": 2,
56
  "per_device_train_batch_size": 64
run-1/checkpoint-78/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f20413c6f4f1baa91041a9640292f4bb307c9f460181077fcc3c0a98556ef3cb
3
  size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b58a714467b799b6a0ccb9002f056087cc69c203d1b9db91e56a40aedfe1659
3
  size 5432
run-2/checkpoint-39/config.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "BertForSequenceClassification"
4
+ ],
5
+ "attention_probs_dropout_prob": 0.1,
6
+ "classifier_dropout": null,
7
+ "gradient_checkpointing": false,
8
+ "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.1,
10
+ "hidden_size": 768,
11
+ "initializer_range": 0.02,
12
+ "intermediate_size": 3072,
13
+ "layer_norm_eps": 1e-12,
14
+ "max_position_embeddings": 512,
15
+ "model_type": "bert",
16
+ "num_attention_heads": 12,
17
+ "num_hidden_layers": 12,
18
+ "pad_token_id": 0,
19
+ "position_embedding_type": "absolute",
20
+ "problem_type": "single_label_classification",
21
+ "torch_dtype": "float32",
22
+ "transformers_version": "4.50.3",
23
+ "type_vocab_size": 2,
24
+ "use_cache": true,
25
+ "vocab_size": 30522
26
+ }
run-2/checkpoint-39/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a99f8e2f451020963cc862630e225027c3a59459785f9d414c18cf527bf0df0c
3
+ size 437958648
run-2/checkpoint-39/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7aa3db6cca0c2b46f6bb3cdc4192524791925aae96afeefadc5fc800c61f8590
3
+ size 876038394
run-2/checkpoint-39/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb9d75225831e9955fede3b2d004809f8a35dbd2208354c70b53a96923288fdc
3
+ size 14244
run-2/checkpoint-39/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51d0b00f673d1afb7ad79ca355e4162ad1ab39a84b5123bbca794c2d33f68972
3
+ size 1064
run-2/checkpoint-39/special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
run-2/checkpoint-39/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
run-2/checkpoint-39/tokenizer_config.json ADDED
@@ -0,0 +1,56 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "clean_up_tokenization_spaces": false,
45
+ "cls_token": "[CLS]",
46
+ "do_lower_case": true,
47
+ "extra_special_tokens": {},
48
+ "mask_token": "[MASK]",
49
+ "model_max_length": 512,
50
+ "pad_token": "[PAD]",
51
+ "sep_token": "[SEP]",
52
+ "strip_accents": null,
53
+ "tokenize_chinese_chars": true,
54
+ "tokenizer_class": "BertTokenizer",
55
+ "unk_token": "[UNK]"
56
+ }
run-2/checkpoint-39/trainer_state.json ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": 39,
3
+ "best_metric": 0.4693140794223827,
4
+ "best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_1/run-2/checkpoint-39",
5
+ "epoch": 1.0,
6
+ "eval_steps": 500,
7
+ "global_step": 39,
8
+ "is_hyper_param_search": true,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 1.0,
14
+ "eval_accuracy": 0.4693140794223827,
15
+ "eval_loss": 0.7152564525604248,
16
+ "eval_runtime": 2.0411,
17
+ "eval_samples_per_second": 135.708,
18
+ "eval_steps_per_second": 2.45,
19
+ "step": 39
20
+ }
21
+ ],
22
+ "logging_steps": 500,
23
+ "max_steps": 39,
24
+ "num_input_tokens_seen": 0,
25
+ "num_train_epochs": 1,
26
+ "save_steps": 500,
27
+ "stateful_callbacks": {
28
+ "TrainerControl": {
29
+ "args": {
30
+ "should_epoch_stop": false,
31
+ "should_evaluate": false,
32
+ "should_log": false,
33
+ "should_save": true,
34
+ "should_training_stop": true
35
+ },
36
+ "attributes": {}
37
+ }
38
+ },
39
+ "total_flos": 0,
40
+ "train_batch_size": 64,
41
+ "trial_name": null,
42
+ "trial_params": {
43
+ "dropout_rate": 0.3750648367717625,
44
+ "learning_rate": 3.89885805363765e-06,
45
+ "max_seq_length": 256,
46
+ "num_train_epochs": 1,
47
+ "per_device_train_batch_size": 64
48
+ }
49
+ }
run-2/checkpoint-39/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9262f528bfa4fcd0f8292f8cee23dda4c29b4b3acbfaca897c50fe6856e9e89
3
+ size 5432
run-2/checkpoint-39/vocab.txt ADDED
The diff for this file is too large to render. See raw diff
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:60d0f60e33d97e1e0e5b10975bfd55ba2fc1145f2d1c8aa831504b116b1fc39f
3
  size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9262f528bfa4fcd0f8292f8cee23dda4c29b4b3acbfaca897c50fe6856e9e89
3
  size 5432