OckerGui commited on
Commit
1a2b7bc
·
1 Parent(s): b9fe364

Model save

Browse files
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.25,
3
- "eval_accuracy": 0.1956521739130435,
4
- "eval_loss": 1.5383708477020264,
5
- "eval_runtime": 100.417,
6
- "eval_samples_per_second": 0.916,
7
- "eval_steps_per_second": 0.229
8
  }
 
1
  {
2
+ "epoch": 3.23,
3
+ "eval_accuracy": 0.36507936507936506,
4
+ "eval_loss": 1.390939474105835,
5
+ "eval_runtime": 50.4581,
6
+ "eval_samples_per_second": 1.249,
7
+ "eval_steps_per_second": 0.317
8
  }
runs/Jul25_23-36-15_33b58b9b2125/events.out.tfevents.1690329587.33b58b9b2125.471.2 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:93f3a7d6ed3575787bf64547ac610a623209ab706ec58bf0fcc494cad8f0fe45
3
- size 405
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61b0e5deb564424fdb232e0ee799d98376651bff2dc33365d626a0b2c4911ec3
3
+ size 722
test_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.25,
3
- "eval_accuracy": 0.1956521739130435,
4
- "eval_loss": 1.5383708477020264,
5
- "eval_runtime": 100.417,
6
- "eval_samples_per_second": 0.916,
7
- "eval_steps_per_second": 0.229
8
  }
 
1
  {
2
+ "epoch": 3.23,
3
+ "eval_accuracy": 0.36507936507936506,
4
+ "eval_loss": 1.390939474105835,
5
+ "eval_runtime": 50.4581,
6
+ "eval_samples_per_second": 1.249,
7
+ "eval_steps_per_second": 0.317
8
  }
trainer_state.json CHANGED
@@ -1,127 +1,151 @@
1
  {
2
- "best_metric": 0.4166666666666667,
3
- "best_model_checkpoint": "videomae-base-finetuned-ASBD_ESBD/checkpoint-42",
4
- "epoch": 3.25,
5
- "global_step": 84,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 0.12,
12
- "learning_rate": 4.933333333333334e-05,
13
- "loss": 1.5615,
14
  "step": 10
15
  },
16
  {
17
- "epoch": 0.24,
18
- "learning_rate": 4.266666666666667e-05,
19
- "loss": 1.4616,
20
  "step": 20
21
  },
22
  {
23
  "epoch": 0.25,
24
- "eval_accuracy": 0.2569444444444444,
25
- "eval_loss": 1.3287016153335571,
26
- "eval_runtime": 164.0785,
27
- "eval_samples_per_second": 0.878,
28
- "eval_steps_per_second": 0.219,
29
- "step": 21
30
- },
31
- {
32
- "epoch": 1.11,
33
- "learning_rate": 3.6e-05,
34
- "loss": 1.3015,
35
  "step": 30
36
  },
37
  {
38
- "epoch": 1.23,
39
- "learning_rate": 2.9333333333333336e-05,
40
- "loss": 1.215,
41
- "step": 40
 
 
 
42
  },
43
  {
44
- "epoch": 1.25,
45
- "eval_accuracy": 0.4166666666666667,
46
- "eval_loss": 1.2314302921295166,
47
- "eval_runtime": 134.8195,
48
- "eval_samples_per_second": 1.068,
49
- "eval_steps_per_second": 0.267,
50
- "step": 42
51
  },
52
  {
53
- "epoch": 2.1,
54
- "learning_rate": 2.2666666666666668e-05,
55
- "loss": 1.2456,
56
  "step": 50
57
  },
58
  {
59
- "epoch": 2.21,
60
- "learning_rate": 1.6000000000000003e-05,
61
- "loss": 1.1371,
62
  "step": 60
63
  },
64
  {
65
- "epoch": 2.25,
66
- "eval_accuracy": 0.3541666666666667,
67
- "eval_loss": 1.2707536220550537,
68
- "eval_runtime": 134.9477,
69
- "eval_samples_per_second": 1.067,
70
- "eval_steps_per_second": 0.267,
71
- "step": 63
72
  },
73
  {
74
- "epoch": 3.08,
75
- "learning_rate": 9.333333333333334e-06,
76
- "loss": 1.1823,
77
  "step": 70
78
  },
79
  {
80
- "epoch": 3.2,
81
- "learning_rate": 2.666666666666667e-06,
82
- "loss": 1.043,
83
  "step": 80
84
  },
85
  {
86
- "epoch": 3.25,
87
- "eval_accuracy": 0.3680555555555556,
88
- "eval_loss": 1.2449548244476318,
89
- "eval_runtime": 140.7456,
90
- "eval_samples_per_second": 1.023,
91
- "eval_steps_per_second": 0.256,
92
- "step": 84
93
  },
94
  {
95
- "epoch": 3.25,
96
- "step": 84,
97
- "total_flos": 4.186851697156424e+17,
98
- "train_loss": 1.2573059399922688,
99
- "train_runtime": 1343.3508,
100
- "train_samples_per_second": 0.25,
101
- "train_steps_per_second": 0.063
102
  },
103
  {
104
- "epoch": 3.25,
105
- "eval_accuracy": 0.1956521739130435,
106
- "eval_loss": 1.5383708477020264,
107
- "eval_runtime": 120.4967,
108
- "eval_samples_per_second": 0.764,
109
- "eval_steps_per_second": 0.191,
110
- "step": 84
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
111
  },
112
  {
113
- "epoch": 3.25,
114
- "eval_accuracy": 0.1956521739130435,
115
- "eval_loss": 1.5383708477020264,
116
- "eval_runtime": 100.417,
117
- "eval_samples_per_second": 0.916,
118
- "eval_steps_per_second": 0.229,
119
- "step": 84
120
  }
121
  ],
122
- "max_steps": 84,
123
  "num_train_epochs": 9223372036854775807,
124
- "total_flos": 4.186851697156424e+17,
125
  "trial_name": null,
126
  "trial_params": null
127
  }
 
1
  {
2
+ "best_metric": 0.34328358208955223,
3
+ "best_model_checkpoint": "videomae-base-finetuned-ASBD_ESBD/checkpoint-62",
4
+ "epoch": 3.225,
5
+ "global_step": 120,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 0.08,
12
+ "learning_rate": 4.166666666666667e-05,
13
+ "loss": 1.4881,
14
  "step": 10
15
  },
16
  {
17
+ "epoch": 0.17,
18
+ "learning_rate": 4.62962962962963e-05,
19
+ "loss": 1.3349,
20
  "step": 20
21
  },
22
  {
23
  "epoch": 0.25,
24
+ "learning_rate": 4.166666666666667e-05,
25
+ "loss": 1.377,
 
 
 
 
 
 
 
 
 
26
  "step": 30
27
  },
28
  {
29
+ "epoch": 0.26,
30
+ "eval_accuracy": 0.19402985074626866,
31
+ "eval_loss": 1.4631586074829102,
32
+ "eval_runtime": 90.4696,
33
+ "eval_samples_per_second": 0.741,
34
+ "eval_steps_per_second": 0.188,
35
+ "step": 31
36
  },
37
  {
38
+ "epoch": 1.07,
39
+ "learning_rate": 3.7037037037037037e-05,
40
+ "loss": 1.3908,
41
+ "step": 40
 
 
 
42
  },
43
  {
44
+ "epoch": 1.16,
45
+ "learning_rate": 3.240740740740741e-05,
46
+ "loss": 1.2884,
47
  "step": 50
48
  },
49
  {
50
+ "epoch": 1.24,
51
+ "learning_rate": 2.777777777777778e-05,
52
+ "loss": 1.2476,
53
  "step": 60
54
  },
55
  {
56
+ "epoch": 1.26,
57
+ "eval_accuracy": 0.34328358208955223,
58
+ "eval_loss": 1.310468316078186,
59
+ "eval_runtime": 85.9108,
60
+ "eval_samples_per_second": 0.78,
61
+ "eval_steps_per_second": 0.198,
62
+ "step": 62
63
  },
64
  {
65
+ "epoch": 2.07,
66
+ "learning_rate": 2.314814814814815e-05,
67
+ "loss": 1.0522,
68
  "step": 70
69
  },
70
  {
71
+ "epoch": 2.15,
72
+ "learning_rate": 1.8518518518518518e-05,
73
+ "loss": 1.2907,
74
  "step": 80
75
  },
76
  {
77
+ "epoch": 2.23,
78
+ "learning_rate": 1.388888888888889e-05,
79
+ "loss": 1.2034,
80
+ "step": 90
 
 
 
81
  },
82
  {
83
+ "epoch": 2.26,
84
+ "eval_accuracy": 0.2835820895522388,
85
+ "eval_loss": 1.3650459051132202,
86
+ "eval_runtime": 87.6565,
87
+ "eval_samples_per_second": 0.764,
88
+ "eval_steps_per_second": 0.194,
89
+ "step": 93
90
  },
91
  {
92
+ "epoch": 3.06,
93
+ "learning_rate": 9.259259259259259e-06,
94
+ "loss": 1.199,
95
+ "step": 100
96
+ },
97
+ {
98
+ "epoch": 3.14,
99
+ "learning_rate": 4.6296296296296296e-06,
100
+ "loss": 1.0395,
101
+ "step": 110
102
+ },
103
+ {
104
+ "epoch": 3.23,
105
+ "learning_rate": 0.0,
106
+ "loss": 0.9454,
107
+ "step": 120
108
+ },
109
+ {
110
+ "epoch": 3.23,
111
+ "eval_accuracy": 0.3283582089552239,
112
+ "eval_loss": 1.347509741783142,
113
+ "eval_runtime": 86.3368,
114
+ "eval_samples_per_second": 0.776,
115
+ "eval_steps_per_second": 0.197,
116
+ "step": 120
117
+ },
118
+ {
119
+ "epoch": 3.23,
120
+ "step": 120,
121
+ "total_flos": 5.869068896906772e+17,
122
+ "train_loss": 1.238083585103353,
123
+ "train_runtime": 1251.5665,
124
+ "train_samples_per_second": 0.384,
125
+ "train_steps_per_second": 0.096
126
+ },
127
+ {
128
+ "epoch": 3.23,
129
+ "eval_accuracy": 0.36507936507936506,
130
+ "eval_loss": 1.390939474105835,
131
+ "eval_runtime": 57.4152,
132
+ "eval_samples_per_second": 1.097,
133
+ "eval_steps_per_second": 0.279,
134
+ "step": 120
135
  },
136
  {
137
+ "epoch": 3.23,
138
+ "eval_accuracy": 0.36507936507936506,
139
+ "eval_loss": 1.390939474105835,
140
+ "eval_runtime": 50.4581,
141
+ "eval_samples_per_second": 1.249,
142
+ "eval_steps_per_second": 0.317,
143
+ "step": 120
144
  }
145
  ],
146
+ "max_steps": 120,
147
  "num_train_epochs": 9223372036854775807,
148
+ "total_flos": 5.869068896906772e+17,
149
  "trial_name": null,
150
  "trial_params": null
151
  }