khleeloo commited on
Commit
fbadca0
1 Parent(s): b64bac5

Training in progress, epoch 1

Browse files
all_results.json CHANGED
@@ -1,16 +1,16 @@
1
  {
2
  "epoch": 4.0,
3
- "eval_accuracy": 0.794973544973545,
4
- "eval_f1": 0.7911822260194087,
5
- "eval_loss": 0.8158386945724487,
6
- "eval_precision": 0.7898693796510783,
7
- "eval_recall": 0.794973544973545,
8
- "eval_runtime": 8.8626,
9
- "eval_samples_per_second": 170.604,
10
- "eval_steps_per_second": 10.719,
11
- "total_flos": 4.65670232933972e+18,
12
- "train_loss": 0.2716429328141264,
13
- "train_runtime": 832.7663,
14
- "train_samples_per_second": 48.105,
15
- "train_steps_per_second": 3.007
16
  }
 
1
  {
2
  "epoch": 4.0,
3
+ "eval_accuracy": 0.7817460317460317,
4
+ "eval_f1": 0.7722244420145986,
5
+ "eval_loss": 0.8502413630485535,
6
+ "eval_precision": 0.7756312792366583,
7
+ "eval_recall": 0.7817460317460317,
8
+ "eval_runtime": 10.0761,
9
+ "eval_samples_per_second": 150.058,
10
+ "eval_steps_per_second": 18.757,
11
+ "total_flos": 3.104468219559813e+18,
12
+ "train_loss": 0.0725347773061683,
13
+ "train_runtime": 849.1916,
14
+ "train_samples_per_second": 47.174,
15
+ "train_steps_per_second": 2.949
16
  }
eval_results.json CHANGED
@@ -1,11 +1,11 @@
1
  {
2
- "epoch": 6.0,
3
- "eval_accuracy": 0.794973544973545,
4
- "eval_f1": 0.7911822260194087,
5
- "eval_loss": 0.8158386945724487,
6
- "eval_precision": 0.7898693796510783,
7
- "eval_recall": 0.794973544973545,
8
- "eval_runtime": 8.8626,
9
- "eval_samples_per_second": 170.604,
10
- "eval_steps_per_second": 10.719
11
  }
 
1
  {
2
+ "epoch": 4.0,
3
+ "eval_accuracy": 0.7817460317460317,
4
+ "eval_f1": 0.7722244420145986,
5
+ "eval_loss": 0.8502413630485535,
6
+ "eval_precision": 0.7756312792366583,
7
+ "eval_recall": 0.7817460317460317,
8
+ "eval_runtime": 10.0761,
9
+ "eval_samples_per_second": 150.058,
10
+ "eval_steps_per_second": 18.757
11
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:19b65157a312222f7d90a2baab38d283d36066ea201f5d41216c9e1c16bf7e11
3
  size 343284077
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:395c6a4d60ddec8cc483a862b93b051769a3190c99b76fb9739e6c5d32e6955d
3
  size 343284077
runs/Oct27_21-22-14_EE4E077/events.out.tfevents.1698413879.EE4E077.103115.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:beabc4f6f14a0cd7ef3beefd317bba1f6146e2ad660f7c8a8e2f404faa9bf4d2
3
+ size 560
runs/Oct27_22-15-51_EE4E077/1698416154.775236/events.out.tfevents.1698416154.EE4E077.103115.10 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:339b203dbaf2081c885219d6e4a9d823431b0f8e2b4070eb9fba16b8c4653a9b
3
+ size 5919
runs/Oct27_22-15-51_EE4E077/events.out.tfevents.1698416154.EE4E077.103115.9 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07476ca587eceeb26e2fe72fb228d090cb8b331fd72311fca7a43997ff57f831
3
+ size 6598
train_results.json CHANGED
@@ -1,7 +1,8 @@
1
  {
2
  "epoch": 4.0,
3
- "train_loss": 0.2716429328141264,
4
- "train_runtime": 832.7663,
5
- "train_samples_per_second": 48.105,
6
- "train_steps_per_second": 3.007
 
7
  }
 
1
  {
2
  "epoch": 4.0,
3
+ "total_flos": 3.104468219559813e+18,
4
+ "train_loss": 0.0725347773061683,
5
+ "train_runtime": 849.1916,
6
+ "train_samples_per_second": 47.174,
7
+ "train_steps_per_second": 2.949
8
  }
trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.8860103626943006,
3
- "best_model_checkpoint": "./vit-focal-skin/checkpoint-1252",
4
  "epoch": 4.0,
5
  "global_step": 2504,
6
  "is_hyper_param_search": false,
@@ -10,209 +10,209 @@
10
  {
11
  "epoch": 0.16,
12
  "learning_rate": 0.00019201277955271565,
13
- "loss": 0.7905,
14
  "step": 100
15
  },
16
  {
17
  "epoch": 0.32,
18
  "learning_rate": 0.00018402555910543132,
19
- "loss": 0.6162,
20
  "step": 200
21
  },
22
  {
23
  "epoch": 0.48,
24
  "learning_rate": 0.000176038338658147,
25
- "loss": 0.5709,
26
  "step": 300
27
  },
28
  {
29
  "epoch": 0.64,
30
  "learning_rate": 0.00016805111821086263,
31
- "loss": 0.5101,
32
  "step": 400
33
  },
34
  {
35
  "epoch": 0.8,
36
  "learning_rate": 0.0001600638977635783,
37
- "loss": 0.4966,
38
  "step": 500
39
  },
40
  {
41
  "epoch": 0.96,
42
  "learning_rate": 0.00015207667731629394,
43
- "loss": 0.4563,
44
  "step": 600
45
  },
46
  {
47
  "epoch": 1.0,
48
- "eval_accuracy": 0.8341968911917098,
49
- "eval_f1": 0.8331282144797781,
50
- "eval_loss": 0.40268635749816895,
51
- "eval_precision": 0.8791963514680484,
52
- "eval_recall": 0.8341968911917098,
53
- "eval_runtime": 1.5386,
54
- "eval_samples_per_second": 125.44,
55
- "eval_steps_per_second": 16.249,
56
  "step": 626
57
  },
58
  {
59
  "epoch": 1.12,
60
  "learning_rate": 0.00014408945686900958,
61
- "loss": 0.385,
62
  "step": 700
63
  },
64
  {
65
  "epoch": 1.28,
66
  "learning_rate": 0.00013610223642172525,
67
- "loss": 0.3621,
68
  "step": 800
69
  },
70
  {
71
  "epoch": 1.44,
72
- "learning_rate": 0.00012811501597444092,
73
- "loss": 0.3624,
74
  "step": 900
75
  },
76
  {
77
  "epoch": 1.6,
78
- "learning_rate": 0.00012012779552715656,
79
- "loss": 0.3403,
80
  "step": 1000
81
  },
82
  {
83
  "epoch": 1.76,
84
- "learning_rate": 0.00011214057507987221,
85
- "loss": 0.3293,
86
  "step": 1100
87
  },
88
  {
89
  "epoch": 1.92,
90
- "learning_rate": 0.00010415335463258787,
91
- "loss": 0.2954,
92
  "step": 1200
93
  },
94
  {
95
  "epoch": 2.0,
96
- "eval_accuracy": 0.8860103626943006,
97
- "eval_f1": 0.8891954516071332,
98
- "eval_loss": 0.3063604235649109,
99
- "eval_precision": 0.8988400162775354,
100
- "eval_recall": 0.8860103626943006,
101
- "eval_runtime": 1.5206,
102
- "eval_samples_per_second": 126.921,
103
- "eval_steps_per_second": 16.441,
104
  "step": 1252
105
  },
106
  {
107
  "epoch": 2.08,
108
- "learning_rate": 9.616613418530351e-05,
109
- "loss": 0.2258,
110
  "step": 1300
111
  },
112
  {
113
  "epoch": 2.24,
114
- "learning_rate": 8.817891373801918e-05,
115
- "loss": 0.1583,
116
  "step": 1400
117
  },
118
  {
119
  "epoch": 2.4,
120
- "learning_rate": 8.019169329073483e-05,
121
- "loss": 0.1589,
122
  "step": 1500
123
  },
124
  {
125
  "epoch": 2.56,
126
- "learning_rate": 7.220447284345049e-05,
127
- "loss": 0.1271,
128
  "step": 1600
129
  },
130
  {
131
  "epoch": 2.72,
132
- "learning_rate": 6.421725239616614e-05,
133
- "loss": 0.1746,
134
  "step": 1700
135
  },
136
  {
137
  "epoch": 2.88,
138
- "learning_rate": 5.623003194888179e-05,
139
- "loss": 0.1118,
140
  "step": 1800
141
  },
142
  {
143
  "epoch": 3.0,
144
  "eval_accuracy": 0.8704663212435233,
145
- "eval_f1": 0.8663258953141536,
146
- "eval_loss": 0.30049628019332886,
147
- "eval_precision": 0.8698602729520133,
148
  "eval_recall": 0.8704663212435233,
149
- "eval_runtime": 1.4368,
150
- "eval_samples_per_second": 134.33,
151
- "eval_steps_per_second": 17.4,
152
  "step": 1878
153
  },
154
  {
155
  "epoch": 3.04,
156
- "learning_rate": 4.824281150159744e-05,
157
- "loss": 0.1193,
158
  "step": 1900
159
  },
160
  {
161
  "epoch": 3.19,
162
- "learning_rate": 4.0255591054313104e-05,
163
- "loss": 0.0409,
164
  "step": 2000
165
  },
166
  {
167
  "epoch": 3.35,
168
- "learning_rate": 3.226837060702875e-05,
169
- "loss": 0.0327,
170
  "step": 2100
171
  },
172
  {
173
  "epoch": 3.51,
174
- "learning_rate": 2.428115015974441e-05,
175
- "loss": 0.0357,
176
  "step": 2200
177
  },
178
  {
179
  "epoch": 3.67,
180
- "learning_rate": 1.6293929712460065e-05,
181
- "loss": 0.0386,
182
  "step": 2300
183
  },
184
  {
185
  "epoch": 3.83,
186
- "learning_rate": 8.306709265175718e-06,
187
- "loss": 0.0303,
188
  "step": 2400
189
  },
190
  {
191
  "epoch": 3.99,
192
- "learning_rate": 3.194888178913738e-07,
193
- "loss": 0.0317,
194
  "step": 2500
195
  },
196
  {
197
  "epoch": 4.0,
198
- "eval_accuracy": 0.8549222797927462,
199
- "eval_f1": 0.8560478324319817,
200
- "eval_loss": 0.3552953004837036,
201
- "eval_precision": 0.8595484172497833,
202
- "eval_recall": 0.8549222797927462,
203
- "eval_runtime": 1.5113,
204
- "eval_samples_per_second": 127.703,
205
- "eval_steps_per_second": 16.542,
206
  "step": 2504
207
  },
208
  {
209
  "epoch": 4.0,
210
  "step": 2504,
211
  "total_flos": 3.104468219559813e+18,
212
- "train_loss": 0.2716429328141264,
213
- "train_runtime": 832.7663,
214
- "train_samples_per_second": 48.105,
215
- "train_steps_per_second": 3.007
216
  }
217
  ],
218
  "max_steps": 2504,
 
1
  {
2
+ "best_metric": 0.8704663212435233,
3
+ "best_model_checkpoint": "./vit-focal-skin/checkpoint-1878",
4
  "epoch": 4.0,
5
  "global_step": 2504,
6
  "is_hyper_param_search": false,
 
10
  {
11
  "epoch": 0.16,
12
  "learning_rate": 0.00019201277955271565,
13
+ "loss": 0.1663,
14
  "step": 100
15
  },
16
  {
17
  "epoch": 0.32,
18
  "learning_rate": 0.00018402555910543132,
19
+ "loss": 0.1962,
20
  "step": 200
21
  },
22
  {
23
  "epoch": 0.48,
24
  "learning_rate": 0.000176038338658147,
25
+ "loss": 0.1853,
26
  "step": 300
27
  },
28
  {
29
  "epoch": 0.64,
30
  "learning_rate": 0.00016805111821086263,
31
+ "loss": 0.1706,
32
  "step": 400
33
  },
34
  {
35
  "epoch": 0.8,
36
  "learning_rate": 0.0001600638977635783,
37
+ "loss": 0.1593,
38
  "step": 500
39
  },
40
  {
41
  "epoch": 0.96,
42
  "learning_rate": 0.00015207667731629394,
43
+ "loss": 0.1702,
44
  "step": 600
45
  },
46
  {
47
  "epoch": 1.0,
48
+ "eval_accuracy": 0.8393782383419689,
49
+ "eval_f1": 0.8380951982999452,
50
+ "eval_loss": 0.39222732186317444,
51
+ "eval_precision": 0.857762154943502,
52
+ "eval_recall": 0.8393782383419689,
53
+ "eval_runtime": 1.5181,
54
+ "eval_samples_per_second": 127.129,
55
+ "eval_steps_per_second": 16.467,
56
  "step": 626
57
  },
58
  {
59
  "epoch": 1.12,
60
  "learning_rate": 0.00014408945686900958,
61
+ "loss": 0.1036,
62
  "step": 700
63
  },
64
  {
65
  "epoch": 1.28,
66
  "learning_rate": 0.00013610223642172525,
67
+ "loss": 0.0941,
68
  "step": 800
69
  },
70
  {
71
  "epoch": 1.44,
72
+ "learning_rate": 0.00012819488817891373,
73
+ "loss": 0.1029,
74
  "step": 900
75
  },
76
  {
77
  "epoch": 1.6,
78
+ "learning_rate": 0.0001202076677316294,
79
+ "loss": 0.095,
80
  "step": 1000
81
  },
82
  {
83
  "epoch": 1.76,
84
+ "learning_rate": 0.00011222044728434504,
85
+ "loss": 0.0911,
86
  "step": 1100
87
  },
88
  {
89
  "epoch": 1.92,
90
+ "learning_rate": 0.00010423322683706072,
91
+ "loss": 0.0647,
92
  "step": 1200
93
  },
94
  {
95
  "epoch": 2.0,
96
+ "eval_accuracy": 0.8238341968911918,
97
+ "eval_f1": 0.8247834676883651,
98
+ "eval_loss": 0.561523973941803,
99
+ "eval_precision": 0.8404391615022521,
100
+ "eval_recall": 0.8238341968911918,
101
+ "eval_runtime": 1.446,
102
+ "eval_samples_per_second": 133.47,
103
+ "eval_steps_per_second": 17.289,
104
  "step": 1252
105
  },
106
  {
107
  "epoch": 2.08,
108
+ "learning_rate": 9.624600638977636e-05,
109
+ "loss": 0.052,
110
  "step": 1300
111
  },
112
  {
113
  "epoch": 2.24,
114
+ "learning_rate": 8.825878594249202e-05,
115
+ "loss": 0.0298,
116
  "step": 1400
117
  },
118
  {
119
  "epoch": 2.4,
120
+ "learning_rate": 8.027156549520767e-05,
121
+ "loss": 0.0243,
122
  "step": 1500
123
  },
124
  {
125
  "epoch": 2.56,
126
+ "learning_rate": 7.228434504792333e-05,
127
+ "loss": 0.0332,
128
  "step": 1600
129
  },
130
  {
131
  "epoch": 2.72,
132
+ "learning_rate": 6.429712460063898e-05,
133
+ "loss": 0.0267,
134
  "step": 1700
135
  },
136
  {
137
  "epoch": 2.88,
138
+ "learning_rate": 5.630990415335463e-05,
139
+ "loss": 0.0111,
140
  "step": 1800
141
  },
142
  {
143
  "epoch": 3.0,
144
  "eval_accuracy": 0.8704663212435233,
145
+ "eval_f1": 0.868408303886561,
146
+ "eval_loss": 0.4315575659275055,
147
+ "eval_precision": 0.8670271155479244,
148
  "eval_recall": 0.8704663212435233,
149
+ "eval_runtime": 1.4834,
150
+ "eval_samples_per_second": 130.104,
151
+ "eval_steps_per_second": 16.853,
152
  "step": 1878
153
  },
154
  {
155
  "epoch": 3.04,
156
+ "learning_rate": 4.832268370607029e-05,
157
+ "loss": 0.0175,
158
  "step": 1900
159
  },
160
  {
161
  "epoch": 3.19,
162
+ "learning_rate": 4.0335463258785946e-05,
163
+ "loss": 0.0083,
164
  "step": 2000
165
  },
166
  {
167
  "epoch": 3.35,
168
+ "learning_rate": 3.23482428115016e-05,
169
+ "loss": 0.0038,
170
  "step": 2100
171
  },
172
  {
173
  "epoch": 3.51,
174
+ "learning_rate": 2.4361022364217255e-05,
175
+ "loss": 0.0009,
176
  "step": 2200
177
  },
178
  {
179
  "epoch": 3.67,
180
+ "learning_rate": 1.6373801916932906e-05,
181
+ "loss": 0.0034,
182
  "step": 2300
183
  },
184
  {
185
  "epoch": 3.83,
186
+ "learning_rate": 8.386581469648563e-06,
187
+ "loss": 0.0025,
188
  "step": 2400
189
  },
190
  {
191
  "epoch": 3.99,
192
+ "learning_rate": 3.9936102236421723e-07,
193
+ "loss": 0.0034,
194
  "step": 2500
195
  },
196
  {
197
  "epoch": 4.0,
198
+ "eval_accuracy": 0.8601036269430051,
199
+ "eval_f1": 0.8616514102008719,
200
+ "eval_loss": 0.4513249099254608,
201
+ "eval_precision": 0.8650015326151586,
202
+ "eval_recall": 0.8601036269430051,
203
+ "eval_runtime": 1.498,
204
+ "eval_samples_per_second": 128.838,
205
+ "eval_steps_per_second": 16.689,
206
  "step": 2504
207
  },
208
  {
209
  "epoch": 4.0,
210
  "step": 2504,
211
  "total_flos": 3.104468219559813e+18,
212
+ "train_loss": 0.0725347773061683,
213
+ "train_runtime": 849.1916,
214
+ "train_samples_per_second": 47.174,
215
+ "train_steps_per_second": 2.949
216
  }
217
  ],
218
  "max_steps": 2504,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dae95784d5a6901f55f2c792e11ade68b7f5871a7f402bd5113f06400a3ea472
3
  size 3899
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f657e798e7f77936234299466c6296e6c9fba3c3d1d364c041c99c8e3780c6a
3
  size 3899