djbp commited on
Commit
611a9b2
·
verified ·
1 Parent(s): 931d63d

End of training

Browse files
README.md CHANGED
@@ -23,7 +23,7 @@ model-index:
23
  metrics:
24
  - name: Accuracy
25
  type: accuracy
26
- value: 0.8705334023821854
27
  ---
28
 
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -33,9 +33,9 @@ should probably proofread and complete it, then remove this comment. -->
33
 
34
  This model is a fine-tuned version of [microsoft/swin-base-patch4-window7-224-in22k](https://huggingface.co/microsoft/swin-base-patch4-window7-224-in22k) on the imagefolder dataset.
35
  It achieves the following results on the evaluation set:
36
- - Loss: 0.3173
37
- - Accuracy: 0.8705
38
- - Auc: 0.9550
39
 
40
  ## Model description
41
 
 
23
  metrics:
24
  - name: Accuracy
25
  type: accuracy
26
+ value: 0.8720870015535992
27
  ---
28
 
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
33
 
34
  This model is a fine-tuned version of [microsoft/swin-base-patch4-window7-224-in22k](https://huggingface.co/microsoft/swin-base-patch4-window7-224-in22k) on the imagefolder dataset.
35
  It achieves the following results on the evaluation set:
36
+ - Loss: 0.3245
37
+ - Accuracy: 0.8721
38
+ - Auc: 0.9534
39
 
40
  ## Model description
41
 
all_results.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "epoch": 6.885245901639344,
3
- "eval_accuracy": 0.8824443293630243,
4
- "eval_auc": 0.957557852599524,
5
- "eval_loss": 0.30561181902885437,
6
- "eval_runtime": 203.3286,
7
- "eval_samples_per_second": 9.497,
8
  "eval_steps_per_second": 0.079,
9
  "total_flos": 4.1785312376666235e+18,
10
- "train_loss": 0.38780884515671504,
11
- "train_runtime": 6680.4521,
12
- "train_samples_per_second": 8.107,
13
- "train_steps_per_second": 0.016
14
  }
 
1
  {
2
  "epoch": 6.885245901639344,
3
+ "eval_accuracy": 0.8720870015535992,
4
+ "eval_auc": 0.9534343762433686,
5
+ "eval_loss": 0.3244781792163849,
6
+ "eval_runtime": 202.4915,
7
+ "eval_samples_per_second": 9.536,
8
  "eval_steps_per_second": 0.079,
9
  "total_flos": 4.1785312376666235e+18,
10
+ "train_loss": 0.3947783969697498,
11
+ "train_runtime": 11418.3292,
12
+ "train_samples_per_second": 4.743,
13
+ "train_steps_per_second": 0.009
14
  }
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 6.885245901639344,
3
- "eval_accuracy": 0.8824443293630243,
4
- "eval_auc": 0.957557852599524,
5
- "eval_loss": 0.30561181902885437,
6
- "eval_runtime": 203.3286,
7
- "eval_samples_per_second": 9.497,
8
  "eval_steps_per_second": 0.079
9
  }
 
1
  {
2
  "epoch": 6.885245901639344,
3
+ "eval_accuracy": 0.8720870015535992,
4
+ "eval_auc": 0.9534343762433686,
5
+ "eval_loss": 0.3244781792163849,
6
+ "eval_runtime": 202.4915,
7
+ "eval_samples_per_second": 9.536,
8
  "eval_steps_per_second": 0.079
9
  }
runs/Aug30_06-47-56_data-science-wbi/events.out.tfevents.1725012113.data-science-wbi ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ddb579b7d0e441055662d315ee540d1acd11d18b5a632a7e14b0abd344fc41f2
3
+ size 87
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 6.885245901639344,
3
  "total_flos": 4.1785312376666235e+18,
4
- "train_loss": 0.38780884515671504,
5
- "train_runtime": 6680.4521,
6
- "train_samples_per_second": 8.107,
7
- "train_steps_per_second": 0.016
8
  }
 
1
  {
2
  "epoch": 6.885245901639344,
3
  "total_flos": 4.1785312376666235e+18,
4
+ "train_loss": 0.3947783969697498,
5
+ "train_runtime": 11418.3292,
6
+ "train_samples_per_second": 4.743,
7
+ "train_steps_per_second": 0.009
8
  }
trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.8824443293630243,
3
- "best_model_checkpoint": "swin-base-patch4-window7-224-in22k-MM_Classification_base_V10/checkpoint-105",
4
  "epoch": 6.885245901639344,
5
  "eval_steps": 500,
6
  "global_step": 105,
@@ -10,141 +10,211 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.6557377049180327,
13
- "grad_norm": 5.335843086242676,
14
  "learning_rate": 4.545454545454546e-05,
15
- "loss": 0.8134,
16
  "step": 10
17
  },
18
  {
19
  "epoch": 0.9836065573770492,
20
- "eval_accuracy": 0.8430864836872087,
21
- "eval_auc": 0.9250639596370771,
22
- "eval_loss": 0.419461190700531,
23
- "eval_runtime": 205.2459,
24
- "eval_samples_per_second": 9.408,
 
 
 
 
 
 
 
 
 
 
25
  "eval_steps_per_second": 0.078,
26
  "step": 15
27
  },
28
  {
29
  "epoch": 1.3114754098360657,
30
- "grad_norm": 2.8889973163604736,
31
  "learning_rate": 4.5212765957446815e-05,
32
- "loss": 0.5101,
33
  "step": 20
34
  },
35
  {
36
  "epoch": 1.9672131147540983,
37
- "grad_norm": 1.6868778467178345,
38
  "learning_rate": 3.9893617021276594e-05,
39
- "loss": 0.3996,
40
  "step": 30
41
  },
42
  {
43
  "epoch": 1.9672131147540983,
44
- "eval_accuracy": 0.8570688762299327,
45
- "eval_auc": 0.9437553079992403,
46
- "eval_loss": 0.3682312071323395,
47
- "eval_runtime": 204.3267,
48
- "eval_samples_per_second": 9.451,
 
 
 
 
 
 
 
 
 
 
49
  "eval_steps_per_second": 0.078,
50
  "step": 30
51
  },
52
  {
53
  "epoch": 2.6229508196721314,
54
- "grad_norm": 1.9163786172866821,
55
  "learning_rate": 3.4574468085106386e-05,
56
- "loss": 0.3693,
57
  "step": 40
58
  },
59
  {
60
  "epoch": 2.9508196721311473,
61
- "eval_accuracy": 0.877783531848783,
62
- "eval_auc": 0.9529726135197429,
63
- "eval_loss": 0.324381947517395,
64
- "eval_runtime": 203.8679,
65
- "eval_samples_per_second": 9.472,
66
- "eval_steps_per_second": 0.078,
 
 
 
 
 
 
 
 
 
 
67
  "step": 45
68
  },
69
  {
70
  "epoch": 3.278688524590164,
71
- "grad_norm": 2.268683433532715,
72
  "learning_rate": 2.925531914893617e-05,
73
- "loss": 0.3326,
74
  "step": 50
75
  },
76
  {
77
  "epoch": 3.9344262295081966,
78
- "grad_norm": 2.837725877761841,
79
  "learning_rate": 2.393617021276596e-05,
80
- "loss": 0.3147,
81
  "step": 60
82
  },
83
  {
84
  "epoch": 4.0,
85
- "eval_accuracy": 0.8793371310201968,
86
- "eval_auc": 0.9557452970649672,
87
- "eval_loss": 0.31093424558639526,
88
- "eval_runtime": 204.9066,
89
- "eval_samples_per_second": 9.424,
 
 
 
 
 
 
 
 
 
 
90
  "eval_steps_per_second": 0.078,
91
  "step": 61
92
  },
93
  {
94
  "epoch": 4.590163934426229,
95
- "grad_norm": 1.7413060665130615,
96
  "learning_rate": 1.8617021276595745e-05,
97
- "loss": 0.3166,
98
  "step": 70
99
  },
100
  {
101
  "epoch": 4.983606557377049,
102
- "eval_accuracy": 0.8803728638011393,
103
- "eval_auc": 0.9561359266346766,
104
- "eval_loss": 0.3134761154651642,
105
- "eval_runtime": 204.4948,
106
- "eval_samples_per_second": 9.443,
107
- "eval_steps_per_second": 0.078,
 
 
 
 
 
 
 
 
 
 
108
  "step": 76
109
  },
110
  {
111
  "epoch": 5.245901639344262,
112
- "grad_norm": 1.7945168018341064,
113
  "learning_rate": 1.3297872340425532e-05,
114
- "loss": 0.2921,
115
  "step": 80
116
  },
117
  {
118
  "epoch": 5.901639344262295,
119
- "grad_norm": 1.865674376487732,
120
  "learning_rate": 7.97872340425532e-06,
121
- "loss": 0.2918,
122
  "step": 90
123
  },
124
  {
125
  "epoch": 5.967213114754099,
126
- "eval_accuracy": 0.8746763335059554,
127
- "eval_auc": 0.9568584001596542,
128
- "eval_loss": 0.3116800785064697,
129
- "eval_runtime": 205.4646,
130
- "eval_samples_per_second": 9.398,
 
 
 
 
 
 
 
 
 
 
131
  "eval_steps_per_second": 0.078,
132
  "step": 91
133
  },
134
  {
135
  "epoch": 6.557377049180328,
136
- "grad_norm": 4.410208225250244,
137
  "learning_rate": 2.6595744680851065e-06,
138
- "loss": 0.2849,
139
  "step": 100
140
  },
141
  {
142
  "epoch": 6.885245901639344,
143
- "eval_accuracy": 0.8824443293630243,
144
- "eval_auc": 0.957557852599524,
145
- "eval_loss": 0.30561181902885437,
146
- "eval_runtime": 203.0816,
147
- "eval_samples_per_second": 9.508,
 
 
 
 
 
 
 
 
 
 
148
  "eval_steps_per_second": 0.079,
149
  "step": 105
150
  },
@@ -152,10 +222,10 @@
152
  "epoch": 6.885245901639344,
153
  "step": 105,
154
  "total_flos": 4.1785312376666235e+18,
155
- "train_loss": 0.38780884515671504,
156
- "train_runtime": 6680.4521,
157
- "train_samples_per_second": 8.107,
158
- "train_steps_per_second": 0.016
159
  }
160
  ],
161
  "logging_steps": 10,
 
1
  {
2
+ "best_metric": 0.8720870015535992,
3
+ "best_model_checkpoint": "swin-base-patch4-window7-224-in22k-MM_Classification_base_V10/checkpoint-61",
4
  "epoch": 6.885245901639344,
5
  "eval_steps": 500,
6
  "global_step": 105,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.6557377049180327,
13
+ "grad_norm": 3.5814733505249023,
14
  "learning_rate": 4.545454545454546e-05,
15
+ "loss": 0.8498,
16
  "step": 10
17
  },
18
  {
19
  "epoch": 0.9836065573770492,
20
+ "step": 15,
21
+ "train_accuracy": 0.8171125759338245,
22
+ "train_auc": 0.8967571163903928,
23
+ "train_loss": 0.47165462374687195,
24
+ "train_runtime": 694.4657,
25
+ "train_samples_per_second": 11.141,
26
+ "train_steps_per_second": 0.088
27
+ },
28
+ {
29
+ "epoch": 0.9836065573770492,
30
+ "eval_accuracy": 0.8327291558777835,
31
+ "eval_auc": 0.9183935491091096,
32
+ "eval_loss": 0.4327956438064575,
33
+ "eval_runtime": 205.3728,
34
+ "eval_samples_per_second": 9.402,
35
  "eval_steps_per_second": 0.078,
36
  "step": 15
37
  },
38
  {
39
  "epoch": 1.3114754098360657,
40
+ "grad_norm": 2.3799431324005127,
41
  "learning_rate": 4.5212765957446815e-05,
42
+ "loss": 0.5123,
43
  "step": 20
44
  },
45
  {
46
  "epoch": 1.9672131147540983,
47
+ "grad_norm": 2.067809581756592,
48
  "learning_rate": 3.9893617021276594e-05,
49
+ "loss": 0.4085,
50
  "step": 30
51
  },
52
  {
53
  "epoch": 1.9672131147540983,
54
+ "step": 30,
55
+ "train_accuracy": 0.8517513248028952,
56
+ "train_auc": 0.9387841345112529,
57
+ "train_loss": 0.36320993304252625,
58
+ "train_runtime": 684.0745,
59
+ "train_samples_per_second": 11.31,
60
+ "train_steps_per_second": 0.089
61
+ },
62
+ {
63
+ "epoch": 1.9672131147540983,
64
+ "eval_accuracy": 0.8518902123252201,
65
+ "eval_auc": 0.9423845489697825,
66
+ "eval_loss": 0.37112149596214294,
67
+ "eval_runtime": 205.1458,
68
+ "eval_samples_per_second": 9.413,
69
  "eval_steps_per_second": 0.078,
70
  "step": 30
71
  },
72
  {
73
  "epoch": 2.6229508196721314,
74
+ "grad_norm": 2.11800479888916,
75
  "learning_rate": 3.4574468085106386e-05,
76
+ "loss": 0.3717,
77
  "step": 40
78
  },
79
  {
80
  "epoch": 2.9508196721311473,
81
+ "step": 45,
82
+ "train_accuracy": 0.864029985782603,
83
+ "train_auc": 0.9527023779434378,
84
+ "train_loss": 0.3227292597293854,
85
+ "train_runtime": 681.4027,
86
+ "train_samples_per_second": 11.355,
87
+ "train_steps_per_second": 0.09
88
+ },
89
+ {
90
+ "epoch": 2.9508196721311473,
91
+ "eval_accuracy": 0.8653547384774728,
92
+ "eval_auc": 0.9487342167219569,
93
+ "eval_loss": 0.3345213234424591,
94
+ "eval_runtime": 203.71,
95
+ "eval_samples_per_second": 9.479,
96
+ "eval_steps_per_second": 0.079,
97
  "step": 45
98
  },
99
  {
100
  "epoch": 3.278688524590164,
101
+ "grad_norm": 4.481107711791992,
102
  "learning_rate": 2.925531914893617e-05,
103
+ "loss": 0.3301,
104
  "step": 50
105
  },
106
  {
107
  "epoch": 3.9344262295081966,
108
+ "grad_norm": 2.703953981399536,
109
  "learning_rate": 2.393617021276596e-05,
110
+ "loss": 0.3196,
111
  "step": 60
112
  },
113
  {
114
  "epoch": 4.0,
115
+ "step": 61,
116
+ "train_accuracy": 0.8733359183145922,
117
+ "train_auc": 0.9563002964315263,
118
+ "train_loss": 0.30748647451400757,
119
+ "train_runtime": 678.9663,
120
+ "train_samples_per_second": 11.395,
121
+ "train_steps_per_second": 0.09
122
+ },
123
+ {
124
+ "epoch": 4.0,
125
+ "eval_accuracy": 0.8720870015535992,
126
+ "eval_auc": 0.9534343762433686,
127
+ "eval_loss": 0.3244781792163849,
128
+ "eval_runtime": 204.3133,
129
+ "eval_samples_per_second": 9.451,
130
  "eval_steps_per_second": 0.078,
131
  "step": 61
132
  },
133
  {
134
  "epoch": 4.590163934426229,
135
+ "grad_norm": 1.967414379119873,
136
  "learning_rate": 1.8617021276595745e-05,
137
+ "loss": 0.3279,
138
  "step": 70
139
  },
140
  {
141
  "epoch": 4.983606557377049,
142
+ "step": 76,
143
+ "train_accuracy": 0.8813493602171384,
144
+ "train_auc": 0.9603495718478623,
145
+ "train_loss": 0.2974039912223816,
146
+ "train_runtime": 680.7385,
147
+ "train_samples_per_second": 11.366,
148
+ "train_steps_per_second": 0.09
149
+ },
150
+ {
151
+ "epoch": 4.983606557377049,
152
+ "eval_accuracy": 0.8694976696012429,
153
+ "eval_auc": 0.953884522107936,
154
+ "eval_loss": 0.3240814805030823,
155
+ "eval_runtime": 203.7726,
156
+ "eval_samples_per_second": 9.476,
157
+ "eval_steps_per_second": 0.079,
158
  "step": 76
159
  },
160
  {
161
  "epoch": 5.245901639344262,
162
+ "grad_norm": 1.8759346008300781,
163
  "learning_rate": 1.3297872340425532e-05,
164
+ "loss": 0.3042,
165
  "step": 80
166
  },
167
  {
168
  "epoch": 5.901639344262295,
169
+ "grad_norm": 2.394904136657715,
170
  "learning_rate": 7.97872340425532e-06,
171
+ "loss": 0.2926,
172
  "step": 90
173
  },
174
  {
175
  "epoch": 5.967213114754099,
176
+ "step": 91,
177
+ "train_accuracy": 0.8858730774201887,
178
+ "train_auc": 0.9646418504220758,
179
+ "train_loss": 0.28083333373069763,
180
+ "train_runtime": 681.28,
181
+ "train_samples_per_second": 11.357,
182
+ "train_steps_per_second": 0.09
183
+ },
184
+ {
185
+ "epoch": 5.967213114754099,
186
+ "eval_accuracy": 0.8674262040393579,
187
+ "eval_auc": 0.9548863198183253,
188
+ "eval_loss": 0.3211652338504791,
189
+ "eval_runtime": 205.0822,
190
+ "eval_samples_per_second": 9.416,
191
  "eval_steps_per_second": 0.078,
192
  "step": 91
193
  },
194
  {
195
  "epoch": 6.557377049180328,
196
+ "grad_norm": 1.7362953424453735,
197
  "learning_rate": 2.6595744680851065e-06,
198
+ "loss": 0.2821,
199
  "step": 100
200
  },
201
  {
202
  "epoch": 6.885245901639344,
203
+ "step": 105,
204
+ "train_accuracy": 0.8937572702597906,
205
+ "train_auc": 0.9682688664846578,
206
+ "train_loss": 0.26618629693984985,
207
+ "train_runtime": 676.8276,
208
+ "train_samples_per_second": 11.431,
209
+ "train_steps_per_second": 0.09
210
+ },
211
+ {
212
+ "epoch": 6.885245901639344,
213
+ "eval_accuracy": 0.8705334023821854,
214
+ "eval_auc": 0.9549996078144867,
215
+ "eval_loss": 0.31725937128067017,
216
+ "eval_runtime": 203.7289,
217
+ "eval_samples_per_second": 9.478,
218
  "eval_steps_per_second": 0.079,
219
  "step": 105
220
  },
 
222
  "epoch": 6.885245901639344,
223
  "step": 105,
224
  "total_flos": 4.1785312376666235e+18,
225
+ "train_loss": 0.3947783969697498,
226
+ "train_runtime": 11418.3292,
227
+ "train_samples_per_second": 4.743,
228
+ "train_steps_per_second": 0.009
229
  }
230
  ],
231
  "logging_steps": 10,