ruanwz commited on
Commit
87393e5
·
verified ·
1 Parent(s): 0768607

Upload folder using huggingface_hub

Browse files
README.md ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ ---
3
+ tags:
4
+ - autotrain
5
+ - image-classification
6
+ widget:
7
+ - src: https://huggingface.co/datasets/mishig/sample_images/resolve/main/tiger.jpg
8
+ example_title: Tiger
9
+ - src: https://huggingface.co/datasets/mishig/sample_images/resolve/main/teapot.jpg
10
+ example_title: Teapot
11
+ - src: https://huggingface.co/datasets/mishig/sample_images/resolve/main/palace.jpg
12
+ example_title: Palace
13
+ datasets:
14
+ - autotrain-prj-image-classification-for-slides/autotrain-data
15
+ ---
16
+
17
+ # Model Trained Using AutoTrain
18
+
19
+ - Problem type: Image Classification
20
+
21
+ ## Validation Metricsg
22
+ loss: 0.26321205496788025
23
+
24
+ f1: 0.8333333333333334
25
+
26
+ precision: 0.8333333333333334
27
+
28
+ recall: 0.8333333333333334
29
+
30
+ auc: 0.9351851851851851
31
+
32
+ accuracy: 0.9166666666666666
checkpoint-48/config.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "google/vit-large-patch32-384",
3
+ "_num_labels": 2,
4
+ "architectures": [
5
+ "ViTForImageClassification"
6
+ ],
7
+ "attention_probs_dropout_prob": 0.0,
8
+ "encoder_stride": 16,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.0,
11
+ "hidden_size": 1024,
12
+ "id2label": {
13
+ "0": "keep",
14
+ "1": "remove"
15
+ },
16
+ "image_size": 384,
17
+ "initializer_range": 0.02,
18
+ "intermediate_size": 4096,
19
+ "label2id": {
20
+ "keep": 0,
21
+ "remove": 1
22
+ },
23
+ "layer_norm_eps": 1e-12,
24
+ "model_type": "vit",
25
+ "num_attention_heads": 16,
26
+ "num_channels": 3,
27
+ "num_hidden_layers": 24,
28
+ "patch_size": 32,
29
+ "problem_type": "single_label_classification",
30
+ "qkv_bias": true,
31
+ "torch_dtype": "float32",
32
+ "transformers_version": "4.37.0"
33
+ }
checkpoint-48/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c3b60842e17608320309b5392cd38c8c37f9d8afa113d9dd4875a5c7f5fcd33
3
+ size 1222485480
checkpoint-48/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84f053b2ba01710e9285586ec8ec5071ddc3ba9aec10f16d3bc867fead328120
3
+ size 2445205930
checkpoint-48/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1809cdcfb16eae6c01916ed89ce23de5a4f8f09ceb97e0a3361bdc427871070c
3
+ size 14244
checkpoint-48/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:659241ea1929c9e2b8e4e41f29443b14abe8f49515ab83d74a4d728c6427b5e9
3
+ size 1064
checkpoint-48/trainer_state.json ADDED
@@ -0,0 +1,361 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.26321205496788025,
3
+ "best_model_checkpoint": "autotrain-prj-image-classification-for-slides/checkpoint-48",
4
+ "epoch": 4.0,
5
+ "eval_steps": 500,
6
+ "global_step": 48,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.08,
13
+ "learning_rate": 4.166666666666667e-06,
14
+ "loss": 0.8158,
15
+ "step": 1
16
+ },
17
+ {
18
+ "epoch": 0.17,
19
+ "learning_rate": 4.166666666666667e-06,
20
+ "loss": 0.7927,
21
+ "step": 2
22
+ },
23
+ {
24
+ "epoch": 0.25,
25
+ "learning_rate": 8.333333333333334e-06,
26
+ "loss": 0.8798,
27
+ "step": 3
28
+ },
29
+ {
30
+ "epoch": 0.33,
31
+ "learning_rate": 1.25e-05,
32
+ "loss": 0.8946,
33
+ "step": 4
34
+ },
35
+ {
36
+ "epoch": 0.42,
37
+ "learning_rate": 1.6666666666666667e-05,
38
+ "loss": 0.735,
39
+ "step": 5
40
+ },
41
+ {
42
+ "epoch": 0.5,
43
+ "learning_rate": 2.0833333333333336e-05,
44
+ "loss": 0.5985,
45
+ "step": 6
46
+ },
47
+ {
48
+ "epoch": 0.58,
49
+ "learning_rate": 2.5e-05,
50
+ "loss": 0.5549,
51
+ "step": 7
52
+ },
53
+ {
54
+ "epoch": 0.67,
55
+ "learning_rate": 2.916666666666667e-05,
56
+ "loss": 0.3827,
57
+ "step": 8
58
+ },
59
+ {
60
+ "epoch": 0.75,
61
+ "learning_rate": 3.3333333333333335e-05,
62
+ "loss": 0.5742,
63
+ "step": 9
64
+ },
65
+ {
66
+ "epoch": 0.83,
67
+ "learning_rate": 3.7500000000000003e-05,
68
+ "loss": 0.3724,
69
+ "step": 10
70
+ },
71
+ {
72
+ "epoch": 0.92,
73
+ "learning_rate": 4.166666666666667e-05,
74
+ "loss": 0.4903,
75
+ "step": 11
76
+ },
77
+ {
78
+ "epoch": 1.0,
79
+ "learning_rate": 4.5833333333333334e-05,
80
+ "loss": 0.9232,
81
+ "step": 12
82
+ },
83
+ {
84
+ "epoch": 1.0,
85
+ "eval_accuracy": 0.75,
86
+ "eval_auc": 0.6296296296296297,
87
+ "eval_f1": 0.0,
88
+ "eval_loss": 0.5604451298713684,
89
+ "eval_precision": 0.0,
90
+ "eval_recall": 0.0,
91
+ "eval_runtime": 0.9668,
92
+ "eval_samples_per_second": 24.824,
93
+ "eval_steps_per_second": 2.069,
94
+ "step": 12
95
+ },
96
+ {
97
+ "epoch": 1.08,
98
+ "learning_rate": 5e-05,
99
+ "loss": 0.2256,
100
+ "step": 13
101
+ },
102
+ {
103
+ "epoch": 1.17,
104
+ "learning_rate": 4.9537037037037035e-05,
105
+ "loss": 0.238,
106
+ "step": 14
107
+ },
108
+ {
109
+ "epoch": 1.25,
110
+ "learning_rate": 4.9074074074074075e-05,
111
+ "loss": 1.0486,
112
+ "step": 15
113
+ },
114
+ {
115
+ "epoch": 1.33,
116
+ "learning_rate": 4.8611111111111115e-05,
117
+ "loss": 0.2961,
118
+ "step": 16
119
+ },
120
+ {
121
+ "epoch": 1.42,
122
+ "learning_rate": 4.814814814814815e-05,
123
+ "loss": 0.5506,
124
+ "step": 17
125
+ },
126
+ {
127
+ "epoch": 1.5,
128
+ "learning_rate": 4.814814814814815e-05,
129
+ "loss": 0.2733,
130
+ "step": 18
131
+ },
132
+ {
133
+ "epoch": 1.58,
134
+ "learning_rate": 4.768518518518519e-05,
135
+ "loss": 0.2415,
136
+ "step": 19
137
+ },
138
+ {
139
+ "epoch": 1.67,
140
+ "learning_rate": 4.722222222222222e-05,
141
+ "loss": 0.1263,
142
+ "step": 20
143
+ },
144
+ {
145
+ "epoch": 1.75,
146
+ "learning_rate": 4.675925925925926e-05,
147
+ "loss": 0.1261,
148
+ "step": 21
149
+ },
150
+ {
151
+ "epoch": 1.83,
152
+ "learning_rate": 4.62962962962963e-05,
153
+ "loss": 0.2731,
154
+ "step": 22
155
+ },
156
+ {
157
+ "epoch": 1.92,
158
+ "learning_rate": 4.5833333333333334e-05,
159
+ "loss": 0.1118,
160
+ "step": 23
161
+ },
162
+ {
163
+ "epoch": 2.0,
164
+ "learning_rate": 4.5370370370370374e-05,
165
+ "loss": 0.6111,
166
+ "step": 24
167
+ },
168
+ {
169
+ "epoch": 2.0,
170
+ "eval_accuracy": 0.8333333333333334,
171
+ "eval_auc": 0.8333333333333334,
172
+ "eval_f1": 0.6,
173
+ "eval_loss": 0.3809445798397064,
174
+ "eval_precision": 0.75,
175
+ "eval_recall": 0.5,
176
+ "eval_runtime": 1.1816,
177
+ "eval_samples_per_second": 20.311,
178
+ "eval_steps_per_second": 1.693,
179
+ "step": 24
180
+ },
181
+ {
182
+ "epoch": 2.08,
183
+ "learning_rate": 4.490740740740741e-05,
184
+ "loss": 0.293,
185
+ "step": 25
186
+ },
187
+ {
188
+ "epoch": 2.17,
189
+ "learning_rate": 4.4444444444444447e-05,
190
+ "loss": 0.0621,
191
+ "step": 26
192
+ },
193
+ {
194
+ "epoch": 2.25,
195
+ "learning_rate": 4.3981481481481486e-05,
196
+ "loss": 0.0873,
197
+ "step": 27
198
+ },
199
+ {
200
+ "epoch": 2.33,
201
+ "learning_rate": 4.351851851851852e-05,
202
+ "loss": 0.0653,
203
+ "step": 28
204
+ },
205
+ {
206
+ "epoch": 2.42,
207
+ "learning_rate": 4.305555555555556e-05,
208
+ "loss": 0.1292,
209
+ "step": 29
210
+ },
211
+ {
212
+ "epoch": 2.5,
213
+ "learning_rate": 4.259259259259259e-05,
214
+ "loss": 0.1142,
215
+ "step": 30
216
+ },
217
+ {
218
+ "epoch": 2.58,
219
+ "learning_rate": 4.212962962962963e-05,
220
+ "loss": 0.0272,
221
+ "step": 31
222
+ },
223
+ {
224
+ "epoch": 2.67,
225
+ "learning_rate": 4.166666666666667e-05,
226
+ "loss": 0.0551,
227
+ "step": 32
228
+ },
229
+ {
230
+ "epoch": 2.75,
231
+ "learning_rate": 4.1203703703703705e-05,
232
+ "loss": 0.1881,
233
+ "step": 33
234
+ },
235
+ {
236
+ "epoch": 2.83,
237
+ "learning_rate": 4.074074074074074e-05,
238
+ "loss": 0.047,
239
+ "step": 34
240
+ },
241
+ {
242
+ "epoch": 2.92,
243
+ "learning_rate": 4.027777777777778e-05,
244
+ "loss": 0.3178,
245
+ "step": 35
246
+ },
247
+ {
248
+ "epoch": 3.0,
249
+ "learning_rate": 3.981481481481482e-05,
250
+ "loss": 0.4922,
251
+ "step": 36
252
+ },
253
+ {
254
+ "epoch": 3.0,
255
+ "eval_accuracy": 0.875,
256
+ "eval_auc": 0.8148148148148148,
257
+ "eval_f1": 0.6666666666666666,
258
+ "eval_loss": 0.4897962510585785,
259
+ "eval_precision": 1.0,
260
+ "eval_recall": 0.5,
261
+ "eval_runtime": 0.91,
262
+ "eval_samples_per_second": 26.373,
263
+ "eval_steps_per_second": 2.198,
264
+ "step": 36
265
+ },
266
+ {
267
+ "epoch": 3.08,
268
+ "learning_rate": 3.935185185185186e-05,
269
+ "loss": 0.0111,
270
+ "step": 37
271
+ },
272
+ {
273
+ "epoch": 3.17,
274
+ "learning_rate": 3.888888888888889e-05,
275
+ "loss": 0.0638,
276
+ "step": 38
277
+ },
278
+ {
279
+ "epoch": 3.25,
280
+ "learning_rate": 3.8425925925925924e-05,
281
+ "loss": 0.0097,
282
+ "step": 39
283
+ },
284
+ {
285
+ "epoch": 3.33,
286
+ "learning_rate": 3.7962962962962964e-05,
287
+ "loss": 0.0402,
288
+ "step": 40
289
+ },
290
+ {
291
+ "epoch": 3.42,
292
+ "learning_rate": 3.7500000000000003e-05,
293
+ "loss": 0.0386,
294
+ "step": 41
295
+ },
296
+ {
297
+ "epoch": 3.5,
298
+ "learning_rate": 3.7037037037037037e-05,
299
+ "loss": 0.1937,
300
+ "step": 42
301
+ },
302
+ {
303
+ "epoch": 3.58,
304
+ "learning_rate": 3.6574074074074076e-05,
305
+ "loss": 0.5758,
306
+ "step": 43
307
+ },
308
+ {
309
+ "epoch": 3.67,
310
+ "learning_rate": 3.611111111111111e-05,
311
+ "loss": 0.1015,
312
+ "step": 44
313
+ },
314
+ {
315
+ "epoch": 3.75,
316
+ "learning_rate": 3.564814814814815e-05,
317
+ "loss": 0.0208,
318
+ "step": 45
319
+ },
320
+ {
321
+ "epoch": 3.83,
322
+ "learning_rate": 3.518518518518519e-05,
323
+ "loss": 0.0489,
324
+ "step": 46
325
+ },
326
+ {
327
+ "epoch": 3.92,
328
+ "learning_rate": 3.472222222222222e-05,
329
+ "loss": 0.0167,
330
+ "step": 47
331
+ },
332
+ {
333
+ "epoch": 4.0,
334
+ "learning_rate": 3.425925925925926e-05,
335
+ "loss": 0.0876,
336
+ "step": 48
337
+ },
338
+ {
339
+ "epoch": 4.0,
340
+ "eval_accuracy": 0.9166666666666666,
341
+ "eval_auc": 0.9351851851851851,
342
+ "eval_f1": 0.8333333333333334,
343
+ "eval_loss": 0.26321205496788025,
344
+ "eval_precision": 0.8333333333333334,
345
+ "eval_recall": 0.8333333333333334,
346
+ "eval_runtime": 0.8986,
347
+ "eval_samples_per_second": 26.708,
348
+ "eval_steps_per_second": 2.226,
349
+ "step": 48
350
+ }
351
+ ],
352
+ "logging_steps": 1,
353
+ "max_steps": 120,
354
+ "num_input_tokens_seen": 0,
355
+ "num_train_epochs": 10,
356
+ "save_steps": 500,
357
+ "total_flos": 3.1148228745363456e+17,
358
+ "train_batch_size": 8,
359
+ "trial_name": null,
360
+ "trial_params": null
361
+ }
checkpoint-48/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d203f70c7b9b0f68fb3aa9f53da11c0446da8cd795bd0cc70900a4e2aa046a77
3
+ size 4728
config.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "google/vit-large-patch32-384",
3
+ "_num_labels": 2,
4
+ "architectures": [
5
+ "ViTForImageClassification"
6
+ ],
7
+ "attention_probs_dropout_prob": 0.0,
8
+ "encoder_stride": 16,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.0,
11
+ "hidden_size": 1024,
12
+ "id2label": {
13
+ "0": "keep",
14
+ "1": "remove"
15
+ },
16
+ "image_size": 384,
17
+ "initializer_range": 0.02,
18
+ "intermediate_size": 4096,
19
+ "label2id": {
20
+ "keep": 0,
21
+ "remove": 1
22
+ },
23
+ "layer_norm_eps": 1e-12,
24
+ "model_type": "vit",
25
+ "num_attention_heads": 16,
26
+ "num_channels": 3,
27
+ "num_hidden_layers": 24,
28
+ "patch_size": 32,
29
+ "problem_type": "single_label_classification",
30
+ "qkv_bias": true,
31
+ "torch_dtype": "float32",
32
+ "transformers_version": "4.37.0"
33
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c3b60842e17608320309b5392cd38c8c37f9d8afa113d9dd4875a5c7f5fcd33
3
+ size 1222485480
preprocessor_config.json ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_normalize": true,
3
+ "do_rescale": true,
4
+ "do_resize": true,
5
+ "image_mean": [
6
+ 0.5,
7
+ 0.5,
8
+ 0.5
9
+ ],
10
+ "image_processor_type": "ViTImageProcessor",
11
+ "image_std": [
12
+ 0.5,
13
+ 0.5,
14
+ 0.5
15
+ ],
16
+ "resample": 2,
17
+ "rescale_factor": 0.00392156862745098,
18
+ "size": {
19
+ "height": 384,
20
+ "width": 384
21
+ }
22
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d203f70c7b9b0f68fb3aa9f53da11c0446da8cd795bd0cc70900a4e2aa046a77
3
+ size 4728
training_params.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "data_path": "autotrain-prj-image-classification-for-slides/autotrain-data",
3
+ "model": "google/vit-large-patch32-384",
4
+ "username": "ruanwz",
5
+ "lr": 5e-05,
6
+ "epochs": 10,
7
+ "batch_size": 8,
8
+ "warmup_ratio": 0.1,
9
+ "gradient_accumulation": 1,
10
+ "optimizer": "adamw_torch",
11
+ "scheduler": "linear",
12
+ "weight_decay": 0.0,
13
+ "max_grad_norm": 1.0,
14
+ "seed": 42,
15
+ "train_split": "train",
16
+ "valid_split": "validation",
17
+ "logging_steps": -1,
18
+ "project_name": "autotrain-prj-image-classification-for-slides",
19
+ "auto_find_batch_size": false,
20
+ "mixed_precision": "fp16",
21
+ "save_total_limit": 1,
22
+ "save_strategy": "epoch",
23
+ "push_to_hub": true,
24
+ "repo_id": "ruanwz/autotrain-prj-image-classification-for-slides",
25
+ "evaluation_strategy": "epoch",
26
+ "image_column": "autotrain_image",
27
+ "target_column": "autotrain_label",
28
+ "log": "none"
29
+ }