paul commited on
Commit
d4f634b
1 Parent(s): aeb8f3b

Training in progress, epoch 0

Browse files
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
config.json ADDED
@@ -0,0 +1,124 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "microsoft/cvt-13-384-22k",
3
+ "architectures": [
4
+ "CvtForImageClassification"
5
+ ],
6
+ "attention_drop_rate": [
7
+ 0.0,
8
+ 0.0,
9
+ 0.0
10
+ ],
11
+ "cls_token": [
12
+ false,
13
+ false,
14
+ true
15
+ ],
16
+ "depth": [
17
+ 1,
18
+ 2,
19
+ 10
20
+ ],
21
+ "drop_path_rate": [
22
+ 0.0,
23
+ 0.0,
24
+ 0.1
25
+ ],
26
+ "drop_rate": [
27
+ 0.0,
28
+ 0.0,
29
+ 0.0
30
+ ],
31
+ "embed_dim": [
32
+ 64,
33
+ 192,
34
+ 384
35
+ ],
36
+ "id2label": {
37
+ "0": "Bollywood memes",
38
+ "1": "Industrialist",
39
+ "2": "Political memes",
40
+ "3": "Singer memes",
41
+ "4": "Sports memes"
42
+ },
43
+ "image_size": 384,
44
+ "initializer_range": 0.02,
45
+ "kernel_qkv": [
46
+ 3,
47
+ 3,
48
+ 3
49
+ ],
50
+ "label2id": {
51
+ "Bollywood memes": "0",
52
+ "Industrialist": "1",
53
+ "Political memes": "2",
54
+ "Singer memes": "3",
55
+ "Sports memes": "4"
56
+ },
57
+ "layer_norm_eps": 1e-12,
58
+ "mlp_ratio": [
59
+ 4.0,
60
+ 4.0,
61
+ 4.0
62
+ ],
63
+ "model_type": "cvt",
64
+ "num_channels": 3,
65
+ "num_heads": [
66
+ 1,
67
+ 3,
68
+ 6
69
+ ],
70
+ "num_stages": 3,
71
+ "padding_kv": [
72
+ 1,
73
+ 1,
74
+ 1
75
+ ],
76
+ "padding_q": [
77
+ 1,
78
+ 1,
79
+ 1
80
+ ],
81
+ "patch_padding": [
82
+ 2,
83
+ 1,
84
+ 1
85
+ ],
86
+ "patch_sizes": [
87
+ 7,
88
+ 3,
89
+ 3
90
+ ],
91
+ "patch_stride": [
92
+ 4,
93
+ 2,
94
+ 2
95
+ ],
96
+ "pos_embed": [
97
+ false,
98
+ false,
99
+ false
100
+ ],
101
+ "problem_type": "single_label_classification",
102
+ "qkv_bias": [
103
+ true,
104
+ true,
105
+ true
106
+ ],
107
+ "qkv_projection_method": [
108
+ "dw_bn",
109
+ "dw_bn",
110
+ "dw_bn"
111
+ ],
112
+ "stride_kv": [
113
+ 2,
114
+ 2,
115
+ 2
116
+ ],
117
+ "stride_q": [
118
+ 1,
119
+ 1,
120
+ 1
121
+ ],
122
+ "torch_dtype": "float32",
123
+ "transformers_version": "4.24.0.dev0"
124
+ }
preprocessor_config.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_pct": 0.875,
3
+ "do_normalize": true,
4
+ "do_resize": true,
5
+ "feature_extractor_type": "ConvNextFeatureExtractor",
6
+ "image_mean": [
7
+ 0.485,
8
+ 0.456,
9
+ 0.406
10
+ ],
11
+ "image_std": [
12
+ 0.229,
13
+ 0.224,
14
+ 0.225
15
+ ],
16
+ "resample": 3,
17
+ "size": 224
18
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88a10859272fab31a8e07b7304da986c70c83d4150619b71497fb43ce2d06213
3
+ size 78734635
runs/Oct21_23-36-54_teesta/1666375635.7998886/events.out.tfevents.1666375635.teesta.547.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f96631bf0243e0d6138b2f0bf59ef7369dc6e117a3dc89b69bcd4b9c12dca56
3
+ size 5520
runs/Oct21_23-36-54_teesta/events.out.tfevents.1666375635.teesta.547.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4dcc89e8c82523f0eb81804cedd59da28fa57ed64720d7bc84922d7b6b86f584
3
+ size 5415
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16f80140675a7f02de656de130ef75a7922ba0e51b2945362d6d0e2d9159fa3e
3
+ size 3439