Upload CustomViltForVQA
Browse files- config.json +216 -216
- model.safetensors +1 -1
config.json
CHANGED
@@ -8,227 +8,227 @@
|
|
8 |
"hidden_dropout_prob": 0.0,
|
9 |
"hidden_size": 768,
|
10 |
"id2label": {
|
11 |
-
"0": "
|
12 |
-
"1": "
|
13 |
-
"2": "
|
14 |
-
"3": "
|
15 |
-
"4": "
|
16 |
-
"5": "
|
17 |
-
"6": "
|
18 |
-
"7": "
|
19 |
-
"8": "
|
20 |
-
"9": "
|
21 |
-
"10": "
|
22 |
-
"11": "
|
23 |
-
"12": "
|
24 |
-
"13": "
|
25 |
-
"14": "
|
26 |
-
"15": "
|
27 |
-
"16": "
|
28 |
-
"17": "
|
29 |
-
"18": "
|
30 |
-
"19": "
|
31 |
-
"20": "
|
32 |
-
"21": "
|
33 |
-
"22": "
|
34 |
-
"23": "
|
35 |
-
"24": "
|
36 |
-
"25": "
|
37 |
-
"26": "
|
38 |
-
"27": "
|
39 |
-
"28": "
|
40 |
-
"29": "
|
41 |
-
"30": "
|
42 |
-
"31": "
|
43 |
-
"32": "
|
44 |
-
"33": "
|
45 |
-
"34": "
|
46 |
-
"35": "
|
47 |
-
"36": "
|
48 |
-
"37": "
|
49 |
-
"38": "
|
50 |
-
"39": "
|
51 |
-
"40": "
|
52 |
-
"41": "
|
53 |
-
"42": "
|
54 |
-
"43": "
|
55 |
-
"44": "
|
56 |
-
"45": "
|
57 |
-
"46": "
|
58 |
-
"47": "
|
59 |
-
"48": "
|
60 |
-
"49": "
|
61 |
-
"50": "
|
62 |
-
"51": "
|
63 |
-
"52": "
|
64 |
-
"53": "
|
65 |
-
"54": "
|
66 |
-
"55": "
|
67 |
-
"56": "
|
68 |
-
"57": "
|
69 |
-
"58": "
|
70 |
-
"59": "
|
71 |
-
"60": "
|
72 |
-
"61": "
|
73 |
-
"62": "
|
74 |
-
"63": "
|
75 |
-
"64": "
|
76 |
-
"65": "
|
77 |
-
"66": "
|
78 |
-
"67": "
|
79 |
-
"68": "
|
80 |
-
"69": "
|
81 |
-
"70": "
|
82 |
-
"71": "
|
83 |
-
"72": "
|
84 |
-
"73": "
|
85 |
-
"74": "
|
86 |
-
"75": "
|
87 |
-
"76": "
|
88 |
-
"77": "
|
89 |
-
"78": "
|
90 |
-
"79": "
|
91 |
-
"80": "
|
92 |
-
"81": "
|
93 |
-
"82": "
|
94 |
-
"83": "
|
95 |
-
"84": "
|
96 |
-
"85": "
|
97 |
-
"86": "
|
98 |
-
"87": "
|
99 |
-
"88": "
|
100 |
-
"89": "
|
101 |
-
"90": "
|
102 |
-
"91": "
|
103 |
-
"92": "
|
104 |
-
"93": "
|
105 |
-
"94": "
|
106 |
-
"95": "
|
107 |
-
"96": "
|
108 |
-
"97": "
|
109 |
-
"98": "
|
110 |
-
"99": "
|
111 |
-
"100": "
|
112 |
-
"101": "
|
113 |
-
"102": "
|
114 |
-
"103": "
|
115 |
-
"104": "
|
116 |
-
"105": "
|
117 |
-
"106": "
|
118 |
-
"107": "
|
119 |
},
|
120 |
"image_size": 384,
|
121 |
"initializer_range": 0.02,
|
122 |
"intermediate_size": 3072,
|
123 |
"label2id": {
|
124 |
-
"0":
|
125 |
-
"1":
|
126 |
-
"2":
|
127 |
-
"3":
|
128 |
-
"4":
|
129 |
-
"5":
|
130 |
-
"6":
|
131 |
-
"7":
|
132 |
-
"8":
|
133 |
-
"9":
|
134 |
-
"Above":
|
135 |
-
"Behind":
|
136 |
-
"Below":
|
137 |
-
"Black":
|
138 |
-
"Blue":
|
139 |
-
"Brown":
|
140 |
-
"Front":
|
141 |
-
"Green":
|
142 |
-
"Grey":
|
143 |
-
"Left":
|
144 |
-
"No":
|
145 |
-
"Orange":
|
146 |
-
"Pink":
|
147 |
-
"Purple":
|
148 |
-
"Red":
|
149 |
-
"Right":
|
150 |
-
"White":
|
151 |
-
"Yellow":
|
152 |
-
"Yes":
|
153 |
-
"above":
|
154 |
-
"airplane":
|
155 |
-
"apple":
|
156 |
-
"banana":
|
157 |
-
"baseball bat":
|
158 |
-
"baseball glove":
|
159 |
-
"bear":
|
160 |
-
"bed":
|
161 |
-
"bench":
|
162 |
-
"bicycle":
|
163 |
-
"bird":
|
164 |
-
"boat":
|
165 |
-
"book":
|
166 |
-
"bottle":
|
167 |
-
"bowl":
|
168 |
-
"broccoli":
|
169 |
-
"bus":
|
170 |
-
"cake":
|
171 |
-
"car":
|
172 |
-
"carrot":
|
173 |
-
"cat":
|
174 |
-
"cell phone":
|
175 |
-
"chair":
|
176 |
-
"clock":
|
177 |
-
"couch":
|
178 |
-
"cow":
|
179 |
-
"cup":
|
180 |
-
"dining table":
|
181 |
-
"dog":
|
182 |
-
"donut":
|
183 |
-
"elephant":
|
184 |
-
"fire hydrant":
|
185 |
-
"fork":
|
186 |
-
"frisbee":
|
187 |
-
"giraffe":
|
188 |
-
"handbag":
|
189 |
-
"horse":
|
190 |
-
"hot dog":
|
191 |
-
"keyboard":
|
192 |
-
"kite":
|
193 |
-
"knife":
|
194 |
-
"laptop":
|
195 |
-
"left":
|
196 |
-
"motorcycle":
|
197 |
-
"mouse":
|
198 |
-
"orange":
|
199 |
-
"oven":
|
200 |
-
"parking meter":
|
201 |
-
"person":
|
202 |
-
"pizza":
|
203 |
-
"potted plant":
|
204 |
-
"refrigerator":
|
205 |
-
"remote":
|
206 |
-
"right":
|
207 |
-
"sandwich":
|
208 |
-
"scissors":
|
209 |
-
"sheep":
|
210 |
-
"sink":
|
211 |
-
"skateboard":
|
212 |
-
"skis":
|
213 |
-
"snowboard":
|
214 |
-
"spoon":
|
215 |
-
"sports ball":
|
216 |
-
"stop sign":
|
217 |
-
"suitcase":
|
218 |
-
"surfboard":
|
219 |
-
"teddy bear":
|
220 |
-
"tennis racket":
|
221 |
-
"tie":
|
222 |
-
"toilet":
|
223 |
-
"toothbrush":
|
224 |
-
"traffic light":
|
225 |
-
"train":
|
226 |
-
"truck":
|
227 |
-
"tv":
|
228 |
-
"umbrella":
|
229 |
-
"vase":
|
230 |
-
"wine glass":
|
231 |
-
"zebra":
|
232 |
},
|
233 |
"layer_norm_eps": 1e-12,
|
234 |
"max_image_length": -1,
|
|
|
8 |
"hidden_dropout_prob": 0.0,
|
9 |
"hidden_size": 768,
|
10 |
"id2label": {
|
11 |
+
"0": "5",
|
12 |
+
"1": "zebra",
|
13 |
+
"2": "couch",
|
14 |
+
"3": "sink",
|
15 |
+
"4": "apple",
|
16 |
+
"5": "umbrella",
|
17 |
+
"6": "bus",
|
18 |
+
"7": "dog",
|
19 |
+
"8": "boat",
|
20 |
+
"9": "Grey",
|
21 |
+
"10": "suitcase",
|
22 |
+
"11": "2",
|
23 |
+
"12": "bottle",
|
24 |
+
"13": "spoon",
|
25 |
+
"14": "3",
|
26 |
+
"15": "toilet",
|
27 |
+
"16": "8",
|
28 |
+
"17": "7",
|
29 |
+
"18": "knife",
|
30 |
+
"19": "Pink",
|
31 |
+
"20": "skis",
|
32 |
+
"21": "4",
|
33 |
+
"22": "toothbrush",
|
34 |
+
"23": "surfboard",
|
35 |
+
"24": "Behind",
|
36 |
+
"25": "person",
|
37 |
+
"26": "orange",
|
38 |
+
"27": "chair",
|
39 |
+
"28": "handbag",
|
40 |
+
"29": "cow",
|
41 |
+
"30": "1",
|
42 |
+
"31": "fire hydrant",
|
43 |
+
"32": "oven",
|
44 |
+
"33": "tennis racket",
|
45 |
+
"34": "Yellow",
|
46 |
+
"35": "remote",
|
47 |
+
"36": "9",
|
48 |
+
"37": "No",
|
49 |
+
"38": "0",
|
50 |
+
"39": "carrot",
|
51 |
+
"40": "Above",
|
52 |
+
"41": "sports ball",
|
53 |
+
"42": "Purple",
|
54 |
+
"43": "snowboard",
|
55 |
+
"44": "parking meter",
|
56 |
+
"45": "mouse",
|
57 |
+
"46": "White",
|
58 |
+
"47": "clock",
|
59 |
+
"48": "dining table",
|
60 |
+
"49": "wine glass",
|
61 |
+
"50": "car",
|
62 |
+
"51": "teddy bear",
|
63 |
+
"52": "bicycle",
|
64 |
+
"53": "scissors",
|
65 |
+
"54": "keyboard",
|
66 |
+
"55": "Green",
|
67 |
+
"56": "Below",
|
68 |
+
"57": "Left",
|
69 |
+
"58": "book",
|
70 |
+
"59": "Front",
|
71 |
+
"60": "fork",
|
72 |
+
"61": "broccoli",
|
73 |
+
"62": "giraffe",
|
74 |
+
"63": "baseball glove",
|
75 |
+
"64": "Red",
|
76 |
+
"65": "Orange",
|
77 |
+
"66": "Black",
|
78 |
+
"67": "frisbee",
|
79 |
+
"68": "potted plant",
|
80 |
+
"69": "sandwich",
|
81 |
+
"70": "cup",
|
82 |
+
"71": "right",
|
83 |
+
"72": "cake",
|
84 |
+
"73": "Yes",
|
85 |
+
"74": "Right",
|
86 |
+
"75": "bed",
|
87 |
+
"76": "cell phone",
|
88 |
+
"77": "skateboard",
|
89 |
+
"78": "bowl",
|
90 |
+
"79": "truck",
|
91 |
+
"80": "donut",
|
92 |
+
"81": "above",
|
93 |
+
"82": "Brown",
|
94 |
+
"83": "kite",
|
95 |
+
"84": "cat",
|
96 |
+
"85": "traffic light",
|
97 |
+
"86": "pizza",
|
98 |
+
"87": "sheep",
|
99 |
+
"88": "elephant",
|
100 |
+
"89": "laptop",
|
101 |
+
"90": "refrigerator",
|
102 |
+
"91": "6",
|
103 |
+
"92": "banana",
|
104 |
+
"93": "Blue",
|
105 |
+
"94": "hot dog",
|
106 |
+
"95": "bear",
|
107 |
+
"96": "bird",
|
108 |
+
"97": "motorcycle",
|
109 |
+
"98": "horse",
|
110 |
+
"99": "tv",
|
111 |
+
"100": "tie",
|
112 |
+
"101": "left",
|
113 |
+
"102": "vase",
|
114 |
+
"103": "train",
|
115 |
+
"104": "baseball bat",
|
116 |
+
"105": "stop sign",
|
117 |
+
"106": "airplane",
|
118 |
+
"107": "bench"
|
119 |
},
|
120 |
"image_size": 384,
|
121 |
"initializer_range": 0.02,
|
122 |
"intermediate_size": 3072,
|
123 |
"label2id": {
|
124 |
+
"0": 38,
|
125 |
+
"1": 30,
|
126 |
+
"2": 11,
|
127 |
+
"3": 14,
|
128 |
+
"4": 21,
|
129 |
+
"5": 0,
|
130 |
+
"6": 91,
|
131 |
+
"7": 17,
|
132 |
+
"8": 16,
|
133 |
+
"9": 36,
|
134 |
+
"Above": 40,
|
135 |
+
"Behind": 24,
|
136 |
+
"Below": 56,
|
137 |
+
"Black": 66,
|
138 |
+
"Blue": 93,
|
139 |
+
"Brown": 82,
|
140 |
+
"Front": 59,
|
141 |
+
"Green": 55,
|
142 |
+
"Grey": 9,
|
143 |
+
"Left": 57,
|
144 |
+
"No": 37,
|
145 |
+
"Orange": 65,
|
146 |
+
"Pink": 19,
|
147 |
+
"Purple": 42,
|
148 |
+
"Red": 64,
|
149 |
+
"Right": 74,
|
150 |
+
"White": 46,
|
151 |
+
"Yellow": 34,
|
152 |
+
"Yes": 73,
|
153 |
+
"above": 81,
|
154 |
+
"airplane": 106,
|
155 |
+
"apple": 4,
|
156 |
+
"banana": 92,
|
157 |
+
"baseball bat": 104,
|
158 |
+
"baseball glove": 63,
|
159 |
+
"bear": 95,
|
160 |
+
"bed": 75,
|
161 |
+
"bench": 107,
|
162 |
+
"bicycle": 52,
|
163 |
+
"bird": 96,
|
164 |
+
"boat": 8,
|
165 |
+
"book": 58,
|
166 |
+
"bottle": 12,
|
167 |
+
"bowl": 78,
|
168 |
+
"broccoli": 61,
|
169 |
+
"bus": 6,
|
170 |
+
"cake": 72,
|
171 |
+
"car": 50,
|
172 |
+
"carrot": 39,
|
173 |
+
"cat": 84,
|
174 |
+
"cell phone": 76,
|
175 |
+
"chair": 27,
|
176 |
+
"clock": 47,
|
177 |
+
"couch": 2,
|
178 |
+
"cow": 29,
|
179 |
+
"cup": 70,
|
180 |
+
"dining table": 48,
|
181 |
+
"dog": 7,
|
182 |
+
"donut": 80,
|
183 |
+
"elephant": 88,
|
184 |
+
"fire hydrant": 31,
|
185 |
+
"fork": 60,
|
186 |
+
"frisbee": 67,
|
187 |
+
"giraffe": 62,
|
188 |
+
"handbag": 28,
|
189 |
+
"horse": 98,
|
190 |
+
"hot dog": 94,
|
191 |
+
"keyboard": 54,
|
192 |
+
"kite": 83,
|
193 |
+
"knife": 18,
|
194 |
+
"laptop": 89,
|
195 |
+
"left": 101,
|
196 |
+
"motorcycle": 97,
|
197 |
+
"mouse": 45,
|
198 |
+
"orange": 26,
|
199 |
+
"oven": 32,
|
200 |
+
"parking meter": 44,
|
201 |
+
"person": 25,
|
202 |
+
"pizza": 86,
|
203 |
+
"potted plant": 68,
|
204 |
+
"refrigerator": 90,
|
205 |
+
"remote": 35,
|
206 |
+
"right": 71,
|
207 |
+
"sandwich": 69,
|
208 |
+
"scissors": 53,
|
209 |
+
"sheep": 87,
|
210 |
+
"sink": 3,
|
211 |
+
"skateboard": 77,
|
212 |
+
"skis": 20,
|
213 |
+
"snowboard": 43,
|
214 |
+
"spoon": 13,
|
215 |
+
"sports ball": 41,
|
216 |
+
"stop sign": 105,
|
217 |
+
"suitcase": 10,
|
218 |
+
"surfboard": 23,
|
219 |
+
"teddy bear": 51,
|
220 |
+
"tennis racket": 33,
|
221 |
+
"tie": 100,
|
222 |
+
"toilet": 15,
|
223 |
+
"toothbrush": 22,
|
224 |
+
"traffic light": 85,
|
225 |
+
"train": 103,
|
226 |
+
"truck": 79,
|
227 |
+
"tv": 99,
|
228 |
+
"umbrella": 5,
|
229 |
+
"vase": 102,
|
230 |
+
"wine glass": 49,
|
231 |
+
"zebra": 1
|
232 |
},
|
233 |
"layer_norm_eps": 1e-12,
|
234 |
"max_image_length": -1,
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 446736704
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c1fef7cdefb7b719d44d7f77a38afcc57b092e5a2a0e6ac7da5c8eebbbd43a4
|
3 |
size 446736704
|