Adding ONNX file of this model
Browse filesBeep boop I am the [ONNX export bot 🤖🏎️](https://huggingface.co/spaces/onnx/export). On behalf of [dongruliu](https://huggingface.co/dongruliu), I would like to add to this repository the model converted to ONNX.
What is ONNX? It stands for "Open Neural Network Exchange", and is the most commonly used open standard for machine learning interoperability. You can find out more at [onnx.ai](https://onnx.ai/)!
The exported ONNX model can be then be consumed by various backends as TensorRT or TVM, or simply be used in a few lines with 🤗 Optimum through ONNX Runtime, check out how [here](https://huggingface.co/docs/optimum/main/en/onnxruntime/usage_guides/models)!
- onnx/config.json +221 -0
- onnx/model.onnx +3 -0
- onnx/preprocessor_config.json +24 -0
onnx/config.json
ADDED
@@ -0,0 +1,221 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "facebook/detr-resnet-101",
|
3 |
+
"activation_dropout": 0.0,
|
4 |
+
"activation_function": "relu",
|
5 |
+
"architectures": [
|
6 |
+
"DetrForObjectDetection"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.0,
|
9 |
+
"auxiliary_loss": false,
|
10 |
+
"backbone": "resnet101",
|
11 |
+
"backbone_config": null,
|
12 |
+
"bbox_cost": 5,
|
13 |
+
"bbox_loss_coefficient": 5,
|
14 |
+
"class_cost": 1,
|
15 |
+
"classifier_dropout": 0.0,
|
16 |
+
"d_model": 256,
|
17 |
+
"decoder_attention_heads": 8,
|
18 |
+
"decoder_ffn_dim": 2048,
|
19 |
+
"decoder_layerdrop": 0.0,
|
20 |
+
"decoder_layers": 6,
|
21 |
+
"dice_loss_coefficient": 1,
|
22 |
+
"dilation": false,
|
23 |
+
"dropout": 0.1,
|
24 |
+
"encoder_attention_heads": 8,
|
25 |
+
"encoder_ffn_dim": 2048,
|
26 |
+
"encoder_layerdrop": 0.0,
|
27 |
+
"encoder_layers": 6,
|
28 |
+
"eos_coefficient": 0.1,
|
29 |
+
"giou_cost": 2,
|
30 |
+
"giou_loss_coefficient": 2,
|
31 |
+
"id2label": {
|
32 |
+
"0": "N/A",
|
33 |
+
"1": "person",
|
34 |
+
"2": "bicycle",
|
35 |
+
"3": "car",
|
36 |
+
"4": "motorcycle",
|
37 |
+
"5": "airplane",
|
38 |
+
"6": "bus",
|
39 |
+
"7": "train",
|
40 |
+
"8": "truck",
|
41 |
+
"9": "boat",
|
42 |
+
"10": "traffic light",
|
43 |
+
"11": "fire hydrant",
|
44 |
+
"12": "N/A",
|
45 |
+
"13": "stop sign",
|
46 |
+
"14": "parking meter",
|
47 |
+
"15": "bench",
|
48 |
+
"16": "bird",
|
49 |
+
"17": "cat",
|
50 |
+
"18": "dog",
|
51 |
+
"19": "horse",
|
52 |
+
"20": "sheep",
|
53 |
+
"21": "cow",
|
54 |
+
"22": "elephant",
|
55 |
+
"23": "bear",
|
56 |
+
"24": "zebra",
|
57 |
+
"25": "giraffe",
|
58 |
+
"26": "N/A",
|
59 |
+
"27": "backpack",
|
60 |
+
"28": "umbrella",
|
61 |
+
"29": "N/A",
|
62 |
+
"30": "N/A",
|
63 |
+
"31": "handbag",
|
64 |
+
"32": "tie",
|
65 |
+
"33": "suitcase",
|
66 |
+
"34": "frisbee",
|
67 |
+
"35": "skis",
|
68 |
+
"36": "snowboard",
|
69 |
+
"37": "sports ball",
|
70 |
+
"38": "kite",
|
71 |
+
"39": "baseball bat",
|
72 |
+
"40": "baseball glove",
|
73 |
+
"41": "skateboard",
|
74 |
+
"42": "surfboard",
|
75 |
+
"43": "tennis racket",
|
76 |
+
"44": "bottle",
|
77 |
+
"45": "N/A",
|
78 |
+
"46": "wine glass",
|
79 |
+
"47": "cup",
|
80 |
+
"48": "fork",
|
81 |
+
"49": "knife",
|
82 |
+
"50": "spoon",
|
83 |
+
"51": "bowl",
|
84 |
+
"52": "banana",
|
85 |
+
"53": "apple",
|
86 |
+
"54": "sandwich",
|
87 |
+
"55": "orange",
|
88 |
+
"56": "broccoli",
|
89 |
+
"57": "carrot",
|
90 |
+
"58": "hot dog",
|
91 |
+
"59": "pizza",
|
92 |
+
"60": "donut",
|
93 |
+
"61": "cake",
|
94 |
+
"62": "chair",
|
95 |
+
"63": "couch",
|
96 |
+
"64": "potted plant",
|
97 |
+
"65": "bed",
|
98 |
+
"66": "N/A",
|
99 |
+
"67": "dining table",
|
100 |
+
"68": "N/A",
|
101 |
+
"69": "N/A",
|
102 |
+
"70": "toilet",
|
103 |
+
"71": "N/A",
|
104 |
+
"72": "tv",
|
105 |
+
"73": "laptop",
|
106 |
+
"74": "mouse",
|
107 |
+
"75": "remote",
|
108 |
+
"76": "keyboard",
|
109 |
+
"77": "cell phone",
|
110 |
+
"78": "microwave",
|
111 |
+
"79": "oven",
|
112 |
+
"80": "toaster",
|
113 |
+
"81": "sink",
|
114 |
+
"82": "refrigerator",
|
115 |
+
"83": "N/A",
|
116 |
+
"84": "book",
|
117 |
+
"85": "clock",
|
118 |
+
"86": "vase",
|
119 |
+
"87": "scissors",
|
120 |
+
"88": "teddy bear",
|
121 |
+
"89": "hair drier",
|
122 |
+
"90": "toothbrush"
|
123 |
+
},
|
124 |
+
"init_std": 0.02,
|
125 |
+
"init_xavier_std": 1.0,
|
126 |
+
"is_encoder_decoder": true,
|
127 |
+
"label2id": {
|
128 |
+
"N/A": 83,
|
129 |
+
"airplane": 5,
|
130 |
+
"apple": 53,
|
131 |
+
"backpack": 27,
|
132 |
+
"banana": 52,
|
133 |
+
"baseball bat": 39,
|
134 |
+
"baseball glove": 40,
|
135 |
+
"bear": 23,
|
136 |
+
"bed": 65,
|
137 |
+
"bench": 15,
|
138 |
+
"bicycle": 2,
|
139 |
+
"bird": 16,
|
140 |
+
"boat": 9,
|
141 |
+
"book": 84,
|
142 |
+
"bottle": 44,
|
143 |
+
"bowl": 51,
|
144 |
+
"broccoli": 56,
|
145 |
+
"bus": 6,
|
146 |
+
"cake": 61,
|
147 |
+
"car": 3,
|
148 |
+
"carrot": 57,
|
149 |
+
"cat": 17,
|
150 |
+
"cell phone": 77,
|
151 |
+
"chair": 62,
|
152 |
+
"clock": 85,
|
153 |
+
"couch": 63,
|
154 |
+
"cow": 21,
|
155 |
+
"cup": 47,
|
156 |
+
"dining table": 67,
|
157 |
+
"dog": 18,
|
158 |
+
"donut": 60,
|
159 |
+
"elephant": 22,
|
160 |
+
"fire hydrant": 11,
|
161 |
+
"fork": 48,
|
162 |
+
"frisbee": 34,
|
163 |
+
"giraffe": 25,
|
164 |
+
"hair drier": 89,
|
165 |
+
"handbag": 31,
|
166 |
+
"horse": 19,
|
167 |
+
"hot dog": 58,
|
168 |
+
"keyboard": 76,
|
169 |
+
"kite": 38,
|
170 |
+
"knife": 49,
|
171 |
+
"laptop": 73,
|
172 |
+
"microwave": 78,
|
173 |
+
"motorcycle": 4,
|
174 |
+
"mouse": 74,
|
175 |
+
"orange": 55,
|
176 |
+
"oven": 79,
|
177 |
+
"parking meter": 14,
|
178 |
+
"person": 1,
|
179 |
+
"pizza": 59,
|
180 |
+
"potted plant": 64,
|
181 |
+
"refrigerator": 82,
|
182 |
+
"remote": 75,
|
183 |
+
"sandwich": 54,
|
184 |
+
"scissors": 87,
|
185 |
+
"sheep": 20,
|
186 |
+
"sink": 81,
|
187 |
+
"skateboard": 41,
|
188 |
+
"skis": 35,
|
189 |
+
"snowboard": 36,
|
190 |
+
"spoon": 50,
|
191 |
+
"sports ball": 37,
|
192 |
+
"stop sign": 13,
|
193 |
+
"suitcase": 33,
|
194 |
+
"surfboard": 42,
|
195 |
+
"teddy bear": 88,
|
196 |
+
"tennis racket": 43,
|
197 |
+
"tie": 32,
|
198 |
+
"toaster": 80,
|
199 |
+
"toilet": 70,
|
200 |
+
"toothbrush": 90,
|
201 |
+
"traffic light": 10,
|
202 |
+
"train": 7,
|
203 |
+
"truck": 8,
|
204 |
+
"tv": 72,
|
205 |
+
"umbrella": 28,
|
206 |
+
"vase": 86,
|
207 |
+
"wine glass": 46,
|
208 |
+
"zebra": 24
|
209 |
+
},
|
210 |
+
"mask_loss_coefficient": 1,
|
211 |
+
"max_position_embeddings": 1024,
|
212 |
+
"model_type": "detr",
|
213 |
+
"num_channels": 3,
|
214 |
+
"num_hidden_layers": 6,
|
215 |
+
"num_queries": 100,
|
216 |
+
"position_embedding_type": "sine",
|
217 |
+
"scale_embedding": false,
|
218 |
+
"transformers_version": "4.37.2",
|
219 |
+
"use_pretrained_backbone": true,
|
220 |
+
"use_timm_backbone": true
|
221 |
+
}
|
onnx/model.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46c6e9309f1a952036aa23549b81ca726bacddf924a053d4091c7eed191d40a0
|
3 |
+
size 242841563
|
onnx/preprocessor_config.json
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"do_normalize": true,
|
3 |
+
"do_pad": true,
|
4 |
+
"do_rescale": true,
|
5 |
+
"do_resize": true,
|
6 |
+
"format": "coco_detection",
|
7 |
+
"image_mean": [
|
8 |
+
0.485,
|
9 |
+
0.456,
|
10 |
+
0.406
|
11 |
+
],
|
12 |
+
"image_processor_type": "DetrFeatureExtractor",
|
13 |
+
"image_std": [
|
14 |
+
0.229,
|
15 |
+
0.224,
|
16 |
+
0.225
|
17 |
+
],
|
18 |
+
"resample": 2,
|
19 |
+
"rescale_factor": 0.00392156862745098,
|
20 |
+
"size": {
|
21 |
+
"longest_edge": 1333,
|
22 |
+
"shortest_edge": 800
|
23 |
+
}
|
24 |
+
}
|