sayakpaul
/

mit-b0-finetuned-sidewalk-semantic

+---
+license: apache-2.0
+tags:
+- generated_from_keras_callback
+model-index:
+- name: mit-b0-finetuned-sidewalk-semantic
+  results: []
+---
+<!-- This model card has been generated automatically according to the information Keras had access to. You should
+probably proofread and complete it, then remove this comment. -->
+# mit-b0-finetuned-sidewalk-semantic
+This model is a fine-tuned version of [nvidia/mit-b0](https://huggingface.co/nvidia/mit-b0) on an unknown dataset.
+It achieves the following results on the evaluation set:
+- Train Loss: 0.2125
+- Validation Loss: 0.5151
+- Epoch: 49
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- optimizer: {'name': 'Adam', 'learning_rate': 6e-05, 'decay': 0.0, 'beta_1': 0.9, 'beta_2': 0.999, 'epsilon': 1e-07, 'amsgrad': False}
+- training_precision: float32
+### Training results
+| Train Loss | Validation Loss | Epoch |
+|:----------:|:---------------:|:-----:|
+| 2.0785     | 1.1753          | 0     |
+| 1.1312     | 0.8807          | 1     |
+| 0.9315     | 0.7585          | 2     |
+| 0.7952     | 0.7261          | 3     |
+| 0.7273     | 0.6701          | 4     |
+| 0.6603     | 0.6396          | 5     |
+| 0.6198     | 0.6238          | 6     |
+| 0.5958     | 0.5925          | 7     |
+| 0.5378     | 0.5714          | 8     |
+| 0.5236     | 0.5786          | 9     |
+| 0.4960     | 0.5588          | 10    |
+| 0.4633     | 0.5624          | 11    |
+| 0.4562     | 0.5450          | 12    |
+| 0.4167     | 0.5438          | 13    |
+| 0.4100     | 0.5248          | 14    |
+| 0.3947     | 0.5354          | 15    |
+| 0.3867     | 0.5069          | 16    |
+| 0.3803     | 0.5285          | 17    |
+| 0.3696     | 0.5318          | 18    |
+| 0.3386     | 0.5162          | 19    |
+| 0.3349     | 0.5312          | 20    |
+| 0.3233     | 0.5304          | 21    |
+| 0.3328     | 0.5178          | 22    |
+| 0.3140     | 0.5131          | 23    |
+| 0.3081     | 0.5049          | 24    |
+| 0.3046     | 0.5011          | 25    |
+| 0.3209     | 0.5197          | 26    |
+| 0.2966     | 0.5151          | 27    |
+| 0.2829     | 0.5166          | 28    |
+| 0.2968     | 0.5210          | 29    |
+| 0.2818     | 0.5300          | 30    |
+| 0.2739     | 0.5221          | 31    |
+| 0.2602     | 0.5340          | 32    |
+| 0.2570     | 0.5124          | 33    |
+| 0.2557     | 0.5234          | 34    |
+| 0.2593     | 0.5098          | 35    |
+| 0.2582     | 0.5329          | 36    |
+| 0.2439     | 0.5373          | 37    |
+| 0.2413     | 0.5141          | 38    |
+| 0.2423     | 0.5210          | 39    |
+| 0.2340     | 0.5043          | 40    |
+| 0.2244     | 0.5300          | 41    |
+| 0.2246     | 0.4978          | 42    |
+| 0.2270     | 0.5385          | 43    |
+| 0.2254     | 0.5125          | 44    |
+| 0.2176     | 0.5510          | 45    |
+| 0.2194     | 0.5384          | 46    |
+| 0.2136     | 0.5186          | 47    |
+| 0.2121     | 0.5356          | 48    |
+| 0.2125     | 0.5151          | 49    |
+### Framework versions
+- Transformers 4.21.0.dev0
+- TensorFlow 2.8.0
+- Datasets 2.3.2
+- Tokenizers 0.12.1

config.json ADDED Viewed

	@@ -0,0 +1,144 @@

+{
+  "_name_or_path": "nvidia/mit-b0",
+  "architectures": [
+    "SegformerForSemanticSegmentation"
+  ],
+  "attention_probs_dropout_prob": 0.0,
+  "classifier_dropout_prob": 0.1,
+  "decoder_hidden_size": 256,
+  "depths": [
+    2,
+    2,
+    2,
+    2
+  ],
+  "downsampling_rates": [
+    1,
+    4,
+    8,
+    16
+  ],
+  "drop_path_rate": 0.1,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.0,
+  "hidden_sizes": [
+    32,
+    64,
+    160,
+    256
+  ],
+  "id2label": {
+    "0": "unlabeled",
+    "1": "flat-road",
+    "2": "flat-sidewalk",
+    "3": "flat-crosswalk",
+    "4": "flat-cyclinglane",
+    "5": "flat-parkingdriveway",
+    "6": "flat-railtrack",
+    "7": "flat-curb",
+    "8": "human-person",
+    "9": "human-rider",
+    "10": "vehicle-car",
+    "11": "vehicle-truck",
+    "12": "vehicle-bus",
+    "13": "vehicle-tramtrain",
+    "14": "vehicle-motorcycle",
+    "15": "vehicle-bicycle",
+    "16": "vehicle-caravan",
+    "17": "vehicle-cartrailer",
+    "18": "construction-building",
+    "19": "construction-door",
+    "20": "construction-wall",
+    "21": "construction-fenceguardrail",
+    "22": "construction-bridge",
+    "23": "construction-tunnel",
+    "24": "construction-stairs",
+    "25": "object-pole",
+    "26": "object-trafficsign",
+    "27": "object-trafficlight",
+    "28": "nature-vegetation",
+    "29": "nature-terrain",
+    "30": "sky",
+    "31": "void-ground",
+    "32": "void-dynamic",
+    "33": "void-static",
+    "34": "void-unclear"
+  },
+  "image_size": 224,
+  "initializer_range": 0.02,
+  "label2id": {
+    "construction-bridge": 22,
+    "construction-building": 18,
+    "construction-door": 19,
+    "construction-fenceguardrail": 21,
+    "construction-stairs": 24,
+    "construction-tunnel": 23,
+    "construction-wall": 20,
+    "flat-crosswalk": 3,
+    "flat-curb": 7,
+    "flat-cyclinglane": 4,
+    "flat-parkingdriveway": 5,
+    "flat-railtrack": 6,
+    "flat-road": 1,
+    "flat-sidewalk": 2,
+    "human-person": 8,
+    "human-rider": 9,
+    "nature-terrain": 29,
+    "nature-vegetation": 28,
+    "object-pole": 25,
+    "object-trafficlight": 27,
+    "object-trafficsign": 26,
+    "sky": 30,
+    "unlabeled": 0,
+    "vehicle-bicycle": 15,
+    "vehicle-bus": 12,
+    "vehicle-car": 10,
+    "vehicle-caravan": 16,
+    "vehicle-cartrailer": 17,
+    "vehicle-motorcycle": 14,
+    "vehicle-tramtrain": 13,
+    "vehicle-truck": 11,
+    "void-dynamic": 32,
+    "void-ground": 31,
+    "void-static": 33,
+    "void-unclear": 34
+  },
+  "layer_norm_eps": 1e-06,
+  "mlp_ratios": [
+    4,
+    4,
+    4,
+    4
+  ],
+  "model_type": "segformer",
+  "num_attention_heads": [
+    1,
+    2,
+    5,
+    8
+  ],
+  "num_channels": 3,
+  "num_encoder_blocks": 4,
+  "patch_sizes": [
+    7,
+    3,
+    3,
+    3
+  ],
+  "reshape_last_stage": true,
+  "semantic_loss_ignore_index": 255,
+  "sr_ratios": [
+    8,
+    4,
+    2,
+    1
+  ],
+  "strides": [
+    4,
+    2,
+    2,
+    2
+  ],
+  "torch_dtype": "float32",
+  "transformers_version": "4.21.0.dev0"
+}

tf_model.h5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fba28ceaa44bba99481b676c803adfd9ed7e20f186595b34bd9b551f5f3a288a
+size 15167588