raygx commited on
Commit
bb3892b
1 Parent(s): 8b49607

Upload TFDistilBertForSequenceClassification

Browse files
Files changed (3) hide show
  1. README.md +3 -3
  2. config.json +16 -17
  3. tf_model.h5 +2 -2
README.md CHANGED
@@ -1,6 +1,6 @@
1
  ---
2
- license: cc-by-nc-sa-4.0
3
- base_model: NepBERTa/NepBERTa
4
  tags:
5
  - generated_from_keras_callback
6
  model-index:
@@ -13,7 +13,7 @@ probably proofread and complete it, then remove this comment. -->
13
 
14
  # sakoni-distilBERT-NepSA
15
 
16
- This model is a fine-tuned version of [NepBERTa/NepBERTa](https://huggingface.co/NepBERTa/NepBERTa) on an unknown dataset.
17
  It achieves the following results on the evaluation set:
18
 
19
 
 
1
  ---
2
+ license: apache-2.0
3
+ base_model: Sakonii/distilbert-base-nepali
4
  tags:
5
  - generated_from_keras_callback
6
  model-index:
 
13
 
14
  # sakoni-distilBERT-NepSA
15
 
16
+ This model is a fine-tuned version of [Sakonii/distilbert-base-nepali](https://huggingface.co/Sakonii/distilbert-base-nepali) on an unknown dataset.
17
  It achieves the following results on the evaluation set:
18
 
19
 
config.json CHANGED
@@ -1,35 +1,34 @@
1
  {
2
- "_name_or_path": "NepBERTa/NepBERTa",
 
3
  "architectures": [
4
- "BertForSequenceClassification"
5
  ],
6
- "attention_probs_dropout_prob": 0.1,
7
- "classifier_dropout": null,
8
- "hidden_act": "gelu",
9
- "hidden_dropout_prob": 0.1,
10
- "hidden_size": 768,
11
  "id2label": {
12
  "0": "NEUTRAL",
13
  "1": "POSITIVE",
14
  "2": "NEGATIVE"
15
  },
16
  "initializer_range": 0.02,
17
- "intermediate_size": 3072,
18
  "label2id": {
19
  "NEGATIVE": 2,
20
  "NEUTRAL": 0,
21
  "POSITIVE": 1
22
  },
23
- "layer_norm_eps": 1e-12,
24
  "max_position_embeddings": 512,
25
- "model_type": "bert",
26
- "num_attention_heads": 12,
27
- "num_hidden_layers": 12,
28
- "output_hidden_state": true,
29
  "pad_token_id": 0,
30
- "position_embedding_type": "absolute",
 
 
 
 
31
  "transformers_version": "4.32.1",
32
- "type_vocab_size": 2,
33
- "use_cache": true,
34
- "vocab_size": 30523
35
  }
 
1
  {
2
+ "_name_or_path": "Sakonii/distilbert-base-nepali",
3
+ "activation": "gelu",
4
  "architectures": [
5
+ "DistilBertForSequenceClassification"
6
  ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "hidden_dim": 3072,
 
11
  "id2label": {
12
  "0": "NEUTRAL",
13
  "1": "POSITIVE",
14
  "2": "NEGATIVE"
15
  },
16
  "initializer_range": 0.02,
 
17
  "label2id": {
18
  "NEGATIVE": 2,
19
  "NEUTRAL": 0,
20
  "POSITIVE": 1
21
  },
 
22
  "max_position_embeddings": 512,
23
+ "model_type": "distilbert",
24
+ "n_heads": 12,
25
+ "n_layers": 6,
 
26
  "pad_token_id": 0,
27
+ "qa_dropout": 0.1,
28
+ "seq_classif_dropout": 0.2,
29
+ "sinusoidal_pos_embds": false,
30
+ "tie_weights_": true,
31
+ "torch_dtype": "float32",
32
  "transformers_version": "4.32.1",
33
+ "vocab_size": 24581
 
 
34
  }
tf_model.h5 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e93e8210b6a6863e802f5558d3a9b6e68bb3e85ae1fce6c4d2ad0936a73e0c57
3
- size 532002416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:736e4cdb0b50770b958a86c2f5cbb81e645320a556fe4dcac1fb7d513740413a
3
+ size 325224960