SharonTudi commited on
Commit
11efdd1
·
verified ·
1 Parent(s): 19ca71f

End of training

Browse files
README.md CHANGED
@@ -1,6 +1,6 @@
1
  ---
2
  license: apache-2.0
3
- base_model: distilbert-base-cased
4
  tags:
5
  - generated_from_trainer
6
  metrics:
@@ -18,9 +18,9 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  # DIALOGUE_second_model
20
 
21
- This model is a fine-tuned version of [distilbert-base-cased](https://huggingface.co/distilbert-base-cased) on the None dataset.
22
  It achieves the following results on the evaluation set:
23
- - Loss: 0.3499
24
  - Precision: 0.9762
25
  - Recall: 0.9737
26
  - F1: 0.9736
@@ -55,20 +55,20 @@ The following hyperparameters were used during training:
55
 
56
  | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1 | Accuracy |
57
  |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|:--------:|
58
- | 1.3735 | 0.31 | 15 | 1.3341 | 0.2562 | 0.4868 | 0.3323 | 0.4868 |
59
- | 1.2891 | 0.62 | 30 | 1.1793 | 0.8546 | 0.7368 | 0.6683 | 0.7368 |
60
- | 1.1 | 0.94 | 45 | 0.9372 | 0.9421 | 0.9342 | 0.9339 | 0.9342 |
61
- | 0.884 | 1.25 | 60 | 0.7268 | 0.9524 | 0.9474 | 0.9472 | 0.9474 |
62
- | 0.7087 | 1.56 | 75 | 0.5780 | 0.9762 | 0.9737 | 0.9736 | 0.9737 |
63
- | 0.6158 | 1.88 | 90 | 0.4773 | 0.9327 | 0.9211 | 0.9204 | 0.9211 |
64
- | 0.5052 | 2.19 | 105 | 0.4043 | 0.9762 | 0.9737 | 0.9736 | 0.9737 |
65
- | 0.4321 | 2.5 | 120 | 0.3652 | 0.9762 | 0.9737 | 0.9736 | 0.9737 |
66
- | 0.4412 | 2.81 | 135 | 0.3499 | 0.9762 | 0.9737 | 0.9736 | 0.9737 |
67
 
68
 
69
  ### Framework versions
70
 
71
- - Transformers 4.36.2
72
  - Pytorch 2.1.0+cu121
73
  - Datasets 2.16.1
74
  - Tokenizers 0.15.0
 
1
  ---
2
  license: apache-2.0
3
+ base_model: bert-base-cased
4
  tags:
5
  - generated_from_trainer
6
  metrics:
 
18
 
19
  # DIALOGUE_second_model
20
 
21
+ This model is a fine-tuned version of [bert-base-cased](https://huggingface.co/bert-base-cased) on the None dataset.
22
  It achieves the following results on the evaluation set:
23
+ - Loss: 0.3364
24
  - Precision: 0.9762
25
  - Recall: 0.9737
26
  - F1: 0.9736
 
55
 
56
  | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1 | Accuracy |
57
  |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|:--------:|
58
+ | 1.3667 | 0.31 | 15 | 1.2505 | 0.2468 | 0.4868 | 0.3263 | 0.4868 |
59
+ | 1.1649 | 0.62 | 30 | 1.0587 | 0.8659 | 0.7105 | 0.6935 | 0.7105 |
60
+ | 1.0288 | 0.94 | 45 | 0.8905 | 0.9479 | 0.9342 | 0.9331 | 0.9342 |
61
+ | 0.8541 | 1.25 | 60 | 0.7069 | 0.9762 | 0.9737 | 0.9736 | 0.9737 |
62
+ | 0.6833 | 1.56 | 75 | 0.5616 | 0.9762 | 0.9737 | 0.9736 | 0.9737 |
63
+ | 0.6072 | 1.88 | 90 | 0.4586 | 0.9762 | 0.9737 | 0.9736 | 0.9737 |
64
+ | 0.4665 | 2.19 | 105 | 0.3944 | 0.9762 | 0.9737 | 0.9736 | 0.9737 |
65
+ | 0.4274 | 2.5 | 120 | 0.3563 | 0.9762 | 0.9737 | 0.9736 | 0.9737 |
66
+ | 0.4116 | 2.81 | 135 | 0.3364 | 0.9762 | 0.9737 | 0.9736 | 0.9737 |
67
 
68
 
69
  ### Framework versions
70
 
71
+ - Transformers 4.37.0
72
  - Pytorch 2.1.0+cu121
73
  - Datasets 2.16.1
74
  - Tokenizers 0.15.0
config.json CHANGED
@@ -1,13 +1,14 @@
1
  {
2
- "_name_or_path": "distilbert-base-cased",
3
- "activation": "gelu",
4
  "architectures": [
5
- "DistilBertForSequenceClassification"
6
  ],
7
- "attention_dropout": 0.1,
8
- "dim": 768,
9
- "dropout": 0.1,
10
- "hidden_dim": 3072,
 
 
11
  "id2label": {
12
  "0": "Hospital-Inform",
13
  "1": "Hospital-Request",
@@ -15,24 +16,24 @@
15
  "3": "general-thank"
16
  },
17
  "initializer_range": 0.02,
 
18
  "label2id": {
19
  "LABEL_0": 0,
20
  "LABEL_1": 1,
21
  "LABEL_2": 2,
22
  "LABEL_3": 3
23
  },
 
24
  "max_position_embeddings": 512,
25
- "model_type": "distilbert",
26
- "n_heads": 12,
27
- "n_layers": 6,
28
- "output_past": true,
29
  "pad_token_id": 0,
 
30
  "problem_type": "single_label_classification",
31
- "qa_dropout": 0.1,
32
- "seq_classif_dropout": 0.2,
33
- "sinusoidal_pos_embds": false,
34
- "tie_weights_": true,
35
  "torch_dtype": "float32",
36
- "transformers_version": "4.36.2",
 
 
37
  "vocab_size": 28996
38
  }
 
1
  {
2
+ "_name_or_path": "bert-base-cased",
 
3
  "architectures": [
4
+ "BertForSequenceClassification"
5
  ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "gradient_checkpointing": false,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 768,
12
  "id2label": {
13
  "0": "Hospital-Inform",
14
  "1": "Hospital-Request",
 
16
  "3": "general-thank"
17
  },
18
  "initializer_range": 0.02,
19
+ "intermediate_size": 3072,
20
  "label2id": {
21
  "LABEL_0": 0,
22
  "LABEL_1": 1,
23
  "LABEL_2": 2,
24
  "LABEL_3": 3
25
  },
26
+ "layer_norm_eps": 1e-12,
27
  "max_position_embeddings": 512,
28
+ "model_type": "bert",
29
+ "num_attention_heads": 12,
30
+ "num_hidden_layers": 12,
 
31
  "pad_token_id": 0,
32
+ "position_embedding_type": "absolute",
33
  "problem_type": "single_label_classification",
 
 
 
 
34
  "torch_dtype": "float32",
35
+ "transformers_version": "4.37.0",
36
+ "type_vocab_size": 2,
37
+ "use_cache": true,
38
  "vocab_size": 28996
39
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3b804e2243b4315b37da4d96fb3ee9fe45c4445c1d3abb76a5685cbfee97c019
3
- size 263150840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4f2d81d6dfc25bb604e7bcd79acfaaf4d0aa9ca6609bad023110eaf142970c0
3
+ size 433276920
runs/Jan23_14-28-05_b3ba10920348/events.out.tfevents.1706020108.b3ba10920348.178.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc73325b6b00bb5ebdc1b100b13de86ada85903007a41214e5f812512e6f9278
3
+ size 10490
tokenizer_config.json CHANGED
@@ -52,6 +52,6 @@
52
  "sep_token": "[SEP]",
53
  "strip_accents": null,
54
  "tokenize_chinese_chars": true,
55
- "tokenizer_class": "DistilBertTokenizer",
56
  "unk_token": "[UNK]"
57
  }
 
52
  "sep_token": "[SEP]",
53
  "strip_accents": null,
54
  "tokenize_chinese_chars": true,
55
+ "tokenizer_class": "BertTokenizer",
56
  "unk_token": "[UNK]"
57
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:684b5c2816d28e5ce76d89aaf4cae488ad92b4164297b5eeaedc967d202fde47
3
- size 4728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e857c7c1121cf0c85367fdeef55d7d66fc8e32b927d83827544ee483bf7c529
3
+ size 4664