SimoneJLaudani commited on
Commit
ca39b4f
·
verified ·
1 Parent(s): 8d190e4

End of training

Browse files
README.md CHANGED
@@ -1,13 +1,8 @@
1
  ---
2
  license: apache-2.0
3
- base_model: distilbert/distilbert-base-uncased
4
  tags:
5
  - generated_from_trainer
6
- metrics:
7
- - precision
8
- - recall
9
- - f1
10
- - accuracy
11
  model-index:
12
  - name: test_trainer3b
13
  results: []
@@ -18,13 +13,7 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  # test_trainer3b
20
 
21
- This model is a fine-tuned version of [distilbert/distilbert-base-uncased](https://huggingface.co/distilbert/distilbert-base-uncased) on the None dataset.
22
- It achieves the following results on the evaluation set:
23
- - Loss: 1.4268
24
- - Precision: 1.0
25
- - Recall: 1.0
26
- - F1: 1.0
27
- - Accuracy: 1.0
28
 
29
  ## Model description
30
 
@@ -49,15 +38,10 @@ The following hyperparameters were used during training:
49
  - seed: 42
50
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
51
  - lr_scheduler_type: linear
52
- - num_epochs: 8
53
 
54
  ### Training results
55
 
56
- | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1 | Accuracy |
57
- |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|:--------:|
58
- | 1.9001 | 2.5 | 10 | 1.8054 | 0.5581 | 0.4762 | 0.3941 | 0.4762 |
59
- | 1.7074 | 5.0 | 20 | 1.5607 | 0.9429 | 0.9048 | 0.8929 | 0.9048 |
60
- | 1.5246 | 7.5 | 30 | 1.4268 | 1.0 | 1.0 | 1.0 | 1.0 |
61
 
62
 
63
  ### Framework versions
 
1
  ---
2
  license: apache-2.0
3
+ base_model: distilbert-base-cased
4
  tags:
5
  - generated_from_trainer
 
 
 
 
 
6
  model-index:
7
  - name: test_trainer3b
8
  results: []
 
13
 
14
  # test_trainer3b
15
 
16
+ This model is a fine-tuned version of [distilbert-base-cased](https://huggingface.co/distilbert-base-cased) on the None dataset.
 
 
 
 
 
 
17
 
18
  ## Model description
19
 
 
38
  - seed: 42
39
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
40
  - lr_scheduler_type: linear
41
+ - num_epochs: 2
42
 
43
  ### Training results
44
 
 
 
 
 
 
45
 
46
 
47
  ### Framework versions
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "distilbert/distilbert-base-uncased",
3
  "activation": "gelu",
4
  "architectures": [
5
  "DistilBertForSequenceClassification"
@@ -31,6 +31,7 @@
31
  "model_type": "distilbert",
32
  "n_heads": 12,
33
  "n_layers": 6,
 
34
  "pad_token_id": 0,
35
  "problem_type": "single_label_classification",
36
  "qa_dropout": 0.1,
@@ -39,5 +40,5 @@
39
  "tie_weights_": true,
40
  "torch_dtype": "float32",
41
  "transformers_version": "4.38.2",
42
- "vocab_size": 30522
43
  }
 
1
  {
2
+ "_name_or_path": "distilbert-base-cased",
3
  "activation": "gelu",
4
  "architectures": [
5
  "DistilBertForSequenceClassification"
 
31
  "model_type": "distilbert",
32
  "n_heads": 12,
33
  "n_layers": 6,
34
+ "output_past": true,
35
  "pad_token_id": 0,
36
  "problem_type": "single_label_classification",
37
  "qa_dropout": 0.1,
 
40
  "tie_weights_": true,
41
  "torch_dtype": "float32",
42
  "transformers_version": "4.38.2",
43
+ "vocab_size": 28996
44
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5c742c4ad2978bb415fdcc9a3a86a05ed60270c4e4cfdb0607c101cf43d61f6d
3
- size 267847948
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4fdded6c5d6aa7c563a2620d8a64102c4dde3f7c68f2fb549016b26d2a0798f
3
+ size 263160068
runs/Mar11_13-20-28_fd75b22569e8/events.out.tfevents.1710163233.fd75b22569e8.296.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c45c411f10afb155e320a6cad369659c676a1a81bfc774535dd34b5d824ac5b
3
+ size 5112
tokenizer_config.json CHANGED
@@ -44,9 +44,9 @@
44
  "clean_up_tokenization_spaces": true,
45
  "cls_token": "[CLS]",
46
  "do_basic_tokenize": true,
47
- "do_lower_case": true,
48
  "mask_token": "[MASK]",
49
- "model_max_length": 1000000000000000019884624838656,
50
  "never_split": null,
51
  "pad_token": "[PAD]",
52
  "sep_token": "[SEP]",
 
44
  "clean_up_tokenization_spaces": true,
45
  "cls_token": "[CLS]",
46
  "do_basic_tokenize": true,
47
+ "do_lower_case": false,
48
  "mask_token": "[MASK]",
49
+ "model_max_length": 512,
50
  "never_split": null,
51
  "pad_token": "[PAD]",
52
  "sep_token": "[SEP]",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dab36f7ba75fc136a8ab8e0dc8a78ec969fc38f94b57cedefe091ba249512db5
3
  size 4856
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16f998a920691bc222fcdd063382e246edab121c6b7bdf921b0743740559d9e1
3
  size 4856
vocab.txt CHANGED
The diff for this file is too large to render. See raw diff