Shresthadev403 commited on
Commit
0f79f7e
·
1 Parent(s): 286cca8

End of training

Browse files
README.md CHANGED
@@ -1,6 +1,4 @@
1
  ---
2
- license: apache-2.0
3
- base_model: bert-base-uncased
4
  tags:
5
  - generated_from_trainer
6
  model-index:
@@ -13,14 +11,14 @@ should probably proofread and complete it, then remove this comment. -->
13
 
14
  # ner-bert-ingredients
15
 
16
- This model is a fine-tuned version of [bert-base-uncased](https://huggingface.co/bert-base-uncased) on an unknown dataset.
17
  It achieves the following results on the evaluation set:
18
- - eval_loss: 1.5282
19
- - eval_runtime: 84.2371
20
- - eval_samples_per_second: 59.356
21
- - eval_steps_per_second: 0.938
22
- - epoch: 6.06
23
- - step: 4500
24
 
25
  ## Model description
26
 
 
1
  ---
 
 
2
  tags:
3
  - generated_from_trainer
4
  model-index:
 
11
 
12
  # ner-bert-ingredients
13
 
14
+ This model was trained from scratch on an unknown dataset.
15
  It achieves the following results on the evaluation set:
16
+ - eval_loss: 2.3785
17
+ - eval_runtime: 84.0031
18
+ - eval_samples_per_second: 59.522
19
+ - eval_steps_per_second: 0.94
20
+ - epoch: 7.08
21
+ - step: 5250
22
 
23
  ## Model description
24
 
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "bert-base-uncased",
3
  "architectures": [
4
  "BertForTokenClassification"
5
  ],
 
1
  {
2
+ "_name_or_path": "/kaggle/working/ner-bert-ingredients",
3
  "architectures": [
4
  "BertForTokenClassification"
5
  ],
logs/events.out.tfevents.1704638284.80d534b5f596.26.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4aaf750cd2f6e4f5bd5705b609fdc3eb01bb4b1c3a25298f3fea438f5bdabdb
3
+ size 1717324
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae13ecd9fc839ef94736671faab0dcc0acd342d63ac53d36f3f434917fb712b3
3
  size 535667604
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50065a45f9f3efe6cb5d824760c2d913022aca1532af3c49e580ae48d003cc04
3
  size 535667604
special_tokens_map.json CHANGED
@@ -1,7 +1,37 @@
1
  {
2
- "cls_token": "[CLS]",
3
- "mask_token": "[MASK]",
4
- "pad_token": "[PAD]",
5
- "sep_token": "[SEP]",
6
- "unk_token": "[UNK]"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7
  }
 
1
  {
2
+ "cls_token": {
3
+ "content": "[CLS]",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "mask_token": {
10
+ "content": "[MASK]",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "[PAD]",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "sep_token": {
24
+ "content": "[SEP]",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "unk_token": {
31
+ "content": "[UNK]",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ }
37
  }
tokenizer_config.json CHANGED
@@ -45,11 +45,18 @@
45
  "cls_token": "[CLS]",
46
  "do_lower_case": true,
47
  "mask_token": "[MASK]",
 
48
  "model_max_length": 512,
 
49
  "pad_token": "[PAD]",
 
 
50
  "sep_token": "[SEP]",
 
51
  "strip_accents": null,
52
  "tokenize_chinese_chars": true,
53
  "tokenizer_class": "BertTokenizer",
 
 
54
  "unk_token": "[UNK]"
55
  }
 
45
  "cls_token": "[CLS]",
46
  "do_lower_case": true,
47
  "mask_token": "[MASK]",
48
+ "max_length": 512,
49
  "model_max_length": 512,
50
+ "pad_to_multiple_of": null,
51
  "pad_token": "[PAD]",
52
+ "pad_token_type_id": 0,
53
+ "padding_side": "right",
54
  "sep_token": "[SEP]",
55
+ "stride": 0,
56
  "strip_accents": null,
57
  "tokenize_chinese_chars": true,
58
  "tokenizer_class": "BertTokenizer",
59
+ "truncation_side": "right",
60
+ "truncation_strategy": "longest_first",
61
  "unk_token": "[UNK]"
62
  }
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 1.6346299648284912,
3
  "best_model_checkpoint": "ner-bert-ingredients/checkpoint-3750",
4
- "epoch": 6.062647356012126,
5
  "eval_steps": 750,
6
- "global_step": 4500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -91,6 +91,20 @@
91
  "eval_samples_per_second": 59.356,
92
  "eval_steps_per_second": 0.938,
93
  "step": 4500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
94
  }
95
  ],
96
  "logging_steps": 750,
@@ -98,7 +112,7 @@
98
  "num_input_tokens_seen": 0,
99
  "num_train_epochs": 100,
100
  "save_steps": 750,
101
- "total_flos": 1.9475913345048576e+17,
102
  "train_batch_size": 16,
103
  "trial_name": null,
104
  "trial_params": null
 
1
  {
2
  "best_metric": 1.6346299648284912,
3
  "best_model_checkpoint": "ner-bert-ingredients/checkpoint-3750",
4
+ "epoch": 7.07510946446615,
5
  "eval_steps": 750,
6
+ "global_step": 5250,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
91
  "eval_samples_per_second": 59.356,
92
  "eval_steps_per_second": 0.938,
93
  "step": 4500
94
+ },
95
+ {
96
+ "epoch": 7.08,
97
+ "learning_rate": 4.949460916442048e-05,
98
+ "loss": 3.7548,
99
+ "step": 5250
100
+ },
101
+ {
102
+ "epoch": 7.08,
103
+ "eval_loss": 2.378469228744507,
104
+ "eval_runtime": 84.0031,
105
+ "eval_samples_per_second": 59.522,
106
+ "eval_steps_per_second": 0.94,
107
+ "step": 5250
108
  }
109
  ],
110
  "logging_steps": 750,
 
112
  "num_input_tokens_seen": 0,
113
  "num_train_epochs": 100,
114
  "save_steps": 750,
115
+ "total_flos": 2.2721898902556672e+17,
116
  "train_batch_size": 16,
117
  "trial_name": null,
118
  "trial_params": null