mp-02 commited on
Commit
38572e2
1 Parent(s): 1cd02cf

End of training

Browse files
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
all_results.json CHANGED
@@ -1,4 +1,14 @@
1
  {
 
 
 
 
 
 
 
 
 
 
2
  "predict_accuracy": 0.8218373936014088,
3
  "predict_f1": 0.9038133181559477,
4
  "predict_loss": 0.6888472437858582,
@@ -6,5 +16,10 @@
6
  "predict_recall": 0.9126436781609195,
7
  "predict_runtime": 2.0596,
8
  "predict_samples_per_second": 8.74,
9
- "predict_steps_per_second": 0.971
 
 
 
 
 
10
  }
 
1
  {
2
+ "epoch": 13.16,
3
+ "eval_accuracy": 0.8535829122645843,
4
+ "eval_f1": 0.9075504610017443,
5
+ "eval_loss": 0.8330431580543518,
6
+ "eval_precision": 0.9046199701937406,
7
+ "eval_recall": 0.9105,
8
+ "eval_runtime": 2.2353,
9
+ "eval_samples": 54,
10
+ "eval_samples_per_second": 24.158,
11
+ "eval_steps_per_second": 1.789,
12
  "predict_accuracy": 0.8218373936014088,
13
  "predict_f1": 0.9038133181559477,
14
  "predict_loss": 0.6888472437858582,
 
16
  "predict_recall": 0.9126436781609195,
17
  "predict_runtime": 2.0596,
18
  "predict_samples_per_second": 8.74,
19
+ "predict_steps_per_second": 0.971,
20
+ "train_loss": 0.256378173828125,
21
+ "train_runtime": 215.2806,
22
+ "train_samples": 150,
23
+ "train_samples_per_second": 9.29,
24
+ "train_steps_per_second": 2.323
25
  }
config.json CHANGED
@@ -7,52 +7,57 @@
7
  "bos_token_id": 0,
8
  "classifier_dropout": null,
9
  "coordinate_size": 128,
 
 
 
10
  "eos_token_id": 2,
 
11
  "has_relative_attention_bias": true,
12
  "has_spatial_attention_bias": true,
13
  "hidden_act": "gelu",
14
  "hidden_dropout_prob": 0.1,
15
  "hidden_size": 768,
16
  "id2label": {
17
- "0": "O",
18
- "1": "B-HEADER",
19
- "2": "I-HEADER",
20
- "3": "B-QUESTION",
21
- "4": "I-QUESTION",
22
- "5": "B-ANSWER",
23
- "6": "I-ANSWER"
24
  },
25
  "initializer_range": 0.02,
26
  "input_size": 224,
27
  "intermediate_size": 3072,
28
  "label2id": {
29
- "B-ANSWER": 5,
30
- "B-HEADER": 1,
31
- "B-QUESTION": 3,
32
- "I-ANSWER": 6,
33
- "I-HEADER": 2,
34
- "I-QUESTION": 4,
35
- "O": 0
36
  },
37
  "layer_norm_eps": 1e-05,
38
  "max_2d_position_embeddings": 1024,
39
  "max_position_embeddings": 514,
40
  "max_rel_2d_pos": 256,
41
  "max_rel_pos": 128,
 
42
  "model_type": "layoutlmv3",
43
  "num_attention_heads": 12,
44
- "num_channels": 3,
45
  "num_hidden_layers": 12,
46
  "pad_token_id": 1,
47
- "patch_size": 16,
48
  "rel_2d_pos_bins": 64,
49
  "rel_pos_bins": 32,
50
  "second_input_size": 112,
51
  "shape_size": 128,
52
- "text_embed": true,
53
  "torch_dtype": "float32",
54
- "transformers_version": "4.44.0",
55
  "type_vocab_size": 1,
 
56
  "visual_embed": true,
57
- "vocab_size": 50265
 
58
  }
 
7
  "bos_token_id": 0,
8
  "classifier_dropout": null,
9
  "coordinate_size": 128,
10
+ "device": "cuda",
11
+ "discrete_vae_type": "dall-e",
12
+ "discrete_vae_weight_path": "",
13
  "eos_token_id": 2,
14
+ "finetuning_task": "ner",
15
  "has_relative_attention_bias": true,
16
  "has_spatial_attention_bias": true,
17
  "hidden_act": "gelu",
18
  "hidden_dropout_prob": 0.1,
19
  "hidden_size": 768,
20
  "id2label": {
21
+ "0": "LABEL_0",
22
+ "1": "LABEL_1",
23
+ "2": "LABEL_2",
24
+ "3": "LABEL_3",
25
+ "4": "LABEL_4",
26
+ "5": "LABEL_5",
27
+ "6": "LABEL_6"
28
  },
29
  "initializer_range": 0.02,
30
  "input_size": 224,
31
  "intermediate_size": 3072,
32
  "label2id": {
33
+ "LABEL_0": 0,
34
+ "LABEL_1": 1,
35
+ "LABEL_2": 2,
36
+ "LABEL_3": 3,
37
+ "LABEL_4": 4,
38
+ "LABEL_5": 5,
39
+ "LABEL_6": 6
40
  },
41
  "layer_norm_eps": 1e-05,
42
  "max_2d_position_embeddings": 1024,
43
  "max_position_embeddings": 514,
44
  "max_rel_2d_pos": 256,
45
  "max_rel_pos": 128,
46
+ "mim": false,
47
  "model_type": "layoutlmv3",
48
  "num_attention_heads": 12,
 
49
  "num_hidden_layers": 12,
50
  "pad_token_id": 1,
51
+ "position_embedding_type": "absolute",
52
  "rel_2d_pos_bins": 64,
53
  "rel_pos_bins": 32,
54
  "second_input_size": 112,
55
  "shape_size": 128,
 
56
  "torch_dtype": "float32",
57
+ "transformers_version": "4.12.5",
58
  "type_vocab_size": 1,
59
+ "use_cache": true,
60
  "visual_embed": true,
61
+ "vocab_size": 50265,
62
+ "wpa_task": false
63
  }
eval_results.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 13.16,
3
+ "eval_accuracy": 0.8535829122645843,
4
+ "eval_f1": 0.9075504610017443,
5
+ "eval_loss": 0.8330431580543518,
6
+ "eval_precision": 0.9046199701937406,
7
+ "eval_recall": 0.9105,
8
+ "eval_runtime": 2.2353,
9
+ "eval_samples": 54,
10
+ "eval_samples_per_second": 24.158,
11
+ "eval_steps_per_second": 1.789
12
+ }
merges.txt CHANGED
@@ -1,4 +1,4 @@
1
- #version: 0.2
2
  Ġ t
3
  Ġ a
4
  h e
 
1
+ #version: 0.2 - Trained by `huggingface/tokenizers`
2
  Ġ t
3
  Ġ a
4
  h e
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a199f09773c9ccd3c9ed282276252abdd4fb21595348d9a4616fad33649056d
3
+ size 501420883
runs/Aug24_17-06-00_bernini/1724512220.8391128/events.out.tfevents.1724512220.bernini.30511.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3da857c91ba0f95212eb2f5941c0edb09aec289239a86860b62ca0a310bbb4f4
3
+ size 4689
runs/Aug24_17-06-00_bernini/events.out.tfevents.1724512220.bernini.30511.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db850f850e6bdc9006830635a2ec09bf1e84faec1d01a1f92c9621ebfef20b35
3
+ size 9322
runs/Aug24_17-06-00_bernini/events.out.tfevents.1724512439.bernini.30511.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89c5ce7ee0f3e9eb76983011c3502f891d63bfb39cf7822811bf69dd7e3195fd
3
+ size 512
special_tokens_map.json CHANGED
@@ -1,51 +1 @@
1
- {
2
- "bos_token": {
3
- "content": "<s>",
4
- "lstrip": false,
5
- "normalized": true,
6
- "rstrip": false,
7
- "single_word": false
8
- },
9
- "cls_token": {
10
- "content": "<s>",
11
- "lstrip": false,
12
- "normalized": true,
13
- "rstrip": false,
14
- "single_word": false
15
- },
16
- "eos_token": {
17
- "content": "</s>",
18
- "lstrip": false,
19
- "normalized": true,
20
- "rstrip": false,
21
- "single_word": false
22
- },
23
- "mask_token": {
24
- "content": "<mask>",
25
- "lstrip": true,
26
- "normalized": true,
27
- "rstrip": false,
28
- "single_word": false
29
- },
30
- "pad_token": {
31
- "content": "<pad>",
32
- "lstrip": false,
33
- "normalized": true,
34
- "rstrip": false,
35
- "single_word": false
36
- },
37
- "sep_token": {
38
- "content": "</s>",
39
- "lstrip": false,
40
- "normalized": true,
41
- "rstrip": false,
42
- "single_word": false
43
- },
44
- "unk_token": {
45
- "content": "<unk>",
46
- "lstrip": false,
47
- "normalized": true,
48
- "rstrip": false,
49
- "single_word": false
50
- }
51
- }
 
1
+ {"bos_token": {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, "eos_token": {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, "unk_token": {"content": "<unk>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, "sep_token": {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, "pad_token": {"content": "<pad>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, "cls_token": {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, "mask_token": {"content": "<mask>", "single_word": false, "lstrip": true, "rstrip": false, "normalized": true}}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -1,80 +1 @@
1
- {
2
- "add_prefix_space": true,
3
- "added_tokens_decoder": {
4
- "0": {
5
- "content": "<s>",
6
- "lstrip": false,
7
- "normalized": true,
8
- "rstrip": false,
9
- "single_word": false,
10
- "special": true
11
- },
12
- "1": {
13
- "content": "<pad>",
14
- "lstrip": false,
15
- "normalized": true,
16
- "rstrip": false,
17
- "single_word": false,
18
- "special": true
19
- },
20
- "2": {
21
- "content": "</s>",
22
- "lstrip": false,
23
- "normalized": true,
24
- "rstrip": false,
25
- "single_word": false,
26
- "special": true
27
- },
28
- "3": {
29
- "content": "<unk>",
30
- "lstrip": false,
31
- "normalized": true,
32
- "rstrip": false,
33
- "single_word": false,
34
- "special": true
35
- },
36
- "50264": {
37
- "content": "<mask>",
38
- "lstrip": true,
39
- "normalized": true,
40
- "rstrip": false,
41
- "single_word": false,
42
- "special": true
43
- }
44
- },
45
- "apply_ocr": false,
46
- "bos_token": "<s>",
47
- "clean_up_tokenization_spaces": true,
48
- "cls_token": "<s>",
49
- "cls_token_box": [
50
- 0,
51
- 0,
52
- 0,
53
- 0
54
- ],
55
- "eos_token": "</s>",
56
- "errors": "replace",
57
- "mask_token": "<mask>",
58
- "model_max_length": 512,
59
- "only_label_first_subword": true,
60
- "pad_token": "<pad>",
61
- "pad_token_box": [
62
- 0,
63
- 0,
64
- 0,
65
- 0
66
- ],
67
- "pad_token_label": -100,
68
- "processor_class": "LayoutLMv3Processor",
69
- "sep_token": "</s>",
70
- "sep_token_box": [
71
- 0,
72
- 0,
73
- 0,
74
- 0
75
- ],
76
- "tokenizer_class": "LayoutLMv3Tokenizer",
77
- "trim_offsets": true,
78
- "unk_token": "<unk>",
79
- "use_fast": true
80
- }
 
1
+ {"unk_token": {"content": "<unk>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "bos_token": {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "eos_token": {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "add_prefix_space": true, "errors": "replace", "sep_token": {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "cls_token": {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "pad_token": {"content": "<pad>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "mask_token": {"content": "<mask>", "single_word": false, "lstrip": true, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "model_max_length": 512, "special_tokens_map_file": null, "name_or_path": "microsoft/layoutlmv3-base", "tokenizer_class": "LayoutLMv3Tokenizer"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 13.16,
3
+ "train_loss": 0.256378173828125,
4
+ "train_runtime": 215.2806,
5
+ "train_samples": 150,
6
+ "train_samples_per_second": 9.29,
7
+ "train_steps_per_second": 2.323
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,151 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 13.157894736842104,
5
+ "global_step": 500,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 1.32,
12
+ "eval_accuracy": 0.8087965089572806,
13
+ "eval_f1": 0.8503675598766895,
14
+ "eval_loss": 0.616326630115509,
15
+ "eval_precision": 0.8087505638249888,
16
+ "eval_recall": 0.8965,
17
+ "eval_runtime": 2.4397,
18
+ "eval_samples_per_second": 22.134,
19
+ "eval_steps_per_second": 1.64,
20
+ "step": 50
21
+ },
22
+ {
23
+ "epoch": 2.63,
24
+ "eval_accuracy": 0.8133899862195683,
25
+ "eval_f1": 0.8346153846153846,
26
+ "eval_loss": 0.541599690914154,
27
+ "eval_precision": 0.8037037037037037,
28
+ "eval_recall": 0.868,
29
+ "eval_runtime": 2.2528,
30
+ "eval_samples_per_second": 23.97,
31
+ "eval_steps_per_second": 1.776,
32
+ "step": 100
33
+ },
34
+ {
35
+ "epoch": 3.95,
36
+ "eval_accuracy": 0.8385392742305926,
37
+ "eval_f1": 0.8659844054580897,
38
+ "eval_loss": 0.5571682453155518,
39
+ "eval_precision": 0.8445817490494296,
40
+ "eval_recall": 0.8885,
41
+ "eval_runtime": 2.2592,
42
+ "eval_samples_per_second": 23.902,
43
+ "eval_steps_per_second": 1.771,
44
+ "step": 150
45
+ },
46
+ {
47
+ "epoch": 5.26,
48
+ "eval_accuracy": 0.8123564538355535,
49
+ "eval_f1": 0.850608998260005,
50
+ "eval_loss": 0.7317042350769043,
51
+ "eval_precision": 0.8457736035590707,
52
+ "eval_recall": 0.8555,
53
+ "eval_runtime": 2.2554,
54
+ "eval_samples_per_second": 23.943,
55
+ "eval_steps_per_second": 1.774,
56
+ "step": 200
57
+ },
58
+ {
59
+ "epoch": 6.58,
60
+ "eval_accuracy": 0.8385392742305926,
61
+ "eval_f1": 0.8906055320209318,
62
+ "eval_loss": 0.7219748497009277,
63
+ "eval_precision": 0.8877297565822156,
64
+ "eval_recall": 0.8935,
65
+ "eval_runtime": 2.2283,
66
+ "eval_samples_per_second": 24.234,
67
+ "eval_steps_per_second": 1.795,
68
+ "step": 250
69
+ },
70
+ {
71
+ "epoch": 7.89,
72
+ "eval_accuracy": 0.8435920992191088,
73
+ "eval_f1": 0.8914595126753629,
74
+ "eval_loss": 0.8069794774055481,
75
+ "eval_precision": 0.8778477944740669,
76
+ "eval_recall": 0.9055,
77
+ "eval_runtime": 2.2476,
78
+ "eval_samples_per_second": 24.025,
79
+ "eval_steps_per_second": 1.78,
80
+ "step": 300
81
+ },
82
+ {
83
+ "epoch": 9.21,
84
+ "eval_accuracy": 0.8477262287551677,
85
+ "eval_f1": 0.9048562933597621,
86
+ "eval_loss": 0.7895194888114929,
87
+ "eval_precision": 0.8968565815324165,
88
+ "eval_recall": 0.913,
89
+ "eval_runtime": 2.3704,
90
+ "eval_samples_per_second": 22.781,
91
+ "eval_steps_per_second": 1.687,
92
+ "step": 350
93
+ },
94
+ {
95
+ "epoch": 10.53,
96
+ "eval_accuracy": 0.8411805236564079,
97
+ "eval_f1": 0.8912280701754386,
98
+ "eval_loss": 0.8168221712112427,
99
+ "eval_precision": 0.893467336683417,
100
+ "eval_recall": 0.889,
101
+ "eval_runtime": 2.4315,
102
+ "eval_samples_per_second": 22.208,
103
+ "eval_steps_per_second": 1.645,
104
+ "step": 400
105
+ },
106
+ {
107
+ "epoch": 11.84,
108
+ "eval_accuracy": 0.8520900321543409,
109
+ "eval_f1": 0.9061264822134387,
110
+ "eval_loss": 0.8232607841491699,
111
+ "eval_precision": 0.8955078125,
112
+ "eval_recall": 0.917,
113
+ "eval_runtime": 2.2665,
114
+ "eval_samples_per_second": 23.825,
115
+ "eval_steps_per_second": 1.765,
116
+ "step": 450
117
+ },
118
+ {
119
+ "epoch": 13.16,
120
+ "learning_rate": 0.0,
121
+ "loss": 0.2564,
122
+ "step": 500
123
+ },
124
+ {
125
+ "epoch": 13.16,
126
+ "eval_accuracy": 0.8535829122645843,
127
+ "eval_f1": 0.9075504610017443,
128
+ "eval_loss": 0.8330431580543518,
129
+ "eval_precision": 0.9046199701937406,
130
+ "eval_recall": 0.9105,
131
+ "eval_runtime": 2.224,
132
+ "eval_samples_per_second": 24.281,
133
+ "eval_steps_per_second": 1.799,
134
+ "step": 500
135
+ },
136
+ {
137
+ "epoch": 13.16,
138
+ "step": 500,
139
+ "total_flos": 520356947539968.0,
140
+ "train_loss": 0.256378173828125,
141
+ "train_runtime": 215.2806,
142
+ "train_samples_per_second": 9.29,
143
+ "train_steps_per_second": 2.323
144
+ }
145
+ ],
146
+ "max_steps": 500,
147
+ "num_train_epochs": 14,
148
+ "total_flos": 520356947539968.0,
149
+ "trial_name": null,
150
+ "trial_params": null
151
+ }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:79a00e9e2eb4d526ef08352565518f227fb0a5281651fc78cd4ba3cb25fb2f28
3
- size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ff27db448ecc4f0766af29a31b5c5ce5b719f6114c6d3e3be5126e0327583fa
3
+ size 2991