lucianoacsilva commited on
Commit
ca7b8f6
·
1 Parent(s): 3c075b0

feature: Faz upload de arquivos do modelo

Browse files
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "[BOS]": 29794
3
+ }
all_results.json ADDED
@@ -0,0 +1,66 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "EOP_f1": 0.7691492742875305,
3
+ "EOP_number": 4774,
4
+ "EOP_precision": 0.7781350482315113,
5
+ "EOP_recall": 0.7603686635944701,
6
+ "accuracy": 0.9456432259834859,
7
+ "epoch": 5.0,
8
+ "eval_EOP_f1": 0.7546452702702704,
9
+ "eval_EOP_number": 2446,
10
+ "eval_EOP_precision": 0.780349344978166,
11
+ "eval_EOP_recall": 0.7305805396565822,
12
+ "eval_da_EOP_f1": 0.7679782903663502,
13
+ "eval_da_EOP_number": 2704,
14
+ "eval_da_EOP_precision": 0.8069246435845214,
15
+ "eval_da_EOP_recall": 0.7326183431952663,
16
+ "eval_da_overall_accuracy": 0.9443618109138235,
17
+ "eval_da_overall_f1": 0.7679782903663502,
18
+ "eval_da_overall_precision": 0.8069246435845214,
19
+ "eval_da_overall_recall": 0.7326183431952663,
20
+ "eval_loss": NaN,
21
+ "eval_overall_accuracy": 0.9436660687448489,
22
+ "eval_overall_f1": 0.7546452702702704,
23
+ "eval_overall_precision": 0.780349344978166,
24
+ "eval_overall_recall": 0.7305805396565822,
25
+ "eval_runtime": 115.155,
26
+ "eval_samples": 1523,
27
+ "eval_samples_per_second": 13.226,
28
+ "eval_steps_per_second": 3.309,
29
+ "overall_accuracy": 0.9456432259834859,
30
+ "overall_f1": 0.7691492742875305,
31
+ "overall_precision": 0.7781350482315113,
32
+ "overall_recall": 0.7603686635944701,
33
+ "predict_EOP_f1": 0.7691492742875305,
34
+ "predict_EOP_number": 4774,
35
+ "predict_EOP_precision": 0.7781350482315113,
36
+ "predict_EOP_recall": 0.7603686635944701,
37
+ "predict_da_EOP_f1": 0.7890958478851378,
38
+ "predict_da_EOP_number": 5339,
39
+ "predict_da_EOP_precision": 0.8184745421614007,
40
+ "predict_da_EOP_recall": 0.7617531372916276,
41
+ "predict_da_overall_accuracy": 0.9483659509785294,
42
+ "predict_da_overall_f1": 0.7890958478851378,
43
+ "predict_da_overall_precision": 0.8184745421614007,
44
+ "predict_da_overall_recall": 0.7617531372916276,
45
+ "predict_examples": 718,
46
+ "predict_loss": NaN,
47
+ "predict_overall_accuracy": 0.9456432259834859,
48
+ "predict_overall_f1": 0.7691492742875305,
49
+ "predict_overall_precision": 0.7781350482315113,
50
+ "predict_overall_recall": 0.7603686635944701,
51
+ "predict_runtime": 220.4272,
52
+ "predict_samples_per_second": 13.238,
53
+ "predict_steps_per_second": 3.312,
54
+ "threshold_0.5_example_level_1-pk": 0.8284,
55
+ "threshold_0.5_example_level_1-wd": 0.8055,
56
+ "threshold_0.5_example_level_f1": 0.7691,
57
+ "threshold_0.5_example_level_pk": 0.17159999999999997,
58
+ "threshold_0.5_example_level_precision": 0.7781,
59
+ "threshold_0.5_example_level_recall": 0.7604,
60
+ "threshold_0.5_example_level_wd": 0.1945,
61
+ "train_loss": 0.545391144610428,
62
+ "train_runtime": 12631.9735,
63
+ "train_samples": 10739,
64
+ "train_samples_per_second": 4.251,
65
+ "train_steps_per_second": 1.063
66
+ }
config.json ADDED
@@ -0,0 +1,67 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "neuralmind/bert-base-portuguese-cased",
3
+ "architectures": [
4
+ "BertWithDAForSentenceLabelingTopicSegmentation"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "cache_dir": null,
8
+ "cl_anchor_level": "eop_list",
9
+ "cl_loss_weight": 0.5,
10
+ "cl_negative_k": 3,
11
+ "cl_positive_k": 1,
12
+ "cl_temp": 0.1,
13
+ "classifier_dropout": null,
14
+ "config_name": null,
15
+ "directionality": "bidi",
16
+ "do_cssl": true,
17
+ "do_da_ts": true,
18
+ "do_tssp": true,
19
+ "finetuning_task": "topic_segment",
20
+ "focal_loss_gamma": 0.0,
21
+ "hidden_act": "gelu",
22
+ "hidden_dropout_prob": 0.1,
23
+ "hidden_size": 768,
24
+ "id2label": {
25
+ "0": "B-EOP",
26
+ "1": "O"
27
+ },
28
+ "ignore_mismatched_sizes": false,
29
+ "initializer_range": 0.02,
30
+ "intermediate_size": 3072,
31
+ "label2id": {
32
+ "B-EOP": 0,
33
+ "O": 1
34
+ },
35
+ "layer_norm_eps": 1e-12,
36
+ "max_position_embeddings": 512,
37
+ "model_name_or_path": "neuralmind/bert-base-portuguese-cased",
38
+ "model_revision": "main",
39
+ "model_type": "bert",
40
+ "num_attention_heads": 12,
41
+ "num_gpu": 1,
42
+ "num_hidden_layers": 12,
43
+ "num_topic_labels": 0,
44
+ "num_tssp_labels": 3,
45
+ "output_past": true,
46
+ "pad_token_id": 0,
47
+ "pooler_fc_size": 768,
48
+ "pooler_num_attention_heads": 12,
49
+ "pooler_num_fc_layers": 3,
50
+ "pooler_size_per_head": 128,
51
+ "pooler_type": "first_token_transform",
52
+ "position_embedding_type": "absolute",
53
+ "sentence_pooler_type": null,
54
+ "tokenizer_name": null,
55
+ "torch_dtype": "float32",
56
+ "transformers_version": "4.26.0",
57
+ "ts_loss_weight": 1.0,
58
+ "ts_score_predictor": "lt",
59
+ "ts_score_predictor_cos_temp": 1,
60
+ "tssp_ablation": "none",
61
+ "tssp_loss_weight": 1.0,
62
+ "type_vocab_size": 2,
63
+ "use_auth_token": false,
64
+ "use_cache": true,
65
+ "vocab_size": 29795,
66
+ "weight_label_zero": 0.5
67
+ }
eval_results.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 5.0,
3
+ "eval_EOP_f1": 0.7546452702702704,
4
+ "eval_EOP_number": 2446,
5
+ "eval_EOP_precision": 0.780349344978166,
6
+ "eval_EOP_recall": 0.7305805396565822,
7
+ "eval_da_EOP_f1": 0.7679782903663502,
8
+ "eval_da_EOP_number": 2704,
9
+ "eval_da_EOP_precision": 0.8069246435845214,
10
+ "eval_da_EOP_recall": 0.7326183431952663,
11
+ "eval_da_overall_accuracy": 0.9443618109138235,
12
+ "eval_da_overall_f1": 0.7679782903663502,
13
+ "eval_da_overall_precision": 0.8069246435845214,
14
+ "eval_da_overall_recall": 0.7326183431952663,
15
+ "eval_loss": NaN,
16
+ "eval_overall_accuracy": 0.9436660687448489,
17
+ "eval_overall_f1": 0.7546452702702704,
18
+ "eval_overall_precision": 0.780349344978166,
19
+ "eval_overall_recall": 0.7305805396565822,
20
+ "eval_runtime": 115.155,
21
+ "eval_samples": 1523,
22
+ "eval_samples_per_second": 13.226,
23
+ "eval_steps_per_second": 3.309
24
+ }
example_level_predict_wiki_section_disease_max_seq512_ts_score_lt_results.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "EOP_f1": 0.7691492742875305,
3
+ "EOP_number": 4774,
4
+ "EOP_precision": 0.7781350482315113,
5
+ "EOP_recall": 0.7603686635944701,
6
+ "accuracy": 0.9456432259834859,
7
+ "overall_accuracy": 0.9456432259834859,
8
+ "overall_f1": 0.7691492742875305,
9
+ "overall_precision": 0.7781350482315113,
10
+ "overall_recall": 0.7603686635944701,
11
+ "predict_examples": 718,
12
+ "threshold_0.5_example_level_1-pk": 0.8284,
13
+ "threshold_0.5_example_level_1-wd": 0.8055,
14
+ "threshold_0.5_example_level_f1": 0.7691,
15
+ "threshold_0.5_example_level_pk": 0.17159999999999997,
16
+ "threshold_0.5_example_level_precision": 0.7781,
17
+ "threshold_0.5_example_level_recall": 0.7604,
18
+ "threshold_0.5_example_level_wd": 0.1945
19
+ }
example_level_predict_wiki_section_disease_max_seq512_ts_score_lt_results_str_metric.txt ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ p / r / f / pk / wd
2
+ threshold_0.5_example_level_metric
3
+ 77.81 / 76.04 / 76.91 / 17.16 / 19.45
4
+
predict_wiki_section_disease_max_seq512_ts_score_lt_results.json ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "predict_EOP_f1": 0.7691492742875305,
3
+ "predict_EOP_number": 4774,
4
+ "predict_EOP_precision": 0.7781350482315113,
5
+ "predict_EOP_recall": 0.7603686635944701,
6
+ "predict_da_EOP_f1": 0.7890958478851378,
7
+ "predict_da_EOP_number": 5339,
8
+ "predict_da_EOP_precision": 0.8184745421614007,
9
+ "predict_da_EOP_recall": 0.7617531372916276,
10
+ "predict_da_overall_accuracy": 0.9483659509785294,
11
+ "predict_da_overall_f1": 0.7890958478851378,
12
+ "predict_da_overall_precision": 0.8184745421614007,
13
+ "predict_da_overall_recall": 0.7617531372916276,
14
+ "predict_loss": NaN,
15
+ "predict_overall_accuracy": 0.9456432259834859,
16
+ "predict_overall_f1": 0.7691492742875305,
17
+ "predict_overall_precision": 0.7781350482315113,
18
+ "predict_overall_recall": 0.7603686635944701,
19
+ "predict_runtime": 220.4272,
20
+ "predict_samples_per_second": 13.238,
21
+ "predict_steps_per_second": 3.312
22
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:567df42ee1adc5e4ede487db9d98b4c4f359c7e6e8506667892385c303303ff6
3
+ size 435782697
run.log ADDED
The diff for this file is too large to render. See raw diff
 
special_tokens_map.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "[BOS]",
3
+ "cls_token": "[CLS]",
4
+ "mask_token": "[MASK]",
5
+ "pad_token": "[PAD]",
6
+ "sep_token": "[SEP]",
7
+ "unk_token": "[UNK]"
8
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "do_basic_tokenize": true,
4
+ "do_lower_case": false,
5
+ "mask_token": "[MASK]",
6
+ "model_max_length": 1000000000000000019884624838656,
7
+ "name_or_path": "neuralmind/bert-base-portuguese-cased",
8
+ "never_split": null,
9
+ "pad_token": "[PAD]",
10
+ "sep_token": "[SEP]",
11
+ "special_tokens_map_file": "/home/ext_maiara_frodrigues2000_gmail_/.cache/huggingface/hub/models--neuralmind--bert-base-portuguese-cased/snapshots/94d69c95f98f7d5b2a8700c420230ae10def0baa/special_tokens_map.json",
12
+ "strip_accents": null,
13
+ "tokenize_chinese_chars": true,
14
+ "tokenizer_class": "BertTokenizer",
15
+ "unk_token": "[UNK]"
16
+ }
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 5.0,
3
+ "train_loss": 0.545391144610428,
4
+ "train_runtime": 12631.9735,
5
+ "train_samples": 10739,
6
+ "train_samples_per_second": 4.251,
7
+ "train_steps_per_second": 1.063
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,175 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.7546452702702704,
3
+ "best_model_checkpoint": "./output/neuralmind/bert-base-portuguese-cased-finetune-wiki_section_disease/seed42-seq512-lr5e-05-epoch5-bs4-ts1.0-tssp1.0-cl0.5-2024-05-03_16:56:29/checkpoint-13420",
4
+ "epoch": 5.0,
5
+ "global_step": 13425,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 1.0,
12
+ "learning_rate": 4.000372439478585e-05,
13
+ "loss": 0.9152,
14
+ "step": 2684
15
+ },
16
+ {
17
+ "epoch": 1.0,
18
+ "eval_EOP_f1": 0.7217790669567319,
19
+ "eval_EOP_number": 2446,
20
+ "eval_EOP_precision": 0.882909520993495,
21
+ "eval_EOP_recall": 0.6103843008994276,
22
+ "eval_da_EOP_f1": 0.7340590979782271,
23
+ "eval_da_EOP_number": 2704,
24
+ "eval_da_EOP_precision": 0.9193099610461881,
25
+ "eval_da_EOP_recall": 0.6109467455621301,
26
+ "eval_da_overall_accuracy": 0.9443618109138235,
27
+ "eval_da_overall_f1": 0.7340590979782271,
28
+ "eval_da_overall_precision": 0.9193099610461881,
29
+ "eval_da_overall_recall": 0.6109467455621301,
30
+ "eval_loss": NaN,
31
+ "eval_overall_accuracy": 0.9441993503660251,
32
+ "eval_overall_f1": 0.7217790669567319,
33
+ "eval_overall_precision": 0.882909520993495,
34
+ "eval_overall_recall": 0.6103843008994276,
35
+ "eval_runtime": 115.3406,
36
+ "eval_samples_per_second": 13.204,
37
+ "eval_steps_per_second": 3.303,
38
+ "step": 2684
39
+ },
40
+ {
41
+ "epoch": 2.0,
42
+ "learning_rate": 3.0007448789571697e-05,
43
+ "loss": 0.6588,
44
+ "step": 5368
45
+ },
46
+ {
47
+ "epoch": 2.0,
48
+ "eval_EOP_f1": 0.7412026726057906,
49
+ "eval_EOP_number": 2446,
50
+ "eval_EOP_precision": 0.8140900195694716,
51
+ "eval_EOP_recall": 0.6802943581357318,
52
+ "eval_da_EOP_f1": 0.7685429790692948,
53
+ "eval_da_EOP_number": 2704,
54
+ "eval_da_EOP_precision": 0.8529544429409112,
55
+ "eval_da_EOP_recall": 0.6993343195266272,
56
+ "eval_da_overall_accuracy": 0.94705772985033,
57
+ "eval_da_overall_f1": 0.7685429790692948,
58
+ "eval_da_overall_precision": 0.8529544429409112,
59
+ "eval_da_overall_recall": 0.6993343195266272,
60
+ "eval_loss": NaN,
61
+ "eval_overall_accuracy": 0.9436660687448489,
62
+ "eval_overall_f1": 0.7412026726057906,
63
+ "eval_overall_precision": 0.8140900195694716,
64
+ "eval_overall_recall": 0.6802943581357318,
65
+ "eval_runtime": 115.0795,
66
+ "eval_samples_per_second": 13.234,
67
+ "eval_steps_per_second": 3.311,
68
+ "step": 5368
69
+ },
70
+ {
71
+ "epoch": 3.0,
72
+ "learning_rate": 2.0011173184357543e-05,
73
+ "loss": 0.4949,
74
+ "step": 8052
75
+ },
76
+ {
77
+ "epoch": 3.0,
78
+ "eval_EOP_f1": 0.7511530858774434,
79
+ "eval_EOP_number": 2446,
80
+ "eval_EOP_precision": 0.8115804461319411,
81
+ "eval_EOP_recall": 0.6991005723630417,
82
+ "eval_da_EOP_f1": 0.7725617159044921,
83
+ "eval_da_EOP_number": 2704,
84
+ "eval_da_EOP_precision": 0.8529937444146559,
85
+ "eval_da_EOP_recall": 0.705991124260355,
86
+ "eval_da_overall_accuracy": 0.9477549502649437,
87
+ "eval_da_overall_f1": 0.7725617159044921,
88
+ "eval_da_overall_precision": 0.8529937444146559,
89
+ "eval_da_overall_recall": 0.705991124260355,
90
+ "eval_loss": NaN,
91
+ "eval_overall_accuracy": 0.9450719930188588,
92
+ "eval_overall_f1": 0.7511530858774434,
93
+ "eval_overall_precision": 0.8115804461319411,
94
+ "eval_overall_recall": 0.6991005723630417,
95
+ "eval_runtime": 114.897,
96
+ "eval_samples_per_second": 13.255,
97
+ "eval_steps_per_second": 3.316,
98
+ "step": 8052
99
+ },
100
+ {
101
+ "epoch": 4.0,
102
+ "learning_rate": 1.001489757914339e-05,
103
+ "loss": 0.3741,
104
+ "step": 10736
105
+ },
106
+ {
107
+ "epoch": 4.0,
108
+ "eval_EOP_f1": 0.752757949383517,
109
+ "eval_EOP_number": 2446,
110
+ "eval_EOP_precision": 0.799265043638034,
111
+ "eval_EOP_recall": 0.7113654946852003,
112
+ "eval_da_EOP_f1": 0.7717067355454003,
113
+ "eval_da_EOP_number": 2704,
114
+ "eval_da_EOP_precision": 0.8338342636324603,
115
+ "eval_da_EOP_recall": 0.7181952662721893,
116
+ "eval_da_overall_accuracy": 0.9465929162405875,
117
+ "eval_da_overall_f1": 0.7717067355454003,
118
+ "eval_da_overall_precision": 0.8338342636324603,
119
+ "eval_da_overall_recall": 0.7181952662721893,
120
+ "eval_loss": NaN,
121
+ "eval_overall_accuracy": 0.9445871915450623,
122
+ "eval_overall_f1": 0.752757949383517,
123
+ "eval_overall_precision": 0.799265043638034,
124
+ "eval_overall_recall": 0.7113654946852003,
125
+ "eval_runtime": 114.8732,
126
+ "eval_samples_per_second": 13.258,
127
+ "eval_steps_per_second": 3.317,
128
+ "step": 10736
129
+ },
130
+ {
131
+ "epoch": 5.0,
132
+ "learning_rate": 1.86219739292365e-08,
133
+ "loss": 0.2844,
134
+ "step": 13420
135
+ },
136
+ {
137
+ "epoch": 5.0,
138
+ "eval_EOP_f1": 0.7546452702702704,
139
+ "eval_EOP_number": 2446,
140
+ "eval_EOP_precision": 0.780349344978166,
141
+ "eval_EOP_recall": 0.7305805396565822,
142
+ "eval_da_EOP_f1": 0.7679782903663502,
143
+ "eval_da_EOP_number": 2704,
144
+ "eval_da_EOP_precision": 0.8069246435845214,
145
+ "eval_da_EOP_recall": 0.7326183431952663,
146
+ "eval_da_overall_accuracy": 0.9443618109138235,
147
+ "eval_da_overall_f1": 0.7679782903663502,
148
+ "eval_da_overall_precision": 0.8069246435845214,
149
+ "eval_da_overall_recall": 0.7326183431952663,
150
+ "eval_loss": NaN,
151
+ "eval_overall_accuracy": 0.9436660687448489,
152
+ "eval_overall_f1": 0.7546452702702704,
153
+ "eval_overall_precision": 0.780349344978166,
154
+ "eval_overall_recall": 0.7305805396565822,
155
+ "eval_runtime": 114.7975,
156
+ "eval_samples_per_second": 13.267,
157
+ "eval_steps_per_second": 3.319,
158
+ "step": 13420
159
+ },
160
+ {
161
+ "epoch": 5.0,
162
+ "step": 13425,
163
+ "total_flos": 2.825625731920896e+16,
164
+ "train_loss": 0.545391144610428,
165
+ "train_runtime": 12631.9735,
166
+ "train_samples_per_second": 4.251,
167
+ "train_steps_per_second": 1.063
168
+ }
169
+ ],
170
+ "max_steps": 13425,
171
+ "num_train_epochs": 5,
172
+ "total_flos": 2.825625731920896e+16,
173
+ "trial_name": null,
174
+ "trial_params": null
175
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3194332b372ea2b036e0fccb377db061e11a589363b40609c5b08e15e729e4f7
3
+ size 3759
vocab.txt ADDED
The diff for this file is too large to render. See raw diff