ArneBinder commited on
Commit
85d9e20
1 Parent(s): 7b3df05

update model

Browse files

https://wandb.ai/arne/dataset-sciarg-task-ner_re-v0.3-training/runs/prik91di

conda-environment.yaml CHANGED
@@ -36,6 +36,7 @@ dependencies:
36
  - attrs==23.1.0
37
  - auto-gptq==0.4.2
38
  - autopage==0.5.1
 
39
  - black==23.7.0
40
  - blis==0.7.10
41
  - catalogue==2.0.9
@@ -56,6 +57,7 @@ dependencies:
56
  - dill==0.3.7
57
  - distlib==0.3.7
58
  - docker-pycreds==0.4.0
 
59
  - en-core-web-trf==3.6.1
60
  - exceptiongroup==1.1.3
61
  - fastjsonschema==2.18.0
@@ -66,7 +68,7 @@ dependencies:
66
  - gitdb==4.0.10
67
  - gitpython==3.1.34
68
  - greenlet==2.0.2
69
- - huggingface-hub==0.19.4
70
  - humanfriendly==10.0
71
  - hydra-colorlog==1.2.0
72
  - hydra-core==1.3.2
@@ -102,16 +104,28 @@ dependencies:
102
  - nodeenv==1.8.0
103
  - numpy==1.25.2
104
  - nvidia-cublas-cu11==11.10.3.66
 
105
  - nvidia-cuda-cupti-cu11==11.7.101
 
106
  - nvidia-cuda-nvrtc-cu11==11.7.99
 
107
  - nvidia-cuda-runtime-cu11==11.7.99
 
108
  - nvidia-cudnn-cu11==8.5.0.96
 
109
  - nvidia-cufft-cu11==10.9.0.58
 
110
  - nvidia-curand-cu11==10.2.10.91
 
111
  - nvidia-cusolver-cu11==11.4.0.1
 
112
  - nvidia-cusparse-cu11==11.7.4.91
 
113
  - nvidia-nccl-cu11==2.14.3
 
 
114
  - nvidia-nvtx-cu11==11.7.91
 
115
  - omegaconf==2.3.0
116
  - optimum==1.12.0
117
  - optuna==2.10.1
@@ -123,9 +137,8 @@ dependencies:
123
  - pathy==0.10.2
124
  - pbr==5.11.1
125
  - peft==0.5.0
126
- - pie-datasets==0.8.1
127
- - pie-models==0.3.0
128
- - pie-modules==0.10.6
129
  - platformdirs==3.10.0
130
  - plotext==5.2.8
131
  - pluggy==1.3.0
@@ -148,7 +161,7 @@ dependencies:
148
  - python-dateutil==2.8.2
149
  - python-dotenv==1.0.0
150
  - pytorch-crf==0.7.2
151
- - pytorch-ie==0.29.8
152
  - pytorch-lightning==2.1.2
153
  - pytz==2023.3.post1
154
  - pyyaml==6.0.1
@@ -158,7 +171,7 @@ dependencies:
158
  - rich==13.5.2
159
  - rouge==1.0.1
160
  - rpds-py==0.10.2
161
- - safetensors==0.3.3
162
  - scipy==1.11.2
163
  - sentencepiece==0.1.99
164
  - sentry-sdk==1.30.0
@@ -176,16 +189,16 @@ dependencies:
176
  - sympy==1.12
177
  - tabulate==0.9.0
178
  - thinc==8.1.12
179
- - tokenizers==0.15.0
180
  - tomli==2.0.1
181
- - torch==2.0.0
182
  - torchmetrics==1.1.1
183
  - tqdm==4.66.1
184
  - traitlets==5.9.0
185
- - transformers==4.36.0
186
- - triton==2.0.0
187
  - typer==0.9.0
188
- - typing-extensions==4.7.1
189
  - tzdata==2023.3
190
  - urllib3==2.0.4
191
  - urwid==2.1.2
 
36
  - attrs==23.1.0
37
  - auto-gptq==0.4.2
38
  - autopage==0.5.1
39
+ - beartype==0.17.2
40
  - black==23.7.0
41
  - blis==0.7.10
42
  - catalogue==2.0.9
 
57
  - dill==0.3.7
58
  - distlib==0.3.7
59
  - docker-pycreds==0.4.0
60
+ - ema-pytorch==0.4.2
61
  - en-core-web-trf==3.6.1
62
  - exceptiongroup==1.1.3
63
  - fastjsonschema==2.18.0
 
68
  - gitdb==4.0.10
69
  - gitpython==3.1.34
70
  - greenlet==2.0.2
71
+ - huggingface-hub==0.23.2
72
  - humanfriendly==10.0
73
  - hydra-colorlog==1.2.0
74
  - hydra-core==1.3.2
 
104
  - nodeenv==1.8.0
105
  - numpy==1.25.2
106
  - nvidia-cublas-cu11==11.10.3.66
107
+ - nvidia-cublas-cu12==12.1.3.1
108
  - nvidia-cuda-cupti-cu11==11.7.101
109
+ - nvidia-cuda-cupti-cu12==12.1.105
110
  - nvidia-cuda-nvrtc-cu11==11.7.99
111
+ - nvidia-cuda-nvrtc-cu12==12.1.105
112
  - nvidia-cuda-runtime-cu11==11.7.99
113
+ - nvidia-cuda-runtime-cu12==12.1.105
114
  - nvidia-cudnn-cu11==8.5.0.96
115
+ - nvidia-cudnn-cu12==8.9.2.26
116
  - nvidia-cufft-cu11==10.9.0.58
117
+ - nvidia-cufft-cu12==11.0.2.54
118
  - nvidia-curand-cu11==10.2.10.91
119
+ - nvidia-curand-cu12==10.3.2.106
120
  - nvidia-cusolver-cu11==11.4.0.1
121
+ - nvidia-cusolver-cu12==11.4.5.107
122
  - nvidia-cusparse-cu11==11.7.4.91
123
+ - nvidia-cusparse-cu12==12.1.0.106
124
  - nvidia-nccl-cu11==2.14.3
125
+ - nvidia-nccl-cu12==2.20.5
126
+ - nvidia-nvjitlink-cu12==12.5.40
127
  - nvidia-nvtx-cu11==11.7.91
128
+ - nvidia-nvtx-cu12==12.1.105
129
  - omegaconf==2.3.0
130
  - optimum==1.12.0
131
  - optuna==2.10.1
 
137
  - pathy==0.10.2
138
  - pbr==5.11.1
139
  - peft==0.5.0
140
+ - pie-datasets==0.10.0
141
+ - pie-modules==0.11.4
 
142
  - platformdirs==3.10.0
143
  - plotext==5.2.8
144
  - pluggy==1.3.0
 
161
  - python-dateutil==2.8.2
162
  - python-dotenv==1.0.0
163
  - pytorch-crf==0.7.2
164
+ - pytorch-ie==0.31.0
165
  - pytorch-lightning==2.1.2
166
  - pytz==2023.3.post1
167
  - pyyaml==6.0.1
 
171
  - rich==13.5.2
172
  - rouge==1.0.1
173
  - rpds-py==0.10.2
174
+ - safetensors==0.4.3
175
  - scipy==1.11.2
176
  - sentencepiece==0.1.99
177
  - sentry-sdk==1.30.0
 
189
  - sympy==1.12
190
  - tabulate==0.9.0
191
  - thinc==8.1.12
192
+ - tokenizers==0.15.2
193
  - tomli==2.0.1
194
+ - torch==2.3.0
195
  - torchmetrics==1.1.1
196
  - tqdm==4.66.1
197
  - traitlets==5.9.0
198
+ - transformers==4.39.3
199
+ - triton==2.3.0
200
  - typer==0.9.0
201
+ - typing-extensions==4.12.0
202
  - tzdata==2023.3
203
  - urllib3==2.0.4
204
  - urwid==2.1.2
config.json CHANGED
@@ -5,6 +5,7 @@
5
  "pretrained_model_name_or_path": "facebook/bart-base",
6
  "use_encoder_mlp": true,
7
  "use_constraints_encoder_mlp": true,
 
8
  "decoder_position_id_pattern": [
9
  0,
10
  0,
@@ -14,6 +15,13 @@
14
  1,
15
  1
16
  ],
 
 
 
 
 
 
 
17
  "encoder_layer_norm_decay": 0.005,
18
  "lr": 6e-05,
19
  "num_beams": 4,
@@ -25,49 +33,49 @@
25
  "target_token_ids": [
26
  0,
27
  2,
28
- 50267,
29
- 50265,
30
- 50268,
31
- 50270,
32
  50271,
33
- 50269,
34
  50272,
35
- 50266
 
 
 
 
36
  ],
37
  "embedding_weight_mapping": {
38
- "50267": [
39
  4146
40
  ],
41
- "50265": [
42
  3618,
43
  1215,
44
  31628
45
  ],
46
- "50268": [
47
  414
48
  ],
49
- "50270": [
50
  308,
51
  1215,
52
  31628
53
  ],
54
- "50271": [
55
  37820
56
  ],
57
- "50269": [
58
  1667,
59
  1215,
60
  1116,
61
  1215,
62
  41690
63
  ],
64
- "50272": [
65
  9031,
66
  38600,
67
  1215,
68
  41690
69
  ],
70
- "50266": [
71
  4548
72
  ]
73
  }
@@ -90,7 +98,6 @@
90
  "tokenizer_name_or_path": "facebook/bart-base",
91
  "document_type": "pytorch_ie.documents.TextDocumentWithLabeledSpansBinaryRelationsAndLabeledPartitions",
92
  "tokenized_document_type": "pie_modules.documents.TokenDocumentWithLabeledSpansBinaryRelationsAndLabeledPartitions",
93
- "span_layer_name": "labeled_spans",
94
  "relation_layer_name": "binary_relations",
95
  "none_label": "none",
96
  "loop_dummy_relation_name": "loop",
 
5
  "pretrained_model_name_or_path": "facebook/bart-base",
6
  "use_encoder_mlp": true,
7
  "use_constraints_encoder_mlp": true,
8
+ "decoder_position_id_mode": "pattern",
9
  "decoder_position_id_pattern": [
10
  0,
11
  0,
 
15
  1,
16
  1
17
  ],
18
+ "decoder_position_id_mapping": {
19
+ "default": 2,
20
+ "vocab": 3,
21
+ "bos": 0,
22
+ "eos": 1,
23
+ "pad": 1
24
+ },
25
  "encoder_layer_norm_decay": 0.005,
26
  "lr": 6e-05,
27
  "num_beams": 4,
 
33
  "target_token_ids": [
34
  0,
35
  2,
 
 
 
 
36
  50271,
37
+ 50266,
38
  50272,
39
+ 50269,
40
+ 50268,
41
+ 50267,
42
+ 50265,
43
+ 50270
44
  ],
45
  "embedding_weight_mapping": {
46
+ "50271": [
47
  4146
48
  ],
49
+ "50266": [
50
  3618,
51
  1215,
52
  31628
53
  ],
54
+ "50272": [
55
  414
56
  ],
57
+ "50269": [
58
  308,
59
  1215,
60
  31628
61
  ],
62
+ "50268": [
63
  37820
64
  ],
65
+ "50267": [
66
  1667,
67
  1215,
68
  1116,
69
  1215,
70
  41690
71
  ],
72
+ "50265": [
73
  9031,
74
  38600,
75
  1215,
76
  41690
77
  ],
78
+ "50270": [
79
  4548
80
  ]
81
  }
 
98
  "tokenizer_name_or_path": "facebook/bart-base",
99
  "document_type": "pytorch_ie.documents.TextDocumentWithLabeledSpansBinaryRelationsAndLabeledPartitions",
100
  "tokenized_document_type": "pie_modules.documents.TokenDocumentWithLabeledSpansBinaryRelationsAndLabeledPartitions",
 
101
  "relation_layer_name": "binary_relations",
102
  "none_label": "none",
103
  "loop_dummy_relation_name": "loop",
output.log ADDED
The diff for this file is too large to render. See raw diff
 
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1ba1c6af701ccda91275955a32da3eb8b9968017e0ecf2b701d9571ea7e7f2ce
3
- size 567262209
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03c4ad1f1ed0f5cad71e7ebbe689f626ad3fd933f93d90caf8857d7588244338
3
+ size 567262654
requirements.txt ADDED
@@ -0,0 +1,190 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ absl-py==1.4.0
2
+ accelerate==0.22.0
3
+ aiohttp==3.8.5
4
+ aiosignal==1.3.1
5
+ alembic==1.12.0
6
+ annotated-types==0.5.0
7
+ antlr4-python3-runtime==4.9.3
8
+ appdirs==1.4.4
9
+ asciidag==0.2.0
10
+ async-timeout==4.0.3
11
+ attrs==23.1.0
12
+ auto-gptq==0.4.2
13
+ autopage==0.5.1
14
+ beartype==0.17.2
15
+ black==23.7.0
16
+ blis==0.7.10
17
+ catalogue==2.0.9
18
+ certifi==2023.7.22
19
+ cfgv==3.4.0
20
+ charset-normalizer==3.2.0
21
+ click==8.1.7
22
+ cliff==4.3.0
23
+ cmaes==0.10.0
24
+ cmake==3.27.4.1
25
+ cmd2==2.4.3
26
+ coloredlogs==15.0.1
27
+ colorlog==6.7.0
28
+ confection==0.1.1
29
+ coverage==7.3.0
30
+ cymem==2.0.7
31
+ datasets==2.14.4
32
+ dill==0.3.7
33
+ distlib==0.3.7
34
+ docker-pycreds==0.4.0
35
+ ema-pytorch==0.4.2
36
+ en-core-web-trf==3.6.1
37
+ exceptiongroup==1.1.3
38
+ fastjsonschema==2.18.0
39
+ filelock==3.12.3
40
+ flake8==6.1.0
41
+ frozenlist==1.4.0
42
+ fsspec==2023.6.0
43
+ gitdb==4.0.10
44
+ gitpython==3.1.34
45
+ greenlet==2.0.2
46
+ huggingface-hub==0.23.2
47
+ humanfriendly==10.0
48
+ hydra-colorlog==1.2.0
49
+ hydra-core==1.3.2
50
+ hydra-optuna-sweeper==1.2.0
51
+ identify==2.5.27
52
+ idna==3.4
53
+ importlib-metadata==6.8.0
54
+ iniconfig==2.0.0
55
+ isort==5.12.0
56
+ jedi==0.19.0
57
+ jinja2==3.1.2
58
+ joblib==1.3.2
59
+ jsonschema-specifications==2023.7.1
60
+ jsonschema==4.19.0
61
+ jupyter-core==5.3.1
62
+ langcodes==3.3.0
63
+ lightning-utilities==0.9.0
64
+ lit==16.0.6
65
+ mako==1.2.4
66
+ markdown-it-py==3.0.0
67
+ markupsafe==2.1.3
68
+ mccabe==0.7.0
69
+ mdurl==0.1.2
70
+ mpmath==1.3.0
71
+ multidict==6.0.4
72
+ multiprocess==0.70.15
73
+ murmurhash==1.0.9
74
+ mypy-extensions==1.0.0
75
+ nbformat==5.9.2
76
+ nbstripout==0.6.1
77
+ networkx==3.1
78
+ nltk==3.8.1
79
+ nodeenv==1.8.0
80
+ numpy==1.25.2
81
+ nvidia-cublas-cu11==11.10.3.66
82
+ nvidia-cublas-cu12==12.1.3.1
83
+ nvidia-cuda-cupti-cu11==11.7.101
84
+ nvidia-cuda-cupti-cu12==12.1.105
85
+ nvidia-cuda-nvrtc-cu11==11.7.99
86
+ nvidia-cuda-nvrtc-cu12==12.1.105
87
+ nvidia-cuda-runtime-cu11==11.7.99
88
+ nvidia-cuda-runtime-cu12==12.1.105
89
+ nvidia-cudnn-cu11==8.5.0.96
90
+ nvidia-cudnn-cu12==8.9.2.26
91
+ nvidia-cufft-cu11==10.9.0.58
92
+ nvidia-cufft-cu12==11.0.2.54
93
+ nvidia-curand-cu11==10.2.10.91
94
+ nvidia-curand-cu12==10.3.2.106
95
+ nvidia-cusolver-cu11==11.4.0.1
96
+ nvidia-cusolver-cu12==11.4.5.107
97
+ nvidia-cusparse-cu11==11.7.4.91
98
+ nvidia-cusparse-cu12==12.1.0.106
99
+ nvidia-nccl-cu11==2.14.3
100
+ nvidia-nccl-cu12==2.20.5
101
+ nvidia-nvjitlink-cu12==12.5.40
102
+ nvidia-nvtx-cu11==11.7.91
103
+ nvidia-nvtx-cu12==12.1.105
104
+ omegaconf==2.3.0
105
+ optimum==1.12.0
106
+ optuna==2.10.1
107
+ packaging==23.1
108
+ pandas==2.1.0
109
+ parso==0.8.3
110
+ pathspec==0.11.2
111
+ pathtools==0.1.2
112
+ pathy==0.10.2
113
+ pbr==5.11.1
114
+ peft==0.5.0
115
+ pie-datasets==0.10.0
116
+ pie-modules==0.11.4
117
+ pip==23.2.1
118
+ platformdirs==3.10.0
119
+ plotext==5.2.8
120
+ pluggy==1.3.0
121
+ pre-commit==3.4.0
122
+ preshed==3.0.8
123
+ prettytable==3.8.0
124
+ protobuf==4.24.2
125
+ psutil==5.9.5
126
+ pudb==2022.1.3
127
+ pyarrow==13.0.0
128
+ pycodestyle==2.11.0
129
+ pydantic-core==2.6.3
130
+ pydantic==2.3.0
131
+ pyflakes==3.1.0
132
+ pygments==2.16.1
133
+ pyperclip==1.8.2
134
+ pyrootutils==1.0.4
135
+ pytest-cov==4.1.0
136
+ pytest==7.4.1
137
+ python-dateutil==2.8.2
138
+ python-dotenv==1.0.0
139
+ pytorch-crf==0.7.2
140
+ pytorch-ie==0.31.0
141
+ pytorch-lightning==2.1.2
142
+ pytz==2023.3.post1
143
+ pyyaml==6.0.1
144
+ referencing==0.30.2
145
+ regex==2023.8.8
146
+ requests==2.31.0
147
+ rich==13.5.2
148
+ rouge==1.0.1
149
+ rpds-py==0.10.2
150
+ safetensors==0.4.3
151
+ scipy==1.11.2
152
+ sentencepiece==0.1.99
153
+ sentry-sdk==1.30.0
154
+ setproctitle==1.3.2
155
+ setuptools==68.0.0
156
+ sh==2.0.6
157
+ six==1.16.0
158
+ smart-open==6.3.0
159
+ smmap==5.0.0
160
+ spacy-alignments==0.9.0
161
+ spacy-legacy==3.0.12
162
+ spacy-loggers==1.0.4
163
+ sqlalchemy==2.0.20
164
+ srsly==2.4.7
165
+ stevedore==5.1.0
166
+ sympy==1.12
167
+ tabulate==0.9.0
168
+ thinc==8.1.12
169
+ tokenizers==0.15.2
170
+ tomli==2.0.1
171
+ torch==2.3.0
172
+ torchmetrics==1.1.1
173
+ tqdm==4.66.1
174
+ traitlets==5.9.0
175
+ transformers==4.39.3
176
+ triton==2.3.0
177
+ typer==0.9.0
178
+ typing-extensions==4.12.0
179
+ tzdata==2023.3
180
+ urllib3==2.0.4
181
+ urwid-readline==0.13
182
+ urwid==2.1.2
183
+ virtualenv==20.24.4
184
+ wandb==0.15.9
185
+ wasabi==1.1.2
186
+ wcwidth==0.2.6
187
+ wheel==0.38.4
188
+ xxhash==3.3.0
189
+ yarl==1.9.2
190
+ zipp==3.16.2
taskmodule_config.json CHANGED
@@ -3,7 +3,6 @@
3
  "tokenizer_name_or_path": "facebook/bart-base",
4
  "document_type": "pytorch_ie.documents.TextDocumentWithLabeledSpansBinaryRelationsAndLabeledPartitions",
5
  "tokenized_document_type": "pie_modules.documents.TokenDocumentWithLabeledSpansBinaryRelationsAndLabeledPartitions",
6
- "span_layer_name": "labeled_spans",
7
  "relation_layer_name": "binary_relations",
8
  "none_label": "none",
9
  "loop_dummy_relation_name": "loop",
 
3
  "tokenizer_name_or_path": "facebook/bart-base",
4
  "document_type": "pytorch_ie.documents.TextDocumentWithLabeledSpansBinaryRelationsAndLabeledPartitions",
5
  "tokenized_document_type": "pie_modules.documents.TokenDocumentWithLabeledSpansBinaryRelationsAndLabeledPartitions",
 
6
  "relation_layer_name": "binary_relations",
7
  "none_label": "none",
8
  "loop_dummy_relation_name": "loop",
wandb-metadata.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "os": "Linux-5.15.0-86-generic-x86_64-with-glibc2.35",
3
  "python": "3.9.17",
4
- "heartbeatAt": "2024-03-01T17:25:43.088987",
5
- "startedAt": "2024-03-01T17:25:42.069556",
6
  "docker": null,
7
  "cuda": null,
8
  "args": [
@@ -23,7 +23,7 @@
23
  "codePath": "src/train.py",
24
  "git": {
25
  "remote": "[email protected]:ArneBinder/pie-document-level.git",
26
- "commit": "6deb3a264efba32f48f10addd87ccea04d4f8b5e"
27
  },
28
  "email": "[email protected]",
29
  "root": "/home/arne/projects/pie-document-level",
@@ -33,7 +33,7 @@
33
  "cpu_count": 6,
34
  "cpu_count_logical": 12,
35
  "cpu_freq": {
36
- "current": 2199.99725,
37
  "min": 2200.0,
38
  "max": 3600.0
39
  },
@@ -84,7 +84,7 @@
84
  "max": 3600.0
85
  },
86
  {
87
- "current": 2200.0,
88
  "min": 2200.0,
89
  "max": 3600.0
90
  },
@@ -94,14 +94,14 @@
94
  "max": 3600.0
95
  },
96
  {
97
- "current": 2199.967,
98
  "min": 2200.0,
99
  "max": 3600.0
100
  }
101
  ],
102
  "disk": {
103
  "total": 878.620922088623,
104
- "used": 658.1419486999512
105
  },
106
  "gpu": "NVIDIA GeForce RTX 2080 Ti",
107
  "gpu_count": 1,
 
1
  {
2
  "os": "Linux-5.15.0-86-generic-x86_64-with-glibc2.35",
3
  "python": "3.9.17",
4
+ "heartbeatAt": "2024-05-28T21:33:56.005050",
5
+ "startedAt": "2024-05-28T21:33:54.883067",
6
  "docker": null,
7
  "cuda": null,
8
  "args": [
 
23
  "codePath": "src/train.py",
24
  "git": {
25
  "remote": "[email protected]:ArneBinder/pie-document-level.git",
26
+ "commit": "98092aa0b288a843bfaa5e07ff06cfe3cd882b32"
27
  },
28
  "email": "[email protected]",
29
  "root": "/home/arne/projects/pie-document-level",
 
33
  "cpu_count": 6,
34
  "cpu_count_logical": 12,
35
  "cpu_freq": {
36
+ "current": 2304.1169999999997,
37
  "min": 2200.0,
38
  "max": 3600.0
39
  },
 
84
  "max": 3600.0
85
  },
86
  {
87
+ "current": 2049.404,
88
  "min": 2200.0,
89
  "max": 3600.0
90
  },
 
94
  "max": 3600.0
95
  },
96
  {
97
+ "current": 3600.0,
98
  "min": 2200.0,
99
  "max": 3600.0
100
  }
101
  ],
102
  "disk": {
103
  "total": 878.620922088623,
104
+ "used": 661.2135887145996
105
  },
106
  "gpu": "NVIDIA GeForce RTX 2080 Ti",
107
  "gpu_count": 1,
wandb-summary.json CHANGED
@@ -1 +1 @@
1
- {"loss/train_step": 0.01761285401880741, "epoch": 150, "trainer/global_step": 39450, "_timestamp": 1709331727.5671468, "_runtime": 17785.49159884453, "_step": 1090, "loss/val": 2.5551652908325195, "metric/exact_encoding_matches/val": 0.3253012001514435, "metric/decoding_errors/all/val": 0.0, "metric/labeled_spans/micro/f1/val": 0.4795539081096649, "metric/labeled_spans/micro/recall/val": 0.4955185651779175, "metric/labeled_spans/micro/precision/val": 0.4645858407020569, "metric/labeled_spans/background_claim/f1/val": 0.5347467660903931, "metric/labeled_spans/background_claim/recall/val": 0.5159090757369995, "metric/labeled_spans/background_claim/precision/val": 0.5550122261047363, "metric/labeled_spans/data/f1/val": 0.5673912763595581, "metric/labeled_spans/data/recall/val": 0.5661605000495911, "metric/labeled_spans/data/precision/val": 0.5686274766921997, "metric/labeled_spans/own_claim/f1/val": 0.3920493423938751, "metric/labeled_spans/own_claim/recall/val": 0.4326777756214142, "metric/labeled_spans/own_claim/precision/val": 0.3583959937095642, "metric/labeled_spans/macro/f1/val": 0.49806246161460876, "metric/labeled_spans/macro/recall/val": 0.5049158334732056, "metric/labeled_spans/macro/precision/val": 0.49401187896728516, "metric/binary_relations/micro/f1/val": 0.2759901285171509, "metric/binary_relations/micro/recall/val": 0.2657926082611084, "metric/binary_relations/micro/precision/val": 0.28700128197669983, "metric/binary_relations/parts_of_same/f1/val": 0.2459016591310501, "metric/binary_relations/parts_of_same/recall/val": 0.23999999463558197, "metric/binary_relations/parts_of_same/precision/val": 0.2521008551120758, "metric/binary_relations/supports/f1/val": 0.2857142686843872, "metric/binary_relations/supports/recall/val": 0.27953410148620605, "metric/binary_relations/supports/precision/val": 0.29217392206192017, "metric/binary_relations/contradicts/f1/val": 0.26455026865005493, "metric/binary_relations/contradicts/recall/val": 0.23364485800266266, "metric/binary_relations/contradicts/precision/val": 0.3048780560493469, "metric/binary_relations/macro/f1/val": 0.19904154539108276, "metric/binary_relations/macro/recall/val": 0.18829473853111267, "metric/binary_relations/macro/precision/val": 0.21228821575641632, "metric/binary_relations/semantically_same/f1/val": 0.0, "metric/binary_relations/semantically_same/recall/val": 0.0, "metric/binary_relations/semantically_same/precision/val": 0.0, "loss/train_epoch": 0.06590206921100616, "metric/exact_encoding_matches/train": 0.9276190400123596, "metric/decoding_errors/label/train": 0.0002683123166207224, "metric/decoding_errors/index/train": 0.0, "metric/decoding_errors/len/train": 0.0001341561583103612, "metric/decoding_errors/order/train": 0.003353904001414776, "metric/decoding_errors/correct/train": 0.9962436556816101, "metric/decoding_errors/all/train": 0.0037563724908977747, "metric/labeled_spans/background_claim/f1/train": 0.9950291514396667, "metric/labeled_spans/background_claim/recall/train": 0.9943844676017761, "metric/labeled_spans/background_claim/precision/train": 0.995674729347229, "metric/labeled_spans/data/f1/train": 0.9951720833778381, "metric/labeled_spans/data/recall/train": 0.994088351726532, "metric/labeled_spans/data/precision/train": 0.9962581992149353, "metric/labeled_spans/own_claim/f1/train": 0.997970700263977, "metric/labeled_spans/own_claim/recall/train": 0.9975208640098572, "metric/labeled_spans/own_claim/precision/train": 0.9984209537506104, "metric/labeled_spans/micro/f1/train": 0.9963851571083069, "metric/labeled_spans/micro/recall/train": 0.995685338973999, "metric/labeled_spans/micro/precision/train": 0.9970859885215759, "metric/labeled_spans/macro/f1/train": 0.9960572719573975, "metric/labeled_spans/macro/recall/train": 0.9953312277793884, "metric/labeled_spans/macro/precision/train": 0.9967846274375916, "metric/binary_relations/supports/f1/train": 0.9916067123413086, "metric/binary_relations/supports/recall/train": 0.9889978766441345, "metric/binary_relations/supports/precision/train": 0.9942293763160706, "metric/binary_relations/micro/f1/train": 0.9924262166023254, "metric/binary_relations/micro/recall/train": 0.9898684620857239, "metric/binary_relations/micro/precision/train": 0.9949973225593567, "metric/binary_relations/parts_of_same/f1/train": 0.9962507486343384, "metric/binary_relations/parts_of_same/recall/train": 0.9935897588729858, "metric/binary_relations/parts_of_same/precision/train": 0.9989258646965027, "metric/binary_relations/contradicts/f1/train": 0.9927158951759338, "metric/binary_relations/contradicts/recall/train": 0.9916840195655823, "metric/binary_relations/contradicts/precision/train": 0.9937499761581421, "metric/binary_relations/semantically_same/f1/train": 0.9818181991577148, "metric/binary_relations/semantically_same/recall/train": 0.9642857313156128, "metric/binary_relations/semantically_same/precision/train": 1.0, "metric/binary_relations/macro/f1/train": 0.9905978441238403, "metric/binary_relations/macro/recall/train": 0.9846393465995789, "metric/binary_relations/macro/precision/train": 0.9967262744903564, "metric/decoding_errors/correct/val": 1.0, "metric/decoding_errors/index/val": 0.0, "metric/decoding_errors/len/val": 0.0, "loss/test": 2.615832805633545, "metric/exact_encoding_matches/test": 0.3636363744735718, "metric/decoding_errors/correct/test": 1.0, "metric/decoding_errors/all/test": 0.0, "metric/labeled_spans/micro/f1/test": 0.4372429847717285, "metric/labeled_spans/micro/recall/test": 0.4461228549480438, "metric/labeled_spans/micro/precision/test": 0.4287096858024597, "metric/labeled_spans/own_claim/f1/test": 0.3857002258300781, "metric/labeled_spans/own_claim/recall/test": 0.4384787380695343, "metric/labeled_spans/own_claim/precision/test": 0.3442623019218445, "metric/labeled_spans/background_claim/f1/test": 0.4095562994480133, "metric/labeled_spans/background_claim/recall/test": 0.34433284401893616, "metric/labeled_spans/background_claim/precision/test": 0.5052631497383118, "metric/labeled_spans/data/f1/test": 0.5392895340919495, "metric/labeled_spans/data/recall/test": 0.5324123501777649, "metric/labeled_spans/data/precision/test": 0.5463467836380005, "metric/labeled_spans/macro/f1/test": 0.4448487162590027, "metric/labeled_spans/macro/recall/test": 0.4384079873561859, "metric/labeled_spans/macro/precision/test": 0.46529075503349304, "metric/binary_relations/micro/f1/test": 0.21993334591388702, "metric/binary_relations/micro/recall/test": 0.20381808280944824, "metric/binary_relations/micro/precision/test": 0.2388157844543457, "metric/binary_relations/parts_of_same/f1/test": 0.19502867758274078, "metric/binary_relations/parts_of_same/recall/test": 0.1764705926179886, "metric/binary_relations/parts_of_same/precision/test": 0.21794871985912323, "metric/binary_relations/supports/f1/test": 0.22637012600898743, "metric/binary_relations/supports/recall/test": 0.21079881489276886, "metric/binary_relations/supports/precision/test": 0.24442538619041443, "metric/binary_relations/contradicts/f1/test": 0.2039215862751007, "metric/binary_relations/contradicts/recall/test": 0.18978102505207062, "metric/binary_relations/contradicts/precision/test": 0.22033898532390594, "metric/binary_relations/semantically_same/f1/test": 0.4000000059604645, "metric/binary_relations/semantically_same/recall/test": 0.3333333432674408, "metric/binary_relations/semantically_same/precision/test": 0.5, "metric/binary_relations/macro/f1/test": 0.25633010268211365, "metric/binary_relations/macro/recall/test": 0.2275959551334381, "metric/binary_relations/macro/precision/test": 0.2956782579421997, "_wandb": {"runtime": 17784}}
 
1
+ {"loss/train_step": 0.028341908007860184, "epoch": 150, "trainer/global_step": 40200, "_timestamp": 1716949379.1344945, "_runtime": 17344.248886585236, "_step": 1105, "loss/val": 2.3559770584106445, "metric/exact_encoding_matches/val": 0.3611111044883728, "metric/decoding_errors/all/val": 0.0, "metric/labeled_spans/micro/f1/val": 0.4843537509441376, "metric/labeled_spans/micro/recall/val": 0.49273356795310974, "metric/labeled_spans/micro/precision/val": 0.4762541949748993, "metric/labeled_spans/data/f1/val": 0.536285400390625, "metric/labeled_spans/data/recall/val": 0.4988558292388916, "metric/labeled_spans/data/precision/val": 0.5797872543334961, "metric/labeled_spans/background_claim/f1/val": 0.5077399015426636, "metric/labeled_spans/background_claim/recall/val": 0.5173501372337341, "metric/labeled_spans/background_claim/precision/val": 0.4984802305698395, "metric/labeled_spans/own_claim/f1/val": 0.4456448256969452, "metric/labeled_spans/own_claim/recall/val": 0.47756874561309814, "metric/labeled_spans/own_claim/precision/val": 0.4177215099334717, "metric/labeled_spans/macro/f1/val": 0.49655672907829285, "metric/labeled_spans/macro/recall/val": 0.49792489409446716, "metric/labeled_spans/macro/precision/val": 0.4986630082130432, "metric/binary_relations/micro/f1/val": 0.23862887918949127, "metric/binary_relations/micro/recall/val": 0.22100122272968292, "metric/binary_relations/micro/precision/val": 0.25931233167648315, "metric/binary_relations/supports/f1/val": 0.2470904141664505, "metric/binary_relations/supports/recall/val": 0.22847682237625122, "metric/binary_relations/supports/precision/val": 0.26900583505630493, "metric/binary_relations/contradicts/f1/val": 0.20481927692890167, "metric/binary_relations/contradicts/recall/val": 0.18681319057941437, "metric/binary_relations/contradicts/precision/val": 0.2266666740179062, "metric/binary_relations/parts_of_same/f1/val": 0.22608695924282074, "metric/binary_relations/parts_of_same/recall/val": 0.21666666865348816, "metric/binary_relations/parts_of_same/precision/val": 0.23636363446712494, "metric/binary_relations/macro/f1/val": 0.16949915885925293, "metric/binary_relations/macro/recall/val": 0.15798917412757874, "metric/binary_relations/macro/precision/val": 0.1830090433359146, "metric/decoding_errors/correct/val": 1.0, "metric/decoding_errors/index/val": 0.0, "metric/decoding_errors/len/val": 0.0, "metric/binary_relations/semantically_same/f1/val": 0.0, "metric/binary_relations/semantically_same/recall/val": 0.0, "metric/binary_relations/semantically_same/precision/val": 0.0, "loss/train_epoch": 0.05872185528278351, "metric/exact_encoding_matches/train": 0.8992537260055542, "metric/decoding_errors/label/train": 0.0005325522506609559, "metric/decoding_errors/len/train": 0.00013313806266523898, "metric/decoding_errors/order/train": 0.004526694305241108, "metric/decoding_errors/index/train": 0.00026627612533047795, "metric/decoding_errors/all/train": 0.005458660423755646, "metric/labeled_spans/background_claim/f1/train": 0.9948760271072388, "metric/labeled_spans/background_claim/recall/train": 0.9954881072044373, "metric/labeled_spans/background_claim/precision/train": 0.9942646622657776, "metric/labeled_spans/data/f1/train": 0.9939675331115723, "metric/labeled_spans/data/recall/train": 0.9922791719436646, "metric/labeled_spans/data/precision/train": 0.9956616163253784, "metric/labeled_spans/own_claim/f1/train": 0.9964792132377625, "metric/labeled_spans/own_claim/recall/train": 0.9954617619514465, "metric/labeled_spans/own_claim/precision/train": 0.9974988698959351, "metric/labeled_spans/micro/f1/train": 0.9952850937843323, "metric/labeled_spans/micro/recall/train": 0.9944460988044739, "metric/labeled_spans/micro/precision/train": 0.9961255788803101, "metric/labeled_spans/macro/f1/train": 0.9951075911521912, "metric/labeled_spans/macro/recall/train": 0.9944097399711609, "metric/labeled_spans/macro/precision/train": 0.995808482170105, "metric/binary_relations/supports/f1/train": 0.9914755821228027, "metric/binary_relations/supports/recall/train": 0.9882718920707703, "metric/binary_relations/supports/precision/train": 0.9947000741958618, "metric/binary_relations/contradicts/f1/train": 0.9827761054039001, "metric/binary_relations/contradicts/recall/train": 0.9758551120758057, "metric/binary_relations/contradicts/precision/train": 0.9897959232330322, "metric/binary_relations/parts_of_same/f1/train": 0.9888119101524353, "metric/binary_relations/parts_of_same/recall/train": 0.9861848950386047, "metric/binary_relations/parts_of_same/precision/train": 0.9914529919624329, "metric/binary_relations/micro/f1/train": 0.990313708782196, "metric/binary_relations/micro/recall/train": 0.986893355846405, "metric/binary_relations/micro/precision/train": 0.9937577843666077, "metric/binary_relations/semantically_same/f1/train": 1.0, "metric/binary_relations/semantically_same/recall/train": 1.0, "metric/binary_relations/semantically_same/precision/train": 1.0, "metric/binary_relations/macro/f1/train": 0.9907659292221069, "metric/binary_relations/macro/recall/train": 0.9875779747962952, "metric/binary_relations/macro/precision/train": 0.9939872026443481, "metric/decoding_errors/correct/train": 0.994541347026825, "loss/test": 3.026346206665039, "metric/exact_encoding_matches/test": 0.34545454382896423, "metric/decoding_errors/correct/test": 0.7914345264434814, "metric/decoding_errors/index/test": 0.00034818940912373364, "metric/decoding_errors/len/test": 0.20821726322174072, "metric/decoding_errors/all/test": 0.20856545865535736, "metric/labeled_spans/micro/f1/test": 0.42222580313682556, "metric/labeled_spans/micro/recall/test": 0.4387378394603729, "metric/labeled_spans/micro/precision/test": 0.40691158175468445, "metric/labeled_spans/data/f1/test": 0.5156335234642029, "metric/labeled_spans/data/recall/test": 0.4994686543941498, "metric/labeled_spans/data/precision/test": 0.5328798294067383, "metric/labeled_spans/background_claim/f1/test": 0.42137405276298523, "metric/labeled_spans/background_claim/recall/test": 0.3959827721118927, "metric/labeled_spans/background_claim/precision/test": 0.4502446949481964, "metric/labeled_spans/own_claim/f1/test": 0.36690646409988403, "metric/labeled_spans/own_claim/recall/test": 0.41834452748298645, "metric/labeled_spans/own_claim/precision/test": 0.32673266530036926, "metric/labeled_spans/macro/f1/test": 0.43463802337646484, "metric/labeled_spans/macro/recall/test": 0.43793198466300964, "metric/labeled_spans/macro/precision/test": 0.4366190433502197, "metric/binary_relations/micro/f1/test": 0.21676044166088104, "metric/binary_relations/micro/recall/test": 0.20550252497196198, "metric/binary_relations/micro/precision/test": 0.22932331264019012, "metric/binary_relations/supports/f1/test": 0.22440946102142334, "metric/binary_relations/supports/recall/test": 0.21079881489276886, "metric/binary_relations/supports/precision/test": 0.23989899456501007, "metric/binary_relations/contradicts/f1/test": 0.22545455396175385, "metric/binary_relations/contradicts/recall/test": 0.22627736628055573, "metric/binary_relations/contradicts/precision/test": 0.2246376872062683, "metric/binary_relations/parts_of_same/f1/test": 0.17359857261180878, "metric/binary_relations/parts_of_same/recall/test": 0.1660899668931961, "metric/binary_relations/parts_of_same/precision/test": 0.1818181872367859, "metric/binary_relations/semantically_same/f1/test": 0.444444477558136, "metric/binary_relations/semantically_same/recall/test": 0.6666666865348816, "metric/binary_relations/semantically_same/precision/test": 0.3333333432674408, "metric/binary_relations/macro/f1/test": 0.2669767737388611, "metric/binary_relations/macro/recall/test": 0.31745821237564087, "metric/binary_relations/macro/precision/test": 0.24492204189300537, "_wandb": {"runtime": 17343}}