ArneBinder's picture
add train config and metadata
df85382 verified
raw
history blame
18.7 kB
wandb_version: 1
_wandb:
desc: null
value:
python_version: 3.9.17
cli_version: 0.15.9
framework: huggingface
huggingface_version: 4.36.0
is_jupyter_run: false
is_kaggle_kernel: false
start_time: 1709313942.075548
t:
1:
- 1
- 9
- 11
- 49
- 50
- 51
- 55
- 71
- 103
2:
- 1
- 9
- 11
- 49
- 50
- 51
- 55
- 71
- 103
3:
- 2
- 7
- 15
- 23
4: 3.9.17
5: 0.15.9
6: 4.36.0
8:
- 5
m:
- 1: trainer/global_step
6:
- 3
- 1: loss/train_step
5: 1
6:
- 1
- 1: epoch
5: 1
6:
- 1
- 1: loss/val
5: 1
6:
- 1
- 1: metric/exact_encoding_matches/val
5: 1
6:
- 1
- 1: metric/decoding_errors/all/val
5: 1
6:
- 1
- 1: metric/labeled_spans/micro/f1/val
5: 1
6:
- 1
- 1: metric/labeled_spans/micro/recall/val
5: 1
6:
- 1
- 1: metric/labeled_spans/micro/precision/val
5: 1
6:
- 1
- 1: metric/labeled_spans/background_claim/f1/val
5: 1
6:
- 1
- 1: metric/labeled_spans/background_claim/recall/val
5: 1
6:
- 1
- 1: metric/labeled_spans/background_claim/precision/val
5: 1
6:
- 1
- 1: metric/labeled_spans/data/f1/val
5: 1
6:
- 1
- 1: metric/labeled_spans/data/recall/val
5: 1
6:
- 1
- 1: metric/labeled_spans/data/precision/val
5: 1
6:
- 1
- 1: metric/labeled_spans/own_claim/f1/val
5: 1
6:
- 1
- 1: metric/labeled_spans/own_claim/recall/val
5: 1
6:
- 1
- 1: metric/labeled_spans/own_claim/precision/val
5: 1
6:
- 1
- 1: metric/labeled_spans/macro/f1/val
5: 1
6:
- 1
- 1: metric/labeled_spans/macro/recall/val
5: 1
6:
- 1
- 1: metric/labeled_spans/macro/precision/val
5: 1
6:
- 1
- 1: metric/binary_relations/micro/f1/val
5: 1
6:
- 1
- 1: metric/binary_relations/micro/recall/val
5: 1
6:
- 1
- 1: metric/binary_relations/micro/precision/val
5: 1
6:
- 1
- 1: metric/binary_relations/parts_of_same/f1/val
5: 1
6:
- 1
- 1: metric/binary_relations/parts_of_same/recall/val
5: 1
6:
- 1
- 1: metric/binary_relations/parts_of_same/precision/val
5: 1
6:
- 1
- 1: metric/binary_relations/supports/f1/val
5: 1
6:
- 1
- 1: metric/binary_relations/supports/recall/val
5: 1
6:
- 1
- 1: metric/binary_relations/supports/precision/val
5: 1
6:
- 1
- 1: metric/binary_relations/contradicts/f1/val
5: 1
6:
- 1
- 1: metric/binary_relations/contradicts/recall/val
5: 1
6:
- 1
- 1: metric/binary_relations/contradicts/precision/val
5: 1
6:
- 1
- 1: metric/binary_relations/macro/f1/val
5: 1
6:
- 1
- 1: metric/binary_relations/macro/recall/val
5: 1
6:
- 1
- 1: metric/binary_relations/macro/precision/val
5: 1
6:
- 1
- 1: metric/binary_relations/semantically_same/f1/val
5: 1
6:
- 1
- 1: metric/binary_relations/semantically_same/recall/val
5: 1
6:
- 1
- 1: metric/binary_relations/semantically_same/precision/val
5: 1
6:
- 1
- 1: loss/train_epoch
5: 1
6:
- 1
- 1: metric/exact_encoding_matches/train
5: 1
6:
- 1
- 1: metric/decoding_errors/label/train
5: 1
6:
- 1
- 1: metric/decoding_errors/index/train
5: 1
6:
- 1
- 1: metric/decoding_errors/len/train
5: 1
6:
- 1
- 1: metric/decoding_errors/order/train
5: 1
6:
- 1
- 1: metric/decoding_errors/correct/train
5: 1
6:
- 1
- 1: metric/decoding_errors/all/train
5: 1
6:
- 1
- 1: metric/labeled_spans/background_claim/f1/train
5: 1
6:
- 1
- 1: metric/labeled_spans/background_claim/recall/train
5: 1
6:
- 1
- 1: metric/labeled_spans/background_claim/precision/train
5: 1
6:
- 1
- 1: metric/labeled_spans/data/f1/train
5: 1
6:
- 1
- 1: metric/labeled_spans/data/recall/train
5: 1
6:
- 1
- 1: metric/labeled_spans/data/precision/train
5: 1
6:
- 1
- 1: metric/labeled_spans/own_claim/f1/train
5: 1
6:
- 1
- 1: metric/labeled_spans/own_claim/recall/train
5: 1
6:
- 1
- 1: metric/labeled_spans/own_claim/precision/train
5: 1
6:
- 1
- 1: metric/labeled_spans/micro/f1/train
5: 1
6:
- 1
- 1: metric/labeled_spans/micro/recall/train
5: 1
6:
- 1
- 1: metric/labeled_spans/micro/precision/train
5: 1
6:
- 1
- 1: metric/labeled_spans/macro/f1/train
5: 1
6:
- 1
- 1: metric/labeled_spans/macro/recall/train
5: 1
6:
- 1
- 1: metric/labeled_spans/macro/precision/train
5: 1
6:
- 1
- 1: metric/binary_relations/supports/f1/train
5: 1
6:
- 1
- 1: metric/binary_relations/supports/recall/train
5: 1
6:
- 1
- 1: metric/binary_relations/supports/precision/train
5: 1
6:
- 1
- 1: metric/binary_relations/micro/f1/train
5: 1
6:
- 1
- 1: metric/binary_relations/micro/recall/train
5: 1
6:
- 1
- 1: metric/binary_relations/micro/precision/train
5: 1
6:
- 1
- 1: metric/binary_relations/parts_of_same/f1/train
5: 1
6:
- 1
- 1: metric/binary_relations/parts_of_same/recall/train
5: 1
6:
- 1
- 1: metric/binary_relations/parts_of_same/precision/train
5: 1
6:
- 1
- 1: metric/binary_relations/contradicts/f1/train
5: 1
6:
- 1
- 1: metric/binary_relations/contradicts/recall/train
5: 1
6:
- 1
- 1: metric/binary_relations/contradicts/precision/train
5: 1
6:
- 1
- 1: metric/binary_relations/semantically_same/f1/train
5: 1
6:
- 1
- 1: metric/binary_relations/semantically_same/recall/train
5: 1
6:
- 1
- 1: metric/binary_relations/semantically_same/precision/train
5: 1
6:
- 1
- 1: metric/binary_relations/macro/f1/train
5: 1
6:
- 1
- 1: metric/binary_relations/macro/recall/train
5: 1
6:
- 1
- 1: metric/binary_relations/macro/precision/train
5: 1
6:
- 1
- 1: metric/decoding_errors/correct/val
5: 1
6:
- 1
- 1: metric/decoding_errors/index/val
5: 1
6:
- 1
- 1: metric/decoding_errors/len/val
5: 1
6:
- 1
- 1: loss/test
5: 1
6:
- 1
- 1: metric/exact_encoding_matches/test
5: 1
6:
- 1
- 1: metric/decoding_errors/correct/test
5: 1
6:
- 1
- 1: metric/decoding_errors/all/test
5: 1
6:
- 1
- 1: metric/labeled_spans/micro/f1/test
5: 1
6:
- 1
- 1: metric/labeled_spans/micro/recall/test
5: 1
6:
- 1
- 1: metric/labeled_spans/micro/precision/test
5: 1
6:
- 1
- 1: metric/labeled_spans/own_claim/f1/test
5: 1
6:
- 1
- 1: metric/labeled_spans/own_claim/recall/test
5: 1
6:
- 1
- 1: metric/labeled_spans/own_claim/precision/test
5: 1
6:
- 1
- 1: metric/labeled_spans/background_claim/f1/test
5: 1
6:
- 1
- 1: metric/labeled_spans/background_claim/recall/test
5: 1
6:
- 1
- 1: metric/labeled_spans/background_claim/precision/test
5: 1
6:
- 1
- 1: metric/labeled_spans/data/f1/test
5: 1
6:
- 1
- 1: metric/labeled_spans/data/recall/test
5: 1
6:
- 1
- 1: metric/labeled_spans/data/precision/test
5: 1
6:
- 1
- 1: metric/labeled_spans/macro/f1/test
5: 1
6:
- 1
- 1: metric/labeled_spans/macro/recall/test
5: 1
6:
- 1
- 1: metric/labeled_spans/macro/precision/test
5: 1
6:
- 1
- 1: metric/binary_relations/micro/f1/test
5: 1
6:
- 1
- 1: metric/binary_relations/micro/recall/test
5: 1
6:
- 1
- 1: metric/binary_relations/micro/precision/test
5: 1
6:
- 1
- 1: metric/binary_relations/parts_of_same/f1/test
5: 1
6:
- 1
- 1: metric/binary_relations/parts_of_same/recall/test
5: 1
6:
- 1
- 1: metric/binary_relations/parts_of_same/precision/test
5: 1
6:
- 1
- 1: metric/binary_relations/supports/f1/test
5: 1
6:
- 1
- 1: metric/binary_relations/supports/recall/test
5: 1
6:
- 1
- 1: metric/binary_relations/supports/precision/test
5: 1
6:
- 1
- 1: metric/binary_relations/contradicts/f1/test
5: 1
6:
- 1
- 1: metric/binary_relations/contradicts/recall/test
5: 1
6:
- 1
- 1: metric/binary_relations/contradicts/precision/test
5: 1
6:
- 1
- 1: metric/binary_relations/semantically_same/f1/test
5: 1
6:
- 1
- 1: metric/binary_relations/semantically_same/recall/test
5: 1
6:
- 1
- 1: metric/binary_relations/semantically_same/precision/test
5: 1
6:
- 1
- 1: metric/binary_relations/macro/f1/test
5: 1
6:
- 1
- 1: metric/binary_relations/macro/recall/test
5: 1
6:
- 1
- 1: metric/binary_relations/macro/precision/test
5: 1
6:
- 1
_num_params/total:
desc: null
value: 141788928
_num_params/trainable:
desc: null
value: 141788928
_num_params/non_trainable:
desc: null
value: 0
_config:
desc: null
value:
pipeline_type: training
name: dataset-sciarg/task-ner_re/v0.3
tags:
- task=ner_re
- model=pointer_network
train: true
validate: true
test: true
monitor_metric: metric/binary_relations/micro/f1/val
monitor_mode: max
seed: 1
ckpt_path: null
push_to_hub: false
model_save_dir: /home/arne/projects/pie-document-level/models/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-32
dataset:
_target_: src.utils.execute_pipeline
input:
_target_: pie_datasets.DatasetDict.load_dataset
path: pie/sciarg
revision: 982d5682ba414ee13cf92cb93ec18fc8e78e2b81
select_n:
_processor_: pie_datasets.DatasetDict.select
split: train
stop: null
select_n_test:
_processor_: pie_datasets.DatasetDict.select
split: test
stop: null
select_n_validation:
_processor_: pie_datasets.DatasetDict.select
split: validation
stop: null
create_test_split:
_processor_: pie_datasets.DatasetDict.move_to_new_split
source_split: train
target_split: test
ids:
- A32
- A33
- A34
- A35
- A36
- A37
- A38
- A39
- A40
create_validation_split:
_processor_: pie_datasets.DatasetDict.add_test_split
test_size: 0.1
seed: 1
source_split: train
target_split: validation
datamodule:
_target_: src.datamodules.PieDataModule
batch_size: 2
num_workers: 0
pin_memory: false
show_progress_for_encode: true
train_split: train
val_split: validation
test_split: test
taskmodule:
_target_: pie_modules.taskmodules.PointerNetworkTaskModuleForEnd2EndRE
tokenizer_init_kwargs:
add_prefix_space: true
tokenizer_name_or_path: facebook/bart-base
tokenizer_kwargs:
truncation: true
return_overflowing_tokens: true
stride: 128
strict_span_conversion: false
create_constraints: true
constrained_generation: true
partition_layer_name: labeled_partitions
model:
_target_: pie_modules.models.SimpleGenerativeModel
base_model_type: pie_modules.models.base_models.BartAsPointerNetwork
base_model_config:
pretrained_model_name_or_path: facebook/bart-base
use_encoder_mlp: true
use_constraints_encoder_mlp: true
decoder_position_id_pattern:
- 0
- 0
- 1
- 0
- 0
- 1
- 1
encoder_layer_norm_decay: 0.005
lr: 6.0e-05
num_beams: 4
max_length: 768
decoder_layer_norm_decay: 0.05
metric_stages:
- val
- test
- train
metric_call_predict:
- val
- test
warmup_proportion: 0.01
callbacks:
model_checkpoint:
_target_: pytorch_lightning.callbacks.ModelCheckpoint
dirpath: /home/arne/projects/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0/checkpoints
filename: epoch_{epoch:03d}
monitor: metric/binary_relations/micro/f1/val
verbose: false
save_last: true
save_top_k: 1
mode: max
auto_insert_metric_name: false
save_weights_only: false
every_n_train_steps: null
train_time_interval: null
every_n_epochs: null
save_on_train_epoch_end: null
early_stopping:
_target_: pytorch_lightning.callbacks.EarlyStopping
monitor: metric/binary_relations/micro/f1/val
min_delta: 0.0
patience: 100
verbose: false
mode: max
strict: true
check_finite: true
stopping_threshold: null
divergence_threshold: null
check_on_train_epoch_end: null
model_summary:
_target_: pytorch_lightning.callbacks.RichModelSummary
max_depth: -1
rich_progress_bar:
_target_: pytorch_lightning.callbacks.RichProgressBar
logger:
wandb:
_target_: pytorch_lightning.loggers.wandb.WandbLogger
save_dir: /home/arne/projects/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0
offline: false
id: null
anonymous: null
project: dataset-sciarg-task-ner_re-v0.3-training
log_model: false
prefix: ''
group: ''
tags:
- task=ner_re
- model=pointer_network
job_type: ''
trainer:
_target_: pytorch_lightning.Trainer
default_root_dir: /home/arne/projects/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0
min_epochs: 150
max_epochs: 150
accelerator: gpu
devices: 1
check_val_every_n_epoch: 1
deterministic: false
gradient_clip_val: 5
gradient_clip_algorithm: value
paths:
root_dir: /home/arne/projects/pie-document-level
data_dir: /home/arne/projects/pie-document-level/data/
log_dir: /home/arne/projects/pie-document-level/logs/
output_dir: /home/arne/projects/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0
save_dir: /home/arne/projects/pie-document-level
work_dir: /home/arne/projects/pie-document-level
extras:
ignore_warnings: false
enforce_tags: true
print_config: true
base_model: facebook/bart-base
base_model_type:
desc: null
value: pie_modules.models.base_models.BartAsPointerNetwork
base_model_config:
desc: null
value:
pretrained_model_name_or_path: facebook/bart-base
use_encoder_mlp: true
use_constraints_encoder_mlp: true
decoder_position_id_pattern:
- 0
- 0
- 1
- 0
- 0
- 1
- 1
encoder_layer_norm_decay: 0.005
lr: 6.0e-05
num_beams: 4
max_length: 768
decoder_layer_norm_decay: 0.05
bos_token_id: 0
eos_token_id: 1
pad_token_id: 1
target_token_ids:
- 0
- 2
- 50267
- 50265
- 50268
- 50270
- 50271
- 50269
- 50272
- 50266
embedding_weight_mapping:
'50267':
- 4146
'50265':
- 3618
- 1215
- 31628
'50268':
- 414
'50270':
- 308
- 1215
- 31628
'50271':
- 37820
'50269':
- 1667
- 1215
- 1116
- 1215
- 41690
'50272':
- 9031
- 38600
- 1215
- 41690
'50266':
- 4548
override_generation_kwargs:
desc: null
value: null
warmup_proportion:
desc: null
value: 0.01
learning_rate:
desc: null
value: null
optimizer_type:
desc: null
value: null
metric_stages:
desc: null
value:
- val
- test
- train
metric_call_predict:
desc: null
value:
- val
- test
taskmodule_config:
desc: null
value:
taskmodule_type: PointerNetworkTaskModuleForEnd2EndRE
tokenizer_name_or_path: facebook/bart-base
document_type: pytorch_ie.documents.TextDocumentWithLabeledSpansBinaryRelationsAndLabeledPartitions
tokenized_document_type: pie_modules.documents.TokenDocumentWithLabeledSpansBinaryRelationsAndLabeledPartitions
span_layer_name: labeled_spans
relation_layer_name: binary_relations
none_label: none
loop_dummy_relation_name: loop
constrained_generation: true
label_tokens: null
label_representations: null
labels_per_layer:
labeled_spans:
- background_claim
- data
- own_claim
binary_relations:
- contradicts
- parts_of_same
- semantically_same
- supports
exclude_labels_per_layer: null
create_constraints: true
tokenizer_init_kwargs:
add_prefix_space: true
tokenizer_kwargs:
truncation: true
return_overflowing_tokens: true
stride: 128
strict_span_conversion: false
partition_layer_name: labeled_partitions
annotation_field_mapping: null
log_first_n_examples: null
_best_checkpoint:
desc: null
value: epoch_145.ckpt
_checkpoint_dir:
desc: null
value: /mnt/data/experiments/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0/checkpoints