sam-pointer-bart-base-v0.3 / config.yaml

add train config and metadata

df85382 verified 6 months ago

18.7 kB

	wandb_version: 1

	_wandb:
	desc: null
	value:
	python_version: 3.9.17
	cli_version: 0.15.9
	framework: huggingface
	huggingface_version: 4.36.0
	is_jupyter_run: false
	is_kaggle_kernel: false
	start_time: 1709313942.075548
	t:
	1:
	- 1
	- 9
	- 11
	- 49
	- 50
	- 51
	- 55
	- 71
	- 103
	2:
	- 1
	- 9
	- 11
	- 49
	- 50
	- 51
	- 55
	- 71
	- 103
	3:
	- 2
	- 7
	- 15
	- 23
	4: 3.9.17
	5: 0.15.9
	6: 4.36.0
	8:
	- 5
	m:
	- 1: trainer/global_step
	6:
	- 3
	- 1: loss/train_step
	5: 1
	6:
	- 1
	- 1: epoch
	5: 1
	6:
	- 1
	- 1: loss/val
	5: 1
	6:
	- 1
	- 1: metric/exact_encoding_matches/val
	5: 1
	6:
	- 1
	- 1: metric/decoding_errors/all/val
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/micro/f1/val
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/micro/recall/val
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/micro/precision/val
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/background_claim/f1/val
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/background_claim/recall/val
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/background_claim/precision/val
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/data/f1/val
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/data/recall/val
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/data/precision/val
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/own_claim/f1/val
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/own_claim/recall/val
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/own_claim/precision/val
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/macro/f1/val
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/macro/recall/val
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/macro/precision/val
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/micro/f1/val
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/micro/recall/val
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/micro/precision/val
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/parts_of_same/f1/val
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/parts_of_same/recall/val
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/parts_of_same/precision/val
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/supports/f1/val
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/supports/recall/val
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/supports/precision/val
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/contradicts/f1/val
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/contradicts/recall/val
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/contradicts/precision/val
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/macro/f1/val
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/macro/recall/val
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/macro/precision/val
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/semantically_same/f1/val
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/semantically_same/recall/val
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/semantically_same/precision/val
	5: 1
	6:
	- 1
	- 1: loss/train_epoch
	5: 1
	6:
	- 1
	- 1: metric/exact_encoding_matches/train
	5: 1
	6:
	- 1
	- 1: metric/decoding_errors/label/train
	5: 1
	6:
	- 1
	- 1: metric/decoding_errors/index/train
	5: 1
	6:
	- 1
	- 1: metric/decoding_errors/len/train
	5: 1
	6:
	- 1
	- 1: metric/decoding_errors/order/train
	5: 1
	6:
	- 1
	- 1: metric/decoding_errors/correct/train
	5: 1
	6:
	- 1
	- 1: metric/decoding_errors/all/train
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/background_claim/f1/train
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/background_claim/recall/train
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/background_claim/precision/train
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/data/f1/train
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/data/recall/train
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/data/precision/train
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/own_claim/f1/train
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/own_claim/recall/train
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/own_claim/precision/train
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/micro/f1/train
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/micro/recall/train
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/micro/precision/train
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/macro/f1/train
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/macro/recall/train
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/macro/precision/train
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/supports/f1/train
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/supports/recall/train
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/supports/precision/train
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/micro/f1/train
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/micro/recall/train
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/micro/precision/train
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/parts_of_same/f1/train
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/parts_of_same/recall/train
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/parts_of_same/precision/train
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/contradicts/f1/train
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/contradicts/recall/train
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/contradicts/precision/train
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/semantically_same/f1/train
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/semantically_same/recall/train
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/semantically_same/precision/train
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/macro/f1/train
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/macro/recall/train
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/macro/precision/train
	5: 1
	6:
	- 1
	- 1: metric/decoding_errors/correct/val
	5: 1
	6:
	- 1
	- 1: metric/decoding_errors/index/val
	5: 1
	6:
	- 1
	- 1: metric/decoding_errors/len/val
	5: 1
	6:
	- 1
	- 1: loss/test
	5: 1
	6:
	- 1
	- 1: metric/exact_encoding_matches/test
	5: 1
	6:
	- 1
	- 1: metric/decoding_errors/correct/test
	5: 1
	6:
	- 1
	- 1: metric/decoding_errors/all/test
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/micro/f1/test
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/micro/recall/test
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/micro/precision/test
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/own_claim/f1/test
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/own_claim/recall/test
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/own_claim/precision/test
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/background_claim/f1/test
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/background_claim/recall/test
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/background_claim/precision/test
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/data/f1/test
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/data/recall/test
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/data/precision/test
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/macro/f1/test
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/macro/recall/test
	5: 1
	6:
	- 1
	- 1: metric/labeled_spans/macro/precision/test
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/micro/f1/test
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/micro/recall/test
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/micro/precision/test
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/parts_of_same/f1/test
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/parts_of_same/recall/test
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/parts_of_same/precision/test
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/supports/f1/test
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/supports/recall/test
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/supports/precision/test
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/contradicts/f1/test
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/contradicts/recall/test
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/contradicts/precision/test
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/semantically_same/f1/test
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/semantically_same/recall/test
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/semantically_same/precision/test
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/macro/f1/test
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/macro/recall/test
	5: 1
	6:
	- 1
	- 1: metric/binary_relations/macro/precision/test
	5: 1
	6:
	- 1
	_num_params/total:
	desc: null
	value: 141788928
	_num_params/trainable:
	desc: null
	value: 141788928
	_num_params/non_trainable:
	desc: null
	value: 0
	_config:
	desc: null
	value:
	pipeline_type: training
	name: dataset-sciarg/task-ner_re/v0.3
	tags:
	- task=ner_re
	- model=pointer_network
	train: true
	validate: true
	test: true
	monitor_metric: metric/binary_relations/micro/f1/val
	monitor_mode: max
	seed: 1
	ckpt_path: null
	push_to_hub: false
	model_save_dir: /home/arne/projects/pie-document-level/models/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-32
	dataset:
	_target_: src.utils.execute_pipeline
	input:
	_target_: pie_datasets.DatasetDict.load_dataset
	path: pie/sciarg
	revision: 982d5682ba414ee13cf92cb93ec18fc8e78e2b81
	select_n:
	_processor_: pie_datasets.DatasetDict.select
	split: train
	stop: null
	select_n_test:
	_processor_: pie_datasets.DatasetDict.select
	split: test
	stop: null
	select_n_validation:
	_processor_: pie_datasets.DatasetDict.select
	split: validation
	stop: null
	create_test_split:
	_processor_: pie_datasets.DatasetDict.move_to_new_split
	source_split: train
	target_split: test
	ids:
	- A32
	- A33
	- A34
	- A35
	- A36
	- A37
	- A38
	- A39
	- A40
	create_validation_split:
	_processor_: pie_datasets.DatasetDict.add_test_split
	test_size: 0.1
	seed: 1
	source_split: train
	target_split: validation
	datamodule:
	_target_: src.datamodules.PieDataModule
	batch_size: 2
	num_workers: 0
	pin_memory: false
	show_progress_for_encode: true
	train_split: train
	val_split: validation
	test_split: test
	taskmodule:
	_target_: pie_modules.taskmodules.PointerNetworkTaskModuleForEnd2EndRE
	tokenizer_init_kwargs:
	add_prefix_space: true
	tokenizer_name_or_path: facebook/bart-base
	tokenizer_kwargs:
	truncation: true
	return_overflowing_tokens: true
	stride: 128
	strict_span_conversion: false
	create_constraints: true
	constrained_generation: true
	partition_layer_name: labeled_partitions
	model:
	_target_: pie_modules.models.SimpleGenerativeModel
	base_model_type: pie_modules.models.base_models.BartAsPointerNetwork
	base_model_config:
	pretrained_model_name_or_path: facebook/bart-base
	use_encoder_mlp: true
	use_constraints_encoder_mlp: true
	decoder_position_id_pattern:
	- 0
	- 0
	- 1
	- 0
	- 0
	- 1
	- 1
	encoder_layer_norm_decay: 0.005
	lr: 6.0e-05
	num_beams: 4
	max_length: 768
	decoder_layer_norm_decay: 0.05
	metric_stages:
	- val
	- test
	- train
	metric_call_predict:
	- val
	- test
	warmup_proportion: 0.01
	callbacks:
	model_checkpoint:
	_target_: pytorch_lightning.callbacks.ModelCheckpoint
	dirpath: /home/arne/projects/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0/checkpoints
	filename: epoch_{epoch:03d}
	monitor: metric/binary_relations/micro/f1/val
	verbose: false
	save_last: true
	save_top_k: 1
	mode: max
	auto_insert_metric_name: false
	save_weights_only: false
	every_n_train_steps: null
	train_time_interval: null
	every_n_epochs: null
	save_on_train_epoch_end: null
	early_stopping:
	_target_: pytorch_lightning.callbacks.EarlyStopping
	monitor: metric/binary_relations/micro/f1/val
	min_delta: 0.0
	patience: 100
	verbose: false
	mode: max
	strict: true
	check_finite: true
	stopping_threshold: null
	divergence_threshold: null
	check_on_train_epoch_end: null
	model_summary:
	_target_: pytorch_lightning.callbacks.RichModelSummary
	max_depth: -1
	rich_progress_bar:
	_target_: pytorch_lightning.callbacks.RichProgressBar
	logger:
	wandb:
	_target_: pytorch_lightning.loggers.wandb.WandbLogger
	save_dir: /home/arne/projects/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0
	offline: false
	id: null
	anonymous: null
	project: dataset-sciarg-task-ner_re-v0.3-training
	log_model: false
	prefix: ''
	group: ''
	tags:
	- task=ner_re
	- model=pointer_network
	job_type: ''
	trainer:
	_target_: pytorch_lightning.Trainer
	default_root_dir: /home/arne/projects/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0
	min_epochs: 150
	max_epochs: 150
	accelerator: gpu
	devices: 1
	check_val_every_n_epoch: 1
	deterministic: false
	gradient_clip_val: 5
	gradient_clip_algorithm: value
	paths:
	root_dir: /home/arne/projects/pie-document-level
	data_dir: /home/arne/projects/pie-document-level/data/
	log_dir: /home/arne/projects/pie-document-level/logs/
	output_dir: /home/arne/projects/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0
	save_dir: /home/arne/projects/pie-document-level
	work_dir: /home/arne/projects/pie-document-level
	extras:
	ignore_warnings: false
	enforce_tags: true
	print_config: true
	base_model: facebook/bart-base
	base_model_type:
	desc: null
	value: pie_modules.models.base_models.BartAsPointerNetwork
	base_model_config:
	desc: null
	value:
	pretrained_model_name_or_path: facebook/bart-base
	use_encoder_mlp: true
	use_constraints_encoder_mlp: true
	decoder_position_id_pattern:
	- 0
	- 0
	- 1
	- 0
	- 0
	- 1
	- 1
	encoder_layer_norm_decay: 0.005
	lr: 6.0e-05
	num_beams: 4
	max_length: 768
	decoder_layer_norm_decay: 0.05
	bos_token_id: 0
	eos_token_id: 1
	pad_token_id: 1
	target_token_ids:
	- 0
	- 2
	- 50267
	- 50265
	- 50268
	- 50270
	- 50271
	- 50269
	- 50272
	- 50266
	embedding_weight_mapping:
	'50267':
	- 4146
	'50265':
	- 3618
	- 1215
	- 31628
	'50268':
	- 414
	'50270':
	- 308
	- 1215
	- 31628
	'50271':
	- 37820
	'50269':
	- 1667
	- 1215
	- 1116
	- 1215
	- 41690
	'50272':
	- 9031
	- 38600
	- 1215
	- 41690
	'50266':
	- 4548
	override_generation_kwargs:
	desc: null
	value: null
	warmup_proportion:
	desc: null
	value: 0.01
	learning_rate:
	desc: null
	value: null
	optimizer_type:
	desc: null
	value: null
	metric_stages:
	desc: null
	value:
	- val
	- test
	- train
	metric_call_predict:
	desc: null
	value:
	- val
	- test
	taskmodule_config:
	desc: null
	value:
	taskmodule_type: PointerNetworkTaskModuleForEnd2EndRE
	tokenizer_name_or_path: facebook/bart-base
	document_type: pytorch_ie.documents.TextDocumentWithLabeledSpansBinaryRelationsAndLabeledPartitions
	tokenized_document_type: pie_modules.documents.TokenDocumentWithLabeledSpansBinaryRelationsAndLabeledPartitions
	span_layer_name: labeled_spans
	relation_layer_name: binary_relations
	none_label: none
	loop_dummy_relation_name: loop
	constrained_generation: true
	label_tokens: null
	label_representations: null
	labels_per_layer:
	labeled_spans:
	- background_claim
	- data
	- own_claim
	binary_relations:
	- contradicts
	- parts_of_same
	- semantically_same
	- supports
	exclude_labels_per_layer: null
	create_constraints: true
	tokenizer_init_kwargs:
	add_prefix_space: true
	tokenizer_kwargs:
	truncation: true
	return_overflowing_tokens: true
	stride: 128
	strict_span_conversion: false
	partition_layer_name: labeled_partitions
	annotation_field_mapping: null
	log_first_n_examples: null
	_best_checkpoint:
	desc: null
	value: epoch_145.ckpt
	_checkpoint_dir:
	desc: null
	value: /mnt/data/experiments/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0/checkpoints