dfki-mlst-deberta-v3 / config.json
tanikina's picture
upload fine-tuned DeBERTa-v3 model (DialAM shared task)
1f2275b verified
raw
history blame
2.49 kB
{
"model_type": "SequenceClassificationModelWithPooler",
"model_name_or_path": "microsoft/deberta-v3-large",
"num_classes": 26,
"tokenizer_vocab_size": 128013,
"classifier_dropout": 0.1,
"learning_rate": 1e-05,
"task_learning_rate": 0.0001,
"warmup_proportion": 0.1,
"multi_label": false,
"multi_label_threshold": 0.5,
"pooler": null,
"freeze_base_model": false,
"taskmodule_config": {
"taskmodule_type": "RETextClassificationWithIndicesTaskModule",
"tokenizer_name_or_path": "microsoft/deberta-v3-large",
"relation_annotation": "nary_relations",
"add_candidate_relations": false,
"add_reversed_relations": false,
"partition_annotation": null,
"none_label": "no_relation",
"padding": true,
"truncation": true,
"max_length": null,
"pad_to_multiple_of": null,
"multi_label": false,
"labels": [
"s_nodes:Default Conflict",
"s_nodes:Default Inference",
"s_nodes:Default Inference-rev",
"s_nodes:Default Rephrase",
"s_nodes:NONE",
"ya_i2l_nodes:Agreeing",
"ya_i2l_nodes:Arguing",
"ya_i2l_nodes:Asserting",
"ya_i2l_nodes:Assertive Questioning",
"ya_i2l_nodes:Challenging",
"ya_i2l_nodes:Default Illocuting",
"ya_i2l_nodes:NONE",
"ya_i2l_nodes:Pure Questioning",
"ya_i2l_nodes:Restating",
"ya_i2l_nodes:Rhetorical Questioning",
"ya_s2ta_nodes:Agreeing",
"ya_s2ta_nodes:Arguing",
"ya_s2ta_nodes:Asserting",
"ya_s2ta_nodes:Challenging",
"ya_s2ta_nodes:Default Illocuting",
"ya_s2ta_nodes:Disagreeing",
"ya_s2ta_nodes:NONE",
"ya_s2ta_nodes:Pure Questioning",
"ya_s2ta_nodes:Restating",
"ya_s2ta_nodes:Rhetorical Questioning"
],
"add_type_to_marker": false,
"argument_role_to_marker": {
"s_nodes:source": "S:S",
"s_nodes:target": "S:T",
"ya_i2l_nodes:source": "YA-I2L:S",
"ya_i2l_nodes:target": "YA-I2L:T",
"ya_s2ta_nodes:source": "YA-S2TA:S",
"ya_s2ta_nodes:target": "YA-S2TA:T"
},
"single_argument_pair": true,
"append_markers": false,
"entity_labels": [
"L"
],
"reversed_relation_label_suffix": "_reversed",
"symmetric_relations": null,
"reverse_symmetric_relations": true,
"max_argument_distance": null,
"max_argument_distance_type": "inner",
"max_window": 512,
"log_first_n_examples": 0,
"add_argument_indices_to_input": false,
"collect_statistics": true
}
}