deberta-v3-base-1107 / config.json
xoyeop's picture
Training in progress, epoch 1
8483030
{
"_name_or_path": "microsoft/deberta-v3-base",
"architectures": [
"DebertaV2ForSequenceClassification"
],
"attention_probs_dropout_prob": 0.1,
"hidden_act": "gelu",
"hidden_dropout_prob": 0.1,
"hidden_size": 768,
"id2label": {
"0": "org:founded_by",
"1": "no_relation",
"10": "per:religion",
"11": "per:age",
"12": "per:date_of_death",
"13": "org:website",
"14": "per:stateorprovinces_of_residence",
"15": "org:top_members/employees",
"16": "org:number_of_employees/members",
"17": "org:members",
"18": "org:country_of_branch",
"19": "per:spouse",
"2": "per:identity",
"20": "org:stateorprovince_of_branch",
"21": "org:political/religious_affiliation",
"22": "org:member_of",
"23": "per:siblings",
"24": "per:stateorprovince_of_birth",
"25": "org:dissolved",
"26": "per:other_family",
"27": "org:shareholders",
"28": "per:parents",
"29": "per:charges",
"3": "org:alternate_names",
"30": "per:schools_attended",
"31": "per:cause_of_death",
"32": "per:city_of_death",
"33": "per:stateorprovince_of_death",
"34": "org:founded",
"35": "per:country_of_death",
"36": "per:country_of_birth",
"37": "per:date_of_birth",
"38": "per:cities_of_residence",
"39": "per:city_of_birth",
"4": "per:children",
"5": "per:origin",
"6": "per:countries_of_residence",
"7": "per:employee_of",
"8": "per:title",
"9": "org:city_of_branch"
},
"initializer_range": 0.02,
"intermediate_size": 3072,
"label2id": {
"no_relation": "1",
"org:alternate_names": "3",
"org:city_of_branch": "9",
"org:country_of_branch": "18",
"org:dissolved": "25",
"org:founded": "34",
"org:founded_by": "0",
"org:member_of": "22",
"org:members": "17",
"org:number_of_employees/members": "16",
"org:political/religious_affiliation": "21",
"org:shareholders": "27",
"org:stateorprovince_of_branch": "20",
"org:top_members/employees": "15",
"org:website": "13",
"per:age": "11",
"per:cause_of_death": "31",
"per:charges": "29",
"per:children": "4",
"per:cities_of_residence": "38",
"per:city_of_birth": "39",
"per:city_of_death": "32",
"per:countries_of_residence": "6",
"per:country_of_birth": "36",
"per:country_of_death": "35",
"per:date_of_birth": "37",
"per:date_of_death": "12",
"per:employee_of": "7",
"per:identity": "2",
"per:origin": "5",
"per:other_family": "26",
"per:parents": "28",
"per:religion": "10",
"per:schools_attended": "30",
"per:siblings": "23",
"per:spouse": "19",
"per:stateorprovince_of_birth": "24",
"per:stateorprovince_of_death": "33",
"per:stateorprovinces_of_residence": "14",
"per:title": "8"
},
"layer_norm_eps": 1e-07,
"max_position_embeddings": 512,
"max_relative_positions": -1,
"model_type": "deberta-v2",
"norm_rel_ebd": "layer_norm",
"num_attention_heads": 12,
"num_hidden_layers": 12,
"pad_token_id": 0,
"pooler_dropout": 0,
"pooler_hidden_act": "gelu",
"pooler_hidden_size": 768,
"pos_att_type": [
"p2c",
"c2p"
],
"position_biased_input": false,
"position_buckets": 256,
"relative_attention": true,
"share_att_key": true,
"torch_dtype": "float32",
"transformers_version": "4.35.0",
"type_vocab_size": 0,
"vocab_size": 128100
}