nzm97's picture
Initial model push after training
7277c15 verified
{
"_name_or_path": "allenai/scibert_scivocab_uncased",
"architectures": [
"BertForSequenceClassification"
],
"attention_probs_dropout_prob": 0.1,
"classifier_dropout": null,
"hidden_act": "gelu",
"hidden_dropout_prob": 0.1,
"hidden_size": 768,
"id2label": {
"0": "1.G",
"1": "1.MD",
"2": "1.NBT",
"3": "1.OA",
"4": "2.G",
"5": "2.MD",
"6": "2.NBT",
"7": "2.OA",
"8": "3.G",
"9": "3.MD",
"10": "3.NBT",
"11": "3.NF",
"12": "3.OA",
"13": "4.G",
"14": "4.MD",
"15": "4.NBT",
"16": "4.NF",
"17": "4.OA",
"18": "5.G",
"19": "5.MD",
"20": "5.NBT",
"21": "5.NF",
"22": "5.OA",
"23": "6.EE",
"24": "6.G",
"25": "6.NS",
"26": "6.RP",
"27": "6.SP",
"28": "7.EE",
"29": "7.G",
"30": "7.NS",
"31": "7.RP",
"32": "7.SP",
"33": "8.EE",
"34": "8.F",
"35": "8.G",
"36": "8.NS",
"37": "8.SP",
"38": "K.CC",
"39": "K.G",
"40": "K.MD",
"41": "K.NBT",
"42": "K.OA"
},
"initializer_range": 0.02,
"intermediate_size": 3072,
"label2id": {
"1.G": 0,
"1.MD": 1,
"1.NBT": 2,
"1.OA": 3,
"2.G": 4,
"2.MD": 5,
"2.NBT": 6,
"2.OA": 7,
"3.G": 8,
"3.MD": 9,
"3.NBT": 10,
"3.NF": 11,
"3.OA": 12,
"4.G": 13,
"4.MD": 14,
"4.NBT": 15,
"4.NF": 16,
"4.OA": 17,
"5.G": 18,
"5.MD": 19,
"5.NBT": 20,
"5.NF": 21,
"5.OA": 22,
"6.EE": 23,
"6.G": 24,
"6.NS": 25,
"6.RP": 26,
"6.SP": 27,
"7.EE": 28,
"7.G": 29,
"7.NS": 30,
"7.RP": 31,
"7.SP": 32,
"8.EE": 33,
"8.F": 34,
"8.G": 35,
"8.NS": 36,
"8.SP": 37,
"K.CC": 38,
"K.G": 39,
"K.MD": 40,
"K.NBT": 41,
"K.OA": 42
},
"layer_norm_eps": 1e-12,
"max_position_embeddings": 512,
"model_type": "bert",
"num_attention_heads": 12,
"num_hidden_layers": 12,
"pad_token_id": 0,
"position_embedding_type": "absolute",
"problem_type": "single_label_classification",
"torch_dtype": "float32",
"transformers_version": "4.46.3",
"type_vocab_size": 2,
"use_cache": true,
"vocab_size": 31090
}