End of training

Browse files

Files changed (8) hide show

.gitignore +2 -0
config.json +29 -0
generation_config.json +5 -0
log.json +282 -0
model.safetensors +3 -0
special_tokens_map.json +4 -0
tokenizer.json +0 -0
tokenizer_config.json +49 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ step_*
2	+ epoch_*

config.json ADDED Viewed

	@@ -0,0 +1,29 @@

+{
+  "_name_or_path": "huawei-noah/TinyBERT_General_4L_312D",
+  "architectures": [
+    "BertForMaskedLM"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "cell": {},
+  "classifier_dropout": null,
+  "emb_size": 312,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 312,
+  "initializer_range": 0.02,
+  "intermediate_size": 1200,
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 4,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "pre_trained": "",
+  "structure": [],
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

generation_config.json ADDED Viewed

	@@ -0,0 +1,5 @@

+{
+  "_from_model_config": true,
+  "pad_token_id": 0,
+  "transformers_version": "4.44.2"
+}

log.json ADDED Viewed

	@@ -0,0 +1,282 @@

+{
+    "eval_perpl": [
+        31449.7657081341,
+        6135.761638226119,
+        2275.301693637439,
+        2100.5636547496974,
+        1763.9246096238794,
+        912.4593282895613,
+        673.2478721800974,
+        426.95282488572326,
+        292.066480449549,
+        229.60749931792827,
+        178.48175607976276,
+        151.7738098243359,
+        132.68325221447097,
+        131.60733192012995,
+        121.35699482687662,
+        113.03692537619067,
+        314.2693244669915,
+        319.62471471397265,
+        357.5297510309972,
+        373.37600350886794,
+        427.6761706922814,
+        418.7241591849811,
+        88.4342864632641,
+        81.68638521632647,
+        71.71099212003867,
+        69.46567916489799,
+        84.99562405056126,
+        97.03116680777474,
+        99.61508321269098,
+        99.53868474540631,
+        96.69570308133885,
+        97.3618052463106,
+        97.37972722605315,
+        95.8043254339647,
+        94.59195856098238,
+        100.33980437996713,
+        95.41348395061875,
+        94.98106528056366,
+        91.7840253560043,
+        92.34501897421714,
+        90.46576611879469,
+        91.17134170708903,
+        89.93299763326101,
+        87.14281899601743,
+        88.47460898187907,
+        88.24948549868428,
+        84.98678917210486,
+        87.07220763140273,
+        63.93756172611777,
+        60.228661637513234,
+        59.19890548462696,
+        57.310445090319284,
+        55.892054997349064,
+        58.32000354396741,
+        56.82671999573329,
+        59.14614220744896,
+        59.17415449564529,
+        59.723865239121785,
+        56.183552716071574,
+        42.941688373342394,
+        43.17332328067362,
+        42.02991489794291,
+        41.175966066255576,
+        42.14810471722296,
+        41.02890386392398,
+        40.96517442480964,
+        39.17880381005861,
+        39.25041154205274
+    ],
+    "eval_loss": [
+        10.356146812438965,
+        8.72188949584961,
+        7.729867935180664,
+        7.649960994720459,
+        7.475296497344971,
+        6.81614351272583,
+        6.512113571166992,
+        6.056673526763916,
+        5.676981449127197,
+        5.436371326446533,
+        5.184486389160156,
+        5.022391319274902,
+        4.887964725494385,
+        4.879822731018066,
+        4.798736572265625,
+        4.727714538574219,
+        5.750250339508057,
+        5.767147541046143,
+        5.879218578338623,
+        5.922585964202881,
+        6.058366298675537,
+        6.037212371826172,
+        4.482259750366211,
+        4.402887344360352,
+        4.27264404296875,
+        4.240832805633545,
+        4.442599773406982,
+        4.5750322341918945,
+        4.601313591003418,
+        4.600546360015869,
+        4.571568965911865,
+        4.578433990478516,
+        4.578618049621582,
+        4.562307834625244,
+        4.549572467803955,
+        4.608562469482422,
+        4.558219909667969,
+        4.553677558898926,
+        4.51943826675415,
+        4.525531768798828,
+        4.504971504211426,
+        4.512740612030029,
+        4.499064922332764,
+        4.467548370361328,
+        4.482715606689453,
+        4.480167865753174,
+        4.442495822906494,
+        4.466737747192383,
+        4.157907009124756,
+        4.098148345947266,
+        4.080903053283691,
+        4.048482894897461,
+        4.0234222412109375,
+        4.065945148468018,
+        4.040006637573242,
+        4.080011367797852,
+        4.080484867095947,
+        4.089731693267822,
+        4.028624057769775,
+        3.759843111038208,
+        3.7652227878570557,
+        3.7383816242218018,
+        3.7178547382354736,
+        3.74118971824646,
+        3.7142767906188965,
+        3.7127223014831543,
+        3.66813588142395,
+        3.669961929321289
+    ],
+    "train_loss": [
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null
+    ],
+    "completed_steps": [
+        0,
+        100,
+        200,
+        300,
+        400,
+        500,
+        600,
+        700,
+        800,
+        900,
+        1000,
+        1100,
+        1200,
+        1300,
+        1400,
+        1500,
+        1600,
+        1700,
+        1800,
+        1900,
+        2000,
+        2100,
+        2200,
+        2300,
+        2400,
+        2500,
+        2600,
+        2700,
+        2800,
+        2900,
+        3000,
+        3100,
+        3200,
+        3300,
+        3400,
+        3500,
+        3600,
+        3700,
+        3800,
+        3900,
+        4000,
+        4100,
+        4200,
+        4300,
+        4400,
+        4500,
+        4600,
+        4700,
+        4800,
+        4900,
+        5000,
+        5100,
+        5200,
+        5300,
+        5400,
+        5500,
+        5600,
+        5700,
+        5800,
+        5900,
+        6000,
+        6100,
+        6200,
+        6300,
+        6400,
+        6500,
+        6600,
+        6700
+    ]
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4647aea8665a92bfe22555c96b68c47c0b94aba8dcb84ddabc2ccb81709ee3fa
+size 57534056

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,4 @@

+{
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]"
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,49 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "4": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "mask_token": "[MASK]",
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "[PAD]",
+  "tokenizer_class": "PreTrainedTokenizerFast"
+}