End of training

Browse files

Files changed (5) hide show

.DS_Store +0 -0
README.md +11 -20
config.json +16 -14
pytorch_model.bin +2 -2
training_args.bin +1 -1

.DS_Store ADDED Viewed

Binary file (6.15 kB). View file

README.md CHANGED Viewed

@@ -1,6 +1,6 @@
 ---
 license: apache-2.0
-base_model: distilbert-base-uncased
 tags:
 - generated_from_trainer
 metrics:
@@ -15,10 +15,10 @@ should probably proofread and complete it, then remove this comment. -->
 # office-character
-This model is a fine-tuned version of [distilbert-base-uncased](https://huggingface.co/distilbert-base-uncased) on the None dataset.
 It achieves the following results on the evaluation set:
-- Loss: 2.5873
-- Accuracy: 0.1544
 ## Model description
@@ -43,27 +43,18 @@ The following hyperparameters were used during training:
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
-- num_epochs: 2.5
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss | Accuracy |
 |:-------------:|:-----:|:----:|:---------------:|:--------:|
-| 2.6964        | 0.16  | 60   | 2.6756          | 0.0834   |
-| 2.6947        | 0.31  | 120  | 2.6670          | 0.0947   |
-| 2.6716        | 0.47  | 180  | 2.6428          | 0.1139   |
-| 2.6315        | 0.63  | 240  | 2.6252          | 0.1268   |
-| 2.6113        | 0.79  | 300  | 2.6205          | 0.1310   |
-| 2.5936        | 0.94  | 360  | 2.6137          | 0.1293   |
-| 2.5298        | 1.1   | 420  | 2.6065          | 0.1381   |
-| 2.4691        | 1.26  | 480  | 2.6097          | 0.1452   |
-| 2.4645        | 1.42  | 540  | 2.6015          | 0.1519   |
-| 2.4404        | 1.57  | 600  | 2.5912          | 0.1414   |
-| 2.4435        | 1.73  | 660  | 2.5890          | 0.1464   |
-| 2.4425        | 1.89  | 720  | 2.5928          | 0.1514   |
-| 2.4038        | 2.05  | 780  | 2.5880          | 0.1481   |
-| 2.2601        | 2.2   | 840  | 2.5941          | 0.1423   |
-| 2.2858        | 2.36  | 900  | 2.5873          | 0.1544   |
 ### Framework versions

 ---
 license: apache-2.0
+base_model: bert-base-uncased
 tags:
 - generated_from_trainer
 metrics:
 # office-character
+This model is a fine-tuned version of [bert-base-uncased](https://huggingface.co/bert-base-uncased) on the None dataset.
 It achieves the following results on the evaluation set:
+- Loss: 2.6075
+- Accuracy: 0.1381
 ## Model description
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
+- num_epochs: 1.0
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss | Accuracy |
 |:-------------:|:-----:|:----:|:---------------:|:--------:|
+| 2.7041        | 0.16  | 60   | 2.6752          | 0.0864   |
+| 2.6928        | 0.31  | 120  | 2.6589          | 0.1118   |
+| 2.6579        | 0.47  | 180  | 2.6806          | 0.0989   |
+| 2.645         | 0.63  | 240  | 2.6248          | 0.1260   |
+| 2.6157        | 0.79  | 300  | 2.6219          | 0.1272   |
+| 2.6076        | 0.94  | 360  | 2.6075          | 0.1381   |
 ### Framework versions

config.json CHANGED Viewed

@@ -1,13 +1,14 @@
 {
-  "_name_or_path": "distilbert-base-uncased",
-  "activation": "gelu",
   "architectures": [
-    "DistilBertForSequenceClassification"
   ],
-  "attention_dropout": 0.1,
-  "dim": 768,
-  "dropout": 0.1,
-  "hidden_dim": 3072,
   "id2label": {
     "0": "Andy",
     "1": "Angela",
@@ -26,6 +27,7 @@
     "14": "Toby"
   },
   "initializer_range": 0.02,
   "label2id": {
     "Andy": 0,
     "Angela": 1,
@@ -43,17 +45,17 @@
     "Ryan": 13,
     "Toby": 14
   },
   "max_position_embeddings": 512,
-  "model_type": "distilbert",
-  "n_heads": 12,
-  "n_layers": 6,
   "pad_token_id": 0,
   "problem_type": "single_label_classification",
-  "qa_dropout": 0.1,
-  "seq_classif_dropout": 0.2,
-  "sinusoidal_pos_embds": false,
-  "tie_weights_": true,
   "torch_dtype": "float32",
   "transformers_version": "4.32.1",
   "vocab_size": 30522
 }

 {
+  "_name_or_path": "bert-base-uncased",
   "architectures": [
+    "BertForSequenceClassification"
   ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
   "id2label": {
     "0": "Andy",
     "1": "Angela",
     "14": "Toby"
   },
   "initializer_range": 0.02,
+  "intermediate_size": 3072,
   "label2id": {
     "Andy": 0,
     "Angela": 1,
     "Ryan": 13,
     "Toby": 14
   },
+  "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
   "pad_token_id": 0,
+  "position_embedding_type": "absolute",
   "problem_type": "single_label_classification",
   "torch_dtype": "float32",
   "transformers_version": "4.32.1",
+  "type_vocab_size": 2,
+  "use_cache": true,
   "vocab_size": 30522
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4f6e7388bce18b2b605553aea45357ee7a822d9f49d16d49e39eb9bbaa29bade
-size 267894125

 version https://git-lfs.github.com/spec/v1
+oid sha256:a684c06ce3d6f306726bd49fc83c37e924bfc58fa168409e39a80f71a31bbf03
+size 438040689

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a6485da611124e3d8ce3a90f9e543316e68cc53c2a3f561390488a73fcbbd490
 size 4027

 version https://git-lfs.github.com/spec/v1
+oid sha256:4f75199ada056e7250135951a860537241a5618166c68d833060a1c1cf7d7686
 size 4027