Upload model with metrics - 2024-12-12 01:56

Browse files

Files changed (11) hide show

README.md +24 -7
checkpoint-35/model.safetensors +1 -1
checkpoint-35/trainer_state.json +19 -19
checkpoint-35/training_args.bin +3 -0
checkpoint-64/model.safetensors +1 -1
checkpoint-64/trainer_state.json +19 -19
checkpoint-64/training_args.bin +3 -0
metrics.json +19 -20
model.safetensors +1 -1
trainer_state.json +23 -23
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -30,6 +30,30 @@ This model is trained for document classification using vision transformers (DiT
 * Learning Rate Schedule: cosine_with_restarts
 * Warmup Ratio: 0.1
 ## Usage
 ```python
@@ -48,10 +72,3 @@ inputs = processor(image, return_tensors="pt")
 outputs = model(**inputs)
 predicted_label = outputs.logits.argmax(-1).item()
 ```
-## Model Performance
-The model was evaluated on a held-out test set. The metrics above show the model's performance on both training and evaluation data. Key metrics to note:
-- Accuracy: Overall classification accuracy
-- F1 Score: Weighted average F1-score across all classes
-- Precision and Recall: Weighted averages across all classes

 * Learning Rate Schedule: cosine_with_restarts
 * Warmup Ratio: 0.1
+## Training and Evaluation Metrics
+### Training Metrics
+* Loss: 5.2299
+* Grad Norm: 5.5809
+* Learning Rate: 0.0010
+* Epoch: 0.5426
+* Step: 35.0000
+### Evaluation Metrics
+* Loss: 5.0066
+* Accuracy: 0.1351
+* Weighted F1: 0.0662
+* Micro F1: 0.1351
+* Macro F1: 0.0380
+* Weighted Recall: 0.1351
+* Micro Recall: 0.1351
+* Macro Recall: 0.0646
+* Weighted Precision: 0.0548
+* Micro Precision: 0.1351
+* Macro Precision: 0.0333
+* Runtime: 8.2574
+* Samples Per Second: 441.1820
+* Steps Per Second: 3.5120
 ## Usage
 ```python
 outputs = model(**inputs)
 predicted_label = outputs.logits.argmax(-1).item()
 ```

checkpoint-35/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:40862837ac36823a66434d0e8fb1b8dcebd62b09379dec3f443c3d4180c26d6f
 size 1213526036

 version https://git-lfs.github.com/spec/v1
+oid sha256:e72a88f97c761c0a531cb086303001d50691997a2b12f53e5ba97ac052c09560
 size 1213526036

checkpoint-35/trainer_state.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "best_metric": 0.13203403788086743,
   "best_model_checkpoint": "ds3-img-classification/checkpoint-35",
   "epoch": 0.5426356589147286,
   "eval_steps": 35,
@@ -10,34 +10,34 @@
   "log_history": [
     {
       "epoch": 0.015503875968992248,
-      "grad_norm": 13.281591415405273,
       "learning_rate": 0.0002857142857142857,
-      "loss": 5.8916,
       "step": 1
     },
     {
       "epoch": 0.5426356589147286,
-      "grad_norm": 4.951363563537598,
       "learning_rate": 0.0010275543423681622,
-      "loss": 5.1595,
       "step": 35
     },
     {
       "epoch": 0.5426356589147286,
-      "eval_accuracy": 0.13203403788086743,
-      "eval_loss": 5.00415563583374,
-      "eval_macro_f1": 0.03707599079404095,
-      "eval_macro_precision": 0.05261629127568818,
-      "eval_macro_recall": 0.06397651980374536,
-      "eval_micro_f1": 0.13203403788086743,
-      "eval_micro_precision": 0.13203403788086743,
-      "eval_micro_recall": 0.13203403788086743,
-      "eval_runtime": 8.4066,
-      "eval_samples_per_second": 433.352,
-      "eval_steps_per_second": 3.45,
-      "eval_weighted_f1": 0.054356566877609806,
-      "eval_weighted_precision": 0.06787536777484662,
-      "eval_weighted_recall": 0.13203403788086743,
       "step": 35
     }
   ],

 {
+  "best_metric": 0.1350535273126544,
   "best_model_checkpoint": "ds3-img-classification/checkpoint-35",
   "epoch": 0.5426356589147286,
   "eval_steps": 35,
   "log_history": [
     {
       "epoch": 0.015503875968992248,
+      "grad_norm": 16.251585006713867,
       "learning_rate": 0.0002857142857142857,
+      "loss": 6.0665,
       "step": 1
     },
     {
       "epoch": 0.5426356589147286,
+      "grad_norm": 5.580934524536133,
       "learning_rate": 0.0010275543423681622,
+      "loss": 5.2299,
       "step": 35
     },
     {
       "epoch": 0.5426356589147286,
+      "eval_accuracy": 0.1350535273126544,
+      "eval_loss": 5.006561279296875,
+      "eval_macro_f1": 0.038001266460012215,
+      "eval_macro_precision": 0.033336047367919855,
+      "eval_macro_recall": 0.06460349403258135,
+      "eval_micro_f1": 0.1350535273126544,
+      "eval_micro_precision": 0.1350535273126544,
+      "eval_micro_recall": 0.1350535273126544,
+      "eval_runtime": 8.2574,
+      "eval_samples_per_second": 441.182,
+      "eval_steps_per_second": 3.512,
+      "eval_weighted_f1": 0.0662231556079451,
+      "eval_weighted_precision": 0.054814565244902975,
+      "eval_weighted_recall": 0.1350535273126544,
       "step": 35
     }
   ],

checkpoint-35/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c6cc8ffd94025c9e00fadf213825a92f261358a56e78b613f233178b10436ef6
+size 5368

checkpoint-64/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7e71729c412a7000ba3fbaf09cdfcefe3e297c814b16c8153fc6dcab8efa3a04
 size 1213526036

 version https://git-lfs.github.com/spec/v1
+oid sha256:df2901e8559ae0de2bd216d039cc92f33736cca45db6be8c08de0bbfb4fdb663
 size 1213526036

checkpoint-64/trainer_state.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "best_metric": 0.13203403788086743,
   "best_model_checkpoint": "ds3-img-classification/checkpoint-35",
   "epoch": 0.9922480620155039,
   "eval_steps": 35,
@@ -10,34 +10,34 @@
   "log_history": [
     {
       "epoch": 0.015503875968992248,
-      "grad_norm": 13.281591415405273,
       "learning_rate": 0.0002857142857142857,
-      "loss": 5.8916,
       "step": 1
     },
     {
       "epoch": 0.5426356589147286,
-      "grad_norm": 4.951363563537598,
       "learning_rate": 0.0010275543423681622,
-      "loss": 5.1595,
       "step": 35
     },
     {
       "epoch": 0.5426356589147286,
-      "eval_accuracy": 0.13203403788086743,
-      "eval_loss": 5.00415563583374,
-      "eval_macro_f1": 0.03707599079404095,
-      "eval_macro_precision": 0.05261629127568818,
-      "eval_macro_recall": 0.06397651980374536,
-      "eval_micro_f1": 0.13203403788086743,
-      "eval_micro_precision": 0.13203403788086743,
-      "eval_micro_recall": 0.13203403788086743,
-      "eval_runtime": 8.4066,
-      "eval_samples_per_second": 433.352,
-      "eval_steps_per_second": 3.45,
-      "eval_weighted_f1": 0.054356566877609806,
-      "eval_weighted_precision": 0.06787536777484662,
-      "eval_weighted_recall": 0.13203403788086743,
       "step": 35
     }
   ],

 {
+  "best_metric": 0.1350535273126544,
   "best_model_checkpoint": "ds3-img-classification/checkpoint-35",
   "epoch": 0.9922480620155039,
   "eval_steps": 35,
   "log_history": [
     {
       "epoch": 0.015503875968992248,
+      "grad_norm": 16.251585006713867,
       "learning_rate": 0.0002857142857142857,
+      "loss": 6.0665,
       "step": 1
     },
     {
       "epoch": 0.5426356589147286,
+      "grad_norm": 5.580934524536133,
       "learning_rate": 0.0010275543423681622,
+      "loss": 5.2299,
       "step": 35
     },
     {
       "epoch": 0.5426356589147286,
+      "eval_accuracy": 0.1350535273126544,
+      "eval_loss": 5.006561279296875,
+      "eval_macro_f1": 0.038001266460012215,
+      "eval_macro_precision": 0.033336047367919855,
+      "eval_macro_recall": 0.06460349403258135,
+      "eval_micro_f1": 0.1350535273126544,
+      "eval_micro_precision": 0.1350535273126544,
+      "eval_micro_recall": 0.1350535273126544,
+      "eval_runtime": 8.2574,
+      "eval_samples_per_second": 441.182,
+      "eval_steps_per_second": 3.512,
+      "eval_weighted_f1": 0.0662231556079451,
+      "eval_weighted_precision": 0.054814565244902975,
+      "eval_weighted_recall": 0.1350535273126544,
       "step": 35
     }
   ],

checkpoint-64/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c6cc8ffd94025c9e00fadf213825a92f261358a56e78b613f233178b10436ef6
+size 5368

metrics.json CHANGED Viewed

@@ -1,26 +1,25 @@
 {
   "train": {
-    "train_runtime": 163.8077,
-    "train_samples_per_second": 200.149,
-    "train_steps_per_second": 0.391,
-    "total_flos": 8.978215898519175e+18,
-    "train_loss": 4.830539099872112,
-    "epoch": 0.9922480620155039
   },
   "eval": {
-    "eval_loss": 5.00415563583374,
-    "eval_accuracy": 0.13203403788086743,
-    "eval_weighted_f1": 0.054356566877609806,
-    "eval_micro_f1": 0.13203403788086743,
-    "eval_macro_f1": 0.03707599079404095,
-    "eval_weighted_recall": 0.13203403788086743,
-    "eval_micro_recall": 0.13203403788086743,
-    "eval_macro_recall": 0.06397651980374536,
-    "eval_weighted_precision": 0.06787536777484662,
-    "eval_micro_precision": 0.13203403788086743,
-    "eval_macro_precision": 0.05261629127568818,
-    "eval_runtime": 8.4066,
-    "eval_samples_per_second": 433.352,
-    "eval_steps_per_second": 3.45
   }
 }

 {
   "train": {
+    "loss": 5.2299,
+    "grad_norm": 5.580934524536133,
+    "learning_rate": 0.0010275543423681622,
+    "epoch": 0.5426356589147286,
+    "step": 35.0
   },
   "eval": {
+    "eval_loss": 5.006561279296875,
+    "eval_accuracy": 0.1350535273126544,
+    "eval_weighted_f1": 0.0662231556079451,
+    "eval_micro_f1": 0.1350535273126544,
+    "eval_macro_f1": 0.038001266460012215,
+    "eval_weighted_recall": 0.1350535273126544,
+    "eval_micro_recall": 0.1350535273126544,
+    "eval_macro_recall": 0.06460349403258135,
+    "eval_weighted_precision": 0.054814565244902975,
+    "eval_micro_precision": 0.1350535273126544,
+    "eval_macro_precision": 0.033336047367919855,
+    "eval_runtime": 8.2574,
+    "eval_samples_per_second": 441.182,
+    "eval_steps_per_second": 3.512
   }
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:40862837ac36823a66434d0e8fb1b8dcebd62b09379dec3f443c3d4180c26d6f
 size 1213526036

 version https://git-lfs.github.com/spec/v1
+oid sha256:e72a88f97c761c0a531cb086303001d50691997a2b12f53e5ba97ac052c09560
 size 1213526036

trainer_state.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "best_metric": 0.13203403788086743,
   "best_model_checkpoint": "ds3-img-classification/checkpoint-35",
   "epoch": 0.9922480620155039,
   "eval_steps": 35,
@@ -10,44 +10,44 @@
   "log_history": [
     {
       "epoch": 0.015503875968992248,
-      "grad_norm": 13.281591415405273,
       "learning_rate": 0.0002857142857142857,
-      "loss": 5.8916,
       "step": 1
     },
     {
       "epoch": 0.5426356589147286,
-      "grad_norm": 4.951363563537598,
       "learning_rate": 0.0010275543423681622,
-      "loss": 5.1595,
       "step": 35
     },
     {
       "epoch": 0.5426356589147286,
-      "eval_accuracy": 0.13203403788086743,
-      "eval_loss": 5.00415563583374,
-      "eval_macro_f1": 0.03707599079404095,
-      "eval_macro_precision": 0.05261629127568818,
-      "eval_macro_recall": 0.06397651980374536,
-      "eval_micro_f1": 0.13203403788086743,
-      "eval_micro_precision": 0.13203403788086743,
-      "eval_micro_recall": 0.13203403788086743,
-      "eval_runtime": 8.4066,
-      "eval_samples_per_second": 433.352,
-      "eval_steps_per_second": 3.45,
-      "eval_weighted_f1": 0.054356566877609806,
-      "eval_weighted_precision": 0.06787536777484662,
-      "eval_weighted_recall": 0.13203403788086743,
       "step": 35
     },
     {
       "epoch": 0.9922480620155039,
       "step": 64,
       "total_flos": 8.978215898519175e+18,
-      "train_loss": 4.830539099872112,
-      "train_runtime": 163.8077,
-      "train_samples_per_second": 200.149,
-      "train_steps_per_second": 0.391
     }
   ],
   "logging_steps": 35,

 {
+  "best_metric": 0.1350535273126544,
   "best_model_checkpoint": "ds3-img-classification/checkpoint-35",
   "epoch": 0.9922480620155039,
   "eval_steps": 35,
   "log_history": [
     {
       "epoch": 0.015503875968992248,
+      "grad_norm": 16.251585006713867,
       "learning_rate": 0.0002857142857142857,
+      "loss": 6.0665,
       "step": 1
     },
     {
       "epoch": 0.5426356589147286,
+      "grad_norm": 5.580934524536133,
       "learning_rate": 0.0010275543423681622,
+      "loss": 5.2299,
       "step": 35
     },
     {
       "epoch": 0.5426356589147286,
+      "eval_accuracy": 0.1350535273126544,
+      "eval_loss": 5.006561279296875,
+      "eval_macro_f1": 0.038001266460012215,
+      "eval_macro_precision": 0.033336047367919855,
+      "eval_macro_recall": 0.06460349403258135,
+      "eval_micro_f1": 0.1350535273126544,
+      "eval_micro_precision": 0.1350535273126544,
+      "eval_micro_recall": 0.1350535273126544,
+      "eval_runtime": 8.2574,
+      "eval_samples_per_second": 441.182,
+      "eval_steps_per_second": 3.512,
+      "eval_weighted_f1": 0.0662231556079451,
+      "eval_weighted_precision": 0.054814565244902975,
+      "eval_weighted_recall": 0.1350535273126544,
       "step": 35
     },
     {
       "epoch": 0.9922480620155039,
       "step": 64,
       "total_flos": 8.978215898519175e+18,
+      "train_loss": 4.950647212564945,
+      "train_runtime": 163.8995,
+      "train_samples_per_second": 200.037,
+      "train_steps_per_second": 0.39
     }
   ],
   "logging_steps": 35,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f20e468d961bf3f2e3584ef964e567145fd00284f9814774d5cd6ba9208eb7fe
 size 5368

 version https://git-lfs.github.com/spec/v1
+oid sha256:c6cc8ffd94025c9e00fadf213825a92f261358a56e78b613f233178b10436ef6
 size 5368