End of training

Browse files

Files changed (6) hide show

README.md +4 -4
all_results.json +15 -0
eval_results.json +9 -0
runs/Dec26_11-34-23_2969512e7c3f/events.out.tfevents.1735215754.2969512e7c3f.118.1 +3 -0
train_results.json +9 -0
trainer_state.json +74 -0

README.md CHANGED Viewed

@@ -5,7 +5,7 @@ base_model: openai/whisper-small
 tags:
 - generated_from_trainer
 datasets:
-- common_voice_17_0
 metrics:
 - wer
 model-index:
@@ -15,8 +15,8 @@ model-index:
       name: Automatic Speech Recognition
       type: automatic-speech-recognition
     dataset:
-      name: common_voice_17_0
-      type: common_voice_17_0
       config: ar
       split: None
       args: ar
@@ -31,7 +31,7 @@ should probably proofread and complete it, then remove this comment. -->
 # whisper-small-ar2
-This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the common_voice_17_0 dataset.
 It achieves the following results on the evaluation set:
 - Loss: 1.2796
 - Wer: 0.7637

 tags:
 - generated_from_trainer
 datasets:
+- mozilla-foundation/common_voice_17_0
 metrics:
 - wer
 model-index:
       name: Automatic Speech Recognition
       type: automatic-speech-recognition
     dataset:
+      name: mozilla-foundation/common_voice_17_0 ar
+      type: mozilla-foundation/common_voice_17_0
       config: ar
       split: None
       args: ar
 # whisper-small-ar2
+This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the mozilla-foundation/common_voice_17_0 ar dataset.
 It achieves the following results on the evaluation set:
 - Loss: 1.2796
 - Wer: 0.7637

all_results.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+    "epoch": 41.666666666666664,
+    "eval_loss": 1.2795981168746948,
+    "eval_runtime": 20.697,
+    "eval_samples": 85,
+    "eval_samples_per_second": 4.107,
+    "eval_steps_per_second": 0.145,
+    "eval_wer": 0.763668430335097,
+    "total_flos": 4.617366645252293e+18,
+    "train_loss": 0.16236594557762146,
+    "train_runtime": 2555.1718,
+    "train_samples": 360,
+    "train_samples_per_second": 6.262,
+    "train_steps_per_second": 0.196
+}

eval_results.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+    "epoch": 41.666666666666664,
+    "eval_loss": 1.2795981168746948,
+    "eval_runtime": 20.697,
+    "eval_samples": 85,
+    "eval_samples_per_second": 4.107,
+    "eval_steps_per_second": 0.145,
+    "eval_wer": 0.763668430335097
+}

runs/Dec26_11-34-23_2969512e7c3f/events.out.tfevents.1735215754.2969512e7c3f.118.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4c3f2ed977aa0efad3f444d21a9e3dae57133c92c3acafdb8718f0d847d35a15
+size 406

train_results.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+    "epoch": 41.666666666666664,
+    "total_flos": 4.617366645252293e+18,
+    "train_loss": 0.16236594557762146,
+    "train_runtime": 2555.1718,
+    "train_samples": 360,
+    "train_samples_per_second": 6.262,
+    "train_steps_per_second": 0.196
+}

trainer_state.json ADDED Viewed

	@@ -0,0 +1,74 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 41.666666666666664,
+  "eval_steps": 250,
+  "global_step": 500,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 20.833333333333332,
+      "grad_norm": 0.165288046002388,
+      "learning_rate": 4.92e-06,
+      "loss": 0.3226,
+      "step": 250
+    },
+    {
+      "epoch": 20.833333333333332,
+      "eval_loss": 1.0812960863113403,
+      "eval_runtime": 20.5975,
+      "eval_samples_per_second": 4.127,
+      "eval_steps_per_second": 0.146,
+      "eval_wer": 0.7583774250440917,
+      "step": 250
+    },
+    {
+      "epoch": 41.666666666666664,
+      "grad_norm": 0.01815676875412464,
+      "learning_rate": 9.920000000000002e-06,
+      "loss": 0.0021,
+      "step": 500
+    },
+    {
+      "epoch": 41.666666666666664,
+      "eval_loss": 1.2795981168746948,
+      "eval_runtime": 20.8995,
+      "eval_samples_per_second": 4.067,
+      "eval_steps_per_second": 0.144,
+      "eval_wer": 0.763668430335097,
+      "step": 500
+    },
+    {
+      "epoch": 41.666666666666664,
+      "step": 500,
+      "total_flos": 4.617366645252293e+18,
+      "train_loss": 0.16236594557762146,
+      "train_runtime": 2555.1718,
+      "train_samples_per_second": 6.262,
+      "train_steps_per_second": 0.196
+    }
+  ],
+  "logging_steps": 250,
+  "max_steps": 500,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 42,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 4.617366645252293e+18,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}