Training in progress, step 50

Files changed (6) hide show

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "openai/whisper-medium",
   "activation_dropout": 0.0,
   "activation_function": "gelu",
   "apply_spec_augment": false,
@@ -13,17 +13,17 @@
   ],
   "bos_token_id": 50257,
   "classifier_proj_size": 256,
-  "d_model": 1024,
-  "decoder_attention_heads": 16,
-  "decoder_ffn_dim": 4096,
   "decoder_layerdrop": 0.0,
-  "decoder_layers": 24,
   "decoder_start_token_id": 50258,
   "dropout": 0.0,
-  "encoder_attention_heads": 16,
-  "encoder_ffn_dim": 4096,
   "encoder_layerdrop": 0.0,
-  "encoder_layers": 24,
   "eos_token_id": 50257,
   "forced_decoder_ids": null,
   "init_std": 0.02,
@@ -39,7 +39,7 @@
   "max_target_positions": 448,
   "median_filter_width": 7,
   "model_type": "whisper",
-  "num_hidden_layers": 24,
   "num_mel_bins": 80,
   "pad_token_id": 50257,
   "scale_embedding": false,

 {
+  "_name_or_path": "openai/whisper-large",
   "activation_dropout": 0.0,
   "activation_function": "gelu",
   "apply_spec_augment": false,
   ],
   "bos_token_id": 50257,
   "classifier_proj_size": 256,
+  "d_model": 1280,
+  "decoder_attention_heads": 20,
+  "decoder_ffn_dim": 5120,
   "decoder_layerdrop": 0.0,
+  "decoder_layers": 32,
   "decoder_start_token_id": 50258,
   "dropout": 0.0,
+  "encoder_attention_heads": 20,
+  "encoder_ffn_dim": 5120,
   "encoder_layerdrop": 0.0,
+  "encoder_layers": 32,
   "eos_token_id": 50257,
   "forced_decoder_ids": null,
   "init_std": 0.02,
   "max_target_positions": 448,
   "median_filter_width": 7,
   "model_type": "whisper",
+  "num_hidden_layers": 32,
   "num_mel_bins": 80,
   "pad_token_id": 50257,
   "scale_embedding": false,

generation_config.json CHANGED Viewed

@@ -1,28 +1,40 @@
 {
   "alignment_heads": [
     [
-      13,
-      15
     ],
     [
-      15,
       4
     ],
     [
-      15,
-      15
     ],
     [
-      16,
-      1
     ],
     [
-      20,
-      0
     ],
     [
       23,
-      4
     ]
   ],
   "begin_suppress_tokens": [

 {
   "alignment_heads": [
     [
+      9,
+      19
+    ],
+    [
+      11,
+      2
     ],
     [
+      11,
       4
     ],
     [
+      11,
+      17
+    ],
+    [
+      22,
+      7
     ],
     [
+      22,
+      11
     ],
     [
+      22,
+      17
     ],
     [
       23,
+      2
+    ],
+    [
+      23,
+      15
     ]
   ],
   "begin_suppress_tokens": [

pytorch_model-00001-of-00002.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:195cc9a1f74856942ecb795c98d5d8ce94442b83b6a4f4d1568e05520468acc8
+size 4992943617

pytorch_model-00002-of-00002.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:159a6999a5ee6ffb36cd7020202c663d7dfcf1b76a8db3ee4fb7f49e92014d94
+size 1180727888

pytorch_model.bin.index.json ADDED Viewed

The diff for this file is too large to render. See raw diff

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6352b9db6d94b3c51b5c2c20b5248447d31f935aae7b9684807aa1a2b5a20c8d
 size 4664

 version https://git-lfs.github.com/spec/v1
+oid sha256:a4a2990d4d130b42cf8fbfa7ba8f574eb43332601e76d83396fa2a0897d71d41
 size 4664