CKSINGH commited on
Commit
0fc3d9a
1 Parent(s): 00022aa

Training in progress, step 100

Browse files
added_tokens.json CHANGED
@@ -1518,7 +1518,6 @@
1518
  "<|da|>": 50285,
1519
  "<|de|>": 50261,
1520
  "<|el|>": 50281,
1521
- "<|endoftext|>": 50257,
1522
  "<|en|>": 50259,
1523
  "<|es|>": 50262,
1524
  "<|et|>": 50307,
 
1518
  "<|da|>": 50285,
1519
  "<|de|>": 50261,
1520
  "<|el|>": 50281,
 
1521
  "<|en|>": 50259,
1522
  "<|es|>": 50262,
1523
  "<|et|>": 50307,
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "openai/whisper-small",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
@@ -13,17 +13,17 @@
13
  ],
14
  "bos_token_id": 50257,
15
  "classifier_proj_size": 256,
16
- "d_model": 768,
17
- "decoder_attention_heads": 12,
18
- "decoder_ffn_dim": 3072,
19
  "decoder_layerdrop": 0.0,
20
- "decoder_layers": 12,
21
  "decoder_start_token_id": 50258,
22
  "dropout": 0.0,
23
- "encoder_attention_heads": 12,
24
- "encoder_ffn_dim": 3072,
25
  "encoder_layerdrop": 0.0,
26
- "encoder_layers": 12,
27
  "eos_token_id": 50257,
28
  "forced_decoder_ids": null,
29
  "init_std": 0.02,
@@ -39,13 +39,13 @@
39
  "max_target_positions": 448,
40
  "median_filter_width": 7,
41
  "model_type": "whisper",
42
- "num_hidden_layers": 12,
43
  "num_mel_bins": 80,
44
  "pad_token_id": 50257,
45
  "scale_embedding": false,
46
  "suppress_tokens": [],
47
  "torch_dtype": "float32",
48
- "transformers_version": "4.34.0.dev0",
49
  "use_cache": true,
50
  "use_weighted_layer_sum": false,
51
  "vocab_size": 51865
 
1
  {
2
+ "_name_or_path": "openai/whisper-medium",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
 
13
  ],
14
  "bos_token_id": 50257,
15
  "classifier_proj_size": 256,
16
+ "d_model": 1024,
17
+ "decoder_attention_heads": 16,
18
+ "decoder_ffn_dim": 4096,
19
  "decoder_layerdrop": 0.0,
20
+ "decoder_layers": 24,
21
  "decoder_start_token_id": 50258,
22
  "dropout": 0.0,
23
+ "encoder_attention_heads": 16,
24
+ "encoder_ffn_dim": 4096,
25
  "encoder_layerdrop": 0.0,
26
+ "encoder_layers": 24,
27
  "eos_token_id": 50257,
28
  "forced_decoder_ids": null,
29
  "init_std": 0.02,
 
39
  "max_target_positions": 448,
40
  "median_filter_width": 7,
41
  "model_type": "whisper",
42
+ "num_hidden_layers": 24,
43
  "num_mel_bins": 80,
44
  "pad_token_id": 50257,
45
  "scale_embedding": false,
46
  "suppress_tokens": [],
47
  "torch_dtype": "float32",
48
+ "transformers_version": "4.35.0.dev0",
49
  "use_cache": true,
50
  "use_weighted_layer_sum": false,
51
  "vocab_size": 51865
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95d0d400b5f18896ab9ec5b6986c6801fafcbc26e4b4b927b838bfdc519fc199
3
+ size 3055544304
runs/Nov01_19-59-36_6dd5567327ab/events.out.tfevents.1698868783.6dd5567327ab.808.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0b53e336af676714c8fb9af37755ae590bd8f625417c38c2be4f3bdd1ee9de2
3
+ size 6029
special_tokens_map.json CHANGED
@@ -108,8 +108,32 @@
108
  "<|nocaptions|>",
109
  "<|notimestamps|>"
110
  ],
111
- "bos_token": "<|endoftext|>",
112
- "eos_token": "<|endoftext|>",
113
- "pad_token": "<|endoftext|>",
114
- "unk_token": "<|endoftext|>"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
115
  }
 
108
  "<|nocaptions|>",
109
  "<|notimestamps|>"
110
  ],
111
+ "bos_token": {
112
+ "content": "<|endoftext|>",
113
+ "lstrip": false,
114
+ "normalized": true,
115
+ "rstrip": false,
116
+ "single_word": false
117
+ },
118
+ "eos_token": {
119
+ "content": "<|endoftext|>",
120
+ "lstrip": false,
121
+ "normalized": true,
122
+ "rstrip": false,
123
+ "single_word": false
124
+ },
125
+ "pad_token": {
126
+ "content": "<|endoftext|>",
127
+ "lstrip": false,
128
+ "normalized": false,
129
+ "rstrip": false,
130
+ "single_word": false
131
+ },
132
+ "unk_token": {
133
+ "content": "<|endoftext|>",
134
+ "lstrip": false,
135
+ "normalized": true,
136
+ "rstrip": false,
137
+ "single_word": false
138
+ }
139
  }
tokenizer_config.json CHANGED
The diff for this file is too large to render. See raw diff
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7af51742e9f54fe59d9a9d5eb2ca40b6a7ca9a40d168f37a94cf3d4aa382fb51
3
- size 4219
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:853f436e2901d5c14a622f9a7697dc1e09b58c26b7f5c995cb0445300729876b
3
+ size 4728