didiudom94 commited on
Commit
fc85f00
·
verified ·
1 Parent(s): 297fc66

Training in progress, step 500

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "openai/whisper-small",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
@@ -10,17 +10,17 @@
10
  "begin_suppress_tokens": null,
11
  "bos_token_id": 50257,
12
  "classifier_proj_size": 256,
13
- "d_model": 768,
14
- "decoder_attention_heads": 12,
15
- "decoder_ffn_dim": 3072,
16
  "decoder_layerdrop": 0.0,
17
- "decoder_layers": 12,
18
  "decoder_start_token_id": 50258,
19
  "dropout": 0.0,
20
- "encoder_attention_heads": 12,
21
- "encoder_ffn_dim": 3072,
22
  "encoder_layerdrop": 0.0,
23
- "encoder_layers": 12,
24
  "eos_token_id": 50257,
25
  "forced_decoder_ids": null,
26
  "init_std": 0.02,
@@ -36,12 +36,12 @@
36
  "max_target_positions": 448,
37
  "median_filter_width": 7,
38
  "model_type": "whisper",
39
- "num_hidden_layers": 12,
40
  "num_mel_bins": 80,
41
  "pad_token_id": 50257,
42
  "scale_embedding": false,
43
  "torch_dtype": "float32",
44
- "transformers_version": "4.47.1",
45
  "use_cache": false,
46
  "use_weighted_layer_sum": false,
47
  "vocab_size": 51865
 
1
  {
2
+ "_name_or_path": "openai/whisper-medium",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
 
10
  "begin_suppress_tokens": null,
11
  "bos_token_id": 50257,
12
  "classifier_proj_size": 256,
13
+ "d_model": 1024,
14
+ "decoder_attention_heads": 16,
15
+ "decoder_ffn_dim": 4096,
16
  "decoder_layerdrop": 0.0,
17
+ "decoder_layers": 24,
18
  "decoder_start_token_id": 50258,
19
  "dropout": 0.0,
20
+ "encoder_attention_heads": 16,
21
+ "encoder_ffn_dim": 4096,
22
  "encoder_layerdrop": 0.0,
23
+ "encoder_layers": 24,
24
  "eos_token_id": 50257,
25
  "forced_decoder_ids": null,
26
  "init_std": 0.02,
 
36
  "max_target_positions": 448,
37
  "median_filter_width": 7,
38
  "model_type": "whisper",
39
+ "num_hidden_layers": 24,
40
  "num_mel_bins": 80,
41
  "pad_token_id": 50257,
42
  "scale_embedding": false,
43
  "torch_dtype": "float32",
44
+ "transformers_version": "4.45.2",
45
  "use_cache": false,
46
  "use_weighted_layer_sum": false,
47
  "vocab_size": 51865
generation_config.json CHANGED
@@ -1,44 +1,28 @@
1
  {
2
  "alignment_heads": [
3
  [
4
- 5,
5
- 3
6
  ],
7
  [
8
- 5,
9
- 9
10
- ],
11
- [
12
- 8,
13
- 0
14
- ],
15
- [
16
- 8,
17
  4
18
  ],
19
  [
20
- 8,
21
- 7
22
  ],
23
  [
24
- 8,
25
- 8
26
  ],
27
  [
28
- 9,
29
  0
30
  ],
31
  [
32
- 9,
33
- 7
34
- ],
35
- [
36
- 9,
37
- 9
38
- ],
39
- [
40
- 10,
41
- 5
42
  ]
43
  ],
44
  "begin_suppress_tokens": [
@@ -167,10 +151,9 @@
167
  "prev_sot_token_id": 50361,
168
  "return_timestamps": false,
169
  "suppress_tokens": [],
170
- "task": "translate",
171
  "task_to_id": {
172
  "transcribe": 50359,
173
  "translate": 50358
174
  },
175
- "transformers_version": "4.47.1"
176
  }
 
1
  {
2
  "alignment_heads": [
3
  [
4
+ 13,
5
+ 15
6
  ],
7
  [
8
+ 15,
 
 
 
 
 
 
 
 
9
  4
10
  ],
11
  [
12
+ 15,
13
+ 15
14
  ],
15
  [
16
+ 16,
17
+ 1
18
  ],
19
  [
20
+ 20,
21
  0
22
  ],
23
  [
24
+ 23,
25
+ 4
 
 
 
 
 
 
 
 
26
  ]
27
  ],
28
  "begin_suppress_tokens": [
 
151
  "prev_sot_token_id": 50361,
152
  "return_timestamps": false,
153
  "suppress_tokens": [],
 
154
  "task_to_id": {
155
  "transcribe": 50359,
156
  "translate": 50358
157
  },
158
+ "transformers_version": "4.45.2"
159
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bdefad703740be8e8fc727ef0190c02293f995d5409e2629a0fa7025711f8887
3
- size 966995080
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d466755a1a30d434549d67e057edcbcbd5f1a7102acec7cb0879edeeba5d44b0
3
+ size 3055544304
runs/Jan08_19-13-32_c402324bf046/events.out.tfevents.1736363666.c402324bf046.1243.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59839f30bface808efd878b93243c1dddf0ddcb5e271a7c00e19043df938c489
3
+ size 10311
tokenizer_config.json CHANGED
@@ -12980,7 +12980,6 @@
12980
  "clean_up_tokenization_spaces": true,
12981
  "eos_token": "<|endoftext|>",
12982
  "errors": "replace",
12983
- "extra_special_tokens": {},
12984
  "model_max_length": 1024,
12985
  "pad_token": "<|endoftext|>",
12986
  "processor_class": "WhisperProcessor",
 
12980
  "clean_up_tokenization_spaces": true,
12981
  "eos_token": "<|endoftext|>",
12982
  "errors": "replace",
 
12983
  "model_max_length": 1024,
12984
  "pad_token": "<|endoftext|>",
12985
  "processor_class": "WhisperProcessor",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:372e07cee47c45bcdd99e97e1b2703a6f6de7c5aa4679f0b1cdbb5af398ea79c
3
- size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8ec4a8c94855f951db9e8fdbf01881b00e1cd380781a427edc3562bec4a1238
3
+ size 5368