bigmorning commited on
Commit
868ff31
1 Parent(s): b83c87f

Upload TFWhisperForConditionalGeneration

Browse files
Files changed (3) hide show
  1. README.md +71 -0
  2. config.json +92 -0
  3. tf_model.h5 +3 -0
README.md ADDED
@@ -0,0 +1,71 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ tags:
4
+ - generated_from_keras_callback
5
+ model-index:
6
+ - name: whisper_werbest
7
+ results: []
8
+ ---
9
+
10
+ <!-- This model card has been generated automatically according to the information Keras had access to. You should
11
+ probably proofread and complete it, then remove this comment. -->
12
+
13
+ # whisper_werbest
14
+
15
+ This model is a fine-tuned version of [openai/whisper-tiny](https://huggingface.co/openai/whisper-tiny) on an unknown dataset.
16
+ It achieves the following results on the evaluation set:
17
+ - Train Loss: 0.3071
18
+ - Train Accuracy: 0.0324
19
+ - Train Wermet: 1.7931
20
+ - Validation Loss: 0.5766
21
+ - Validation Accuracy: 0.0312
22
+ - Validation Wermet: 1.5663
23
+ - Epoch: 14
24
+
25
+ ## Model description
26
+
27
+ More information needed
28
+
29
+ ## Intended uses & limitations
30
+
31
+ More information needed
32
+
33
+ ## Training and evaluation data
34
+
35
+ More information needed
36
+
37
+ ## Training procedure
38
+
39
+ ### Training hyperparameters
40
+
41
+ The following hyperparameters were used during training:
42
+ - optimizer: {'name': 'AdamWeightDecay', 'learning_rate': 1e-05, 'decay': 0.0, 'beta_1': 0.9, 'beta_2': 0.999, 'epsilon': 1e-07, 'amsgrad': False, 'weight_decay_rate': 0.01}
43
+ - training_precision: float32
44
+
45
+ ### Training results
46
+
47
+ | Train Loss | Train Accuracy | Train Wermet | Validation Loss | Validation Accuracy | Validation Wermet | Epoch |
48
+ |:----------:|:--------------:|:------------:|:---------------:|:-------------------:|:-----------------:|:-----:|
49
+ | 5.0795 | 0.0116 | 43.8776 | 4.4395 | 0.0122 | 35.4119 | 0 |
50
+ | 4.3059 | 0.0131 | 29.7976 | 4.0311 | 0.0143 | 26.0070 | 1 |
51
+ | 3.8871 | 0.0148 | 19.3999 | 3.6500 | 0.0158 | 19.2186 | 2 |
52
+ | 3.0943 | 0.0184 | 18.3704 | 2.3327 | 0.0226 | 22.5034 | 3 |
53
+ | 1.8954 | 0.0240 | 16.2471 | 1.4889 | 0.0266 | 14.2782 | 4 |
54
+ | 1.2781 | 0.0269 | 8.4169 | 1.1273 | 0.0283 | 7.4581 | 5 |
55
+ | 0.9797 | 0.0283 | 4.8739 | 0.9481 | 0.0292 | 3.9451 | 6 |
56
+ | 0.8006 | 0.0293 | 2.7433 | 0.8371 | 0.0297 | 2.3065 | 7 |
57
+ | 0.6764 | 0.0299 | 2.1646 | 0.7554 | 0.0301 | 1.3005 | 8 |
58
+ | 0.5820 | 0.0305 | 1.5323 | 0.6980 | 0.0305 | 1.1238 | 9 |
59
+ | 0.5078 | 0.0310 | 1.4328 | 0.6617 | 0.0306 | 1.2793 | 10 |
60
+ | 0.4455 | 0.0314 | 1.4891 | 0.6252 | 0.0309 | 1.6833 | 11 |
61
+ | 0.3927 | 0.0317 | 1.6700 | 0.6123 | 0.0310 | 2.1091 | 12 |
62
+ | 0.3473 | 0.0321 | 1.6245 | 0.5851 | 0.0311 | 1.4109 | 13 |
63
+ | 0.3071 | 0.0324 | 1.7931 | 0.5766 | 0.0312 | 1.5663 | 14 |
64
+
65
+
66
+ ### Framework versions
67
+
68
+ - Transformers 4.25.0.dev0
69
+ - TensorFlow 2.9.2
70
+ - Datasets 2.6.1
71
+ - Tokenizers 0.13.2
config.json ADDED
@@ -0,0 +1,92 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "openai/whisper-tiny",
3
+ "activation_dropout": 0.0,
4
+ "activation_function": "gelu",
5
+ "architectures": [
6
+ "WhisperForConditionalGeneration"
7
+ ],
8
+ "attention_dropout": 0.0,
9
+ "begin_suppress_tokens": [
10
+ 220,
11
+ 50257
12
+ ],
13
+ "bos_token_id": 50257,
14
+ "d_model": 384,
15
+ "decoder_attention_heads": 6,
16
+ "decoder_ffn_dim": 1536,
17
+ "decoder_layerdrop": 0.0,
18
+ "decoder_layers": 4,
19
+ "decoder_start_token_id": 50258,
20
+ "dropout": 0.0,
21
+ "encoder_attention_heads": 6,
22
+ "encoder_ffn_dim": 1536,
23
+ "encoder_layerdrop": 0.0,
24
+ "encoder_layers": 4,
25
+ "eos_token_id": 50257,
26
+ "forced_decoder_ids": [
27
+ [
28
+ 1,
29
+ 50289
30
+ ],
31
+ [
32
+ 2,
33
+ 50359
34
+ ],
35
+ [
36
+ 3,
37
+ 50363
38
+ ]
39
+ ],
40
+ "init_std": 0.02,
41
+ "is_encoder_decoder": true,
42
+ "max_length": 448,
43
+ "max_source_positions": 1500,
44
+ "max_target_positions": 448,
45
+ "model_type": "whisper",
46
+ "num_hidden_layers": 4,
47
+ "num_mel_bins": 80,
48
+ "pad_token_id": 50257,
49
+ "scale_embedding": false,
50
+ "suppress_tokens": [
51
+ 0,
52
+ 1,
53
+ 2,
54
+ 3,
55
+ 4,
56
+ 10968,
57
+ 10969,
58
+ 10970,
59
+ 10971,
60
+ 10972,
61
+ 10973,
62
+ 10974,
63
+ 10975,
64
+ 10976,
65
+ 10977,
66
+ 10978,
67
+ 10979,
68
+ 10980,
69
+ 10981,
70
+ 10982,
71
+ 10983,
72
+ 10984,
73
+ 10985,
74
+ 10986,
75
+ 10987,
76
+ 10988,
77
+ 10989,
78
+ 10990,
79
+ 10991,
80
+ 10992,
81
+ 10993,
82
+ 10994,
83
+ 10995,
84
+ 10996,
85
+ 10997,
86
+ 50256
87
+ ],
88
+ "torch_dtype": "float32",
89
+ "transformers_version": "4.25.0.dev0",
90
+ "use_cache": true,
91
+ "vocab_size": 51865
92
+ }
tf_model.h5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f15a211305c75fd1a6445b17f681006fbdad2ba01f294f7d4f34ba52f248fc7b
3
+ size 151253984