diff --git a/README.md b/README.md new file mode 100644 index 0000000000000000000000000000000000000000..906dac99cb514c79383c3ad20d4b1f946e5dd321 --- /dev/null +++ b/README.md @@ -0,0 +1,63 @@ +--- +tags: +- generated_from_trainer +metrics: +- wer +model-index: +- name: whisper-tiny-hi2_test + results: [] +--- + + + +# whisper-tiny-hi2_test + +This model was trained from scratch on the None dataset. +It achieves the following results on the evaluation set: +- Loss: 0.6505 +- Wer: 69.9890 + +## Model description + +More information needed + +## Intended uses & limitations + +More information needed + +## Training and evaluation data + +More information needed + +## Training procedure + +### Training hyperparameters + +The following hyperparameters were used during training: +- learning_rate: 1e-05 +- train_batch_size: 32 +- eval_batch_size: 1 +- seed: 42 +- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08 +- lr_scheduler_type: linear +- training_steps: 200 +- mixed_precision_training: Native AMP + +### Training results + +| Training Loss | Epoch | Step | Validation Loss | Wer | +|:-------------:|:-----:|:----:|:---------------:|:-------:| +| 1.2169 | 1.25 | 40 | 1.0360 | 91.6081 | +| 0.7302 | 2.5 | 80 | 0.7369 | 79.8035 | +| 0.5917 | 3.75 | 120 | 0.6505 | 69.9890 | +| 0.5156 | 5.0 | 160 | 0.6157 | 70.4293 | +| 0.481 | 6.25 | 200 | 0.6051 | 70.0398 | + + +### Framework versions + +- Transformers 4.41.1 +- Pytorch 2.3.1+cu121 +- Datasets 2.19.1 +- Tokenizers 0.19.1 diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1fd81577f3d2ead4fc609557a3a9fa1d7916ef63 --- /dev/null +++ b/config.json @@ -0,0 +1,52 @@ +{ + "_name_or_path": "openai/whisper-tiny", + "activation_dropout": 0.0, + "activation_function": "gelu", + "apply_spec_augment": false, + "architectures": [ + "WhisperForConditionalGeneration" + ], + "attention_dropout": 0.0, + "begin_suppress_tokens": [ + 220, + 50257 + ], + "bos_token_id": 50257, + "classifier_proj_size": 256, + "d_model": 384, + "decoder_attention_heads": 6, + "decoder_ffn_dim": 1536, + "decoder_layerdrop": 0.0, + "decoder_layers": 4, + "decoder_start_token_id": 50258, + "dropout": 0.0, + "encoder_attention_heads": 6, + "encoder_ffn_dim": 1536, + "encoder_layerdrop": 0.0, + "encoder_layers": 4, + "eos_token_id": 50257, + "forced_decoder_ids": null, + "init_std": 0.02, + "is_encoder_decoder": true, + "mask_feature_length": 10, + "mask_feature_min_masks": 0, + "mask_feature_prob": 0.0, + "mask_time_length": 10, + "mask_time_min_masks": 2, + "mask_time_prob": 0.05, + "max_length": 448, + "max_source_positions": 1500, + "max_target_positions": 448, + "median_filter_width": 7, + "model_type": "whisper", + "num_hidden_layers": 4, + "num_mel_bins": 80, + "pad_token_id": 50257, + "scale_embedding": false, + "suppress_tokens": [], + "torch_dtype": "float32", + "transformers_version": "4.41.1", + "use_cache": true, + "use_weighted_layer_sum": false, + "vocab_size": 51865 +} diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9d286bdf1e0677a78ae4dc92903472de5fe668ef --- /dev/null +++ b/generation_config.json @@ -0,0 +1,248 @@ +{ + "alignment_heads": [ + [ + 2, + 2 + ], + [ + 3, + 0 + ], + [ + 3, + 2 + ], + [ + 3, + 3 + ], + [ + 3, + 4 + ], + [ + 3, + 5 + ] + ], + "begin_suppress_tokens": [ + 220, + 50257 + ], + "bos_token_id": 50257, + "decoder_start_token_id": 50258, + "eos_token_id": 50257, + "forced_decoder_ids": [ + [ + 1, + null + ], + [ + 2, + 50359 + ] + ], + "is_multilingual": true, + "lang_to_id": { + "<|af|>": 50327, + "<|am|>": 50334, + "<|ar|>": 50272, + "<|as|>": 50350, + "<|az|>": 50304, + "<|ba|>": 50355, + "<|be|>": 50330, + "<|bg|>": 50292, + "<|bn|>": 50302, + "<|bo|>": 50347, + "<|br|>": 50309, + "<|bs|>": 50315, + "<|ca|>": 50270, + "<|cs|>": 50283, + "<|cy|>": 50297, + "<|da|>": 50285, + "<|de|>": 50261, + "<|el|>": 50281, + "<|en|>": 50259, + "<|es|>": 50262, + "<|et|>": 50307, + "<|eu|>": 50310, + "<|fa|>": 50300, + "<|fi|>": 50277, + "<|fo|>": 50338, + "<|fr|>": 50265, + "<|gl|>": 50319, + "<|gu|>": 50333, + "<|haw|>": 50352, + "<|ha|>": 50354, + "<|he|>": 50279, + "<|hi|>": 50276, + "<|hr|>": 50291, + "<|ht|>": 50339, + "<|hu|>": 50286, + "<|hy|>": 50312, + "<|id|>": 50275, + "<|is|>": 50311, + "<|it|>": 50274, + "<|ja|>": 50266, + "<|jw|>": 50356, + "<|ka|>": 50329, + "<|kk|>": 50316, + "<|km|>": 50323, + "<|kn|>": 50306, + "<|ko|>": 50264, + "<|la|>": 50294, + "<|lb|>": 50345, + "<|ln|>": 50353, + "<|lo|>": 50336, + "<|lt|>": 50293, + "<|lv|>": 50301, + "<|mg|>": 50349, + "<|mi|>": 50295, + "<|mk|>": 50308, + "<|ml|>": 50296, + "<|mn|>": 50314, + "<|mr|>": 50320, + "<|ms|>": 50282, + "<|mt|>": 50343, + "<|my|>": 50346, + "<|ne|>": 50313, + "<|nl|>": 50271, + "<|nn|>": 50342, + "<|no|>": 50288, + "<|oc|>": 50328, + "<|pa|>": 50321, + "<|pl|>": 50269, + "<|ps|>": 50340, + "<|pt|>": 50267, + "<|ro|>": 50284, + "<|ru|>": 50263, + "<|sa|>": 50344, + "<|sd|>": 50332, + "<|si|>": 50322, + "<|sk|>": 50298, + "<|sl|>": 50305, + "<|sn|>": 50324, + "<|so|>": 50326, + "<|sq|>": 50317, + "<|sr|>": 50303, + "<|su|>": 50357, + "<|sv|>": 50273, + "<|sw|>": 50318, + "<|ta|>": 50287, + "<|te|>": 50299, + "<|tg|>": 50331, + "<|th|>": 50289, + "<|tk|>": 50341, + "<|tl|>": 50348, + "<|tr|>": 50268, + "<|tt|>": 50351, + "<|uk|>": 50280, + "<|ur|>": 50290, + "<|uz|>": 50337, + "<|vi|>": 50278, + "<|yi|>": 50335, + "<|yo|>": 50325, + "<|zh|>": 50260 + }, + "max_initial_timestamp_index": 50, + "max_length": 448, + "no_timestamps_token_id": 50363, + "pad_token_id": 50257, + "prev_sot_token_id": 50361, + "return_timestamps": false, + "suppress_tokens": [ + 1, + 2, + 7, + 8, + 9, + 10, + 14, + 25, + 26, + 27, + 28, + 29, + 31, + 58, + 59, + 60, + 61, + 62, + 63, + 90, + 91, + 92, + 93, + 359, + 503, + 522, + 542, + 873, + 893, + 902, + 918, + 922, + 931, + 1350, + 1853, + 1982, + 2460, + 2627, + 3246, + 3253, + 3268, + 3536, + 3846, + 3961, + 4183, + 4667, + 6585, + 6647, + 7273, + 9061, + 9383, + 10428, + 10929, + 11938, + 12033, + 12331, + 12562, + 13793, + 14157, + 14635, + 15265, + 15618, + 16553, + 16604, + 18362, + 18956, + 20075, + 21675, + 22520, + 26130, + 26161, + 26435, + 28279, + 29464, + 31650, + 32302, + 32470, + 36865, + 42863, + 47425, + 49870, + 50254, + 50258, + 50358, + 50359, + 50360, + 50361, + 50362 + ], + "task_to_id": { + "transcribe": 50359, + "translate": 50358 + }, + "transformers_version": "4.41.1" +} diff --git a/model.safetensors b/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0bc8697c8e8add0d2b41608e619039eacd5da941 --- /dev/null +++ b/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d190ef9c83448c09f88c0d4fc1c930eed6a8903a60639390d6b1ba2a9601942 +size 151061672 diff --git a/preprocessor_config.json b/preprocessor_config.json new file mode 100644 index 0000000000000000000000000000000000000000..91876762a536a746d268353c5cba57286e76b058 --- /dev/null +++ b/preprocessor_config.json @@ -0,0 +1,14 @@ +{ + "chunk_length": 30, + "feature_extractor_type": "WhisperFeatureExtractor", + "feature_size": 80, + "hop_length": 160, + "n_fft": 400, + "n_samples": 480000, + "nb_max_frames": 3000, + "padding_side": "right", + "padding_value": 0.0, + "processor_class": "WhisperProcessor", + "return_attention_mask": false, + "sampling_rate": 16000 +} diff --git a/runs/Jun19_20-28-38_bharatsahaiyak-test/events.out.tfevents.1718828918.bharatsahaiyak-test.421665.1 b/runs/Jun19_20-28-38_bharatsahaiyak-test/events.out.tfevents.1718828918.bharatsahaiyak-test.421665.1 new file mode 100644 index 0000000000000000000000000000000000000000..e6e84335c9a84c2ad8c124882c6d74a92abc03cd --- /dev/null +++ b/runs/Jun19_20-28-38_bharatsahaiyak-test/events.out.tfevents.1718828918.bharatsahaiyak-test.421665.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:510cd619e1c6debdc2e3ec4cfbe77fda3f0ce35d267c20bf1f2b4d15cd7c1d18 +size 5660 diff --git a/runs/Jun19_20-31-09_bharatsahaiyak-test/events.out.tfevents.1718829070.bharatsahaiyak-test.422770.0 b/runs/Jun19_20-31-09_bharatsahaiyak-test/events.out.tfevents.1718829070.bharatsahaiyak-test.422770.0 new file mode 100644 index 0000000000000000000000000000000000000000..aa7acbe18e19a2f838ad238e9449fb9c1b866921 --- /dev/null +++ b/runs/Jun19_20-31-09_bharatsahaiyak-test/events.out.tfevents.1718829070.bharatsahaiyak-test.422770.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b52aa63e09164dfe4fa7d470a9fc7a5109ebabf94b247ac53600532d4e8940f4 +size 7003 diff --git a/runs/Jun19_21-03-46_bharatsahaiyak-test/events.out.tfevents.1718831027.bharatsahaiyak-test.422770.1 b/runs/Jun19_21-03-46_bharatsahaiyak-test/events.out.tfevents.1718831027.bharatsahaiyak-test.422770.1 new file mode 100644 index 0000000000000000000000000000000000000000..a9f554dfe41960bc7a61a3481dbfe73713bffb0e --- /dev/null +++ b/runs/Jun19_21-03-46_bharatsahaiyak-test/events.out.tfevents.1718831027.bharatsahaiyak-test.422770.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f04b2cf982a47b2cafe36be02f0c833cd85f281766e17ed44ef993ea66aed9c5 +size 5656 diff --git a/runs/Jun19_21-12-37_bharatsahaiyak-test/events.out.tfevents.1718831558.bharatsahaiyak-test.422770.2 b/runs/Jun19_21-12-37_bharatsahaiyak-test/events.out.tfevents.1718831558.bharatsahaiyak-test.422770.2 new file mode 100644 index 0000000000000000000000000000000000000000..2ca41bf64584e8d3e840d6f171f87b55148df215 --- /dev/null +++ b/runs/Jun19_21-12-37_bharatsahaiyak-test/events.out.tfevents.1718831558.bharatsahaiyak-test.422770.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22ea635942e2833956fe030d25656abec1c28d64b475185a0040644a0450bf39 +size 7005 diff --git a/runs/Jun19_21-32-10_bharatsahaiyak-test/events.out.tfevents.1718832731.bharatsahaiyak-test.422770.3 b/runs/Jun19_21-32-10_bharatsahaiyak-test/events.out.tfevents.1718832731.bharatsahaiyak-test.422770.3 new file mode 100644 index 0000000000000000000000000000000000000000..7308280b062ef21a33ed6fb5528a5760b8a712ff --- /dev/null +++ b/runs/Jun19_21-32-10_bharatsahaiyak-test/events.out.tfevents.1718832731.bharatsahaiyak-test.422770.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d22a8f787959993dfa3fc1ac86d0b7b2fe85b423f594c5781e5312c1dd14d9a +size 9669 diff --git a/runs/Jun19_22-32-24_bharatsahaiyak-test/events.out.tfevents.1718836344.bharatsahaiyak-test.422770.4 b/runs/Jun19_22-32-24_bharatsahaiyak-test/events.out.tfevents.1718836344.bharatsahaiyak-test.422770.4 new file mode 100644 index 0000000000000000000000000000000000000000..ed5dda06c7a3e0b3107dfdf43854bfd7c5ba47be --- /dev/null +++ b/runs/Jun19_22-32-24_bharatsahaiyak-test/events.out.tfevents.1718836344.bharatsahaiyak-test.422770.4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc76fe49e19efc5f5fcccfee242a3e9fce8e65d7c571886d70a39454db49488d +size 6044 diff --git a/runs/Jun20_05-30-45_bharatsahaiyak-test/events.out.tfevents.1718861446.bharatsahaiyak-test.471347.0 b/runs/Jun20_05-30-45_bharatsahaiyak-test/events.out.tfevents.1718861446.bharatsahaiyak-test.471347.0 new file mode 100644 index 0000000000000000000000000000000000000000..f0dc7f5ccc12250a237e562ceea83cb74135ce15 --- /dev/null +++ b/runs/Jun20_05-30-45_bharatsahaiyak-test/events.out.tfevents.1718861446.bharatsahaiyak-test.471347.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d442eb775d65605a5cabaa49c274315d892f3b8c368a8503a14fbadbaff5981 +size 5657 diff --git a/runs/Jun20_05-34-22_bharatsahaiyak-test/events.out.tfevents.1718861663.bharatsahaiyak-test.474181.0 b/runs/Jun20_05-34-22_bharatsahaiyak-test/events.out.tfevents.1718861663.bharatsahaiyak-test.474181.0 new file mode 100644 index 0000000000000000000000000000000000000000..6bb5863593f5b7799e85f79fed197c4d7bec2509 --- /dev/null +++ b/runs/Jun20_05-34-22_bharatsahaiyak-test/events.out.tfevents.1718861663.bharatsahaiyak-test.474181.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7cd143c23d4b672024605f3d389594054ab531878716d504eace6c370ff1611 +size 7316 diff --git a/runs/Jun20_06-21-19_bharatsahaiyak-test/events.out.tfevents.1718864480.bharatsahaiyak-test.505065.0 b/runs/Jun20_06-21-19_bharatsahaiyak-test/events.out.tfevents.1718864480.bharatsahaiyak-test.505065.0 new file mode 100644 index 0000000000000000000000000000000000000000..c8d6e9ad9287326b95e2b9b315a21ad1b3b38384 --- /dev/null +++ b/runs/Jun20_06-21-19_bharatsahaiyak-test/events.out.tfevents.1718864480.bharatsahaiyak-test.505065.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c70425037cb1abacb669a47c355fd90bc51ef0645990611c2049c753bc1e160 +size 6383 diff --git a/runs/Jun20_06-40-00_bharatsahaiyak-test/events.out.tfevents.1718865601.bharatsahaiyak-test.505065.1 b/runs/Jun20_06-40-00_bharatsahaiyak-test/events.out.tfevents.1718865601.bharatsahaiyak-test.505065.1 new file mode 100644 index 0000000000000000000000000000000000000000..c53ed8552021379cecb5cf80ea87f9d976bd8420 --- /dev/null +++ b/runs/Jun20_06-40-00_bharatsahaiyak-test/events.out.tfevents.1718865601.bharatsahaiyak-test.505065.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:394e617e5ea8c4e041ff5135453bb7da82866f0c8d8878d0427393541faf96a6 +size 9669 diff --git a/runs/Jun20_07-41-26_bharatsahaiyak-test/events.out.tfevents.1718869287.bharatsahaiyak-test.505065.2 b/runs/Jun20_07-41-26_bharatsahaiyak-test/events.out.tfevents.1718869287.bharatsahaiyak-test.505065.2 new file mode 100644 index 0000000000000000000000000000000000000000..abe9a198604e1c4d37982a6bddccc75439b1ce20 --- /dev/null +++ b/runs/Jun20_07-41-26_bharatsahaiyak-test/events.out.tfevents.1718869287.bharatsahaiyak-test.505065.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2cf272083b8469c853e9a6c0a41ad5158ed6496bc17d433226be899ab555562 +size 6044 diff --git a/runs/Jun20_07-41-26_bharatsahaiyak-test/events.out.tfevents.1718869846.bharatsahaiyak-test.505065.3 b/runs/Jun20_07-41-26_bharatsahaiyak-test/events.out.tfevents.1718869846.bharatsahaiyak-test.505065.3 new file mode 100644 index 0000000000000000000000000000000000000000..7391394a819b092a130dc609964a66a574d48618 --- /dev/null +++ b/runs/Jun20_07-41-26_bharatsahaiyak-test/events.out.tfevents.1718869846.bharatsahaiyak-test.505065.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9af5e74380fe61b2074b17ac1ccc46acd88711215ffa6bd282b205a25eafb11f +size 406 diff --git a/runs/Jun20_07-51-18_bharatsahaiyak-test/events.out.tfevents.1718869879.bharatsahaiyak-test.505065.4 b/runs/Jun20_07-51-18_bharatsahaiyak-test/events.out.tfevents.1718869879.bharatsahaiyak-test.505065.4 new file mode 100644 index 0000000000000000000000000000000000000000..8d9da00c1d94d189db48ff098bb33349d792028e --- /dev/null +++ b/runs/Jun20_07-51-18_bharatsahaiyak-test/events.out.tfevents.1718869879.bharatsahaiyak-test.505065.4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:083dfc981299d8b0d10cbe7517551650074654d0598e5a7b1cbfd95b62950ced +size 6044 diff --git a/runs/Jun20_07-51-18_bharatsahaiyak-test/events.out.tfevents.1718870430.bharatsahaiyak-test.505065.5 b/runs/Jun20_07-51-18_bharatsahaiyak-test/events.out.tfevents.1718870430.bharatsahaiyak-test.505065.5 new file mode 100644 index 0000000000000000000000000000000000000000..08cec8fbe6825c7e3dcf4483f5256219ce5c9a8c --- /dev/null +++ b/runs/Jun20_07-51-18_bharatsahaiyak-test/events.out.tfevents.1718870430.bharatsahaiyak-test.505065.5 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f06dbd7e8c0b79bf7693d2402923be0924fc3b1e03021ca10a5119255c0f9f4 +size 406 diff --git a/runs/Jun20_08-01-03_bharatsahaiyak-test/events.out.tfevents.1718870463.bharatsahaiyak-test.505065.6 b/runs/Jun20_08-01-03_bharatsahaiyak-test/events.out.tfevents.1718870463.bharatsahaiyak-test.505065.6 new file mode 100644 index 0000000000000000000000000000000000000000..ddf2ee4aa29dea95b97447964b0e2f475d661230 --- /dev/null +++ b/runs/Jun20_08-01-03_bharatsahaiyak-test/events.out.tfevents.1718870463.bharatsahaiyak-test.505065.6 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c0563652c8c970190e82ce248d84da5affa390018b88c9a8b0b75adaabbc49e +size 6044 diff --git a/runs/Jun20_08-01-03_bharatsahaiyak-test/events.out.tfevents.1718871013.bharatsahaiyak-test.505065.7 b/runs/Jun20_08-01-03_bharatsahaiyak-test/events.out.tfevents.1718871013.bharatsahaiyak-test.505065.7 new file mode 100644 index 0000000000000000000000000000000000000000..a7e078aca52ae63675c64fd55d6428de3e79ea7b --- /dev/null +++ b/runs/Jun20_08-01-03_bharatsahaiyak-test/events.out.tfevents.1718871013.bharatsahaiyak-test.505065.7 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:872f0fc2abb888580bcbfc5bfd3c16edbb7b84458786e74c647c4cbb744913c5 +size 406 diff --git a/runs/Jun20_08-10-47_bharatsahaiyak-test/events.out.tfevents.1718871048.bharatsahaiyak-test.505065.8 b/runs/Jun20_08-10-47_bharatsahaiyak-test/events.out.tfevents.1718871048.bharatsahaiyak-test.505065.8 new file mode 100644 index 0000000000000000000000000000000000000000..052a2503d3ac918b33136cf503ad5740aee10071 --- /dev/null +++ b/runs/Jun20_08-10-47_bharatsahaiyak-test/events.out.tfevents.1718871048.bharatsahaiyak-test.505065.8 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e27dfd90e68d0373c568fd2fd895429b849cc31d965e7151bcee5bc63c5888bd +size 6044 diff --git a/runs/Jun20_08-10-47_bharatsahaiyak-test/events.out.tfevents.1718871600.bharatsahaiyak-test.505065.9 b/runs/Jun20_08-10-47_bharatsahaiyak-test/events.out.tfevents.1718871600.bharatsahaiyak-test.505065.9 new file mode 100644 index 0000000000000000000000000000000000000000..a984a8db835d3854930b992403d3650f05ea5510 --- /dev/null +++ b/runs/Jun20_08-10-47_bharatsahaiyak-test/events.out.tfevents.1718871600.bharatsahaiyak-test.505065.9 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ef2dbbbd65409ef53bc3863b7da72a6e4bca31d35fdc2ae52310b889c23e4ef +size 406 diff --git a/runs/Jun20_08-20-34_bharatsahaiyak-test/events.out.tfevents.1718871634.bharatsahaiyak-test.505065.10 b/runs/Jun20_08-20-34_bharatsahaiyak-test/events.out.tfevents.1718871634.bharatsahaiyak-test.505065.10 new file mode 100644 index 0000000000000000000000000000000000000000..945e7fa78376adb60d7b75954df0eb02bdca6840 --- /dev/null +++ b/runs/Jun20_08-20-34_bharatsahaiyak-test/events.out.tfevents.1718871634.bharatsahaiyak-test.505065.10 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32fa872d31dd1b73f80739537ec98f31798720bf73992336f4298524773661b6 +size 6044 diff --git a/runs/Jun20_08-20-34_bharatsahaiyak-test/events.out.tfevents.1718872186.bharatsahaiyak-test.505065.11 b/runs/Jun20_08-20-34_bharatsahaiyak-test/events.out.tfevents.1718872186.bharatsahaiyak-test.505065.11 new file mode 100644 index 0000000000000000000000000000000000000000..4bdda989ae7f2d8b85688f26b211b99aa6284bf8 --- /dev/null +++ b/runs/Jun20_08-20-34_bharatsahaiyak-test/events.out.tfevents.1718872186.bharatsahaiyak-test.505065.11 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b04a758e8279dc07c154e4e35552c1d31f2e17fad24e20445612f079969b970 +size 406 diff --git a/runs/Jun20_08-30-19_bharatsahaiyak-test/events.out.tfevents.1718872220.bharatsahaiyak-test.505065.12 b/runs/Jun20_08-30-19_bharatsahaiyak-test/events.out.tfevents.1718872220.bharatsahaiyak-test.505065.12 new file mode 100644 index 0000000000000000000000000000000000000000..b69b83fe4746ae3cd5465b0f7b4b2b83c90cca47 --- /dev/null +++ b/runs/Jun20_08-30-19_bharatsahaiyak-test/events.out.tfevents.1718872220.bharatsahaiyak-test.505065.12 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36de5cbe836b3aa9a3020223a41b2e1b7f68f06f2409002fd638f68f2e7cb892 +size 6044 diff --git a/runs/Jun20_14-52-54_bharatsahaiyak-test/events.out.tfevents.1718895174.bharatsahaiyak-test.584004.0 b/runs/Jun20_14-52-54_bharatsahaiyak-test/events.out.tfevents.1718895174.bharatsahaiyak-test.584004.0 new file mode 100644 index 0000000000000000000000000000000000000000..0e9e52fbd4d7e60b602b49d776e2432b459b874f --- /dev/null +++ b/runs/Jun20_14-52-54_bharatsahaiyak-test/events.out.tfevents.1718895174.bharatsahaiyak-test.584004.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb04e0955c5f60c5533bfc3ab486c4cd2d1985b39d4576d5fe32cf53e6127618 +size 9666 diff --git a/runs/Jun20_15-53-41_bharatsahaiyak-test/events.out.tfevents.1718898822.bharatsahaiyak-test.584004.1 b/runs/Jun20_15-53-41_bharatsahaiyak-test/events.out.tfevents.1718898822.bharatsahaiyak-test.584004.1 new file mode 100644 index 0000000000000000000000000000000000000000..18c4309829f1dc066baf1ee929c90b1d6ea67814 --- /dev/null +++ b/runs/Jun20_15-53-41_bharatsahaiyak-test/events.out.tfevents.1718898822.bharatsahaiyak-test.584004.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0c3bea61afd7059e4bfbdc33b93fec1962be1a41673fd5707f3c3893899f6a4 +size 6041 diff --git a/runs/Jun20_15-53-41_bharatsahaiyak-test/events.out.tfevents.1718899378.bharatsahaiyak-test.584004.2 b/runs/Jun20_15-53-41_bharatsahaiyak-test/events.out.tfevents.1718899378.bharatsahaiyak-test.584004.2 new file mode 100644 index 0000000000000000000000000000000000000000..44d5982f4d833c25fd76af1df0b6ca7a38ecdd69 --- /dev/null +++ b/runs/Jun20_15-53-41_bharatsahaiyak-test/events.out.tfevents.1718899378.bharatsahaiyak-test.584004.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66096c03089eb5b6b771e373cfb9672913aa337d5d14d2236b9451e46a12ec5a +size 406 diff --git a/runs/Jun20_16-03-30_bharatsahaiyak-test/events.out.tfevents.1718899410.bharatsahaiyak-test.584004.3 b/runs/Jun20_16-03-30_bharatsahaiyak-test/events.out.tfevents.1718899410.bharatsahaiyak-test.584004.3 new file mode 100644 index 0000000000000000000000000000000000000000..102e8b5915e0d1517f8fa7df7c5412719aec79d9 --- /dev/null +++ b/runs/Jun20_16-03-30_bharatsahaiyak-test/events.out.tfevents.1718899410.bharatsahaiyak-test.584004.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d736509209f05e11f32fb53771eb5ae9685748b90d5a424b9dee1eb4bb8a12e8 +size 6041 diff --git a/runs/Jun20_16-03-30_bharatsahaiyak-test/events.out.tfevents.1718899966.bharatsahaiyak-test.584004.4 b/runs/Jun20_16-03-30_bharatsahaiyak-test/events.out.tfevents.1718899966.bharatsahaiyak-test.584004.4 new file mode 100644 index 0000000000000000000000000000000000000000..e4060ed80e93b78b65a20cbf19ee800b980364ba --- /dev/null +++ b/runs/Jun20_16-03-30_bharatsahaiyak-test/events.out.tfevents.1718899966.bharatsahaiyak-test.584004.4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6215965a67ec2a2a36bb46a58de7e0014aa9eef5c41a43aa4e8ad00b4a258ee4 +size 406 diff --git a/runs/Jun20_16-13-18_bharatsahaiyak-test/events.out.tfevents.1718899999.bharatsahaiyak-test.584004.5 b/runs/Jun20_16-13-18_bharatsahaiyak-test/events.out.tfevents.1718899999.bharatsahaiyak-test.584004.5 new file mode 100644 index 0000000000000000000000000000000000000000..8f1a8154e35b08f09dfc7bfd3e4ab488cb7b205a --- /dev/null +++ b/runs/Jun20_16-13-18_bharatsahaiyak-test/events.out.tfevents.1718899999.bharatsahaiyak-test.584004.5 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4d29399ca5e7f3f069e1775ebfab9b350737f4b1590cc98adb53dbe5cc57a7c +size 6041 diff --git a/runs/Jun20_16-13-18_bharatsahaiyak-test/events.out.tfevents.1718900554.bharatsahaiyak-test.584004.6 b/runs/Jun20_16-13-18_bharatsahaiyak-test/events.out.tfevents.1718900554.bharatsahaiyak-test.584004.6 new file mode 100644 index 0000000000000000000000000000000000000000..34add29de79ecc623980eeae616836d12bb768ea --- /dev/null +++ b/runs/Jun20_16-13-18_bharatsahaiyak-test/events.out.tfevents.1718900554.bharatsahaiyak-test.584004.6 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cce34150423b17f1193e5ac1d524306785ba726b230eab83dd387222ceeedede +size 406 diff --git a/runs/Jun20_16-23-08_bharatsahaiyak-test/events.out.tfevents.1718900588.bharatsahaiyak-test.584004.7 b/runs/Jun20_16-23-08_bharatsahaiyak-test/events.out.tfevents.1718900588.bharatsahaiyak-test.584004.7 new file mode 100644 index 0000000000000000000000000000000000000000..6c53e35d40f7ebde27a7887d23cfb21b7dfff8b0 --- /dev/null +++ b/runs/Jun20_16-23-08_bharatsahaiyak-test/events.out.tfevents.1718900588.bharatsahaiyak-test.584004.7 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:305c86f410f4372eadea70a12ca3fe7d401f5b673089185c08454f1b56789531 +size 6041 diff --git a/runs/Jun20_16-23-08_bharatsahaiyak-test/events.out.tfevents.1718901143.bharatsahaiyak-test.584004.8 b/runs/Jun20_16-23-08_bharatsahaiyak-test/events.out.tfevents.1718901143.bharatsahaiyak-test.584004.8 new file mode 100644 index 0000000000000000000000000000000000000000..3f357d6da2644bae036c2eabe253dc1204f3c826 --- /dev/null +++ b/runs/Jun20_16-23-08_bharatsahaiyak-test/events.out.tfevents.1718901143.bharatsahaiyak-test.584004.8 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0f842b9b276a5f59e3faa05114ea25e0c94b271a5b56b122ef9b64b201086cc +size 406 diff --git a/runs/Jun20_16-32-55_bharatsahaiyak-test/events.out.tfevents.1718901175.bharatsahaiyak-test.584004.9 b/runs/Jun20_16-32-55_bharatsahaiyak-test/events.out.tfevents.1718901175.bharatsahaiyak-test.584004.9 new file mode 100644 index 0000000000000000000000000000000000000000..e313b56bd2cc98d1d80d91e9db41e645471803f8 --- /dev/null +++ b/runs/Jun20_16-32-55_bharatsahaiyak-test/events.out.tfevents.1718901175.bharatsahaiyak-test.584004.9 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df447129bd81e3df977ba18126deff6e8d1b367a1929a3b49f62432b58146ad0 +size 6041 diff --git a/runs/Jun20_16-32-55_bharatsahaiyak-test/events.out.tfevents.1718901729.bharatsahaiyak-test.584004.10 b/runs/Jun20_16-32-55_bharatsahaiyak-test/events.out.tfevents.1718901729.bharatsahaiyak-test.584004.10 new file mode 100644 index 0000000000000000000000000000000000000000..b89e8881218fbc4964e0b0ef7fc5834d24c0aaa8 --- /dev/null +++ b/runs/Jun20_16-32-55_bharatsahaiyak-test/events.out.tfevents.1718901729.bharatsahaiyak-test.584004.10 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:728230a75f3a023d5e7f45f5b7dfb0f4e13d18059e1efb879468a2e72d3bdc91 +size 406 diff --git a/runs/Jun20_16-42-42_bharatsahaiyak-test/events.out.tfevents.1718901763.bharatsahaiyak-test.584004.11 b/runs/Jun20_16-42-42_bharatsahaiyak-test/events.out.tfevents.1718901763.bharatsahaiyak-test.584004.11 new file mode 100644 index 0000000000000000000000000000000000000000..b3ee46a284f0b1d44823131cb59df9e73559a214 --- /dev/null +++ b/runs/Jun20_16-42-42_bharatsahaiyak-test/events.out.tfevents.1718901763.bharatsahaiyak-test.584004.11 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88263d8bf4f4560ea0333fbea3a644df31d21fd132431c2525af07a6a3b278c4 +size 6041 diff --git a/runs/Jun20_16-42-42_bharatsahaiyak-test/events.out.tfevents.1718902317.bharatsahaiyak-test.584004.12 b/runs/Jun20_16-42-42_bharatsahaiyak-test/events.out.tfevents.1718902317.bharatsahaiyak-test.584004.12 new file mode 100644 index 0000000000000000000000000000000000000000..4c84f1b53f62a2819588ab56118b2be93f8b15b1 --- /dev/null +++ b/runs/Jun20_16-42-42_bharatsahaiyak-test/events.out.tfevents.1718902317.bharatsahaiyak-test.584004.12 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12f1431903f73cb0ebc4f17b8fece3056f11fb2eeec7e7621f4a8a4db5c7e762 +size 406 diff --git a/runs/Jun20_16-52-29_bharatsahaiyak-test/events.out.tfevents.1718902350.bharatsahaiyak-test.584004.13 b/runs/Jun20_16-52-29_bharatsahaiyak-test/events.out.tfevents.1718902350.bharatsahaiyak-test.584004.13 new file mode 100644 index 0000000000000000000000000000000000000000..b9cd2b3e9cedb596a0c003301bc3ee1f36361777 --- /dev/null +++ b/runs/Jun20_16-52-29_bharatsahaiyak-test/events.out.tfevents.1718902350.bharatsahaiyak-test.584004.13 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33c6ba615fc6006ea943feb79f6fbc5d14b10b8015c40ee810677aaab2942c3f +size 6041 diff --git a/runs/Jun20_16-52-29_bharatsahaiyak-test/events.out.tfevents.1718902903.bharatsahaiyak-test.584004.14 b/runs/Jun20_16-52-29_bharatsahaiyak-test/events.out.tfevents.1718902903.bharatsahaiyak-test.584004.14 new file mode 100644 index 0000000000000000000000000000000000000000..b7d393285d35f3aa5c023da9bdb13fd74672c38b --- /dev/null +++ b/runs/Jun20_16-52-29_bharatsahaiyak-test/events.out.tfevents.1718902903.bharatsahaiyak-test.584004.14 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13aa284f4c6b605fd298844950c4e9c8f4bfb84e227ac700cbce65b7209d3d91 +size 406 diff --git a/runs/Jun20_17-02-22_bharatsahaiyak-test/events.out.tfevents.1718902942.bharatsahaiyak-test.584004.15 b/runs/Jun20_17-02-22_bharatsahaiyak-test/events.out.tfevents.1718902942.bharatsahaiyak-test.584004.15 new file mode 100644 index 0000000000000000000000000000000000000000..e361712ddc753c12f3b354b9370f34c44e4533f7 --- /dev/null +++ b/runs/Jun20_17-02-22_bharatsahaiyak-test/events.out.tfevents.1718902942.bharatsahaiyak-test.584004.15 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8872bca6899d33d468cdf88461293d21683dc5c3a883495506d2dea2a1fe6875 +size 6041 diff --git a/runs/Jun20_17-02-22_bharatsahaiyak-test/events.out.tfevents.1718903497.bharatsahaiyak-test.584004.16 b/runs/Jun20_17-02-22_bharatsahaiyak-test/events.out.tfevents.1718903497.bharatsahaiyak-test.584004.16 new file mode 100644 index 0000000000000000000000000000000000000000..f6a7c043541170878e7150726949a110be56f65e --- /dev/null +++ b/runs/Jun20_17-02-22_bharatsahaiyak-test/events.out.tfevents.1718903497.bharatsahaiyak-test.584004.16 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80d6d442ac3252d42d19909bd07cf84663f8728c90281ee59d7697970a29e6a1 +size 406 diff --git a/runs/Jun20_17-12-17_bharatsahaiyak-test/events.out.tfevents.1718903538.bharatsahaiyak-test.584004.17 b/runs/Jun20_17-12-17_bharatsahaiyak-test/events.out.tfevents.1718903538.bharatsahaiyak-test.584004.17 new file mode 100644 index 0000000000000000000000000000000000000000..854ea4ad696cec2abec3a6d5e03d4c5b96493cbf --- /dev/null +++ b/runs/Jun20_17-12-17_bharatsahaiyak-test/events.out.tfevents.1718903538.bharatsahaiyak-test.584004.17 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc21cff19d8da62d157be35e39c6e543d5e06b24e395581958ad47a1b58a4f8f +size 6041 diff --git a/runs/Jun25_19-32-54_bharatsahaiyak-test/events.out.tfevents.1719343975.bharatsahaiyak-test.945044.0 b/runs/Jun25_19-32-54_bharatsahaiyak-test/events.out.tfevents.1719343975.bharatsahaiyak-test.945044.0 new file mode 100644 index 0000000000000000000000000000000000000000..1747c90a36cf384369d169249df14add2d8c8c0e --- /dev/null +++ b/runs/Jun25_19-32-54_bharatsahaiyak-test/events.out.tfevents.1719343975.bharatsahaiyak-test.945044.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee19fbbf775497fc0678744e77aee77baf82246b93eaf448a5f7b26f14254e43 +size 6383 diff --git a/training_args.bin b/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..8bd81ca077d83038930c0af28a08a0f8f1541d0e --- /dev/null +++ b/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb6a9965906076c7dada293c67702be2256eee05b35a9c0969b175f38ca2222b +size 5240 diff --git a/whisper-tiny-hi-checkpoint-1/config.json b/whisper-tiny-hi-checkpoint-1/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1fd81577f3d2ead4fc609557a3a9fa1d7916ef63 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-1/config.json @@ -0,0 +1,52 @@ +{ + "_name_or_path": "openai/whisper-tiny", + "activation_dropout": 0.0, + "activation_function": "gelu", + "apply_spec_augment": false, + "architectures": [ + "WhisperForConditionalGeneration" + ], + "attention_dropout": 0.0, + "begin_suppress_tokens": [ + 220, + 50257 + ], + "bos_token_id": 50257, + "classifier_proj_size": 256, + "d_model": 384, + "decoder_attention_heads": 6, + "decoder_ffn_dim": 1536, + "decoder_layerdrop": 0.0, + "decoder_layers": 4, + "decoder_start_token_id": 50258, + "dropout": 0.0, + "encoder_attention_heads": 6, + "encoder_ffn_dim": 1536, + "encoder_layerdrop": 0.0, + "encoder_layers": 4, + "eos_token_id": 50257, + "forced_decoder_ids": null, + "init_std": 0.02, + "is_encoder_decoder": true, + "mask_feature_length": 10, + "mask_feature_min_masks": 0, + "mask_feature_prob": 0.0, + "mask_time_length": 10, + "mask_time_min_masks": 2, + "mask_time_prob": 0.05, + "max_length": 448, + "max_source_positions": 1500, + "max_target_positions": 448, + "median_filter_width": 7, + "model_type": "whisper", + "num_hidden_layers": 4, + "num_mel_bins": 80, + "pad_token_id": 50257, + "scale_embedding": false, + "suppress_tokens": [], + "torch_dtype": "float32", + "transformers_version": "4.41.1", + "use_cache": true, + "use_weighted_layer_sum": false, + "vocab_size": 51865 +} diff --git a/whisper-tiny-hi-checkpoint-1/generation_config.json b/whisper-tiny-hi-checkpoint-1/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9d286bdf1e0677a78ae4dc92903472de5fe668ef --- /dev/null +++ b/whisper-tiny-hi-checkpoint-1/generation_config.json @@ -0,0 +1,248 @@ +{ + "alignment_heads": [ + [ + 2, + 2 + ], + [ + 3, + 0 + ], + [ + 3, + 2 + ], + [ + 3, + 3 + ], + [ + 3, + 4 + ], + [ + 3, + 5 + ] + ], + "begin_suppress_tokens": [ + 220, + 50257 + ], + "bos_token_id": 50257, + "decoder_start_token_id": 50258, + "eos_token_id": 50257, + "forced_decoder_ids": [ + [ + 1, + null + ], + [ + 2, + 50359 + ] + ], + "is_multilingual": true, + "lang_to_id": { + "<|af|>": 50327, + "<|am|>": 50334, + "<|ar|>": 50272, + "<|as|>": 50350, + "<|az|>": 50304, + "<|ba|>": 50355, + "<|be|>": 50330, + "<|bg|>": 50292, + "<|bn|>": 50302, + "<|bo|>": 50347, + "<|br|>": 50309, + "<|bs|>": 50315, + "<|ca|>": 50270, + "<|cs|>": 50283, + "<|cy|>": 50297, + "<|da|>": 50285, + "<|de|>": 50261, + "<|el|>": 50281, + "<|en|>": 50259, + "<|es|>": 50262, + "<|et|>": 50307, + "<|eu|>": 50310, + "<|fa|>": 50300, + "<|fi|>": 50277, + "<|fo|>": 50338, + "<|fr|>": 50265, + "<|gl|>": 50319, + "<|gu|>": 50333, + "<|haw|>": 50352, + "<|ha|>": 50354, + "<|he|>": 50279, + "<|hi|>": 50276, + "<|hr|>": 50291, + "<|ht|>": 50339, + "<|hu|>": 50286, + "<|hy|>": 50312, + "<|id|>": 50275, + "<|is|>": 50311, + "<|it|>": 50274, + "<|ja|>": 50266, + "<|jw|>": 50356, + "<|ka|>": 50329, + "<|kk|>": 50316, + "<|km|>": 50323, + "<|kn|>": 50306, + "<|ko|>": 50264, + "<|la|>": 50294, + "<|lb|>": 50345, + "<|ln|>": 50353, + "<|lo|>": 50336, + "<|lt|>": 50293, + "<|lv|>": 50301, + "<|mg|>": 50349, + "<|mi|>": 50295, + "<|mk|>": 50308, + "<|ml|>": 50296, + "<|mn|>": 50314, + "<|mr|>": 50320, + "<|ms|>": 50282, + "<|mt|>": 50343, + "<|my|>": 50346, + "<|ne|>": 50313, + "<|nl|>": 50271, + "<|nn|>": 50342, + "<|no|>": 50288, + "<|oc|>": 50328, + "<|pa|>": 50321, + "<|pl|>": 50269, + "<|ps|>": 50340, + "<|pt|>": 50267, + "<|ro|>": 50284, + "<|ru|>": 50263, + "<|sa|>": 50344, + "<|sd|>": 50332, + "<|si|>": 50322, + "<|sk|>": 50298, + "<|sl|>": 50305, + "<|sn|>": 50324, + "<|so|>": 50326, + "<|sq|>": 50317, + "<|sr|>": 50303, + "<|su|>": 50357, + "<|sv|>": 50273, + "<|sw|>": 50318, + "<|ta|>": 50287, + "<|te|>": 50299, + "<|tg|>": 50331, + "<|th|>": 50289, + "<|tk|>": 50341, + "<|tl|>": 50348, + "<|tr|>": 50268, + "<|tt|>": 50351, + "<|uk|>": 50280, + "<|ur|>": 50290, + "<|uz|>": 50337, + "<|vi|>": 50278, + "<|yi|>": 50335, + "<|yo|>": 50325, + "<|zh|>": 50260 + }, + "max_initial_timestamp_index": 50, + "max_length": 448, + "no_timestamps_token_id": 50363, + "pad_token_id": 50257, + "prev_sot_token_id": 50361, + "return_timestamps": false, + "suppress_tokens": [ + 1, + 2, + 7, + 8, + 9, + 10, + 14, + 25, + 26, + 27, + 28, + 29, + 31, + 58, + 59, + 60, + 61, + 62, + 63, + 90, + 91, + 92, + 93, + 359, + 503, + 522, + 542, + 873, + 893, + 902, + 918, + 922, + 931, + 1350, + 1853, + 1982, + 2460, + 2627, + 3246, + 3253, + 3268, + 3536, + 3846, + 3961, + 4183, + 4667, + 6585, + 6647, + 7273, + 9061, + 9383, + 10428, + 10929, + 11938, + 12033, + 12331, + 12562, + 13793, + 14157, + 14635, + 15265, + 15618, + 16553, + 16604, + 18362, + 18956, + 20075, + 21675, + 22520, + 26130, + 26161, + 26435, + 28279, + 29464, + 31650, + 32302, + 32470, + 36865, + 42863, + 47425, + 49870, + 50254, + 50258, + 50358, + 50359, + 50360, + 50361, + 50362 + ], + "task_to_id": { + "transcribe": 50359, + "translate": 50358 + }, + "transformers_version": "4.41.1" +} diff --git a/whisper-tiny-hi-checkpoint-1/model.safetensors b/whisper-tiny-hi-checkpoint-1/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9aa0b456f8cd8c36c001d1d45bbe4fde21f76cff --- /dev/null +++ b/whisper-tiny-hi-checkpoint-1/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a59c8982089b3ffb0f35b2a8b93a329827d3603f741f4d47ddb7a17dc5a7e5e2 +size 151061672 diff --git a/whisper-tiny-hi-checkpoint-1/preprocessor_config.json b/whisper-tiny-hi-checkpoint-1/preprocessor_config.json new file mode 100644 index 0000000000000000000000000000000000000000..91876762a536a746d268353c5cba57286e76b058 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-1/preprocessor_config.json @@ -0,0 +1,14 @@ +{ + "chunk_length": 30, + "feature_extractor_type": "WhisperFeatureExtractor", + "feature_size": 80, + "hop_length": 160, + "n_fft": 400, + "n_samples": 480000, + "nb_max_frames": 3000, + "padding_side": "right", + "padding_value": 0.0, + "processor_class": "WhisperProcessor", + "return_attention_mask": false, + "sampling_rate": 16000 +} diff --git a/whisper-tiny-hi-checkpoint-1/trainer_state.json b/whisper-tiny-hi-checkpoint-1/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..7fe5041a6036ad610cb196d381364365bf5b99ff --- /dev/null +++ b/whisper-tiny-hi-checkpoint-1/trainer_state.json @@ -0,0 +1,157 @@ +{ + "best_metric": 69.98899144720129, + "best_model_checkpoint": "./whisper-tiny-hi2_test/checkpoint-120", + "epoch": 6.25, + "eval_steps": 40, + "global_step": 200, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.625, + "grad_norm": 10.95101547241211, + "learning_rate": 9.200000000000002e-06, + "loss": 2.3747, + "step": 20 + }, + { + "epoch": 1.25, + "grad_norm": 7.747081279754639, + "learning_rate": 8.2e-06, + "loss": 1.2169, + "step": 40 + }, + { + "epoch": 1.25, + "eval_loss": 1.0360029935836792, + "eval_runtime": 574.5339, + "eval_samples_per_second": 1.741, + "eval_steps_per_second": 1.741, + "eval_wer": 91.60809552036582, + "step": 40 + }, + { + "epoch": 1.875, + "grad_norm": 7.32460355758667, + "learning_rate": 7.2000000000000005e-06, + "loss": 0.9058, + "step": 60 + }, + { + "epoch": 2.5, + "grad_norm": 6.835532188415527, + "learning_rate": 6.200000000000001e-06, + "loss": 0.7302, + "step": 80 + }, + { + "epoch": 2.5, + "eval_loss": 0.7368654608726501, + "eval_runtime": 549.562, + "eval_samples_per_second": 1.82, + "eval_steps_per_second": 1.82, + "eval_wer": 79.80353967313066, + "step": 80 + }, + { + "epoch": 3.125, + "grad_norm": 6.408384323120117, + "learning_rate": 5.2e-06, + "loss": 0.6453, + "step": 100 + }, + { + "epoch": 3.75, + "grad_norm": 5.809150695800781, + "learning_rate": 4.2000000000000004e-06, + "loss": 0.5917, + "step": 120 + }, + { + "epoch": 3.75, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.8688, + "eval_samples_per_second": 1.822, + "eval_steps_per_second": 1.822, + "eval_wer": 69.98899144720129, + "step": 120 + }, + { + "epoch": 4.375, + "grad_norm": 5.724637508392334, + "learning_rate": 3.2000000000000003e-06, + "loss": 0.5356, + "step": 140 + }, + { + "epoch": 5.0, + "grad_norm": 10.124310493469238, + "learning_rate": 2.2e-06, + "loss": 0.5156, + "step": 160 + }, + { + "epoch": 5.0, + "eval_loss": 0.6157090663909912, + "eval_runtime": 549.7895, + "eval_samples_per_second": 1.819, + "eval_steps_per_second": 1.819, + "eval_wer": 70.4293335591498, + "step": 160 + }, + { + "epoch": 5.625, + "grad_norm": 4.947811126708984, + "learning_rate": 1.2000000000000002e-06, + "loss": 0.4986, + "step": 180 + }, + { + "epoch": 6.25, + "grad_norm": 4.541861057281494, + "learning_rate": 2.0000000000000002e-07, + "loss": 0.481, + "step": 200 + }, + { + "epoch": 6.25, + "eval_loss": 0.6050636768341064, + "eval_runtime": 552.964, + "eval_samples_per_second": 1.808, + "eval_steps_per_second": 1.808, + "eval_wer": 70.03980015242611, + "step": 200 + }, + { + "epoch": 6.25, + "step": 200, + "total_flos": 1.5401574531072e+17, + "train_loss": 0.8495243072509766, + "train_runtime": 3592.94, + "train_samples_per_second": 1.781, + "train_steps_per_second": 0.056 + } + ], + "logging_steps": 20, + "max_steps": 200, + "num_input_tokens_seen": 0, + "num_train_epochs": 7, + "save_steps": 40, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 1.5401574531072e+17, + "train_batch_size": 32, + "trial_name": null, + "trial_params": null +} diff --git a/whisper-tiny-hi-checkpoint-1/training_args.bin b/whisper-tiny-hi-checkpoint-1/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..d4e924f371dff0e59e030904c79600ce608fe0cb --- /dev/null +++ b/whisper-tiny-hi-checkpoint-1/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c982fa9327e2e49f4765e9f4a5be54ca2c672121610ce55b8168505a2beb3b7 +size 5240 diff --git a/whisper-tiny-hi-checkpoint-2/config.json b/whisper-tiny-hi-checkpoint-2/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0b6f3b7ccfc50d2fda0d26c7eda2380d84d6bc4e --- /dev/null +++ b/whisper-tiny-hi-checkpoint-2/config.json @@ -0,0 +1,52 @@ +{ + "_name_or_path": "./whisper-tiny-hi2_test/whisper-tiny-hi-checkpoint-1", + "activation_dropout": 0.0, + "activation_function": "gelu", + "apply_spec_augment": false, + "architectures": [ + "WhisperForConditionalGeneration" + ], + "attention_dropout": 0.0, + "begin_suppress_tokens": [ + 220, + 50257 + ], + "bos_token_id": 50257, + "classifier_proj_size": 256, + "d_model": 384, + "decoder_attention_heads": 6, + "decoder_ffn_dim": 1536, + "decoder_layerdrop": 0.0, + "decoder_layers": 4, + "decoder_start_token_id": 50258, + "dropout": 0.0, + "encoder_attention_heads": 6, + "encoder_ffn_dim": 1536, + "encoder_layerdrop": 0.0, + "encoder_layers": 4, + "eos_token_id": 50257, + "forced_decoder_ids": null, + "init_std": 0.02, + "is_encoder_decoder": true, + "mask_feature_length": 10, + "mask_feature_min_masks": 0, + "mask_feature_prob": 0.0, + "mask_time_length": 10, + "mask_time_min_masks": 2, + "mask_time_prob": 0.05, + "max_length": 448, + "max_source_positions": 1500, + "max_target_positions": 448, + "median_filter_width": 7, + "model_type": "whisper", + "num_hidden_layers": 4, + "num_mel_bins": 80, + "pad_token_id": 50257, + "scale_embedding": false, + "suppress_tokens": [], + "torch_dtype": "float32", + "transformers_version": "4.41.1", + "use_cache": true, + "use_weighted_layer_sum": false, + "vocab_size": 51865 +} diff --git a/whisper-tiny-hi-checkpoint-2/generation_config.json b/whisper-tiny-hi-checkpoint-2/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9d286bdf1e0677a78ae4dc92903472de5fe668ef --- /dev/null +++ b/whisper-tiny-hi-checkpoint-2/generation_config.json @@ -0,0 +1,248 @@ +{ + "alignment_heads": [ + [ + 2, + 2 + ], + [ + 3, + 0 + ], + [ + 3, + 2 + ], + [ + 3, + 3 + ], + [ + 3, + 4 + ], + [ + 3, + 5 + ] + ], + "begin_suppress_tokens": [ + 220, + 50257 + ], + "bos_token_id": 50257, + "decoder_start_token_id": 50258, + "eos_token_id": 50257, + "forced_decoder_ids": [ + [ + 1, + null + ], + [ + 2, + 50359 + ] + ], + "is_multilingual": true, + "lang_to_id": { + "<|af|>": 50327, + "<|am|>": 50334, + "<|ar|>": 50272, + "<|as|>": 50350, + "<|az|>": 50304, + "<|ba|>": 50355, + "<|be|>": 50330, + "<|bg|>": 50292, + "<|bn|>": 50302, + "<|bo|>": 50347, + "<|br|>": 50309, + "<|bs|>": 50315, + "<|ca|>": 50270, + "<|cs|>": 50283, + "<|cy|>": 50297, + "<|da|>": 50285, + "<|de|>": 50261, + "<|el|>": 50281, + "<|en|>": 50259, + "<|es|>": 50262, + "<|et|>": 50307, + "<|eu|>": 50310, + "<|fa|>": 50300, + "<|fi|>": 50277, + "<|fo|>": 50338, + "<|fr|>": 50265, + "<|gl|>": 50319, + "<|gu|>": 50333, + "<|haw|>": 50352, + "<|ha|>": 50354, + "<|he|>": 50279, + "<|hi|>": 50276, + "<|hr|>": 50291, + "<|ht|>": 50339, + "<|hu|>": 50286, + "<|hy|>": 50312, + "<|id|>": 50275, + "<|is|>": 50311, + "<|it|>": 50274, + "<|ja|>": 50266, + "<|jw|>": 50356, + "<|ka|>": 50329, + "<|kk|>": 50316, + "<|km|>": 50323, + "<|kn|>": 50306, + "<|ko|>": 50264, + "<|la|>": 50294, + "<|lb|>": 50345, + "<|ln|>": 50353, + "<|lo|>": 50336, + "<|lt|>": 50293, + "<|lv|>": 50301, + "<|mg|>": 50349, + "<|mi|>": 50295, + "<|mk|>": 50308, + "<|ml|>": 50296, + "<|mn|>": 50314, + "<|mr|>": 50320, + "<|ms|>": 50282, + "<|mt|>": 50343, + "<|my|>": 50346, + "<|ne|>": 50313, + "<|nl|>": 50271, + "<|nn|>": 50342, + "<|no|>": 50288, + "<|oc|>": 50328, + "<|pa|>": 50321, + "<|pl|>": 50269, + "<|ps|>": 50340, + "<|pt|>": 50267, + "<|ro|>": 50284, + "<|ru|>": 50263, + "<|sa|>": 50344, + "<|sd|>": 50332, + "<|si|>": 50322, + "<|sk|>": 50298, + "<|sl|>": 50305, + "<|sn|>": 50324, + "<|so|>": 50326, + "<|sq|>": 50317, + "<|sr|>": 50303, + "<|su|>": 50357, + "<|sv|>": 50273, + "<|sw|>": 50318, + "<|ta|>": 50287, + "<|te|>": 50299, + "<|tg|>": 50331, + "<|th|>": 50289, + "<|tk|>": 50341, + "<|tl|>": 50348, + "<|tr|>": 50268, + "<|tt|>": 50351, + "<|uk|>": 50280, + "<|ur|>": 50290, + "<|uz|>": 50337, + "<|vi|>": 50278, + "<|yi|>": 50335, + "<|yo|>": 50325, + "<|zh|>": 50260 + }, + "max_initial_timestamp_index": 50, + "max_length": 448, + "no_timestamps_token_id": 50363, + "pad_token_id": 50257, + "prev_sot_token_id": 50361, + "return_timestamps": false, + "suppress_tokens": [ + 1, + 2, + 7, + 8, + 9, + 10, + 14, + 25, + 26, + 27, + 28, + 29, + 31, + 58, + 59, + 60, + 61, + 62, + 63, + 90, + 91, + 92, + 93, + 359, + 503, + 522, + 542, + 873, + 893, + 902, + 918, + 922, + 931, + 1350, + 1853, + 1982, + 2460, + 2627, + 3246, + 3253, + 3268, + 3536, + 3846, + 3961, + 4183, + 4667, + 6585, + 6647, + 7273, + 9061, + 9383, + 10428, + 10929, + 11938, + 12033, + 12331, + 12562, + 13793, + 14157, + 14635, + 15265, + 15618, + 16553, + 16604, + 18362, + 18956, + 20075, + 21675, + 22520, + 26130, + 26161, + 26435, + 28279, + 29464, + 31650, + 32302, + 32470, + 36865, + 42863, + 47425, + 49870, + 50254, + 50258, + 50358, + 50359, + 50360, + 50361, + 50362 + ], + "task_to_id": { + "transcribe": 50359, + "translate": 50358 + }, + "transformers_version": "4.41.1" +} diff --git a/whisper-tiny-hi-checkpoint-2/model.safetensors b/whisper-tiny-hi-checkpoint-2/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9aa0b456f8cd8c36c001d1d45bbe4fde21f76cff --- /dev/null +++ b/whisper-tiny-hi-checkpoint-2/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a59c8982089b3ffb0f35b2a8b93a329827d3603f741f4d47ddb7a17dc5a7e5e2 +size 151061672 diff --git a/whisper-tiny-hi-checkpoint-2/preprocessor_config.json b/whisper-tiny-hi-checkpoint-2/preprocessor_config.json new file mode 100644 index 0000000000000000000000000000000000000000..91876762a536a746d268353c5cba57286e76b058 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-2/preprocessor_config.json @@ -0,0 +1,14 @@ +{ + "chunk_length": 30, + "feature_extractor_type": "WhisperFeatureExtractor", + "feature_size": 80, + "hop_length": 160, + "n_fft": 400, + "n_samples": 480000, + "nb_max_frames": 3000, + "padding_side": "right", + "padding_value": 0.0, + "processor_class": "WhisperProcessor", + "return_attention_mask": false, + "sampling_rate": 16000 +} diff --git a/whisper-tiny-hi-checkpoint-2/trainer_state.json b/whisper-tiny-hi-checkpoint-2/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..d6f2c356d2cc73904e38090dd414b0c88f54d72e --- /dev/null +++ b/whisper-tiny-hi-checkpoint-2/trainer_state.json @@ -0,0 +1,175 @@ +{ + "best_metric": 69.98899144720129, + "best_model_checkpoint": "./whisper-tiny-hi2_test/checkpoint-120", + "epoch": 6.28125, + "eval_steps": 40, + "global_step": 201, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.625, + "grad_norm": 10.95101547241211, + "learning_rate": 9.200000000000002e-06, + "loss": 2.3747, + "step": 20 + }, + { + "epoch": 1.25, + "grad_norm": 7.747081279754639, + "learning_rate": 8.2e-06, + "loss": 1.2169, + "step": 40 + }, + { + "epoch": 1.25, + "eval_loss": 1.0360029935836792, + "eval_runtime": 574.5339, + "eval_samples_per_second": 1.741, + "eval_steps_per_second": 1.741, + "eval_wer": 91.60809552036582, + "step": 40 + }, + { + "epoch": 1.875, + "grad_norm": 7.32460355758667, + "learning_rate": 7.2000000000000005e-06, + "loss": 0.9058, + "step": 60 + }, + { + "epoch": 2.5, + "grad_norm": 6.835532188415527, + "learning_rate": 6.200000000000001e-06, + "loss": 0.7302, + "step": 80 + }, + { + "epoch": 2.5, + "eval_loss": 0.7368654608726501, + "eval_runtime": 549.562, + "eval_samples_per_second": 1.82, + "eval_steps_per_second": 1.82, + "eval_wer": 79.80353967313066, + "step": 80 + }, + { + "epoch": 3.125, + "grad_norm": 6.408384323120117, + "learning_rate": 5.2e-06, + "loss": 0.6453, + "step": 100 + }, + { + "epoch": 3.75, + "grad_norm": 5.809150695800781, + "learning_rate": 4.2000000000000004e-06, + "loss": 0.5917, + "step": 120 + }, + { + "epoch": 3.75, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.8688, + "eval_samples_per_second": 1.822, + "eval_steps_per_second": 1.822, + "eval_wer": 69.98899144720129, + "step": 120 + }, + { + "epoch": 4.375, + "grad_norm": 5.724637508392334, + "learning_rate": 3.2000000000000003e-06, + "loss": 0.5356, + "step": 140 + }, + { + "epoch": 5.0, + "grad_norm": 10.124310493469238, + "learning_rate": 2.2e-06, + "loss": 0.5156, + "step": 160 + }, + { + "epoch": 5.0, + "eval_loss": 0.6157090663909912, + "eval_runtime": 549.7895, + "eval_samples_per_second": 1.819, + "eval_steps_per_second": 1.819, + "eval_wer": 70.4293335591498, + "step": 160 + }, + { + "epoch": 5.625, + "grad_norm": 4.947811126708984, + "learning_rate": 1.2000000000000002e-06, + "loss": 0.4986, + "step": 180 + }, + { + "epoch": 6.25, + "grad_norm": 4.541861057281494, + "learning_rate": 2.0000000000000002e-07, + "loss": 0.481, + "step": 200 + }, + { + "epoch": 6.25, + "eval_loss": 0.6050636768341064, + "eval_runtime": 552.964, + "eval_samples_per_second": 1.808, + "eval_steps_per_second": 1.808, + "eval_wer": 70.03980015242611, + "step": 200 + }, + { + "epoch": 6.25, + "step": 200, + "total_flos": 1.5401574531072e+17, + "train_loss": 0.8495243072509766, + "train_runtime": 3592.94, + "train_samples_per_second": 1.781, + "train_steps_per_second": 0.056 + }, + { + "epoch": 6.28125, + "step": 201, + "total_flos": 1.5480354963456e+17, + "train_loss": 0.003230639654605543, + "train_runtime": 7.5043, + "train_samples_per_second": 852.844, + "train_steps_per_second": 26.651 + }, + { + "epoch": 6.28125, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.5863, + "eval_samples_per_second": 1.823, + "eval_steps_per_second": 1.823, + "eval_wer": 69.98899144720129, + "step": 201 + } + ], + "logging_steps": 20, + "max_steps": 200, + "num_input_tokens_seen": 0, + "num_train_epochs": 7, + "save_steps": 40, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 1.5480354963456e+17, + "train_batch_size": 32, + "trial_name": null, + "trial_params": null +} diff --git a/whisper-tiny-hi-checkpoint-2/training_args.bin b/whisper-tiny-hi-checkpoint-2/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..79dccad896a492cac0a90d8135cb645365a40b54 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-2/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57320ccedcf473157fcb44c0152851471c74170811def3aa0279b4a3552d63db +size 5240 diff --git a/whisper-tiny-hi-checkpoint-3/config.json b/whisper-tiny-hi-checkpoint-3/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f19c04d2d9ca39cff0a0934b2819b1dda73f15d3 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-3/config.json @@ -0,0 +1,52 @@ +{ + "_name_or_path": "./whisper-tiny-hi2_test/whisper-tiny-hi-checkpoint-2", + "activation_dropout": 0.0, + "activation_function": "gelu", + "apply_spec_augment": false, + "architectures": [ + "WhisperForConditionalGeneration" + ], + "attention_dropout": 0.0, + "begin_suppress_tokens": [ + 220, + 50257 + ], + "bos_token_id": 50257, + "classifier_proj_size": 256, + "d_model": 384, + "decoder_attention_heads": 6, + "decoder_ffn_dim": 1536, + "decoder_layerdrop": 0.0, + "decoder_layers": 4, + "decoder_start_token_id": 50258, + "dropout": 0.0, + "encoder_attention_heads": 6, + "encoder_ffn_dim": 1536, + "encoder_layerdrop": 0.0, + "encoder_layers": 4, + "eos_token_id": 50257, + "forced_decoder_ids": null, + "init_std": 0.02, + "is_encoder_decoder": true, + "mask_feature_length": 10, + "mask_feature_min_masks": 0, + "mask_feature_prob": 0.0, + "mask_time_length": 10, + "mask_time_min_masks": 2, + "mask_time_prob": 0.05, + "max_length": 448, + "max_source_positions": 1500, + "max_target_positions": 448, + "median_filter_width": 7, + "model_type": "whisper", + "num_hidden_layers": 4, + "num_mel_bins": 80, + "pad_token_id": 50257, + "scale_embedding": false, + "suppress_tokens": [], + "torch_dtype": "float32", + "transformers_version": "4.41.1", + "use_cache": true, + "use_weighted_layer_sum": false, + "vocab_size": 51865 +} diff --git a/whisper-tiny-hi-checkpoint-3/generation_config.json b/whisper-tiny-hi-checkpoint-3/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9d286bdf1e0677a78ae4dc92903472de5fe668ef --- /dev/null +++ b/whisper-tiny-hi-checkpoint-3/generation_config.json @@ -0,0 +1,248 @@ +{ + "alignment_heads": [ + [ + 2, + 2 + ], + [ + 3, + 0 + ], + [ + 3, + 2 + ], + [ + 3, + 3 + ], + [ + 3, + 4 + ], + [ + 3, + 5 + ] + ], + "begin_suppress_tokens": [ + 220, + 50257 + ], + "bos_token_id": 50257, + "decoder_start_token_id": 50258, + "eos_token_id": 50257, + "forced_decoder_ids": [ + [ + 1, + null + ], + [ + 2, + 50359 + ] + ], + "is_multilingual": true, + "lang_to_id": { + "<|af|>": 50327, + "<|am|>": 50334, + "<|ar|>": 50272, + "<|as|>": 50350, + "<|az|>": 50304, + "<|ba|>": 50355, + "<|be|>": 50330, + "<|bg|>": 50292, + "<|bn|>": 50302, + "<|bo|>": 50347, + "<|br|>": 50309, + "<|bs|>": 50315, + "<|ca|>": 50270, + "<|cs|>": 50283, + "<|cy|>": 50297, + "<|da|>": 50285, + "<|de|>": 50261, + "<|el|>": 50281, + "<|en|>": 50259, + "<|es|>": 50262, + "<|et|>": 50307, + "<|eu|>": 50310, + "<|fa|>": 50300, + "<|fi|>": 50277, + "<|fo|>": 50338, + "<|fr|>": 50265, + "<|gl|>": 50319, + "<|gu|>": 50333, + "<|haw|>": 50352, + "<|ha|>": 50354, + "<|he|>": 50279, + "<|hi|>": 50276, + "<|hr|>": 50291, + "<|ht|>": 50339, + "<|hu|>": 50286, + "<|hy|>": 50312, + "<|id|>": 50275, + "<|is|>": 50311, + "<|it|>": 50274, + "<|ja|>": 50266, + "<|jw|>": 50356, + "<|ka|>": 50329, + "<|kk|>": 50316, + "<|km|>": 50323, + "<|kn|>": 50306, + "<|ko|>": 50264, + "<|la|>": 50294, + "<|lb|>": 50345, + "<|ln|>": 50353, + "<|lo|>": 50336, + "<|lt|>": 50293, + "<|lv|>": 50301, + "<|mg|>": 50349, + "<|mi|>": 50295, + "<|mk|>": 50308, + "<|ml|>": 50296, + "<|mn|>": 50314, + "<|mr|>": 50320, + "<|ms|>": 50282, + "<|mt|>": 50343, + "<|my|>": 50346, + "<|ne|>": 50313, + "<|nl|>": 50271, + "<|nn|>": 50342, + "<|no|>": 50288, + "<|oc|>": 50328, + "<|pa|>": 50321, + "<|pl|>": 50269, + "<|ps|>": 50340, + "<|pt|>": 50267, + "<|ro|>": 50284, + "<|ru|>": 50263, + "<|sa|>": 50344, + "<|sd|>": 50332, + "<|si|>": 50322, + "<|sk|>": 50298, + "<|sl|>": 50305, + "<|sn|>": 50324, + "<|so|>": 50326, + "<|sq|>": 50317, + "<|sr|>": 50303, + "<|su|>": 50357, + "<|sv|>": 50273, + "<|sw|>": 50318, + "<|ta|>": 50287, + "<|te|>": 50299, + "<|tg|>": 50331, + "<|th|>": 50289, + "<|tk|>": 50341, + "<|tl|>": 50348, + "<|tr|>": 50268, + "<|tt|>": 50351, + "<|uk|>": 50280, + "<|ur|>": 50290, + "<|uz|>": 50337, + "<|vi|>": 50278, + "<|yi|>": 50335, + "<|yo|>": 50325, + "<|zh|>": 50260 + }, + "max_initial_timestamp_index": 50, + "max_length": 448, + "no_timestamps_token_id": 50363, + "pad_token_id": 50257, + "prev_sot_token_id": 50361, + "return_timestamps": false, + "suppress_tokens": [ + 1, + 2, + 7, + 8, + 9, + 10, + 14, + 25, + 26, + 27, + 28, + 29, + 31, + 58, + 59, + 60, + 61, + 62, + 63, + 90, + 91, + 92, + 93, + 359, + 503, + 522, + 542, + 873, + 893, + 902, + 918, + 922, + 931, + 1350, + 1853, + 1982, + 2460, + 2627, + 3246, + 3253, + 3268, + 3536, + 3846, + 3961, + 4183, + 4667, + 6585, + 6647, + 7273, + 9061, + 9383, + 10428, + 10929, + 11938, + 12033, + 12331, + 12562, + 13793, + 14157, + 14635, + 15265, + 15618, + 16553, + 16604, + 18362, + 18956, + 20075, + 21675, + 22520, + 26130, + 26161, + 26435, + 28279, + 29464, + 31650, + 32302, + 32470, + 36865, + 42863, + 47425, + 49870, + 50254, + 50258, + 50358, + 50359, + 50360, + 50361, + 50362 + ], + "task_to_id": { + "transcribe": 50359, + "translate": 50358 + }, + "transformers_version": "4.41.1" +} diff --git a/whisper-tiny-hi-checkpoint-3/model.safetensors b/whisper-tiny-hi-checkpoint-3/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9aa0b456f8cd8c36c001d1d45bbe4fde21f76cff --- /dev/null +++ b/whisper-tiny-hi-checkpoint-3/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a59c8982089b3ffb0f35b2a8b93a329827d3603f741f4d47ddb7a17dc5a7e5e2 +size 151061672 diff --git a/whisper-tiny-hi-checkpoint-3/preprocessor_config.json b/whisper-tiny-hi-checkpoint-3/preprocessor_config.json new file mode 100644 index 0000000000000000000000000000000000000000..91876762a536a746d268353c5cba57286e76b058 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-3/preprocessor_config.json @@ -0,0 +1,14 @@ +{ + "chunk_length": 30, + "feature_extractor_type": "WhisperFeatureExtractor", + "feature_size": 80, + "hop_length": 160, + "n_fft": 400, + "n_samples": 480000, + "nb_max_frames": 3000, + "padding_side": "right", + "padding_value": 0.0, + "processor_class": "WhisperProcessor", + "return_attention_mask": false, + "sampling_rate": 16000 +} diff --git a/whisper-tiny-hi-checkpoint-3/trainer_state.json b/whisper-tiny-hi-checkpoint-3/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..2767db7d4500c25893550df3b22ebba11ed4593c --- /dev/null +++ b/whisper-tiny-hi-checkpoint-3/trainer_state.json @@ -0,0 +1,193 @@ +{ + "best_metric": 69.98899144720129, + "best_model_checkpoint": "./whisper-tiny-hi2_test/checkpoint-120", + "epoch": 6.3125, + "eval_steps": 40, + "global_step": 202, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.625, + "grad_norm": 10.95101547241211, + "learning_rate": 9.200000000000002e-06, + "loss": 2.3747, + "step": 20 + }, + { + "epoch": 1.25, + "grad_norm": 7.747081279754639, + "learning_rate": 8.2e-06, + "loss": 1.2169, + "step": 40 + }, + { + "epoch": 1.25, + "eval_loss": 1.0360029935836792, + "eval_runtime": 574.5339, + "eval_samples_per_second": 1.741, + "eval_steps_per_second": 1.741, + "eval_wer": 91.60809552036582, + "step": 40 + }, + { + "epoch": 1.875, + "grad_norm": 7.32460355758667, + "learning_rate": 7.2000000000000005e-06, + "loss": 0.9058, + "step": 60 + }, + { + "epoch": 2.5, + "grad_norm": 6.835532188415527, + "learning_rate": 6.200000000000001e-06, + "loss": 0.7302, + "step": 80 + }, + { + "epoch": 2.5, + "eval_loss": 0.7368654608726501, + "eval_runtime": 549.562, + "eval_samples_per_second": 1.82, + "eval_steps_per_second": 1.82, + "eval_wer": 79.80353967313066, + "step": 80 + }, + { + "epoch": 3.125, + "grad_norm": 6.408384323120117, + "learning_rate": 5.2e-06, + "loss": 0.6453, + "step": 100 + }, + { + "epoch": 3.75, + "grad_norm": 5.809150695800781, + "learning_rate": 4.2000000000000004e-06, + "loss": 0.5917, + "step": 120 + }, + { + "epoch": 3.75, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.8688, + "eval_samples_per_second": 1.822, + "eval_steps_per_second": 1.822, + "eval_wer": 69.98899144720129, + "step": 120 + }, + { + "epoch": 4.375, + "grad_norm": 5.724637508392334, + "learning_rate": 3.2000000000000003e-06, + "loss": 0.5356, + "step": 140 + }, + { + "epoch": 5.0, + "grad_norm": 10.124310493469238, + "learning_rate": 2.2e-06, + "loss": 0.5156, + "step": 160 + }, + { + "epoch": 5.0, + "eval_loss": 0.6157090663909912, + "eval_runtime": 549.7895, + "eval_samples_per_second": 1.819, + "eval_steps_per_second": 1.819, + "eval_wer": 70.4293335591498, + "step": 160 + }, + { + "epoch": 5.625, + "grad_norm": 4.947811126708984, + "learning_rate": 1.2000000000000002e-06, + "loss": 0.4986, + "step": 180 + }, + { + "epoch": 6.25, + "grad_norm": 4.541861057281494, + "learning_rate": 2.0000000000000002e-07, + "loss": 0.481, + "step": 200 + }, + { + "epoch": 6.25, + "eval_loss": 0.6050636768341064, + "eval_runtime": 552.964, + "eval_samples_per_second": 1.808, + "eval_steps_per_second": 1.808, + "eval_wer": 70.03980015242611, + "step": 200 + }, + { + "epoch": 6.25, + "step": 200, + "total_flos": 1.5401574531072e+17, + "train_loss": 0.8495243072509766, + "train_runtime": 3592.94, + "train_samples_per_second": 1.781, + "train_steps_per_second": 0.056 + }, + { + "epoch": 6.28125, + "step": 201, + "total_flos": 1.5480354963456e+17, + "train_loss": 0.003230639654605543, + "train_runtime": 7.5043, + "train_samples_per_second": 852.844, + "train_steps_per_second": 26.651 + }, + { + "epoch": 6.28125, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.5863, + "eval_samples_per_second": 1.823, + "eval_steps_per_second": 1.823, + "eval_wer": 69.98899144720129, + "step": 201 + }, + { + "epoch": 6.3125, + "step": 202, + "total_flos": 1.555913539584e+17, + "train_loss": 0.0035205459830784562, + "train_runtime": 7.6486, + "train_samples_per_second": 836.753, + "train_steps_per_second": 26.149 + }, + { + "epoch": 6.3125, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.2984, + "eval_samples_per_second": 1.824, + "eval_steps_per_second": 1.824, + "eval_wer": 69.98899144720129, + "step": 202 + } + ], + "logging_steps": 20, + "max_steps": 200, + "num_input_tokens_seen": 0, + "num_train_epochs": 7, + "save_steps": 40, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 1.555913539584e+17, + "train_batch_size": 32, + "trial_name": null, + "trial_params": null +} diff --git a/whisper-tiny-hi-checkpoint-3/training_args.bin b/whisper-tiny-hi-checkpoint-3/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..c79dca10b379641400bb3b61b6e8ce70b7bf6ca6 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-3/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf420e0b38b82d46a55cd7ad07aeb13abc779974b6f703a2306e4deb9f513f5b +size 5240 diff --git a/whisper-tiny-hi-checkpoint-4/config.json b/whisper-tiny-hi-checkpoint-4/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9ef91e69ab8ff496e65da2f791380cd26a1cf2e2 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-4/config.json @@ -0,0 +1,52 @@ +{ + "_name_or_path": "./whisper-tiny-hi2_test/whisper-tiny-hi-checkpoint-3", + "activation_dropout": 0.0, + "activation_function": "gelu", + "apply_spec_augment": false, + "architectures": [ + "WhisperForConditionalGeneration" + ], + "attention_dropout": 0.0, + "begin_suppress_tokens": [ + 220, + 50257 + ], + "bos_token_id": 50257, + "classifier_proj_size": 256, + "d_model": 384, + "decoder_attention_heads": 6, + "decoder_ffn_dim": 1536, + "decoder_layerdrop": 0.0, + "decoder_layers": 4, + "decoder_start_token_id": 50258, + "dropout": 0.0, + "encoder_attention_heads": 6, + "encoder_ffn_dim": 1536, + "encoder_layerdrop": 0.0, + "encoder_layers": 4, + "eos_token_id": 50257, + "forced_decoder_ids": null, + "init_std": 0.02, + "is_encoder_decoder": true, + "mask_feature_length": 10, + "mask_feature_min_masks": 0, + "mask_feature_prob": 0.0, + "mask_time_length": 10, + "mask_time_min_masks": 2, + "mask_time_prob": 0.05, + "max_length": 448, + "max_source_positions": 1500, + "max_target_positions": 448, + "median_filter_width": 7, + "model_type": "whisper", + "num_hidden_layers": 4, + "num_mel_bins": 80, + "pad_token_id": 50257, + "scale_embedding": false, + "suppress_tokens": [], + "torch_dtype": "float32", + "transformers_version": "4.41.1", + "use_cache": true, + "use_weighted_layer_sum": false, + "vocab_size": 51865 +} diff --git a/whisper-tiny-hi-checkpoint-4/generation_config.json b/whisper-tiny-hi-checkpoint-4/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9d286bdf1e0677a78ae4dc92903472de5fe668ef --- /dev/null +++ b/whisper-tiny-hi-checkpoint-4/generation_config.json @@ -0,0 +1,248 @@ +{ + "alignment_heads": [ + [ + 2, + 2 + ], + [ + 3, + 0 + ], + [ + 3, + 2 + ], + [ + 3, + 3 + ], + [ + 3, + 4 + ], + [ + 3, + 5 + ] + ], + "begin_suppress_tokens": [ + 220, + 50257 + ], + "bos_token_id": 50257, + "decoder_start_token_id": 50258, + "eos_token_id": 50257, + "forced_decoder_ids": [ + [ + 1, + null + ], + [ + 2, + 50359 + ] + ], + "is_multilingual": true, + "lang_to_id": { + "<|af|>": 50327, + "<|am|>": 50334, + "<|ar|>": 50272, + "<|as|>": 50350, + "<|az|>": 50304, + "<|ba|>": 50355, + "<|be|>": 50330, + "<|bg|>": 50292, + "<|bn|>": 50302, + "<|bo|>": 50347, + "<|br|>": 50309, + "<|bs|>": 50315, + "<|ca|>": 50270, + "<|cs|>": 50283, + "<|cy|>": 50297, + "<|da|>": 50285, + "<|de|>": 50261, + "<|el|>": 50281, + "<|en|>": 50259, + "<|es|>": 50262, + "<|et|>": 50307, + "<|eu|>": 50310, + "<|fa|>": 50300, + "<|fi|>": 50277, + "<|fo|>": 50338, + "<|fr|>": 50265, + "<|gl|>": 50319, + "<|gu|>": 50333, + "<|haw|>": 50352, + "<|ha|>": 50354, + "<|he|>": 50279, + "<|hi|>": 50276, + "<|hr|>": 50291, + "<|ht|>": 50339, + "<|hu|>": 50286, + "<|hy|>": 50312, + "<|id|>": 50275, + "<|is|>": 50311, + "<|it|>": 50274, + "<|ja|>": 50266, + "<|jw|>": 50356, + "<|ka|>": 50329, + "<|kk|>": 50316, + "<|km|>": 50323, + "<|kn|>": 50306, + "<|ko|>": 50264, + "<|la|>": 50294, + "<|lb|>": 50345, + "<|ln|>": 50353, + "<|lo|>": 50336, + "<|lt|>": 50293, + "<|lv|>": 50301, + "<|mg|>": 50349, + "<|mi|>": 50295, + "<|mk|>": 50308, + "<|ml|>": 50296, + "<|mn|>": 50314, + "<|mr|>": 50320, + "<|ms|>": 50282, + "<|mt|>": 50343, + "<|my|>": 50346, + "<|ne|>": 50313, + "<|nl|>": 50271, + "<|nn|>": 50342, + "<|no|>": 50288, + "<|oc|>": 50328, + "<|pa|>": 50321, + "<|pl|>": 50269, + "<|ps|>": 50340, + "<|pt|>": 50267, + "<|ro|>": 50284, + "<|ru|>": 50263, + "<|sa|>": 50344, + "<|sd|>": 50332, + "<|si|>": 50322, + "<|sk|>": 50298, + "<|sl|>": 50305, + "<|sn|>": 50324, + "<|so|>": 50326, + "<|sq|>": 50317, + "<|sr|>": 50303, + "<|su|>": 50357, + "<|sv|>": 50273, + "<|sw|>": 50318, + "<|ta|>": 50287, + "<|te|>": 50299, + "<|tg|>": 50331, + "<|th|>": 50289, + "<|tk|>": 50341, + "<|tl|>": 50348, + "<|tr|>": 50268, + "<|tt|>": 50351, + "<|uk|>": 50280, + "<|ur|>": 50290, + "<|uz|>": 50337, + "<|vi|>": 50278, + "<|yi|>": 50335, + "<|yo|>": 50325, + "<|zh|>": 50260 + }, + "max_initial_timestamp_index": 50, + "max_length": 448, + "no_timestamps_token_id": 50363, + "pad_token_id": 50257, + "prev_sot_token_id": 50361, + "return_timestamps": false, + "suppress_tokens": [ + 1, + 2, + 7, + 8, + 9, + 10, + 14, + 25, + 26, + 27, + 28, + 29, + 31, + 58, + 59, + 60, + 61, + 62, + 63, + 90, + 91, + 92, + 93, + 359, + 503, + 522, + 542, + 873, + 893, + 902, + 918, + 922, + 931, + 1350, + 1853, + 1982, + 2460, + 2627, + 3246, + 3253, + 3268, + 3536, + 3846, + 3961, + 4183, + 4667, + 6585, + 6647, + 7273, + 9061, + 9383, + 10428, + 10929, + 11938, + 12033, + 12331, + 12562, + 13793, + 14157, + 14635, + 15265, + 15618, + 16553, + 16604, + 18362, + 18956, + 20075, + 21675, + 22520, + 26130, + 26161, + 26435, + 28279, + 29464, + 31650, + 32302, + 32470, + 36865, + 42863, + 47425, + 49870, + 50254, + 50258, + 50358, + 50359, + 50360, + 50361, + 50362 + ], + "task_to_id": { + "transcribe": 50359, + "translate": 50358 + }, + "transformers_version": "4.41.1" +} diff --git a/whisper-tiny-hi-checkpoint-4/model.safetensors b/whisper-tiny-hi-checkpoint-4/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9aa0b456f8cd8c36c001d1d45bbe4fde21f76cff --- /dev/null +++ b/whisper-tiny-hi-checkpoint-4/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a59c8982089b3ffb0f35b2a8b93a329827d3603f741f4d47ddb7a17dc5a7e5e2 +size 151061672 diff --git a/whisper-tiny-hi-checkpoint-4/preprocessor_config.json b/whisper-tiny-hi-checkpoint-4/preprocessor_config.json new file mode 100644 index 0000000000000000000000000000000000000000..91876762a536a746d268353c5cba57286e76b058 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-4/preprocessor_config.json @@ -0,0 +1,14 @@ +{ + "chunk_length": 30, + "feature_extractor_type": "WhisperFeatureExtractor", + "feature_size": 80, + "hop_length": 160, + "n_fft": 400, + "n_samples": 480000, + "nb_max_frames": 3000, + "padding_side": "right", + "padding_value": 0.0, + "processor_class": "WhisperProcessor", + "return_attention_mask": false, + "sampling_rate": 16000 +} diff --git a/whisper-tiny-hi-checkpoint-4/trainer_state.json b/whisper-tiny-hi-checkpoint-4/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..884b086e71e08bdd8eea3fea58003924428ec4f6 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-4/trainer_state.json @@ -0,0 +1,211 @@ +{ + "best_metric": 69.98899144720129, + "best_model_checkpoint": "./whisper-tiny-hi2_test/checkpoint-120", + "epoch": 6.34375, + "eval_steps": 40, + "global_step": 203, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.625, + "grad_norm": 10.95101547241211, + "learning_rate": 9.200000000000002e-06, + "loss": 2.3747, + "step": 20 + }, + { + "epoch": 1.25, + "grad_norm": 7.747081279754639, + "learning_rate": 8.2e-06, + "loss": 1.2169, + "step": 40 + }, + { + "epoch": 1.25, + "eval_loss": 1.0360029935836792, + "eval_runtime": 574.5339, + "eval_samples_per_second": 1.741, + "eval_steps_per_second": 1.741, + "eval_wer": 91.60809552036582, + "step": 40 + }, + { + "epoch": 1.875, + "grad_norm": 7.32460355758667, + "learning_rate": 7.2000000000000005e-06, + "loss": 0.9058, + "step": 60 + }, + { + "epoch": 2.5, + "grad_norm": 6.835532188415527, + "learning_rate": 6.200000000000001e-06, + "loss": 0.7302, + "step": 80 + }, + { + "epoch": 2.5, + "eval_loss": 0.7368654608726501, + "eval_runtime": 549.562, + "eval_samples_per_second": 1.82, + "eval_steps_per_second": 1.82, + "eval_wer": 79.80353967313066, + "step": 80 + }, + { + "epoch": 3.125, + "grad_norm": 6.408384323120117, + "learning_rate": 5.2e-06, + "loss": 0.6453, + "step": 100 + }, + { + "epoch": 3.75, + "grad_norm": 5.809150695800781, + "learning_rate": 4.2000000000000004e-06, + "loss": 0.5917, + "step": 120 + }, + { + "epoch": 3.75, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.8688, + "eval_samples_per_second": 1.822, + "eval_steps_per_second": 1.822, + "eval_wer": 69.98899144720129, + "step": 120 + }, + { + "epoch": 4.375, + "grad_norm": 5.724637508392334, + "learning_rate": 3.2000000000000003e-06, + "loss": 0.5356, + "step": 140 + }, + { + "epoch": 5.0, + "grad_norm": 10.124310493469238, + "learning_rate": 2.2e-06, + "loss": 0.5156, + "step": 160 + }, + { + "epoch": 5.0, + "eval_loss": 0.6157090663909912, + "eval_runtime": 549.7895, + "eval_samples_per_second": 1.819, + "eval_steps_per_second": 1.819, + "eval_wer": 70.4293335591498, + "step": 160 + }, + { + "epoch": 5.625, + "grad_norm": 4.947811126708984, + "learning_rate": 1.2000000000000002e-06, + "loss": 0.4986, + "step": 180 + }, + { + "epoch": 6.25, + "grad_norm": 4.541861057281494, + "learning_rate": 2.0000000000000002e-07, + "loss": 0.481, + "step": 200 + }, + { + "epoch": 6.25, + "eval_loss": 0.6050636768341064, + "eval_runtime": 552.964, + "eval_samples_per_second": 1.808, + "eval_steps_per_second": 1.808, + "eval_wer": 70.03980015242611, + "step": 200 + }, + { + "epoch": 6.25, + "step": 200, + "total_flos": 1.5401574531072e+17, + "train_loss": 0.8495243072509766, + "train_runtime": 3592.94, + "train_samples_per_second": 1.781, + "train_steps_per_second": 0.056 + }, + { + "epoch": 6.28125, + "step": 201, + "total_flos": 1.5480354963456e+17, + "train_loss": 0.003230639654605543, + "train_runtime": 7.5043, + "train_samples_per_second": 852.844, + "train_steps_per_second": 26.651 + }, + { + "epoch": 6.28125, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.5863, + "eval_samples_per_second": 1.823, + "eval_steps_per_second": 1.823, + "eval_wer": 69.98899144720129, + "step": 201 + }, + { + "epoch": 6.3125, + "step": 202, + "total_flos": 1.555913539584e+17, + "train_loss": 0.0035205459830784562, + "train_runtime": 7.6486, + "train_samples_per_second": 836.753, + "train_steps_per_second": 26.149 + }, + { + "epoch": 6.3125, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.2984, + "eval_samples_per_second": 1.824, + "eval_steps_per_second": 1.824, + "eval_wer": 69.98899144720129, + "step": 202 + }, + { + "epoch": 6.34375, + "step": 203, + "total_flos": 1.5637915828224e+17, + "train_loss": 0.002875891812329222, + "train_runtime": 7.5227, + "train_samples_per_second": 850.756, + "train_steps_per_second": 26.586 + }, + { + "epoch": 6.34375, + "eval_loss": 0.6504533886909485, + "eval_runtime": 547.5722, + "eval_samples_per_second": 1.826, + "eval_steps_per_second": 1.826, + "eval_wer": 69.98899144720129, + "step": 203 + } + ], + "logging_steps": 20, + "max_steps": 200, + "num_input_tokens_seen": 0, + "num_train_epochs": 7, + "save_steps": 40, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 1.5637915828224e+17, + "train_batch_size": 32, + "trial_name": null, + "trial_params": null +} diff --git a/whisper-tiny-hi-checkpoint-4/training_args.bin b/whisper-tiny-hi-checkpoint-4/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e19ef782e7aa3518e0efc787f2c5da6532709095 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-4/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fde3b061801e57ac6347876e7eec0136a5fe65654b71efe0a4f717dc40704c04 +size 5240 diff --git a/whisper-tiny-hi-checkpoint-5/config.json b/whisper-tiny-hi-checkpoint-5/config.json new file mode 100644 index 0000000000000000000000000000000000000000..01d7571d8c324f142b561ae5830277f03ae7bdf9 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-5/config.json @@ -0,0 +1,52 @@ +{ + "_name_or_path": "./whisper-tiny-hi2_test/whisper-tiny-hi-checkpoint-4", + "activation_dropout": 0.0, + "activation_function": "gelu", + "apply_spec_augment": false, + "architectures": [ + "WhisperForConditionalGeneration" + ], + "attention_dropout": 0.0, + "begin_suppress_tokens": [ + 220, + 50257 + ], + "bos_token_id": 50257, + "classifier_proj_size": 256, + "d_model": 384, + "decoder_attention_heads": 6, + "decoder_ffn_dim": 1536, + "decoder_layerdrop": 0.0, + "decoder_layers": 4, + "decoder_start_token_id": 50258, + "dropout": 0.0, + "encoder_attention_heads": 6, + "encoder_ffn_dim": 1536, + "encoder_layerdrop": 0.0, + "encoder_layers": 4, + "eos_token_id": 50257, + "forced_decoder_ids": null, + "init_std": 0.02, + "is_encoder_decoder": true, + "mask_feature_length": 10, + "mask_feature_min_masks": 0, + "mask_feature_prob": 0.0, + "mask_time_length": 10, + "mask_time_min_masks": 2, + "mask_time_prob": 0.05, + "max_length": 448, + "max_source_positions": 1500, + "max_target_positions": 448, + "median_filter_width": 7, + "model_type": "whisper", + "num_hidden_layers": 4, + "num_mel_bins": 80, + "pad_token_id": 50257, + "scale_embedding": false, + "suppress_tokens": [], + "torch_dtype": "float32", + "transformers_version": "4.41.1", + "use_cache": true, + "use_weighted_layer_sum": false, + "vocab_size": 51865 +} diff --git a/whisper-tiny-hi-checkpoint-5/generation_config.json b/whisper-tiny-hi-checkpoint-5/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9d286bdf1e0677a78ae4dc92903472de5fe668ef --- /dev/null +++ b/whisper-tiny-hi-checkpoint-5/generation_config.json @@ -0,0 +1,248 @@ +{ + "alignment_heads": [ + [ + 2, + 2 + ], + [ + 3, + 0 + ], + [ + 3, + 2 + ], + [ + 3, + 3 + ], + [ + 3, + 4 + ], + [ + 3, + 5 + ] + ], + "begin_suppress_tokens": [ + 220, + 50257 + ], + "bos_token_id": 50257, + "decoder_start_token_id": 50258, + "eos_token_id": 50257, + "forced_decoder_ids": [ + [ + 1, + null + ], + [ + 2, + 50359 + ] + ], + "is_multilingual": true, + "lang_to_id": { + "<|af|>": 50327, + "<|am|>": 50334, + "<|ar|>": 50272, + "<|as|>": 50350, + "<|az|>": 50304, + "<|ba|>": 50355, + "<|be|>": 50330, + "<|bg|>": 50292, + "<|bn|>": 50302, + "<|bo|>": 50347, + "<|br|>": 50309, + "<|bs|>": 50315, + "<|ca|>": 50270, + "<|cs|>": 50283, + "<|cy|>": 50297, + "<|da|>": 50285, + "<|de|>": 50261, + "<|el|>": 50281, + "<|en|>": 50259, + "<|es|>": 50262, + "<|et|>": 50307, + "<|eu|>": 50310, + "<|fa|>": 50300, + "<|fi|>": 50277, + "<|fo|>": 50338, + "<|fr|>": 50265, + "<|gl|>": 50319, + "<|gu|>": 50333, + "<|haw|>": 50352, + "<|ha|>": 50354, + "<|he|>": 50279, + "<|hi|>": 50276, + "<|hr|>": 50291, + "<|ht|>": 50339, + "<|hu|>": 50286, + "<|hy|>": 50312, + "<|id|>": 50275, + "<|is|>": 50311, + "<|it|>": 50274, + "<|ja|>": 50266, + "<|jw|>": 50356, + "<|ka|>": 50329, + "<|kk|>": 50316, + "<|km|>": 50323, + "<|kn|>": 50306, + "<|ko|>": 50264, + "<|la|>": 50294, + "<|lb|>": 50345, + "<|ln|>": 50353, + "<|lo|>": 50336, + "<|lt|>": 50293, + "<|lv|>": 50301, + "<|mg|>": 50349, + "<|mi|>": 50295, + "<|mk|>": 50308, + "<|ml|>": 50296, + "<|mn|>": 50314, + "<|mr|>": 50320, + "<|ms|>": 50282, + "<|mt|>": 50343, + "<|my|>": 50346, + "<|ne|>": 50313, + "<|nl|>": 50271, + "<|nn|>": 50342, + "<|no|>": 50288, + "<|oc|>": 50328, + "<|pa|>": 50321, + "<|pl|>": 50269, + "<|ps|>": 50340, + "<|pt|>": 50267, + "<|ro|>": 50284, + "<|ru|>": 50263, + "<|sa|>": 50344, + "<|sd|>": 50332, + "<|si|>": 50322, + "<|sk|>": 50298, + "<|sl|>": 50305, + "<|sn|>": 50324, + "<|so|>": 50326, + "<|sq|>": 50317, + "<|sr|>": 50303, + "<|su|>": 50357, + "<|sv|>": 50273, + "<|sw|>": 50318, + "<|ta|>": 50287, + "<|te|>": 50299, + "<|tg|>": 50331, + "<|th|>": 50289, + "<|tk|>": 50341, + "<|tl|>": 50348, + "<|tr|>": 50268, + "<|tt|>": 50351, + "<|uk|>": 50280, + "<|ur|>": 50290, + "<|uz|>": 50337, + "<|vi|>": 50278, + "<|yi|>": 50335, + "<|yo|>": 50325, + "<|zh|>": 50260 + }, + "max_initial_timestamp_index": 50, + "max_length": 448, + "no_timestamps_token_id": 50363, + "pad_token_id": 50257, + "prev_sot_token_id": 50361, + "return_timestamps": false, + "suppress_tokens": [ + 1, + 2, + 7, + 8, + 9, + 10, + 14, + 25, + 26, + 27, + 28, + 29, + 31, + 58, + 59, + 60, + 61, + 62, + 63, + 90, + 91, + 92, + 93, + 359, + 503, + 522, + 542, + 873, + 893, + 902, + 918, + 922, + 931, + 1350, + 1853, + 1982, + 2460, + 2627, + 3246, + 3253, + 3268, + 3536, + 3846, + 3961, + 4183, + 4667, + 6585, + 6647, + 7273, + 9061, + 9383, + 10428, + 10929, + 11938, + 12033, + 12331, + 12562, + 13793, + 14157, + 14635, + 15265, + 15618, + 16553, + 16604, + 18362, + 18956, + 20075, + 21675, + 22520, + 26130, + 26161, + 26435, + 28279, + 29464, + 31650, + 32302, + 32470, + 36865, + 42863, + 47425, + 49870, + 50254, + 50258, + 50358, + 50359, + 50360, + 50361, + 50362 + ], + "task_to_id": { + "transcribe": 50359, + "translate": 50358 + }, + "transformers_version": "4.41.1" +} diff --git a/whisper-tiny-hi-checkpoint-5/model.safetensors b/whisper-tiny-hi-checkpoint-5/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9aa0b456f8cd8c36c001d1d45bbe4fde21f76cff --- /dev/null +++ b/whisper-tiny-hi-checkpoint-5/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a59c8982089b3ffb0f35b2a8b93a329827d3603f741f4d47ddb7a17dc5a7e5e2 +size 151061672 diff --git a/whisper-tiny-hi-checkpoint-5/preprocessor_config.json b/whisper-tiny-hi-checkpoint-5/preprocessor_config.json new file mode 100644 index 0000000000000000000000000000000000000000..91876762a536a746d268353c5cba57286e76b058 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-5/preprocessor_config.json @@ -0,0 +1,14 @@ +{ + "chunk_length": 30, + "feature_extractor_type": "WhisperFeatureExtractor", + "feature_size": 80, + "hop_length": 160, + "n_fft": 400, + "n_samples": 480000, + "nb_max_frames": 3000, + "padding_side": "right", + "padding_value": 0.0, + "processor_class": "WhisperProcessor", + "return_attention_mask": false, + "sampling_rate": 16000 +} diff --git a/whisper-tiny-hi-checkpoint-5/trainer_state.json b/whisper-tiny-hi-checkpoint-5/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..c184ceb4f6ec5dbf42dc54bff4a4a6c1701b7612 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-5/trainer_state.json @@ -0,0 +1,229 @@ +{ + "best_metric": 69.98899144720129, + "best_model_checkpoint": "./whisper-tiny-hi2_test/checkpoint-120", + "epoch": 6.375, + "eval_steps": 40, + "global_step": 204, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.625, + "grad_norm": 10.95101547241211, + "learning_rate": 9.200000000000002e-06, + "loss": 2.3747, + "step": 20 + }, + { + "epoch": 1.25, + "grad_norm": 7.747081279754639, + "learning_rate": 8.2e-06, + "loss": 1.2169, + "step": 40 + }, + { + "epoch": 1.25, + "eval_loss": 1.0360029935836792, + "eval_runtime": 574.5339, + "eval_samples_per_second": 1.741, + "eval_steps_per_second": 1.741, + "eval_wer": 91.60809552036582, + "step": 40 + }, + { + "epoch": 1.875, + "grad_norm": 7.32460355758667, + "learning_rate": 7.2000000000000005e-06, + "loss": 0.9058, + "step": 60 + }, + { + "epoch": 2.5, + "grad_norm": 6.835532188415527, + "learning_rate": 6.200000000000001e-06, + "loss": 0.7302, + "step": 80 + }, + { + "epoch": 2.5, + "eval_loss": 0.7368654608726501, + "eval_runtime": 549.562, + "eval_samples_per_second": 1.82, + "eval_steps_per_second": 1.82, + "eval_wer": 79.80353967313066, + "step": 80 + }, + { + "epoch": 3.125, + "grad_norm": 6.408384323120117, + "learning_rate": 5.2e-06, + "loss": 0.6453, + "step": 100 + }, + { + "epoch": 3.75, + "grad_norm": 5.809150695800781, + "learning_rate": 4.2000000000000004e-06, + "loss": 0.5917, + "step": 120 + }, + { + "epoch": 3.75, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.8688, + "eval_samples_per_second": 1.822, + "eval_steps_per_second": 1.822, + "eval_wer": 69.98899144720129, + "step": 120 + }, + { + "epoch": 4.375, + "grad_norm": 5.724637508392334, + "learning_rate": 3.2000000000000003e-06, + "loss": 0.5356, + "step": 140 + }, + { + "epoch": 5.0, + "grad_norm": 10.124310493469238, + "learning_rate": 2.2e-06, + "loss": 0.5156, + "step": 160 + }, + { + "epoch": 5.0, + "eval_loss": 0.6157090663909912, + "eval_runtime": 549.7895, + "eval_samples_per_second": 1.819, + "eval_steps_per_second": 1.819, + "eval_wer": 70.4293335591498, + "step": 160 + }, + { + "epoch": 5.625, + "grad_norm": 4.947811126708984, + "learning_rate": 1.2000000000000002e-06, + "loss": 0.4986, + "step": 180 + }, + { + "epoch": 6.25, + "grad_norm": 4.541861057281494, + "learning_rate": 2.0000000000000002e-07, + "loss": 0.481, + "step": 200 + }, + { + "epoch": 6.25, + "eval_loss": 0.6050636768341064, + "eval_runtime": 552.964, + "eval_samples_per_second": 1.808, + "eval_steps_per_second": 1.808, + "eval_wer": 70.03980015242611, + "step": 200 + }, + { + "epoch": 6.25, + "step": 200, + "total_flos": 1.5401574531072e+17, + "train_loss": 0.8495243072509766, + "train_runtime": 3592.94, + "train_samples_per_second": 1.781, + "train_steps_per_second": 0.056 + }, + { + "epoch": 6.28125, + "step": 201, + "total_flos": 1.5480354963456e+17, + "train_loss": 0.003230639654605543, + "train_runtime": 7.5043, + "train_samples_per_second": 852.844, + "train_steps_per_second": 26.651 + }, + { + "epoch": 6.28125, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.5863, + "eval_samples_per_second": 1.823, + "eval_steps_per_second": 1.823, + "eval_wer": 69.98899144720129, + "step": 201 + }, + { + "epoch": 6.3125, + "step": 202, + "total_flos": 1.555913539584e+17, + "train_loss": 0.0035205459830784562, + "train_runtime": 7.6486, + "train_samples_per_second": 836.753, + "train_steps_per_second": 26.149 + }, + { + "epoch": 6.3125, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.2984, + "eval_samples_per_second": 1.824, + "eval_steps_per_second": 1.824, + "eval_wer": 69.98899144720129, + "step": 202 + }, + { + "epoch": 6.34375, + "step": 203, + "total_flos": 1.5637915828224e+17, + "train_loss": 0.002875891812329222, + "train_runtime": 7.5227, + "train_samples_per_second": 850.756, + "train_steps_per_second": 26.586 + }, + { + "epoch": 6.34375, + "eval_loss": 0.6504533886909485, + "eval_runtime": 547.5722, + "eval_samples_per_second": 1.826, + "eval_steps_per_second": 1.826, + "eval_wer": 69.98899144720129, + "step": 203 + }, + { + "epoch": 6.375, + "step": 204, + "total_flos": 1.5716696260608e+17, + "train_loss": 0.003042735305486941, + "train_runtime": 7.3464, + "train_samples_per_second": 871.18, + "train_steps_per_second": 27.224 + }, + { + "epoch": 6.375, + "eval_loss": 0.6504533886909485, + "eval_runtime": 547.015, + "eval_samples_per_second": 1.828, + "eval_steps_per_second": 1.828, + "eval_wer": 69.98899144720129, + "step": 204 + } + ], + "logging_steps": 20, + "max_steps": 200, + "num_input_tokens_seen": 0, + "num_train_epochs": 7, + "save_steps": 40, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 1.5716696260608e+17, + "train_batch_size": 32, + "trial_name": null, + "trial_params": null +} diff --git a/whisper-tiny-hi-checkpoint-5/training_args.bin b/whisper-tiny-hi-checkpoint-5/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b558c878b292ae7a28401ea13fe7d6d415f2ff74 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-5/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa5e527ce8bfb8fc127d02e63369a0c87d27cf046d5c9db273f93e3ab605fc0c +size 5240 diff --git a/whisper-tiny-hi-checkpoint-6/config.json b/whisper-tiny-hi-checkpoint-6/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9a1d4d121c9f711018edbb00f0a24212b89a3467 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-6/config.json @@ -0,0 +1,52 @@ +{ + "_name_or_path": "./whisper-tiny-hi2_test/whisper-tiny-hi-checkpoint-5", + "activation_dropout": 0.0, + "activation_function": "gelu", + "apply_spec_augment": false, + "architectures": [ + "WhisperForConditionalGeneration" + ], + "attention_dropout": 0.0, + "begin_suppress_tokens": [ + 220, + 50257 + ], + "bos_token_id": 50257, + "classifier_proj_size": 256, + "d_model": 384, + "decoder_attention_heads": 6, + "decoder_ffn_dim": 1536, + "decoder_layerdrop": 0.0, + "decoder_layers": 4, + "decoder_start_token_id": 50258, + "dropout": 0.0, + "encoder_attention_heads": 6, + "encoder_ffn_dim": 1536, + "encoder_layerdrop": 0.0, + "encoder_layers": 4, + "eos_token_id": 50257, + "forced_decoder_ids": null, + "init_std": 0.02, + "is_encoder_decoder": true, + "mask_feature_length": 10, + "mask_feature_min_masks": 0, + "mask_feature_prob": 0.0, + "mask_time_length": 10, + "mask_time_min_masks": 2, + "mask_time_prob": 0.05, + "max_length": 448, + "max_source_positions": 1500, + "max_target_positions": 448, + "median_filter_width": 7, + "model_type": "whisper", + "num_hidden_layers": 4, + "num_mel_bins": 80, + "pad_token_id": 50257, + "scale_embedding": false, + "suppress_tokens": [], + "torch_dtype": "float32", + "transformers_version": "4.41.1", + "use_cache": true, + "use_weighted_layer_sum": false, + "vocab_size": 51865 +} diff --git a/whisper-tiny-hi-checkpoint-6/generation_config.json b/whisper-tiny-hi-checkpoint-6/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9d286bdf1e0677a78ae4dc92903472de5fe668ef --- /dev/null +++ b/whisper-tiny-hi-checkpoint-6/generation_config.json @@ -0,0 +1,248 @@ +{ + "alignment_heads": [ + [ + 2, + 2 + ], + [ + 3, + 0 + ], + [ + 3, + 2 + ], + [ + 3, + 3 + ], + [ + 3, + 4 + ], + [ + 3, + 5 + ] + ], + "begin_suppress_tokens": [ + 220, + 50257 + ], + "bos_token_id": 50257, + "decoder_start_token_id": 50258, + "eos_token_id": 50257, + "forced_decoder_ids": [ + [ + 1, + null + ], + [ + 2, + 50359 + ] + ], + "is_multilingual": true, + "lang_to_id": { + "<|af|>": 50327, + "<|am|>": 50334, + "<|ar|>": 50272, + "<|as|>": 50350, + "<|az|>": 50304, + "<|ba|>": 50355, + "<|be|>": 50330, + "<|bg|>": 50292, + "<|bn|>": 50302, + "<|bo|>": 50347, + "<|br|>": 50309, + "<|bs|>": 50315, + "<|ca|>": 50270, + "<|cs|>": 50283, + "<|cy|>": 50297, + "<|da|>": 50285, + "<|de|>": 50261, + "<|el|>": 50281, + "<|en|>": 50259, + "<|es|>": 50262, + "<|et|>": 50307, + "<|eu|>": 50310, + "<|fa|>": 50300, + "<|fi|>": 50277, + "<|fo|>": 50338, + "<|fr|>": 50265, + "<|gl|>": 50319, + "<|gu|>": 50333, + "<|haw|>": 50352, + "<|ha|>": 50354, + "<|he|>": 50279, + "<|hi|>": 50276, + "<|hr|>": 50291, + "<|ht|>": 50339, + "<|hu|>": 50286, + "<|hy|>": 50312, + "<|id|>": 50275, + "<|is|>": 50311, + "<|it|>": 50274, + "<|ja|>": 50266, + "<|jw|>": 50356, + "<|ka|>": 50329, + "<|kk|>": 50316, + "<|km|>": 50323, + "<|kn|>": 50306, + "<|ko|>": 50264, + "<|la|>": 50294, + "<|lb|>": 50345, + "<|ln|>": 50353, + "<|lo|>": 50336, + "<|lt|>": 50293, + "<|lv|>": 50301, + "<|mg|>": 50349, + "<|mi|>": 50295, + "<|mk|>": 50308, + "<|ml|>": 50296, + "<|mn|>": 50314, + "<|mr|>": 50320, + "<|ms|>": 50282, + "<|mt|>": 50343, + "<|my|>": 50346, + "<|ne|>": 50313, + "<|nl|>": 50271, + "<|nn|>": 50342, + "<|no|>": 50288, + "<|oc|>": 50328, + "<|pa|>": 50321, + "<|pl|>": 50269, + "<|ps|>": 50340, + "<|pt|>": 50267, + "<|ro|>": 50284, + "<|ru|>": 50263, + "<|sa|>": 50344, + "<|sd|>": 50332, + "<|si|>": 50322, + "<|sk|>": 50298, + "<|sl|>": 50305, + "<|sn|>": 50324, + "<|so|>": 50326, + "<|sq|>": 50317, + "<|sr|>": 50303, + "<|su|>": 50357, + "<|sv|>": 50273, + "<|sw|>": 50318, + "<|ta|>": 50287, + "<|te|>": 50299, + "<|tg|>": 50331, + "<|th|>": 50289, + "<|tk|>": 50341, + "<|tl|>": 50348, + "<|tr|>": 50268, + "<|tt|>": 50351, + "<|uk|>": 50280, + "<|ur|>": 50290, + "<|uz|>": 50337, + "<|vi|>": 50278, + "<|yi|>": 50335, + "<|yo|>": 50325, + "<|zh|>": 50260 + }, + "max_initial_timestamp_index": 50, + "max_length": 448, + "no_timestamps_token_id": 50363, + "pad_token_id": 50257, + "prev_sot_token_id": 50361, + "return_timestamps": false, + "suppress_tokens": [ + 1, + 2, + 7, + 8, + 9, + 10, + 14, + 25, + 26, + 27, + 28, + 29, + 31, + 58, + 59, + 60, + 61, + 62, + 63, + 90, + 91, + 92, + 93, + 359, + 503, + 522, + 542, + 873, + 893, + 902, + 918, + 922, + 931, + 1350, + 1853, + 1982, + 2460, + 2627, + 3246, + 3253, + 3268, + 3536, + 3846, + 3961, + 4183, + 4667, + 6585, + 6647, + 7273, + 9061, + 9383, + 10428, + 10929, + 11938, + 12033, + 12331, + 12562, + 13793, + 14157, + 14635, + 15265, + 15618, + 16553, + 16604, + 18362, + 18956, + 20075, + 21675, + 22520, + 26130, + 26161, + 26435, + 28279, + 29464, + 31650, + 32302, + 32470, + 36865, + 42863, + 47425, + 49870, + 50254, + 50258, + 50358, + 50359, + 50360, + 50361, + 50362 + ], + "task_to_id": { + "transcribe": 50359, + "translate": 50358 + }, + "transformers_version": "4.41.1" +} diff --git a/whisper-tiny-hi-checkpoint-6/model.safetensors b/whisper-tiny-hi-checkpoint-6/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9aa0b456f8cd8c36c001d1d45bbe4fde21f76cff --- /dev/null +++ b/whisper-tiny-hi-checkpoint-6/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a59c8982089b3ffb0f35b2a8b93a329827d3603f741f4d47ddb7a17dc5a7e5e2 +size 151061672 diff --git a/whisper-tiny-hi-checkpoint-6/preprocessor_config.json b/whisper-tiny-hi-checkpoint-6/preprocessor_config.json new file mode 100644 index 0000000000000000000000000000000000000000..91876762a536a746d268353c5cba57286e76b058 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-6/preprocessor_config.json @@ -0,0 +1,14 @@ +{ + "chunk_length": 30, + "feature_extractor_type": "WhisperFeatureExtractor", + "feature_size": 80, + "hop_length": 160, + "n_fft": 400, + "n_samples": 480000, + "nb_max_frames": 3000, + "padding_side": "right", + "padding_value": 0.0, + "processor_class": "WhisperProcessor", + "return_attention_mask": false, + "sampling_rate": 16000 +} diff --git a/whisper-tiny-hi-checkpoint-6/trainer_state.json b/whisper-tiny-hi-checkpoint-6/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..bf7db2d2182797333bd04906ca9d7d00235d5729 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-6/trainer_state.json @@ -0,0 +1,247 @@ +{ + "best_metric": 69.98899144720129, + "best_model_checkpoint": "./whisper-tiny-hi2_test/checkpoint-120", + "epoch": 6.40625, + "eval_steps": 40, + "global_step": 205, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.625, + "grad_norm": 10.95101547241211, + "learning_rate": 9.200000000000002e-06, + "loss": 2.3747, + "step": 20 + }, + { + "epoch": 1.25, + "grad_norm": 7.747081279754639, + "learning_rate": 8.2e-06, + "loss": 1.2169, + "step": 40 + }, + { + "epoch": 1.25, + "eval_loss": 1.0360029935836792, + "eval_runtime": 574.5339, + "eval_samples_per_second": 1.741, + "eval_steps_per_second": 1.741, + "eval_wer": 91.60809552036582, + "step": 40 + }, + { + "epoch": 1.875, + "grad_norm": 7.32460355758667, + "learning_rate": 7.2000000000000005e-06, + "loss": 0.9058, + "step": 60 + }, + { + "epoch": 2.5, + "grad_norm": 6.835532188415527, + "learning_rate": 6.200000000000001e-06, + "loss": 0.7302, + "step": 80 + }, + { + "epoch": 2.5, + "eval_loss": 0.7368654608726501, + "eval_runtime": 549.562, + "eval_samples_per_second": 1.82, + "eval_steps_per_second": 1.82, + "eval_wer": 79.80353967313066, + "step": 80 + }, + { + "epoch": 3.125, + "grad_norm": 6.408384323120117, + "learning_rate": 5.2e-06, + "loss": 0.6453, + "step": 100 + }, + { + "epoch": 3.75, + "grad_norm": 5.809150695800781, + "learning_rate": 4.2000000000000004e-06, + "loss": 0.5917, + "step": 120 + }, + { + "epoch": 3.75, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.8688, + "eval_samples_per_second": 1.822, + "eval_steps_per_second": 1.822, + "eval_wer": 69.98899144720129, + "step": 120 + }, + { + "epoch": 4.375, + "grad_norm": 5.724637508392334, + "learning_rate": 3.2000000000000003e-06, + "loss": 0.5356, + "step": 140 + }, + { + "epoch": 5.0, + "grad_norm": 10.124310493469238, + "learning_rate": 2.2e-06, + "loss": 0.5156, + "step": 160 + }, + { + "epoch": 5.0, + "eval_loss": 0.6157090663909912, + "eval_runtime": 549.7895, + "eval_samples_per_second": 1.819, + "eval_steps_per_second": 1.819, + "eval_wer": 70.4293335591498, + "step": 160 + }, + { + "epoch": 5.625, + "grad_norm": 4.947811126708984, + "learning_rate": 1.2000000000000002e-06, + "loss": 0.4986, + "step": 180 + }, + { + "epoch": 6.25, + "grad_norm": 4.541861057281494, + "learning_rate": 2.0000000000000002e-07, + "loss": 0.481, + "step": 200 + }, + { + "epoch": 6.25, + "eval_loss": 0.6050636768341064, + "eval_runtime": 552.964, + "eval_samples_per_second": 1.808, + "eval_steps_per_second": 1.808, + "eval_wer": 70.03980015242611, + "step": 200 + }, + { + "epoch": 6.25, + "step": 200, + "total_flos": 1.5401574531072e+17, + "train_loss": 0.8495243072509766, + "train_runtime": 3592.94, + "train_samples_per_second": 1.781, + "train_steps_per_second": 0.056 + }, + { + "epoch": 6.28125, + "step": 201, + "total_flos": 1.5480354963456e+17, + "train_loss": 0.003230639654605543, + "train_runtime": 7.5043, + "train_samples_per_second": 852.844, + "train_steps_per_second": 26.651 + }, + { + "epoch": 6.28125, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.5863, + "eval_samples_per_second": 1.823, + "eval_steps_per_second": 1.823, + "eval_wer": 69.98899144720129, + "step": 201 + }, + { + "epoch": 6.3125, + "step": 202, + "total_flos": 1.555913539584e+17, + "train_loss": 0.0035205459830784562, + "train_runtime": 7.6486, + "train_samples_per_second": 836.753, + "train_steps_per_second": 26.149 + }, + { + "epoch": 6.3125, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.2984, + "eval_samples_per_second": 1.824, + "eval_steps_per_second": 1.824, + "eval_wer": 69.98899144720129, + "step": 202 + }, + { + "epoch": 6.34375, + "step": 203, + "total_flos": 1.5637915828224e+17, + "train_loss": 0.002875891812329222, + "train_runtime": 7.5227, + "train_samples_per_second": 850.756, + "train_steps_per_second": 26.586 + }, + { + "epoch": 6.34375, + "eval_loss": 0.6504533886909485, + "eval_runtime": 547.5722, + "eval_samples_per_second": 1.826, + "eval_steps_per_second": 1.826, + "eval_wer": 69.98899144720129, + "step": 203 + }, + { + "epoch": 6.375, + "step": 204, + "total_flos": 1.5716696260608e+17, + "train_loss": 0.003042735305486941, + "train_runtime": 7.3464, + "train_samples_per_second": 871.18, + "train_steps_per_second": 27.224 + }, + { + "epoch": 6.375, + "eval_loss": 0.6504533886909485, + "eval_runtime": 547.015, + "eval_samples_per_second": 1.828, + "eval_steps_per_second": 1.828, + "eval_wer": 69.98899144720129, + "step": 204 + }, + { + "epoch": 6.40625, + "step": 205, + "total_flos": 1.5795476692992e+17, + "train_loss": 0.0033008325390699433, + "train_runtime": 7.3265, + "train_samples_per_second": 873.547, + "train_steps_per_second": 27.298 + }, + { + "epoch": 6.40625, + "eval_loss": 0.6504533886909485, + "eval_runtime": 545.7731, + "eval_samples_per_second": 1.832, + "eval_steps_per_second": 1.832, + "eval_wer": 69.98899144720129, + "step": 205 + } + ], + "logging_steps": 20, + "max_steps": 200, + "num_input_tokens_seen": 0, + "num_train_epochs": 7, + "save_steps": 40, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 1.5795476692992e+17, + "train_batch_size": 32, + "trial_name": null, + "trial_params": null +} diff --git a/whisper-tiny-hi-checkpoint-6/training_args.bin b/whisper-tiny-hi-checkpoint-6/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..7a964e0d5fd756a2d157082dfe6ad51a0b5ab178 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-6/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:319a37cc1be11f31107d50f5d1c738bcbdf762b1adfd84cac855fe8bbf608c5e +size 5240 diff --git a/whisper-tiny-hi-checkpoint-7/config.json b/whisper-tiny-hi-checkpoint-7/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9f677d2a2860675d39685a33dd833ee2e98c269d --- /dev/null +++ b/whisper-tiny-hi-checkpoint-7/config.json @@ -0,0 +1,52 @@ +{ + "_name_or_path": "./whisper-tiny-hi2_test/whisper-tiny-hi-checkpoint-6", + "activation_dropout": 0.0, + "activation_function": "gelu", + "apply_spec_augment": false, + "architectures": [ + "WhisperForConditionalGeneration" + ], + "attention_dropout": 0.0, + "begin_suppress_tokens": [ + 220, + 50257 + ], + "bos_token_id": 50257, + "classifier_proj_size": 256, + "d_model": 384, + "decoder_attention_heads": 6, + "decoder_ffn_dim": 1536, + "decoder_layerdrop": 0.0, + "decoder_layers": 4, + "decoder_start_token_id": 50258, + "dropout": 0.0, + "encoder_attention_heads": 6, + "encoder_ffn_dim": 1536, + "encoder_layerdrop": 0.0, + "encoder_layers": 4, + "eos_token_id": 50257, + "forced_decoder_ids": null, + "init_std": 0.02, + "is_encoder_decoder": true, + "mask_feature_length": 10, + "mask_feature_min_masks": 0, + "mask_feature_prob": 0.0, + "mask_time_length": 10, + "mask_time_min_masks": 2, + "mask_time_prob": 0.05, + "max_length": 448, + "max_source_positions": 1500, + "max_target_positions": 448, + "median_filter_width": 7, + "model_type": "whisper", + "num_hidden_layers": 4, + "num_mel_bins": 80, + "pad_token_id": 50257, + "scale_embedding": false, + "suppress_tokens": [], + "torch_dtype": "float32", + "transformers_version": "4.41.1", + "use_cache": true, + "use_weighted_layer_sum": false, + "vocab_size": 51865 +} diff --git a/whisper-tiny-hi-checkpoint-7/generation_config.json b/whisper-tiny-hi-checkpoint-7/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9d286bdf1e0677a78ae4dc92903472de5fe668ef --- /dev/null +++ b/whisper-tiny-hi-checkpoint-7/generation_config.json @@ -0,0 +1,248 @@ +{ + "alignment_heads": [ + [ + 2, + 2 + ], + [ + 3, + 0 + ], + [ + 3, + 2 + ], + [ + 3, + 3 + ], + [ + 3, + 4 + ], + [ + 3, + 5 + ] + ], + "begin_suppress_tokens": [ + 220, + 50257 + ], + "bos_token_id": 50257, + "decoder_start_token_id": 50258, + "eos_token_id": 50257, + "forced_decoder_ids": [ + [ + 1, + null + ], + [ + 2, + 50359 + ] + ], + "is_multilingual": true, + "lang_to_id": { + "<|af|>": 50327, + "<|am|>": 50334, + "<|ar|>": 50272, + "<|as|>": 50350, + "<|az|>": 50304, + "<|ba|>": 50355, + "<|be|>": 50330, + "<|bg|>": 50292, + "<|bn|>": 50302, + "<|bo|>": 50347, + "<|br|>": 50309, + "<|bs|>": 50315, + "<|ca|>": 50270, + "<|cs|>": 50283, + "<|cy|>": 50297, + "<|da|>": 50285, + "<|de|>": 50261, + "<|el|>": 50281, + "<|en|>": 50259, + "<|es|>": 50262, + "<|et|>": 50307, + "<|eu|>": 50310, + "<|fa|>": 50300, + "<|fi|>": 50277, + "<|fo|>": 50338, + "<|fr|>": 50265, + "<|gl|>": 50319, + "<|gu|>": 50333, + "<|haw|>": 50352, + "<|ha|>": 50354, + "<|he|>": 50279, + "<|hi|>": 50276, + "<|hr|>": 50291, + "<|ht|>": 50339, + "<|hu|>": 50286, + "<|hy|>": 50312, + "<|id|>": 50275, + "<|is|>": 50311, + "<|it|>": 50274, + "<|ja|>": 50266, + "<|jw|>": 50356, + "<|ka|>": 50329, + "<|kk|>": 50316, + "<|km|>": 50323, + "<|kn|>": 50306, + "<|ko|>": 50264, + "<|la|>": 50294, + "<|lb|>": 50345, + "<|ln|>": 50353, + "<|lo|>": 50336, + "<|lt|>": 50293, + "<|lv|>": 50301, + "<|mg|>": 50349, + "<|mi|>": 50295, + "<|mk|>": 50308, + "<|ml|>": 50296, + "<|mn|>": 50314, + "<|mr|>": 50320, + "<|ms|>": 50282, + "<|mt|>": 50343, + "<|my|>": 50346, + "<|ne|>": 50313, + "<|nl|>": 50271, + "<|nn|>": 50342, + "<|no|>": 50288, + "<|oc|>": 50328, + "<|pa|>": 50321, + "<|pl|>": 50269, + "<|ps|>": 50340, + "<|pt|>": 50267, + "<|ro|>": 50284, + "<|ru|>": 50263, + "<|sa|>": 50344, + "<|sd|>": 50332, + "<|si|>": 50322, + "<|sk|>": 50298, + "<|sl|>": 50305, + "<|sn|>": 50324, + "<|so|>": 50326, + "<|sq|>": 50317, + "<|sr|>": 50303, + "<|su|>": 50357, + "<|sv|>": 50273, + "<|sw|>": 50318, + "<|ta|>": 50287, + "<|te|>": 50299, + "<|tg|>": 50331, + "<|th|>": 50289, + "<|tk|>": 50341, + "<|tl|>": 50348, + "<|tr|>": 50268, + "<|tt|>": 50351, + "<|uk|>": 50280, + "<|ur|>": 50290, + "<|uz|>": 50337, + "<|vi|>": 50278, + "<|yi|>": 50335, + "<|yo|>": 50325, + "<|zh|>": 50260 + }, + "max_initial_timestamp_index": 50, + "max_length": 448, + "no_timestamps_token_id": 50363, + "pad_token_id": 50257, + "prev_sot_token_id": 50361, + "return_timestamps": false, + "suppress_tokens": [ + 1, + 2, + 7, + 8, + 9, + 10, + 14, + 25, + 26, + 27, + 28, + 29, + 31, + 58, + 59, + 60, + 61, + 62, + 63, + 90, + 91, + 92, + 93, + 359, + 503, + 522, + 542, + 873, + 893, + 902, + 918, + 922, + 931, + 1350, + 1853, + 1982, + 2460, + 2627, + 3246, + 3253, + 3268, + 3536, + 3846, + 3961, + 4183, + 4667, + 6585, + 6647, + 7273, + 9061, + 9383, + 10428, + 10929, + 11938, + 12033, + 12331, + 12562, + 13793, + 14157, + 14635, + 15265, + 15618, + 16553, + 16604, + 18362, + 18956, + 20075, + 21675, + 22520, + 26130, + 26161, + 26435, + 28279, + 29464, + 31650, + 32302, + 32470, + 36865, + 42863, + 47425, + 49870, + 50254, + 50258, + 50358, + 50359, + 50360, + 50361, + 50362 + ], + "task_to_id": { + "transcribe": 50359, + "translate": 50358 + }, + "transformers_version": "4.41.1" +} diff --git a/whisper-tiny-hi-checkpoint-7/model.safetensors b/whisper-tiny-hi-checkpoint-7/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9aa0b456f8cd8c36c001d1d45bbe4fde21f76cff --- /dev/null +++ b/whisper-tiny-hi-checkpoint-7/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a59c8982089b3ffb0f35b2a8b93a329827d3603f741f4d47ddb7a17dc5a7e5e2 +size 151061672 diff --git a/whisper-tiny-hi-checkpoint-7/preprocessor_config.json b/whisper-tiny-hi-checkpoint-7/preprocessor_config.json new file mode 100644 index 0000000000000000000000000000000000000000..91876762a536a746d268353c5cba57286e76b058 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-7/preprocessor_config.json @@ -0,0 +1,14 @@ +{ + "chunk_length": 30, + "feature_extractor_type": "WhisperFeatureExtractor", + "feature_size": 80, + "hop_length": 160, + "n_fft": 400, + "n_samples": 480000, + "nb_max_frames": 3000, + "padding_side": "right", + "padding_value": 0.0, + "processor_class": "WhisperProcessor", + "return_attention_mask": false, + "sampling_rate": 16000 +} diff --git a/whisper-tiny-hi-checkpoint-7/trainer_state.json b/whisper-tiny-hi-checkpoint-7/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..64f89c3ca22a66bda9b995ef6e8324eb47e5a12a --- /dev/null +++ b/whisper-tiny-hi-checkpoint-7/trainer_state.json @@ -0,0 +1,265 @@ +{ + "best_metric": 69.98899144720129, + "best_model_checkpoint": "./whisper-tiny-hi2_test/checkpoint-120", + "epoch": 6.4375, + "eval_steps": 40, + "global_step": 206, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.625, + "grad_norm": 10.95101547241211, + "learning_rate": 9.200000000000002e-06, + "loss": 2.3747, + "step": 20 + }, + { + "epoch": 1.25, + "grad_norm": 7.747081279754639, + "learning_rate": 8.2e-06, + "loss": 1.2169, + "step": 40 + }, + { + "epoch": 1.25, + "eval_loss": 1.0360029935836792, + "eval_runtime": 574.5339, + "eval_samples_per_second": 1.741, + "eval_steps_per_second": 1.741, + "eval_wer": 91.60809552036582, + "step": 40 + }, + { + "epoch": 1.875, + "grad_norm": 7.32460355758667, + "learning_rate": 7.2000000000000005e-06, + "loss": 0.9058, + "step": 60 + }, + { + "epoch": 2.5, + "grad_norm": 6.835532188415527, + "learning_rate": 6.200000000000001e-06, + "loss": 0.7302, + "step": 80 + }, + { + "epoch": 2.5, + "eval_loss": 0.7368654608726501, + "eval_runtime": 549.562, + "eval_samples_per_second": 1.82, + "eval_steps_per_second": 1.82, + "eval_wer": 79.80353967313066, + "step": 80 + }, + { + "epoch": 3.125, + "grad_norm": 6.408384323120117, + "learning_rate": 5.2e-06, + "loss": 0.6453, + "step": 100 + }, + { + "epoch": 3.75, + "grad_norm": 5.809150695800781, + "learning_rate": 4.2000000000000004e-06, + "loss": 0.5917, + "step": 120 + }, + { + "epoch": 3.75, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.8688, + "eval_samples_per_second": 1.822, + "eval_steps_per_second": 1.822, + "eval_wer": 69.98899144720129, + "step": 120 + }, + { + "epoch": 4.375, + "grad_norm": 5.724637508392334, + "learning_rate": 3.2000000000000003e-06, + "loss": 0.5356, + "step": 140 + }, + { + "epoch": 5.0, + "grad_norm": 10.124310493469238, + "learning_rate": 2.2e-06, + "loss": 0.5156, + "step": 160 + }, + { + "epoch": 5.0, + "eval_loss": 0.6157090663909912, + "eval_runtime": 549.7895, + "eval_samples_per_second": 1.819, + "eval_steps_per_second": 1.819, + "eval_wer": 70.4293335591498, + "step": 160 + }, + { + "epoch": 5.625, + "grad_norm": 4.947811126708984, + "learning_rate": 1.2000000000000002e-06, + "loss": 0.4986, + "step": 180 + }, + { + "epoch": 6.25, + "grad_norm": 4.541861057281494, + "learning_rate": 2.0000000000000002e-07, + "loss": 0.481, + "step": 200 + }, + { + "epoch": 6.25, + "eval_loss": 0.6050636768341064, + "eval_runtime": 552.964, + "eval_samples_per_second": 1.808, + "eval_steps_per_second": 1.808, + "eval_wer": 70.03980015242611, + "step": 200 + }, + { + "epoch": 6.25, + "step": 200, + "total_flos": 1.5401574531072e+17, + "train_loss": 0.8495243072509766, + "train_runtime": 3592.94, + "train_samples_per_second": 1.781, + "train_steps_per_second": 0.056 + }, + { + "epoch": 6.28125, + "step": 201, + "total_flos": 1.5480354963456e+17, + "train_loss": 0.003230639654605543, + "train_runtime": 7.5043, + "train_samples_per_second": 852.844, + "train_steps_per_second": 26.651 + }, + { + "epoch": 6.28125, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.5863, + "eval_samples_per_second": 1.823, + "eval_steps_per_second": 1.823, + "eval_wer": 69.98899144720129, + "step": 201 + }, + { + "epoch": 6.3125, + "step": 202, + "total_flos": 1.555913539584e+17, + "train_loss": 0.0035205459830784562, + "train_runtime": 7.6486, + "train_samples_per_second": 836.753, + "train_steps_per_second": 26.149 + }, + { + "epoch": 6.3125, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.2984, + "eval_samples_per_second": 1.824, + "eval_steps_per_second": 1.824, + "eval_wer": 69.98899144720129, + "step": 202 + }, + { + "epoch": 6.34375, + "step": 203, + "total_flos": 1.5637915828224e+17, + "train_loss": 0.002875891812329222, + "train_runtime": 7.5227, + "train_samples_per_second": 850.756, + "train_steps_per_second": 26.586 + }, + { + "epoch": 6.34375, + "eval_loss": 0.6504533886909485, + "eval_runtime": 547.5722, + "eval_samples_per_second": 1.826, + "eval_steps_per_second": 1.826, + "eval_wer": 69.98899144720129, + "step": 203 + }, + { + "epoch": 6.375, + "step": 204, + "total_flos": 1.5716696260608e+17, + "train_loss": 0.003042735305486941, + "train_runtime": 7.3464, + "train_samples_per_second": 871.18, + "train_steps_per_second": 27.224 + }, + { + "epoch": 6.375, + "eval_loss": 0.6504533886909485, + "eval_runtime": 547.015, + "eval_samples_per_second": 1.828, + "eval_steps_per_second": 1.828, + "eval_wer": 69.98899144720129, + "step": 204 + }, + { + "epoch": 6.40625, + "step": 205, + "total_flos": 1.5795476692992e+17, + "train_loss": 0.0033008325390699433, + "train_runtime": 7.3265, + "train_samples_per_second": 873.547, + "train_steps_per_second": 27.298 + }, + { + "epoch": 6.40625, + "eval_loss": 0.6504533886909485, + "eval_runtime": 545.7731, + "eval_samples_per_second": 1.832, + "eval_steps_per_second": 1.832, + "eval_wer": 69.98899144720129, + "step": 205 + }, + { + "epoch": 6.4375, + "step": 206, + "total_flos": 1.5874257125376e+17, + "train_loss": 0.0030977731769524734, + "train_runtime": 7.5608, + "train_samples_per_second": 846.467, + "train_steps_per_second": 26.452 + }, + { + "epoch": 6.4375, + "eval_loss": 0.6504533886909485, + "eval_runtime": 546.3323, + "eval_samples_per_second": 1.83, + "eval_steps_per_second": 1.83, + "eval_wer": 69.98899144720129, + "step": 206 + } + ], + "logging_steps": 20, + "max_steps": 200, + "num_input_tokens_seen": 0, + "num_train_epochs": 7, + "save_steps": 40, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 1.5874257125376e+17, + "train_batch_size": 32, + "trial_name": null, + "trial_params": null +} diff --git a/whisper-tiny-hi-checkpoint-7/training_args.bin b/whisper-tiny-hi-checkpoint-7/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..d5f8edc7271c4b4da8bc38a47a84c354f92afe9a --- /dev/null +++ b/whisper-tiny-hi-checkpoint-7/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2fc511e8a8df6e4a22a9d587085443d2b3f42c9d8e0dedb27674021fb85a1f5 +size 5240 diff --git a/whisper-tiny-hi-checkpoint-8/config.json b/whisper-tiny-hi-checkpoint-8/config.json new file mode 100644 index 0000000000000000000000000000000000000000..719a2825b76ea63956b3ce0bc68078b782fce788 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-8/config.json @@ -0,0 +1,52 @@ +{ + "_name_or_path": "./whisper-tiny-hi2_test/whisper-tiny-hi-checkpoint-7", + "activation_dropout": 0.0, + "activation_function": "gelu", + "apply_spec_augment": false, + "architectures": [ + "WhisperForConditionalGeneration" + ], + "attention_dropout": 0.0, + "begin_suppress_tokens": [ + 220, + 50257 + ], + "bos_token_id": 50257, + "classifier_proj_size": 256, + "d_model": 384, + "decoder_attention_heads": 6, + "decoder_ffn_dim": 1536, + "decoder_layerdrop": 0.0, + "decoder_layers": 4, + "decoder_start_token_id": 50258, + "dropout": 0.0, + "encoder_attention_heads": 6, + "encoder_ffn_dim": 1536, + "encoder_layerdrop": 0.0, + "encoder_layers": 4, + "eos_token_id": 50257, + "forced_decoder_ids": null, + "init_std": 0.02, + "is_encoder_decoder": true, + "mask_feature_length": 10, + "mask_feature_min_masks": 0, + "mask_feature_prob": 0.0, + "mask_time_length": 10, + "mask_time_min_masks": 2, + "mask_time_prob": 0.05, + "max_length": 448, + "max_source_positions": 1500, + "max_target_positions": 448, + "median_filter_width": 7, + "model_type": "whisper", + "num_hidden_layers": 4, + "num_mel_bins": 80, + "pad_token_id": 50257, + "scale_embedding": false, + "suppress_tokens": [], + "torch_dtype": "float32", + "transformers_version": "4.41.1", + "use_cache": true, + "use_weighted_layer_sum": false, + "vocab_size": 51865 +} diff --git a/whisper-tiny-hi-checkpoint-8/generation_config.json b/whisper-tiny-hi-checkpoint-8/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9d286bdf1e0677a78ae4dc92903472de5fe668ef --- /dev/null +++ b/whisper-tiny-hi-checkpoint-8/generation_config.json @@ -0,0 +1,248 @@ +{ + "alignment_heads": [ + [ + 2, + 2 + ], + [ + 3, + 0 + ], + [ + 3, + 2 + ], + [ + 3, + 3 + ], + [ + 3, + 4 + ], + [ + 3, + 5 + ] + ], + "begin_suppress_tokens": [ + 220, + 50257 + ], + "bos_token_id": 50257, + "decoder_start_token_id": 50258, + "eos_token_id": 50257, + "forced_decoder_ids": [ + [ + 1, + null + ], + [ + 2, + 50359 + ] + ], + "is_multilingual": true, + "lang_to_id": { + "<|af|>": 50327, + "<|am|>": 50334, + "<|ar|>": 50272, + "<|as|>": 50350, + "<|az|>": 50304, + "<|ba|>": 50355, + "<|be|>": 50330, + "<|bg|>": 50292, + "<|bn|>": 50302, + "<|bo|>": 50347, + "<|br|>": 50309, + "<|bs|>": 50315, + "<|ca|>": 50270, + "<|cs|>": 50283, + "<|cy|>": 50297, + "<|da|>": 50285, + "<|de|>": 50261, + "<|el|>": 50281, + "<|en|>": 50259, + "<|es|>": 50262, + "<|et|>": 50307, + "<|eu|>": 50310, + "<|fa|>": 50300, + "<|fi|>": 50277, + "<|fo|>": 50338, + "<|fr|>": 50265, + "<|gl|>": 50319, + "<|gu|>": 50333, + "<|haw|>": 50352, + "<|ha|>": 50354, + "<|he|>": 50279, + "<|hi|>": 50276, + "<|hr|>": 50291, + "<|ht|>": 50339, + "<|hu|>": 50286, + "<|hy|>": 50312, + "<|id|>": 50275, + "<|is|>": 50311, + "<|it|>": 50274, + "<|ja|>": 50266, + "<|jw|>": 50356, + "<|ka|>": 50329, + "<|kk|>": 50316, + "<|km|>": 50323, + "<|kn|>": 50306, + "<|ko|>": 50264, + "<|la|>": 50294, + "<|lb|>": 50345, + "<|ln|>": 50353, + "<|lo|>": 50336, + "<|lt|>": 50293, + "<|lv|>": 50301, + "<|mg|>": 50349, + "<|mi|>": 50295, + "<|mk|>": 50308, + "<|ml|>": 50296, + "<|mn|>": 50314, + "<|mr|>": 50320, + "<|ms|>": 50282, + "<|mt|>": 50343, + "<|my|>": 50346, + "<|ne|>": 50313, + "<|nl|>": 50271, + "<|nn|>": 50342, + "<|no|>": 50288, + "<|oc|>": 50328, + "<|pa|>": 50321, + "<|pl|>": 50269, + "<|ps|>": 50340, + "<|pt|>": 50267, + "<|ro|>": 50284, + "<|ru|>": 50263, + "<|sa|>": 50344, + "<|sd|>": 50332, + "<|si|>": 50322, + "<|sk|>": 50298, + "<|sl|>": 50305, + "<|sn|>": 50324, + "<|so|>": 50326, + "<|sq|>": 50317, + "<|sr|>": 50303, + "<|su|>": 50357, + "<|sv|>": 50273, + "<|sw|>": 50318, + "<|ta|>": 50287, + "<|te|>": 50299, + "<|tg|>": 50331, + "<|th|>": 50289, + "<|tk|>": 50341, + "<|tl|>": 50348, + "<|tr|>": 50268, + "<|tt|>": 50351, + "<|uk|>": 50280, + "<|ur|>": 50290, + "<|uz|>": 50337, + "<|vi|>": 50278, + "<|yi|>": 50335, + "<|yo|>": 50325, + "<|zh|>": 50260 + }, + "max_initial_timestamp_index": 50, + "max_length": 448, + "no_timestamps_token_id": 50363, + "pad_token_id": 50257, + "prev_sot_token_id": 50361, + "return_timestamps": false, + "suppress_tokens": [ + 1, + 2, + 7, + 8, + 9, + 10, + 14, + 25, + 26, + 27, + 28, + 29, + 31, + 58, + 59, + 60, + 61, + 62, + 63, + 90, + 91, + 92, + 93, + 359, + 503, + 522, + 542, + 873, + 893, + 902, + 918, + 922, + 931, + 1350, + 1853, + 1982, + 2460, + 2627, + 3246, + 3253, + 3268, + 3536, + 3846, + 3961, + 4183, + 4667, + 6585, + 6647, + 7273, + 9061, + 9383, + 10428, + 10929, + 11938, + 12033, + 12331, + 12562, + 13793, + 14157, + 14635, + 15265, + 15618, + 16553, + 16604, + 18362, + 18956, + 20075, + 21675, + 22520, + 26130, + 26161, + 26435, + 28279, + 29464, + 31650, + 32302, + 32470, + 36865, + 42863, + 47425, + 49870, + 50254, + 50258, + 50358, + 50359, + 50360, + 50361, + 50362 + ], + "task_to_id": { + "transcribe": 50359, + "translate": 50358 + }, + "transformers_version": "4.41.1" +} diff --git a/whisper-tiny-hi-checkpoint-8/model.safetensors b/whisper-tiny-hi-checkpoint-8/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9aa0b456f8cd8c36c001d1d45bbe4fde21f76cff --- /dev/null +++ b/whisper-tiny-hi-checkpoint-8/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a59c8982089b3ffb0f35b2a8b93a329827d3603f741f4d47ddb7a17dc5a7e5e2 +size 151061672 diff --git a/whisper-tiny-hi-checkpoint-8/preprocessor_config.json b/whisper-tiny-hi-checkpoint-8/preprocessor_config.json new file mode 100644 index 0000000000000000000000000000000000000000..91876762a536a746d268353c5cba57286e76b058 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-8/preprocessor_config.json @@ -0,0 +1,14 @@ +{ + "chunk_length": 30, + "feature_extractor_type": "WhisperFeatureExtractor", + "feature_size": 80, + "hop_length": 160, + "n_fft": 400, + "n_samples": 480000, + "nb_max_frames": 3000, + "padding_side": "right", + "padding_value": 0.0, + "processor_class": "WhisperProcessor", + "return_attention_mask": false, + "sampling_rate": 16000 +} diff --git a/whisper-tiny-hi-checkpoint-8/trainer_state.json b/whisper-tiny-hi-checkpoint-8/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..d24401fe30577fb48edb59b0274106270f9e6dec --- /dev/null +++ b/whisper-tiny-hi-checkpoint-8/trainer_state.json @@ -0,0 +1,283 @@ +{ + "best_metric": 69.98899144720129, + "best_model_checkpoint": "./whisper-tiny-hi2_test/checkpoint-120", + "epoch": 6.46875, + "eval_steps": 40, + "global_step": 207, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.625, + "grad_norm": 10.95101547241211, + "learning_rate": 9.200000000000002e-06, + "loss": 2.3747, + "step": 20 + }, + { + "epoch": 1.25, + "grad_norm": 7.747081279754639, + "learning_rate": 8.2e-06, + "loss": 1.2169, + "step": 40 + }, + { + "epoch": 1.25, + "eval_loss": 1.0360029935836792, + "eval_runtime": 574.5339, + "eval_samples_per_second": 1.741, + "eval_steps_per_second": 1.741, + "eval_wer": 91.60809552036582, + "step": 40 + }, + { + "epoch": 1.875, + "grad_norm": 7.32460355758667, + "learning_rate": 7.2000000000000005e-06, + "loss": 0.9058, + "step": 60 + }, + { + "epoch": 2.5, + "grad_norm": 6.835532188415527, + "learning_rate": 6.200000000000001e-06, + "loss": 0.7302, + "step": 80 + }, + { + "epoch": 2.5, + "eval_loss": 0.7368654608726501, + "eval_runtime": 549.562, + "eval_samples_per_second": 1.82, + "eval_steps_per_second": 1.82, + "eval_wer": 79.80353967313066, + "step": 80 + }, + { + "epoch": 3.125, + "grad_norm": 6.408384323120117, + "learning_rate": 5.2e-06, + "loss": 0.6453, + "step": 100 + }, + { + "epoch": 3.75, + "grad_norm": 5.809150695800781, + "learning_rate": 4.2000000000000004e-06, + "loss": 0.5917, + "step": 120 + }, + { + "epoch": 3.75, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.8688, + "eval_samples_per_second": 1.822, + "eval_steps_per_second": 1.822, + "eval_wer": 69.98899144720129, + "step": 120 + }, + { + "epoch": 4.375, + "grad_norm": 5.724637508392334, + "learning_rate": 3.2000000000000003e-06, + "loss": 0.5356, + "step": 140 + }, + { + "epoch": 5.0, + "grad_norm": 10.124310493469238, + "learning_rate": 2.2e-06, + "loss": 0.5156, + "step": 160 + }, + { + "epoch": 5.0, + "eval_loss": 0.6157090663909912, + "eval_runtime": 549.7895, + "eval_samples_per_second": 1.819, + "eval_steps_per_second": 1.819, + "eval_wer": 70.4293335591498, + "step": 160 + }, + { + "epoch": 5.625, + "grad_norm": 4.947811126708984, + "learning_rate": 1.2000000000000002e-06, + "loss": 0.4986, + "step": 180 + }, + { + "epoch": 6.25, + "grad_norm": 4.541861057281494, + "learning_rate": 2.0000000000000002e-07, + "loss": 0.481, + "step": 200 + }, + { + "epoch": 6.25, + "eval_loss": 0.6050636768341064, + "eval_runtime": 552.964, + "eval_samples_per_second": 1.808, + "eval_steps_per_second": 1.808, + "eval_wer": 70.03980015242611, + "step": 200 + }, + { + "epoch": 6.25, + "step": 200, + "total_flos": 1.5401574531072e+17, + "train_loss": 0.8495243072509766, + "train_runtime": 3592.94, + "train_samples_per_second": 1.781, + "train_steps_per_second": 0.056 + }, + { + "epoch": 6.28125, + "step": 201, + "total_flos": 1.5480354963456e+17, + "train_loss": 0.003230639654605543, + "train_runtime": 7.5043, + "train_samples_per_second": 852.844, + "train_steps_per_second": 26.651 + }, + { + "epoch": 6.28125, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.5863, + "eval_samples_per_second": 1.823, + "eval_steps_per_second": 1.823, + "eval_wer": 69.98899144720129, + "step": 201 + }, + { + "epoch": 6.3125, + "step": 202, + "total_flos": 1.555913539584e+17, + "train_loss": 0.0035205459830784562, + "train_runtime": 7.6486, + "train_samples_per_second": 836.753, + "train_steps_per_second": 26.149 + }, + { + "epoch": 6.3125, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.2984, + "eval_samples_per_second": 1.824, + "eval_steps_per_second": 1.824, + "eval_wer": 69.98899144720129, + "step": 202 + }, + { + "epoch": 6.34375, + "step": 203, + "total_flos": 1.5637915828224e+17, + "train_loss": 0.002875891812329222, + "train_runtime": 7.5227, + "train_samples_per_second": 850.756, + "train_steps_per_second": 26.586 + }, + { + "epoch": 6.34375, + "eval_loss": 0.6504533886909485, + "eval_runtime": 547.5722, + "eval_samples_per_second": 1.826, + "eval_steps_per_second": 1.826, + "eval_wer": 69.98899144720129, + "step": 203 + }, + { + "epoch": 6.375, + "step": 204, + "total_flos": 1.5716696260608e+17, + "train_loss": 0.003042735305486941, + "train_runtime": 7.3464, + "train_samples_per_second": 871.18, + "train_steps_per_second": 27.224 + }, + { + "epoch": 6.375, + "eval_loss": 0.6504533886909485, + "eval_runtime": 547.015, + "eval_samples_per_second": 1.828, + "eval_steps_per_second": 1.828, + "eval_wer": 69.98899144720129, + "step": 204 + }, + { + "epoch": 6.40625, + "step": 205, + "total_flos": 1.5795476692992e+17, + "train_loss": 0.0033008325390699433, + "train_runtime": 7.3265, + "train_samples_per_second": 873.547, + "train_steps_per_second": 27.298 + }, + { + "epoch": 6.40625, + "eval_loss": 0.6504533886909485, + "eval_runtime": 545.7731, + "eval_samples_per_second": 1.832, + "eval_steps_per_second": 1.832, + "eval_wer": 69.98899144720129, + "step": 205 + }, + { + "epoch": 6.4375, + "step": 206, + "total_flos": 1.5874257125376e+17, + "train_loss": 0.0030977731769524734, + "train_runtime": 7.5608, + "train_samples_per_second": 846.467, + "train_steps_per_second": 26.452 + }, + { + "epoch": 6.4375, + "eval_loss": 0.6504533886909485, + "eval_runtime": 546.3323, + "eval_samples_per_second": 1.83, + "eval_steps_per_second": 1.83, + "eval_wer": 69.98899144720129, + "step": 206 + }, + { + "epoch": 6.46875, + "step": 207, + "total_flos": 1.595303755776e+17, + "train_loss": 0.0028965755361289795, + "train_runtime": 7.5526, + "train_samples_per_second": 847.394, + "train_steps_per_second": 26.481 + }, + { + "epoch": 6.46875, + "eval_loss": 0.6504533886909485, + "eval_runtime": 546.1485, + "eval_samples_per_second": 1.831, + "eval_steps_per_second": 1.831, + "eval_wer": 69.98899144720129, + "step": 207 + } + ], + "logging_steps": 20, + "max_steps": 200, + "num_input_tokens_seen": 0, + "num_train_epochs": 7, + "save_steps": 40, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 1.595303755776e+17, + "train_batch_size": 32, + "trial_name": null, + "trial_params": null +} diff --git a/whisper-tiny-hi-checkpoint-8/training_args.bin b/whisper-tiny-hi-checkpoint-8/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2308fe2a4639389510814af6cadd7505219645a6 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-8/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:767a339ae784e4e2055db7eadefcdc190b9171a0a90225fa68122ab68b97bf5b +size 5240 diff --git a/whisper-tiny-hi-checkpoint-9/config.json b/whisper-tiny-hi-checkpoint-9/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1c588432553e8fcb65845fb79262f2bef36bb72a --- /dev/null +++ b/whisper-tiny-hi-checkpoint-9/config.json @@ -0,0 +1,52 @@ +{ + "_name_or_path": "./whisper-tiny-hi2_test/whisper-tiny-hi-checkpoint-8", + "activation_dropout": 0.0, + "activation_function": "gelu", + "apply_spec_augment": false, + "architectures": [ + "WhisperForConditionalGeneration" + ], + "attention_dropout": 0.0, + "begin_suppress_tokens": [ + 220, + 50257 + ], + "bos_token_id": 50257, + "classifier_proj_size": 256, + "d_model": 384, + "decoder_attention_heads": 6, + "decoder_ffn_dim": 1536, + "decoder_layerdrop": 0.0, + "decoder_layers": 4, + "decoder_start_token_id": 50258, + "dropout": 0.0, + "encoder_attention_heads": 6, + "encoder_ffn_dim": 1536, + "encoder_layerdrop": 0.0, + "encoder_layers": 4, + "eos_token_id": 50257, + "forced_decoder_ids": null, + "init_std": 0.02, + "is_encoder_decoder": true, + "mask_feature_length": 10, + "mask_feature_min_masks": 0, + "mask_feature_prob": 0.0, + "mask_time_length": 10, + "mask_time_min_masks": 2, + "mask_time_prob": 0.05, + "max_length": 448, + "max_source_positions": 1500, + "max_target_positions": 448, + "median_filter_width": 7, + "model_type": "whisper", + "num_hidden_layers": 4, + "num_mel_bins": 80, + "pad_token_id": 50257, + "scale_embedding": false, + "suppress_tokens": [], + "torch_dtype": "float32", + "transformers_version": "4.41.1", + "use_cache": true, + "use_weighted_layer_sum": false, + "vocab_size": 51865 +} diff --git a/whisper-tiny-hi-checkpoint-9/generation_config.json b/whisper-tiny-hi-checkpoint-9/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..9d286bdf1e0677a78ae4dc92903472de5fe668ef --- /dev/null +++ b/whisper-tiny-hi-checkpoint-9/generation_config.json @@ -0,0 +1,248 @@ +{ + "alignment_heads": [ + [ + 2, + 2 + ], + [ + 3, + 0 + ], + [ + 3, + 2 + ], + [ + 3, + 3 + ], + [ + 3, + 4 + ], + [ + 3, + 5 + ] + ], + "begin_suppress_tokens": [ + 220, + 50257 + ], + "bos_token_id": 50257, + "decoder_start_token_id": 50258, + "eos_token_id": 50257, + "forced_decoder_ids": [ + [ + 1, + null + ], + [ + 2, + 50359 + ] + ], + "is_multilingual": true, + "lang_to_id": { + "<|af|>": 50327, + "<|am|>": 50334, + "<|ar|>": 50272, + "<|as|>": 50350, + "<|az|>": 50304, + "<|ba|>": 50355, + "<|be|>": 50330, + "<|bg|>": 50292, + "<|bn|>": 50302, + "<|bo|>": 50347, + "<|br|>": 50309, + "<|bs|>": 50315, + "<|ca|>": 50270, + "<|cs|>": 50283, + "<|cy|>": 50297, + "<|da|>": 50285, + "<|de|>": 50261, + "<|el|>": 50281, + "<|en|>": 50259, + "<|es|>": 50262, + "<|et|>": 50307, + "<|eu|>": 50310, + "<|fa|>": 50300, + "<|fi|>": 50277, + "<|fo|>": 50338, + "<|fr|>": 50265, + "<|gl|>": 50319, + "<|gu|>": 50333, + "<|haw|>": 50352, + "<|ha|>": 50354, + "<|he|>": 50279, + "<|hi|>": 50276, + "<|hr|>": 50291, + "<|ht|>": 50339, + "<|hu|>": 50286, + "<|hy|>": 50312, + "<|id|>": 50275, + "<|is|>": 50311, + "<|it|>": 50274, + "<|ja|>": 50266, + "<|jw|>": 50356, + "<|ka|>": 50329, + "<|kk|>": 50316, + "<|km|>": 50323, + "<|kn|>": 50306, + "<|ko|>": 50264, + "<|la|>": 50294, + "<|lb|>": 50345, + "<|ln|>": 50353, + "<|lo|>": 50336, + "<|lt|>": 50293, + "<|lv|>": 50301, + "<|mg|>": 50349, + "<|mi|>": 50295, + "<|mk|>": 50308, + "<|ml|>": 50296, + "<|mn|>": 50314, + "<|mr|>": 50320, + "<|ms|>": 50282, + "<|mt|>": 50343, + "<|my|>": 50346, + "<|ne|>": 50313, + "<|nl|>": 50271, + "<|nn|>": 50342, + "<|no|>": 50288, + "<|oc|>": 50328, + "<|pa|>": 50321, + "<|pl|>": 50269, + "<|ps|>": 50340, + "<|pt|>": 50267, + "<|ro|>": 50284, + "<|ru|>": 50263, + "<|sa|>": 50344, + "<|sd|>": 50332, + "<|si|>": 50322, + "<|sk|>": 50298, + "<|sl|>": 50305, + "<|sn|>": 50324, + "<|so|>": 50326, + "<|sq|>": 50317, + "<|sr|>": 50303, + "<|su|>": 50357, + "<|sv|>": 50273, + "<|sw|>": 50318, + "<|ta|>": 50287, + "<|te|>": 50299, + "<|tg|>": 50331, + "<|th|>": 50289, + "<|tk|>": 50341, + "<|tl|>": 50348, + "<|tr|>": 50268, + "<|tt|>": 50351, + "<|uk|>": 50280, + "<|ur|>": 50290, + "<|uz|>": 50337, + "<|vi|>": 50278, + "<|yi|>": 50335, + "<|yo|>": 50325, + "<|zh|>": 50260 + }, + "max_initial_timestamp_index": 50, + "max_length": 448, + "no_timestamps_token_id": 50363, + "pad_token_id": 50257, + "prev_sot_token_id": 50361, + "return_timestamps": false, + "suppress_tokens": [ + 1, + 2, + 7, + 8, + 9, + 10, + 14, + 25, + 26, + 27, + 28, + 29, + 31, + 58, + 59, + 60, + 61, + 62, + 63, + 90, + 91, + 92, + 93, + 359, + 503, + 522, + 542, + 873, + 893, + 902, + 918, + 922, + 931, + 1350, + 1853, + 1982, + 2460, + 2627, + 3246, + 3253, + 3268, + 3536, + 3846, + 3961, + 4183, + 4667, + 6585, + 6647, + 7273, + 9061, + 9383, + 10428, + 10929, + 11938, + 12033, + 12331, + 12562, + 13793, + 14157, + 14635, + 15265, + 15618, + 16553, + 16604, + 18362, + 18956, + 20075, + 21675, + 22520, + 26130, + 26161, + 26435, + 28279, + 29464, + 31650, + 32302, + 32470, + 36865, + 42863, + 47425, + 49870, + 50254, + 50258, + 50358, + 50359, + 50360, + 50361, + 50362 + ], + "task_to_id": { + "transcribe": 50359, + "translate": 50358 + }, + "transformers_version": "4.41.1" +} diff --git a/whisper-tiny-hi-checkpoint-9/model.safetensors b/whisper-tiny-hi-checkpoint-9/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9aa0b456f8cd8c36c001d1d45bbe4fde21f76cff --- /dev/null +++ b/whisper-tiny-hi-checkpoint-9/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a59c8982089b3ffb0f35b2a8b93a329827d3603f741f4d47ddb7a17dc5a7e5e2 +size 151061672 diff --git a/whisper-tiny-hi-checkpoint-9/preprocessor_config.json b/whisper-tiny-hi-checkpoint-9/preprocessor_config.json new file mode 100644 index 0000000000000000000000000000000000000000..91876762a536a746d268353c5cba57286e76b058 --- /dev/null +++ b/whisper-tiny-hi-checkpoint-9/preprocessor_config.json @@ -0,0 +1,14 @@ +{ + "chunk_length": 30, + "feature_extractor_type": "WhisperFeatureExtractor", + "feature_size": 80, + "hop_length": 160, + "n_fft": 400, + "n_samples": 480000, + "nb_max_frames": 3000, + "padding_side": "right", + "padding_value": 0.0, + "processor_class": "WhisperProcessor", + "return_attention_mask": false, + "sampling_rate": 16000 +} diff --git a/whisper-tiny-hi-checkpoint-9/trainer_state.json b/whisper-tiny-hi-checkpoint-9/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..f6357d1b3eacc6ae69c3804d71e189145349a66e --- /dev/null +++ b/whisper-tiny-hi-checkpoint-9/trainer_state.json @@ -0,0 +1,301 @@ +{ + "best_metric": 69.98899144720129, + "best_model_checkpoint": "./whisper-tiny-hi2_test/checkpoint-120", + "epoch": 6.5, + "eval_steps": 40, + "global_step": 208, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.625, + "grad_norm": 10.95101547241211, + "learning_rate": 9.200000000000002e-06, + "loss": 2.3747, + "step": 20 + }, + { + "epoch": 1.25, + "grad_norm": 7.747081279754639, + "learning_rate": 8.2e-06, + "loss": 1.2169, + "step": 40 + }, + { + "epoch": 1.25, + "eval_loss": 1.0360029935836792, + "eval_runtime": 574.5339, + "eval_samples_per_second": 1.741, + "eval_steps_per_second": 1.741, + "eval_wer": 91.60809552036582, + "step": 40 + }, + { + "epoch": 1.875, + "grad_norm": 7.32460355758667, + "learning_rate": 7.2000000000000005e-06, + "loss": 0.9058, + "step": 60 + }, + { + "epoch": 2.5, + "grad_norm": 6.835532188415527, + "learning_rate": 6.200000000000001e-06, + "loss": 0.7302, + "step": 80 + }, + { + "epoch": 2.5, + "eval_loss": 0.7368654608726501, + "eval_runtime": 549.562, + "eval_samples_per_second": 1.82, + "eval_steps_per_second": 1.82, + "eval_wer": 79.80353967313066, + "step": 80 + }, + { + "epoch": 3.125, + "grad_norm": 6.408384323120117, + "learning_rate": 5.2e-06, + "loss": 0.6453, + "step": 100 + }, + { + "epoch": 3.75, + "grad_norm": 5.809150695800781, + "learning_rate": 4.2000000000000004e-06, + "loss": 0.5917, + "step": 120 + }, + { + "epoch": 3.75, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.8688, + "eval_samples_per_second": 1.822, + "eval_steps_per_second": 1.822, + "eval_wer": 69.98899144720129, + "step": 120 + }, + { + "epoch": 4.375, + "grad_norm": 5.724637508392334, + "learning_rate": 3.2000000000000003e-06, + "loss": 0.5356, + "step": 140 + }, + { + "epoch": 5.0, + "grad_norm": 10.124310493469238, + "learning_rate": 2.2e-06, + "loss": 0.5156, + "step": 160 + }, + { + "epoch": 5.0, + "eval_loss": 0.6157090663909912, + "eval_runtime": 549.7895, + "eval_samples_per_second": 1.819, + "eval_steps_per_second": 1.819, + "eval_wer": 70.4293335591498, + "step": 160 + }, + { + "epoch": 5.625, + "grad_norm": 4.947811126708984, + "learning_rate": 1.2000000000000002e-06, + "loss": 0.4986, + "step": 180 + }, + { + "epoch": 6.25, + "grad_norm": 4.541861057281494, + "learning_rate": 2.0000000000000002e-07, + "loss": 0.481, + "step": 200 + }, + { + "epoch": 6.25, + "eval_loss": 0.6050636768341064, + "eval_runtime": 552.964, + "eval_samples_per_second": 1.808, + "eval_steps_per_second": 1.808, + "eval_wer": 70.03980015242611, + "step": 200 + }, + { + "epoch": 6.25, + "step": 200, + "total_flos": 1.5401574531072e+17, + "train_loss": 0.8495243072509766, + "train_runtime": 3592.94, + "train_samples_per_second": 1.781, + "train_steps_per_second": 0.056 + }, + { + "epoch": 6.28125, + "step": 201, + "total_flos": 1.5480354963456e+17, + "train_loss": 0.003230639654605543, + "train_runtime": 7.5043, + "train_samples_per_second": 852.844, + "train_steps_per_second": 26.651 + }, + { + "epoch": 6.28125, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.5863, + "eval_samples_per_second": 1.823, + "eval_steps_per_second": 1.823, + "eval_wer": 69.98899144720129, + "step": 201 + }, + { + "epoch": 6.3125, + "step": 202, + "total_flos": 1.555913539584e+17, + "train_loss": 0.0035205459830784562, + "train_runtime": 7.6486, + "train_samples_per_second": 836.753, + "train_steps_per_second": 26.149 + }, + { + "epoch": 6.3125, + "eval_loss": 0.6504533886909485, + "eval_runtime": 548.2984, + "eval_samples_per_second": 1.824, + "eval_steps_per_second": 1.824, + "eval_wer": 69.98899144720129, + "step": 202 + }, + { + "epoch": 6.34375, + "step": 203, + "total_flos": 1.5637915828224e+17, + "train_loss": 0.002875891812329222, + "train_runtime": 7.5227, + "train_samples_per_second": 850.756, + "train_steps_per_second": 26.586 + }, + { + "epoch": 6.34375, + "eval_loss": 0.6504533886909485, + "eval_runtime": 547.5722, + "eval_samples_per_second": 1.826, + "eval_steps_per_second": 1.826, + "eval_wer": 69.98899144720129, + "step": 203 + }, + { + "epoch": 6.375, + "step": 204, + "total_flos": 1.5716696260608e+17, + "train_loss": 0.003042735305486941, + "train_runtime": 7.3464, + "train_samples_per_second": 871.18, + "train_steps_per_second": 27.224 + }, + { + "epoch": 6.375, + "eval_loss": 0.6504533886909485, + "eval_runtime": 547.015, + "eval_samples_per_second": 1.828, + "eval_steps_per_second": 1.828, + "eval_wer": 69.98899144720129, + "step": 204 + }, + { + "epoch": 6.40625, + "step": 205, + "total_flos": 1.5795476692992e+17, + "train_loss": 0.0033008325390699433, + "train_runtime": 7.3265, + "train_samples_per_second": 873.547, + "train_steps_per_second": 27.298 + }, + { + "epoch": 6.40625, + "eval_loss": 0.6504533886909485, + "eval_runtime": 545.7731, + "eval_samples_per_second": 1.832, + "eval_steps_per_second": 1.832, + "eval_wer": 69.98899144720129, + "step": 205 + }, + { + "epoch": 6.4375, + "step": 206, + "total_flos": 1.5874257125376e+17, + "train_loss": 0.0030977731769524734, + "train_runtime": 7.5608, + "train_samples_per_second": 846.467, + "train_steps_per_second": 26.452 + }, + { + "epoch": 6.4375, + "eval_loss": 0.6504533886909485, + "eval_runtime": 546.3323, + "eval_samples_per_second": 1.83, + "eval_steps_per_second": 1.83, + "eval_wer": 69.98899144720129, + "step": 206 + }, + { + "epoch": 6.46875, + "step": 207, + "total_flos": 1.595303755776e+17, + "train_loss": 0.0028965755361289795, + "train_runtime": 7.5526, + "train_samples_per_second": 847.394, + "train_steps_per_second": 26.481 + }, + { + "epoch": 6.46875, + "eval_loss": 0.6504533886909485, + "eval_runtime": 546.1485, + "eval_samples_per_second": 1.831, + "eval_steps_per_second": 1.831, + "eval_wer": 69.98899144720129, + "step": 207 + }, + { + "epoch": 6.5, + "step": 208, + "total_flos": 1.6031817990144e+17, + "train_loss": 0.003312833607196808, + "train_runtime": 7.6251, + "train_samples_per_second": 839.332, + "train_steps_per_second": 26.229 + }, + { + "epoch": 6.5, + "eval_loss": 0.6504533886909485, + "eval_runtime": 547.4069, + "eval_samples_per_second": 1.827, + "eval_steps_per_second": 1.827, + "eval_wer": 69.98899144720129, + "step": 208 + } + ], + "logging_steps": 20, + "max_steps": 200, + "num_input_tokens_seen": 0, + "num_train_epochs": 7, + "save_steps": 40, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 1.6031817990144e+17, + "train_batch_size": 32, + "trial_name": null, + "trial_params": null +} diff --git a/whisper-tiny-hi-checkpoint-9/training_args.bin b/whisper-tiny-hi-checkpoint-9/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..7365ec059443c66ca4f62795b6a0365b0ec6082a --- /dev/null +++ b/whisper-tiny-hi-checkpoint-9/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:491ea0b3fac64ea37df87b10285499fb08a8bcc03ba05abb9770d611ee81c6e0 +size 5240