kiranpantha commited on
Commit
b87dc76
·
verified ·
1 Parent(s): 52c6888

Training in progress, step 4800

Browse files
Files changed (16) hide show
  1. .ipynb_checkpoints/config-checkpoint.json +47 -0
  2. config.json +1 -1
  3. model-00001-of-00002.safetensors +1 -1
  4. model-00002-of-00002.safetensors +1 -1
  5. runs/Jan05_18-37-57_idc-training-gpu-compute-27/events.out.tfevents.1736102278.idc-training-gpu-compute-27.4006726.0 +3 -0
  6. runs/Jan05_18-42-55_idc-training-gpu-compute-27/events.out.tfevents.1736102576.idc-training-gpu-compute-27.4075677.0 +3 -0
  7. runs/Jan05_20-34-24_idc-training-gpu-compute-27/events.out.tfevents.1736109277.idc-training-gpu-compute-27.4165010.0 +3 -0
  8. runs/Jan06_04-10-26_idc-training-gpu-compute-28/events.out.tfevents.1736136648.idc-training-gpu-compute-28.2174673.0 +3 -0
  9. runs/Jan06_04-35-33_idc-training-gpu-compute-28/events.out.tfevents.1736138146.idc-training-gpu-compute-28.2176479.0 +3 -0
  10. runs/Jan06_06-10-27_idc-training-gpu-compute-27/events.out.tfevents.1736143848.idc-training-gpu-compute-27.27115.0 +3 -0
  11. runs/Jan06_07-06-16_idc-training-gpu-compute-27/events.out.tfevents.1736147188.idc-training-gpu-compute-27.32049.0 +3 -0
  12. runs/Jan06_08-17-44_idc-training-gpu-compute-28/events.out.tfevents.1736151485.idc-training-gpu-compute-28.2249042.0 +3 -0
  13. runs/Jan06_10-13-29_idc-training-gpu-compute-28/events.out.tfevents.1736158423.idc-training-gpu-compute-28.2258229.0 +3 -0
  14. runs/Jan06_12-03-06_idc-training-gpu-compute-28/events.out.tfevents.1736164999.idc-training-gpu-compute-28.2266171.0 +3 -0
  15. runs/Jan06_12-17-40_idc-training-gpu-compute-30/events.out.tfevents.1736165882.idc-training-gpu-compute-30.3877298.0 +3 -0
  16. training_args.bin +2 -2
.ipynb_checkpoints/config-checkpoint.json ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "openai/whisper-large-v3",
3
+ "activation_dropout": 0.0,
4
+ "activation_function": "gelu",
5
+ "apply_spec_augment": false,
6
+ "architectures": [
7
+ "WhisperForConditionalGeneration"
8
+ ],
9
+ "attention_dropout": 0.0,
10
+ "begin_suppress_tokens": null,
11
+ "bos_token_id": 50257,
12
+ "classifier_proj_size": 256,
13
+ "d_model": 1280,
14
+ "decoder_attention_heads": 20,
15
+ "decoder_ffn_dim": 5120,
16
+ "decoder_layerdrop": 0.0,
17
+ "decoder_layers": 32,
18
+ "decoder_start_token_id": 50258,
19
+ "dropout": 0.0,
20
+ "encoder_attention_heads": 20,
21
+ "encoder_ffn_dim": 5120,
22
+ "encoder_layerdrop": 0.0,
23
+ "encoder_layers": 32,
24
+ "eos_token_id": 50257,
25
+ "init_std": 0.02,
26
+ "is_encoder_decoder": true,
27
+ "mask_feature_length": 10,
28
+ "mask_feature_min_masks": 0,
29
+ "mask_feature_prob": 0.0,
30
+ "mask_time_length": 10,
31
+ "mask_time_min_masks": 2,
32
+ "mask_time_prob": 0.05,
33
+ "max_length": null,
34
+ "max_source_positions": 1500,
35
+ "max_target_positions": 448,
36
+ "median_filter_width": 7,
37
+ "model_type": "whisper",
38
+ "num_hidden_layers": 32,
39
+ "num_mel_bins": 128,
40
+ "pad_token_id": 50256,
41
+ "scale_embedding": false,
42
+ "torch_dtype": "float32",
43
+ "transformers_version": "4.47.1",
44
+ "use_cache": true,
45
+ "use_weighted_layer_sum": false,
46
+ "vocab_size": 51866
47
+ }
config.json CHANGED
@@ -40,7 +40,7 @@
40
  "pad_token_id": 50256,
41
  "scale_embedding": false,
42
  "torch_dtype": "float32",
43
- "transformers_version": "4.46.3",
44
  "use_cache": true,
45
  "use_weighted_layer_sum": false,
46
  "vocab_size": 51866
 
40
  "pad_token_id": 50256,
41
  "scale_embedding": false,
42
  "torch_dtype": "float32",
43
+ "transformers_version": "4.47.1",
44
  "use_cache": true,
45
  "use_weighted_layer_sum": false,
46
  "vocab_size": 51866
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8cb4e3fe5f9c3908229be09f5cfb5d8c9140346bf5bffae7c0bf490c0659beff
3
  size 4993448880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f883dcabd631321110701e05f61994998c3ca7ce015c9161ac9fe7d7e036b91
3
  size 4993448880
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8054c2eb8b5999c0177a927da3e4bf7dbbbe35c218ffffe64c6f4fb29effe984
3
  size 1180663192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89b5bb57ec7c4e57d7cb9a440a3c2c772ddaafa7122c5869415540e3c1516703
3
  size 1180663192
runs/Jan05_18-37-57_idc-training-gpu-compute-27/events.out.tfevents.1736102278.idc-training-gpu-compute-27.4006726.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80ad6e2478fe8c36f8799a4751ddd865475e61c7a49ad09d615ef79aa10b4ae9
3
+ size 6295
runs/Jan05_18-42-55_idc-training-gpu-compute-27/events.out.tfevents.1736102576.idc-training-gpu-compute-27.4075677.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15d35cf1659910e59319f5b7a386cbc6359d1621c150d87c6d9f06e2f5f45e58
3
+ size 14185
runs/Jan05_20-34-24_idc-training-gpu-compute-27/events.out.tfevents.1736109277.idc-training-gpu-compute-27.4165010.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8788d388e51074beba43cb67173e43bcba4235fa4a0f762e5babae4ad8f800e5
3
+ size 15625
runs/Jan06_04-10-26_idc-training-gpu-compute-28/events.out.tfevents.1736136648.idc-training-gpu-compute-28.2174673.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c20cde4274cc712a0b9e8ff31d00941f7946e02cf5e9a607533db4a46e26960e
3
+ size 8411
runs/Jan06_04-35-33_idc-training-gpu-compute-28/events.out.tfevents.1736138146.idc-training-gpu-compute-28.2176479.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01e8a12996e6035aa2a3629cca52109c94deb2a5a6181670285039fc6bb8773c
3
+ size 14205
runs/Jan06_06-10-27_idc-training-gpu-compute-27/events.out.tfevents.1736143848.idc-training-gpu-compute-27.27115.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be54f7a78eaabead1d09c5a674b197b7debf722401c7445bea97d09585f308c0
3
+ size 11308
runs/Jan06_07-06-16_idc-training-gpu-compute-27/events.out.tfevents.1736147188.idc-training-gpu-compute-27.32049.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:667029c44c1396cfecea4340646a1656de03332eae3c63da0d71d7634189e643
3
+ size 11308
runs/Jan06_08-17-44_idc-training-gpu-compute-28/events.out.tfevents.1736151485.idc-training-gpu-compute-28.2249042.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c1cf93e893da833eafb66a4825150b695923a91c522df3c6e7e1f8a8c383ce1
3
+ size 14570
runs/Jan06_10-13-29_idc-training-gpu-compute-28/events.out.tfevents.1736158423.idc-training-gpu-compute-28.2258229.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b01c79545728b1abf5895e4907f6bc5bf06ae14c3bfc8d5cbce5a8db6085b15
3
+ size 14781
runs/Jan06_12-03-06_idc-training-gpu-compute-28/events.out.tfevents.1736164999.idc-training-gpu-compute-28.2266171.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4301aee596aa56008d92cf18ef59b43d583a1d4c5d1a5adbbb3a0677c9c4b4b7
3
+ size 7127
runs/Jan06_12-17-40_idc-training-gpu-compute-30/events.out.tfevents.1736165882.idc-training-gpu-compute-30.3877298.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f10c5fbb332d271e10e95e2cb5ff0ed53d31a3e97f77bec0fbb5797c23b98d3b
3
+ size 8758
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:515a18595fdc557be78d20d2f8ac86d6061cf4b21e093106aa9a633b4c3c554d
3
- size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9adbcf5dceccf6b81598143cd6ade0047a7188e8591077ef64309bc65d3cc94
3
+ size 5496