KevinKibe commited on
Commit
b416dbc
1 Parent(s): 18b3d8e

Training in progress, step 10, checkpoint

Browse files
last-checkpoint/adapter_config.json CHANGED
@@ -23,8 +23,8 @@
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
- "q_proj",
27
- "v_proj"
28
  ],
29
  "task_type": null,
30
  "use_dora": false,
 
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
+ "v_proj",
27
+ "q_proj"
28
  ],
29
  "task_type": null,
30
  "use_dora": false,
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7d88d32075310057b782ee49feb21ea7135a3773bbafa6698fb3a52694c71da4
3
  size 14176064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fcc8161bffaa776c36d0bf716f4d9f51343742505a8ec6e761925c605d343e9
3
  size 14176064
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8f4af295acab05c9b709544b2d95aebf7cbe98d7c71d1ef6587176e2441646f6
3
- size 4832890
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2faaedeca429e56c53308b4544dd0629e2b969cef4e149360e7d203cbebd9bf7
3
+ size 4832762
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:03cd9de6ee2a65932ad2fb6094dfd18e75c7e402f88bba702657f50ca5a09f4c
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fd34c05f32915cfddb244845f306181a1764de738fcce7d4ddb675210c64c1c
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:30ee3ca470c4d31872c3879402fa37a65e88eac48e4a7fb0671df0eafcffb412
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4dcd0406e202df2a3c65a5d416d9b75e9f9f16a0af78526a7608fc8a266c503
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,99 +1,35 @@
1
  {
2
- "best_metric": 78.03590285110876,
3
- "best_model_checkpoint": "../openai/whisper-small-finetuned/checkpoint-500",
4
- "epoch": 31.008,
5
- "eval_steps": 100,
6
- "global_step": 500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 6.008,
13
- "grad_norm": 1.1062548160552979,
14
  "learning_rate": 0.0001,
15
- "loss": 2.2203,
16
- "step": 100
17
  },
18
  {
19
- "epoch": 6.008,
20
- "eval_loss": 2.724890947341919,
21
- "eval_runtime": 331.0923,
22
- "eval_samples_per_second": 0.302,
23
- "eval_steps_per_second": 0.012,
24
- "eval_wer": 96.09292502639916,
25
- "step": 100
26
- },
27
- {
28
- "epoch": 12.016,
29
- "grad_norm": 3.7120275497436523,
30
- "learning_rate": 0.0001,
31
- "loss": 1.4989,
32
- "step": 200
33
- },
34
- {
35
- "epoch": 12.016,
36
- "eval_loss": 2.2445077896118164,
37
- "eval_runtime": 331.3447,
38
- "eval_samples_per_second": 0.302,
39
- "eval_steps_per_second": 0.012,
40
- "eval_wer": 92.08025343189018,
41
- "step": 200
42
- },
43
- {
44
- "epoch": 18.024,
45
- "grad_norm": 2.7632181644439697,
46
- "learning_rate": 0.0001,
47
- "loss": 0.9049,
48
- "step": 300
49
- },
50
- {
51
- "epoch": 18.024,
52
- "eval_loss": 2.2876439094543457,
53
- "eval_runtime": 338.7944,
54
- "eval_samples_per_second": 0.295,
55
- "eval_steps_per_second": 0.012,
56
- "eval_wer": 84.58289334741288,
57
- "step": 300
58
- },
59
- {
60
- "epoch": 24.032,
61
- "grad_norm": 3.781102180480957,
62
- "learning_rate": 0.0001,
63
- "loss": 0.6953,
64
- "step": 400
65
- },
66
- {
67
- "epoch": 24.032,
68
- "eval_loss": 2.42946720123291,
69
- "eval_runtime": 336.5888,
70
- "eval_samples_per_second": 0.297,
71
- "eval_steps_per_second": 0.012,
72
- "eval_wer": 87.11721224920802,
73
- "step": 400
74
- },
75
- {
76
- "epoch": 31.008,
77
- "grad_norm": 1.3651665449142456,
78
- "learning_rate": 0.0001,
79
- "loss": 0.5138,
80
- "step": 500
81
- },
82
- {
83
- "epoch": 31.008,
84
- "eval_loss": 2.5180132389068604,
85
- "eval_runtime": 333.0055,
86
- "eval_samples_per_second": 0.3,
87
- "eval_steps_per_second": 0.012,
88
- "eval_wer": 78.03590285110876,
89
- "step": 500
90
  }
91
  ],
92
- "logging_steps": 100,
93
- "max_steps": 500,
94
  "num_input_tokens_seen": 0,
95
  "num_train_epochs": 9223372036854775807,
96
- "save_steps": 100,
97
  "stateful_callbacks": {
98
  "TrainerControl": {
99
  "args": {
@@ -101,12 +37,12 @@
101
  "should_evaluate": false,
102
  "should_log": false,
103
  "should_save": true,
104
- "should_training_stop": true
105
  },
106
  "attributes": {}
107
  }
108
  },
109
- "total_flos": 4.58965416443904e+18,
110
  "train_batch_size": 32,
111
  "trial_name": null,
112
  "trial_params": null
 
1
  {
2
+ "best_metric": 86.20689655172413,
3
+ "best_model_checkpoint": "../openai/whisper-small-finetuned/checkpoint-10",
4
+ "epoch": 9.05,
5
+ "eval_steps": 10,
6
+ "global_step": 10,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 9.05,
13
+ "grad_norm": 3.4064078330993652,
14
  "learning_rate": 0.0001,
15
+ "loss": 3.95,
16
+ "step": 10
17
  },
18
  {
19
+ "epoch": 9.05,
20
+ "eval_loss": 4.568088531494141,
21
+ "eval_runtime": 19.5829,
22
+ "eval_samples_per_second": 0.511,
23
+ "eval_steps_per_second": 0.051,
24
+ "eval_wer": 86.20689655172413,
25
+ "step": 10
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
26
  }
27
  ],
28
+ "logging_steps": 10,
29
+ "max_steps": 20,
30
  "num_input_tokens_seen": 0,
31
  "num_train_epochs": 9223372036854775807,
32
+ "save_steps": 10,
33
  "stateful_callbacks": {
34
  "TrainerControl": {
35
  "args": {
 
37
  "should_evaluate": false,
38
  "should_log": false,
39
  "should_save": true,
40
+ "should_training_stop": false
41
  },
42
  "attributes": {}
43
  }
44
  },
45
+ "total_flos": 5.8736295936e+16,
46
  "train_batch_size": 32,
47
  "trial_name": null,
48
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d78f1c80a7f597bc652f6906f996f83ceebff67856d88e00606bfa4ac987241
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a8867a5cd2e51decccd6a3078781ed396b55c1f60f54d4610df595db10f9abe
3
  size 5368