ashanhr commited on
Commit
2d4ca83
·
verified ·
1 Parent(s): 7c76c47

Training in progress, step 200, checkpoint

Browse files
last-checkpoint/config.json CHANGED
@@ -43,7 +43,7 @@
43
  2
44
  ],
45
  "ctc_loss_reduction": "mean",
46
- "ctc_zero_infinity": false,
47
  "diversity_loss_weight": 0.1,
48
  "do_stable_layer_norm": true,
49
  "eos_token_id": 2,
@@ -64,7 +64,7 @@
64
  "mask_feature_length": 10,
65
  "mask_feature_min_masks": 0,
66
  "mask_feature_prob": 0.0,
67
- "mask_time_length": 5,
68
  "mask_time_min_masks": 2,
69
  "mask_time_prob": 0.05,
70
  "model_type": "wav2vec2",
 
43
  2
44
  ],
45
  "ctc_loss_reduction": "mean",
46
+ "ctc_zero_infinity": true,
47
  "diversity_loss_weight": 0.1,
48
  "do_stable_layer_norm": true,
49
  "eos_token_id": 2,
 
64
  "mask_feature_length": 10,
65
  "mask_feature_min_masks": 0,
66
  "mask_feature_prob": 0.0,
67
+ "mask_time_length": 10,
68
  "mask_time_min_masks": 2,
69
  "mask_time_prob": 0.05,
70
  "model_type": "wav2vec2",
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9943c125d533def374c92e62764fa9d5f751012948f78a46b38bc79cfac2a0cf
3
  size 1261926380
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:361df9cebcb1a2ffc9266959f7e68c97ed1b31f111697b77cb4c6fcb7aa4bb6e
3
  size 1261926380
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:abff52a4cb221cb6fdea55294c6a7f2291f55946f6c1a5de2d334f55f16ba256
3
  size 2490397494
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14379549cbbd615e1afc0f55a72aeefce9e30a8d572d6881616daf914ac9f050
3
  size 2490397494
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:15e9e40d7a10723b41ae89b32ea99392d168dfcbf7c21d9d393f955eea5a17df
3
  size 14308
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae6d077d17ee0eb0d05a121413a9e8770985be4c4d32267b724795c0599d8873
3
  size 14308
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c5771c0459252628d921b8efec8b44d18d11d0dd4c0120b974418319c20ad04e
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fc54d329cf6de9dd761f8fb381d9d1d1cba79225575c60b10e5e232eb19099e
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,36 +1,52 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.33783783783783783,
5
  "eval_steps": 100,
6
- "global_step": 100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.34,
13
- "grad_norm": NaN,
14
- "learning_rate": 0.0001729,
15
- "loss": 6.329,
16
  "step": 100
17
  },
18
  {
19
- "epoch": 0.34,
20
- "eval_loss": Infinity,
21
- "eval_runtime": 77.9869,
22
- "eval_samples_per_second": 15.015,
23
- "eval_steps_per_second": 1.885,
24
  "eval_wer": 1.0,
25
  "step": 100
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
26
  }
27
  ],
28
  "logging_steps": 100,
29
- "max_steps": 8880,
30
  "num_input_tokens_seen": 0,
31
  "num_train_epochs": 30,
32
  "save_steps": 100,
33
- "total_flos": 1.2267819282523704e+17,
34
  "train_batch_size": 8,
35
  "trial_name": null,
36
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.966183574879227,
5
  "eval_steps": 100,
6
+ "global_step": 200,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.48,
13
+ "grad_norm": 0.33149510622024536,
14
+ "learning_rate": 0.00018810000000000002,
15
+ "loss": 3.162,
16
  "step": 100
17
  },
18
  {
19
+ "epoch": 0.48,
20
+ "eval_loss": 2.6494271755218506,
21
+ "eval_runtime": 61.8673,
22
+ "eval_samples_per_second": 13.125,
23
+ "eval_steps_per_second": 1.649,
24
  "eval_wer": 1.0,
25
  "step": 100
26
+ },
27
+ {
28
+ "epoch": 0.97,
29
+ "grad_norm": NaN,
30
+ "learning_rate": 0.00037620000000000004,
31
+ "loss": 2.8381,
32
+ "step": 200
33
+ },
34
+ {
35
+ "epoch": 0.97,
36
+ "eval_loss": 2.6534550189971924,
37
+ "eval_runtime": 62.5126,
38
+ "eval_samples_per_second": 12.989,
39
+ "eval_steps_per_second": 1.632,
40
+ "eval_wer": 1.0,
41
+ "step": 200
42
  }
43
  ],
44
  "logging_steps": 100,
45
+ "max_steps": 6210,
46
  "num_input_tokens_seen": 0,
47
  "num_train_epochs": 30,
48
  "save_steps": 100,
49
+ "total_flos": 4.310189589213924e+17,
50
  "train_batch_size": 8,
51
  "trial_name": null,
52
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2de0a87eb18a49a9f916c4d5d69b8a801be8a6fb5c6c876aa08d56068e5e5288
3
  size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:662cb01d4e6609aa62cde1fb3cfa65348fbcf48196567d53cb73aabfde47c1ae
3
  size 4920