MorenoLaQuatra commited on
Commit
f85a01d
·
1 Parent(s): ddd36e6

Added model, config and complete checkpoint

Browse files
Files changed (3) hide show
  1. bestrq.pth +3 -0
  2. config.yaml +72 -0
  3. model.safetensors +3 -0
bestrq.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea1f988f120bd2a423fd910e4c7af64137ecefe3f90044daad3a6995a6f5360d
3
+ size 972101321
config.yaml ADDED
@@ -0,0 +1,72 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ augmentation:
2
+ augment_pitch_shift: false
3
+ augment_time_stretch: false
4
+ noise_injection: false
5
+ data:
6
+ audio_normalization_type: standard
7
+ eval_dataset_path: /mnt/disk4/datasets/librispeech/valid.tsv
8
+ feature_type: mel
9
+ hop_length: 160
10
+ max_length: 12.5
11
+ n_fft: 400
12
+ n_mels: 80
13
+ n_mfcc: 13
14
+ normalize_audio: false
15
+ normalize_features: true
16
+ pad_to_max_length: true
17
+ sample_rate: 16000
18
+ train_dataset_path: /mnt/disk4/datasets/librispeech/train.tsv
19
+ truncate_to_max_length: true
20
+ win_length: 400
21
+ evaluation:
22
+ early_stopping: false
23
+ eval_interval: 1
24
+ metric: validation_accuracy
25
+ metric_lower_is_better: false
26
+ patience: 10
27
+ inference:
28
+ batch_size: 1
29
+ checkpoint_path: /mnt/disk3/bestrq_ckpts/bestrq-mel-pt-subsampled/12L-ls960-V8K-P16-M.05NM8-MEL/
30
+ logging:
31
+ checkpoint_interval: 1
32
+ log_dir: /mnt/disk3/bestrq_ckpts/logs-mel-pt-subsampled/12L-ls960-V8K-P16-M.05NM8-MEL/
33
+ log_interval: 4
34
+ save_dir: /mnt/disk3/bestrq_ckpts/bestrq-mel-pt-subsampled/12L-ls960-V8K-P16-M.05NM8-MEL/
35
+ masking:
36
+ bert_style_masking: false
37
+ mask_len: 8
38
+ mask_prob: 0.05
39
+ mask_type: random
40
+ model:
41
+ conformer_depth: 12
42
+ conformer_dim: 768
43
+ dim_head: 96
44
+ dropout: 0.1
45
+ ff_mult: 4
46
+ heads: 8
47
+ input_dim: 80
48
+ kernel_size: 31
49
+ proj_dim: 16
50
+ quantizer_simvq_mode: false
51
+ subsampled_dim: 768
52
+ use_subsampling: true
53
+ vocab_size: 8192
54
+ training:
55
+ accelerate_config: configs/accelerate_2GPU_config.yaml
56
+ batch_size: 128
57
+ comet_experiment_name: 12L-ls960-V8K-P16-M.05NM8-MEL
58
+ comet_project_name: bestrq-pt-1124
59
+ gradient_accumulation_steps: 32
60
+ gradient_clipping: 5.0
61
+ learning_rate: 0.001
62
+ lr_scheduler: warmup_linear
63
+ max_checkpoints: 5
64
+ mixed_precision: false
65
+ multi_gpu: true
66
+ num_epochs: 500
67
+ num_workers: 16
68
+ optimizer: adamw
69
+ use_comet: true
70
+ use_cuda: true
71
+ warmup_ratio: 0.05
72
+ weight_decay: 0.05
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a63db95cfe51798e9931c1acf91143088c75b48f06165cd8e6d3b80e881ddb89
3
+ size 389050296