MorenoLaQuatra
commited on
Commit
·
f85a01d
1
Parent(s):
ddd36e6
Added model, config and complete checkpoint
Browse files- bestrq.pth +3 -0
- config.yaml +72 -0
- model.safetensors +3 -0
bestrq.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea1f988f120bd2a423fd910e4c7af64137ecefe3f90044daad3a6995a6f5360d
|
3 |
+
size 972101321
|
config.yaml
ADDED
@@ -0,0 +1,72 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
augmentation:
|
2 |
+
augment_pitch_shift: false
|
3 |
+
augment_time_stretch: false
|
4 |
+
noise_injection: false
|
5 |
+
data:
|
6 |
+
audio_normalization_type: standard
|
7 |
+
eval_dataset_path: /mnt/disk4/datasets/librispeech/valid.tsv
|
8 |
+
feature_type: mel
|
9 |
+
hop_length: 160
|
10 |
+
max_length: 12.5
|
11 |
+
n_fft: 400
|
12 |
+
n_mels: 80
|
13 |
+
n_mfcc: 13
|
14 |
+
normalize_audio: false
|
15 |
+
normalize_features: true
|
16 |
+
pad_to_max_length: true
|
17 |
+
sample_rate: 16000
|
18 |
+
train_dataset_path: /mnt/disk4/datasets/librispeech/train.tsv
|
19 |
+
truncate_to_max_length: true
|
20 |
+
win_length: 400
|
21 |
+
evaluation:
|
22 |
+
early_stopping: false
|
23 |
+
eval_interval: 1
|
24 |
+
metric: validation_accuracy
|
25 |
+
metric_lower_is_better: false
|
26 |
+
patience: 10
|
27 |
+
inference:
|
28 |
+
batch_size: 1
|
29 |
+
checkpoint_path: /mnt/disk3/bestrq_ckpts/bestrq-mel-pt-subsampled/12L-ls960-V8K-P16-M.05NM8-MEL/
|
30 |
+
logging:
|
31 |
+
checkpoint_interval: 1
|
32 |
+
log_dir: /mnt/disk3/bestrq_ckpts/logs-mel-pt-subsampled/12L-ls960-V8K-P16-M.05NM8-MEL/
|
33 |
+
log_interval: 4
|
34 |
+
save_dir: /mnt/disk3/bestrq_ckpts/bestrq-mel-pt-subsampled/12L-ls960-V8K-P16-M.05NM8-MEL/
|
35 |
+
masking:
|
36 |
+
bert_style_masking: false
|
37 |
+
mask_len: 8
|
38 |
+
mask_prob: 0.05
|
39 |
+
mask_type: random
|
40 |
+
model:
|
41 |
+
conformer_depth: 12
|
42 |
+
conformer_dim: 768
|
43 |
+
dim_head: 96
|
44 |
+
dropout: 0.1
|
45 |
+
ff_mult: 4
|
46 |
+
heads: 8
|
47 |
+
input_dim: 80
|
48 |
+
kernel_size: 31
|
49 |
+
proj_dim: 16
|
50 |
+
quantizer_simvq_mode: false
|
51 |
+
subsampled_dim: 768
|
52 |
+
use_subsampling: true
|
53 |
+
vocab_size: 8192
|
54 |
+
training:
|
55 |
+
accelerate_config: configs/accelerate_2GPU_config.yaml
|
56 |
+
batch_size: 128
|
57 |
+
comet_experiment_name: 12L-ls960-V8K-P16-M.05NM8-MEL
|
58 |
+
comet_project_name: bestrq-pt-1124
|
59 |
+
gradient_accumulation_steps: 32
|
60 |
+
gradient_clipping: 5.0
|
61 |
+
learning_rate: 0.001
|
62 |
+
lr_scheduler: warmup_linear
|
63 |
+
max_checkpoints: 5
|
64 |
+
mixed_precision: false
|
65 |
+
multi_gpu: true
|
66 |
+
num_epochs: 500
|
67 |
+
num_workers: 16
|
68 |
+
optimizer: adamw
|
69 |
+
use_comet: true
|
70 |
+
use_cuda: true
|
71 |
+
warmup_ratio: 0.05
|
72 |
+
weight_decay: 0.05
|
model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a63db95cfe51798e9931c1acf91143088c75b48f06165cd8e6d3b80e881ddb89
|
3 |
+
size 389050296
|