ecker commited on
Commit
64c1edc
·
1 Parent(s): fffdea4

Upload config.ar_nar_double.yaml

Browse files
Files changed (1) hide show
  1. config.ar_nar_double.yaml +105 -0
config.ar_nar_double.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ dataset:
2
+ training: [
3
+ ]
4
+ validation: [
5
+ ]
6
+ noise: [
7
+ ]
8
+
9
+ speaker_name_getter: "lambda p: f'{p.parts[-3]}_{p.parts[-2]}'"
10
+
11
+ use_hdf5: True
12
+ use_metadata: True
13
+ hdf5_flag: r
14
+ validate: True
15
+
16
+ workers: 4
17
+ cache: True
18
+
19
+ phones_range: [4, 256]
20
+ duration_range: [1.0, 16.0]
21
+
22
+ random_utterance: 1.0
23
+ max_prompts: 3
24
+ prompt_duration: 3.0
25
+
26
+ sample_type: speaker
27
+
28
+ tasks_list: ["tts"] # , "ns", "sr", "tse", "cse", "nse", "tts"]
29
+
30
+ models:
31
+ _prom_levels: 4
32
+ _max_levels: 8
33
+
34
+ _models:
35
+ - name: "ar+nar"
36
+ size: "double"
37
+ resp_levels: 4
38
+ prom_levels: 4
39
+ tasks: 8
40
+ arch_type: "retnet"
41
+ training: True
42
+
43
+ hyperparameters:
44
+ batch_size: 8
45
+ gradient_accumulation_steps: 1
46
+ gradient_clipping: 100
47
+
48
+ optimizer: AdamW
49
+ learning_rate: 1.0e-5
50
+
51
+ scheduler_type: ""
52
+
53
+ evaluation:
54
+ batch_size: 16
55
+ frequency: 500
56
+ size: 16
57
+
58
+ steps: 300
59
+ ar_temperature: 0.95
60
+ nar_temperature: 0.25
61
+ load_disabled_engines: True
62
+
63
+ trainer:
64
+ iterations: 1_000_000
65
+
66
+ save_tag: step
67
+ save_on_oom: True
68
+ save_on_quit: True
69
+ save_frequency: 500
70
+ export_on_save: True
71
+
72
+ keep_last_checkpoints: 4
73
+
74
+ aggressive_optimizations: False
75
+ load_disabled_engines: False
76
+
77
+ load_state_dict: True
78
+
79
+ gc_mode: None # "global_step"
80
+
81
+ weight_dtype: float32
82
+ amp: False
83
+
84
+ backend: local
85
+ deepspeed:
86
+ zero_optimization_level: 0
87
+ use_compression_training: True
88
+
89
+ inference:
90
+ weight_dtype: float32
91
+ amp: False
92
+
93
+ use_vocos: True
94
+ normalize: False
95
+
96
+ recurrent_chunk_size: 0
97
+ recurrent_forward: False
98
+
99
+ bitsandbytes:
100
+ enabled: False
101
+ injects: True
102
+ linear: True
103
+ embedding: True
104
+
105
+ device: cpu