Higobeatz commited on
Commit
03e4733
·
verified ·
1 Parent(s): e27f927

Delete dreamvoice/src/configs/.ipynb_checkpoints

Browse files
dreamvoice/src/configs/.ipynb_checkpoints/diffvc_base-checkpoint.yaml DELETED
@@ -1,47 +0,0 @@
1
- version: 1.0
2
-
3
- system: "base"
4
-
5
- model:
6
- cls_embedding:
7
- speaker_dim: 256
8
- feature_dim: 512
9
- content_dim: 768
10
- content_hidden: 256
11
- use_pitch: false
12
-
13
- unet:
14
- sample_size: [128, 256]
15
- in_channels: 257
16
- out_channels: 1
17
- layers_per_block: 2
18
- block_out_channels: [128, 256, 256, 512]
19
- down_block_types:
20
- [
21
- "DownBlock2D",
22
- "DownBlock2D",
23
- "AttnDownBlock2D",
24
- "AttnDownBlock2D",
25
- ]
26
- up_block_types:
27
- [
28
- "AttnUpBlock2D",
29
- "AttnUpBlock2D",
30
- "UpBlock2D",
31
- "UpBlock2D"
32
- ]
33
- attention_head_dim: 32
34
- class_embed_type: 'identity'
35
-
36
- scheduler:
37
- num_train_steps: 1000
38
- beta_schedule: 'linear'
39
- beta_start: 0.0001
40
- beta_end: 0.02
41
- num_infer_steps: 50
42
- rescale_betas_zero_snr: true
43
- timestep_spacing: "trailing"
44
- clip_sample: false
45
- prediction_type: 'v_prediction'
46
- scale: 2.75
47
- shift: 5.80
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
dreamvoice/src/configs/.ipynb_checkpoints/diffvc_base_pitch-checkpoint.yaml DELETED
@@ -1,34 +0,0 @@
1
- version: 1.0
2
-
3
- system: "base"
4
-
5
- diffwrap:
6
- cls_embedding:
7
- speaker_dim: 256
8
- feature_dim: 512
9
- content_dim: 768
10
- content_hidden: 256
11
- use_pitch: true
12
- pitch_dim: 1
13
- pitch_hidden: 128
14
-
15
- unet:
16
- sample_size: [128, 256]
17
- in_channels: 385
18
- out_channels: 1
19
- layers_per_block: 2
20
- block_out_channels: [256, 256, 512]
21
- down_block_types:
22
- [
23
- "DownBlock2D",
24
- "AttnDownBlock2D",
25
- "AttnDownBlock2D",
26
- ]
27
- up_block_types:
28
- [
29
- "AttnUpBlock2D",
30
- "AttnUpBlock2D",
31
- "UpBlock2D"
32
- ]
33
- attention_head_dim: 32
34
- class_embed_type: 'identity'
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
dreamvoice/src/configs/.ipynb_checkpoints/diffvc_cross-checkpoint.yaml DELETED
@@ -1,45 +0,0 @@
1
- version: 1.0
2
-
3
- system: "cross"
4
-
5
- model:
6
- cls_embedding:
7
- content_dim: 768
8
- content_hidden: 256
9
- use_pitch: false
10
-
11
- unet:
12
- sample_size: [128, 256]
13
- in_channels: 257
14
- out_channels: 1
15
- layers_per_block: 2
16
- block_out_channels: [128, 256, 256, 512]
17
- down_block_types:
18
- [
19
- "DownBlock2D",
20
- "DownBlock2D",
21
- "CrossAttnDownBlock2D",
22
- "CrossAttnDownBlock2D",
23
- ]
24
- up_block_types:
25
- [
26
- "CrossAttnUpBlock2D",
27
- "CrossAttnUpBlock2D",
28
- "UpBlock2D",
29
- "UpBlock2D",
30
- ]
31
- attention_head_dim: 32
32
- cross_attention_dim: 768
33
-
34
- scheduler:
35
- num_train_steps: 1000
36
- beta_schedule: 'linear'
37
- beta_start: 0.0001
38
- beta_end: 0.02
39
- num_infer_steps: 50
40
- rescale_betas_zero_snr: true
41
- timestep_spacing: "trailing"
42
- clip_sample: false
43
- prediction_type: 'v_prediction'
44
- scale: 2.75
45
- shift: 5.80
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
dreamvoice/src/configs/.ipynb_checkpoints/diffvc_cross_pitch-checkpoint.yaml DELETED
@@ -1,33 +0,0 @@
1
- version: 1.0
2
-
3
- system: "cross"
4
-
5
- diffwrap:
6
- cls_embedding:
7
- content_dim: 768
8
- content_hidden: 256
9
- use_pitch: true
10
- pitch_dim: 1
11
- pitch_hidden: 128
12
-
13
- unet:
14
- sample_size: [100, 256]
15
- in_channels: 385
16
- out_channels: 1
17
- layers_per_block: 2
18
- block_out_channels: [128, 256, 512]
19
- down_block_types:
20
- [
21
- "DownBlock2D",
22
- "CrossAttnDownBlock2D",
23
- "CrossAttnDownBlock2D",
24
- ]
25
- up_block_types:
26
- [
27
- "CrossAttnUpBlock2D",
28
- "CrossAttnUpBlock2D",
29
- "UpBlock2D",
30
- ]
31
- attention_head_dim: 32
32
- cross_attention_dim: 768
33
-
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
dreamvoice/src/configs/.ipynb_checkpoints/plugin_cross-checkpoint.yaml DELETED
@@ -1,39 +0,0 @@
1
- version: 1.0
2
-
3
- system: "cross"
4
-
5
- model:
6
- cls_embedding:
7
- content_dim: 768
8
- content_hidden: 256
9
-
10
- unet:
11
- sample_size: [1, 1]
12
- in_channels: 256
13
- out_channels: 256
14
- layers_per_block: 2
15
- block_out_channels: [256]
16
- down_block_types:
17
- [
18
- "CrossAttnDownBlock2D",
19
- ]
20
- up_block_types:
21
- [
22
- "CrossAttnUpBlock2D",
23
- ]
24
- attention_head_dim: 32
25
- cross_attention_dim: 768
26
-
27
- scheduler:
28
- num_train_steps: 1000
29
- beta_schedule: 'linear'
30
- beta_start: 0.0001
31
- beta_end: 0.02
32
- num_infer_steps: 50
33
- rescale_betas_zero_snr: true
34
- timestep_spacing: "trailing"
35
- clip_sample: false
36
- prediction_type: 'v_prediction'
37
- scale: 0.05
38
- shift: -0.035
39
-