HoneyTian commited on
Commit
deadd6d
·
1 Parent(s): f2818f3
examples/nx_clean_unet/yaml/config.yaml CHANGED
@@ -16,6 +16,9 @@ tsfm_hidden_size: 512
16
  tsfm_attention_heads: 8
17
  tsfm_num_blocks: 6
18
  tsfm_dropout_rate: 0.1
 
 
 
19
 
20
  discriminator_dim: 32
21
  discriminator_in_channel: 2
 
16
  tsfm_attention_heads: 8
17
  tsfm_num_blocks: 6
18
  tsfm_dropout_rate: 0.1
19
+ tsfm_max_length: 1024
20
+ tsfm_chunk_size: 1
21
+ tsfm_num_left_chunks: 128
22
 
23
  discriminator_dim: 32
24
  discriminator_in_channel: 2
toolbox/torchaudio/models/nx_clean_unet/configuration_nx_clean_unet.py CHANGED
@@ -24,6 +24,9 @@ class NXCleanUNetConfig(PretrainedConfig):
24
  tsfm_attention_heads: int = 4,
25
  tsfm_num_blocks: int = 6,
26
  tsfm_dropout_rate: float = 0.1,
 
 
 
27
 
28
  discriminator_dim: int = 32,
29
  discriminator_in_channel: int = 2,
@@ -56,6 +59,9 @@ class NXCleanUNetConfig(PretrainedConfig):
56
  self.tsfm_attention_heads = tsfm_attention_heads
57
  self.tsfm_num_blocks = tsfm_num_blocks
58
  self.tsfm_dropout_rate = tsfm_dropout_rate
 
 
 
59
 
60
  self.discriminator_dim = discriminator_dim
61
  self.discriminator_in_channel = discriminator_in_channel
 
24
  tsfm_attention_heads: int = 4,
25
  tsfm_num_blocks: int = 6,
26
  tsfm_dropout_rate: float = 0.1,
27
+ tsfm_max_length: int = 1024,
28
+ tsfm_chunk_size: int = 1,
29
+ tsfm_num_left_chunks: int = 128,
30
 
31
  discriminator_dim: int = 32,
32
  discriminator_in_channel: int = 2,
 
59
  self.tsfm_attention_heads = tsfm_attention_heads
60
  self.tsfm_num_blocks = tsfm_num_blocks
61
  self.tsfm_dropout_rate = tsfm_dropout_rate
62
+ self.tsfm_max_length = tsfm_max_length
63
+ self.tsfm_chunk_size = tsfm_chunk_size
64
+ self.tsfm_num_left_chunks = tsfm_num_left_chunks
65
 
66
  self.discriminator_dim = discriminator_dim
67
  self.discriminator_in_channel = discriminator_in_channel
toolbox/torchaudio/models/nx_clean_unet/transformer/transformer.py CHANGED
@@ -410,7 +410,7 @@ class TransformerEncoder(nn.Module):
410
  attention_heads: int = 4,
411
  num_blocks: int = 6,
412
  dropout_rate: float = 0.1,
413
- max_length: int = 512,
414
  chunk_size: int = 1,
415
  num_left_chunks: int = 128,
416
  ):
 
410
  attention_heads: int = 4,
411
  num_blocks: int = 6,
412
  dropout_rate: float = 0.1,
413
+ max_length: int = 1024,
414
  chunk_size: int = 1,
415
  num_left_chunks: int = 128,
416
  ):
toolbox/torchaudio/models/nx_clean_unet/yaml/config.yaml CHANGED
@@ -12,10 +12,13 @@ down_sampling_hidden_channels: 64
12
  down_sampling_kernel_size: 4
13
  down_sampling_stride: 2
14
 
15
- tsfm_hidden_size: 256
16
  tsfm_attention_heads: 4
17
  tsfm_num_blocks: 6
18
  tsfm_dropout_rate: 0.1
 
 
 
19
 
20
  discriminator_dim: 32
21
  discriminator_in_channel: 2
 
12
  down_sampling_kernel_size: 4
13
  down_sampling_stride: 2
14
 
15
+ tsfm_hidden_size: 512
16
  tsfm_attention_heads: 4
17
  tsfm_num_blocks: 6
18
  tsfm_dropout_rate: 0.1
19
+ tsfm_max_length: 1024
20
+ tsfm_chunk_size: 1
21
+ tsfm_num_left_chunks: 128
22
 
23
  discriminator_dim: 32
24
  discriminator_in_channel: 2