ArthurZ HF staff commited on
Commit
8ba3e2b
1 Parent(s): 7c53501
Files changed (2) hide show
  1. config.json +258 -0
  2. pytorch_model.bin +3 -0
config.json ADDED
@@ -0,0 +1,258 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "activation_function": "gelu_new",
3
+ "alignment_head": [
4
+ 2,
5
+ null,
6
+ null
7
+ ],
8
+ "alignment_layer": [
9
+ 68,
10
+ null,
11
+ null
12
+ ],
13
+ "architectures": [
14
+ "JukeboxModel"
15
+ ],
16
+ "attn_dropout": 0.0,
17
+ "attn_init_scale": 1.0,
18
+ "attn_order": [
19
+ 12,
20
+ 2,
21
+ 2
22
+ ],
23
+ "blocks": 128,
24
+ "bos_token_id": 50256,
25
+ "c_res": 1,
26
+ "cond_c_res": [
27
+ 0,
28
+ 1,
29
+ 1
30
+ ],
31
+ "cond_depth": [
32
+ 3,
33
+ 16,
34
+ 16
35
+ ],
36
+ "cond_dilation_cycle": [
37
+ null,
38
+ 8,
39
+ 8
40
+ ],
41
+ "cond_dilation_growth_rate": [
42
+ 1,
43
+ 3,
44
+ 3
45
+ ],
46
+ "cond_m_conv": 1,
47
+ "cond_res_scale": false,
48
+ "cond_width": [
49
+ 128,
50
+ 128,
51
+ 64
52
+ ],
53
+ "cond_zero_out": false,
54
+ "copy_input": false,
55
+ "depth": [
56
+ 2,
57
+ 2,
58
+ 2
59
+ ],
60
+ "downs_t": [
61
+ 3,
62
+ 2,
63
+ 2
64
+ ],
65
+ "emb_dropout": 0.1,
66
+ "eos_token_id": 50256,
67
+ "fp16_params": true,
68
+ "hop_length": 256,
69
+ "init_scale": [
70
+ 0.7,
71
+ 1,
72
+ 1
73
+ ],
74
+ "initializer_range": 0.02,
75
+ "l_bins": 128,
76
+ "labels": true,
77
+ "layer_norm_epsilon": 1e-05,
78
+ "m_attn": 0.25,
79
+ "max_bow_genre_size": 1,
80
+ "max_duration": 600.0,
81
+ "merged_decoder": [
82
+ true,
83
+ false,
84
+ false
85
+ ],
86
+ "min_duration": 1,
87
+ "mlp_init_scale": 0.02,
88
+ "model_type": "jukebox",
89
+ "multispec_loss_hop_length": [
90
+ 240,
91
+ 120,
92
+ 50
93
+ ],
94
+ "multispec_loss_n_fft": [
95
+ 2048,
96
+ 1024,
97
+ 512
98
+ ],
99
+ "multispec_loss_window_size": [
100
+ 1200,
101
+ 600,
102
+ 240
103
+ ],
104
+ "multispectral": 1.0,
105
+ "n_ctx": 256,
106
+ "n_embd": 768,
107
+ "n_head": 12,
108
+ "n_heads": [
109
+ 2,
110
+ 1,
111
+ 1
112
+ ],
113
+ "n_inner": null,
114
+ "n_layer": 12,
115
+ "n_positions": 1024,
116
+ "n_tokens": [
117
+ 512,
118
+ 512,
119
+ 512
120
+ ],
121
+ "n_vocab": 79,
122
+ "name": "AudioSamples",
123
+ "nb_priors": 3,
124
+ "pos_init": false,
125
+ "prime_attn_dropout": 0.0,
126
+ "prime_attn_order": [
127
+ 2,
128
+ 0,
129
+ 0
130
+ ],
131
+ "prime_blocks": 32,
132
+ "prime_c_res": 1,
133
+ "prime_cond_c_res": [
134
+ 0,
135
+ 1,
136
+ 1
137
+ ],
138
+ "prime_depth": [
139
+ 18,
140
+ 3,
141
+ 3
142
+ ],
143
+ "prime_emb_dropout": 0.0,
144
+ "prime_heads": 4,
145
+ "prime_init_scale": [
146
+ 0.1,
147
+ 0.4,
148
+ 0.4
149
+ ],
150
+ "prime_loss_fraction": [
151
+ 0.4,
152
+ 0.0,
153
+ 0.0
154
+ ],
155
+ "prime_m_attn": 0.25,
156
+ "prime_m_mlp": 1.0,
157
+ "prime_pos_init": false,
158
+ "prime_res_scale": false,
159
+ "prime_resid_dropout": 0.0,
160
+ "prime_spread": null,
161
+ "prime_width": [
162
+ 128,
163
+ 128,
164
+ 128
165
+ ],
166
+ "prime_zero_out": false,
167
+ "priors_width": [
168
+ 128,
169
+ 64,
170
+ 32
171
+ ],
172
+ "reorder_and_upcast_attn": false,
173
+ "res_scale": false,
174
+ "resid_dropout": 0.0,
175
+ "sample_hop_length": 30000,
176
+ "sample_length": 44032,
177
+ "sample_length_in_seconds": 1,
178
+ "scale_attn_by_inverse_layer_idx": false,
179
+ "scale_attn_weights": true,
180
+ "single_enc_dec": [
181
+ true,
182
+ false,
183
+ false
184
+ ],
185
+ "spectral": 0.0,
186
+ "spread": null,
187
+ "sr": 44100,
188
+ "strides_t": [
189
+ 2,
190
+ 2,
191
+ 2
192
+ ],
193
+ "summary_activation": null,
194
+ "summary_first_dropout": 0.1,
195
+ "summary_proj_to_labels": true,
196
+ "summary_type": "cls_index",
197
+ "summary_use_proj": true,
198
+ "t_bins": 64,
199
+ "torch_dtype": "float32",
200
+ "transformers_version": "4.19.0.dev0",
201
+ "use_cache": true,
202
+ "use_nonrelative_specloss": true,
203
+ "use_tokens": [
204
+ true,
205
+ false,
206
+ false
207
+ ],
208
+ "vocab_size": 50257,
209
+ "vq_vae_codebook_dimension": 128,
210
+ "vq_vae_commit": 0.02,
211
+ "vq_vae_conv_block_depth": 4,
212
+ "vq_vae_conv_block_width": 64,
213
+ "vq_vae_depth": 4,
214
+ "vq_vae_dilation_cycle": 1,
215
+ "vq_vae_dilation_growth_rate": 3,
216
+ "vq_vae_downs_t": [
217
+ 3,
218
+ 2,
219
+ 2
220
+ ],
221
+ "vq_vae_emmbedding_width": 128,
222
+ "vq_vae_levels": 3,
223
+ "vq_vae_lmu": 0.99,
224
+ "vq_vae_m_conv": 1,
225
+ "vq_vae_multipliers": [
226
+ 2,
227
+ 1,
228
+ 1
229
+ ],
230
+ "vq_vae_reverse_decoder_dilation": 1,
231
+ "vq_vae_strides_t": [
232
+ 2,
233
+ 2,
234
+ 2
235
+ ],
236
+ "vq_vae_width": 64,
237
+ "vqvae_z_shapes": [
238
+ [
239
+ 344
240
+ ],
241
+ [
242
+ 1376
243
+ ],
244
+ [
245
+ 5504
246
+ ]
247
+ ],
248
+ "width": [
249
+ 128,
250
+ 64,
251
+ 32
252
+ ],
253
+ "y_bins": [
254
+ 120,
255
+ 4111
256
+ ],
257
+ "zero_out": false
258
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9568880db535057b63ba7278f2a2749a5030f1dc402487d6655dde9bcc0226e0
3
+ size 40460179