version: 1.0 | |
system: "udit_rotary_v_b_1000" | |
ddim: | |
v_prediction: true | |
diffusers: | |
num_train_timesteps: 1000 | |
beta_schedule: 'scaled_linear' | |
beta_start: 0.00085 | |
beta_end: 0.012 | |
prediction_type: 'v_prediction' | |
rescale_betas_zero_snr: true | |
timestep_spacing: 'trailing' | |
clip_sample: false | |
diffwrap: | |
UDiT: | |
input_dim: 256 | |
output_dim: 128 | |
pos_method: 'none' | |
pos_length: 500 | |
timbre_dim: 512 | |
hidden_size: 768 | |
depth: 12 | |
num_heads: 12 |