| version: 1.0 | |
| system: "udit_rotary_v_b_1000" | |
| ddim: | |
| v_prediction: true | |
| diffusers: | |
| num_train_timesteps: 1000 | |
| beta_schedule: 'scaled_linear' | |
| beta_start: 0.00085 | |
| beta_end: 0.012 | |
| prediction_type: 'v_prediction' | |
| rescale_betas_zero_snr: true | |
| timestep_spacing: 'trailing' | |
| clip_sample: false | |
| diffwrap: | |
| UDiT: | |
| input_dim: 256 | |
| output_dim: 128 | |
| pos_method: 'none' | |
| pos_length: 500 | |
| timbre_dim: 512 | |
| hidden_size: 768 | |
| depth: 12 | |
| num_heads: 12 |