unets: unet1: dim: 64 num_resnet_blocks: 2 dim_mults: - 1 - 2 - 4 max_text_len: 1 layer_attns: false layer_cross_attns: - false - false - true cond_images_channels: 3 attend_at_middle: false imagen: elucidated: True condition_on_text: true image_sizes: - 112 text_embed_dim: 1 num_sample_steps: 64 temporal_downsample_factor: - 1 lowres_sample_noise_level: 0.2 sigma_min: 0.002 sigma_max: 80 sigma_data: 0.25 rho: 7 P_mean: -1.2 P_std: 1.2 S_churn: 160 S_tmin: 0.05 S_tmax: 50 S_noise: 1.003 trainer: split_batches: false lr: 0.0005 dl_tuple_output_keywords_names: - images - text_embeds - cond_images dataset: data_path: / deactivate_cache: false fps: 8 duration: 2.0 grayscale: false dataloader: batch_size: 8 num_workers: 8 wandb: project: "" entity: "" checkpoint: path: / batch_size: 4 cond_scale: 5.0 save_every_x_it: 5000