File size: 1,304 Bytes
9d095b0 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 |
unets:
unet1:
dim: 64
num_resnet_blocks: 2
dim_mults:
- 1
- 2
- 4
max_text_len: 1
layer_attns: false
layer_cross_attns:
- false
- false
- true
cond_images_channels: 3
unet2:
dim: 64
num_resnet_blocks: 2
dim_mults:
- 1
- 2
- 4
max_text_len: 1
layer_attns: false
layer_cross_attns:
- false
- false
- true
memory_efficient: true
cond_images_channels: 3
imagen:
elucidated: true
condition_on_text: true
image_sizes:
- 56
- 112
text_embed_dim: 1
num_sample_steps:
- 32
- 64
random_crop_sizes:
- null
- 56
temporal_downsample_factor:
- 4
- 1
sigma_min: 0.002
sigma_max: 80
sigma_data: 0.25
rho: 7
P_mean: -1.2
P_std: 1.2
S_churn:
- 80
- 160
S_tmin: 0.05
S_tmax: 50
S_noise: 1.003
resize_mode: trilinear
trainer:
split_batches: false
lr: 0.0005
dl_tuple_output_keywords_names:
- images
- text_embeds
- cond_images
dataset:
data_path: /path/to/EchoNet-Dynamic
deactivate_cache: false
fps: 32
duration: 2.0
grayscale: false
dataloader:
batch_size: 8
num_workers: 8
wandb:
project: EchoDiffusion
# entity: your-login
checkpoint:
path: /path/to/checkpoints
batch_size: 4
cond_scale: 5.0
save_every_x_it: 5000
|