use_ema: true output_dir: results/train pretrained_model_path: /mnt/vepfs/zhaomin/projects/LargeData/checkpoints/stable-video-diffusion-img2vid/ train_data: file_path: /mnt/vepfs/zhaomin/projects/scence_fusion/improved-svd/finalre/webvid.csv video_folder: /mnt/vepfs/bigdata/video_datasets/webvid/2M_train sample_size: 320,512 fps: 3 sample_n_frames: 16 validation_folder: /mnt/vepfs/zhaomin/projects/scence_fusion/improved-svd/SVD_diffusers/demo motion_bucket_id: 20.0 cfg_random_null_ratio: 0.1 resume_path: '' ema_decay: 0.9999 noise_scheduler_kwargs: P_mean: -1.2 P_std: 1.2 sigma_data: 1 beta_m: 15 a: 5 max_train_steps: 100000 validation_steps: 10 learning_rate: 3.0e-05 scale_lr: false lr_scheduler: constant train_batch_size: 1 adam_beta1: 0.9 adam_beta2: 0.999 adam_weight_decay: 0.01 adam_epsilon: 1.0e-08 gradient_accumulation_steps: 1 gradient_checkpointing: true checkpointing_steps: 10000 mixed_precision_training: true global_seed: 23 max_grad_norm: 1.0