PSHuman / configs /inference-768-6view.yaml
fffiloni's picture
Update configs/inference-768-6view.yaml
f4557da verified
pretrained_model_name_or_path: 'stabilityai/stable-diffusion-2-1-unclip'
revision: null
num_views: 7
with_smpl: false
validation_dataset:
prompt_embeds_path: mvdiffusion/data/fixed_prompt_embeds_7view
root_dir: 'examples/shhq'
num_views: ${num_views}
bg_color: 'white'
img_wh: [768, 768]
num_validation_samples: 1000
crop_size: 740
margin_size: 50
smpl_folder: 'smpl_image_pymaf'
save_dir: 'mv_results'
save_mode: 'rgba' # 'concat', 'rgba', 'rgb'
seed: 42
validation_batch_size: 1
dataloader_num_workers: 1
local_rank: -1
pipe_kwargs:
num_views: ${num_views}
validation_guidance_scales: 3.0
pipe_validation_kwargs:
num_inference_steps: 40
eta: 1.0
validation_grid_nrow: ${num_views}
unet_from_pretrained_kwargs:
unclip: true
sdxl: false
num_views: ${num_views}
sample_size: 96
zero_init_conv_in: false # modify
projection_camera_embeddings_input_dim: 2 # 2 for elevation and 6 for focal_length
zero_init_camera_projection: false
num_regress_blocks: 3
cd_attention_last: false
cd_attention_mid: false
multiview_attention: true
sparse_mv_attention: true
selfattn_block: self_rowwise
mvcd_attention: true
recon_opt:
res_path: out
save_glb: true
# camera setting
num_view: 6
scale: 4
mode: ortho
resolution: 1024
cam_path: 'mvdiffusion/data/six_human_pose'
# optimization
iters: 700
clr_iters: 200
debug: false
snapshot_step: 50
lr_clr: 2e-3
gpu_id: 0
replace_hand: false
enable_xformers_memory_efficient_attention: true