| pretrained_model_name_or_path: 'stabilityai/stable-diffusion-2-1-unclip' | |
| revision: null | |
| num_views: 7 | |
| with_smpl: false | |
| validation_dataset: | |
| prompt_embeds_path: mvdiffusion/data/fixed_prompt_embeds_7view | |
| root_dir: 'examples/shhq' | |
| num_views: ${num_views} | |
| bg_color: 'white' | |
| img_wh: [768, 768] | |
| num_validation_samples: 1000 | |
| crop_size: 740 | |
| margin_size: 50 | |
| smpl_folder: 'smpl_image_pymaf' | |
| save_dir: 'mv_results' | |
| save_mode: 'rgba' # 'concat', 'rgba', 'rgb' | |
| seed: 42 | |
| validation_batch_size: 1 | |
| dataloader_num_workers: 1 | |
| local_rank: -1 | |
| pipe_kwargs: | |
| num_views: ${num_views} | |
| validation_guidance_scales: 3.0 | |
| pipe_validation_kwargs: | |
| num_inference_steps: 40 | |
| eta: 1.0 | |
| validation_grid_nrow: ${num_views} | |
| unet_from_pretrained_kwargs: | |
| unclip: true | |
| sdxl: false | |
| num_views: ${num_views} | |
| sample_size: 96 | |
| zero_init_conv_in: false # modify | |
| projection_camera_embeddings_input_dim: 2 # 2 for elevation and 6 for focal_length | |
| zero_init_camera_projection: false | |
| num_regress_blocks: 3 | |
| cd_attention_last: false | |
| cd_attention_mid: false | |
| multiview_attention: true | |
| sparse_mv_attention: true | |
| selfattn_block: self_rowwise | |
| mvcd_attention: true | |
| recon_opt: | |
| res_path: out | |
| save_glb: true | |
| # camera setting | |
| num_view: 6 | |
| scale: 4 | |
| mode: ortho | |
| resolution: 1024 | |
| cam_path: 'mvdiffusion/data/six_human_pose' | |
| # optimization | |
| iters: 700 | |
| clr_iters: 200 | |
| debug: false | |
| snapshot_step: 50 | |
| lr_clr: 2e-3 | |
| gpu_id: 0 | |
| replace_hand: false | |
| enable_xformers_memory_efficient_attention: true |