# manual setting max_frames: 32 resolution: [512, 768] # or resolution: [768, 1216] # resolution: [768, 1216] round: 1 ddim_timesteps: 30 # among 25-50 seed: 11 # 7 test_list_path: [ # Format: [frame_interval, reference image, driving pose sequence] [2, "data/images/WOMEN-Blouses_Shirts-id_00004955-01_4_full.jpg", "data/saved_pose/WOMEN-Blouses_Shirts-id_00004955-01_4_full"], [2, "data/images/musk.jpg", "data/saved_pose/musk"], [2, "data/images/WOMEN-Blouses_Shirts-id_00005125-03_4_full.jpg", "data/saved_pose/WOMEN-Blouses_Shirts-id_00005125-03_4_full"], [2, "data/images/IMG_20240514_104337.jpg", "data/saved_pose/IMG_20240514_104337"] ] partial_keys: [ ['image','local_image', "dwpose"], # reference image as the first frame of the generated video (optional) ['image', 'randomref', "dwpose"], ] # default settings TASK_TYPE: inference_unianimate_entrance guide_scale: 2.5 vit_resolution: [224, 224] use_fp16: True batch_size: 1 latent_random_ref: True chunk_size: 2 decoder_bs: 2 scale: 8 use_fps_condition: False test_model: checkpoints/unianimate_16f_32f_non_ema_223000.pth embedder: { 'type': 'FrozenOpenCLIPTextVisualEmbedder', 'layer': 'penultimate', 'pretrained': 'checkpoints/open_clip_pytorch_model.bin' } auto_encoder: { 'type': 'AutoencoderKL', 'ddconfig': { 'double_z': True, 'z_channels': 4, 'resolution': 256, 'in_channels': 3, 'out_ch': 3, 'ch': 128, 'ch_mult': [1, 2, 4, 4], 'num_res_blocks': 2, 'attn_resolutions': [], 'dropout': 0.0, 'video_kernel_size': [3, 1, 1] }, 'embed_dim': 4, 'pretrained': 'checkpoints/v2-1_512-ema-pruned.ckpt' } UNet: { 'type': 'UNetSD_UniAnimate', 'config': None, 'in_dim': 4, 'dim': 320, 'y_dim': 1024, 'context_dim': 1024, 'out_dim': 4, 'dim_mult': [1, 2, 4, 4], 'num_heads': 8, 'head_dim': 64, 'num_res_blocks': 2, 'dropout': 0.1, 'temporal_attention': True, 'num_tokens': 4, 'temporal_attn_times': 1, 'use_checkpoint': True, 'use_fps_condition': False, 'use_sim_mask': False } video_compositions: ['image', 'local_image', 'dwpose', 'randomref', 'randomref_pose'] Diffusion: { 'type': 'DiffusionDDIM', 'schedule': 'linear_sd', 'schedule_param': { 'num_timesteps': 1000, "init_beta": 0.00085, "last_beta": 0.0120, 'zero_terminal_snr': True, }, 'mean_type': 'v', 'loss_type': 'mse', 'var_type': 'fixed_small', # 'fixed_large', 'rescale_timesteps': False, 'noise_strength': 0.1 } use_DiffusionDPM: False CPU_CLIP_VAE: True noise_prior_value: 949 # or 999, 949