export WANDB_BASE_URL="https://api.wandb.ai" export WANDB_MODE=online torchrun --nnodes 1 --nproc_per_node 4 \ fastvideo/distill.py \ --seed 42 \ --pretrained_model_name_or_path data/mochi \ --model_type "mochi" \ --cache_dir data/.cache \ --data_json_path data/Merge-30k-Data/video2caption.json \ --validation_prompt_dir data/Image-Vid-Finetune-Mochi/validation \ --gradient_checkpointing \ --train_batch_size=1 \ --num_latent_t 28 \ --sp_size 4 \ --train_sp_batch_size 2 \ --dataloader_num_workers 4 \ --gradient_accumulation_steps=1 \ --max_train_steps=4000 \ --learning_rate=1e-6 \ --mixed_precision=bf16 \ --checkpointing_steps=64 \ --validation_steps 1 \ --validation_sampling_steps 8 \ --checkpoints_total_limit 3 \ --allow_tf32 \ --ema_start_step 0 \ --cfg 0.0 \ --log_validation \ --output_dir="data/outputs/lq_euler_50_thres0.1_lrg_0.75_phase1_lr1e-6_repro" \ --tracker_project_name PCM \ --num_frames 163 \ --scheduler_type pcm_linear_quadratic \ --validation_guidance_scale 0.5,1.5,2.5 \ --num_euler_timesteps 50 \ --linear_quadratic_threshold 0.1 \ --linear_range 0.75 \ --multi_phased_distill_schedule 4000-1