export CUDA_VISIBLE_DEVICES=1 | |
output_path=./exps/fluxaudio/output_25nfe | |
prompt="A basketball bounces rhythmically on a court, shoes squeak against the floor, and a referee’s whistle cuts through the air" | |
model=fluxaudio_fm | |
ckpt_path=weights/fluxaudio_fm.pth | |
python infer.py \ | |
--variant "fluxaudio_fm" \ | |
--prompt "$prompt" \ | |
--model_path "$ckpt_path" \ | |
--output $output_path \ | |
--num_steps 25 \ | |
--cfg_strength 4.5 \ | |
--encoder_name t5_clap \ | |
--duration 10 \ | |
--use_rope \ | |
--text_c_dim 512 | |