File size: 530 Bytes
3a1da90
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
export CUDA_VISIBLE_DEVICES=1

output_path=./exps/fluxaudio/output_25nfe

prompt="A basketball bounces rhythmically on a court, shoes squeak against the floor, and a referee’s whistle cuts through the air"
model=fluxaudio_fm
ckpt_path=weights/fluxaudio_fm.pth

python infer.py \
    --variant "fluxaudio_fm" \
    --prompt "$prompt" \
    --model_path "$ckpt_path" \
    --output $output_path \
    --num_steps 25 \
    --cfg_strength 4.5 \
    --encoder_name t5_clap \
    --duration 10 \
    --use_rope \
    --text_c_dim 512