File size: 673 Bytes
b140fcf |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 |
MODEL_NAME="auffusion/auffusion"
test_data_dir="./data/test_audiocaps.raw.json"
output_dir="./output/auffusion"
audio_column="spec_path"
caption_column="text"
num_inference_steps=100
guidance_scale=7.5
training_params="--pretrained_model_name_or_path=$MODEL_NAME \
--test_data_dir=$test_data_dir \
--output_dir=$output_dir \
--audio_column=$audio_column \
--caption_column=$caption_column \
--sample_rate=16000 \
--duration=10 \
--num_inference_steps=$num_inference_steps \
--guidance_scale=$guidance_scale \
--mixed_precision="fp16" \
--enable_xformers_memory_efficient_attention \
"
python inference.py $training_params
|