File size: 673 Bytes
b140fcf
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25

MODEL_NAME="auffusion/auffusion"
test_data_dir="./data/test_audiocaps.raw.json"  
output_dir="./output/auffusion"
audio_column="spec_path"
caption_column="text"
num_inference_steps=100 
guidance_scale=7.5


training_params="--pretrained_model_name_or_path=$MODEL_NAME \
    --test_data_dir=$test_data_dir \
    --output_dir=$output_dir \
    --audio_column=$audio_column \
    --caption_column=$caption_column \
    --sample_rate=16000 \
    --duration=10 \
    --num_inference_steps=$num_inference_steps \
    --guidance_scale=$guidance_scale \
    --mixed_precision="fp16" \
    --enable_xformers_memory_efficient_attention \
    "

python inference.py $training_params