llama-omni / cog.yaml
marcosremar2's picture
ereerre
c57019c
build:
gpu: true
python_version: "3.10"
python_packages:
- "torch==2.0.1"
- "numpy==1.24.0"
- "transformers==4.34.0"
- "accelerate==0.21.0"
- "gradio==3.50.2"
- "fastapi==0.104.0"
- "uvicorn==0.23.2"
- "pydantic==2.3.0"
- "openai-whisper==20231117"
- "tqdm==4.66.1"
- "requests==2.31.0"
system_packages:
- "wget"
- "ffmpeg"
- "libsndfile1"
- "build-essential"
- "git"
run:
- "pip install -e git+https://github.com/pytorch/fairseq.git#egg=fairseq"
- "python -c 'import platform; import subprocess; arch=platform.machine(); is_arm64=arch==\"arm64\" or arch==\"aarch64\"; is_darwin=platform.system()==\"Darwin\"; not_compatible=is_arm64 and is_darwin; exit_code=subprocess.call([\"pip\", \"install\", \"flash-attn==2.3.0\"]) if not not_compatible else 0; print(f\"flash-attn installation {'skipped on Apple Silicon' if not_compatible else 'completed' if exit_code==0 else 'failed but continuing'}\")'"
- "mkdir -p vocoder"
- "wget https://dl.fbaipublicfiles.com/fairseq/speech_to_speech/vocoder/code_hifigan/mhubert_vp_en_es_fr_it3_400k_layer11_km1000_lj/g_00500000 -P vocoder/"
- "wget https://dl.fbaipublicfiles.com/fairseq/speech_to_speech/vocoder/code_hifigan/mhubert_vp_en_es_fr_it3_400k_layer11_km1000_lj/config.json -P vocoder/"
- "mkdir -p models/speech_encoder"
predict: "predict.py:Predictor"