FROM python:3.9 WORKDIR /app # Install system dependencies RUN apt-get update && apt-get install -y \ build-essential \ curl \ git \ software-properties-common \ && rm -rf /var/lib/apt/lists/* # Copy requirements first to leverage Docker cache COPY requirements.txt . # Install Python packages RUN pip install --no-cache-dir -r requirements.txt # Pre-download the model RUN python -c "from transformers import AutoTokenizer, AutoModelForCausalLM; \ model_id='mradermacher/Huihui-gemma-3n-E4B-it-abliterated-GGUF'; \ tokenizer = AutoTokenizer.from_pretrained(model_id); \ model = AutoModelForCausalLM.from_pretrained(model_id, device_map='auto')" # Copy the rest of the application COPY . . # Set environment variables ENV HOST=0.0.0.0 ENV PORT=7860 ENV PYTHONUNBUFFERED=1 # Expose the port HF Spaces expects EXPOSE 7860 # Start the FastAPI app CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860", "--workers", "1"]