ndc8
Update Dockerfile and application entry point for GGUF backend; optimize memory usage in model parameters and requirements
358e717
| # Use Python 3.10 slim image | |
| FROM python:3.10-slim | |
| # Set up a new user named "user" with user ID 1000 (required by HF Spaces) | |
| RUN useradd -m -u 1000 user | |
| # Switch to the "user" user | |
| USER user | |
| # Set home to the user's home directory | |
| ENV HOME=/home/user \ | |
| PATH=/home/user/.local/bin:$PATH \ | |
| HF_HOME=/tmp/.cache/huggingface \ | |
| TRANSFORMERS_NO_ADVISORY_WARNINGS=1 | |
| # Set the working directory to the user's home directory | |
| WORKDIR $HOME/app | |
| # Copy requirements and install dependencies | |
| COPY --chown=user requirements.txt . | |
| RUN pip install --no-cache-dir --upgrade pip && \ | |
| pip install --no-cache-dir -r requirements.txt | |
| # Copy the application code | |
| COPY --chown=user . . | |
| # Expose port 7860 (HF Spaces default) | |
| EXPOSE 7860 | |
| # Command to run the GGUF backend application | |
| CMD ["python", "-m", "uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"] | |