meirk
/

whisper-large-v3-turbo-ct2-copy

Model card Files Files and versions Community

meirk commited on 14 days ago

Commit

d3f8264

·

verified ·

1 Parent(s): 4604f0d

Update Dockerfile

Files changed (1) hide show

Dockerfile +11 -13

Dockerfile CHANGED Viewed

@@ -1,21 +1,19 @@
-# Use an official NVIDIA base image with PyTorch, CUDA, and cuDNN pre-installed
-# We choose a version with Python 3.11 to match your previous environment
 FROM nvcr.io/nvidia/pytorch:24.04-py3
-# Set the working directory
 WORKDIR /repository
-# Copy the requirements file into the container
-COPY requirements.txt .
-# Install your Python dependencies
-# Using --no-cache-dir is good practice for smaller image sizes
-RUN pip install --no-cache-dir -r requirements.txt
-# Copy the rest of your application code (e.g., your handler.py)
 COPY . .
-# (Optional) Set an environment variable if needed by your platform
-# ENV TRANSFORMERS_CACHE="/repository/cache"
-# Your inference platform will typically handle the CMD or ENTRYPOINT

+# 1. Start from the same great NVIDIA base image
 FROM nvcr.io/nvidia/pytorch:24.04-py3
+# 2. Set the working directory
 WORKDIR /repository
+# 3. Add Hugging Face specific environment variables
+ENV PROTOCOL_BUFFERS_PYTHON_IMPLEMENTATION=python
+ENV PORT=80
+# 4. Copy and install requirements AND the HF toolkit
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt huggingface_inference_toolkit
+# 5. Copy the rest of your application code
 COPY . .
+# 6. THE CRUCIAL PART: Set the command to run the inference server
+CMD ["python", "-m", "huggingface_inference_toolkit.main", "--model_dir", "."]