Spaces:

lastmass
/

Qwen3_Medical

Sleeping

App Files Files Community

lastmass commited on Sep 1

Commit

242707c

verified ·

1 Parent(s): 5ec6cc3

Update Dockerfile

Browse files

Files changed (1) hide show

Dockerfile +30 -13

Dockerfile CHANGED Viewed

@@ -1,36 +1,53 @@
-# 使用与原版一致的基础镜像
 FROM python:3.11-slim
-# 1. 安装必要的运行时依赖，并根据你的要求加入编译工具
 RUN apt-get update && apt-get install -y \
     wget \
     git \
     build-essential \
     cmake \
     && rm -rf /var/lib/apt/lists/*
-# 2. 升级 pip 工具本身
 RUN pip install --upgrade pip
-# 3. 使用官方 extra-index-url 来安装所有包，这是我们成功的关键
-RUN pip install --no-cache-dir --only-binary :all: \
-    gradio \
-    huggingface-hub \
-    llama-cpp-python \
-    --extra-index-url https://abetlen.github.io/llama-cpp-python/whl/cpu
-# 4. 设置模型路径 (保持不变)
 ENV MODEL_REPO="mradermacher/Qwen3_Medical_GRPO-i1-GGUF"
 ENV MODEL_FILE="Qwen3_Medical_GRPO.i1-Q4_K_M.gguf"
 ENV MODEL_DIR="/models"
 ENV MODEL_PATH="${MODEL_DIR}/${MODEL_FILE}"
-# 5. 创建模型目录 (保持不变)
 RUN mkdir -p /models
-# 6. 复制应用文件
 COPY app.py /app/app.py
 WORKDIR /app
-# 7. 启动 Gradio 应用
 CMD ["python", "app.py"]

+# ------------------------------------------------------------------
+# Dockerfile based on building from source with OpenBLAS
+# ------------------------------------------------------------------
 FROM python:3.11-slim
+# 1. 安装所有依赖：运行时依赖 + 编译工具 + OpenBLAS 开发库
 RUN apt-get update && apt-get install -y \
+    # 运行时
     wget \
     git \
+    # 编译时
     build-essential \
     cmake \
+    # BLAS 加速库
+    libopenblas-dev \
     && rm -rf /var/lib/apt/lists/*
+# 2. 升级 pip
 RUN pip install --upgrade pip
+# 3. 克隆源码并使用特定参数进行编译安装（这是核心步骤）
+#    我们将所有命令放在一个 RUN 层里，以确保环境变量生效
+RUN set -e && \
+    # 克隆最新的源码到 /tmp 目录
+    cd /tmp && \
+    git clone --recursive https://github.com/abetlen/llama-cpp-python.git && \
+    cd llama-cpp-python && \
+    # 更新底层的 llama.cpp  submodule 到最新
+    git submodule update --remote vendor/llama.cpp && \
+    # 设置环境变量并从本地源码安装
+    FORCE_CMAKE=1 CMAKE_ARGS="-DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DLLAMA_CURL=OFF" \
+    pip install . --upgrade --force-reinstall --no-cache-dir && \
+    # 清理源码，减小镜像体积
+    rm -rf /tmp/llama-cpp-python
+# 4. 安装其他 Python 依赖
+RUN pip install --no-cache-dir gradio huggingface-hub
+# 5. 设置模型路径 (保持不变)
 ENV MODEL_REPO="mradermacher/Qwen3_Medical_GRPO-i1-GGUF"
 ENV MODEL_FILE="Qwen3_Medical_GRPO.i1-Q4_K_M.gguf"
 ENV MODEL_DIR="/models"
 ENV MODEL_PATH="${MODEL_DIR}/${MODEL_FILE}"
+# 6. 创建模型目录 (保持不变)
 RUN mkdir -p /models
+# 7. 复制应用文件
 COPY app.py /app/app.py
 WORKDIR /app
+# 8. 启动 Gradio 应用
 CMD ["python", "app.py"]