Spaces:

Lyte
/

DeepSeek-R1-Distill-Qwen-1.5B-Demo-GGUF

Running

codebyam commited on Jul 5

Commit

551d27d

verified ·

1 Parent(s): c98b1e7

Update Dockerfile

For further inference improvement.

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -6,25 +6,36 @@ RUN apt-get update && \
     build-essential \
     libssl-dev \
     zlib1g-dev \
     libboost-system-dev \
     libboost-filesystem-dev \
     cmake \
     git \
     python3-pip \
     curl \
     wget && \
     rm -rf /var/lib/apt/lists/*
 # Install Python dependencies
 RUN pip3 install huggingface-hub openai gradio
-# Build llama.cpp
 RUN git clone https://github.com/ggerganov/llama.cpp && \
     cd llama.cpp && \
-    mkdir build && \
-    cd build && \
-    cmake .. -DLLAMA_BUILD_SERVER=ON -DLLAMA_BUILD_EXAMPLES=ON -DCMAKE_BUILD_TYPE=Release && \
-    cmake --build . --config Release --target llama-server -j $(nproc)
 # Download model
 RUN mkdir -p /models && \

     build-essential \
     libssl-dev \
     zlib1g-dev \
+    libboost-math-dev \
+    libboost-python-dev \
+    libboost-timer-dev \
+    libboost-thread-dev \
     libboost-system-dev \
     libboost-filesystem-dev \
+    libopenblas-dev \
+    libomp-dev \
     cmake \
+    pkg-config \
     git \
     python3-pip \
     curl \
+    libcurl4-openssl-dev \
     wget && \
     rm -rf /var/lib/apt/lists/*
 # Install Python dependencies
 RUN pip3 install huggingface-hub openai gradio
+# Build llama.cpp with OpenBLAS
 RUN git clone https://github.com/ggerganov/llama.cpp && \
     cd llama.cpp && \
+    cmake -B build -S . \
+        -DLLAMA_BUILD_SERVER=ON \
+        -DLLAMA_BUILD_EXAMPLES=ON \
+        -DGGML_BLAS=ON \
+        -DGGML_BLAS_VENDOR=OpenBLAS \
+        -DCMAKE_BUILD_TYPE=Release && \
+    cmake --build build --config Release --target llama-server -j $(nproc)
 # Download model
 RUN mkdir -p /models && \