Spaces:

Luka512
/

Qwen3

Runtime error

Tim Luka Horstmann commited on May 12

Commit

c2b5e84

1 Parent(s): f32e6b8

Fix

Files changed (2) hide show

.gitignore ADDED Viewed

File without changes

Dockerfile CHANGED Viewed

@@ -47,7 +47,9 @@ RUN pip install --no-cache-dir huggingface_hub
 # 9) Clone llama.cpp for quantize tool
 RUN git clone https://github.com/ggerganov/llama.cpp.git /tmp/llama.cpp && \
-    cd /tmp/llama.cpp && Cmake quantize
 # 10) Download & pre-quantize model (no runtime repack)
 RUN python3 - <<EOF

 # 9) Clone llama.cpp for quantize tool
 RUN git clone https://github.com/ggerganov/llama.cpp.git /tmp/llama.cpp && \
+    cd /tmp/llama.cpp && \
+    cmake -B build -DLLAMA_BUILD_QUANTIZE=ON . && \
+    cmake --build build --target quantize
 # 10) Download & pre-quantize model (no runtime repack)
 RUN python3 - <<EOF