Tim Luka Horstmann
commited on
Commit
·
f32e6b8
1
Parent(s):
470d3ad
Fix cmake
Browse files- Dockerfile +1 -1
Dockerfile
CHANGED
|
@@ -47,7 +47,7 @@ RUN pip install --no-cache-dir huggingface_hub
|
|
| 47 |
|
| 48 |
# 9) Clone llama.cpp for quantize tool
|
| 49 |
RUN git clone https://github.com/ggerganov/llama.cpp.git /tmp/llama.cpp && \
|
| 50 |
-
cd /tmp/llama.cpp &&
|
| 51 |
|
| 52 |
# 10) Download & pre-quantize model (no runtime repack)
|
| 53 |
RUN python3 - <<EOF
|
|
|
|
| 47 |
|
| 48 |
# 9) Clone llama.cpp for quantize tool
|
| 49 |
RUN git clone https://github.com/ggerganov/llama.cpp.git /tmp/llama.cpp && \
|
| 50 |
+
cd /tmp/llama.cpp && Cmake quantize
|
| 51 |
|
| 52 |
# 10) Download & pre-quantize model (no runtime repack)
|
| 53 |
RUN python3 - <<EOF
|