Create Dockerfile
Browse files- Dockerfile +7 -0
Dockerfile
ADDED
|
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
FROM ghcr.io/ggerganov/llama.cpp:server-cuda
|
| 2 |
+
|
| 3 |
+
ENV LLAMA_ARG_CTX_SIZE=10000
|
| 4 |
+
ENV LLAMA_ARG_FLASH_ATTN=1
|
| 5 |
+
ENV LLAMA_ARG_HF_REPO=bartowski/Qwen2.5-Coder-14B-GGUF
|
| 6 |
+
ENV LLAMA_ARG_HF_FILE=Qwen2.5-Coder-14B-Q4_K_M.gguf
|
| 7 |
+
ENV LLAMA_ARG_N_PARALLEL=2
|