File size: 483 Bytes
435f6db 00fa67d 45c1114 00fa67d 45c1114 33f9f12 00fa67d de362e9 e9669da |
1 2 3 4 5 6 7 8 9 10 11 12 |
FROM ghcr.io/ggerganov/llama.cpp:server-cuda
RUN apt update && apt install -y curl
RUN mkdir /models
RUN curl -L https://huggingface.co/TheBloke/deepseek-coder-6.7B-instruct-GGUF/resolve/main/deepseek-coder-6.7b-instruct.Q6_K.gguf --output /models/deepseek-coder-6.7b-instruct.Q6_K.gguf
ENTRYPOINT [ "/server" ]
CMD [ "-ngl", "32", "--host", "0.0.0.0", "--port", "7860", "--model", "/models/deepseek-coder-6.7b-instruct.Q6_K.gguf", "-c", "8192", "--chat-template", "deepseek" ]
|