File size: 467 Bytes
c230d0d
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
FROM ubuntu:22.04

RUN apk install -y git cmake clang
WORKDIR /app
RUN git clone https://github.com/ggerganov/llama.cpp --depth 1 repo && cd repo && cmake -B build && cmake --build build --config Release --target server && cp ../build/bin/server /app/server
RUN wget -c -o model.gguf "https://huggingface.co/zhangtao103239/Qwen-1.8B-GGUF/resolve/main/qwen-1.8b-q5_k_m.gguf"
EXPOSE  7860
CMD ["/app/server", "-m" "model.gguf", "--host", "0.0.0.0", "--port", "7860"]