Spaces:

rapacious
/

LLaMA_Server

Running

LLaMA_Server / Dockerfile

Update Dockerfile

54dbd2f verified 2 months ago

741 Bytes

	# Chọn image cơ bản
	FROM ubuntu:22.04

	# Cài đặt thư viện cần thiết
	RUN apt-get update && apt-get install -y \
	unzip wget curl python3 python3-pip

	# Sao chép binary LLaMA đã build vào container
	COPY llama_bin.zip /app/llama_bin.zip
	WORKDIR /app

	# Giải nén binaries
	RUN unzip llama_bin.zip && rm llama_bin.zip && chmod +x bin/server

	# Tạo thư mục models
	RUN mkdir -p /models

	# Tải mô hình Qwen2.5-0.5B-Instruct-GGUF
	RUN wget -O /models/qwen2.5-0.5b-instruct-q5_k_m.gguf \
	https://huggingface.co/Qwen/Qwen2.5-0.5B-Instruct-GGUF/resolve/main/qwen2.5-0.5b-instruct-q5_k_m.gguf

	# Chạy server với mô hình Qwen
	CMD ["./bin/server", "-m", "/models/qwen2.5-0.5b-instruct-q5_k_m.gguf", "-p", "8000"]