Spaces:

rapacious
/

LLaMA_Server

Running

LLaMA_Server / Dockerfile

Create Dockerfile

03c48e3 verified 2 months ago

702 Bytes

	# Chọn image cơ bản (có CUDA nếu cần GPU)
	FROM ubuntu:22.04

	# Cài đặt các thư viện cần thiết
	RUN apt-get update && apt-get install -y \
	unzip wget curl python3 python3-pip

	# Sao chép file binary đã build vào container
	COPY llama_bin.zip /app/llama_bin.zip
	WORKDIR /app

	# Giải nén binaries
	RUN unzip llama_bin.zip && rm llama_bin.zip && chmod +x bin/server

	# Sao chép model (hoặc tải nếu cần)
	COPY models /models
	# Hoặc tải nếu mô hình chưa có
	# RUN wget -O /models/llama-7b.gguf https://huggingface.co/TheBloke/Llama-2-7B-GGUF/resolve/main/llama-2-7b.Q4_K_M.gguf

	# Chạy server
	CMD ["./bin/server", "-m", "/models/llama-7b.gguf", "-p", "8000"]