nllb-api-v3 / Dockerfile
winstxnhdw's picture
feat: use only a single worker with 2 translators
e01c6a6
raw
history blame
190 Bytes
FROM ghcr.io/winstxnhdw/nllb-api:main
ENV SERVER_PORT=7860
ENV OMP_NUM_THREADS=2
ENV CT2_USE_EXPERIMENTAL_PACKED_GEMM=1
ENV CT2_FORCE_CPU_ISA=AVX512
ENV WORKER_COUNT=1
EXPOSE $SERVER_PORT