nllb-api / Dockerfile
winstxnhdw's picture
perf/build/docs: use translator threads instead of workers
1cc3f06
raw
history blame
196 Bytes
FROM ghcr.io/winstxnhdw/nllb-api:main
ENV SERVER_PORT=7860
ENV OMP_NUM_THREADS=1
ENV CT2_USE_EXPERIMENTAL_PACKED_GEMM=1
ENV CT2_FORCE_CPU_ISA=AVX512
ENV TRANSLATOR_THREADS=4
EXPOSE $SERVER_PORT