LibreTranslate/docker/cuda.Dockerfile
2026-02-10 15:22:34 -05:00

60 lines
1.8 KiB
Docker

FROM nvidia/cuda:12.4.1-runtime-ubuntu22.04 AS builder
WORKDIR /app
ARG DEBIAN_FRONTEND=noninteractive
RUN apt-get update -qq \
&& apt-get -qqq install --no-install-recommends -y pkg-config gcc g++ python3-dev python3-pip python3-venv git \
&& apt-get upgrade --assume-yes \
&& apt-get clean \
&& rm -rf /var/lib/apt
RUN python3 -m venv venv && ./venv/bin/pip install --no-cache-dir --upgrade pip
COPY . .
# Install package from source code, compile translations
RUN ./venv/bin/pip install Babel==2.12.1 && ./venv/bin/python scripts/compile_locales.py \
&& ./venv/bin/pip install "numpy<2" \
&& ./venv/bin/pip install . \
&& ./venv/bin/pip uninstall -y onnxruntime && ./venv/bin/pip install --no-cache-dir onnxruntime-gpu>=1.10.0 \
&& ./venv/bin/pip cache purge
FROM nvidia/cuda:12.4.1-runtime-ubuntu22.04
ENV ARGOS_DEVICE_TYPE auto
ARG with_models=false
ARG models=""
WORKDIR /app
ARG DEBIAN_FRONTEND=noninteractive
RUN apt-get update -qq \
&& apt-get -qqq install --no-install-recommends -y python3 python3-pip \
&& apt-get clean \
&& rm -rf /var/lib/apt
RUN ln -s /usr/bin/python3 /usr/bin/python
COPY --from=builder /app /app
ENV PATH="/app/venv/bin:$PATH"
COPY --from=builder /app/venv/bin/ltmanage /usr/bin/
RUN if [ "$with_models" = "true" ]; then \
# initialize the language models
if [ ! -z "$models" ]; then \
python scripts/install_models.py --load_only_lang_codes "$models"; \
else \
python scripts/install_models.py; \
fi \
fi
# Depending on your cuda install you may need to uncomment this line to allow the container to access the cuda libraries
# See: https://docs.nvidia.com/cuda/cuda-installation-guide-linux/index.html#post-installation-actions
# ENV LD_LIBRARY_PATH=/usr/local/cuda/lib:/usr/local/cuda/lib64
EXPOSE 5000
ENTRYPOINT [ "libretranslate", "--host", "*" ]