2024-02-08 19:12:51 +00:00
ARG BASE_IMAGE=ubuntu:22.04
2024-04-18 20:19:36 +00:00
ARG GRPC_BASE_IMAGE=${BASE_IMAGE}
2024-05-22 21:35:39 +00:00
ARG INTEL_BASE_IMAGE=${BASE_IMAGE}
2023-05-30 13:53:37 +00:00
2025-06-15 12:56:52 +00:00
FROM ${BASE_IMAGE} AS requirements
2023-05-29 21:12:27 +00:00
2024-02-08 19:12:51 +00:00
ENV DEBIAN_FRONTEND=noninteractive
2023-05-29 21:12:27 +00:00
RUN apt-get update && \
2024-04-27 17:48:20 +00:00
apt-get install -y --no-install-recommends \
2025-06-26 16:41:38 +00:00
ca-certificates curl wget espeak-ng libgomp1 \
python3 python-is-python3 ffmpeg && \
2024-04-27 17:48:20 +00:00
apt-get clean && \
2024-05-27 20:07:48 +00:00
rm -rf /var/lib/apt/lists/*
2023-10-16 19:46:29 +00:00
2024-04-30 08:12:19 +00:00
# The requirements-drivers target is for BUILD_TYPE specific items. If you need to install something specific to CUDA, or specific to ROCM, it goes here.
2025-06-15 12:56:52 +00:00
FROM requirements AS requirements-drivers
2024-04-30 08:12:19 +00:00
ARG BUILD_TYPE
2024-06-19 15:50:49 +00:00
ARG CUDA_MAJOR_VERSION=12
2024-07-23 21:35:31 +00:00
ARG CUDA_MINOR_VERSION=0
2024-12-22 20:28:38 +00:00
ARG SKIP_DRIVERS=false
2025-06-26 16:41:38 +00:00
ARG TARGETARCH
ARG TARGETVARIANT
2024-04-30 08:12:19 +00:00
ENV BUILD_TYPE=${BUILD_TYPE}
2024-06-24 18:04:58 +00:00
# Vulkan requirements
RUN <<EOT bash
2024-12-22 20:28:38 +00:00
if [ "${BUILD_TYPE}" = "vulkan" ] && [ "${SKIP_DRIVERS}" = "false" ]; then
2024-06-24 18:04:58 +00:00
apt-get update && \
apt-get install -y --no-install-recommends \
2024-07-16 01:51:15 +00:00
software-properties-common pciutils wget gpg-agent && \
2024-06-24 18:04:58 +00:00
wget -qO - https://packages.lunarg.com/lunarg-signing-key-pub.asc | apt-key add - && \
wget -qO /etc/apt/sources.list.d/lunarg-vulkan-jammy.list https://packages.lunarg.com/vulkan/lunarg-vulkan-jammy.list && \
apt-get update && \
2024-07-16 01:51:15 +00:00
apt-get install -y \
2024-06-24 18:04:58 +00:00
vulkan-sdk && \
apt-get clean && \
rm -rf /var/lib/apt/lists/*
fi
EOT
2024-04-30 08:12:19 +00:00
# CuBLAS requirements
2024-05-28 08:34:59 +00:00
RUN <<EOT bash
2024-12-22 20:28:38 +00:00
if [ "${BUILD_TYPE}" = "cublas" ] && [ "${SKIP_DRIVERS}" = "false" ]; then
2024-05-28 08:34:59 +00:00
apt-get update && \
apt-get install -y --no-install-recommends \
2024-07-16 01:51:15 +00:00
software-properties-common pciutils
2024-05-28 08:34:59 +00:00
if [ "amd64" = "$TARGETARCH" ]; then
curl -O https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/x86_64/cuda-keyring_1.1-1_all.deb
2024-07-16 01:51:15 +00:00
fi
2024-05-28 08:34:59 +00:00
if [ "arm64" = "$TARGETARCH" ]; then
curl -O https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/arm64/cuda-keyring_1.1-1_all.deb
fi
2024-04-30 08:12:19 +00:00
dpkg -i cuda-keyring_1.1-1_all.deb && \
rm -f cuda-keyring_1.1-1_all.deb && \
apt-get update && \
apt-get install -y --no-install-recommends \
cuda-nvcc-${CUDA_MAJOR_VERSION}-${CUDA_MINOR_VERSION} \
2024-06-06 06:41:04 +00:00
libcufft-dev-${CUDA_MAJOR_VERSION}-${CUDA_MINOR_VERSION} \
2024-04-30 08:12:19 +00:00
libcurand-dev-${CUDA_MAJOR_VERSION}-${CUDA_MINOR_VERSION} \
libcublas-dev-${CUDA_MAJOR_VERSION}-${CUDA_MINOR_VERSION} \
libcusparse-dev-${CUDA_MAJOR_VERSION}-${CUDA_MINOR_VERSION} \
libcusolver-dev-${CUDA_MAJOR_VERSION}-${CUDA_MINOR_VERSION} && \
apt-get clean && \
2024-07-16 01:51:15 +00:00
rm -rf /var/lib/apt/lists/*
fi
EOT
2024-04-30 08:12:19 +00:00
# If we are building with clblas support, we need the libraries for the builds
2024-12-22 20:28:38 +00:00
RUN if [ "${BUILD_TYPE}" = "clblas" ] && [ "${SKIP_DRIVERS}" = "false" ]; then \
2024-04-30 08:12:19 +00:00
apt-get update && \
apt-get install -y --no-install-recommends \
libclblast-dev && \
apt-get clean && \
rm -rf /var/lib/apt/lists/* \
2024-03-07 13:37:45 +00:00
; fi
2024-12-22 20:28:38 +00:00
RUN if [ "${BUILD_TYPE}" = "hipblas" ] && [ "${SKIP_DRIVERS}" = "false" ]; then \
2024-05-03 16:46:49 +00:00
apt-get update && \
apt-get install -y --no-install-recommends \
hipblas-dev \
rocblas-dev && \
apt-get clean && \
rm -rf /var/lib/apt/lists/* && \
# I have no idea why, but the ROCM lib packages don't trigger ldconfig after they install, which results in local-ai and others not being able
# to locate the libraries. We run ldconfig ourselves to work around this packaging deficiency
ldconfig \
; fi
2025-06-26 16:41:38 +00:00
# Cuda
ENV PATH=/usr/local/cuda/bin:${PATH}
# HipBLAS requirements
ENV PATH=/opt/rocm/bin:${PATH}
###################################
###################################
# The requirements-core target is common to all images. It should not be placed in requirements-core unless every single build will use it.
FROM requirements-drivers AS build-requirements
ARG GO_VERSION=1.22.6
ARG CMAKE_VERSION=3.26.4
ARG CMAKE_FROM_SOURCE=false
ARG TARGETARCH
ARG TARGETVARIANT
RUN apt-get update && \
apt-get install -y --no-install-recommends \
build-essential \
ccache \
ca-certificates espeak-ng \
curl libssl-dev \
git \
git-lfs \
unzip upx-ucl python3 python-is-python3 && \
apt-get clean && \
rm -rf /var/lib/apt/lists/*
# Install CMake (the version in 22.04 is too old)
RUN <<EOT bash
if [ "${CMAKE_FROM_SOURCE}}" = "true" ]; then
curl -L -s https://github.com/Kitware/CMake/releases/download/v${CMAKE_VERSION}/cmake-${CMAKE_VERSION}.tar.gz -o cmake.tar.gz && tar xvf cmake.tar.gz && cd cmake-${CMAKE_VERSION} && ./configure && make && make install
else
apt-get update && \
apt-get install -y \
cmake && \
apt-get clean && \
rm -rf /var/lib/apt/lists/*
fi
EOT
# Install Go
RUN curl -L -s https://go.dev/dl/go${GO_VERSION}.linux-${TARGETARCH}.tar.gz | tar -C /usr/local -xz
ENV PATH=$PATH:/root/go/bin:/usr/local/go/bin
# Install grpc compilers and rice
RUN go install google.golang.org/protobuf/cmd/protoc-gen-go@v1.34.2 && \
go install google.golang.org/grpc/cmd/protoc-gen-go-grpc@1958fcbe2ca8bd93af633f11e97d44e567e945af && \
go install github.com/GeertJohan/go.rice/rice@latest
COPY --chmod=644 custom-ca-certs/* /usr/local/share/ca-certificates/
RUN update-ca-certificates
# OpenBLAS requirements and stable diffusion
RUN apt-get update && \
apt-get install -y --no-install-recommends \
libopenblas-dev && \
apt-get clean && \
rm -rf /var/lib/apt/lists/*
RUN test -n "$TARGETARCH" \
|| (echo 'warn: missing $TARGETARCH, either set this `ARG` manually, or run using `docker buildkit`')
# Use the variables in subsequent instructions
RUN echo "Target Architecture: $TARGETARCH"
RUN echo "Target Variant: $TARGETVARIANT"
WORKDIR /build
2023-06-26 20:34:03 +00:00
###################################
###################################
2024-05-22 21:35:39 +00:00
# Temporary workaround for Intel's repository to work correctly
# https://community.intel.com/t5/Intel-oneAPI-Math-Kernel-Library/APT-Repository-not-working-signatures-invalid/m-p/1599436/highlight/true#M36143
# This is a temporary workaround until Intel fixes their repository
FROM ${INTEL_BASE_IMAGE} AS intel
RUN wget -qO - https://repositories.intel.com/gpu/intel-graphics.key | \
gpg --yes --dearmor --output /usr/share/keyrings/intel-graphics.gpg
RUN echo "deb [arch=amd64 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/gpu/ubuntu jammy/lts/2350 unified" > /etc/apt/sources.list.d/intel-graphics.list
###################################
###################################
2024-04-30 08:12:19 +00:00
# The grpc target does one thing, it builds and installs GRPC. This is in it's own layer so that it can be effectively cached by CI.
# You probably don't need to change anything here, and if you do, make sure that CI is adjusted so that the cache continues to work.
2024-04-23 16:43:00 +00:00
FROM ${GRPC_BASE_IMAGE} AS grpc
2024-03-29 21:32:40 +00:00
2024-04-27 17:48:20 +00:00
# This is a bit of a hack, but it's required in order to be able to effectively cache this layer in CI
ARG GRPC_MAKEFLAGS="-j4 -Otarget"
2025-02-12 08:11:31 +00:00
ARG GRPC_VERSION=v1.65.0
2024-10-07 14:42:56 +00:00
ARG CMAKE_FROM_SOURCE=false
2024-10-07 09:22:55 +00:00
ARG CMAKE_VERSION=3.26.4
2024-03-29 21:32:40 +00:00
2024-04-27 17:48:20 +00:00
ENV MAKEFLAGS=${GRPC_MAKEFLAGS}
2024-03-29 21:32:40 +00:00
WORKDIR /build
RUN apt-get update && \
2024-04-27 17:48:20 +00:00
apt-get install -y --no-install-recommends \
ca-certificates \
2024-10-07 09:22:55 +00:00
build-essential curl libssl-dev \
2024-04-27 17:48:20 +00:00
git && \
2024-03-29 21:32:40 +00:00
apt-get clean && \
rm -rf /var/lib/apt/lists/*
2024-10-07 09:22:55 +00:00
# Install CMake (the version in 22.04 is too old)
2024-10-07 14:42:56 +00:00
RUN <<EOT bash
if [ "${CMAKE_FROM_SOURCE}}" = "true" ]; then
curl -L -s https://github.com/Kitware/CMake/releases/download/v${CMAKE_VERSION}/cmake-${CMAKE_VERSION}.tar.gz -o cmake.tar.gz && tar xvf cmake.tar.gz && cd cmake-${CMAKE_VERSION} && ./configure && make && make install
else
apt-get update && \
apt-get install -y \
cmake && \
apt-get clean && \
rm -rf /var/lib/apt/lists/*
fi
EOT
2024-10-07 09:22:55 +00:00
2024-04-27 17:48:20 +00:00
# We install GRPC to a different prefix here so that we can copy in only the build artifacts later
# saves several hundred MB on the final docker image size vs copying in the entire GRPC source tree
# and running make install in the target container
2024-04-28 19:24:16 +00:00
RUN git clone --recurse-submodules --jobs 4 -b ${GRPC_VERSION} --depth 1 --shallow-submodules https://github.com/grpc/grpc && \
mkdir -p /build/grpc/cmake/build && \
cd /build/grpc/cmake/build && \
2024-07-11 01:40:54 +00:00
sed -i "216i\ TESTONLY" "../../third_party/abseil-cpp/absl/container/CMakeLists.txt" && \
2024-04-28 19:24:16 +00:00
cmake -DgRPC_INSTALL=ON -DgRPC_BUILD_TESTS=OFF -DCMAKE_INSTALL_PREFIX:PATH=/opt/grpc ../.. && \
2024-04-27 17:48:20 +00:00
make && \
2024-04-28 19:24:16 +00:00
make install && \
rm -rf /build
2024-03-29 21:32:40 +00:00
###################################
###################################
2024-08-14 07:06:41 +00:00
# The builder-base target has the arguments, variables, and copies shared between full builder images and the uncompiled devcontainer
2025-06-26 16:41:38 +00:00
FROM build-requirements AS builder-base
2023-05-30 13:53:37 +00:00
2025-01-22 18:34:16 +00:00
ARG GO_TAGS="tts p2p"
2023-10-19 11:50:40 +00:00
ARG GRPC_BACKENDS
2024-03-17 14:39:20 +00:00
ARG MAKEFLAGS
2024-08-14 07:06:41 +00:00
ARG LD_FLAGS="-s -w"
2025-06-26 16:41:38 +00:00
ARG TARGETARCH
ARG TARGETVARIANT
2023-10-19 11:50:40 +00:00
ENV GRPC_BACKENDS=${GRPC_BACKENDS}
2023-05-30 13:53:37 +00:00
ENV GO_TAGS=${GO_TAGS}
2024-03-17 14:39:20 +00:00
ENV MAKEFLAGS=${MAKEFLAGS}
2023-05-30 13:53:37 +00:00
ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility
ENV NVIDIA_REQUIRE_CUDA="cuda>=${CUDA_MAJOR_VERSION}.0"
ENV NVIDIA_VISIBLE_DEVICES=all
2024-08-14 07:06:41 +00:00
ENV LD_FLAGS=${LD_FLAGS}
2023-05-30 13:53:37 +00:00
2024-08-14 07:06:41 +00:00
RUN echo "GO_TAGS: $GO_TAGS" && echo "TARGETARCH: $TARGETARCH"
2023-06-26 20:34:03 +00:00
2024-08-14 07:06:41 +00:00
WORKDIR /build
2024-04-13 07:37:32 +00:00
2023-07-02 09:14:09 +00:00
2024-04-27 17:48:20 +00:00
# We need protoc installed, and the version in 22.04 is too old. We will create one as part installing the GRPC build below
# but that will also being in a newer version of absl which stablediffusion cannot compile with. This version of protoc is only
# here so that we can generate the grpc code for the stablediffusion build
2024-05-28 08:34:59 +00:00
RUN <<EOT bash
if [ "amd64" = "$TARGETARCH" ]; then
2024-06-10 08:40:02 +00:00
curl -L -s https://github.com/protocolbuffers/protobuf/releases/download/v27.1/protoc-27.1-linux-x86_64.zip -o protoc.zip && \
2024-05-28 08:34:59 +00:00
unzip -j -d /usr/local/bin protoc.zip bin/protoc && \
rm protoc.zip
fi
if [ "arm64" = "$TARGETARCH" ]; then
2024-06-10 08:40:02 +00:00
curl -L -s https://github.com/protocolbuffers/protobuf/releases/download/v27.1/protoc-27.1-linux-aarch_64.zip -o protoc.zip && \
2024-05-28 08:34:59 +00:00
unzip -j -d /usr/local/bin protoc.zip bin/protoc && \
rm protoc.zip
fi
EOT
2024-04-27 17:48:20 +00:00
2024-08-20 10:16:21 +00:00
###################################
###################################
2025-05-25 20:25:05 +00:00
# Compile backends first in a separate stage
FROM builder-base AS builder-backends
2025-06-26 16:41:38 +00:00
ARG TARGETARCH
ARG TARGETVARIANT
2024-08-20 10:16:21 +00:00
2024-04-27 17:48:20 +00:00
COPY --from=grpc /opt/grpc /usr/local
2023-10-16 19:46:29 +00:00
2024-04-23 16:43:00 +00:00
WORKDIR /build
2024-07-01 20:50:36 +00:00
2025-05-25 20:25:05 +00:00
COPY ./Makefile .
COPY ./backend ./backend
COPY ./go.mod .
COPY ./go.sum .
COPY ./.git ./.git
# Some of the Go backends use libs from the main src, we could further optimize the caching by building the CPP backends before here
COPY ./pkg/grpc ./pkg/grpc
COPY ./pkg/utils ./pkg/utils
COPY ./pkg/langchain ./pkg/langchain
2024-09-10 06:57:16 +00:00
2025-05-25 20:25:05 +00:00
RUN ls -l ./
RUN make backend-assets
2024-09-10 06:57:16 +00:00
RUN make prepare
2025-05-25 20:25:05 +00:00
RUN if [ "${TARGETARCH}" = "arm64" ] || [ "${BUILD_TYPE}" = "hipblas" ]; then \
SKIP_GRPC_BACKEND="backend-assets/grpc/llama-cpp-avx512 backend-assets/grpc/llama-cpp-avx backend-assets/grpc/llama-cpp-avx2" make grpcs; \
else \
make grpcs; \
fi
# The builder target compiles LocalAI. This target is not the target that will be uploaded to the registry.
# Adjustments to the build process should likely be made here.
FROM builder-backends AS builder
WORKDIR /build
COPY . .
2024-09-10 06:57:16 +00:00
2024-07-01 20:50:36 +00:00
## Build the binary
2025-05-05 15:30:00 +00:00
## If we're on arm64 AND using cublas/hipblas, skip some of the llama-compat backends to save space
## Otherwise just run the normal build
2025-05-06 08:00:50 +00:00
RUN if [ "${TARGETARCH}" = "arm64" ] || [ "${BUILD_TYPE}" = "hipblas" ]; then \
2025-05-05 15:30:00 +00:00
SKIP_GRPC_BACKEND="backend-assets/grpc/llama-cpp-avx512 backend-assets/grpc/llama-cpp-avx backend-assets/grpc/llama-cpp-avx2" make build; \
else \
make build; \
fi
2023-05-30 13:53:37 +00:00
2023-12-07 21:58:41 +00:00
RUN if [ ! -d "/build/sources/go-piper/piper-phonemize/pi/lib/" ]; then \
2024-04-27 17:48:20 +00:00
mkdir -p /build/sources/go-piper/piper-phonemize/pi/lib/ \
touch /build/sources/go-piper/piper-phonemize/pi/lib/keep \
2023-11-18 07:18:43 +00:00
; fi
2023-06-26 20:34:03 +00:00
###################################
###################################
2024-08-14 07:06:41 +00:00
# The devcontainer target is not used on CI. It is a target for developers to use locally -
# rather than copying files it mounts them locally and leaves building to the developer
FROM builder-base AS devcontainer
COPY --from=grpc /opt/grpc /usr/local
2024-08-20 10:16:21 +00:00
COPY .devcontainer-scripts /.devcontainer-scripts
2024-08-14 07:06:41 +00:00
2024-08-20 10:16:21 +00:00
RUN apt-get update && \
apt-get install -y --no-install-recommends \
2025-06-26 16:41:38 +00:00
ssh less
2024-09-24 07:32:48 +00:00
# For the devcontainer, leave apt functional in case additional devtools are needed at runtime.
2024-08-20 10:16:21 +00:00
2024-08-14 07:06:41 +00:00
RUN go install github.com/go-delve/delve/cmd/dlv@latest
2024-08-20 10:16:21 +00:00
RUN go install github.com/mikefarah/yq/v4@latest
2024-08-14 07:06:41 +00:00
###################################
###################################
2024-04-30 08:12:19 +00:00
# This is the final target. The result of this target will be the image uploaded to the registry.
# If you cannot find a more suitable place for an addition, this layer is a suitable place for it.
FROM requirements-drivers
2023-06-13 06:39:38 +00:00
ENV HEALTHCHECK_ENDPOINT=http://localhost:8080/readyz
2023-06-04 12:00:21 +00:00
2024-06-19 15:50:49 +00:00
ARG CUDA_MAJOR_VERSION=12
2023-10-19 11:50:40 +00:00
ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility
ENV NVIDIA_REQUIRE_CUDA="cuda>=${CUDA_MAJOR_VERSION}.0"
ENV NVIDIA_VISIBLE_DEVICES=all
2025-06-26 16:41:38 +00:00
WORKDIR /
2023-06-04 12:00:21 +00:00
2025-06-26 16:41:38 +00:00
COPY ./entrypoint.sh .
2023-11-25 07:48:24 +00:00
2023-10-16 19:46:29 +00:00
# Copy the binary
2023-05-30 13:53:37 +00:00
COPY --from=builder /build/local-ai ./
2023-09-04 17:25:23 +00:00
2023-11-11 17:40:26 +00:00
# Copy shared libraries for piper
2023-12-07 21:58:41 +00:00
COPY --from=builder /build/sources/go-piper/piper-phonemize/pi/lib/* /usr/lib/
2023-11-11 17:40:26 +00:00
2024-01-09 07:55:43 +00:00
# Make sure the models directory exists
2025-06-26 16:41:38 +00:00
RUN mkdir -p /models /backends
2024-01-09 07:55:43 +00:00
2023-05-26 16:34:02 +00:00
# Define the health check command
2023-05-30 10:00:30 +00:00
HEALTHCHECK --interval=1m --timeout=10m --retries=10 \
2024-04-23 16:43:00 +00:00
CMD curl -f ${HEALTHCHECK_ENDPOINT} || exit 1
2024-05-26 07:56:06 +00:00
2025-06-26 16:41:38 +00:00
VOLUME /models /backends
2023-04-27 16:45:24 +00:00
EXPOSE 8080
2025-06-26 16:41:38 +00:00
ENTRYPOINT [ "/entrypoint.sh" ]