ARG OPENVINO_VERSION_MAJOR=2025.2 ARG OPENVINO_VERSION_FULL=2025.2.0.19140.c01cd93e24d ARG UBUNTU_VERSION=24.04 # Optional proxy build arguments - empty by default ARG http_proxy= ARG https_proxy= ## Build Image FROM ubuntu:${UBUNTU_VERSION} AS build # Pass proxy args to build stage ARG http_proxy ARG https_proxy RUN apt-get update && \ apt-get install -y --no-install-recommends \ ca-certificates \ gnupg \ wget \ git \ cmake \ ninja-build \ build-essential \ libtbb12 \ libcurl4-openssl-dev && \ rm -rf /var/lib/apt/lists/* # Install OpenVINO for Ubuntu 24.04 ARG OPENVINO_VERSION_MAJOR ARG OPENVINO_VERSION_FULL RUN mkdir -p /opt/intel && \ wget https://storage.openvinotoolkit.org/repositories/openvino/packages/${OPENVINO_VERSION_MAJOR}/linux/openvino_toolkit_ubuntu24_${OPENVINO_VERSION_FULL}_x86_64.tgz && \ tar -xf openvino_toolkit_ubuntu24_${OPENVINO_VERSION_FULL}_x86_64.tgz && \ mv openvino_toolkit_ubuntu24_${OPENVINO_VERSION_FULL}_x86_64 /opt/intel/openvino_${OPENVINO_VERSION_MAJOR} && \ cd /opt/intel/openvino_${OPENVINO_VERSION_MAJOR} && \ echo "Y" | ./install_dependencies/install_openvino_dependencies.sh && \ cd - && \ ln -s /opt/intel/openvino_${OPENVINO_VERSION_MAJOR} /opt/intel/openvino ENV OpenVINO_DIR=/opt/intel/openvino WORKDIR /app COPY . . # Build Stage RUN bash -c "source ${OpenVINO_DIR}/setupvars.sh && \ cmake -B build/ReleaseOV -G Ninja \ -DCMAKE_BUILD_TYPE=Release \ -DGGML_OPENVINO=ON && \ cmake --build build/ReleaseOV -j$(nproc)" # Copy all necessary libraries RUN mkdir -p /app/lib && \ find build/ReleaseOV -name '*.so*' -exec cp {} /app/lib \; && \ find ${OpenVINO_DIR}/runtime/lib/intel64 -name '*.so*' -exec cp -P {} /app/lib \; 2>/dev/null || \ find ${OpenVINO_DIR}/lib/intel64 -name '*.so*' -exec cp -P {} /app/lib \; # Create runtime directories and copy binaries RUN mkdir -p /app/full \ && cp build/ReleaseOV/bin/* /app/full/ \ && cp *.py /app/full \ && cp -r gguf-py /app/full \ && cp -r requirements /app/full \ && cp requirements.txt /app/full \ && cp .devops/tools.sh /app/full/tools.sh ## Base Runtime Image FROM ubuntu:${UBUNTU_VERSION} AS base # Pass proxy args to runtime stage ARG http_proxy ARG https_proxy RUN apt-get update \ && apt-get install -y libgomp1 libtbb12 curl\ && apt autoremove -y \ && apt clean -y \ && rm -rf /tmp/* /var/tmp/* \ && find /var/cache/apt/archives /var/lib/apt/lists -not -name lock -type f -delete \ && find /var/cache -type f -delete COPY --from=build /app/lib/ /app/ ### Full (all binaries) FROM base AS full ARG http_proxy ARG https_proxy COPY --from=build /app/full /app/ WORKDIR /app RUN apt-get update && \ apt-get install -y --no-install-recommends \ git \ python3 \ python3-venv \ python3-pip && \ python3 -m venv /ov-venv && \ /ov-venv/bin/pip install --no-cache-dir --upgrade pip setuptools wheel && \ /ov-venv/bin/pip install --no-cache-dir -r requirements.txt && \ apt-get autoremove -y && \ apt-get clean && \ rm -rf /tmp/* /var/tmp/* && \ find /var/cache/apt/archives /var/lib/apt/lists -not -name lock -type f -delete && \ find /var/cache -type f -delete ENTRYPOINT ["/bin/bash", "-c", "source /ov-venv/bin/activate && exec /app/tools.sh \"$@\"", "--"] ### Light, CLI only FROM base AS light COPY --from=build /app/full/llama-cli /app/ WORKDIR /app ENTRYPOINT [ "/app/llama-cli" ] ### Server, Server only FROM base AS server ENV LLAMA_ARG_HOST=0.0.0.0 COPY --from=build /app/full/llama-server /app/ WORKDIR /app HEALTHCHECK CMD [ "curl", "-f", "http://localhost:8080/health" ] ENTRYPOINT [ "/app/llama-server" ]