dockerfile(backend): initial working version of llama.cpp container
This commit is contained in:
parent
02cd6fe427
commit
daf1631e09
|
@ -15,8 +15,10 @@ COPY router router
|
||||||
RUN cargo chef prepare --recipe-path recipe.json
|
RUN cargo chef prepare --recipe-path recipe.json
|
||||||
|
|
||||||
FROM chef AS builder
|
FROM chef AS builder
|
||||||
ENV CMAKE_INSTALL_PREFIX=${CWD}/dist
|
ENV CMAKE_INSTALL_PREFIX=/usr/src/text-generation-inference/dist
|
||||||
RUN apt update && DEBIAN_FRONTEND=noninteractive apt install -y \
|
RUN --mount=type=cache,target=/var/cache/apt,sharing=locked \
|
||||||
|
--mount=type=cache,target=/var/lib/apt,sharing=locked \
|
||||||
|
apt update && DEBIAN_FRONTEND=noninteractive apt install -y \
|
||||||
clang \
|
clang \
|
||||||
cmake \
|
cmake \
|
||||||
gcc g++ \
|
gcc g++ \
|
||||||
|
@ -48,8 +50,23 @@ COPY launcher launcher
|
||||||
COPY router router
|
COPY router router
|
||||||
|
|
||||||
ENV RUSTFLAGS="-L/usr/lib"
|
ENV RUSTFLAGS="-L/usr/lib"
|
||||||
|
ENV CMAKE_INSTALL_PREFIX=/usr/src/text-generation-inference/dist
|
||||||
RUN cargo build --profile release-opt --package text-generation-backend-llamacpp --bin text-generation-backend-llamacpp --frozen
|
RUN cargo build --profile release-opt --package text-generation-backend-llamacpp --bin text-generation-backend-llamacpp --frozen
|
||||||
|
|
||||||
FROM ubuntu:24.04
|
FROM ubuntu:22.04
|
||||||
|
ENV DEBIAN_FRONTEND=noninteractive
|
||||||
|
|
||||||
|
RUN --mount=type=cache,target=/var/cache/apt,sharing=locked \
|
||||||
|
--mount=type=cache,target=/var/lib/apt,sharing=locked \
|
||||||
|
apt update && \
|
||||||
|
apt upgrade -y && \
|
||||||
|
apt install -y \
|
||||||
|
openssl \
|
||||||
|
python3.11-dev
|
||||||
|
|
||||||
COPY --from=builder /usr/src/text-generation-inference/target/release-opt/text-generation-backend-llamacpp /usr/src/text-generation-inference/text-generation-launcher
|
COPY --from=builder /usr/src/text-generation-inference/target/release-opt/text-generation-backend-llamacpp /usr/src/text-generation-inference/text-generation-launcher
|
||||||
COPY --from=builder /usr/src/text-generation-inference/dist /usr/
|
COPY --from=builder /usr/src/text-generation-inference/dist /usr/
|
||||||
|
|
||||||
|
ENV PORT=8080
|
||||||
|
WORKDIR /usr/src/text-generation-inference
|
||||||
|
ENTRYPOINT ["text-generation-launcher"]
|
Loading…
Reference in New Issue