From 11d7af730bf42cb277dde2be754d83716f88da9f Mon Sep 17 00:00:00 2001 From: Mohit Sharma Date: Fri, 4 Oct 2024 17:41:02 +0000 Subject: [PATCH] add cloning in Dockerfile --- .github/workflows/build.yaml | 2 -- Dockerfile_amd | 8 +++++++- 2 files changed, 7 insertions(+), 3 deletions(-) diff --git a/.github/workflows/build.yaml b/.github/workflows/build.yaml index 23946173..ce1cdc33 100644 --- a/.github/workflows/build.yaml +++ b/.github/workflows/build.yaml @@ -35,8 +35,6 @@ jobs: steps: - name: Checkout repository uses: actions/checkout@v4 - with: - lfs: true - name: Inject slug/short variables uses: rlespinasse/github-slug-action@v4.4.1 - name: Construct harware variables diff --git a/Dockerfile_amd b/Dockerfile_amd index e4665004..049fa8b1 100644 --- a/Dockerfile_amd +++ b/Dockerfile_amd @@ -265,6 +265,12 @@ COPY server/exllamav2_kernels/ . RUN python setup.py build +FROM base as get_tuned_ops +RUN apt-get update && apt-get install git-lfs +RUN git clone https://github.com/huggingface/text-generation-inference.git +WORKDIR /text-generation-inference +RUN git checkout add_tunable_prefill && git lfs pull + FROM install_deps AS base-copy # Text Generation Inference base env @@ -328,7 +334,7 @@ ENV ATTENTION=paged ENV USE_PREFIX_CACHING=0 ENV ROCM_USE_SKINNY_GEMM=1 -COPY ./rocm_tuned_ops/afo_tune_device_0_full.csv /afo_tune/ +COPY --from=get_tuned_ops /text-generation-inference/rocm_tuned_ops/afo_tune_device_0_full.csv /afo_tune/afo_tune_device_0_full.csv RUN seq 1 7 | xargs -I{} cp /afo_tune/afo_tune_device_0_full.csv /afo_tune/afo_tune_device_{}_full.csv ENV PYTORCH_TUNABLEOP_FILENAME=/afo_tune/afo_tune_device_%d_full.csv