diff --git a/Dockerfile_trtllm b/Dockerfile_trtllm index 3ccb0310..8f0c549c 100644 --- a/Dockerfile_trtllm +++ b/Dockerfile_trtllm @@ -1,5 +1,5 @@ ARG CUDA_ARCH_LIST="75-real;80-real;86-real;89-real;90-real" -ARG OMPI_VERSION="4.1.6" +ARG OMPI_VERSION="4.1.7rc1" # Build dependencies resolver stage FROM lukemathwalker/cargo-chef:latest AS chef diff --git a/backends/trtllm/lib/backend.cpp b/backends/trtllm/lib/backend.cpp index ad22b0c7..b5364001 100644 --- a/backends/trtllm/lib/backend.cpp +++ b/backends/trtllm/lib/backend.cpp @@ -52,7 +52,7 @@ huggingface::tgi::backends::GetParallelConfig(const size_t worldSize, const std: if (worldSize > 1) { SPDLOG_INFO("Detected sharded engine deployment, using orchestrator mode"); mode = tle::CommunicationMode::kORCHESTRATOR; - orchestratorConfig = std::make_optional(true, workerPath, nullptr, true); + orchestratorConfig = std::make_optional(true, workerPath); } else { SPDLOG_INFO("Detected single engine deployment, using leader mode"); }