From 0c478846c5002a4053b0349d6557bafb9cedc935 Mon Sep 17 00:00:00 2001 From: Nicolas Patry Date: Fri, 11 Oct 2024 21:47:03 +0200 Subject: [PATCH] Fixing intel Supports windowing. (#2637) --- server/text_generation_server/layers/attention/common.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/server/text_generation_server/layers/attention/common.py b/server/text_generation_server/layers/attention/common.py index d6e512c0..c8ac0c2a 100644 --- a/server/text_generation_server/layers/attention/common.py +++ b/server/text_generation_server/layers/attention/common.py @@ -68,5 +68,5 @@ else: def clamp(self, max): if SYSTEM == "rocm": return self - raise NotImplementedError("Not implemented seqlen for paged") - return Seqlen(torch.clamp(self.input_lengths, max=max)) + self.input_lengths = torch.clamp(self.input_lengths, max=max) + return self