Fixing rocm gptq by using triton code too (renamed cuda into triton). (#2691)

This commit is contained in:
Nicolas Patry 2024-10-25 09:17:57 +02:00 committed by GitHub
parent 43df056eee
commit cece8635f8
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
2 changed files with 2 additions and 2 deletions

View File

@ -10,8 +10,8 @@ from text_generation_server.utils.weights import Weight, Weights, WeightsLoader
if SYSTEM == "ipex":
from .ipex import QuantLinear
elif SYSTEM == "cuda":
from .cuda import QuantLinear
elif SYSTEM in {"cuda", "rocm"}:
from .triton import QuantLinear
@dataclass