parent
2358c2bb54
commit
0da4df4b96
|
@ -26,8 +26,8 @@ class KVCache:
|
||||||
|
|
||||||
if (
|
if (
|
||||||
dtype == torch.float8_e5m2
|
dtype == torch.float8_e5m2
|
||||||
and ATTENTION != "flashinfer"
|
and (ATTENTION != "flashinfer"
|
||||||
and SYSTEM != "cuda"
|
or SYSTEM != "cuda")
|
||||||
):
|
):
|
||||||
raise ValueError(
|
raise ValueError(
|
||||||
"float8_e5m2 KV cache is currently only supported for flashinfer on CUDA"
|
"float8_e5m2 KV cache is currently only supported for flashinfer on CUDA"
|
||||||
|
|
Loading…
Reference in New Issue