[IPEX] Fix SDPA attn_mask dtype

This commit is contained in:
Nuullll 2024-01-06 16:32:18 +08:00
parent 8b6848c6db
commit 16b4d2cf3f
1 changed files with 2 additions and 0 deletions

View File

@ -41,6 +41,8 @@ def torch_xpu_scaled_dot_product_attention(
# cast to same dtype first
key = key.to(query.dtype)
value = value.to(query.dtype)
if attn_mask is not None and attn_mask.dtype != torch.bool:
attn_mask = attn_mask.to(query.dtype)
N = query.shape[:-2] # Batch size
L = query.size(-2) # Target sequence length