[MFMA] [FA] Keep bf16 results of FA dot operations in registers (#298)

This PR enables optimization for keeping bf16 values in registers between dot operations.
This commit is contained in:
Alexander Efimov
2023-08-18 14:33:00 +02:00
committed by GitHub
parent 9ab335196f
commit 01b0108c94
2 changed files with 4 additions and 3 deletions

View File

@@ -228,7 +228,7 @@ bool isMfmaToDotShortcut(RankedTensorType &srcTy, RankedTensorType &dstTy) {
return mfmaLayout.getWarpsPerCTA()[1] == 1 &&
dotOperandLayout.getOpIdx() == 0 &&
dotOperandLayout.getParent() == mfmaLayout &&
mfmaLayout.getIsTransposed() && srcTy.getElementType().isF16();
mfmaLayout.getIsTransposed() && (srcTy.getElementType().isF16() || srcTy.getElementType().isBF16());
}
#endif