[Triton] Mfma16 support (#251)

* [MFAM] Support mfma with NM size 16

This PR code emitting of MFMA instructions with size 16.

* add control over mfma type with MFMA_TYPE=16 env var
This commit is contained in:
Alexander Efimov
2023-10-09 20:59:54 +02:00
committed by GitHub
parent e801638b40
commit 7e34c244c2
11 changed files with 252 additions and 107 deletions

View File

@@ -257,7 +257,8 @@ private:
SmallVector<SmallVector<unsigned>> offsets;
assert(rank == 2);
SmallVector<Value> multiDimOffset(rank);
emitMfmaOffsetForCTA(mfmaLayout, offsets, multiDimCTAInRepId[0], multiDimCTAInRepId[1]);
emitMfmaOffsetForCTA(mfmaLayout, offsets, multiDimCTAInRepId[0],
multiDimCTAInRepId[1]);
multiDimOffset[0] = add(multiDimBase[0], i32_val(offsets[elemId][0]));
multiDimOffset[1] = add(multiDimBase[1], i32_val(offsets[elemId][1]));
return multiDimOffset;