mirror of
https://github.com/ROCm/ROCm.git
synced 2026-04-05 03:01:17 -04:00
[Triton] Mfma16 support (#251)
* [MFAM] Support mfma with NM size 16 This PR code emitting of MFMA instructions with size 16. * add control over mfma type with MFMA_TYPE=16 env var
This commit is contained in:
@@ -257,7 +257,8 @@ private:
|
||||
SmallVector<SmallVector<unsigned>> offsets;
|
||||
assert(rank == 2);
|
||||
SmallVector<Value> multiDimOffset(rank);
|
||||
emitMfmaOffsetForCTA(mfmaLayout, offsets, multiDimCTAInRepId[0], multiDimCTAInRepId[1]);
|
||||
emitMfmaOffsetForCTA(mfmaLayout, offsets, multiDimCTAInRepId[0],
|
||||
multiDimCTAInRepId[1]);
|
||||
multiDimOffset[0] = add(multiDimBase[0], i32_val(offsets[elemId][0]));
|
||||
multiDimOffset[1] = add(multiDimBase[1], i32_val(offsets[elemId][1]));
|
||||
return multiDimOffset;
|
||||
|
||||
Reference in New Issue
Block a user