mirror of
https://github.com/ROCm/ROCm.git
synced 2026-04-05 03:01:17 -04:00
ROCM IFU: Fix test_core_amd.py::test_reduce_layouts
This commit is contained in:
@@ -2968,7 +2968,7 @@ def test_reduce_layouts(M, N, src_layout, axis, device='cuda'):
|
||||
%14 = triton_gpu.convert_layout %13 : (tensor<{M}x{N}xf32, #blocked>) -> tensor<{M}x{N}xf32, #src>
|
||||
%15 = "tt.reduce"(%14) ({{
|
||||
^bb0(%arg3: f32, %arg4: f32):
|
||||
%16 = "triton_gpu.cmpf"(%arg3, %arg4) {{predicate = 2 : i64}} : (f32, f32) -> i1
|
||||
%16 = "arith.cmpf"(%arg3, %arg4) {{predicate = 2 : i64}} : (f32, f32) -> i1
|
||||
%17 = arith.select %16, %arg3, %arg4 : f32
|
||||
tt.reduce.return %17 : f32
|
||||
}}) {{axis = {axis} : i32}} : (tensor<{M}x{N}xf32, #src>) -> tensor<{rdims_1d}xf32, #triton_gpu.slice<{{dim = {axis}, parent = #src}}>>
|
||||
|
||||
Reference in New Issue
Block a user