Add fix for attention slicing fp16 (#1217)

2026-04-03 03:00:17 -04:00 · 2023-03-20 22:11:29 -04:00
parent d105246b9c
commit 7899e1803a
1 changed files with 1 additions and 0 deletions
--- a/shark/shark_importer.py
+++ b/shark/shark_importer.py
@@ -297,6 +297,7 @@ def transform_fx(fx_g):
            if node.target in [
                torch.ops.aten.arange,
                torch.ops.aten.empty,
+                torch.ops.aten.zeros,
            ]:
                node.kwargs = kwargs_dict
            # Inputs and outputs of aten.var.mean should be upcasted to fp32.