[BACKEND] Solidify f8e4m3 (#2105)

Co-authored-by: Philippe Tillet <phil@openai.com>
This commit is contained in:
Zahi Moudallal
2023-08-18 19:12:09 -07:00
committed by GitHub
parent 23ef2615d2
commit 23dd11d471
18 changed files with 171 additions and 172 deletions

View File

@@ -381,7 +381,7 @@ def get_max_tensorcore_tflops(dtype, backend=None, device=None, clock_rate=None)
ops_per_sub_core = 256
elif dtype in [torch.float16, torch.bfloat16, torch.int16]:
ops_per_sub_core = 512
elif dtype in [torch.int8, tl.float8e4, tl.float8e4b15, tl.float8e5]:
elif dtype in [torch.int8, tl.float8e4nv, tl.float8e4b15, tl.float8e5]:
ops_per_sub_core = 1024
else:
raise RuntimeError("dtype not supported")