wmma: add CUDA tensor core (#3464)

This commit is contained in:
Francis Lam
2024-02-22 02:57:08 -08:00
committed by GitHub
parent 57678012e1
commit e9cef13f0b
7 changed files with 54 additions and 32 deletions

View File

@@ -45,6 +45,7 @@ jobs:
run: |
DEBUG=2 EMULATE_METAL=1 FORWARD_ONLY=1 PYTHON=1 python3 ./test/test_linearizer.py TestLinearizer.test_tensor_cores
DEBUG=2 EMULATE_HIP=1 FORWARD_ONLY=1 PYTHON=1 python3 ./test/test_linearizer.py TestLinearizer.test_tensor_cores
DEBUG=2 EMULATE_CUDA=1 FORWARD_ONLY=1 PYTHON=1 python3 ./test/test_linearizer.py TestLinearizer.test_tensor_cores
- name: Test dtype with Python emulator
run: DEBUG=2 PYTHON=1 python3 test/test_dtype.py
- name: Test ops with Python emulator