[CODEGEN] Bugfixes with FP32 async copy

This commit is contained in:
Philippe Tillet
2021-02-24 13:36:26 -05:00
parent bfe92a5d91
commit db6bf71564
3 changed files with 12 additions and 11 deletions

View File

@@ -44,7 +44,7 @@ import torch
(128, 128, 32, 1, 4, 384, 128, 640, AT, BT, DTYPE),
(128, 128, 32, 1, 4, 107, 233, 256, AT, BT, DTYPE),
(128, 128, 32, 1, 4, 107, 233, 311, AT, BT, DTYPE),
] for DTYPE in ["float16"] for AT in [False, True] for BT in [False, True]
] for DTYPE in ["float16", "float32"] for AT in [False, True] for BT in [False, True]
]),
)
def test_op(TM, TN, TK, SPLITK, NWARP, M, N, K, AT, BT, DTYPE):