[codegen] bugfix in alignment inference

This commit is contained in:
Philippe Tillet
2019-06-25 15:06:15 -07:00
parent edc31cabb0
commit d52abc9379
7 changed files with 170 additions and 52 deletions

View File

@@ -26,9 +26,9 @@ const tunable int32 TN = {64, 128};
const tunable int32 TK = {16};
const tunable int32 GZ = {1};
void matmul(restrict read_only align(4) fp16 *A,
restrict read_only align(4) fp16 *B,
align(4) fp32 *C,
void matmul(restrict read_only align(16) fp16 *A,
restrict read_only align(16) fp16 *B,
align(16) fp32 *C,
int32 M, int32 N, int32 K,
multiple_of(4) int32 lda, multiple_of(4) int32 ldb, multiple_of(4) int32 ldc,
int32 *locks, int32 grid0, int32 grid1) {