no performance regression
This commit is contained in:
@@ -64,7 +64,7 @@ void dot(TYPE * A, TYPE * B, TYPE * C,
|
|||||||
// epilogue
|
// epilogue
|
||||||
int rxc[TM] = ridx * TM + 0 ... TM;
|
int rxc[TM] = ridx * TM + 0 ... TM;
|
||||||
int ryc[TN] = ridy * TN + 0 ... TN;
|
int ryc[TN] = ridy * TN + 0 ... TN;
|
||||||
TYPE* pc[TM, TN] = C + ryc[newaxis, :] + rxc[:, newaxis] * ldc;
|
TYPE* pc[TM, TN] = C + rxc[:, newaxis] * ldc + ryc[newaxis, :];
|
||||||
*pc = c;
|
*pc = c;
|
||||||
}
|
}
|
||||||
)";
|
)";
|
||||||
|
Reference in New Issue
Block a user