[examples] debugging matrix multiplication code
This commit is contained in:
@@ -40,7 +40,7 @@ void test(fp32 *a, fp32 *b, fp32 *c, int32 M, int32 N, int32 K){\
|
|||||||
fp32* pa[32, 8] = a + rx[:, newaxis] + rka[newaxis, :]*M;\
|
fp32* pa[32, 8] = a + rx[:, newaxis] + rka[newaxis, :]*M;\
|
||||||
fp32* pb[32, 8] = b + ry[:, newaxis] + rkb[newaxis, :]*K;\
|
fp32* pb[32, 8] = b + ry[:, newaxis] + rkb[newaxis, :]*K;\
|
||||||
fp32* pc[32, 32] = c + rx[:, newaxis] + ry[newaxis, :]*M;\
|
fp32* pc[32, 32] = c + rx[:, newaxis] + ry[newaxis, :]*M;\
|
||||||
for(k = K; k >= 0; k = k - 8){\
|
for(k = K; k > 0; k = k - 8){\
|
||||||
fp32 a[32, 8] = *pa;\
|
fp32 a[32, 8] = *pa;\
|
||||||
fp32 b[32, 8] = *pb;\
|
fp32 b[32, 8] = *pb;\
|
||||||
C = C + 1;\
|
C = C + 1;\
|
||||||
@@ -228,5 +228,8 @@ int main() {
|
|||||||
// Write back
|
// Write back
|
||||||
checkCudaErrors(cuMemcpyDtoH(c.data(), d_c, sizeof(numeric_t) * c.size()));
|
checkCudaErrors(cuMemcpyDtoH(c.data(), d_c, sizeof(numeric_t) * c.size()));
|
||||||
|
|
||||||
|
for(size_t i = 0; i < M*N; i++)
|
||||||
|
if(c[i] == 32)
|
||||||
|
std::cout << i << " " << "success" << std::endl;
|
||||||
return 0;
|
return 0;
|
||||||
}
|
}
|
||||||
|
Reference in New Issue
Block a user