[codegen/selection] tensor cores now used for transposed layotus

This commit is contained in:
Philippe Tillet
2019-07-17 17:20:38 -07:00
parent bfa39b8992
commit 2f0817b2cd
5 changed files with 57 additions and 14 deletions

View File

@@ -25,6 +25,7 @@ def run_dot():
# Test
hresult = np.dot(ha.T, hb.T).T
dif = np.abs(result - hresult)
np.savetxt('dif.dat', dif, '%2.4f')
print(hresult)
print(result)
print("dif: %f" % np.max(dif))