[DOCS] Updates and improvements (#87)
This commit is contained in:
committed by
Philippe Tillet
parent
39f4730305
commit
29e33e50b7
@@ -100,7 +100,7 @@ def softmax(x):
|
||||
# Allocate output
|
||||
y = torch.empty_like(x)
|
||||
# Enqueue kernel. The launch grid is simple: we have one kernel instance per row of the input matrix
|
||||
_softmax[(M, )](y, x, x.stride(0), y.stride(0), M, N, BLOCK=BLOCK)
|
||||
_softmax[(M, )](y, x, x.stride(0), y.stride(0), M, N, num_warps=num_warps, BLOCK=BLOCK)
|
||||
return y
|
||||
|
||||
|
||||
|
Reference in New Issue
Block a user