[GH-PAGES] Updated website

This commit is contained in:
Philippe Tillet
2022-04-09 00:42:33 +00:00
parent 0c570c178d
commit 226c24346e
158 changed files with 288 additions and 288 deletions

View File

@@ -564,42 +564,42 @@ torch_output=tensor([[ 1.1045, -36.9688, 31.4688, ..., -11.3906, 24.4531, -3
<p class="sphx-glr-script-out">Out:</p>
<div class="sphx-glr-script-out highlight-none notranslate"><div class="highlight"><pre><span></span>matmul-performance:
M cuBLAS ... Triton Triton (+ LeakyReLU)
0 256.0 2.730667 ... 3.276800 2.978909
1 384.0 7.372800 ... 7.899428 8.507077
2 512.0 14.563555 ... 15.420235 15.420235
0 256.0 2.730667 ... 2.978909 2.978909
1 384.0 7.372800 ... 8.507077 8.507077
2 512.0 14.563555 ... 16.384000 16.384000
3 640.0 22.260869 ... 24.380953 24.380953
4 768.0 32.768000 ... 35.389441 34.028308
5 896.0 37.971025 ... 40.140799 39.025776
5 896.0 37.971025 ... 40.140799 40.140799
6 1024.0 49.932191 ... 53.773130 53.773130
7 1152.0 45.242181 ... 48.161033 47.396572
8 1280.0 51.200001 ... 57.690139 57.690139
9 1408.0 64.138541 ... 69.009825 67.305878
10 1536.0 79.526831 ... 80.430545 79.526831
11 1664.0 63.372618 ... 63.372618 62.929456
12 1792.0 72.983276 ... 63.142831 63.142831
13 1920.0 69.120002 ... 71.626943 70.892307
14 2048.0 73.584279 ... 78.033565 77.672296
15 2176.0 83.500614 ... 87.115360 86.739860
8 1280.0 51.200001 ... 58.514284 57.690139
9 1408.0 64.138541 ... 69.009825 68.147202
10 1536.0 80.430545 ... 80.430545 80.430545
11 1664.0 62.929456 ... 63.372618 62.929456
12 1792.0 72.983276 ... 63.499573 63.142831
13 1920.0 69.467336 ... 71.257735 71.257735
14 2048.0 73.908442 ... 78.398206 78.033565
15 2176.0 83.155572 ... 87.115360 86.739860
16 2304.0 68.446623 ... 77.810656 77.307030
17 2432.0 71.125224 ... 75.522751 75.320281
18 2560.0 77.833728 ... 81.715711 81.512437
19 2688.0 83.737433 ... 90.966561 90.532356
20 2816.0 79.443003 ... 82.916747 84.035084
21 2944.0 81.832567 ... 83.198715 82.102191
22 3072.0 81.121923 ... 88.197981 87.381335
23 3200.0 83.116885 ... 96.385543 96.096095
24 3328.0 82.939284 ... 84.895397 85.096096
25 3456.0 77.745004 ... 86.596744 84.332184
26 3584.0 86.540320 ... 91.380335 97.416461
27 3712.0 85.748791 ... 88.404730 86.341700
28 3840.0 84.874902 ... 93.247896 85.300426
29 3968.0 92.372393 ... 80.015697 78.220472
30 4096.0 93.990003 ... 93.206754 86.036145
17 2432.0 71.125224 ... 75.522751 75.118889
18 2560.0 77.833728 ... 82.331658 81.715711
19 2688.0 83.552988 ... 90.102270 90.748936
20 2816.0 79.587973 ... 83.552120 83.552120
21 2944.0 82.237674 ... 82.646820 82.784108
22 3072.0 82.181572 ... 89.310890 87.246694
23 3200.0 78.817733 ... 96.240602 96.096095
24 3328.0 82.939284 ... 85.602017 85.806075
25 3456.0 78.655188 ... 92.086311 90.994998
26 3584.0 83.101104 ... 90.276496 95.249353
27 3712.0 85.675250 ... 85.091436 89.114488
28 3840.0 79.562590 ... 91.322872 85.136259
29 3968.0 93.076994 ... 79.133552 85.510815
30 4096.0 87.666706 ... 92.723821 87.267706
[31 rows x 5 columns]
</pre></div>
</div>
<p class="sphx-glr-timing"><strong>Total running time of the script:</strong> ( 6 minutes 48.521 seconds)</p>
<p class="sphx-glr-timing"><strong>Total running time of the script:</strong> ( 6 minutes 12.272 seconds)</p>
<div class="sphx-glr-footer class sphx-glr-footer-example docutils container" id="sphx-glr-download-getting-started-tutorials-03-matrix-multiplication-py">
<div class="sphx-glr-download sphx-glr-download-python docutils container">
<p><a class="reference download internal" download="" href="../../_downloads/d5fee5b55a64e47f1b5724ec39adf171/03-matrix-multiplication.py"><code class="xref download docutils literal notranslate"><span class="pre">Download</span> <span class="pre">Python</span> <span class="pre">source</span> <span class="pre">code:</span> <span class="pre">03-matrix-multiplication.py</span></code></a></p>