[GH-PAGES] Updated website

This commit is contained in:
Philippe Tillet
2022-02-14 00:38:35 +00:00
parent 13537582ad
commit 819da42584
158 changed files with 248 additions and 248 deletions

View File

@@ -564,9 +564,9 @@ torch_output=tensor([[ 1.1045, -36.9688, 31.4688, ..., -11.3906, 24.4531, -3
<p class="sphx-glr-script-out">Out:</p>
<div class="sphx-glr-script-out highlight-none notranslate"><div class="highlight"><pre><span></span>matmul-performance:
M cuBLAS ... Triton Triton (+ LeakyReLU)
0 256.0 2.978909 ... 2.978909 2.978909
1 384.0 7.372800 ... 8.507077 8.192000
2 512.0 14.563555 ... 16.384000 16.384000
0 256.0 2.730667 ... 2.978909 2.978909
1 384.0 7.372800 ... 8.507077 8.507077
2 512.0 14.563555 ... 15.420235 16.384000
3 640.0 22.260869 ... 24.380953 24.380953
4 768.0 32.768000 ... 34.028308 34.028308
5 896.0 39.025776 ... 40.140799 39.025776
@@ -574,32 +574,32 @@ torch_output=tensor([[ 1.1045, -36.9688, 31.4688, ..., -11.3906, 24.4531, -3
7 1152.0 45.242181 ... 46.656000 46.656000
8 1280.0 51.200001 ... 56.888887 56.888887
9 1408.0 64.138541 ... 67.305878 66.485074
10 1536.0 79.526831 ... 79.526831 78.643199
10 1536.0 80.430545 ... 79.526831 78.643199
11 1664.0 62.929456 ... 62.492442 62.061463
12 1792.0 72.512412 ... 71.588687 72.047592
13 1920.0 69.120002 ... 70.172588 70.172588
14 2048.0 73.908442 ... 76.959706 76.260072
15 2176.0 83.155572 ... 85.998493 85.998493
16 2304.0 68.643310 ... 76.809875 76.076024
17 2432.0 71.125224 ... 84.877538 85.134737
18 2560.0 78.019048 ... 80.908642 81.108913
19 2688.0 82.642823 ... 89.995386 89.464755
20 2816.0 83.074685 ... 83.552120 82.680963
21 2944.0 81.832567 ... 81.564701 81.967162
22 3072.0 81.707223 ... 88.060814 88.612060
23 3200.0 80.706181 ... 95.167286 94.814812
24 3328.0 83.226931 ... 84.003845 84.298943
25 3456.0 79.430113 ... 84.909497 89.380896
26 3584.0 87.466332 ... 97.734120 98.160909
27 3712.0 79.917877 ... 86.942857 89.035062
28 3840.0 84.292684 ... 91.473945 86.467555
29 3968.0 90.791620 ... 80.864108 86.572497
30 4096.0 88.592559 ... 86.928580 91.366730
12 1792.0 72.512412 ... 72.047592 71.588687
13 1920.0 68.776119 ... 70.172588 70.172588
14 2048.0 73.262953 ... 76.608294 76.260072
15 2176.0 83.155572 ... 85.998493 85.632545
16 2304.0 68.643310 ... 76.563695 76.319081
17 2432.0 71.487187 ... 84.621881 85.134737
18 2560.0 78.019048 ... 81.310171 81.108913
19 2688.0 83.369354 ... 89.254248 89.464755
20 2816.0 81.218262 ... 82.135981 83.392363
21 2944.0 82.102191 ... 82.509987 82.373605
22 3072.0 81.707223 ... 86.845249 84.135370
23 3200.0 84.880639 ... 87.795257 90.780140
24 3328.0 79.990330 ... 84.101981 84.596116
25 3456.0 81.600781 ... 90.943675 84.775569
26 3584.0 85.715344 ... 93.661869 95.047985
27 3712.0 81.615477 ... 88.365630 83.982636
28 3840.0 82.592983 ... 87.286505 91.322872
29 3968.0 86.973584 ... 90.926929 83.982489
30 4096.0 92.500158 ... 88.417474 85.271746
[31 rows x 5 columns]
</pre></div>
</div>
<p class="sphx-glr-timing"><strong>Total running time of the script:</strong> ( 6 minutes 8.357 seconds)</p>
<p class="sphx-glr-timing"><strong>Total running time of the script:</strong> ( 6 minutes 4.120 seconds)</p>
<div class="sphx-glr-footer class sphx-glr-footer-example docutils container" id="sphx-glr-download-getting-started-tutorials-03-matrix-multiplication-py">
<div class="sphx-glr-download sphx-glr-download-python docutils container">
<p><a class="reference download internal" download="" href="../../_downloads/d5fee5b55a64e47f1b5724ec39adf171/03-matrix-multiplication.py"><code class="xref download docutils literal notranslate"><span class="pre">Download</span> <span class="pre">Python</span> <span class="pre">source</span> <span class="pre">code:</span> <span class="pre">03-matrix-multiplication.py</span></code></a></p>