Files
triton/searchindex.js
2021-04-21 01:58:48 -04:00

1 line
14 KiB
JavaScript

Search.setIndex({docnames:["getting-started/tutorials/01-vector-add","getting-started/tutorials/02-fused-softmax","getting-started/tutorials/03-matrix-multiplication","getting-started/tutorials/index","getting-started/tutorials/sg_execution_times","index","language-reference/python-api/generated/triton.arange","language-reference/python-api/generated/triton.atomic_cas","language-reference/python-api/generated/triton.atomic_xchg","language-reference/python-api/generated/triton.broadcast_to","language-reference/python-api/generated/triton.dot","language-reference/python-api/generated/triton.exp","language-reference/python-api/generated/triton.load","language-reference/python-api/generated/triton.log","language-reference/python-api/generated/triton.max","language-reference/python-api/generated/triton.maximum","language-reference/python-api/generated/triton.min","language-reference/python-api/generated/triton.minimum","language-reference/python-api/generated/triton.multiple_of","language-reference/python-api/generated/triton.num_programs","language-reference/python-api/generated/triton.program_id","language-reference/python-api/generated/triton.ravel","language-reference/python-api/generated/triton.reshape","language-reference/python-api/generated/triton.sigmoid","language-reference/python-api/generated/triton.softmax","language-reference/python-api/generated/triton.store","language-reference/python-api/generated/triton.sum","language-reference/python-api/generated/triton.where","language-reference/python-api/generated/triton.zeros"],envversion:{"sphinx.domains.c":2,"sphinx.domains.changeset":1,"sphinx.domains.citation":1,"sphinx.domains.cpp":3,"sphinx.domains.index":1,"sphinx.domains.javascript":2,"sphinx.domains.math":2,"sphinx.domains.python":2,"sphinx.domains.rst":2,"sphinx.domains.std":2,sphinx:56},filenames:["getting-started/tutorials/01-vector-add.rst","getting-started/tutorials/02-fused-softmax.rst","getting-started/tutorials/03-matrix-multiplication.rst","getting-started/tutorials/index.rst","getting-started/tutorials/sg_execution_times.rst","index.rst","language-reference/python-api/generated/triton.arange.rst","language-reference/python-api/generated/triton.atomic_cas.rst","language-reference/python-api/generated/triton.atomic_xchg.rst","language-reference/python-api/generated/triton.broadcast_to.rst","language-reference/python-api/generated/triton.dot.rst","language-reference/python-api/generated/triton.exp.rst","language-reference/python-api/generated/triton.load.rst","language-reference/python-api/generated/triton.log.rst","language-reference/python-api/generated/triton.max.rst","language-reference/python-api/generated/triton.maximum.rst","language-reference/python-api/generated/triton.min.rst","language-reference/python-api/generated/triton.minimum.rst","language-reference/python-api/generated/triton.multiple_of.rst","language-reference/python-api/generated/triton.num_programs.rst","language-reference/python-api/generated/triton.program_id.rst","language-reference/python-api/generated/triton.ravel.rst","language-reference/python-api/generated/triton.reshape.rst","language-reference/python-api/generated/triton.sigmoid.rst","language-reference/python-api/generated/triton.softmax.rst","language-reference/python-api/generated/triton.store.rst","language-reference/python-api/generated/triton.sum.rst","language-reference/python-api/generated/triton.where.rst","language-reference/python-api/generated/triton.zeros.rst"],objects:{triton:{arange:[6,0,1,""],atomic_cas:[7,0,1,""],atomic_xchg:[8,0,1,""],broadcast_to:[9,0,1,""],dot:[10,0,1,""],exp:[11,0,1,""],load:[12,0,1,""],log:[13,0,1,""],max:[14,0,1,""],maximum:[15,1,1,""],min:[16,0,1,""],minimum:[17,1,1,""],multiple_of:[18,0,1,""],num_programs:[19,0,1,""],program_id:[20,0,1,""],ravel:[21,1,1,""],reshape:[22,0,1,""],sigmoid:[23,1,1,""],softmax:[24,1,1,""],store:[25,0,1,""],sum:[26,0,1,""],where:[27,0,1,""],zeros:[28,0,1,""]}},objnames:{"0":["py","function","Python function"],"1":["py","data","Python data"]},objtypes:{"0":"py:function","1":"py:data"},terms:{"0000e":2,"002304":2,"003930":2,"0220e":2,"028568":2,"032234":2,"044":[0,4],"057027":2,"078047":2,"0876e":2,"096276":2,"1024":[0,2],"1094e":2,"10mn":1,"1133e":2,"117":2,"1238e":2,"128":2,"1280":2,"137481":2,"144":2,"152":2,"153":2,"1536":2,"1539e":2,"154":4,"157":2,"157204":2,"161678":2,"164923":2,"172024":2,"173747":2,"176":[1,4],"1778e":2,"178":2,"178785":2,"1792":2,"180520":2,"1823":1,"184001":2,"190":2,"198":2,"199":2,"2048":[1,2],"205983":2,"206935":2,"208":2,"210":2,"2141":0,"215":2,"215272":2,"2156e":2,"220":2,"221":2,"222":2,"229":2,"230":2,"2304":2,"231":2,"232":2,"233":2,"235":2,"236":2,"238":2,"239":2,"241":2,"242":2,"244":2,"245":2,"246":2,"246398":2,"248":2,"249":2,"250":2,"251":2,"2510e":2,"252":2,"253":2,"254":2,"256":[1,2],"2560":2,"257":2,"259":2,"2598e":2,"2605e":2,"2617e":2,"263":2,"264":2,"2658e":2,"266":2,"266731":2,"267699":2,"270":2,"276":2,"2816":2,"282797":2,"293068":2,"2mn":1,"3072":2,"3076":0,"307632":2,"3094e":2,"315584":2,"3328":2,"3375e":2,"3584":2,"360005":2,"366501":2,"3713":0,"377264":2,"3836e":2,"3840":2,"385067":2,"3mn":1,"4096":[1,2],"420235":2,"4277e":2,"4352":2,"4375e":2,"441481":2,"446699":2,"4608":2,"4864":2,"4940":0,"498706":2,"500857":2,"511113":2,"512":2,"5120":2,"514009":2,"519114":2,"520144":2,"527241":2,"5332e":2,"5376":2,"538463":2,"552287":2,"560014":2,"5632":2,"578957":2,"5888":2,"595626":2,"606284":2,"614125":2,"6144":2,"6387e":2,"6400":2,"6547e":2,"6562e":2,"6656":2,"6724":0,"676487":2,"6865e":2,"6875e":2,"6891e":2,"6907e":2,"6912":2,"692102":2,"699140":2,"7100e":2,"7168":2,"728763":2,"7295e":2,"740709":2,"741014":2,"7424":2,"768":2,"7680":2,"7684e":2,"781":1,"7936":2,"7mn":1,"803966":2,"8125e":2,"8192":2,"8340e":2,"844029":2,"8477e":2,"8537e":2,"8632e":2,"8644e":2,"867127":2,"868505":2,"916752":2,"917998":2,"933":[2,4],"9414e":2,"9453e":2,"9605e":2,"9733":0,"982401":2,"98432":0,"9844e":2,"988932":2,"990461":2,"byte":1,"case":[1,2],"float":1,"function":[0,1,2,6,9,10,12,19,20,22,25,27,28],"import":[0,1,2],"int":[0,6,9,19,20,28],"new":[9,22,28],"return":[0,1,2,6,10,12,19,20,27,28],"super":2,"switch":2,"true":[0,1,2,27],"try":2,For:2,Has:[19,20],One:2,The:[0,1,2,9,10,19,20,25,27],These:2,Used:[0,1,2],__expf:1,_add:0,_matmul:2,_softmax:1,a100:2,about:[0,1,2,5],abov:[0,1,2],abs:0,acc:2,accept:2,access:0,accomod:2,achiev:2,activ:2,actual:2,add:[0,4],addit:[1,3,4],address:1,affect:2,against:[0,1,2,5],aggress:1,aim:5,algorithm:2,all:[1,2,3],allclos:[1,2],alloc:[0,1,2],allow:[0,1],almost:1,along:[0,19,20],also:[0,1,2],alwai:27,amount:1,analog:0,ani:[1,2],anoth:1,api:5,approxim:1,arang:[0,1,2],arbitrari:2,architectur:2,arg:[0,1,2],argument:[0,1,2,27],around:1,arrai:28,arrang:2,ask:1,assert:2,assum:1,asynchron:0,auto:[1,2],automat:2,autotun:2,avoid:27,axi:[0,1,2,14,16,19,20,26],back:[0,1],bandwidth:1,basic:[0,3],been:0,befor:2,below:3,benefit:1,best:0,better:2,between:0,bit:1,block:[0,1,2,9,10,12,22,25,27,28],block_k:2,block_m:2,block_n:2,bool:[12,25,27],both:27,bound:[0,1],broadcast:[9,27],build:2,builder:[6,7,8,9,10,11,12,13,14,16,18,19,20,22,25,26,27,28],built:0,c_0:2,c_1:2,cach:1,call:[0,2],callabl:0,can:[0,1,2],cannot:2,capabl:5,cdiv:[0,2],chang:2,chapter:5,check:[2,5],checkout:5,chip:1,choic:5,click:[0,1,2],close:2,cmp:7,code:[0,1,2,3,6,9,10,12,19,20,22,25,27,28],code_gen:[15,17,21,23,24],col:1,column:[1,2],come:[1,2],compar:[1,2,5],compat:10,compil:[1,2,5],comput:5,concis:0,condit:27,config:2,configur:2,consid:1,consist:1,constitut:0,constraint:2,consum:2,contigu:[2,6],conveni:2,convert:0,correspond:[0,1,2],could:1,creat:[0,1,2],csv:0,cubla:2,cuda:[0,1,2],current:20,custom:[0,1,2,5],cutlass:2,data:[0,1,2,12,27,28],declara:0,decor:[0,2],deep:2,def:[0,1,2],defin:[1,2,12],denom:1,denomin:1,denot:0,depend:27,devic:[0,1,2],differ:[0,1,2,20],difficulti:2,dimens:[2,10],dimension:[2,10],disk:0,dnn:5,do_bench:[0,1,2],doe:[0,1],don:[0,1],done:2,dot:2,doubli:2,download:[0,1,2,3],dram:1,dsl:5,dtype:[0,1,2,28],each:[1,2],easi:2,easier:[0,1],easili:2,education:1,effici:2,either:[0,19,20,27],element:[0,1,2,25,27],element_s:1,elementwis:[1,12],empti:2,empty_lik:[0,1],end:6,enqueu:[0,1],entir:1,entri:0,environ:5,etc:2,evalu:[2,27],exampl:[0,1,2,3],execut:[0,4],exp:[1,2],expect:1,expert:2,exponenti:1,extend:2,extract:2,fairli:2,fals:[12,25,27],far:1,fast:1,faster:1,feel:2,file:[0,1,2,4],fill:28,first:[0,5,10],fit:1,float16:[2,10,28],float32:[0,1,2,10],focu:2,follow:[1,2,5],forget:0,free:2,from:[1,2,6,9,10,12,19,20,22,25,27,28],full:[0,1,2],fuse:[2,3,4],fusion:1,galleri:[0,1,2,3],gbp:[0,1],gener:[0,1,2,3,6,9,10,12,19,20,22,25,27,28],get:[0,1,4],given:[1,2,19,20,28],good:0,gpu:[0,1,2,5],greater:1,grid:[0,1,2,19,20],grid_m:2,grid_n:2,group:2,group_id:2,group_m:2,group_siz:2,guard:[0,1],guess:1,handl:[0,1,2],hard:2,hardwar:[2,5],has:0,hasn:0,have:[1,10,27],helper:[0,1],henc:2,here:[0,1,2],heurist:1,high:2,hit:2,how:[0,1,2,5],howev:2,ident:1,idx:[12,25],imper:5,implement:[0,1,2],implicitli:0,improv:2,incompat:2,increas:0,index:1,indic:[1,27],inf:1,initi:2,inner:[2,10],input:[0,1,2,9,10,14,16,22,26],instal:5,instanc:[0,1,2,19,20],instead:[1,12,27],instruct:5,intern:1,interv:6,introduct:5,ipynb:[0,1,2],irregular:1,is_contigu:2,iter:2,its:1,jit:[0,1,2,6,9,10,12,19,20,22,25,27,28],jitfunct:[15,17,21,23,24],jupyt:[0,1,2,3],kei:[0,1,2],kernel:5,keyword:0,label:[0,1,2],lambda:[0,1,2],larg:1,launch:[0,1,2,19,20],learn:[0,1,2,5],less:1,let:1,level:2,librari:2,like:0,limit:1,line:[0,1,2],list:2,load:[0,1,2,27],locat:[2,12,25],logarithm:0,longer:1,look:[1,5],loop:2,main:[0,2],maintain:1,major:2,make:[0,1],manual:1,manual_se:[0,1,2],mask:[0,1,2,12,25,27],matmul:2,matric:[1,2],matrix:[1,3,4,10],matter:2,max:[0,1],max_m:[0,1,2],maxim:5,maximum:[0,1],mean:[1,2],mechan:1,memori:[0,1,2,12,25,27],mention:2,meta:[0,1,2],metaparamet:[0,2],min:2,min_m:[0,1,2],minut:[0,1,2],mixtur:2,model:[0,20],modern:[2,5],more:[1,5],most:2,move:1,multi:2,multipl:[3,4],multipli:10,must:[1,2,10,27],naiv:[1,2],naive_softmax:1,name:[0,1,2],nativ:[0,2],natur:1,necessari:1,need:[1,2],nelement:1,nest:2,next:[1,2],next_power_of_2:1,none:[1,2,6,7,8,9,10,11,12,13,14,16,18,19,20,22,25,26,27,28],nonzero:27,normal:[1,2],note:[0,1,27],notebook:[0,1,2,3],notori:2,now:[0,2],num:1,num_warp:[1,2],number:[0,1,19],numer:1,object:[0,2,15,17,21,23,24],obtain:0,obvious:1,offset:0,often:2,onc:1,one:[1,3],onli:[1,2],open:6,oper:[0,1,2,3,27],operand:2,ops:0,option:[0,2,6,9,10,12,19,20,22,25,27,28],order:[2,3],other:[1,2,5,10,12],otherwis:27,our:[0,1,2],out:[0,1,2,5],outperform:1,output:[0,1,2],pad:1,parallel:[0,1,2,5,20],param:22,paramet:[0,2,6,9,10,12,19,20,25,27,28],part:2,partial:1,pass:0,path:0,peak:2,per:1,perf:2,perf_report:[0,1,2],perform:[0,1],pid:[0,2],pid_m:2,pid_n:2,platform:5,plot:[0,1,2],plot_nam:[0,1,2],point:0,pointer:[0,12,25],possibl:[0,1,2],power:1,practic:[0,1,2],predict:1,prefer:1,present:2,print:[0,1,2],print_data:2,problem:0,process:0,product:[5,10],program:[0,1,2,5,19,20],program_id:[0,1,2],promot:2,properli:1,proprietari:2,provid:[0,1,2,5],pseudo:2,ptr:[7,8],python:[0,1,2,3,5],pytorch:[0,1],rand:0,randn:[1,2],rang:[0,1,2],rate:2,raw:0,read:[1,2,3],reason:2,recommend:3,reduct:1,refer:0,regardless:27,regist:2,rel:0,relat:5,remateri:2,requir:1,result:[0,1],ret:1,ret_fals:2,ret_tru:2,reus:2,roughli:2,row:[1,2],run:[0,1,2,5,20],save:[0,1,2],save_path:0,scalar:[10,28],script:[0,1,2],second:[0,1,2,10],see:[0,1],seem:0,select:27,sens:0,set:0,shape:[0,1,2,9,22,27,28],share:1,should:0,show:2,show_plot:[0,1],sigmoid:2,significantli:1,silu:2,simpl:[0,1],simplest:3,sinc:[0,2],size:[0,1],smallest:1,softmax:[3,4],solut:[1,2],some:2,sourc:[0,1,2,3],speak:2,specif:2,specifi:[2,25],speed:1,sphinx:[0,1,2,3],spmd:[0,20],stabil:1,start:[3,6],started_tutori:4,still:0,stop:6,store:[0,1,2,27],straightforward:2,stride:[1,2],stride_a_0:2,stride_a_1:2,stride_ak:2,stride_am:2,stride_b_0:2,stride_b_1:2,stride_bk:2,stride_bn:2,stride_cm:2,stride_cn:2,stride_x_0:2,stride_x_1:2,stride_xm:1,stride_ym:1,subscript:0,substract:1,sum:[0,1],sure:1,swish:2,synchron:0,system:2,take:[2,5],techniqu:2,temporari:1,tensor:[0,1,2],test:0,tflop:2,than:1,thei:2,them:0,themselv:2,theoret:1,therefor:2,thi:[0,1,2],thing:0,think:1,though:1,through:3,throughput:5,tile:1,time:[0,1,2],too:1,torch:[0,1,2],total:[0,1,2,4],transfer:1,tri:9,trick:1,trigger:2,triton:[0,1,2,3],tune:[1,2],tupl:[0,9,28],tutori:[0,1,2,5],tutorials_jupyt:3,tutorials_python:3,twice:1,two:[0,1,2,10],type:[10,22,27,28],typic:2,understand:1,unfortun:2,unint:27,unlik:2,updat:2,use:[0,1,2,27],used:0,uses:20,using:[0,2],util:0,val:[7,8],valid:0,valu:[0,1,2,6,9,12,18,25,27,28],valuabl:1,variou:3,vector:[1,3,4],vendor:2,veri:1,verifi:1,via:2,wai:[1,2],want:[1,27],warp:1,wast:1,when:[1,27],where:[2,25],which:[0,1,2,20],whose:[0,1,2,12],width:2,wise:[1,2,25],wish:2,within:[6,9,10,12,19,20,22,25,27,28],won:1,work:[1,5],workload:2,would:1,wrapper:2,write:[0,1,2,3,5],wrote:1,x_log:0,x_max:1,x_name:[0,1,2],x_val:[0,1,2],y_line:[0,1,2],y_name:[0,1,2],y_ref:1,y_tri:1,y_val:[0,1,2],yield:27,ylabel:[0,1,2],you:[0,1,2,3,27],your:5,yourself:[1,2],zero:2,zip:3},titles:["Vector Addition","Fused Softmax","Matrix Multiplication","Tutorials","Computation times","Welcome to Triton\u2019s documentation!","triton.arange","triton.atomic_cas","triton.atomic_xchg","triton.broadcast_to","triton.dot","triton.exp","triton.load","triton.log","triton.max","triton.maximum","triton.min","triton.minimum","triton.multiple_of","triton.num_programs","triton.program_id","triton.ravel","triton.reshape","triton.sigmoid","triton.softmax","triton.store","triton.sum","triton.where","triton.zeros"],titleterms:{"final":2,Going:5,addit:0,arang:6,arithmet:2,atomic_ca:7,atomic_xchg:8,benchmark:[0,1,2],broadcast_to:9,cach:2,comput:[0,1,2,4],document:5,dot:10,exp:11,further:5,fuse:1,get:5,kernel:[0,1,2],languag:5,load:12,log:13,matrix:2,max:14,maximum:15,min:16,minimum:17,motiv:[1,2],multipl:2,multiple_of:18,num_program:19,optim:2,perform:2,pointer:2,program_id:20,ravel:21,refer:5,reshap:22,result:2,sigmoid:23,softmax:[1,24],squar:2,start:5,store:25,sum:26,test:[1,2],time:4,triton:[5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28],tutori:3,unit:[1,2],vector:0,welcom:5,where:27,zero:28}})