1 line
21 KiB
JavaScript
1 line
21 KiB
JavaScript
Search.setIndex({docnames:["getting-started/installation","getting-started/tutorials/01-vector-add","getting-started/tutorials/02-fused-softmax","getting-started/tutorials/03-matrix-multiplication","getting-started/tutorials/index","getting-started/tutorials/sg_execution_times","index","language-reference/python-api/generated/triton.arange","language-reference/python-api/generated/triton.atomic_cas","language-reference/python-api/generated/triton.atomic_xchg","language-reference/python-api/generated/triton.broadcast_to","language-reference/python-api/generated/triton.dot","language-reference/python-api/generated/triton.exp","language-reference/python-api/generated/triton.load","language-reference/python-api/generated/triton.log","language-reference/python-api/generated/triton.max","language-reference/python-api/generated/triton.maximum","language-reference/python-api/generated/triton.min","language-reference/python-api/generated/triton.minimum","language-reference/python-api/generated/triton.multiple_of","language-reference/python-api/generated/triton.num_programs","language-reference/python-api/generated/triton.program_id","language-reference/python-api/generated/triton.ravel","language-reference/python-api/generated/triton.reshape","language-reference/python-api/generated/triton.sigmoid","language-reference/python-api/generated/triton.softmax","language-reference/python-api/generated/triton.store","language-reference/python-api/generated/triton.sum","language-reference/python-api/generated/triton.where","language-reference/python-api/generated/triton.zeros","language-reference/python-api/index","programming-guide/chapter-1/introduction","programming-guide/chapter-2/related-work"],envversion:{"sphinx.domains.c":2,"sphinx.domains.changeset":1,"sphinx.domains.citation":1,"sphinx.domains.cpp":3,"sphinx.domains.index":1,"sphinx.domains.javascript":2,"sphinx.domains.math":2,"sphinx.domains.python":2,"sphinx.domains.rst":2,"sphinx.domains.std":2,sphinx:56},filenames:["getting-started/installation.rst","getting-started/tutorials/01-vector-add.rst","getting-started/tutorials/02-fused-softmax.rst","getting-started/tutorials/03-matrix-multiplication.rst","getting-started/tutorials/index.rst","getting-started/tutorials/sg_execution_times.rst","index.rst","language-reference/python-api/generated/triton.arange.rst","language-reference/python-api/generated/triton.atomic_cas.rst","language-reference/python-api/generated/triton.atomic_xchg.rst","language-reference/python-api/generated/triton.broadcast_to.rst","language-reference/python-api/generated/triton.dot.rst","language-reference/python-api/generated/triton.exp.rst","language-reference/python-api/generated/triton.load.rst","language-reference/python-api/generated/triton.log.rst","language-reference/python-api/generated/triton.max.rst","language-reference/python-api/generated/triton.maximum.rst","language-reference/python-api/generated/triton.min.rst","language-reference/python-api/generated/triton.minimum.rst","language-reference/python-api/generated/triton.multiple_of.rst","language-reference/python-api/generated/triton.num_programs.rst","language-reference/python-api/generated/triton.program_id.rst","language-reference/python-api/generated/triton.ravel.rst","language-reference/python-api/generated/triton.reshape.rst","language-reference/python-api/generated/triton.sigmoid.rst","language-reference/python-api/generated/triton.softmax.rst","language-reference/python-api/generated/triton.store.rst","language-reference/python-api/generated/triton.sum.rst","language-reference/python-api/generated/triton.where.rst","language-reference/python-api/generated/triton.zeros.rst","language-reference/python-api/index.rst","programming-guide/chapter-1/introduction.rst","programming-guide/chapter-2/related-work.rst"],objects:{triton:{arange:[7,0,1,""],atomic_cas:[8,0,1,""],atomic_xchg:[9,0,1,""],broadcast_to:[10,0,1,""],dot:[11,0,1,""],exp:[12,0,1,""],load:[13,0,1,""],log:[14,0,1,""],max:[15,0,1,""],maximum:[16,1,1,""],min:[17,0,1,""],minimum:[18,1,1,""],multiple_of:[19,0,1,""],num_programs:[20,0,1,""],program_id:[21,0,1,""],ravel:[22,1,1,""],reshape:[23,0,1,""],sigmoid:[24,1,1,""],softmax:[25,1,1,""],store:[26,0,1,""],sum:[27,0,1,""],where:[28,0,1,""],zeros:[29,0,1,""]}},objnames:{"0":["py","function","Python function"],"1":["py","data","Python data"]},objtypes:{"0":"py:function","1":"py:data"},terms:{"0000e":3,"002304":3,"003930":3,"0220e":3,"028568":3,"032234":3,"044":[1,5],"057027":3,"078047":3,"0876e":3,"096276":3,"1024":[1,3],"1094e":3,"10mn":2,"1133e":3,"117":3,"1238e":3,"128":3,"1280":3,"137481":3,"144":3,"152":3,"153":3,"1536":3,"1539e":3,"154":5,"157":3,"157204":3,"161678":3,"164923":3,"172024":3,"173747":3,"176":[2,5],"1778e":3,"178":3,"178785":3,"1792":3,"180520":3,"1823":2,"184001":3,"190":3,"198":3,"1983":31,"1984":32,"1989":32,"199":3,"1991":[31,32],"1999":32,"2004":32,"2006":32,"2012":32,"2013":31,"2014":31,"2016":[31,32],"2017":31,"2018":[31,32],"2019":32,"2021":[31,32],"2048":[2,3],"205983":3,"206935":3,"208":3,"210":3,"2141":1,"215":3,"215272":3,"2156e":3,"220":3,"221":3,"222":3,"229":3,"230":3,"2304":3,"231":3,"232":3,"233":3,"235":3,"236":3,"238":3,"239":3,"241":3,"242":3,"244":3,"245":3,"246":3,"246398":3,"248":3,"249":3,"250":3,"251":3,"2510e":3,"252":3,"253":3,"254":3,"256":[2,3],"2560":3,"257":3,"259":3,"2598e":3,"2605e":3,"2617e":3,"263":3,"264":3,"2658e":3,"266":3,"266731":3,"267699":3,"270":3,"276":3,"2816":3,"282797":3,"293068":3,"2mn":2,"3072":3,"3076":1,"307632":3,"3094e":3,"315584":3,"3328":3,"3375e":3,"3584":3,"360005":3,"366501":3,"3713":1,"377264":3,"3836e":3,"3840":3,"385067":3,"3mn":2,"4096":[2,3],"420235":3,"4277e":3,"4352":3,"4375e":3,"441481":3,"446699":3,"4608":3,"4864":3,"4940":1,"498706":3,"500857":3,"511113":3,"512":3,"5120":3,"514009":3,"519114":3,"520144":3,"527241":3,"5332e":3,"5376":3,"538463":3,"552287":3,"560014":3,"5632":3,"578957":3,"5888":3,"595626":3,"606284":3,"614125":3,"6144":3,"6387e":3,"6400":3,"6547e":3,"6562e":3,"6656":3,"6724":1,"676487":3,"6865e":3,"6875e":3,"6891e":3,"6907e":3,"6912":3,"692102":3,"699140":3,"7100e":3,"7168":3,"728763":3,"7295e":3,"740709":3,"741014":3,"7424":3,"768":3,"7680":3,"7684e":3,"781":2,"7936":3,"7mn":2,"803966":3,"8125e":3,"8192":3,"8340e":3,"844029":3,"8477e":3,"8537e":3,"8632e":3,"8644e":3,"867127":3,"868505":3,"916752":3,"917998":3,"933":[3,5],"9414e":3,"9453e":3,"9605e":3,"9733":1,"982401":3,"98432":1,"9844e":3,"988932":3,"990461":3,"abstract":[31,32],"break":32,"byte":2,"case":[2,3,31,32],"class":[31,32],"float":[2,31,32],"function":[1,2,3,7,10,11,13,20,21,23,26,28,29,32],"import":[1,2,3,31,32],"int":[1,7,10,20,21,29,31,32],"new":[10,23,29],"return":[1,2,3,7,11,13,20,21,28,29],"static":[31,32],"super":3,"switch":3,"true":[1,2,3,28],"try":3,"var":32,"while":[0,31],For:[3,31,32],Has:[20,21],One:3,SMs:32,T_S:32,The:[1,2,3,10,11,20,21,26,28,31,32],These:[3,32],Used:[1,2,3],__expf:2,_add:1,_matmul:3,_softmax:2,a100:[3,32],abl:32,about:[1,2,3,6],abov:[1,2,3,32],abs:1,academ:31,acc:[3,31,32],acceler:31,accept:3,access:[1,31,32],accomod:3,accordingli:32,account:32,accumul:32,accuraci:31,achiev:[3,31,32],across:[31,32],activ:3,actual:[3,31,32],add:[1,5],addit:[2,4,5,31],addition:32,address:[2,31],adopt:32,advanc:31,advoc:32,affect:3,affin:32,against:[1,2,3,6],aggress:[2,31,32],agnost:[31,32],ahead:32,aim:6,algebra:32,algorithm:[3,31,32],alia:32,all:[2,3,4,31,32],allclos:[2,3],allen1984:32,allen:32,alloc:[1,2,3,31],allow:[1,2,31,32],almost:2,along:[1,20,21],also:[1,2,3,31,32],alwai:[28,32],amd:31,amen:32,amount:[2,31],ampl:32,analog:1,analysi:[31,32],analyz:32,ancourt1991:32,ancourt:32,ani:[2,3,32],anoth:[2,32],apart:32,api:[0,6],appli:[31,32],applic:32,approach:[31,32],approxim:2,arang:[1,2,3],arbitrari:3,architectur:[3,31],area:32,arg:[1,2,3],argument:[1,2,3,28],around:2,arrai:[29,32],arrang:3,art:[31,32],arxiv:[31,32],ask:2,aspect:32,asplo:31,assert:3,assum:2,asynchron:[1,31],auguin1983:31,auguin:31,auto:[2,3,32],autom:31,automat:[3,31,32],autotun:[3,32],avail:[31,32],avoid:28,awar:31,axi:[1,2,3,15,17,20,21,27],back:[1,2],baghdadi2021:[31,32],baghdadi:[31,32],balanc:32,bandwidth:2,base:[31,32],basic:[1,4,32],becom:31,been:[1,31,32],befor:3,begin:32,behavior:32,believ:32,below:[4,32],bench:0,benchmark:0,benefit:[2,31,32],best:[1,31],better:3,between:[1,31],bit:2,block:[1,2,3,10,11,13,23,26,28,29,31,32],block_k:3,block_m:3,block_n:3,block_siz:32,boil:32,bool:[13,26,28],both:[28,32],bound:[1,2,32],branch:32,broad:31,broadcast:[10,28],build:[0,3],builder:[7,8,9,10,11,12,13,14,15,17,19,20,21,23,26,27,28,29],built:[1,32],c_0:3,c_1:3,cach:[2,31,32],call:[1,3,32],callabl:1,can:[0,1,2,3,31,32],cannot:[3,31,32],capabl:[6,31],cdiv:[1,3],cgo:[31,32],chang:3,chapter:6,characterist:32,cheap:31,check:[3,6],checkout:6,chen2018:31,chen:31,chip:2,choic:6,cite:32,click:[1,2,3],clone:0,close:[3,32],cmake:0,cmp:8,coalesc:31,code:[1,2,3,4,7,10,11,13,20,21,23,26,28,29,31,32],code_gen:[16,18,22,24,25],codegen:0,col:[2,32],column:[2,3],com:[0,32],combin:31,come:[2,3,32],command:0,common:32,commonli:32,compar:[2,3,6,32],compat:11,compil:[0,2,3,6,31],complet:32,complex:32,compos:31,composit:32,comprehens:[31,32],comput:[6,31,32],computation:[31,32],concern:32,concis:1,condit:[28,32],config:3,configur:3,connectom:31,consecut:32,consequ:31,consid:2,consist:2,constitut:1,constraint:[3,32],construct:31,consum:3,contain:32,contextu:32,contigu:[3,7],control:[31,32],conveni:3,convert:1,convolut:31,copi:31,core:[31,32],correspond:[1,2,3],cost:32,could:[2,32],cours:31,creat:[1,2,3,31],csv:1,cubla:[3,31],cuda:[1,2,3,31],cudnn:31,current:21,custom:[1,2,3,6],cutlass:3,cvpr:31,dart:32,darte1999:32,data:[1,2,3,13,28,29,31,32],dataflow:32,decad:31,declara:1,decompos:32,decor:[1,3],deep:[3,31,32],def:[1,2,3],defin:[2,3,13,32],definit:32,denom:2,denomin:2,denot:1,dens:32,depend:[28,32],deploi:31,describ:32,design:32,detail:32,detect:31,develop:[31,32],devic:[1,2,3],dialect:32,diesel:32,differ:[1,2,3,21,31,32],difficult:32,difficulti:[3,31],dijkstra82:32,dim:32,dimens:[3,11],dimension:[3,11,32],dir:0,direct:0,directli:0,disjoint:32,disk:1,dissert:32,distribut:32,dnn:[6,31,32],do_bench:[1,2,3],doe:[1,2,32],doesn:32,doing:31,domain:[31,32],don:[1,2],done:[0,3,31],dot:3,doubli:3,doubt:32,down:32,download:[0,1,2,3,4],dram:2,driver:0,dsl:[6,31,32],dtype:[1,2,3,29],each:[2,3,31,32],eas:32,easi:3,easier:[1,2,31],easili:3,education:2,effect:32,effici:[3,31],effort:32,either:[1,20,21,28],elango2018:32,elango:32,element:[1,2,3,26,28],element_s:2,elementwis:[2,13],emerg:31,empti:3,empty_lik:[1,2],enabl:32,encod:32,end:[7,31,32],enforc:32,engin:32,enqueu:[1,2],ensur:32,entir:[2,32],entri:1,environ:6,equal:32,especi:31,etc:3,euromicro:31,evalu:[3,28],even:32,evidenc:31,evolv:31,exampl:[1,2,3,4,31,32],execut:[1,5,31,32],exist:[31,32],exp:[2,3],expect:2,expens:[31,32],expert:3,explor:31,exponenti:2,express:[31,32],extend:3,extract:3,extrem:32,facilit:[31,32],fact:32,fairli:3,fals:[13,26,28],far:2,fast:[2,31,32],faster:2,fastest:32,feel:3,fetch:31,few:32,field:31,figur:32,file:[1,2,3,5],fill:29,first:[1,6,11,32],fit:2,flexibl:31,float16:[3,11,29],float32:[1,2,3,11],flow:[31,32],focu:[3,32],follow:[0,2,3,6,31,32],forget:1,formal:32,format:32,found:0,foundat:32,framework:[31,32],free:3,from:[2,3,7,10,11,13,20,21,23,26,28,29,31,32],full:[1,2,3],fulli:32,func:32,fundament:32,further:32,fuse:[3,4,5],fusion:[2,32],galleri:[1,2,3,4],gbp:[1,2],gener:[1,2,3,4,7,10,11,13,20,21,23,26,28,29,31,32],geq:32,get:[1,2,5],girbal2006:32,girbal:32,git:0,github:0,give:31,given:[2,3,20,21,29],global:32,good:[1,32],gpgpu:31,gpu:[1,2,3,6,31,32],grammat:32,graphic:31,greater:2,grid:[1,2,3,20,21],grid_m:3,grid_n:3,grosser2012:32,grosser:32,group:3,group_id:3,group_m:3,group_siz:3,grow:32,guard:[1,2],guess:2,guid:31,halid:[31,32],hand:32,handl:[1,2,3,32],handwritten:31,hard:3,harder:32,hardwar:[3,6,32],has:[1,31,32],hasn:1,have:[2,11,28,31,32],heavi:31,helper:[1,2],henc:3,here:[0,1,2,3],heurist:2,hierarch:31,hierarchi:32,high:[3,31,32],highli:31,highlight:32,hint:32,hit:3,how:[1,2,3,6,31],howev:[3,32],http:0,idea:31,ident:2,idx:[13,26],imag:[31,32],imper:6,implement:[1,2,3,31,32],implicitli:1,importantli:32,impos:32,improv:3,incompat:[3,32],increas:1,incred:31,increment:32,inde:32,independ:32,index:2,indic:[2,28,32],induc:32,industri:31,inequ:32,inf:2,inform:32,infrastructur:32,initi:3,inner:[3,11],input:[1,2,3,10,11,15,17,23,27,32],instal:6,instanc:[1,2,3,20,21,31],instead:[2,13,28],instruct:[6,31],integ:32,integr:0,interchang:32,interest:[0,31,32],intermedi:[0,32],intern:[0,2,32],interv:7,intrins:32,introduct:6,invari:32,ipynb:[1,2,3],irregular:[2,32],is_contigu:3,issu:[31,32],iter:[3,31,32],its:[2,32],jit:[1,2,3,7,10,11,13,20,21,23,26,28,29],jitfunct:[16,18,22,24,25],journal:32,jrk2013:31,jupyt:[1,2,3,4],just:32,kei:[1,2,3,31],kellei:31,kernel:[6,31],keyword:1,known:32,label:[1,2,3],lam1991:31,lam:31,lambda:[1,2,3],languag:31,larg:[2,31,32],later:32,latest:0,lattner2004:32,lattner2019:32,lattner:32,launch:[1,2,3,20,21],law:32,layer:[31,32],lead:[31,32],learn:[1,2,3,6,31,32],least:32,lee2017:31,lee:31,left:32,legal:32,less:[2,31,32],let:2,letter:32,level:[3,31,32],librari:[3,31,32],lies:31,lifelong:32,like:[1,31,32],limit:2,line:[1,2,3,32],linear:[31,32],list:3,litteratur:32,llvm:[0,32],load:[1,2,3,28,32],local:[31,32],locat:[3,13,26],logarithm:1,longer:2,look:[2,6,31],loop:[3,32],low:32,machin:[31,32],machineri:[31,32],made:31,mai:[0,32],main:[1,3,31,32],maintain:[2,32],major:[3,32],make:[0,1,2,31,32],manag:31,mani:[31,32],manual:[2,32],manual_se:[1,2,3],mapl:32,markedli:31,mask:[1,2,3,13,26,28],mathbb:32,mathbf:32,mathcal:32,mathemat:32,matmul:[3,32],matric:[2,3],matrix:[2,4,5,11,31,32],matrix_s:32,matter:[3,31,32],max:[1,2],max_m:[1,2,3],maxim:[6,32],maximum:[1,2],mean:[2,3,32],mechan:[2,32],memori:[1,2,3,13,26,28,31,32],mention:3,meta:[1,2,3],metaparamet:[1,3],method:32,methodolog:32,micro:31,min:3,min_m:[1,2,3],minut:[0,1,2,3],miss:32,mitig:32,mixtur:3,mkdir:0,mlir:32,model:[1,21,31,32],modern:[3,6,31,32],modular:32,moor:32,more:[2,6,31,32],most:[3,32],move:2,mullapudi2016:32,mullapudi:32,multi:[3,31,32],multipl:[4,5,31,32],multipli:[11,32],must:[2,3,11,28],naiv:[2,3],naive_softmax:2,name:[1,2,3],nativ:[1,3],natur:[2,31],necessari:2,need:[2,3],nelement:2,nest:[3,32],net:32,network:[31,32],neural:[31,32],neurosci:31,next:[2,3],next_power_of_2:2,nightli:0,nip:31,non:31,none:[2,3,7,8,9,10,11,12,13,14,15,17,19,20,21,23,26,27,28,29],nonzero:28,normal:[2,3],note:[0,1,2,28,32],notebook:[1,2,3,4],notic:32,notori:[3,31],novel:31,now:[1,3],num:2,num_warp:[2,3],number:[1,2,20,32],numer:[2,31],nvidia:31,object:[1,3,16,18,22,24,25,31],obtain:1,obvious:2,occur:32,offer:31,offici:0,offset:1,often:3,omega:32,onc:[2,31,32],one:[2,4,31,32],onli:[2,3,31,32],open:7,opencl:31,oper:[1,2,3,4,28,31],operand:3,opportun:31,ops:1,opsila:31,optim:[31,32],option:[1,3,7,10,11,13,20,21,23,26,28,29],order:[3,4,32],origin:32,osdi:31,other:[2,3,6,11,13,32],otherwis:28,our:[1,2,3,31],out:[1,2,3,6,32],outlin:32,outperform:2,output:[1,2,3],over:[31,32],pact:32,pad:2,paradigm:[31,32],parallel:[1,2,3,6,21,31,32],paralleliz:31,param:23,paramet:[1,3,7,10,11,13,20,21,26,28,29,32],parametr:31,parser:0,part:[3,32],partial:2,particularli:[31,32],partit:31,pass:[1,32],past:[31,32],path:1,pattern:31,peak:[3,32],per:2,perf:3,perf_report:[1,2,3],perform:[1,2,31,32],phase:32,philosophi:32,pid:[1,3],pid_m:3,pid_n:3,pip:0,pipelin:[31,32],platform:[6,32],pldi:31,plot:[0,1,2,3],plot_nam:[1,2,3],pmatrix:32,point:[1,32],pointer:[1,13,26],polli:32,polyhedr:31,polyhedra:32,popular:32,portabl:[31,32],pose:31,possibl:[1,2,3,32],power:[2,32],ppopp:32,practic:[1,2,3,31],pragma:31,pre:[0,31],predict:[2,32],prefer:2,premis:31,present:3,preserv:32,prevent:32,primer:32,primit:31,principl:32,print:[1,2,3],print_data:3,probabl:32,problem:1,problemat:32,procedur:32,process:[1,31,32],processor:31,product:[6,11,32],program:[1,2,3,6,20,21,31],program_id:[1,2,3],programm:[31,32],project:31,promot:[3,32],properli:2,properti:32,propos:31,proprietari:3,provid:[1,2,3,6,32],pseudo:3,ptillet:0,ptr:[8,9],purpos:[31,32],push:32,putat:32,pytest:0,python:[1,2,3,4,6],pytorch:[1,2],qquad:32,ragan:31,rand:1,randn:[2,3],rang:[1,2,3,31,32],rapidli:[31,32],rate:3,rather:31,raw:1,rdom:32,read:[2,3,4],reader:32,real:31,reason:[3,32],recent:31,recommend:4,recomput:31,rectifi:31,redmon2016:31,redmon:31,reduct:2,refer:1,regardless:28,regist:3,regrett:31,regular:32,rel:[1,32],relat:6,releas:[0,31],reli:32,remain:31,remateri:3,reorder:32,repres:32,represent:0,requir:[2,32],research:[31,32],resolut:32,resourc:31,resp:32,respect:32,restrict:32,result:[0,1,2,31,32],ret:2,ret_fals:3,ret_tru:3,retriev:32,reus:3,revisit:31,right:32,rise:32,roughli:3,row:[2,3],run:[0,1,2,3,6,21,32],runtim:[0,32],rvar:32,said:32,same:31,sato2019:32,sato:32,save:[1,2,3],save_path:1,scalabl:32,scalar:[11,29,31],scan:32,schedul:31,scienc:32,scop:32,scope:32,script:[1,2,3],second:[1,2,3,11,32],section:32,see:[1,2,32],seem:[1,32],select:[28,31],semant:32,semi:32,sens:[1,31,32],separ:32,sequenc:31,set:[1,32],sever:[31,32],shall:32,shape:[1,2,3,10,23,28,29,32],share:[2,31],should:[1,31,32],show:3,show_plot:[1,2],shown:32,side:32,sight:32,sigmoid:3,signal:31,significantli:2,sigplan:32,silu:3,simd:31,simpl:[1,2],simplest:4,simpli:32,sinc:[1,3],singl:31,size:[1,2,32],slower:[31,32],slowest:32,smallest:2,snemi3d:31,softmax:[4,5],solid:32,solut:[2,3],solv:32,some:3,sometim:32,sourc:[1,2,3,4,32],space:[31,32],spars:[31,32],spatial:32,speak:3,special:31,specif:[3,31],specifi:[3,26,32],speed:2,sphinx:[1,2,3,4],split:32,spmd:[1,21,31,32],stabil:2,standard:32,start:[4,7],started_tutori:5,state:[31,32],statement:32,step:32,still:[1,32],stop:7,store:[1,2,3,28],straightforward:3,strategi:32,strength:31,stride:[2,3],stride_a_0:3,stride_a_1:3,stride_ak:3,stride_am:3,stride_b_0:3,stride_b_1:3,stride_bk:3,stride_bn:3,stride_cm:3,stride_cn:3,stride_x_0:3,stride_x_1:3,stride_xm:2,stride_ym:2,structur:[31,32],subscript:[1,32],substanti:31,substract:2,successfulli:32,suffer:32,suit:31,sum:[1,2],superhuman:31,support:[0,32],sure:2,surprisingli:31,surround:32,sutskev:31,sutskever2014:31,swish:3,swizzl:31,synchron:[1,31],system:[3,31,32],taco:32,take:[0,3,6],taken:32,target:31,techniqu:[3,31,32],tempor:32,temporari:2,tend:32,tension:31,tensor:[1,2,3,31,32],tensorrt:31,test:[0,1],text:32,tflop:3,than:[2,31,32],thei:[3,31,32],them:1,themselv:3,theoret:2,therebi:32,therefor:3,theta:32,theta_:32,thi:[0,1,2,3,31,32],thing:1,think:2,those:0,though:[2,31,32],thread:31,through:[4,32],throughout:32,throughput:6,tile:[2,32],time:[1,2,3,31,32],tiramisu:[31,32],tmp:0,tog:32,too:2,topic:32,torch:[1,2,3],total:[1,2,3,5],tradit:[31,32],transfer:2,transform:32,travers:32,trend:31,tri:10,trick:2,trigger:3,triton:[0,1,2,3,4,31,32],trivial:31,tune:[2,3,32],tupl:[1,10,29],tutori:[0,1,2,3,6],tutorials_jupyt:4,tutorials_python:4,tvm:[31,32],twice:2,two:[1,2,3,11,32],type:[11,23,28,29],typic:[3,32],uncommon:32,underneath:32,understand:2,unfortun:[3,32],unifi:31,unint:28,unit:[0,31],univers:32,unlik:3,unrol:32,updat:[3,32],usag:0,use:[0,1,2,3,28,31,32],used:1,uses:21,using:[1,3,31,32],util:1,v100:32,val:[8,9],valid:1,valu:[1,2,3,7,10,13,19,26,28,29],valuabl:2,variant:31,variou:4,vasilach:[31,32],vasilache2018:[31,32],vast:32,vec:32,vector:[2,4,5,31,32],vendor:3,veri:[2,32],verif:32,verifi:[2,32],via:[3,32],visibl:32,vision:31,wai:[2,3],want:[0,2,28],warp:2,wast:2,well:[31,32],when:[2,28,31,32],where:[3,26,32],whether:31,which:[1,2,3,21,31,32],whose:[1,2,3,13,32],wide:32,width:3,wise:[2,3,26],wish:[3,32],within:[7,10,11,13,20,21,23,26,28,29],without:32,wolf:32,wolfe1989:32,won:2,word:32,work:[2,6,31],workload:3,wors:[31,32],would:2,wouldn:32,wrapper:3,write:[1,2,3,4,6,32],wrote:2,x_log:1,x_max:2,x_name:[1,2,3],x_val:[1,2,3],xii:32,y_line:[1,2,3],y_name:[1,2,3],y_ref:2,y_tri:2,y_val:[1,2,3],year:32,yet:[31,32],yield:28,yii:32,ylabel:[1,2,3],you:[0,1,2,3,4,28,31],your:[0,6],yourself:[2,3],zero:3,zip:4},titles:["Installation","Vector Addition","Fused Softmax","Matrix Multiplication","Tutorials","Computation times","Welcome to Triton\u2019s documentation!","triton.arange","triton.atomic_cas","triton.atomic_xchg","triton.broadcast_to","triton.dot","triton.exp","triton.load","triton.log","triton.max","triton.maximum","triton.min","triton.minimum","triton.multiple_of","triton.num_programs","triton.program_id","triton.ravel","triton.reshape","triton.sigmoid","triton.softmax","triton.store","triton.sum","triton.where","triton.zeros","Python API","Introduction","Related Work"],titleterms:{"final":3,Going:6,Ops:30,addit:1,advantag:32,algebra:30,api:30,arang:7,arithmet:3,atomic_ca:8,atomic_xchg:9,benchmark:[1,2,3],binari:0,broadcast_to:10,cach:3,challeng:31,comparison:30,compil:[30,32],comput:[1,2,3,5],creation:30,distribut:0,document:6,dot:11,exp:12,from:0,further:6,fuse:2,get:6,hint:30,index:30,instal:0,introduct:31,kernel:[1,2,3],languag:[6,32],limit:32,linear:30,load:13,log:14,manipul:30,math:30,matrix:3,max:15,maximum:16,memori:30,min:17,minimum:18,model:30,motiv:[2,3,31],multipl:3,multiple_of:19,num_program:20,ops:30,optim:3,packag:0,perform:3,pointer:3,polyhedr:32,program:[30,32],program_id:21,python:[0,30],ravel:22,reduct:30,refer:[6,31,32],relat:32,represent:32,reshap:23,result:3,schedul:32,shape:30,sigmoid:24,softmax:[2,25],sourc:0,squar:3,start:6,store:26,sum:27,test:[2,3],time:5,triton:[6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29],tutori:4,unit:[2,3],vector:1,welcom:6,where:28,work:32,zero:29}}) |