1 line
20 KiB
JavaScript
1 line
20 KiB
JavaScript
Search.setIndex({docnames:["getting-started/installation","index","programming-guide/chapter-1/introduction","programming-guide/chapter-2/related-work","python-api/generated/triton.Config","python-api/generated/triton.autotune","python-api/generated/triton.heuristics","python-api/generated/triton.jit","python-api/generated/triton.language.arange","python-api/generated/triton.language.atomic_add","python-api/generated/triton.language.atomic_cas","python-api/generated/triton.language.atomic_max","python-api/generated/triton.language.atomic_min","python-api/generated/triton.language.atomic_xchg","python-api/generated/triton.language.broadcast_to","python-api/generated/triton.language.cos","python-api/generated/triton.language.dot","python-api/generated/triton.language.exp","python-api/generated/triton.language.load","python-api/generated/triton.language.log","python-api/generated/triton.language.max","python-api/generated/triton.language.maximum","python-api/generated/triton.language.min","python-api/generated/triton.language.minimum","python-api/generated/triton.language.multiple_of","python-api/generated/triton.language.num_programs","python-api/generated/triton.language.program_id","python-api/generated/triton.language.rand","python-api/generated/triton.language.randint","python-api/generated/triton.language.randint4x","python-api/generated/triton.language.randn","python-api/generated/triton.language.ravel","python-api/generated/triton.language.reshape","python-api/generated/triton.language.sigmoid","python-api/generated/triton.language.sin","python-api/generated/triton.language.softmax","python-api/generated/triton.language.sqrt","python-api/generated/triton.language.store","python-api/generated/triton.language.sum","python-api/generated/triton.language.where","python-api/generated/triton.language.zeros","python-api/generated/triton.testing.Benchmark","python-api/generated/triton.testing.do_bench","python-api/generated/triton.testing.perf_report","python-api/triton","python-api/triton.language","python-api/triton.testing"],envversion:{"sphinx.domains.c":2,"sphinx.domains.changeset":1,"sphinx.domains.citation":1,"sphinx.domains.cpp":4,"sphinx.domains.index":1,"sphinx.domains.javascript":2,"sphinx.domains.math":2,"sphinx.domains.python":3,"sphinx.domains.rst":2,"sphinx.domains.std":2,"sphinx.ext.intersphinx":1,sphinx:56},filenames:["getting-started/installation.rst","index.rst","programming-guide/chapter-1/introduction.rst","programming-guide/chapter-2/related-work.rst","python-api/generated/triton.Config.rst","python-api/generated/triton.autotune.rst","python-api/generated/triton.heuristics.rst","python-api/generated/triton.jit.rst","python-api/generated/triton.language.arange.rst","python-api/generated/triton.language.atomic_add.rst","python-api/generated/triton.language.atomic_cas.rst","python-api/generated/triton.language.atomic_max.rst","python-api/generated/triton.language.atomic_min.rst","python-api/generated/triton.language.atomic_xchg.rst","python-api/generated/triton.language.broadcast_to.rst","python-api/generated/triton.language.cos.rst","python-api/generated/triton.language.dot.rst","python-api/generated/triton.language.exp.rst","python-api/generated/triton.language.load.rst","python-api/generated/triton.language.log.rst","python-api/generated/triton.language.max.rst","python-api/generated/triton.language.maximum.rst","python-api/generated/triton.language.min.rst","python-api/generated/triton.language.minimum.rst","python-api/generated/triton.language.multiple_of.rst","python-api/generated/triton.language.num_programs.rst","python-api/generated/triton.language.program_id.rst","python-api/generated/triton.language.rand.rst","python-api/generated/triton.language.randint.rst","python-api/generated/triton.language.randint4x.rst","python-api/generated/triton.language.randn.rst","python-api/generated/triton.language.ravel.rst","python-api/generated/triton.language.reshape.rst","python-api/generated/triton.language.sigmoid.rst","python-api/generated/triton.language.sin.rst","python-api/generated/triton.language.softmax.rst","python-api/generated/triton.language.sqrt.rst","python-api/generated/triton.language.store.rst","python-api/generated/triton.language.sum.rst","python-api/generated/triton.language.where.rst","python-api/generated/triton.language.zeros.rst","python-api/generated/triton.testing.Benchmark.rst","python-api/generated/triton.testing.do_bench.rst","python-api/generated/triton.testing.perf_report.rst","python-api/triton.rst","python-api/triton.language.rst","python-api/triton.testing.rst"],objects:{"triton.Config":{__init__:[4,1,1,""]},"triton.language":{arange:[8,2,1,""],atomic_add:[9,2,1,""],atomic_cas:[10,2,1,""],atomic_max:[11,2,1,""],atomic_min:[12,2,1,""],atomic_xchg:[13,2,1,""],broadcast_to:[14,2,1,""],cos:[15,2,1,""],dot:[16,2,1,""],exp:[17,2,1,""],load:[18,2,1,""],log:[19,2,1,""],max:[20,2,1,""],maximum:[21,2,1,""],min:[22,2,1,""],minimum:[23,2,1,""],multiple_of:[24,2,1,""],num_programs:[25,2,1,""],program_id:[26,2,1,""],rand:[27,2,1,""],randint4x:[29,2,1,""],randint:[28,2,1,""],randn:[30,2,1,""],ravel:[31,2,1,""],reshape:[32,2,1,""],sigmoid:[33,2,1,""],sin:[34,2,1,""],softmax:[35,2,1,""],sqrt:[36,2,1,""],store:[37,2,1,""],sum:[38,2,1,""],where:[39,2,1,""],zeros:[40,2,1,""]},"triton.testing":{Benchmark:[41,0,1,""],do_bench:[42,2,1,""],perf_report:[43,2,1,""]},"triton.testing.Benchmark":{__init__:[41,1,1,""]},triton:{Config:[4,0,1,""],autotune:[5,2,1,""],heuristics:[6,2,1,""],jit:[7,2,1,""]}},objnames:{"0":["py","class","Python class"],"1":["py","method","Python method"],"2":["py","function","Python function"]},objtypes:{"0":"py:class","1":"py:method","2":"py:function"},terms:{"0":[2,3,25,26,27,30,40,42],"0f":3,"1":[1,3,6,25,26,27,30],"10":[27,28,29,30],"100":42,"1024":5,"11":0,"128":5,"16":[3,40],"1982":3,"1983":2,"1984":3,"1989":3,"1991":[2,3],"1999":3,"2":[1,3,4,6,25,26,42],"20":42,"2004":3,"2006":3,"2012":3,"2013":2,"2014":2,"2016":[2,3],"2017":2,"2018":[2,3],"2019":3,"2021":[2,3],"25":42,"256":4,"2d":16,"3":[0,3],"32":4,"3d":[25,26],"4":[3,4,5,28],"5":[3,42],"6":0,"7":[0,3],"8":[3,4,5,40,42],"80":42,"9":0,"abstract":[2,3],"break":3,"case":[2,3,6,9,10,11,12,13],"class":[2,3,4,41],"default":42,"do":[2,3,18,37],"float":[2,3,42],"function":[3,4,5,6,7,41,42,43],"import":[2,3],"int":[2,3,6,8,14,25,26,32,40,42],"new":[14,32,40],"return":[5,8,9,10,11,12,13,16,18,20,22,25,26,27,28,29,30,31,38,39,40,42,43],"static":[0,2,3],"true":[16,39],"try":4,"var":3,"while":2,A:[2,3],And:0,As:[2,3],At:3,By:42,For:[2,3,4],If:[3,28,37,39,41],In:3,It:[1,3,5,7],Of:2,On:3,The:[2,3,9,10,11,12,13,14,16,25,26,27,28,29,30,32,37,39,43],These:3,To:[2,3,5],__init__:[4,41],a100:3,abl:3,about:1,abov:[3,5],academ:2,acc:[2,3],acceler:2,access:[2,3,7],accordingli:3,account:3,accumul:3,accuraci:2,achiev:[2,3],across:[2,3],actual:[2,3],add:9,addit:[2,42],addition:3,address:[2,18],adopt:3,advanc:2,advoc:3,affin:3,against:[0,1],aggress:[2,3],agnost:[2,3],ahead:3,aim:1,al:[2,3],algebra:3,algorithm:[2,3],alia:3,all:[2,3,5,20,22,24,38,41],allen1984:3,allen:3,alloc:2,allow:[2,3],allow_tf32:16,along:[20,22,25,26,38,42],also:[2,3],alwai:[3,39],amd:2,amen:3,amount:2,ampl:3,an:[2,3,4,9,10,11,12,13,27,28,29,30],analysi:[2,3],analyz:3,ancourt1991:3,ancourt:3,ani:[3,5,6,41],anoth:3,anytim:5,apart:3,api:41,appear:41,appli:[2,3],applic:[3,6],approach:[2,3],ar:[0,2,3,4,5,7,18,24,37,39,41],architectur:2,area:3,arg:[4,6,7,41],argument:[4,5,6,7,39,41],arrai:[3,40],art:[2,3],arxiv:[2,3],aspect:3,asplo:2,assum:41,asynchron:2,atom:[9,10,11,12,13],auguin1983:2,auguin:2,auto:[3,4,5,6],autom:2,automat:[2,3,4],autotun:3,avail:[0,2,3],avoid:[5,39],awar:2,axi:[20,22,25,26,38,41],b:[2,3],baghdadi2021:[2,3],baghdadi:[2,3],balanc:3,base:[1,2,3],basic:3,becom:2,been:[2,3],befor:[4,5,9,10,11,12,13],begin:3,behavior:[3,5],believ:3,below:3,bench:[0,5],benchmark:[0,42,43],benefit:[2,3],best:2,between:2,bfloat16:16,block:[2,3,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,27,28,29,30,31,32,33,34,35,36,37,38,39,40],block_siz:[3,5,6],boil:3,bool:[39,41],both:[3,39],bound:3,branch:3,broad:2,broadcast:[14,18,37,39],build:0,built:3,c:[2,3],cach:[2,3,18],cache_modifi:18,call:[3,4,7,28],callabl:[6,7,42],can:[0,2,3,5,43],cannot:[2,3],capabl:[1,2],cd:0,ceil:6,certain:6,cgo:[2,3],chang:[5,18],chapter:1,characterist:3,cheap:2,check:1,chen2018:2,chen:2,choic:1,clone:0,close:3,cmake:0,cmp:[9,10,11,12,13],coalesc:2,code:[2,3],col:3,color:41,com:0,combin:2,come:3,command:0,common:3,commonli:3,compar:[1,3,9,10,11,12,13],compat:16,compil:[1,2,4,7,24],complet:3,complex:3,compos:2,composit:3,comprehens:[2,3],comput:[1,2,3,6,15,17,19,21,23,33,34,35,36],computation:[2,3],concern:3,concis:41,condit:[3,39],config:5,configur:[4,5,43],connectom:2,consecut:3,consequ:2,constexpr:[27,28,29,30],constraint:3,construct:2,constructor:41,contain:[3,9,10,11,12,13,41],contextu:3,contigu:[8,31],control:[2,3],convert:7,convolut:2,cooper:4,copi:[2,9,10,11,12,13],core:[2,3,27,28,29,30],correspond:41,cosin:15,cost:3,could:3,cours:2,cpython:0,creat:2,cubla:2,cuda:2,cudnn:2,current:26,custom:1,cvpr:2,d:[5,7],dart:3,darte1999:3,data:[2,3,9,10,11,12,13,18,39,40],data_ptr:7,dataflow:3,decad:2,decompos:3,decor:[5,6,7],deep:[2,3],def:[5,6],defin:[3,18],definit:3,dens:3,depend:[0,3,39],deploi:2,describ:3,design:3,desir:[14,32],detail:3,detect:2,develop:[2,3],dialect:3,dict:[5,6],dictionari:[4,6],diesel:3,differ:[2,3,5,41],difficult:3,difficulti:2,dijkstra82:3,dijkstra:3,dim:3,dimens:[16,20,22,38],dimension:[3,16],dir:0,disjoint:3,dissert:3,distribut:3,dnn:[1,2,3],doe:3,doesn:3,domain:[2,3],done:[2,20,22,38],doubt:3,down:3,download:0,dsl:[1,2,3],dtype:[9,10,11,12,13,18,37,40],e:[0,2,3,40],each:[2,3,4,6],eas:3,easier:2,effect:3,effici:[2,29],effort:3,either:[25,26,39],elango2018:3,elango:3,element:[15,17,19,20,21,22,23,33,34,35,36,37,38,39,41],element_ti:[9,10,11,12,13,18,37],elementwis:18,emerg:2,enabl:3,encod:3,end:[2,3,8],enforc:3,engin:3,ensur:3,entir:3,entri:29,environ:1,equal:3,especi:2,et:[2,3],euromicro:2,evalu:[5,39],even:3,evidenc:2,evolv:2,exampl:[2,3,4],exchang:13,execut:[2,3,4,43],exist:[2,3],expect:[9,10,11,12,13],expens:[2,3,6],explor:2,exponenti:17,express:[2,3],extrem:3,f:3,facilit:[2,3],fact:3,fals:[18,35,37,39,41,42],fast:[2,3],faster:28,fastest:3,fetch:2,few:3,field:[2,5],figur:3,fill:40,first:[1,3,16,21,23],fix:41,flatten:31,flexibl:2,float16:[16,40],float32:[16,27,30],flow:[2,3],fn:[7,42],focu:3,follow:[0,1,2,3],formal:3,format:3,found:[9,10,11,12,13],foundat:3,four:29,framework:[2,3],from:[2,3,18,39],fulli:3,func:3,fundament:3,further:3,fusion:3,g:[2,3,40],gener:[2,3,27,28,29,30,41],geq:3,girbal2006:3,girbal:3,git:0,github:0,give:2,given:[14,25,26,27,28,29,30,32,40],global:3,go:3,good:3,gpgpu:2,gpu:[1,2,3,4,7],grad_to_non:42,gradient:42,grammat:3,graphic:2,grid:[25,26],grosser2012:3,grosser:3,grow:3,guid:2,ha:[2,3,25,26],halid:[2,3],hand:3,handl:3,handwritten:2,harder:3,hardwar:[1,3],have:[2,3,7,16,39,41],heavi:2,hierarch:2,hierarchi:3,high:[2,3],highli:2,highlight:3,hint:3,how:[1,2,6],howev:3,http:0,i:[2,3],id:26,idea:2,idx:[18,37],ieee_round:35,imag:[2,3],implement:[2,3],implicitli:[7,18,37],importantli:3,impos:3,incompat:3,incred:2,increment:3,inde:3,independ:3,indic:[3,39],induc:3,industri:2,inequ:3,inform:3,infrastructur:3,inner:16,input:[3,5,6,14,15,16,17,19,20,21,22,23,24,31,32,33,34,35,36,38],instal:1,instanc:[2,4,25,26],instead:39,instruct:[1,2],int1:[18,37],int32:[28,29],integ:3,interchang:3,interest:[2,3],intermedi:3,intern:3,interv:8,intrins:3,introduct:1,invari:3,ir:3,irregular:3,issu:[2,3],iter:[2,3],its:[3,5],j:[2,3],jit:[5,6],journal:3,jrk2013:2,just:[3,6],k:[2,3],kb:2,kei:[2,5],kellei:2,kernel:[1,2,4,5,6],keyword:4,ki:3,know:24,known:3,kwarg:[4,7],label:41,lam1991:2,lam:2,lambda:6,languag:[1,2,7],larg:[2,3],later:3,latest:0,lattner2004:3,lattner2019:3,lattner:3,launch:[25,26],law:3,layer:[2,3],lead:[2,3],learn:[1,2,3],least:3,lee2017:2,lee:2,left:3,legal:3,less:[2,3],let:24,letter:3,level:[2,3],li:2,librari:[0,2,3],lifelong:3,like:[2,3,28],line:[3,41],line_arg:41,line_nam:41,line_v:41,linear:[2,3],link:0,list:[5,6,41,42,43],litteratur:3,llvm11:0,llvm:[0,3],load:[3,39],local:[2,3],locat:[9,10,11,12,13,18,37],log2:6,log:41,logarithm:19,look:[1,2],loop:[3,4],low:3,m:[0,2],machin:[2,3],machineri:[2,3],made:2,mai:[3,6],main:[2,3],maintain:3,major:3,make:[2,3],manag:2,mani:[2,3],manual:3,mapl:3,mark:43,markedli:2,mask:[9,11,12,13,18,37,39],match:[9,10,11,12,13],math:6,mathbb:3,mathbf:3,mathcal:[3,30],mathemat:3,matmul:3,matrix:[2,3,4,16],matrix_s:3,matter:[2,3],max:11,maxim:[1,3,29],maximum:20,mb:2,mean:[3,5],mechan:3,median:42,memori:[2,3,9,10,11,12,13,18,37,39],meta:[4,5,6],method:[3,4,7,41,43],methodolog:3,micro:2,min:12,minimum:22,miss:3,mitig:3,ml:2,mlir:3,model:[2,3,5],modern:[1,2,3],modular:3,moor:3,more:[1,2,3,41],most:3,mostli:4,ms:42,mullapudi2016:3,mullapudi:3,multi:[2,3],multipl:[2,3,4,5,24,28],multipli:[3,16],must:[8,16,39],n:[2,30],n_round:[27,28,29,30],name:[5,6,41],natur:[2,19],nb:2,need:28,nest:3,net:3,network:[2,3],neural:[2,3],neurosci:2,nightli:0,nip:2,non:2,none:[4,5,9,11,12,13,18,37,41,42],nonzero:39,note:[0,3,5,7,39],notic:3,notori:2,novel:2,num_stag:[4,5],num_warp:[4,5],number:[3,4,5,25,27,28,29,30],numer:2,nvidia:[2,18],object:[2,4,5,7,9,10,11,12,13],occur:3,offer:2,offici:0,offset:[27,28,29,30],omega:3,onc:[2,3],one:[2,3,41],onli:[2,3,7],open:8,openai:0,opencl:2,oper:[2,9,10,11,12,13,39],opportun:2,opsila:2,optim:[2,3],option:[5,18,37,41,42],order:3,origin:3,osdi:2,other:[1,3,7,16,18,21,23],otherwis:39,our:2,out:[1,3],outlin:3,over:[2,3],p:3,packag:7,pact:3,paradigm:[2,3],parallel:[1,2,3,4],paralleliz:2,param:6,paramet:[3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43],parametr:2,part:3,particularli:[2,3],partit:2,pass:[3,4],past:[2,3],pattern:2,peak:3,percentil:42,perf_model:5,perf_report:41,perform:[2,3,5,9,10,11,12,13,42],person:3,perspect:3,phase:3,philosophi:3,philox:29,pip:0,pipelin:[2,3,4],platform:[1,3],pldi:2,plot:[0,41],plot_nam:41,pmatrix:3,point:[3,29],pointer:[7,9,10,11,12,13,18,37],pointerdtyp:[9,10,11,12,13,18,37],polli:3,polyhedr:2,polyhedra:3,popular:3,portabl:[2,3],pose:2,posit:6,possibl:[3,4],power:[3,6,8],ppopp:3,practic:2,pragma:2,pre:[0,2],pre_hook:4,predic:5,predict:3,premis:2,present:0,preserv:3,prevent:3,primer:3,primit:[2,7],principl:3,probabl:3,problemat:3,procedur:3,process:[2,3],processor:2,product:[1,3,16],program:[1,2,25,26],programm:[2,3],prohibitev:6,project:2,promot:3,properti:3,propos:2,provid:[1,3,5,20,22,38,42],prune:5,prune_configs_bi:5,prune_num_stages_bi:5,pseudo:29,ptx:18,purpos:[2,3],push:3,py:0,pypi:0,pytest:0,python:7,qquad:3,ragan:2,randint4x:28,random:[27,28,29,30],rang:[2,3],rapidli:[2,3],rather:2,rdom:3,reader:3,real:2,reason:3,recent:2,recomput:2,record_clock:42,rectifi:2,redmon2016:2,redmon:2,reduct:[20,22,38],regardless:39,regrett:2,regular:3,rel:3,relat:1,releas:[0,2],reli:3,remain:[2,41],reorder:3,rep:42,repetit:42,repres:[3,4],requir:3,research:[2,3],reset:[5,42],reset_to_zero:5,resolut:3,resourc:2,resp:3,respect:3,restrict:3,result:[0,2,3],retriev:3,revisit:2,right:3,rise:3,role:3,root:36,run:[0,1,3,5,7,43],runtim:[3,42],rvar:3,s:[3,29],said:3,same:[2,41],sato2019:3,sato:3,sc:3,scalabl:3,scalar:[2,16,27,28,29,30,40],scale:41,scan:3,schedul:2,scienc:3,scientif:3,scop:3,scope:3,script:0,second:[3,16,21,23],section:3,see:3,seed:[27,28,29,30],seem:3,select:[2,3,39],self:[4,41],semant:3,semi:3,sens:[2,3],separ:3,sequenc:2,set:3,setup:0,sever:[2,3],shall:3,shape:[3,14,18,32,37,39,40],share:2,should:[2,3,4,20,22,38,41],shown:3,side:3,sight:3,signal:2,sigplan:3,simd:2,simpli:3,sine:34,singl:[2,28],size:3,slower:[2,3],slowest:3,sm80:4,sm:3,smallest:6,snemi3d:2,so:3,softwar:4,solid:3,solv:3,sometim:3,sourc:3,space:[2,3],spars:[2,3],spatial:3,special:2,specif:2,specifi:[3,6,9,10,11,12,13,37],split:3,spmd:[2,3],squar:36,stabl:0,stage:4,standard:3,start:8,state:[2,3],statement:3,step:3,still:3,stop:8,store:[9,10,11,12,13,39],str:[5,6,18,41],strategi:3,stream:28,strength:2,structur:[2,3],style:41,subscript:3,substanti:2,successfulli:3,suffer:3,suit:2,superhuman:2,support:3,surprisingli:2,surround:3,sutskev:2,sutskever2014:2,swap:[9,10,11,12,13],swizzl:2,synchron:2,system:[0,2,3],t:3,t_:3,taco:3,take:[1,5,6],taken:3,target:2,techniqu:[2,3],tempor:3,tend:3,tension:2,tensor:[2,3,5,7,42],tensorrt:2,test:[0,1],text:3,th:42,than:[2,3,28,41],thei:[2,3],therebi:3,theta:3,theta_:3,thi:[2,3,4,5,6,7,29,41],though:[2,3],thought:3,thread:[2,4],through:3,throughout:[3,41],throughput:1,tile:3,time:[0,2,3,5,28,42],tiramisu:[2,3],tl:40,tmp:0,tog:3,top_k:5,topic:3,torch:[7,42],tradit:[2,3],transform:3,travers:3,trend:2,tri:[14,32],trigger:5,triton:[0,2,3],trivial:2,tune:[3,5,6],tuner:4,tupl:[14,32,40],tutori:1,tvm:[2,3],two:[3,5,6,8,16],type:[6,16,18,39,40],typecast:[18,37],typic:3,u:[0,27],un:3,uncommon:3,underneath:3,undesir:5,unfortun:3,unifi:2,unint:39,unit:[0,2],univers:3,unrol:3,updat:[3,5],us:[2,3,4,5,6,7,28,39,41,43],v100:3,val:[9,10,11,12,13],valu:[5,6,8,9,10,11,12,13,15,17,18,19,20,22,24,33,34,35,36,37,38,39,40,41,43],variabl:4,variant:2,vasilach:[2,3],vasilache2018:[2,3],vast:3,vec:3,vector:[2,3],veri:3,verif:3,verifi:3,via:3,view:31,visibl:3,vision:2,volatil:18,vs:0,w:3,want:39,warmup:42,warp:4,we:[2,3],well:[2,3],whatev:5,wheel:0,when:[2,3,4,5,7,39],where:[3,6,37],whether:[2,41],which:[2,3,5,20,22,38,41],whose:[3,5,18],wide:3,wise:[15,17,19,21,23,33,34,35,36,37],wish:3,within:[7,8],without:3,wolf:3,wolfe1989:3,word:3,work:[1,2],workload:4,wors:[2,3],wouldn:3,write:[1,3],x:[3,15,17,19,21,23,31,33,34,35,36,39,41],x_log:41,x_name:41,x_ptr:[5,6],x_size:[5,6],x_val:41,xi:3,xii:3,xlabel:41,xo:3,y:[3,21,23,39,41],y_log:41,year:3,yet:[2,3],yi:3,yield:39,yii:3,ylabel:41,yo:3,you:[0,2,5,28,39],your:[0,1],z:3,zero:5},titles:["Installation","Welcome to Triton\u2019s documentation!","Introduction","Related Work","triton.Config","triton.autotune","triton.heuristics","triton.jit","triton.language.arange","triton.language.atomic_add","triton.language.atomic_cas","triton.language.atomic_max","triton.language.atomic_min","triton.language.atomic_xchg","triton.language.broadcast_to","triton.language.cos","triton.language.dot","triton.language.exp","triton.language.load","triton.language.log","triton.language.max","triton.language.maximum","triton.language.min","triton.language.minimum","triton.language.multiple_of","triton.language.num_programs","triton.language.program_id","triton.language.rand","triton.language.randint","triton.language.randint4x","triton.language.randn","triton.language.ravel","triton.language.reshape","triton.language.sigmoid","triton.language.sin","triton.language.softmax","triton.language.sqrt","triton.language.store","triton.language.sum","triton.language.where","triton.language.zeros","triton.testing.Benchmark","triton.testing.do_bench","triton.testing.perf_report","triton","triton.language","triton.testing"],titleterms:{advantag:3,algebra:45,api:1,arang:8,atom:45,atomic_add:9,atomic_ca:10,atomic_max:11,atomic_min:12,atomic_xchg:13,autotun:5,benchmark:41,binari:0,broadcast_to:14,challeng:2,co:15,comparison:45,compil:[3,45],config:4,creation:45,distribut:0,do_bench:42,document:1,dot:16,exp:17,from:0,further:1,gener:45,get:1,go:1,heurist:6,hint:45,index:45,instal:0,introduct:2,jit:7,languag:[3,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,45],limit:3,linear:45,load:18,log:19,manipul:45,math:45,max:20,maximum:21,memori:45,min:22,minimum:23,model:45,motiv:2,multiple_of:24,num_program:25,number:45,op:45,packag:0,perf_report:43,polyhedr:3,program:[3,45],program_id:26,python:[0,1],rand:27,randint4x:29,randint:28,randn:30,random:45,ravel:31,reduct:45,refer:[2,3],relat:3,represent:3,reshap:32,s:1,schedul:3,shape:45,sigmoid:33,sin:34,softmax:35,sourc:0,sqrt:36,start:1,store:37,sum:38,test:[41,42,43,46],triton:[1,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46],welcom:1,where:39,work:3,zero:40}}) |