Search.setIndex({docnames:["api/empty_workspace_list","api/index","api/methods","api/operators","api/traits","index","introduction","performance","release_notes","requirements_func","warnings/bit_identical","warnings/bit_identical_sm"],envversion:{"sphinx.domains.c":2,"sphinx.domains.changeset":1,"sphinx.domains.citation":1,"sphinx.domains.cpp":4,"sphinx.domains.index":1,"sphinx.domains.javascript":2,"sphinx.domains.math":2,"sphinx.domains.python":3,"sphinx.domains.rst":2,"sphinx.domains.std":2,sphinx:56},filenames:["api/empty_workspace_list.rst","api/index.rst","api/methods.rst","api/operators.rst","api/traits.rst","index.rst","introduction.rst","performance.rst","release_notes.rst","requirements_func.rst","warnings/bit_identical.rst","warnings/bit_identical_sm.rst"],objects:{},objnames:{},objtypes:{},terms:{"0":[2,4,5,6,9],"1":[2,3,4,5,6,7],"10":[0,2,9],"10000":[0,2,9],"11":[0,2,6,9],"12":[0,2,9],"128":[2,3,4,6],"1296":[0,2,9],"1331":[0,2,9],"151":6,"15625":[0,2,9],"16":[3,6,9],"16384":[3,9],"17":9,"1728":[0,2,9],"18":9,"194":9,"19683":[0,2,9],"2":[0,2,3,4,6,7,9],"2048":9,"2401":[0,2,9],"2d":3,"3":[0,2,5,6,7,9],"32":[3,8,9],"32768":[0,2,3,9],"3d":3,"4":[2,4,7],"4096":9,"5":[0,2,7,9],"6":[0,2,4,7,9],"64":8,"7":[0,2,7,9],"70":9,"700":[3,6],"72":9,"720":3,"75":9,"750":3,"8":[2,3,4,6],"80":9,"800":3,"8192":9,"86":9,"860":3,"9":9,"abstract":6,"boolean":4,"byte":[2,4],"case":[6,7],"class":[2,6],"const":6,"default":[3,4,7,8],"do":[0,2,6,9],"final":6,"float":[2,3,4,6,9],"function":[1,3,4,5,6,7,8],"int":[3,4,6],"long":2,"new":6,"return":[2,4],"true":[2,3,4,6],"try":7,"void":[2,6],"while":6,A:[2,5,6],By:6,For:[2,3,4,6,7],If:[2,3,4,6],In:[0,6,7,9],Is:3,It:[2,3,6,10,11],Not:3,On:6,One:[3,4],The:[2,3,4,5,6,8,9],There:[3,4],These:2,To:6,With:3,__global__:[2,6],__half:[3,4],__launch_bounds__:[2,6],__shared__:[2,6],_valuetyp:4,a100:8,abi:6,abil:[5,7],abl:4,about:[4,6,8,9],access:8,achiev:5,ad:[3,4,6,8,9],adapt:6,add:6,addit:[2,6,9],address:8,address_s:8,adjac:7,adjust:[5,7],advanc:5,advantag:6,advic:5,affect:6,after:[2,6],aim:6,align:2,alignof:2,all:[2,4,6,9],alloc:[2,4,6,9],allow:[3,6],along:6,also:[2,4,6],alwai:[4,7],amount:6,amper:[3,7],an:[2,3,4,5,6,7],analysi:7,ani:[2,4,6],anymor:8,api:[5,6,7,8],appear:8,appli:6,applic:[5,7],approach:6,ar:[2,3,4,6,7,9],arch:6,architectur:[2,3,6,9,11],architecur:[3,6],argument:[2,6],around:8,arrai:[2,6],ask:6,assum:3,attach:6,auto:[2,4,6],automat:6,avail:[2,4,6,7,8,9],avoid:[7,8],back:[2,6],baselin:7,batch:[2,5],becaus:6,been:[2,4,6],being:6,below:7,best:7,better:7,between:[2,4],bi:9,bit:[2,3,8,10,11],block:[1,6,7,8,9,10],block_dim:[2,3,4,6],block_fft_kernel:[2,6],blockdim:[2,4,9,10],both:[4,6],bound:7,build:[4,6],built:[4,6],burden:6,c2c:[2,3,4,6],c2r:[2,3,4],c:[6,7,9],calcul:[2,3,4,5,6,7,10],call:[2,6],can:[1,2,3,4,5,6,9],cast:[2,4],cc:3,certain:6,chang:[6,7,8],check:[4,6,9],choic:6,clang:9,cmake:9,coalesc:7,code:[2,6,7],collabor:9,collect:[3,4,6,9],com:7,combin:[3,6,9],commun:2,compat:[5,6],compil:[3,4,5,8],complet:[3,6],complex:[2,3,4,6,7,9],complex_typ:[2,4,6],compon:[1,5],comprehens:5,comput:[2,3,4,6,7,9],concurr:[2,3],configur:[0,2,4,6,9],conflict:8,consid:7,consist:[3,5,6],construct:[2,3,4,6],contain:[2,6],context:[3,4],continu:[0,2,9],control:6,cooper:3,copi:[2,6],correct:[6,9],correctli:[2,6],cost:6,cout:4,creat:[2,3,4,6,9],cu:6,cuda:[2,3,4,5,6,7,9,10,11],cudaerror_t:[2,4,6],cudamallocmanag:4,cudaoccupancymaxactiveblockspermultiprocessor:7,cudasuccess:[2,6],cuffdx:[3,6],cufft:[5,6,7],cufftdx:[0,2,3,4,7,8,9],cufftdx_ignore_deprecated_compil:9,cufftdx_ignore_deprecated_dialect:9,cufttdx:9,custom:[3,5,7,9],customiz:5,data:[3,4,5,6,7,9],decltyp:[2,3,4,6],decoupl:6,decreas:5,defer:6,defin:[2,3,4,6,9],definit:6,depend:[4,6,7,9],describ:[2,3,6],descript:[1,2,6],descriptor:[2,3,4,6,9],design:6,destruct:2,detail:[4,6,9],determin:[3,4,6,7],devic:[4,5,6],differ:[2,3,4,5,6,10,11],dim3:4,dimens:[2,3,9,10],direct:[2,6,9,10],direction_of:4,directli:4,directori:6,divid:[3,4],divisor:3,doc:7,document:[5,8],doe:[4,6,8],doesn:[2,4],don:2,done:7,doubl:[2,3,4,6,9],double2:2,driver:6,dure:9,e:[2,3],ea:8,each:[2,3,4,6],earli:8,either:[3,4,6],element:[2,6,7,9,10],elements_per_thread:[3,4,6],elementsperthread:[2,3,4,6,8,10],embedd:5,emit:9,empti:[2,4,6],enabl:[5,7,9],encod:6,endl:4,enough:7,ensur:7,entir:7,equal:[2,4],equival:6,error:[2,4,9],error_cod:6,etc:[5,6],evalu:6,everi:9,evolv:6,exact:6,exactli:[2,3,11],exampl:[1,3,6],exclus:3,execut:[1,5,6,8,10,11],exist:[6,7],expect:[2,4],experiment:[6,9],expertis:9,expos:6,express:6,extend:4,extens:[5,6],extern:[2,6],extra:[4,7],f:3,fail:[3,4],fals:[2,3,4],fast:[3,5],featur:6,fft:[0,2,5,7,8,9,10,11],fft_128_float:6,fft_direct:[2,3,4,6],fft_input_size_in_byt:2,fft_output_size_in_byt:2,fft_type:[2,3,4,6],fftcomplet:6,fftexecut:6,ffts_per_block:[2,3,4],fftsperblock:[2,3,4,6,8,10],file:[4,6],fill:7,find:1,fine:9,first:[2,5,8],fit:2,fix:6,float2:[2,6],flow:9,follow:[0,2,3,4,6,9],form:[3,4,6],format:4,forward:[2,3,4,6],fourier:[3,5],fp16:2,free:2,freed:2,from:[2,4,5,6,7,9],full:[6,8],fulli:6,further:5,fuse:5,fusion:5,futur:[0,2,4,5,6,9],ga:8,gcc:9,gener:[3,5,8],get:6,given:9,global:[2,4,5,6,7,9],go:4,gpu:[2,3,6,7,9,11],grain:9,greater:[3,4,9],greatli:7,group:3,group__cudart__occup:7,guarante:[2,3,9,10,11],guid:7,ha:[2,4,6],half:[2,9],hand:6,handl:6,happen:5,hardwar:6,have:[2,4,6],header:[4,6,9],held:4,help:7,helper:[2,4],here:1,heurist:[3,4],high:5,higher:[4,9],hood:5,host:[6,9],how:[3,4,6,7],howev:[2,9],hpp:[2,3,4,6],html:7,http:7,i:[2,6],ident:[2,3,7,10,11],identifi:6,ie:7,imaginari:2,imaginary_1:2,imaginary_2:2,impact:8,implement:[3,4,6],implicit_type_batch:[2,4],implicitli:2,improv:[5,7,8],includ:[2,3,4,6,8,9],increas:7,independ:3,index:[2,7],indic:6,influenc:6,inform:[4,6,9],inlin:6,input:[3,6,9],input_typ:4,insid:[3,5,6],instanti:6,invalid:2,invers:[3,4,6],iostream:4,is_complet:4,is_complete_fft:[4,6],is_complete_fft_execut:[2,4],is_fft:4,is_fft_execut:4,its:[2,4,6],kernel:[2,5,8],know:6,label:[4,6],last:[2,6,8],latenc:5,later:2,launch:[6,7],let:6,level:6,librari:[1,5,6,7,8,9],lifetim:[2,4],like:6,line:[6,8],linux:9,list:[6,7,8,9],load:[2,7],local:[2,6,9],locat:6,logic:2,lose:7,magnitud:7,mai:[0,2,4,6,7,8,9],main:[1,5],major:6,make:[1,4,9],make_workspac:[2,4,6],manag:[4,5,6],mani:6,manner:6,map:6,match:7,max_siz:9,max_threads_per_block:[2,4,6],maxim:[4,6],maximum:[2,4,6],mean:[2,4,6],mechan:6,memori:[5,6,9],merg:7,messag:4,method:[1,4,5,6,8],might:[7,9],miss:4,modifi:6,more:[2,3,4,6,7,9],most:9,move:6,movement:5,msvc:9,much:4,multipl:[4,6],must:[2,3,4,6,9],mutual:3,my_fft_kernel_128:6,n:2,namespac:6,natur:2,necessari:[3,4],need:[5,6,7,9],never:2,newer:9,next:5,none:4,note:[4,5],nsight:7,nsightcomput:7,number:[2,3,4,6,10],nvcc:[6,9],nvidia:7,nvrtc:[6,9],o3:6,o:6,object:[2,3,4,6],obtain:[6,9],occup:7,offer:[6,7,8],onc:6,one:[3,4,6,7,9],onli:[2,3,4,6,9],oper:[1,2,4,5,6,7,9],optim:[6,7,8],optimum:7,option:[5,7,9],order:[2,6,7,9],organ:6,other:[0,2,4,5,6,9],otherwis:[2,4],our:6,output:[3,6,9],output_typ:4,over:6,overload:2,overview:5,p:3,parallel:[3,4,6,7],paramet:[4,6,7,9],part:[2,4],particip:2,particular:6,pass:[2,4,6],path_to_cufftdx_loc:6,peak:7,per:[2,6,7,9,10],perform:[3,4,5,6,8,9],pick:6,piec:6,place:2,platform:6,pleas:4,point:[2,3,4],pointer:[2,6,8],port:7,post:7,potenti:[6,7],power:[0,2,3,8,9],practic:7,pre:7,precis:[2,5,6,9,10],precision_of:4,preliminari:9,preserv:6,previou:6,problem:6,process:[2,7],produc:[2,3,10,11],program:8,proof:6,propag:6,properti:6,provid:[4,5,6,7],ptx:6,ptxa:8,queri:6,quick:5,quickli:6,r2c:[2,3,4],race:2,rang:[3,9],read:5,real:[2,3,6,9],real_1:2,real_2:2,reason:7,recompil:6,refer:[2,5],regist:[6,7,9],regular:7,rel:9,releas:[4,5,6],remov:[0,2,9],replac:4,request:[3,6],requir:[0,2,3,5,6,7],requires_workspac:[2,3,4,6,9],requiresworkspac:6,resourc:[6,7],respons:2,restor:8,restrict:3,result:[2,3,6,9,10,11],retriev:[4,6],routin:[5,6],rule:2,run:[2,3,4,6,7,9],runtim:7,s:[2,3,4],same:[2,3,4,6,10,11],save:[5,6,7],second:[2,6],section:[2,8],see:[2,3,4,8,9],seen:6,select:[5,6,9],separ:[3,7],set:[3,4,7],share:[6,7,8,9],shared_mem:[2,6],shared_memori:2,shared_memory_input:2,shared_memory_s:[2,4,6],ship:6,should:[2,3,4,6,7,8],shouldn:8,side:4,signific:8,silenc:9,simpl:[6,7],simultan:3,sinc:[2,6],singl:[2,3,6,9],size:[0,2,5,6,7,8,9,10],size_byt:4,size_of:[3,4,6],sizeof:4,sm70:8,sm80:8,sm:[4,6,9],sm_70:[3,6],sm_72:3,sm_75:3,sm_80:3,sm_86:3,small:9,smaller:[2,3],so:[0,2,6,9],softwar:9,solv:3,some:6,sourc:[6,7],specif:9,specifi:[3,6],standalon:6,standard:9,start:[5,6,7],std:[4,6],storage_s:[2,4,6],store:[2,7,9],stream:7,stride:[2,6,8],struct:3,suggest:[6,9],suggested_ffts_per_block:[4,6],summar:9,support:[3,5,6],t:[2,4,8],tabl:9,take:7,target:[3,4,6,7,8,9],techniqu:6,templat:[2,6],temporari:7,th:[2,4],than:[2,3,4,6],thei:[3,4],them:6,therefor:[6,9],thi:[2,3,4,6,7,8,9],those:2,thread:[1,6,7,9,10],thread_data:[2,6],threadidx:6,three:6,thu:2,time:6,toolkit:[5,6,9],total:4,track:[2,4],trait:[1,2,5,6,9],transform:[3,5,6],trip:[5,7],tune:[3,7],ture:[3,7],tweak:7,two:[2,3,5,6,8],type:[2,6,9,10],type_of:4,typenam:[2,4,6],u:3,under:5,underli:[2,3,4],unless:[3,4,8],unlik:6,unnecessari:5,unnorm:3,unsign:[3,4],unsupport:9,up:[0,2,6,7,9],upcom:7,upon:2,us:[2,3,4,5,7,8,9],usabl:6,usag:1,user:[2,3,4,6,7,9],v100:8,valid:[2,4],valu:[3,6,7,8],value_typ:[2,4,6],variat:6,variou:8,verifi:6,version:[0,2,5,6,7,9],via:9,volta:[3,6,7],wa:[2,4,6],wai:6,want:6,warn:8,we:[4,6,7,8],well:3,what:[5,7],when:[2,3,4,6,8],where:[2,6,9],which:[2,3,4,6,8,9],why:5,window:9,within:[2,3,4],without:7,won:4,work:[8,9],workspac:[0,1,6,9],workspace_s:[2,4],workspace_typ:[2,4,6],world:6,wors:7,would:6,write:7,wsl2:9,x:[3,4,6],xxx:8,y:[3,4,6],yet:[3,9],you:[1,5,6,9],your:5,z:[3,4],zero:4},titles:["&lt;no title&gt;","cuFFTDx API Reference","Execution Methods","Operators","Traits","NVIDIA cuFFTDx","First FFT using cuFFTDx","Achieving high performance","Release Notes","Requirements and Functionality","&lt;no title&gt;","&lt;no title&gt;"],titleterms:{"0":8,"1":8,"3":8,"function":[2,9],"new":8,In:2,Is:4,achiev:7,advanc:7,advic:7,api:1,batch:4,block:[2,3,4],blockdim:3,compil:[6,9],complet:4,configur:3,cufftdx:[1,5,6],custom:6,data:2,descript:[3,4],dim:4,direct:[3,4],element:[3,4],exampl:[2,4],execut:[2,3,4],featur:8,fft:[3,4,6],first:6,format:2,further:7,fusion:7,gener:7,guid:5,happen:6,high:7,highlight:5,hood:6,implicit:4,input:[2,4],issu:8,kernel:[6,7],known:8,make:2,manag:7,max:4,memori:[2,4,7],method:2,next:6,note:8,nvidia:5,oper:3,output:[2,4],per:[3,4],perform:7,precis:[3,4],read:7,refer:[1,7],regist:2,releas:8,requir:[4,9],resolv:8,share:[2,4],size:[3,4],sm:3,storag:4,stride:4,suggest:4,support:9,thread:[2,3,4],trait:4,type:[3,4],under:6,us:6,user:5,valu:[2,4],what:6,why:6,workspac:[2,4],your:6}})