GlslangToSpv.cpp 494 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322232323242325232623272328232923302331233223332334233523362337233823392340234123422343234423452346234723482349235023512352235323542355235623572358235923602361236223632364236523662367236823692370237123722373237423752376237723782379238023812382238323842385238623872388238923902391239223932394239523962397239823992400240124022403240424052406240724082409241024112412241324142415241624172418241924202421242224232424242524262427242824292430243124322433243424352436243724382439244024412442244324442445244624472448244924502451245224532454245524562457245824592460246124622463246424652466246724682469247024712472247324742475247624772478247924802481248224832484248524862487248824892490249124922493249424952496249724982499250025012502250325042505250625072508250925102511251225132514251525162517251825192520252125222523252425252526252725282529253025312532253325342535253625372538253925402541254225432544254525462547254825492550255125522553255425552556255725582559256025612562256325642565256625672568256925702571257225732574257525762577257825792580258125822583258425852586258725882589259025912592259325942595259625972598259926002601260226032604260526062607260826092610261126122613261426152616261726182619262026212622262326242625262626272628262926302631263226332634263526362637263826392640264126422643264426452646264726482649265026512652265326542655265626572658265926602661266226632664266526662667266826692670267126722673267426752676267726782679268026812682268326842685268626872688268926902691269226932694269526962697269826992700270127022703270427052706270727082709271027112712271327142715271627172718271927202721272227232724272527262727272827292730273127322733273427352736273727382739274027412742274327442745274627472748274927502751275227532754275527562757275827592760276127622763276427652766276727682769277027712772277327742775277627772778277927802781278227832784278527862787278827892790279127922793279427952796279727982799280028012802280328042805280628072808280928102811281228132814281528162817281828192820282128222823282428252826282728282829283028312832283328342835283628372838283928402841284228432844284528462847284828492850285128522853285428552856285728582859286028612862286328642865286628672868286928702871287228732874287528762877287828792880288128822883288428852886288728882889289028912892289328942895289628972898289929002901290229032904290529062907290829092910291129122913291429152916291729182919292029212922292329242925292629272928292929302931293229332934293529362937293829392940294129422943294429452946294729482949295029512952295329542955295629572958295929602961296229632964296529662967296829692970297129722973297429752976297729782979298029812982298329842985298629872988298929902991299229932994299529962997299829993000300130023003300430053006300730083009301030113012301330143015301630173018301930203021302230233024302530263027302830293030303130323033303430353036303730383039304030413042304330443045304630473048304930503051305230533054305530563057305830593060306130623063306430653066306730683069307030713072307330743075307630773078307930803081308230833084308530863087308830893090309130923093309430953096309730983099310031013102310331043105310631073108310931103111311231133114311531163117311831193120312131223123312431253126312731283129313031313132313331343135313631373138313931403141314231433144314531463147314831493150315131523153315431553156315731583159316031613162316331643165316631673168316931703171317231733174317531763177317831793180318131823183318431853186318731883189319031913192319331943195319631973198319932003201320232033204320532063207320832093210321132123213321432153216321732183219322032213222322332243225322632273228322932303231323232333234323532363237323832393240324132423243324432453246324732483249325032513252325332543255325632573258325932603261326232633264326532663267326832693270327132723273327432753276327732783279328032813282328332843285328632873288328932903291329232933294329532963297329832993300330133023303330433053306330733083309331033113312331333143315331633173318331933203321332233233324332533263327332833293330333133323333333433353336333733383339334033413342334333443345334633473348334933503351335233533354335533563357335833593360336133623363336433653366336733683369337033713372337333743375337633773378337933803381338233833384338533863387338833893390339133923393339433953396339733983399340034013402340334043405340634073408340934103411341234133414341534163417341834193420342134223423342434253426342734283429343034313432343334343435343634373438343934403441344234433444344534463447344834493450345134523453345434553456345734583459346034613462346334643465346634673468346934703471347234733474347534763477347834793480348134823483348434853486348734883489349034913492349334943495349634973498349935003501350235033504350535063507350835093510351135123513351435153516351735183519352035213522352335243525352635273528352935303531353235333534353535363537353835393540354135423543354435453546354735483549355035513552355335543555355635573558355935603561356235633564356535663567356835693570357135723573357435753576357735783579358035813582358335843585358635873588358935903591359235933594359535963597359835993600360136023603360436053606360736083609361036113612361336143615361636173618361936203621362236233624362536263627362836293630363136323633363436353636363736383639364036413642364336443645364636473648364936503651365236533654365536563657365836593660366136623663366436653666366736683669367036713672367336743675367636773678367936803681368236833684368536863687368836893690369136923693369436953696369736983699370037013702370337043705370637073708370937103711371237133714371537163717371837193720372137223723372437253726372737283729373037313732373337343735373637373738373937403741374237433744374537463747374837493750375137523753375437553756375737583759376037613762376337643765376637673768376937703771377237733774377537763777377837793780378137823783378437853786378737883789379037913792379337943795379637973798379938003801380238033804380538063807380838093810381138123813381438153816381738183819382038213822382338243825382638273828382938303831383238333834383538363837383838393840384138423843384438453846384738483849385038513852385338543855385638573858385938603861386238633864386538663867386838693870387138723873387438753876387738783879388038813882388338843885388638873888388938903891389238933894389538963897389838993900390139023903390439053906390739083909391039113912391339143915391639173918391939203921392239233924392539263927392839293930393139323933393439353936393739383939394039413942394339443945394639473948394939503951395239533954395539563957395839593960396139623963396439653966396739683969397039713972397339743975397639773978397939803981398239833984398539863987398839893990399139923993399439953996399739983999400040014002400340044005400640074008400940104011401240134014401540164017401840194020402140224023402440254026402740284029403040314032403340344035403640374038403940404041404240434044404540464047404840494050405140524053405440554056405740584059406040614062406340644065406640674068406940704071407240734074407540764077407840794080408140824083408440854086408740884089409040914092409340944095409640974098409941004101410241034104410541064107410841094110411141124113411441154116411741184119412041214122412341244125412641274128412941304131413241334134413541364137413841394140414141424143414441454146414741484149415041514152415341544155415641574158415941604161416241634164416541664167416841694170417141724173417441754176417741784179418041814182418341844185418641874188418941904191419241934194419541964197419841994200420142024203420442054206420742084209421042114212421342144215421642174218421942204221422242234224422542264227422842294230423142324233423442354236423742384239424042414242424342444245424642474248424942504251425242534254425542564257425842594260426142624263426442654266426742684269427042714272427342744275427642774278427942804281428242834284428542864287428842894290429142924293429442954296429742984299430043014302430343044305430643074308430943104311431243134314431543164317431843194320432143224323432443254326432743284329433043314332433343344335433643374338433943404341434243434344434543464347434843494350435143524353435443554356435743584359436043614362436343644365436643674368436943704371437243734374437543764377437843794380438143824383438443854386438743884389439043914392439343944395439643974398439944004401440244034404440544064407440844094410441144124413441444154416441744184419442044214422442344244425442644274428442944304431443244334434443544364437443844394440444144424443444444454446444744484449445044514452445344544455445644574458445944604461446244634464446544664467446844694470447144724473447444754476447744784479448044814482448344844485448644874488448944904491449244934494449544964497449844994500450145024503450445054506450745084509451045114512451345144515451645174518451945204521452245234524452545264527452845294530453145324533453445354536453745384539454045414542454345444545454645474548454945504551455245534554455545564557455845594560456145624563456445654566456745684569457045714572457345744575457645774578457945804581458245834584458545864587458845894590459145924593459445954596459745984599460046014602460346044605460646074608460946104611461246134614461546164617461846194620462146224623462446254626462746284629463046314632463346344635463646374638463946404641464246434644464546464647464846494650465146524653465446554656465746584659466046614662466346644665466646674668466946704671467246734674467546764677467846794680468146824683468446854686468746884689469046914692469346944695469646974698469947004701470247034704470547064707470847094710471147124713471447154716471747184719472047214722472347244725472647274728472947304731473247334734473547364737473847394740474147424743474447454746474747484749475047514752475347544755475647574758475947604761476247634764476547664767476847694770477147724773477447754776477747784779478047814782478347844785478647874788478947904791479247934794479547964797479847994800480148024803480448054806480748084809481048114812481348144815481648174818481948204821482248234824482548264827482848294830483148324833483448354836483748384839484048414842484348444845484648474848484948504851485248534854485548564857485848594860486148624863486448654866486748684869487048714872487348744875487648774878487948804881488248834884488548864887488848894890489148924893489448954896489748984899490049014902490349044905490649074908490949104911491249134914491549164917491849194920492149224923492449254926492749284929493049314932493349344935493649374938493949404941494249434944494549464947494849494950495149524953495449554956495749584959496049614962496349644965496649674968496949704971497249734974497549764977497849794980498149824983498449854986498749884989499049914992499349944995499649974998499950005001500250035004500550065007500850095010501150125013501450155016501750185019502050215022502350245025502650275028502950305031503250335034503550365037503850395040504150425043504450455046504750485049505050515052505350545055505650575058505950605061506250635064506550665067506850695070507150725073507450755076507750785079508050815082508350845085508650875088508950905091509250935094509550965097509850995100510151025103510451055106510751085109511051115112511351145115511651175118511951205121512251235124512551265127512851295130513151325133513451355136513751385139514051415142514351445145514651475148514951505151515251535154515551565157515851595160516151625163516451655166516751685169517051715172517351745175517651775178517951805181518251835184518551865187518851895190519151925193519451955196519751985199520052015202520352045205520652075208520952105211521252135214521552165217521852195220522152225223522452255226522752285229523052315232523352345235523652375238523952405241524252435244524552465247524852495250525152525253525452555256525752585259526052615262526352645265526652675268526952705271527252735274527552765277527852795280528152825283528452855286528752885289529052915292529352945295529652975298529953005301530253035304530553065307530853095310531153125313531453155316531753185319532053215322532353245325532653275328532953305331533253335334533553365337533853395340534153425343534453455346534753485349535053515352535353545355535653575358535953605361536253635364536553665367536853695370537153725373537453755376537753785379538053815382538353845385538653875388538953905391539253935394539553965397539853995400540154025403540454055406540754085409541054115412541354145415541654175418541954205421542254235424542554265427542854295430543154325433543454355436543754385439544054415442544354445445544654475448544954505451545254535454545554565457545854595460546154625463546454655466546754685469547054715472547354745475547654775478547954805481548254835484548554865487548854895490549154925493549454955496549754985499550055015502550355045505550655075508550955105511551255135514551555165517551855195520552155225523552455255526552755285529553055315532553355345535553655375538553955405541554255435544554555465547554855495550555155525553555455555556555755585559556055615562556355645565556655675568556955705571557255735574557555765577557855795580558155825583558455855586558755885589559055915592559355945595559655975598559956005601560256035604560556065607560856095610561156125613561456155616561756185619562056215622562356245625562656275628562956305631563256335634563556365637563856395640564156425643564456455646564756485649565056515652565356545655565656575658565956605661566256635664566556665667566856695670567156725673567456755676567756785679568056815682568356845685568656875688568956905691569256935694569556965697569856995700570157025703570457055706570757085709571057115712571357145715571657175718571957205721572257235724572557265727572857295730573157325733573457355736573757385739574057415742574357445745574657475748574957505751575257535754575557565757575857595760576157625763576457655766576757685769577057715772577357745775577657775778577957805781578257835784578557865787578857895790579157925793579457955796579757985799580058015802580358045805580658075808580958105811581258135814581558165817581858195820582158225823582458255826582758285829583058315832583358345835583658375838583958405841584258435844584558465847584858495850585158525853585458555856585758585859586058615862586358645865586658675868586958705871587258735874587558765877587858795880588158825883588458855886588758885889589058915892589358945895589658975898589959005901590259035904590559065907590859095910591159125913591459155916591759185919592059215922592359245925592659275928592959305931593259335934593559365937593859395940594159425943594459455946594759485949595059515952595359545955595659575958595959605961596259635964596559665967596859695970597159725973597459755976597759785979598059815982598359845985598659875988598959905991599259935994599559965997599859996000600160026003600460056006600760086009601060116012601360146015601660176018601960206021602260236024602560266027602860296030603160326033603460356036603760386039604060416042604360446045604660476048604960506051605260536054605560566057605860596060606160626063606460656066606760686069607060716072607360746075607660776078607960806081608260836084608560866087608860896090609160926093609460956096609760986099610061016102610361046105610661076108610961106111611261136114611561166117611861196120612161226123612461256126612761286129613061316132613361346135613661376138613961406141614261436144614561466147614861496150615161526153615461556156615761586159616061616162616361646165616661676168616961706171617261736174617561766177617861796180618161826183618461856186618761886189619061916192619361946195619661976198619962006201620262036204620562066207620862096210621162126213621462156216621762186219622062216222622362246225622662276228622962306231623262336234623562366237623862396240624162426243624462456246624762486249625062516252625362546255625662576258625962606261626262636264626562666267626862696270627162726273627462756276627762786279628062816282628362846285628662876288628962906291629262936294629562966297629862996300630163026303630463056306630763086309631063116312631363146315631663176318631963206321632263236324632563266327632863296330633163326333633463356336633763386339634063416342634363446345634663476348634963506351635263536354635563566357635863596360636163626363636463656366636763686369637063716372637363746375637663776378637963806381638263836384638563866387638863896390639163926393639463956396639763986399640064016402640364046405640664076408640964106411641264136414641564166417641864196420642164226423642464256426642764286429643064316432643364346435643664376438643964406441644264436444644564466447644864496450645164526453645464556456645764586459646064616462646364646465646664676468646964706471647264736474647564766477647864796480648164826483648464856486648764886489649064916492649364946495649664976498649965006501650265036504650565066507650865096510651165126513651465156516651765186519652065216522652365246525652665276528652965306531653265336534653565366537653865396540654165426543654465456546654765486549655065516552655365546555655665576558655965606561656265636564656565666567656865696570657165726573657465756576657765786579658065816582658365846585658665876588658965906591659265936594659565966597659865996600660166026603660466056606660766086609661066116612661366146615661666176618661966206621662266236624662566266627662866296630663166326633663466356636663766386639664066416642664366446645664666476648664966506651665266536654665566566657665866596660666166626663666466656666666766686669667066716672667366746675667666776678667966806681668266836684668566866687668866896690669166926693669466956696669766986699670067016702670367046705670667076708670967106711671267136714671567166717671867196720672167226723672467256726672767286729673067316732673367346735673667376738673967406741674267436744674567466747674867496750675167526753675467556756675767586759676067616762676367646765676667676768676967706771677267736774677567766777677867796780678167826783678467856786678767886789679067916792679367946795679667976798679968006801680268036804680568066807680868096810681168126813681468156816681768186819682068216822682368246825682668276828682968306831683268336834683568366837683868396840684168426843684468456846684768486849685068516852685368546855685668576858685968606861686268636864686568666867686868696870687168726873687468756876687768786879688068816882688368846885688668876888688968906891689268936894689568966897689868996900690169026903690469056906690769086909691069116912691369146915691669176918691969206921692269236924692569266927692869296930693169326933693469356936693769386939694069416942694369446945694669476948694969506951695269536954695569566957695869596960696169626963696469656966696769686969697069716972697369746975697669776978697969806981698269836984698569866987698869896990699169926993699469956996699769986999700070017002700370047005700670077008700970107011701270137014701570167017701870197020702170227023702470257026702770287029703070317032703370347035703670377038703970407041704270437044704570467047704870497050705170527053705470557056705770587059706070617062706370647065706670677068706970707071707270737074707570767077707870797080708170827083708470857086708770887089709070917092709370947095709670977098709971007101710271037104710571067107710871097110711171127113711471157116711771187119712071217122712371247125712671277128712971307131713271337134713571367137713871397140714171427143714471457146714771487149715071517152715371547155715671577158715971607161716271637164716571667167716871697170717171727173717471757176717771787179718071817182718371847185718671877188718971907191719271937194719571967197719871997200720172027203720472057206720772087209721072117212721372147215721672177218721972207221722272237224722572267227722872297230723172327233723472357236723772387239724072417242724372447245724672477248724972507251725272537254725572567257725872597260726172627263726472657266726772687269727072717272727372747275727672777278727972807281728272837284728572867287728872897290729172927293729472957296729772987299730073017302730373047305730673077308730973107311731273137314731573167317731873197320732173227323732473257326732773287329733073317332733373347335733673377338733973407341734273437344734573467347734873497350735173527353735473557356735773587359736073617362736373647365736673677368736973707371737273737374737573767377737873797380738173827383738473857386738773887389739073917392739373947395739673977398739974007401740274037404740574067407740874097410741174127413741474157416741774187419742074217422742374247425742674277428742974307431743274337434743574367437743874397440744174427443744474457446744774487449745074517452745374547455745674577458745974607461746274637464746574667467746874697470747174727473747474757476747774787479748074817482748374847485748674877488748974907491749274937494749574967497749874997500750175027503750475057506750775087509751075117512751375147515751675177518751975207521752275237524752575267527752875297530753175327533753475357536753775387539754075417542754375447545754675477548754975507551755275537554755575567557755875597560756175627563756475657566756775687569757075717572757375747575757675777578757975807581758275837584758575867587758875897590759175927593759475957596759775987599760076017602760376047605760676077608760976107611761276137614761576167617761876197620762176227623762476257626762776287629763076317632763376347635763676377638763976407641764276437644764576467647764876497650765176527653765476557656765776587659766076617662766376647665766676677668766976707671767276737674767576767677767876797680768176827683768476857686768776887689769076917692769376947695769676977698769977007701770277037704770577067707770877097710771177127713771477157716771777187719772077217722772377247725772677277728772977307731773277337734773577367737773877397740774177427743774477457746774777487749775077517752775377547755775677577758775977607761776277637764776577667767776877697770777177727773777477757776777777787779778077817782778377847785778677877788778977907791779277937794779577967797779877997800780178027803780478057806780778087809781078117812781378147815781678177818781978207821782278237824782578267827782878297830783178327833783478357836783778387839784078417842784378447845784678477848784978507851785278537854785578567857785878597860786178627863786478657866786778687869787078717872787378747875787678777878787978807881788278837884788578867887788878897890789178927893789478957896789778987899790079017902790379047905790679077908790979107911791279137914791579167917791879197920792179227923792479257926792779287929793079317932793379347935793679377938793979407941794279437944794579467947794879497950795179527953795479557956795779587959796079617962796379647965796679677968796979707971797279737974797579767977797879797980798179827983798479857986798779887989799079917992799379947995799679977998799980008001800280038004800580068007800880098010801180128013801480158016801780188019802080218022802380248025802680278028802980308031803280338034803580368037803880398040804180428043804480458046804780488049805080518052805380548055805680578058805980608061806280638064806580668067806880698070807180728073807480758076807780788079808080818082808380848085808680878088808980908091809280938094809580968097809880998100810181028103810481058106810781088109811081118112811381148115811681178118811981208121812281238124812581268127812881298130813181328133813481358136813781388139814081418142814381448145814681478148814981508151815281538154815581568157815881598160816181628163816481658166816781688169817081718172817381748175817681778178817981808181818281838184818581868187818881898190819181928193819481958196819781988199820082018202820382048205820682078208820982108211821282138214821582168217821882198220822182228223822482258226822782288229823082318232823382348235823682378238823982408241824282438244824582468247824882498250825182528253825482558256825782588259826082618262826382648265826682678268826982708271827282738274827582768277827882798280828182828283828482858286828782888289829082918292829382948295829682978298829983008301830283038304830583068307830883098310831183128313831483158316831783188319832083218322832383248325832683278328832983308331833283338334833583368337833883398340834183428343834483458346834783488349835083518352835383548355835683578358835983608361836283638364836583668367836883698370837183728373837483758376837783788379838083818382838383848385838683878388838983908391839283938394839583968397839883998400840184028403840484058406840784088409841084118412841384148415841684178418841984208421842284238424842584268427842884298430843184328433843484358436843784388439844084418442844384448445844684478448844984508451845284538454845584568457845884598460846184628463846484658466846784688469847084718472847384748475847684778478847984808481848284838484848584868487848884898490849184928493849484958496849784988499850085018502850385048505850685078508850985108511851285138514851585168517851885198520852185228523852485258526852785288529853085318532853385348535853685378538853985408541854285438544854585468547854885498550855185528553855485558556855785588559856085618562856385648565856685678568856985708571857285738574857585768577857885798580858185828583858485858586858785888589859085918592859385948595859685978598859986008601860286038604860586068607860886098610861186128613861486158616861786188619862086218622862386248625862686278628862986308631863286338634863586368637863886398640864186428643864486458646864786488649865086518652865386548655865686578658865986608661866286638664866586668667866886698670867186728673867486758676867786788679868086818682868386848685868686878688868986908691869286938694869586968697869886998700870187028703870487058706870787088709871087118712871387148715871687178718871987208721872287238724872587268727872887298730873187328733873487358736873787388739874087418742874387448745874687478748874987508751875287538754875587568757875887598760876187628763876487658766876787688769877087718772877387748775877687778778877987808781878287838784878587868787878887898790879187928793879487958796879787988799880088018802880388048805880688078808880988108811881288138814881588168817881888198820882188228823882488258826882788288829883088318832883388348835883688378838883988408841884288438844884588468847884888498850885188528853885488558856885788588859886088618862886388648865886688678868886988708871887288738874887588768877887888798880888188828883888488858886888788888889889088918892889388948895889688978898889989008901890289038904890589068907890889098910891189128913891489158916891789188919892089218922892389248925892689278928892989308931893289338934893589368937893889398940894189428943894489458946894789488949895089518952895389548955895689578958895989608961896289638964896589668967896889698970897189728973897489758976897789788979898089818982898389848985898689878988898989908991899289938994899589968997899889999000900190029003900490059006900790089009901090119012901390149015901690179018901990209021902290239024902590269027902890299030903190329033903490359036903790389039904090419042904390449045904690479048904990509051905290539054905590569057905890599060906190629063906490659066906790689069907090719072907390749075907690779078907990809081908290839084908590869087908890899090909190929093909490959096909790989099910091019102910391049105910691079108910991109111911291139114911591169117911891199120912191229123912491259126912791289129913091319132913391349135913691379138913991409141914291439144914591469147914891499150915191529153915491559156915791589159916091619162916391649165916691679168916991709171917291739174917591769177917891799180918191829183918491859186918791889189919091919192919391949195919691979198919992009201920292039204920592069207920892099210921192129213921492159216921792189219922092219222922392249225922692279228922992309231923292339234923592369237923892399240924192429243924492459246924792489249925092519252925392549255925692579258925992609261926292639264926592669267926892699270927192729273927492759276927792789279928092819282928392849285928692879288928992909291929292939294929592969297929892999300930193029303930493059306930793089309931093119312931393149315931693179318931993209321932293239324932593269327932893299330933193329333933493359336933793389339934093419342934393449345934693479348934993509351935293539354935593569357935893599360936193629363936493659366936793689369937093719372937393749375937693779378937993809381938293839384938593869387938893899390939193929393939493959396939793989399940094019402940394049405940694079408940994109411941294139414941594169417941894199420942194229423942494259426942794289429943094319432943394349435943694379438943994409441944294439444944594469447944894499450945194529453945494559456945794589459946094619462946394649465946694679468946994709471947294739474947594769477947894799480948194829483948494859486948794889489949094919492949394949495949694979498949995009501950295039504950595069507950895099510951195129513951495159516951795189519952095219522952395249525952695279528952995309531953295339534953595369537953895399540954195429543954495459546954795489549955095519552955395549555955695579558955995609561956295639564956595669567956895699570957195729573957495759576957795789579958095819582958395849585958695879588958995909591959295939594959595969597959895999600960196029603960496059606960796089609961096119612961396149615961696179618961996209621962296239624962596269627962896299630963196329633963496359636963796389639964096419642964396449645964696479648964996509651965296539654965596569657965896599660966196629663966496659666966796689669967096719672967396749675967696779678967996809681968296839684968596869687968896899690969196929693969496959696969796989699970097019702970397049705970697079708970997109711971297139714971597169717971897199720972197229723972497259726972797289729973097319732973397349735973697379738973997409741974297439744974597469747974897499750975197529753975497559756975797589759976097619762976397649765976697679768976997709771977297739774977597769777977897799780978197829783978497859786978797889789979097919792979397949795979697979798979998009801980298039804980598069807980898099810981198129813981498159816981798189819982098219822982398249825982698279828982998309831983298339834983598369837983898399840984198429843984498459846984798489849985098519852985398549855985698579858985998609861986298639864986598669867986898699870987198729873987498759876987798789879988098819882988398849885988698879888988998909891989298939894989598969897989898999900990199029903990499059906990799089909991099119912991399149915991699179918991999209921992299239924992599269927992899299930993199329933993499359936993799389939994099419942994399449945994699479948994999509951995299539954995599569957995899599960996199629963996499659966996799689969997099719972997399749975997699779978997999809981998299839984998599869987998899899990999199929993999499959996999799989999100001000110002100031000410005100061000710008100091001010011100121001310014100151001610017100181001910020100211002210023100241002510026100271002810029100301003110032100331003410035100361003710038100391004010041100421004310044100451004610047100481004910050100511005210053100541005510056100571005810059100601006110062100631006410065100661006710068100691007010071100721007310074100751007610077100781007910080100811008210083100841008510086100871008810089100901009110092100931009410095100961009710098100991010010101101021010310104101051010610107101081010910110101111011210113101141011510116101171011810119101201012110122101231012410125101261012710128101291013010131101321013310134101351013610137101381013910140101411014210143101441014510146101471014810149101501015110152101531015410155101561015710158101591016010161101621016310164101651016610167101681016910170101711017210173101741017510176101771017810179101801018110182101831018410185101861018710188101891019010191101921019310194101951019610197101981019910200102011020210203102041020510206102071020810209102101021110212102131021410215102161021710218102191022010221102221022310224102251022610227102281022910230102311023210233102341023510236102371023810239102401024110242102431024410245102461024710248102491025010251102521025310254102551025610257102581025910260102611026210263102641026510266102671026810269102701027110272102731027410275102761027710278102791028010281102821028310284102851028610287102881028910290102911029210293102941029510296102971029810299103001030110302103031030410305103061030710308103091031010311103121031310314103151031610317103181031910320103211032210323103241032510326103271032810329103301033110332103331033410335103361033710338103391034010341103421034310344103451034610347103481034910350103511035210353103541035510356103571035810359103601036110362103631036410365103661036710368103691037010371103721037310374103751037610377103781037910380103811038210383103841038510386103871038810389103901039110392103931039410395103961039710398103991040010401104021040310404104051040610407104081040910410104111041210413104141041510416104171041810419104201042110422104231042410425104261042710428104291043010431104321043310434104351043610437104381043910440104411044210443104441044510446104471044810449104501045110452104531045410455104561045710458104591046010461104621046310464104651046610467104681046910470104711047210473104741047510476104771047810479104801048110482104831048410485104861048710488104891049010491104921049310494104951049610497104981049910500105011050210503105041050510506105071050810509105101051110512105131051410515105161051710518105191052010521105221052310524105251052610527105281052910530105311053210533105341053510536105371053810539105401054110542105431054410545105461054710548105491055010551105521055310554105551055610557105581055910560105611056210563105641056510566105671056810569105701057110572105731057410575105761057710578105791058010581105821058310584105851058610587105881058910590105911059210593105941059510596105971059810599106001060110602106031060410605106061060710608106091061010611106121061310614106151061610617106181061910620106211062210623106241062510626106271062810629106301063110632106331063410635106361063710638106391064010641106421064310644106451064610647106481064910650106511065210653106541065510656106571065810659106601066110662106631066410665106661066710668106691067010671106721067310674106751067610677106781067910680106811068210683106841068510686106871068810689106901069110692106931069410695106961069710698106991070010701107021070310704107051070610707107081070910710107111071210713107141071510716107171071810719107201072110722107231072410725107261072710728107291073010731107321073310734107351073610737107381073910740107411074210743107441074510746107471074810749107501075110752107531075410755107561075710758107591076010761107621076310764107651076610767107681076910770107711077210773107741077510776107771077810779107801078110782107831078410785107861078710788107891079010791107921079310794107951079610797107981079910800108011080210803108041080510806108071080810809108101081110812108131081410815108161081710818108191082010821108221082310824108251082610827108281082910830108311083210833108341083510836108371083810839108401084110842108431084410845108461084710848108491085010851108521085310854108551085610857108581085910860108611086210863108641086510866108671086810869108701087110872108731087410875108761087710878108791088010881108821088310884108851088610887108881088910890108911089210893108941089510896108971089810899109001090110902109031090410905109061090710908109091091010911109121091310914109151091610917109181091910920109211092210923109241092510926109271092810929109301093110932109331093410935109361093710938109391094010941109421094310944109451094610947109481094910950109511095210953109541095510956109571095810959109601096110962109631096410965109661096710968109691097010971109721097310974109751097610977109781097910980109811098210983109841098510986109871098810989109901099110992109931099410995109961099710998109991100011001110021100311004110051100611007110081100911010110111101211013110141101511016110171101811019110201102111022110231102411025110261102711028110291103011031110321103311034110351103611037110381103911040110411104211043110441104511046110471104811049110501105111052110531105411055110561105711058110591106011061110621106311064110651106611067110681106911070110711107211073110741107511076110771107811079110801108111082110831108411085110861108711088110891109011091110921109311094110951109611097110981109911100111011110211103111041110511106111071110811109111101111111112
  1. //
  2. // Copyright (C) 2014-2016 LunarG, Inc.
  3. // Copyright (C) 2015-2020 Google, Inc.
  4. // Copyright (C) 2017, 2022-2025 Arm Limited.
  5. // Modifications Copyright (C) 2020 Advanced Micro Devices, Inc. All rights reserved.
  6. //
  7. // All rights reserved.
  8. //
  9. // Redistribution and use in source and binary forms, with or without
  10. // modification, are permitted provided that the following conditions
  11. // are met:
  12. //
  13. // Redistributions of source code must retain the above copyright
  14. // notice, this list of conditions and the following disclaimer.
  15. //
  16. // Redistributions in binary form must reproduce the above
  17. // copyright notice, this list of conditions and the following
  18. // disclaimer in the documentation and/or other materials provided
  19. // with the distribution.
  20. //
  21. // Neither the name of 3Dlabs Inc. Ltd. nor the names of its
  22. // contributors may be used to endorse or promote products derived
  23. // from this software without specific prior written permission.
  24. //
  25. // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  26. // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  27. // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
  28. // FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
  29. // COPYRIGHT HOLDERS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
  30. // INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
  31. // BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  32. // LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
  33. // CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  34. // LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
  35. // ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  36. // POSSIBILITY OF SUCH DAMAGE.
  37. //
  38. // Visit the nodes in the glslang intermediate tree representation to
  39. // translate them to SPIR-V.
  40. //
  41. #include "spirv.hpp11"
  42. #include "GlslangToSpv.h"
  43. #include "SpvBuilder.h"
  44. #include "SpvTools.h"
  45. #include "spvUtil.h"
  46. namespace spv {
  47. #include "GLSL.std.450.h"
  48. #include "GLSL.ext.KHR.h"
  49. #include "GLSL.ext.EXT.h"
  50. #include "GLSL.ext.AMD.h"
  51. #include "GLSL.ext.NV.h"
  52. #include "GLSL.ext.ARM.h"
  53. #include "GLSL.ext.QCOM.h"
  54. #include "NonSemanticDebugPrintf.h"
  55. }
  56. // Glslang includes
  57. #include "../glslang/MachineIndependent/localintermediate.h"
  58. #include "../glslang/MachineIndependent/SymbolTable.h"
  59. #include "../glslang/Include/Common.h"
  60. // Build-time generated includes
  61. #include "glslang/build_info.h"
  62. #include <fstream>
  63. #include <iomanip>
  64. #include <list>
  65. #include <map>
  66. #include <optional>
  67. #include <stack>
  68. #include <string>
  69. #include <vector>
  70. namespace {
  71. namespace {
  72. class SpecConstantOpModeGuard {
  73. public:
  74. SpecConstantOpModeGuard(spv::Builder* builder)
  75. : builder_(builder) {
  76. previous_flag_ = builder->isInSpecConstCodeGenMode();
  77. }
  78. ~SpecConstantOpModeGuard() {
  79. previous_flag_ ? builder_->setToSpecConstCodeGenMode()
  80. : builder_->setToNormalCodeGenMode();
  81. }
  82. void turnOnSpecConstantOpMode() {
  83. builder_->setToSpecConstCodeGenMode();
  84. }
  85. private:
  86. spv::Builder* builder_;
  87. bool previous_flag_;
  88. };
  89. struct OpDecorations {
  90. public:
  91. OpDecorations(spv::Decoration precision, spv::Decoration noContraction, spv::Decoration nonUniform) :
  92. precision(precision)
  93. ,
  94. noContraction(noContraction),
  95. nonUniform(nonUniform)
  96. { }
  97. spv::Decoration precision;
  98. void addNoContraction(spv::Builder& builder, spv::Id t) { builder.addDecoration(t, noContraction); }
  99. void addNonUniform(spv::Builder& builder, spv::Id t) { builder.addDecoration(t, nonUniform); }
  100. protected:
  101. spv::Decoration noContraction;
  102. spv::Decoration nonUniform;
  103. };
  104. } // namespace
  105. //
  106. // The main holder of information for translating glslang to SPIR-V.
  107. //
  108. // Derives from the AST walking base class.
  109. //
  110. class TGlslangToSpvTraverser : public glslang::TIntermTraverser {
  111. public:
  112. TGlslangToSpvTraverser(unsigned int spvVersion, const glslang::TIntermediate*, spv::SpvBuildLogger* logger,
  113. glslang::SpvOptions& options);
  114. virtual ~TGlslangToSpvTraverser() { }
  115. bool visitAggregate(glslang::TVisit, glslang::TIntermAggregate*);
  116. bool visitBinary(glslang::TVisit, glslang::TIntermBinary*);
  117. void visitConstantUnion(glslang::TIntermConstantUnion*);
  118. bool visitSelection(glslang::TVisit, glslang::TIntermSelection*);
  119. bool visitSwitch(glslang::TVisit, glslang::TIntermSwitch*);
  120. void visitSymbol(glslang::TIntermSymbol* symbol);
  121. bool visitUnary(glslang::TVisit, glslang::TIntermUnary*);
  122. bool visitLoop(glslang::TVisit, glslang::TIntermLoop*);
  123. bool visitBranch(glslang::TVisit visit, glslang::TIntermBranch*);
  124. void finishSpv(bool compileOnly);
  125. void dumpSpv(std::vector<unsigned int>& out);
  126. protected:
  127. TGlslangToSpvTraverser(TGlslangToSpvTraverser&);
  128. TGlslangToSpvTraverser& operator=(TGlslangToSpvTraverser&);
  129. spv::Decoration TranslateInterpolationDecoration(const glslang::TQualifier& qualifier);
  130. spv::Decoration TranslateAuxiliaryStorageDecoration(const glslang::TQualifier& qualifier);
  131. spv::Decoration TranslateNonUniformDecoration(const glslang::TQualifier& qualifier);
  132. spv::Decoration TranslateNonUniformDecoration(const spv::Builder::AccessChain::CoherentFlags& coherentFlags);
  133. spv::Builder::AccessChain::CoherentFlags TranslateCoherent(const glslang::TType& type);
  134. spv::MemoryAccessMask TranslateMemoryAccess(const spv::Builder::AccessChain::CoherentFlags &coherentFlags);
  135. spv::ImageOperandsMask TranslateImageOperands(const spv::Builder::AccessChain::CoherentFlags &coherentFlags);
  136. spv::Scope TranslateMemoryScope(const spv::Builder::AccessChain::CoherentFlags &coherentFlags);
  137. spv::BuiltIn TranslateBuiltInDecoration(glslang::TBuiltInVariable, bool memberDeclaration);
  138. spv::ImageFormat TranslateImageFormat(const glslang::TType& type);
  139. spv::SelectionControlMask TranslateSelectionControl(const glslang::TIntermSelection&) const;
  140. spv::SelectionControlMask TranslateSwitchControl(const glslang::TIntermSwitch&) const;
  141. spv::LoopControlMask TranslateLoopControl(const glslang::TIntermLoop&, std::vector<unsigned int>& operands) const;
  142. spv::StorageClass TranslateStorageClass(const glslang::TType&);
  143. void TranslateLiterals(const glslang::TVector<const glslang::TIntermConstantUnion*>&, std::vector<unsigned>&) const;
  144. void addIndirectionIndexCapabilities(const glslang::TType& baseType, const glslang::TType& indexType);
  145. spv::Id createSpvVariable(const glslang::TIntermSymbol*, spv::Id forcedType);
  146. spv::Id getSampledType(const glslang::TSampler&);
  147. spv::Id getInvertedSwizzleType(const glslang::TIntermTyped&);
  148. spv::Id createInvertedSwizzle(spv::Decoration precision, const glslang::TIntermTyped&, spv::Id parentResult);
  149. void convertSwizzle(const glslang::TIntermAggregate&, std::vector<unsigned>& swizzle);
  150. spv::Id convertGlslangToSpvType(const glslang::TType& type, bool forwardReferenceOnly = false);
  151. spv::Id convertGlslangToSpvType(const glslang::TType& type, glslang::TLayoutPacking, const glslang::TQualifier&,
  152. bool lastBufferBlockMember, bool forwardReferenceOnly = false);
  153. void applySpirvDecorate(const glslang::TType& type, spv::Id id, std::optional<int> member);
  154. bool filterMember(const glslang::TType& member);
  155. spv::Id convertGlslangStructToSpvType(const glslang::TType&, const glslang::TTypeList* glslangStruct,
  156. glslang::TLayoutPacking, const glslang::TQualifier&);
  157. spv::LinkageType convertGlslangLinkageToSpv(glslang::TLinkType glslangLinkType);
  158. void decorateStructType(const glslang::TType&, const glslang::TTypeList* glslangStruct, glslang::TLayoutPacking,
  159. const glslang::TQualifier&, spv::Id, const std::vector<spv::Id>& spvMembers);
  160. spv::Id makeArraySizeId(const glslang::TArraySizes&, int dim, bool allowZero = false, bool boolType = false);
  161. spv::Id accessChainLoad(const glslang::TType& type);
  162. void accessChainStore(const glslang::TType& type, spv::Id rvalue);
  163. void multiTypeStore(const glslang::TType&, spv::Id rValue);
  164. spv::Id convertLoadedBoolInUniformToUint(const glslang::TType& type, spv::Id nominalTypeId, spv::Id loadedId);
  165. glslang::TLayoutPacking getExplicitLayout(const glslang::TType& type) const;
  166. int getArrayStride(const glslang::TType& arrayType, glslang::TLayoutPacking, glslang::TLayoutMatrix);
  167. int getMatrixStride(const glslang::TType& matrixType, glslang::TLayoutPacking, glslang::TLayoutMatrix);
  168. void updateMemberOffset(const glslang::TType& structType, const glslang::TType& memberType, int& currentOffset,
  169. int& nextOffset, glslang::TLayoutPacking, glslang::TLayoutMatrix);
  170. void declareUseOfStructMember(const glslang::TTypeList& members, int glslangMember);
  171. bool isShaderEntryPoint(const glslang::TIntermAggregate* node);
  172. bool writableParam(glslang::TStorageQualifier) const;
  173. bool originalParam(glslang::TStorageQualifier, const glslang::TType&, bool implicitThisParam);
  174. void makeFunctions(const glslang::TIntermSequence&);
  175. void makeGlobalInitializers(const glslang::TIntermSequence&);
  176. void collectRayTracingLinkerObjects();
  177. void visitFunctions(const glslang::TIntermSequence&);
  178. void handleFunctionEntry(const glslang::TIntermAggregate* node);
  179. void translateArguments(const glslang::TIntermAggregate& node, std::vector<spv::Id>& arguments,
  180. spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags);
  181. void translateArguments(glslang::TIntermUnary& node, std::vector<spv::Id>& arguments);
  182. spv::Id createImageTextureFunctionCall(glslang::TIntermOperator* node);
  183. spv::Id handleUserFunctionCall(const glslang::TIntermAggregate*);
  184. spv::Id createBinaryOperation(glslang::TOperator op, OpDecorations&, spv::Id typeId, spv::Id left, spv::Id right,
  185. glslang::TBasicType typeProxy, bool reduceComparison = true);
  186. spv::Id createBinaryMatrixOperation(spv::Op, OpDecorations&, spv::Id typeId, spv::Id left, spv::Id right);
  187. spv::Id createUnaryOperation(glslang::TOperator op, OpDecorations&, spv::Id typeId, spv::Id operand,
  188. glslang::TBasicType typeProxy,
  189. const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags,
  190. const glslang::TType &opType);
  191. spv::Id createUnaryMatrixOperation(spv::Op op, OpDecorations&, spv::Id typeId, spv::Id operand,
  192. glslang::TBasicType typeProxy);
  193. spv::Id createConversion(glslang::TOperator op, OpDecorations&, spv::Id destTypeId, spv::Id operand,
  194. glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType);
  195. spv::Id createIntWidthConversion(spv::Id operand, int vectorSize, spv::Id destType,
  196. glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType);
  197. spv::Id makeSmearedConstant(spv::Id constant, int vectorSize);
  198. spv::Id createAtomicOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId,
  199. std::vector<spv::Id>& operands, glslang::TBasicType typeProxy,
  200. const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags,
  201. const glslang::TType &opType);
  202. spv::Id createInvocationsOperation(glslang::TOperator op, spv::Id typeId, std::vector<spv::Id>& operands,
  203. glslang::TBasicType typeProxy);
  204. spv::Id CreateInvocationsVectorOperation(spv::Op op, spv::GroupOperation groupOperation,
  205. spv::Id typeId, std::vector<spv::Id>& operands);
  206. spv::Id createSubgroupOperation(glslang::TOperator op, spv::Id typeId, std::vector<spv::Id>& operands,
  207. glslang::TBasicType typeProxy);
  208. spv::Id createMiscOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId,
  209. std::vector<spv::Id>& operands, glslang::TBasicType typeProxy);
  210. spv::Id createNoArgOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId);
  211. spv::Id getSymbolId(const glslang::TIntermSymbol* node);
  212. void addMeshNVDecoration(spv::Id id, int member, const glslang::TQualifier & qualifier);
  213. bool hasQCOMImageProceessingDecoration(spv::Id id, spv::Decoration decor);
  214. void addImageProcessingQCOMDecoration(spv::Id id, spv::Decoration decor);
  215. void addImageProcessing2QCOMDecoration(spv::Id id, bool isForGather);
  216. spv::Id createSpvConstant(const glslang::TIntermTyped&);
  217. spv::Id createSpvConstantFromConstUnionArray(const glslang::TType& type, const glslang::TConstUnionArray&,
  218. int& nextConst, bool specConstant);
  219. bool isTrivialLeaf(const glslang::TIntermTyped* node);
  220. bool isTrivial(const glslang::TIntermTyped* node);
  221. spv::Id createShortCircuit(glslang::TOperator, glslang::TIntermTyped& left, glslang::TIntermTyped& right);
  222. spv::Id getExtBuiltins(const char* name);
  223. std::pair<spv::Id, spv::Id> getForcedType(glslang::TBuiltInVariable builtIn, const glslang::TType&);
  224. spv::Id translateForcedType(spv::Id object);
  225. spv::Id createCompositeConstruct(spv::Id typeId, std::vector<spv::Id> constituents);
  226. glslang::SpvOptions& options;
  227. spv::Function* shaderEntry;
  228. spv::Function* currentFunction;
  229. spv::Instruction* entryPoint;
  230. int sequenceDepth;
  231. spv::SpvBuildLogger* logger;
  232. // There is a 1:1 mapping between a spv builder and a module; this is thread safe
  233. spv::Builder builder;
  234. bool inEntryPoint;
  235. bool entryPointTerminated;
  236. bool linkageOnly; // true when visiting the set of objects in the AST present only for
  237. // establishing interface, whether or not they were statically used
  238. std::set<spv::Id> iOSet; // all input/output variables from either static use or declaration of interface
  239. const glslang::TIntermediate* glslangIntermediate;
  240. bool nanMinMaxClamp; // true if use NMin/NMax/NClamp instead of FMin/FMax/FClamp
  241. spv::Id stdBuiltins;
  242. spv::Id nonSemanticDebugPrintf;
  243. std::unordered_map<std::string, spv::Id> extBuiltinMap;
  244. std::unordered_map<long long, spv::Id> symbolValues;
  245. std::unordered_map<uint32_t, spv::Id> builtInVariableIds;
  246. std::unordered_set<long long> rValueParameters; // set of formal function parameters passed as rValues,
  247. // rather than a pointer
  248. std::unordered_map<std::string, spv::Function*> functionMap;
  249. std::unordered_map<const glslang::TTypeList*, spv::Id> structMap[glslang::ElpCount][glslang::ElmCount];
  250. // for mapping glslang block indices to spv indices (e.g., due to hidden members):
  251. std::unordered_map<long long, std::vector<int>> memberRemapper;
  252. // for mapping glslang symbol struct to symbol Id
  253. std::unordered_map<const glslang::TTypeList*, long long> glslangTypeToIdMap;
  254. std::stack<bool> breakForLoop; // false means break for switch
  255. std::unordered_map<std::string, const glslang::TIntermSymbol*> counterOriginator;
  256. // Map pointee types for EbtReference to their forward pointers
  257. std::map<const glslang::TType *, spv::Id> forwardPointers;
  258. // Type forcing, for when SPIR-V wants a different type than the AST,
  259. // requiring local translation to and from SPIR-V type on every access.
  260. // Maps <builtin-variable-id -> AST-required-type-id>
  261. std::unordered_map<spv::Id, spv::Id> forceType;
  262. // Used by Task shader while generating opearnds for OpEmitMeshTasksEXT
  263. spv::Id taskPayloadID;
  264. // Used later for generating OpTraceKHR/OpExecuteCallableKHR/OpHitObjectRecordHit*/OpHitObjectGetShaderBindingTableData
  265. std::unordered_map<unsigned int, glslang::TIntermSymbol *> locationToSymbol[4];
  266. std::unordered_map<spv::Id, std::vector<spv::Decoration> > idToQCOMDecorations;
  267. };
  268. //
  269. // Helper functions for translating glslang representations to SPIR-V enumerants.
  270. //
  271. // Translate glslang profile to SPIR-V source language.
  272. spv::SourceLanguage TranslateSourceLanguage(glslang::EShSource source, EProfile profile)
  273. {
  274. switch (source) {
  275. case glslang::EShSourceGlsl:
  276. switch (profile) {
  277. case ENoProfile:
  278. case ECoreProfile:
  279. case ECompatibilityProfile:
  280. return spv::SourceLanguage::GLSL;
  281. case EEsProfile:
  282. return spv::SourceLanguage::ESSL;
  283. default:
  284. return spv::SourceLanguage::Unknown;
  285. }
  286. case glslang::EShSourceHlsl:
  287. return spv::SourceLanguage::HLSL;
  288. default:
  289. return spv::SourceLanguage::Unknown;
  290. }
  291. }
  292. // Translate glslang language (stage) to SPIR-V execution model.
  293. spv::ExecutionModel TranslateExecutionModel(EShLanguage stage, bool isMeshShaderEXT = false)
  294. {
  295. switch (stage) {
  296. case EShLangVertex: return spv::ExecutionModel::Vertex;
  297. case EShLangFragment: return spv::ExecutionModel::Fragment;
  298. case EShLangCompute: return spv::ExecutionModel::GLCompute;
  299. case EShLangTessControl: return spv::ExecutionModel::TessellationControl;
  300. case EShLangTessEvaluation: return spv::ExecutionModel::TessellationEvaluation;
  301. case EShLangGeometry: return spv::ExecutionModel::Geometry;
  302. case EShLangRayGen: return spv::ExecutionModel::RayGenerationKHR;
  303. case EShLangIntersect: return spv::ExecutionModel::IntersectionKHR;
  304. case EShLangAnyHit: return spv::ExecutionModel::AnyHitKHR;
  305. case EShLangClosestHit: return spv::ExecutionModel::ClosestHitKHR;
  306. case EShLangMiss: return spv::ExecutionModel::MissKHR;
  307. case EShLangCallable: return spv::ExecutionModel::CallableKHR;
  308. case EShLangTask: return (isMeshShaderEXT)? spv::ExecutionModel::TaskEXT : spv::ExecutionModel::TaskNV;
  309. case EShLangMesh: return (isMeshShaderEXT)? spv::ExecutionModel::MeshEXT : spv::ExecutionModel::MeshNV;
  310. default:
  311. assert(0);
  312. return spv::ExecutionModel::Fragment;
  313. }
  314. }
  315. // Translate glslang sampler type to SPIR-V dimensionality.
  316. spv::Dim TranslateDimensionality(const glslang::TSampler& sampler)
  317. {
  318. switch (sampler.dim) {
  319. case glslang::Esd1D: return spv::Dim::Dim1D;
  320. case glslang::Esd2D: return spv::Dim::Dim2D;
  321. case glslang::Esd3D: return spv::Dim::Dim3D;
  322. case glslang::EsdCube: return spv::Dim::Cube;
  323. case glslang::EsdRect: return spv::Dim::Rect;
  324. case glslang::EsdBuffer: return spv::Dim::Buffer;
  325. case glslang::EsdSubpass: return spv::Dim::SubpassData;
  326. case glslang::EsdAttachmentEXT: return spv::Dim::TileImageDataEXT;
  327. default:
  328. assert(0);
  329. return spv::Dim::Dim2D;
  330. }
  331. }
  332. // Translate glslang precision to SPIR-V precision decorations.
  333. spv::Decoration TranslatePrecisionDecoration(glslang::TPrecisionQualifier glslangPrecision)
  334. {
  335. switch (glslangPrecision) {
  336. case glslang::EpqLow: return spv::Decoration::RelaxedPrecision;
  337. case glslang::EpqMedium: return spv::Decoration::RelaxedPrecision;
  338. default:
  339. return spv::NoPrecision;
  340. }
  341. }
  342. // Translate glslang type to SPIR-V precision decorations.
  343. spv::Decoration TranslatePrecisionDecoration(const glslang::TType& type)
  344. {
  345. return TranslatePrecisionDecoration(type.getQualifier().precision);
  346. }
  347. // Translate glslang type to SPIR-V block decorations.
  348. spv::Decoration TranslateBlockDecoration(const glslang::TStorageQualifier storage, bool useStorageBuffer)
  349. {
  350. switch (storage) {
  351. case glslang::EvqUniform: return spv::Decoration::Block;
  352. case glslang::EvqBuffer: return useStorageBuffer ? spv::Decoration::Block : spv::Decoration::BufferBlock;
  353. case glslang::EvqVaryingIn: return spv::Decoration::Block;
  354. case glslang::EvqVaryingOut: return spv::Decoration::Block;
  355. case glslang::EvqShared: return spv::Decoration::Block;
  356. case glslang::EvqPayload: return spv::Decoration::Block;
  357. case glslang::EvqPayloadIn: return spv::Decoration::Block;
  358. case glslang::EvqHitAttr: return spv::Decoration::Block;
  359. case glslang::EvqCallableData: return spv::Decoration::Block;
  360. case glslang::EvqCallableDataIn: return spv::Decoration::Block;
  361. case glslang::EvqHitObjectAttrNV: return spv::Decoration::Block;
  362. default:
  363. assert(0);
  364. break;
  365. }
  366. return spv::Decoration::Max;
  367. }
  368. // Translate glslang type to SPIR-V memory decorations.
  369. void TranslateMemoryDecoration(const glslang::TQualifier& qualifier, std::vector<spv::Decoration>& memory,
  370. bool useVulkanMemoryModel)
  371. {
  372. if (!useVulkanMemoryModel) {
  373. if (qualifier.isVolatile()) {
  374. memory.push_back(spv::Decoration::Volatile);
  375. memory.push_back(spv::Decoration::Coherent);
  376. } else if (qualifier.isCoherent()) {
  377. memory.push_back(spv::Decoration::Coherent);
  378. }
  379. }
  380. if (qualifier.isRestrict())
  381. memory.push_back(spv::Decoration::Restrict);
  382. if (qualifier.isReadOnly())
  383. memory.push_back(spv::Decoration::NonWritable);
  384. if (qualifier.isWriteOnly())
  385. memory.push_back(spv::Decoration::NonReadable);
  386. }
  387. // Translate glslang type to SPIR-V layout decorations.
  388. spv::Decoration TranslateLayoutDecoration(const glslang::TType& type, glslang::TLayoutMatrix matrixLayout)
  389. {
  390. if (type.isMatrix()) {
  391. switch (matrixLayout) {
  392. case glslang::ElmRowMajor:
  393. return spv::Decoration::RowMajor;
  394. case glslang::ElmColumnMajor:
  395. return spv::Decoration::ColMajor;
  396. default:
  397. // opaque layouts don't need a majorness
  398. return spv::Decoration::Max;
  399. }
  400. } else {
  401. switch (type.getBasicType()) {
  402. default:
  403. return spv::Decoration::Max;
  404. break;
  405. case glslang::EbtBlock:
  406. switch (type.getQualifier().storage) {
  407. case glslang::EvqShared:
  408. case glslang::EvqUniform:
  409. case glslang::EvqBuffer:
  410. switch (type.getQualifier().layoutPacking) {
  411. case glslang::ElpShared: return spv::Decoration::GLSLShared;
  412. case glslang::ElpPacked: return spv::Decoration::GLSLPacked;
  413. default:
  414. return spv::Decoration::Max;
  415. }
  416. case glslang::EvqVaryingIn:
  417. case glslang::EvqVaryingOut:
  418. if (type.getQualifier().isTaskMemory()) {
  419. switch (type.getQualifier().layoutPacking) {
  420. case glslang::ElpShared: return spv::Decoration::GLSLShared;
  421. case glslang::ElpPacked: return spv::Decoration::GLSLPacked;
  422. default: break;
  423. }
  424. } else {
  425. assert(type.getQualifier().layoutPacking == glslang::ElpNone);
  426. }
  427. return spv::Decoration::Max;
  428. case glslang::EvqPayload:
  429. case glslang::EvqPayloadIn:
  430. case glslang::EvqHitAttr:
  431. case glslang::EvqCallableData:
  432. case glslang::EvqCallableDataIn:
  433. case glslang::EvqHitObjectAttrNV:
  434. return spv::Decoration::Max;
  435. default:
  436. assert(0);
  437. return spv::Decoration::Max;
  438. }
  439. }
  440. }
  441. }
  442. // Translate glslang type to SPIR-V interpolation decorations.
  443. // Returns spv::Decoration::Max when no decoration
  444. // should be applied.
  445. spv::Decoration TGlslangToSpvTraverser::TranslateInterpolationDecoration(const glslang::TQualifier& qualifier)
  446. {
  447. if (qualifier.smooth)
  448. // Smooth decoration doesn't exist in SPIR-V 1.0
  449. return spv::Decoration::Max;
  450. else if (qualifier.isNonPerspective())
  451. return spv::Decoration::NoPerspective;
  452. else if (qualifier.flat)
  453. return spv::Decoration::Flat;
  454. else if (qualifier.isExplicitInterpolation()) {
  455. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  456. return spv::Decoration::ExplicitInterpAMD;
  457. }
  458. else
  459. return spv::Decoration::Max;
  460. }
  461. // Translate glslang type to SPIR-V auxiliary storage decorations.
  462. // Returns spv::Decoration::Max when no decoration
  463. // should be applied.
  464. spv::Decoration TGlslangToSpvTraverser::TranslateAuxiliaryStorageDecoration(const glslang::TQualifier& qualifier)
  465. {
  466. if (qualifier.centroid)
  467. return spv::Decoration::Centroid;
  468. else if (qualifier.patch)
  469. return spv::Decoration::Patch;
  470. else if (qualifier.sample) {
  471. builder.addCapability(spv::Capability::SampleRateShading);
  472. return spv::Decoration::Sample;
  473. }
  474. return spv::Decoration::Max;
  475. }
  476. // If glslang type is invariant, return SPIR-V invariant decoration.
  477. spv::Decoration TranslateInvariantDecoration(const glslang::TQualifier& qualifier)
  478. {
  479. if (qualifier.invariant)
  480. return spv::Decoration::Invariant;
  481. else
  482. return spv::Decoration::Max;
  483. }
  484. // If glslang type is noContraction, return SPIR-V NoContraction decoration.
  485. spv::Decoration TranslateNoContractionDecoration(const glslang::TQualifier& qualifier)
  486. {
  487. if (qualifier.isNoContraction())
  488. return spv::Decoration::NoContraction;
  489. else
  490. return spv::Decoration::Max;
  491. }
  492. // If glslang type is nonUniform, return SPIR-V NonUniform decoration.
  493. spv::Decoration TGlslangToSpvTraverser::TranslateNonUniformDecoration(const glslang::TQualifier& qualifier)
  494. {
  495. if (qualifier.isNonUniform()) {
  496. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  497. builder.addCapability(spv::Capability::ShaderNonUniformEXT);
  498. return spv::Decoration::NonUniformEXT;
  499. } else
  500. return spv::Decoration::Max;
  501. }
  502. // If lvalue flags contains nonUniform, return SPIR-V NonUniform decoration.
  503. spv::Decoration TGlslangToSpvTraverser::TranslateNonUniformDecoration(
  504. const spv::Builder::AccessChain::CoherentFlags& coherentFlags)
  505. {
  506. if (coherentFlags.isNonUniform()) {
  507. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  508. builder.addCapability(spv::Capability::ShaderNonUniformEXT);
  509. return spv::Decoration::NonUniformEXT;
  510. } else
  511. return spv::Decoration::Max;
  512. }
  513. spv::MemoryAccessMask TGlslangToSpvTraverser::TranslateMemoryAccess(
  514. const spv::Builder::AccessChain::CoherentFlags &coherentFlags)
  515. {
  516. spv::MemoryAccessMask mask = spv::MemoryAccessMask::MaskNone;
  517. if (!glslangIntermediate->usingVulkanMemoryModel() || coherentFlags.isImage)
  518. return mask;
  519. if (coherentFlags.isVolatile() || coherentFlags.anyCoherent()) {
  520. mask = mask | spv::MemoryAccessMask::MakePointerAvailableKHR |
  521. spv::MemoryAccessMask::MakePointerVisibleKHR;
  522. }
  523. if (coherentFlags.nonprivate) {
  524. mask = mask | spv::MemoryAccessMask::NonPrivatePointerKHR;
  525. }
  526. if (coherentFlags.volatil) {
  527. mask = mask | spv::MemoryAccessMask::Volatile;
  528. }
  529. if (coherentFlags.nontemporal) {
  530. mask = mask | spv::MemoryAccessMask::Nontemporal;
  531. }
  532. if (mask != spv::MemoryAccessMask::MaskNone) {
  533. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  534. }
  535. return mask;
  536. }
  537. spv::ImageOperandsMask TGlslangToSpvTraverser::TranslateImageOperands(
  538. const spv::Builder::AccessChain::CoherentFlags &coherentFlags)
  539. {
  540. spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;
  541. if (!glslangIntermediate->usingVulkanMemoryModel())
  542. return mask;
  543. if (coherentFlags.volatil ||
  544. coherentFlags.anyCoherent()) {
  545. mask = mask | spv::ImageOperandsMask::MakeTexelAvailableKHR |
  546. spv::ImageOperandsMask::MakeTexelVisibleKHR;
  547. }
  548. if (coherentFlags.nonprivate) {
  549. mask = mask | spv::ImageOperandsMask::NonPrivateTexelKHR;
  550. }
  551. if (coherentFlags.volatil) {
  552. mask = mask | spv::ImageOperandsMask::VolatileTexelKHR;
  553. }
  554. if (coherentFlags.nontemporal && builder.getSpvVersion() >= spv::Spv_1_6) {
  555. mask = mask | spv::ImageOperandsMask::Nontemporal;
  556. }
  557. if (mask != spv::ImageOperandsMask::MaskNone) {
  558. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  559. }
  560. return mask;
  561. }
  562. spv::Builder::AccessChain::CoherentFlags TGlslangToSpvTraverser::TranslateCoherent(const glslang::TType& type)
  563. {
  564. spv::Builder::AccessChain::CoherentFlags flags = {};
  565. flags.coherent = type.getQualifier().coherent;
  566. flags.devicecoherent = type.getQualifier().devicecoherent;
  567. flags.queuefamilycoherent = type.getQualifier().queuefamilycoherent;
  568. // shared variables are implicitly workgroupcoherent in GLSL.
  569. flags.workgroupcoherent = type.getQualifier().workgroupcoherent ||
  570. type.getQualifier().storage == glslang::EvqShared;
  571. flags.subgroupcoherent = type.getQualifier().subgroupcoherent;
  572. flags.shadercallcoherent = type.getQualifier().shadercallcoherent;
  573. flags.volatil = type.getQualifier().volatil;
  574. flags.nontemporal = type.getQualifier().nontemporal;
  575. // *coherent variables are implicitly nonprivate in GLSL
  576. flags.nonprivate = type.getQualifier().nonprivate ||
  577. flags.anyCoherent() ||
  578. flags.volatil;
  579. flags.isImage = type.getBasicType() == glslang::EbtSampler;
  580. flags.nonUniform = type.getQualifier().nonUniform;
  581. return flags;
  582. }
  583. spv::Scope TGlslangToSpvTraverser::TranslateMemoryScope(
  584. const spv::Builder::AccessChain::CoherentFlags &coherentFlags)
  585. {
  586. spv::Scope scope = spv::Scope::Max;
  587. if (coherentFlags.volatil || coherentFlags.coherent) {
  588. // coherent defaults to Device scope in the old model, QueueFamilyKHR scope in the new model
  589. scope = glslangIntermediate->usingVulkanMemoryModel() ? spv::Scope::QueueFamilyKHR : spv::Scope::Device;
  590. } else if (coherentFlags.devicecoherent) {
  591. scope = spv::Scope::Device;
  592. } else if (coherentFlags.queuefamilycoherent) {
  593. scope = spv::Scope::QueueFamilyKHR;
  594. } else if (coherentFlags.workgroupcoherent) {
  595. scope = spv::Scope::Workgroup;
  596. } else if (coherentFlags.subgroupcoherent) {
  597. scope = spv::Scope::Subgroup;
  598. } else if (coherentFlags.shadercallcoherent) {
  599. scope = spv::Scope::ShaderCallKHR;
  600. }
  601. if (glslangIntermediate->usingVulkanMemoryModel() && scope == spv::Scope::Device) {
  602. builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);
  603. }
  604. return scope;
  605. }
  606. // Translate a glslang built-in variable to a SPIR-V built in decoration. Also generate
  607. // associated capabilities when required. For some built-in variables, a capability
  608. // is generated only when using the variable in an executable instruction, but not when
  609. // just declaring a struct member variable with it. This is true for PointSize,
  610. // ClipDistance, and CullDistance.
  611. spv::BuiltIn TGlslangToSpvTraverser::TranslateBuiltInDecoration(glslang::TBuiltInVariable builtIn,
  612. bool memberDeclaration)
  613. {
  614. switch (builtIn) {
  615. case glslang::EbvPointSize:
  616. // Defer adding the capability until the built-in is actually used.
  617. if (! memberDeclaration) {
  618. switch (glslangIntermediate->getStage()) {
  619. case EShLangGeometry:
  620. builder.addCapability(spv::Capability::GeometryPointSize);
  621. break;
  622. case EShLangTessControl:
  623. case EShLangTessEvaluation:
  624. builder.addCapability(spv::Capability::TessellationPointSize);
  625. break;
  626. default:
  627. break;
  628. }
  629. }
  630. return spv::BuiltIn::PointSize;
  631. case glslang::EbvPosition: return spv::BuiltIn::Position;
  632. case glslang::EbvVertexId: return spv::BuiltIn::VertexId;
  633. case glslang::EbvInstanceId: return spv::BuiltIn::InstanceId;
  634. case glslang::EbvVertexIndex: return spv::BuiltIn::VertexIndex;
  635. case glslang::EbvInstanceIndex: return spv::BuiltIn::InstanceIndex;
  636. case glslang::EbvFragCoord: return spv::BuiltIn::FragCoord;
  637. case glslang::EbvPointCoord: return spv::BuiltIn::PointCoord;
  638. case glslang::EbvFace: return spv::BuiltIn::FrontFacing;
  639. case glslang::EbvFragDepth: return spv::BuiltIn::FragDepth;
  640. case glslang::EbvNumWorkGroups: return spv::BuiltIn::NumWorkgroups;
  641. case glslang::EbvWorkGroupSize: return spv::BuiltIn::WorkgroupSize;
  642. case glslang::EbvWorkGroupId: return spv::BuiltIn::WorkgroupId;
  643. case glslang::EbvLocalInvocationId: return spv::BuiltIn::LocalInvocationId;
  644. case glslang::EbvLocalInvocationIndex: return spv::BuiltIn::LocalInvocationIndex;
  645. case glslang::EbvGlobalInvocationId: return spv::BuiltIn::GlobalInvocationId;
  646. // These *Distance capabilities logically belong here, but if the member is declared and
  647. // then never used, consumers of SPIR-V prefer the capability not be declared.
  648. // They are now generated when used, rather than here when declared.
  649. // Potentially, the specification should be more clear what the minimum
  650. // use needed is to trigger the capability.
  651. //
  652. case glslang::EbvClipDistance:
  653. if (!memberDeclaration)
  654. builder.addCapability(spv::Capability::ClipDistance);
  655. return spv::BuiltIn::ClipDistance;
  656. case glslang::EbvCullDistance:
  657. if (!memberDeclaration)
  658. builder.addCapability(spv::Capability::CullDistance);
  659. return spv::BuiltIn::CullDistance;
  660. case glslang::EbvViewportIndex:
  661. if (glslangIntermediate->getStage() == EShLangGeometry ||
  662. glslangIntermediate->getStage() == EShLangFragment) {
  663. builder.addCapability(spv::Capability::MultiViewport);
  664. }
  665. if (glslangIntermediate->getStage() == EShLangVertex ||
  666. glslangIntermediate->getStage() == EShLangTessControl ||
  667. glslangIntermediate->getStage() == EShLangTessEvaluation) {
  668. if (builder.getSpvVersion() < spv::Spv_1_5) {
  669. builder.addIncorporatedExtension(spv::E_SPV_EXT_shader_viewport_index_layer, spv::Spv_1_5);
  670. builder.addCapability(spv::Capability::ShaderViewportIndexLayerEXT);
  671. }
  672. else
  673. builder.addCapability(spv::Capability::ShaderViewportIndex);
  674. }
  675. return spv::BuiltIn::ViewportIndex;
  676. case glslang::EbvSampleId:
  677. builder.addCapability(spv::Capability::SampleRateShading);
  678. return spv::BuiltIn::SampleId;
  679. case glslang::EbvSamplePosition:
  680. builder.addCapability(spv::Capability::SampleRateShading);
  681. return spv::BuiltIn::SamplePosition;
  682. case glslang::EbvSampleMask:
  683. return spv::BuiltIn::SampleMask;
  684. case glslang::EbvLayer:
  685. if (glslangIntermediate->getStage() == EShLangMesh) {
  686. return spv::BuiltIn::Layer;
  687. }
  688. if (glslangIntermediate->getStage() == EShLangGeometry ||
  689. glslangIntermediate->getStage() == EShLangFragment) {
  690. builder.addCapability(spv::Capability::Geometry);
  691. }
  692. if (glslangIntermediate->getStage() == EShLangVertex ||
  693. glslangIntermediate->getStage() == EShLangTessControl ||
  694. glslangIntermediate->getStage() == EShLangTessEvaluation) {
  695. if (builder.getSpvVersion() < spv::Spv_1_5) {
  696. builder.addIncorporatedExtension(spv::E_SPV_EXT_shader_viewport_index_layer, spv::Spv_1_5);
  697. builder.addCapability(spv::Capability::ShaderViewportIndexLayerEXT);
  698. } else
  699. builder.addCapability(spv::Capability::ShaderLayer);
  700. }
  701. return spv::BuiltIn::Layer;
  702. case glslang::EbvBaseVertex:
  703. builder.addIncorporatedExtension(spv::E_SPV_KHR_shader_draw_parameters, spv::Spv_1_3);
  704. builder.addCapability(spv::Capability::DrawParameters);
  705. return spv::BuiltIn::BaseVertex;
  706. case glslang::EbvBaseInstance:
  707. builder.addIncorporatedExtension(spv::E_SPV_KHR_shader_draw_parameters, spv::Spv_1_3);
  708. builder.addCapability(spv::Capability::DrawParameters);
  709. return spv::BuiltIn::BaseInstance;
  710. case glslang::EbvDrawId:
  711. builder.addIncorporatedExtension(spv::E_SPV_KHR_shader_draw_parameters, spv::Spv_1_3);
  712. builder.addCapability(spv::Capability::DrawParameters);
  713. return spv::BuiltIn::DrawIndex;
  714. case glslang::EbvPrimitiveId:
  715. if (glslangIntermediate->getStage() == EShLangFragment)
  716. builder.addCapability(spv::Capability::Geometry);
  717. return spv::BuiltIn::PrimitiveId;
  718. case glslang::EbvFragStencilRef:
  719. builder.addExtension(spv::E_SPV_EXT_shader_stencil_export);
  720. builder.addCapability(spv::Capability::StencilExportEXT);
  721. return spv::BuiltIn::FragStencilRefEXT;
  722. case glslang::EbvShadingRateKHR:
  723. builder.addExtension(spv::E_SPV_KHR_fragment_shading_rate);
  724. builder.addCapability(spv::Capability::FragmentShadingRateKHR);
  725. return spv::BuiltIn::ShadingRateKHR;
  726. case glslang::EbvPrimitiveShadingRateKHR:
  727. builder.addExtension(spv::E_SPV_KHR_fragment_shading_rate);
  728. builder.addCapability(spv::Capability::FragmentShadingRateKHR);
  729. return spv::BuiltIn::PrimitiveShadingRateKHR;
  730. case glslang::EbvInvocationId: return spv::BuiltIn::InvocationId;
  731. case glslang::EbvTessLevelInner: return spv::BuiltIn::TessLevelInner;
  732. case glslang::EbvTessLevelOuter: return spv::BuiltIn::TessLevelOuter;
  733. case glslang::EbvTessCoord: return spv::BuiltIn::TessCoord;
  734. case glslang::EbvPatchVertices: return spv::BuiltIn::PatchVertices;
  735. case glslang::EbvHelperInvocation: return spv::BuiltIn::HelperInvocation;
  736. case glslang::EbvSubGroupSize:
  737. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  738. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  739. return spv::BuiltIn::SubgroupSize;
  740. case glslang::EbvSubGroupInvocation:
  741. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  742. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  743. return spv::BuiltIn::SubgroupLocalInvocationId;
  744. case glslang::EbvSubGroupEqMask:
  745. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  746. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  747. return spv::BuiltIn::SubgroupEqMask;
  748. case glslang::EbvSubGroupGeMask:
  749. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  750. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  751. return spv::BuiltIn::SubgroupGeMask;
  752. case glslang::EbvSubGroupGtMask:
  753. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  754. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  755. return spv::BuiltIn::SubgroupGtMask;
  756. case glslang::EbvSubGroupLeMask:
  757. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  758. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  759. return spv::BuiltIn::SubgroupLeMask;
  760. case glslang::EbvSubGroupLtMask:
  761. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  762. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  763. return spv::BuiltIn::SubgroupLtMask;
  764. case glslang::EbvNumSubgroups:
  765. builder.addCapability(spv::Capability::GroupNonUniform);
  766. return spv::BuiltIn::NumSubgroups;
  767. case glslang::EbvSubgroupID:
  768. builder.addCapability(spv::Capability::GroupNonUniform);
  769. return spv::BuiltIn::SubgroupId;
  770. case glslang::EbvSubgroupSize2:
  771. builder.addCapability(spv::Capability::GroupNonUniform);
  772. return spv::BuiltIn::SubgroupSize;
  773. case glslang::EbvSubgroupInvocation2:
  774. builder.addCapability(spv::Capability::GroupNonUniform);
  775. return spv::BuiltIn::SubgroupLocalInvocationId;
  776. case glslang::EbvSubgroupEqMask2:
  777. builder.addCapability(spv::Capability::GroupNonUniform);
  778. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  779. return spv::BuiltIn::SubgroupEqMask;
  780. case glslang::EbvSubgroupGeMask2:
  781. builder.addCapability(spv::Capability::GroupNonUniform);
  782. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  783. return spv::BuiltIn::SubgroupGeMask;
  784. case glslang::EbvSubgroupGtMask2:
  785. builder.addCapability(spv::Capability::GroupNonUniform);
  786. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  787. return spv::BuiltIn::SubgroupGtMask;
  788. case glslang::EbvSubgroupLeMask2:
  789. builder.addCapability(spv::Capability::GroupNonUniform);
  790. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  791. return spv::BuiltIn::SubgroupLeMask;
  792. case glslang::EbvSubgroupLtMask2:
  793. builder.addCapability(spv::Capability::GroupNonUniform);
  794. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  795. return spv::BuiltIn::SubgroupLtMask;
  796. case glslang::EbvBaryCoordNoPersp:
  797. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  798. return spv::BuiltIn::BaryCoordNoPerspAMD;
  799. case glslang::EbvBaryCoordNoPerspCentroid:
  800. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  801. return spv::BuiltIn::BaryCoordNoPerspCentroidAMD;
  802. case glslang::EbvBaryCoordNoPerspSample:
  803. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  804. return spv::BuiltIn::BaryCoordNoPerspSampleAMD;
  805. case glslang::EbvBaryCoordSmooth:
  806. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  807. return spv::BuiltIn::BaryCoordSmoothAMD;
  808. case glslang::EbvBaryCoordSmoothCentroid:
  809. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  810. return spv::BuiltIn::BaryCoordSmoothCentroidAMD;
  811. case glslang::EbvBaryCoordSmoothSample:
  812. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  813. return spv::BuiltIn::BaryCoordSmoothSampleAMD;
  814. case glslang::EbvBaryCoordPullModel:
  815. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  816. return spv::BuiltIn::BaryCoordPullModelAMD;
  817. case glslang::EbvDeviceIndex:
  818. builder.addIncorporatedExtension(spv::E_SPV_KHR_device_group, spv::Spv_1_3);
  819. builder.addCapability(spv::Capability::DeviceGroup);
  820. return spv::BuiltIn::DeviceIndex;
  821. case glslang::EbvViewIndex:
  822. builder.addIncorporatedExtension(spv::E_SPV_KHR_multiview, spv::Spv_1_3);
  823. builder.addCapability(spv::Capability::MultiView);
  824. return spv::BuiltIn::ViewIndex;
  825. case glslang::EbvFragSizeEXT:
  826. builder.addExtension(spv::E_SPV_EXT_fragment_invocation_density);
  827. builder.addCapability(spv::Capability::FragmentDensityEXT);
  828. return spv::BuiltIn::FragSizeEXT;
  829. case glslang::EbvFragInvocationCountEXT:
  830. builder.addExtension(spv::E_SPV_EXT_fragment_invocation_density);
  831. builder.addCapability(spv::Capability::FragmentDensityEXT);
  832. return spv::BuiltIn::FragInvocationCountEXT;
  833. case glslang::EbvViewportMaskNV:
  834. if (!memberDeclaration) {
  835. builder.addExtension(spv::E_SPV_NV_viewport_array2);
  836. builder.addCapability(spv::Capability::ShaderViewportMaskNV);
  837. }
  838. return spv::BuiltIn::ViewportMaskNV;
  839. case glslang::EbvSecondaryPositionNV:
  840. if (!memberDeclaration) {
  841. builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
  842. builder.addCapability(spv::Capability::ShaderStereoViewNV);
  843. }
  844. return spv::BuiltIn::SecondaryPositionNV;
  845. case glslang::EbvSecondaryViewportMaskNV:
  846. if (!memberDeclaration) {
  847. builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
  848. builder.addCapability(spv::Capability::ShaderStereoViewNV);
  849. }
  850. return spv::BuiltIn::SecondaryViewportMaskNV;
  851. case glslang::EbvPositionPerViewNV:
  852. if (!memberDeclaration) {
  853. builder.addExtension(spv::E_SPV_NVX_multiview_per_view_attributes);
  854. builder.addCapability(spv::Capability::PerViewAttributesNV);
  855. }
  856. return spv::BuiltIn::PositionPerViewNV;
  857. case glslang::EbvViewportMaskPerViewNV:
  858. if (!memberDeclaration) {
  859. builder.addExtension(spv::E_SPV_NVX_multiview_per_view_attributes);
  860. builder.addCapability(spv::Capability::PerViewAttributesNV);
  861. }
  862. return spv::BuiltIn::ViewportMaskPerViewNV;
  863. case glslang::EbvFragFullyCoveredNV:
  864. builder.addExtension(spv::E_SPV_EXT_fragment_fully_covered);
  865. builder.addCapability(spv::Capability::FragmentFullyCoveredEXT);
  866. return spv::BuiltIn::FullyCoveredEXT;
  867. case glslang::EbvFragmentSizeNV:
  868. builder.addExtension(spv::E_SPV_NV_shading_rate);
  869. builder.addCapability(spv::Capability::ShadingRateNV);
  870. return spv::BuiltIn::FragmentSizeNV;
  871. case glslang::EbvInvocationsPerPixelNV:
  872. builder.addExtension(spv::E_SPV_NV_shading_rate);
  873. builder.addCapability(spv::Capability::ShadingRateNV);
  874. return spv::BuiltIn::InvocationsPerPixelNV;
  875. // ray tracing
  876. case glslang::EbvLaunchId:
  877. return spv::BuiltIn::LaunchIdKHR;
  878. case glslang::EbvLaunchSize:
  879. return spv::BuiltIn::LaunchSizeKHR;
  880. case glslang::EbvWorldRayOrigin:
  881. return spv::BuiltIn::WorldRayOriginKHR;
  882. case glslang::EbvWorldRayDirection:
  883. return spv::BuiltIn::WorldRayDirectionKHR;
  884. case glslang::EbvObjectRayOrigin:
  885. return spv::BuiltIn::ObjectRayOriginKHR;
  886. case glslang::EbvObjectRayDirection:
  887. return spv::BuiltIn::ObjectRayDirectionKHR;
  888. case glslang::EbvRayTmin:
  889. return spv::BuiltIn::RayTminKHR;
  890. case glslang::EbvRayTmax:
  891. return spv::BuiltIn::RayTmaxKHR;
  892. case glslang::EbvCullMask:
  893. return spv::BuiltIn::CullMaskKHR;
  894. case glslang::EbvPositionFetch:
  895. return spv::BuiltIn::HitTriangleVertexPositionsKHR;
  896. case glslang::EbvInstanceCustomIndex:
  897. return spv::BuiltIn::InstanceCustomIndexKHR;
  898. case glslang::EbvHitKind:
  899. return spv::BuiltIn::HitKindKHR;
  900. case glslang::EbvObjectToWorld:
  901. case glslang::EbvObjectToWorld3x4:
  902. return spv::BuiltIn::ObjectToWorldKHR;
  903. case glslang::EbvWorldToObject:
  904. case glslang::EbvWorldToObject3x4:
  905. return spv::BuiltIn::WorldToObjectKHR;
  906. case glslang::EbvIncomingRayFlags:
  907. return spv::BuiltIn::IncomingRayFlagsKHR;
  908. case glslang::EbvGeometryIndex:
  909. return spv::BuiltIn::RayGeometryIndexKHR;
  910. case glslang::EbvCurrentRayTimeNV:
  911. builder.addExtension(spv::E_SPV_NV_ray_tracing_motion_blur);
  912. builder.addCapability(spv::Capability::RayTracingMotionBlurNV);
  913. return spv::BuiltIn::CurrentRayTimeNV;
  914. case glslang::EbvMicroTrianglePositionNV:
  915. builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);
  916. builder.addExtension("SPV_NV_displacement_micromap");
  917. return spv::BuiltIn::HitMicroTriangleVertexPositionsNV;
  918. case glslang::EbvMicroTriangleBaryNV:
  919. builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);
  920. builder.addExtension("SPV_NV_displacement_micromap");
  921. return spv::BuiltIn::HitMicroTriangleVertexBarycentricsNV;
  922. case glslang::EbvHitKindFrontFacingMicroTriangleNV:
  923. builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);
  924. builder.addExtension("SPV_NV_displacement_micromap");
  925. return spv::BuiltIn::HitKindFrontFacingMicroTriangleNV;
  926. case glslang::EbvHitKindBackFacingMicroTriangleNV:
  927. builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);
  928. builder.addExtension("SPV_NV_displacement_micromap");
  929. return spv::BuiltIn::HitKindBackFacingMicroTriangleNV;
  930. case glslang::EbvClusterIDNV:
  931. builder.addCapability(spv::Capability::RayTracingClusterAccelerationStructureNV);
  932. builder.addExtension("SPV_NV_cluster_acceleration_structure");
  933. return spv::BuiltIn::ClusterIDNV;
  934. case glslang::EbvHitIsSphereNV:
  935. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  936. builder.addExtension("SPV_NV_linear_swept_spheres");
  937. return spv::BuiltIn::HitIsSphereNV;
  938. case glslang::EbvHitIsLSSNV:
  939. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  940. builder.addExtension("SPV_NV_linear_swept_spheres");
  941. return spv::BuiltIn::HitIsLSSNV;
  942. case glslang::EbvHitSpherePositionNV:
  943. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  944. builder.addExtension("SPV_NV_linear_swept_spheres");
  945. return spv::BuiltIn::HitSpherePositionNV;
  946. case glslang::EbvHitSphereRadiusNV:
  947. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  948. builder.addExtension("SPV_NV_linear_swept_spheres");
  949. return spv::BuiltIn::HitSphereRadiusNV;
  950. case glslang::EbvHitLSSPositionsNV:
  951. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  952. builder.addExtension("SPV_NV_linear_swept_spheres");
  953. return spv::BuiltIn::HitLSSPositionsNV;
  954. case glslang::EbvHitLSSRadiiNV:
  955. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  956. builder.addExtension("SPV_NV_linear_swept_spheres");
  957. return spv::BuiltIn::HitLSSRadiiNV;
  958. // barycentrics
  959. case glslang::EbvBaryCoordNV:
  960. builder.addExtension(spv::E_SPV_NV_fragment_shader_barycentric);
  961. builder.addCapability(spv::Capability::FragmentBarycentricNV);
  962. return spv::BuiltIn::BaryCoordNV;
  963. case glslang::EbvBaryCoordNoPerspNV:
  964. builder.addExtension(spv::E_SPV_NV_fragment_shader_barycentric);
  965. builder.addCapability(spv::Capability::FragmentBarycentricNV);
  966. return spv::BuiltIn::BaryCoordNoPerspNV;
  967. case glslang::EbvBaryCoordEXT:
  968. builder.addExtension(spv::E_SPV_KHR_fragment_shader_barycentric);
  969. builder.addCapability(spv::Capability::FragmentBarycentricKHR);
  970. return spv::BuiltIn::BaryCoordKHR;
  971. case glslang::EbvBaryCoordNoPerspEXT:
  972. builder.addExtension(spv::E_SPV_KHR_fragment_shader_barycentric);
  973. builder.addCapability(spv::Capability::FragmentBarycentricKHR);
  974. return spv::BuiltIn::BaryCoordNoPerspKHR;
  975. // mesh shaders
  976. case glslang::EbvTaskCountNV:
  977. return spv::BuiltIn::TaskCountNV;
  978. case glslang::EbvPrimitiveCountNV:
  979. return spv::BuiltIn::PrimitiveCountNV;
  980. case glslang::EbvPrimitiveIndicesNV:
  981. return spv::BuiltIn::PrimitiveIndicesNV;
  982. case glslang::EbvClipDistancePerViewNV:
  983. return spv::BuiltIn::ClipDistancePerViewNV;
  984. case glslang::EbvCullDistancePerViewNV:
  985. return spv::BuiltIn::CullDistancePerViewNV;
  986. case glslang::EbvLayerPerViewNV:
  987. return spv::BuiltIn::LayerPerViewNV;
  988. case glslang::EbvMeshViewCountNV:
  989. return spv::BuiltIn::MeshViewCountNV;
  990. case glslang::EbvMeshViewIndicesNV:
  991. return spv::BuiltIn::MeshViewIndicesNV;
  992. // SPV_EXT_mesh_shader
  993. case glslang::EbvPrimitivePointIndicesEXT:
  994. return spv::BuiltIn::PrimitivePointIndicesEXT;
  995. case glslang::EbvPrimitiveLineIndicesEXT:
  996. return spv::BuiltIn::PrimitiveLineIndicesEXT;
  997. case glslang::EbvPrimitiveTriangleIndicesEXT:
  998. return spv::BuiltIn::PrimitiveTriangleIndicesEXT;
  999. case glslang::EbvCullPrimitiveEXT:
  1000. return spv::BuiltIn::CullPrimitiveEXT;
  1001. // sm builtins
  1002. case glslang::EbvWarpsPerSM:
  1003. builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);
  1004. builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);
  1005. return spv::BuiltIn::WarpsPerSMNV;
  1006. case glslang::EbvSMCount:
  1007. builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);
  1008. builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);
  1009. return spv::BuiltIn::SMCountNV;
  1010. case glslang::EbvWarpID:
  1011. builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);
  1012. builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);
  1013. return spv::BuiltIn::WarpIDNV;
  1014. case glslang::EbvSMID:
  1015. builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);
  1016. builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);
  1017. return spv::BuiltIn::SMIDNV;
  1018. // ARM builtins
  1019. case glslang::EbvCoreCountARM:
  1020. builder.addExtension(spv::E_SPV_ARM_core_builtins);
  1021. builder.addCapability(spv::Capability::CoreBuiltinsARM);
  1022. return spv::BuiltIn::CoreCountARM;
  1023. case glslang::EbvCoreIDARM:
  1024. builder.addExtension(spv::E_SPV_ARM_core_builtins);
  1025. builder.addCapability(spv::Capability::CoreBuiltinsARM);
  1026. return spv::BuiltIn::CoreIDARM;
  1027. case glslang::EbvCoreMaxIDARM:
  1028. builder.addExtension(spv::E_SPV_ARM_core_builtins);
  1029. builder.addCapability(spv::Capability::CoreBuiltinsARM);
  1030. return spv::BuiltIn::CoreMaxIDARM;
  1031. case glslang::EbvWarpIDARM:
  1032. builder.addExtension(spv::E_SPV_ARM_core_builtins);
  1033. builder.addCapability(spv::Capability::CoreBuiltinsARM);
  1034. return spv::BuiltIn::WarpIDARM;
  1035. case glslang::EbvWarpMaxIDARM:
  1036. builder.addExtension(spv::E_SPV_ARM_core_builtins);
  1037. builder.addCapability(spv::Capability::CoreBuiltinsARM);
  1038. return spv::BuiltIn::WarpMaxIDARM;
  1039. // QCOM builtins
  1040. case glslang::EbvTileOffsetQCOM:
  1041. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1042. return spv::BuiltIn::TileOffsetQCOM;
  1043. case glslang::EbvTileDimensionQCOM:
  1044. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1045. return spv::BuiltIn::TileDimensionQCOM;
  1046. case glslang::EbvTileApronSizeQCOM:
  1047. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1048. return spv::BuiltIn::TileApronSizeQCOM;
  1049. default:
  1050. return spv::BuiltIn::Max;
  1051. }
  1052. }
  1053. // Translate glslang image layout format to SPIR-V image format.
  1054. spv::ImageFormat TGlslangToSpvTraverser::TranslateImageFormat(const glslang::TType& type)
  1055. {
  1056. assert(type.getBasicType() == glslang::EbtSampler);
  1057. // Check for capabilities
  1058. switch (type.getQualifier().getFormat()) {
  1059. case glslang::ElfRg32f:
  1060. case glslang::ElfRg16f:
  1061. case glslang::ElfR11fG11fB10f:
  1062. case glslang::ElfR16f:
  1063. case glslang::ElfRgba16:
  1064. case glslang::ElfRgb10A2:
  1065. case glslang::ElfRg16:
  1066. case glslang::ElfRg8:
  1067. case glslang::ElfR16:
  1068. case glslang::ElfR8:
  1069. case glslang::ElfRgba16Snorm:
  1070. case glslang::ElfRg16Snorm:
  1071. case glslang::ElfRg8Snorm:
  1072. case glslang::ElfR16Snorm:
  1073. case glslang::ElfR8Snorm:
  1074. case glslang::ElfRg32i:
  1075. case glslang::ElfRg16i:
  1076. case glslang::ElfRg8i:
  1077. case glslang::ElfR16i:
  1078. case glslang::ElfR8i:
  1079. case glslang::ElfRgb10a2ui:
  1080. case glslang::ElfRg32ui:
  1081. case glslang::ElfRg16ui:
  1082. case glslang::ElfRg8ui:
  1083. case glslang::ElfR16ui:
  1084. case glslang::ElfR8ui:
  1085. builder.addCapability(spv::Capability::StorageImageExtendedFormats);
  1086. break;
  1087. case glslang::ElfR64ui:
  1088. case glslang::ElfR64i:
  1089. builder.addExtension(spv::E_SPV_EXT_shader_image_int64);
  1090. builder.addCapability(spv::Capability::Int64ImageEXT);
  1091. break;
  1092. default:
  1093. break;
  1094. }
  1095. // do the translation
  1096. switch (type.getQualifier().getFormat()) {
  1097. case glslang::ElfNone: return spv::ImageFormat::Unknown;
  1098. case glslang::ElfRgba32f: return spv::ImageFormat::Rgba32f;
  1099. case glslang::ElfRgba16f: return spv::ImageFormat::Rgba16f;
  1100. case glslang::ElfR32f: return spv::ImageFormat::R32f;
  1101. case glslang::ElfRgba8: return spv::ImageFormat::Rgba8;
  1102. case glslang::ElfRgba8Snorm: return spv::ImageFormat::Rgba8Snorm;
  1103. case glslang::ElfRg32f: return spv::ImageFormat::Rg32f;
  1104. case glslang::ElfRg16f: return spv::ImageFormat::Rg16f;
  1105. case glslang::ElfR11fG11fB10f: return spv::ImageFormat::R11fG11fB10f;
  1106. case glslang::ElfR16f: return spv::ImageFormat::R16f;
  1107. case glslang::ElfRgba16: return spv::ImageFormat::Rgba16;
  1108. case glslang::ElfRgb10A2: return spv::ImageFormat::Rgb10A2;
  1109. case glslang::ElfRg16: return spv::ImageFormat::Rg16;
  1110. case glslang::ElfRg8: return spv::ImageFormat::Rg8;
  1111. case glslang::ElfR16: return spv::ImageFormat::R16;
  1112. case glslang::ElfR8: return spv::ImageFormat::R8;
  1113. case glslang::ElfRgba16Snorm: return spv::ImageFormat::Rgba16Snorm;
  1114. case glslang::ElfRg16Snorm: return spv::ImageFormat::Rg16Snorm;
  1115. case glslang::ElfRg8Snorm: return spv::ImageFormat::Rg8Snorm;
  1116. case glslang::ElfR16Snorm: return spv::ImageFormat::R16Snorm;
  1117. case glslang::ElfR8Snorm: return spv::ImageFormat::R8Snorm;
  1118. case glslang::ElfRgba32i: return spv::ImageFormat::Rgba32i;
  1119. case glslang::ElfRgba16i: return spv::ImageFormat::Rgba16i;
  1120. case glslang::ElfRgba8i: return spv::ImageFormat::Rgba8i;
  1121. case glslang::ElfR32i: return spv::ImageFormat::R32i;
  1122. case glslang::ElfRg32i: return spv::ImageFormat::Rg32i;
  1123. case glslang::ElfRg16i: return spv::ImageFormat::Rg16i;
  1124. case glslang::ElfRg8i: return spv::ImageFormat::Rg8i;
  1125. case glslang::ElfR16i: return spv::ImageFormat::R16i;
  1126. case glslang::ElfR8i: return spv::ImageFormat::R8i;
  1127. case glslang::ElfRgba32ui: return spv::ImageFormat::Rgba32ui;
  1128. case glslang::ElfRgba16ui: return spv::ImageFormat::Rgba16ui;
  1129. case glslang::ElfRgba8ui: return spv::ImageFormat::Rgba8ui;
  1130. case glslang::ElfR32ui: return spv::ImageFormat::R32ui;
  1131. case glslang::ElfRg32ui: return spv::ImageFormat::Rg32ui;
  1132. case glslang::ElfRg16ui: return spv::ImageFormat::Rg16ui;
  1133. case glslang::ElfRgb10a2ui: return spv::ImageFormat::Rgb10a2ui;
  1134. case glslang::ElfRg8ui: return spv::ImageFormat::Rg8ui;
  1135. case glslang::ElfR16ui: return spv::ImageFormat::R16ui;
  1136. case glslang::ElfR8ui: return spv::ImageFormat::R8ui;
  1137. case glslang::ElfR64ui: return spv::ImageFormat::R64ui;
  1138. case glslang::ElfR64i: return spv::ImageFormat::R64i;
  1139. default: return spv::ImageFormat::Max;
  1140. }
  1141. }
  1142. spv::SelectionControlMask TGlslangToSpvTraverser::TranslateSelectionControl(
  1143. const glslang::TIntermSelection& selectionNode) const
  1144. {
  1145. if (selectionNode.getFlatten())
  1146. return spv::SelectionControlMask::Flatten;
  1147. if (selectionNode.getDontFlatten())
  1148. return spv::SelectionControlMask::DontFlatten;
  1149. return spv::SelectionControlMask::MaskNone;
  1150. }
  1151. spv::SelectionControlMask TGlslangToSpvTraverser::TranslateSwitchControl(const glslang::TIntermSwitch& switchNode)
  1152. const
  1153. {
  1154. if (switchNode.getFlatten())
  1155. return spv::SelectionControlMask::Flatten;
  1156. if (switchNode.getDontFlatten())
  1157. return spv::SelectionControlMask::DontFlatten;
  1158. return spv::SelectionControlMask::MaskNone;
  1159. }
  1160. // return a non-0 dependency if the dependency argument must be set
  1161. spv::LoopControlMask TGlslangToSpvTraverser::TranslateLoopControl(const glslang::TIntermLoop& loopNode,
  1162. std::vector<unsigned int>& operands) const
  1163. {
  1164. spv::LoopControlMask control = spv::LoopControlMask::MaskNone;
  1165. if (loopNode.getDontUnroll())
  1166. control = control | spv::LoopControlMask::DontUnroll;
  1167. if (loopNode.getUnroll())
  1168. control = control | spv::LoopControlMask::Unroll;
  1169. if (unsigned(loopNode.getLoopDependency()) == glslang::TIntermLoop::dependencyInfinite)
  1170. control = control | spv::LoopControlMask::DependencyInfinite;
  1171. else if (loopNode.getLoopDependency() > 0) {
  1172. control = control | spv::LoopControlMask::DependencyLength;
  1173. operands.push_back((unsigned int)loopNode.getLoopDependency());
  1174. }
  1175. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {
  1176. if (loopNode.getMinIterations() > 0) {
  1177. control = control | spv::LoopControlMask::MinIterations;
  1178. operands.push_back(loopNode.getMinIterations());
  1179. }
  1180. if (loopNode.getMaxIterations() < glslang::TIntermLoop::iterationsInfinite) {
  1181. control = control | spv::LoopControlMask::MaxIterations;
  1182. operands.push_back(loopNode.getMaxIterations());
  1183. }
  1184. if (loopNode.getIterationMultiple() > 1) {
  1185. control = control | spv::LoopControlMask::IterationMultiple;
  1186. operands.push_back(loopNode.getIterationMultiple());
  1187. }
  1188. if (loopNode.getPeelCount() > 0) {
  1189. control = control | spv::LoopControlMask::PeelCount;
  1190. operands.push_back(loopNode.getPeelCount());
  1191. }
  1192. if (loopNode.getPartialCount() > 0) {
  1193. control = control | spv::LoopControlMask::PartialCount;
  1194. operands.push_back(loopNode.getPartialCount());
  1195. }
  1196. }
  1197. return control;
  1198. }
  1199. // Translate glslang type to SPIR-V storage class.
  1200. spv::StorageClass TGlslangToSpvTraverser::TranslateStorageClass(const glslang::TType& type)
  1201. {
  1202. if (type.getBasicType() == glslang::EbtRayQuery || type.getBasicType() == glslang::EbtHitObjectNV)
  1203. return spv::StorageClass::Private;
  1204. if (type.getQualifier().isSpirvByReference()) {
  1205. if (type.getQualifier().isParamInput() || type.getQualifier().isParamOutput())
  1206. return spv::StorageClass::Function;
  1207. }
  1208. if (type.getQualifier().isPipeInput())
  1209. return spv::StorageClass::Input;
  1210. if (type.getQualifier().isPipeOutput())
  1211. return spv::StorageClass::Output;
  1212. if (type.getQualifier().storage == glslang::EvqTileImageEXT || type.isAttachmentEXT()) {
  1213. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  1214. builder.addCapability(spv::Capability::TileImageColorReadAccessEXT);
  1215. return spv::StorageClass::TileImageEXT;
  1216. }
  1217. if (type.getQualifier().isTileAttachmentQCOM()) {
  1218. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1219. builder.addCapability(spv::Capability::TileShadingQCOM);
  1220. return spv::StorageClass::TileAttachmentQCOM;
  1221. }
  1222. if (glslangIntermediate->getSource() != glslang::EShSourceHlsl ||
  1223. type.getQualifier().storage == glslang::EvqUniform) {
  1224. if (type.isAtomic())
  1225. return spv::StorageClass::AtomicCounter;
  1226. if (type.containsOpaque() && !glslangIntermediate->getBindlessMode())
  1227. return spv::StorageClass::UniformConstant;
  1228. }
  1229. if (type.getQualifier().isUniformOrBuffer() &&
  1230. type.getQualifier().isShaderRecord()) {
  1231. return spv::StorageClass::ShaderRecordBufferKHR;
  1232. }
  1233. if (glslangIntermediate->usingStorageBuffer() && type.getQualifier().storage == glslang::EvqBuffer) {
  1234. builder.addIncorporatedExtension(spv::E_SPV_KHR_storage_buffer_storage_class, spv::Spv_1_3);
  1235. return spv::StorageClass::StorageBuffer;
  1236. }
  1237. if (type.getQualifier().isUniformOrBuffer()) {
  1238. if (type.getQualifier().isPushConstant())
  1239. return spv::StorageClass::PushConstant;
  1240. if (type.getBasicType() == glslang::EbtBlock)
  1241. return spv::StorageClass::Uniform;
  1242. return spv::StorageClass::UniformConstant;
  1243. }
  1244. if (type.getQualifier().storage == glslang::EvqShared && type.getBasicType() == glslang::EbtBlock) {
  1245. builder.addExtension(spv::E_SPV_KHR_workgroup_memory_explicit_layout);
  1246. builder.addCapability(spv::Capability::WorkgroupMemoryExplicitLayoutKHR);
  1247. return spv::StorageClass::Workgroup;
  1248. }
  1249. switch (type.getQualifier().storage) {
  1250. case glslang::EvqGlobal: return spv::StorageClass::Private;
  1251. case glslang::EvqConstReadOnly: return spv::StorageClass::Function;
  1252. case glslang::EvqTemporary: return spv::StorageClass::Function;
  1253. case glslang::EvqShared: return spv::StorageClass::Workgroup;
  1254. case glslang::EvqPayload: return spv::StorageClass::RayPayloadKHR;
  1255. case glslang::EvqPayloadIn: return spv::StorageClass::IncomingRayPayloadKHR;
  1256. case glslang::EvqHitAttr: return spv::StorageClass::HitAttributeKHR;
  1257. case glslang::EvqCallableData: return spv::StorageClass::CallableDataKHR;
  1258. case glslang::EvqCallableDataIn: return spv::StorageClass::IncomingCallableDataKHR;
  1259. case glslang::EvqtaskPayloadSharedEXT : return spv::StorageClass::TaskPayloadWorkgroupEXT;
  1260. case glslang::EvqHitObjectAttrNV: return spv::StorageClass::HitObjectAttributeNV;
  1261. case glslang::EvqSpirvStorageClass: return static_cast<spv::StorageClass>(type.getQualifier().spirvStorageClass);
  1262. default:
  1263. assert(0);
  1264. break;
  1265. }
  1266. return spv::StorageClass::Function;
  1267. }
  1268. // Translate glslang constants to SPIR-V literals
  1269. void TGlslangToSpvTraverser::TranslateLiterals(const glslang::TVector<const glslang::TIntermConstantUnion*>& constants,
  1270. std::vector<unsigned>& literals) const
  1271. {
  1272. for (auto constant : constants) {
  1273. if (constant->getBasicType() == glslang::EbtFloat) {
  1274. float floatValue = static_cast<float>(constant->getConstArray()[0].getDConst());
  1275. unsigned literal;
  1276. static_assert(sizeof(literal) == sizeof(floatValue), "sizeof(unsigned) != sizeof(float)");
  1277. memcpy(&literal, &floatValue, sizeof(literal));
  1278. literals.push_back(literal);
  1279. } else if (constant->getBasicType() == glslang::EbtInt) {
  1280. unsigned literal = constant->getConstArray()[0].getIConst();
  1281. literals.push_back(literal);
  1282. } else if (constant->getBasicType() == glslang::EbtUint) {
  1283. unsigned literal = constant->getConstArray()[0].getUConst();
  1284. literals.push_back(literal);
  1285. } else if (constant->getBasicType() == glslang::EbtBool) {
  1286. unsigned literal = constant->getConstArray()[0].getBConst();
  1287. literals.push_back(literal);
  1288. } else if (constant->getBasicType() == glslang::EbtString) {
  1289. auto str = constant->getConstArray()[0].getSConst()->c_str();
  1290. unsigned literal = 0;
  1291. char* literalPtr = reinterpret_cast<char*>(&literal);
  1292. unsigned charCount = 0;
  1293. char ch = 0;
  1294. do {
  1295. ch = *(str++);
  1296. *(literalPtr++) = ch;
  1297. ++charCount;
  1298. if (charCount == 4) {
  1299. literals.push_back(literal);
  1300. literalPtr = reinterpret_cast<char*>(&literal);
  1301. charCount = 0;
  1302. }
  1303. } while (ch != 0);
  1304. // Partial literal is padded with 0
  1305. if (charCount > 0) {
  1306. for (; charCount < 4; ++charCount)
  1307. *(literalPtr++) = 0;
  1308. literals.push_back(literal);
  1309. }
  1310. } else
  1311. assert(0); // Unexpected type
  1312. }
  1313. }
  1314. // Add capabilities pertaining to how an array is indexed.
  1315. void TGlslangToSpvTraverser::addIndirectionIndexCapabilities(const glslang::TType& baseType,
  1316. const glslang::TType& indexType)
  1317. {
  1318. if (indexType.getQualifier().isNonUniform()) {
  1319. // deal with an asserted non-uniform index
  1320. // SPV_EXT_descriptor_indexing already added in TranslateNonUniformDecoration
  1321. if (baseType.getBasicType() == glslang::EbtSampler) {
  1322. if (baseType.getQualifier().hasAttachment())
  1323. builder.addCapability(spv::Capability::InputAttachmentArrayNonUniformIndexingEXT);
  1324. else if (baseType.isImage() && baseType.getSampler().isBuffer())
  1325. builder.addCapability(spv::Capability::StorageTexelBufferArrayNonUniformIndexingEXT);
  1326. else if (baseType.isTexture() && baseType.getSampler().isBuffer())
  1327. builder.addCapability(spv::Capability::UniformTexelBufferArrayNonUniformIndexingEXT);
  1328. else if (baseType.isImage())
  1329. builder.addCapability(spv::Capability::StorageImageArrayNonUniformIndexingEXT);
  1330. else if (baseType.isTexture())
  1331. builder.addCapability(spv::Capability::SampledImageArrayNonUniformIndexingEXT);
  1332. } else if (baseType.getBasicType() == glslang::EbtBlock) {
  1333. if (baseType.getQualifier().storage == glslang::EvqBuffer)
  1334. builder.addCapability(spv::Capability::StorageBufferArrayNonUniformIndexingEXT);
  1335. else if (baseType.getQualifier().storage == glslang::EvqUniform)
  1336. builder.addCapability(spv::Capability::UniformBufferArrayNonUniformIndexingEXT);
  1337. }
  1338. } else {
  1339. // assume a dynamically uniform index
  1340. if (baseType.getBasicType() == glslang::EbtSampler) {
  1341. if (baseType.getQualifier().hasAttachment()) {
  1342. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  1343. builder.addCapability(spv::Capability::InputAttachmentArrayDynamicIndexingEXT);
  1344. } else if (baseType.isImage() && baseType.getSampler().isBuffer()) {
  1345. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  1346. builder.addCapability(spv::Capability::StorageTexelBufferArrayDynamicIndexingEXT);
  1347. } else if (baseType.isTexture() && baseType.getSampler().isBuffer()) {
  1348. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  1349. builder.addCapability(spv::Capability::UniformTexelBufferArrayDynamicIndexingEXT);
  1350. }
  1351. }
  1352. }
  1353. }
  1354. // Return whether or not the given type is something that should be tied to a
  1355. // descriptor set.
  1356. bool IsDescriptorResource(const glslang::TType& type)
  1357. {
  1358. // uniform and buffer blocks are included, unless it is a push_constant
  1359. if (type.getBasicType() == glslang::EbtBlock)
  1360. return type.getQualifier().isUniformOrBuffer() &&
  1361. ! type.getQualifier().isShaderRecord() &&
  1362. ! type.getQualifier().isPushConstant();
  1363. // non block...
  1364. // basically samplerXXX/subpass/sampler/texture are all included
  1365. // if they are the global-scope-class, not the function parameter
  1366. // (or local, if they ever exist) class.
  1367. if (type.getBasicType() == glslang::EbtSampler ||
  1368. type.getBasicType() == glslang::EbtAccStruct)
  1369. return type.getQualifier().isUniformOrBuffer();
  1370. // Tensors are tied to a descriptor.
  1371. if (type.isTensorARM())
  1372. return true;
  1373. // None of the above.
  1374. return false;
  1375. }
  1376. void InheritQualifiers(glslang::TQualifier& child, const glslang::TQualifier& parent)
  1377. {
  1378. if (child.layoutMatrix == glslang::ElmNone)
  1379. child.layoutMatrix = parent.layoutMatrix;
  1380. if (parent.invariant)
  1381. child.invariant = true;
  1382. if (parent.flat)
  1383. child.flat = true;
  1384. if (parent.centroid)
  1385. child.centroid = true;
  1386. if (parent.nopersp)
  1387. child.nopersp = true;
  1388. if (parent.explicitInterp)
  1389. child.explicitInterp = true;
  1390. if (parent.perPrimitiveNV)
  1391. child.perPrimitiveNV = true;
  1392. if (parent.perViewNV)
  1393. child.perViewNV = true;
  1394. if (parent.perTaskNV)
  1395. child.perTaskNV = true;
  1396. if (parent.storage == glslang::EvqtaskPayloadSharedEXT)
  1397. child.storage = glslang::EvqtaskPayloadSharedEXT;
  1398. if (parent.patch)
  1399. child.patch = true;
  1400. if (parent.sample)
  1401. child.sample = true;
  1402. if (parent.coherent)
  1403. child.coherent = true;
  1404. if (parent.devicecoherent)
  1405. child.devicecoherent = true;
  1406. if (parent.queuefamilycoherent)
  1407. child.queuefamilycoherent = true;
  1408. if (parent.workgroupcoherent)
  1409. child.workgroupcoherent = true;
  1410. if (parent.subgroupcoherent)
  1411. child.subgroupcoherent = true;
  1412. if (parent.shadercallcoherent)
  1413. child.shadercallcoherent = true;
  1414. if (parent.nonprivate)
  1415. child.nonprivate = true;
  1416. if (parent.volatil)
  1417. child.volatil = true;
  1418. if (parent.nontemporal)
  1419. child.nontemporal = true;
  1420. if (parent.restrict)
  1421. child.restrict = true;
  1422. if (parent.readonly)
  1423. child.readonly = true;
  1424. if (parent.writeonly)
  1425. child.writeonly = true;
  1426. if (parent.nonUniform)
  1427. child.nonUniform = true;
  1428. }
  1429. bool HasNonLayoutQualifiers(const glslang::TType& type, const glslang::TQualifier& qualifier)
  1430. {
  1431. // This should list qualifiers that simultaneous satisfy:
  1432. // - struct members might inherit from a struct declaration
  1433. // (note that non-block structs don't explicitly inherit,
  1434. // only implicitly, meaning no decoration involved)
  1435. // - affect decorations on the struct members
  1436. // (note smooth does not, and expecting something like volatile
  1437. // to effect the whole object)
  1438. // - are not part of the offset/st430/etc or row/column-major layout
  1439. return qualifier.invariant || (qualifier.hasLocation() && type.getBasicType() == glslang::EbtBlock);
  1440. }
  1441. //
  1442. // Implement the TGlslangToSpvTraverser class.
  1443. //
  1444. TGlslangToSpvTraverser::TGlslangToSpvTraverser(unsigned int spvVersion,
  1445. const glslang::TIntermediate* glslangIntermediate,
  1446. spv::SpvBuildLogger* buildLogger, glslang::SpvOptions& options) :
  1447. TIntermTraverser(true, false, true),
  1448. options(options),
  1449. shaderEntry(nullptr), currentFunction(nullptr),
  1450. sequenceDepth(0), logger(buildLogger),
  1451. builder(spvVersion, (glslang::GetKhronosToolId() << 16) | glslang::GetSpirvGeneratorVersion(), logger),
  1452. inEntryPoint(false), entryPointTerminated(false), linkageOnly(false),
  1453. glslangIntermediate(glslangIntermediate),
  1454. nanMinMaxClamp(glslangIntermediate->getNanMinMaxClamp()),
  1455. nonSemanticDebugPrintf(0),
  1456. taskPayloadID(0)
  1457. {
  1458. bool isMeshShaderExt = (glslangIntermediate->getRequestedExtensions().find(glslang::E_GL_EXT_mesh_shader) !=
  1459. glslangIntermediate->getRequestedExtensions().end());
  1460. spv::ExecutionModel executionModel = TranslateExecutionModel(glslangIntermediate->getStage(), isMeshShaderExt);
  1461. builder.clearAccessChain();
  1462. builder.setSource(TranslateSourceLanguage(glslangIntermediate->getSource(), glslangIntermediate->getProfile()),
  1463. glslangIntermediate->getVersion());
  1464. if (options.emitNonSemanticShaderDebugSource)
  1465. this->options.emitNonSemanticShaderDebugInfo = true;
  1466. if (options.emitNonSemanticShaderDebugInfo)
  1467. this->options.generateDebugInfo = true;
  1468. if (this->options.generateDebugInfo) {
  1469. if (this->options.emitNonSemanticShaderDebugInfo) {
  1470. builder.setEmitNonSemanticShaderDebugInfo(this->options.emitNonSemanticShaderDebugSource);
  1471. }
  1472. else {
  1473. builder.setEmitSpirvDebugInfo();
  1474. }
  1475. builder.setDebugMainSourceFile(glslangIntermediate->getSourceFile());
  1476. // Set the source shader's text. If for SPV version 1.0, include
  1477. // a preamble in comments stating the OpModuleProcessed instructions.
  1478. // Otherwise, emit those as actual instructions.
  1479. std::string text;
  1480. const std::vector<std::string>& processes = glslangIntermediate->getProcesses();
  1481. for (int p = 0; p < (int)processes.size(); ++p) {
  1482. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_1) {
  1483. text.append("// OpModuleProcessed ");
  1484. text.append(processes[p]);
  1485. text.append("\n");
  1486. } else
  1487. builder.addModuleProcessed(processes[p]);
  1488. }
  1489. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_1 && (int)processes.size() > 0)
  1490. text.append("#line 1\n");
  1491. text.append(glslangIntermediate->getSourceText());
  1492. builder.setSourceText(text);
  1493. // Pass name and text for all included files
  1494. const std::map<std::string, std::string>& include_txt = glslangIntermediate->getIncludeText();
  1495. for (auto iItr = include_txt.begin(); iItr != include_txt.end(); ++iItr)
  1496. builder.addInclude(iItr->first, iItr->second);
  1497. }
  1498. builder.setUseReplicatedComposites(glslangIntermediate->usingReplicatedComposites());
  1499. stdBuiltins = builder.import("GLSL.std.450");
  1500. spv::AddressingModel addressingModel = spv::AddressingModel::Logical;
  1501. spv::MemoryModel memoryModel = spv::MemoryModel::GLSL450;
  1502. if (glslangIntermediate->usingPhysicalStorageBuffer()) {
  1503. addressingModel = spv::AddressingModel::PhysicalStorageBuffer64EXT;
  1504. builder.addIncorporatedExtension(spv::E_SPV_KHR_physical_storage_buffer, spv::Spv_1_5);
  1505. builder.addCapability(spv::Capability::PhysicalStorageBufferAddressesEXT);
  1506. }
  1507. if (glslangIntermediate->usingVulkanMemoryModel()) {
  1508. memoryModel = spv::MemoryModel::VulkanKHR;
  1509. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  1510. builder.addIncorporatedExtension(spv::E_SPV_KHR_vulkan_memory_model, spv::Spv_1_5);
  1511. }
  1512. builder.setMemoryModel(addressingModel, memoryModel);
  1513. if (glslangIntermediate->usingVariablePointers()) {
  1514. builder.addCapability(spv::Capability::VariablePointers);
  1515. }
  1516. // If not linking, there is no entry point
  1517. if (!options.compileOnly) {
  1518. shaderEntry = builder.makeEntryPoint(glslangIntermediate->getEntryPointName().c_str());
  1519. entryPoint =
  1520. builder.addEntryPoint(executionModel, shaderEntry, glslangIntermediate->getEntryPointName().c_str());
  1521. }
  1522. // Add the source extensions
  1523. const auto& sourceExtensions = glslangIntermediate->getRequestedExtensions();
  1524. for (auto it = sourceExtensions.begin(); it != sourceExtensions.end(); ++it)
  1525. builder.addSourceExtension(it->c_str());
  1526. // Add the top-level modes for this shader.
  1527. if (glslangIntermediate->getXfbMode()) {
  1528. builder.addCapability(spv::Capability::TransformFeedback);
  1529. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::Xfb);
  1530. }
  1531. if (glslangIntermediate->getLayoutPrimitiveCulling()) {
  1532. builder.addCapability(spv::Capability::RayTraversalPrimitiveCullingKHR);
  1533. }
  1534. if (glslangIntermediate->getSubgroupUniformControlFlow()) {
  1535. builder.addExtension(spv::E_SPV_KHR_subgroup_uniform_control_flow);
  1536. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::SubgroupUniformControlFlowKHR);
  1537. }
  1538. if (glslangIntermediate->getMaximallyReconverges()) {
  1539. builder.addExtension(spv::E_SPV_KHR_maximal_reconvergence);
  1540. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::MaximallyReconvergesKHR);
  1541. }
  1542. if (glslangIntermediate->getQuadDerivMode())
  1543. {
  1544. builder.addCapability(spv::Capability::QuadControlKHR);
  1545. builder.addExtension(spv::E_SPV_KHR_quad_control);
  1546. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::QuadDerivativesKHR);
  1547. }
  1548. if (glslangIntermediate->getReqFullQuadsMode())
  1549. {
  1550. builder.addCapability(spv::Capability::QuadControlKHR);
  1551. builder.addExtension(spv::E_SPV_KHR_quad_control);
  1552. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::RequireFullQuadsKHR);
  1553. }
  1554. spv::ExecutionMode mode;
  1555. switch (glslangIntermediate->getStage()) {
  1556. case EShLangVertex:
  1557. builder.addCapability(spv::Capability::Shader);
  1558. break;
  1559. case EShLangFragment:
  1560. builder.addCapability(spv::Capability::Shader);
  1561. if (glslangIntermediate->getPixelCenterInteger())
  1562. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::PixelCenterInteger);
  1563. if (glslangIntermediate->getOriginUpperLeft())
  1564. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OriginUpperLeft);
  1565. else
  1566. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OriginLowerLeft);
  1567. if (glslangIntermediate->getEarlyFragmentTests())
  1568. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::EarlyFragmentTests);
  1569. if (glslangIntermediate->getEarlyAndLateFragmentTestsAMD())
  1570. {
  1571. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::EarlyAndLateFragmentTestsAMD);
  1572. builder.addExtension(spv::E_SPV_AMD_shader_early_and_late_fragment_tests);
  1573. }
  1574. if (glslangIntermediate->getPostDepthCoverage()) {
  1575. builder.addCapability(spv::Capability::SampleMaskPostDepthCoverage);
  1576. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::PostDepthCoverage);
  1577. builder.addExtension(spv::E_SPV_KHR_post_depth_coverage);
  1578. }
  1579. if (glslangIntermediate->getNonCoherentColorAttachmentReadEXT()) {
  1580. builder.addCapability(spv::Capability::TileImageColorReadAccessEXT);
  1581. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentColorAttachmentReadEXT);
  1582. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  1583. }
  1584. if (glslangIntermediate->getNonCoherentDepthAttachmentReadEXT()) {
  1585. builder.addCapability(spv::Capability::TileImageDepthReadAccessEXT);
  1586. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentDepthAttachmentReadEXT);
  1587. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  1588. }
  1589. if (glslangIntermediate->getNonCoherentStencilAttachmentReadEXT()) {
  1590. builder.addCapability(spv::Capability::TileImageStencilReadAccessEXT);
  1591. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentStencilAttachmentReadEXT);
  1592. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  1593. }
  1594. if (glslangIntermediate->getNonCoherentTileAttachmentReadQCOM()) {
  1595. builder.addCapability(spv::Capability::TileShadingQCOM);
  1596. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentTileAttachmentReadQCOM);
  1597. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1598. }
  1599. if (glslangIntermediate->isDepthReplacing())
  1600. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::DepthReplacing);
  1601. if (glslangIntermediate->isStencilReplacing())
  1602. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::StencilRefReplacingEXT);
  1603. switch(glslangIntermediate->getDepth()) {
  1604. case glslang::EldGreater: mode = spv::ExecutionMode::DepthGreater; break;
  1605. case glslang::EldLess: mode = spv::ExecutionMode::DepthLess; break;
  1606. case glslang::EldUnchanged: mode = spv::ExecutionMode::DepthUnchanged; break;
  1607. default: mode = spv::ExecutionMode::Max; break;
  1608. }
  1609. if (mode != spv::ExecutionMode::Max)
  1610. builder.addExecutionMode(shaderEntry, mode);
  1611. switch (glslangIntermediate->getStencil()) {
  1612. case glslang::ElsRefUnchangedFrontAMD: mode = spv::ExecutionMode::StencilRefUnchangedFrontAMD; break;
  1613. case glslang::ElsRefGreaterFrontAMD: mode = spv::ExecutionMode::StencilRefGreaterFrontAMD; break;
  1614. case glslang::ElsRefLessFrontAMD: mode = spv::ExecutionMode::StencilRefLessFrontAMD; break;
  1615. case glslang::ElsRefUnchangedBackAMD: mode = spv::ExecutionMode::StencilRefUnchangedBackAMD; break;
  1616. case glslang::ElsRefGreaterBackAMD: mode = spv::ExecutionMode::StencilRefGreaterBackAMD; break;
  1617. case glslang::ElsRefLessBackAMD: mode = spv::ExecutionMode::StencilRefLessBackAMD; break;
  1618. default: mode = spv::ExecutionMode::Max; break;
  1619. }
  1620. if (mode != spv::ExecutionMode::Max)
  1621. builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
  1622. switch (glslangIntermediate->getInterlockOrdering()) {
  1623. case glslang::EioPixelInterlockOrdered: mode = spv::ExecutionMode::PixelInterlockOrderedEXT;
  1624. break;
  1625. case glslang::EioPixelInterlockUnordered: mode = spv::ExecutionMode::PixelInterlockUnorderedEXT;
  1626. break;
  1627. case glslang::EioSampleInterlockOrdered: mode = spv::ExecutionMode::SampleInterlockOrderedEXT;
  1628. break;
  1629. case glslang::EioSampleInterlockUnordered: mode = spv::ExecutionMode::SampleInterlockUnorderedEXT;
  1630. break;
  1631. case glslang::EioShadingRateInterlockOrdered: mode = spv::ExecutionMode::ShadingRateInterlockOrderedEXT;
  1632. break;
  1633. case glslang::EioShadingRateInterlockUnordered: mode = spv::ExecutionMode::ShadingRateInterlockUnorderedEXT;
  1634. break;
  1635. default: mode = spv::ExecutionMode::Max;
  1636. break;
  1637. }
  1638. if (mode != spv::ExecutionMode::Max) {
  1639. builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
  1640. if (mode == spv::ExecutionMode::ShadingRateInterlockOrderedEXT ||
  1641. mode == spv::ExecutionMode::ShadingRateInterlockUnorderedEXT) {
  1642. builder.addCapability(spv::Capability::FragmentShaderShadingRateInterlockEXT);
  1643. } else if (mode == spv::ExecutionMode::PixelInterlockOrderedEXT ||
  1644. mode == spv::ExecutionMode::PixelInterlockUnorderedEXT) {
  1645. builder.addCapability(spv::Capability::FragmentShaderPixelInterlockEXT);
  1646. } else {
  1647. builder.addCapability(spv::Capability::FragmentShaderSampleInterlockEXT);
  1648. }
  1649. builder.addExtension(spv::E_SPV_EXT_fragment_shader_interlock);
  1650. }
  1651. break;
  1652. case EShLangCompute: {
  1653. builder.addCapability(spv::Capability::Shader);
  1654. bool needSizeId = false;
  1655. for (int dim = 0; dim < 3; ++dim) {
  1656. if ((glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet)) {
  1657. needSizeId = true;
  1658. break;
  1659. }
  1660. }
  1661. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6 && needSizeId) {
  1662. std::vector<spv::Id> dimConstId;
  1663. for (int dim = 0; dim < 3; ++dim) {
  1664. bool specConst = (glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet);
  1665. dimConstId.push_back(builder.makeUintConstant(glslangIntermediate->getLocalSize(dim), specConst));
  1666. if (specConst) {
  1667. builder.addDecoration(dimConstId.back(), spv::Decoration::SpecId,
  1668. glslangIntermediate->getLocalSizeSpecId(dim));
  1669. needSizeId = true;
  1670. }
  1671. }
  1672. builder.addExecutionModeId(shaderEntry, spv::ExecutionMode::LocalSizeId, dimConstId);
  1673. } else {
  1674. if (glslangIntermediate->getTileShadingRateQCOM(0) >= 1 || glslangIntermediate->getTileShadingRateQCOM(1) >= 1 || glslangIntermediate->getTileShadingRateQCOM(2) >= 1) {
  1675. auto rate_x = glslangIntermediate->getTileShadingRateQCOM(0);
  1676. auto rate_y = glslangIntermediate->getTileShadingRateQCOM(1);
  1677. auto rate_z = glslangIntermediate->getTileShadingRateQCOM(2);
  1678. rate_x = ( rate_x == 0 ? 1 : rate_x );
  1679. rate_y = ( rate_y == 0 ? 1 : rate_y );
  1680. rate_z = ( rate_z == 0 ? 1 : rate_z );
  1681. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::TileShadingRateQCOM, rate_x, rate_y, rate_z);
  1682. } else {
  1683. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::LocalSize, glslangIntermediate->getLocalSize(0),
  1684. glslangIntermediate->getLocalSize(1),
  1685. glslangIntermediate->getLocalSize(2));
  1686. }
  1687. }
  1688. if (glslangIntermediate->getLayoutDerivativeModeNone() == glslang::LayoutDerivativeGroupQuads) {
  1689. builder.addCapability(spv::Capability::ComputeDerivativeGroupQuadsNV);
  1690. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::DerivativeGroupQuadsNV);
  1691. builder.addExtension(spv::E_SPV_NV_compute_shader_derivatives);
  1692. } else if (glslangIntermediate->getLayoutDerivativeModeNone() == glslang::LayoutDerivativeGroupLinear) {
  1693. builder.addCapability(spv::Capability::ComputeDerivativeGroupLinearNV);
  1694. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::DerivativeGroupLinearNV);
  1695. builder.addExtension(spv::E_SPV_NV_compute_shader_derivatives);
  1696. }
  1697. if (glslangIntermediate->getNonCoherentTileAttachmentReadQCOM()) {
  1698. builder.addCapability(spv::Capability::TileShadingQCOM);
  1699. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentTileAttachmentReadQCOM);
  1700. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1701. }
  1702. break;
  1703. }
  1704. case EShLangTessEvaluation:
  1705. case EShLangTessControl:
  1706. builder.addCapability(spv::Capability::Tessellation);
  1707. glslang::TLayoutGeometry primitive;
  1708. if (glslangIntermediate->getStage() == EShLangTessControl) {
  1709. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputVertices,
  1710. glslangIntermediate->getVertices());
  1711. primitive = glslangIntermediate->getOutputPrimitive();
  1712. } else {
  1713. primitive = glslangIntermediate->getInputPrimitive();
  1714. }
  1715. switch (primitive) {
  1716. case glslang::ElgTriangles: mode = spv::ExecutionMode::Triangles; break;
  1717. case glslang::ElgQuads: mode = spv::ExecutionMode::Quads; break;
  1718. case glslang::ElgIsolines: mode = spv::ExecutionMode::Isolines; break;
  1719. default: mode = spv::ExecutionMode::Max; break;
  1720. }
  1721. if (mode != spv::ExecutionMode::Max)
  1722. builder.addExecutionMode(shaderEntry, mode);
  1723. switch (glslangIntermediate->getVertexSpacing()) {
  1724. case glslang::EvsEqual: mode = spv::ExecutionMode::SpacingEqual; break;
  1725. case glslang::EvsFractionalEven: mode = spv::ExecutionMode::SpacingFractionalEven; break;
  1726. case glslang::EvsFractionalOdd: mode = spv::ExecutionMode::SpacingFractionalOdd; break;
  1727. default: mode = spv::ExecutionMode::Max; break;
  1728. }
  1729. if (mode != spv::ExecutionMode::Max)
  1730. builder.addExecutionMode(shaderEntry, mode);
  1731. switch (glslangIntermediate->getVertexOrder()) {
  1732. case glslang::EvoCw: mode = spv::ExecutionMode::VertexOrderCw; break;
  1733. case glslang::EvoCcw: mode = spv::ExecutionMode::VertexOrderCcw; break;
  1734. default: mode = spv::ExecutionMode::Max; break;
  1735. }
  1736. if (mode != spv::ExecutionMode::Max)
  1737. builder.addExecutionMode(shaderEntry, mode);
  1738. if (glslangIntermediate->getPointMode())
  1739. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::PointMode);
  1740. break;
  1741. case EShLangGeometry:
  1742. builder.addCapability(spv::Capability::Geometry);
  1743. switch (glslangIntermediate->getInputPrimitive()) {
  1744. case glslang::ElgPoints: mode = spv::ExecutionMode::InputPoints; break;
  1745. case glslang::ElgLines: mode = spv::ExecutionMode::InputLines; break;
  1746. case glslang::ElgLinesAdjacency: mode = spv::ExecutionMode::InputLinesAdjacency; break;
  1747. case glslang::ElgTriangles: mode = spv::ExecutionMode::Triangles; break;
  1748. case glslang::ElgTrianglesAdjacency: mode = spv::ExecutionMode::InputTrianglesAdjacency; break;
  1749. default: mode = spv::ExecutionMode::Max; break;
  1750. }
  1751. if (mode != spv::ExecutionMode::Max)
  1752. builder.addExecutionMode(shaderEntry, mode);
  1753. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::Invocations, glslangIntermediate->getInvocations());
  1754. switch (glslangIntermediate->getOutputPrimitive()) {
  1755. case glslang::ElgPoints: mode = spv::ExecutionMode::OutputPoints; break;
  1756. case glslang::ElgLineStrip: mode = spv::ExecutionMode::OutputLineStrip; break;
  1757. case glslang::ElgTriangleStrip: mode = spv::ExecutionMode::OutputTriangleStrip; break;
  1758. default: mode = spv::ExecutionMode::Max; break;
  1759. }
  1760. if (mode != spv::ExecutionMode::Max)
  1761. builder.addExecutionMode(shaderEntry, mode);
  1762. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputVertices, glslangIntermediate->getVertices());
  1763. break;
  1764. case EShLangRayGen:
  1765. case EShLangIntersect:
  1766. case EShLangAnyHit:
  1767. case EShLangClosestHit:
  1768. case EShLangMiss:
  1769. case EShLangCallable:
  1770. {
  1771. auto& extensions = glslangIntermediate->getRequestedExtensions();
  1772. if (extensions.find("GL_EXT_opacity_micromap") != extensions.end()) {
  1773. builder.addCapability(spv::Capability::RayTracingOpacityMicromapEXT);
  1774. builder.addExtension("SPV_EXT_opacity_micromap");
  1775. }
  1776. if (extensions.find("GL_NV_ray_tracing") == extensions.end()) {
  1777. builder.addCapability(spv::Capability::RayTracingKHR);
  1778. builder.addExtension("SPV_KHR_ray_tracing");
  1779. }
  1780. else {
  1781. builder.addCapability(spv::Capability::RayTracingNV);
  1782. builder.addExtension("SPV_NV_ray_tracing");
  1783. }
  1784. if (glslangIntermediate->getStage() != EShLangRayGen && glslangIntermediate->getStage() != EShLangCallable) {
  1785. if (extensions.find("GL_EXT_ray_cull_mask") != extensions.end()) {
  1786. builder.addCapability(spv::Capability::RayCullMaskKHR);
  1787. builder.addExtension("SPV_KHR_ray_cull_mask");
  1788. }
  1789. if (extensions.find("GL_EXT_ray_tracing_position_fetch") != extensions.end()) {
  1790. builder.addCapability(spv::Capability::RayTracingPositionFetchKHR);
  1791. builder.addExtension("SPV_KHR_ray_tracing_position_fetch");
  1792. }
  1793. }
  1794. break;
  1795. }
  1796. case EShLangTask:
  1797. case EShLangMesh:
  1798. if(isMeshShaderExt) {
  1799. builder.addCapability(spv::Capability::MeshShadingEXT);
  1800. builder.addExtension(spv::E_SPV_EXT_mesh_shader);
  1801. } else {
  1802. builder.addCapability(spv::Capability::MeshShadingNV);
  1803. builder.addExtension(spv::E_SPV_NV_mesh_shader);
  1804. }
  1805. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {
  1806. std::vector<spv::Id> dimConstId;
  1807. for (int dim = 0; dim < 3; ++dim) {
  1808. bool specConst = (glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet);
  1809. dimConstId.push_back(builder.makeUintConstant(glslangIntermediate->getLocalSize(dim), specConst));
  1810. if (specConst) {
  1811. builder.addDecoration(dimConstId.back(), spv::Decoration::SpecId,
  1812. glslangIntermediate->getLocalSizeSpecId(dim));
  1813. }
  1814. }
  1815. builder.addExecutionModeId(shaderEntry, spv::ExecutionMode::LocalSizeId, dimConstId);
  1816. } else {
  1817. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::LocalSize, glslangIntermediate->getLocalSize(0),
  1818. glslangIntermediate->getLocalSize(1),
  1819. glslangIntermediate->getLocalSize(2));
  1820. }
  1821. if (glslangIntermediate->getStage() == EShLangMesh) {
  1822. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputVertices,
  1823. glslangIntermediate->getVertices());
  1824. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputPrimitivesNV,
  1825. glslangIntermediate->getPrimitives());
  1826. switch (glslangIntermediate->getOutputPrimitive()) {
  1827. case glslang::ElgPoints: mode = spv::ExecutionMode::OutputPoints; break;
  1828. case glslang::ElgLines: mode = spv::ExecutionMode::OutputLinesNV; break;
  1829. case glslang::ElgTriangles: mode = spv::ExecutionMode::OutputTrianglesNV; break;
  1830. default: mode = spv::ExecutionMode::Max; break;
  1831. }
  1832. if (mode != spv::ExecutionMode::Max)
  1833. builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
  1834. }
  1835. break;
  1836. default:
  1837. break;
  1838. }
  1839. //
  1840. // Add SPIR-V requirements (GL_EXT_spirv_intrinsics)
  1841. //
  1842. if (glslangIntermediate->hasSpirvRequirement()) {
  1843. const glslang::TSpirvRequirement& spirvRequirement = glslangIntermediate->getSpirvRequirement();
  1844. // Add SPIR-V extension requirement
  1845. for (auto& extension : spirvRequirement.extensions)
  1846. builder.addExtension(extension.c_str());
  1847. // Add SPIR-V capability requirement
  1848. for (auto capability : spirvRequirement.capabilities)
  1849. builder.addCapability(static_cast<spv::Capability>(capability));
  1850. }
  1851. //
  1852. // Add SPIR-V execution mode qualifiers (GL_EXT_spirv_intrinsics)
  1853. //
  1854. if (glslangIntermediate->hasSpirvExecutionMode()) {
  1855. const glslang::TSpirvExecutionMode spirvExecutionMode = glslangIntermediate->getSpirvExecutionMode();
  1856. // Add spirv_execution_mode
  1857. for (auto& mode : spirvExecutionMode.modes) {
  1858. if (!mode.second.empty()) {
  1859. std::vector<unsigned> literals;
  1860. TranslateLiterals(mode.second, literals);
  1861. builder.addExecutionMode(shaderEntry, static_cast<spv::ExecutionMode>(mode.first), literals);
  1862. } else
  1863. builder.addExecutionMode(shaderEntry, static_cast<spv::ExecutionMode>(mode.first));
  1864. }
  1865. // Add spirv_execution_mode_id
  1866. for (auto& modeId : spirvExecutionMode.modeIds) {
  1867. std::vector<spv::Id> operandIds;
  1868. assert(!modeId.second.empty());
  1869. for (auto extraOperand : modeId.second) {
  1870. if (extraOperand->getType().getQualifier().isSpecConstant())
  1871. operandIds.push_back(getSymbolId(extraOperand->getAsSymbolNode()));
  1872. else
  1873. operandIds.push_back(createSpvConstant(*extraOperand));
  1874. }
  1875. builder.addExecutionModeId(shaderEntry, static_cast<spv::ExecutionMode>(modeId.first), operandIds);
  1876. }
  1877. }
  1878. }
  1879. // Finish creating SPV, after the traversal is complete.
  1880. void TGlslangToSpvTraverser::finishSpv(bool compileOnly)
  1881. {
  1882. // If not linking, an entry point is not expected
  1883. if (!compileOnly) {
  1884. // Finish the entry point function
  1885. if (!entryPointTerminated) {
  1886. builder.setBuildPoint(shaderEntry->getLastBlock());
  1887. builder.leaveFunction();
  1888. }
  1889. // finish off the entry-point SPV instruction by adding the Input/Output <id>
  1890. entryPoint->reserveOperands(iOSet.size());
  1891. for (auto id : iOSet)
  1892. entryPoint->addIdOperand(id);
  1893. }
  1894. // Add capabilities, extensions, remove unneeded decorations, etc.,
  1895. // based on the resulting SPIR-V.
  1896. // Note: WebGPU code generation must have the opportunity to aggressively
  1897. // prune unreachable merge blocks and continue targets.
  1898. builder.postProcess(compileOnly);
  1899. }
  1900. // Write the SPV into 'out'.
  1901. void TGlslangToSpvTraverser::dumpSpv(std::vector<unsigned int>& out)
  1902. {
  1903. builder.dump(out);
  1904. }
  1905. //
  1906. // Implement the traversal functions.
  1907. //
  1908. // Return true from interior nodes to have the external traversal
  1909. // continue on to children. Return false if children were
  1910. // already processed.
  1911. //
  1912. //
  1913. // Symbols can turn into
  1914. // - uniform/input reads
  1915. // - output writes
  1916. // - complex lvalue base setups: foo.bar[3].... , where we see foo and start up an access chain
  1917. // - something simple that degenerates into the last bullet
  1918. //
  1919. void TGlslangToSpvTraverser::visitSymbol(glslang::TIntermSymbol* symbol)
  1920. {
  1921. // We update the line information even though no code might be generated here
  1922. // This is helpful to yield correct lines for control flow instructions
  1923. if (!linkageOnly) {
  1924. builder.setDebugSourceLocation(symbol->getLoc().line, symbol->getLoc().getFilename());
  1925. }
  1926. if (symbol->getBasicType() == glslang::EbtFunction) {
  1927. return;
  1928. }
  1929. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  1930. if (symbol->getType().isStruct())
  1931. glslangTypeToIdMap[symbol->getType().getStruct()] = symbol->getId();
  1932. if (symbol->getType().getQualifier().isSpecConstant())
  1933. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  1934. #ifdef ENABLE_HLSL
  1935. // Skip symbol handling if it is string-typed
  1936. if (symbol->getBasicType() == glslang::EbtString)
  1937. return;
  1938. #endif
  1939. // getSymbolId() will set up all the IO decorations on the first call.
  1940. // Formal function parameters were mapped during makeFunctions().
  1941. spv::Id id = getSymbolId(symbol);
  1942. if (symbol->getType().getQualifier().isTaskPayload())
  1943. taskPayloadID = id; // cache the taskPayloadID to be used it as operand for OpEmitMeshTasksEXT
  1944. if (builder.isPointer(id)) {
  1945. if (!symbol->getType().getQualifier().isParamInput() &&
  1946. !symbol->getType().getQualifier().isParamOutput()) {
  1947. // Include all "static use" and "linkage only" interface variables on the OpEntryPoint instruction
  1948. // Consider adding to the OpEntryPoint interface list.
  1949. // Only looking at structures if they have at least one member.
  1950. if (!symbol->getType().isStruct() || symbol->getType().getStruct()->size() > 0) {
  1951. spv::StorageClass sc = builder.getStorageClass(id);
  1952. // Before SPIR-V 1.4, we only want to include Input and Output.
  1953. // Starting with SPIR-V 1.4, we want all globals.
  1954. if ((glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4 && builder.isGlobalVariable(id)) ||
  1955. (sc == spv::StorageClass::Input || sc == spv::StorageClass::Output)) {
  1956. iOSet.insert(id);
  1957. }
  1958. }
  1959. }
  1960. // If the SPIR-V type is required to be different than the AST type
  1961. // (for ex SubgroupMasks or 3x4 ObjectToWorld/WorldToObject matrices),
  1962. // translate now from the SPIR-V type to the AST type, for the consuming
  1963. // operation.
  1964. // Note this turns it from an l-value to an r-value.
  1965. // Currently, all symbols needing this are inputs; avoid the map lookup when non-input.
  1966. if (symbol->getType().getQualifier().storage == glslang::EvqVaryingIn)
  1967. id = translateForcedType(id);
  1968. }
  1969. // Only process non-linkage-only nodes for generating actual static uses
  1970. if (! linkageOnly || symbol->getQualifier().isSpecConstant()) {
  1971. // Prepare to generate code for the access
  1972. // L-value chains will be computed left to right. We're on the symbol now,
  1973. // which is the left-most part of the access chain, so now is "clear" time,
  1974. // followed by setting the base.
  1975. builder.clearAccessChain();
  1976. // For now, we consider all user variables as being in memory, so they are pointers,
  1977. // except for
  1978. // A) R-Value arguments to a function, which are an intermediate object.
  1979. // See comments in handleUserFunctionCall().
  1980. // B) Specialization constants (normal constants don't even come in as a variable),
  1981. // These are also pure R-values.
  1982. // C) R-Values from type translation, see above call to translateForcedType()
  1983. glslang::TQualifier qualifier = symbol->getQualifier();
  1984. if (qualifier.isSpecConstant() || rValueParameters.find(symbol->getId()) != rValueParameters.end() ||
  1985. !builder.isPointerType(builder.getTypeId(id)))
  1986. builder.setAccessChainRValue(id);
  1987. else
  1988. builder.setAccessChainLValue(id);
  1989. }
  1990. #ifdef ENABLE_HLSL
  1991. // Process linkage-only nodes for any special additional interface work.
  1992. if (linkageOnly) {
  1993. if (glslangIntermediate->getHlslFunctionality1()) {
  1994. // Map implicit counter buffers to their originating buffers, which should have been
  1995. // seen by now, given earlier pruning of unused counters, and preservation of order
  1996. // of declaration.
  1997. if (symbol->getType().getQualifier().isUniformOrBuffer()) {
  1998. if (!glslangIntermediate->hasCounterBufferName(symbol->getName())) {
  1999. // Save possible originating buffers for counter buffers, keyed by
  2000. // making the potential counter-buffer name.
  2001. std::string keyName = symbol->getName().c_str();
  2002. keyName = glslangIntermediate->addCounterBufferName(keyName);
  2003. counterOriginator[keyName] = symbol;
  2004. } else {
  2005. // Handle a counter buffer, by finding the saved originating buffer.
  2006. std::string keyName = symbol->getName().c_str();
  2007. auto it = counterOriginator.find(keyName);
  2008. if (it != counterOriginator.end()) {
  2009. id = getSymbolId(it->second);
  2010. if (id != spv::NoResult) {
  2011. spv::Id counterId = getSymbolId(symbol);
  2012. if (counterId != spv::NoResult) {
  2013. builder.addExtension("SPV_GOOGLE_hlsl_functionality1");
  2014. builder.addDecorationId(id, spv::Decoration::HlslCounterBufferGOOGLE, counterId);
  2015. }
  2016. }
  2017. }
  2018. }
  2019. }
  2020. }
  2021. }
  2022. #endif
  2023. }
  2024. bool TGlslangToSpvTraverser::visitBinary(glslang::TVisit /* visit */, glslang::TIntermBinary* node)
  2025. {
  2026. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2027. if (node->getLeft()->getAsSymbolNode() != nullptr && node->getLeft()->getType().isStruct()) {
  2028. glslangTypeToIdMap[node->getLeft()->getType().getStruct()] = node->getLeft()->getAsSymbolNode()->getId();
  2029. }
  2030. if (node->getRight()->getAsSymbolNode() != nullptr && node->getRight()->getType().isStruct()) {
  2031. glslangTypeToIdMap[node->getRight()->getType().getStruct()] = node->getRight()->getAsSymbolNode()->getId();
  2032. }
  2033. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  2034. if (node->getType().getQualifier().isSpecConstant())
  2035. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  2036. // First, handle special cases
  2037. switch (node->getOp()) {
  2038. case glslang::EOpAssign:
  2039. case glslang::EOpAddAssign:
  2040. case glslang::EOpSubAssign:
  2041. case glslang::EOpMulAssign:
  2042. case glslang::EOpVectorTimesMatrixAssign:
  2043. case glslang::EOpVectorTimesScalarAssign:
  2044. case glslang::EOpMatrixTimesScalarAssign:
  2045. case glslang::EOpMatrixTimesMatrixAssign:
  2046. case glslang::EOpDivAssign:
  2047. case glslang::EOpModAssign:
  2048. case glslang::EOpAndAssign:
  2049. case glslang::EOpInclusiveOrAssign:
  2050. case glslang::EOpExclusiveOrAssign:
  2051. case glslang::EOpLeftShiftAssign:
  2052. case glslang::EOpRightShiftAssign:
  2053. // A bin-op assign "a += b" means the same thing as "a = a + b"
  2054. // where a is evaluated before b. For a simple assignment, GLSL
  2055. // says to evaluate the left before the right. So, always, left
  2056. // node then right node.
  2057. {
  2058. // get the left l-value, save it away
  2059. builder.clearAccessChain();
  2060. node->getLeft()->traverse(this);
  2061. spv::Builder::AccessChain lValue = builder.getAccessChain();
  2062. // evaluate the right
  2063. builder.clearAccessChain();
  2064. node->getRight()->traverse(this);
  2065. spv::Id rValue = accessChainLoad(node->getRight()->getType());
  2066. // reset line number for assignment
  2067. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2068. if (node->getOp() != glslang::EOpAssign) {
  2069. // the left is also an r-value
  2070. builder.setAccessChain(lValue);
  2071. spv::Id leftRValue = accessChainLoad(node->getLeft()->getType());
  2072. // do the operation
  2073. spv::Builder::AccessChain::CoherentFlags coherentFlags = TranslateCoherent(node->getLeft()->getType());
  2074. coherentFlags |= TranslateCoherent(node->getRight()->getType());
  2075. OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
  2076. TranslateNoContractionDecoration(node->getType().getQualifier()),
  2077. TranslateNonUniformDecoration(coherentFlags) };
  2078. rValue = createBinaryOperation(node->getOp(), decorations,
  2079. convertGlslangToSpvType(node->getType()), leftRValue, rValue,
  2080. node->getType().getBasicType());
  2081. // these all need their counterparts in createBinaryOperation()
  2082. assert(rValue != spv::NoResult);
  2083. }
  2084. // store the result
  2085. builder.setAccessChain(lValue);
  2086. multiTypeStore(node->getLeft()->getType(), rValue);
  2087. // assignments are expressions having an rValue after they are evaluated...
  2088. builder.clearAccessChain();
  2089. builder.setAccessChainRValue(rValue);
  2090. }
  2091. return false;
  2092. case glslang::EOpIndexDirect:
  2093. case glslang::EOpIndexDirectStruct:
  2094. {
  2095. // Structure, array, matrix, or vector indirection with statically known index.
  2096. // Get the left part of the access chain.
  2097. node->getLeft()->traverse(this);
  2098. // Add the next element in the chain
  2099. const int glslangIndex = node->getRight()->getAsConstantUnion()->getConstArray()[0].getIConst();
  2100. if (! node->getLeft()->getType().isArray() &&
  2101. node->getLeft()->getType().isVector() &&
  2102. node->getOp() == glslang::EOpIndexDirect) {
  2103. // Swizzle is uniform so propagate uniform into access chain
  2104. spv::Builder::AccessChain::CoherentFlags coherentFlags = TranslateCoherent(node->getLeft()->getType());
  2105. coherentFlags.nonUniform = 0;
  2106. // This is essentially a hard-coded vector swizzle of size 1,
  2107. // so short circuit the access-chain stuff with a swizzle.
  2108. std::vector<unsigned> swizzle;
  2109. swizzle.push_back(glslangIndex);
  2110. int dummySize;
  2111. builder.accessChainPushSwizzle(swizzle, convertGlslangToSpvType(node->getLeft()->getType()),
  2112. coherentFlags,
  2113. glslangIntermediate->getBaseAlignmentScalar(
  2114. node->getLeft()->getType(), dummySize));
  2115. } else {
  2116. // Load through a block reference is performed with a dot operator that
  2117. // is mapped to EOpIndexDirectStruct. When we get to the actual reference,
  2118. // do a load and reset the access chain.
  2119. if (node->getLeft()->isReference() &&
  2120. !node->getLeft()->getType().isArray() &&
  2121. node->getOp() == glslang::EOpIndexDirectStruct)
  2122. {
  2123. spv::Id left = accessChainLoad(node->getLeft()->getType());
  2124. builder.clearAccessChain();
  2125. builder.setAccessChainLValue(left);
  2126. }
  2127. int spvIndex = glslangIndex;
  2128. if (node->getLeft()->getBasicType() == glslang::EbtBlock &&
  2129. node->getOp() == glslang::EOpIndexDirectStruct)
  2130. {
  2131. // This may be, e.g., an anonymous block-member selection, which generally need
  2132. // index remapping due to hidden members in anonymous blocks.
  2133. long long glslangId = glslangTypeToIdMap[node->getLeft()->getType().getStruct()];
  2134. if (memberRemapper.find(glslangId) != memberRemapper.end()) {
  2135. std::vector<int>& remapper = memberRemapper[glslangId];
  2136. assert(remapper.size() > 0);
  2137. spvIndex = remapper[glslangIndex];
  2138. }
  2139. }
  2140. // Struct reference propagates uniform lvalue
  2141. spv::Builder::AccessChain::CoherentFlags coherentFlags =
  2142. TranslateCoherent(node->getLeft()->getType());
  2143. coherentFlags.nonUniform = 0;
  2144. // normal case for indexing array or structure or block
  2145. builder.accessChainPush(builder.makeIntConstant(spvIndex),
  2146. coherentFlags,
  2147. node->getLeft()->getType().getBufferReferenceAlignment());
  2148. // Add capabilities here for accessing PointSize and clip/cull distance.
  2149. // We have deferred generation of associated capabilities until now.
  2150. if (node->getLeft()->getType().isStruct() && ! node->getLeft()->getType().isArray())
  2151. declareUseOfStructMember(*(node->getLeft()->getType().getStruct()), glslangIndex);
  2152. }
  2153. }
  2154. return false;
  2155. case glslang::EOpIndexIndirect:
  2156. {
  2157. // Array, matrix, or vector indirection with variable index.
  2158. // Will use native SPIR-V access-chain for and array indirection;
  2159. // matrices are arrays of vectors, so will also work for a matrix.
  2160. // Will use the access chain's 'component' for variable index into a vector.
  2161. // This adapter is building access chains left to right.
  2162. // Set up the access chain to the left.
  2163. node->getLeft()->traverse(this);
  2164. // save it so that computing the right side doesn't trash it
  2165. spv::Builder::AccessChain partial = builder.getAccessChain();
  2166. // compute the next index in the chain
  2167. builder.clearAccessChain();
  2168. node->getRight()->traverse(this);
  2169. spv::Id index = accessChainLoad(node->getRight()->getType());
  2170. // Zero-extend smaller unsigned integer types for array indexing.
  2171. // SPIR-V OpAccessChain treats indices as signed, so we need to zero-extend
  2172. // unsigned types to preserve their values (signed types are fine as-is).
  2173. spv::Id indexType = builder.getTypeId(index);
  2174. if (builder.isUintType(indexType) && builder.getScalarTypeWidth(indexType) < 32) {
  2175. // Zero-extend unsigned types to preserve their values
  2176. spv::Id uintType = builder.makeUintType(32);
  2177. index = builder.createUnaryOp(spv::Op::OpUConvert, uintType, index);
  2178. }
  2179. addIndirectionIndexCapabilities(node->getLeft()->getType(), node->getRight()->getType());
  2180. // restore the saved access chain
  2181. builder.setAccessChain(partial);
  2182. // Only if index is nonUniform should we propagate nonUniform into access chain
  2183. spv::Builder::AccessChain::CoherentFlags index_flags = TranslateCoherent(node->getRight()->getType());
  2184. spv::Builder::AccessChain::CoherentFlags coherent_flags = TranslateCoherent(node->getLeft()->getType());
  2185. coherent_flags.nonUniform = index_flags.nonUniform;
  2186. if (! node->getLeft()->getType().isArray() && node->getLeft()->getType().isVector()) {
  2187. int dummySize;
  2188. builder.accessChainPushComponent(
  2189. index, convertGlslangToSpvType(node->getLeft()->getType()), coherent_flags,
  2190. glslangIntermediate->getBaseAlignmentScalar(node->getLeft()->getType(),
  2191. dummySize));
  2192. } else
  2193. builder.accessChainPush(index, coherent_flags,
  2194. node->getLeft()->getType().getBufferReferenceAlignment());
  2195. }
  2196. return false;
  2197. case glslang::EOpVectorSwizzle:
  2198. {
  2199. node->getLeft()->traverse(this);
  2200. std::vector<unsigned> swizzle;
  2201. convertSwizzle(*node->getRight()->getAsAggregate(), swizzle);
  2202. int dummySize;
  2203. builder.accessChainPushSwizzle(swizzle, convertGlslangToSpvType(node->getLeft()->getType()),
  2204. TranslateCoherent(node->getLeft()->getType()),
  2205. glslangIntermediate->getBaseAlignmentScalar(node->getLeft()->getType(),
  2206. dummySize));
  2207. }
  2208. return false;
  2209. case glslang::EOpMatrixSwizzle:
  2210. logger->missingFunctionality("matrix swizzle");
  2211. return true;
  2212. case glslang::EOpLogicalOr:
  2213. case glslang::EOpLogicalAnd:
  2214. {
  2215. // These may require short circuiting, but can sometimes be done as straight
  2216. // binary operations. The right operand must be short circuited if it has
  2217. // side effects, and should probably be if it is complex.
  2218. if (isTrivial(node->getRight()->getAsTyped()))
  2219. break; // handle below as a normal binary operation
  2220. // otherwise, we need to do dynamic short circuiting on the right operand
  2221. spv::Id result = createShortCircuit(node->getOp(), *node->getLeft()->getAsTyped(),
  2222. *node->getRight()->getAsTyped());
  2223. builder.clearAccessChain();
  2224. builder.setAccessChainRValue(result);
  2225. }
  2226. return false;
  2227. default:
  2228. break;
  2229. }
  2230. // Assume generic binary op...
  2231. // get right operand
  2232. builder.clearAccessChain();
  2233. node->getLeft()->traverse(this);
  2234. spv::Id left = accessChainLoad(node->getLeft()->getType());
  2235. // get left operand
  2236. builder.clearAccessChain();
  2237. node->getRight()->traverse(this);
  2238. spv::Id right = accessChainLoad(node->getRight()->getType());
  2239. // get result
  2240. OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
  2241. TranslateNoContractionDecoration(node->getType().getQualifier()),
  2242. TranslateNonUniformDecoration(node->getType().getQualifier()) };
  2243. spv::Id result = createBinaryOperation(node->getOp(), decorations,
  2244. convertGlslangToSpvType(node->getType()), left, right,
  2245. node->getLeft()->getType().getBasicType());
  2246. builder.clearAccessChain();
  2247. if (! result) {
  2248. logger->missingFunctionality("unknown glslang binary operation");
  2249. return true; // pick up a child as the place-holder result
  2250. } else {
  2251. builder.setAccessChainRValue(result);
  2252. return false;
  2253. }
  2254. }
  2255. spv::Id TGlslangToSpvTraverser::convertLoadedBoolInUniformToUint(const glslang::TType& type,
  2256. spv::Id nominalTypeId,
  2257. spv::Id loadedId)
  2258. {
  2259. if (builder.isScalarType(nominalTypeId)) {
  2260. // Conversion for bool
  2261. spv::Id boolType = builder.makeBoolType();
  2262. if (nominalTypeId != boolType)
  2263. return builder.createBinOp(spv::Op::OpINotEqual, boolType, loadedId, builder.makeUintConstant(0));
  2264. } else if (builder.isVectorType(nominalTypeId)) {
  2265. // Conversion for bvec
  2266. int vecSize = builder.getNumTypeComponents(nominalTypeId);
  2267. spv::Id bvecType = builder.makeVectorType(builder.makeBoolType(), vecSize);
  2268. if (nominalTypeId != bvecType)
  2269. loadedId = builder.createBinOp(spv::Op::OpINotEqual, bvecType, loadedId,
  2270. makeSmearedConstant(builder.makeUintConstant(0), vecSize));
  2271. } else if (builder.isArrayType(nominalTypeId)) {
  2272. // Conversion for bool array
  2273. spv::Id boolArrayTypeId = convertGlslangToSpvType(type);
  2274. if (nominalTypeId != boolArrayTypeId)
  2275. {
  2276. // Use OpCopyLogical from SPIR-V 1.4 if available.
  2277. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4)
  2278. return builder.createUnaryOp(spv::Op::OpCopyLogical, boolArrayTypeId, loadedId);
  2279. glslang::TType glslangElementType(type, 0);
  2280. spv::Id elementNominalTypeId = builder.getContainedTypeId(nominalTypeId);
  2281. std::vector<spv::Id> constituents;
  2282. for (int index = 0; index < type.getOuterArraySize(); ++index) {
  2283. // get the element
  2284. spv::Id elementValue = builder.createCompositeExtract(loadedId, elementNominalTypeId, index);
  2285. // recursively convert it
  2286. spv::Id elementConvertedValue = convertLoadedBoolInUniformToUint(glslangElementType, elementNominalTypeId, elementValue);
  2287. constituents.push_back(elementConvertedValue);
  2288. }
  2289. return builder.createCompositeConstruct(boolArrayTypeId, constituents);
  2290. }
  2291. }
  2292. return loadedId;
  2293. }
  2294. // Figure out what, if any, type changes are needed when accessing a specific built-in.
  2295. // Returns <the type SPIR-V requires for declarion, the type to translate to on use>.
  2296. // Also see comment for 'forceType', regarding tracking SPIR-V-required types.
  2297. std::pair<spv::Id, spv::Id> TGlslangToSpvTraverser::getForcedType(glslang::TBuiltInVariable glslangBuiltIn,
  2298. const glslang::TType& glslangType)
  2299. {
  2300. switch(glslangBuiltIn)
  2301. {
  2302. case glslang::EbvSubGroupEqMask:
  2303. case glslang::EbvSubGroupGeMask:
  2304. case glslang::EbvSubGroupGtMask:
  2305. case glslang::EbvSubGroupLeMask:
  2306. case glslang::EbvSubGroupLtMask: {
  2307. // these require changing a 64-bit scaler -> a vector of 32-bit components
  2308. if (glslangType.isVector())
  2309. break;
  2310. spv::Id ivec4_type = builder.makeVectorType(builder.makeUintType(32), 4);
  2311. spv::Id uint64_type = builder.makeUintType(64);
  2312. std::pair<spv::Id, spv::Id> ret(ivec4_type, uint64_type);
  2313. return ret;
  2314. }
  2315. // There are no SPIR-V builtins defined for these and map onto original non-transposed
  2316. // builtins. During visitBinary we insert a transpose
  2317. case glslang::EbvWorldToObject3x4:
  2318. case glslang::EbvObjectToWorld3x4: {
  2319. spv::Id mat43 = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  2320. spv::Id mat34 = builder.makeMatrixType(builder.makeFloatType(32), 3, 4);
  2321. std::pair<spv::Id, spv::Id> ret(mat43, mat34);
  2322. return ret;
  2323. }
  2324. default:
  2325. break;
  2326. }
  2327. std::pair<spv::Id, spv::Id> ret(spv::NoType, spv::NoType);
  2328. return ret;
  2329. }
  2330. // For an object previously identified (see getForcedType() and forceType)
  2331. // as needing type translations, do the translation needed for a load, turning
  2332. // an L-value into in R-value.
  2333. spv::Id TGlslangToSpvTraverser::translateForcedType(spv::Id object)
  2334. {
  2335. const auto forceIt = forceType.find(object);
  2336. if (forceIt == forceType.end())
  2337. return object;
  2338. spv::Id desiredTypeId = forceIt->second;
  2339. spv::Id objectTypeId = builder.getTypeId(object);
  2340. assert(builder.isPointerType(objectTypeId));
  2341. objectTypeId = builder.getContainedTypeId(objectTypeId);
  2342. if (builder.isVectorType(objectTypeId) &&
  2343. builder.getScalarTypeWidth(builder.getContainedTypeId(objectTypeId)) == 32) {
  2344. if (builder.getScalarTypeWidth(desiredTypeId) == 64) {
  2345. // handle 32-bit v.xy* -> 64-bit
  2346. builder.clearAccessChain();
  2347. builder.setAccessChainLValue(object);
  2348. object = builder.accessChainLoad(spv::NoPrecision, spv::Decoration::Max, spv::Decoration::Max, objectTypeId);
  2349. std::vector<spv::Id> components;
  2350. components.push_back(builder.createCompositeExtract(object, builder.getContainedTypeId(objectTypeId), 0));
  2351. components.push_back(builder.createCompositeExtract(object, builder.getContainedTypeId(objectTypeId), 1));
  2352. spv::Id vecType = builder.makeVectorType(builder.getContainedTypeId(objectTypeId), 2);
  2353. return builder.createUnaryOp(spv::Op::OpBitcast, desiredTypeId,
  2354. builder.createCompositeConstruct(vecType, components));
  2355. } else {
  2356. logger->missingFunctionality("forcing 32-bit vector type to non 64-bit scalar");
  2357. }
  2358. } else if (builder.isMatrixType(objectTypeId)) {
  2359. // There are no SPIR-V builtins defined for 3x4 variants of ObjectToWorld/WorldToObject
  2360. // and we insert a transpose after loading the original non-transposed builtins
  2361. builder.clearAccessChain();
  2362. builder.setAccessChainLValue(object);
  2363. object = builder.accessChainLoad(spv::NoPrecision, spv::Decoration::Max, spv::Decoration::Max, objectTypeId);
  2364. return builder.createUnaryOp(spv::Op::OpTranspose, desiredTypeId, object);
  2365. } else {
  2366. logger->missingFunctionality("forcing non 32-bit vector type");
  2367. }
  2368. return object;
  2369. }
  2370. bool TGlslangToSpvTraverser::visitUnary(glslang::TVisit /* visit */, glslang::TIntermUnary* node)
  2371. {
  2372. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2373. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  2374. if (node->getType().getQualifier().isSpecConstant())
  2375. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  2376. spv::Id result = spv::NoResult;
  2377. // try texturing first
  2378. result = createImageTextureFunctionCall(node);
  2379. if (result != spv::NoResult) {
  2380. builder.clearAccessChain();
  2381. builder.setAccessChainRValue(result);
  2382. return false; // done with this node
  2383. }
  2384. // Non-texturing.
  2385. if (node->getOp() == glslang::EOpArrayLength) {
  2386. // Quite special; won't want to evaluate the operand.
  2387. // Currently, the front-end does not allow .length() on an array until it is sized,
  2388. // except for the last block membeor of an SSBO.
  2389. // TODO: If this changes, link-time sized arrays might show up here, and need their
  2390. // size extracted.
  2391. // Normal .length() would have been constant folded by the front-end.
  2392. // So, this has to be block.lastMember.length().
  2393. // SPV wants "block" and member number as the operands, go get them.
  2394. spv::Id length;
  2395. if (node->getOperand()->getType().isCoopMat()) {
  2396. spv::Id typeId = convertGlslangToSpvType(node->getOperand()->getType());
  2397. assert(builder.isCooperativeMatrixType(typeId));
  2398. if (node->getOperand()->getType().isCoopMatKHR()) {
  2399. length = builder.createCooperativeMatrixLengthKHR(typeId);
  2400. } else {
  2401. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  2402. length = builder.createCooperativeMatrixLengthNV(typeId);
  2403. }
  2404. } else if (node->getOperand()->getType().isCoopVecNV()) {
  2405. spv::Id typeId = convertGlslangToSpvType(node->getOperand()->getType());
  2406. length = builder.getCooperativeVectorNumComponents(typeId);
  2407. } else {
  2408. glslang::TIntermTyped* block = node->getOperand()->getAsBinaryNode()->getLeft();
  2409. block->traverse(this);
  2410. unsigned int member = node->getOperand()->getAsBinaryNode()->getRight()->getAsConstantUnion()
  2411. ->getConstArray()[0].getUConst();
  2412. length = builder.createArrayLength(builder.accessChainGetLValue(), member);
  2413. }
  2414. // GLSL semantics say the result of .length() is an int, while SPIR-V says
  2415. // signedness must be 0. So, convert from SPIR-V unsigned back to GLSL's
  2416. // AST expectation of a signed result.
  2417. if (glslangIntermediate->getSource() == glslang::EShSourceGlsl) {
  2418. if (builder.isInSpecConstCodeGenMode()) {
  2419. length = builder.createBinOp(spv::Op::OpIAdd, builder.makeIntType(32), length, builder.makeIntConstant(0));
  2420. } else {
  2421. length = builder.createUnaryOp(spv::Op::OpBitcast, builder.makeIntType(32), length);
  2422. }
  2423. }
  2424. builder.clearAccessChain();
  2425. builder.setAccessChainRValue(length);
  2426. return false;
  2427. }
  2428. // Force variable declaration - Debug Mode Only
  2429. if (node->getOp() == glslang::EOpDeclare) {
  2430. builder.clearAccessChain();
  2431. node->getOperand()->traverse(this);
  2432. builder.clearAccessChain();
  2433. return false;
  2434. }
  2435. // Start by evaluating the operand
  2436. // Does it need a swizzle inversion? If so, evaluation is inverted;
  2437. // operate first on the swizzle base, then apply the swizzle.
  2438. spv::Id invertedType = spv::NoType;
  2439. auto resultType = [&invertedType, &node, this](){ return invertedType != spv::NoType ?
  2440. invertedType : convertGlslangToSpvType(node->getType()); };
  2441. if (node->getOp() == glslang::EOpInterpolateAtCentroid)
  2442. invertedType = getInvertedSwizzleType(*node->getOperand());
  2443. builder.clearAccessChain();
  2444. TIntermNode *operandNode;
  2445. if (invertedType != spv::NoType)
  2446. operandNode = node->getOperand()->getAsBinaryNode()->getLeft();
  2447. else
  2448. operandNode = node->getOperand();
  2449. operandNode->traverse(this);
  2450. spv::Id operand = spv::NoResult;
  2451. spv::Builder::AccessChain::CoherentFlags lvalueCoherentFlags;
  2452. const auto hitObjectOpsWithLvalue = [](glslang::TOperator op) {
  2453. switch(op) {
  2454. case glslang::EOpReorderThreadNV:
  2455. case glslang::EOpHitObjectGetCurrentTimeNV:
  2456. case glslang::EOpHitObjectGetHitKindNV:
  2457. case glslang::EOpHitObjectGetPrimitiveIndexNV:
  2458. case glslang::EOpHitObjectGetGeometryIndexNV:
  2459. case glslang::EOpHitObjectGetInstanceIdNV:
  2460. case glslang::EOpHitObjectGetInstanceCustomIndexNV:
  2461. case glslang::EOpHitObjectGetObjectRayDirectionNV:
  2462. case glslang::EOpHitObjectGetObjectRayOriginNV:
  2463. case glslang::EOpHitObjectGetWorldRayDirectionNV:
  2464. case glslang::EOpHitObjectGetWorldRayOriginNV:
  2465. case glslang::EOpHitObjectGetWorldToObjectNV:
  2466. case glslang::EOpHitObjectGetObjectToWorldNV:
  2467. case glslang::EOpHitObjectGetRayTMaxNV:
  2468. case glslang::EOpHitObjectGetRayTMinNV:
  2469. case glslang::EOpHitObjectIsEmptyNV:
  2470. case glslang::EOpHitObjectIsHitNV:
  2471. case glslang::EOpHitObjectIsMissNV:
  2472. case glslang::EOpHitObjectRecordEmptyNV:
  2473. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:
  2474. case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:
  2475. case glslang::EOpHitObjectGetClusterIdNV:
  2476. case glslang::EOpHitObjectGetSpherePositionNV:
  2477. case glslang::EOpHitObjectGetSphereRadiusNV:
  2478. case glslang::EOpHitObjectIsSphereHitNV:
  2479. case glslang::EOpHitObjectIsLSSHitNV:
  2480. return true;
  2481. default:
  2482. return false;
  2483. }
  2484. };
  2485. if (node->getOp() == glslang::EOpAtomicCounterIncrement ||
  2486. node->getOp() == glslang::EOpAtomicCounterDecrement ||
  2487. node->getOp() == glslang::EOpAtomicCounter ||
  2488. (node->getOp() == glslang::EOpInterpolateAtCentroid &&
  2489. glslangIntermediate->getSource() != glslang::EShSourceHlsl) ||
  2490. node->getOp() == glslang::EOpRayQueryProceed ||
  2491. node->getOp() == glslang::EOpRayQueryGetRayTMin ||
  2492. node->getOp() == glslang::EOpRayQueryGetRayFlags ||
  2493. node->getOp() == glslang::EOpRayQueryGetWorldRayOrigin ||
  2494. node->getOp() == glslang::EOpRayQueryGetWorldRayDirection ||
  2495. node->getOp() == glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque ||
  2496. node->getOp() == glslang::EOpRayQueryTerminate ||
  2497. node->getOp() == glslang::EOpRayQueryConfirmIntersection ||
  2498. (node->getOp() == glslang::EOpSpirvInst && operandNode->getAsTyped()->getQualifier().isSpirvByReference()) ||
  2499. hitObjectOpsWithLvalue(node->getOp())) {
  2500. operand = builder.accessChainGetLValue(); // Special case l-value operands
  2501. lvalueCoherentFlags = builder.getAccessChain().coherentFlags;
  2502. lvalueCoherentFlags |= TranslateCoherent(operandNode->getAsTyped()->getType());
  2503. } else if (operandNode->getAsTyped()->getQualifier().isSpirvLiteral()) {
  2504. // Will be translated to a literal value, make a placeholder here
  2505. operand = spv::NoResult;
  2506. } else {
  2507. operand = accessChainLoad(node->getOperand()->getType());
  2508. }
  2509. OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
  2510. TranslateNoContractionDecoration(node->getType().getQualifier()),
  2511. TranslateNonUniformDecoration(node->getType().getQualifier()) };
  2512. // it could be a conversion
  2513. if (! result) {
  2514. result = createConversion(node->getOp(), decorations, resultType(), operand,
  2515. node->getType().getBasicType(), node->getOperand()->getBasicType());
  2516. if (result) {
  2517. if (node->getType().isCoopMatKHR() && node->getOperand()->getAsTyped()->getType().isCoopMatKHR() &&
  2518. !node->getAsTyped()->getType().sameCoopMatUse(node->getOperand()->getAsTyped()->getType())) {
  2519. // Conversions that change use need CapabilityCooperativeMatrixConversionsNV
  2520. builder.addCapability(spv::Capability::CooperativeMatrixConversionsNV);
  2521. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  2522. }
  2523. }
  2524. }
  2525. // if not, then possibly an operation
  2526. if (! result)
  2527. result = createUnaryOperation(node->getOp(), decorations, resultType(), operand,
  2528. node->getOperand()->getBasicType(), lvalueCoherentFlags, node->getType());
  2529. // it could be attached to a SPIR-V intruction
  2530. if (!result) {
  2531. if (node->getOp() == glslang::EOpSpirvInst) {
  2532. const auto& spirvInst = node->getSpirvInstruction();
  2533. if (spirvInst.set == "") {
  2534. spv::IdImmediate idImmOp = {true, operand};
  2535. if (operandNode->getAsTyped()->getQualifier().isSpirvLiteral()) {
  2536. // Translate the constant to a literal value
  2537. std::vector<unsigned> literals;
  2538. glslang::TVector<const glslang::TIntermConstantUnion*> constants;
  2539. constants.push_back(operandNode->getAsConstantUnion());
  2540. TranslateLiterals(constants, literals);
  2541. idImmOp = {false, literals[0]};
  2542. }
  2543. if (node->getBasicType() == glslang::EbtVoid)
  2544. builder.createNoResultOp(static_cast<spv::Op>(spirvInst.id), {idImmOp});
  2545. else
  2546. result = builder.createOp(static_cast<spv::Op>(spirvInst.id), resultType(), {idImmOp});
  2547. } else {
  2548. result = builder.createBuiltinCall(
  2549. resultType(), spirvInst.set == "GLSL.std.450" ? stdBuiltins : getExtBuiltins(spirvInst.set.c_str()),
  2550. spirvInst.id, {operand});
  2551. }
  2552. if (node->getBasicType() == glslang::EbtVoid)
  2553. return false; // done with this node
  2554. }
  2555. }
  2556. if (result) {
  2557. if (invertedType) {
  2558. result = createInvertedSwizzle(decorations.precision, *node->getOperand(), result);
  2559. decorations.addNonUniform(builder, result);
  2560. }
  2561. builder.clearAccessChain();
  2562. builder.setAccessChainRValue(result);
  2563. return false; // done with this node
  2564. }
  2565. // it must be a special case, check...
  2566. switch (node->getOp()) {
  2567. case glslang::EOpPostIncrement:
  2568. case glslang::EOpPostDecrement:
  2569. case glslang::EOpPreIncrement:
  2570. case glslang::EOpPreDecrement:
  2571. {
  2572. // we need the integer value "1" or the floating point "1.0" to add/subtract
  2573. spv::Id one = 0;
  2574. if (node->getBasicType() == glslang::EbtFloat)
  2575. one = builder.makeFloatConstant(1.0F);
  2576. else if (node->getBasicType() == glslang::EbtDouble)
  2577. one = builder.makeDoubleConstant(1.0);
  2578. else if (node->getBasicType() == glslang::EbtFloat16)
  2579. one = builder.makeFloat16Constant(1.0F);
  2580. else if (node->getBasicType() == glslang::EbtBFloat16)
  2581. one = builder.makeBFloat16Constant(1.0F);
  2582. else if (node->getBasicType() == glslang::EbtFloatE5M2)
  2583. one = builder.makeFloatE5M2Constant(1.0F);
  2584. else if (node->getBasicType() == glslang::EbtFloatE4M3)
  2585. one = builder.makeFloatE4M3Constant(1.0F);
  2586. else if (node->getBasicType() == glslang::EbtInt8 || node->getBasicType() == glslang::EbtUint8)
  2587. one = builder.makeInt8Constant(1);
  2588. else if (node->getBasicType() == glslang::EbtInt16 || node->getBasicType() == glslang::EbtUint16)
  2589. one = builder.makeInt16Constant(1);
  2590. else if (node->getBasicType() == glslang::EbtInt64 || node->getBasicType() == glslang::EbtUint64)
  2591. one = builder.makeInt64Constant(1);
  2592. else
  2593. one = builder.makeIntConstant(1);
  2594. glslang::TOperator op;
  2595. if (node->getOp() == glslang::EOpPreIncrement ||
  2596. node->getOp() == glslang::EOpPostIncrement)
  2597. op = glslang::EOpAdd;
  2598. else
  2599. op = glslang::EOpSub;
  2600. spv::Id result = createBinaryOperation(op, decorations,
  2601. convertGlslangToSpvType(node->getType()), operand, one,
  2602. node->getType().getBasicType());
  2603. assert(result != spv::NoResult);
  2604. // The result of operation is always stored, but conditionally the
  2605. // consumed result. The consumed result is always an r-value.
  2606. builder.accessChainStore(result,
  2607. TranslateNonUniformDecoration(builder.getAccessChain().coherentFlags));
  2608. builder.clearAccessChain();
  2609. if (node->getOp() == glslang::EOpPreIncrement ||
  2610. node->getOp() == glslang::EOpPreDecrement)
  2611. builder.setAccessChainRValue(result);
  2612. else
  2613. builder.setAccessChainRValue(operand);
  2614. }
  2615. return false;
  2616. case glslang::EOpAssumeEXT:
  2617. builder.addCapability(spv::Capability::ExpectAssumeKHR);
  2618. builder.addExtension(spv::E_SPV_KHR_expect_assume);
  2619. builder.createNoResultOp(spv::Op::OpAssumeTrueKHR, operand);
  2620. return false;
  2621. case glslang::EOpEmitStreamVertex:
  2622. builder.createNoResultOp(spv::Op::OpEmitStreamVertex, operand);
  2623. return false;
  2624. case glslang::EOpEndStreamPrimitive:
  2625. builder.createNoResultOp(spv::Op::OpEndStreamPrimitive, operand);
  2626. return false;
  2627. case glslang::EOpRayQueryTerminate:
  2628. builder.createNoResultOp(spv::Op::OpRayQueryTerminateKHR, operand);
  2629. return false;
  2630. case glslang::EOpRayQueryConfirmIntersection:
  2631. builder.createNoResultOp(spv::Op::OpRayQueryConfirmIntersectionKHR, operand);
  2632. return false;
  2633. case glslang::EOpReorderThreadNV:
  2634. builder.createNoResultOp(spv::Op::OpReorderThreadWithHitObjectNV, operand);
  2635. return false;
  2636. case glslang::EOpHitObjectRecordEmptyNV:
  2637. builder.createNoResultOp(spv::Op::OpHitObjectRecordEmptyNV, operand);
  2638. return false;
  2639. case glslang::EOpCreateTensorLayoutNV:
  2640. result = builder.createOp(spv::Op::OpCreateTensorLayoutNV, resultType(), std::vector<spv::Id>{});
  2641. builder.clearAccessChain();
  2642. builder.setAccessChainRValue(result);
  2643. return false;
  2644. case glslang::EOpCreateTensorViewNV:
  2645. result = builder.createOp(spv::Op::OpCreateTensorViewNV, resultType(), std::vector<spv::Id>{});
  2646. builder.clearAccessChain();
  2647. builder.setAccessChainRValue(result);
  2648. return false;
  2649. default:
  2650. logger->missingFunctionality("unknown glslang unary");
  2651. return true; // pick up operand as placeholder result
  2652. }
  2653. }
  2654. // Construct a composite object, recursively copying members if their types don't match
  2655. spv::Id TGlslangToSpvTraverser::createCompositeConstruct(spv::Id resultTypeId, std::vector<spv::Id> constituents)
  2656. {
  2657. for (int c = 0; c < (int)constituents.size(); ++c) {
  2658. spv::Id& constituent = constituents[c];
  2659. spv::Id lType = builder.getContainedTypeId(resultTypeId, c);
  2660. spv::Id rType = builder.getTypeId(constituent);
  2661. if (lType != rType) {
  2662. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {
  2663. constituent = builder.createUnaryOp(spv::Op::OpCopyLogical, lType, constituent);
  2664. } else if (builder.isStructType(rType)) {
  2665. std::vector<spv::Id> rTypeConstituents;
  2666. int numrTypeConstituents = builder.getNumTypeConstituents(rType);
  2667. for (int i = 0; i < numrTypeConstituents; ++i) {
  2668. rTypeConstituents.push_back(builder.createCompositeExtract(constituent,
  2669. builder.getContainedTypeId(rType, i), i));
  2670. }
  2671. constituents[c] = createCompositeConstruct(lType, rTypeConstituents);
  2672. } else {
  2673. assert(builder.isArrayType(rType));
  2674. std::vector<spv::Id> rTypeConstituents;
  2675. int numrTypeConstituents = builder.getNumTypeConstituents(rType);
  2676. spv::Id elementRType = builder.getContainedTypeId(rType);
  2677. for (int i = 0; i < numrTypeConstituents; ++i) {
  2678. rTypeConstituents.push_back(builder.createCompositeExtract(constituent, elementRType, i));
  2679. }
  2680. constituents[c] = createCompositeConstruct(lType, rTypeConstituents);
  2681. }
  2682. }
  2683. }
  2684. return builder.createCompositeConstruct(resultTypeId, constituents);
  2685. }
  2686. bool TGlslangToSpvTraverser::visitAggregate(glslang::TVisit visit, glslang::TIntermAggregate* node)
  2687. {
  2688. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  2689. if (node->getType().getQualifier().isSpecConstant())
  2690. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  2691. spv::Id result = spv::NoResult;
  2692. spv::Id invertedType = spv::NoType; // to use to override the natural type of the node
  2693. std::vector<spv::Builder::AccessChain> complexLvalues; // for holding swizzling l-values too complex for
  2694. // SPIR-V, for an out parameter
  2695. std::vector<spv::Id> temporaryLvalues; // temporaries to pass, as proxies for complexLValues
  2696. auto resultType = [&invertedType, &node, this](){
  2697. if (invertedType != spv::NoType) {
  2698. return invertedType;
  2699. } else {
  2700. auto ret = convertGlslangToSpvType(node->getType());
  2701. // convertGlslangToSpvType may clobber the debug location, reset it
  2702. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2703. return ret;
  2704. }
  2705. };
  2706. // try texturing
  2707. result = createImageTextureFunctionCall(node);
  2708. if (result != spv::NoResult) {
  2709. builder.clearAccessChain();
  2710. builder.setAccessChainRValue(result);
  2711. return false;
  2712. } else if (node->getOp() == glslang::EOpImageStore ||
  2713. node->getOp() == glslang::EOpImageStoreLod ||
  2714. node->getOp() == glslang::EOpImageAtomicStore) {
  2715. // "imageStore" is a special case, which has no result
  2716. return false;
  2717. }
  2718. glslang::TOperator binOp = glslang::EOpNull;
  2719. bool reduceComparison = true;
  2720. bool isMatrix = false;
  2721. bool noReturnValue = false;
  2722. bool atomic = false;
  2723. spv::Builder::AccessChain::CoherentFlags lvalueCoherentFlags;
  2724. assert(node->getOp());
  2725. spv::Decoration precision = TranslatePrecisionDecoration(node->getOperationPrecision());
  2726. switch (node->getOp()) {
  2727. case glslang::EOpScope:
  2728. case glslang::EOpSequence:
  2729. {
  2730. if (visit == glslang::EvPreVisit) {
  2731. ++sequenceDepth;
  2732. if (sequenceDepth == 1) {
  2733. // If this is the parent node of all the functions, we want to see them
  2734. // early, so all call points have actual SPIR-V functions to reference.
  2735. // In all cases, still let the traverser visit the children for us.
  2736. makeFunctions(node->getAsAggregate()->getSequence());
  2737. // Global initializers is specific to the shader entry point, which does not exist in compile-only mode
  2738. if (!options.compileOnly) {
  2739. // Also, we want all globals initializers to go into the beginning of the entry point, before
  2740. // anything else gets there, so visit out of order, doing them all now.
  2741. makeGlobalInitializers(node->getAsAggregate()->getSequence());
  2742. }
  2743. //Pre process linker objects for ray tracing stages
  2744. if (glslangIntermediate->isRayTracingStage())
  2745. collectRayTracingLinkerObjects();
  2746. // Initializers are done, don't want to visit again, but functions and link objects need to be processed,
  2747. // so do them manually.
  2748. visitFunctions(node->getAsAggregate()->getSequence());
  2749. return false;
  2750. } else {
  2751. if (node->getOp() == glslang::EOpScope) {
  2752. auto loc = node->getLoc();
  2753. builder.enterLexicalBlock(loc.line, loc.column);
  2754. }
  2755. }
  2756. } else {
  2757. if (sequenceDepth > 1 && node->getOp() == glslang::EOpScope)
  2758. builder.leaveLexicalBlock();
  2759. --sequenceDepth;
  2760. }
  2761. return true;
  2762. }
  2763. case glslang::EOpLinkerObjects:
  2764. {
  2765. if (visit == glslang::EvPreVisit)
  2766. linkageOnly = true;
  2767. else
  2768. linkageOnly = false;
  2769. return true;
  2770. }
  2771. case glslang::EOpComma:
  2772. {
  2773. // processing from left to right naturally leaves the right-most
  2774. // lying around in the access chain
  2775. glslang::TIntermSequence& glslangOperands = node->getSequence();
  2776. for (int i = 0; i < (int)glslangOperands.size(); ++i)
  2777. glslangOperands[i]->traverse(this);
  2778. return false;
  2779. }
  2780. case glslang::EOpFunction:
  2781. if (visit == glslang::EvPreVisit) {
  2782. if (options.generateDebugInfo) {
  2783. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2784. }
  2785. if (isShaderEntryPoint(node)) {
  2786. inEntryPoint = true;
  2787. builder.setBuildPoint(shaderEntry->getLastBlock());
  2788. builder.enterFunction(shaderEntry);
  2789. currentFunction = shaderEntry;
  2790. } else {
  2791. handleFunctionEntry(node);
  2792. }
  2793. if (options.generateDebugInfo && !options.emitNonSemanticShaderDebugInfo) {
  2794. const auto& loc = node->getLoc();
  2795. const char* sourceFileName = loc.getFilename();
  2796. spv::Id sourceFileId = sourceFileName ? builder.getStringId(sourceFileName) : builder.getMainFileId();
  2797. currentFunction->setDebugLineInfo(sourceFileId, loc.line, loc.column);
  2798. }
  2799. } else {
  2800. if (options.generateDebugInfo) {
  2801. if (glslangIntermediate->getSource() == glslang::EShSourceGlsl && node->getSequence().size() > 1) {
  2802. auto endLoc = node->getSequence()[1]->getAsAggregate()->getEndLoc();
  2803. builder.setDebugSourceLocation(endLoc.line, endLoc.getFilename());
  2804. }
  2805. }
  2806. if (inEntryPoint)
  2807. entryPointTerminated = true;
  2808. builder.leaveFunction();
  2809. inEntryPoint = false;
  2810. }
  2811. return true;
  2812. case glslang::EOpParameters:
  2813. // Parameters will have been consumed by EOpFunction processing, but not
  2814. // the body, so we still visited the function node's children, making this
  2815. // child redundant.
  2816. return false;
  2817. case glslang::EOpFunctionCall:
  2818. {
  2819. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2820. if (node->isUserDefined())
  2821. result = handleUserFunctionCall(node);
  2822. if (result) {
  2823. builder.clearAccessChain();
  2824. builder.setAccessChainRValue(result);
  2825. } else
  2826. logger->missingFunctionality("missing user function; linker needs to catch that");
  2827. return false;
  2828. }
  2829. case glslang::EOpConstructMat2x2:
  2830. case glslang::EOpConstructMat2x3:
  2831. case glslang::EOpConstructMat2x4:
  2832. case glslang::EOpConstructMat3x2:
  2833. case glslang::EOpConstructMat3x3:
  2834. case glslang::EOpConstructMat3x4:
  2835. case glslang::EOpConstructMat4x2:
  2836. case glslang::EOpConstructMat4x3:
  2837. case glslang::EOpConstructMat4x4:
  2838. case glslang::EOpConstructDMat2x2:
  2839. case glslang::EOpConstructDMat2x3:
  2840. case glslang::EOpConstructDMat2x4:
  2841. case glslang::EOpConstructDMat3x2:
  2842. case glslang::EOpConstructDMat3x3:
  2843. case glslang::EOpConstructDMat3x4:
  2844. case glslang::EOpConstructDMat4x2:
  2845. case glslang::EOpConstructDMat4x3:
  2846. case glslang::EOpConstructDMat4x4:
  2847. case glslang::EOpConstructIMat2x2:
  2848. case glslang::EOpConstructIMat2x3:
  2849. case glslang::EOpConstructIMat2x4:
  2850. case glslang::EOpConstructIMat3x2:
  2851. case glslang::EOpConstructIMat3x3:
  2852. case glslang::EOpConstructIMat3x4:
  2853. case glslang::EOpConstructIMat4x2:
  2854. case glslang::EOpConstructIMat4x3:
  2855. case glslang::EOpConstructIMat4x4:
  2856. case glslang::EOpConstructUMat2x2:
  2857. case glslang::EOpConstructUMat2x3:
  2858. case glslang::EOpConstructUMat2x4:
  2859. case glslang::EOpConstructUMat3x2:
  2860. case glslang::EOpConstructUMat3x3:
  2861. case glslang::EOpConstructUMat3x4:
  2862. case glslang::EOpConstructUMat4x2:
  2863. case glslang::EOpConstructUMat4x3:
  2864. case glslang::EOpConstructUMat4x4:
  2865. case glslang::EOpConstructBMat2x2:
  2866. case glslang::EOpConstructBMat2x3:
  2867. case glslang::EOpConstructBMat2x4:
  2868. case glslang::EOpConstructBMat3x2:
  2869. case glslang::EOpConstructBMat3x3:
  2870. case glslang::EOpConstructBMat3x4:
  2871. case glslang::EOpConstructBMat4x2:
  2872. case glslang::EOpConstructBMat4x3:
  2873. case glslang::EOpConstructBMat4x4:
  2874. case glslang::EOpConstructF16Mat2x2:
  2875. case glslang::EOpConstructF16Mat2x3:
  2876. case glslang::EOpConstructF16Mat2x4:
  2877. case glslang::EOpConstructF16Mat3x2:
  2878. case glslang::EOpConstructF16Mat3x3:
  2879. case glslang::EOpConstructF16Mat3x4:
  2880. case glslang::EOpConstructF16Mat4x2:
  2881. case glslang::EOpConstructF16Mat4x3:
  2882. case glslang::EOpConstructF16Mat4x4:
  2883. isMatrix = true;
  2884. [[fallthrough]];
  2885. case glslang::EOpConstructFloat:
  2886. case glslang::EOpConstructVec2:
  2887. case glslang::EOpConstructVec3:
  2888. case glslang::EOpConstructVec4:
  2889. case glslang::EOpConstructDouble:
  2890. case glslang::EOpConstructDVec2:
  2891. case glslang::EOpConstructDVec3:
  2892. case glslang::EOpConstructDVec4:
  2893. case glslang::EOpConstructFloat16:
  2894. case glslang::EOpConstructF16Vec2:
  2895. case glslang::EOpConstructF16Vec3:
  2896. case glslang::EOpConstructF16Vec4:
  2897. case glslang::EOpConstructBFloat16:
  2898. case glslang::EOpConstructBF16Vec2:
  2899. case glslang::EOpConstructBF16Vec3:
  2900. case glslang::EOpConstructBF16Vec4:
  2901. case glslang::EOpConstructFloatE5M2:
  2902. case glslang::EOpConstructFloatE5M2Vec2:
  2903. case glslang::EOpConstructFloatE5M2Vec3:
  2904. case glslang::EOpConstructFloatE5M2Vec4:
  2905. case glslang::EOpConstructFloatE4M3:
  2906. case glslang::EOpConstructFloatE4M3Vec2:
  2907. case glslang::EOpConstructFloatE4M3Vec3:
  2908. case glslang::EOpConstructFloatE4M3Vec4:
  2909. case glslang::EOpConstructBool:
  2910. case glslang::EOpConstructBVec2:
  2911. case glslang::EOpConstructBVec3:
  2912. case glslang::EOpConstructBVec4:
  2913. case glslang::EOpConstructInt8:
  2914. case glslang::EOpConstructI8Vec2:
  2915. case glslang::EOpConstructI8Vec3:
  2916. case glslang::EOpConstructI8Vec4:
  2917. case glslang::EOpConstructUint8:
  2918. case glslang::EOpConstructU8Vec2:
  2919. case glslang::EOpConstructU8Vec3:
  2920. case glslang::EOpConstructU8Vec4:
  2921. case glslang::EOpConstructInt16:
  2922. case glslang::EOpConstructI16Vec2:
  2923. case glslang::EOpConstructI16Vec3:
  2924. case glslang::EOpConstructI16Vec4:
  2925. case glslang::EOpConstructUint16:
  2926. case glslang::EOpConstructU16Vec2:
  2927. case glslang::EOpConstructU16Vec3:
  2928. case glslang::EOpConstructU16Vec4:
  2929. case glslang::EOpConstructInt:
  2930. case glslang::EOpConstructIVec2:
  2931. case glslang::EOpConstructIVec3:
  2932. case glslang::EOpConstructIVec4:
  2933. case glslang::EOpConstructUint:
  2934. case glslang::EOpConstructUVec2:
  2935. case glslang::EOpConstructUVec3:
  2936. case glslang::EOpConstructUVec4:
  2937. case glslang::EOpConstructInt64:
  2938. case glslang::EOpConstructI64Vec2:
  2939. case glslang::EOpConstructI64Vec3:
  2940. case glslang::EOpConstructI64Vec4:
  2941. case glslang::EOpConstructUint64:
  2942. case glslang::EOpConstructU64Vec2:
  2943. case glslang::EOpConstructU64Vec3:
  2944. case glslang::EOpConstructU64Vec4:
  2945. case glslang::EOpConstructStruct:
  2946. case glslang::EOpConstructTextureSampler:
  2947. case glslang::EOpConstructReference:
  2948. case glslang::EOpConstructCooperativeMatrixNV:
  2949. case glslang::EOpConstructCooperativeMatrixKHR:
  2950. case glslang::EOpConstructCooperativeVectorNV:
  2951. case glslang::EOpConstructSaturated:
  2952. {
  2953. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2954. std::vector<spv::Id> arguments;
  2955. translateArguments(*node, arguments, lvalueCoherentFlags);
  2956. spv::Id constructed;
  2957. if (node->getOp() == glslang::EOpConstructTextureSampler) {
  2958. const glslang::TType& texType = node->getSequence()[0]->getAsTyped()->getType();
  2959. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6 &&
  2960. texType.getSampler().isBuffer()) {
  2961. // SamplerBuffer is not supported in spirv1.6 so
  2962. // `samplerBuffer(textureBuffer, sampler)` is a no-op
  2963. // and textureBuffer is the result going forward
  2964. constructed = arguments[0];
  2965. } else
  2966. constructed = builder.createOp(spv::Op::OpSampledImage, resultType(), arguments);
  2967. } else if (node->getOp() == glslang::EOpConstructCooperativeMatrixKHR &&
  2968. node->getType().isCoopMatKHR() && node->getSequence()[0]->getAsTyped()->getType().isCoopMatKHR()) {
  2969. builder.addCapability(spv::Capability::CooperativeMatrixConversionsNV);
  2970. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  2971. constructed = builder.createCooperativeMatrixConversion(resultType(), arguments[0]);
  2972. } else if (node->getOp() == glslang::EOpConstructCooperativeVectorNV &&
  2973. arguments.size() == 1 &&
  2974. builder.getTypeId(arguments[0]) == resultType()) {
  2975. constructed = arguments[0];
  2976. } else if (node->getOp() == glslang::EOpConstructStruct ||
  2977. node->getOp() == glslang::EOpConstructCooperativeMatrixNV ||
  2978. node->getOp() == glslang::EOpConstructCooperativeMatrixKHR ||
  2979. node->getType().isArray() ||
  2980. // Handle constructing coopvec from one component here, to avoid the component
  2981. // getting smeared
  2982. (node->getOp() == glslang::EOpConstructCooperativeVectorNV && arguments.size() == 1 && builder.isScalar(arguments[0]))) {
  2983. std::vector<spv::Id> constituents;
  2984. for (int c = 0; c < (int)arguments.size(); ++c)
  2985. constituents.push_back(arguments[c]);
  2986. constructed = createCompositeConstruct(resultType(), constituents);
  2987. } else if (isMatrix)
  2988. constructed = builder.createMatrixConstructor(precision, arguments, resultType());
  2989. else if (node->getOp() == glslang::EOpConstructSaturated) {
  2990. OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
  2991. TranslateNoContractionDecoration(node->getType().getQualifier()),
  2992. TranslateNonUniformDecoration(lvalueCoherentFlags) };
  2993. constructed = createConversion(node->getOp(), decorations, resultType(), arguments[1],
  2994. node->getType().getBasicType(), node->getSequence()[1]->getAsTyped()->getBasicType());
  2995. builder.addDecoration(constructed, spv::Decoration::SaturatedToLargestFloat8NormalConversionEXT);
  2996. builder.createStore(constructed, arguments[0]);
  2997. }
  2998. else
  2999. constructed = builder.createConstructor(precision, arguments, resultType());
  3000. if (node->getType().getQualifier().isNonUniform()) {
  3001. builder.addDecoration(constructed, spv::Decoration::NonUniformEXT);
  3002. }
  3003. builder.clearAccessChain();
  3004. builder.setAccessChainRValue(constructed);
  3005. return false;
  3006. }
  3007. // These six are component-wise compares with component-wise results.
  3008. // Forward on to createBinaryOperation(), requesting a vector result.
  3009. case glslang::EOpLessThan:
  3010. case glslang::EOpGreaterThan:
  3011. case glslang::EOpLessThanEqual:
  3012. case glslang::EOpGreaterThanEqual:
  3013. case glslang::EOpVectorEqual:
  3014. case glslang::EOpVectorNotEqual:
  3015. {
  3016. // Map the operation to a binary
  3017. binOp = node->getOp();
  3018. reduceComparison = false;
  3019. switch (node->getOp()) {
  3020. case glslang::EOpVectorEqual: binOp = glslang::EOpVectorEqual; break;
  3021. case glslang::EOpVectorNotEqual: binOp = glslang::EOpVectorNotEqual; break;
  3022. default: binOp = node->getOp(); break;
  3023. }
  3024. break;
  3025. }
  3026. case glslang::EOpMul:
  3027. // component-wise matrix multiply
  3028. binOp = glslang::EOpMul;
  3029. break;
  3030. case glslang::EOpOuterProduct:
  3031. // two vectors multiplied to make a matrix
  3032. binOp = glslang::EOpOuterProduct;
  3033. break;
  3034. case glslang::EOpDot:
  3035. {
  3036. // for scalar dot product, use multiply
  3037. glslang::TIntermSequence& glslangOperands = node->getSequence();
  3038. if (glslangOperands[0]->getAsTyped()->getVectorSize() == 1)
  3039. binOp = glslang::EOpMul;
  3040. break;
  3041. }
  3042. case glslang::EOpMod:
  3043. // when an aggregate, this is the floating-point mod built-in function,
  3044. // which can be emitted by the one in createBinaryOperation()
  3045. binOp = glslang::EOpMod;
  3046. break;
  3047. case glslang::EOpEmitVertex:
  3048. case glslang::EOpEndPrimitive:
  3049. case glslang::EOpBarrier:
  3050. case glslang::EOpMemoryBarrier:
  3051. case glslang::EOpMemoryBarrierAtomicCounter:
  3052. case glslang::EOpMemoryBarrierBuffer:
  3053. case glslang::EOpMemoryBarrierImage:
  3054. case glslang::EOpMemoryBarrierShared:
  3055. case glslang::EOpGroupMemoryBarrier:
  3056. case glslang::EOpDeviceMemoryBarrier:
  3057. case glslang::EOpAllMemoryBarrierWithGroupSync:
  3058. case glslang::EOpDeviceMemoryBarrierWithGroupSync:
  3059. case glslang::EOpWorkgroupMemoryBarrier:
  3060. case glslang::EOpWorkgroupMemoryBarrierWithGroupSync:
  3061. case glslang::EOpSubgroupBarrier:
  3062. case glslang::EOpSubgroupMemoryBarrier:
  3063. case glslang::EOpSubgroupMemoryBarrierBuffer:
  3064. case glslang::EOpSubgroupMemoryBarrierImage:
  3065. case glslang::EOpSubgroupMemoryBarrierShared:
  3066. noReturnValue = true;
  3067. // These all have 0 operands and will naturally finish up in the code below for 0 operands
  3068. break;
  3069. case glslang::EOpAtomicAdd:
  3070. case glslang::EOpAtomicSubtract:
  3071. case glslang::EOpAtomicMin:
  3072. case glslang::EOpAtomicMax:
  3073. case glslang::EOpAtomicAnd:
  3074. case glslang::EOpAtomicOr:
  3075. case glslang::EOpAtomicXor:
  3076. case glslang::EOpAtomicExchange:
  3077. case glslang::EOpAtomicCompSwap:
  3078. atomic = true;
  3079. break;
  3080. case glslang::EOpAtomicStore:
  3081. noReturnValue = true;
  3082. [[fallthrough]];
  3083. case glslang::EOpAtomicLoad:
  3084. atomic = true;
  3085. break;
  3086. case glslang::EOpAtomicCounterAdd:
  3087. case glslang::EOpAtomicCounterSubtract:
  3088. case glslang::EOpAtomicCounterMin:
  3089. case glslang::EOpAtomicCounterMax:
  3090. case glslang::EOpAtomicCounterAnd:
  3091. case glslang::EOpAtomicCounterOr:
  3092. case glslang::EOpAtomicCounterXor:
  3093. case glslang::EOpAtomicCounterExchange:
  3094. case glslang::EOpAtomicCounterCompSwap:
  3095. builder.addExtension("SPV_KHR_shader_atomic_counter_ops");
  3096. builder.addCapability(spv::Capability::AtomicStorageOps);
  3097. atomic = true;
  3098. break;
  3099. case glslang::EOpAbsDifference:
  3100. case glslang::EOpAddSaturate:
  3101. case glslang::EOpSubSaturate:
  3102. case glslang::EOpAverage:
  3103. case glslang::EOpAverageRounded:
  3104. case glslang::EOpMul32x16:
  3105. builder.addCapability(spv::Capability::IntegerFunctions2INTEL);
  3106. builder.addExtension("SPV_INTEL_shader_integer_functions2");
  3107. binOp = node->getOp();
  3108. break;
  3109. case glslang::EOpExpectEXT:
  3110. builder.addCapability(spv::Capability::ExpectAssumeKHR);
  3111. builder.addExtension(spv::E_SPV_KHR_expect_assume);
  3112. binOp = node->getOp();
  3113. break;
  3114. case glslang::EOpIgnoreIntersectionNV:
  3115. case glslang::EOpTerminateRayNV:
  3116. case glslang::EOpTraceNV:
  3117. case glslang::EOpTraceRayMotionNV:
  3118. case glslang::EOpTraceKHR:
  3119. case glslang::EOpExecuteCallableNV:
  3120. case glslang::EOpExecuteCallableKHR:
  3121. case glslang::EOpWritePackedPrimitiveIndices4x8NV:
  3122. case glslang::EOpEmitMeshTasksEXT:
  3123. case glslang::EOpSetMeshOutputsEXT:
  3124. noReturnValue = true;
  3125. break;
  3126. case glslang::EOpRayQueryInitialize:
  3127. case glslang::EOpRayQueryTerminate:
  3128. case glslang::EOpRayQueryGenerateIntersection:
  3129. case glslang::EOpRayQueryConfirmIntersection:
  3130. builder.addExtension("SPV_KHR_ray_query");
  3131. builder.addCapability(spv::Capability::RayQueryKHR);
  3132. noReturnValue = true;
  3133. break;
  3134. case glslang::EOpRayQueryProceed:
  3135. case glslang::EOpRayQueryGetIntersectionType:
  3136. case glslang::EOpRayQueryGetRayTMin:
  3137. case glslang::EOpRayQueryGetRayFlags:
  3138. case glslang::EOpRayQueryGetIntersectionT:
  3139. case glslang::EOpRayQueryGetIntersectionInstanceCustomIndex:
  3140. case glslang::EOpRayQueryGetIntersectionInstanceId:
  3141. case glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset:
  3142. case glslang::EOpRayQueryGetIntersectionGeometryIndex:
  3143. case glslang::EOpRayQueryGetIntersectionPrimitiveIndex:
  3144. case glslang::EOpRayQueryGetIntersectionBarycentrics:
  3145. case glslang::EOpRayQueryGetIntersectionFrontFace:
  3146. case glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque:
  3147. case glslang::EOpRayQueryGetIntersectionObjectRayDirection:
  3148. case glslang::EOpRayQueryGetIntersectionObjectRayOrigin:
  3149. case glslang::EOpRayQueryGetWorldRayDirection:
  3150. case glslang::EOpRayQueryGetWorldRayOrigin:
  3151. case glslang::EOpRayQueryGetIntersectionObjectToWorld:
  3152. case glslang::EOpRayQueryGetIntersectionWorldToObject:
  3153. builder.addExtension("SPV_KHR_ray_query");
  3154. builder.addCapability(spv::Capability::RayQueryKHR);
  3155. break;
  3156. case glslang::EOpCooperativeMatrixLoad:
  3157. case glslang::EOpCooperativeMatrixStore:
  3158. case glslang::EOpCooperativeMatrixLoadNV:
  3159. case glslang::EOpCooperativeMatrixStoreNV:
  3160. case glslang::EOpCooperativeMatrixLoadTensorNV:
  3161. case glslang::EOpCooperativeMatrixStoreTensorNV:
  3162. case glslang::EOpCooperativeMatrixReduceNV:
  3163. case glslang::EOpCooperativeMatrixPerElementOpNV:
  3164. case glslang::EOpCooperativeMatrixTransposeNV:
  3165. case glslang::EOpCooperativeVectorMatMulNV:
  3166. case glslang::EOpCooperativeVectorMatMulAddNV:
  3167. case glslang::EOpCooperativeVectorLoadNV:
  3168. case glslang::EOpCooperativeVectorStoreNV:
  3169. case glslang::EOpCooperativeVectorOuterProductAccumulateNV:
  3170. case glslang::EOpCooperativeVectorReduceSumAccumulateNV:
  3171. noReturnValue = true;
  3172. break;
  3173. case glslang::EOpBeginInvocationInterlock:
  3174. case glslang::EOpEndInvocationInterlock:
  3175. builder.addExtension(spv::E_SPV_EXT_fragment_shader_interlock);
  3176. noReturnValue = true;
  3177. break;
  3178. case glslang::EOpHitObjectTraceRayNV:
  3179. case glslang::EOpHitObjectTraceRayMotionNV:
  3180. case glslang::EOpHitObjectGetAttributesNV:
  3181. case glslang::EOpHitObjectExecuteShaderNV:
  3182. case glslang::EOpHitObjectRecordEmptyNV:
  3183. case glslang::EOpHitObjectRecordMissNV:
  3184. case glslang::EOpHitObjectRecordMissMotionNV:
  3185. case glslang::EOpHitObjectRecordHitNV:
  3186. case glslang::EOpHitObjectRecordHitMotionNV:
  3187. case glslang::EOpHitObjectRecordHitWithIndexNV:
  3188. case glslang::EOpHitObjectRecordHitWithIndexMotionNV:
  3189. case glslang::EOpReorderThreadNV:
  3190. noReturnValue = true;
  3191. [[fallthrough]];
  3192. case glslang::EOpHitObjectIsEmptyNV:
  3193. case glslang::EOpHitObjectIsMissNV:
  3194. case glslang::EOpHitObjectIsHitNV:
  3195. case glslang::EOpHitObjectGetRayTMinNV:
  3196. case glslang::EOpHitObjectGetRayTMaxNV:
  3197. case glslang::EOpHitObjectGetObjectRayOriginNV:
  3198. case glslang::EOpHitObjectGetObjectRayDirectionNV:
  3199. case glslang::EOpHitObjectGetWorldRayOriginNV:
  3200. case glslang::EOpHitObjectGetWorldRayDirectionNV:
  3201. case glslang::EOpHitObjectGetObjectToWorldNV:
  3202. case glslang::EOpHitObjectGetWorldToObjectNV:
  3203. case glslang::EOpHitObjectGetInstanceCustomIndexNV:
  3204. case glslang::EOpHitObjectGetInstanceIdNV:
  3205. case glslang::EOpHitObjectGetGeometryIndexNV:
  3206. case glslang::EOpHitObjectGetPrimitiveIndexNV:
  3207. case glslang::EOpHitObjectGetHitKindNV:
  3208. case glslang::EOpHitObjectGetCurrentTimeNV:
  3209. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:
  3210. case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:
  3211. builder.addExtension(spv::E_SPV_NV_shader_invocation_reorder);
  3212. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  3213. break;
  3214. case glslang::EOpHitObjectGetLSSPositionsNV:
  3215. case glslang::EOpHitObjectGetLSSRadiiNV:
  3216. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  3217. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  3218. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  3219. noReturnValue = true;
  3220. break;
  3221. case glslang::EOpRayQueryGetIntersectionLSSPositionsNV:
  3222. case glslang::EOpRayQueryGetIntersectionLSSRadiiNV:
  3223. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  3224. builder.addCapability(spv::Capability::RayQueryKHR);
  3225. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  3226. noReturnValue = true;
  3227. break;
  3228. case glslang::EOpRayQueryGetIntersectionSpherePositionNV:
  3229. case glslang::EOpRayQueryGetIntersectionSphereRadiusNV:
  3230. case glslang::EOpRayQueryIsSphereHitNV:
  3231. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  3232. builder.addCapability(spv::Capability::RayQueryKHR);
  3233. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  3234. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  3235. break;
  3236. case glslang::EOpRayQueryGetIntersectionLSSHitValueNV:
  3237. case glslang::EOpRayQueryIsLSSHitNV:
  3238. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  3239. builder.addCapability(spv::Capability::RayQueryKHR);
  3240. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  3241. break;
  3242. case glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT:
  3243. builder.addExtension(spv::E_SPV_KHR_ray_tracing_position_fetch);
  3244. builder.addCapability(spv::Capability::RayQueryPositionFetchKHR);
  3245. noReturnValue = true;
  3246. break;
  3247. case glslang::EOpImageSampleWeightedQCOM:
  3248. builder.addCapability(spv::Capability::TextureSampleWeightedQCOM);
  3249. builder.addExtension(spv::E_SPV_QCOM_image_processing);
  3250. break;
  3251. case glslang::EOpImageBoxFilterQCOM:
  3252. builder.addCapability(spv::Capability::TextureBoxFilterQCOM);
  3253. builder.addExtension(spv::E_SPV_QCOM_image_processing);
  3254. break;
  3255. case glslang::EOpImageBlockMatchSADQCOM:
  3256. case glslang::EOpImageBlockMatchSSDQCOM:
  3257. builder.addCapability(spv::Capability::TextureBlockMatchQCOM);
  3258. builder.addExtension(spv::E_SPV_QCOM_image_processing);
  3259. break;
  3260. case glslang::EOpTensorWriteARM:
  3261. noReturnValue = true;
  3262. break;
  3263. case glslang::EOpImageBlockMatchWindowSSDQCOM:
  3264. case glslang::EOpImageBlockMatchWindowSADQCOM:
  3265. builder.addCapability(spv::Capability::TextureBlockMatchQCOM);
  3266. builder.addExtension(spv::E_SPV_QCOM_image_processing);
  3267. builder.addCapability(spv::Capability::TextureBlockMatch2QCOM);
  3268. builder.addExtension(spv::E_SPV_QCOM_image_processing2);
  3269. break;
  3270. case glslang::EOpImageBlockMatchGatherSSDQCOM:
  3271. case glslang::EOpImageBlockMatchGatherSADQCOM:
  3272. builder.addCapability(spv::Capability::TextureBlockMatchQCOM);
  3273. builder.addExtension(spv::E_SPV_QCOM_image_processing);
  3274. builder.addCapability(spv::Capability::TextureBlockMatch2QCOM);
  3275. builder.addExtension(spv::E_SPV_QCOM_image_processing2);
  3276. break;
  3277. case glslang::EOpFetchMicroTriangleVertexPositionNV:
  3278. case glslang::EOpFetchMicroTriangleVertexBarycentricNV:
  3279. builder.addExtension(spv::E_SPV_NV_displacement_micromap);
  3280. builder.addCapability(spv::Capability::DisplacementMicromapNV);
  3281. break;
  3282. case glslang::EOpRayQueryGetIntersectionClusterIdNV:
  3283. builder.addExtension(spv::E_SPV_NV_cluster_acceleration_structure);
  3284. builder.addCapability(spv::Capability::RayQueryKHR);
  3285. builder.addCapability(spv::Capability::RayTracingClusterAccelerationStructureNV);
  3286. break;
  3287. case glslang::EOpDebugPrintf:
  3288. noReturnValue = true;
  3289. break;
  3290. default:
  3291. break;
  3292. }
  3293. //
  3294. // See if it maps to a regular operation.
  3295. //
  3296. if (binOp != glslang::EOpNull) {
  3297. glslang::TIntermTyped* left = node->getSequence()[0]->getAsTyped();
  3298. glslang::TIntermTyped* right = node->getSequence()[1]->getAsTyped();
  3299. assert(left && right);
  3300. builder.clearAccessChain();
  3301. left->traverse(this);
  3302. spv::Id leftId = accessChainLoad(left->getType());
  3303. builder.clearAccessChain();
  3304. right->traverse(this);
  3305. spv::Id rightId = accessChainLoad(right->getType());
  3306. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  3307. OpDecorations decorations = { precision,
  3308. TranslateNoContractionDecoration(node->getType().getQualifier()),
  3309. TranslateNonUniformDecoration(node->getType().getQualifier()) };
  3310. result = createBinaryOperation(binOp, decorations,
  3311. resultType(), leftId, rightId,
  3312. left->getType().getBasicType(), reduceComparison);
  3313. // code above should only make binOp that exists in createBinaryOperation
  3314. assert(result != spv::NoResult);
  3315. builder.clearAccessChain();
  3316. builder.setAccessChainRValue(result);
  3317. return false;
  3318. }
  3319. //
  3320. // Create the list of operands.
  3321. //
  3322. glslang::TIntermSequence& glslangOperands = node->getSequence();
  3323. std::vector<spv::Id> operands;
  3324. std::vector<spv::IdImmediate> memoryAccessOperands;
  3325. for (int arg = 0; arg < (int)glslangOperands.size(); ++arg) {
  3326. // special case l-value operands; there are just a few
  3327. bool lvalue = false;
  3328. switch (node->getOp()) {
  3329. case glslang::EOpModf:
  3330. if (arg == 1)
  3331. lvalue = true;
  3332. break;
  3333. case glslang::EOpHitObjectRecordHitNV:
  3334. case glslang::EOpHitObjectRecordHitMotionNV:
  3335. case glslang::EOpHitObjectRecordHitWithIndexNV:
  3336. case glslang::EOpHitObjectRecordHitWithIndexMotionNV:
  3337. case glslang::EOpHitObjectTraceRayNV:
  3338. case glslang::EOpHitObjectTraceRayMotionNV:
  3339. case glslang::EOpHitObjectExecuteShaderNV:
  3340. case glslang::EOpHitObjectRecordMissNV:
  3341. case glslang::EOpHitObjectRecordMissMotionNV:
  3342. case glslang::EOpHitObjectGetAttributesNV:
  3343. case glslang::EOpHitObjectGetClusterIdNV:
  3344. if (arg == 0)
  3345. lvalue = true;
  3346. break;
  3347. case glslang::EOpHitObjectGetLSSPositionsNV:
  3348. case glslang::EOpHitObjectGetLSSRadiiNV:
  3349. lvalue = true;
  3350. break;
  3351. case glslang::EOpRayQueryInitialize:
  3352. case glslang::EOpRayQueryTerminate:
  3353. case glslang::EOpRayQueryConfirmIntersection:
  3354. case glslang::EOpRayQueryProceed:
  3355. case glslang::EOpRayQueryGenerateIntersection:
  3356. case glslang::EOpRayQueryGetIntersectionType:
  3357. case glslang::EOpRayQueryGetIntersectionT:
  3358. case glslang::EOpRayQueryGetIntersectionInstanceCustomIndex:
  3359. case glslang::EOpRayQueryGetIntersectionInstanceId:
  3360. case glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset:
  3361. case glslang::EOpRayQueryGetIntersectionGeometryIndex:
  3362. case glslang::EOpRayQueryGetIntersectionPrimitiveIndex:
  3363. case glslang::EOpRayQueryGetIntersectionBarycentrics:
  3364. case glslang::EOpRayQueryGetIntersectionFrontFace:
  3365. case glslang::EOpRayQueryGetIntersectionObjectRayDirection:
  3366. case glslang::EOpRayQueryGetIntersectionObjectRayOrigin:
  3367. case glslang::EOpRayQueryGetIntersectionObjectToWorld:
  3368. case glslang::EOpRayQueryGetIntersectionWorldToObject:
  3369. case glslang::EOpRayQueryGetIntersectionClusterIdNV:
  3370. case glslang::EOpRayQueryGetIntersectionSpherePositionNV:
  3371. case glslang::EOpRayQueryGetIntersectionSphereRadiusNV:
  3372. case glslang::EOpRayQueryGetIntersectionLSSHitValueNV:
  3373. case glslang::EOpRayQueryIsSphereHitNV:
  3374. case glslang::EOpRayQueryIsLSSHitNV:
  3375. if (arg == 0)
  3376. lvalue = true;
  3377. break;
  3378. case glslang::EOpAtomicAdd:
  3379. case glslang::EOpAtomicSubtract:
  3380. case glslang::EOpAtomicMin:
  3381. case glslang::EOpAtomicMax:
  3382. case glslang::EOpAtomicAnd:
  3383. case glslang::EOpAtomicOr:
  3384. case glslang::EOpAtomicXor:
  3385. case glslang::EOpAtomicExchange:
  3386. case glslang::EOpAtomicCompSwap:
  3387. if (arg == 0)
  3388. lvalue = true;
  3389. break;
  3390. case glslang::EOpFrexp:
  3391. if (arg == 1)
  3392. lvalue = true;
  3393. break;
  3394. case glslang::EOpInterpolateAtSample:
  3395. case glslang::EOpInterpolateAtOffset:
  3396. case glslang::EOpInterpolateAtVertex:
  3397. if (arg == 0) {
  3398. // If GLSL, use the address of the interpolant argument.
  3399. // If HLSL, use an internal version of OpInterolates that takes
  3400. // the rvalue of the interpolant. A fixup pass in spirv-opt
  3401. // legalization will remove the OpLoad and convert to an lvalue.
  3402. // Had to do this because legalization will only propagate a
  3403. // builtin into an rvalue.
  3404. lvalue = glslangIntermediate->getSource() != glslang::EShSourceHlsl;
  3405. // Does it need a swizzle inversion? If so, evaluation is inverted;
  3406. // operate first on the swizzle base, then apply the swizzle.
  3407. // That is, we transform
  3408. //
  3409. // interpolate(v.zy) -> interpolate(v).zy
  3410. //
  3411. if (glslangOperands[0]->getAsOperator() &&
  3412. glslangOperands[0]->getAsOperator()->getOp() == glslang::EOpVectorSwizzle)
  3413. invertedType = convertGlslangToSpvType(
  3414. glslangOperands[0]->getAsBinaryNode()->getLeft()->getType());
  3415. }
  3416. break;
  3417. case glslang::EOpAtomicLoad:
  3418. case glslang::EOpAtomicStore:
  3419. case glslang::EOpAtomicCounterAdd:
  3420. case glslang::EOpAtomicCounterSubtract:
  3421. case glslang::EOpAtomicCounterMin:
  3422. case glslang::EOpAtomicCounterMax:
  3423. case glslang::EOpAtomicCounterAnd:
  3424. case glslang::EOpAtomicCounterOr:
  3425. case glslang::EOpAtomicCounterXor:
  3426. case glslang::EOpAtomicCounterExchange:
  3427. case glslang::EOpAtomicCounterCompSwap:
  3428. if (arg == 0)
  3429. lvalue = true;
  3430. break;
  3431. case glslang::EOpAddCarry:
  3432. case glslang::EOpSubBorrow:
  3433. if (arg == 2)
  3434. lvalue = true;
  3435. break;
  3436. case glslang::EOpUMulExtended:
  3437. case glslang::EOpIMulExtended:
  3438. if (arg >= 2)
  3439. lvalue = true;
  3440. break;
  3441. case glslang::EOpCooperativeMatrixLoad:
  3442. case glslang::EOpCooperativeMatrixLoadNV:
  3443. case glslang::EOpCooperativeMatrixLoadTensorNV:
  3444. case glslang::EOpCooperativeVectorLoadNV:
  3445. if (arg == 0 || arg == 1)
  3446. lvalue = true;
  3447. break;
  3448. case glslang::EOpCooperativeMatrixStore:
  3449. case glslang::EOpCooperativeMatrixStoreNV:
  3450. case glslang::EOpCooperativeMatrixStoreTensorNV:
  3451. case glslang::EOpCooperativeVectorStoreNV:
  3452. if (arg == 1)
  3453. lvalue = true;
  3454. break;
  3455. case glslang::EOpCooperativeVectorMatMulNV:
  3456. if (arg == 0 || arg == 3)
  3457. lvalue = true;
  3458. break;
  3459. case glslang::EOpCooperativeVectorMatMulAddNV:
  3460. if (arg == 0 || arg == 3 || arg == 6)
  3461. lvalue = true;
  3462. break;
  3463. case glslang::EOpCooperativeVectorOuterProductAccumulateNV:
  3464. if (arg == 2)
  3465. lvalue = true;
  3466. break;
  3467. case glslang::EOpCooperativeVectorReduceSumAccumulateNV:
  3468. if (arg == 1)
  3469. lvalue = true;
  3470. break;
  3471. case glslang::EOpCooperativeMatrixReduceNV:
  3472. case glslang::EOpCooperativeMatrixPerElementOpNV:
  3473. case glslang::EOpCooperativeMatrixTransposeNV:
  3474. if (arg == 0)
  3475. lvalue = true;
  3476. break;
  3477. case glslang::EOpSpirvInst:
  3478. if (glslangOperands[arg]->getAsTyped()->getQualifier().isSpirvByReference())
  3479. lvalue = true;
  3480. break;
  3481. case glslang::EOpReorderThreadNV:
  3482. //Three variants of reorderThreadNV, two of them use hitObjectNV
  3483. if (arg == 0 && glslangOperands.size() != 2)
  3484. lvalue = true;
  3485. break;
  3486. case glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT:
  3487. case glslang::EOpRayQueryGetIntersectionLSSPositionsNV:
  3488. case glslang::EOpRayQueryGetIntersectionLSSRadiiNV:
  3489. if (arg == 0 || arg == 2)
  3490. lvalue = true;
  3491. break;
  3492. case glslang::EOpTensorReadARM:
  3493. if (arg == 2)
  3494. lvalue = true;
  3495. break;
  3496. default:
  3497. break;
  3498. }
  3499. builder.clearAccessChain();
  3500. if (invertedType != spv::NoType && arg == 0)
  3501. glslangOperands[0]->getAsBinaryNode()->getLeft()->traverse(this);
  3502. else
  3503. glslangOperands[arg]->traverse(this);
  3504. bool isCoopMat = node->getOp() == glslang::EOpCooperativeMatrixLoad ||
  3505. node->getOp() == glslang::EOpCooperativeMatrixStore ||
  3506. node->getOp() == glslang::EOpCooperativeMatrixLoadNV ||
  3507. node->getOp() == glslang::EOpCooperativeMatrixStoreNV ||
  3508. node->getOp() == glslang::EOpCooperativeMatrixLoadTensorNV ||
  3509. node->getOp() == glslang::EOpCooperativeMatrixStoreTensorNV;
  3510. bool isCoopVec = node->getOp() == glslang::EOpCooperativeVectorLoadNV ||
  3511. node->getOp() == glslang::EOpCooperativeVectorStoreNV;
  3512. if (isCoopMat || isCoopVec) {
  3513. if (arg == 1) {
  3514. spv::Builder::AccessChain::CoherentFlags coherentFlags {};
  3515. unsigned int alignment {};
  3516. if (isCoopMat) {
  3517. // fold "element" parameter into the access chain
  3518. spv::Builder::AccessChain save = builder.getAccessChain();
  3519. builder.clearAccessChain();
  3520. glslangOperands[2]->traverse(this);
  3521. spv::Id elementId = accessChainLoad(glslangOperands[2]->getAsTyped()->getType());
  3522. builder.setAccessChain(save);
  3523. // Point to the first element of the array.
  3524. builder.accessChainPush(elementId,
  3525. TranslateCoherent(glslangOperands[arg]->getAsTyped()->getType()),
  3526. glslangOperands[arg]->getAsTyped()->getType().getBufferReferenceAlignment());
  3527. coherentFlags = builder.getAccessChain().coherentFlags;
  3528. alignment = builder.getAccessChain().alignment;
  3529. } else {
  3530. coherentFlags = builder.getAccessChain().coherentFlags;
  3531. coherentFlags |= TranslateCoherent(glslangOperands[arg]->getAsTyped()->getType());
  3532. alignment = 16;
  3533. }
  3534. spv::MemoryAccessMask memoryAccess = TranslateMemoryAccess(coherentFlags);
  3535. if (node->getOp() == glslang::EOpCooperativeMatrixLoad ||
  3536. node->getOp() == glslang::EOpCooperativeMatrixLoadNV ||
  3537. node->getOp() == glslang::EOpCooperativeMatrixLoadTensorNV ||
  3538. node->getOp() == glslang::EOpCooperativeVectorLoadNV)
  3539. memoryAccess = (memoryAccess & ~spv::MemoryAccessMask::MakePointerAvailableKHR);
  3540. if (node->getOp() == glslang::EOpCooperativeMatrixStore ||
  3541. node->getOp() == glslang::EOpCooperativeMatrixStoreNV ||
  3542. node->getOp() == glslang::EOpCooperativeMatrixStoreTensorNV ||
  3543. node->getOp() == glslang::EOpCooperativeVectorStoreNV)
  3544. memoryAccess = (memoryAccess & ~spv::MemoryAccessMask::MakePointerVisibleKHR);
  3545. if (builder.getStorageClass(builder.getAccessChain().base) ==
  3546. spv::StorageClass::PhysicalStorageBufferEXT) {
  3547. memoryAccess = (spv::MemoryAccessMask)(memoryAccess | spv::MemoryAccessMask::Aligned);
  3548. }
  3549. memoryAccessOperands.push_back(spv::IdImmediate(false, memoryAccess));
  3550. if (anySet(memoryAccess, spv::MemoryAccessMask::Aligned)) {
  3551. memoryAccessOperands.push_back(spv::IdImmediate(false, alignment));
  3552. }
  3553. if (anySet(memoryAccess,
  3554. spv::MemoryAccessMask::MakePointerAvailableKHR | spv::MemoryAccessMask::MakePointerVisibleKHR)) {
  3555. memoryAccessOperands.push_back(spv::IdImmediate(true,
  3556. builder.makeUintConstant(TranslateMemoryScope(coherentFlags))));
  3557. }
  3558. } else if (isCoopMat && arg == 2) {
  3559. continue;
  3560. }
  3561. }
  3562. // for l-values, pass the address, for r-values, pass the value
  3563. if (lvalue) {
  3564. if (invertedType == spv::NoType && !builder.isSpvLvalue()) {
  3565. // SPIR-V cannot represent an l-value containing a swizzle that doesn't
  3566. // reduce to a simple access chain. So, we need a temporary vector to
  3567. // receive the result, and must later swizzle that into the original
  3568. // l-value.
  3569. complexLvalues.push_back(builder.getAccessChain());
  3570. temporaryLvalues.push_back(builder.createVariable(
  3571. spv::NoPrecision, spv::StorageClass::Function,
  3572. builder.accessChainGetInferredType(), "swizzleTemp"));
  3573. operands.push_back(temporaryLvalues.back());
  3574. } else {
  3575. operands.push_back(builder.accessChainGetLValue());
  3576. }
  3577. lvalueCoherentFlags = builder.getAccessChain().coherentFlags;
  3578. lvalueCoherentFlags |= TranslateCoherent(glslangOperands[arg]->getAsTyped()->getType());
  3579. } else {
  3580. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  3581. glslang::TOperator glslangOp = node->getOp();
  3582. if (arg == 1 &&
  3583. (glslangOp == glslang::EOpRayQueryGetIntersectionType ||
  3584. glslangOp == glslang::EOpRayQueryGetIntersectionT ||
  3585. glslangOp == glslang::EOpRayQueryGetIntersectionInstanceCustomIndex ||
  3586. glslangOp == glslang::EOpRayQueryGetIntersectionInstanceId ||
  3587. glslangOp == glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset ||
  3588. glslangOp == glslang::EOpRayQueryGetIntersectionGeometryIndex ||
  3589. glslangOp == glslang::EOpRayQueryGetIntersectionPrimitiveIndex ||
  3590. glslangOp == glslang::EOpRayQueryGetIntersectionBarycentrics ||
  3591. glslangOp == glslang::EOpRayQueryGetIntersectionFrontFace ||
  3592. glslangOp == glslang::EOpRayQueryGetIntersectionObjectRayDirection ||
  3593. glslangOp == glslang::EOpRayQueryGetIntersectionObjectRayOrigin ||
  3594. glslangOp == glslang::EOpRayQueryGetIntersectionObjectToWorld ||
  3595. glslangOp == glslang::EOpRayQueryGetIntersectionWorldToObject ||
  3596. glslangOp == glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT ||
  3597. glslangOp == glslang::EOpRayQueryGetIntersectionClusterIdNV ||
  3598. glslangOp == glslang::EOpRayQueryGetIntersectionSpherePositionNV ||
  3599. glslangOp == glslang::EOpRayQueryGetIntersectionSphereRadiusNV ||
  3600. glslangOp == glslang::EOpRayQueryGetIntersectionLSSHitValueNV ||
  3601. glslangOp == glslang::EOpRayQueryGetIntersectionLSSPositionsNV ||
  3602. glslangOp == glslang::EOpRayQueryGetIntersectionLSSRadiiNV ||
  3603. glslangOp == glslang::EOpRayQueryIsLSSHitNV ||
  3604. glslangOp == glslang::EOpRayQueryIsSphereHitNV
  3605. )) {
  3606. bool cond = glslangOperands[arg]->getAsConstantUnion()->getConstArray()[0].getBConst();
  3607. operands.push_back(builder.makeIntConstant(cond ? 1 : 0));
  3608. } else if ((arg == 10 && glslangOp == glslang::EOpTraceKHR) ||
  3609. (arg == 11 && glslangOp == glslang::EOpTraceRayMotionNV) ||
  3610. (arg == 1 && glslangOp == glslang::EOpExecuteCallableKHR) ||
  3611. (arg == 1 && glslangOp == glslang::EOpHitObjectExecuteShaderNV) ||
  3612. (arg == 11 && glslangOp == glslang::EOpHitObjectTraceRayNV) ||
  3613. (arg == 12 && glslangOp == glslang::EOpHitObjectTraceRayMotionNV)) {
  3614. const int set = glslangOp == glslang::EOpExecuteCallableKHR ? 1 : 0;
  3615. const int location = glslangOperands[arg]->getAsConstantUnion()->getConstArray()[0].getUConst();
  3616. auto itNode = locationToSymbol[set].find(location);
  3617. visitSymbol(itNode->second);
  3618. spv::Id symId = getSymbolId(itNode->second);
  3619. operands.push_back(symId);
  3620. } else if ((arg == 12 && glslangOp == glslang::EOpHitObjectRecordHitNV) ||
  3621. (arg == 13 && glslangOp == glslang::EOpHitObjectRecordHitMotionNV) ||
  3622. (arg == 11 && glslangOp == glslang::EOpHitObjectRecordHitWithIndexNV) ||
  3623. (arg == 12 && glslangOp == glslang::EOpHitObjectRecordHitWithIndexMotionNV) ||
  3624. (arg == 1 && glslangOp == glslang::EOpHitObjectGetAttributesNV)) {
  3625. const int location = glslangOperands[arg]->getAsConstantUnion()->getConstArray()[0].getUConst();
  3626. const int set = 2;
  3627. auto itNode = locationToSymbol[set].find(location);
  3628. visitSymbol(itNode->second);
  3629. spv::Id symId = getSymbolId(itNode->second);
  3630. operands.push_back(symId);
  3631. } else if (glslangOperands[arg]->getAsTyped()->getQualifier().isSpirvLiteral()) {
  3632. // Will be translated to a literal value, make a placeholder here
  3633. operands.push_back(spv::NoResult);
  3634. } else if (glslangOperands[arg]->getAsTyped()->getBasicType() == glslang::EbtFunction) {
  3635. spv::Function* function = functionMap[glslangOperands[arg]->getAsSymbolNode()->getMangledName().c_str()];
  3636. assert(function);
  3637. operands.push_back(function->getId());
  3638. } else {
  3639. operands.push_back(accessChainLoad(glslangOperands[arg]->getAsTyped()->getType()));
  3640. }
  3641. }
  3642. }
  3643. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  3644. if (node->getOp() == glslang::EOpCooperativeMatrixLoadTensorNV) {
  3645. std::vector<spv::IdImmediate> idImmOps;
  3646. builder.addCapability(spv::Capability::CooperativeMatrixTensorAddressingNV);
  3647. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  3648. spv::Id object = builder.createLoad(operands[0], spv::NoPrecision);
  3649. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // Pointer
  3650. idImmOps.push_back(spv::IdImmediate(true, object)); // Object
  3651. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // tensorLayout
  3652. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end()); // memoryaccess
  3653. // initialize tensor operands to zero, then OR in flags based on the operands
  3654. size_t tensorOpIdx = idImmOps.size();
  3655. idImmOps.push_back(spv::IdImmediate(false, 0));
  3656. for (uint32_t i = 3; i < operands.size(); ++i) {
  3657. if (builder.isTensorView(operands[i])) {
  3658. addMask(idImmOps[tensorOpIdx].word, spv::TensorAddressingOperandsMask::TensorView);
  3659. } else {
  3660. // must be the decode func
  3661. addMask(idImmOps[tensorOpIdx].word, spv::TensorAddressingOperandsMask::DecodeFunc);
  3662. builder.addCapability(spv::Capability::CooperativeMatrixBlockLoadsNV);
  3663. }
  3664. idImmOps.push_back(spv::IdImmediate(true, operands[i])); // tensorView or decodeFunc
  3665. }
  3666. // get the pointee type
  3667. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  3668. assert(builder.isCooperativeMatrixType(typeId));
  3669. // do the op
  3670. spv::Id result = builder.createOp(spv::Op::OpCooperativeMatrixLoadTensorNV, typeId, idImmOps);
  3671. // store the result to the pointer (out param 'm')
  3672. builder.createStore(result, operands[0]);
  3673. result = 0;
  3674. } else if (node->getOp() == glslang::EOpCooperativeMatrixLoad ||
  3675. node->getOp() == glslang::EOpCooperativeMatrixLoadNV) {
  3676. std::vector<spv::IdImmediate> idImmOps;
  3677. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  3678. if (node->getOp() == glslang::EOpCooperativeMatrixLoad) {
  3679. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // matrixLayout
  3680. auto layout = (spv::CooperativeMatrixLayout)builder.getConstantScalar(operands[3]);
  3681. if (layout == spv::CooperativeMatrixLayout::RowBlockedInterleavedARM ||
  3682. layout == spv::CooperativeMatrixLayout::ColumnBlockedInterleavedARM) {
  3683. builder.addExtension(spv::E_SPV_ARM_cooperative_matrix_layouts);
  3684. builder.addCapability(spv::Capability::CooperativeMatrixLayoutsARM);
  3685. }
  3686. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
  3687. } else {
  3688. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
  3689. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // colMajor
  3690. }
  3691. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
  3692. // get the pointee type
  3693. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  3694. assert(builder.isCooperativeMatrixType(typeId));
  3695. // do the op
  3696. spv::Id result = node->getOp() == glslang::EOpCooperativeMatrixLoad
  3697. ? builder.createOp(spv::Op::OpCooperativeMatrixLoadKHR, typeId, idImmOps)
  3698. : builder.createOp(spv::Op::OpCooperativeMatrixLoadNV, typeId, idImmOps);
  3699. // store the result to the pointer (out param 'm')
  3700. builder.createStore(result, operands[0]);
  3701. result = 0;
  3702. } else if (node->getOp() == glslang::EOpCooperativeMatrixStoreTensorNV) {
  3703. std::vector<spv::IdImmediate> idImmOps;
  3704. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  3705. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // object
  3706. builder.addCapability(spv::Capability::CooperativeMatrixTensorAddressingNV);
  3707. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  3708. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // tensorLayout
  3709. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end()); // memoryaccess
  3710. if (operands.size() > 3) {
  3711. idImmOps.push_back(spv::IdImmediate(false, spv::TensorAddressingOperandsMask::TensorView));
  3712. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // tensorView
  3713. } else {
  3714. idImmOps.push_back(spv::IdImmediate(false, 0));
  3715. }
  3716. builder.createNoResultOp(spv::Op::OpCooperativeMatrixStoreTensorNV, idImmOps);
  3717. result = 0;
  3718. } else if (node->getOp() == glslang::EOpCooperativeMatrixStore ||
  3719. node->getOp() == glslang::EOpCooperativeMatrixStoreNV) {
  3720. std::vector<spv::IdImmediate> idImmOps;
  3721. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  3722. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // object
  3723. if (node->getOp() == glslang::EOpCooperativeMatrixStore) {
  3724. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // matrixLayout
  3725. auto layout = (spv::CooperativeMatrixLayout)builder.getConstantScalar(operands[3]);
  3726. if (layout == spv::CooperativeMatrixLayout::RowBlockedInterleavedARM ||
  3727. layout == spv::CooperativeMatrixLayout::ColumnBlockedInterleavedARM) {
  3728. builder.addExtension(spv::E_SPV_ARM_cooperative_matrix_layouts);
  3729. builder.addCapability(spv::Capability::CooperativeMatrixLayoutsARM);
  3730. }
  3731. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
  3732. } else {
  3733. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
  3734. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // colMajor
  3735. }
  3736. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
  3737. if (node->getOp() == glslang::EOpCooperativeMatrixStore)
  3738. builder.createNoResultOp(spv::Op::OpCooperativeMatrixStoreKHR, idImmOps);
  3739. else
  3740. builder.createNoResultOp(spv::Op::OpCooperativeMatrixStoreNV, idImmOps);
  3741. result = 0;
  3742. } else if (node->getOp() == glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT) {
  3743. std::vector<spv::IdImmediate> idImmOps;
  3744. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // q
  3745. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // committed
  3746. spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),
  3747. builder.makeUintConstant(3), 0);
  3748. // do the op
  3749. spv::Op spvOp = spv::Op::OpRayQueryGetIntersectionTriangleVertexPositionsKHR;
  3750. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  3751. // store the result to the pointer (out param 'm')
  3752. builder.createStore(result, operands[2]);
  3753. result = 0;
  3754. } else if (node->getOp() == glslang::EOpRayQueryGetIntersectionLSSPositionsNV) {
  3755. std::vector<spv::IdImmediate> idImmOps;
  3756. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // q
  3757. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // committed
  3758. spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),
  3759. builder.makeUintConstant(2), 0);
  3760. // do the op
  3761. spv::Op spvOp = spv::Op::OpRayQueryGetIntersectionLSSPositionsNV;
  3762. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  3763. // store the result to the pointer (out param 'm')
  3764. builder.createStore(result, operands[2]);
  3765. result = 0;
  3766. } else if (node->getOp() == glslang::EOpRayQueryGetIntersectionLSSRadiiNV) {
  3767. std::vector<spv::IdImmediate> idImmOps;
  3768. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // q
  3769. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // committed
  3770. spv::Id typeId = builder.makeArrayType(builder.makeFloatType(32),
  3771. builder.makeUintConstant(2), 0);
  3772. // do the op
  3773. spv::Op spvOp = spv::Op::OpRayQueryGetIntersectionLSSRadiiNV;
  3774. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  3775. // store the result to the pointer (out param 'm')
  3776. builder.createStore(result, operands[2]);
  3777. result = 0;
  3778. } else if (node->getOp() == glslang::EOpHitObjectGetLSSPositionsNV) {
  3779. std::vector<spv::IdImmediate> idImmOps;
  3780. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // hitObject
  3781. spv::Op spvOp = spv::Op::OpHitObjectGetLSSPositionsNV;
  3782. spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),
  3783. builder.makeUintConstant(2), 0);
  3784. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  3785. // store the result to the pointer (out param 'm')
  3786. builder.createStore(result, operands[1]);
  3787. result = 0;
  3788. } else if (node->getOp() == glslang::EOpHitObjectGetLSSRadiiNV) {
  3789. std::vector<spv::IdImmediate> idImmOps;
  3790. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // hitObject
  3791. spv::Op spvOp = spv::Op::OpHitObjectGetLSSRadiiNV;
  3792. spv::Id typeId = builder.makeArrayType(builder.makeFloatType(32),
  3793. builder.makeUintConstant(2), 0);
  3794. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  3795. // store the result to the pointer (out param 'm')
  3796. builder.createStore(result, operands[1]);
  3797. result = 0;
  3798. } else if (node->getOp() == glslang::EOpCooperativeMatrixMulAdd) {
  3799. auto matrixOperands = spv::CooperativeMatrixOperandsMask::MaskNone;
  3800. // If the optional operand is present, initialize matrixOperands to that value.
  3801. if (glslangOperands.size() == 4 && glslangOperands[3]->getAsConstantUnion()) {
  3802. matrixOperands = (spv::CooperativeMatrixOperandsMask)glslangOperands[3]->getAsConstantUnion()->getConstArray()[0].getIConst();
  3803. }
  3804. // Determine Cooperative Matrix Operands bits from the signedness of the types.
  3805. if (isTypeSignedInt(glslangOperands[0]->getAsTyped()->getBasicType()))
  3806. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixASignedComponentsKHR);
  3807. if (isTypeSignedInt(glslangOperands[1]->getAsTyped()->getBasicType()))
  3808. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixBSignedComponentsKHR);
  3809. if (isTypeSignedInt(glslangOperands[2]->getAsTyped()->getBasicType()))
  3810. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixCSignedComponentsKHR);
  3811. if (isTypeSignedInt(node->getBasicType()))
  3812. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixResultSignedComponentsKHR);
  3813. std::vector<spv::IdImmediate> idImmOps;
  3814. idImmOps.push_back(spv::IdImmediate(true, operands[0]));
  3815. idImmOps.push_back(spv::IdImmediate(true, operands[1]));
  3816. idImmOps.push_back(spv::IdImmediate(true, operands[2]));
  3817. if (matrixOperands != spv::CooperativeMatrixOperandsMask::MaskNone)
  3818. idImmOps.push_back(spv::IdImmediate(false, matrixOperands));
  3819. result = builder.createOp(spv::Op::OpCooperativeMatrixMulAddKHR, resultType(), idImmOps);
  3820. } else if (node->getOp() == glslang::EOpCooperativeMatrixReduceNV) {
  3821. builder.addCapability(spv::Capability::CooperativeMatrixReductionsNV);
  3822. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  3823. spv::Op opcode = spv::Op::OpCooperativeMatrixReduceNV;
  3824. unsigned mask = glslangOperands[2]->getAsConstantUnion()->getConstArray()[0].getUConst();
  3825. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  3826. assert(builder.isCooperativeMatrixType(typeId));
  3827. result = builder.createCooperativeMatrixReduce(opcode, typeId, operands[1], mask, operands[3]);
  3828. // store the result to the pointer (out param 'm')
  3829. builder.createStore(result, operands[0]);
  3830. result = 0;
  3831. } else if (node->getOp() == glslang::EOpCooperativeMatrixPerElementOpNV) {
  3832. builder.addCapability(spv::Capability::CooperativeMatrixPerElementOperationsNV);
  3833. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  3834. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  3835. assert(builder.isCooperativeMatrixType(typeId));
  3836. result = builder.createCooperativeMatrixPerElementOp(typeId, operands);
  3837. // store the result to the pointer
  3838. builder.createStore(result, operands[0]);
  3839. result = 0;
  3840. } else if (node->getOp() == glslang::EOpCooperativeMatrixTransposeNV) {
  3841. builder.addCapability(spv::Capability::CooperativeMatrixConversionsNV);
  3842. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  3843. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  3844. assert(builder.isCooperativeMatrixType(typeId));
  3845. result = builder.createUnaryOp(spv::Op::OpCooperativeMatrixTransposeNV, typeId, operands[1]);
  3846. // store the result to the pointer
  3847. builder.createStore(result, operands[0]);
  3848. result = 0;
  3849. } else if (node->getOp() == glslang::EOpBitCastArrayQCOM) {
  3850. builder.addCapability(spv::Capability::CooperativeMatrixConversionQCOM);
  3851. builder.addExtension(spv::E_SPV_QCOM_cooperative_matrix_conversion);
  3852. result = builder.createUnaryOp(spv::Op::OpBitCastArrayQCOM, resultType(), operands[0]);
  3853. } else if (node->getOp() == glslang::EOpCompositeConstructCoopMatQCOM) {
  3854. builder.addCapability(spv::Capability::CooperativeMatrixConversionQCOM);
  3855. builder.addExtension(spv::E_SPV_QCOM_cooperative_matrix_conversion);
  3856. result = builder.createUnaryOp(spv::Op::OpCompositeConstructCoopMatQCOM, resultType(), operands[0]);
  3857. } else if (node->getOp() == glslang::EOpCompositeExtractCoopMatQCOM) {
  3858. builder.addCapability(spv::Capability::CooperativeMatrixConversionQCOM);
  3859. builder.addExtension(spv::E_SPV_QCOM_cooperative_matrix_conversion);
  3860. result = builder.createUnaryOp(spv::Op::OpCompositeExtractCoopMatQCOM, resultType(), operands[0]);
  3861. } else if (node->getOp() == glslang::EOpExtractSubArrayQCOM) {
  3862. builder.addCapability(spv::Capability::CooperativeMatrixConversionQCOM);
  3863. builder.addExtension(spv::E_SPV_QCOM_cooperative_matrix_conversion);
  3864. std::vector<spv::Id> arguments { operands[0], operands[1] };;
  3865. result = builder.createOp(spv::Op::OpExtractSubArrayQCOM, resultType(), arguments);
  3866. } else if (node->getOp() == glslang::EOpCooperativeVectorMatMulNV ||
  3867. node->getOp() == glslang::EOpCooperativeVectorMatMulAddNV) {
  3868. auto matrixOperands = spv::CooperativeMatrixOperandsMask::MaskNone;
  3869. bool isMulAdd = node->getOp() == glslang::EOpCooperativeVectorMatMulAddNV;
  3870. // Determine Cooperative Matrix Operands bits from the signedness of the types.
  3871. if (isTypeSignedInt(glslangOperands[1]->getAsTyped()->getBasicType()))
  3872. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixBSignedComponentsKHR);
  3873. if (isTypeSignedInt(glslangOperands[0]->getAsTyped()->getBasicType()))
  3874. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixResultSignedComponentsKHR);
  3875. uint32_t opIdx = 1;
  3876. std::vector<spv::IdImmediate> idImmOps;
  3877. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Input
  3878. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // InputInterpretation
  3879. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Matrix
  3880. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MatrixOffset
  3881. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MatrixInterpretation
  3882. if (isMulAdd) {
  3883. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Bias
  3884. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // BiasOffset
  3885. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // BiasInterpretation
  3886. }
  3887. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // M
  3888. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // K
  3889. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MemoryLayout
  3890. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Transpose
  3891. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MatrixStride
  3892. if (matrixOperands != spv::CooperativeMatrixOperandsMask::MaskNone)
  3893. idImmOps.push_back(spv::IdImmediate(false, matrixOperands)); // Cooperative Matrix Operands
  3894. // get the pointee type
  3895. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  3896. assert(builder.isCooperativeVectorType(typeId));
  3897. // do the op
  3898. spv::Id result = builder.createOp(isMulAdd ? spv::Op::OpCooperativeVectorMatrixMulAddNV : spv::Op::OpCooperativeVectorMatrixMulNV, typeId, idImmOps);
  3899. // store the result to the pointer (out param 'res')
  3900. builder.createStore(result, operands[0]);
  3901. result = 0;
  3902. } else if (node->getOp() == glslang::EOpCooperativeVectorLoadNV) {
  3903. std::vector<spv::IdImmediate> idImmOps;
  3904. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  3905. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // offset
  3906. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
  3907. // get the pointee type
  3908. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  3909. assert(builder.isCooperativeVectorType(typeId));
  3910. // do the op
  3911. spv::Id result = builder.createOp(spv::Op::OpCooperativeVectorLoadNV, typeId, idImmOps);
  3912. // store the result to the pointer (out param 'v')
  3913. builder.createStore(result, operands[0]);
  3914. result = 0;
  3915. } else if (node->getOp() == glslang::EOpCooperativeVectorStoreNV) {
  3916. std::vector<spv::IdImmediate> idImmOps;
  3917. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  3918. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // offset
  3919. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // object
  3920. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
  3921. builder.createNoResultOp(spv::Op::OpCooperativeVectorStoreNV, idImmOps);
  3922. result = 0;
  3923. } else if (node->getOp() == glslang::EOpCooperativeVectorOuterProductAccumulateNV) {
  3924. builder.addCapability(spv::Capability::CooperativeVectorTrainingNV);
  3925. builder.addExtension(spv::E_SPV_NV_cooperative_vector);
  3926. std::vector<spv::IdImmediate> idImmOps;
  3927. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // Matrix
  3928. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // Offset
  3929. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // A
  3930. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // B
  3931. idImmOps.push_back(spv::IdImmediate(true, operands[5])); // MemoryLayout
  3932. idImmOps.push_back(spv::IdImmediate(true, operands[6])); // MatrixInterpretation
  3933. idImmOps.push_back(spv::IdImmediate(true, operands[4])); // Stride
  3934. builder.createNoResultOp(spv::Op::OpCooperativeVectorOuterProductAccumulateNV, idImmOps);
  3935. result = 0;
  3936. } else if (node->getOp() == glslang::EOpCooperativeVectorReduceSumAccumulateNV) {
  3937. builder.addCapability(spv::Capability::CooperativeVectorTrainingNV);
  3938. builder.addExtension(spv::E_SPV_NV_cooperative_vector);
  3939. std::vector<spv::IdImmediate> idImmOps;
  3940. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // Buf
  3941. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // Offset
  3942. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // A
  3943. builder.createNoResultOp(spv::Op::OpCooperativeVectorReduceSumAccumulateNV, idImmOps);
  3944. result = 0;
  3945. } else if (node->getOp() == glslang::EOpTensorReadARM ||
  3946. node->getOp() == glslang::EOpTensorWriteARM) {
  3947. const bool isWrite = node->getOp() == glslang::EOpTensorWriteARM;
  3948. const unsigned int tensorMinOperandCount = 3;
  3949. assert(operands.size() >= tensorMinOperandCount);
  3950. std::vector<spv::IdImmediate> idImmOps;
  3951. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // tensor
  3952. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // coords
  3953. if (isWrite) {
  3954. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // value
  3955. }
  3956. // Analyze the tensor operands
  3957. spv::IdImmediate tensorOperands = { false, uint32_t(spv::TensorOperandsMask::MaskNone) };
  3958. bool pushExtraArg = false;
  3959. if (operands.size() > tensorMinOperandCount) {
  3960. auto enumVal = builder.getConstantScalar(operands[tensorMinOperandCount]);
  3961. if (enumVal & uint32_t(spv::TensorOperandsMask::NontemporalARM)) {
  3962. tensorOperands.word |= uint32_t(spv::TensorOperandsMask::NontemporalARM);
  3963. }
  3964. if (enumVal & uint32_t(spv::TensorOperandsMask::OutOfBoundsValueARM)) {
  3965. tensorOperands.word |= uint32_t(spv::TensorOperandsMask::OutOfBoundsValueARM);
  3966. assert(operands.size() >= tensorMinOperandCount + 2 &&
  3967. "TensorOperandsOutOfBoundsValueMask requires an additional value");
  3968. pushExtraArg = true;
  3969. }
  3970. }
  3971. // Append optional tensor operands if the mask was non-zero.
  3972. if (tensorOperands.word) {
  3973. idImmOps.push_back(tensorOperands);
  3974. if (pushExtraArg)
  3975. idImmOps.push_back(spv::IdImmediate(true, operands[tensorMinOperandCount + 1]));
  3976. }
  3977. if (isWrite) {
  3978. builder.createNoResultOp(spv::Op::OpTensorWriteARM, idImmOps);
  3979. result = 0;
  3980. } else {
  3981. // Use the result argument type as the OpTensorReadARM result type.
  3982. const glslang::TType &resArgType = glslangOperands[2]->getAsTyped()->getType();
  3983. spv::Id retType = convertGlslangToSpvType(resArgType);
  3984. result = builder.createOp(spv::Op::OpTensorReadARM, retType, idImmOps);
  3985. // Store the result to the result argument.
  3986. builder.createStore(result, operands[2]);
  3987. }
  3988. } else if (node->getOp() == glslang::EOpTensorSizeARM) {
  3989. // Expected operands are (tensor, dimension)
  3990. assert(operands.size() == 2);
  3991. spv::Id tensorOp = operands[0];
  3992. spv::Id dimOp = operands[1];
  3993. assert(builder.isTensorTypeARM(builder.getTypeId(tensorOp)) && "operand #0 must be a tensor");
  3994. std::vector<spv::IdImmediate> idImmOps;
  3995. idImmOps.push_back(spv::IdImmediate(true, tensorOp));
  3996. idImmOps.push_back(spv::IdImmediate(true, dimOp));
  3997. result = builder.createOp(spv::Op::OpTensorQuerySizeARM, resultType(), idImmOps);
  3998. } else if (atomic) {
  3999. // Handle all atomics
  4000. glslang::TBasicType typeProxy = (node->getOp() == glslang::EOpAtomicStore)
  4001. ? node->getSequence()[0]->getAsTyped()->getBasicType() : node->getBasicType();
  4002. result = createAtomicOperation(node->getOp(), precision, resultType(), operands, typeProxy,
  4003. lvalueCoherentFlags, node->getType());
  4004. } else if (node->getOp() == glslang::EOpSpirvInst) {
  4005. const auto& spirvInst = node->getSpirvInstruction();
  4006. if (spirvInst.set == "") {
  4007. std::vector<spv::IdImmediate> idImmOps;
  4008. for (unsigned int i = 0; i < glslangOperands.size(); ++i) {
  4009. if (glslangOperands[i]->getAsTyped()->getQualifier().isSpirvLiteral()) {
  4010. // Translate the constant to a literal value
  4011. std::vector<unsigned> literals;
  4012. glslang::TVector<const glslang::TIntermConstantUnion*> constants;
  4013. constants.push_back(glslangOperands[i]->getAsConstantUnion());
  4014. TranslateLiterals(constants, literals);
  4015. idImmOps.push_back({false, literals[0]});
  4016. } else
  4017. idImmOps.push_back({true, operands[i]});
  4018. }
  4019. if (node->getBasicType() == glslang::EbtVoid)
  4020. builder.createNoResultOp(static_cast<spv::Op>(spirvInst.id), idImmOps);
  4021. else
  4022. result = builder.createOp(static_cast<spv::Op>(spirvInst.id), resultType(), idImmOps);
  4023. } else {
  4024. result = builder.createBuiltinCall(
  4025. resultType(), spirvInst.set == "GLSL.std.450" ? stdBuiltins : getExtBuiltins(spirvInst.set.c_str()),
  4026. spirvInst.id, operands);
  4027. }
  4028. noReturnValue = node->getBasicType() == glslang::EbtVoid;
  4029. } else if (node->getOp() == glslang::EOpDebugPrintf) {
  4030. if (!nonSemanticDebugPrintf) {
  4031. nonSemanticDebugPrintf = builder.import("NonSemantic.DebugPrintf");
  4032. }
  4033. result = builder.createBuiltinCall(builder.makeVoidType(), nonSemanticDebugPrintf, spv::NonSemanticDebugPrintfDebugPrintf, operands);
  4034. builder.addExtension(spv::E_SPV_KHR_non_semantic_info);
  4035. } else {
  4036. // Pass through to generic operations.
  4037. switch (glslangOperands.size()) {
  4038. case 0:
  4039. result = createNoArgOperation(node->getOp(), precision, resultType());
  4040. break;
  4041. case 1:
  4042. {
  4043. OpDecorations decorations = { precision,
  4044. TranslateNoContractionDecoration(node->getType().getQualifier()),
  4045. TranslateNonUniformDecoration(node->getType().getQualifier()) };
  4046. result = createUnaryOperation(
  4047. node->getOp(), decorations,
  4048. resultType(), operands.front(),
  4049. glslangOperands[0]->getAsTyped()->getBasicType(), lvalueCoherentFlags, node->getType());
  4050. }
  4051. break;
  4052. default:
  4053. result = createMiscOperation(node->getOp(), precision, resultType(), operands, node->getBasicType());
  4054. break;
  4055. }
  4056. if (invertedType != spv::NoResult)
  4057. result = createInvertedSwizzle(precision, *glslangOperands[0]->getAsBinaryNode(), result);
  4058. for (unsigned int i = 0; i < temporaryLvalues.size(); ++i) {
  4059. builder.setAccessChain(complexLvalues[i]);
  4060. builder.accessChainStore(builder.createLoad(temporaryLvalues[i], spv::NoPrecision),
  4061. TranslateNonUniformDecoration(complexLvalues[i].coherentFlags));
  4062. }
  4063. }
  4064. if (noReturnValue)
  4065. return false;
  4066. if (! result) {
  4067. logger->missingFunctionality("unknown glslang aggregate");
  4068. return true; // pick up a child as a placeholder operand
  4069. } else {
  4070. builder.clearAccessChain();
  4071. builder.setAccessChainRValue(result);
  4072. return false;
  4073. }
  4074. }
  4075. // This path handles both if-then-else and ?:
  4076. // The if-then-else has a node type of void, while
  4077. // ?: has either a void or a non-void node type
  4078. //
  4079. // Leaving the result, when not void:
  4080. // GLSL only has r-values as the result of a :?, but
  4081. // if we have an l-value, that can be more efficient if it will
  4082. // become the base of a complex r-value expression, because the
  4083. // next layer copies r-values into memory to use the access-chain mechanism
  4084. bool TGlslangToSpvTraverser::visitSelection(glslang::TVisit /* visit */, glslang::TIntermSelection* node)
  4085. {
  4086. // see if OpSelect can handle it
  4087. const auto isOpSelectable = [&]() {
  4088. if (node->getBasicType() == glslang::EbtVoid)
  4089. return false;
  4090. // OpSelect can do all other types starting with SPV 1.4
  4091. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_4) {
  4092. // pre-1.4, only scalars and vectors can be handled
  4093. if ((!node->getType().isScalar() && !node->getType().isVector()))
  4094. return false;
  4095. }
  4096. return true;
  4097. };
  4098. // See if it simple and safe, or required, to execute both sides.
  4099. // Crucially, side effects must be either semantically required or avoided,
  4100. // and there are performance trade-offs.
  4101. // Return true if required or a good idea (and safe) to execute both sides,
  4102. // false otherwise.
  4103. const auto bothSidesPolicy = [&]() -> bool {
  4104. // do we have both sides?
  4105. if (node->getTrueBlock() == nullptr ||
  4106. node->getFalseBlock() == nullptr)
  4107. return false;
  4108. // required? (unless we write additional code to look for side effects
  4109. // and make performance trade-offs if none are present)
  4110. if (!node->getShortCircuit())
  4111. return true;
  4112. // if not required to execute both, decide based on performance/practicality...
  4113. if (!isOpSelectable())
  4114. return false;
  4115. assert(node->getType() == node->getTrueBlock() ->getAsTyped()->getType() &&
  4116. node->getType() == node->getFalseBlock()->getAsTyped()->getType());
  4117. // return true if a single operand to ? : is okay for OpSelect
  4118. const auto operandOkay = [](glslang::TIntermTyped* node) {
  4119. return node->getAsSymbolNode() || node->getType().getQualifier().isConstant();
  4120. };
  4121. return operandOkay(node->getTrueBlock() ->getAsTyped()) &&
  4122. operandOkay(node->getFalseBlock()->getAsTyped());
  4123. };
  4124. spv::Id result = spv::NoResult; // upcoming result selecting between trueValue and falseValue
  4125. // emit the condition before doing anything with selection
  4126. node->getCondition()->traverse(this);
  4127. spv::Id condition = accessChainLoad(node->getCondition()->getType());
  4128. // Find a way of executing both sides and selecting the right result.
  4129. const auto executeBothSides = [&]() -> void {
  4130. // execute both sides
  4131. spv::Id resultType = convertGlslangToSpvType(node->getType());
  4132. node->getTrueBlock()->traverse(this);
  4133. spv::Id trueValue = accessChainLoad(node->getTrueBlock()->getAsTyped()->getType());
  4134. node->getFalseBlock()->traverse(this);
  4135. spv::Id falseValue = accessChainLoad(node->getFalseBlock()->getAsTyped()->getType());
  4136. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  4137. // done if void
  4138. if (node->getBasicType() == glslang::EbtVoid)
  4139. return;
  4140. // emit code to select between trueValue and falseValue
  4141. // see if OpSelect can handle the result type, and that the SPIR-V types
  4142. // of the inputs match the result type.
  4143. if (isOpSelectable()) {
  4144. // Emit OpSelect for this selection.
  4145. // smear condition to vector, if necessary (AST is always scalar)
  4146. // Before 1.4, smear like for mix(), starting with 1.4, keep it scalar
  4147. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_4 && builder.isVector(trueValue)) {
  4148. condition = builder.smearScalar(spv::NoPrecision, condition,
  4149. builder.makeVectorType(builder.makeBoolType(),
  4150. builder.getNumComponents(trueValue)));
  4151. }
  4152. // If the types do not match, it is because of mismatched decorations on aggregates.
  4153. // Since isOpSelectable only lets us get here for SPIR-V >= 1.4, we can use OpCopyObject
  4154. // to get matching types.
  4155. if (builder.getTypeId(trueValue) != resultType) {
  4156. trueValue = builder.createUnaryOp(spv::Op::OpCopyLogical, resultType, trueValue);
  4157. }
  4158. if (builder.getTypeId(falseValue) != resultType) {
  4159. falseValue = builder.createUnaryOp(spv::Op::OpCopyLogical, resultType, falseValue);
  4160. }
  4161. // OpSelect
  4162. result = builder.createTriOp(spv::Op::OpSelect, resultType, condition, trueValue, falseValue);
  4163. builder.clearAccessChain();
  4164. builder.setAccessChainRValue(result);
  4165. } else {
  4166. // We need control flow to select the result.
  4167. // TODO: Once SPIR-V OpSelect allows arbitrary types, eliminate this path.
  4168. result = builder.createVariable(TranslatePrecisionDecoration(node->getType()),
  4169. spv::StorageClass::Function, resultType);
  4170. // Selection control:
  4171. const spv::SelectionControlMask control = TranslateSelectionControl(*node);
  4172. // make an "if" based on the value created by the condition
  4173. spv::Builder::If ifBuilder(condition, control, builder);
  4174. // emit the "then" statement
  4175. builder.clearAccessChain();
  4176. builder.setAccessChainLValue(result);
  4177. multiTypeStore(node->getType(), trueValue);
  4178. ifBuilder.makeBeginElse();
  4179. // emit the "else" statement
  4180. builder.clearAccessChain();
  4181. builder.setAccessChainLValue(result);
  4182. multiTypeStore(node->getType(), falseValue);
  4183. // finish off the control flow
  4184. ifBuilder.makeEndIf();
  4185. builder.clearAccessChain();
  4186. builder.setAccessChainLValue(result);
  4187. }
  4188. };
  4189. // Execute the one side needed, as per the condition
  4190. const auto executeOneSide = [&]() {
  4191. // Always emit control flow.
  4192. if (node->getBasicType() != glslang::EbtVoid) {
  4193. result = builder.createVariable(TranslatePrecisionDecoration(node->getType()), spv::StorageClass::Function,
  4194. convertGlslangToSpvType(node->getType()));
  4195. }
  4196. // Selection control:
  4197. const spv::SelectionControlMask control = TranslateSelectionControl(*node);
  4198. // make an "if" based on the value created by the condition
  4199. spv::Builder::If ifBuilder(condition, control, builder);
  4200. // emit the "then" statement
  4201. if (node->getTrueBlock() != nullptr) {
  4202. node->getTrueBlock()->traverse(this);
  4203. if (result != spv::NoResult) {
  4204. spv::Id load = accessChainLoad(node->getTrueBlock()->getAsTyped()->getType());
  4205. builder.clearAccessChain();
  4206. builder.setAccessChainLValue(result);
  4207. multiTypeStore(node->getType(), load);
  4208. }
  4209. }
  4210. if (node->getFalseBlock() != nullptr) {
  4211. ifBuilder.makeBeginElse();
  4212. // emit the "else" statement
  4213. node->getFalseBlock()->traverse(this);
  4214. if (result != spv::NoResult) {
  4215. spv::Id load = accessChainLoad(node->getFalseBlock()->getAsTyped()->getType());
  4216. builder.clearAccessChain();
  4217. builder.setAccessChainLValue(result);
  4218. multiTypeStore(node->getType(), load);
  4219. }
  4220. }
  4221. // finish off the control flow
  4222. ifBuilder.makeEndIf();
  4223. if (result != spv::NoResult) {
  4224. builder.clearAccessChain();
  4225. builder.setAccessChainLValue(result);
  4226. }
  4227. };
  4228. // Try for OpSelect (or a requirement to execute both sides)
  4229. if (bothSidesPolicy()) {
  4230. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  4231. if (node->getType().getQualifier().isSpecConstant())
  4232. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  4233. executeBothSides();
  4234. } else
  4235. executeOneSide();
  4236. return false;
  4237. }
  4238. bool TGlslangToSpvTraverser::visitSwitch(glslang::TVisit /* visit */, glslang::TIntermSwitch* node)
  4239. {
  4240. // emit and get the condition before doing anything with switch
  4241. node->getCondition()->traverse(this);
  4242. spv::Id selector = accessChainLoad(node->getCondition()->getAsTyped()->getType());
  4243. // Selection control:
  4244. const spv::SelectionControlMask control = TranslateSwitchControl(*node);
  4245. // browse the children to sort out code segments
  4246. int defaultSegment = -1;
  4247. std::vector<TIntermNode*> codeSegments;
  4248. glslang::TIntermSequence& sequence = node->getBody()->getSequence();
  4249. std::vector<int> caseValues;
  4250. std::vector<int> valueIndexToSegment(sequence.size()); // note: probably not all are used, it is an overestimate
  4251. for (glslang::TIntermSequence::iterator c = sequence.begin(); c != sequence.end(); ++c) {
  4252. TIntermNode* child = *c;
  4253. if (child->getAsBranchNode() && child->getAsBranchNode()->getFlowOp() == glslang::EOpDefault)
  4254. defaultSegment = (int)codeSegments.size();
  4255. else if (child->getAsBranchNode() && child->getAsBranchNode()->getFlowOp() == glslang::EOpCase) {
  4256. valueIndexToSegment[caseValues.size()] = (int)codeSegments.size();
  4257. caseValues.push_back(child->getAsBranchNode()->getExpression()->getAsConstantUnion()
  4258. ->getConstArray()[0].getIConst());
  4259. } else
  4260. codeSegments.push_back(child);
  4261. }
  4262. // handle the case where the last code segment is missing, due to no code
  4263. // statements between the last case and the end of the switch statement
  4264. if ((caseValues.size() && (int)codeSegments.size() == valueIndexToSegment[caseValues.size() - 1]) ||
  4265. (int)codeSegments.size() == defaultSegment)
  4266. codeSegments.push_back(nullptr);
  4267. // make the switch statement
  4268. std::vector<spv::Block*> segmentBlocks; // returned, as the blocks allocated in the call
  4269. builder.makeSwitch(selector, control, (int)codeSegments.size(), caseValues, valueIndexToSegment, defaultSegment,
  4270. segmentBlocks);
  4271. // emit all the code in the segments
  4272. breakForLoop.push(false);
  4273. for (unsigned int s = 0; s < codeSegments.size(); ++s) {
  4274. builder.nextSwitchSegment(segmentBlocks, s);
  4275. if (codeSegments[s])
  4276. codeSegments[s]->traverse(this);
  4277. else
  4278. builder.addSwitchBreak(true);
  4279. }
  4280. breakForLoop.pop();
  4281. builder.endSwitch(segmentBlocks);
  4282. return false;
  4283. }
  4284. void TGlslangToSpvTraverser::visitConstantUnion(glslang::TIntermConstantUnion* node)
  4285. {
  4286. if (node->getQualifier().isSpirvLiteral())
  4287. return; // Translated to a literal value, skip further processing
  4288. int nextConst = 0;
  4289. spv::Id constant = createSpvConstantFromConstUnionArray(node->getType(), node->getConstArray(), nextConst, false);
  4290. builder.clearAccessChain();
  4291. builder.setAccessChainRValue(constant);
  4292. }
  4293. bool TGlslangToSpvTraverser::visitLoop(glslang::TVisit /* visit */, glslang::TIntermLoop* node)
  4294. {
  4295. auto blocks = builder.makeNewLoop();
  4296. builder.createBranch(true, &blocks.head);
  4297. // Loop control:
  4298. std::vector<unsigned int> operands;
  4299. const spv::LoopControlMask control = TranslateLoopControl(*node, operands);
  4300. // Spec requires back edges to target header blocks, and every header block
  4301. // must dominate its merge block. Make a header block first to ensure these
  4302. // conditions are met. By definition, it will contain OpLoopMerge, followed
  4303. // by a block-ending branch. But we don't want to put any other body/test
  4304. // instructions in it, since the body/test may have arbitrary instructions,
  4305. // including merges of its own.
  4306. builder.setBuildPoint(&blocks.head);
  4307. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  4308. builder.createLoopMerge(&blocks.merge, &blocks.continue_target, control, operands);
  4309. if (node->testFirst() && node->getTest()) {
  4310. spv::Block& test = builder.makeNewBlock();
  4311. builder.createBranch(true, &test);
  4312. builder.setBuildPoint(&test);
  4313. node->getTest()->traverse(this);
  4314. spv::Id condition = accessChainLoad(node->getTest()->getType());
  4315. builder.createConditionalBranch(condition, &blocks.body, &blocks.merge);
  4316. builder.setBuildPoint(&blocks.body);
  4317. breakForLoop.push(true);
  4318. if (node->getBody())
  4319. node->getBody()->traverse(this);
  4320. builder.createBranch(true, &blocks.continue_target);
  4321. breakForLoop.pop();
  4322. builder.setBuildPoint(&blocks.continue_target);
  4323. if (node->getTerminal())
  4324. node->getTerminal()->traverse(this);
  4325. builder.createBranch(true, &blocks.head);
  4326. } else {
  4327. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  4328. builder.createBranch(true, &blocks.body);
  4329. breakForLoop.push(true);
  4330. builder.setBuildPoint(&blocks.body);
  4331. if (node->getBody())
  4332. node->getBody()->traverse(this);
  4333. builder.createBranch(true, &blocks.continue_target);
  4334. breakForLoop.pop();
  4335. builder.setBuildPoint(&blocks.continue_target);
  4336. if (node->getTerminal())
  4337. node->getTerminal()->traverse(this);
  4338. if (node->getTest()) {
  4339. node->getTest()->traverse(this);
  4340. spv::Id condition =
  4341. accessChainLoad(node->getTest()->getType());
  4342. builder.createConditionalBranch(condition, &blocks.head, &blocks.merge);
  4343. } else {
  4344. // TODO: unless there was a break/return/discard instruction
  4345. // somewhere in the body, this is an infinite loop, so we should
  4346. // issue a warning.
  4347. builder.createBranch(true, &blocks.head);
  4348. }
  4349. }
  4350. builder.setBuildPoint(&blocks.merge);
  4351. builder.closeLoop();
  4352. return false;
  4353. }
  4354. bool TGlslangToSpvTraverser::visitBranch(glslang::TVisit /* visit */, glslang::TIntermBranch* node)
  4355. {
  4356. if (node->getExpression())
  4357. node->getExpression()->traverse(this);
  4358. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  4359. switch (node->getFlowOp()) {
  4360. case glslang::EOpKill:
  4361. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {
  4362. builder.addCapability(spv::Capability::DemoteToHelperInvocation);
  4363. builder.createNoResultOp(spv::Op::OpDemoteToHelperInvocationEXT);
  4364. } else {
  4365. builder.makeStatementTerminator(spv::Op::OpKill, "post-discard");
  4366. }
  4367. break;
  4368. case glslang::EOpTerminateInvocation:
  4369. builder.addExtension(spv::E_SPV_KHR_terminate_invocation);
  4370. builder.makeStatementTerminator(spv::Op::OpTerminateInvocation, "post-terminate-invocation");
  4371. break;
  4372. case glslang::EOpBreak:
  4373. if (breakForLoop.top())
  4374. builder.createLoopExit();
  4375. else
  4376. builder.addSwitchBreak(false);
  4377. break;
  4378. case glslang::EOpContinue:
  4379. builder.createLoopContinue();
  4380. break;
  4381. case glslang::EOpReturn:
  4382. if (node->getExpression() != nullptr) {
  4383. const glslang::TType& glslangReturnType = node->getExpression()->getType();
  4384. spv::Id returnId = accessChainLoad(glslangReturnType);
  4385. if (builder.getTypeId(returnId) != currentFunction->getReturnType() ||
  4386. TranslatePrecisionDecoration(glslangReturnType) != currentFunction->getReturnPrecision()) {
  4387. builder.clearAccessChain();
  4388. spv::Id copyId = builder.createVariable(currentFunction->getReturnPrecision(),
  4389. spv::StorageClass::Function, currentFunction->getReturnType());
  4390. builder.setAccessChainLValue(copyId);
  4391. multiTypeStore(glslangReturnType, returnId);
  4392. returnId = builder.createLoad(copyId, currentFunction->getReturnPrecision());
  4393. }
  4394. builder.makeReturn(false, returnId);
  4395. } else
  4396. builder.makeReturn(false);
  4397. builder.clearAccessChain();
  4398. break;
  4399. case glslang::EOpDemote:
  4400. builder.createNoResultOp(spv::Op::OpDemoteToHelperInvocationEXT);
  4401. builder.addExtension(spv::E_SPV_EXT_demote_to_helper_invocation);
  4402. builder.addCapability(spv::Capability::DemoteToHelperInvocationEXT);
  4403. break;
  4404. case glslang::EOpTerminateRayKHR:
  4405. builder.makeStatementTerminator(spv::Op::OpTerminateRayKHR, "post-terminateRayKHR");
  4406. break;
  4407. case glslang::EOpIgnoreIntersectionKHR:
  4408. builder.makeStatementTerminator(spv::Op::OpIgnoreIntersectionKHR, "post-ignoreIntersectionKHR");
  4409. break;
  4410. default:
  4411. assert(0);
  4412. break;
  4413. }
  4414. return false;
  4415. }
  4416. spv::Id TGlslangToSpvTraverser::createSpvVariable(const glslang::TIntermSymbol* node, spv::Id forcedType)
  4417. {
  4418. // First, steer off constants, which are not SPIR-V variables, but
  4419. // can still have a mapping to a SPIR-V Id.
  4420. // This includes specialization constants.
  4421. if (node->getQualifier().isConstant()) {
  4422. spv::Id result = createSpvConstant(*node);
  4423. if (result != spv::NoResult)
  4424. return result;
  4425. }
  4426. // Now, handle actual variables
  4427. spv::StorageClass storageClass = TranslateStorageClass(node->getType());
  4428. spv::Id spvType = forcedType == spv::NoType ? convertGlslangToSpvType(node->getType())
  4429. : forcedType;
  4430. const bool contains16BitType = node->getType().contains16BitFloat() ||
  4431. node->getType().contains16BitInt();
  4432. if (contains16BitType) {
  4433. switch (storageClass) {
  4434. case spv::StorageClass::Input:
  4435. case spv::StorageClass::Output:
  4436. builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);
  4437. builder.addCapability(spv::Capability::StorageInputOutput16);
  4438. break;
  4439. case spv::StorageClass::Uniform:
  4440. builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);
  4441. if (node->getType().getQualifier().storage == glslang::EvqBuffer)
  4442. builder.addCapability(spv::Capability::StorageUniformBufferBlock16);
  4443. else
  4444. builder.addCapability(spv::Capability::StorageUniform16);
  4445. break;
  4446. case spv::StorageClass::PushConstant:
  4447. builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);
  4448. builder.addCapability(spv::Capability::StoragePushConstant16);
  4449. break;
  4450. case spv::StorageClass::StorageBuffer:
  4451. case spv::StorageClass::PhysicalStorageBufferEXT:
  4452. builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);
  4453. builder.addCapability(spv::Capability::StorageUniformBufferBlock16);
  4454. break;
  4455. case spv::StorageClass::TileAttachmentQCOM:
  4456. builder.addCapability(spv::Capability::TileShadingQCOM);
  4457. break;
  4458. default:
  4459. if (storageClass == spv::StorageClass::Workgroup &&
  4460. node->getType().getBasicType() == glslang::EbtBlock) {
  4461. builder.addCapability(spv::Capability::WorkgroupMemoryExplicitLayout16BitAccessKHR);
  4462. break;
  4463. }
  4464. if (node->getType().contains16BitFloat())
  4465. builder.addCapability(spv::Capability::Float16);
  4466. if (node->getType().contains16BitInt())
  4467. builder.addCapability(spv::Capability::Int16);
  4468. break;
  4469. }
  4470. }
  4471. if (node->getType().contains8BitInt()) {
  4472. if (storageClass == spv::StorageClass::PushConstant) {
  4473. builder.addIncorporatedExtension(spv::E_SPV_KHR_8bit_storage, spv::Spv_1_5);
  4474. builder.addCapability(spv::Capability::StoragePushConstant8);
  4475. } else if (storageClass == spv::StorageClass::Uniform) {
  4476. builder.addIncorporatedExtension(spv::E_SPV_KHR_8bit_storage, spv::Spv_1_5);
  4477. builder.addCapability(spv::Capability::UniformAndStorageBuffer8BitAccess);
  4478. } else if (storageClass == spv::StorageClass::StorageBuffer) {
  4479. builder.addIncorporatedExtension(spv::E_SPV_KHR_8bit_storage, spv::Spv_1_5);
  4480. builder.addCapability(spv::Capability::StorageBuffer8BitAccess);
  4481. } else if (storageClass == spv::StorageClass::Workgroup &&
  4482. node->getType().getBasicType() == glslang::EbtBlock) {
  4483. builder.addCapability(spv::Capability::WorkgroupMemoryExplicitLayout8BitAccessKHR);
  4484. } else {
  4485. builder.addCapability(spv::Capability::Int8);
  4486. }
  4487. }
  4488. const char* name = node->getName().c_str();
  4489. if (glslang::IsAnonymous(name))
  4490. name = "";
  4491. spv::Id initializer = spv::NoResult;
  4492. if (node->getType().getQualifier().storage == glslang::EvqUniform && !node->getConstArray().empty()) {
  4493. int nextConst = 0;
  4494. initializer = createSpvConstantFromConstUnionArray(node->getType(),
  4495. node->getConstArray(),
  4496. nextConst,
  4497. false /* specConst */);
  4498. } else if (node->getType().getQualifier().isNullInit()) {
  4499. initializer = builder.makeNullConstant(spvType);
  4500. }
  4501. spv::Id var = builder.createVariable(spv::NoPrecision, storageClass, spvType, name, initializer, false);
  4502. std::vector<spv::Decoration> topLevelDecorations;
  4503. glslang::TQualifier typeQualifier = node->getType().getQualifier();
  4504. TranslateMemoryDecoration(typeQualifier, topLevelDecorations, glslangIntermediate->usingVulkanMemoryModel());
  4505. for (auto deco : topLevelDecorations) {
  4506. builder.addDecoration(var, deco);
  4507. }
  4508. return var;
  4509. }
  4510. // Return type Id of the sampled type.
  4511. spv::Id TGlslangToSpvTraverser::getSampledType(const glslang::TSampler& sampler)
  4512. {
  4513. switch (sampler.type) {
  4514. case glslang::EbtInt: return builder.makeIntType(32);
  4515. case glslang::EbtUint: return builder.makeUintType(32);
  4516. case glslang::EbtFloat: return builder.makeFloatType(32);
  4517. case glslang::EbtFloat16:
  4518. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float_fetch);
  4519. builder.addCapability(spv::Capability::Float16ImageAMD);
  4520. return builder.makeFloatType(16);
  4521. case glslang::EbtInt64:
  4522. builder.addExtension(spv::E_SPV_EXT_shader_image_int64);
  4523. builder.addCapability(spv::Capability::Int64ImageEXT);
  4524. return builder.makeIntType(64);
  4525. case glslang::EbtUint64:
  4526. builder.addExtension(spv::E_SPV_EXT_shader_image_int64);
  4527. builder.addCapability(spv::Capability::Int64ImageEXT);
  4528. return builder.makeUintType(64);
  4529. default:
  4530. assert(0);
  4531. return builder.makeFloatType(32);
  4532. }
  4533. }
  4534. // If node is a swizzle operation, return the type that should be used if
  4535. // the swizzle base is first consumed by another operation, before the swizzle
  4536. // is applied.
  4537. spv::Id TGlslangToSpvTraverser::getInvertedSwizzleType(const glslang::TIntermTyped& node)
  4538. {
  4539. if (node.getAsOperator() &&
  4540. node.getAsOperator()->getOp() == glslang::EOpVectorSwizzle)
  4541. return convertGlslangToSpvType(node.getAsBinaryNode()->getLeft()->getType());
  4542. else
  4543. return spv::NoType;
  4544. }
  4545. // When inverting a swizzle with a parent op, this function
  4546. // will apply the swizzle operation to a completed parent operation.
  4547. spv::Id TGlslangToSpvTraverser::createInvertedSwizzle(spv::Decoration precision, const glslang::TIntermTyped& node,
  4548. spv::Id parentResult)
  4549. {
  4550. std::vector<unsigned> swizzle;
  4551. convertSwizzle(*node.getAsBinaryNode()->getRight()->getAsAggregate(), swizzle);
  4552. return builder.createRvalueSwizzle(precision, convertGlslangToSpvType(node.getType()), parentResult, swizzle);
  4553. }
  4554. // Convert a glslang AST swizzle node to a swizzle vector for building SPIR-V.
  4555. void TGlslangToSpvTraverser::convertSwizzle(const glslang::TIntermAggregate& node, std::vector<unsigned>& swizzle)
  4556. {
  4557. const glslang::TIntermSequence& swizzleSequence = node.getSequence();
  4558. for (int i = 0; i < (int)swizzleSequence.size(); ++i)
  4559. swizzle.push_back(swizzleSequence[i]->getAsConstantUnion()->getConstArray()[0].getIConst());
  4560. }
  4561. // Convert from a glslang type to an SPV type, by calling into a
  4562. // recursive version of this function. This establishes the inherited
  4563. // layout state rooted from the top-level type.
  4564. spv::Id TGlslangToSpvTraverser::convertGlslangToSpvType(const glslang::TType& type, bool forwardReferenceOnly)
  4565. {
  4566. return convertGlslangToSpvType(type, getExplicitLayout(type), type.getQualifier(), false, forwardReferenceOnly);
  4567. }
  4568. spv::LinkageType TGlslangToSpvTraverser::convertGlslangLinkageToSpv(glslang::TLinkType linkType)
  4569. {
  4570. switch (linkType) {
  4571. case glslang::ELinkExport:
  4572. return spv::LinkageType::Export;
  4573. default:
  4574. return spv::LinkageType::Max;
  4575. }
  4576. }
  4577. // Do full recursive conversion of an arbitrary glslang type to a SPIR-V Id.
  4578. // explicitLayout can be kept the same throughout the hierarchical recursive walk.
  4579. // Mutually recursive with convertGlslangStructToSpvType().
  4580. spv::Id TGlslangToSpvTraverser::convertGlslangToSpvType(const glslang::TType& type,
  4581. glslang::TLayoutPacking explicitLayout, const glslang::TQualifier& qualifier,
  4582. bool lastBufferBlockMember, bool forwardReferenceOnly)
  4583. {
  4584. spv::Id spvType = spv::NoResult;
  4585. switch (type.getBasicType()) {
  4586. case glslang::EbtVoid:
  4587. spvType = builder.makeVoidType();
  4588. assert (! type.isArray());
  4589. break;
  4590. case glslang::EbtBool:
  4591. // "transparent" bool doesn't exist in SPIR-V. The GLSL convention is
  4592. // a 32-bit int where non-0 means true.
  4593. if (explicitLayout != glslang::ElpNone)
  4594. spvType = builder.makeUintType(32);
  4595. else
  4596. spvType = builder.makeBoolType();
  4597. break;
  4598. case glslang::EbtInt:
  4599. spvType = builder.makeIntType(32);
  4600. break;
  4601. case glslang::EbtUint:
  4602. spvType = builder.makeUintType(32);
  4603. break;
  4604. case glslang::EbtFloat:
  4605. spvType = builder.makeFloatType(32);
  4606. break;
  4607. case glslang::EbtDouble:
  4608. spvType = builder.makeFloatType(64);
  4609. break;
  4610. case glslang::EbtFloat16:
  4611. spvType = builder.makeFloatType(16);
  4612. break;
  4613. case glslang::EbtBFloat16:
  4614. spvType = builder.makeBFloat16Type();
  4615. break;
  4616. case glslang::EbtFloatE5M2:
  4617. spvType = builder.makeFloatE5M2Type();
  4618. break;
  4619. case glslang::EbtFloatE4M3:
  4620. spvType = builder.makeFloatE4M3Type();
  4621. break;
  4622. case glslang::EbtInt8:
  4623. spvType = builder.makeIntType(8);
  4624. break;
  4625. case glslang::EbtUint8:
  4626. spvType = builder.makeUintType(8);
  4627. break;
  4628. case glslang::EbtInt16:
  4629. spvType = builder.makeIntType(16);
  4630. break;
  4631. case glslang::EbtUint16:
  4632. spvType = builder.makeUintType(16);
  4633. break;
  4634. case glslang::EbtInt64:
  4635. spvType = builder.makeIntType(64);
  4636. break;
  4637. case glslang::EbtUint64:
  4638. spvType = builder.makeUintType(64);
  4639. break;
  4640. case glslang::EbtAtomicUint:
  4641. builder.addCapability(spv::Capability::AtomicStorage);
  4642. spvType = builder.makeUintType(32);
  4643. break;
  4644. case glslang::EbtAccStruct:
  4645. switch (glslangIntermediate->getStage()) {
  4646. case EShLangRayGen:
  4647. case EShLangIntersect:
  4648. case EShLangAnyHit:
  4649. case EShLangClosestHit:
  4650. case EShLangMiss:
  4651. case EShLangCallable:
  4652. // these all should have the RayTracingNV/KHR capability already
  4653. break;
  4654. default:
  4655. {
  4656. auto& extensions = glslangIntermediate->getRequestedExtensions();
  4657. if (extensions.find("GL_EXT_ray_query") != extensions.end()) {
  4658. builder.addExtension(spv::E_SPV_KHR_ray_query);
  4659. builder.addCapability(spv::Capability::RayQueryKHR);
  4660. }
  4661. }
  4662. break;
  4663. }
  4664. spvType = builder.makeAccelerationStructureType();
  4665. break;
  4666. case glslang::EbtRayQuery:
  4667. {
  4668. auto& extensions = glslangIntermediate->getRequestedExtensions();
  4669. if (extensions.find("GL_EXT_ray_query") != extensions.end()) {
  4670. builder.addExtension(spv::E_SPV_KHR_ray_query);
  4671. builder.addCapability(spv::Capability::RayQueryKHR);
  4672. }
  4673. spvType = builder.makeRayQueryType();
  4674. }
  4675. break;
  4676. case glslang::EbtReference:
  4677. {
  4678. // Make the forward pointer, then recurse to convert the structure type, then
  4679. // patch up the forward pointer with a real pointer type.
  4680. if (forwardPointers.find(type.getReferentType()) == forwardPointers.end()) {
  4681. spv::Id forwardId = builder.makeForwardPointer(spv::StorageClass::PhysicalStorageBufferEXT);
  4682. forwardPointers[type.getReferentType()] = forwardId;
  4683. }
  4684. spvType = forwardPointers[type.getReferentType()];
  4685. if (!forwardReferenceOnly) {
  4686. spv::Id referentType = convertGlslangToSpvType(*type.getReferentType());
  4687. builder.makePointerFromForwardPointer(spv::StorageClass::PhysicalStorageBufferEXT,
  4688. forwardPointers[type.getReferentType()],
  4689. referentType);
  4690. }
  4691. }
  4692. break;
  4693. case glslang::EbtSampler:
  4694. {
  4695. const glslang::TSampler& sampler = type.getSampler();
  4696. if (sampler.isPureSampler()) {
  4697. spvType = builder.makeSamplerType();
  4698. } else {
  4699. // an image is present, make its type
  4700. spvType = builder.makeImageType(getSampledType(sampler), TranslateDimensionality(sampler),
  4701. sampler.isShadow(), sampler.isArrayed(), sampler.isMultiSample(),
  4702. sampler.isImageClass() ? 2 : 1, TranslateImageFormat(type));
  4703. if (sampler.isCombined() &&
  4704. (!sampler.isBuffer() || glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_6)) {
  4705. // Already has both image and sampler, make the combined type. Only combine sampler to
  4706. // buffer if before SPIR-V 1.6.
  4707. spvType = builder.makeSampledImageType(spvType);
  4708. }
  4709. }
  4710. }
  4711. break;
  4712. case glslang::EbtStruct:
  4713. case glslang::EbtBlock:
  4714. {
  4715. // If we've seen this struct type, return it
  4716. const glslang::TTypeList* glslangMembers = type.getStruct();
  4717. // Try to share structs for different layouts, but not yet for other
  4718. // kinds of qualification (primarily not yet including interpolant qualification).
  4719. if (! HasNonLayoutQualifiers(type, qualifier))
  4720. spvType = structMap[explicitLayout][qualifier.layoutMatrix][glslangMembers];
  4721. if (spvType != spv::NoResult)
  4722. break;
  4723. // else, we haven't seen it...
  4724. if (type.getBasicType() == glslang::EbtBlock)
  4725. memberRemapper[glslangTypeToIdMap[glslangMembers]].resize(glslangMembers->size());
  4726. spvType = convertGlslangStructToSpvType(type, glslangMembers, explicitLayout, qualifier);
  4727. }
  4728. break;
  4729. case glslang::EbtString:
  4730. // no type used for OpString
  4731. return 0;
  4732. case glslang::EbtHitObjectNV: {
  4733. builder.addExtension(spv::E_SPV_NV_shader_invocation_reorder);
  4734. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  4735. spvType = builder.makeHitObjectNVType();
  4736. }
  4737. break;
  4738. case glslang::EbtSpirvType: {
  4739. // GL_EXT_spirv_intrinsics
  4740. const auto& spirvType = type.getSpirvType();
  4741. const auto& spirvInst = spirvType.spirvInst;
  4742. std::vector<spv::IdImmediate> operands;
  4743. for (const auto& typeParam : spirvType.typeParams) {
  4744. if (typeParam.getAsConstant() != nullptr) {
  4745. // Constant expression
  4746. auto constant = typeParam.getAsConstant();
  4747. if (constant->isLiteral()) {
  4748. if (constant->getBasicType() == glslang::EbtFloat) {
  4749. float floatValue = static_cast<float>(constant->getConstArray()[0].getDConst());
  4750. unsigned literal;
  4751. static_assert(sizeof(literal) == sizeof(floatValue), "sizeof(unsigned) != sizeof(float)");
  4752. memcpy(&literal, &floatValue, sizeof(literal));
  4753. operands.push_back({false, literal});
  4754. } else if (constant->getBasicType() == glslang::EbtInt) {
  4755. unsigned literal = constant->getConstArray()[0].getIConst();
  4756. operands.push_back({false, literal});
  4757. } else if (constant->getBasicType() == glslang::EbtUint) {
  4758. unsigned literal = constant->getConstArray()[0].getUConst();
  4759. operands.push_back({false, literal});
  4760. } else if (constant->getBasicType() == glslang::EbtBool) {
  4761. unsigned literal = constant->getConstArray()[0].getBConst();
  4762. operands.push_back({false, literal});
  4763. } else if (constant->getBasicType() == glslang::EbtString) {
  4764. auto str = constant->getConstArray()[0].getSConst()->c_str();
  4765. unsigned literal = 0;
  4766. char* literalPtr = reinterpret_cast<char*>(&literal);
  4767. unsigned charCount = 0;
  4768. char ch = 0;
  4769. do {
  4770. ch = *(str++);
  4771. *(literalPtr++) = ch;
  4772. ++charCount;
  4773. if (charCount == 4) {
  4774. operands.push_back({false, literal});
  4775. literalPtr = reinterpret_cast<char*>(&literal);
  4776. charCount = 0;
  4777. }
  4778. } while (ch != 0);
  4779. // Partial literal is padded with 0
  4780. if (charCount > 0) {
  4781. for (; charCount < 4; ++charCount)
  4782. *(literalPtr++) = 0;
  4783. operands.push_back({false, literal});
  4784. }
  4785. } else
  4786. assert(0); // Unexpected type
  4787. } else
  4788. operands.push_back({true, createSpvConstant(*constant)});
  4789. } else {
  4790. // Type specifier
  4791. assert(typeParam.getAsType() != nullptr);
  4792. operands.push_back({true, convertGlslangToSpvType(*typeParam.getAsType())});
  4793. }
  4794. }
  4795. assert(spirvInst.set == ""); // Currently, couldn't be extended instructions.
  4796. spvType = builder.makeGenericType(static_cast<spv::Op>(spirvInst.id), operands);
  4797. break;
  4798. }
  4799. case glslang::EbtTensorLayoutNV:
  4800. {
  4801. builder.addCapability(spv::Capability::TensorAddressingNV);
  4802. builder.addExtension(spv::E_SPV_NV_tensor_addressing);
  4803. std::vector<spv::IdImmediate> operands;
  4804. for (uint32_t i = 0; i < 2; ++i) {
  4805. operands.push_back({true, makeArraySizeId(*type.getTypeParameters()->arraySizes, i, true)});
  4806. }
  4807. spvType = builder.makeGenericType(spv::Op::OpTypeTensorLayoutNV, operands);
  4808. break;
  4809. }
  4810. case glslang::EbtTensorViewNV:
  4811. {
  4812. builder.addCapability(spv::Capability::TensorAddressingNV);
  4813. builder.addExtension(spv::E_SPV_NV_tensor_addressing);
  4814. uint32_t dim = type.getTypeParameters()->arraySizes->getDimSize(0);
  4815. assert(dim >= 1 && dim <= 5);
  4816. std::vector<spv::IdImmediate> operands;
  4817. for (uint32_t i = 0; i < dim + 2; ++i) {
  4818. operands.push_back({true, makeArraySizeId(*type.getTypeParameters()->arraySizes, i, true, i==1)});
  4819. }
  4820. spvType = builder.makeGenericType(spv::Op::OpTypeTensorViewNV, operands);
  4821. break;
  4822. }
  4823. default:
  4824. assert(0);
  4825. break;
  4826. }
  4827. if (type.isMatrix())
  4828. spvType = builder.makeMatrixType(spvType, type.getMatrixCols(), type.getMatrixRows());
  4829. else {
  4830. // If this variable has a vector element count greater than 1, create a SPIR-V vector
  4831. if (type.getVectorSize() > 1)
  4832. spvType = builder.makeVectorType(spvType, type.getVectorSize());
  4833. }
  4834. if (type.isCoopMatNV()) {
  4835. builder.addCapability(spv::Capability::CooperativeMatrixNV);
  4836. builder.addExtension(spv::E_SPV_NV_cooperative_matrix);
  4837. if (type.getBasicType() == glslang::EbtFloat16)
  4838. builder.addCapability(spv::Capability::Float16);
  4839. if (type.getBasicType() == glslang::EbtUint8 ||
  4840. type.getBasicType() == glslang::EbtInt8) {
  4841. builder.addCapability(spv::Capability::Int8);
  4842. }
  4843. spv::Id scope = makeArraySizeId(*type.getTypeParameters()->arraySizes, 1);
  4844. spv::Id rows = makeArraySizeId(*type.getTypeParameters()->arraySizes, 2);
  4845. spv::Id cols = makeArraySizeId(*type.getTypeParameters()->arraySizes, 3);
  4846. spvType = builder.makeCooperativeMatrixTypeNV(spvType, scope, rows, cols);
  4847. }
  4848. if (type.isCoopMatKHR()) {
  4849. builder.addCapability(spv::Capability::CooperativeMatrixKHR);
  4850. builder.addExtension(spv::E_SPV_KHR_cooperative_matrix);
  4851. if (type.getBasicType() == glslang::EbtBFloat16) {
  4852. builder.addExtension(spv::E_SPV_KHR_bfloat16);
  4853. builder.addCapability(spv::Capability::BFloat16CooperativeMatrixKHR);
  4854. }
  4855. if (type.getBasicType() == glslang::EbtFloatE5M2 || type.getBasicType() == glslang::EbtFloatE4M3) {
  4856. builder.addExtension(spv::E_SPV_EXT_float8);
  4857. builder.addCapability(spv::Capability::Float8CooperativeMatrixEXT);
  4858. }
  4859. if (type.getBasicType() == glslang::EbtFloat16)
  4860. builder.addCapability(spv::Capability::Float16);
  4861. if (type.getBasicType() == glslang::EbtUint8 || type.getBasicType() == glslang::EbtInt8) {
  4862. builder.addCapability(spv::Capability::Int8);
  4863. }
  4864. spv::Id scope = makeArraySizeId(*type.getTypeParameters()->arraySizes, 0);
  4865. spv::Id rows = makeArraySizeId(*type.getTypeParameters()->arraySizes, 1);
  4866. spv::Id cols = makeArraySizeId(*type.getTypeParameters()->arraySizes, 2);
  4867. spv::Id use = makeArraySizeId(*type.getTypeParameters()->arraySizes, 3, true);
  4868. spvType = builder.makeCooperativeMatrixTypeKHR(spvType, scope, rows, cols, use);
  4869. }
  4870. else if (type.isTensorARM()) {
  4871. builder.addCapability(spv::Capability::TensorsARM);
  4872. builder.addExtension(spv::E_SPV_ARM_tensors);
  4873. if (type.getBasicType() == glslang::EbtInt8 || type.getBasicType() == glslang::EbtUint8) {
  4874. builder.addCapability(spv::Capability::Int8);
  4875. } else if (type.getBasicType() == glslang::EbtInt16 ||
  4876. type.getBasicType() == glslang::EbtUint16) {
  4877. builder.addCapability(spv::Capability::Int16);
  4878. } else if (type.getBasicType() == glslang::EbtInt64 ||
  4879. type.getBasicType() == glslang::EbtUint64) {
  4880. builder.addCapability(spv::Capability::Int64);
  4881. } else if (type.getBasicType() == glslang::EbtFloat16) {
  4882. builder.addCapability(spv::Capability::Float16);
  4883. }
  4884. spv::Id rank = makeArraySizeId(*type.getTypeParameters()->arraySizes, 0);
  4885. spvType = builder.makeTensorTypeARM(spvType, rank);
  4886. }
  4887. if (type.isCoopVecNV()) {
  4888. builder.addCapability(spv::Capability::CooperativeVectorNV);
  4889. builder.addExtension(spv::E_SPV_NV_cooperative_vector);
  4890. if (type.getBasicType() == glslang::EbtFloat16)
  4891. builder.addCapability(spv::Capability::Float16);
  4892. if (type.getBasicType() == glslang::EbtUint8 || type.getBasicType() == glslang::EbtInt8) {
  4893. builder.addCapability(spv::Capability::Int8);
  4894. }
  4895. spv::Id components = makeArraySizeId(*type.getTypeParameters()->arraySizes, 0);
  4896. spvType = builder.makeCooperativeVectorTypeNV(spvType, components);
  4897. }
  4898. if (type.isArray()) {
  4899. int stride = 0; // keep this 0 unless doing an explicit layout; 0 will mean no decoration, no stride
  4900. // Do all but the outer dimension
  4901. if (type.getArraySizes()->getNumDims() > 1) {
  4902. // We need to decorate array strides for types needing explicit layout, except blocks.
  4903. if (explicitLayout != glslang::ElpNone && type.getBasicType() != glslang::EbtBlock) {
  4904. // Use a dummy glslang type for querying internal strides of
  4905. // arrays of arrays, but using just a one-dimensional array.
  4906. glslang::TType simpleArrayType(type, 0); // deference type of the array
  4907. while (simpleArrayType.getArraySizes()->getNumDims() > 1)
  4908. simpleArrayType.getArraySizes()->dereference();
  4909. // Will compute the higher-order strides here, rather than making a whole
  4910. // pile of types and doing repetitive recursion on their contents.
  4911. stride = getArrayStride(simpleArrayType, explicitLayout, qualifier.layoutMatrix);
  4912. }
  4913. // make the arrays
  4914. for (int dim = type.getArraySizes()->getNumDims() - 1; dim > 0; --dim) {
  4915. spvType = builder.makeArrayType(spvType, makeArraySizeId(*type.getArraySizes(), dim), stride);
  4916. if (stride > 0)
  4917. builder.addDecoration(spvType, spv::Decoration::ArrayStride, stride);
  4918. stride *= type.getArraySizes()->getDimSize(dim);
  4919. }
  4920. } else {
  4921. // single-dimensional array, and don't yet have stride
  4922. // We need to decorate array strides for types needing explicit layout, except blocks.
  4923. if (explicitLayout != glslang::ElpNone && type.getBasicType() != glslang::EbtBlock)
  4924. stride = getArrayStride(type, explicitLayout, qualifier.layoutMatrix);
  4925. }
  4926. // Do the outer dimension, which might not be known for a runtime-sized array.
  4927. // (Unsized arrays that survive through linking will be runtime-sized arrays)
  4928. if (type.isSizedArray())
  4929. spvType = builder.makeArrayType(spvType, makeArraySizeId(*type.getArraySizes(), 0), stride);
  4930. else {
  4931. if (!lastBufferBlockMember) {
  4932. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  4933. builder.addCapability(spv::Capability::RuntimeDescriptorArrayEXT);
  4934. }
  4935. spvType = builder.makeRuntimeArray(spvType);
  4936. }
  4937. if (stride > 0)
  4938. builder.addDecoration(spvType, spv::Decoration::ArrayStride, stride);
  4939. }
  4940. return spvType;
  4941. }
  4942. // Apply SPIR-V decorations to the SPIR-V object (provided by SPIR-V ID). If member index is provided, the
  4943. // decorations are applied to this member.
  4944. void TGlslangToSpvTraverser::applySpirvDecorate(const glslang::TType& type, spv::Id id, std::optional<int> member)
  4945. {
  4946. assert(type.getQualifier().hasSpirvDecorate());
  4947. const glslang::TSpirvDecorate& spirvDecorate = type.getQualifier().getSpirvDecorate();
  4948. // Add spirv_decorate
  4949. for (auto& decorate : spirvDecorate.decorates) {
  4950. if (!decorate.second.empty()) {
  4951. std::vector<unsigned> literals;
  4952. TranslateLiterals(decorate.second, literals);
  4953. if (member.has_value())
  4954. builder.addMemberDecoration(id, *member, static_cast<spv::Decoration>(decorate.first), literals);
  4955. else
  4956. builder.addDecoration(id, static_cast<spv::Decoration>(decorate.first), literals);
  4957. } else {
  4958. if (member.has_value())
  4959. builder.addMemberDecoration(id, *member, static_cast<spv::Decoration>(decorate.first));
  4960. else
  4961. builder.addDecoration(id, static_cast<spv::Decoration>(decorate.first));
  4962. }
  4963. }
  4964. // Add spirv_decorate_id
  4965. if (member.has_value()) {
  4966. // spirv_decorate_id not applied to members
  4967. assert(spirvDecorate.decorateIds.empty());
  4968. } else {
  4969. for (auto& decorateId : spirvDecorate.decorateIds) {
  4970. std::vector<spv::Id> operandIds;
  4971. assert(!decorateId.second.empty());
  4972. for (auto extraOperand : decorateId.second) {
  4973. if (extraOperand->getQualifier().isFrontEndConstant())
  4974. operandIds.push_back(createSpvConstant(*extraOperand));
  4975. else
  4976. operandIds.push_back(getSymbolId(extraOperand->getAsSymbolNode()));
  4977. }
  4978. builder.addDecorationId(id, static_cast<spv::Decoration>(decorateId.first), operandIds);
  4979. }
  4980. }
  4981. // Add spirv_decorate_string
  4982. for (auto& decorateString : spirvDecorate.decorateStrings) {
  4983. std::vector<const char*> strings;
  4984. assert(!decorateString.second.empty());
  4985. for (auto extraOperand : decorateString.second) {
  4986. const char* string = extraOperand->getConstArray()[0].getSConst()->c_str();
  4987. strings.push_back(string);
  4988. }
  4989. if (member.has_value())
  4990. builder.addMemberDecoration(id, *member, static_cast<spv::Decoration>(decorateString.first), strings);
  4991. else
  4992. builder.addDecoration(id, static_cast<spv::Decoration>(decorateString.first), strings);
  4993. }
  4994. }
  4995. // TODO: this functionality should exist at a higher level, in creating the AST
  4996. //
  4997. // Identify interface members that don't have their required extension turned on.
  4998. //
  4999. bool TGlslangToSpvTraverser::filterMember(const glslang::TType& member)
  5000. {
  5001. auto& extensions = glslangIntermediate->getRequestedExtensions();
  5002. if (member.getFieldName() == "gl_SecondaryViewportMaskNV" &&
  5003. extensions.find("GL_NV_stereo_view_rendering") == extensions.end())
  5004. return true;
  5005. if (member.getFieldName() == "gl_SecondaryPositionNV" &&
  5006. extensions.find("GL_NV_stereo_view_rendering") == extensions.end())
  5007. return true;
  5008. if (glslangIntermediate->getStage() == EShLangMesh) {
  5009. if (member.getFieldName() == "gl_PrimitiveShadingRateEXT" &&
  5010. extensions.find("GL_EXT_fragment_shading_rate") == extensions.end())
  5011. return true;
  5012. }
  5013. if (glslangIntermediate->getStage() != EShLangMesh) {
  5014. if (member.getFieldName() == "gl_ViewportMask" &&
  5015. extensions.find("GL_NV_viewport_array2") == extensions.end())
  5016. return true;
  5017. if (member.getFieldName() == "gl_PositionPerViewNV" &&
  5018. extensions.find("GL_NVX_multiview_per_view_attributes") == extensions.end())
  5019. return true;
  5020. if (member.getFieldName() == "gl_ViewportMaskPerViewNV" &&
  5021. extensions.find("GL_NVX_multiview_per_view_attributes") == extensions.end())
  5022. return true;
  5023. }
  5024. return false;
  5025. }
  5026. // Do full recursive conversion of a glslang structure (or block) type to a SPIR-V Id.
  5027. // explicitLayout can be kept the same throughout the hierarchical recursive walk.
  5028. // Mutually recursive with convertGlslangToSpvType().
  5029. spv::Id TGlslangToSpvTraverser::convertGlslangStructToSpvType(const glslang::TType& type,
  5030. const glslang::TTypeList* glslangMembers,
  5031. glslang::TLayoutPacking explicitLayout,
  5032. const glslang::TQualifier& qualifier)
  5033. {
  5034. // Create a vector of struct types for SPIR-V to consume
  5035. std::vector<spv::Id> spvMembers;
  5036. int memberDelta = 0; // how much the member's index changes from glslang to SPIR-V, normally 0,
  5037. // except sometimes for blocks
  5038. std::vector<std::pair<glslang::TType*, glslang::TQualifier> > deferredForwardPointers;
  5039. for (int i = 0; i < (int)glslangMembers->size(); i++) {
  5040. auto& glslangMember = (*glslangMembers)[i];
  5041. if (glslangMember.type->hiddenMember()) {
  5042. ++memberDelta;
  5043. if (type.getBasicType() == glslang::EbtBlock)
  5044. memberRemapper[glslangTypeToIdMap[glslangMembers]][i] = -1;
  5045. } else {
  5046. if (type.getBasicType() == glslang::EbtBlock) {
  5047. if (filterMember(*glslangMember.type)) {
  5048. memberDelta++;
  5049. memberRemapper[glslangTypeToIdMap[glslangMembers]][i] = -1;
  5050. continue;
  5051. }
  5052. memberRemapper[glslangTypeToIdMap[glslangMembers]][i] = i - memberDelta;
  5053. }
  5054. // modify just this child's view of the qualifier
  5055. glslang::TQualifier memberQualifier = glslangMember.type->getQualifier();
  5056. InheritQualifiers(memberQualifier, qualifier);
  5057. // manually inherit location
  5058. if (! memberQualifier.hasLocation() && qualifier.hasLocation())
  5059. memberQualifier.layoutLocation = qualifier.layoutLocation;
  5060. // recurse
  5061. bool lastBufferBlockMember = qualifier.storage == glslang::EvqBuffer &&
  5062. i == (int)glslangMembers->size() - 1;
  5063. // Make forward pointers for any pointer members.
  5064. if (glslangMember.type->isReference() &&
  5065. forwardPointers.find(glslangMember.type->getReferentType()) == forwardPointers.end()) {
  5066. deferredForwardPointers.push_back(std::make_pair(glslangMember.type, memberQualifier));
  5067. }
  5068. // Create the member type.
  5069. auto const spvMember = convertGlslangToSpvType(*glslangMember.type, explicitLayout, memberQualifier, lastBufferBlockMember,
  5070. glslangMember.type->isReference());
  5071. spvMembers.push_back(spvMember);
  5072. // Update the builder with the type's location so that we can create debug types for the structure members.
  5073. // There doesn't exist a "clean" entry point for this information to be passed along to the builder so, for now,
  5074. // it is stored in the builder and consumed during the construction of composite debug types.
  5075. // TODO: This probably warrants further investigation. This approach was decided to be the least ugly of the
  5076. // quick and dirty approaches that were tried.
  5077. // Advantages of this approach:
  5078. // + Relatively clean. No direct calls into debug type system.
  5079. // + Handles nested recursive structures.
  5080. // Disadvantages of this approach:
  5081. // + Not as clean as desired. Traverser queries/sets persistent state. This is fragile.
  5082. // + Table lookup during creation of composite debug types. This really shouldn't be necessary.
  5083. if(options.emitNonSemanticShaderDebugInfo) {
  5084. builder.debugTypeLocs[spvMember].name = glslangMember.type->getFieldName().c_str();
  5085. builder.debugTypeLocs[spvMember].line = glslangMember.loc.line;
  5086. builder.debugTypeLocs[spvMember].column = glslangMember.loc.column;
  5087. }
  5088. }
  5089. }
  5090. // Make the SPIR-V type
  5091. spv::Id spvType = builder.makeStructType(spvMembers, type.getTypeName().c_str(), false);
  5092. if (! HasNonLayoutQualifiers(type, qualifier))
  5093. structMap[explicitLayout][qualifier.layoutMatrix][glslangMembers] = spvType;
  5094. // Decorate it
  5095. decorateStructType(type, glslangMembers, explicitLayout, qualifier, spvType, spvMembers);
  5096. for (int i = 0; i < (int)deferredForwardPointers.size(); ++i) {
  5097. auto it = deferredForwardPointers[i];
  5098. convertGlslangToSpvType(*it.first, explicitLayout, it.second, false);
  5099. }
  5100. return spvType;
  5101. }
  5102. void TGlslangToSpvTraverser::decorateStructType(const glslang::TType& type,
  5103. const glslang::TTypeList* glslangMembers,
  5104. glslang::TLayoutPacking explicitLayout,
  5105. const glslang::TQualifier& qualifier,
  5106. spv::Id spvType,
  5107. const std::vector<spv::Id>& spvMembers)
  5108. {
  5109. // Name and decorate the non-hidden members
  5110. int offset = -1;
  5111. bool memberLocationInvalid = type.isArrayOfArrays() ||
  5112. (type.isArray() && (type.getQualifier().isArrayedIo(glslangIntermediate->getStage()) == false));
  5113. for (int i = 0; i < (int)glslangMembers->size(); i++) {
  5114. glslang::TType& glslangMember = *(*glslangMembers)[i].type;
  5115. int member = i;
  5116. if (type.getBasicType() == glslang::EbtBlock) {
  5117. member = memberRemapper[glslangTypeToIdMap[glslangMembers]][i];
  5118. if (filterMember(glslangMember))
  5119. continue;
  5120. }
  5121. // modify just this child's view of the qualifier
  5122. glslang::TQualifier memberQualifier = glslangMember.getQualifier();
  5123. InheritQualifiers(memberQualifier, qualifier);
  5124. // using -1 above to indicate a hidden member
  5125. if (member < 0)
  5126. continue;
  5127. builder.addMemberName(spvType, member, glslangMember.getFieldName().c_str());
  5128. builder.addMemberDecoration(spvType, member,
  5129. TranslateLayoutDecoration(glslangMember, memberQualifier.layoutMatrix));
  5130. builder.addMemberDecoration(spvType, member, TranslatePrecisionDecoration(glslangMember));
  5131. // Add interpolation and auxiliary storage decorations only to
  5132. // top-level members of Input and Output storage classes
  5133. if (type.getQualifier().storage == glslang::EvqVaryingIn ||
  5134. type.getQualifier().storage == glslang::EvqVaryingOut) {
  5135. if (type.getBasicType() == glslang::EbtBlock ||
  5136. glslangIntermediate->getSource() == glslang::EShSourceHlsl) {
  5137. builder.addMemberDecoration(spvType, member, TranslateInterpolationDecoration(memberQualifier));
  5138. builder.addMemberDecoration(spvType, member, TranslateAuxiliaryStorageDecoration(memberQualifier));
  5139. addMeshNVDecoration(spvType, member, memberQualifier);
  5140. }
  5141. }
  5142. builder.addMemberDecoration(spvType, member, TranslateInvariantDecoration(memberQualifier));
  5143. if (type.getBasicType() == glslang::EbtBlock &&
  5144. qualifier.storage == glslang::EvqBuffer) {
  5145. // Add memory decorations only to top-level members of shader storage block
  5146. std::vector<spv::Decoration> memory;
  5147. TranslateMemoryDecoration(memberQualifier, memory, glslangIntermediate->usingVulkanMemoryModel());
  5148. for (unsigned int i = 0; i < memory.size(); ++i)
  5149. builder.addMemberDecoration(spvType, member, memory[i]);
  5150. }
  5151. // Location assignment was already completed correctly by the front end,
  5152. // just track whether a member needs to be decorated.
  5153. // Ignore member locations if the container is an array, as that's
  5154. // ill-specified and decisions have been made to not allow this.
  5155. if (!memberLocationInvalid && memberQualifier.hasLocation())
  5156. builder.addMemberDecoration(spvType, member, spv::Decoration::Location, memberQualifier.layoutLocation);
  5157. // component, XFB, others
  5158. if (glslangMember.getQualifier().hasComponent())
  5159. builder.addMemberDecoration(spvType, member, spv::Decoration::Component,
  5160. glslangMember.getQualifier().layoutComponent);
  5161. if (glslangMember.getQualifier().hasXfbOffset())
  5162. builder.addMemberDecoration(spvType, member, spv::Decoration::Offset,
  5163. glslangMember.getQualifier().layoutXfbOffset);
  5164. else if (explicitLayout != glslang::ElpNone) {
  5165. // figure out what to do with offset, which is accumulating
  5166. int nextOffset;
  5167. updateMemberOffset(type, glslangMember, offset, nextOffset, explicitLayout, memberQualifier.layoutMatrix);
  5168. if (offset >= 0)
  5169. builder.addMemberDecoration(spvType, member, spv::Decoration::Offset, offset);
  5170. offset = nextOffset;
  5171. }
  5172. if (glslangMember.isMatrix() && explicitLayout != glslang::ElpNone)
  5173. builder.addMemberDecoration(spvType, member, spv::Decoration::MatrixStride,
  5174. getMatrixStride(glslangMember, explicitLayout, memberQualifier.layoutMatrix));
  5175. // built-in variable decorations
  5176. spv::BuiltIn builtIn = TranslateBuiltInDecoration(glslangMember.getQualifier().builtIn, true);
  5177. if (builtIn != spv::BuiltIn::Max)
  5178. builder.addMemberDecoration(spvType, member, spv::Decoration::BuiltIn, (int)builtIn);
  5179. // nonuniform
  5180. builder.addMemberDecoration(spvType, member, TranslateNonUniformDecoration(glslangMember.getQualifier()));
  5181. if (glslangIntermediate->getHlslFunctionality1() && memberQualifier.semanticName != nullptr) {
  5182. builder.addExtension("SPV_GOOGLE_hlsl_functionality1");
  5183. builder.addMemberDecoration(spvType, member, spv::Decoration::HlslSemanticGOOGLE,
  5184. memberQualifier.semanticName);
  5185. }
  5186. if (builtIn == spv::BuiltIn::Layer) {
  5187. // SPV_NV_viewport_array2 extension
  5188. if (glslangMember.getQualifier().layoutViewportRelative){
  5189. builder.addMemberDecoration(spvType, member, spv::Decoration::ViewportRelativeNV);
  5190. builder.addCapability(spv::Capability::ShaderViewportMaskNV);
  5191. builder.addExtension(spv::E_SPV_NV_viewport_array2);
  5192. }
  5193. if (glslangMember.getQualifier().layoutSecondaryViewportRelativeOffset != -2048){
  5194. builder.addMemberDecoration(spvType, member,
  5195. spv::Decoration::SecondaryViewportRelativeNV,
  5196. glslangMember.getQualifier().layoutSecondaryViewportRelativeOffset);
  5197. builder.addCapability(spv::Capability::ShaderStereoViewNV);
  5198. builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
  5199. }
  5200. }
  5201. if (glslangMember.getQualifier().layoutPassthrough) {
  5202. builder.addMemberDecoration(spvType, member, spv::Decoration::PassthroughNV);
  5203. builder.addCapability(spv::Capability::GeometryShaderPassthroughNV);
  5204. builder.addExtension(spv::E_SPV_NV_geometry_shader_passthrough);
  5205. }
  5206. // Add SPIR-V decorations (GL_EXT_spirv_intrinsics)
  5207. if (glslangMember.getQualifier().hasSpirvDecorate())
  5208. applySpirvDecorate(glslangMember, spvType, member);
  5209. }
  5210. // Decorate the structure
  5211. builder.addDecoration(spvType, TranslateLayoutDecoration(type, qualifier.layoutMatrix));
  5212. const auto basicType = type.getBasicType();
  5213. const auto typeStorageQualifier = type.getQualifier().storage;
  5214. if (basicType == glslang::EbtBlock) {
  5215. builder.addDecoration(spvType, TranslateBlockDecoration(typeStorageQualifier, glslangIntermediate->usingStorageBuffer()));
  5216. } else if (basicType == glslang::EbtStruct && glslangIntermediate->getSpv().vulkan > 0) {
  5217. const auto hasRuntimeArray = !spvMembers.empty() && builder.getOpCode(spvMembers.back()) == spv::Op::OpTypeRuntimeArray;
  5218. if (hasRuntimeArray) {
  5219. builder.addDecoration(spvType, TranslateBlockDecoration(typeStorageQualifier, glslangIntermediate->usingStorageBuffer()));
  5220. }
  5221. }
  5222. if (qualifier.hasHitObjectShaderRecordNV())
  5223. builder.addDecoration(spvType, spv::Decoration::HitObjectShaderRecordBufferNV);
  5224. }
  5225. // Turn the expression forming the array size into an id.
  5226. // This is not quite trivial, because of specialization constants.
  5227. // Sometimes, a raw constant is turned into an Id, and sometimes
  5228. // a specialization constant expression is.
  5229. spv::Id TGlslangToSpvTraverser::makeArraySizeId(const glslang::TArraySizes& arraySizes, int dim, bool allowZero, bool boolType)
  5230. {
  5231. // First, see if this is sized with a node, meaning a specialization constant:
  5232. glslang::TIntermTyped* specNode = arraySizes.getDimNode(dim);
  5233. if (specNode != nullptr) {
  5234. builder.clearAccessChain();
  5235. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  5236. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  5237. specNode->traverse(this);
  5238. return accessChainLoad(specNode->getAsTyped()->getType());
  5239. }
  5240. // Otherwise, need a compile-time (front end) size, get it:
  5241. int size = arraySizes.getDimSize(dim);
  5242. if (!allowZero)
  5243. assert(size > 0);
  5244. if (boolType) {
  5245. return builder.makeBoolConstant(size);
  5246. } else {
  5247. return builder.makeUintConstant(size);
  5248. }
  5249. }
  5250. // Wrap the builder's accessChainLoad to:
  5251. // - localize handling of RelaxedPrecision
  5252. // - use the SPIR-V inferred type instead of another conversion of the glslang type
  5253. // (avoids unnecessary work and possible type punning for structures)
  5254. // - do conversion of concrete to abstract type
  5255. spv::Id TGlslangToSpvTraverser::accessChainLoad(const glslang::TType& type)
  5256. {
  5257. spv::Id nominalTypeId = builder.accessChainGetInferredType();
  5258. spv::Builder::AccessChain::CoherentFlags coherentFlags = builder.getAccessChain().coherentFlags;
  5259. coherentFlags |= TranslateCoherent(type);
  5260. spv::MemoryAccessMask accessMask = spv::MemoryAccessMask(TranslateMemoryAccess(coherentFlags) & ~spv::MemoryAccessMask::MakePointerAvailableKHR);
  5261. // If the value being loaded is HelperInvocation, SPIR-V 1.6 is being generated (so that
  5262. // SPV_EXT_demote_to_helper_invocation is in core) and the memory model is in use, add
  5263. // the Volatile MemoryAccess semantic.
  5264. if (type.getQualifier().builtIn == glslang::EbvHelperInvocation &&
  5265. glslangIntermediate->usingVulkanMemoryModel() &&
  5266. glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {
  5267. accessMask = spv::MemoryAccessMask(accessMask | spv::MemoryAccessMask::Volatile);
  5268. }
  5269. unsigned int alignment = builder.getAccessChain().alignment;
  5270. alignment |= type.getBufferReferenceAlignment();
  5271. spv::Id loadedId = builder.accessChainLoad(TranslatePrecisionDecoration(type),
  5272. TranslateNonUniformDecoration(builder.getAccessChain().coherentFlags),
  5273. TranslateNonUniformDecoration(type.getQualifier()),
  5274. nominalTypeId,
  5275. accessMask,
  5276. TranslateMemoryScope(coherentFlags),
  5277. alignment);
  5278. // Need to convert to abstract types when necessary
  5279. if (type.getBasicType() == glslang::EbtBool) {
  5280. loadedId = convertLoadedBoolInUniformToUint(type, nominalTypeId, loadedId);
  5281. }
  5282. return loadedId;
  5283. }
  5284. // Wrap the builder's accessChainStore to:
  5285. // - do conversion of concrete to abstract type
  5286. //
  5287. // Implicitly uses the existing builder.accessChain as the storage target.
  5288. void TGlslangToSpvTraverser::accessChainStore(const glslang::TType& type, spv::Id rvalue)
  5289. {
  5290. // Need to convert to abstract types when necessary
  5291. if (type.getBasicType() == glslang::EbtBool) {
  5292. spv::Id nominalTypeId = builder.accessChainGetInferredType();
  5293. if (builder.isScalarType(nominalTypeId)) {
  5294. // Conversion for bool
  5295. spv::Id boolType = builder.makeBoolType();
  5296. if (nominalTypeId != boolType) {
  5297. // keep these outside arguments, for determinant order-of-evaluation
  5298. spv::Id one = builder.makeUintConstant(1);
  5299. spv::Id zero = builder.makeUintConstant(0);
  5300. rvalue = builder.createTriOp(spv::Op::OpSelect, nominalTypeId, rvalue, one, zero);
  5301. } else if (builder.getTypeId(rvalue) != boolType)
  5302. rvalue = builder.createBinOp(spv::Op::OpINotEqual, boolType, rvalue, builder.makeUintConstant(0));
  5303. } else if (builder.isVectorType(nominalTypeId)) {
  5304. // Conversion for bvec
  5305. int vecSize = builder.getNumTypeComponents(nominalTypeId);
  5306. spv::Id bvecType = builder.makeVectorType(builder.makeBoolType(), vecSize);
  5307. if (nominalTypeId != bvecType) {
  5308. // keep these outside arguments, for determinant order-of-evaluation
  5309. spv::Id one = makeSmearedConstant(builder.makeUintConstant(1), vecSize);
  5310. spv::Id zero = makeSmearedConstant(builder.makeUintConstant(0), vecSize);
  5311. rvalue = builder.createTriOp(spv::Op::OpSelect, nominalTypeId, rvalue, one, zero);
  5312. } else if (builder.getTypeId(rvalue) != bvecType)
  5313. rvalue = builder.createBinOp(spv::Op::OpINotEqual, bvecType, rvalue,
  5314. makeSmearedConstant(builder.makeUintConstant(0), vecSize));
  5315. }
  5316. }
  5317. spv::Builder::AccessChain::CoherentFlags coherentFlags = builder.getAccessChain().coherentFlags;
  5318. coherentFlags |= TranslateCoherent(type);
  5319. unsigned int alignment = builder.getAccessChain().alignment;
  5320. alignment |= type.getBufferReferenceAlignment();
  5321. builder.accessChainStore(rvalue, TranslateNonUniformDecoration(builder.getAccessChain().coherentFlags),
  5322. spv::MemoryAccessMask(TranslateMemoryAccess(coherentFlags) &
  5323. ~spv::MemoryAccessMask::MakePointerVisibleKHR),
  5324. TranslateMemoryScope(coherentFlags), alignment);
  5325. }
  5326. // For storing when types match at the glslang level, but not might match at the
  5327. // SPIR-V level.
  5328. //
  5329. // This especially happens when a single glslang type expands to multiple
  5330. // SPIR-V types, like a struct that is used in a member-undecorated way as well
  5331. // as in a member-decorated way.
  5332. //
  5333. // NOTE: This function can handle any store request; if it's not special it
  5334. // simplifies to a simple OpStore.
  5335. //
  5336. // Implicitly uses the existing builder.accessChain as the storage target.
  5337. void TGlslangToSpvTraverser::multiTypeStore(const glslang::TType& type, spv::Id rValue)
  5338. {
  5339. // we only do the complex path here if it's an aggregate
  5340. if (! type.isStruct() && ! type.isArray()) {
  5341. accessChainStore(type, rValue);
  5342. return;
  5343. }
  5344. // and, it has to be a case of type aliasing
  5345. spv::Id rType = builder.getTypeId(rValue);
  5346. spv::Id lValue = builder.accessChainGetLValue();
  5347. spv::Id lType = builder.getContainedTypeId(builder.getTypeId(lValue));
  5348. if (lType == rType) {
  5349. accessChainStore(type, rValue);
  5350. return;
  5351. }
  5352. // Recursively (as needed) copy an aggregate type to a different aggregate type,
  5353. // where the two types were the same type in GLSL. This requires member
  5354. // by member copy, recursively.
  5355. // SPIR-V 1.4 added an instruction to do help do this.
  5356. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {
  5357. // However, bool in uniform space is changed to int, so
  5358. // OpCopyLogical does not work for that.
  5359. // TODO: It would be more robust to do a full recursive verification of the types satisfying SPIR-V rules.
  5360. bool rBool = builder.containsType(builder.getTypeId(rValue), spv::Op::OpTypeBool, 0);
  5361. bool lBool = builder.containsType(lType, spv::Op::OpTypeBool, 0);
  5362. if (lBool == rBool) {
  5363. spv::Id logicalCopy = builder.createUnaryOp(spv::Op::OpCopyLogical, lType, rValue);
  5364. accessChainStore(type, logicalCopy);
  5365. return;
  5366. }
  5367. }
  5368. // If an array, copy element by element.
  5369. if (type.isArray()) {
  5370. glslang::TType glslangElementType(type, 0);
  5371. spv::Id elementRType = builder.getContainedTypeId(rType);
  5372. for (int index = 0; index < type.getOuterArraySize(); ++index) {
  5373. // get the source member
  5374. spv::Id elementRValue = builder.createCompositeExtract(rValue, elementRType, index);
  5375. // set up the target storage
  5376. builder.clearAccessChain();
  5377. builder.setAccessChainLValue(lValue);
  5378. builder.accessChainPush(builder.makeIntConstant(index), TranslateCoherent(type),
  5379. type.getBufferReferenceAlignment());
  5380. // store the member
  5381. multiTypeStore(glslangElementType, elementRValue);
  5382. }
  5383. } else {
  5384. assert(type.isStruct());
  5385. // loop over structure members
  5386. const glslang::TTypeList& members = *type.getStruct();
  5387. for (int m = 0; m < (int)members.size(); ++m) {
  5388. const glslang::TType& glslangMemberType = *members[m].type;
  5389. // get the source member
  5390. spv::Id memberRType = builder.getContainedTypeId(rType, m);
  5391. spv::Id memberRValue = builder.createCompositeExtract(rValue, memberRType, m);
  5392. // set up the target storage
  5393. builder.clearAccessChain();
  5394. builder.setAccessChainLValue(lValue);
  5395. builder.accessChainPush(builder.makeIntConstant(m), TranslateCoherent(type),
  5396. type.getBufferReferenceAlignment());
  5397. // store the member
  5398. multiTypeStore(glslangMemberType, memberRValue);
  5399. }
  5400. }
  5401. }
  5402. // Decide whether or not this type should be
  5403. // decorated with offsets and strides, and if so
  5404. // whether std140 or std430 rules should be applied.
  5405. glslang::TLayoutPacking TGlslangToSpvTraverser::getExplicitLayout(const glslang::TType& type) const
  5406. {
  5407. // has to be a block
  5408. if (type.getBasicType() != glslang::EbtBlock)
  5409. return glslang::ElpNone;
  5410. // has to be a uniform or buffer block or task in/out blocks
  5411. if (type.getQualifier().storage != glslang::EvqUniform &&
  5412. type.getQualifier().storage != glslang::EvqBuffer &&
  5413. type.getQualifier().storage != glslang::EvqShared &&
  5414. !type.getQualifier().isTaskMemory())
  5415. return glslang::ElpNone;
  5416. // return the layout to use
  5417. switch (type.getQualifier().layoutPacking) {
  5418. case glslang::ElpStd140:
  5419. case glslang::ElpStd430:
  5420. case glslang::ElpScalar:
  5421. return type.getQualifier().layoutPacking;
  5422. default:
  5423. return glslang::ElpNone;
  5424. }
  5425. }
  5426. // Given an array type, returns the integer stride required for that array
  5427. int TGlslangToSpvTraverser::getArrayStride(const glslang::TType& arrayType, glslang::TLayoutPacking explicitLayout,
  5428. glslang::TLayoutMatrix matrixLayout)
  5429. {
  5430. int size;
  5431. int stride;
  5432. glslangIntermediate->getMemberAlignment(arrayType, size, stride, explicitLayout,
  5433. matrixLayout == glslang::ElmRowMajor);
  5434. return stride;
  5435. }
  5436. // Given a matrix type, or array (of array) of matrixes type, returns the integer stride required for that matrix
  5437. // when used as a member of an interface block
  5438. int TGlslangToSpvTraverser::getMatrixStride(const glslang::TType& matrixType, glslang::TLayoutPacking explicitLayout,
  5439. glslang::TLayoutMatrix matrixLayout)
  5440. {
  5441. glslang::TType elementType;
  5442. elementType.shallowCopy(matrixType);
  5443. elementType.clearArraySizes();
  5444. int size;
  5445. int stride;
  5446. glslangIntermediate->getMemberAlignment(elementType, size, stride, explicitLayout,
  5447. matrixLayout == glslang::ElmRowMajor);
  5448. return stride;
  5449. }
  5450. // Given a member type of a struct, realign the current offset for it, and compute
  5451. // the next (not yet aligned) offset for the next member, which will get aligned
  5452. // on the next call.
  5453. // 'currentOffset' should be passed in already initialized, ready to modify, and reflecting
  5454. // the migration of data from nextOffset -> currentOffset. It should be -1 on the first call.
  5455. // -1 means a non-forced member offset (no decoration needed).
  5456. void TGlslangToSpvTraverser::updateMemberOffset(const glslang::TType& structType, const glslang::TType& memberType,
  5457. int& currentOffset, int& nextOffset, glslang::TLayoutPacking explicitLayout, glslang::TLayoutMatrix matrixLayout)
  5458. {
  5459. // this will get a positive value when deemed necessary
  5460. nextOffset = -1;
  5461. // override anything in currentOffset with user-set offset
  5462. if (memberType.getQualifier().hasOffset())
  5463. currentOffset = memberType.getQualifier().layoutOffset;
  5464. // It could be that current linker usage in glslang updated all the layoutOffset,
  5465. // in which case the following code does not matter. But, that's not quite right
  5466. // once cross-compilation unit GLSL validation is done, as the original user
  5467. // settings are needed in layoutOffset, and then the following will come into play.
  5468. if (explicitLayout == glslang::ElpNone) {
  5469. if (! memberType.getQualifier().hasOffset())
  5470. currentOffset = -1;
  5471. return;
  5472. }
  5473. // Getting this far means we need explicit offsets
  5474. if (currentOffset < 0)
  5475. currentOffset = 0;
  5476. // Now, currentOffset is valid (either 0, or from a previous nextOffset),
  5477. // but possibly not yet correctly aligned.
  5478. int memberSize;
  5479. int dummyStride;
  5480. int memberAlignment = glslangIntermediate->getMemberAlignment(memberType, memberSize, dummyStride, explicitLayout,
  5481. matrixLayout == glslang::ElmRowMajor);
  5482. bool isVectorLike = memberType.isVector();
  5483. if (memberType.isMatrix()) {
  5484. if (matrixLayout == glslang::ElmRowMajor)
  5485. isVectorLike = memberType.getMatrixRows() == 1;
  5486. else
  5487. isVectorLike = memberType.getMatrixCols() == 1;
  5488. }
  5489. // Adjust alignment for HLSL rules
  5490. // TODO: make this consistent in early phases of code:
  5491. // adjusting this late means inconsistencies with earlier code, which for reflection is an issue
  5492. // Until reflection is brought in sync with these adjustments, don't apply to $Global,
  5493. // which is the most likely to rely on reflection, and least likely to rely implicit layouts
  5494. if (glslangIntermediate->usingHlslOffsets() &&
  5495. ! memberType.isStruct() && structType.getTypeName().compare("$Global") != 0) {
  5496. int componentSize;
  5497. int componentAlignment = glslangIntermediate->getBaseAlignmentScalar(memberType, componentSize);
  5498. if (! memberType.isArray() && isVectorLike && componentAlignment <= 4)
  5499. memberAlignment = componentAlignment;
  5500. // Don't add unnecessary padding after this member
  5501. // (undo std140 bumping size to a mutliple of vec4)
  5502. if (explicitLayout == glslang::ElpStd140) {
  5503. if (memberType.isMatrix()) {
  5504. if (matrixLayout == glslang::ElmRowMajor)
  5505. memberSize -= componentSize * (4 - memberType.getMatrixCols());
  5506. else
  5507. memberSize -= componentSize * (4 - memberType.getMatrixRows());
  5508. } else if (memberType.isArray())
  5509. memberSize -= componentSize * (4 - memberType.getVectorSize());
  5510. }
  5511. }
  5512. // Bump up to member alignment
  5513. glslang::RoundToPow2(currentOffset, memberAlignment);
  5514. // Bump up to vec4 if there is a bad straddle
  5515. if (explicitLayout != glslang::ElpScalar && glslangIntermediate->improperStraddle(memberType, memberSize,
  5516. currentOffset, isVectorLike))
  5517. glslang::RoundToPow2(currentOffset, 16);
  5518. nextOffset = currentOffset + memberSize;
  5519. }
  5520. void TGlslangToSpvTraverser::declareUseOfStructMember(const glslang::TTypeList& members, int glslangMember)
  5521. {
  5522. const glslang::TBuiltInVariable glslangBuiltIn = members[glslangMember].type->getQualifier().builtIn;
  5523. switch (glslangBuiltIn)
  5524. {
  5525. case glslang::EbvPointSize:
  5526. case glslang::EbvClipDistance:
  5527. case glslang::EbvCullDistance:
  5528. case glslang::EbvViewportMaskNV:
  5529. case glslang::EbvSecondaryPositionNV:
  5530. case glslang::EbvSecondaryViewportMaskNV:
  5531. case glslang::EbvPositionPerViewNV:
  5532. case glslang::EbvViewportMaskPerViewNV:
  5533. case glslang::EbvTaskCountNV:
  5534. case glslang::EbvPrimitiveCountNV:
  5535. case glslang::EbvPrimitiveIndicesNV:
  5536. case glslang::EbvClipDistancePerViewNV:
  5537. case glslang::EbvCullDistancePerViewNV:
  5538. case glslang::EbvLayerPerViewNV:
  5539. case glslang::EbvMeshViewCountNV:
  5540. case glslang::EbvMeshViewIndicesNV:
  5541. // Generate the associated capability. Delegate to TranslateBuiltInDecoration.
  5542. // Alternately, we could just call this for any glslang built-in, since the
  5543. // capability already guards against duplicates.
  5544. TranslateBuiltInDecoration(glslangBuiltIn, false);
  5545. break;
  5546. default:
  5547. // Capabilities were already generated when the struct was declared.
  5548. break;
  5549. }
  5550. }
  5551. bool TGlslangToSpvTraverser::isShaderEntryPoint(const glslang::TIntermAggregate* node)
  5552. {
  5553. return node->getName().compare(glslangIntermediate->getEntryPointMangledName().c_str()) == 0;
  5554. }
  5555. // Does parameter need a place to keep writes, separate from the original?
  5556. // Assumes called after originalParam(), which filters out block/buffer/opaque-based
  5557. // qualifiers such that we should have only in/out/inout/constreadonly here.
  5558. bool TGlslangToSpvTraverser::writableParam(glslang::TStorageQualifier qualifier) const
  5559. {
  5560. assert(qualifier == glslang::EvqIn ||
  5561. qualifier == glslang::EvqOut ||
  5562. qualifier == glslang::EvqInOut ||
  5563. qualifier == glslang::EvqUniform ||
  5564. qualifier == glslang::EvqConstReadOnly);
  5565. return qualifier != glslang::EvqConstReadOnly &&
  5566. qualifier != glslang::EvqUniform;
  5567. }
  5568. // Is parameter pass-by-original?
  5569. bool TGlslangToSpvTraverser::originalParam(glslang::TStorageQualifier qualifier, const glslang::TType& paramType,
  5570. bool implicitThisParam)
  5571. {
  5572. if (implicitThisParam) // implicit this
  5573. return true;
  5574. if (glslangIntermediate->getSource() == glslang::EShSourceHlsl)
  5575. return paramType.getBasicType() == glslang::EbtBlock;
  5576. return (paramType.containsOpaque() && !glslangIntermediate->getBindlessMode()) || // sampler, etc.
  5577. paramType.getQualifier().isSpirvByReference() || // spirv_by_reference
  5578. (paramType.getBasicType() == glslang::EbtBlock && qualifier == glslang::EvqBuffer); // SSBO
  5579. }
  5580. // Make all the functions, skeletally, without actually visiting their bodies.
  5581. void TGlslangToSpvTraverser::makeFunctions(const glslang::TIntermSequence& glslFunctions)
  5582. {
  5583. const auto getParamDecorations = [&](std::vector<spv::Decoration>& decorations, const glslang::TType& type,
  5584. bool useVulkanMemoryModel) {
  5585. spv::Decoration paramPrecision = TranslatePrecisionDecoration(type);
  5586. if (paramPrecision != spv::NoPrecision)
  5587. decorations.push_back(paramPrecision);
  5588. TranslateMemoryDecoration(type.getQualifier(), decorations, useVulkanMemoryModel);
  5589. if (type.isReference()) {
  5590. // Original and non-writable params pass the pointer directly and
  5591. // use restrict/aliased, others are stored to a pointer in Function
  5592. // memory and use RestrictPointer/AliasedPointer.
  5593. if (originalParam(type.getQualifier().storage, type, false) ||
  5594. !writableParam(type.getQualifier().storage)) {
  5595. // TranslateMemoryDecoration added Restrict decoration already.
  5596. if (!type.getQualifier().isRestrict()) {
  5597. decorations.push_back(spv::Decoration::Aliased);
  5598. }
  5599. } else {
  5600. decorations.push_back(type.getQualifier().isRestrict() ? spv::Decoration::RestrictPointerEXT :
  5601. spv::Decoration::AliasedPointerEXT);
  5602. }
  5603. }
  5604. };
  5605. for (int f = 0; f < (int)glslFunctions.size(); ++f) {
  5606. glslang::TIntermAggregate* glslFunction = glslFunctions[f]->getAsAggregate();
  5607. if (! glslFunction || glslFunction->getOp() != glslang::EOpFunction)
  5608. continue;
  5609. builder.setDebugSourceLocation(glslFunction->getLoc().line, glslFunction->getLoc().getFilename());
  5610. if (isShaderEntryPoint(glslFunction)) {
  5611. // For HLSL, the entry function is actually a compiler generated function to resolve the difference of
  5612. // entry function signature between HLSL and SPIR-V. So we don't emit debug information for that.
  5613. if (glslangIntermediate->getSource() != glslang::EShSourceHlsl) {
  5614. builder.setupFunctionDebugInfo(shaderEntry, glslangIntermediate->getEntryPointMangledName().c_str(),
  5615. std::vector<spv::Id>(), // main function has no param
  5616. std::vector<char const*>());
  5617. }
  5618. continue;
  5619. }
  5620. // We're on a user function. Set up the basic interface for the function now,
  5621. // so that it's available to call. Translating the body will happen later.
  5622. //
  5623. // Typically (except for a "const in" parameter), an address will be passed to the
  5624. // function. What it is an address of varies:
  5625. //
  5626. // - "in" parameters not marked as "const" can be written to without modifying the calling
  5627. // argument so that write needs to be to a copy, hence the address of a copy works.
  5628. //
  5629. // - "const in" parameters can just be the r-value, as no writes need occur.
  5630. //
  5631. // - "out" and "inout" arguments can't be done as pointers to the calling argument, because
  5632. // GLSL has copy-in/copy-out semantics. They can be handled though with a pointer to a copy.
  5633. std::vector<spv::Id> paramTypes;
  5634. std::vector<char const*> paramNames;
  5635. std::vector<std::vector<spv::Decoration>> paramDecorations; // list of decorations per parameter
  5636. glslang::TIntermSequence& parameters = glslFunction->getSequence()[0]->getAsAggregate()->getSequence();
  5637. #ifdef ENABLE_HLSL
  5638. bool implicitThis = (int)parameters.size() > 0 && parameters[0]->getAsSymbolNode()->getName() ==
  5639. glslangIntermediate->implicitThisName;
  5640. #else
  5641. bool implicitThis = false;
  5642. #endif
  5643. paramDecorations.resize(parameters.size());
  5644. for (int p = 0; p < (int)parameters.size(); ++p) {
  5645. const glslang::TType& paramType = parameters[p]->getAsTyped()->getType();
  5646. spv::Id typeId = convertGlslangToSpvType(paramType);
  5647. if (originalParam(paramType.getQualifier().storage, paramType, implicitThis && p == 0))
  5648. typeId = builder.makePointer(TranslateStorageClass(paramType), typeId);
  5649. else if (writableParam(paramType.getQualifier().storage))
  5650. typeId = builder.makePointer(spv::StorageClass::Function, typeId);
  5651. else
  5652. rValueParameters.insert(parameters[p]->getAsSymbolNode()->getId());
  5653. getParamDecorations(paramDecorations[p], paramType, glslangIntermediate->usingVulkanMemoryModel());
  5654. paramTypes.push_back(typeId);
  5655. }
  5656. for (auto const parameter:parameters) {
  5657. paramNames.push_back(parameter->getAsSymbolNode()->getName().c_str());
  5658. }
  5659. spv::Block* functionBlock;
  5660. spv::Function* function = builder.makeFunctionEntry(
  5661. TranslatePrecisionDecoration(glslFunction->getType()), convertGlslangToSpvType(glslFunction->getType()),
  5662. glslFunction->getName().c_str(), convertGlslangLinkageToSpv(glslFunction->getLinkType()), paramTypes,
  5663. paramDecorations, &functionBlock);
  5664. builder.setupFunctionDebugInfo(function, glslFunction->getName().c_str(), paramTypes, paramNames);
  5665. if (implicitThis)
  5666. function->setImplicitThis();
  5667. // Track function to emit/call later
  5668. functionMap[glslFunction->getName().c_str()] = function;
  5669. // Set the parameter id's
  5670. for (int p = 0; p < (int)parameters.size(); ++p) {
  5671. symbolValues[parameters[p]->getAsSymbolNode()->getId()] = function->getParamId(p);
  5672. // give a name too
  5673. builder.addName(function->getParamId(p), parameters[p]->getAsSymbolNode()->getName().c_str());
  5674. const glslang::TType& paramType = parameters[p]->getAsTyped()->getType();
  5675. if (paramType.contains8BitInt())
  5676. builder.addCapability(spv::Capability::Int8);
  5677. if (paramType.contains16BitInt())
  5678. builder.addCapability(spv::Capability::Int16);
  5679. if (paramType.contains16BitFloat())
  5680. builder.addCapability(spv::Capability::Float16);
  5681. }
  5682. }
  5683. }
  5684. // Process all the initializers, while skipping the functions and link objects
  5685. void TGlslangToSpvTraverser::makeGlobalInitializers(const glslang::TIntermSequence& initializers)
  5686. {
  5687. builder.setBuildPoint(shaderEntry->getLastBlock());
  5688. for (int i = 0; i < (int)initializers.size(); ++i) {
  5689. glslang::TIntermAggregate* initializer = initializers[i]->getAsAggregate();
  5690. if (initializer && initializer->getOp() != glslang::EOpFunction && initializer->getOp() !=
  5691. glslang::EOpLinkerObjects) {
  5692. // We're on a top-level node that's not a function. Treat as an initializer, whose
  5693. // code goes into the beginning of the entry point.
  5694. initializer->traverse(this);
  5695. }
  5696. }
  5697. }
  5698. // Walk over all linker objects to create a map for payload and callable data linker objects
  5699. // and their location to be used during codegen for OpTraceKHR and OpExecuteCallableKHR
  5700. // This is done here since it is possible that these linker objects are not be referenced in the AST
  5701. void TGlslangToSpvTraverser::collectRayTracingLinkerObjects()
  5702. {
  5703. glslang::TIntermAggregate* linkerObjects = glslangIntermediate->findLinkerObjects();
  5704. for (auto& objSeq : linkerObjects->getSequence()) {
  5705. auto objNode = objSeq->getAsSymbolNode();
  5706. if (objNode != nullptr) {
  5707. if (objNode->getQualifier().hasLocation()) {
  5708. unsigned int location = objNode->getQualifier().layoutLocation;
  5709. auto st = objNode->getQualifier().storage;
  5710. int set;
  5711. switch (st)
  5712. {
  5713. case glslang::EvqPayload:
  5714. case glslang::EvqPayloadIn:
  5715. set = 0;
  5716. break;
  5717. case glslang::EvqCallableData:
  5718. case glslang::EvqCallableDataIn:
  5719. set = 1;
  5720. break;
  5721. case glslang::EvqHitObjectAttrNV:
  5722. set = 2;
  5723. break;
  5724. default:
  5725. set = -1;
  5726. }
  5727. if (set != -1)
  5728. locationToSymbol[set].insert(std::make_pair(location, objNode));
  5729. }
  5730. }
  5731. }
  5732. }
  5733. // Process all the functions, while skipping initializers.
  5734. void TGlslangToSpvTraverser::visitFunctions(const glslang::TIntermSequence& glslFunctions)
  5735. {
  5736. for (int f = 0; f < (int)glslFunctions.size(); ++f) {
  5737. glslang::TIntermAggregate* node = glslFunctions[f]->getAsAggregate();
  5738. if (node && (node->getOp() == glslang::EOpFunction || node->getOp() == glslang::EOpLinkerObjects))
  5739. node->traverse(this);
  5740. }
  5741. }
  5742. void TGlslangToSpvTraverser::handleFunctionEntry(const glslang::TIntermAggregate* node)
  5743. {
  5744. // SPIR-V functions should already be in the functionMap from the prepass
  5745. // that called makeFunctions().
  5746. currentFunction = functionMap[node->getName().c_str()];
  5747. spv::Block* functionBlock = currentFunction->getEntryBlock();
  5748. builder.setBuildPoint(functionBlock);
  5749. builder.enterFunction(currentFunction);
  5750. }
  5751. void TGlslangToSpvTraverser::translateArguments(const glslang::TIntermAggregate& node, std::vector<spv::Id>& arguments,
  5752. spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags)
  5753. {
  5754. const glslang::TIntermSequence& glslangArguments = node.getSequence();
  5755. glslang::TSampler sampler = {};
  5756. bool cubeCompare = false;
  5757. bool f16ShadowCompare = false;
  5758. if (node.isTexture() || node.isImage()) {
  5759. sampler = glslangArguments[0]->getAsTyped()->getType().getSampler();
  5760. cubeCompare = sampler.dim == glslang::EsdCube && sampler.arrayed && sampler.shadow;
  5761. f16ShadowCompare = sampler.shadow &&
  5762. glslangArguments[1]->getAsTyped()->getType().getBasicType() == glslang::EbtFloat16;
  5763. }
  5764. for (int i = 0; i < (int)glslangArguments.size(); ++i) {
  5765. builder.clearAccessChain();
  5766. glslangArguments[i]->traverse(this);
  5767. // Special case l-value operands
  5768. bool lvalue = false;
  5769. switch (node.getOp()) {
  5770. case glslang::EOpImageAtomicAdd:
  5771. case glslang::EOpImageAtomicMin:
  5772. case glslang::EOpImageAtomicMax:
  5773. case glslang::EOpImageAtomicAnd:
  5774. case glslang::EOpImageAtomicOr:
  5775. case glslang::EOpImageAtomicXor:
  5776. case glslang::EOpImageAtomicExchange:
  5777. case glslang::EOpImageAtomicCompSwap:
  5778. case glslang::EOpImageAtomicLoad:
  5779. case glslang::EOpImageAtomicStore:
  5780. if (i == 0)
  5781. lvalue = true;
  5782. break;
  5783. case glslang::EOpSparseImageLoad:
  5784. if ((sampler.ms && i == 3) || (! sampler.ms && i == 2))
  5785. lvalue = true;
  5786. break;
  5787. case glslang::EOpSparseTexture:
  5788. if (((cubeCompare || f16ShadowCompare) && i == 3) || (! (cubeCompare || f16ShadowCompare) && i == 2))
  5789. lvalue = true;
  5790. break;
  5791. case glslang::EOpSparseTextureClamp:
  5792. if (((cubeCompare || f16ShadowCompare) && i == 4) || (! (cubeCompare || f16ShadowCompare) && i == 3))
  5793. lvalue = true;
  5794. break;
  5795. case glslang::EOpSparseTextureLod:
  5796. case glslang::EOpSparseTextureOffset:
  5797. if ((f16ShadowCompare && i == 4) || (! f16ShadowCompare && i == 3))
  5798. lvalue = true;
  5799. break;
  5800. case glslang::EOpSparseTextureFetch:
  5801. if ((sampler.dim != glslang::EsdRect && i == 3) || (sampler.dim == glslang::EsdRect && i == 2))
  5802. lvalue = true;
  5803. break;
  5804. case glslang::EOpSparseTextureFetchOffset:
  5805. if ((sampler.dim != glslang::EsdRect && i == 4) || (sampler.dim == glslang::EsdRect && i == 3))
  5806. lvalue = true;
  5807. break;
  5808. case glslang::EOpSparseTextureLodOffset:
  5809. case glslang::EOpSparseTextureGrad:
  5810. case glslang::EOpSparseTextureOffsetClamp:
  5811. if ((f16ShadowCompare && i == 5) || (! f16ShadowCompare && i == 4))
  5812. lvalue = true;
  5813. break;
  5814. case glslang::EOpSparseTextureGradOffset:
  5815. case glslang::EOpSparseTextureGradClamp:
  5816. if ((f16ShadowCompare && i == 6) || (! f16ShadowCompare && i == 5))
  5817. lvalue = true;
  5818. break;
  5819. case glslang::EOpSparseTextureGradOffsetClamp:
  5820. if ((f16ShadowCompare && i == 7) || (! f16ShadowCompare && i == 6))
  5821. lvalue = true;
  5822. break;
  5823. case glslang::EOpSparseTextureGather:
  5824. if ((sampler.shadow && i == 3) || (! sampler.shadow && i == 2))
  5825. lvalue = true;
  5826. break;
  5827. case glslang::EOpSparseTextureGatherOffset:
  5828. case glslang::EOpSparseTextureGatherOffsets:
  5829. if ((sampler.shadow && i == 4) || (! sampler.shadow && i == 3))
  5830. lvalue = true;
  5831. break;
  5832. case glslang::EOpSparseTextureGatherLod:
  5833. if (i == 3)
  5834. lvalue = true;
  5835. break;
  5836. case glslang::EOpSparseTextureGatherLodOffset:
  5837. case glslang::EOpSparseTextureGatherLodOffsets:
  5838. if (i == 4)
  5839. lvalue = true;
  5840. break;
  5841. case glslang::EOpSparseImageLoadLod:
  5842. if (i == 3)
  5843. lvalue = true;
  5844. break;
  5845. case glslang::EOpImageSampleFootprintNV:
  5846. if (i == 4)
  5847. lvalue = true;
  5848. break;
  5849. case glslang::EOpImageSampleFootprintClampNV:
  5850. case glslang::EOpImageSampleFootprintLodNV:
  5851. if (i == 5)
  5852. lvalue = true;
  5853. break;
  5854. case glslang::EOpImageSampleFootprintGradNV:
  5855. if (i == 6)
  5856. lvalue = true;
  5857. break;
  5858. case glslang::EOpImageSampleFootprintGradClampNV:
  5859. if (i == 7)
  5860. lvalue = true;
  5861. break;
  5862. case glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT:
  5863. case glslang::EOpRayQueryGetIntersectionLSSPositionsNV:
  5864. case glslang::EOpRayQueryGetIntersectionLSSRadiiNV:
  5865. if (i == 2)
  5866. lvalue = true;
  5867. break;
  5868. case glslang::EOpConstructSaturated:
  5869. if (i == 0)
  5870. lvalue = true;
  5871. break;
  5872. default:
  5873. break;
  5874. }
  5875. if (lvalue) {
  5876. spv::Id lvalue_id = builder.accessChainGetLValue();
  5877. arguments.push_back(lvalue_id);
  5878. lvalueCoherentFlags = builder.getAccessChain().coherentFlags;
  5879. builder.addDecoration(lvalue_id, TranslateNonUniformDecoration(lvalueCoherentFlags));
  5880. lvalueCoherentFlags |= TranslateCoherent(glslangArguments[i]->getAsTyped()->getType());
  5881. } else {
  5882. if (i > 0 &&
  5883. glslangArguments[i]->getAsSymbolNode() && glslangArguments[i-1]->getAsSymbolNode() &&
  5884. glslangArguments[i]->getAsSymbolNode()->getId() == glslangArguments[i-1]->getAsSymbolNode()->getId()) {
  5885. // Reuse the id if possible
  5886. arguments.push_back(arguments[i-1]);
  5887. } else {
  5888. arguments.push_back(accessChainLoad(glslangArguments[i]->getAsTyped()->getType()));
  5889. }
  5890. }
  5891. }
  5892. }
  5893. void TGlslangToSpvTraverser::translateArguments(glslang::TIntermUnary& node, std::vector<spv::Id>& arguments)
  5894. {
  5895. builder.clearAccessChain();
  5896. node.getOperand()->traverse(this);
  5897. arguments.push_back(accessChainLoad(node.getOperand()->getType()));
  5898. }
  5899. spv::Id TGlslangToSpvTraverser::createImageTextureFunctionCall(glslang::TIntermOperator* node)
  5900. {
  5901. if (! node->isImage() && ! node->isTexture())
  5902. return spv::NoResult;
  5903. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  5904. // Process a GLSL texturing op (will be SPV image)
  5905. const glslang::TType &imageType = node->getAsAggregate()
  5906. ? node->getAsAggregate()->getSequence()[0]->getAsTyped()->getType()
  5907. : node->getAsUnaryNode()->getOperand()->getAsTyped()->getType();
  5908. const glslang::TSampler sampler = imageType.getSampler();
  5909. bool f16ShadowCompare = (sampler.shadow && node->getAsAggregate())
  5910. ? node->getAsAggregate()->getSequence()[1]->getAsTyped()->getType().getBasicType() == glslang::EbtFloat16
  5911. : false;
  5912. const auto signExtensionMask = [&]() {
  5913. if (builder.getSpvVersion() >= spv::Spv_1_4) {
  5914. if (sampler.type == glslang::EbtUint)
  5915. return spv::ImageOperandsMask::ZeroExtend;
  5916. else if (sampler.type == glslang::EbtInt)
  5917. return spv::ImageOperandsMask::SignExtend;
  5918. }
  5919. return spv::ImageOperandsMask::MaskNone;
  5920. };
  5921. spv::Builder::AccessChain::CoherentFlags lvalueCoherentFlags;
  5922. std::vector<spv::Id> arguments;
  5923. if (node->getAsAggregate())
  5924. translateArguments(*node->getAsAggregate(), arguments, lvalueCoherentFlags);
  5925. else
  5926. translateArguments(*node->getAsUnaryNode(), arguments);
  5927. spv::Decoration precision = TranslatePrecisionDecoration(node->getType());
  5928. spv::Builder::TextureParameters params = { };
  5929. params.sampler = arguments[0];
  5930. glslang::TCrackedTextureOp cracked;
  5931. node->crackTexture(sampler, cracked);
  5932. const bool isUnsignedResult = node->getType().getBasicType() == glslang::EbtUint;
  5933. if (builder.isSampledImage(params.sampler) &&
  5934. ((cracked.query && node->getOp() != glslang::EOpTextureQueryLod) || cracked.fragMask || cracked.fetch)) {
  5935. params.sampler = builder.createUnaryOp(spv::Op::OpImage, builder.getImageType(params.sampler), params.sampler);
  5936. if (imageType.getQualifier().isNonUniform()) {
  5937. builder.addDecoration(params.sampler, spv::Decoration::NonUniformEXT);
  5938. }
  5939. }
  5940. // Check for queries
  5941. if (cracked.query) {
  5942. switch (node->getOp()) {
  5943. case glslang::EOpImageQuerySize:
  5944. case glslang::EOpTextureQuerySize:
  5945. if (arguments.size() > 1) {
  5946. params.lod = arguments[1];
  5947. return builder.createTextureQueryCall(spv::Op::OpImageQuerySizeLod, params, isUnsignedResult);
  5948. } else
  5949. return builder.createTextureQueryCall(spv::Op::OpImageQuerySize, params, isUnsignedResult);
  5950. case glslang::EOpImageQuerySamples:
  5951. case glslang::EOpTextureQuerySamples:
  5952. return builder.createTextureQueryCall(spv::Op::OpImageQuerySamples, params, isUnsignedResult);
  5953. case glslang::EOpTextureQueryLod:
  5954. params.coords = arguments[1];
  5955. return builder.createTextureQueryCall(spv::Op::OpImageQueryLod, params, isUnsignedResult);
  5956. case glslang::EOpTextureQueryLevels:
  5957. return builder.createTextureQueryCall(spv::Op::OpImageQueryLevels, params, isUnsignedResult);
  5958. case glslang::EOpSparseTexelsResident:
  5959. return builder.createUnaryOp(spv::Op::OpImageSparseTexelsResident, builder.makeBoolType(), arguments[0]);
  5960. default:
  5961. assert(0);
  5962. break;
  5963. }
  5964. }
  5965. int components = node->getType().getVectorSize();
  5966. if (node->getOp() == glslang::EOpImageLoad ||
  5967. node->getOp() == glslang::EOpImageLoadLod ||
  5968. node->getOp() == glslang::EOpTextureFetch ||
  5969. node->getOp() == glslang::EOpTextureFetchOffset) {
  5970. // These must produce 4 components, per SPIR-V spec. We'll add a conversion constructor if needed.
  5971. // This will only happen through the HLSL path for operator[], so we do not have to handle e.g.
  5972. // the EOpTexture/Proj/Lod/etc family. It would be harmless to do so, but would need more logic
  5973. // here around e.g. which ones return scalars or other types.
  5974. components = 4;
  5975. }
  5976. glslang::TType returnType(node->getType().getBasicType(), glslang::EvqTemporary, components);
  5977. auto resultType = [&returnType,this]{ return convertGlslangToSpvType(returnType); };
  5978. // Check for image functions other than queries
  5979. if (node->isImage()) {
  5980. std::vector<spv::IdImmediate> operands;
  5981. auto opIt = arguments.begin();
  5982. spv::IdImmediate image = { true, *(opIt++) };
  5983. operands.push_back(image);
  5984. // Handle subpass operations
  5985. // TODO: GLSL should change to have the "MS" only on the type rather than the
  5986. // built-in function.
  5987. if (cracked.subpass) {
  5988. // add on the (0,0) coordinate
  5989. spv::Id zero = builder.makeIntConstant(0);
  5990. std::vector<spv::Id> comps;
  5991. comps.push_back(zero);
  5992. comps.push_back(zero);
  5993. spv::IdImmediate coord = { true,
  5994. builder.makeCompositeConstant(builder.makeVectorType(builder.makeIntType(32), 2), comps) };
  5995. operands.push_back(coord);
  5996. spv::IdImmediate imageOperands = { false, spv::ImageOperandsMask::MaskNone };
  5997. imageOperands.word = imageOperands.word | (unsigned)signExtensionMask();
  5998. if (sampler.isMultiSample()) {
  5999. imageOperands.word = imageOperands.word | (unsigned)spv::ImageOperandsMask::Sample;
  6000. }
  6001. if (imageOperands.word != (unsigned)spv::ImageOperandsMask::MaskNone) {
  6002. operands.push_back(imageOperands);
  6003. if (sampler.isMultiSample()) {
  6004. spv::IdImmediate imageOperand = { true, *(opIt++) };
  6005. operands.push_back(imageOperand);
  6006. }
  6007. }
  6008. spv::Id result = builder.createOp(spv::Op::OpImageRead, resultType(), operands);
  6009. builder.setPrecision(result, precision);
  6010. return result;
  6011. }
  6012. if (cracked.attachmentEXT) {
  6013. if (opIt != arguments.end()) {
  6014. spv::IdImmediate sample = { true, *opIt };
  6015. operands.push_back(sample);
  6016. }
  6017. spv::Id result = builder.createOp(spv::Op::OpColorAttachmentReadEXT, resultType(), operands);
  6018. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  6019. builder.setPrecision(result, precision);
  6020. return result;
  6021. }
  6022. spv::IdImmediate coord = { true, *(opIt++) };
  6023. operands.push_back(coord);
  6024. if (node->getOp() == glslang::EOpImageLoad || node->getOp() == glslang::EOpImageLoadLod) {
  6025. spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;
  6026. if (sampler.isMultiSample()) {
  6027. mask = mask | spv::ImageOperandsMask::Sample;
  6028. }
  6029. if (cracked.lod) {
  6030. builder.addExtension(spv::E_SPV_AMD_shader_image_load_store_lod);
  6031. builder.addCapability(spv::Capability::ImageReadWriteLodAMD);
  6032. mask = mask | spv::ImageOperandsMask::Lod;
  6033. }
  6034. mask = mask | TranslateImageOperands(TranslateCoherent(imageType));
  6035. mask = (spv::ImageOperandsMask)(mask & ~spv::ImageOperandsMask::MakeTexelAvailableKHR);
  6036. mask = mask | signExtensionMask();
  6037. if (mask != spv::ImageOperandsMask::MaskNone) {
  6038. spv::IdImmediate imageOperands = { false, (unsigned int)mask };
  6039. operands.push_back(imageOperands);
  6040. }
  6041. if (anySet(mask, spv::ImageOperandsMask::Sample)) {
  6042. spv::IdImmediate imageOperand = { true, *opIt++ };
  6043. operands.push_back(imageOperand);
  6044. }
  6045. if (anySet(mask, spv::ImageOperandsMask::Lod)) {
  6046. spv::IdImmediate imageOperand = { true, *opIt++ };
  6047. operands.push_back(imageOperand);
  6048. }
  6049. if (anySet(mask, spv::ImageOperandsMask::MakeTexelVisibleKHR)) {
  6050. spv::IdImmediate imageOperand = { true,
  6051. builder.makeUintConstant(TranslateMemoryScope(TranslateCoherent(imageType))) };
  6052. operands.push_back(imageOperand);
  6053. }
  6054. if (builder.getImageTypeFormat(builder.getImageType(operands.front().word)) == spv::ImageFormat::Unknown)
  6055. builder.addCapability(spv::Capability::StorageImageReadWithoutFormat);
  6056. std::vector<spv::Id> result(1, builder.createOp(spv::Op::OpImageRead, resultType(), operands));
  6057. builder.setPrecision(result[0], precision);
  6058. // If needed, add a conversion constructor to the proper size.
  6059. if (components != node->getType().getVectorSize())
  6060. result[0] = builder.createConstructor(precision, result, convertGlslangToSpvType(node->getType()));
  6061. return result[0];
  6062. } else if (node->getOp() == glslang::EOpImageStore || node->getOp() == glslang::EOpImageStoreLod) {
  6063. // Push the texel value before the operands
  6064. if (sampler.isMultiSample() || cracked.lod) {
  6065. spv::IdImmediate texel = { true, *(opIt + 1) };
  6066. operands.push_back(texel);
  6067. } else {
  6068. spv::IdImmediate texel = { true, *opIt };
  6069. operands.push_back(texel);
  6070. }
  6071. spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;
  6072. if (sampler.isMultiSample()) {
  6073. mask = mask | spv::ImageOperandsMask::Sample;
  6074. }
  6075. if (cracked.lod) {
  6076. builder.addExtension(spv::E_SPV_AMD_shader_image_load_store_lod);
  6077. builder.addCapability(spv::Capability::ImageReadWriteLodAMD);
  6078. mask = mask | spv::ImageOperandsMask::Lod;
  6079. }
  6080. mask = mask | TranslateImageOperands(TranslateCoherent(imageType));
  6081. mask = (spv::ImageOperandsMask)(mask & ~spv::ImageOperandsMask::MakeTexelVisibleKHR);
  6082. mask = mask | signExtensionMask();
  6083. if (mask != spv::ImageOperandsMask::MaskNone) {
  6084. spv::IdImmediate imageOperands = { false, (unsigned int)mask };
  6085. operands.push_back(imageOperands);
  6086. }
  6087. if (anySet(mask, spv::ImageOperandsMask::Sample)) {
  6088. spv::IdImmediate imageOperand = { true, *opIt++ };
  6089. operands.push_back(imageOperand);
  6090. }
  6091. if (anySet(mask, spv::ImageOperandsMask::Lod)) {
  6092. spv::IdImmediate imageOperand = { true, *opIt++ };
  6093. operands.push_back(imageOperand);
  6094. }
  6095. if (anySet(mask, spv::ImageOperandsMask::MakeTexelAvailableKHR)) {
  6096. spv::IdImmediate imageOperand = { true,
  6097. builder.makeUintConstant(TranslateMemoryScope(TranslateCoherent(imageType))) };
  6098. operands.push_back(imageOperand);
  6099. }
  6100. builder.createNoResultOp(spv::Op::OpImageWrite, operands);
  6101. if (builder.getImageTypeFormat(builder.getImageType(operands.front().word)) == spv::ImageFormat::Unknown)
  6102. builder.addCapability(spv::Capability::StorageImageWriteWithoutFormat);
  6103. return spv::NoResult;
  6104. } else if (node->getOp() == glslang::EOpSparseImageLoad ||
  6105. node->getOp() == glslang::EOpSparseImageLoadLod) {
  6106. builder.addCapability(spv::Capability::SparseResidency);
  6107. if (builder.getImageTypeFormat(builder.getImageType(operands.front().word)) == spv::ImageFormat::Unknown)
  6108. builder.addCapability(spv::Capability::StorageImageReadWithoutFormat);
  6109. spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;
  6110. if (sampler.isMultiSample()) {
  6111. mask = mask | spv::ImageOperandsMask::Sample;
  6112. }
  6113. if (cracked.lod) {
  6114. builder.addExtension(spv::E_SPV_AMD_shader_image_load_store_lod);
  6115. builder.addCapability(spv::Capability::ImageReadWriteLodAMD);
  6116. mask = mask | spv::ImageOperandsMask::Lod;
  6117. }
  6118. mask = mask | TranslateImageOperands(TranslateCoherent(imageType));
  6119. mask = (spv::ImageOperandsMask)(mask & ~spv::ImageOperandsMask::MakeTexelAvailableKHR);
  6120. mask = mask | signExtensionMask();
  6121. if (mask != spv::ImageOperandsMask::MaskNone) {
  6122. spv::IdImmediate imageOperands = { false, (unsigned int)mask };
  6123. operands.push_back(imageOperands);
  6124. }
  6125. if (anySet(mask, spv::ImageOperandsMask::Sample)) {
  6126. spv::IdImmediate imageOperand = { true, *opIt++ };
  6127. operands.push_back(imageOperand);
  6128. }
  6129. if (anySet(mask, spv::ImageOperandsMask::Lod)) {
  6130. spv::IdImmediate imageOperand = { true, *opIt++ };
  6131. operands.push_back(imageOperand);
  6132. }
  6133. if (anySet(mask, spv::ImageOperandsMask::MakeTexelVisibleKHR)) {
  6134. spv::IdImmediate imageOperand = { true, builder.makeUintConstant(TranslateMemoryScope(
  6135. TranslateCoherent(imageType))) };
  6136. operands.push_back(imageOperand);
  6137. }
  6138. // Create the return type that was a special structure
  6139. spv::Id texelOut = *opIt;
  6140. spv::Id typeId0 = resultType();
  6141. spv::Id typeId1 = builder.getDerefTypeId(texelOut);
  6142. spv::Id resultTypeId = builder.makeStructResultType(typeId0, typeId1);
  6143. spv::Id resultId = builder.createOp(spv::Op::OpImageSparseRead, resultTypeId, operands);
  6144. // Decode the return type
  6145. builder.createStore(builder.createCompositeExtract(resultId, typeId1, 1), texelOut);
  6146. return builder.createCompositeExtract(resultId, typeId0, 0);
  6147. } else {
  6148. // Process image atomic operations
  6149. // GLSL "IMAGE_PARAMS" will involve in constructing an image texel pointer and this pointer,
  6150. // as the first source operand, is required by SPIR-V atomic operations.
  6151. // For non-MS, the sample value should be 0
  6152. spv::IdImmediate sample = { true, sampler.isMultiSample() ? *(opIt++) : builder.makeUintConstant(0) };
  6153. operands.push_back(sample);
  6154. spv::Id resultTypeId;
  6155. glslang::TBasicType typeProxy = node->getBasicType();
  6156. // imageAtomicStore has a void return type so base the pointer type on
  6157. // the type of the value operand.
  6158. if (node->getOp() == glslang::EOpImageAtomicStore) {
  6159. resultTypeId = builder.makePointer(spv::StorageClass::Image, builder.getTypeId(*opIt));
  6160. typeProxy = node->getAsAggregate()->getSequence()[0]->getAsTyped()->getType().getSampler().type;
  6161. } else {
  6162. resultTypeId = builder.makePointer(spv::StorageClass::Image, resultType());
  6163. }
  6164. spv::Id pointer = builder.createOp(spv::Op::OpImageTexelPointer, resultTypeId, operands);
  6165. if (imageType.getQualifier().nonUniform) {
  6166. builder.addDecoration(pointer, spv::Decoration::NonUniformEXT);
  6167. }
  6168. std::vector<spv::Id> operands;
  6169. operands.push_back(pointer);
  6170. for (; opIt != arguments.end(); ++opIt)
  6171. operands.push_back(*opIt);
  6172. return createAtomicOperation(node->getOp(), precision, resultType(), operands, typeProxy,
  6173. lvalueCoherentFlags, node->getType());
  6174. }
  6175. }
  6176. // Check for fragment mask functions other than queries
  6177. if (cracked.fragMask) {
  6178. assert(sampler.ms);
  6179. auto opIt = arguments.begin();
  6180. std::vector<spv::Id> operands;
  6181. operands.push_back(params.sampler);
  6182. ++opIt;
  6183. if (sampler.isSubpass()) {
  6184. // add on the (0,0) coordinate
  6185. spv::Id zero = builder.makeIntConstant(0);
  6186. std::vector<spv::Id> comps;
  6187. comps.push_back(zero);
  6188. comps.push_back(zero);
  6189. operands.push_back(builder.makeCompositeConstant(
  6190. builder.makeVectorType(builder.makeIntType(32), 2), comps));
  6191. }
  6192. for (; opIt != arguments.end(); ++opIt)
  6193. operands.push_back(*opIt);
  6194. spv::Op fragMaskOp = spv::Op::OpNop;
  6195. if (node->getOp() == glslang::EOpFragmentMaskFetch)
  6196. fragMaskOp = spv::Op::OpFragmentMaskFetchAMD;
  6197. else if (node->getOp() == glslang::EOpFragmentFetch)
  6198. fragMaskOp = spv::Op::OpFragmentFetchAMD;
  6199. builder.addExtension(spv::E_SPV_AMD_shader_fragment_mask);
  6200. builder.addCapability(spv::Capability::FragmentMaskAMD);
  6201. return builder.createOp(fragMaskOp, resultType(), operands);
  6202. }
  6203. // Check for texture functions other than queries
  6204. bool sparse = node->isSparseTexture();
  6205. bool imageFootprint = node->isImageFootprint();
  6206. bool cubeCompare = sampler.dim == glslang::EsdCube && sampler.isArrayed() && sampler.isShadow();
  6207. // check for bias argument
  6208. bool bias = false;
  6209. if (! cracked.lod && ! cracked.grad && ! cracked.fetch && ! cubeCompare) {
  6210. int nonBiasArgCount = 2;
  6211. if (cracked.gather)
  6212. ++nonBiasArgCount; // comp argument should be present when bias argument is present
  6213. if (f16ShadowCompare)
  6214. ++nonBiasArgCount;
  6215. if (cracked.offset)
  6216. ++nonBiasArgCount;
  6217. else if (cracked.offsets)
  6218. ++nonBiasArgCount;
  6219. if (cracked.grad)
  6220. nonBiasArgCount += 2;
  6221. if (cracked.lodClamp)
  6222. ++nonBiasArgCount;
  6223. if (sparse)
  6224. ++nonBiasArgCount;
  6225. if (imageFootprint)
  6226. //Following three extra arguments
  6227. // int granularity, bool coarse, out gl_TextureFootprint2DNV footprint
  6228. nonBiasArgCount += 3;
  6229. if ((int)arguments.size() > nonBiasArgCount)
  6230. bias = true;
  6231. }
  6232. if (cracked.gather) {
  6233. const auto& sourceExtensions = glslangIntermediate->getRequestedExtensions();
  6234. if (bias || cracked.lod ||
  6235. sourceExtensions.find(glslang::E_GL_AMD_texture_gather_bias_lod) != sourceExtensions.end()) {
  6236. builder.addExtension(spv::E_SPV_AMD_texture_gather_bias_lod);
  6237. builder.addCapability(spv::Capability::ImageGatherBiasLodAMD);
  6238. }
  6239. }
  6240. // set the rest of the arguments
  6241. params.coords = arguments[1];
  6242. int extraArgs = 0;
  6243. bool noImplicitLod = false;
  6244. // sort out where Dref is coming from
  6245. if (cubeCompare || f16ShadowCompare) {
  6246. params.Dref = arguments[2];
  6247. ++extraArgs;
  6248. } else if (sampler.shadow && cracked.gather) {
  6249. params.Dref = arguments[2];
  6250. ++extraArgs;
  6251. } else if (sampler.shadow) {
  6252. std::vector<spv::Id> indexes;
  6253. int dRefComp;
  6254. if (cracked.proj)
  6255. dRefComp = 2; // "The resulting 3rd component of P in the shadow forms is used as Dref"
  6256. else
  6257. dRefComp = builder.getNumComponents(params.coords) - 1;
  6258. indexes.push_back(dRefComp);
  6259. params.Dref = builder.createCompositeExtract(params.coords,
  6260. builder.getScalarTypeId(builder.getTypeId(params.coords)), indexes);
  6261. }
  6262. // lod
  6263. if (cracked.lod) {
  6264. params.lod = arguments[2 + extraArgs];
  6265. ++extraArgs;
  6266. } else if (glslangIntermediate->getStage() != EShLangFragment &&
  6267. !(glslangIntermediate->getStage() == EShLangCompute &&
  6268. glslangIntermediate->hasLayoutDerivativeModeNone())) {
  6269. // we need to invent the default lod for an explicit lod instruction for a non-fragment stage
  6270. noImplicitLod = true;
  6271. }
  6272. // multisample
  6273. if (sampler.isMultiSample()) {
  6274. params.sample = arguments[2 + extraArgs]; // For MS, "sample" should be specified
  6275. ++extraArgs;
  6276. }
  6277. // gradient
  6278. if (cracked.grad) {
  6279. params.gradX = arguments[2 + extraArgs];
  6280. params.gradY = arguments[3 + extraArgs];
  6281. extraArgs += 2;
  6282. }
  6283. // offset and offsets
  6284. if (cracked.offset) {
  6285. params.offset = arguments[2 + extraArgs];
  6286. ++extraArgs;
  6287. } else if (cracked.offsets) {
  6288. params.offsets = arguments[2 + extraArgs];
  6289. ++extraArgs;
  6290. }
  6291. // lod clamp
  6292. if (cracked.lodClamp) {
  6293. params.lodClamp = arguments[2 + extraArgs];
  6294. ++extraArgs;
  6295. }
  6296. // sparse
  6297. if (sparse) {
  6298. params.texelOut = arguments[2 + extraArgs];
  6299. ++extraArgs;
  6300. }
  6301. // gather component
  6302. if (cracked.gather && ! sampler.shadow) {
  6303. // default component is 0, if missing, otherwise an argument
  6304. if (2 + extraArgs < (int)arguments.size()) {
  6305. params.component = arguments[2 + extraArgs];
  6306. ++extraArgs;
  6307. } else
  6308. params.component = builder.makeIntConstant(0);
  6309. }
  6310. spv::Id resultStruct = spv::NoResult;
  6311. if (imageFootprint) {
  6312. //Following three extra arguments
  6313. // int granularity, bool coarse, out gl_TextureFootprint2DNV footprint
  6314. params.granularity = arguments[2 + extraArgs];
  6315. params.coarse = arguments[3 + extraArgs];
  6316. resultStruct = arguments[4 + extraArgs];
  6317. extraArgs += 3;
  6318. }
  6319. // bias
  6320. if (bias) {
  6321. params.bias = arguments[2 + extraArgs];
  6322. ++extraArgs;
  6323. }
  6324. if (imageFootprint) {
  6325. builder.addExtension(spv::E_SPV_NV_shader_image_footprint);
  6326. builder.addCapability(spv::Capability::ImageFootprintNV);
  6327. //resultStructType(OpenGL type) contains 5 elements:
  6328. //struct gl_TextureFootprint2DNV {
  6329. // uvec2 anchor;
  6330. // uvec2 offset;
  6331. // uvec2 mask;
  6332. // uint lod;
  6333. // uint granularity;
  6334. //};
  6335. //or
  6336. //struct gl_TextureFootprint3DNV {
  6337. // uvec3 anchor;
  6338. // uvec3 offset;
  6339. // uvec2 mask;
  6340. // uint lod;
  6341. // uint granularity;
  6342. //};
  6343. spv::Id resultStructType = builder.getContainedTypeId(builder.getTypeId(resultStruct));
  6344. assert(builder.isStructType(resultStructType));
  6345. //resType (SPIR-V type) contains 6 elements:
  6346. //Member 0 must be a Boolean type scalar(LOD),
  6347. //Member 1 must be a vector of integer type, whose Signedness operand is 0(anchor),
  6348. //Member 2 must be a vector of integer type, whose Signedness operand is 0(offset),
  6349. //Member 3 must be a vector of integer type, whose Signedness operand is 0(mask),
  6350. //Member 4 must be a scalar of integer type, whose Signedness operand is 0(lod),
  6351. //Member 5 must be a scalar of integer type, whose Signedness operand is 0(granularity).
  6352. std::vector<spv::Id> members;
  6353. members.push_back(resultType());
  6354. for (int i = 0; i < 5; i++) {
  6355. members.push_back(builder.getContainedTypeId(resultStructType, i));
  6356. }
  6357. spv::Id resType = builder.makeStructType(members, "ResType");
  6358. //call ImageFootprintNV
  6359. spv::Id res = builder.createTextureCall(precision, resType, sparse, cracked.fetch, cracked.proj,
  6360. cracked.gather, noImplicitLod, params, signExtensionMask());
  6361. //copy resType (SPIR-V type) to resultStructType(OpenGL type)
  6362. for (int i = 0; i < 5; i++) {
  6363. builder.clearAccessChain();
  6364. builder.setAccessChainLValue(resultStruct);
  6365. //Accessing to a struct we created, no coherent flag is set
  6366. spv::Builder::AccessChain::CoherentFlags flags;
  6367. flags.clear();
  6368. builder.accessChainPush(builder.makeIntConstant(i), flags, 0);
  6369. builder.accessChainStore(builder.createCompositeExtract(res, builder.getContainedTypeId(resType, i+1),
  6370. i+1), TranslateNonUniformDecoration(imageType.getQualifier()));
  6371. }
  6372. return builder.createCompositeExtract(res, resultType(), 0);
  6373. }
  6374. // projective component (might not to move)
  6375. // GLSL: "The texture coordinates consumed from P, not including the last component of P,
  6376. // are divided by the last component of P."
  6377. // SPIR-V: "... (u [, v] [, w], q)... It may be a vector larger than needed, but all
  6378. // unused components will appear after all used components."
  6379. if (cracked.proj) {
  6380. int projSourceComp = builder.getNumComponents(params.coords) - 1;
  6381. int projTargetComp;
  6382. switch (sampler.dim) {
  6383. case glslang::Esd1D: projTargetComp = 1; break;
  6384. case glslang::Esd2D: projTargetComp = 2; break;
  6385. case glslang::EsdRect: projTargetComp = 2; break;
  6386. default: projTargetComp = projSourceComp; break;
  6387. }
  6388. // copy the projective coordinate if we have to
  6389. if (projTargetComp != projSourceComp) {
  6390. spv::Id projComp = builder.createCompositeExtract(params.coords,
  6391. builder.getScalarTypeId(builder.getTypeId(params.coords)), projSourceComp);
  6392. params.coords = builder.createCompositeInsert(projComp, params.coords,
  6393. builder.getTypeId(params.coords), projTargetComp);
  6394. }
  6395. }
  6396. // nonprivate
  6397. if (imageType.getQualifier().nonprivate) {
  6398. params.nonprivate = true;
  6399. }
  6400. // volatile
  6401. if (imageType.getQualifier().volatil) {
  6402. params.volatil = true;
  6403. }
  6404. if (imageType.getQualifier().nontemporal) {
  6405. params.nontemporal = true;
  6406. }
  6407. std::vector<spv::Id> result( 1,
  6408. builder.createTextureCall(precision, resultType(), sparse, cracked.fetch, cracked.proj, cracked.gather,
  6409. noImplicitLod, params, signExtensionMask())
  6410. );
  6411. if (components != node->getType().getVectorSize())
  6412. result[0] = builder.createConstructor(precision, result, convertGlslangToSpvType(node->getType()));
  6413. return result[0];
  6414. }
  6415. spv::Id TGlslangToSpvTraverser::handleUserFunctionCall(const glslang::TIntermAggregate* node)
  6416. {
  6417. // Grab the function's pointer from the previously created function
  6418. spv::Function* function = functionMap[node->getName().c_str()];
  6419. if (! function)
  6420. return 0;
  6421. const glslang::TIntermSequence& glslangArgs = node->getSequence();
  6422. const glslang::TQualifierList& qualifiers = node->getQualifierList();
  6423. // See comments in makeFunctions() for details about the semantics for parameter passing.
  6424. //
  6425. // These imply we need a four step process:
  6426. // 1. Evaluate the arguments
  6427. // 2. Allocate and make copies of in, out, and inout arguments
  6428. // 3. Make the call
  6429. // 4. Copy back the results
  6430. // 1. Evaluate the arguments and their types
  6431. std::vector<spv::Builder::AccessChain> lValues;
  6432. std::vector<spv::Id> rValues;
  6433. std::vector<const glslang::TType*> argTypes;
  6434. for (int a = 0; a < (int)glslangArgs.size(); ++a) {
  6435. argTypes.push_back(&glslangArgs[a]->getAsTyped()->getType());
  6436. // build l-value
  6437. builder.clearAccessChain();
  6438. glslangArgs[a]->traverse(this);
  6439. // keep outputs and pass-by-originals as l-values, evaluate others as r-values
  6440. if (originalParam(qualifiers[a], *argTypes[a], function->hasImplicitThis() && a == 0) ||
  6441. writableParam(qualifiers[a])) {
  6442. // save l-value
  6443. lValues.push_back(builder.getAccessChain());
  6444. } else {
  6445. // process r-value
  6446. rValues.push_back(accessChainLoad(*argTypes.back()));
  6447. }
  6448. }
  6449. // Reset source location to the function call location after argument evaluation
  6450. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  6451. // 2. Allocate space for anything needing a copy, and if it's "in" or "inout"
  6452. // copy the original into that space.
  6453. //
  6454. // Also, build up the list of actual arguments to pass in for the call
  6455. int lValueCount = 0;
  6456. int rValueCount = 0;
  6457. std::vector<spv::Id> spvArgs;
  6458. for (int a = 0; a < (int)glslangArgs.size(); ++a) {
  6459. spv::Id arg;
  6460. if (originalParam(qualifiers[a], *argTypes[a], function->hasImplicitThis() && a == 0)) {
  6461. builder.setAccessChain(lValues[lValueCount]);
  6462. arg = builder.accessChainGetLValue();
  6463. ++lValueCount;
  6464. } else if (writableParam(qualifiers[a])) {
  6465. // need space to hold the copy
  6466. arg = builder.createVariable(function->getParamPrecision(a), spv::StorageClass::Function,
  6467. builder.getContainedTypeId(function->getParamType(a)), "param");
  6468. if (qualifiers[a] == glslang::EvqIn || qualifiers[a] == glslang::EvqInOut) {
  6469. // need to copy the input into output space
  6470. builder.setAccessChain(lValues[lValueCount]);
  6471. spv::Id copy = accessChainLoad(*argTypes[a]);
  6472. builder.clearAccessChain();
  6473. builder.setAccessChainLValue(arg);
  6474. multiTypeStore(*argTypes[a], copy);
  6475. }
  6476. ++lValueCount;
  6477. } else {
  6478. // process r-value, which involves a copy for a type mismatch
  6479. if (function->getParamType(a) != builder.getTypeId(rValues[rValueCount]) ||
  6480. TranslatePrecisionDecoration(*argTypes[a]) != function->getParamPrecision(a))
  6481. {
  6482. spv::Id argCopy = builder.createVariable(function->getParamPrecision(a), spv::StorageClass::Function, function->getParamType(a), "arg");
  6483. builder.clearAccessChain();
  6484. builder.setAccessChainLValue(argCopy);
  6485. multiTypeStore(*argTypes[a], rValues[rValueCount]);
  6486. arg = builder.createLoad(argCopy, function->getParamPrecision(a));
  6487. } else
  6488. arg = rValues[rValueCount];
  6489. ++rValueCount;
  6490. }
  6491. spvArgs.push_back(arg);
  6492. }
  6493. // 3. Make the call.
  6494. spv::Id result = builder.createFunctionCall(function, spvArgs);
  6495. builder.setPrecision(result, TranslatePrecisionDecoration(node->getType()));
  6496. builder.addDecoration(result, TranslateNonUniformDecoration(node->getType().getQualifier()));
  6497. // 4. Copy back out an "out" arguments.
  6498. lValueCount = 0;
  6499. for (int a = 0; a < (int)glslangArgs.size(); ++a) {
  6500. if (originalParam(qualifiers[a], *argTypes[a], function->hasImplicitThis() && a == 0))
  6501. ++lValueCount;
  6502. else if (writableParam(qualifiers[a])) {
  6503. if (qualifiers[a] == glslang::EvqOut || qualifiers[a] == glslang::EvqInOut) {
  6504. spv::Id copy = builder.createLoad(spvArgs[a], spv::NoPrecision);
  6505. builder.addDecoration(copy, TranslateNonUniformDecoration(argTypes[a]->getQualifier()));
  6506. builder.setAccessChain(lValues[lValueCount]);
  6507. multiTypeStore(*argTypes[a], copy);
  6508. }
  6509. ++lValueCount;
  6510. }
  6511. }
  6512. return result;
  6513. }
  6514. // Translate AST operation to SPV operation, already having SPV-based operands/types.
  6515. spv::Id TGlslangToSpvTraverser::createBinaryOperation(glslang::TOperator op, OpDecorations& decorations,
  6516. spv::Id typeId, spv::Id left, spv::Id right,
  6517. glslang::TBasicType typeProxy, bool reduceComparison)
  6518. {
  6519. bool isUnsigned = isTypeUnsignedInt(typeProxy);
  6520. bool isFloat = isTypeFloat(typeProxy);
  6521. bool isBool = typeProxy == glslang::EbtBool;
  6522. spv::Op binOp = spv::Op::OpNop;
  6523. bool needMatchingVectors = true; // for non-matrix ops, would a scalar need to smear to match a vector?
  6524. bool comparison = false;
  6525. switch (op) {
  6526. case glslang::EOpAdd:
  6527. case glslang::EOpAddAssign:
  6528. if (isFloat)
  6529. binOp = spv::Op::OpFAdd;
  6530. else
  6531. binOp = spv::Op::OpIAdd;
  6532. break;
  6533. case glslang::EOpSub:
  6534. case glslang::EOpSubAssign:
  6535. if (isFloat)
  6536. binOp = spv::Op::OpFSub;
  6537. else
  6538. binOp = spv::Op::OpISub;
  6539. break;
  6540. case glslang::EOpMul:
  6541. case glslang::EOpMulAssign:
  6542. if (isFloat)
  6543. binOp = spv::Op::OpFMul;
  6544. else
  6545. binOp = spv::Op::OpIMul;
  6546. break;
  6547. case glslang::EOpVectorTimesScalar:
  6548. case glslang::EOpVectorTimesScalarAssign:
  6549. if (isFloat && (builder.isVector(left) || builder.isVector(right) || builder.isCooperativeVector(left) || builder.isCooperativeVector(right))) {
  6550. if (builder.isVector(right) || builder.isCooperativeVector(right))
  6551. std::swap(left, right);
  6552. assert(builder.isScalar(right));
  6553. needMatchingVectors = false;
  6554. binOp = spv::Op::OpVectorTimesScalar;
  6555. } else if (isFloat) {
  6556. binOp = spv::Op::OpFMul;
  6557. } else if (builder.isCooperativeVector(left) || builder.isCooperativeVector(right)) {
  6558. if (builder.isCooperativeVector(right))
  6559. std::swap(left, right);
  6560. assert(builder.isScalar(right));
  6561. // Construct a cooperative vector from the scalar
  6562. right = builder.createCompositeConstruct(builder.getTypeId(left), { right });
  6563. binOp = spv::Op::OpIMul;
  6564. } else {
  6565. binOp = spv::Op::OpIMul;
  6566. }
  6567. break;
  6568. case glslang::EOpVectorTimesMatrix:
  6569. case glslang::EOpVectorTimesMatrixAssign:
  6570. binOp = spv::Op::OpVectorTimesMatrix;
  6571. break;
  6572. case glslang::EOpMatrixTimesVector:
  6573. binOp = spv::Op::OpMatrixTimesVector;
  6574. break;
  6575. case glslang::EOpMatrixTimesScalar:
  6576. case glslang::EOpMatrixTimesScalarAssign:
  6577. binOp = spv::Op::OpMatrixTimesScalar;
  6578. break;
  6579. case glslang::EOpMatrixTimesMatrix:
  6580. case glslang::EOpMatrixTimesMatrixAssign:
  6581. binOp = spv::Op::OpMatrixTimesMatrix;
  6582. break;
  6583. case glslang::EOpOuterProduct:
  6584. binOp = spv::Op::OpOuterProduct;
  6585. needMatchingVectors = false;
  6586. break;
  6587. case glslang::EOpDiv:
  6588. case glslang::EOpDivAssign:
  6589. if (isFloat)
  6590. binOp = spv::Op::OpFDiv;
  6591. else if (isUnsigned)
  6592. binOp = spv::Op::OpUDiv;
  6593. else
  6594. binOp = spv::Op::OpSDiv;
  6595. break;
  6596. case glslang::EOpMod:
  6597. case glslang::EOpModAssign:
  6598. if (isFloat)
  6599. binOp = spv::Op::OpFMod;
  6600. else if (isUnsigned)
  6601. binOp = spv::Op::OpUMod;
  6602. else
  6603. binOp = spv::Op::OpSMod;
  6604. break;
  6605. case glslang::EOpRightShift:
  6606. case glslang::EOpRightShiftAssign:
  6607. if (isUnsigned)
  6608. binOp = spv::Op::OpShiftRightLogical;
  6609. else
  6610. binOp = spv::Op::OpShiftRightArithmetic;
  6611. break;
  6612. case glslang::EOpLeftShift:
  6613. case glslang::EOpLeftShiftAssign:
  6614. binOp = spv::Op::OpShiftLeftLogical;
  6615. break;
  6616. case glslang::EOpAnd:
  6617. case glslang::EOpAndAssign:
  6618. binOp = spv::Op::OpBitwiseAnd;
  6619. break;
  6620. case glslang::EOpLogicalAnd:
  6621. needMatchingVectors = false;
  6622. binOp = spv::Op::OpLogicalAnd;
  6623. break;
  6624. case glslang::EOpInclusiveOr:
  6625. case glslang::EOpInclusiveOrAssign:
  6626. binOp = spv::Op::OpBitwiseOr;
  6627. break;
  6628. case glslang::EOpLogicalOr:
  6629. needMatchingVectors = false;
  6630. binOp = spv::Op::OpLogicalOr;
  6631. break;
  6632. case glslang::EOpExclusiveOr:
  6633. case glslang::EOpExclusiveOrAssign:
  6634. binOp = spv::Op::OpBitwiseXor;
  6635. break;
  6636. case glslang::EOpLogicalXor:
  6637. needMatchingVectors = false;
  6638. binOp = spv::Op::OpLogicalNotEqual;
  6639. break;
  6640. case glslang::EOpAbsDifference:
  6641. binOp = isUnsigned ? spv::Op::OpAbsUSubINTEL : spv::Op::OpAbsISubINTEL;
  6642. break;
  6643. case glslang::EOpAddSaturate:
  6644. binOp = isUnsigned ? spv::Op::OpUAddSatINTEL : spv::Op::OpIAddSatINTEL;
  6645. break;
  6646. case glslang::EOpSubSaturate:
  6647. binOp = isUnsigned ? spv::Op::OpUSubSatINTEL : spv::Op::OpISubSatINTEL;
  6648. break;
  6649. case glslang::EOpAverage:
  6650. binOp = isUnsigned ? spv::Op::OpUAverageINTEL : spv::Op::OpIAverageINTEL;
  6651. break;
  6652. case glslang::EOpAverageRounded:
  6653. binOp = isUnsigned ? spv::Op::OpUAverageRoundedINTEL : spv::Op::OpIAverageRoundedINTEL;
  6654. break;
  6655. case glslang::EOpMul32x16:
  6656. binOp = isUnsigned ? spv::Op::OpUMul32x16INTEL : spv::Op::OpIMul32x16INTEL;
  6657. break;
  6658. case glslang::EOpExpectEXT:
  6659. binOp = spv::Op::OpExpectKHR;
  6660. break;
  6661. case glslang::EOpLessThan:
  6662. case glslang::EOpGreaterThan:
  6663. case glslang::EOpLessThanEqual:
  6664. case glslang::EOpGreaterThanEqual:
  6665. case glslang::EOpEqual:
  6666. case glslang::EOpNotEqual:
  6667. case glslang::EOpVectorEqual:
  6668. case glslang::EOpVectorNotEqual:
  6669. comparison = true;
  6670. break;
  6671. default:
  6672. break;
  6673. }
  6674. // handle mapped binary operations (should be non-comparison)
  6675. if (binOp != spv::Op::OpNop) {
  6676. assert(comparison == false);
  6677. if (builder.isMatrix(left) || builder.isMatrix(right) ||
  6678. builder.isCooperativeMatrix(left) || builder.isCooperativeMatrix(right))
  6679. return createBinaryMatrixOperation(binOp, decorations, typeId, left, right);
  6680. // No matrix involved; make both operands be the same number of components, if needed
  6681. if (needMatchingVectors)
  6682. builder.promoteScalar(decorations.precision, left, right);
  6683. spv::Id result = builder.createBinOp(binOp, typeId, left, right);
  6684. decorations.addNoContraction(builder, result);
  6685. decorations.addNonUniform(builder, result);
  6686. return builder.setPrecision(result, decorations.precision);
  6687. }
  6688. if (! comparison)
  6689. return 0;
  6690. // Handle comparison instructions
  6691. if (reduceComparison && (op == glslang::EOpEqual || op == glslang::EOpNotEqual)
  6692. && (builder.isVector(left) || builder.isMatrix(left) || builder.isAggregate(left))) {
  6693. spv::Id result = builder.createCompositeCompare(decorations.precision, left, right, op == glslang::EOpEqual);
  6694. decorations.addNonUniform(builder, result);
  6695. return result;
  6696. }
  6697. switch (op) {
  6698. case glslang::EOpLessThan:
  6699. if (isFloat)
  6700. binOp = spv::Op::OpFOrdLessThan;
  6701. else if (isUnsigned)
  6702. binOp = spv::Op::OpULessThan;
  6703. else
  6704. binOp = spv::Op::OpSLessThan;
  6705. break;
  6706. case glslang::EOpGreaterThan:
  6707. if (isFloat)
  6708. binOp = spv::Op::OpFOrdGreaterThan;
  6709. else if (isUnsigned)
  6710. binOp = spv::Op::OpUGreaterThan;
  6711. else
  6712. binOp = spv::Op::OpSGreaterThan;
  6713. break;
  6714. case glslang::EOpLessThanEqual:
  6715. if (isFloat)
  6716. binOp = spv::Op::OpFOrdLessThanEqual;
  6717. else if (isUnsigned)
  6718. binOp = spv::Op::OpULessThanEqual;
  6719. else
  6720. binOp = spv::Op::OpSLessThanEqual;
  6721. break;
  6722. case glslang::EOpGreaterThanEqual:
  6723. if (isFloat)
  6724. binOp = spv::Op::OpFOrdGreaterThanEqual;
  6725. else if (isUnsigned)
  6726. binOp = spv::Op::OpUGreaterThanEqual;
  6727. else
  6728. binOp = spv::Op::OpSGreaterThanEqual;
  6729. break;
  6730. case glslang::EOpEqual:
  6731. case glslang::EOpVectorEqual:
  6732. if (isFloat)
  6733. binOp = spv::Op::OpFOrdEqual;
  6734. else if (isBool)
  6735. binOp = spv::Op::OpLogicalEqual;
  6736. else
  6737. binOp = spv::Op::OpIEqual;
  6738. break;
  6739. case glslang::EOpNotEqual:
  6740. case glslang::EOpVectorNotEqual:
  6741. if (isFloat)
  6742. binOp = spv::Op::OpFUnordNotEqual;
  6743. else if (isBool)
  6744. binOp = spv::Op::OpLogicalNotEqual;
  6745. else
  6746. binOp = spv::Op::OpINotEqual;
  6747. break;
  6748. default:
  6749. break;
  6750. }
  6751. if (binOp != spv::Op::OpNop) {
  6752. spv::Id result = builder.createBinOp(binOp, typeId, left, right);
  6753. decorations.addNoContraction(builder, result);
  6754. decorations.addNonUniform(builder, result);
  6755. return builder.setPrecision(result, decorations.precision);
  6756. }
  6757. return 0;
  6758. }
  6759. //
  6760. // Translate AST matrix operation to SPV operation, already having SPV-based operands/types.
  6761. // These can be any of:
  6762. //
  6763. // matrix * scalar
  6764. // scalar * matrix
  6765. // matrix * matrix linear algebraic
  6766. // matrix * vector
  6767. // vector * matrix
  6768. // matrix * matrix componentwise
  6769. // matrix op matrix op in {+, -, /}
  6770. // matrix op scalar op in {+, -, /}
  6771. // scalar op matrix op in {+, -, /}
  6772. //
  6773. spv::Id TGlslangToSpvTraverser::createBinaryMatrixOperation(spv::Op op, OpDecorations& decorations, spv::Id typeId,
  6774. spv::Id left, spv::Id right)
  6775. {
  6776. bool firstClass = true;
  6777. // First, handle first-class matrix operations (* and matrix/scalar)
  6778. switch (op) {
  6779. case spv::Op::OpFDiv:
  6780. if (builder.isMatrix(left) && builder.isScalar(right)) {
  6781. // turn matrix / scalar into a multiply...
  6782. spv::Id resultType = builder.getTypeId(right);
  6783. right = builder.createBinOp(spv::Op::OpFDiv, resultType, builder.makeFpConstant(resultType, 1.0), right);
  6784. op = spv::Op::OpMatrixTimesScalar;
  6785. } else
  6786. firstClass = false;
  6787. break;
  6788. case spv::Op::OpMatrixTimesScalar:
  6789. if (builder.isMatrix(right) || builder.isCooperativeMatrix(right))
  6790. std::swap(left, right);
  6791. assert(builder.isScalar(right));
  6792. break;
  6793. case spv::Op::OpVectorTimesMatrix:
  6794. assert(builder.isVector(left));
  6795. assert(builder.isMatrix(right));
  6796. break;
  6797. case spv::Op::OpMatrixTimesVector:
  6798. assert(builder.isMatrix(left));
  6799. assert(builder.isVector(right));
  6800. break;
  6801. case spv::Op::OpMatrixTimesMatrix:
  6802. assert(builder.isMatrix(left));
  6803. assert(builder.isMatrix(right));
  6804. break;
  6805. default:
  6806. firstClass = false;
  6807. break;
  6808. }
  6809. if (builder.isCooperativeMatrix(left) || builder.isCooperativeMatrix(right))
  6810. firstClass = true;
  6811. if (firstClass) {
  6812. spv::Id result = builder.createBinOp(op, typeId, left, right);
  6813. decorations.addNoContraction(builder, result);
  6814. decorations.addNonUniform(builder, result);
  6815. return builder.setPrecision(result, decorations.precision);
  6816. }
  6817. // Handle component-wise +, -, *, %, and / for all combinations of type.
  6818. // The result type of all of them is the same type as the (a) matrix operand.
  6819. // The algorithm is to:
  6820. // - break the matrix(es) into vectors
  6821. // - smear any scalar to a vector
  6822. // - do vector operations
  6823. // - make a matrix out the vector results
  6824. switch (op) {
  6825. case spv::Op::OpFAdd:
  6826. case spv::Op::OpFSub:
  6827. case spv::Op::OpFDiv:
  6828. case spv::Op::OpFMod:
  6829. case spv::Op::OpFMul:
  6830. {
  6831. // one time set up...
  6832. bool leftMat = builder.isMatrix(left);
  6833. bool rightMat = builder.isMatrix(right);
  6834. unsigned int numCols = leftMat ? builder.getNumColumns(left) : builder.getNumColumns(right);
  6835. int numRows = leftMat ? builder.getNumRows(left) : builder.getNumRows(right);
  6836. spv::Id scalarType = builder.getScalarTypeId(typeId);
  6837. spv::Id vecType = builder.makeVectorType(scalarType, numRows);
  6838. std::vector<spv::Id> results;
  6839. spv::Id smearVec = spv::NoResult;
  6840. if (builder.isScalar(left))
  6841. smearVec = builder.smearScalar(decorations.precision, left, vecType);
  6842. else if (builder.isScalar(right))
  6843. smearVec = builder.smearScalar(decorations.precision, right, vecType);
  6844. // do each vector op
  6845. for (unsigned int c = 0; c < numCols; ++c) {
  6846. std::vector<unsigned int> indexes;
  6847. indexes.push_back(c);
  6848. spv::Id leftVec = leftMat ? builder.createCompositeExtract( left, vecType, indexes) : smearVec;
  6849. spv::Id rightVec = rightMat ? builder.createCompositeExtract(right, vecType, indexes) : smearVec;
  6850. spv::Id result = builder.createBinOp(op, vecType, leftVec, rightVec);
  6851. decorations.addNoContraction(builder, result);
  6852. decorations.addNonUniform(builder, result);
  6853. results.push_back(builder.setPrecision(result, decorations.precision));
  6854. }
  6855. // put the pieces together
  6856. spv::Id result = builder.setPrecision(builder.createCompositeConstruct(typeId, results), decorations.precision);
  6857. decorations.addNonUniform(builder, result);
  6858. return result;
  6859. }
  6860. default:
  6861. assert(0);
  6862. return spv::NoResult;
  6863. }
  6864. }
  6865. spv::Id TGlslangToSpvTraverser::createUnaryOperation(glslang::TOperator op, OpDecorations& decorations, spv::Id typeId,
  6866. spv::Id operand, glslang::TBasicType typeProxy, const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags,
  6867. const glslang::TType &opType)
  6868. {
  6869. spv::Op unaryOp = spv::Op::OpNop;
  6870. int extBuiltins = -1;
  6871. int libCall = -1;
  6872. bool isUnsigned = isTypeUnsignedInt(typeProxy);
  6873. bool isFloat = isTypeFloat(typeProxy);
  6874. switch (op) {
  6875. case glslang::EOpNegative:
  6876. if (isFloat) {
  6877. unaryOp = spv::Op::OpFNegate;
  6878. if (builder.isMatrixType(typeId))
  6879. return createUnaryMatrixOperation(unaryOp, decorations, typeId, operand, typeProxy);
  6880. } else
  6881. unaryOp = spv::Op::OpSNegate;
  6882. break;
  6883. case glslang::EOpLogicalNot:
  6884. case glslang::EOpVectorLogicalNot:
  6885. unaryOp = spv::Op::OpLogicalNot;
  6886. break;
  6887. case glslang::EOpBitwiseNot:
  6888. unaryOp = spv::Op::OpNot;
  6889. break;
  6890. case glslang::EOpDeterminant:
  6891. libCall = spv::GLSLstd450Determinant;
  6892. break;
  6893. case glslang::EOpMatrixInverse:
  6894. libCall = spv::GLSLstd450MatrixInverse;
  6895. break;
  6896. case glslang::EOpTranspose:
  6897. unaryOp = spv::Op::OpTranspose;
  6898. break;
  6899. case glslang::EOpRadians:
  6900. libCall = spv::GLSLstd450Radians;
  6901. break;
  6902. case glslang::EOpDegrees:
  6903. libCall = spv::GLSLstd450Degrees;
  6904. break;
  6905. case glslang::EOpSin:
  6906. libCall = spv::GLSLstd450Sin;
  6907. break;
  6908. case glslang::EOpCos:
  6909. libCall = spv::GLSLstd450Cos;
  6910. break;
  6911. case glslang::EOpTan:
  6912. libCall = spv::GLSLstd450Tan;
  6913. break;
  6914. case glslang::EOpAcos:
  6915. libCall = spv::GLSLstd450Acos;
  6916. break;
  6917. case glslang::EOpAsin:
  6918. libCall = spv::GLSLstd450Asin;
  6919. break;
  6920. case glslang::EOpAtan:
  6921. libCall = spv::GLSLstd450Atan;
  6922. break;
  6923. case glslang::EOpAcosh:
  6924. libCall = spv::GLSLstd450Acosh;
  6925. break;
  6926. case glslang::EOpAsinh:
  6927. libCall = spv::GLSLstd450Asinh;
  6928. break;
  6929. case glslang::EOpAtanh:
  6930. libCall = spv::GLSLstd450Atanh;
  6931. break;
  6932. case glslang::EOpTanh:
  6933. libCall = spv::GLSLstd450Tanh;
  6934. break;
  6935. case glslang::EOpCosh:
  6936. libCall = spv::GLSLstd450Cosh;
  6937. break;
  6938. case glslang::EOpSinh:
  6939. libCall = spv::GLSLstd450Sinh;
  6940. break;
  6941. case glslang::EOpLength:
  6942. libCall = spv::GLSLstd450Length;
  6943. break;
  6944. case glslang::EOpNormalize:
  6945. libCall = spv::GLSLstd450Normalize;
  6946. break;
  6947. case glslang::EOpExp:
  6948. libCall = spv::GLSLstd450Exp;
  6949. break;
  6950. case glslang::EOpLog:
  6951. libCall = spv::GLSLstd450Log;
  6952. break;
  6953. case glslang::EOpExp2:
  6954. libCall = spv::GLSLstd450Exp2;
  6955. break;
  6956. case glslang::EOpLog2:
  6957. libCall = spv::GLSLstd450Log2;
  6958. break;
  6959. case glslang::EOpSqrt:
  6960. libCall = spv::GLSLstd450Sqrt;
  6961. break;
  6962. case glslang::EOpInverseSqrt:
  6963. libCall = spv::GLSLstd450InverseSqrt;
  6964. break;
  6965. case glslang::EOpFloor:
  6966. libCall = spv::GLSLstd450Floor;
  6967. break;
  6968. case glslang::EOpTrunc:
  6969. libCall = spv::GLSLstd450Trunc;
  6970. break;
  6971. case glslang::EOpRound:
  6972. libCall = spv::GLSLstd450Round;
  6973. break;
  6974. case glslang::EOpRoundEven:
  6975. libCall = spv::GLSLstd450RoundEven;
  6976. break;
  6977. case glslang::EOpCeil:
  6978. libCall = spv::GLSLstd450Ceil;
  6979. break;
  6980. case glslang::EOpFract:
  6981. libCall = spv::GLSLstd450Fract;
  6982. break;
  6983. case glslang::EOpIsNan:
  6984. unaryOp = spv::Op::OpIsNan;
  6985. break;
  6986. case glslang::EOpIsInf:
  6987. unaryOp = spv::Op::OpIsInf;
  6988. break;
  6989. case glslang::EOpIsFinite:
  6990. unaryOp = spv::Op::OpIsFinite;
  6991. break;
  6992. case glslang::EOpFloatBitsToInt:
  6993. case glslang::EOpFloatBitsToUint:
  6994. case glslang::EOpIntBitsToFloat:
  6995. case glslang::EOpUintBitsToFloat:
  6996. case glslang::EOpDoubleBitsToInt64:
  6997. case glslang::EOpDoubleBitsToUint64:
  6998. case glslang::EOpInt64BitsToDouble:
  6999. case glslang::EOpUint64BitsToDouble:
  7000. case glslang::EOpFloat16BitsToInt16:
  7001. case glslang::EOpFloat16BitsToUint16:
  7002. case glslang::EOpInt16BitsToFloat16:
  7003. case glslang::EOpUint16BitsToFloat16:
  7004. unaryOp = spv::Op::OpBitcast;
  7005. break;
  7006. case glslang::EOpPackSnorm2x16:
  7007. libCall = spv::GLSLstd450PackSnorm2x16;
  7008. break;
  7009. case glslang::EOpUnpackSnorm2x16:
  7010. libCall = spv::GLSLstd450UnpackSnorm2x16;
  7011. break;
  7012. case glslang::EOpPackUnorm2x16:
  7013. libCall = spv::GLSLstd450PackUnorm2x16;
  7014. break;
  7015. case glslang::EOpUnpackUnorm2x16:
  7016. libCall = spv::GLSLstd450UnpackUnorm2x16;
  7017. break;
  7018. case glslang::EOpPackHalf2x16:
  7019. libCall = spv::GLSLstd450PackHalf2x16;
  7020. break;
  7021. case glslang::EOpUnpackHalf2x16:
  7022. libCall = spv::GLSLstd450UnpackHalf2x16;
  7023. break;
  7024. case glslang::EOpPackSnorm4x8:
  7025. libCall = spv::GLSLstd450PackSnorm4x8;
  7026. break;
  7027. case glslang::EOpUnpackSnorm4x8:
  7028. libCall = spv::GLSLstd450UnpackSnorm4x8;
  7029. break;
  7030. case glslang::EOpPackUnorm4x8:
  7031. libCall = spv::GLSLstd450PackUnorm4x8;
  7032. break;
  7033. case glslang::EOpUnpackUnorm4x8:
  7034. libCall = spv::GLSLstd450UnpackUnorm4x8;
  7035. break;
  7036. case glslang::EOpPackDouble2x32:
  7037. libCall = spv::GLSLstd450PackDouble2x32;
  7038. break;
  7039. case glslang::EOpUnpackDouble2x32:
  7040. libCall = spv::GLSLstd450UnpackDouble2x32;
  7041. break;
  7042. case glslang::EOpPackInt2x32:
  7043. case glslang::EOpUnpackInt2x32:
  7044. case glslang::EOpPackUint2x32:
  7045. case glslang::EOpUnpackUint2x32:
  7046. case glslang::EOpPack16:
  7047. case glslang::EOpPack32:
  7048. case glslang::EOpPack64:
  7049. case glslang::EOpUnpack32:
  7050. case glslang::EOpUnpack16:
  7051. case glslang::EOpUnpack8:
  7052. case glslang::EOpPackInt2x16:
  7053. case glslang::EOpUnpackInt2x16:
  7054. case glslang::EOpPackUint2x16:
  7055. case glslang::EOpUnpackUint2x16:
  7056. case glslang::EOpPackInt4x16:
  7057. case glslang::EOpUnpackInt4x16:
  7058. case glslang::EOpPackUint4x16:
  7059. case glslang::EOpUnpackUint4x16:
  7060. case glslang::EOpPackFloat2x16:
  7061. case glslang::EOpUnpackFloat2x16:
  7062. unaryOp = spv::Op::OpBitcast;
  7063. break;
  7064. case glslang::EOpDPdx:
  7065. unaryOp = spv::Op::OpDPdx;
  7066. break;
  7067. case glslang::EOpDPdy:
  7068. unaryOp = spv::Op::OpDPdy;
  7069. break;
  7070. case glslang::EOpFwidth:
  7071. unaryOp = spv::Op::OpFwidth;
  7072. break;
  7073. case glslang::EOpAny:
  7074. unaryOp = spv::Op::OpAny;
  7075. break;
  7076. case glslang::EOpAll:
  7077. unaryOp = spv::Op::OpAll;
  7078. break;
  7079. case glslang::EOpAbs:
  7080. if (isFloat)
  7081. libCall = spv::GLSLstd450FAbs;
  7082. else
  7083. libCall = spv::GLSLstd450SAbs;
  7084. break;
  7085. case glslang::EOpSign:
  7086. if (isFloat)
  7087. libCall = spv::GLSLstd450FSign;
  7088. else
  7089. libCall = spv::GLSLstd450SSign;
  7090. break;
  7091. case glslang::EOpDPdxFine:
  7092. unaryOp = spv::Op::OpDPdxFine;
  7093. break;
  7094. case glslang::EOpDPdyFine:
  7095. unaryOp = spv::Op::OpDPdyFine;
  7096. break;
  7097. case glslang::EOpFwidthFine:
  7098. unaryOp = spv::Op::OpFwidthFine;
  7099. break;
  7100. case glslang::EOpDPdxCoarse:
  7101. unaryOp = spv::Op::OpDPdxCoarse;
  7102. break;
  7103. case glslang::EOpDPdyCoarse:
  7104. unaryOp = spv::Op::OpDPdyCoarse;
  7105. break;
  7106. case glslang::EOpFwidthCoarse:
  7107. unaryOp = spv::Op::OpFwidthCoarse;
  7108. break;
  7109. case glslang::EOpRayQueryProceed:
  7110. unaryOp = spv::Op::OpRayQueryProceedKHR;
  7111. break;
  7112. case glslang::EOpRayQueryGetRayTMin:
  7113. unaryOp = spv::Op::OpRayQueryGetRayTMinKHR;
  7114. break;
  7115. case glslang::EOpRayQueryGetRayFlags:
  7116. unaryOp = spv::Op::OpRayQueryGetRayFlagsKHR;
  7117. break;
  7118. case glslang::EOpRayQueryGetWorldRayOrigin:
  7119. unaryOp = spv::Op::OpRayQueryGetWorldRayOriginKHR;
  7120. break;
  7121. case glslang::EOpRayQueryGetWorldRayDirection:
  7122. unaryOp = spv::Op::OpRayQueryGetWorldRayDirectionKHR;
  7123. break;
  7124. case glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque:
  7125. unaryOp = spv::Op::OpRayQueryGetIntersectionCandidateAABBOpaqueKHR;
  7126. break;
  7127. case glslang::EOpInterpolateAtCentroid:
  7128. if (typeProxy == glslang::EbtFloat16)
  7129. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
  7130. libCall = spv::GLSLstd450InterpolateAtCentroid;
  7131. break;
  7132. case glslang::EOpAtomicCounterIncrement:
  7133. case glslang::EOpAtomicCounterDecrement:
  7134. case glslang::EOpAtomicCounter:
  7135. {
  7136. // Handle all of the atomics in one place, in createAtomicOperation()
  7137. std::vector<spv::Id> operands;
  7138. operands.push_back(operand);
  7139. return createAtomicOperation(op, decorations.precision, typeId, operands, typeProxy, lvalueCoherentFlags, opType);
  7140. }
  7141. case glslang::EOpBitFieldReverse:
  7142. unaryOp = spv::Op::OpBitReverse;
  7143. break;
  7144. case glslang::EOpBitCount:
  7145. unaryOp = spv::Op::OpBitCount;
  7146. break;
  7147. case glslang::EOpFindLSB:
  7148. libCall = spv::GLSLstd450FindILsb;
  7149. break;
  7150. case glslang::EOpFindMSB:
  7151. if (isUnsigned)
  7152. libCall = spv::GLSLstd450FindUMsb;
  7153. else
  7154. libCall = spv::GLSLstd450FindSMsb;
  7155. break;
  7156. case glslang::EOpCountLeadingZeros:
  7157. builder.addCapability(spv::Capability::IntegerFunctions2INTEL);
  7158. builder.addExtension("SPV_INTEL_shader_integer_functions2");
  7159. unaryOp = spv::Op::OpUCountLeadingZerosINTEL;
  7160. break;
  7161. case glslang::EOpCountTrailingZeros:
  7162. builder.addCapability(spv::Capability::IntegerFunctions2INTEL);
  7163. builder.addExtension("SPV_INTEL_shader_integer_functions2");
  7164. unaryOp = spv::Op::OpUCountTrailingZerosINTEL;
  7165. break;
  7166. case glslang::EOpBallot:
  7167. case glslang::EOpReadFirstInvocation:
  7168. case glslang::EOpAnyInvocation:
  7169. case glslang::EOpAllInvocations:
  7170. case glslang::EOpAllInvocationsEqual:
  7171. case glslang::EOpMinInvocations:
  7172. case glslang::EOpMaxInvocations:
  7173. case glslang::EOpAddInvocations:
  7174. case glslang::EOpMinInvocationsNonUniform:
  7175. case glslang::EOpMaxInvocationsNonUniform:
  7176. case glslang::EOpAddInvocationsNonUniform:
  7177. case glslang::EOpMinInvocationsInclusiveScan:
  7178. case glslang::EOpMaxInvocationsInclusiveScan:
  7179. case glslang::EOpAddInvocationsInclusiveScan:
  7180. case glslang::EOpMinInvocationsInclusiveScanNonUniform:
  7181. case glslang::EOpMaxInvocationsInclusiveScanNonUniform:
  7182. case glslang::EOpAddInvocationsInclusiveScanNonUniform:
  7183. case glslang::EOpMinInvocationsExclusiveScan:
  7184. case glslang::EOpMaxInvocationsExclusiveScan:
  7185. case glslang::EOpAddInvocationsExclusiveScan:
  7186. case glslang::EOpMinInvocationsExclusiveScanNonUniform:
  7187. case glslang::EOpMaxInvocationsExclusiveScanNonUniform:
  7188. case glslang::EOpAddInvocationsExclusiveScanNonUniform:
  7189. {
  7190. std::vector<spv::Id> operands;
  7191. operands.push_back(operand);
  7192. return createInvocationsOperation(op, typeId, operands, typeProxy);
  7193. }
  7194. case glslang::EOpSubgroupAll:
  7195. case glslang::EOpSubgroupAny:
  7196. case glslang::EOpSubgroupAllEqual:
  7197. case glslang::EOpSubgroupBroadcastFirst:
  7198. case glslang::EOpSubgroupBallot:
  7199. case glslang::EOpSubgroupInverseBallot:
  7200. case glslang::EOpSubgroupBallotBitCount:
  7201. case glslang::EOpSubgroupBallotInclusiveBitCount:
  7202. case glslang::EOpSubgroupBallotExclusiveBitCount:
  7203. case glslang::EOpSubgroupBallotFindLSB:
  7204. case glslang::EOpSubgroupBallotFindMSB:
  7205. case glslang::EOpSubgroupAdd:
  7206. case glslang::EOpSubgroupMul:
  7207. case glslang::EOpSubgroupMin:
  7208. case glslang::EOpSubgroupMax:
  7209. case glslang::EOpSubgroupAnd:
  7210. case glslang::EOpSubgroupOr:
  7211. case glslang::EOpSubgroupXor:
  7212. case glslang::EOpSubgroupInclusiveAdd:
  7213. case glslang::EOpSubgroupInclusiveMul:
  7214. case glslang::EOpSubgroupInclusiveMin:
  7215. case glslang::EOpSubgroupInclusiveMax:
  7216. case glslang::EOpSubgroupInclusiveAnd:
  7217. case glslang::EOpSubgroupInclusiveOr:
  7218. case glslang::EOpSubgroupInclusiveXor:
  7219. case glslang::EOpSubgroupExclusiveAdd:
  7220. case glslang::EOpSubgroupExclusiveMul:
  7221. case glslang::EOpSubgroupExclusiveMin:
  7222. case glslang::EOpSubgroupExclusiveMax:
  7223. case glslang::EOpSubgroupExclusiveAnd:
  7224. case glslang::EOpSubgroupExclusiveOr:
  7225. case glslang::EOpSubgroupExclusiveXor:
  7226. case glslang::EOpSubgroupQuadSwapHorizontal:
  7227. case glslang::EOpSubgroupQuadSwapVertical:
  7228. case glslang::EOpSubgroupQuadSwapDiagonal:
  7229. case glslang::EOpSubgroupQuadAll:
  7230. case glslang::EOpSubgroupQuadAny: {
  7231. std::vector<spv::Id> operands;
  7232. operands.push_back(operand);
  7233. return createSubgroupOperation(op, typeId, operands, typeProxy);
  7234. }
  7235. case glslang::EOpMbcnt:
  7236. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
  7237. libCall = spv::MbcntAMD;
  7238. break;
  7239. case glslang::EOpCubeFaceIndex:
  7240. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_gcn_shader);
  7241. libCall = spv::CubeFaceIndexAMD;
  7242. break;
  7243. case glslang::EOpCubeFaceCoord:
  7244. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_gcn_shader);
  7245. libCall = spv::CubeFaceCoordAMD;
  7246. break;
  7247. case glslang::EOpSubgroupPartition:
  7248. unaryOp = spv::Op::OpGroupNonUniformPartitionNV;
  7249. break;
  7250. case glslang::EOpConstructReference:
  7251. unaryOp = spv::Op::OpBitcast;
  7252. break;
  7253. case glslang::EOpConvUint64ToAccStruct:
  7254. case glslang::EOpConvUvec2ToAccStruct:
  7255. unaryOp = spv::Op::OpConvertUToAccelerationStructureKHR;
  7256. break;
  7257. case glslang::EOpHitObjectIsEmptyNV:
  7258. unaryOp = spv::Op::OpHitObjectIsEmptyNV;
  7259. break;
  7260. case glslang::EOpHitObjectIsMissNV:
  7261. unaryOp = spv::Op::OpHitObjectIsMissNV;
  7262. break;
  7263. case glslang::EOpHitObjectIsHitNV:
  7264. unaryOp = spv::Op::OpHitObjectIsHitNV;
  7265. break;
  7266. case glslang::EOpHitObjectGetObjectRayOriginNV:
  7267. unaryOp = spv::Op::OpHitObjectGetObjectRayOriginNV;
  7268. break;
  7269. case glslang::EOpHitObjectGetObjectRayDirectionNV:
  7270. unaryOp = spv::Op::OpHitObjectGetObjectRayDirectionNV;
  7271. break;
  7272. case glslang::EOpHitObjectGetWorldRayOriginNV:
  7273. unaryOp = spv::Op::OpHitObjectGetWorldRayOriginNV;
  7274. break;
  7275. case glslang::EOpHitObjectGetWorldRayDirectionNV:
  7276. unaryOp = spv::Op::OpHitObjectGetWorldRayDirectionNV;
  7277. break;
  7278. case glslang::EOpHitObjectGetObjectToWorldNV:
  7279. unaryOp = spv::Op::OpHitObjectGetObjectToWorldNV;
  7280. break;
  7281. case glslang::EOpHitObjectGetWorldToObjectNV:
  7282. unaryOp = spv::Op::OpHitObjectGetWorldToObjectNV;
  7283. break;
  7284. case glslang::EOpHitObjectGetRayTMinNV:
  7285. unaryOp = spv::Op::OpHitObjectGetRayTMinNV;
  7286. break;
  7287. case glslang::EOpHitObjectGetRayTMaxNV:
  7288. unaryOp = spv::Op::OpHitObjectGetRayTMaxNV;
  7289. break;
  7290. case glslang::EOpHitObjectGetPrimitiveIndexNV:
  7291. unaryOp = spv::Op::OpHitObjectGetPrimitiveIndexNV;
  7292. break;
  7293. case glslang::EOpHitObjectGetInstanceIdNV:
  7294. unaryOp = spv::Op::OpHitObjectGetInstanceIdNV;
  7295. break;
  7296. case glslang::EOpHitObjectGetInstanceCustomIndexNV:
  7297. unaryOp = spv::Op::OpHitObjectGetInstanceCustomIndexNV;
  7298. break;
  7299. case glslang::EOpHitObjectGetGeometryIndexNV:
  7300. unaryOp = spv::Op::OpHitObjectGetGeometryIndexNV;
  7301. break;
  7302. case glslang::EOpHitObjectGetHitKindNV:
  7303. unaryOp = spv::Op::OpHitObjectGetHitKindNV;
  7304. break;
  7305. case glslang::EOpHitObjectGetCurrentTimeNV:
  7306. unaryOp = spv::Op::OpHitObjectGetCurrentTimeNV;
  7307. break;
  7308. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:
  7309. unaryOp = spv::Op::OpHitObjectGetShaderBindingTableRecordIndexNV;
  7310. break;
  7311. case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:
  7312. unaryOp = spv::Op::OpHitObjectGetShaderRecordBufferHandleNV;
  7313. break;
  7314. case glslang::EOpHitObjectGetClusterIdNV:
  7315. unaryOp = spv::Op::OpHitObjectGetClusterIdNV;
  7316. builder.addExtension(spv::E_SPV_NV_cluster_acceleration_structure);
  7317. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  7318. builder.addCapability(spv::Capability::RayTracingClusterAccelerationStructureNV);
  7319. break;
  7320. case glslang::EOpHitObjectGetSpherePositionNV:
  7321. unaryOp = spv::Op::OpHitObjectGetSpherePositionNV;
  7322. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  7323. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  7324. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  7325. break;
  7326. case glslang::EOpHitObjectGetSphereRadiusNV:
  7327. unaryOp = spv::Op::OpHitObjectGetSphereRadiusNV;
  7328. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  7329. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  7330. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  7331. break;
  7332. case glslang::EOpHitObjectIsSphereHitNV:
  7333. unaryOp = spv::Op::OpHitObjectIsSphereHitNV;
  7334. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  7335. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  7336. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  7337. break;
  7338. case glslang::EOpHitObjectIsLSSHitNV:
  7339. unaryOp = spv::Op::OpHitObjectIsLSSHitNV;
  7340. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  7341. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  7342. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  7343. break;
  7344. case glslang::EOpFetchMicroTriangleVertexPositionNV:
  7345. unaryOp = spv::Op::OpFetchMicroTriangleVertexPositionNV;
  7346. break;
  7347. case glslang::EOpFetchMicroTriangleVertexBarycentricNV:
  7348. unaryOp = spv::Op::OpFetchMicroTriangleVertexBarycentricNV;
  7349. break;
  7350. case glslang::EOpCopyObject:
  7351. unaryOp = spv::Op::OpCopyObject;
  7352. break;
  7353. case glslang::EOpDepthAttachmentReadEXT:
  7354. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  7355. builder.addCapability(spv::Capability::TileImageDepthReadAccessEXT);
  7356. unaryOp = spv::Op::OpDepthAttachmentReadEXT;
  7357. decorations.precision = spv::NoPrecision;
  7358. break;
  7359. case glslang::EOpStencilAttachmentReadEXT:
  7360. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  7361. builder.addCapability(spv::Capability::TileImageStencilReadAccessEXT);
  7362. unaryOp = spv::Op::OpStencilAttachmentReadEXT;
  7363. decorations.precision = spv::Decoration::RelaxedPrecision;
  7364. break;
  7365. default:
  7366. return 0;
  7367. }
  7368. spv::Id id;
  7369. if (libCall >= 0) {
  7370. std::vector<spv::Id> args;
  7371. args.push_back(operand);
  7372. id = builder.createBuiltinCall(typeId, extBuiltins >= 0 ? extBuiltins : stdBuiltins, libCall, args);
  7373. } else {
  7374. id = builder.createUnaryOp(unaryOp, typeId, operand);
  7375. }
  7376. decorations.addNoContraction(builder, id);
  7377. decorations.addNonUniform(builder, id);
  7378. return builder.setPrecision(id, decorations.precision);
  7379. }
  7380. // Create a unary operation on a matrix
  7381. spv::Id TGlslangToSpvTraverser::createUnaryMatrixOperation(spv::Op op, OpDecorations& decorations, spv::Id typeId,
  7382. spv::Id operand, glslang::TBasicType /* typeProxy */)
  7383. {
  7384. // Handle unary operations vector by vector.
  7385. // The result type is the same type as the original type.
  7386. // The algorithm is to:
  7387. // - break the matrix into vectors
  7388. // - apply the operation to each vector
  7389. // - make a matrix out the vector results
  7390. // get the types sorted out
  7391. int numCols = builder.getNumColumns(operand);
  7392. int numRows = builder.getNumRows(operand);
  7393. spv::Id srcVecType = builder.makeVectorType(builder.getScalarTypeId(builder.getTypeId(operand)), numRows);
  7394. spv::Id destVecType = builder.makeVectorType(builder.getScalarTypeId(typeId), numRows);
  7395. std::vector<spv::Id> results;
  7396. // do each vector op
  7397. for (int c = 0; c < numCols; ++c) {
  7398. std::vector<unsigned int> indexes;
  7399. indexes.push_back(c);
  7400. spv::Id srcVec = builder.createCompositeExtract(operand, srcVecType, indexes);
  7401. spv::Id destVec = builder.createUnaryOp(op, destVecType, srcVec);
  7402. decorations.addNoContraction(builder, destVec);
  7403. decorations.addNonUniform(builder, destVec);
  7404. results.push_back(builder.setPrecision(destVec, decorations.precision));
  7405. }
  7406. // put the pieces together
  7407. spv::Id result = builder.setPrecision(builder.createCompositeConstruct(typeId, results), decorations.precision);
  7408. decorations.addNonUniform(builder, result);
  7409. return result;
  7410. }
  7411. // For converting integers where both the bitwidth and the signedness could
  7412. // change, but only do the width change here. The caller is still responsible
  7413. // for the signedness conversion.
  7414. // destType is the final type that will be converted to, but this function
  7415. // may only be doing part of that conversion.
  7416. spv::Id TGlslangToSpvTraverser::createIntWidthConversion(spv::Id operand, int vectorSize, spv::Id destType,
  7417. glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType)
  7418. {
  7419. // Get the result type width, based on the type to convert to.
  7420. int width = GetNumBits(resultBasicType);
  7421. // Get the conversion operation and result type,
  7422. // based on the target width, but the source type.
  7423. spv::Id type = spv::NoType;
  7424. spv::Op convOp = spv::Op::OpNop;
  7425. if (isTypeSignedInt(operandBasicType)) {
  7426. convOp = spv::Op::OpSConvert;
  7427. type = builder.makeIntType(width);
  7428. } else {
  7429. convOp = spv::Op::OpUConvert;
  7430. type = builder.makeUintType(width);
  7431. }
  7432. if (builder.getOpCode(destType) == spv::Op::OpTypeCooperativeVectorNV) {
  7433. type = builder.makeCooperativeVectorTypeNV(type, builder.getCooperativeVectorNumComponents(destType));
  7434. } else if (vectorSize > 0)
  7435. type = builder.makeVectorType(type, vectorSize);
  7436. else if (builder.getOpCode(destType) == spv::Op::OpTypeCooperativeMatrixKHR ||
  7437. builder.getOpCode(destType) == spv::Op::OpTypeCooperativeMatrixNV) {
  7438. type = builder.makeCooperativeMatrixTypeWithSameShape(type, destType);
  7439. }
  7440. return builder.createUnaryOp(convOp, type, operand);
  7441. }
  7442. spv::Id TGlslangToSpvTraverser::createConversion(glslang::TOperator op, OpDecorations& decorations, spv::Id destType,
  7443. spv::Id operand, glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType)
  7444. {
  7445. spv::Op convOp = spv::Op::OpNop;
  7446. spv::Id zero = 0;
  7447. spv::Id one = 0;
  7448. int vectorSize = builder.isVectorType(destType) ? builder.getNumTypeComponents(destType) : 0;
  7449. if (IsOpNumericConv(op) || op == glslang::EOpConstructSaturated) {
  7450. if (isTypeSignedInt(operandBasicType) && isTypeFloat(resultBasicType)) {
  7451. convOp = spv::Op::OpConvertSToF;
  7452. }
  7453. if (isTypeUnsignedInt(operandBasicType) && isTypeFloat(resultBasicType)) {
  7454. convOp = spv::Op::OpConvertUToF;
  7455. }
  7456. if (isTypeFloat(operandBasicType) && isTypeSignedInt(resultBasicType)) {
  7457. convOp = spv::Op::OpConvertFToS;
  7458. }
  7459. if (isTypeFloat(operandBasicType) && isTypeUnsignedInt(resultBasicType)) {
  7460. convOp = spv::Op::OpConvertFToU;
  7461. }
  7462. if (isTypeSignedInt(operandBasicType) && isTypeSignedInt(resultBasicType)) {
  7463. convOp = spv::Op::OpSConvert;
  7464. }
  7465. if (isTypeUnsignedInt(operandBasicType) && isTypeUnsignedInt(resultBasicType)) {
  7466. convOp = spv::Op::OpUConvert;
  7467. }
  7468. if (isTypeFloat(operandBasicType) && isTypeFloat(resultBasicType)) {
  7469. convOp = spv::Op::OpFConvert;
  7470. if (builder.isMatrixType(destType))
  7471. return createUnaryMatrixOperation(convOp, decorations, destType, operand, operandBasicType);
  7472. }
  7473. if (isTypeInt(operandBasicType) && isTypeInt(resultBasicType) &&
  7474. isTypeUnsignedInt(operandBasicType) != isTypeUnsignedInt(resultBasicType)) {
  7475. if (GetNumBits(operandBasicType) != GetNumBits(resultBasicType)) {
  7476. // OpSConvert/OpUConvert + OpBitCast
  7477. operand = createIntWidthConversion(operand, vectorSize, destType, resultBasicType, operandBasicType);
  7478. }
  7479. if (builder.isInSpecConstCodeGenMode()) {
  7480. uint32_t bits = GetNumBits(resultBasicType);
  7481. spv::Id zeroType = builder.makeUintType(bits);
  7482. if (bits == 64) {
  7483. zero = builder.makeInt64Constant(zeroType, 0, false);
  7484. } else {
  7485. zero = builder.makeIntConstant(zeroType, 0, false);
  7486. }
  7487. zero = makeSmearedConstant(zero, vectorSize);
  7488. // Use OpIAdd, instead of OpBitcast to do the conversion when
  7489. // generating for OpSpecConstantOp instruction.
  7490. return builder.createBinOp(spv::Op::OpIAdd, destType, operand, zero);
  7491. }
  7492. // For normal run-time conversion instruction, use OpBitcast.
  7493. convOp = spv::Op::OpBitcast;
  7494. }
  7495. if (resultBasicType == glslang::EbtBool) {
  7496. uint32_t bits = GetNumBits(operandBasicType);
  7497. if (isTypeInt(operandBasicType)) {
  7498. spv::Id zeroType = builder.makeUintType(bits);
  7499. if (bits == 64) {
  7500. zero = builder.makeInt64Constant(zeroType, 0, false);
  7501. } else {
  7502. zero = builder.makeIntConstant(zeroType, 0, false);
  7503. }
  7504. zero = makeSmearedConstant(zero, vectorSize);
  7505. return builder.createBinOp(spv::Op::OpINotEqual, destType, operand, zero);
  7506. } else {
  7507. assert(isTypeFloat(operandBasicType));
  7508. if (bits == 64) {
  7509. zero = builder.makeDoubleConstant(0.0);
  7510. } else if (bits == 32) {
  7511. zero = builder.makeFloatConstant(0.0);
  7512. } else {
  7513. assert(bits == 16);
  7514. zero = builder.makeFloat16Constant(0.0);
  7515. }
  7516. zero = makeSmearedConstant(zero, vectorSize);
  7517. return builder.createBinOp(spv::Op::OpFUnordNotEqual, destType, operand, zero);
  7518. }
  7519. }
  7520. if (operandBasicType == glslang::EbtBool) {
  7521. uint32_t bits = GetNumBits(resultBasicType);
  7522. convOp = spv::Op::OpSelect;
  7523. if (isTypeInt(resultBasicType)) {
  7524. spv::Id zeroType = isTypeSignedInt(resultBasicType) ? builder.makeIntType(bits) : builder.makeUintType(bits);
  7525. if (bits == 64) {
  7526. zero = builder.makeInt64Constant(zeroType, 0, false);
  7527. one = builder.makeInt64Constant(zeroType, 1, false);
  7528. } else {
  7529. zero = builder.makeIntConstant(zeroType, 0, false);
  7530. one = builder.makeIntConstant(zeroType, 1, false);
  7531. }
  7532. } else {
  7533. assert(isTypeFloat(resultBasicType));
  7534. if (bits == 64) {
  7535. zero = builder.makeDoubleConstant(0.0);
  7536. one = builder.makeDoubleConstant(1.0);
  7537. } else if (bits == 32) {
  7538. zero = builder.makeFloatConstant(0.0);
  7539. one = builder.makeFloatConstant(1.0);
  7540. } else {
  7541. assert(bits == 16);
  7542. zero = builder.makeFloat16Constant(0.0);
  7543. one = builder.makeFloat16Constant(1.0);
  7544. }
  7545. }
  7546. }
  7547. }
  7548. if (convOp == spv::Op::OpNop) {
  7549. switch (op) {
  7550. case glslang::EOpConvUint64ToPtr:
  7551. convOp = spv::Op::OpConvertUToPtr;
  7552. break;
  7553. case glslang::EOpConvPtrToUint64:
  7554. convOp = spv::Op::OpConvertPtrToU;
  7555. break;
  7556. case glslang::EOpConvPtrToUvec2:
  7557. case glslang::EOpConvUvec2ToPtr:
  7558. convOp = spv::Op::OpBitcast;
  7559. break;
  7560. default:
  7561. break;
  7562. }
  7563. }
  7564. spv::Id result = 0;
  7565. if (convOp == spv::Op::OpNop)
  7566. return result;
  7567. if (convOp == spv::Op::OpSelect) {
  7568. zero = makeSmearedConstant(zero, vectorSize);
  7569. one = makeSmearedConstant(one, vectorSize);
  7570. result = builder.createTriOp(convOp, destType, operand, one, zero);
  7571. } else
  7572. result = builder.createUnaryOp(convOp, destType, operand);
  7573. result = builder.setPrecision(result, decorations.precision);
  7574. decorations.addNonUniform(builder, result);
  7575. return result;
  7576. }
  7577. spv::Id TGlslangToSpvTraverser::makeSmearedConstant(spv::Id constant, int vectorSize)
  7578. {
  7579. if (vectorSize == 0)
  7580. return constant;
  7581. spv::Id vectorTypeId = builder.makeVectorType(builder.getTypeId(constant), vectorSize);
  7582. std::vector<spv::Id> components;
  7583. for (int c = 0; c < vectorSize; ++c)
  7584. components.push_back(constant);
  7585. return builder.makeCompositeConstant(vectorTypeId, components);
  7586. }
  7587. // For glslang ops that map to SPV atomic opCodes
  7588. spv::Id TGlslangToSpvTraverser::createAtomicOperation(glslang::TOperator op, spv::Decoration /*precision*/,
  7589. spv::Id typeId, std::vector<spv::Id>& operands, glslang::TBasicType typeProxy,
  7590. const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags, const glslang::TType &opType)
  7591. {
  7592. spv::Op opCode = spv::Op::OpNop;
  7593. switch (op) {
  7594. case glslang::EOpAtomicAdd:
  7595. case glslang::EOpImageAtomicAdd:
  7596. case glslang::EOpAtomicCounterAdd:
  7597. opCode = spv::Op::OpAtomicIAdd;
  7598. if (typeProxy == glslang::EbtFloat16 || typeProxy == glslang::EbtFloat || typeProxy == glslang::EbtDouble) {
  7599. opCode = spv::Op::OpAtomicFAddEXT;
  7600. if (typeProxy == glslang::EbtFloat16 &&
  7601. (opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {
  7602. builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);
  7603. builder.addCapability(spv::Capability::AtomicFloat16VectorNV);
  7604. } else {
  7605. builder.addExtension(spv::E_SPV_EXT_shader_atomic_float_add);
  7606. if (typeProxy == glslang::EbtFloat16) {
  7607. builder.addExtension(spv::E_SPV_EXT_shader_atomic_float16_add);
  7608. builder.addCapability(spv::Capability::AtomicFloat16AddEXT);
  7609. } else if (typeProxy == glslang::EbtFloat) {
  7610. builder.addCapability(spv::Capability::AtomicFloat32AddEXT);
  7611. } else {
  7612. builder.addCapability(spv::Capability::AtomicFloat64AddEXT);
  7613. }
  7614. }
  7615. }
  7616. break;
  7617. case glslang::EOpAtomicSubtract:
  7618. case glslang::EOpAtomicCounterSubtract:
  7619. opCode = spv::Op::OpAtomicISub;
  7620. break;
  7621. case glslang::EOpAtomicMin:
  7622. case glslang::EOpImageAtomicMin:
  7623. case glslang::EOpAtomicCounterMin:
  7624. if (typeProxy == glslang::EbtFloat16 || typeProxy == glslang::EbtFloat || typeProxy == glslang::EbtDouble) {
  7625. opCode = spv::Op::OpAtomicFMinEXT;
  7626. if (typeProxy == glslang::EbtFloat16 &&
  7627. (opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {
  7628. builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);
  7629. builder.addCapability(spv::Capability::AtomicFloat16VectorNV);
  7630. } else {
  7631. builder.addExtension(spv::E_SPV_EXT_shader_atomic_float_min_max);
  7632. if (typeProxy == glslang::EbtFloat16)
  7633. builder.addCapability(spv::Capability::AtomicFloat16MinMaxEXT);
  7634. else if (typeProxy == glslang::EbtFloat)
  7635. builder.addCapability(spv::Capability::AtomicFloat32MinMaxEXT);
  7636. else
  7637. builder.addCapability(spv::Capability::AtomicFloat64MinMaxEXT);
  7638. }
  7639. } else if (typeProxy == glslang::EbtUint || typeProxy == glslang::EbtUint64) {
  7640. opCode = spv::Op::OpAtomicUMin;
  7641. } else {
  7642. opCode = spv::Op::OpAtomicSMin;
  7643. }
  7644. break;
  7645. case glslang::EOpAtomicMax:
  7646. case glslang::EOpImageAtomicMax:
  7647. case glslang::EOpAtomicCounterMax:
  7648. if (typeProxy == glslang::EbtFloat16 || typeProxy == glslang::EbtFloat || typeProxy == glslang::EbtDouble) {
  7649. opCode = spv::Op::OpAtomicFMaxEXT;
  7650. if (typeProxy == glslang::EbtFloat16 &&
  7651. (opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {
  7652. builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);
  7653. builder.addCapability(spv::Capability::AtomicFloat16VectorNV);
  7654. } else {
  7655. builder.addExtension(spv::E_SPV_EXT_shader_atomic_float_min_max);
  7656. if (typeProxy == glslang::EbtFloat16)
  7657. builder.addCapability(spv::Capability::AtomicFloat16MinMaxEXT);
  7658. else if (typeProxy == glslang::EbtFloat)
  7659. builder.addCapability(spv::Capability::AtomicFloat32MinMaxEXT);
  7660. else
  7661. builder.addCapability(spv::Capability::AtomicFloat64MinMaxEXT);
  7662. }
  7663. } else if (typeProxy == glslang::EbtUint || typeProxy == glslang::EbtUint64) {
  7664. opCode = spv::Op::OpAtomicUMax;
  7665. } else {
  7666. opCode = spv::Op::OpAtomicSMax;
  7667. }
  7668. break;
  7669. case glslang::EOpAtomicAnd:
  7670. case glslang::EOpImageAtomicAnd:
  7671. case glslang::EOpAtomicCounterAnd:
  7672. opCode = spv::Op::OpAtomicAnd;
  7673. break;
  7674. case glslang::EOpAtomicOr:
  7675. case glslang::EOpImageAtomicOr:
  7676. case glslang::EOpAtomicCounterOr:
  7677. opCode = spv::Op::OpAtomicOr;
  7678. break;
  7679. case glslang::EOpAtomicXor:
  7680. case glslang::EOpImageAtomicXor:
  7681. case glslang::EOpAtomicCounterXor:
  7682. opCode = spv::Op::OpAtomicXor;
  7683. break;
  7684. case glslang::EOpAtomicExchange:
  7685. case glslang::EOpImageAtomicExchange:
  7686. case glslang::EOpAtomicCounterExchange:
  7687. if ((typeProxy == glslang::EbtFloat16) &&
  7688. (opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {
  7689. builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);
  7690. builder.addCapability(spv::Capability::AtomicFloat16VectorNV);
  7691. }
  7692. opCode = spv::Op::OpAtomicExchange;
  7693. break;
  7694. case glslang::EOpAtomicCompSwap:
  7695. case glslang::EOpImageAtomicCompSwap:
  7696. case glslang::EOpAtomicCounterCompSwap:
  7697. opCode = spv::Op::OpAtomicCompareExchange;
  7698. break;
  7699. case glslang::EOpAtomicCounterIncrement:
  7700. opCode = spv::Op::OpAtomicIIncrement;
  7701. break;
  7702. case glslang::EOpAtomicCounterDecrement:
  7703. opCode = spv::Op::OpAtomicIDecrement;
  7704. break;
  7705. case glslang::EOpAtomicCounter:
  7706. case glslang::EOpImageAtomicLoad:
  7707. case glslang::EOpAtomicLoad:
  7708. opCode = spv::Op::OpAtomicLoad;
  7709. break;
  7710. case glslang::EOpAtomicStore:
  7711. case glslang::EOpImageAtomicStore:
  7712. opCode = spv::Op::OpAtomicStore;
  7713. break;
  7714. default:
  7715. assert(0);
  7716. break;
  7717. }
  7718. if (typeProxy == glslang::EbtInt64 || typeProxy == glslang::EbtUint64)
  7719. builder.addCapability(spv::Capability::Int64Atomics);
  7720. // Sort out the operands
  7721. // - mapping from glslang -> SPV
  7722. // - there are extra SPV operands that are optional in glslang
  7723. // - compare-exchange swaps the value and comparator
  7724. // - compare-exchange has an extra memory semantics
  7725. // - EOpAtomicCounterDecrement needs a post decrement
  7726. spv::Id pointerId = 0, compareId = 0, valueId = 0;
  7727. // scope defaults to Device in the old model, QueueFamilyKHR in the new model
  7728. spv::Id scopeId;
  7729. if (glslangIntermediate->usingVulkanMemoryModel()) {
  7730. scopeId = builder.makeUintConstant(spv::Scope::QueueFamilyKHR);
  7731. } else {
  7732. scopeId = builder.makeUintConstant(spv::Scope::Device);
  7733. }
  7734. // semantics default to relaxed
  7735. spv::Id semanticsId = builder.makeUintConstant(lvalueCoherentFlags.isVolatile() &&
  7736. glslangIntermediate->usingVulkanMemoryModel() ?
  7737. spv::MemorySemanticsMask::Volatile :
  7738. spv::MemorySemanticsMask::MaskNone);
  7739. spv::Id semanticsId2 = semanticsId;
  7740. pointerId = operands[0];
  7741. if (opCode == spv::Op::OpAtomicIIncrement || opCode == spv::Op::OpAtomicIDecrement) {
  7742. // no additional operands
  7743. } else if (opCode == spv::Op::OpAtomicCompareExchange) {
  7744. compareId = operands[1];
  7745. valueId = operands[2];
  7746. if (operands.size() > 3) {
  7747. scopeId = operands[3];
  7748. semanticsId = builder.makeUintConstant(
  7749. builder.getConstantScalar(operands[4]) | builder.getConstantScalar(operands[5]));
  7750. semanticsId2 = builder.makeUintConstant(
  7751. builder.getConstantScalar(operands[6]) | builder.getConstantScalar(operands[7]));
  7752. }
  7753. } else if (opCode == spv::Op::OpAtomicLoad) {
  7754. if (operands.size() > 1) {
  7755. scopeId = operands[1];
  7756. semanticsId = builder.makeUintConstant(
  7757. builder.getConstantScalar(operands[2]) | builder.getConstantScalar(operands[3]));
  7758. }
  7759. } else {
  7760. // atomic store or RMW
  7761. valueId = operands[1];
  7762. if (operands.size() > 2) {
  7763. scopeId = operands[2];
  7764. semanticsId = builder.makeUintConstant
  7765. (builder.getConstantScalar(operands[3]) | builder.getConstantScalar(operands[4]));
  7766. }
  7767. }
  7768. // Check for capabilities
  7769. auto const semanticsImmediate = (spv::MemorySemanticsMask)(builder.getConstantScalar(semanticsId) | builder.getConstantScalar(semanticsId2));
  7770. if (anySet(semanticsImmediate, spv::MemorySemanticsMask::MakeAvailableKHR |
  7771. spv::MemorySemanticsMask::MakeVisibleKHR |
  7772. spv::MemorySemanticsMask::OutputMemoryKHR |
  7773. spv::MemorySemanticsMask::Volatile)) {
  7774. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  7775. }
  7776. auto const scope = (spv::Scope)builder.getConstantScalar(scopeId);
  7777. if (scope == spv::Scope::QueueFamily) {
  7778. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  7779. }
  7780. if (glslangIntermediate->usingVulkanMemoryModel() && scope == spv::Scope::Device) {
  7781. builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);
  7782. }
  7783. std::vector<spv::Id> spvAtomicOperands; // hold the spv operands
  7784. spvAtomicOperands.reserve(6);
  7785. spvAtomicOperands.push_back(pointerId);
  7786. spvAtomicOperands.push_back(scopeId);
  7787. spvAtomicOperands.push_back(semanticsId);
  7788. if (opCode == spv::Op::OpAtomicCompareExchange) {
  7789. spvAtomicOperands.push_back(semanticsId2);
  7790. spvAtomicOperands.push_back(valueId);
  7791. spvAtomicOperands.push_back(compareId);
  7792. } else if (opCode != spv::Op::OpAtomicLoad && opCode != spv::Op::OpAtomicIIncrement && opCode != spv::Op::OpAtomicIDecrement) {
  7793. spvAtomicOperands.push_back(valueId);
  7794. }
  7795. if (opCode == spv::Op::OpAtomicStore) {
  7796. builder.createNoResultOp(opCode, spvAtomicOperands);
  7797. return 0;
  7798. } else {
  7799. spv::Id resultId = builder.createOp(opCode, typeId, spvAtomicOperands);
  7800. // GLSL and HLSL atomic-counter decrement return post-decrement value,
  7801. // while SPIR-V returns pre-decrement value. Translate between these semantics.
  7802. if (op == glslang::EOpAtomicCounterDecrement)
  7803. resultId = builder.createBinOp(spv::Op::OpISub, typeId, resultId, builder.makeIntConstant(1));
  7804. return resultId;
  7805. }
  7806. }
  7807. // Create group invocation operations.
  7808. spv::Id TGlslangToSpvTraverser::createInvocationsOperation(glslang::TOperator op, spv::Id typeId,
  7809. std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)
  7810. {
  7811. bool isUnsigned = isTypeUnsignedInt(typeProxy);
  7812. bool isFloat = isTypeFloat(typeProxy);
  7813. spv::Op opCode = spv::Op::OpNop;
  7814. std::vector<spv::IdImmediate> spvGroupOperands;
  7815. spv::GroupOperation groupOperation = spv::GroupOperation::Max;
  7816. if (op == glslang::EOpBallot || op == glslang::EOpReadFirstInvocation ||
  7817. op == glslang::EOpReadInvocation) {
  7818. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  7819. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  7820. } else if (op == glslang::EOpAnyInvocation ||
  7821. op == glslang::EOpAllInvocations ||
  7822. op == glslang::EOpAllInvocationsEqual) {
  7823. builder.addExtension(spv::E_SPV_KHR_subgroup_vote);
  7824. builder.addCapability(spv::Capability::SubgroupVoteKHR);
  7825. } else {
  7826. builder.addCapability(spv::Capability::Groups);
  7827. if (op == glslang::EOpMinInvocationsNonUniform ||
  7828. op == glslang::EOpMaxInvocationsNonUniform ||
  7829. op == glslang::EOpAddInvocationsNonUniform ||
  7830. op == glslang::EOpMinInvocationsInclusiveScanNonUniform ||
  7831. op == glslang::EOpMaxInvocationsInclusiveScanNonUniform ||
  7832. op == glslang::EOpAddInvocationsInclusiveScanNonUniform ||
  7833. op == glslang::EOpMinInvocationsExclusiveScanNonUniform ||
  7834. op == glslang::EOpMaxInvocationsExclusiveScanNonUniform ||
  7835. op == glslang::EOpAddInvocationsExclusiveScanNonUniform)
  7836. builder.addExtension(spv::E_SPV_AMD_shader_ballot);
  7837. switch (op) {
  7838. case glslang::EOpMinInvocations:
  7839. case glslang::EOpMaxInvocations:
  7840. case glslang::EOpAddInvocations:
  7841. case glslang::EOpMinInvocationsNonUniform:
  7842. case glslang::EOpMaxInvocationsNonUniform:
  7843. case glslang::EOpAddInvocationsNonUniform:
  7844. groupOperation = spv::GroupOperation::Reduce;
  7845. break;
  7846. case glslang::EOpMinInvocationsInclusiveScan:
  7847. case glslang::EOpMaxInvocationsInclusiveScan:
  7848. case glslang::EOpAddInvocationsInclusiveScan:
  7849. case glslang::EOpMinInvocationsInclusiveScanNonUniform:
  7850. case glslang::EOpMaxInvocationsInclusiveScanNonUniform:
  7851. case glslang::EOpAddInvocationsInclusiveScanNonUniform:
  7852. groupOperation = spv::GroupOperation::InclusiveScan;
  7853. break;
  7854. case glslang::EOpMinInvocationsExclusiveScan:
  7855. case glslang::EOpMaxInvocationsExclusiveScan:
  7856. case glslang::EOpAddInvocationsExclusiveScan:
  7857. case glslang::EOpMinInvocationsExclusiveScanNonUniform:
  7858. case glslang::EOpMaxInvocationsExclusiveScanNonUniform:
  7859. case glslang::EOpAddInvocationsExclusiveScanNonUniform:
  7860. groupOperation = spv::GroupOperation::ExclusiveScan;
  7861. break;
  7862. default:
  7863. break;
  7864. }
  7865. spv::IdImmediate scope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };
  7866. spvGroupOperands.push_back(scope);
  7867. if (groupOperation != spv::GroupOperation::Max) {
  7868. spv::IdImmediate groupOp = { false, (unsigned)groupOperation };
  7869. spvGroupOperands.push_back(groupOp);
  7870. }
  7871. }
  7872. for (auto opIt = operands.begin(); opIt != operands.end(); ++opIt) {
  7873. spv::IdImmediate op = { true, *opIt };
  7874. spvGroupOperands.push_back(op);
  7875. }
  7876. switch (op) {
  7877. case glslang::EOpAnyInvocation:
  7878. opCode = spv::Op::OpSubgroupAnyKHR;
  7879. break;
  7880. case glslang::EOpAllInvocations:
  7881. opCode = spv::Op::OpSubgroupAllKHR;
  7882. break;
  7883. case glslang::EOpAllInvocationsEqual:
  7884. opCode = spv::Op::OpSubgroupAllEqualKHR;
  7885. break;
  7886. case glslang::EOpReadInvocation:
  7887. opCode = spv::Op::OpSubgroupReadInvocationKHR;
  7888. if (builder.isVectorType(typeId))
  7889. return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
  7890. break;
  7891. case glslang::EOpReadFirstInvocation:
  7892. opCode = spv::Op::OpSubgroupFirstInvocationKHR;
  7893. if (builder.isVectorType(typeId))
  7894. return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
  7895. break;
  7896. case glslang::EOpBallot:
  7897. {
  7898. // NOTE: According to the spec, the result type of "OpSubgroupBallotKHR" must be a 4 component vector of 32
  7899. // bit integer types. The GLSL built-in function "ballotARB()" assumes the maximum number of invocations in
  7900. // a subgroup is 64. Thus, we have to convert uvec4.xy to uint64_t as follow:
  7901. //
  7902. // result = Bitcast(SubgroupBallotKHR(Predicate).xy)
  7903. //
  7904. spv::Id uintType = builder.makeUintType(32);
  7905. spv::Id uvec4Type = builder.makeVectorType(uintType, 4);
  7906. spv::Id result = builder.createOp(spv::Op::OpSubgroupBallotKHR, uvec4Type, spvGroupOperands);
  7907. std::vector<spv::Id> components;
  7908. components.push_back(builder.createCompositeExtract(result, uintType, 0));
  7909. components.push_back(builder.createCompositeExtract(result, uintType, 1));
  7910. spv::Id uvec2Type = builder.makeVectorType(uintType, 2);
  7911. return builder.createUnaryOp(spv::Op::OpBitcast, typeId,
  7912. builder.createCompositeConstruct(uvec2Type, components));
  7913. }
  7914. case glslang::EOpMinInvocations:
  7915. case glslang::EOpMaxInvocations:
  7916. case glslang::EOpAddInvocations:
  7917. case glslang::EOpMinInvocationsInclusiveScan:
  7918. case glslang::EOpMaxInvocationsInclusiveScan:
  7919. case glslang::EOpAddInvocationsInclusiveScan:
  7920. case glslang::EOpMinInvocationsExclusiveScan:
  7921. case glslang::EOpMaxInvocationsExclusiveScan:
  7922. case glslang::EOpAddInvocationsExclusiveScan:
  7923. if (op == glslang::EOpMinInvocations ||
  7924. op == glslang::EOpMinInvocationsInclusiveScan ||
  7925. op == glslang::EOpMinInvocationsExclusiveScan) {
  7926. if (isFloat)
  7927. opCode = spv::Op::OpGroupFMin;
  7928. else {
  7929. if (isUnsigned)
  7930. opCode = spv::Op::OpGroupUMin;
  7931. else
  7932. opCode = spv::Op::OpGroupSMin;
  7933. }
  7934. } else if (op == glslang::EOpMaxInvocations ||
  7935. op == glslang::EOpMaxInvocationsInclusiveScan ||
  7936. op == glslang::EOpMaxInvocationsExclusiveScan) {
  7937. if (isFloat)
  7938. opCode = spv::Op::OpGroupFMax;
  7939. else {
  7940. if (isUnsigned)
  7941. opCode = spv::Op::OpGroupUMax;
  7942. else
  7943. opCode = spv::Op::OpGroupSMax;
  7944. }
  7945. } else {
  7946. if (isFloat)
  7947. opCode = spv::Op::OpGroupFAdd;
  7948. else
  7949. opCode = spv::Op::OpGroupIAdd;
  7950. }
  7951. if (builder.isVectorType(typeId))
  7952. return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
  7953. break;
  7954. case glslang::EOpMinInvocationsNonUniform:
  7955. case glslang::EOpMaxInvocationsNonUniform:
  7956. case glslang::EOpAddInvocationsNonUniform:
  7957. case glslang::EOpMinInvocationsInclusiveScanNonUniform:
  7958. case glslang::EOpMaxInvocationsInclusiveScanNonUniform:
  7959. case glslang::EOpAddInvocationsInclusiveScanNonUniform:
  7960. case glslang::EOpMinInvocationsExclusiveScanNonUniform:
  7961. case glslang::EOpMaxInvocationsExclusiveScanNonUniform:
  7962. case glslang::EOpAddInvocationsExclusiveScanNonUniform:
  7963. if (op == glslang::EOpMinInvocationsNonUniform ||
  7964. op == glslang::EOpMinInvocationsInclusiveScanNonUniform ||
  7965. op == glslang::EOpMinInvocationsExclusiveScanNonUniform) {
  7966. if (isFloat)
  7967. opCode = spv::Op::OpGroupFMinNonUniformAMD;
  7968. else {
  7969. if (isUnsigned)
  7970. opCode = spv::Op::OpGroupUMinNonUniformAMD;
  7971. else
  7972. opCode = spv::Op::OpGroupSMinNonUniformAMD;
  7973. }
  7974. }
  7975. else if (op == glslang::EOpMaxInvocationsNonUniform ||
  7976. op == glslang::EOpMaxInvocationsInclusiveScanNonUniform ||
  7977. op == glslang::EOpMaxInvocationsExclusiveScanNonUniform) {
  7978. if (isFloat)
  7979. opCode = spv::Op::OpGroupFMaxNonUniformAMD;
  7980. else {
  7981. if (isUnsigned)
  7982. opCode = spv::Op::OpGroupUMaxNonUniformAMD;
  7983. else
  7984. opCode = spv::Op::OpGroupSMaxNonUniformAMD;
  7985. }
  7986. }
  7987. else {
  7988. if (isFloat)
  7989. opCode = spv::Op::OpGroupFAddNonUniformAMD;
  7990. else
  7991. opCode = spv::Op::OpGroupIAddNonUniformAMD;
  7992. }
  7993. if (builder.isVectorType(typeId))
  7994. return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
  7995. break;
  7996. default:
  7997. logger->missingFunctionality("invocation operation");
  7998. return spv::NoResult;
  7999. }
  8000. assert(opCode != spv::Op::OpNop);
  8001. return builder.createOp(opCode, typeId, spvGroupOperands);
  8002. }
  8003. // Create group invocation operations on a vector
  8004. spv::Id TGlslangToSpvTraverser::CreateInvocationsVectorOperation(spv::Op op, spv::GroupOperation groupOperation,
  8005. spv::Id typeId, std::vector<spv::Id>& operands)
  8006. {
  8007. assert(op == spv::Op::OpGroupFMin || op == spv::Op::OpGroupUMin || op == spv::Op::OpGroupSMin ||
  8008. op == spv::Op::OpGroupFMax || op == spv::Op::OpGroupUMax || op == spv::Op::OpGroupSMax ||
  8009. op == spv::Op::OpGroupFAdd || op == spv::Op::OpGroupIAdd || op == spv::Op::OpGroupBroadcast ||
  8010. op == spv::Op::OpSubgroupReadInvocationKHR || op == spv::Op::OpSubgroupFirstInvocationKHR ||
  8011. op == spv::Op::OpGroupFMinNonUniformAMD || op == spv::Op::OpGroupUMinNonUniformAMD ||
  8012. op == spv::Op::OpGroupSMinNonUniformAMD ||
  8013. op == spv::Op::OpGroupFMaxNonUniformAMD || op == spv::Op::OpGroupUMaxNonUniformAMD ||
  8014. op == spv::Op::OpGroupSMaxNonUniformAMD ||
  8015. op == spv::Op::OpGroupFAddNonUniformAMD || op == spv::Op::OpGroupIAddNonUniformAMD);
  8016. // Handle group invocation operations scalar by scalar.
  8017. // The result type is the same type as the original type.
  8018. // The algorithm is to:
  8019. // - break the vector into scalars
  8020. // - apply the operation to each scalar
  8021. // - make a vector out the scalar results
  8022. // get the types sorted out
  8023. int numComponents = builder.getNumComponents(operands[0]);
  8024. spv::Id scalarType = builder.getScalarTypeId(builder.getTypeId(operands[0]));
  8025. std::vector<spv::Id> results;
  8026. // do each scalar op
  8027. for (int comp = 0; comp < numComponents; ++comp) {
  8028. std::vector<unsigned int> indexes;
  8029. indexes.push_back(comp);
  8030. spv::IdImmediate scalar = { true, builder.createCompositeExtract(operands[0], scalarType, indexes) };
  8031. std::vector<spv::IdImmediate> spvGroupOperands;
  8032. if (op == spv::Op::OpSubgroupReadInvocationKHR) {
  8033. spvGroupOperands.push_back(scalar);
  8034. spv::IdImmediate operand = { true, operands[1] };
  8035. spvGroupOperands.push_back(operand);
  8036. } else if (op == spv::Op::OpSubgroupFirstInvocationKHR) {
  8037. spvGroupOperands.push_back(scalar);
  8038. } else if (op == spv::Op::OpGroupBroadcast) {
  8039. spv::IdImmediate scope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };
  8040. spvGroupOperands.push_back(scope);
  8041. spvGroupOperands.push_back(scalar);
  8042. spv::IdImmediate operand = { true, operands[1] };
  8043. spvGroupOperands.push_back(operand);
  8044. } else {
  8045. spv::IdImmediate scope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };
  8046. spvGroupOperands.push_back(scope);
  8047. spv::IdImmediate groupOp = { false, (unsigned)groupOperation };
  8048. spvGroupOperands.push_back(groupOp);
  8049. spvGroupOperands.push_back(scalar);
  8050. }
  8051. results.push_back(builder.createOp(op, scalarType, spvGroupOperands));
  8052. }
  8053. // put the pieces together
  8054. return builder.createCompositeConstruct(typeId, results);
  8055. }
  8056. // Create subgroup invocation operations.
  8057. spv::Id TGlslangToSpvTraverser::createSubgroupOperation(glslang::TOperator op, spv::Id typeId,
  8058. std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)
  8059. {
  8060. // Add the required capabilities.
  8061. switch (op) {
  8062. case glslang::EOpSubgroupElect:
  8063. builder.addCapability(spv::Capability::GroupNonUniform);
  8064. break;
  8065. case glslang::EOpSubgroupQuadAll:
  8066. case glslang::EOpSubgroupQuadAny:
  8067. builder.addExtension(spv::E_SPV_KHR_quad_control);
  8068. builder.addCapability(spv::Capability::QuadControlKHR);
  8069. [[fallthrough]];
  8070. case glslang::EOpSubgroupAll:
  8071. case glslang::EOpSubgroupAny:
  8072. case glslang::EOpSubgroupAllEqual:
  8073. builder.addCapability(spv::Capability::GroupNonUniform);
  8074. builder.addCapability(spv::Capability::GroupNonUniformVote);
  8075. break;
  8076. case glslang::EOpSubgroupBroadcast:
  8077. case glslang::EOpSubgroupBroadcastFirst:
  8078. case glslang::EOpSubgroupBallot:
  8079. case glslang::EOpSubgroupInverseBallot:
  8080. case glslang::EOpSubgroupBallotBitExtract:
  8081. case glslang::EOpSubgroupBallotBitCount:
  8082. case glslang::EOpSubgroupBallotInclusiveBitCount:
  8083. case glslang::EOpSubgroupBallotExclusiveBitCount:
  8084. case glslang::EOpSubgroupBallotFindLSB:
  8085. case glslang::EOpSubgroupBallotFindMSB:
  8086. builder.addCapability(spv::Capability::GroupNonUniform);
  8087. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  8088. break;
  8089. case glslang::EOpSubgroupRotate:
  8090. case glslang::EOpSubgroupClusteredRotate:
  8091. builder.addExtension(spv::E_SPV_KHR_subgroup_rotate);
  8092. builder.addCapability(spv::Capability::GroupNonUniformRotateKHR);
  8093. break;
  8094. case glslang::EOpSubgroupShuffle:
  8095. case glslang::EOpSubgroupShuffleXor:
  8096. builder.addCapability(spv::Capability::GroupNonUniform);
  8097. builder.addCapability(spv::Capability::GroupNonUniformShuffle);
  8098. break;
  8099. case glslang::EOpSubgroupShuffleUp:
  8100. case glslang::EOpSubgroupShuffleDown:
  8101. builder.addCapability(spv::Capability::GroupNonUniform);
  8102. builder.addCapability(spv::Capability::GroupNonUniformShuffleRelative);
  8103. break;
  8104. case glslang::EOpSubgroupAdd:
  8105. case glslang::EOpSubgroupMul:
  8106. case glslang::EOpSubgroupMin:
  8107. case glslang::EOpSubgroupMax:
  8108. case glslang::EOpSubgroupAnd:
  8109. case glslang::EOpSubgroupOr:
  8110. case glslang::EOpSubgroupXor:
  8111. case glslang::EOpSubgroupInclusiveAdd:
  8112. case glslang::EOpSubgroupInclusiveMul:
  8113. case glslang::EOpSubgroupInclusiveMin:
  8114. case glslang::EOpSubgroupInclusiveMax:
  8115. case glslang::EOpSubgroupInclusiveAnd:
  8116. case glslang::EOpSubgroupInclusiveOr:
  8117. case glslang::EOpSubgroupInclusiveXor:
  8118. case glslang::EOpSubgroupExclusiveAdd:
  8119. case glslang::EOpSubgroupExclusiveMul:
  8120. case glslang::EOpSubgroupExclusiveMin:
  8121. case glslang::EOpSubgroupExclusiveMax:
  8122. case glslang::EOpSubgroupExclusiveAnd:
  8123. case glslang::EOpSubgroupExclusiveOr:
  8124. case glslang::EOpSubgroupExclusiveXor:
  8125. builder.addCapability(spv::Capability::GroupNonUniform);
  8126. builder.addCapability(spv::Capability::GroupNonUniformArithmetic);
  8127. break;
  8128. case glslang::EOpSubgroupClusteredAdd:
  8129. case glslang::EOpSubgroupClusteredMul:
  8130. case glslang::EOpSubgroupClusteredMin:
  8131. case glslang::EOpSubgroupClusteredMax:
  8132. case glslang::EOpSubgroupClusteredAnd:
  8133. case glslang::EOpSubgroupClusteredOr:
  8134. case glslang::EOpSubgroupClusteredXor:
  8135. builder.addCapability(spv::Capability::GroupNonUniform);
  8136. builder.addCapability(spv::Capability::GroupNonUniformClustered);
  8137. break;
  8138. case glslang::EOpSubgroupQuadBroadcast:
  8139. case glslang::EOpSubgroupQuadSwapHorizontal:
  8140. case glslang::EOpSubgroupQuadSwapVertical:
  8141. case glslang::EOpSubgroupQuadSwapDiagonal:
  8142. builder.addCapability(spv::Capability::GroupNonUniform);
  8143. builder.addCapability(spv::Capability::GroupNonUniformQuad);
  8144. break;
  8145. case glslang::EOpSubgroupPartitionedAdd:
  8146. case glslang::EOpSubgroupPartitionedMul:
  8147. case glslang::EOpSubgroupPartitionedMin:
  8148. case glslang::EOpSubgroupPartitionedMax:
  8149. case glslang::EOpSubgroupPartitionedAnd:
  8150. case glslang::EOpSubgroupPartitionedOr:
  8151. case glslang::EOpSubgroupPartitionedXor:
  8152. case glslang::EOpSubgroupPartitionedInclusiveAdd:
  8153. case glslang::EOpSubgroupPartitionedInclusiveMul:
  8154. case glslang::EOpSubgroupPartitionedInclusiveMin:
  8155. case glslang::EOpSubgroupPartitionedInclusiveMax:
  8156. case glslang::EOpSubgroupPartitionedInclusiveAnd:
  8157. case glslang::EOpSubgroupPartitionedInclusiveOr:
  8158. case glslang::EOpSubgroupPartitionedInclusiveXor:
  8159. case glslang::EOpSubgroupPartitionedExclusiveAdd:
  8160. case glslang::EOpSubgroupPartitionedExclusiveMul:
  8161. case glslang::EOpSubgroupPartitionedExclusiveMin:
  8162. case glslang::EOpSubgroupPartitionedExclusiveMax:
  8163. case glslang::EOpSubgroupPartitionedExclusiveAnd:
  8164. case glslang::EOpSubgroupPartitionedExclusiveOr:
  8165. case glslang::EOpSubgroupPartitionedExclusiveXor:
  8166. builder.addExtension(spv::E_SPV_NV_shader_subgroup_partitioned);
  8167. builder.addCapability(spv::Capability::GroupNonUniformPartitionedNV);
  8168. break;
  8169. default: assert(0 && "Unhandled subgroup operation!");
  8170. }
  8171. const bool isUnsigned = isTypeUnsignedInt(typeProxy);
  8172. const bool isFloat = isTypeFloat(typeProxy);
  8173. const bool isBool = typeProxy == glslang::EbtBool;
  8174. spv::Op opCode = spv::Op::OpNop;
  8175. // Figure out which opcode to use.
  8176. switch (op) {
  8177. case glslang::EOpSubgroupElect: opCode = spv::Op::OpGroupNonUniformElect; break;
  8178. case glslang::EOpSubgroupQuadAll: opCode = spv::Op::OpGroupNonUniformQuadAllKHR; break;
  8179. case glslang::EOpSubgroupAll: opCode = spv::Op::OpGroupNonUniformAll; break;
  8180. case glslang::EOpSubgroupQuadAny: opCode = spv::Op::OpGroupNonUniformQuadAnyKHR; break;
  8181. case glslang::EOpSubgroupAny: opCode = spv::Op::OpGroupNonUniformAny; break;
  8182. case glslang::EOpSubgroupAllEqual: opCode = spv::Op::OpGroupNonUniformAllEqual; break;
  8183. case glslang::EOpSubgroupBroadcast: opCode = spv::Op::OpGroupNonUniformBroadcast; break;
  8184. case glslang::EOpSubgroupBroadcastFirst: opCode = spv::Op::OpGroupNonUniformBroadcastFirst; break;
  8185. case glslang::EOpSubgroupBallot: opCode = spv::Op::OpGroupNonUniformBallot; break;
  8186. case glslang::EOpSubgroupInverseBallot: opCode = spv::Op::OpGroupNonUniformInverseBallot; break;
  8187. case glslang::EOpSubgroupBallotBitExtract: opCode = spv::Op::OpGroupNonUniformBallotBitExtract; break;
  8188. case glslang::EOpSubgroupBallotBitCount:
  8189. case glslang::EOpSubgroupBallotInclusiveBitCount:
  8190. case glslang::EOpSubgroupBallotExclusiveBitCount: opCode = spv::Op::OpGroupNonUniformBallotBitCount; break;
  8191. case glslang::EOpSubgroupBallotFindLSB: opCode = spv::Op::OpGroupNonUniformBallotFindLSB; break;
  8192. case glslang::EOpSubgroupBallotFindMSB: opCode = spv::Op::OpGroupNonUniformBallotFindMSB; break;
  8193. case glslang::EOpSubgroupShuffle: opCode = spv::Op::OpGroupNonUniformShuffle; break;
  8194. case glslang::EOpSubgroupShuffleXor: opCode = spv::Op::OpGroupNonUniformShuffleXor; break;
  8195. case glslang::EOpSubgroupShuffleUp: opCode = spv::Op::OpGroupNonUniformShuffleUp; break;
  8196. case glslang::EOpSubgroupShuffleDown: opCode = spv::Op::OpGroupNonUniformShuffleDown; break;
  8197. case glslang::EOpSubgroupRotate:
  8198. case glslang::EOpSubgroupClusteredRotate: opCode = spv::Op::OpGroupNonUniformRotateKHR; break;
  8199. case glslang::EOpSubgroupAdd:
  8200. case glslang::EOpSubgroupInclusiveAdd:
  8201. case glslang::EOpSubgroupExclusiveAdd:
  8202. case glslang::EOpSubgroupClusteredAdd:
  8203. case glslang::EOpSubgroupPartitionedAdd:
  8204. case glslang::EOpSubgroupPartitionedInclusiveAdd:
  8205. case glslang::EOpSubgroupPartitionedExclusiveAdd:
  8206. if (isFloat) {
  8207. opCode = spv::Op::OpGroupNonUniformFAdd;
  8208. } else {
  8209. opCode = spv::Op::OpGroupNonUniformIAdd;
  8210. }
  8211. break;
  8212. case glslang::EOpSubgroupMul:
  8213. case glslang::EOpSubgroupInclusiveMul:
  8214. case glslang::EOpSubgroupExclusiveMul:
  8215. case glslang::EOpSubgroupClusteredMul:
  8216. case glslang::EOpSubgroupPartitionedMul:
  8217. case glslang::EOpSubgroupPartitionedInclusiveMul:
  8218. case glslang::EOpSubgroupPartitionedExclusiveMul:
  8219. if (isFloat) {
  8220. opCode = spv::Op::OpGroupNonUniformFMul;
  8221. } else {
  8222. opCode = spv::Op::OpGroupNonUniformIMul;
  8223. }
  8224. break;
  8225. case glslang::EOpSubgroupMin:
  8226. case glslang::EOpSubgroupInclusiveMin:
  8227. case glslang::EOpSubgroupExclusiveMin:
  8228. case glslang::EOpSubgroupClusteredMin:
  8229. case glslang::EOpSubgroupPartitionedMin:
  8230. case glslang::EOpSubgroupPartitionedInclusiveMin:
  8231. case glslang::EOpSubgroupPartitionedExclusiveMin:
  8232. if (isFloat) {
  8233. opCode = spv::Op::OpGroupNonUniformFMin;
  8234. } else if (isUnsigned) {
  8235. opCode = spv::Op::OpGroupNonUniformUMin;
  8236. } else {
  8237. opCode = spv::Op::OpGroupNonUniformSMin;
  8238. }
  8239. break;
  8240. case glslang::EOpSubgroupMax:
  8241. case glslang::EOpSubgroupInclusiveMax:
  8242. case glslang::EOpSubgroupExclusiveMax:
  8243. case glslang::EOpSubgroupClusteredMax:
  8244. case glslang::EOpSubgroupPartitionedMax:
  8245. case glslang::EOpSubgroupPartitionedInclusiveMax:
  8246. case glslang::EOpSubgroupPartitionedExclusiveMax:
  8247. if (isFloat) {
  8248. opCode = spv::Op::OpGroupNonUniformFMax;
  8249. } else if (isUnsigned) {
  8250. opCode = spv::Op::OpGroupNonUniformUMax;
  8251. } else {
  8252. opCode = spv::Op::OpGroupNonUniformSMax;
  8253. }
  8254. break;
  8255. case glslang::EOpSubgroupAnd:
  8256. case glslang::EOpSubgroupInclusiveAnd:
  8257. case glslang::EOpSubgroupExclusiveAnd:
  8258. case glslang::EOpSubgroupClusteredAnd:
  8259. case glslang::EOpSubgroupPartitionedAnd:
  8260. case glslang::EOpSubgroupPartitionedInclusiveAnd:
  8261. case glslang::EOpSubgroupPartitionedExclusiveAnd:
  8262. if (isBool) {
  8263. opCode = spv::Op::OpGroupNonUniformLogicalAnd;
  8264. } else {
  8265. opCode = spv::Op::OpGroupNonUniformBitwiseAnd;
  8266. }
  8267. break;
  8268. case glslang::EOpSubgroupOr:
  8269. case glslang::EOpSubgroupInclusiveOr:
  8270. case glslang::EOpSubgroupExclusiveOr:
  8271. case glslang::EOpSubgroupClusteredOr:
  8272. case glslang::EOpSubgroupPartitionedOr:
  8273. case glslang::EOpSubgroupPartitionedInclusiveOr:
  8274. case glslang::EOpSubgroupPartitionedExclusiveOr:
  8275. if (isBool) {
  8276. opCode = spv::Op::OpGroupNonUniformLogicalOr;
  8277. } else {
  8278. opCode = spv::Op::OpGroupNonUniformBitwiseOr;
  8279. }
  8280. break;
  8281. case glslang::EOpSubgroupXor:
  8282. case glslang::EOpSubgroupInclusiveXor:
  8283. case glslang::EOpSubgroupExclusiveXor:
  8284. case glslang::EOpSubgroupClusteredXor:
  8285. case glslang::EOpSubgroupPartitionedXor:
  8286. case glslang::EOpSubgroupPartitionedInclusiveXor:
  8287. case glslang::EOpSubgroupPartitionedExclusiveXor:
  8288. if (isBool) {
  8289. opCode = spv::Op::OpGroupNonUniformLogicalXor;
  8290. } else {
  8291. opCode = spv::Op::OpGroupNonUniformBitwiseXor;
  8292. }
  8293. break;
  8294. case glslang::EOpSubgroupQuadBroadcast: opCode = spv::Op::OpGroupNonUniformQuadBroadcast; break;
  8295. case glslang::EOpSubgroupQuadSwapHorizontal:
  8296. case glslang::EOpSubgroupQuadSwapVertical:
  8297. case glslang::EOpSubgroupQuadSwapDiagonal: opCode = spv::Op::OpGroupNonUniformQuadSwap; break;
  8298. default: assert(0 && "Unhandled subgroup operation!");
  8299. }
  8300. // get the right Group Operation
  8301. spv::GroupOperation groupOperation = spv::GroupOperation::Max;
  8302. switch (op) {
  8303. default:
  8304. break;
  8305. case glslang::EOpSubgroupBallotBitCount:
  8306. case glslang::EOpSubgroupAdd:
  8307. case glslang::EOpSubgroupMul:
  8308. case glslang::EOpSubgroupMin:
  8309. case glslang::EOpSubgroupMax:
  8310. case glslang::EOpSubgroupAnd:
  8311. case glslang::EOpSubgroupOr:
  8312. case glslang::EOpSubgroupXor:
  8313. groupOperation = spv::GroupOperation::Reduce;
  8314. break;
  8315. case glslang::EOpSubgroupBallotInclusiveBitCount:
  8316. case glslang::EOpSubgroupInclusiveAdd:
  8317. case glslang::EOpSubgroupInclusiveMul:
  8318. case glslang::EOpSubgroupInclusiveMin:
  8319. case glslang::EOpSubgroupInclusiveMax:
  8320. case glslang::EOpSubgroupInclusiveAnd:
  8321. case glslang::EOpSubgroupInclusiveOr:
  8322. case glslang::EOpSubgroupInclusiveXor:
  8323. groupOperation = spv::GroupOperation::InclusiveScan;
  8324. break;
  8325. case glslang::EOpSubgroupBallotExclusiveBitCount:
  8326. case glslang::EOpSubgroupExclusiveAdd:
  8327. case glslang::EOpSubgroupExclusiveMul:
  8328. case glslang::EOpSubgroupExclusiveMin:
  8329. case glslang::EOpSubgroupExclusiveMax:
  8330. case glslang::EOpSubgroupExclusiveAnd:
  8331. case glslang::EOpSubgroupExclusiveOr:
  8332. case glslang::EOpSubgroupExclusiveXor:
  8333. groupOperation = spv::GroupOperation::ExclusiveScan;
  8334. break;
  8335. case glslang::EOpSubgroupClusteredAdd:
  8336. case glslang::EOpSubgroupClusteredMul:
  8337. case glslang::EOpSubgroupClusteredMin:
  8338. case glslang::EOpSubgroupClusteredMax:
  8339. case glslang::EOpSubgroupClusteredAnd:
  8340. case glslang::EOpSubgroupClusteredOr:
  8341. case glslang::EOpSubgroupClusteredXor:
  8342. groupOperation = spv::GroupOperation::ClusteredReduce;
  8343. break;
  8344. case glslang::EOpSubgroupPartitionedAdd:
  8345. case glslang::EOpSubgroupPartitionedMul:
  8346. case glslang::EOpSubgroupPartitionedMin:
  8347. case glslang::EOpSubgroupPartitionedMax:
  8348. case glslang::EOpSubgroupPartitionedAnd:
  8349. case glslang::EOpSubgroupPartitionedOr:
  8350. case glslang::EOpSubgroupPartitionedXor:
  8351. groupOperation = spv::GroupOperation::PartitionedReduceNV;
  8352. break;
  8353. case glslang::EOpSubgroupPartitionedInclusiveAdd:
  8354. case glslang::EOpSubgroupPartitionedInclusiveMul:
  8355. case glslang::EOpSubgroupPartitionedInclusiveMin:
  8356. case glslang::EOpSubgroupPartitionedInclusiveMax:
  8357. case glslang::EOpSubgroupPartitionedInclusiveAnd:
  8358. case glslang::EOpSubgroupPartitionedInclusiveOr:
  8359. case glslang::EOpSubgroupPartitionedInclusiveXor:
  8360. groupOperation = spv::GroupOperation::PartitionedInclusiveScanNV;
  8361. break;
  8362. case glslang::EOpSubgroupPartitionedExclusiveAdd:
  8363. case glslang::EOpSubgroupPartitionedExclusiveMul:
  8364. case glslang::EOpSubgroupPartitionedExclusiveMin:
  8365. case glslang::EOpSubgroupPartitionedExclusiveMax:
  8366. case glslang::EOpSubgroupPartitionedExclusiveAnd:
  8367. case glslang::EOpSubgroupPartitionedExclusiveOr:
  8368. case glslang::EOpSubgroupPartitionedExclusiveXor:
  8369. groupOperation = spv::GroupOperation::PartitionedExclusiveScanNV;
  8370. break;
  8371. }
  8372. // build the instruction
  8373. std::vector<spv::IdImmediate> spvGroupOperands;
  8374. // Every operation begins with the Execution Scope operand.
  8375. spv::IdImmediate executionScope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };
  8376. // All other ops need the execution scope. Quad Control Ops don't need scope, it's always Quad.
  8377. if (opCode != spv::Op::OpGroupNonUniformQuadAllKHR && opCode != spv::Op::OpGroupNonUniformQuadAnyKHR) {
  8378. spvGroupOperands.push_back(executionScope);
  8379. }
  8380. // Next, for all operations that use a Group Operation, push that as an operand.
  8381. if (groupOperation != spv::GroupOperation::Max) {
  8382. spv::IdImmediate groupOperand = { false, (unsigned)groupOperation };
  8383. spvGroupOperands.push_back(groupOperand);
  8384. }
  8385. // Push back the operands next.
  8386. for (auto opIt = operands.cbegin(); opIt != operands.cend(); ++opIt) {
  8387. spv::IdImmediate operand = { true, *opIt };
  8388. spvGroupOperands.push_back(operand);
  8389. }
  8390. // Some opcodes have additional operands.
  8391. spv::Id directionId = spv::NoResult;
  8392. switch (op) {
  8393. default: break;
  8394. case glslang::EOpSubgroupQuadSwapHorizontal: directionId = builder.makeUintConstant(0); break;
  8395. case glslang::EOpSubgroupQuadSwapVertical: directionId = builder.makeUintConstant(1); break;
  8396. case glslang::EOpSubgroupQuadSwapDiagonal: directionId = builder.makeUintConstant(2); break;
  8397. }
  8398. if (directionId != spv::NoResult) {
  8399. spv::IdImmediate direction = { true, directionId };
  8400. spvGroupOperands.push_back(direction);
  8401. }
  8402. return builder.createOp(opCode, typeId, spvGroupOperands);
  8403. }
  8404. spv::Id TGlslangToSpvTraverser::createMiscOperation(glslang::TOperator op, spv::Decoration precision,
  8405. spv::Id typeId, std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)
  8406. {
  8407. bool isUnsigned = isTypeUnsignedInt(typeProxy);
  8408. bool isFloat = isTypeFloat(typeProxy);
  8409. spv::Op opCode = spv::Op::OpNop;
  8410. int extBuiltins = -1;
  8411. int libCall = -1;
  8412. size_t consumedOperands = operands.size();
  8413. spv::Id typeId0 = 0;
  8414. if (consumedOperands > 0)
  8415. typeId0 = builder.getTypeId(operands[0]);
  8416. spv::Id typeId1 = 0;
  8417. if (consumedOperands > 1)
  8418. typeId1 = builder.getTypeId(operands[1]);
  8419. spv::Id frexpIntType = 0;
  8420. switch (op) {
  8421. case glslang::EOpMin:
  8422. if (isFloat)
  8423. libCall = nanMinMaxClamp ? spv::GLSLstd450NMin : spv::GLSLstd450FMin;
  8424. else if (isUnsigned)
  8425. libCall = spv::GLSLstd450UMin;
  8426. else
  8427. libCall = spv::GLSLstd450SMin;
  8428. builder.promoteScalar(precision, operands.front(), operands.back());
  8429. break;
  8430. case glslang::EOpModf:
  8431. {
  8432. libCall = spv::GLSLstd450ModfStruct;
  8433. assert(builder.isFloatType(builder.getScalarTypeId(typeId0)));
  8434. // The returned struct has two members of the same type as the first argument
  8435. typeId = builder.makeStructResultType(typeId0, typeId0);
  8436. consumedOperands = 1;
  8437. }
  8438. break;
  8439. case glslang::EOpMax:
  8440. if (isFloat)
  8441. libCall = nanMinMaxClamp ? spv::GLSLstd450NMax : spv::GLSLstd450FMax;
  8442. else if (isUnsigned)
  8443. libCall = spv::GLSLstd450UMax;
  8444. else
  8445. libCall = spv::GLSLstd450SMax;
  8446. builder.promoteScalar(precision, operands.front(), operands.back());
  8447. break;
  8448. case glslang::EOpPow:
  8449. libCall = spv::GLSLstd450Pow;
  8450. break;
  8451. case glslang::EOpDot:
  8452. case glslang::EOpDotPackedEXT:
  8453. case glslang::EOpDotAccSatEXT:
  8454. case glslang::EOpDotPackedAccSatEXT:
  8455. {
  8456. if (builder.isFloatType(builder.getScalarTypeId(typeId0)) ||
  8457. // HLSL supports dot(int,int) which is just a multiply
  8458. glslangIntermediate->getSource() == glslang::EShSourceHlsl) {
  8459. if (typeProxy == glslang::EbtBFloat16) {
  8460. builder.addExtension(spv::E_SPV_KHR_bfloat16);
  8461. builder.addCapability(spv::Capability::BFloat16DotProductKHR);
  8462. }
  8463. opCode = spv::Op::OpDot;
  8464. } else {
  8465. builder.addExtension(spv::E_SPV_KHR_integer_dot_product);
  8466. builder.addCapability(spv::Capability::DotProductKHR);
  8467. const unsigned int vectorSize = builder.getNumComponents(operands[0]);
  8468. if (op == glslang::EOpDotPackedEXT || op == glslang::EOpDotPackedAccSatEXT) {
  8469. builder.addCapability(spv::Capability::DotProductInput4x8BitPackedKHR);
  8470. } else if (vectorSize == 4 && builder.getScalarTypeWidth(typeId0) == 8) {
  8471. builder.addCapability(spv::Capability::DotProductInput4x8BitKHR);
  8472. } else {
  8473. builder.addCapability(spv::Capability::DotProductInputAllKHR);
  8474. }
  8475. const bool type0isSigned = builder.isIntType(builder.getScalarTypeId(typeId0));
  8476. const bool type1isSigned = builder.isIntType(builder.getScalarTypeId(typeId1));
  8477. const bool accSat = (op == glslang::EOpDotAccSatEXT || op == glslang::EOpDotPackedAccSatEXT);
  8478. if (!type0isSigned && !type1isSigned) {
  8479. opCode = accSat ? spv::Op::OpUDotAccSatKHR : spv::Op::OpUDotKHR;
  8480. } else if (type0isSigned && type1isSigned) {
  8481. opCode = accSat ? spv::Op::OpSDotAccSatKHR : spv::Op::OpSDotKHR;
  8482. } else {
  8483. opCode = accSat ? spv::Op::OpSUDotAccSatKHR : spv::Op::OpSUDotKHR;
  8484. // the spir-v opcode assumes the operands to be "signed, unsigned" in that order, so swap if needed
  8485. if (type1isSigned) {
  8486. std::swap(operands[0], operands[1]);
  8487. }
  8488. }
  8489. std::vector<spv::IdImmediate> operands2;
  8490. for (auto &o : operands) {
  8491. operands2.push_back({true, o});
  8492. }
  8493. if (op == glslang::EOpDotPackedEXT || op == glslang::EOpDotPackedAccSatEXT) {
  8494. operands2.push_back({false, 0});
  8495. }
  8496. return builder.createOp(opCode, typeId, operands2);
  8497. }
  8498. }
  8499. break;
  8500. case glslang::EOpAtan:
  8501. libCall = spv::GLSLstd450Atan2;
  8502. break;
  8503. case glslang::EOpClamp:
  8504. if (isFloat)
  8505. libCall = nanMinMaxClamp ? spv::GLSLstd450NClamp : spv::GLSLstd450FClamp;
  8506. else if (isUnsigned)
  8507. libCall = spv::GLSLstd450UClamp;
  8508. else
  8509. libCall = spv::GLSLstd450SClamp;
  8510. builder.promoteScalar(precision, operands.front(), operands[1]);
  8511. builder.promoteScalar(precision, operands.front(), operands[2]);
  8512. break;
  8513. case glslang::EOpMix:
  8514. if (! builder.isBoolType(builder.getScalarTypeId(builder.getTypeId(operands.back())))) {
  8515. assert(isFloat);
  8516. libCall = spv::GLSLstd450FMix;
  8517. } else {
  8518. opCode = spv::Op::OpSelect;
  8519. std::swap(operands.front(), operands.back());
  8520. }
  8521. builder.promoteScalar(precision, operands.front(), operands.back());
  8522. break;
  8523. case glslang::EOpStep:
  8524. libCall = spv::GLSLstd450Step;
  8525. builder.promoteScalar(precision, operands.front(), operands.back());
  8526. break;
  8527. case glslang::EOpSmoothStep:
  8528. libCall = spv::GLSLstd450SmoothStep;
  8529. builder.promoteScalar(precision, operands[0], operands[2]);
  8530. builder.promoteScalar(precision, operands[1], operands[2]);
  8531. break;
  8532. case glslang::EOpDistance:
  8533. libCall = spv::GLSLstd450Distance;
  8534. break;
  8535. case glslang::EOpCross:
  8536. libCall = spv::GLSLstd450Cross;
  8537. break;
  8538. case glslang::EOpFaceForward:
  8539. libCall = spv::GLSLstd450FaceForward;
  8540. break;
  8541. case glslang::EOpReflect:
  8542. libCall = spv::GLSLstd450Reflect;
  8543. break;
  8544. case glslang::EOpRefract:
  8545. libCall = spv::GLSLstd450Refract;
  8546. break;
  8547. case glslang::EOpBarrier:
  8548. {
  8549. // This is for the extended controlBarrier function, with four operands.
  8550. // The unextended barrier() goes through createNoArgOperation.
  8551. assert(operands.size() == 4);
  8552. auto const executionScope = (spv::Scope)builder.getConstantScalar(operands[0]);
  8553. auto const memoryScope = (spv::Scope)builder.getConstantScalar(operands[1]);
  8554. auto const semantics = (spv::MemorySemanticsMask)(builder.getConstantScalar(operands[2]) | builder.getConstantScalar(operands[3]));
  8555. builder.createControlBarrier(executionScope, memoryScope,
  8556. semantics);
  8557. if (anySet(semantics, spv::MemorySemanticsMask::MakeAvailableKHR |
  8558. spv::MemorySemanticsMask::MakeVisibleKHR |
  8559. spv::MemorySemanticsMask::OutputMemoryKHR |
  8560. spv::MemorySemanticsMask::Volatile)) {
  8561. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  8562. }
  8563. if (glslangIntermediate->usingVulkanMemoryModel() && (executionScope == spv::Scope::Device ||
  8564. memoryScope == spv::Scope::Device)) {
  8565. builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);
  8566. }
  8567. return 0;
  8568. }
  8569. break;
  8570. case glslang::EOpMemoryBarrier:
  8571. {
  8572. // This is for the extended memoryBarrier function, with three operands.
  8573. // The unextended memoryBarrier() goes through createNoArgOperation.
  8574. assert(operands.size() == 3);
  8575. auto const memoryScope = (spv::Scope)builder.getConstantScalar(operands[0]);
  8576. auto const semantics = (spv::MemorySemanticsMask)(builder.getConstantScalar(operands[1]) | builder.getConstantScalar(operands[2]));
  8577. builder.createMemoryBarrier(memoryScope, semantics);
  8578. if (anySet(semantics, spv::MemorySemanticsMask::MakeAvailableKHR |
  8579. spv::MemorySemanticsMask::MakeVisibleKHR |
  8580. spv::MemorySemanticsMask::OutputMemoryKHR |
  8581. spv::MemorySemanticsMask::Volatile)) {
  8582. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  8583. }
  8584. if (glslangIntermediate->usingVulkanMemoryModel() && memoryScope == spv::Scope::Device) {
  8585. builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);
  8586. }
  8587. return 0;
  8588. }
  8589. break;
  8590. case glslang::EOpInterpolateAtSample:
  8591. if (typeProxy == glslang::EbtFloat16)
  8592. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
  8593. libCall = spv::GLSLstd450InterpolateAtSample;
  8594. break;
  8595. case glslang::EOpInterpolateAtOffset:
  8596. if (typeProxy == glslang::EbtFloat16)
  8597. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
  8598. libCall = spv::GLSLstd450InterpolateAtOffset;
  8599. break;
  8600. case glslang::EOpAddCarry:
  8601. opCode = spv::Op::OpIAddCarry;
  8602. typeId = builder.makeStructResultType(typeId0, typeId0);
  8603. consumedOperands = 2;
  8604. break;
  8605. case glslang::EOpSubBorrow:
  8606. opCode = spv::Op::OpISubBorrow;
  8607. typeId = builder.makeStructResultType(typeId0, typeId0);
  8608. consumedOperands = 2;
  8609. break;
  8610. case glslang::EOpUMulExtended:
  8611. opCode = spv::Op::OpUMulExtended;
  8612. typeId = builder.makeStructResultType(typeId0, typeId0);
  8613. consumedOperands = 2;
  8614. break;
  8615. case glslang::EOpIMulExtended:
  8616. opCode = spv::Op::OpSMulExtended;
  8617. typeId = builder.makeStructResultType(typeId0, typeId0);
  8618. consumedOperands = 2;
  8619. break;
  8620. case glslang::EOpBitfieldExtract:
  8621. if (isUnsigned)
  8622. opCode = spv::Op::OpBitFieldUExtract;
  8623. else
  8624. opCode = spv::Op::OpBitFieldSExtract;
  8625. break;
  8626. case glslang::EOpBitfieldInsert:
  8627. opCode = spv::Op::OpBitFieldInsert;
  8628. break;
  8629. case glslang::EOpFma:
  8630. libCall = spv::GLSLstd450Fma;
  8631. break;
  8632. case glslang::EOpFrexp:
  8633. {
  8634. libCall = spv::GLSLstd450FrexpStruct;
  8635. assert(builder.isPointerType(typeId1));
  8636. typeId1 = builder.getContainedTypeId(typeId1);
  8637. int width = builder.getScalarTypeWidth(typeId1);
  8638. if (width == 16)
  8639. // Using 16-bit exp operand, enable extension SPV_AMD_gpu_shader_int16
  8640. builder.addExtension(spv::E_SPV_AMD_gpu_shader_int16);
  8641. if (builder.getNumComponents(operands[0]) == 1)
  8642. frexpIntType = builder.makeIntegerType(width, true);
  8643. else
  8644. frexpIntType = builder.makeVectorType(builder.makeIntegerType(width, true),
  8645. builder.getNumComponents(operands[0]));
  8646. typeId = builder.makeStructResultType(typeId0, frexpIntType);
  8647. consumedOperands = 1;
  8648. }
  8649. break;
  8650. case glslang::EOpLdexp:
  8651. libCall = spv::GLSLstd450Ldexp;
  8652. break;
  8653. case glslang::EOpReadInvocation:
  8654. return createInvocationsOperation(op, typeId, operands, typeProxy);
  8655. case glslang::EOpSubgroupBroadcast:
  8656. case glslang::EOpSubgroupBallotBitExtract:
  8657. case glslang::EOpSubgroupShuffle:
  8658. case glslang::EOpSubgroupShuffleXor:
  8659. case glslang::EOpSubgroupShuffleUp:
  8660. case glslang::EOpSubgroupShuffleDown:
  8661. case glslang::EOpSubgroupRotate:
  8662. case glslang::EOpSubgroupClusteredRotate:
  8663. case glslang::EOpSubgroupClusteredAdd:
  8664. case glslang::EOpSubgroupClusteredMul:
  8665. case glslang::EOpSubgroupClusteredMin:
  8666. case glslang::EOpSubgroupClusteredMax:
  8667. case glslang::EOpSubgroupClusteredAnd:
  8668. case glslang::EOpSubgroupClusteredOr:
  8669. case glslang::EOpSubgroupClusteredXor:
  8670. case glslang::EOpSubgroupQuadBroadcast:
  8671. case glslang::EOpSubgroupPartitionedAdd:
  8672. case glslang::EOpSubgroupPartitionedMul:
  8673. case glslang::EOpSubgroupPartitionedMin:
  8674. case glslang::EOpSubgroupPartitionedMax:
  8675. case glslang::EOpSubgroupPartitionedAnd:
  8676. case glslang::EOpSubgroupPartitionedOr:
  8677. case glslang::EOpSubgroupPartitionedXor:
  8678. case glslang::EOpSubgroupPartitionedInclusiveAdd:
  8679. case glslang::EOpSubgroupPartitionedInclusiveMul:
  8680. case glslang::EOpSubgroupPartitionedInclusiveMin:
  8681. case glslang::EOpSubgroupPartitionedInclusiveMax:
  8682. case glslang::EOpSubgroupPartitionedInclusiveAnd:
  8683. case glslang::EOpSubgroupPartitionedInclusiveOr:
  8684. case glslang::EOpSubgroupPartitionedInclusiveXor:
  8685. case glslang::EOpSubgroupPartitionedExclusiveAdd:
  8686. case glslang::EOpSubgroupPartitionedExclusiveMul:
  8687. case glslang::EOpSubgroupPartitionedExclusiveMin:
  8688. case glslang::EOpSubgroupPartitionedExclusiveMax:
  8689. case glslang::EOpSubgroupPartitionedExclusiveAnd:
  8690. case glslang::EOpSubgroupPartitionedExclusiveOr:
  8691. case glslang::EOpSubgroupPartitionedExclusiveXor:
  8692. return createSubgroupOperation(op, typeId, operands, typeProxy);
  8693. case glslang::EOpSwizzleInvocations:
  8694. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
  8695. libCall = spv::SwizzleInvocationsAMD;
  8696. break;
  8697. case glslang::EOpSwizzleInvocationsMasked:
  8698. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
  8699. libCall = spv::SwizzleInvocationsMaskedAMD;
  8700. break;
  8701. case glslang::EOpWriteInvocation:
  8702. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
  8703. libCall = spv::WriteInvocationAMD;
  8704. break;
  8705. case glslang::EOpMin3:
  8706. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_trinary_minmax);
  8707. if (isFloat)
  8708. libCall = spv::FMin3AMD;
  8709. else {
  8710. if (isUnsigned)
  8711. libCall = spv::UMin3AMD;
  8712. else
  8713. libCall = spv::SMin3AMD;
  8714. }
  8715. break;
  8716. case glslang::EOpMax3:
  8717. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_trinary_minmax);
  8718. if (isFloat)
  8719. libCall = spv::FMax3AMD;
  8720. else {
  8721. if (isUnsigned)
  8722. libCall = spv::UMax3AMD;
  8723. else
  8724. libCall = spv::SMax3AMD;
  8725. }
  8726. break;
  8727. case glslang::EOpMid3:
  8728. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_trinary_minmax);
  8729. if (isFloat)
  8730. libCall = spv::FMid3AMD;
  8731. else {
  8732. if (isUnsigned)
  8733. libCall = spv::UMid3AMD;
  8734. else
  8735. libCall = spv::SMid3AMD;
  8736. }
  8737. break;
  8738. case glslang::EOpInterpolateAtVertex:
  8739. if (typeProxy == glslang::EbtFloat16)
  8740. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
  8741. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  8742. libCall = spv::InterpolateAtVertexAMD;
  8743. break;
  8744. case glslang::EOpReportIntersection:
  8745. typeId = builder.makeBoolType();
  8746. opCode = spv::Op::OpReportIntersectionKHR;
  8747. break;
  8748. case glslang::EOpTraceNV:
  8749. builder.createNoResultOp(spv::Op::OpTraceNV, operands);
  8750. return 0;
  8751. case glslang::EOpTraceRayMotionNV:
  8752. builder.addExtension(spv::E_SPV_NV_ray_tracing_motion_blur);
  8753. builder.addCapability(spv::Capability::RayTracingMotionBlurNV);
  8754. builder.createNoResultOp(spv::Op::OpTraceRayMotionNV, operands);
  8755. return 0;
  8756. case glslang::EOpTraceKHR:
  8757. builder.createNoResultOp(spv::Op::OpTraceRayKHR, operands);
  8758. return 0;
  8759. case glslang::EOpExecuteCallableNV:
  8760. builder.createNoResultOp(spv::Op::OpExecuteCallableNV, operands);
  8761. return 0;
  8762. case glslang::EOpExecuteCallableKHR:
  8763. builder.createNoResultOp(spv::Op::OpExecuteCallableKHR, operands);
  8764. return 0;
  8765. case glslang::EOpRayQueryInitialize:
  8766. builder.createNoResultOp(spv::Op::OpRayQueryInitializeKHR, operands);
  8767. return 0;
  8768. case glslang::EOpRayQueryTerminate:
  8769. builder.createNoResultOp(spv::Op::OpRayQueryTerminateKHR, operands);
  8770. return 0;
  8771. case glslang::EOpRayQueryGenerateIntersection:
  8772. builder.createNoResultOp(spv::Op::OpRayQueryGenerateIntersectionKHR, operands);
  8773. return 0;
  8774. case glslang::EOpRayQueryConfirmIntersection:
  8775. builder.createNoResultOp(spv::Op::OpRayQueryConfirmIntersectionKHR, operands);
  8776. return 0;
  8777. case glslang::EOpRayQueryProceed:
  8778. typeId = builder.makeBoolType();
  8779. opCode = spv::Op::OpRayQueryProceedKHR;
  8780. break;
  8781. case glslang::EOpRayQueryGetIntersectionType:
  8782. typeId = builder.makeUintType(32);
  8783. opCode = spv::Op::OpRayQueryGetIntersectionTypeKHR;
  8784. break;
  8785. case glslang::EOpRayQueryGetRayTMin:
  8786. typeId = builder.makeFloatType(32);
  8787. opCode = spv::Op::OpRayQueryGetRayTMinKHR;
  8788. break;
  8789. case glslang::EOpRayQueryGetRayFlags:
  8790. typeId = builder.makeIntType(32);
  8791. opCode = spv::Op::OpRayQueryGetRayFlagsKHR;
  8792. break;
  8793. case glslang::EOpRayQueryGetIntersectionT:
  8794. typeId = builder.makeFloatType(32);
  8795. opCode = spv::Op::OpRayQueryGetIntersectionTKHR;
  8796. break;
  8797. case glslang::EOpRayQueryGetIntersectionInstanceCustomIndex:
  8798. typeId = builder.makeIntType(32);
  8799. opCode = spv::Op::OpRayQueryGetIntersectionInstanceCustomIndexKHR;
  8800. break;
  8801. case glslang::EOpRayQueryGetIntersectionInstanceId:
  8802. typeId = builder.makeIntType(32);
  8803. opCode = spv::Op::OpRayQueryGetIntersectionInstanceIdKHR;
  8804. break;
  8805. case glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset:
  8806. typeId = builder.makeUintType(32);
  8807. opCode = spv::Op::OpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffsetKHR;
  8808. break;
  8809. case glslang::EOpRayQueryGetIntersectionGeometryIndex:
  8810. typeId = builder.makeIntType(32);
  8811. opCode = spv::Op::OpRayQueryGetIntersectionGeometryIndexKHR;
  8812. break;
  8813. case glslang::EOpRayQueryGetIntersectionPrimitiveIndex:
  8814. typeId = builder.makeIntType(32);
  8815. opCode = spv::Op::OpRayQueryGetIntersectionPrimitiveIndexKHR;
  8816. break;
  8817. case glslang::EOpRayQueryGetIntersectionBarycentrics:
  8818. typeId = builder.makeVectorType(builder.makeFloatType(32), 2);
  8819. opCode = spv::Op::OpRayQueryGetIntersectionBarycentricsKHR;
  8820. break;
  8821. case glslang::EOpRayQueryGetIntersectionFrontFace:
  8822. typeId = builder.makeBoolType();
  8823. opCode = spv::Op::OpRayQueryGetIntersectionFrontFaceKHR;
  8824. break;
  8825. case glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque:
  8826. typeId = builder.makeBoolType();
  8827. opCode = spv::Op::OpRayQueryGetIntersectionCandidateAABBOpaqueKHR;
  8828. break;
  8829. case glslang::EOpRayQueryGetIntersectionObjectRayDirection:
  8830. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  8831. opCode = spv::Op::OpRayQueryGetIntersectionObjectRayDirectionKHR;
  8832. break;
  8833. case glslang::EOpRayQueryGetIntersectionObjectRayOrigin:
  8834. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  8835. opCode = spv::Op::OpRayQueryGetIntersectionObjectRayOriginKHR;
  8836. break;
  8837. case glslang::EOpRayQueryGetWorldRayDirection:
  8838. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  8839. opCode = spv::Op::OpRayQueryGetWorldRayDirectionKHR;
  8840. break;
  8841. case glslang::EOpRayQueryGetWorldRayOrigin:
  8842. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  8843. opCode = spv::Op::OpRayQueryGetWorldRayOriginKHR;
  8844. break;
  8845. case glslang::EOpRayQueryGetIntersectionObjectToWorld:
  8846. typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  8847. opCode = spv::Op::OpRayQueryGetIntersectionObjectToWorldKHR;
  8848. break;
  8849. case glslang::EOpRayQueryGetIntersectionClusterIdNV:
  8850. typeId = builder.makeIntegerType(32, 1);
  8851. opCode = spv::Op::OpRayQueryGetClusterIdNV;
  8852. break;
  8853. case glslang::EOpRayQueryGetIntersectionWorldToObject:
  8854. typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  8855. opCode = spv::Op::OpRayQueryGetIntersectionWorldToObjectKHR;
  8856. break;
  8857. case glslang::EOpRayQueryGetIntersectionSpherePositionNV:
  8858. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  8859. opCode = spv::Op::OpRayQueryGetIntersectionSpherePositionNV;
  8860. break;
  8861. case glslang::EOpRayQueryGetIntersectionSphereRadiusNV:
  8862. typeId = builder.makeFloatType(32);
  8863. opCode = spv::Op::OpRayQueryGetIntersectionSphereRadiusNV;
  8864. break;
  8865. case glslang::EOpRayQueryGetIntersectionLSSHitValueNV:
  8866. typeId = builder.makeFloatType(32);
  8867. opCode = spv::Op::OpRayQueryGetIntersectionLSSHitValueNV;
  8868. break;
  8869. case glslang::EOpRayQueryIsSphereHitNV:
  8870. typeId = builder.makeBoolType();
  8871. opCode = spv::Op::OpRayQueryIsSphereHitNV;
  8872. break;
  8873. case glslang::EOpRayQueryIsLSSHitNV:
  8874. typeId = builder.makeBoolType();
  8875. opCode = spv::Op::OpRayQueryIsLSSHitNV;
  8876. break;
  8877. case glslang::EOpWritePackedPrimitiveIndices4x8NV:
  8878. builder.createNoResultOp(spv::Op::OpWritePackedPrimitiveIndices4x8NV, operands);
  8879. return 0;
  8880. case glslang::EOpEmitMeshTasksEXT:
  8881. if (taskPayloadID)
  8882. operands.push_back(taskPayloadID);
  8883. // As per SPV_EXT_mesh_shader make it a terminating instruction in the current block
  8884. builder.makeStatementTerminator(spv::Op::OpEmitMeshTasksEXT, operands, "post-OpEmitMeshTasksEXT");
  8885. return 0;
  8886. case glslang::EOpSetMeshOutputsEXT:
  8887. builder.createNoResultOp(spv::Op::OpSetMeshOutputsEXT, operands);
  8888. return 0;
  8889. case glslang::EOpCooperativeMatrixMulAddNV:
  8890. opCode = spv::Op::OpCooperativeMatrixMulAddNV;
  8891. break;
  8892. case glslang::EOpHitObjectTraceRayNV:
  8893. builder.createNoResultOp(spv::Op::OpHitObjectTraceRayNV, operands);
  8894. return 0;
  8895. case glslang::EOpHitObjectTraceRayMotionNV:
  8896. builder.createNoResultOp(spv::Op::OpHitObjectTraceRayMotionNV, operands);
  8897. return 0;
  8898. case glslang::EOpHitObjectRecordHitNV:
  8899. builder.createNoResultOp(spv::Op::OpHitObjectRecordHitNV, operands);
  8900. return 0;
  8901. case glslang::EOpHitObjectRecordHitMotionNV:
  8902. builder.createNoResultOp(spv::Op::OpHitObjectRecordHitMotionNV, operands);
  8903. return 0;
  8904. case glslang::EOpHitObjectRecordHitWithIndexNV:
  8905. builder.createNoResultOp(spv::Op::OpHitObjectRecordHitWithIndexNV, operands);
  8906. return 0;
  8907. case glslang::EOpHitObjectRecordHitWithIndexMotionNV:
  8908. builder.createNoResultOp(spv::Op::OpHitObjectRecordHitWithIndexMotionNV, operands);
  8909. return 0;
  8910. case glslang::EOpHitObjectRecordMissNV:
  8911. builder.createNoResultOp(spv::Op::OpHitObjectRecordMissNV, operands);
  8912. return 0;
  8913. case glslang::EOpHitObjectRecordMissMotionNV:
  8914. builder.createNoResultOp(spv::Op::OpHitObjectRecordMissMotionNV, operands);
  8915. return 0;
  8916. case glslang::EOpHitObjectExecuteShaderNV:
  8917. builder.createNoResultOp(spv::Op::OpHitObjectExecuteShaderNV, operands);
  8918. return 0;
  8919. case glslang::EOpHitObjectIsEmptyNV:
  8920. typeId = builder.makeBoolType();
  8921. opCode = spv::Op::OpHitObjectIsEmptyNV;
  8922. break;
  8923. case glslang::EOpHitObjectIsMissNV:
  8924. typeId = builder.makeBoolType();
  8925. opCode = spv::Op::OpHitObjectIsMissNV;
  8926. break;
  8927. case glslang::EOpHitObjectIsHitNV:
  8928. typeId = builder.makeBoolType();
  8929. opCode = spv::Op::OpHitObjectIsHitNV;
  8930. break;
  8931. case glslang::EOpHitObjectIsSphereHitNV:
  8932. typeId = builder.makeBoolType();
  8933. opCode = spv::Op::OpHitObjectIsSphereHitNV;
  8934. break;
  8935. case glslang::EOpHitObjectIsLSSHitNV:
  8936. typeId = builder.makeBoolType();
  8937. opCode = spv::Op::OpHitObjectIsLSSHitNV;
  8938. break;
  8939. case glslang::EOpHitObjectGetRayTMinNV:
  8940. typeId = builder.makeFloatType(32);
  8941. opCode = spv::Op::OpHitObjectGetRayTMinNV;
  8942. break;
  8943. case glslang::EOpHitObjectGetRayTMaxNV:
  8944. typeId = builder.makeFloatType(32);
  8945. opCode = spv::Op::OpHitObjectGetRayTMaxNV;
  8946. break;
  8947. case glslang::EOpHitObjectGetObjectRayOriginNV:
  8948. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  8949. opCode = spv::Op::OpHitObjectGetObjectRayOriginNV;
  8950. break;
  8951. case glslang::EOpHitObjectGetObjectRayDirectionNV:
  8952. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  8953. opCode = spv::Op::OpHitObjectGetObjectRayDirectionNV;
  8954. break;
  8955. case glslang::EOpHitObjectGetWorldRayOriginNV:
  8956. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  8957. opCode = spv::Op::OpHitObjectGetWorldRayOriginNV;
  8958. break;
  8959. case glslang::EOpHitObjectGetWorldRayDirectionNV:
  8960. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  8961. opCode = spv::Op::OpHitObjectGetWorldRayDirectionNV;
  8962. break;
  8963. case glslang::EOpHitObjectGetWorldToObjectNV:
  8964. typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  8965. opCode = spv::Op::OpHitObjectGetWorldToObjectNV;
  8966. break;
  8967. case glslang::EOpHitObjectGetObjectToWorldNV:
  8968. typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  8969. opCode = spv::Op::OpHitObjectGetObjectToWorldNV;
  8970. break;
  8971. case glslang::EOpHitObjectGetInstanceCustomIndexNV:
  8972. typeId = builder.makeIntegerType(32, 1);
  8973. opCode = spv::Op::OpHitObjectGetInstanceCustomIndexNV;
  8974. break;
  8975. case glslang::EOpHitObjectGetInstanceIdNV:
  8976. typeId = builder.makeIntegerType(32, 1);
  8977. opCode = spv::Op::OpHitObjectGetInstanceIdNV;
  8978. break;
  8979. case glslang::EOpHitObjectGetGeometryIndexNV:
  8980. typeId = builder.makeIntegerType(32, 1);
  8981. opCode = spv::Op::OpHitObjectGetGeometryIndexNV;
  8982. break;
  8983. case glslang::EOpHitObjectGetPrimitiveIndexNV:
  8984. typeId = builder.makeIntegerType(32, 1);
  8985. opCode = spv::Op::OpHitObjectGetPrimitiveIndexNV;
  8986. break;
  8987. case glslang::EOpHitObjectGetHitKindNV:
  8988. typeId = builder.makeIntegerType(32, 0);
  8989. opCode = spv::Op::OpHitObjectGetHitKindNV;
  8990. break;
  8991. case glslang::EOpHitObjectGetCurrentTimeNV:
  8992. typeId = builder.makeFloatType(32);
  8993. opCode = spv::Op::OpHitObjectGetCurrentTimeNV;
  8994. break;
  8995. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:
  8996. typeId = builder.makeIntegerType(32, 0);
  8997. opCode = spv::Op::OpHitObjectGetShaderBindingTableRecordIndexNV;
  8998. return 0;
  8999. case glslang::EOpHitObjectGetAttributesNV:
  9000. builder.createNoResultOp(spv::Op::OpHitObjectGetAttributesNV, operands);
  9001. return 0;
  9002. case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:
  9003. typeId = builder.makeVectorType(builder.makeUintType(32), 2);
  9004. opCode = spv::Op::OpHitObjectGetShaderRecordBufferHandleNV;
  9005. break;
  9006. case glslang::EOpHitObjectGetClusterIdNV:
  9007. typeId = builder.makeIntegerType(32, 1);
  9008. opCode = spv::Op::OpHitObjectGetClusterIdNV;
  9009. break;
  9010. case glslang::EOpReorderThreadNV: {
  9011. if (operands.size() == 2) {
  9012. builder.createNoResultOp(spv::Op::OpReorderThreadWithHintNV, operands);
  9013. } else {
  9014. builder.createNoResultOp(spv::Op::OpReorderThreadWithHitObjectNV, operands);
  9015. }
  9016. return 0;
  9017. }
  9018. case glslang::EOpImageSampleWeightedQCOM:
  9019. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9020. opCode = spv::Op::OpImageSampleWeightedQCOM;
  9021. addImageProcessingQCOMDecoration(operands[2], spv::Decoration::WeightTextureQCOM);
  9022. break;
  9023. case glslang::EOpImageBoxFilterQCOM:
  9024. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9025. opCode = spv::Op::OpImageBoxFilterQCOM;
  9026. break;
  9027. case glslang::EOpImageBlockMatchSADQCOM:
  9028. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9029. opCode = spv::Op::OpImageBlockMatchSADQCOM;
  9030. addImageProcessingQCOMDecoration(operands[0], spv::Decoration::BlockMatchTextureQCOM);
  9031. addImageProcessingQCOMDecoration(operands[2], spv::Decoration::BlockMatchTextureQCOM);
  9032. break;
  9033. case glslang::EOpImageBlockMatchSSDQCOM:
  9034. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9035. opCode = spv::Op::OpImageBlockMatchSSDQCOM;
  9036. addImageProcessingQCOMDecoration(operands[0], spv::Decoration::BlockMatchTextureQCOM);
  9037. addImageProcessingQCOMDecoration(operands[2], spv::Decoration::BlockMatchTextureQCOM);
  9038. break;
  9039. case glslang::EOpFetchMicroTriangleVertexBarycentricNV:
  9040. typeId = builder.makeVectorType(builder.makeFloatType(32), 2);
  9041. opCode = spv::Op::OpFetchMicroTriangleVertexBarycentricNV;
  9042. break;
  9043. case glslang::EOpFetchMicroTriangleVertexPositionNV:
  9044. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9045. opCode = spv::Op::OpFetchMicroTriangleVertexPositionNV;
  9046. break;
  9047. case glslang::EOpImageBlockMatchWindowSSDQCOM:
  9048. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9049. opCode = spv::Op::OpImageBlockMatchWindowSSDQCOM;
  9050. addImageProcessing2QCOMDecoration(operands[0], false);
  9051. addImageProcessing2QCOMDecoration(operands[2], false);
  9052. break;
  9053. case glslang::EOpImageBlockMatchWindowSADQCOM:
  9054. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9055. opCode = spv::Op::OpImageBlockMatchWindowSADQCOM;
  9056. addImageProcessing2QCOMDecoration(operands[0], false);
  9057. addImageProcessing2QCOMDecoration(operands[2], false);
  9058. break;
  9059. case glslang::EOpImageBlockMatchGatherSSDQCOM:
  9060. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9061. opCode = spv::Op::OpImageBlockMatchGatherSSDQCOM;
  9062. addImageProcessing2QCOMDecoration(operands[0], true);
  9063. addImageProcessing2QCOMDecoration(operands[2], true);
  9064. break;
  9065. case glslang::EOpImageBlockMatchGatherSADQCOM:
  9066. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9067. opCode = spv::Op::OpImageBlockMatchGatherSADQCOM;
  9068. addImageProcessing2QCOMDecoration(operands[0], true);
  9069. addImageProcessing2QCOMDecoration(operands[2], true);
  9070. break;
  9071. case glslang::EOpCreateTensorLayoutNV:
  9072. return builder.createOp(spv::Op::OpCreateTensorLayoutNV, typeId, std::vector<spv::Id>{});
  9073. case glslang::EOpCreateTensorViewNV:
  9074. return builder.createOp(spv::Op::OpCreateTensorViewNV, typeId, std::vector<spv::Id>{});
  9075. case glslang::EOpTensorLayoutSetBlockSizeNV:
  9076. opCode = spv::Op::OpTensorLayoutSetBlockSizeNV;
  9077. break;
  9078. case glslang::EOpTensorLayoutSetDimensionNV:
  9079. opCode = spv::Op::OpTensorLayoutSetDimensionNV;
  9080. break;
  9081. case glslang::EOpTensorLayoutSetStrideNV:
  9082. opCode = spv::Op::OpTensorLayoutSetStrideNV;
  9083. break;
  9084. case glslang::EOpTensorLayoutSliceNV:
  9085. opCode = spv::Op::OpTensorLayoutSliceNV;
  9086. break;
  9087. case glslang::EOpTensorLayoutSetClampValueNV:
  9088. opCode = spv::Op::OpTensorLayoutSetClampValueNV;
  9089. break;
  9090. case glslang::EOpTensorViewSetDimensionNV:
  9091. opCode = spv::Op::OpTensorViewSetDimensionNV;
  9092. break;
  9093. case glslang::EOpTensorViewSetStrideNV:
  9094. opCode = spv::Op::OpTensorViewSetStrideNV;
  9095. break;
  9096. case glslang::EOpTensorViewSetClipNV:
  9097. opCode = spv::Op::OpTensorViewSetClipNV;
  9098. break;
  9099. default:
  9100. return 0;
  9101. }
  9102. spv::Id id = 0;
  9103. if (libCall >= 0) {
  9104. // Use an extended instruction from the standard library.
  9105. // Construct the call arguments, without modifying the original operands vector.
  9106. // We might need the remaining arguments, e.g. in the EOpFrexp case.
  9107. std::vector<spv::Id> callArguments(operands.begin(), operands.begin() + consumedOperands);
  9108. id = builder.createBuiltinCall(typeId, extBuiltins >= 0 ? extBuiltins : stdBuiltins, libCall, callArguments);
  9109. } else if (opCode == spv::Op::OpDot && !isFloat) {
  9110. // int dot(int, int)
  9111. // NOTE: never called for scalar/vector1, this is turned into simple mul before this can be reached
  9112. const int componentCount = builder.getNumComponents(operands[0]);
  9113. spv::Id mulOp = builder.createBinOp(spv::Op::OpIMul, builder.getTypeId(operands[0]), operands[0], operands[1]);
  9114. builder.setPrecision(mulOp, precision);
  9115. id = builder.createCompositeExtract(mulOp, typeId, 0);
  9116. for (int i = 1; i < componentCount; ++i) {
  9117. builder.setPrecision(id, precision);
  9118. id = builder.createBinOp(spv::Op::OpIAdd, typeId, id, builder.createCompositeExtract(mulOp, typeId, i));
  9119. }
  9120. } else {
  9121. switch (consumedOperands) {
  9122. case 0:
  9123. // should all be handled by visitAggregate and createNoArgOperation
  9124. assert(0);
  9125. return 0;
  9126. case 1:
  9127. // should all be handled by createUnaryOperation
  9128. assert(0);
  9129. return 0;
  9130. case 2:
  9131. id = builder.createBinOp(opCode, typeId, operands[0], operands[1]);
  9132. break;
  9133. default:
  9134. // anything 3 or over doesn't have l-value operands, so all should be consumed
  9135. assert(consumedOperands == operands.size());
  9136. id = builder.createOp(opCode, typeId, operands);
  9137. break;
  9138. }
  9139. }
  9140. // Decode the return types that were structures
  9141. switch (op) {
  9142. case glslang::EOpAddCarry:
  9143. case glslang::EOpSubBorrow:
  9144. builder.createStore(builder.createCompositeExtract(id, typeId0, 1), operands[2]);
  9145. id = builder.createCompositeExtract(id, typeId0, 0);
  9146. break;
  9147. case glslang::EOpUMulExtended:
  9148. case glslang::EOpIMulExtended:
  9149. builder.createStore(builder.createCompositeExtract(id, typeId0, 0), operands[3]);
  9150. builder.createStore(builder.createCompositeExtract(id, typeId0, 1), operands[2]);
  9151. break;
  9152. case glslang::EOpModf:
  9153. {
  9154. assert(operands.size() == 2);
  9155. builder.createStore(builder.createCompositeExtract(id, typeId0, 1), operands[1]);
  9156. id = builder.createCompositeExtract(id, typeId0, 0);
  9157. }
  9158. break;
  9159. case glslang::EOpFrexp:
  9160. {
  9161. assert(operands.size() == 2);
  9162. if (builder.isFloatType(builder.getScalarTypeId(typeId1))) {
  9163. // "exp" is floating-point type (from HLSL intrinsic)
  9164. spv::Id member1 = builder.createCompositeExtract(id, frexpIntType, 1);
  9165. member1 = builder.createUnaryOp(spv::Op::OpConvertSToF, typeId1, member1);
  9166. builder.createStore(member1, operands[1]);
  9167. } else
  9168. // "exp" is integer type (from GLSL built-in function)
  9169. builder.createStore(builder.createCompositeExtract(id, frexpIntType, 1), operands[1]);
  9170. id = builder.createCompositeExtract(id, typeId0, 0);
  9171. }
  9172. break;
  9173. default:
  9174. break;
  9175. }
  9176. return builder.setPrecision(id, precision);
  9177. }
  9178. // Intrinsics with no arguments (or no return value, and no precision).
  9179. spv::Id TGlslangToSpvTraverser::createNoArgOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId)
  9180. {
  9181. // GLSL memory barriers use queuefamily scope in new model, device scope in old model
  9182. spv::Scope memoryBarrierScope = glslangIntermediate->usingVulkanMemoryModel() ?
  9183. spv::Scope::QueueFamilyKHR : spv::Scope::Device;
  9184. switch (op) {
  9185. case glslang::EOpBarrier:
  9186. if (glslangIntermediate->getStage() == EShLangTessControl) {
  9187. if (glslangIntermediate->usingVulkanMemoryModel()) {
  9188. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Workgroup,
  9189. spv::MemorySemanticsMask::OutputMemoryKHR |
  9190. spv::MemorySemanticsMask::AcquireRelease);
  9191. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  9192. } else {
  9193. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Invocation, spv::MemorySemanticsMask::MaskNone);
  9194. }
  9195. } else {
  9196. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Workgroup,
  9197. spv::MemorySemanticsMask::WorkgroupMemory |
  9198. spv::MemorySemanticsMask::AcquireRelease);
  9199. }
  9200. return 0;
  9201. case glslang::EOpMemoryBarrier:
  9202. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsAllMemory |
  9203. spv::MemorySemanticsMask::AcquireRelease);
  9204. return 0;
  9205. case glslang::EOpMemoryBarrierBuffer:
  9206. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::UniformMemory |
  9207. spv::MemorySemanticsMask::AcquireRelease);
  9208. return 0;
  9209. case glslang::EOpMemoryBarrierShared:
  9210. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::WorkgroupMemory |
  9211. spv::MemorySemanticsMask::AcquireRelease);
  9212. return 0;
  9213. case glslang::EOpGroupMemoryBarrier:
  9214. builder.createMemoryBarrier(spv::Scope::Workgroup, spv::MemorySemanticsAllMemory |
  9215. spv::MemorySemanticsMask::AcquireRelease);
  9216. return 0;
  9217. case glslang::EOpMemoryBarrierAtomicCounter:
  9218. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::AtomicCounterMemory |
  9219. spv::MemorySemanticsMask::AcquireRelease);
  9220. return 0;
  9221. case glslang::EOpMemoryBarrierImage:
  9222. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::ImageMemory |
  9223. spv::MemorySemanticsMask::AcquireRelease);
  9224. return 0;
  9225. case glslang::EOpAllMemoryBarrierWithGroupSync:
  9226. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Device,
  9227. spv::MemorySemanticsAllMemory |
  9228. spv::MemorySemanticsMask::AcquireRelease);
  9229. return 0;
  9230. case glslang::EOpDeviceMemoryBarrier:
  9231. builder.createMemoryBarrier(spv::Scope::Device, spv::MemorySemanticsMask::UniformMemory |
  9232. spv::MemorySemanticsMask::ImageMemory |
  9233. spv::MemorySemanticsMask::AcquireRelease);
  9234. return 0;
  9235. case glslang::EOpDeviceMemoryBarrierWithGroupSync:
  9236. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Device, spv::MemorySemanticsMask::UniformMemory |
  9237. spv::MemorySemanticsMask::ImageMemory |
  9238. spv::MemorySemanticsMask::AcquireRelease);
  9239. return 0;
  9240. case glslang::EOpWorkgroupMemoryBarrier:
  9241. builder.createMemoryBarrier(spv::Scope::Workgroup, spv::MemorySemanticsMask::WorkgroupMemory |
  9242. spv::MemorySemanticsMask::AcquireRelease);
  9243. return 0;
  9244. case glslang::EOpWorkgroupMemoryBarrierWithGroupSync:
  9245. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Workgroup,
  9246. spv::MemorySemanticsMask::WorkgroupMemory |
  9247. spv::MemorySemanticsMask::AcquireRelease);
  9248. return 0;
  9249. case glslang::EOpSubgroupBarrier:
  9250. builder.createControlBarrier(spv::Scope::Subgroup, spv::Scope::Subgroup, spv::MemorySemanticsAllMemory |
  9251. spv::MemorySemanticsMask::AcquireRelease);
  9252. return spv::NoResult;
  9253. case glslang::EOpSubgroupMemoryBarrier:
  9254. builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsAllMemory |
  9255. spv::MemorySemanticsMask::AcquireRelease);
  9256. return spv::NoResult;
  9257. case glslang::EOpSubgroupMemoryBarrierBuffer:
  9258. builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsMask::UniformMemory |
  9259. spv::MemorySemanticsMask::AcquireRelease);
  9260. return spv::NoResult;
  9261. case glslang::EOpSubgroupMemoryBarrierImage:
  9262. builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsMask::ImageMemory |
  9263. spv::MemorySemanticsMask::AcquireRelease);
  9264. return spv::NoResult;
  9265. case glslang::EOpSubgroupMemoryBarrierShared:
  9266. builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsMask::WorkgroupMemory |
  9267. spv::MemorySemanticsMask::AcquireRelease);
  9268. return spv::NoResult;
  9269. case glslang::EOpEmitVertex:
  9270. builder.createNoResultOp(spv::Op::OpEmitVertex);
  9271. return 0;
  9272. case glslang::EOpEndPrimitive:
  9273. builder.createNoResultOp(spv::Op::OpEndPrimitive);
  9274. return 0;
  9275. case glslang::EOpSubgroupElect: {
  9276. std::vector<spv::Id> operands;
  9277. return createSubgroupOperation(op, typeId, operands, glslang::EbtVoid);
  9278. }
  9279. case glslang::EOpTime:
  9280. {
  9281. std::vector<spv::Id> args; // Dummy arguments
  9282. spv::Id id = builder.createBuiltinCall(typeId, getExtBuiltins(spv::E_SPV_AMD_gcn_shader), spv::TimeAMD, args);
  9283. return builder.setPrecision(id, precision);
  9284. }
  9285. case glslang::EOpIgnoreIntersectionNV:
  9286. builder.createNoResultOp(spv::Op::OpIgnoreIntersectionNV);
  9287. return 0;
  9288. case glslang::EOpTerminateRayNV:
  9289. builder.createNoResultOp(spv::Op::OpTerminateRayNV);
  9290. return 0;
  9291. case glslang::EOpRayQueryInitialize:
  9292. builder.createNoResultOp(spv::Op::OpRayQueryInitializeKHR);
  9293. return 0;
  9294. case glslang::EOpRayQueryTerminate:
  9295. builder.createNoResultOp(spv::Op::OpRayQueryTerminateKHR);
  9296. return 0;
  9297. case glslang::EOpRayQueryGenerateIntersection:
  9298. builder.createNoResultOp(spv::Op::OpRayQueryGenerateIntersectionKHR);
  9299. return 0;
  9300. case glslang::EOpRayQueryConfirmIntersection:
  9301. builder.createNoResultOp(spv::Op::OpRayQueryConfirmIntersectionKHR);
  9302. return 0;
  9303. case glslang::EOpBeginInvocationInterlock:
  9304. builder.createNoResultOp(spv::Op::OpBeginInvocationInterlockEXT);
  9305. return 0;
  9306. case glslang::EOpEndInvocationInterlock:
  9307. builder.createNoResultOp(spv::Op::OpEndInvocationInterlockEXT);
  9308. return 0;
  9309. case glslang::EOpIsHelperInvocation:
  9310. {
  9311. std::vector<spv::Id> args; // Dummy arguments
  9312. builder.addExtension(spv::E_SPV_EXT_demote_to_helper_invocation);
  9313. builder.addCapability(spv::Capability::DemoteToHelperInvocationEXT);
  9314. return builder.createOp(spv::Op::OpIsHelperInvocationEXT, typeId, args);
  9315. }
  9316. case glslang::EOpReadClockSubgroupKHR: {
  9317. std::vector<spv::Id> args;
  9318. args.push_back(builder.makeUintConstant(spv::Scope::Subgroup));
  9319. builder.addExtension(spv::E_SPV_KHR_shader_clock);
  9320. builder.addCapability(spv::Capability::ShaderClockKHR);
  9321. return builder.createOp(spv::Op::OpReadClockKHR, typeId, args);
  9322. }
  9323. case glslang::EOpReadClockDeviceKHR: {
  9324. std::vector<spv::Id> args;
  9325. args.push_back(builder.makeUintConstant(spv::Scope::Device));
  9326. builder.addExtension(spv::E_SPV_KHR_shader_clock);
  9327. builder.addCapability(spv::Capability::ShaderClockKHR);
  9328. return builder.createOp(spv::Op::OpReadClockKHR, typeId, args);
  9329. }
  9330. case glslang::EOpStencilAttachmentReadEXT:
  9331. case glslang::EOpDepthAttachmentReadEXT:
  9332. {
  9333. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  9334. spv::Decoration precision;
  9335. spv::Op spv_op;
  9336. if (op == glslang::EOpStencilAttachmentReadEXT)
  9337. {
  9338. precision = spv::Decoration::RelaxedPrecision;
  9339. spv_op = spv::Op::OpStencilAttachmentReadEXT;
  9340. builder.addCapability(spv::Capability::TileImageStencilReadAccessEXT);
  9341. }
  9342. else
  9343. {
  9344. precision = spv::NoPrecision;
  9345. spv_op = spv::Op::OpDepthAttachmentReadEXT;
  9346. builder.addCapability(spv::Capability::TileImageDepthReadAccessEXT);
  9347. }
  9348. std::vector<spv::Id> args; // Dummy args
  9349. spv::Id result = builder.createOp(spv_op, typeId, args);
  9350. return builder.setPrecision(result, precision);
  9351. }
  9352. default:
  9353. break;
  9354. }
  9355. logger->missingFunctionality("unknown operation with no arguments");
  9356. return 0;
  9357. }
  9358. spv::Id TGlslangToSpvTraverser::getSymbolId(const glslang::TIntermSymbol* symbol)
  9359. {
  9360. auto iter = symbolValues.find(symbol->getId());
  9361. spv::Id id;
  9362. if (symbolValues.end() != iter) {
  9363. id = iter->second;
  9364. return id;
  9365. }
  9366. // it was not found, create it
  9367. spv::BuiltIn builtIn = TranslateBuiltInDecoration(symbol->getQualifier().builtIn, false);
  9368. auto forcedType = getForcedType(symbol->getQualifier().builtIn, symbol->getType());
  9369. // There are pairs of symbols that map to the same SPIR-V built-in:
  9370. // gl_ObjectToWorldEXT and gl_ObjectToWorld3x4EXT, and gl_WorldToObjectEXT
  9371. // and gl_WorldToObject3x4EXT. SPIR-V forbids having two OpVariables
  9372. // with the same BuiltIn in the same storage class, so we must re-use one.
  9373. const bool mayNeedToReuseBuiltIn =
  9374. builtIn == spv::BuiltIn::ObjectToWorldKHR ||
  9375. builtIn == spv::BuiltIn::WorldToObjectKHR;
  9376. if (mayNeedToReuseBuiltIn) {
  9377. auto iter = builtInVariableIds.find(uint32_t(builtIn));
  9378. if (builtInVariableIds.end() != iter) {
  9379. id = iter->second;
  9380. symbolValues[symbol->getId()] = id;
  9381. if (forcedType.second != spv::NoType)
  9382. forceType[id] = forcedType.second;
  9383. return id;
  9384. }
  9385. }
  9386. if (symbol->getBasicType() == glslang::EbtFunction) {
  9387. return 0;
  9388. }
  9389. id = createSpvVariable(symbol, forcedType.first);
  9390. if (mayNeedToReuseBuiltIn) {
  9391. builtInVariableIds.insert({uint32_t(builtIn), id});
  9392. }
  9393. symbolValues[symbol->getId()] = id;
  9394. if (forcedType.second != spv::NoType)
  9395. forceType[id] = forcedType.second;
  9396. if (symbol->getBasicType() != glslang::EbtBlock) {
  9397. builder.addDecoration(id, TranslatePrecisionDecoration(symbol->getType()));
  9398. builder.addDecoration(id, TranslateInterpolationDecoration(symbol->getType().getQualifier()));
  9399. builder.addDecoration(id, TranslateAuxiliaryStorageDecoration(symbol->getType().getQualifier()));
  9400. addMeshNVDecoration(id, /*member*/ -1, symbol->getType().getQualifier());
  9401. if (symbol->getQualifier().hasComponent())
  9402. builder.addDecoration(id, spv::Decoration::Component, symbol->getQualifier().layoutComponent);
  9403. if (symbol->getQualifier().hasIndex())
  9404. builder.addDecoration(id, spv::Decoration::Index, symbol->getQualifier().layoutIndex);
  9405. if (symbol->getType().getQualifier().hasSpecConstantId())
  9406. builder.addDecoration(id, spv::Decoration::SpecId, symbol->getType().getQualifier().layoutSpecConstantId);
  9407. // atomic counters use this:
  9408. if (symbol->getQualifier().hasOffset())
  9409. builder.addDecoration(id, spv::Decoration::Offset, symbol->getQualifier().layoutOffset);
  9410. }
  9411. if (symbol->getQualifier().hasLocation()) {
  9412. if (!(glslangIntermediate->isRayTracingStage() &&
  9413. (glslangIntermediate->IsRequestedExtension(glslang::E_GL_EXT_ray_tracing) ||
  9414. glslangIntermediate->IsRequestedExtension(glslang::E_GL_NV_shader_invocation_reorder))
  9415. && (builder.getStorageClass(id) == spv::StorageClass::RayPayloadKHR ||
  9416. builder.getStorageClass(id) == spv::StorageClass::IncomingRayPayloadKHR ||
  9417. builder.getStorageClass(id) == spv::StorageClass::CallableDataKHR ||
  9418. builder.getStorageClass(id) == spv::StorageClass::IncomingCallableDataKHR ||
  9419. builder.getStorageClass(id) == spv::StorageClass::HitObjectAttributeNV))) {
  9420. // Location values are used to link TraceRayKHR/ExecuteCallableKHR/HitObjectGetAttributesNV
  9421. // to corresponding variables but are not valid in SPIRV since they are supported only
  9422. // for Input/Output Storage classes.
  9423. builder.addDecoration(id, spv::Decoration::Location, symbol->getQualifier().layoutLocation);
  9424. }
  9425. }
  9426. builder.addDecoration(id, TranslateInvariantDecoration(symbol->getType().getQualifier()));
  9427. if (symbol->getQualifier().hasStream() && glslangIntermediate->isMultiStream()) {
  9428. builder.addCapability(spv::Capability::GeometryStreams);
  9429. builder.addDecoration(id, spv::Decoration::Stream, symbol->getQualifier().layoutStream);
  9430. }
  9431. if (symbol->getQualifier().hasSet())
  9432. builder.addDecoration(id, spv::Decoration::DescriptorSet, symbol->getQualifier().layoutSet);
  9433. else if (IsDescriptorResource(symbol->getType())) {
  9434. // default to 0
  9435. builder.addDecoration(id, spv::Decoration::DescriptorSet, 0);
  9436. }
  9437. if (symbol->getQualifier().hasBinding())
  9438. builder.addDecoration(id, spv::Decoration::Binding, symbol->getQualifier().layoutBinding);
  9439. else if (IsDescriptorResource(symbol->getType())) {
  9440. // default to 0
  9441. builder.addDecoration(id, spv::Decoration::Binding, 0);
  9442. }
  9443. if (symbol->getQualifier().hasAttachment())
  9444. builder.addDecoration(id, spv::Decoration::InputAttachmentIndex, symbol->getQualifier().layoutAttachment);
  9445. if (glslangIntermediate->getXfbMode()) {
  9446. builder.addCapability(spv::Capability::TransformFeedback);
  9447. if (symbol->getQualifier().hasXfbBuffer()) {
  9448. builder.addDecoration(id, spv::Decoration::XfbBuffer, symbol->getQualifier().layoutXfbBuffer);
  9449. unsigned stride = glslangIntermediate->getXfbStride(symbol->getQualifier().layoutXfbBuffer);
  9450. if (stride != glslang::TQualifier::layoutXfbStrideEnd)
  9451. builder.addDecoration(id, spv::Decoration::XfbStride, stride);
  9452. }
  9453. if (symbol->getQualifier().hasXfbOffset())
  9454. builder.addDecoration(id, spv::Decoration::Offset, symbol->getQualifier().layoutXfbOffset);
  9455. }
  9456. // add built-in variable decoration
  9457. if (builtIn != spv::BuiltIn::Max) {
  9458. // WorkgroupSize deprecated in spirv1.6
  9459. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_6 ||
  9460. builtIn != spv::BuiltIn::WorkgroupSize)
  9461. builder.addDecoration(id, spv::Decoration::BuiltIn, (int)builtIn);
  9462. }
  9463. // Add volatile decoration to HelperInvocation for spirv1.6 and beyond
  9464. if (builtIn == spv::BuiltIn::HelperInvocation &&
  9465. !glslangIntermediate->usingVulkanMemoryModel() &&
  9466. glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {
  9467. builder.addDecoration(id, spv::Decoration::Volatile);
  9468. }
  9469. // Subgroup builtins which have input storage class are volatile for ray tracing stages.
  9470. if (symbol->getType().isImage() || symbol->getQualifier().isPipeInput()) {
  9471. std::vector<spv::Decoration> memory;
  9472. TranslateMemoryDecoration(symbol->getType().getQualifier(), memory,
  9473. glslangIntermediate->usingVulkanMemoryModel());
  9474. for (unsigned int i = 0; i < memory.size(); ++i)
  9475. builder.addDecoration(id, memory[i]);
  9476. }
  9477. if (builtIn == spv::BuiltIn::SampleMask) {
  9478. spv::Decoration decoration;
  9479. // GL_NV_sample_mask_override_coverage extension
  9480. if (glslangIntermediate->getLayoutOverrideCoverage())
  9481. decoration = spv::Decoration::OverrideCoverageNV;
  9482. else
  9483. decoration = spv::Decoration::Max;
  9484. builder.addDecoration(id, decoration);
  9485. if (decoration != spv::Decoration::Max) {
  9486. builder.addCapability(spv::Capability::SampleMaskOverrideCoverageNV);
  9487. builder.addExtension(spv::E_SPV_NV_sample_mask_override_coverage);
  9488. }
  9489. }
  9490. else if (builtIn == spv::BuiltIn::Layer) {
  9491. // SPV_NV_viewport_array2 extension
  9492. if (symbol->getQualifier().layoutViewportRelative) {
  9493. builder.addDecoration(id, spv::Decoration::ViewportRelativeNV);
  9494. builder.addCapability(spv::Capability::ShaderViewportMaskNV);
  9495. builder.addExtension(spv::E_SPV_NV_viewport_array2);
  9496. }
  9497. if (symbol->getQualifier().layoutSecondaryViewportRelativeOffset != -2048) {
  9498. builder.addDecoration(id, spv::Decoration::SecondaryViewportRelativeNV,
  9499. symbol->getQualifier().layoutSecondaryViewportRelativeOffset);
  9500. builder.addCapability(spv::Capability::ShaderStereoViewNV);
  9501. builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
  9502. }
  9503. }
  9504. if (symbol->getQualifier().layoutPassthrough) {
  9505. builder.addDecoration(id, spv::Decoration::PassthroughNV);
  9506. builder.addCapability(spv::Capability::GeometryShaderPassthroughNV);
  9507. builder.addExtension(spv::E_SPV_NV_geometry_shader_passthrough);
  9508. }
  9509. if (symbol->getQualifier().pervertexNV) {
  9510. builder.addDecoration(id, spv::Decoration::PerVertexNV);
  9511. builder.addCapability(spv::Capability::FragmentBarycentricNV);
  9512. builder.addExtension(spv::E_SPV_NV_fragment_shader_barycentric);
  9513. }
  9514. if (symbol->getQualifier().pervertexEXT) {
  9515. builder.addDecoration(id, spv::Decoration::PerVertexKHR);
  9516. builder.addCapability(spv::Capability::FragmentBarycentricKHR);
  9517. builder.addExtension(spv::E_SPV_KHR_fragment_shader_barycentric);
  9518. }
  9519. if (glslangIntermediate->getHlslFunctionality1() && symbol->getType().getQualifier().semanticName != nullptr) {
  9520. builder.addExtension("SPV_GOOGLE_hlsl_functionality1");
  9521. builder.addDecoration(id, spv::Decoration::HlslSemanticGOOGLE,
  9522. symbol->getType().getQualifier().semanticName);
  9523. }
  9524. if (symbol->isReference()) {
  9525. builder.addDecoration(id, symbol->getType().getQualifier().restrict ?
  9526. spv::Decoration::RestrictPointerEXT : spv::Decoration::AliasedPointerEXT);
  9527. }
  9528. // Add SPIR-V decorations (GL_EXT_spirv_intrinsics)
  9529. if (symbol->getType().getQualifier().hasSpirvDecorate())
  9530. applySpirvDecorate(symbol->getType(), id, {});
  9531. return id;
  9532. }
  9533. // add per-primitive, per-view. per-task decorations to a struct member (member >= 0) or an object
  9534. void TGlslangToSpvTraverser::addMeshNVDecoration(spv::Id id, int member, const glslang::TQualifier& qualifier)
  9535. {
  9536. bool isMeshShaderExt = (glslangIntermediate->getRequestedExtensions().find(glslang::E_GL_EXT_mesh_shader) !=
  9537. glslangIntermediate->getRequestedExtensions().end());
  9538. if (member >= 0) {
  9539. if (qualifier.perPrimitiveNV) {
  9540. // Need to add capability/extension for fragment shader.
  9541. // Mesh shader already adds this by default.
  9542. if (glslangIntermediate->getStage() == EShLangFragment) {
  9543. if(isMeshShaderExt) {
  9544. builder.addCapability(spv::Capability::MeshShadingEXT);
  9545. builder.addExtension(spv::E_SPV_EXT_mesh_shader);
  9546. } else {
  9547. builder.addCapability(spv::Capability::MeshShadingNV);
  9548. builder.addExtension(spv::E_SPV_NV_mesh_shader);
  9549. }
  9550. }
  9551. builder.addMemberDecoration(id, (unsigned)member, spv::Decoration::PerPrimitiveNV);
  9552. }
  9553. if (qualifier.perViewNV)
  9554. builder.addMemberDecoration(id, (unsigned)member, spv::Decoration::PerViewNV);
  9555. if (qualifier.perTaskNV)
  9556. builder.addMemberDecoration(id, (unsigned)member, spv::Decoration::PerTaskNV);
  9557. } else {
  9558. if (qualifier.perPrimitiveNV) {
  9559. // Need to add capability/extension for fragment shader.
  9560. // Mesh shader already adds this by default.
  9561. if (glslangIntermediate->getStage() == EShLangFragment) {
  9562. if(isMeshShaderExt) {
  9563. builder.addCapability(spv::Capability::MeshShadingEXT);
  9564. builder.addExtension(spv::E_SPV_EXT_mesh_shader);
  9565. } else {
  9566. builder.addCapability(spv::Capability::MeshShadingNV);
  9567. builder.addExtension(spv::E_SPV_NV_mesh_shader);
  9568. }
  9569. }
  9570. builder.addDecoration(id, spv::Decoration::PerPrimitiveNV);
  9571. }
  9572. if (qualifier.perViewNV)
  9573. builder.addDecoration(id, spv::Decoration::PerViewNV);
  9574. if (qualifier.perTaskNV)
  9575. builder.addDecoration(id, spv::Decoration::PerTaskNV);
  9576. }
  9577. }
  9578. bool TGlslangToSpvTraverser::hasQCOMImageProceessingDecoration(spv::Id id, spv::Decoration decor)
  9579. {
  9580. std::vector<spv::Decoration> &decoVec = idToQCOMDecorations[id];
  9581. for ( auto d : decoVec ) {
  9582. if ( d == decor )
  9583. return true;
  9584. }
  9585. return false;
  9586. }
  9587. void TGlslangToSpvTraverser::addImageProcessingQCOMDecoration(spv::Id id, spv::Decoration decor)
  9588. {
  9589. spv::Op opc = builder.getOpCode(id);
  9590. if (opc == spv::Op::OpSampledImage) {
  9591. id = builder.getIdOperand(id, 0);
  9592. opc = builder.getOpCode(id);
  9593. }
  9594. if (opc == spv::Op::OpLoad) {
  9595. spv::Id texid = builder.getIdOperand(id, 0);
  9596. if (!hasQCOMImageProceessingDecoration(texid, decor)) {//
  9597. builder.addDecoration(texid, decor);
  9598. idToQCOMDecorations[texid].push_back(decor);
  9599. }
  9600. }
  9601. }
  9602. void TGlslangToSpvTraverser::addImageProcessing2QCOMDecoration(spv::Id id, bool isForGather)
  9603. {
  9604. if (isForGather) {
  9605. return addImageProcessingQCOMDecoration(id, spv::Decoration::BlockMatchTextureQCOM);
  9606. }
  9607. auto addDecor =
  9608. [this](spv::Id id, spv::Decoration decor) {
  9609. spv::Op tsopc = this->builder.getOpCode(id);
  9610. if (tsopc == spv::Op::OpLoad) {
  9611. spv::Id tsid = this->builder.getIdOperand(id, 0);
  9612. if (this->glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {
  9613. assert(iOSet.count(tsid) > 0);
  9614. }
  9615. if (!hasQCOMImageProceessingDecoration(tsid, decor)) {
  9616. this->builder.addDecoration(tsid, decor);
  9617. idToQCOMDecorations[tsid].push_back(decor);
  9618. }
  9619. }
  9620. };
  9621. spv::Op opc = builder.getOpCode(id);
  9622. bool isInterfaceObject = (opc != spv::Op::OpSampledImage);
  9623. if (!isInterfaceObject) {
  9624. addDecor(builder.getIdOperand(id, 0), spv::Decoration::BlockMatchTextureQCOM);
  9625. addDecor(builder.getIdOperand(id, 1), spv::Decoration::BlockMatchSamplerQCOM);
  9626. } else {
  9627. addDecor(id, spv::Decoration::BlockMatchTextureQCOM);
  9628. addDecor(id, spv::Decoration::BlockMatchSamplerQCOM);
  9629. }
  9630. }
  9631. // Make a full tree of instructions to build a SPIR-V specialization constant,
  9632. // or regular constant if possible.
  9633. //
  9634. // TBD: this is not yet done, nor verified to be the best design, it does do the leaf symbols though
  9635. //
  9636. // Recursively walk the nodes. The nodes form a tree whose leaves are
  9637. // regular constants, which themselves are trees that createSpvConstant()
  9638. // recursively walks. So, this function walks the "top" of the tree:
  9639. // - emit specialization constant-building instructions for specConstant
  9640. // - when running into a non-spec-constant, switch to createSpvConstant()
  9641. spv::Id TGlslangToSpvTraverser::createSpvConstant(const glslang::TIntermTyped& node)
  9642. {
  9643. assert(node.getQualifier().isConstant());
  9644. // Handle front-end constants first (non-specialization constants).
  9645. if (! node.getQualifier().specConstant) {
  9646. // hand off to the non-spec-constant path
  9647. assert(node.getAsConstantUnion() != nullptr || node.getAsSymbolNode() != nullptr);
  9648. int nextConst = 0;
  9649. return createSpvConstantFromConstUnionArray(node.getType(), node.getAsConstantUnion() ?
  9650. node.getAsConstantUnion()->getConstArray() : node.getAsSymbolNode()->getConstArray(),
  9651. nextConst, false);
  9652. }
  9653. // We now know we have a specialization constant to build
  9654. // Extra capabilities may be needed.
  9655. if (node.getType().contains8BitInt())
  9656. builder.addCapability(spv::Capability::Int8);
  9657. if (node.getType().contains16BitFloat())
  9658. builder.addCapability(spv::Capability::Float16);
  9659. if (node.getType().contains16BitInt())
  9660. builder.addCapability(spv::Capability::Int16);
  9661. if (node.getType().contains64BitInt())
  9662. builder.addCapability(spv::Capability::Int64);
  9663. if (node.getType().containsDouble())
  9664. builder.addCapability(spv::Capability::Float64);
  9665. // gl_WorkGroupSize is a special case until the front-end handles hierarchical specialization constants,
  9666. // even then, it's specialization ids are handled by special case syntax in GLSL: layout(local_size_x = ...
  9667. if (node.getType().getQualifier().builtIn == glslang::EbvWorkGroupSize) {
  9668. std::vector<spv::Id> dimConstId;
  9669. for (int dim = 0; dim < 3; ++dim) {
  9670. bool specConst = (glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet);
  9671. dimConstId.push_back(builder.makeUintConstant(glslangIntermediate->getLocalSize(dim), specConst));
  9672. if (specConst) {
  9673. builder.addDecoration(dimConstId.back(), spv::Decoration::SpecId,
  9674. glslangIntermediate->getLocalSizeSpecId(dim));
  9675. }
  9676. }
  9677. return builder.makeCompositeConstant(builder.makeVectorType(builder.makeUintType(32), 3), dimConstId, true);
  9678. }
  9679. // An AST node labelled as specialization constant should be a symbol node.
  9680. // Its initializer should either be a sub tree with constant nodes, or a constant union array.
  9681. if (auto* sn = node.getAsSymbolNode()) {
  9682. spv::Id result;
  9683. if (auto* sub_tree = sn->getConstSubtree()) {
  9684. // Traverse the constant constructor sub tree like generating normal run-time instructions.
  9685. // During the AST traversal, if the node is marked as 'specConstant', SpecConstantOpModeGuard
  9686. // will set the builder into spec constant op instruction generating mode.
  9687. sub_tree->traverse(this);
  9688. result = accessChainLoad(sub_tree->getType());
  9689. } else if (auto* const_union_array = &sn->getConstArray()) {
  9690. int nextConst = 0;
  9691. result = createSpvConstantFromConstUnionArray(sn->getType(), *const_union_array, nextConst, true);
  9692. } else {
  9693. logger->missingFunctionality("Invalid initializer for spec onstant.");
  9694. return spv::NoResult;
  9695. }
  9696. builder.addName(result, sn->getName().c_str());
  9697. return result;
  9698. }
  9699. // Neither a front-end constant node, nor a specialization constant node with constant union array or
  9700. // constant sub tree as initializer.
  9701. logger->missingFunctionality("Neither a front-end constant nor a spec constant.");
  9702. return spv::NoResult;
  9703. }
  9704. // Use 'consts' as the flattened glslang source of scalar constants to recursively
  9705. // build the aggregate SPIR-V constant.
  9706. //
  9707. // If there are not enough elements present in 'consts', 0 will be substituted;
  9708. // an empty 'consts' can be used to create a fully zeroed SPIR-V constant.
  9709. //
  9710. spv::Id TGlslangToSpvTraverser::createSpvConstantFromConstUnionArray(const glslang::TType& glslangType,
  9711. const glslang::TConstUnionArray& consts, int& nextConst, bool specConstant)
  9712. {
  9713. // vector of constants for SPIR-V
  9714. std::vector<spv::Id> spvConsts;
  9715. // Type is used for struct and array constants
  9716. spv::Id typeId = convertGlslangToSpvType(glslangType);
  9717. if (glslangType.isArray()) {
  9718. glslang::TType elementType(glslangType, 0);
  9719. for (int i = 0; i < glslangType.getOuterArraySize(); ++i)
  9720. spvConsts.push_back(createSpvConstantFromConstUnionArray(elementType, consts, nextConst, false));
  9721. } else if (glslangType.isMatrix()) {
  9722. glslang::TType vectorType(glslangType, 0);
  9723. for (int col = 0; col < glslangType.getMatrixCols(); ++col)
  9724. spvConsts.push_back(createSpvConstantFromConstUnionArray(vectorType, consts, nextConst, false));
  9725. } else if (glslangType.isCoopMat()) {
  9726. glslang::TType componentType(glslangType.getBasicType());
  9727. spvConsts.push_back(createSpvConstantFromConstUnionArray(componentType, consts, nextConst, false));
  9728. } else if (glslangType.isStruct()) {
  9729. glslang::TVector<glslang::TTypeLoc>::const_iterator iter;
  9730. for (iter = glslangType.getStruct()->begin(); iter != glslangType.getStruct()->end(); ++iter)
  9731. spvConsts.push_back(createSpvConstantFromConstUnionArray(*iter->type, consts, nextConst, false));
  9732. } else if (glslangType.getVectorSize() > 1 || glslangType.isCoopVecNV()) {
  9733. unsigned int numComponents = glslangType.isCoopVecNV() ? glslangType.getTypeParameters()->arraySizes->getDimSize(0) : glslangType.getVectorSize();
  9734. for (unsigned int i = 0; i < numComponents; ++i) {
  9735. bool zero = nextConst >= consts.size();
  9736. switch (glslangType.getBasicType()) {
  9737. case glslang::EbtInt:
  9738. spvConsts.push_back(builder.makeIntConstant(zero ? 0 : consts[nextConst].getIConst()));
  9739. break;
  9740. case glslang::EbtUint:
  9741. spvConsts.push_back(builder.makeUintConstant(zero ? 0 : consts[nextConst].getUConst()));
  9742. break;
  9743. case glslang::EbtFloat:
  9744. spvConsts.push_back(builder.makeFloatConstant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  9745. break;
  9746. case glslang::EbtBool:
  9747. spvConsts.push_back(builder.makeBoolConstant(zero ? false : consts[nextConst].getBConst()));
  9748. break;
  9749. case glslang::EbtInt8:
  9750. builder.addCapability(spv::Capability::Int8);
  9751. spvConsts.push_back(builder.makeInt8Constant(zero ? 0 : consts[nextConst].getI8Const()));
  9752. break;
  9753. case glslang::EbtUint8:
  9754. builder.addCapability(spv::Capability::Int8);
  9755. spvConsts.push_back(builder.makeUint8Constant(zero ? 0 : consts[nextConst].getU8Const()));
  9756. break;
  9757. case glslang::EbtInt16:
  9758. builder.addCapability(spv::Capability::Int16);
  9759. spvConsts.push_back(builder.makeInt16Constant(zero ? 0 : consts[nextConst].getI16Const()));
  9760. break;
  9761. case glslang::EbtUint16:
  9762. builder.addCapability(spv::Capability::Int16);
  9763. spvConsts.push_back(builder.makeUint16Constant(zero ? 0 : consts[nextConst].getU16Const()));
  9764. break;
  9765. case glslang::EbtInt64:
  9766. spvConsts.push_back(builder.makeInt64Constant(zero ? 0 : consts[nextConst].getI64Const()));
  9767. break;
  9768. case glslang::EbtUint64:
  9769. spvConsts.push_back(builder.makeUint64Constant(zero ? 0 : consts[nextConst].getU64Const()));
  9770. break;
  9771. case glslang::EbtDouble:
  9772. spvConsts.push_back(builder.makeDoubleConstant(zero ? 0.0 : consts[nextConst].getDConst()));
  9773. break;
  9774. case glslang::EbtFloat16:
  9775. builder.addCapability(spv::Capability::Float16);
  9776. spvConsts.push_back(builder.makeFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  9777. break;
  9778. case glslang::EbtBFloat16:
  9779. spvConsts.push_back(builder.makeBFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  9780. break;
  9781. case glslang::EbtFloatE5M2:
  9782. spvConsts.push_back(builder.makeFloatE5M2Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  9783. break;
  9784. case glslang::EbtFloatE4M3:
  9785. spvConsts.push_back(builder.makeFloatE4M3Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  9786. break;
  9787. default:
  9788. assert(0);
  9789. break;
  9790. }
  9791. ++nextConst;
  9792. }
  9793. } else {
  9794. // we have a non-aggregate (scalar) constant
  9795. bool zero = nextConst >= consts.size();
  9796. spv::Id scalar = 0;
  9797. switch (glslangType.getBasicType()) {
  9798. case glslang::EbtInt:
  9799. scalar = builder.makeIntConstant(zero ? 0 : consts[nextConst].getIConst(), specConstant);
  9800. break;
  9801. case glslang::EbtUint:
  9802. scalar = builder.makeUintConstant(zero ? 0 : consts[nextConst].getUConst(), specConstant);
  9803. break;
  9804. case glslang::EbtFloat:
  9805. scalar = builder.makeFloatConstant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  9806. break;
  9807. case glslang::EbtBool:
  9808. scalar = builder.makeBoolConstant(zero ? false : consts[nextConst].getBConst(), specConstant);
  9809. break;
  9810. case glslang::EbtInt8:
  9811. builder.addCapability(spv::Capability::Int8);
  9812. scalar = builder.makeInt8Constant(zero ? 0 : consts[nextConst].getI8Const(), specConstant);
  9813. break;
  9814. case glslang::EbtUint8:
  9815. builder.addCapability(spv::Capability::Int8);
  9816. scalar = builder.makeUint8Constant(zero ? 0 : consts[nextConst].getU8Const(), specConstant);
  9817. break;
  9818. case glslang::EbtInt16:
  9819. builder.addCapability(spv::Capability::Int16);
  9820. scalar = builder.makeInt16Constant(zero ? 0 : consts[nextConst].getI16Const(), specConstant);
  9821. break;
  9822. case glslang::EbtUint16:
  9823. builder.addCapability(spv::Capability::Int16);
  9824. scalar = builder.makeUint16Constant(zero ? 0 : consts[nextConst].getU16Const(), specConstant);
  9825. break;
  9826. case glslang::EbtInt64:
  9827. scalar = builder.makeInt64Constant(zero ? 0 : consts[nextConst].getI64Const(), specConstant);
  9828. break;
  9829. case glslang::EbtUint64:
  9830. scalar = builder.makeUint64Constant(zero ? 0 : consts[nextConst].getU64Const(), specConstant);
  9831. break;
  9832. case glslang::EbtDouble:
  9833. scalar = builder.makeDoubleConstant(zero ? 0.0 : consts[nextConst].getDConst(), specConstant);
  9834. break;
  9835. case glslang::EbtFloat16:
  9836. builder.addCapability(spv::Capability::Float16);
  9837. scalar = builder.makeFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  9838. break;
  9839. case glslang::EbtBFloat16:
  9840. scalar = builder.makeBFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  9841. break;
  9842. case glslang::EbtFloatE5M2:
  9843. scalar = builder.makeFloatE5M2Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  9844. break;
  9845. case glslang::EbtFloatE4M3:
  9846. scalar = builder.makeFloatE4M3Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  9847. break;
  9848. case glslang::EbtReference:
  9849. scalar = builder.makeUint64Constant(zero ? 0 : consts[nextConst].getU64Const(), specConstant);
  9850. scalar = builder.createUnaryOp(spv::Op::OpBitcast, typeId, scalar);
  9851. break;
  9852. case glslang::EbtString:
  9853. scalar = builder.getStringId(consts[nextConst].getSConst()->c_str());
  9854. break;
  9855. default:
  9856. assert(0);
  9857. break;
  9858. }
  9859. ++nextConst;
  9860. return scalar;
  9861. }
  9862. return builder.makeCompositeConstant(typeId, spvConsts);
  9863. }
  9864. // Return true if the node is a constant or symbol whose reading has no
  9865. // non-trivial observable cost or effect.
  9866. bool TGlslangToSpvTraverser::isTrivialLeaf(const glslang::TIntermTyped* node)
  9867. {
  9868. // don't know what this is
  9869. if (node == nullptr)
  9870. return false;
  9871. // a constant is safe
  9872. if (node->getAsConstantUnion() != nullptr)
  9873. return true;
  9874. // not a symbol means non-trivial
  9875. if (node->getAsSymbolNode() == nullptr)
  9876. return false;
  9877. // a symbol, depends on what's being read
  9878. switch (node->getType().getQualifier().storage) {
  9879. case glslang::EvqTemporary:
  9880. case glslang::EvqGlobal:
  9881. case glslang::EvqIn:
  9882. case glslang::EvqInOut:
  9883. case glslang::EvqConst:
  9884. case glslang::EvqConstReadOnly:
  9885. case glslang::EvqUniform:
  9886. return true;
  9887. default:
  9888. return false;
  9889. }
  9890. }
  9891. // A node is trivial if it is a single operation with no side effects.
  9892. // HLSL (and/or vectors) are always trivial, as it does not short circuit.
  9893. // Otherwise, error on the side of saying non-trivial.
  9894. // Return true if trivial.
  9895. bool TGlslangToSpvTraverser::isTrivial(const glslang::TIntermTyped* node)
  9896. {
  9897. if (node == nullptr)
  9898. return false;
  9899. // count non scalars as trivial, as well as anything coming from HLSL
  9900. if (! node->getType().isScalarOrVec1() || glslangIntermediate->getSource() == glslang::EShSourceHlsl)
  9901. return true;
  9902. // symbols and constants are trivial
  9903. if (isTrivialLeaf(node))
  9904. return true;
  9905. // otherwise, it needs to be a simple operation or one or two leaf nodes
  9906. // not a simple operation
  9907. const glslang::TIntermBinary* binaryNode = node->getAsBinaryNode();
  9908. const glslang::TIntermUnary* unaryNode = node->getAsUnaryNode();
  9909. if (binaryNode == nullptr && unaryNode == nullptr)
  9910. return false;
  9911. // not on leaf nodes
  9912. if (binaryNode && (! isTrivialLeaf(binaryNode->getLeft()) || ! isTrivialLeaf(binaryNode->getRight())))
  9913. return false;
  9914. if (unaryNode && ! isTrivialLeaf(unaryNode->getOperand())) {
  9915. return false;
  9916. }
  9917. if (IsOpNumericConv(node->getAsOperator()->getOp()) &&
  9918. node->getType().getBasicType() == glslang::EbtBool) {
  9919. return true;
  9920. }
  9921. switch (node->getAsOperator()->getOp()) {
  9922. case glslang::EOpLogicalNot:
  9923. case glslang::EOpEqual:
  9924. case glslang::EOpNotEqual:
  9925. case glslang::EOpLessThan:
  9926. case glslang::EOpGreaterThan:
  9927. case glslang::EOpLessThanEqual:
  9928. case glslang::EOpGreaterThanEqual:
  9929. case glslang::EOpIndexDirect:
  9930. case glslang::EOpIndexDirectStruct:
  9931. case glslang::EOpLogicalXor:
  9932. case glslang::EOpAny:
  9933. case glslang::EOpAll:
  9934. return true;
  9935. default:
  9936. return false;
  9937. }
  9938. }
  9939. // Emit short-circuiting code, where 'right' is never evaluated unless
  9940. // the left side is true (for &&) or false (for ||).
  9941. spv::Id TGlslangToSpvTraverser::createShortCircuit(glslang::TOperator op, glslang::TIntermTyped& left,
  9942. glslang::TIntermTyped& right)
  9943. {
  9944. spv::Id boolTypeId = builder.makeBoolType();
  9945. // emit left operand
  9946. builder.clearAccessChain();
  9947. left.traverse(this);
  9948. spv::Id leftId = accessChainLoad(left.getType());
  9949. // Operands to accumulate OpPhi operands
  9950. std::vector<spv::Id> phiOperands;
  9951. phiOperands.reserve(4);
  9952. // accumulate left operand's phi information
  9953. phiOperands.push_back(leftId);
  9954. phiOperands.push_back(builder.getBuildPoint()->getId());
  9955. // Make the two kinds of operation symmetric with a "!"
  9956. // || => emit "if (! left) result = right"
  9957. // && => emit "if ( left) result = right"
  9958. //
  9959. // TODO: this runtime "not" for || could be avoided by adding functionality
  9960. // to 'builder' to have an "else" without an "then"
  9961. if (op == glslang::EOpLogicalOr)
  9962. leftId = builder.createUnaryOp(spv::Op::OpLogicalNot, boolTypeId, leftId);
  9963. // make an "if" based on the left value
  9964. spv::Builder::If ifBuilder(leftId, spv::SelectionControlMask::MaskNone, builder);
  9965. // emit right operand as the "then" part of the "if"
  9966. builder.clearAccessChain();
  9967. right.traverse(this);
  9968. spv::Id rightId = accessChainLoad(right.getType());
  9969. // accumulate left operand's phi information
  9970. phiOperands.push_back(rightId);
  9971. phiOperands.push_back(builder.getBuildPoint()->getId());
  9972. // finish the "if"
  9973. ifBuilder.makeEndIf();
  9974. // phi together the two results
  9975. return builder.createOp(spv::Op::OpPhi, boolTypeId, phiOperands);
  9976. }
  9977. // Return type Id of the imported set of extended instructions corresponds to the name.
  9978. // Import this set if it has not been imported yet.
  9979. spv::Id TGlslangToSpvTraverser::getExtBuiltins(const char* name)
  9980. {
  9981. if (extBuiltinMap.find(name) != extBuiltinMap.end())
  9982. return extBuiltinMap[name];
  9983. else {
  9984. spv::Id extBuiltins = builder.import(name);
  9985. extBuiltinMap[name] = extBuiltins;
  9986. return extBuiltins;
  9987. }
  9988. }
  9989. } // end anonymous namespace
  9990. namespace glslang {
  9991. void GetSpirvVersion(std::string& version)
  9992. {
  9993. const int bufSize = 100;
  9994. char buf[bufSize];
  9995. snprintf(buf, bufSize, "0x%08x, Revision %d", spv::Version, spv::Revision);
  9996. version = buf;
  9997. }
  9998. // For low-order part of the generator's magic number. Bump up
  9999. // when there is a change in the style (e.g., if SSA form changes,
  10000. // or a different instruction sequence to do something gets used).
  10001. int GetSpirvGeneratorVersion()
  10002. {
  10003. // return 1; // start
  10004. // return 2; // EOpAtomicCounterDecrement gets a post decrement, to map between GLSL -> SPIR-V
  10005. // return 3; // change/correct barrier-instruction operands, to match memory model group decisions
  10006. // return 4; // some deeper access chains: for dynamic vector component, and local Boolean component
  10007. // return 5; // make OpArrayLength result type be an int with signedness of 0
  10008. // return 6; // revert version 5 change, which makes a different (new) kind of incorrect code,
  10009. // versions 4 and 6 each generate OpArrayLength as it has long been done
  10010. // return 7; // GLSL volatile keyword maps to both SPIR-V decorations Volatile and Coherent
  10011. // return 8; // switch to new dead block eliminator; use OpUnreachable
  10012. // return 9; // don't include opaque function parameters in OpEntryPoint global's operand list
  10013. // return 10; // Generate OpFUnordNotEqual for != comparisons
  10014. return 11; // Make OpEmitMeshTasksEXT a terminal instruction
  10015. }
  10016. // Write SPIR-V out to a binary file
  10017. bool OutputSpvBin(const std::vector<unsigned int>& spirv, const char* baseName)
  10018. {
  10019. std::ofstream out;
  10020. out.open(baseName, std::ios::binary | std::ios::out);
  10021. if (out.fail()) {
  10022. printf("ERROR: Failed to open file: %s\n", baseName);
  10023. return false;
  10024. }
  10025. for (int i = 0; i < (int)spirv.size(); ++i) {
  10026. unsigned int word = spirv[i];
  10027. out.write((const char*)&word, 4);
  10028. }
  10029. out.close();
  10030. return true;
  10031. }
  10032. // Write SPIR-V out to a text file with 32-bit hexadecimal words
  10033. bool OutputSpvHex(const std::vector<unsigned int>& spirv, const char* baseName, const char* varName)
  10034. {
  10035. std::ofstream out;
  10036. out.open(baseName, std::ios::binary | std::ios::out);
  10037. if (out.fail()) {
  10038. printf("ERROR: Failed to open file: %s\n", baseName);
  10039. return false;
  10040. }
  10041. out << "\t// " <<
  10042. GetSpirvGeneratorVersion() <<
  10043. GLSLANG_VERSION_MAJOR << "." << GLSLANG_VERSION_MINOR << "." << GLSLANG_VERSION_PATCH <<
  10044. GLSLANG_VERSION_FLAVOR << std::endl;
  10045. if (varName != nullptr) {
  10046. out << "\t #pragma once" << std::endl;
  10047. out << "const uint32_t " << varName << "[] = {" << std::endl;
  10048. }
  10049. const int WORDS_PER_LINE = 8;
  10050. for (int i = 0; i < (int)spirv.size(); i += WORDS_PER_LINE) {
  10051. out << "\t";
  10052. for (int j = 0; j < WORDS_PER_LINE && i + j < (int)spirv.size(); ++j) {
  10053. const unsigned int word = spirv[i + j];
  10054. out << "0x" << std::hex << std::setw(8) << std::setfill('0') << word;
  10055. if (i + j + 1 < (int)spirv.size()) {
  10056. out << ",";
  10057. }
  10058. }
  10059. out << std::endl;
  10060. }
  10061. if (varName != nullptr) {
  10062. out << "};";
  10063. out << std::endl;
  10064. }
  10065. out.close();
  10066. return true;
  10067. }
  10068. //
  10069. // Set up the glslang traversal
  10070. //
  10071. void GlslangToSpv(const TIntermediate& intermediate, std::vector<unsigned int>& spirv, SpvOptions* options)
  10072. {
  10073. spv::SpvBuildLogger logger;
  10074. GlslangToSpv(intermediate, spirv, &logger, options);
  10075. }
  10076. void GlslangToSpv(const TIntermediate& intermediate, std::vector<unsigned int>& spirv,
  10077. spv::SpvBuildLogger* logger, SpvOptions* options)
  10078. {
  10079. TIntermNode* root = intermediate.getTreeRoot();
  10080. if (root == nullptr)
  10081. return;
  10082. SpvOptions defaultOptions;
  10083. if (options == nullptr)
  10084. options = &defaultOptions;
  10085. GetThreadPoolAllocator().push();
  10086. TGlslangToSpvTraverser it(intermediate.getSpv().spv, &intermediate, logger, *options);
  10087. root->traverse(&it);
  10088. it.finishSpv(options->compileOnly);
  10089. it.dumpSpv(spirv);
  10090. #if ENABLE_OPT
  10091. // If from HLSL, run spirv-opt to "legalize" the SPIR-V for Vulkan
  10092. // eg. forward and remove memory writes of opaque types.
  10093. bool prelegalization = intermediate.getSource() == EShSourceHlsl;
  10094. if ((prelegalization || options->optimizeSize) && !options->disableOptimizer) {
  10095. SpirvToolsTransform(intermediate, spirv, logger, options);
  10096. prelegalization = false;
  10097. }
  10098. else if (options->stripDebugInfo) {
  10099. // Strip debug info even if optimization is disabled.
  10100. SpirvToolsStripDebugInfo(intermediate, spirv, logger);
  10101. }
  10102. if (options->validate)
  10103. SpirvToolsValidate(intermediate, spirv, logger, prelegalization);
  10104. if (options->disassemble)
  10105. SpirvToolsDisassemble(std::cout, spirv);
  10106. #endif
  10107. GetThreadPoolAllocator().pop();
  10108. }
  10109. } // end namespace glslang