GlslangToSpv.cpp 517 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322232323242325232623272328232923302331233223332334233523362337233823392340234123422343234423452346234723482349235023512352235323542355235623572358235923602361236223632364236523662367236823692370237123722373237423752376237723782379238023812382238323842385238623872388238923902391239223932394239523962397239823992400240124022403240424052406240724082409241024112412241324142415241624172418241924202421242224232424242524262427242824292430243124322433243424352436243724382439244024412442244324442445244624472448244924502451245224532454245524562457245824592460246124622463246424652466246724682469247024712472247324742475247624772478247924802481248224832484248524862487248824892490249124922493249424952496249724982499250025012502250325042505250625072508250925102511251225132514251525162517251825192520252125222523252425252526252725282529253025312532253325342535253625372538253925402541254225432544254525462547254825492550255125522553255425552556255725582559256025612562256325642565256625672568256925702571257225732574257525762577257825792580258125822583258425852586258725882589259025912592259325942595259625972598259926002601260226032604260526062607260826092610261126122613261426152616261726182619262026212622262326242625262626272628262926302631263226332634263526362637263826392640264126422643264426452646264726482649265026512652265326542655265626572658265926602661266226632664266526662667266826692670267126722673267426752676267726782679268026812682268326842685268626872688268926902691269226932694269526962697269826992700270127022703270427052706270727082709271027112712271327142715271627172718271927202721272227232724272527262727272827292730273127322733273427352736273727382739274027412742274327442745274627472748274927502751275227532754275527562757275827592760276127622763276427652766276727682769277027712772277327742775277627772778277927802781278227832784278527862787278827892790279127922793279427952796279727982799280028012802280328042805280628072808280928102811281228132814281528162817281828192820282128222823282428252826282728282829283028312832283328342835283628372838283928402841284228432844284528462847284828492850285128522853285428552856285728582859286028612862286328642865286628672868286928702871287228732874287528762877287828792880288128822883288428852886288728882889289028912892289328942895289628972898289929002901290229032904290529062907290829092910291129122913291429152916291729182919292029212922292329242925292629272928292929302931293229332934293529362937293829392940294129422943294429452946294729482949295029512952295329542955295629572958295929602961296229632964296529662967296829692970297129722973297429752976297729782979298029812982298329842985298629872988298929902991299229932994299529962997299829993000300130023003300430053006300730083009301030113012301330143015301630173018301930203021302230233024302530263027302830293030303130323033303430353036303730383039304030413042304330443045304630473048304930503051305230533054305530563057305830593060306130623063306430653066306730683069307030713072307330743075307630773078307930803081308230833084308530863087308830893090309130923093309430953096309730983099310031013102310331043105310631073108310931103111311231133114311531163117311831193120312131223123312431253126312731283129313031313132313331343135313631373138313931403141314231433144314531463147314831493150315131523153315431553156315731583159316031613162316331643165316631673168316931703171317231733174317531763177317831793180318131823183318431853186318731883189319031913192319331943195319631973198319932003201320232033204320532063207320832093210321132123213321432153216321732183219322032213222322332243225322632273228322932303231323232333234323532363237323832393240324132423243324432453246324732483249325032513252325332543255325632573258325932603261326232633264326532663267326832693270327132723273327432753276327732783279328032813282328332843285328632873288328932903291329232933294329532963297329832993300330133023303330433053306330733083309331033113312331333143315331633173318331933203321332233233324332533263327332833293330333133323333333433353336333733383339334033413342334333443345334633473348334933503351335233533354335533563357335833593360336133623363336433653366336733683369337033713372337333743375337633773378337933803381338233833384338533863387338833893390339133923393339433953396339733983399340034013402340334043405340634073408340934103411341234133414341534163417341834193420342134223423342434253426342734283429343034313432343334343435343634373438343934403441344234433444344534463447344834493450345134523453345434553456345734583459346034613462346334643465346634673468346934703471347234733474347534763477347834793480348134823483348434853486348734883489349034913492349334943495349634973498349935003501350235033504350535063507350835093510351135123513351435153516351735183519352035213522352335243525352635273528352935303531353235333534353535363537353835393540354135423543354435453546354735483549355035513552355335543555355635573558355935603561356235633564356535663567356835693570357135723573357435753576357735783579358035813582358335843585358635873588358935903591359235933594359535963597359835993600360136023603360436053606360736083609361036113612361336143615361636173618361936203621362236233624362536263627362836293630363136323633363436353636363736383639364036413642364336443645364636473648364936503651365236533654365536563657365836593660366136623663366436653666366736683669367036713672367336743675367636773678367936803681368236833684368536863687368836893690369136923693369436953696369736983699370037013702370337043705370637073708370937103711371237133714371537163717371837193720372137223723372437253726372737283729373037313732373337343735373637373738373937403741374237433744374537463747374837493750375137523753375437553756375737583759376037613762376337643765376637673768376937703771377237733774377537763777377837793780378137823783378437853786378737883789379037913792379337943795379637973798379938003801380238033804380538063807380838093810381138123813381438153816381738183819382038213822382338243825382638273828382938303831383238333834383538363837383838393840384138423843384438453846384738483849385038513852385338543855385638573858385938603861386238633864386538663867386838693870387138723873387438753876387738783879388038813882388338843885388638873888388938903891389238933894389538963897389838993900390139023903390439053906390739083909391039113912391339143915391639173918391939203921392239233924392539263927392839293930393139323933393439353936393739383939394039413942394339443945394639473948394939503951395239533954395539563957395839593960396139623963396439653966396739683969397039713972397339743975397639773978397939803981398239833984398539863987398839893990399139923993399439953996399739983999400040014002400340044005400640074008400940104011401240134014401540164017401840194020402140224023402440254026402740284029403040314032403340344035403640374038403940404041404240434044404540464047404840494050405140524053405440554056405740584059406040614062406340644065406640674068406940704071407240734074407540764077407840794080408140824083408440854086408740884089409040914092409340944095409640974098409941004101410241034104410541064107410841094110411141124113411441154116411741184119412041214122412341244125412641274128412941304131413241334134413541364137413841394140414141424143414441454146414741484149415041514152415341544155415641574158415941604161416241634164416541664167416841694170417141724173417441754176417741784179418041814182418341844185418641874188418941904191419241934194419541964197419841994200420142024203420442054206420742084209421042114212421342144215421642174218421942204221422242234224422542264227422842294230423142324233423442354236423742384239424042414242424342444245424642474248424942504251425242534254425542564257425842594260426142624263426442654266426742684269427042714272427342744275427642774278427942804281428242834284428542864287428842894290429142924293429442954296429742984299430043014302430343044305430643074308430943104311431243134314431543164317431843194320432143224323432443254326432743284329433043314332433343344335433643374338433943404341434243434344434543464347434843494350435143524353435443554356435743584359436043614362436343644365436643674368436943704371437243734374437543764377437843794380438143824383438443854386438743884389439043914392439343944395439643974398439944004401440244034404440544064407440844094410441144124413441444154416441744184419442044214422442344244425442644274428442944304431443244334434443544364437443844394440444144424443444444454446444744484449445044514452445344544455445644574458445944604461446244634464446544664467446844694470447144724473447444754476447744784479448044814482448344844485448644874488448944904491449244934494449544964497449844994500450145024503450445054506450745084509451045114512451345144515451645174518451945204521452245234524452545264527452845294530453145324533453445354536453745384539454045414542454345444545454645474548454945504551455245534554455545564557455845594560456145624563456445654566456745684569457045714572457345744575457645774578457945804581458245834584458545864587458845894590459145924593459445954596459745984599460046014602460346044605460646074608460946104611461246134614461546164617461846194620462146224623462446254626462746284629463046314632463346344635463646374638463946404641464246434644464546464647464846494650465146524653465446554656465746584659466046614662466346644665466646674668466946704671467246734674467546764677467846794680468146824683468446854686468746884689469046914692469346944695469646974698469947004701470247034704470547064707470847094710471147124713471447154716471747184719472047214722472347244725472647274728472947304731473247334734473547364737473847394740474147424743474447454746474747484749475047514752475347544755475647574758475947604761476247634764476547664767476847694770477147724773477447754776477747784779478047814782478347844785478647874788478947904791479247934794479547964797479847994800480148024803480448054806480748084809481048114812481348144815481648174818481948204821482248234824482548264827482848294830483148324833483448354836483748384839484048414842484348444845484648474848484948504851485248534854485548564857485848594860486148624863486448654866486748684869487048714872487348744875487648774878487948804881488248834884488548864887488848894890489148924893489448954896489748984899490049014902490349044905490649074908490949104911491249134914491549164917491849194920492149224923492449254926492749284929493049314932493349344935493649374938493949404941494249434944494549464947494849494950495149524953495449554956495749584959496049614962496349644965496649674968496949704971497249734974497549764977497849794980498149824983498449854986498749884989499049914992499349944995499649974998499950005001500250035004500550065007500850095010501150125013501450155016501750185019502050215022502350245025502650275028502950305031503250335034503550365037503850395040504150425043504450455046504750485049505050515052505350545055505650575058505950605061506250635064506550665067506850695070507150725073507450755076507750785079508050815082508350845085508650875088508950905091509250935094509550965097509850995100510151025103510451055106510751085109511051115112511351145115511651175118511951205121512251235124512551265127512851295130513151325133513451355136513751385139514051415142514351445145514651475148514951505151515251535154515551565157515851595160516151625163516451655166516751685169517051715172517351745175517651775178517951805181518251835184518551865187518851895190519151925193519451955196519751985199520052015202520352045205520652075208520952105211521252135214521552165217521852195220522152225223522452255226522752285229523052315232523352345235523652375238523952405241524252435244524552465247524852495250525152525253525452555256525752585259526052615262526352645265526652675268526952705271527252735274527552765277527852795280528152825283528452855286528752885289529052915292529352945295529652975298529953005301530253035304530553065307530853095310531153125313531453155316531753185319532053215322532353245325532653275328532953305331533253335334533553365337533853395340534153425343534453455346534753485349535053515352535353545355535653575358535953605361536253635364536553665367536853695370537153725373537453755376537753785379538053815382538353845385538653875388538953905391539253935394539553965397539853995400540154025403540454055406540754085409541054115412541354145415541654175418541954205421542254235424542554265427542854295430543154325433543454355436543754385439544054415442544354445445544654475448544954505451545254535454545554565457545854595460546154625463546454655466546754685469547054715472547354745475547654775478547954805481548254835484548554865487548854895490549154925493549454955496549754985499550055015502550355045505550655075508550955105511551255135514551555165517551855195520552155225523552455255526552755285529553055315532553355345535553655375538553955405541554255435544554555465547554855495550555155525553555455555556555755585559556055615562556355645565556655675568556955705571557255735574557555765577557855795580558155825583558455855586558755885589559055915592559355945595559655975598559956005601560256035604560556065607560856095610561156125613561456155616561756185619562056215622562356245625562656275628562956305631563256335634563556365637563856395640564156425643564456455646564756485649565056515652565356545655565656575658565956605661566256635664566556665667566856695670567156725673567456755676567756785679568056815682568356845685568656875688568956905691569256935694569556965697569856995700570157025703570457055706570757085709571057115712571357145715571657175718571957205721572257235724572557265727572857295730573157325733573457355736573757385739574057415742574357445745574657475748574957505751575257535754575557565757575857595760576157625763576457655766576757685769577057715772577357745775577657775778577957805781578257835784578557865787578857895790579157925793579457955796579757985799580058015802580358045805580658075808580958105811581258135814581558165817581858195820582158225823582458255826582758285829583058315832583358345835583658375838583958405841584258435844584558465847584858495850585158525853585458555856585758585859586058615862586358645865586658675868586958705871587258735874587558765877587858795880588158825883588458855886588758885889589058915892589358945895589658975898589959005901590259035904590559065907590859095910591159125913591459155916591759185919592059215922592359245925592659275928592959305931593259335934593559365937593859395940594159425943594459455946594759485949595059515952595359545955595659575958595959605961596259635964596559665967596859695970597159725973597459755976597759785979598059815982598359845985598659875988598959905991599259935994599559965997599859996000600160026003600460056006600760086009601060116012601360146015601660176018601960206021602260236024602560266027602860296030603160326033603460356036603760386039604060416042604360446045604660476048604960506051605260536054605560566057605860596060606160626063606460656066606760686069607060716072607360746075607660776078607960806081608260836084608560866087608860896090609160926093609460956096609760986099610061016102610361046105610661076108610961106111611261136114611561166117611861196120612161226123612461256126612761286129613061316132613361346135613661376138613961406141614261436144614561466147614861496150615161526153615461556156615761586159616061616162616361646165616661676168616961706171617261736174617561766177617861796180618161826183618461856186618761886189619061916192619361946195619661976198619962006201620262036204620562066207620862096210621162126213621462156216621762186219622062216222622362246225622662276228622962306231623262336234623562366237623862396240624162426243624462456246624762486249625062516252625362546255625662576258625962606261626262636264626562666267626862696270627162726273627462756276627762786279628062816282628362846285628662876288628962906291629262936294629562966297629862996300630163026303630463056306630763086309631063116312631363146315631663176318631963206321632263236324632563266327632863296330633163326333633463356336633763386339634063416342634363446345634663476348634963506351635263536354635563566357635863596360636163626363636463656366636763686369637063716372637363746375637663776378637963806381638263836384638563866387638863896390639163926393639463956396639763986399640064016402640364046405640664076408640964106411641264136414641564166417641864196420642164226423642464256426642764286429643064316432643364346435643664376438643964406441644264436444644564466447644864496450645164526453645464556456645764586459646064616462646364646465646664676468646964706471647264736474647564766477647864796480648164826483648464856486648764886489649064916492649364946495649664976498649965006501650265036504650565066507650865096510651165126513651465156516651765186519652065216522652365246525652665276528652965306531653265336534653565366537653865396540654165426543654465456546654765486549655065516552655365546555655665576558655965606561656265636564656565666567656865696570657165726573657465756576657765786579658065816582658365846585658665876588658965906591659265936594659565966597659865996600660166026603660466056606660766086609661066116612661366146615661666176618661966206621662266236624662566266627662866296630663166326633663466356636663766386639664066416642664366446645664666476648664966506651665266536654665566566657665866596660666166626663666466656666666766686669667066716672667366746675667666776678667966806681668266836684668566866687668866896690669166926693669466956696669766986699670067016702670367046705670667076708670967106711671267136714671567166717671867196720672167226723672467256726672767286729673067316732673367346735673667376738673967406741674267436744674567466747674867496750675167526753675467556756675767586759676067616762676367646765676667676768676967706771677267736774677567766777677867796780678167826783678467856786678767886789679067916792679367946795679667976798679968006801680268036804680568066807680868096810681168126813681468156816681768186819682068216822682368246825682668276828682968306831683268336834683568366837683868396840684168426843684468456846684768486849685068516852685368546855685668576858685968606861686268636864686568666867686868696870687168726873687468756876687768786879688068816882688368846885688668876888688968906891689268936894689568966897689868996900690169026903690469056906690769086909691069116912691369146915691669176918691969206921692269236924692569266927692869296930693169326933693469356936693769386939694069416942694369446945694669476948694969506951695269536954695569566957695869596960696169626963696469656966696769686969697069716972697369746975697669776978697969806981698269836984698569866987698869896990699169926993699469956996699769986999700070017002700370047005700670077008700970107011701270137014701570167017701870197020702170227023702470257026702770287029703070317032703370347035703670377038703970407041704270437044704570467047704870497050705170527053705470557056705770587059706070617062706370647065706670677068706970707071707270737074707570767077707870797080708170827083708470857086708770887089709070917092709370947095709670977098709971007101710271037104710571067107710871097110711171127113711471157116711771187119712071217122712371247125712671277128712971307131713271337134713571367137713871397140714171427143714471457146714771487149715071517152715371547155715671577158715971607161716271637164716571667167716871697170717171727173717471757176717771787179718071817182718371847185718671877188718971907191719271937194719571967197719871997200720172027203720472057206720772087209721072117212721372147215721672177218721972207221722272237224722572267227722872297230723172327233723472357236723772387239724072417242724372447245724672477248724972507251725272537254725572567257725872597260726172627263726472657266726772687269727072717272727372747275727672777278727972807281728272837284728572867287728872897290729172927293729472957296729772987299730073017302730373047305730673077308730973107311731273137314731573167317731873197320732173227323732473257326732773287329733073317332733373347335733673377338733973407341734273437344734573467347734873497350735173527353735473557356735773587359736073617362736373647365736673677368736973707371737273737374737573767377737873797380738173827383738473857386738773887389739073917392739373947395739673977398739974007401740274037404740574067407740874097410741174127413741474157416741774187419742074217422742374247425742674277428742974307431743274337434743574367437743874397440744174427443744474457446744774487449745074517452745374547455745674577458745974607461746274637464746574667467746874697470747174727473747474757476747774787479748074817482748374847485748674877488748974907491749274937494749574967497749874997500750175027503750475057506750775087509751075117512751375147515751675177518751975207521752275237524752575267527752875297530753175327533753475357536753775387539754075417542754375447545754675477548754975507551755275537554755575567557755875597560756175627563756475657566756775687569757075717572757375747575757675777578757975807581758275837584758575867587758875897590759175927593759475957596759775987599760076017602760376047605760676077608760976107611761276137614761576167617761876197620762176227623762476257626762776287629763076317632763376347635763676377638763976407641764276437644764576467647764876497650765176527653765476557656765776587659766076617662766376647665766676677668766976707671767276737674767576767677767876797680768176827683768476857686768776887689769076917692769376947695769676977698769977007701770277037704770577067707770877097710771177127713771477157716771777187719772077217722772377247725772677277728772977307731773277337734773577367737773877397740774177427743774477457746774777487749775077517752775377547755775677577758775977607761776277637764776577667767776877697770777177727773777477757776777777787779778077817782778377847785778677877788778977907791779277937794779577967797779877997800780178027803780478057806780778087809781078117812781378147815781678177818781978207821782278237824782578267827782878297830783178327833783478357836783778387839784078417842784378447845784678477848784978507851785278537854785578567857785878597860786178627863786478657866786778687869787078717872787378747875787678777878787978807881788278837884788578867887788878897890789178927893789478957896789778987899790079017902790379047905790679077908790979107911791279137914791579167917791879197920792179227923792479257926792779287929793079317932793379347935793679377938793979407941794279437944794579467947794879497950795179527953795479557956795779587959796079617962796379647965796679677968796979707971797279737974797579767977797879797980798179827983798479857986798779887989799079917992799379947995799679977998799980008001800280038004800580068007800880098010801180128013801480158016801780188019802080218022802380248025802680278028802980308031803280338034803580368037803880398040804180428043804480458046804780488049805080518052805380548055805680578058805980608061806280638064806580668067806880698070807180728073807480758076807780788079808080818082808380848085808680878088808980908091809280938094809580968097809880998100810181028103810481058106810781088109811081118112811381148115811681178118811981208121812281238124812581268127812881298130813181328133813481358136813781388139814081418142814381448145814681478148814981508151815281538154815581568157815881598160816181628163816481658166816781688169817081718172817381748175817681778178817981808181818281838184818581868187818881898190819181928193819481958196819781988199820082018202820382048205820682078208820982108211821282138214821582168217821882198220822182228223822482258226822782288229823082318232823382348235823682378238823982408241824282438244824582468247824882498250825182528253825482558256825782588259826082618262826382648265826682678268826982708271827282738274827582768277827882798280828182828283828482858286828782888289829082918292829382948295829682978298829983008301830283038304830583068307830883098310831183128313831483158316831783188319832083218322832383248325832683278328832983308331833283338334833583368337833883398340834183428343834483458346834783488349835083518352835383548355835683578358835983608361836283638364836583668367836883698370837183728373837483758376837783788379838083818382838383848385838683878388838983908391839283938394839583968397839883998400840184028403840484058406840784088409841084118412841384148415841684178418841984208421842284238424842584268427842884298430843184328433843484358436843784388439844084418442844384448445844684478448844984508451845284538454845584568457845884598460846184628463846484658466846784688469847084718472847384748475847684778478847984808481848284838484848584868487848884898490849184928493849484958496849784988499850085018502850385048505850685078508850985108511851285138514851585168517851885198520852185228523852485258526852785288529853085318532853385348535853685378538853985408541854285438544854585468547854885498550855185528553855485558556855785588559856085618562856385648565856685678568856985708571857285738574857585768577857885798580858185828583858485858586858785888589859085918592859385948595859685978598859986008601860286038604860586068607860886098610861186128613861486158616861786188619862086218622862386248625862686278628862986308631863286338634863586368637863886398640864186428643864486458646864786488649865086518652865386548655865686578658865986608661866286638664866586668667866886698670867186728673867486758676867786788679868086818682868386848685868686878688868986908691869286938694869586968697869886998700870187028703870487058706870787088709871087118712871387148715871687178718871987208721872287238724872587268727872887298730873187328733873487358736873787388739874087418742874387448745874687478748874987508751875287538754875587568757875887598760876187628763876487658766876787688769877087718772877387748775877687778778877987808781878287838784878587868787878887898790879187928793879487958796879787988799880088018802880388048805880688078808880988108811881288138814881588168817881888198820882188228823882488258826882788288829883088318832883388348835883688378838883988408841884288438844884588468847884888498850885188528853885488558856885788588859886088618862886388648865886688678868886988708871887288738874887588768877887888798880888188828883888488858886888788888889889088918892889388948895889688978898889989008901890289038904890589068907890889098910891189128913891489158916891789188919892089218922892389248925892689278928892989308931893289338934893589368937893889398940894189428943894489458946894789488949895089518952895389548955895689578958895989608961896289638964896589668967896889698970897189728973897489758976897789788979898089818982898389848985898689878988898989908991899289938994899589968997899889999000900190029003900490059006900790089009901090119012901390149015901690179018901990209021902290239024902590269027902890299030903190329033903490359036903790389039904090419042904390449045904690479048904990509051905290539054905590569057905890599060906190629063906490659066906790689069907090719072907390749075907690779078907990809081908290839084908590869087908890899090909190929093909490959096909790989099910091019102910391049105910691079108910991109111911291139114911591169117911891199120912191229123912491259126912791289129913091319132913391349135913691379138913991409141914291439144914591469147914891499150915191529153915491559156915791589159916091619162916391649165916691679168916991709171917291739174917591769177917891799180918191829183918491859186918791889189919091919192919391949195919691979198919992009201920292039204920592069207920892099210921192129213921492159216921792189219922092219222922392249225922692279228922992309231923292339234923592369237923892399240924192429243924492459246924792489249925092519252925392549255925692579258925992609261926292639264926592669267926892699270927192729273927492759276927792789279928092819282928392849285928692879288928992909291929292939294929592969297929892999300930193029303930493059306930793089309931093119312931393149315931693179318931993209321932293239324932593269327932893299330933193329333933493359336933793389339934093419342934393449345934693479348934993509351935293539354935593569357935893599360936193629363936493659366936793689369937093719372937393749375937693779378937993809381938293839384938593869387938893899390939193929393939493959396939793989399940094019402940394049405940694079408940994109411941294139414941594169417941894199420942194229423942494259426942794289429943094319432943394349435943694379438943994409441944294439444944594469447944894499450945194529453945494559456945794589459946094619462946394649465946694679468946994709471947294739474947594769477947894799480948194829483948494859486948794889489949094919492949394949495949694979498949995009501950295039504950595069507950895099510951195129513951495159516951795189519952095219522952395249525952695279528952995309531953295339534953595369537953895399540954195429543954495459546954795489549955095519552955395549555955695579558955995609561956295639564956595669567956895699570957195729573957495759576957795789579958095819582958395849585958695879588958995909591959295939594959595969597959895999600960196029603960496059606960796089609961096119612961396149615961696179618961996209621962296239624962596269627962896299630963196329633963496359636963796389639964096419642964396449645964696479648964996509651965296539654965596569657965896599660966196629663966496659666966796689669967096719672967396749675967696779678967996809681968296839684968596869687968896899690969196929693969496959696969796989699970097019702970397049705970697079708970997109711971297139714971597169717971897199720972197229723972497259726972797289729973097319732973397349735973697379738973997409741974297439744974597469747974897499750975197529753975497559756975797589759976097619762976397649765976697679768976997709771977297739774977597769777977897799780978197829783978497859786978797889789979097919792979397949795979697979798979998009801980298039804980598069807980898099810981198129813981498159816981798189819982098219822982398249825982698279828982998309831983298339834983598369837983898399840984198429843984498459846984798489849985098519852985398549855985698579858985998609861986298639864986598669867986898699870987198729873987498759876987798789879988098819882988398849885988698879888988998909891989298939894989598969897989898999900990199029903990499059906990799089909991099119912991399149915991699179918991999209921992299239924992599269927992899299930993199329933993499359936993799389939994099419942994399449945994699479948994999509951995299539954995599569957995899599960996199629963996499659966996799689969997099719972997399749975997699779978997999809981998299839984998599869987998899899990999199929993999499959996999799989999100001000110002100031000410005100061000710008100091001010011100121001310014100151001610017100181001910020100211002210023100241002510026100271002810029100301003110032100331003410035100361003710038100391004010041100421004310044100451004610047100481004910050100511005210053100541005510056100571005810059100601006110062100631006410065100661006710068100691007010071100721007310074100751007610077100781007910080100811008210083100841008510086100871008810089100901009110092100931009410095100961009710098100991010010101101021010310104101051010610107101081010910110101111011210113101141011510116101171011810119101201012110122101231012410125101261012710128101291013010131101321013310134101351013610137101381013910140101411014210143101441014510146101471014810149101501015110152101531015410155101561015710158101591016010161101621016310164101651016610167101681016910170101711017210173101741017510176101771017810179101801018110182101831018410185101861018710188101891019010191101921019310194101951019610197101981019910200102011020210203102041020510206102071020810209102101021110212102131021410215102161021710218102191022010221102221022310224102251022610227102281022910230102311023210233102341023510236102371023810239102401024110242102431024410245102461024710248102491025010251102521025310254102551025610257102581025910260102611026210263102641026510266102671026810269102701027110272102731027410275102761027710278102791028010281102821028310284102851028610287102881028910290102911029210293102941029510296102971029810299103001030110302103031030410305103061030710308103091031010311103121031310314103151031610317103181031910320103211032210323103241032510326103271032810329103301033110332103331033410335103361033710338103391034010341103421034310344103451034610347103481034910350103511035210353103541035510356103571035810359103601036110362103631036410365103661036710368103691037010371103721037310374103751037610377103781037910380103811038210383103841038510386103871038810389103901039110392103931039410395103961039710398103991040010401104021040310404104051040610407104081040910410104111041210413104141041510416104171041810419104201042110422104231042410425104261042710428104291043010431104321043310434104351043610437104381043910440104411044210443104441044510446104471044810449104501045110452104531045410455104561045710458104591046010461104621046310464104651046610467104681046910470104711047210473104741047510476104771047810479104801048110482104831048410485104861048710488104891049010491104921049310494104951049610497104981049910500105011050210503105041050510506105071050810509105101051110512105131051410515105161051710518105191052010521105221052310524105251052610527105281052910530105311053210533105341053510536105371053810539105401054110542105431054410545105461054710548105491055010551105521055310554105551055610557105581055910560105611056210563105641056510566105671056810569105701057110572105731057410575105761057710578105791058010581105821058310584105851058610587105881058910590105911059210593105941059510596105971059810599106001060110602106031060410605106061060710608106091061010611106121061310614106151061610617106181061910620106211062210623106241062510626106271062810629106301063110632106331063410635106361063710638106391064010641106421064310644106451064610647106481064910650106511065210653106541065510656106571065810659106601066110662106631066410665106661066710668106691067010671106721067310674106751067610677106781067910680106811068210683106841068510686106871068810689106901069110692106931069410695106961069710698106991070010701107021070310704107051070610707107081070910710107111071210713107141071510716107171071810719107201072110722107231072410725107261072710728107291073010731107321073310734107351073610737107381073910740107411074210743107441074510746107471074810749107501075110752107531075410755107561075710758107591076010761107621076310764107651076610767107681076910770107711077210773107741077510776107771077810779107801078110782107831078410785107861078710788107891079010791107921079310794107951079610797107981079910800108011080210803108041080510806108071080810809108101081110812108131081410815108161081710818108191082010821108221082310824108251082610827108281082910830108311083210833108341083510836108371083810839108401084110842108431084410845108461084710848108491085010851108521085310854108551085610857108581085910860108611086210863108641086510866108671086810869108701087110872108731087410875108761087710878108791088010881108821088310884108851088610887108881088910890108911089210893108941089510896108971089810899109001090110902109031090410905109061090710908109091091010911109121091310914109151091610917109181091910920109211092210923109241092510926109271092810929109301093110932109331093410935109361093710938109391094010941109421094310944109451094610947109481094910950109511095210953109541095510956109571095810959109601096110962109631096410965109661096710968109691097010971109721097310974109751097610977109781097910980109811098210983109841098510986109871098810989109901099110992109931099410995109961099710998109991100011001110021100311004110051100611007110081100911010110111101211013110141101511016110171101811019110201102111022110231102411025110261102711028110291103011031110321103311034110351103611037110381103911040110411104211043110441104511046110471104811049110501105111052110531105411055110561105711058110591106011061110621106311064110651106611067110681106911070110711107211073110741107511076110771107811079110801108111082110831108411085110861108711088110891109011091110921109311094110951109611097110981109911100111011110211103111041110511106111071110811109111101111111112111131111411115111161111711118111191112011121111221112311124111251112611127111281112911130111311113211133111341113511136111371113811139111401114111142111431114411145111461114711148111491115011151111521115311154111551115611157111581115911160111611116211163111641116511166111671116811169111701117111172111731117411175111761117711178111791118011181111821118311184111851118611187111881118911190111911119211193111941119511196111971119811199112001120111202112031120411205112061120711208112091121011211112121121311214112151121611217112181121911220112211122211223112241122511226112271122811229112301123111232112331123411235112361123711238112391124011241112421124311244112451124611247112481124911250112511125211253112541125511256112571125811259112601126111262112631126411265112661126711268112691127011271112721127311274112751127611277112781127911280112811128211283112841128511286112871128811289112901129111292112931129411295112961129711298112991130011301113021130311304113051130611307113081130911310113111131211313113141131511316113171131811319113201132111322113231132411325113261132711328113291133011331113321133311334113351133611337113381133911340113411134211343113441134511346113471134811349113501135111352113531135411355113561135711358113591136011361113621136311364113651136611367113681136911370113711137211373113741137511376113771137811379113801138111382113831138411385113861138711388113891139011391113921139311394113951139611397113981139911400114011140211403114041140511406114071140811409114101141111412114131141411415114161141711418114191142011421114221142311424114251142611427114281142911430114311143211433114341143511436114371143811439114401144111442114431144411445114461144711448114491145011451114521145311454114551145611457114581145911460114611146211463114641146511466114671146811469114701147111472114731147411475114761147711478114791148011481114821148311484114851148611487114881148911490114911149211493114941149511496114971149811499115001150111502115031150411505115061150711508115091151011511115121151311514115151151611517115181151911520115211152211523115241152511526115271152811529115301153111532115331153411535115361153711538115391154011541115421154311544115451154611547115481154911550115511155211553115541155511556115571155811559115601156111562115631156411565115661156711568115691157011571
  1. //
  2. // Copyright (C) 2014-2016 LunarG, Inc.
  3. // Copyright (C) 2015-2020 Google, Inc.
  4. // Copyright (C) 2017, 2022-2025 Arm Limited.
  5. // Modifications Copyright (C) 2020 Advanced Micro Devices, Inc. All rights reserved.
  6. //
  7. // All rights reserved.
  8. //
  9. // Redistribution and use in source and binary forms, with or without
  10. // modification, are permitted provided that the following conditions
  11. // are met:
  12. //
  13. // Redistributions of source code must retain the above copyright
  14. // notice, this list of conditions and the following disclaimer.
  15. //
  16. // Redistributions in binary form must reproduce the above
  17. // copyright notice, this list of conditions and the following
  18. // disclaimer in the documentation and/or other materials provided
  19. // with the distribution.
  20. //
  21. // Neither the name of 3Dlabs Inc. Ltd. nor the names of its
  22. // contributors may be used to endorse or promote products derived
  23. // from this software without specific prior written permission.
  24. //
  25. // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  26. // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  27. // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
  28. // FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
  29. // COPYRIGHT HOLDERS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
  30. // INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
  31. // BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  32. // LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
  33. // CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  34. // LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
  35. // ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  36. // POSSIBILITY OF SUCH DAMAGE.
  37. //
  38. // Visit the nodes in the glslang intermediate tree representation to
  39. // translate them to SPIR-V.
  40. //
  41. #include "spirv.hpp11"
  42. #include "GlslangToSpv.h"
  43. #include "SpvBuilder.h"
  44. #include "SpvTools.h"
  45. #include "spvUtil.h"
  46. namespace spv {
  47. #include "GLSL.std.450.h"
  48. #include "GLSL.ext.KHR.h"
  49. #include "GLSL.ext.EXT.h"
  50. #include "GLSL.ext.AMD.h"
  51. #include "GLSL.ext.NV.h"
  52. #include "GLSL.ext.ARM.h"
  53. #include "GLSL.ext.QCOM.h"
  54. #include "NonSemanticDebugPrintf.h"
  55. }
  56. // Glslang includes
  57. #include "../glslang/MachineIndependent/localintermediate.h"
  58. #include "../glslang/MachineIndependent/SymbolTable.h"
  59. #include "../glslang/Include/Common.h"
  60. // Build-time generated includes
  61. #include "glslang/build_info.h"
  62. #include <fstream>
  63. #include <iomanip>
  64. #include <list>
  65. #include <map>
  66. #include <optional>
  67. #include <stack>
  68. #include <string>
  69. #include <vector>
  70. namespace {
  71. namespace {
  72. class SpecConstantOpModeGuard {
  73. public:
  74. SpecConstantOpModeGuard(spv::Builder* builder)
  75. : builder_(builder) {
  76. previous_flag_ = builder->isInSpecConstCodeGenMode();
  77. }
  78. ~SpecConstantOpModeGuard() {
  79. previous_flag_ ? builder_->setToSpecConstCodeGenMode()
  80. : builder_->setToNormalCodeGenMode();
  81. }
  82. void turnOnSpecConstantOpMode() {
  83. builder_->setToSpecConstCodeGenMode();
  84. }
  85. private:
  86. spv::Builder* builder_;
  87. bool previous_flag_;
  88. };
  89. struct OpDecorations {
  90. public:
  91. OpDecorations(spv::Decoration precision, spv::Decoration noContraction, spv::Decoration nonUniform) :
  92. precision(precision)
  93. ,
  94. noContraction(noContraction),
  95. nonUniform(nonUniform)
  96. { }
  97. spv::Decoration precision;
  98. void addNoContraction(spv::Builder& builder, spv::Id t) { builder.addDecoration(t, noContraction); }
  99. void addNonUniform(spv::Builder& builder, spv::Id t) { builder.addDecoration(t, nonUniform); }
  100. protected:
  101. spv::Decoration noContraction;
  102. spv::Decoration nonUniform;
  103. };
  104. } // namespace
  105. //
  106. // The main holder of information for translating glslang to SPIR-V.
  107. //
  108. // Derives from the AST walking base class.
  109. //
  110. class TGlslangToSpvTraverser : public glslang::TIntermTraverser {
  111. public:
  112. TGlslangToSpvTraverser(unsigned int spvVersion, const glslang::TIntermediate*, spv::SpvBuildLogger* logger,
  113. glslang::SpvOptions& options);
  114. virtual ~TGlslangToSpvTraverser() { }
  115. bool visitAggregate(glslang::TVisit, glslang::TIntermAggregate*) override;
  116. bool visitBinary(glslang::TVisit, glslang::TIntermBinary*) override;
  117. void visitConstantUnion(glslang::TIntermConstantUnion*) override;
  118. bool visitSelection(glslang::TVisit, glslang::TIntermSelection*) override;
  119. bool visitSwitch(glslang::TVisit, glslang::TIntermSwitch*) override;
  120. void visitSymbol(glslang::TIntermSymbol* symbol) override;
  121. bool visitUnary(glslang::TVisit, glslang::TIntermUnary*) override;
  122. bool visitLoop(glslang::TVisit, glslang::TIntermLoop*) override;
  123. bool visitBranch(glslang::TVisit visit, glslang::TIntermBranch*) override;
  124. bool visitVariableDecl(glslang::TVisit, glslang::TIntermVariableDecl*) override;
  125. void finishSpv(bool compileOnly);
  126. void dumpSpv(std::vector<unsigned int>& out);
  127. protected:
  128. TGlslangToSpvTraverser(TGlslangToSpvTraverser&);
  129. TGlslangToSpvTraverser& operator=(TGlslangToSpvTraverser&);
  130. spv::Decoration TranslateInterpolationDecoration(const glslang::TQualifier& qualifier);
  131. spv::Decoration TranslateAuxiliaryStorageDecoration(const glslang::TQualifier& qualifier);
  132. spv::Decoration TranslateNonUniformDecoration(const glslang::TQualifier& qualifier);
  133. spv::Decoration TranslateNonUniformDecoration(const spv::Builder::AccessChain::CoherentFlags& coherentFlags);
  134. spv::Builder::AccessChain::CoherentFlags TranslateCoherent(const glslang::TType& type);
  135. spv::MemoryAccessMask TranslateMemoryAccess(const spv::Builder::AccessChain::CoherentFlags &coherentFlags);
  136. spv::ImageOperandsMask TranslateImageOperands(const spv::Builder::AccessChain::CoherentFlags &coherentFlags);
  137. spv::Scope TranslateMemoryScope(const spv::Builder::AccessChain::CoherentFlags &coherentFlags);
  138. spv::BuiltIn TranslateBuiltInDecoration(glslang::TBuiltInVariable, bool memberDeclaration);
  139. spv::ImageFormat TranslateImageFormat(const glslang::TType& type);
  140. spv::SelectionControlMask TranslateSelectionControl(const glslang::TIntermSelection&) const;
  141. spv::SelectionControlMask TranslateSwitchControl(const glslang::TIntermSwitch&) const;
  142. spv::LoopControlMask TranslateLoopControl(const glslang::TIntermLoop&, std::vector<unsigned int>& operands) const;
  143. spv::StorageClass TranslateStorageClass(const glslang::TType&);
  144. void TranslateLiterals(const glslang::TVector<const glslang::TIntermConstantUnion*>&, std::vector<unsigned>&) const;
  145. void addIndirectionIndexCapabilities(const glslang::TType& baseType, const glslang::TType& indexType);
  146. spv::Id createSpvVariable(const glslang::TIntermSymbol*, spv::Id forcedType);
  147. spv::Id getSampledType(const glslang::TSampler&);
  148. spv::Id getInvertedSwizzleType(const glslang::TIntermTyped&);
  149. spv::Id createInvertedSwizzle(spv::Decoration precision, const glslang::TIntermTyped&, spv::Id parentResult);
  150. void convertSwizzle(const glslang::TIntermAggregate&, std::vector<unsigned>& swizzle);
  151. spv::Id convertGlslangToSpvType(const glslang::TType& type, bool forwardReferenceOnly = false);
  152. spv::Id convertGlslangToSpvType(const glslang::TType& type, glslang::TLayoutPacking, const glslang::TQualifier&,
  153. bool lastBufferBlockMember, bool forwardReferenceOnly = false);
  154. void applySpirvDecorate(const glslang::TType& type, spv::Id id, std::optional<int> member);
  155. bool filterMember(const glslang::TType& member);
  156. spv::Id convertGlslangStructToSpvType(const glslang::TType&, const glslang::TTypeList* glslangStruct,
  157. glslang::TLayoutPacking, const glslang::TQualifier&);
  158. spv::LinkageType convertGlslangLinkageToSpv(glslang::TLinkType glslangLinkType);
  159. void decorateStructType(const glslang::TType&, const glslang::TTypeList* glslangStruct, glslang::TLayoutPacking,
  160. const glslang::TQualifier&, spv::Id, const std::vector<spv::Id>& spvMembers);
  161. spv::Id makeArraySizeId(const glslang::TArraySizes&, int dim, bool allowZero = false, bool boolType = false);
  162. spv::Id accessChainLoad(const glslang::TType& type);
  163. void accessChainStore(const glslang::TType& type, spv::Id rvalue);
  164. void multiTypeStore(const glslang::TType&, spv::Id rValue);
  165. spv::Id convertLoadedBoolInUniformToUint(const glslang::TType& type, spv::Id nominalTypeId, spv::Id loadedId);
  166. glslang::TLayoutPacking getExplicitLayout(const glslang::TType& type) const;
  167. int getArrayStride(const glslang::TType& arrayType, glslang::TLayoutPacking, glslang::TLayoutMatrix);
  168. int getMatrixStride(const glslang::TType& matrixType, glslang::TLayoutPacking, glslang::TLayoutMatrix);
  169. void updateMemberOffset(const glslang::TType& structType, const glslang::TType& memberType, int& currentOffset,
  170. int& nextOffset, glslang::TLayoutPacking, glslang::TLayoutMatrix);
  171. void declareUseOfStructMember(const glslang::TTypeList& members, int glslangMember);
  172. bool isShaderEntryPoint(const glslang::TIntermAggregate* node);
  173. bool writableParam(glslang::TStorageQualifier) const;
  174. bool originalParam(glslang::TStorageQualifier, const glslang::TType&, bool implicitThisParam);
  175. void makeFunctions(const glslang::TIntermSequence&);
  176. void makeGlobalInitializers(const glslang::TIntermSequence&);
  177. void collectRayTracingLinkerObjects();
  178. void visitFunctions(const glslang::TIntermSequence&);
  179. void translateArguments(const glslang::TIntermAggregate& node, std::vector<spv::Id>& arguments,
  180. spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags);
  181. void translateArguments(glslang::TIntermUnary& node, std::vector<spv::Id>& arguments);
  182. spv::Id createImageTextureFunctionCall(glslang::TIntermOperator* node);
  183. spv::Id handleUserFunctionCall(const glslang::TIntermAggregate*);
  184. spv::Id createBinaryOperation(glslang::TOperator op, OpDecorations&, spv::Id typeId, spv::Id left, spv::Id right,
  185. glslang::TBasicType typeProxy, bool reduceComparison = true);
  186. spv::Id createBinaryMatrixOperation(spv::Op, OpDecorations&, spv::Id typeId, spv::Id left, spv::Id right);
  187. spv::Id createUnaryOperation(glslang::TOperator op, OpDecorations&, spv::Id typeId, spv::Id operand,
  188. glslang::TBasicType typeProxy,
  189. const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags,
  190. const glslang::TType &opType);
  191. spv::Id createUnaryMatrixOperation(spv::Op op, OpDecorations&, spv::Id typeId, spv::Id operand,
  192. glslang::TBasicType typeProxy);
  193. spv::Id createConversion(glslang::TOperator op, OpDecorations&, spv::Id destTypeId, spv::Id operand,
  194. glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType);
  195. spv::Id createIntWidthConversion(spv::Id operand, int vectorSize, spv::Id destType,
  196. glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType);
  197. spv::Id makeSmearedConstant(spv::Id constant, int vectorSize);
  198. spv::Id createAtomicOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId,
  199. std::vector<spv::Id>& operands, glslang::TBasicType typeProxy,
  200. const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags,
  201. const glslang::TType &opType);
  202. spv::Id createInvocationsOperation(glslang::TOperator op, spv::Id typeId, std::vector<spv::Id>& operands,
  203. glslang::TBasicType typeProxy);
  204. spv::Id CreateInvocationsVectorOperation(spv::Op op, spv::GroupOperation groupOperation,
  205. spv::Id typeId, std::vector<spv::Id>& operands);
  206. spv::Id createSubgroupOperation(glslang::TOperator op, spv::Id typeId, std::vector<spv::Id>& operands,
  207. glslang::TBasicType typeProxy);
  208. spv::Id createMiscOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId,
  209. std::vector<spv::Id>& operands, glslang::TBasicType typeProxy);
  210. spv::Id createNoArgOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId);
  211. spv::Id getSymbolId(const glslang::TIntermSymbol* node);
  212. void addMeshNVDecoration(spv::Id id, int member, const glslang::TQualifier & qualifier);
  213. bool hasQCOMImageProceessingDecoration(spv::Id id, spv::Decoration decor);
  214. void addImageProcessingQCOMDecoration(spv::Id id, spv::Decoration decor);
  215. void addImageProcessing2QCOMDecoration(spv::Id id, bool isForGather);
  216. spv::Id createSpvConstant(const glslang::TIntermTyped&);
  217. spv::Id createSpvConstantFromConstUnionArray(const glslang::TType& type, const glslang::TConstUnionArray&,
  218. int& nextConst, bool specConstant);
  219. bool isTrivialLeaf(const glslang::TIntermTyped* node);
  220. bool isTrivial(const glslang::TIntermTyped* node);
  221. spv::Id createShortCircuit(glslang::TOperator, glslang::TIntermTyped& left, glslang::TIntermTyped& right);
  222. spv::Id getExtBuiltins(const char* name);
  223. std::pair<spv::Id, spv::Id> getForcedType(glslang::TBuiltInVariable builtIn, const glslang::TType&);
  224. spv::Id translateForcedType(spv::Id object);
  225. spv::Id createCompositeConstruct(spv::Id typeId, std::vector<spv::Id> constituents);
  226. glslang::SpvOptions& options;
  227. spv::Function* shaderEntry;
  228. spv::Function* currentFunction;
  229. spv::Instruction* entryPoint;
  230. int sequenceDepth;
  231. spv::SpvBuildLogger* logger;
  232. // There is a 1:1 mapping between a spv builder and a module; this is thread safe
  233. spv::Builder builder;
  234. bool inEntryPoint;
  235. bool entryPointTerminated;
  236. bool linkageOnly; // true when visiting the set of objects in the AST present only for
  237. // establishing interface, whether or not they were statically used
  238. std::set<spv::Id> iOSet; // all input/output variables from either static use or declaration of interface
  239. const glslang::TIntermediate* glslangIntermediate;
  240. bool nanMinMaxClamp; // true if use NMin/NMax/NClamp instead of FMin/FMax/FClamp
  241. spv::Id stdBuiltins;
  242. spv::Id nonSemanticDebugPrintf;
  243. std::unordered_map<std::string, spv::Id> extBuiltinMap;
  244. std::unordered_map<long long, spv::Id> symbolValues;
  245. std::unordered_map<uint32_t, spv::Id> builtInVariableIds;
  246. std::unordered_set<long long> rValueParameters; // set of formal function parameters passed as rValues,
  247. // rather than a pointer
  248. std::unordered_map<std::string, spv::Function*> functionMap;
  249. std::unordered_map<const glslang::TTypeList*, spv::Id> structMap[glslang::ElpCount][glslang::ElmCount];
  250. // for mapping glslang block indices to spv indices (e.g., due to hidden members):
  251. std::unordered_map<long long, std::vector<int>> memberRemapper;
  252. // for mapping glslang symbol struct to symbol Id
  253. std::unordered_map<const glslang::TTypeList*, long long> glslangTypeToIdMap;
  254. std::stack<bool> breakForLoop; // false means break for switch
  255. std::unordered_map<std::string, const glslang::TIntermSymbol*> counterOriginator;
  256. // Map pointee types for EbtReference to their forward pointers
  257. std::map<const glslang::TType *, spv::Id> forwardPointers;
  258. // Type forcing, for when SPIR-V wants a different type than the AST,
  259. // requiring local translation to and from SPIR-V type on every access.
  260. // Maps <builtin-variable-id -> AST-required-type-id>
  261. std::unordered_map<spv::Id, spv::Id> forceType;
  262. // Used by Task shader while generating opearnds for OpEmitMeshTasksEXT
  263. spv::Id taskPayloadID;
  264. // Used later for generating OpTraceKHR/OpExecuteCallableKHR/OpHitObjectRecordHit*/OpHitObjectGetShaderBindingTableData
  265. std::unordered_map<unsigned int, glslang::TIntermSymbol *> locationToSymbol[4];
  266. std::unordered_map<spv::Id, std::vector<spv::Decoration> > idToQCOMDecorations;
  267. };
  268. //
  269. // Helper functions for translating glslang representations to SPIR-V enumerants.
  270. //
  271. // Translate glslang profile to SPIR-V source language.
  272. spv::SourceLanguage TranslateSourceLanguage(glslang::EShSource source, EProfile profile)
  273. {
  274. switch (source) {
  275. case glslang::EShSourceGlsl:
  276. switch (profile) {
  277. case ENoProfile:
  278. case ECoreProfile:
  279. case ECompatibilityProfile:
  280. return spv::SourceLanguage::GLSL;
  281. case EEsProfile:
  282. return spv::SourceLanguage::ESSL;
  283. default:
  284. return spv::SourceLanguage::Unknown;
  285. }
  286. case glslang::EShSourceHlsl:
  287. return spv::SourceLanguage::HLSL;
  288. default:
  289. return spv::SourceLanguage::Unknown;
  290. }
  291. }
  292. // Translate glslang language (stage) to SPIR-V execution model.
  293. spv::ExecutionModel TranslateExecutionModel(EShLanguage stage, bool isMeshShaderEXT = false)
  294. {
  295. switch (stage) {
  296. case EShLangVertex: return spv::ExecutionModel::Vertex;
  297. case EShLangFragment: return spv::ExecutionModel::Fragment;
  298. case EShLangCompute: return spv::ExecutionModel::GLCompute;
  299. case EShLangTessControl: return spv::ExecutionModel::TessellationControl;
  300. case EShLangTessEvaluation: return spv::ExecutionModel::TessellationEvaluation;
  301. case EShLangGeometry: return spv::ExecutionModel::Geometry;
  302. case EShLangRayGen: return spv::ExecutionModel::RayGenerationKHR;
  303. case EShLangIntersect: return spv::ExecutionModel::IntersectionKHR;
  304. case EShLangAnyHit: return spv::ExecutionModel::AnyHitKHR;
  305. case EShLangClosestHit: return spv::ExecutionModel::ClosestHitKHR;
  306. case EShLangMiss: return spv::ExecutionModel::MissKHR;
  307. case EShLangCallable: return spv::ExecutionModel::CallableKHR;
  308. case EShLangTask: return (isMeshShaderEXT)? spv::ExecutionModel::TaskEXT : spv::ExecutionModel::TaskNV;
  309. case EShLangMesh: return (isMeshShaderEXT)? spv::ExecutionModel::MeshEXT : spv::ExecutionModel::MeshNV;
  310. default:
  311. assert(0);
  312. return spv::ExecutionModel::Fragment;
  313. }
  314. }
  315. // Translate glslang sampler type to SPIR-V dimensionality.
  316. spv::Dim TranslateDimensionality(const glslang::TSampler& sampler)
  317. {
  318. switch (sampler.dim) {
  319. case glslang::Esd1D: return spv::Dim::Dim1D;
  320. case glslang::Esd2D: return spv::Dim::Dim2D;
  321. case glslang::Esd3D: return spv::Dim::Dim3D;
  322. case glslang::EsdCube: return spv::Dim::Cube;
  323. case glslang::EsdRect: return spv::Dim::Rect;
  324. case glslang::EsdBuffer: return spv::Dim::Buffer;
  325. case glslang::EsdSubpass: return spv::Dim::SubpassData;
  326. case glslang::EsdAttachmentEXT: return spv::Dim::TileImageDataEXT;
  327. default:
  328. assert(0);
  329. return spv::Dim::Dim2D;
  330. }
  331. }
  332. // Translate glslang precision to SPIR-V precision decorations.
  333. spv::Decoration TranslatePrecisionDecoration(glslang::TPrecisionQualifier glslangPrecision)
  334. {
  335. switch (glslangPrecision) {
  336. case glslang::EpqLow: return spv::Decoration::RelaxedPrecision;
  337. case glslang::EpqMedium: return spv::Decoration::RelaxedPrecision;
  338. default:
  339. return spv::NoPrecision;
  340. }
  341. }
  342. // Translate glslang type to SPIR-V precision decorations.
  343. spv::Decoration TranslatePrecisionDecoration(const glslang::TType& type)
  344. {
  345. return TranslatePrecisionDecoration(type.getQualifier().precision);
  346. }
  347. // Translate glslang type to SPIR-V block decorations.
  348. spv::Decoration TranslateBlockDecoration(const glslang::TStorageQualifier storage, bool useStorageBuffer)
  349. {
  350. switch (storage) {
  351. case glslang::EvqUniform: return spv::Decoration::Block;
  352. case glslang::EvqBuffer: return useStorageBuffer ? spv::Decoration::Block : spv::Decoration::BufferBlock;
  353. case glslang::EvqVaryingIn: return spv::Decoration::Block;
  354. case glslang::EvqVaryingOut: return spv::Decoration::Block;
  355. case glslang::EvqShared: return spv::Decoration::Block;
  356. case glslang::EvqPayload: return spv::Decoration::Block;
  357. case glslang::EvqPayloadIn: return spv::Decoration::Block;
  358. case glslang::EvqHitAttr: return spv::Decoration::Block;
  359. case glslang::EvqCallableData: return spv::Decoration::Block;
  360. case glslang::EvqCallableDataIn: return spv::Decoration::Block;
  361. case glslang::EvqHitObjectAttrNV: return spv::Decoration::Block;
  362. case glslang::EvqHitObjectAttrEXT: return spv::Decoration::Block;
  363. default:
  364. assert(0);
  365. break;
  366. }
  367. return spv::Decoration::Max;
  368. }
  369. // Translate glslang type to SPIR-V memory decorations.
  370. void TranslateMemoryDecoration(const glslang::TQualifier& qualifier, std::vector<spv::Decoration>& memory,
  371. bool useVulkanMemoryModel)
  372. {
  373. if (!useVulkanMemoryModel) {
  374. if (qualifier.isVolatile()) {
  375. memory.push_back(spv::Decoration::Volatile);
  376. memory.push_back(spv::Decoration::Coherent);
  377. } else if (qualifier.isCoherent()) {
  378. memory.push_back(spv::Decoration::Coherent);
  379. }
  380. }
  381. if (qualifier.isRestrict())
  382. memory.push_back(spv::Decoration::Restrict);
  383. if (qualifier.isReadOnly())
  384. memory.push_back(spv::Decoration::NonWritable);
  385. if (qualifier.isWriteOnly())
  386. memory.push_back(spv::Decoration::NonReadable);
  387. }
  388. // Translate glslang type to SPIR-V layout decorations.
  389. spv::Decoration TranslateLayoutDecoration(const glslang::TType& type, glslang::TLayoutMatrix matrixLayout)
  390. {
  391. if (type.isMatrix()) {
  392. switch (matrixLayout) {
  393. case glslang::ElmRowMajor:
  394. return spv::Decoration::RowMajor;
  395. case glslang::ElmColumnMajor:
  396. return spv::Decoration::ColMajor;
  397. default:
  398. // opaque layouts don't need a majorness
  399. return spv::Decoration::Max;
  400. }
  401. } else {
  402. switch (type.getBasicType()) {
  403. default:
  404. return spv::Decoration::Max;
  405. break;
  406. case glslang::EbtBlock:
  407. switch (type.getQualifier().storage) {
  408. case glslang::EvqShared:
  409. case glslang::EvqUniform:
  410. case glslang::EvqBuffer:
  411. switch (type.getQualifier().layoutPacking) {
  412. case glslang::ElpShared: return spv::Decoration::GLSLShared;
  413. case glslang::ElpPacked: return spv::Decoration::GLSLPacked;
  414. default:
  415. return spv::Decoration::Max;
  416. }
  417. case glslang::EvqVaryingIn:
  418. case glslang::EvqVaryingOut:
  419. if (type.getQualifier().isTaskMemory()) {
  420. switch (type.getQualifier().layoutPacking) {
  421. case glslang::ElpShared: return spv::Decoration::GLSLShared;
  422. case glslang::ElpPacked: return spv::Decoration::GLSLPacked;
  423. default: break;
  424. }
  425. } else {
  426. assert(type.getQualifier().layoutPacking == glslang::ElpNone);
  427. }
  428. return spv::Decoration::Max;
  429. case glslang::EvqPayload:
  430. case glslang::EvqPayloadIn:
  431. case glslang::EvqHitAttr:
  432. case glslang::EvqCallableData:
  433. case glslang::EvqCallableDataIn:
  434. case glslang::EvqHitObjectAttrNV:
  435. case glslang::EvqHitObjectAttrEXT:
  436. return spv::Decoration::Max;
  437. default:
  438. assert(0);
  439. return spv::Decoration::Max;
  440. }
  441. }
  442. }
  443. }
  444. // Translate glslang type to SPIR-V interpolation decorations.
  445. // Returns spv::Decoration::Max when no decoration
  446. // should be applied.
  447. spv::Decoration TGlslangToSpvTraverser::TranslateInterpolationDecoration(const glslang::TQualifier& qualifier)
  448. {
  449. if (qualifier.smooth)
  450. // Smooth decoration doesn't exist in SPIR-V 1.0
  451. return spv::Decoration::Max;
  452. else if (qualifier.isNonPerspective())
  453. return spv::Decoration::NoPerspective;
  454. else if (qualifier.flat)
  455. return spv::Decoration::Flat;
  456. else if (qualifier.isExplicitInterpolation()) {
  457. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  458. return spv::Decoration::ExplicitInterpAMD;
  459. }
  460. else
  461. return spv::Decoration::Max;
  462. }
  463. // Translate glslang type to SPIR-V auxiliary storage decorations.
  464. // Returns spv::Decoration::Max when no decoration
  465. // should be applied.
  466. spv::Decoration TGlslangToSpvTraverser::TranslateAuxiliaryStorageDecoration(const glslang::TQualifier& qualifier)
  467. {
  468. if (qualifier.centroid)
  469. return spv::Decoration::Centroid;
  470. else if (qualifier.patch)
  471. return spv::Decoration::Patch;
  472. else if (qualifier.sample) {
  473. builder.addCapability(spv::Capability::SampleRateShading);
  474. return spv::Decoration::Sample;
  475. }
  476. return spv::Decoration::Max;
  477. }
  478. // If glslang type is invariant, return SPIR-V invariant decoration.
  479. spv::Decoration TranslateInvariantDecoration(const glslang::TQualifier& qualifier)
  480. {
  481. if (qualifier.invariant)
  482. return spv::Decoration::Invariant;
  483. else
  484. return spv::Decoration::Max;
  485. }
  486. // If glslang type is noContraction, return SPIR-V NoContraction decoration.
  487. spv::Decoration TranslateNoContractionDecoration(const glslang::TQualifier& qualifier)
  488. {
  489. if (qualifier.isNoContraction())
  490. return spv::Decoration::NoContraction;
  491. else
  492. return spv::Decoration::Max;
  493. }
  494. // If glslang type is nonUniform, return SPIR-V NonUniform decoration.
  495. spv::Decoration TGlslangToSpvTraverser::TranslateNonUniformDecoration(const glslang::TQualifier& qualifier)
  496. {
  497. if (qualifier.isNonUniform()) {
  498. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  499. builder.addCapability(spv::Capability::ShaderNonUniformEXT);
  500. return spv::Decoration::NonUniformEXT;
  501. } else
  502. return spv::Decoration::Max;
  503. }
  504. // If lvalue flags contains nonUniform, return SPIR-V NonUniform decoration.
  505. spv::Decoration TGlslangToSpvTraverser::TranslateNonUniformDecoration(
  506. const spv::Builder::AccessChain::CoherentFlags& coherentFlags)
  507. {
  508. if (coherentFlags.isNonUniform()) {
  509. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  510. builder.addCapability(spv::Capability::ShaderNonUniformEXT);
  511. return spv::Decoration::NonUniformEXT;
  512. } else
  513. return spv::Decoration::Max;
  514. }
  515. spv::MemoryAccessMask TGlslangToSpvTraverser::TranslateMemoryAccess(
  516. const spv::Builder::AccessChain::CoherentFlags &coherentFlags)
  517. {
  518. spv::MemoryAccessMask mask = spv::MemoryAccessMask::MaskNone;
  519. if (!glslangIntermediate->usingVulkanMemoryModel() || coherentFlags.isImage)
  520. return mask;
  521. if (coherentFlags.isVolatile() || coherentFlags.anyCoherent()) {
  522. mask = mask | spv::MemoryAccessMask::MakePointerAvailableKHR |
  523. spv::MemoryAccessMask::MakePointerVisibleKHR;
  524. }
  525. if (coherentFlags.nonprivate) {
  526. mask = mask | spv::MemoryAccessMask::NonPrivatePointerKHR;
  527. }
  528. if (coherentFlags.volatil) {
  529. mask = mask | spv::MemoryAccessMask::Volatile;
  530. }
  531. if (coherentFlags.nontemporal) {
  532. mask = mask | spv::MemoryAccessMask::Nontemporal;
  533. }
  534. if (mask != spv::MemoryAccessMask::MaskNone) {
  535. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  536. }
  537. return mask;
  538. }
  539. spv::ImageOperandsMask TGlslangToSpvTraverser::TranslateImageOperands(
  540. const spv::Builder::AccessChain::CoherentFlags &coherentFlags)
  541. {
  542. spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;
  543. if (!glslangIntermediate->usingVulkanMemoryModel())
  544. return mask;
  545. if (coherentFlags.volatil ||
  546. coherentFlags.anyCoherent()) {
  547. mask = mask | spv::ImageOperandsMask::MakeTexelAvailableKHR |
  548. spv::ImageOperandsMask::MakeTexelVisibleKHR;
  549. }
  550. if (coherentFlags.nonprivate) {
  551. mask = mask | spv::ImageOperandsMask::NonPrivateTexelKHR;
  552. }
  553. if (coherentFlags.volatil) {
  554. mask = mask | spv::ImageOperandsMask::VolatileTexelKHR;
  555. }
  556. if (coherentFlags.nontemporal && builder.getSpvVersion() >= spv::Spv_1_6) {
  557. mask = mask | spv::ImageOperandsMask::Nontemporal;
  558. }
  559. if (mask != spv::ImageOperandsMask::MaskNone) {
  560. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  561. }
  562. return mask;
  563. }
  564. spv::Builder::AccessChain::CoherentFlags TGlslangToSpvTraverser::TranslateCoherent(const glslang::TType& type)
  565. {
  566. spv::Builder::AccessChain::CoherentFlags flags = {};
  567. flags.coherent = type.getQualifier().coherent;
  568. flags.devicecoherent = type.getQualifier().devicecoherent;
  569. flags.queuefamilycoherent = type.getQualifier().queuefamilycoherent;
  570. // shared variables are implicitly workgroupcoherent in GLSL.
  571. flags.workgroupcoherent = type.getQualifier().workgroupcoherent ||
  572. type.getQualifier().storage == glslang::EvqShared;
  573. flags.subgroupcoherent = type.getQualifier().subgroupcoherent;
  574. flags.shadercallcoherent = type.getQualifier().shadercallcoherent;
  575. flags.volatil = type.getQualifier().volatil;
  576. flags.nontemporal = type.getQualifier().nontemporal;
  577. // *coherent variables are implicitly nonprivate in GLSL
  578. flags.nonprivate = type.getQualifier().nonprivate ||
  579. flags.anyCoherent() ||
  580. flags.volatil;
  581. flags.isImage = type.getBasicType() == glslang::EbtSampler;
  582. flags.nonUniform = type.getQualifier().nonUniform;
  583. return flags;
  584. }
  585. spv::Scope TGlslangToSpvTraverser::TranslateMemoryScope(
  586. const spv::Builder::AccessChain::CoherentFlags &coherentFlags)
  587. {
  588. spv::Scope scope = spv::Scope::Max;
  589. if (coherentFlags.volatil || coherentFlags.coherent) {
  590. // coherent defaults to Device scope in the old model, QueueFamilyKHR scope in the new model
  591. scope = glslangIntermediate->usingVulkanMemoryModel() ? spv::Scope::QueueFamilyKHR : spv::Scope::Device;
  592. } else if (coherentFlags.devicecoherent) {
  593. scope = spv::Scope::Device;
  594. } else if (coherentFlags.queuefamilycoherent) {
  595. scope = spv::Scope::QueueFamilyKHR;
  596. } else if (coherentFlags.workgroupcoherent) {
  597. scope = spv::Scope::Workgroup;
  598. } else if (coherentFlags.subgroupcoherent) {
  599. scope = spv::Scope::Subgroup;
  600. } else if (coherentFlags.shadercallcoherent) {
  601. scope = spv::Scope::ShaderCallKHR;
  602. }
  603. if (glslangIntermediate->usingVulkanMemoryModel() && scope == spv::Scope::Device) {
  604. builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);
  605. }
  606. return scope;
  607. }
  608. // Translate a glslang built-in variable to a SPIR-V built in decoration. Also generate
  609. // associated capabilities when required. For some built-in variables, a capability
  610. // is generated only when using the variable in an executable instruction, but not when
  611. // just declaring a struct member variable with it. This is true for PointSize,
  612. // ClipDistance, and CullDistance.
  613. spv::BuiltIn TGlslangToSpvTraverser::TranslateBuiltInDecoration(glslang::TBuiltInVariable builtIn,
  614. bool memberDeclaration)
  615. {
  616. switch (builtIn) {
  617. case glslang::EbvPointSize:
  618. // Defer adding the capability until the built-in is actually used.
  619. if (! memberDeclaration) {
  620. switch (glslangIntermediate->getStage()) {
  621. case EShLangGeometry:
  622. builder.addCapability(spv::Capability::GeometryPointSize);
  623. break;
  624. case EShLangTessControl:
  625. case EShLangTessEvaluation:
  626. builder.addCapability(spv::Capability::TessellationPointSize);
  627. break;
  628. default:
  629. break;
  630. }
  631. }
  632. return spv::BuiltIn::PointSize;
  633. case glslang::EbvPosition: return spv::BuiltIn::Position;
  634. case glslang::EbvVertexId: return spv::BuiltIn::VertexId;
  635. case glslang::EbvInstanceId: return spv::BuiltIn::InstanceId;
  636. case glslang::EbvVertexIndex: return spv::BuiltIn::VertexIndex;
  637. case glslang::EbvInstanceIndex: return spv::BuiltIn::InstanceIndex;
  638. case glslang::EbvFragCoord: return spv::BuiltIn::FragCoord;
  639. case glslang::EbvPointCoord: return spv::BuiltIn::PointCoord;
  640. case glslang::EbvFace: return spv::BuiltIn::FrontFacing;
  641. case glslang::EbvFragDepth: return spv::BuiltIn::FragDepth;
  642. case glslang::EbvNumWorkGroups: return spv::BuiltIn::NumWorkgroups;
  643. case glslang::EbvWorkGroupSize: return spv::BuiltIn::WorkgroupSize;
  644. case glslang::EbvWorkGroupId: return spv::BuiltIn::WorkgroupId;
  645. case glslang::EbvLocalInvocationId: return spv::BuiltIn::LocalInvocationId;
  646. case glslang::EbvLocalInvocationIndex: return spv::BuiltIn::LocalInvocationIndex;
  647. case glslang::EbvGlobalInvocationId: return spv::BuiltIn::GlobalInvocationId;
  648. // These *Distance capabilities logically belong here, but if the member is declared and
  649. // then never used, consumers of SPIR-V prefer the capability not be declared.
  650. // They are now generated when used, rather than here when declared.
  651. // Potentially, the specification should be more clear what the minimum
  652. // use needed is to trigger the capability.
  653. //
  654. case glslang::EbvClipDistance:
  655. if (!memberDeclaration)
  656. builder.addCapability(spv::Capability::ClipDistance);
  657. return spv::BuiltIn::ClipDistance;
  658. case glslang::EbvCullDistance:
  659. if (!memberDeclaration)
  660. builder.addCapability(spv::Capability::CullDistance);
  661. return spv::BuiltIn::CullDistance;
  662. case glslang::EbvViewportIndex:
  663. if (glslangIntermediate->getStage() == EShLangGeometry ||
  664. glslangIntermediate->getStage() == EShLangFragment) {
  665. builder.addCapability(spv::Capability::MultiViewport);
  666. }
  667. if (glslangIntermediate->getStage() == EShLangVertex ||
  668. glslangIntermediate->getStage() == EShLangTessControl ||
  669. glslangIntermediate->getStage() == EShLangTessEvaluation) {
  670. if (builder.getSpvVersion() < spv::Spv_1_5) {
  671. builder.addIncorporatedExtension(spv::E_SPV_EXT_shader_viewport_index_layer, spv::Spv_1_5);
  672. builder.addCapability(spv::Capability::ShaderViewportIndexLayerEXT);
  673. }
  674. else
  675. builder.addCapability(spv::Capability::ShaderViewportIndex);
  676. }
  677. return spv::BuiltIn::ViewportIndex;
  678. case glslang::EbvSampleId:
  679. builder.addCapability(spv::Capability::SampleRateShading);
  680. return spv::BuiltIn::SampleId;
  681. case glslang::EbvSamplePosition:
  682. builder.addCapability(spv::Capability::SampleRateShading);
  683. return spv::BuiltIn::SamplePosition;
  684. case glslang::EbvSampleMask:
  685. return spv::BuiltIn::SampleMask;
  686. case glslang::EbvLayer:
  687. if (glslangIntermediate->getStage() == EShLangMesh) {
  688. return spv::BuiltIn::Layer;
  689. }
  690. if (glslangIntermediate->getStage() == EShLangGeometry ||
  691. glslangIntermediate->getStage() == EShLangFragment) {
  692. builder.addCapability(spv::Capability::Geometry);
  693. }
  694. if (glslangIntermediate->getStage() == EShLangVertex ||
  695. glslangIntermediate->getStage() == EShLangTessControl ||
  696. glslangIntermediate->getStage() == EShLangTessEvaluation) {
  697. if (builder.getSpvVersion() < spv::Spv_1_5) {
  698. builder.addIncorporatedExtension(spv::E_SPV_EXT_shader_viewport_index_layer, spv::Spv_1_5);
  699. builder.addCapability(spv::Capability::ShaderViewportIndexLayerEXT);
  700. } else
  701. builder.addCapability(spv::Capability::ShaderLayer);
  702. }
  703. return spv::BuiltIn::Layer;
  704. case glslang::EbvBaseVertex:
  705. builder.addIncorporatedExtension(spv::E_SPV_KHR_shader_draw_parameters, spv::Spv_1_3);
  706. builder.addCapability(spv::Capability::DrawParameters);
  707. return spv::BuiltIn::BaseVertex;
  708. case glslang::EbvBaseInstance:
  709. builder.addIncorporatedExtension(spv::E_SPV_KHR_shader_draw_parameters, spv::Spv_1_3);
  710. builder.addCapability(spv::Capability::DrawParameters);
  711. return spv::BuiltIn::BaseInstance;
  712. case glslang::EbvDrawId:
  713. builder.addIncorporatedExtension(spv::E_SPV_KHR_shader_draw_parameters, spv::Spv_1_3);
  714. builder.addCapability(spv::Capability::DrawParameters);
  715. return spv::BuiltIn::DrawIndex;
  716. case glslang::EbvPrimitiveId:
  717. if (glslangIntermediate->getStage() == EShLangFragment)
  718. builder.addCapability(spv::Capability::Geometry);
  719. return spv::BuiltIn::PrimitiveId;
  720. case glslang::EbvFragStencilRef:
  721. builder.addExtension(spv::E_SPV_EXT_shader_stencil_export);
  722. builder.addCapability(spv::Capability::StencilExportEXT);
  723. return spv::BuiltIn::FragStencilRefEXT;
  724. case glslang::EbvShadingRateKHR:
  725. builder.addExtension(spv::E_SPV_KHR_fragment_shading_rate);
  726. builder.addCapability(spv::Capability::FragmentShadingRateKHR);
  727. return spv::BuiltIn::ShadingRateKHR;
  728. case glslang::EbvPrimitiveShadingRateKHR:
  729. builder.addExtension(spv::E_SPV_KHR_fragment_shading_rate);
  730. builder.addCapability(spv::Capability::FragmentShadingRateKHR);
  731. return spv::BuiltIn::PrimitiveShadingRateKHR;
  732. case glslang::EbvInvocationId: return spv::BuiltIn::InvocationId;
  733. case glslang::EbvTessLevelInner: return spv::BuiltIn::TessLevelInner;
  734. case glslang::EbvTessLevelOuter: return spv::BuiltIn::TessLevelOuter;
  735. case glslang::EbvTessCoord: return spv::BuiltIn::TessCoord;
  736. case glslang::EbvPatchVertices: return spv::BuiltIn::PatchVertices;
  737. case glslang::EbvHelperInvocation: return spv::BuiltIn::HelperInvocation;
  738. case glslang::EbvSubGroupSize:
  739. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  740. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  741. return spv::BuiltIn::SubgroupSize;
  742. case glslang::EbvSubGroupInvocation:
  743. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  744. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  745. return spv::BuiltIn::SubgroupLocalInvocationId;
  746. case glslang::EbvSubGroupEqMask:
  747. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  748. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  749. return spv::BuiltIn::SubgroupEqMask;
  750. case glslang::EbvSubGroupGeMask:
  751. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  752. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  753. return spv::BuiltIn::SubgroupGeMask;
  754. case glslang::EbvSubGroupGtMask:
  755. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  756. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  757. return spv::BuiltIn::SubgroupGtMask;
  758. case glslang::EbvSubGroupLeMask:
  759. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  760. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  761. return spv::BuiltIn::SubgroupLeMask;
  762. case glslang::EbvSubGroupLtMask:
  763. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  764. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  765. return spv::BuiltIn::SubgroupLtMask;
  766. case glslang::EbvNumSubgroups:
  767. builder.addCapability(spv::Capability::GroupNonUniform);
  768. return spv::BuiltIn::NumSubgroups;
  769. case glslang::EbvSubgroupID:
  770. builder.addCapability(spv::Capability::GroupNonUniform);
  771. return spv::BuiltIn::SubgroupId;
  772. case glslang::EbvSubgroupSize2:
  773. builder.addCapability(spv::Capability::GroupNonUniform);
  774. return spv::BuiltIn::SubgroupSize;
  775. case glslang::EbvSubgroupInvocation2:
  776. builder.addCapability(spv::Capability::GroupNonUniform);
  777. return spv::BuiltIn::SubgroupLocalInvocationId;
  778. case glslang::EbvSubgroupEqMask2:
  779. builder.addCapability(spv::Capability::GroupNonUniform);
  780. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  781. return spv::BuiltIn::SubgroupEqMask;
  782. case glslang::EbvSubgroupGeMask2:
  783. builder.addCapability(spv::Capability::GroupNonUniform);
  784. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  785. return spv::BuiltIn::SubgroupGeMask;
  786. case glslang::EbvSubgroupGtMask2:
  787. builder.addCapability(spv::Capability::GroupNonUniform);
  788. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  789. return spv::BuiltIn::SubgroupGtMask;
  790. case glslang::EbvSubgroupLeMask2:
  791. builder.addCapability(spv::Capability::GroupNonUniform);
  792. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  793. return spv::BuiltIn::SubgroupLeMask;
  794. case glslang::EbvSubgroupLtMask2:
  795. builder.addCapability(spv::Capability::GroupNonUniform);
  796. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  797. return spv::BuiltIn::SubgroupLtMask;
  798. case glslang::EbvBaryCoordNoPersp:
  799. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  800. return spv::BuiltIn::BaryCoordNoPerspAMD;
  801. case glslang::EbvBaryCoordNoPerspCentroid:
  802. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  803. return spv::BuiltIn::BaryCoordNoPerspCentroidAMD;
  804. case glslang::EbvBaryCoordNoPerspSample:
  805. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  806. return spv::BuiltIn::BaryCoordNoPerspSampleAMD;
  807. case glslang::EbvBaryCoordSmooth:
  808. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  809. return spv::BuiltIn::BaryCoordSmoothAMD;
  810. case glslang::EbvBaryCoordSmoothCentroid:
  811. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  812. return spv::BuiltIn::BaryCoordSmoothCentroidAMD;
  813. case glslang::EbvBaryCoordSmoothSample:
  814. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  815. return spv::BuiltIn::BaryCoordSmoothSampleAMD;
  816. case glslang::EbvBaryCoordPullModel:
  817. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  818. return spv::BuiltIn::BaryCoordPullModelAMD;
  819. case glslang::EbvDeviceIndex:
  820. builder.addIncorporatedExtension(spv::E_SPV_KHR_device_group, spv::Spv_1_3);
  821. builder.addCapability(spv::Capability::DeviceGroup);
  822. return spv::BuiltIn::DeviceIndex;
  823. case glslang::EbvViewIndex:
  824. builder.addIncorporatedExtension(spv::E_SPV_KHR_multiview, spv::Spv_1_3);
  825. builder.addCapability(spv::Capability::MultiView);
  826. return spv::BuiltIn::ViewIndex;
  827. case glslang::EbvFragSizeEXT:
  828. builder.addExtension(spv::E_SPV_EXT_fragment_invocation_density);
  829. builder.addCapability(spv::Capability::FragmentDensityEXT);
  830. return spv::BuiltIn::FragSizeEXT;
  831. case glslang::EbvFragInvocationCountEXT:
  832. builder.addExtension(spv::E_SPV_EXT_fragment_invocation_density);
  833. builder.addCapability(spv::Capability::FragmentDensityEXT);
  834. return spv::BuiltIn::FragInvocationCountEXT;
  835. case glslang::EbvViewportMaskNV:
  836. if (!memberDeclaration) {
  837. builder.addExtension(spv::E_SPV_NV_viewport_array2);
  838. builder.addCapability(spv::Capability::ShaderViewportMaskNV);
  839. }
  840. return spv::BuiltIn::ViewportMaskNV;
  841. case glslang::EbvSecondaryPositionNV:
  842. if (!memberDeclaration) {
  843. builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
  844. builder.addCapability(spv::Capability::ShaderStereoViewNV);
  845. }
  846. return spv::BuiltIn::SecondaryPositionNV;
  847. case glslang::EbvSecondaryViewportMaskNV:
  848. if (!memberDeclaration) {
  849. builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
  850. builder.addCapability(spv::Capability::ShaderStereoViewNV);
  851. }
  852. return spv::BuiltIn::SecondaryViewportMaskNV;
  853. case glslang::EbvPositionPerViewNV:
  854. if (!memberDeclaration) {
  855. builder.addExtension(spv::E_SPV_NVX_multiview_per_view_attributes);
  856. builder.addCapability(spv::Capability::PerViewAttributesNV);
  857. }
  858. return spv::BuiltIn::PositionPerViewNV;
  859. case glslang::EbvViewportMaskPerViewNV:
  860. if (!memberDeclaration) {
  861. builder.addExtension(spv::E_SPV_NVX_multiview_per_view_attributes);
  862. builder.addCapability(spv::Capability::PerViewAttributesNV);
  863. }
  864. return spv::BuiltIn::ViewportMaskPerViewNV;
  865. case glslang::EbvFragFullyCoveredNV:
  866. builder.addExtension(spv::E_SPV_EXT_fragment_fully_covered);
  867. builder.addCapability(spv::Capability::FragmentFullyCoveredEXT);
  868. return spv::BuiltIn::FullyCoveredEXT;
  869. case glslang::EbvFragmentSizeNV:
  870. builder.addExtension(spv::E_SPV_NV_shading_rate);
  871. builder.addCapability(spv::Capability::ShadingRateNV);
  872. return spv::BuiltIn::FragmentSizeNV;
  873. case glslang::EbvInvocationsPerPixelNV:
  874. builder.addExtension(spv::E_SPV_NV_shading_rate);
  875. builder.addCapability(spv::Capability::ShadingRateNV);
  876. return spv::BuiltIn::InvocationsPerPixelNV;
  877. // ray tracing
  878. case glslang::EbvLaunchId:
  879. return spv::BuiltIn::LaunchIdKHR;
  880. case glslang::EbvLaunchSize:
  881. return spv::BuiltIn::LaunchSizeKHR;
  882. case glslang::EbvWorldRayOrigin:
  883. return spv::BuiltIn::WorldRayOriginKHR;
  884. case glslang::EbvWorldRayDirection:
  885. return spv::BuiltIn::WorldRayDirectionKHR;
  886. case glslang::EbvObjectRayOrigin:
  887. return spv::BuiltIn::ObjectRayOriginKHR;
  888. case glslang::EbvObjectRayDirection:
  889. return spv::BuiltIn::ObjectRayDirectionKHR;
  890. case glslang::EbvRayTmin:
  891. return spv::BuiltIn::RayTminKHR;
  892. case glslang::EbvRayTmax:
  893. return spv::BuiltIn::RayTmaxKHR;
  894. case glslang::EbvCullMask:
  895. return spv::BuiltIn::CullMaskKHR;
  896. case glslang::EbvPositionFetch:
  897. return spv::BuiltIn::HitTriangleVertexPositionsKHR;
  898. case glslang::EbvInstanceCustomIndex:
  899. return spv::BuiltIn::InstanceCustomIndexKHR;
  900. case glslang::EbvHitKind:
  901. return spv::BuiltIn::HitKindKHR;
  902. case glslang::EbvObjectToWorld:
  903. case glslang::EbvObjectToWorld3x4:
  904. return spv::BuiltIn::ObjectToWorldKHR;
  905. case glslang::EbvWorldToObject:
  906. case glslang::EbvWorldToObject3x4:
  907. return spv::BuiltIn::WorldToObjectKHR;
  908. case glslang::EbvIncomingRayFlags:
  909. return spv::BuiltIn::IncomingRayFlagsKHR;
  910. case glslang::EbvGeometryIndex:
  911. return spv::BuiltIn::RayGeometryIndexKHR;
  912. case glslang::EbvCurrentRayTimeNV:
  913. builder.addExtension(spv::E_SPV_NV_ray_tracing_motion_blur);
  914. builder.addCapability(spv::Capability::RayTracingMotionBlurNV);
  915. return spv::BuiltIn::CurrentRayTimeNV;
  916. case glslang::EbvMicroTrianglePositionNV:
  917. builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);
  918. builder.addExtension("SPV_NV_displacement_micromap");
  919. return spv::BuiltIn::HitMicroTriangleVertexPositionsNV;
  920. case glslang::EbvMicroTriangleBaryNV:
  921. builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);
  922. builder.addExtension("SPV_NV_displacement_micromap");
  923. return spv::BuiltIn::HitMicroTriangleVertexBarycentricsNV;
  924. case glslang::EbvHitKindFrontFacingMicroTriangleNV:
  925. builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);
  926. builder.addExtension("SPV_NV_displacement_micromap");
  927. return spv::BuiltIn::HitKindFrontFacingMicroTriangleNV;
  928. case glslang::EbvHitKindBackFacingMicroTriangleNV:
  929. builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);
  930. builder.addExtension("SPV_NV_displacement_micromap");
  931. return spv::BuiltIn::HitKindBackFacingMicroTriangleNV;
  932. case glslang::EbvClusterIDNV:
  933. builder.addCapability(spv::Capability::RayTracingClusterAccelerationStructureNV);
  934. builder.addExtension("SPV_NV_cluster_acceleration_structure");
  935. return spv::BuiltIn::ClusterIDNV;
  936. case glslang::EbvHitIsSphereNV:
  937. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  938. builder.addExtension("SPV_NV_linear_swept_spheres");
  939. return spv::BuiltIn::HitIsSphereNV;
  940. case glslang::EbvHitIsLSSNV:
  941. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  942. builder.addExtension("SPV_NV_linear_swept_spheres");
  943. return spv::BuiltIn::HitIsLSSNV;
  944. case glslang::EbvHitSpherePositionNV:
  945. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  946. builder.addExtension("SPV_NV_linear_swept_spheres");
  947. return spv::BuiltIn::HitSpherePositionNV;
  948. case glslang::EbvHitSphereRadiusNV:
  949. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  950. builder.addExtension("SPV_NV_linear_swept_spheres");
  951. return spv::BuiltIn::HitSphereRadiusNV;
  952. case glslang::EbvHitLSSPositionsNV:
  953. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  954. builder.addExtension("SPV_NV_linear_swept_spheres");
  955. return spv::BuiltIn::HitLSSPositionsNV;
  956. case glslang::EbvHitLSSRadiiNV:
  957. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  958. builder.addExtension("SPV_NV_linear_swept_spheres");
  959. return spv::BuiltIn::HitLSSRadiiNV;
  960. // barycentrics
  961. case glslang::EbvBaryCoordNV:
  962. builder.addExtension(spv::E_SPV_NV_fragment_shader_barycentric);
  963. builder.addCapability(spv::Capability::FragmentBarycentricNV);
  964. return spv::BuiltIn::BaryCoordNV;
  965. case glslang::EbvBaryCoordNoPerspNV:
  966. builder.addExtension(spv::E_SPV_NV_fragment_shader_barycentric);
  967. builder.addCapability(spv::Capability::FragmentBarycentricNV);
  968. return spv::BuiltIn::BaryCoordNoPerspNV;
  969. case glslang::EbvBaryCoordEXT:
  970. builder.addExtension(spv::E_SPV_KHR_fragment_shader_barycentric);
  971. builder.addCapability(spv::Capability::FragmentBarycentricKHR);
  972. return spv::BuiltIn::BaryCoordKHR;
  973. case glslang::EbvBaryCoordNoPerspEXT:
  974. builder.addExtension(spv::E_SPV_KHR_fragment_shader_barycentric);
  975. builder.addCapability(spv::Capability::FragmentBarycentricKHR);
  976. return spv::BuiltIn::BaryCoordNoPerspKHR;
  977. // mesh shaders
  978. case glslang::EbvTaskCountNV:
  979. return spv::BuiltIn::TaskCountNV;
  980. case glslang::EbvPrimitiveCountNV:
  981. return spv::BuiltIn::PrimitiveCountNV;
  982. case glslang::EbvPrimitiveIndicesNV:
  983. return spv::BuiltIn::PrimitiveIndicesNV;
  984. case glslang::EbvClipDistancePerViewNV:
  985. return spv::BuiltIn::ClipDistancePerViewNV;
  986. case glslang::EbvCullDistancePerViewNV:
  987. return spv::BuiltIn::CullDistancePerViewNV;
  988. case glslang::EbvLayerPerViewNV:
  989. return spv::BuiltIn::LayerPerViewNV;
  990. case glslang::EbvMeshViewCountNV:
  991. return spv::BuiltIn::MeshViewCountNV;
  992. case glslang::EbvMeshViewIndicesNV:
  993. return spv::BuiltIn::MeshViewIndicesNV;
  994. // SPV_EXT_mesh_shader
  995. case glslang::EbvPrimitivePointIndicesEXT:
  996. return spv::BuiltIn::PrimitivePointIndicesEXT;
  997. case glslang::EbvPrimitiveLineIndicesEXT:
  998. return spv::BuiltIn::PrimitiveLineIndicesEXT;
  999. case glslang::EbvPrimitiveTriangleIndicesEXT:
  1000. return spv::BuiltIn::PrimitiveTriangleIndicesEXT;
  1001. case glslang::EbvCullPrimitiveEXT:
  1002. return spv::BuiltIn::CullPrimitiveEXT;
  1003. // sm builtins
  1004. case glslang::EbvWarpsPerSM:
  1005. builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);
  1006. builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);
  1007. return spv::BuiltIn::WarpsPerSMNV;
  1008. case glslang::EbvSMCount:
  1009. builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);
  1010. builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);
  1011. return spv::BuiltIn::SMCountNV;
  1012. case glslang::EbvWarpID:
  1013. builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);
  1014. builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);
  1015. return spv::BuiltIn::WarpIDNV;
  1016. case glslang::EbvSMID:
  1017. builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);
  1018. builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);
  1019. return spv::BuiltIn::SMIDNV;
  1020. // ARM builtins
  1021. case glslang::EbvCoreCountARM:
  1022. builder.addExtension(spv::E_SPV_ARM_core_builtins);
  1023. builder.addCapability(spv::Capability::CoreBuiltinsARM);
  1024. return spv::BuiltIn::CoreCountARM;
  1025. case glslang::EbvCoreIDARM:
  1026. builder.addExtension(spv::E_SPV_ARM_core_builtins);
  1027. builder.addCapability(spv::Capability::CoreBuiltinsARM);
  1028. return spv::BuiltIn::CoreIDARM;
  1029. case glslang::EbvCoreMaxIDARM:
  1030. builder.addExtension(spv::E_SPV_ARM_core_builtins);
  1031. builder.addCapability(spv::Capability::CoreBuiltinsARM);
  1032. return spv::BuiltIn::CoreMaxIDARM;
  1033. case glslang::EbvWarpIDARM:
  1034. builder.addExtension(spv::E_SPV_ARM_core_builtins);
  1035. builder.addCapability(spv::Capability::CoreBuiltinsARM);
  1036. return spv::BuiltIn::WarpIDARM;
  1037. case glslang::EbvWarpMaxIDARM:
  1038. builder.addExtension(spv::E_SPV_ARM_core_builtins);
  1039. builder.addCapability(spv::Capability::CoreBuiltinsARM);
  1040. return spv::BuiltIn::WarpMaxIDARM;
  1041. // QCOM builtins
  1042. case glslang::EbvTileOffsetQCOM:
  1043. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1044. return spv::BuiltIn::TileOffsetQCOM;
  1045. case glslang::EbvTileDimensionQCOM:
  1046. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1047. return spv::BuiltIn::TileDimensionQCOM;
  1048. case glslang::EbvTileApronSizeQCOM:
  1049. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1050. return spv::BuiltIn::TileApronSizeQCOM;
  1051. default:
  1052. return spv::BuiltIn::Max;
  1053. }
  1054. }
  1055. // Translate glslang image layout format to SPIR-V image format.
  1056. spv::ImageFormat TGlslangToSpvTraverser::TranslateImageFormat(const glslang::TType& type)
  1057. {
  1058. assert(type.getBasicType() == glslang::EbtSampler);
  1059. // Check for capabilities
  1060. switch (type.getQualifier().getFormat()) {
  1061. case glslang::ElfRg32f:
  1062. case glslang::ElfRg16f:
  1063. case glslang::ElfR11fG11fB10f:
  1064. case glslang::ElfR16f:
  1065. case glslang::ElfRgba16:
  1066. case glslang::ElfRgb10A2:
  1067. case glslang::ElfRg16:
  1068. case glslang::ElfRg8:
  1069. case glslang::ElfR16:
  1070. case glslang::ElfR8:
  1071. case glslang::ElfRgba16Snorm:
  1072. case glslang::ElfRg16Snorm:
  1073. case glslang::ElfRg8Snorm:
  1074. case glslang::ElfR16Snorm:
  1075. case glslang::ElfR8Snorm:
  1076. case glslang::ElfRg32i:
  1077. case glslang::ElfRg16i:
  1078. case glslang::ElfRg8i:
  1079. case glslang::ElfR16i:
  1080. case glslang::ElfR8i:
  1081. case glslang::ElfRgb10a2ui:
  1082. case glslang::ElfRg32ui:
  1083. case glslang::ElfRg16ui:
  1084. case glslang::ElfRg8ui:
  1085. case glslang::ElfR16ui:
  1086. case glslang::ElfR8ui:
  1087. builder.addCapability(spv::Capability::StorageImageExtendedFormats);
  1088. break;
  1089. case glslang::ElfR64ui:
  1090. case glslang::ElfR64i:
  1091. builder.addExtension(spv::E_SPV_EXT_shader_image_int64);
  1092. builder.addCapability(spv::Capability::Int64ImageEXT);
  1093. break;
  1094. default:
  1095. break;
  1096. }
  1097. // do the translation
  1098. switch (type.getQualifier().getFormat()) {
  1099. case glslang::ElfNone: return spv::ImageFormat::Unknown;
  1100. case glslang::ElfRgba32f: return spv::ImageFormat::Rgba32f;
  1101. case glslang::ElfRgba16f: return spv::ImageFormat::Rgba16f;
  1102. case glslang::ElfR32f: return spv::ImageFormat::R32f;
  1103. case glslang::ElfRgba8: return spv::ImageFormat::Rgba8;
  1104. case glslang::ElfRgba8Snorm: return spv::ImageFormat::Rgba8Snorm;
  1105. case glslang::ElfRg32f: return spv::ImageFormat::Rg32f;
  1106. case glslang::ElfRg16f: return spv::ImageFormat::Rg16f;
  1107. case glslang::ElfR11fG11fB10f: return spv::ImageFormat::R11fG11fB10f;
  1108. case glslang::ElfR16f: return spv::ImageFormat::R16f;
  1109. case glslang::ElfRgba16: return spv::ImageFormat::Rgba16;
  1110. case glslang::ElfRgb10A2: return spv::ImageFormat::Rgb10A2;
  1111. case glslang::ElfRg16: return spv::ImageFormat::Rg16;
  1112. case glslang::ElfRg8: return spv::ImageFormat::Rg8;
  1113. case glslang::ElfR16: return spv::ImageFormat::R16;
  1114. case glslang::ElfR8: return spv::ImageFormat::R8;
  1115. case glslang::ElfRgba16Snorm: return spv::ImageFormat::Rgba16Snorm;
  1116. case glslang::ElfRg16Snorm: return spv::ImageFormat::Rg16Snorm;
  1117. case glslang::ElfRg8Snorm: return spv::ImageFormat::Rg8Snorm;
  1118. case glslang::ElfR16Snorm: return spv::ImageFormat::R16Snorm;
  1119. case glslang::ElfR8Snorm: return spv::ImageFormat::R8Snorm;
  1120. case glslang::ElfRgba32i: return spv::ImageFormat::Rgba32i;
  1121. case glslang::ElfRgba16i: return spv::ImageFormat::Rgba16i;
  1122. case glslang::ElfRgba8i: return spv::ImageFormat::Rgba8i;
  1123. case glslang::ElfR32i: return spv::ImageFormat::R32i;
  1124. case glslang::ElfRg32i: return spv::ImageFormat::Rg32i;
  1125. case glslang::ElfRg16i: return spv::ImageFormat::Rg16i;
  1126. case glslang::ElfRg8i: return spv::ImageFormat::Rg8i;
  1127. case glslang::ElfR16i: return spv::ImageFormat::R16i;
  1128. case glslang::ElfR8i: return spv::ImageFormat::R8i;
  1129. case glslang::ElfRgba32ui: return spv::ImageFormat::Rgba32ui;
  1130. case glslang::ElfRgba16ui: return spv::ImageFormat::Rgba16ui;
  1131. case glslang::ElfRgba8ui: return spv::ImageFormat::Rgba8ui;
  1132. case glslang::ElfR32ui: return spv::ImageFormat::R32ui;
  1133. case glslang::ElfRg32ui: return spv::ImageFormat::Rg32ui;
  1134. case glslang::ElfRg16ui: return spv::ImageFormat::Rg16ui;
  1135. case glslang::ElfRgb10a2ui: return spv::ImageFormat::Rgb10a2ui;
  1136. case glslang::ElfRg8ui: return spv::ImageFormat::Rg8ui;
  1137. case glslang::ElfR16ui: return spv::ImageFormat::R16ui;
  1138. case glslang::ElfR8ui: return spv::ImageFormat::R8ui;
  1139. case glslang::ElfR64ui: return spv::ImageFormat::R64ui;
  1140. case glslang::ElfR64i: return spv::ImageFormat::R64i;
  1141. default: return spv::ImageFormat::Max;
  1142. }
  1143. }
  1144. spv::SelectionControlMask TGlslangToSpvTraverser::TranslateSelectionControl(
  1145. const glslang::TIntermSelection& selectionNode) const
  1146. {
  1147. if (selectionNode.getFlatten())
  1148. return spv::SelectionControlMask::Flatten;
  1149. if (selectionNode.getDontFlatten())
  1150. return spv::SelectionControlMask::DontFlatten;
  1151. return spv::SelectionControlMask::MaskNone;
  1152. }
  1153. spv::SelectionControlMask TGlslangToSpvTraverser::TranslateSwitchControl(const glslang::TIntermSwitch& switchNode)
  1154. const
  1155. {
  1156. if (switchNode.getFlatten())
  1157. return spv::SelectionControlMask::Flatten;
  1158. if (switchNode.getDontFlatten())
  1159. return spv::SelectionControlMask::DontFlatten;
  1160. return spv::SelectionControlMask::MaskNone;
  1161. }
  1162. // return a non-0 dependency if the dependency argument must be set
  1163. spv::LoopControlMask TGlslangToSpvTraverser::TranslateLoopControl(const glslang::TIntermLoop& loopNode,
  1164. std::vector<unsigned int>& operands) const
  1165. {
  1166. spv::LoopControlMask control = spv::LoopControlMask::MaskNone;
  1167. if (loopNode.getDontUnroll())
  1168. control = control | spv::LoopControlMask::DontUnroll;
  1169. if (loopNode.getUnroll())
  1170. control = control | spv::LoopControlMask::Unroll;
  1171. if (unsigned(loopNode.getLoopDependency()) == glslang::TIntermLoop::dependencyInfinite)
  1172. control = control | spv::LoopControlMask::DependencyInfinite;
  1173. else if (loopNode.getLoopDependency() > 0) {
  1174. control = control | spv::LoopControlMask::DependencyLength;
  1175. operands.push_back((unsigned int)loopNode.getLoopDependency());
  1176. }
  1177. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {
  1178. if (loopNode.getMinIterations() > 0) {
  1179. control = control | spv::LoopControlMask::MinIterations;
  1180. operands.push_back(loopNode.getMinIterations());
  1181. }
  1182. if (loopNode.getMaxIterations() < glslang::TIntermLoop::iterationsInfinite) {
  1183. control = control | spv::LoopControlMask::MaxIterations;
  1184. operands.push_back(loopNode.getMaxIterations());
  1185. }
  1186. if (loopNode.getIterationMultiple() > 1) {
  1187. control = control | spv::LoopControlMask::IterationMultiple;
  1188. operands.push_back(loopNode.getIterationMultiple());
  1189. }
  1190. if (loopNode.getPeelCount() > 0) {
  1191. control = control | spv::LoopControlMask::PeelCount;
  1192. operands.push_back(loopNode.getPeelCount());
  1193. }
  1194. if (loopNode.getPartialCount() > 0) {
  1195. control = control | spv::LoopControlMask::PartialCount;
  1196. operands.push_back(loopNode.getPartialCount());
  1197. }
  1198. }
  1199. return control;
  1200. }
  1201. // Translate glslang type to SPIR-V storage class.
  1202. spv::StorageClass TGlslangToSpvTraverser::TranslateStorageClass(const glslang::TType& type)
  1203. {
  1204. if (type.getBasicType() == glslang::EbtRayQuery || type.getBasicType() == glslang::EbtHitObjectNV
  1205. || type.getBasicType() == glslang::EbtHitObjectEXT)
  1206. return spv::StorageClass::Private;
  1207. if (type.getQualifier().isSpirvByReference()) {
  1208. if (type.getQualifier().isParamInput() || type.getQualifier().isParamOutput())
  1209. return spv::StorageClass::Function;
  1210. }
  1211. if (type.getQualifier().isPipeInput())
  1212. return spv::StorageClass::Input;
  1213. if (type.getQualifier().isPipeOutput())
  1214. return spv::StorageClass::Output;
  1215. if (type.getQualifier().storage == glslang::EvqTileImageEXT || type.isAttachmentEXT()) {
  1216. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  1217. builder.addCapability(spv::Capability::TileImageColorReadAccessEXT);
  1218. return spv::StorageClass::TileImageEXT;
  1219. }
  1220. if (type.getQualifier().isTileAttachmentQCOM()) {
  1221. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1222. builder.addCapability(spv::Capability::TileShadingQCOM);
  1223. return spv::StorageClass::TileAttachmentQCOM;
  1224. }
  1225. if (glslangIntermediate->getSource() != glslang::EShSourceHlsl ||
  1226. type.getQualifier().storage == glslang::EvqUniform) {
  1227. if (type.isAtomic())
  1228. return spv::StorageClass::AtomicCounter;
  1229. if (type.containsOpaque() && !glslangIntermediate->getBindlessMode())
  1230. return spv::StorageClass::UniformConstant;
  1231. }
  1232. if (type.getQualifier().isUniformOrBuffer() &&
  1233. type.getQualifier().isShaderRecord()) {
  1234. return spv::StorageClass::ShaderRecordBufferKHR;
  1235. }
  1236. if (glslangIntermediate->usingStorageBuffer() && type.getQualifier().storage == glslang::EvqBuffer) {
  1237. builder.addIncorporatedExtension(spv::E_SPV_KHR_storage_buffer_storage_class, spv::Spv_1_3);
  1238. return spv::StorageClass::StorageBuffer;
  1239. }
  1240. if (type.getQualifier().isUniformOrBuffer()) {
  1241. if (type.getQualifier().isPushConstant())
  1242. return spv::StorageClass::PushConstant;
  1243. if (type.getBasicType() == glslang::EbtBlock)
  1244. return spv::StorageClass::Uniform;
  1245. return spv::StorageClass::UniformConstant;
  1246. }
  1247. if (type.getQualifier().storage == glslang::EvqShared && type.getBasicType() == glslang::EbtBlock) {
  1248. builder.addExtension(spv::E_SPV_KHR_workgroup_memory_explicit_layout);
  1249. builder.addCapability(spv::Capability::WorkgroupMemoryExplicitLayoutKHR);
  1250. return spv::StorageClass::Workgroup;
  1251. }
  1252. switch (type.getQualifier().storage) {
  1253. case glslang::EvqGlobal: return spv::StorageClass::Private;
  1254. case glslang::EvqConstReadOnly: return spv::StorageClass::Function;
  1255. case glslang::EvqTemporary: return spv::StorageClass::Function;
  1256. case glslang::EvqShared: return spv::StorageClass::Workgroup;
  1257. case glslang::EvqPayload: return spv::StorageClass::RayPayloadKHR;
  1258. case glslang::EvqPayloadIn: return spv::StorageClass::IncomingRayPayloadKHR;
  1259. case glslang::EvqHitAttr: return spv::StorageClass::HitAttributeKHR;
  1260. case glslang::EvqCallableData: return spv::StorageClass::CallableDataKHR;
  1261. case glslang::EvqCallableDataIn: return spv::StorageClass::IncomingCallableDataKHR;
  1262. case glslang::EvqtaskPayloadSharedEXT : return spv::StorageClass::TaskPayloadWorkgroupEXT;
  1263. case glslang::EvqHitObjectAttrNV: return spv::StorageClass::HitObjectAttributeNV;
  1264. case glslang::EvqHitObjectAttrEXT: return spv::StorageClass::HitObjectAttributeEXT;
  1265. case glslang::EvqSpirvStorageClass: return static_cast<spv::StorageClass>(type.getQualifier().spirvStorageClass);
  1266. default:
  1267. assert(0);
  1268. break;
  1269. }
  1270. return spv::StorageClass::Function;
  1271. }
  1272. // Translate glslang constants to SPIR-V literals
  1273. void TGlslangToSpvTraverser::TranslateLiterals(const glslang::TVector<const glslang::TIntermConstantUnion*>& constants,
  1274. std::vector<unsigned>& literals) const
  1275. {
  1276. for (auto constant : constants) {
  1277. if (constant->getBasicType() == glslang::EbtFloat) {
  1278. float floatValue = static_cast<float>(constant->getConstArray()[0].getDConst());
  1279. unsigned literal;
  1280. static_assert(sizeof(literal) == sizeof(floatValue), "sizeof(unsigned) != sizeof(float)");
  1281. memcpy(&literal, &floatValue, sizeof(literal));
  1282. literals.push_back(literal);
  1283. } else if (constant->getBasicType() == glslang::EbtInt) {
  1284. unsigned literal = constant->getConstArray()[0].getIConst();
  1285. literals.push_back(literal);
  1286. } else if (constant->getBasicType() == glslang::EbtUint) {
  1287. unsigned literal = constant->getConstArray()[0].getUConst();
  1288. literals.push_back(literal);
  1289. } else if (constant->getBasicType() == glslang::EbtBool) {
  1290. unsigned literal = constant->getConstArray()[0].getBConst();
  1291. literals.push_back(literal);
  1292. } else if (constant->getBasicType() == glslang::EbtString) {
  1293. auto str = constant->getConstArray()[0].getSConst()->c_str();
  1294. unsigned literal = 0;
  1295. char* literalPtr = reinterpret_cast<char*>(&literal);
  1296. unsigned charCount = 0;
  1297. char ch = 0;
  1298. do {
  1299. ch = *(str++);
  1300. *(literalPtr++) = ch;
  1301. ++charCount;
  1302. if (charCount == 4) {
  1303. literals.push_back(literal);
  1304. literalPtr = reinterpret_cast<char*>(&literal);
  1305. charCount = 0;
  1306. }
  1307. } while (ch != 0);
  1308. // Partial literal is padded with 0
  1309. if (charCount > 0) {
  1310. for (; charCount < 4; ++charCount)
  1311. *(literalPtr++) = 0;
  1312. literals.push_back(literal);
  1313. }
  1314. } else
  1315. assert(0); // Unexpected type
  1316. }
  1317. }
  1318. // Add capabilities pertaining to how an array is indexed.
  1319. void TGlslangToSpvTraverser::addIndirectionIndexCapabilities(const glslang::TType& baseType,
  1320. const glslang::TType& indexType)
  1321. {
  1322. if (indexType.getQualifier().isNonUniform()) {
  1323. // deal with an asserted non-uniform index
  1324. // SPV_EXT_descriptor_indexing already added in TranslateNonUniformDecoration
  1325. if (baseType.getBasicType() == glslang::EbtSampler) {
  1326. if (baseType.getQualifier().hasAttachment())
  1327. builder.addCapability(spv::Capability::InputAttachmentArrayNonUniformIndexingEXT);
  1328. else if (baseType.isImage() && baseType.getSampler().isBuffer())
  1329. builder.addCapability(spv::Capability::StorageTexelBufferArrayNonUniformIndexingEXT);
  1330. else if (baseType.isTexture() && baseType.getSampler().isBuffer())
  1331. builder.addCapability(spv::Capability::UniformTexelBufferArrayNonUniformIndexingEXT);
  1332. else if (baseType.isImage())
  1333. builder.addCapability(spv::Capability::StorageImageArrayNonUniformIndexingEXT);
  1334. else if (baseType.isTexture())
  1335. builder.addCapability(spv::Capability::SampledImageArrayNonUniformIndexingEXT);
  1336. } else if (baseType.getBasicType() == glslang::EbtBlock) {
  1337. if (baseType.getQualifier().storage == glslang::EvqBuffer)
  1338. builder.addCapability(spv::Capability::StorageBufferArrayNonUniformIndexingEXT);
  1339. else if (baseType.getQualifier().storage == glslang::EvqUniform)
  1340. builder.addCapability(spv::Capability::UniformBufferArrayNonUniformIndexingEXT);
  1341. }
  1342. } else {
  1343. // assume a dynamically uniform index
  1344. if (baseType.getBasicType() == glslang::EbtSampler) {
  1345. if (baseType.getQualifier().hasAttachment()) {
  1346. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  1347. builder.addCapability(spv::Capability::InputAttachmentArrayDynamicIndexingEXT);
  1348. } else if (baseType.isImage() && baseType.getSampler().isBuffer()) {
  1349. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  1350. builder.addCapability(spv::Capability::StorageTexelBufferArrayDynamicIndexingEXT);
  1351. } else if (baseType.isTexture() && baseType.getSampler().isBuffer()) {
  1352. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  1353. builder.addCapability(spv::Capability::UniformTexelBufferArrayDynamicIndexingEXT);
  1354. }
  1355. }
  1356. }
  1357. }
  1358. // Return whether or not the given type is something that should be tied to a
  1359. // descriptor set.
  1360. bool IsDescriptorResource(const glslang::TType& type)
  1361. {
  1362. // uniform and buffer blocks are included, unless it is a push_constant
  1363. if (type.getBasicType() == glslang::EbtBlock)
  1364. return type.getQualifier().isUniformOrBuffer() &&
  1365. ! type.getQualifier().isShaderRecord() &&
  1366. ! type.getQualifier().isPushConstant();
  1367. // non block...
  1368. // basically samplerXXX/subpass/sampler/texture are all included
  1369. // if they are the global-scope-class, not the function parameter
  1370. // (or local, if they ever exist) class.
  1371. if (type.getBasicType() == glslang::EbtSampler ||
  1372. type.getBasicType() == glslang::EbtAccStruct)
  1373. return type.getQualifier().isUniformOrBuffer();
  1374. // Tensors are tied to a descriptor.
  1375. if (type.isTensorARM())
  1376. return true;
  1377. // None of the above.
  1378. return false;
  1379. }
  1380. void InheritQualifiers(glslang::TQualifier& child, const glslang::TQualifier& parent)
  1381. {
  1382. if (child.layoutMatrix == glslang::ElmNone)
  1383. child.layoutMatrix = parent.layoutMatrix;
  1384. if (parent.invariant)
  1385. child.invariant = true;
  1386. if (parent.flat)
  1387. child.flat = true;
  1388. if (parent.centroid)
  1389. child.centroid = true;
  1390. if (parent.nopersp)
  1391. child.nopersp = true;
  1392. if (parent.explicitInterp)
  1393. child.explicitInterp = true;
  1394. if (parent.perPrimitiveNV)
  1395. child.perPrimitiveNV = true;
  1396. if (parent.perViewNV)
  1397. child.perViewNV = true;
  1398. if (parent.perTaskNV)
  1399. child.perTaskNV = true;
  1400. if (parent.storage == glslang::EvqtaskPayloadSharedEXT)
  1401. child.storage = glslang::EvqtaskPayloadSharedEXT;
  1402. if (parent.patch)
  1403. child.patch = true;
  1404. if (parent.sample)
  1405. child.sample = true;
  1406. if (parent.coherent)
  1407. child.coherent = true;
  1408. if (parent.devicecoherent)
  1409. child.devicecoherent = true;
  1410. if (parent.queuefamilycoherent)
  1411. child.queuefamilycoherent = true;
  1412. if (parent.workgroupcoherent)
  1413. child.workgroupcoherent = true;
  1414. if (parent.subgroupcoherent)
  1415. child.subgroupcoherent = true;
  1416. if (parent.shadercallcoherent)
  1417. child.shadercallcoherent = true;
  1418. if (parent.nonprivate)
  1419. child.nonprivate = true;
  1420. if (parent.volatil)
  1421. child.volatil = true;
  1422. if (parent.nontemporal)
  1423. child.nontemporal = true;
  1424. if (parent.restrict)
  1425. child.restrict = true;
  1426. if (parent.readonly)
  1427. child.readonly = true;
  1428. if (parent.writeonly)
  1429. child.writeonly = true;
  1430. if (parent.nonUniform)
  1431. child.nonUniform = true;
  1432. }
  1433. bool HasNonLayoutQualifiers(const glslang::TType& type, const glslang::TQualifier& qualifier)
  1434. {
  1435. // This should list qualifiers that simultaneous satisfy:
  1436. // - struct members might inherit from a struct declaration
  1437. // (note that non-block structs don't explicitly inherit,
  1438. // only implicitly, meaning no decoration involved)
  1439. // - affect decorations on the struct members
  1440. // (note smooth does not, and expecting something like volatile
  1441. // to effect the whole object)
  1442. // - are not part of the offset/st430/etc or row/column-major layout
  1443. return qualifier.invariant || (qualifier.hasLocation() && type.getBasicType() == glslang::EbtBlock);
  1444. }
  1445. //
  1446. // Implement the TGlslangToSpvTraverser class.
  1447. //
  1448. TGlslangToSpvTraverser::TGlslangToSpvTraverser(unsigned int spvVersion,
  1449. const glslang::TIntermediate* glslangIntermediate,
  1450. spv::SpvBuildLogger* buildLogger, glslang::SpvOptions& options) :
  1451. TIntermTraverser(true, false, true),
  1452. options(options),
  1453. shaderEntry(nullptr), currentFunction(nullptr),
  1454. sequenceDepth(0), logger(buildLogger),
  1455. builder(spvVersion, (glslang::GetKhronosToolId() << 16) | glslang::GetSpirvGeneratorVersion(), logger),
  1456. inEntryPoint(false), entryPointTerminated(false), linkageOnly(false),
  1457. glslangIntermediate(glslangIntermediate),
  1458. nanMinMaxClamp(glslangIntermediate->getNanMinMaxClamp()),
  1459. nonSemanticDebugPrintf(0),
  1460. taskPayloadID(0)
  1461. {
  1462. bool isMeshShaderExt = (glslangIntermediate->getRequestedExtensions().find(glslang::E_GL_EXT_mesh_shader) !=
  1463. glslangIntermediate->getRequestedExtensions().end());
  1464. spv::ExecutionModel executionModel = TranslateExecutionModel(glslangIntermediate->getStage(), isMeshShaderExt);
  1465. builder.clearAccessChain();
  1466. builder.setSource(TranslateSourceLanguage(glslangIntermediate->getSource(), glslangIntermediate->getProfile()),
  1467. glslangIntermediate->getVersion());
  1468. if (options.emitNonSemanticShaderDebugSource)
  1469. this->options.emitNonSemanticShaderDebugInfo = true;
  1470. if (options.emitNonSemanticShaderDebugInfo)
  1471. this->options.generateDebugInfo = true;
  1472. if (this->options.generateDebugInfo) {
  1473. if (this->options.emitNonSemanticShaderDebugInfo) {
  1474. builder.setEmitNonSemanticShaderDebugInfo(this->options.emitNonSemanticShaderDebugSource);
  1475. }
  1476. else {
  1477. builder.setEmitSpirvDebugInfo();
  1478. }
  1479. builder.setDebugMainSourceFile(glslangIntermediate->getSourceFile());
  1480. // Set the source shader's text. If for SPV version 1.0, include
  1481. // a preamble in comments stating the OpModuleProcessed instructions.
  1482. // Otherwise, emit those as actual instructions.
  1483. std::string text;
  1484. const std::vector<std::string>& processes = glslangIntermediate->getProcesses();
  1485. for (int p = 0; p < (int)processes.size(); ++p) {
  1486. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_1) {
  1487. text.append("// OpModuleProcessed ");
  1488. text.append(processes[p]);
  1489. text.append("\n");
  1490. } else
  1491. builder.addModuleProcessed(processes[p]);
  1492. }
  1493. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_1 && (int)processes.size() > 0)
  1494. text.append("#line 1\n");
  1495. text.append(glslangIntermediate->getSourceText());
  1496. builder.setSourceText(text);
  1497. // Pass name and text for all included files
  1498. const std::map<std::string, std::string>& include_txt = glslangIntermediate->getIncludeText();
  1499. for (auto iItr = include_txt.begin(); iItr != include_txt.end(); ++iItr)
  1500. builder.addInclude(iItr->first, iItr->second);
  1501. }
  1502. builder.setUseReplicatedComposites(glslangIntermediate->usingReplicatedComposites());
  1503. stdBuiltins = builder.import("GLSL.std.450");
  1504. spv::AddressingModel addressingModel = spv::AddressingModel::Logical;
  1505. spv::MemoryModel memoryModel = spv::MemoryModel::GLSL450;
  1506. if (glslangIntermediate->usingPhysicalStorageBuffer()) {
  1507. addressingModel = spv::AddressingModel::PhysicalStorageBuffer64EXT;
  1508. builder.addIncorporatedExtension(spv::E_SPV_KHR_physical_storage_buffer, spv::Spv_1_5);
  1509. builder.addCapability(spv::Capability::PhysicalStorageBufferAddressesEXT);
  1510. }
  1511. if (glslangIntermediate->usingVulkanMemoryModel()) {
  1512. memoryModel = spv::MemoryModel::VulkanKHR;
  1513. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  1514. builder.addIncorporatedExtension(spv::E_SPV_KHR_vulkan_memory_model, spv::Spv_1_5);
  1515. }
  1516. builder.setMemoryModel(addressingModel, memoryModel);
  1517. if (glslangIntermediate->usingVariablePointers()) {
  1518. builder.addCapability(spv::Capability::VariablePointers);
  1519. }
  1520. // If not linking, there is no entry point
  1521. if (!options.compileOnly) {
  1522. shaderEntry = builder.makeEntryPoint(glslangIntermediate->getEntryPointName().c_str());
  1523. entryPoint =
  1524. builder.addEntryPoint(executionModel, shaderEntry, glslangIntermediate->getEntryPointName().c_str());
  1525. }
  1526. // Add the source extensions
  1527. const auto& sourceExtensions = glslangIntermediate->getRequestedExtensions();
  1528. for (auto it = sourceExtensions.begin(); it != sourceExtensions.end(); ++it)
  1529. builder.addSourceExtension(it->c_str());
  1530. // Add the top-level modes for this shader.
  1531. if (glslangIntermediate->getXfbMode()) {
  1532. builder.addCapability(spv::Capability::TransformFeedback);
  1533. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::Xfb);
  1534. }
  1535. if (glslangIntermediate->getLayoutPrimitiveCulling()) {
  1536. builder.addCapability(spv::Capability::RayTraversalPrimitiveCullingKHR);
  1537. }
  1538. if (glslangIntermediate->getSubgroupUniformControlFlow()) {
  1539. builder.addExtension(spv::E_SPV_KHR_subgroup_uniform_control_flow);
  1540. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::SubgroupUniformControlFlowKHR);
  1541. }
  1542. if (glslangIntermediate->getMaximallyReconverges()) {
  1543. builder.addExtension(spv::E_SPV_KHR_maximal_reconvergence);
  1544. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::MaximallyReconvergesKHR);
  1545. }
  1546. if (glslangIntermediate->getQuadDerivMode())
  1547. {
  1548. builder.addCapability(spv::Capability::QuadControlKHR);
  1549. builder.addExtension(spv::E_SPV_KHR_quad_control);
  1550. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::QuadDerivativesKHR);
  1551. }
  1552. if (glslangIntermediate->getReqFullQuadsMode())
  1553. {
  1554. builder.addCapability(spv::Capability::QuadControlKHR);
  1555. builder.addExtension(spv::E_SPV_KHR_quad_control);
  1556. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::RequireFullQuadsKHR);
  1557. }
  1558. if (glslangIntermediate->usingShader64BitIndexing())
  1559. {
  1560. builder.addCapability(spv::Capability::Shader64BitIndexingEXT);
  1561. builder.addExtension(spv::E_SPV_EXT_shader_64bit_indexing);
  1562. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::Shader64BitIndexingEXT);
  1563. }
  1564. spv::ExecutionMode mode;
  1565. switch (glslangIntermediate->getStage()) {
  1566. case EShLangVertex:
  1567. builder.addCapability(spv::Capability::Shader);
  1568. break;
  1569. case EShLangFragment:
  1570. builder.addCapability(spv::Capability::Shader);
  1571. if (glslangIntermediate->getPixelCenterInteger())
  1572. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::PixelCenterInteger);
  1573. if (glslangIntermediate->getOriginUpperLeft())
  1574. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OriginUpperLeft);
  1575. else
  1576. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OriginLowerLeft);
  1577. if (glslangIntermediate->getEarlyFragmentTests())
  1578. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::EarlyFragmentTests);
  1579. if (glslangIntermediate->getEarlyAndLateFragmentTestsAMD())
  1580. {
  1581. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::EarlyAndLateFragmentTestsAMD);
  1582. builder.addExtension(spv::E_SPV_AMD_shader_early_and_late_fragment_tests);
  1583. }
  1584. if (glslangIntermediate->getPostDepthCoverage()) {
  1585. builder.addCapability(spv::Capability::SampleMaskPostDepthCoverage);
  1586. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::PostDepthCoverage);
  1587. builder.addExtension(spv::E_SPV_KHR_post_depth_coverage);
  1588. }
  1589. if (glslangIntermediate->getNonCoherentColorAttachmentReadEXT()) {
  1590. builder.addCapability(spv::Capability::TileImageColorReadAccessEXT);
  1591. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentColorAttachmentReadEXT);
  1592. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  1593. }
  1594. if (glslangIntermediate->getNonCoherentDepthAttachmentReadEXT()) {
  1595. builder.addCapability(spv::Capability::TileImageDepthReadAccessEXT);
  1596. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentDepthAttachmentReadEXT);
  1597. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  1598. }
  1599. if (glslangIntermediate->getNonCoherentStencilAttachmentReadEXT()) {
  1600. builder.addCapability(spv::Capability::TileImageStencilReadAccessEXT);
  1601. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentStencilAttachmentReadEXT);
  1602. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  1603. }
  1604. if (glslangIntermediate->getNonCoherentTileAttachmentReadQCOM()) {
  1605. builder.addCapability(spv::Capability::TileShadingQCOM);
  1606. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentTileAttachmentReadQCOM);
  1607. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1608. }
  1609. if (glslangIntermediate->isDepthReplacing())
  1610. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::DepthReplacing);
  1611. if (glslangIntermediate->isStencilReplacing())
  1612. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::StencilRefReplacingEXT);
  1613. switch(glslangIntermediate->getDepth()) {
  1614. case glslang::EldGreater: mode = spv::ExecutionMode::DepthGreater; break;
  1615. case glslang::EldLess: mode = spv::ExecutionMode::DepthLess; break;
  1616. case glslang::EldUnchanged: mode = spv::ExecutionMode::DepthUnchanged; break;
  1617. default: mode = spv::ExecutionMode::Max; break;
  1618. }
  1619. if (mode != spv::ExecutionMode::Max)
  1620. builder.addExecutionMode(shaderEntry, mode);
  1621. switch (glslangIntermediate->getStencil()) {
  1622. case glslang::ElsRefUnchangedFrontAMD: mode = spv::ExecutionMode::StencilRefUnchangedFrontAMD; break;
  1623. case glslang::ElsRefGreaterFrontAMD: mode = spv::ExecutionMode::StencilRefGreaterFrontAMD; break;
  1624. case glslang::ElsRefLessFrontAMD: mode = spv::ExecutionMode::StencilRefLessFrontAMD; break;
  1625. case glslang::ElsRefUnchangedBackAMD: mode = spv::ExecutionMode::StencilRefUnchangedBackAMD; break;
  1626. case glslang::ElsRefGreaterBackAMD: mode = spv::ExecutionMode::StencilRefGreaterBackAMD; break;
  1627. case glslang::ElsRefLessBackAMD: mode = spv::ExecutionMode::StencilRefLessBackAMD; break;
  1628. default: mode = spv::ExecutionMode::Max; break;
  1629. }
  1630. if (mode != spv::ExecutionMode::Max)
  1631. builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
  1632. switch (glslangIntermediate->getInterlockOrdering()) {
  1633. case glslang::EioPixelInterlockOrdered: mode = spv::ExecutionMode::PixelInterlockOrderedEXT;
  1634. break;
  1635. case glslang::EioPixelInterlockUnordered: mode = spv::ExecutionMode::PixelInterlockUnorderedEXT;
  1636. break;
  1637. case glslang::EioSampleInterlockOrdered: mode = spv::ExecutionMode::SampleInterlockOrderedEXT;
  1638. break;
  1639. case glslang::EioSampleInterlockUnordered: mode = spv::ExecutionMode::SampleInterlockUnorderedEXT;
  1640. break;
  1641. case glslang::EioShadingRateInterlockOrdered: mode = spv::ExecutionMode::ShadingRateInterlockOrderedEXT;
  1642. break;
  1643. case glslang::EioShadingRateInterlockUnordered: mode = spv::ExecutionMode::ShadingRateInterlockUnorderedEXT;
  1644. break;
  1645. default: mode = spv::ExecutionMode::Max;
  1646. break;
  1647. }
  1648. if (mode != spv::ExecutionMode::Max) {
  1649. builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
  1650. if (mode == spv::ExecutionMode::ShadingRateInterlockOrderedEXT ||
  1651. mode == spv::ExecutionMode::ShadingRateInterlockUnorderedEXT) {
  1652. builder.addCapability(spv::Capability::FragmentShaderShadingRateInterlockEXT);
  1653. } else if (mode == spv::ExecutionMode::PixelInterlockOrderedEXT ||
  1654. mode == spv::ExecutionMode::PixelInterlockUnorderedEXT) {
  1655. builder.addCapability(spv::Capability::FragmentShaderPixelInterlockEXT);
  1656. } else {
  1657. builder.addCapability(spv::Capability::FragmentShaderSampleInterlockEXT);
  1658. }
  1659. builder.addExtension(spv::E_SPV_EXT_fragment_shader_interlock);
  1660. }
  1661. break;
  1662. case EShLangCompute: {
  1663. builder.addCapability(spv::Capability::Shader);
  1664. bool needSizeId = false;
  1665. for (int dim = 0; dim < 3; ++dim) {
  1666. if ((glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet)) {
  1667. needSizeId = true;
  1668. break;
  1669. }
  1670. }
  1671. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6 && needSizeId) {
  1672. std::vector<spv::Id> dimConstId;
  1673. for (int dim = 0; dim < 3; ++dim) {
  1674. bool specConst = (glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet);
  1675. dimConstId.push_back(builder.makeUintConstant(glslangIntermediate->getLocalSize(dim), specConst));
  1676. if (specConst) {
  1677. builder.addDecoration(dimConstId.back(), spv::Decoration::SpecId,
  1678. glslangIntermediate->getLocalSizeSpecId(dim));
  1679. needSizeId = true;
  1680. }
  1681. }
  1682. builder.addExecutionModeId(shaderEntry, spv::ExecutionMode::LocalSizeId, dimConstId);
  1683. } else {
  1684. if (glslangIntermediate->getTileShadingRateQCOM(0) >= 1 || glslangIntermediate->getTileShadingRateQCOM(1) >= 1 || glslangIntermediate->getTileShadingRateQCOM(2) >= 1) {
  1685. auto rate_x = glslangIntermediate->getTileShadingRateQCOM(0);
  1686. auto rate_y = glslangIntermediate->getTileShadingRateQCOM(1);
  1687. auto rate_z = glslangIntermediate->getTileShadingRateQCOM(2);
  1688. rate_x = ( rate_x == 0 ? 1 : rate_x );
  1689. rate_y = ( rate_y == 0 ? 1 : rate_y );
  1690. rate_z = ( rate_z == 0 ? 1 : rate_z );
  1691. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::TileShadingRateQCOM, rate_x, rate_y, rate_z);
  1692. } else {
  1693. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::LocalSize, glslangIntermediate->getLocalSize(0),
  1694. glslangIntermediate->getLocalSize(1),
  1695. glslangIntermediate->getLocalSize(2));
  1696. }
  1697. }
  1698. if (glslangIntermediate->getLayoutDerivativeModeNone() == glslang::LayoutDerivativeGroupQuads) {
  1699. builder.addCapability(spv::Capability::ComputeDerivativeGroupQuadsNV);
  1700. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::DerivativeGroupQuadsNV);
  1701. builder.addExtension(spv::E_SPV_NV_compute_shader_derivatives);
  1702. } else if (glslangIntermediate->getLayoutDerivativeModeNone() == glslang::LayoutDerivativeGroupLinear) {
  1703. builder.addCapability(spv::Capability::ComputeDerivativeGroupLinearNV);
  1704. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::DerivativeGroupLinearNV);
  1705. builder.addExtension(spv::E_SPV_NV_compute_shader_derivatives);
  1706. }
  1707. if (glslangIntermediate->getNonCoherentTileAttachmentReadQCOM()) {
  1708. builder.addCapability(spv::Capability::TileShadingQCOM);
  1709. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentTileAttachmentReadQCOM);
  1710. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1711. }
  1712. break;
  1713. }
  1714. case EShLangTessEvaluation:
  1715. case EShLangTessControl:
  1716. builder.addCapability(spv::Capability::Tessellation);
  1717. glslang::TLayoutGeometry primitive;
  1718. if (glslangIntermediate->getStage() == EShLangTessControl) {
  1719. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputVertices,
  1720. glslangIntermediate->getVertices());
  1721. primitive = glslangIntermediate->getOutputPrimitive();
  1722. } else {
  1723. primitive = glslangIntermediate->getInputPrimitive();
  1724. }
  1725. switch (primitive) {
  1726. case glslang::ElgTriangles: mode = spv::ExecutionMode::Triangles; break;
  1727. case glslang::ElgQuads: mode = spv::ExecutionMode::Quads; break;
  1728. case glslang::ElgIsolines: mode = spv::ExecutionMode::Isolines; break;
  1729. default: mode = spv::ExecutionMode::Max; break;
  1730. }
  1731. if (mode != spv::ExecutionMode::Max)
  1732. builder.addExecutionMode(shaderEntry, mode);
  1733. switch (glslangIntermediate->getVertexSpacing()) {
  1734. case glslang::EvsEqual: mode = spv::ExecutionMode::SpacingEqual; break;
  1735. case glslang::EvsFractionalEven: mode = spv::ExecutionMode::SpacingFractionalEven; break;
  1736. case glslang::EvsFractionalOdd: mode = spv::ExecutionMode::SpacingFractionalOdd; break;
  1737. default: mode = spv::ExecutionMode::Max; break;
  1738. }
  1739. if (mode != spv::ExecutionMode::Max)
  1740. builder.addExecutionMode(shaderEntry, mode);
  1741. switch (glslangIntermediate->getVertexOrder()) {
  1742. case glslang::EvoCw: mode = spv::ExecutionMode::VertexOrderCw; break;
  1743. case glslang::EvoCcw: mode = spv::ExecutionMode::VertexOrderCcw; break;
  1744. default: mode = spv::ExecutionMode::Max; break;
  1745. }
  1746. if (mode != spv::ExecutionMode::Max)
  1747. builder.addExecutionMode(shaderEntry, mode);
  1748. if (glslangIntermediate->getPointMode())
  1749. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::PointMode);
  1750. break;
  1751. case EShLangGeometry:
  1752. builder.addCapability(spv::Capability::Geometry);
  1753. switch (glslangIntermediate->getInputPrimitive()) {
  1754. case glslang::ElgPoints: mode = spv::ExecutionMode::InputPoints; break;
  1755. case glslang::ElgLines: mode = spv::ExecutionMode::InputLines; break;
  1756. case glslang::ElgLinesAdjacency: mode = spv::ExecutionMode::InputLinesAdjacency; break;
  1757. case glslang::ElgTriangles: mode = spv::ExecutionMode::Triangles; break;
  1758. case glslang::ElgTrianglesAdjacency: mode = spv::ExecutionMode::InputTrianglesAdjacency; break;
  1759. default: mode = spv::ExecutionMode::Max; break;
  1760. }
  1761. if (mode != spv::ExecutionMode::Max)
  1762. builder.addExecutionMode(shaderEntry, mode);
  1763. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::Invocations, glslangIntermediate->getInvocations());
  1764. switch (glslangIntermediate->getOutputPrimitive()) {
  1765. case glslang::ElgPoints: mode = spv::ExecutionMode::OutputPoints; break;
  1766. case glslang::ElgLineStrip: mode = spv::ExecutionMode::OutputLineStrip; break;
  1767. case glslang::ElgTriangleStrip: mode = spv::ExecutionMode::OutputTriangleStrip; break;
  1768. default: mode = spv::ExecutionMode::Max; break;
  1769. }
  1770. if (mode != spv::ExecutionMode::Max)
  1771. builder.addExecutionMode(shaderEntry, mode);
  1772. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputVertices, glslangIntermediate->getVertices());
  1773. break;
  1774. case EShLangRayGen:
  1775. case EShLangIntersect:
  1776. case EShLangAnyHit:
  1777. case EShLangClosestHit:
  1778. case EShLangMiss:
  1779. case EShLangCallable:
  1780. {
  1781. auto& extensions = glslangIntermediate->getRequestedExtensions();
  1782. if (extensions.find("GL_EXT_opacity_micromap") != extensions.end()) {
  1783. builder.addCapability(spv::Capability::RayTracingOpacityMicromapEXT);
  1784. builder.addExtension("SPV_EXT_opacity_micromap");
  1785. }
  1786. if (extensions.find("GL_NV_ray_tracing") == extensions.end()) {
  1787. builder.addCapability(spv::Capability::RayTracingKHR);
  1788. builder.addExtension("SPV_KHR_ray_tracing");
  1789. }
  1790. else {
  1791. builder.addCapability(spv::Capability::RayTracingNV);
  1792. builder.addExtension("SPV_NV_ray_tracing");
  1793. }
  1794. if (glslangIntermediate->getStage() != EShLangRayGen && glslangIntermediate->getStage() != EShLangCallable) {
  1795. if (extensions.find("GL_EXT_ray_cull_mask") != extensions.end()) {
  1796. builder.addCapability(spv::Capability::RayCullMaskKHR);
  1797. builder.addExtension("SPV_KHR_ray_cull_mask");
  1798. }
  1799. if (extensions.find("GL_EXT_ray_tracing_position_fetch") != extensions.end()) {
  1800. builder.addCapability(spv::Capability::RayTracingPositionFetchKHR);
  1801. builder.addExtension("SPV_KHR_ray_tracing_position_fetch");
  1802. }
  1803. }
  1804. break;
  1805. }
  1806. case EShLangTask:
  1807. case EShLangMesh:
  1808. if(isMeshShaderExt) {
  1809. builder.addCapability(spv::Capability::MeshShadingEXT);
  1810. builder.addExtension(spv::E_SPV_EXT_mesh_shader);
  1811. } else {
  1812. builder.addCapability(spv::Capability::MeshShadingNV);
  1813. builder.addExtension(spv::E_SPV_NV_mesh_shader);
  1814. }
  1815. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {
  1816. std::vector<spv::Id> dimConstId;
  1817. for (int dim = 0; dim < 3; ++dim) {
  1818. bool specConst = (glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet);
  1819. dimConstId.push_back(builder.makeUintConstant(glslangIntermediate->getLocalSize(dim), specConst));
  1820. if (specConst) {
  1821. builder.addDecoration(dimConstId.back(), spv::Decoration::SpecId,
  1822. glslangIntermediate->getLocalSizeSpecId(dim));
  1823. }
  1824. }
  1825. builder.addExecutionModeId(shaderEntry, spv::ExecutionMode::LocalSizeId, dimConstId);
  1826. } else {
  1827. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::LocalSize, glslangIntermediate->getLocalSize(0),
  1828. glslangIntermediate->getLocalSize(1),
  1829. glslangIntermediate->getLocalSize(2));
  1830. }
  1831. if (glslangIntermediate->getStage() == EShLangMesh) {
  1832. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputVertices,
  1833. glslangIntermediate->getVertices());
  1834. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputPrimitivesNV,
  1835. glslangIntermediate->getPrimitives());
  1836. switch (glslangIntermediate->getOutputPrimitive()) {
  1837. case glslang::ElgPoints: mode = spv::ExecutionMode::OutputPoints; break;
  1838. case glslang::ElgLines: mode = spv::ExecutionMode::OutputLinesNV; break;
  1839. case glslang::ElgTriangles: mode = spv::ExecutionMode::OutputTrianglesNV; break;
  1840. default: mode = spv::ExecutionMode::Max; break;
  1841. }
  1842. if (mode != spv::ExecutionMode::Max)
  1843. builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
  1844. }
  1845. break;
  1846. default:
  1847. break;
  1848. }
  1849. //
  1850. // Add SPIR-V requirements (GL_EXT_spirv_intrinsics)
  1851. //
  1852. if (glslangIntermediate->hasSpirvRequirement()) {
  1853. const glslang::TSpirvRequirement& spirvRequirement = glslangIntermediate->getSpirvRequirement();
  1854. // Add SPIR-V extension requirement
  1855. for (auto& extension : spirvRequirement.extensions)
  1856. builder.addExtension(extension.c_str());
  1857. // Add SPIR-V capability requirement
  1858. for (auto capability : spirvRequirement.capabilities)
  1859. builder.addCapability(static_cast<spv::Capability>(capability));
  1860. }
  1861. //
  1862. // Add SPIR-V execution mode qualifiers (GL_EXT_spirv_intrinsics)
  1863. //
  1864. if (glslangIntermediate->hasSpirvExecutionMode()) {
  1865. const glslang::TSpirvExecutionMode spirvExecutionMode = glslangIntermediate->getSpirvExecutionMode();
  1866. // Add spirv_execution_mode
  1867. for (auto& mode : spirvExecutionMode.modes) {
  1868. if (!mode.second.empty()) {
  1869. std::vector<unsigned> literals;
  1870. TranslateLiterals(mode.second, literals);
  1871. builder.addExecutionMode(shaderEntry, static_cast<spv::ExecutionMode>(mode.first), literals);
  1872. } else
  1873. builder.addExecutionMode(shaderEntry, static_cast<spv::ExecutionMode>(mode.first));
  1874. }
  1875. // Add spirv_execution_mode_id
  1876. for (auto& modeId : spirvExecutionMode.modeIds) {
  1877. std::vector<spv::Id> operandIds;
  1878. assert(!modeId.second.empty());
  1879. for (auto extraOperand : modeId.second) {
  1880. if (extraOperand->getType().getQualifier().isSpecConstant())
  1881. operandIds.push_back(getSymbolId(extraOperand->getAsSymbolNode()));
  1882. else
  1883. operandIds.push_back(createSpvConstant(*extraOperand));
  1884. }
  1885. builder.addExecutionModeId(shaderEntry, static_cast<spv::ExecutionMode>(modeId.first), operandIds);
  1886. }
  1887. }
  1888. }
  1889. // Finish creating SPV, after the traversal is complete.
  1890. void TGlslangToSpvTraverser::finishSpv(bool compileOnly)
  1891. {
  1892. // If not linking, an entry point is not expected
  1893. if (!compileOnly) {
  1894. // Finish the entry point function
  1895. if (!entryPointTerminated) {
  1896. builder.setBuildPoint(shaderEntry->getLastBlock());
  1897. builder.leaveFunction();
  1898. }
  1899. // finish off the entry-point SPV instruction by adding the Input/Output <id>
  1900. entryPoint->reserveOperands(iOSet.size());
  1901. for (auto id : iOSet)
  1902. entryPoint->addIdOperand(id);
  1903. }
  1904. // Add capabilities, extensions, remove unneeded decorations, etc.,
  1905. // based on the resulting SPIR-V.
  1906. // Note: WebGPU code generation must have the opportunity to aggressively
  1907. // prune unreachable merge blocks and continue targets.
  1908. builder.postProcess(compileOnly);
  1909. }
  1910. // Write the SPV into 'out'.
  1911. void TGlslangToSpvTraverser::dumpSpv(std::vector<unsigned int>& out)
  1912. {
  1913. builder.dump(out);
  1914. }
  1915. //
  1916. // Implement the traversal functions.
  1917. //
  1918. // Return true from interior nodes to have the external traversal
  1919. // continue on to children. Return false if children were
  1920. // already processed.
  1921. //
  1922. //
  1923. // Symbols can turn into
  1924. // - uniform/input reads
  1925. // - output writes
  1926. // - complex lvalue base setups: foo.bar[3].... , where we see foo and start up an access chain
  1927. // - something simple that degenerates into the last bullet
  1928. //
  1929. void TGlslangToSpvTraverser::visitSymbol(glslang::TIntermSymbol* symbol)
  1930. {
  1931. // We update the line information even though no code might be generated here
  1932. // This is helpful to yield correct lines for control flow instructions
  1933. if (!linkageOnly) {
  1934. builder.setDebugSourceLocation(symbol->getLoc().line, symbol->getLoc().getFilename());
  1935. }
  1936. if (symbol->getBasicType() == glslang::EbtFunction) {
  1937. return;
  1938. }
  1939. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  1940. if (symbol->getType().isStruct())
  1941. glslangTypeToIdMap[symbol->getType().getStruct()] = symbol->getId();
  1942. if (symbol->getType().getQualifier().isSpecConstant())
  1943. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  1944. #ifdef ENABLE_HLSL
  1945. // Skip symbol handling if it is string-typed
  1946. if (symbol->getBasicType() == glslang::EbtString)
  1947. return;
  1948. #endif
  1949. // getSymbolId() will set up all the IO decorations on the first call.
  1950. // Formal function parameters were mapped during makeFunctions().
  1951. spv::Id id = getSymbolId(symbol);
  1952. if (symbol->getType().getQualifier().isTaskPayload())
  1953. taskPayloadID = id; // cache the taskPayloadID to be used it as operand for OpEmitMeshTasksEXT
  1954. if (builder.isPointer(id)) {
  1955. if (!symbol->getType().getQualifier().isParamInput() &&
  1956. !symbol->getType().getQualifier().isParamOutput()) {
  1957. // Include all "static use" and "linkage only" interface variables on the OpEntryPoint instruction
  1958. // Consider adding to the OpEntryPoint interface list.
  1959. // Only looking at structures if they have at least one member.
  1960. if (!symbol->getType().isStruct() || symbol->getType().getStruct()->size() > 0) {
  1961. spv::StorageClass sc = builder.getStorageClass(id);
  1962. // Before SPIR-V 1.4, we only want to include Input and Output.
  1963. // Starting with SPIR-V 1.4, we want all globals.
  1964. if ((glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4 && builder.isGlobalVariable(id)) ||
  1965. (sc == spv::StorageClass::Input || sc == spv::StorageClass::Output)) {
  1966. iOSet.insert(id);
  1967. }
  1968. }
  1969. }
  1970. // If the SPIR-V type is required to be different than the AST type
  1971. // (for ex SubgroupMasks or 3x4 ObjectToWorld/WorldToObject matrices),
  1972. // translate now from the SPIR-V type to the AST type, for the consuming
  1973. // operation.
  1974. // Note this turns it from an l-value to an r-value.
  1975. // Currently, all symbols needing this are inputs; avoid the map lookup when non-input.
  1976. if (symbol->getType().getQualifier().storage == glslang::EvqVaryingIn)
  1977. id = translateForcedType(id);
  1978. }
  1979. // Only process non-linkage-only nodes for generating actual static uses
  1980. if (! linkageOnly || symbol->getQualifier().isSpecConstant()) {
  1981. // Prepare to generate code for the access
  1982. // L-value chains will be computed left to right. We're on the symbol now,
  1983. // which is the left-most part of the access chain, so now is "clear" time,
  1984. // followed by setting the base.
  1985. builder.clearAccessChain();
  1986. // For now, we consider all user variables as being in memory, so they are pointers,
  1987. // except for
  1988. // A) R-Value arguments to a function, which are an intermediate object.
  1989. // See comments in handleUserFunctionCall().
  1990. // B) Specialization constants (normal constants don't even come in as a variable),
  1991. // These are also pure R-values.
  1992. // C) R-Values from type translation, see above call to translateForcedType()
  1993. glslang::TQualifier qualifier = symbol->getQualifier();
  1994. if (qualifier.isSpecConstant() || rValueParameters.find(symbol->getId()) != rValueParameters.end() ||
  1995. !builder.isPointerType(builder.getTypeId(id)))
  1996. builder.setAccessChainRValue(id);
  1997. else
  1998. builder.setAccessChainLValue(id);
  1999. }
  2000. #ifdef ENABLE_HLSL
  2001. // Process linkage-only nodes for any special additional interface work.
  2002. if (linkageOnly) {
  2003. if (glslangIntermediate->getHlslFunctionality1()) {
  2004. // Map implicit counter buffers to their originating buffers, which should have been
  2005. // seen by now, given earlier pruning of unused counters, and preservation of order
  2006. // of declaration.
  2007. if (symbol->getType().getQualifier().isUniformOrBuffer()) {
  2008. if (!glslangIntermediate->hasCounterBufferName(symbol->getName())) {
  2009. // Save possible originating buffers for counter buffers, keyed by
  2010. // making the potential counter-buffer name.
  2011. std::string keyName = symbol->getName().c_str();
  2012. keyName = glslangIntermediate->addCounterBufferName(keyName);
  2013. counterOriginator[keyName] = symbol;
  2014. } else {
  2015. // Handle a counter buffer, by finding the saved originating buffer.
  2016. std::string keyName = symbol->getName().c_str();
  2017. auto it = counterOriginator.find(keyName);
  2018. if (it != counterOriginator.end()) {
  2019. id = getSymbolId(it->second);
  2020. if (id != spv::NoResult) {
  2021. spv::Id counterId = getSymbolId(symbol);
  2022. if (counterId != spv::NoResult) {
  2023. builder.addExtension("SPV_GOOGLE_hlsl_functionality1");
  2024. builder.addDecorationId(id, spv::Decoration::HlslCounterBufferGOOGLE, counterId);
  2025. }
  2026. }
  2027. }
  2028. }
  2029. }
  2030. }
  2031. }
  2032. #endif
  2033. }
  2034. bool TGlslangToSpvTraverser::visitBinary(glslang::TVisit /* visit */, glslang::TIntermBinary* node)
  2035. {
  2036. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2037. if (node->getLeft()->getAsSymbolNode() != nullptr && node->getLeft()->getType().isStruct()) {
  2038. glslangTypeToIdMap[node->getLeft()->getType().getStruct()] = node->getLeft()->getAsSymbolNode()->getId();
  2039. }
  2040. if (node->getRight()->getAsSymbolNode() != nullptr && node->getRight()->getType().isStruct()) {
  2041. glslangTypeToIdMap[node->getRight()->getType().getStruct()] = node->getRight()->getAsSymbolNode()->getId();
  2042. }
  2043. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  2044. if (node->getType().getQualifier().isSpecConstant())
  2045. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  2046. // First, handle special cases
  2047. switch (node->getOp()) {
  2048. case glslang::EOpAssign:
  2049. case glslang::EOpAddAssign:
  2050. case glslang::EOpSubAssign:
  2051. case glslang::EOpMulAssign:
  2052. case glslang::EOpVectorTimesMatrixAssign:
  2053. case glslang::EOpVectorTimesScalarAssign:
  2054. case glslang::EOpMatrixTimesScalarAssign:
  2055. case glslang::EOpMatrixTimesMatrixAssign:
  2056. case glslang::EOpDivAssign:
  2057. case glslang::EOpModAssign:
  2058. case glslang::EOpAndAssign:
  2059. case glslang::EOpInclusiveOrAssign:
  2060. case glslang::EOpExclusiveOrAssign:
  2061. case glslang::EOpLeftShiftAssign:
  2062. case glslang::EOpRightShiftAssign:
  2063. // A bin-op assign "a += b" means the same thing as "a = a + b"
  2064. // where a is evaluated before b. For a simple assignment, GLSL
  2065. // says to evaluate the left before the right. So, always, left
  2066. // node then right node.
  2067. {
  2068. // get the left l-value, save it away
  2069. builder.clearAccessChain();
  2070. node->getLeft()->traverse(this);
  2071. spv::Builder::AccessChain lValue = builder.getAccessChain();
  2072. // evaluate the right
  2073. builder.clearAccessChain();
  2074. node->getRight()->traverse(this);
  2075. spv::Id rValue = accessChainLoad(node->getRight()->getType());
  2076. // reset line number for assignment
  2077. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2078. if (node->getOp() != glslang::EOpAssign) {
  2079. // the left is also an r-value
  2080. builder.setAccessChain(lValue);
  2081. spv::Id leftRValue = accessChainLoad(node->getLeft()->getType());
  2082. // do the operation
  2083. spv::Builder::AccessChain::CoherentFlags coherentFlags = TranslateCoherent(node->getLeft()->getType());
  2084. coherentFlags |= TranslateCoherent(node->getRight()->getType());
  2085. OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
  2086. TranslateNoContractionDecoration(node->getType().getQualifier()),
  2087. TranslateNonUniformDecoration(coherentFlags) };
  2088. rValue = createBinaryOperation(node->getOp(), decorations,
  2089. convertGlslangToSpvType(node->getType()), leftRValue, rValue,
  2090. node->getType().getBasicType());
  2091. // these all need their counterparts in createBinaryOperation()
  2092. assert(rValue != spv::NoResult);
  2093. }
  2094. // store the result
  2095. builder.setAccessChain(lValue);
  2096. multiTypeStore(node->getLeft()->getType(), rValue);
  2097. // assignments are expressions having an rValue after they are evaluated...
  2098. builder.clearAccessChain();
  2099. builder.setAccessChainRValue(rValue);
  2100. }
  2101. return false;
  2102. case glslang::EOpIndexDirect:
  2103. case glslang::EOpIndexDirectStruct:
  2104. {
  2105. // Structure, array, matrix, or vector indirection with statically known index.
  2106. // Get the left part of the access chain.
  2107. node->getLeft()->traverse(this);
  2108. // Add the next element in the chain
  2109. const int glslangIndex = node->getRight()->getAsConstantUnion()->getConstArray()[0].getIConst();
  2110. if (! node->getLeft()->getType().isArray() &&
  2111. node->getLeft()->getType().isVector() &&
  2112. node->getOp() == glslang::EOpIndexDirect) {
  2113. // Swizzle is uniform so propagate uniform into access chain
  2114. spv::Builder::AccessChain::CoherentFlags coherentFlags = TranslateCoherent(node->getLeft()->getType());
  2115. coherentFlags.nonUniform = 0;
  2116. // This is essentially a hard-coded vector swizzle of size 1,
  2117. // so short circuit the access-chain stuff with a swizzle.
  2118. std::vector<unsigned> swizzle;
  2119. swizzle.push_back(glslangIndex);
  2120. int dummySize;
  2121. builder.accessChainPushSwizzle(swizzle, convertGlslangToSpvType(node->getLeft()->getType()),
  2122. coherentFlags,
  2123. glslangIntermediate->getBaseAlignmentScalar(
  2124. node->getLeft()->getType(), dummySize));
  2125. } else {
  2126. // Load through a block reference is performed with a dot operator that
  2127. // is mapped to EOpIndexDirectStruct. When we get to the actual reference,
  2128. // do a load and reset the access chain.
  2129. if (node->getLeft()->isReference() &&
  2130. !node->getLeft()->getType().isArray() &&
  2131. node->getOp() == glslang::EOpIndexDirectStruct)
  2132. {
  2133. spv::Id left = accessChainLoad(node->getLeft()->getType());
  2134. builder.clearAccessChain();
  2135. builder.setAccessChainLValue(left);
  2136. }
  2137. int spvIndex = glslangIndex;
  2138. if (node->getLeft()->getBasicType() == glslang::EbtBlock &&
  2139. node->getOp() == glslang::EOpIndexDirectStruct)
  2140. {
  2141. // This may be, e.g., an anonymous block-member selection, which generally need
  2142. // index remapping due to hidden members in anonymous blocks.
  2143. long long glslangId = glslangTypeToIdMap[node->getLeft()->getType().getStruct()];
  2144. if (memberRemapper.find(glslangId) != memberRemapper.end()) {
  2145. std::vector<int>& remapper = memberRemapper[glslangId];
  2146. assert(remapper.size() > 0);
  2147. spvIndex = remapper[glslangIndex];
  2148. }
  2149. }
  2150. // Struct reference propagates uniform lvalue
  2151. spv::Builder::AccessChain::CoherentFlags coherentFlags =
  2152. TranslateCoherent(node->getLeft()->getType());
  2153. coherentFlags.nonUniform = 0;
  2154. // normal case for indexing array or structure or block
  2155. if ((node->getRight()->getType().getBasicType() == glslang::EbtUint && glslangIntermediate->usingPromoteUint32Indices()) ||
  2156. node->getRight()->getType().contains64BitInt()) {
  2157. int64_t idx = node->getRight()->getType().contains64BitInt() ?
  2158. node->getRight()->getAsConstantUnion()->getConstArray()[0].getI64Const() :
  2159. node->getRight()->getAsConstantUnion()->getConstArray()[0].getUConst();
  2160. builder.accessChainPush(builder.makeInt64Constant(idx),
  2161. coherentFlags,
  2162. node->getLeft()->getType().getBufferReferenceAlignment());
  2163. } else {
  2164. builder.accessChainPush(builder.makeIntConstant(spvIndex),
  2165. coherentFlags,
  2166. node->getLeft()->getType().getBufferReferenceAlignment());
  2167. }
  2168. // Add capabilities here for accessing PointSize and clip/cull distance.
  2169. // We have deferred generation of associated capabilities until now.
  2170. if (node->getLeft()->getType().isStruct() && ! node->getLeft()->getType().isArray())
  2171. declareUseOfStructMember(*(node->getLeft()->getType().getStruct()), glslangIndex);
  2172. }
  2173. }
  2174. return false;
  2175. case glslang::EOpIndexIndirect:
  2176. {
  2177. // Array, matrix, or vector indirection with variable index.
  2178. // Will use native SPIR-V access-chain for and array indirection;
  2179. // matrices are arrays of vectors, so will also work for a matrix.
  2180. // Will use the access chain's 'component' for variable index into a vector.
  2181. // This adapter is building access chains left to right.
  2182. // Set up the access chain to the left.
  2183. node->getLeft()->traverse(this);
  2184. // save it so that computing the right side doesn't trash it
  2185. spv::Builder::AccessChain partial = builder.getAccessChain();
  2186. // compute the next index in the chain
  2187. builder.clearAccessChain();
  2188. node->getRight()->traverse(this);
  2189. spv::Id index = accessChainLoad(node->getRight()->getType());
  2190. // Zero-extend smaller unsigned integer types for array indexing.
  2191. // SPIR-V OpAccessChain treats indices as signed, so we need to zero-extend
  2192. // unsigned types to preserve their values (signed types are fine as-is).
  2193. spv::Id indexType = builder.getTypeId(index);
  2194. if (builder.isUintType(indexType) && builder.getScalarTypeWidth(indexType) < 32) {
  2195. // Zero-extend unsigned types to preserve their values
  2196. spv::Id uintType = builder.makeUintType(32);
  2197. index = builder.createUnaryOp(spv::Op::OpUConvert, uintType, index);
  2198. }
  2199. addIndirectionIndexCapabilities(node->getLeft()->getType(), node->getRight()->getType());
  2200. // restore the saved access chain
  2201. builder.setAccessChain(partial);
  2202. // Only if index is nonUniform should we propagate nonUniform into access chain
  2203. spv::Builder::AccessChain::CoherentFlags index_flags = TranslateCoherent(node->getRight()->getType());
  2204. spv::Builder::AccessChain::CoherentFlags coherent_flags = TranslateCoherent(node->getLeft()->getType());
  2205. coherent_flags.nonUniform = index_flags.nonUniform;
  2206. if (! node->getLeft()->getType().isArray() && node->getLeft()->getType().isVector()) {
  2207. int dummySize;
  2208. builder.accessChainPushComponent(
  2209. index, convertGlslangToSpvType(node->getLeft()->getType()), coherent_flags,
  2210. glslangIntermediate->getBaseAlignmentScalar(node->getLeft()->getType(),
  2211. dummySize));
  2212. } else {
  2213. if (glslangIntermediate->usingPromoteUint32Indices() &&
  2214. node->getRight()->getType().getBasicType() == glslang::EbtUint) {
  2215. index = createIntWidthConversion(index, 0, builder.makeIntegerType(64, true), glslang::EbtInt64, node->getRight()->getType().getBasicType());
  2216. }
  2217. builder.accessChainPush(index, coherent_flags,
  2218. node->getLeft()->getType().getBufferReferenceAlignment());
  2219. }
  2220. }
  2221. return false;
  2222. case glslang::EOpVectorSwizzle:
  2223. {
  2224. node->getLeft()->traverse(this);
  2225. std::vector<unsigned> swizzle;
  2226. convertSwizzle(*node->getRight()->getAsAggregate(), swizzle);
  2227. int dummySize;
  2228. builder.accessChainPushSwizzle(swizzle, convertGlslangToSpvType(node->getLeft()->getType()),
  2229. TranslateCoherent(node->getLeft()->getType()),
  2230. glslangIntermediate->getBaseAlignmentScalar(node->getLeft()->getType(),
  2231. dummySize));
  2232. }
  2233. return false;
  2234. case glslang::EOpMatrixSwizzle:
  2235. logger->missingFunctionality("matrix swizzle");
  2236. return true;
  2237. case glslang::EOpLogicalOr:
  2238. case glslang::EOpLogicalAnd:
  2239. {
  2240. // These may require short circuiting, but can sometimes be done as straight
  2241. // binary operations. The right operand must be short circuited if it has
  2242. // side effects, and should probably be if it is complex.
  2243. if (isTrivial(node->getRight()->getAsTyped()))
  2244. break; // handle below as a normal binary operation
  2245. // otherwise, we need to do dynamic short circuiting on the right operand
  2246. spv::Id result = createShortCircuit(node->getOp(), *node->getLeft()->getAsTyped(),
  2247. *node->getRight()->getAsTyped());
  2248. builder.clearAccessChain();
  2249. builder.setAccessChainRValue(result);
  2250. }
  2251. return false;
  2252. default:
  2253. break;
  2254. }
  2255. // Assume generic binary op...
  2256. // get right operand
  2257. builder.clearAccessChain();
  2258. node->getLeft()->traverse(this);
  2259. spv::Id left = accessChainLoad(node->getLeft()->getType());
  2260. // get left operand
  2261. builder.clearAccessChain();
  2262. node->getRight()->traverse(this);
  2263. spv::Id right = accessChainLoad(node->getRight()->getType());
  2264. // get result
  2265. OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
  2266. TranslateNoContractionDecoration(node->getType().getQualifier()),
  2267. TranslateNonUniformDecoration(node->getType().getQualifier()) };
  2268. spv::Id result = createBinaryOperation(node->getOp(), decorations,
  2269. convertGlslangToSpvType(node->getType()), left, right,
  2270. node->getLeft()->getType().getBasicType());
  2271. builder.clearAccessChain();
  2272. if (! result) {
  2273. logger->missingFunctionality("unknown glslang binary operation");
  2274. return true; // pick up a child as the place-holder result
  2275. } else {
  2276. builder.setAccessChainRValue(result);
  2277. return false;
  2278. }
  2279. }
  2280. spv::Id TGlslangToSpvTraverser::convertLoadedBoolInUniformToUint(const glslang::TType& type,
  2281. spv::Id nominalTypeId,
  2282. spv::Id loadedId)
  2283. {
  2284. if (builder.isScalarType(nominalTypeId)) {
  2285. // Conversion for bool
  2286. spv::Id boolType = builder.makeBoolType();
  2287. if (nominalTypeId != boolType)
  2288. return builder.createBinOp(spv::Op::OpINotEqual, boolType, loadedId, builder.makeUintConstant(0));
  2289. } else if (builder.isVectorType(nominalTypeId)) {
  2290. // Conversion for bvec
  2291. int vecSize = builder.getNumTypeComponents(nominalTypeId);
  2292. spv::Id bvecType = builder.makeVectorType(builder.makeBoolType(), vecSize);
  2293. if (nominalTypeId != bvecType)
  2294. loadedId = builder.createBinOp(spv::Op::OpINotEqual, bvecType, loadedId,
  2295. makeSmearedConstant(builder.makeUintConstant(0), vecSize));
  2296. } else if (builder.isArrayType(nominalTypeId)) {
  2297. // Conversion for bool array
  2298. spv::Id boolArrayTypeId = convertGlslangToSpvType(type);
  2299. if (nominalTypeId != boolArrayTypeId)
  2300. {
  2301. // Use OpCopyLogical from SPIR-V 1.4 if available.
  2302. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4)
  2303. return builder.createUnaryOp(spv::Op::OpCopyLogical, boolArrayTypeId, loadedId);
  2304. glslang::TType glslangElementType(type, 0);
  2305. spv::Id elementNominalTypeId = builder.getContainedTypeId(nominalTypeId);
  2306. std::vector<spv::Id> constituents;
  2307. for (int index = 0; index < type.getOuterArraySize(); ++index) {
  2308. // get the element
  2309. spv::Id elementValue = builder.createCompositeExtract(loadedId, elementNominalTypeId, index);
  2310. // recursively convert it
  2311. spv::Id elementConvertedValue = convertLoadedBoolInUniformToUint(glslangElementType, elementNominalTypeId, elementValue);
  2312. constituents.push_back(elementConvertedValue);
  2313. }
  2314. return builder.createCompositeConstruct(boolArrayTypeId, constituents);
  2315. }
  2316. }
  2317. return loadedId;
  2318. }
  2319. // Figure out what, if any, type changes are needed when accessing a specific built-in.
  2320. // Returns <the type SPIR-V requires for declarion, the type to translate to on use>.
  2321. // Also see comment for 'forceType', regarding tracking SPIR-V-required types.
  2322. std::pair<spv::Id, spv::Id> TGlslangToSpvTraverser::getForcedType(glslang::TBuiltInVariable glslangBuiltIn,
  2323. const glslang::TType& glslangType)
  2324. {
  2325. switch(glslangBuiltIn)
  2326. {
  2327. case glslang::EbvSubGroupEqMask:
  2328. case glslang::EbvSubGroupGeMask:
  2329. case glslang::EbvSubGroupGtMask:
  2330. case glslang::EbvSubGroupLeMask:
  2331. case glslang::EbvSubGroupLtMask: {
  2332. // these require changing a 64-bit scaler -> a vector of 32-bit components
  2333. if (glslangType.isVector())
  2334. break;
  2335. spv::Id ivec4_type = builder.makeVectorType(builder.makeUintType(32), 4);
  2336. spv::Id uint64_type = builder.makeUintType(64);
  2337. std::pair<spv::Id, spv::Id> ret(ivec4_type, uint64_type);
  2338. return ret;
  2339. }
  2340. // There are no SPIR-V builtins defined for these and map onto original non-transposed
  2341. // builtins. During visitBinary we insert a transpose
  2342. case glslang::EbvWorldToObject3x4:
  2343. case glslang::EbvObjectToWorld3x4: {
  2344. spv::Id mat43 = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  2345. spv::Id mat34 = builder.makeMatrixType(builder.makeFloatType(32), 3, 4);
  2346. std::pair<spv::Id, spv::Id> ret(mat43, mat34);
  2347. return ret;
  2348. }
  2349. default:
  2350. break;
  2351. }
  2352. std::pair<spv::Id, spv::Id> ret(spv::NoType, spv::NoType);
  2353. return ret;
  2354. }
  2355. // For an object previously identified (see getForcedType() and forceType)
  2356. // as needing type translations, do the translation needed for a load, turning
  2357. // an L-value into in R-value.
  2358. spv::Id TGlslangToSpvTraverser::translateForcedType(spv::Id object)
  2359. {
  2360. const auto forceIt = forceType.find(object);
  2361. if (forceIt == forceType.end())
  2362. return object;
  2363. spv::Id desiredTypeId = forceIt->second;
  2364. spv::Id objectTypeId = builder.getTypeId(object);
  2365. assert(builder.isPointerType(objectTypeId));
  2366. objectTypeId = builder.getContainedTypeId(objectTypeId);
  2367. if (builder.isVectorType(objectTypeId) &&
  2368. builder.getScalarTypeWidth(builder.getContainedTypeId(objectTypeId)) == 32) {
  2369. if (builder.getScalarTypeWidth(desiredTypeId) == 64) {
  2370. // handle 32-bit v.xy* -> 64-bit
  2371. builder.clearAccessChain();
  2372. builder.setAccessChainLValue(object);
  2373. object = builder.accessChainLoad(spv::NoPrecision, spv::Decoration::Max, spv::Decoration::Max, objectTypeId);
  2374. std::vector<spv::Id> components;
  2375. components.push_back(builder.createCompositeExtract(object, builder.getContainedTypeId(objectTypeId), 0));
  2376. components.push_back(builder.createCompositeExtract(object, builder.getContainedTypeId(objectTypeId), 1));
  2377. spv::Id vecType = builder.makeVectorType(builder.getContainedTypeId(objectTypeId), 2);
  2378. return builder.createUnaryOp(spv::Op::OpBitcast, desiredTypeId,
  2379. builder.createCompositeConstruct(vecType, components));
  2380. } else {
  2381. logger->missingFunctionality("forcing 32-bit vector type to non 64-bit scalar");
  2382. }
  2383. } else if (builder.isMatrixType(objectTypeId)) {
  2384. // There are no SPIR-V builtins defined for 3x4 variants of ObjectToWorld/WorldToObject
  2385. // and we insert a transpose after loading the original non-transposed builtins
  2386. builder.clearAccessChain();
  2387. builder.setAccessChainLValue(object);
  2388. object = builder.accessChainLoad(spv::NoPrecision, spv::Decoration::Max, spv::Decoration::Max, objectTypeId);
  2389. return builder.createUnaryOp(spv::Op::OpTranspose, desiredTypeId, object);
  2390. } else {
  2391. logger->missingFunctionality("forcing non 32-bit vector type");
  2392. }
  2393. return object;
  2394. }
  2395. bool TGlslangToSpvTraverser::visitUnary(glslang::TVisit /* visit */, glslang::TIntermUnary* node)
  2396. {
  2397. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2398. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  2399. if (node->getType().getQualifier().isSpecConstant())
  2400. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  2401. spv::Id result = spv::NoResult;
  2402. // try texturing first
  2403. result = createImageTextureFunctionCall(node);
  2404. if (result != spv::NoResult) {
  2405. builder.clearAccessChain();
  2406. builder.setAccessChainRValue(result);
  2407. return false; // done with this node
  2408. }
  2409. // Non-texturing.
  2410. if (node->getOp() == glslang::EOpArrayLength) {
  2411. // Quite special; won't want to evaluate the operand.
  2412. // Currently, the front-end does not allow .length() on an array until it is sized,
  2413. // except for the last block membeor of an SSBO.
  2414. // TODO: If this changes, link-time sized arrays might show up here, and need their
  2415. // size extracted.
  2416. // Normal .length() would have been constant folded by the front-end.
  2417. // So, this has to be block.lastMember.length().
  2418. // SPV wants "block" and member number as the operands, go get them.
  2419. uint32_t bits = node->getType().contains64BitInt() ? 64 : 32;
  2420. spv::Id length;
  2421. if (node->getOperand()->getType().isCoopMat()) {
  2422. spv::Id typeId = convertGlslangToSpvType(node->getOperand()->getType());
  2423. assert(builder.isCooperativeMatrixType(typeId));
  2424. if (node->getOperand()->getType().isCoopMatKHR()) {
  2425. length = builder.createCooperativeMatrixLengthKHR(typeId);
  2426. } else {
  2427. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  2428. length = builder.createCooperativeMatrixLengthNV(typeId);
  2429. }
  2430. } else if (node->getOperand()->getType().isCoopVecNV()) {
  2431. spv::Id typeId = convertGlslangToSpvType(node->getOperand()->getType());
  2432. length = builder.getCooperativeVectorNumComponents(typeId);
  2433. } else {
  2434. glslang::TIntermTyped* block = node->getOperand()->getAsBinaryNode()->getLeft();
  2435. block->traverse(this);
  2436. unsigned int member = node->getOperand()->getAsBinaryNode()->getRight()->getAsConstantUnion()
  2437. ->getConstArray()[0].getUConst();
  2438. length = builder.createArrayLength(builder.accessChainGetLValue(), member, bits);
  2439. }
  2440. // GLSL semantics say the result of .length() is an int, while SPIR-V says
  2441. // signedness must be 0. So, convert from SPIR-V unsigned back to GLSL's
  2442. // AST expectation of a signed result.
  2443. if (glslangIntermediate->getSource() == glslang::EShSourceGlsl) {
  2444. if (builder.isInSpecConstCodeGenMode()) {
  2445. length = builder.createBinOp(spv::Op::OpIAdd, builder.makeIntType(bits), length, builder.makeIntConstant(0));
  2446. } else {
  2447. length = builder.createUnaryOp(spv::Op::OpBitcast, builder.makeIntType(bits), length);
  2448. }
  2449. }
  2450. builder.clearAccessChain();
  2451. builder.setAccessChainRValue(length);
  2452. return false;
  2453. }
  2454. // Force variable declaration - Debug Mode Only
  2455. if (node->getOp() == glslang::EOpDeclare) {
  2456. builder.clearAccessChain();
  2457. node->getOperand()->traverse(this);
  2458. builder.clearAccessChain();
  2459. return false;
  2460. }
  2461. // Start by evaluating the operand
  2462. // Does it need a swizzle inversion? If so, evaluation is inverted;
  2463. // operate first on the swizzle base, then apply the swizzle.
  2464. spv::Id invertedType = spv::NoType;
  2465. auto resultType = [&invertedType, &node, this](){ return invertedType != spv::NoType ?
  2466. invertedType : convertGlslangToSpvType(node->getType()); };
  2467. if (node->getOp() == glslang::EOpInterpolateAtCentroid)
  2468. invertedType = getInvertedSwizzleType(*node->getOperand());
  2469. builder.clearAccessChain();
  2470. TIntermNode *operandNode;
  2471. if (invertedType != spv::NoType)
  2472. operandNode = node->getOperand()->getAsBinaryNode()->getLeft();
  2473. else
  2474. operandNode = node->getOperand();
  2475. operandNode->traverse(this);
  2476. spv::Id operand = spv::NoResult;
  2477. spv::Builder::AccessChain::CoherentFlags lvalueCoherentFlags;
  2478. const auto hitObjectOpsWithLvalue = [](glslang::TOperator op) {
  2479. switch(op) {
  2480. case glslang::EOpReorderThreadNV:
  2481. case glslang::EOpHitObjectGetCurrentTimeNV:
  2482. case glslang::EOpHitObjectGetHitKindNV:
  2483. case glslang::EOpHitObjectGetPrimitiveIndexNV:
  2484. case glslang::EOpHitObjectGetGeometryIndexNV:
  2485. case glslang::EOpHitObjectGetInstanceIdNV:
  2486. case glslang::EOpHitObjectGetInstanceCustomIndexNV:
  2487. case glslang::EOpHitObjectGetObjectRayDirectionNV:
  2488. case glslang::EOpHitObjectGetObjectRayOriginNV:
  2489. case glslang::EOpHitObjectGetWorldRayDirectionNV:
  2490. case glslang::EOpHitObjectGetWorldRayOriginNV:
  2491. case glslang::EOpHitObjectGetWorldToObjectNV:
  2492. case glslang::EOpHitObjectGetObjectToWorldNV:
  2493. case glslang::EOpHitObjectGetRayTMaxNV:
  2494. case glslang::EOpHitObjectGetRayTMinNV:
  2495. case glslang::EOpHitObjectIsEmptyNV:
  2496. case glslang::EOpHitObjectIsHitNV:
  2497. case glslang::EOpHitObjectIsMissNV:
  2498. case glslang::EOpHitObjectRecordEmptyNV:
  2499. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:
  2500. case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:
  2501. case glslang::EOpHitObjectGetClusterIdNV:
  2502. case glslang::EOpHitObjectGetSpherePositionNV:
  2503. case glslang::EOpHitObjectGetSphereRadiusNV:
  2504. case glslang::EOpHitObjectIsSphereHitNV:
  2505. case glslang::EOpHitObjectIsLSSHitNV:
  2506. case glslang::EOpReorderThreadEXT:
  2507. case glslang::EOpHitObjectGetCurrentTimeEXT:
  2508. case glslang::EOpHitObjectGetHitKindEXT:
  2509. case glslang::EOpHitObjectGetPrimitiveIndexEXT:
  2510. case glslang::EOpHitObjectGetGeometryIndexEXT:
  2511. case glslang::EOpHitObjectGetInstanceIdEXT:
  2512. case glslang::EOpHitObjectGetInstanceCustomIndexEXT:
  2513. case glslang::EOpHitObjectGetObjectRayDirectionEXT:
  2514. case glslang::EOpHitObjectGetObjectRayOriginEXT:
  2515. case glslang::EOpHitObjectGetWorldRayDirectionEXT:
  2516. case glslang::EOpHitObjectGetWorldRayOriginEXT:
  2517. case glslang::EOpHitObjectGetWorldToObjectEXT:
  2518. case glslang::EOpHitObjectGetObjectToWorldEXT:
  2519. case glslang::EOpHitObjectGetRayTMaxEXT:
  2520. case glslang::EOpHitObjectGetRayTMinEXT:
  2521. case glslang::EOpHitObjectGetRayFlagsEXT:
  2522. case glslang::EOpHitObjectIsEmptyEXT:
  2523. case glslang::EOpHitObjectIsHitEXT:
  2524. case glslang::EOpHitObjectIsMissEXT:
  2525. case glslang::EOpHitObjectRecordEmptyEXT:
  2526. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexEXT:
  2527. case glslang::EOpHitObjectGetShaderRecordBufferHandleEXT:
  2528. return true;
  2529. default:
  2530. return false;
  2531. }
  2532. };
  2533. if (node->getOp() == glslang::EOpAtomicCounterIncrement ||
  2534. node->getOp() == glslang::EOpAtomicCounterDecrement ||
  2535. node->getOp() == glslang::EOpAtomicCounter ||
  2536. (node->getOp() == glslang::EOpInterpolateAtCentroid &&
  2537. glslangIntermediate->getSource() != glslang::EShSourceHlsl) ||
  2538. node->getOp() == glslang::EOpRayQueryProceed ||
  2539. node->getOp() == glslang::EOpRayQueryGetRayTMin ||
  2540. node->getOp() == glslang::EOpRayQueryGetRayFlags ||
  2541. node->getOp() == glslang::EOpRayQueryGetWorldRayOrigin ||
  2542. node->getOp() == glslang::EOpRayQueryGetWorldRayDirection ||
  2543. node->getOp() == glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque ||
  2544. node->getOp() == glslang::EOpRayQueryTerminate ||
  2545. node->getOp() == glslang::EOpRayQueryConfirmIntersection ||
  2546. (node->getOp() == glslang::EOpSpirvInst && operandNode->getAsTyped()->getQualifier().isSpirvByReference()) ||
  2547. hitObjectOpsWithLvalue(node->getOp())) {
  2548. operand = builder.accessChainGetLValue(); // Special case l-value operands
  2549. lvalueCoherentFlags = builder.getAccessChain().coherentFlags;
  2550. lvalueCoherentFlags |= TranslateCoherent(operandNode->getAsTyped()->getType());
  2551. } else if (operandNode->getAsTyped()->getQualifier().isSpirvLiteral()) {
  2552. // Will be translated to a literal value, make a placeholder here
  2553. operand = spv::NoResult;
  2554. } else {
  2555. operand = accessChainLoad(node->getOperand()->getType());
  2556. }
  2557. OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
  2558. TranslateNoContractionDecoration(node->getType().getQualifier()),
  2559. TranslateNonUniformDecoration(node->getType().getQualifier()) };
  2560. // it could be a conversion
  2561. if (! result) {
  2562. result = createConversion(node->getOp(), decorations, resultType(), operand,
  2563. node->getType().getBasicType(), node->getOperand()->getBasicType());
  2564. if (result) {
  2565. if (node->getType().isCoopMatKHR() && node->getOperand()->getAsTyped()->getType().isCoopMatKHR() &&
  2566. !node->getAsTyped()->getType().sameCoopMatUse(node->getOperand()->getAsTyped()->getType())) {
  2567. // Conversions that change use need CapabilityCooperativeMatrixConversionsNV
  2568. builder.addCapability(spv::Capability::CooperativeMatrixConversionsNV);
  2569. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  2570. }
  2571. }
  2572. }
  2573. // if not, then possibly an operation
  2574. if (! result)
  2575. result = createUnaryOperation(node->getOp(), decorations, resultType(), operand,
  2576. node->getOperand()->getBasicType(), lvalueCoherentFlags, node->getType());
  2577. // it could be attached to a SPIR-V intruction
  2578. if (!result) {
  2579. if (node->getOp() == glslang::EOpSpirvInst) {
  2580. const auto& spirvInst = node->getSpirvInstruction();
  2581. if (spirvInst.set == "") {
  2582. spv::IdImmediate idImmOp = {true, operand};
  2583. if (operandNode->getAsTyped()->getQualifier().isSpirvLiteral()) {
  2584. // Translate the constant to a literal value
  2585. std::vector<unsigned> literals;
  2586. glslang::TVector<const glslang::TIntermConstantUnion*> constants;
  2587. constants.push_back(operandNode->getAsConstantUnion());
  2588. TranslateLiterals(constants, literals);
  2589. idImmOp = {false, literals[0]};
  2590. }
  2591. if (node->getBasicType() == glslang::EbtVoid)
  2592. builder.createNoResultOp(static_cast<spv::Op>(spirvInst.id), {idImmOp});
  2593. else
  2594. result = builder.createOp(static_cast<spv::Op>(spirvInst.id), resultType(), {idImmOp});
  2595. } else {
  2596. result = builder.createBuiltinCall(
  2597. resultType(), spirvInst.set == "GLSL.std.450" ? stdBuiltins : getExtBuiltins(spirvInst.set.c_str()),
  2598. spirvInst.id, {operand});
  2599. }
  2600. if (node->getBasicType() == glslang::EbtVoid)
  2601. return false; // done with this node
  2602. }
  2603. }
  2604. if (result) {
  2605. if (invertedType) {
  2606. result = createInvertedSwizzle(decorations.precision, *node->getOperand(), result);
  2607. decorations.addNonUniform(builder, result);
  2608. }
  2609. builder.clearAccessChain();
  2610. builder.setAccessChainRValue(result);
  2611. return false; // done with this node
  2612. }
  2613. // it must be a special case, check...
  2614. switch (node->getOp()) {
  2615. case glslang::EOpPostIncrement:
  2616. case glslang::EOpPostDecrement:
  2617. case glslang::EOpPreIncrement:
  2618. case glslang::EOpPreDecrement:
  2619. {
  2620. // we need the integer value "1" or the floating point "1.0" to add/subtract
  2621. spv::Id one = 0;
  2622. if (node->getBasicType() == glslang::EbtFloat)
  2623. one = builder.makeFloatConstant(1.0F);
  2624. else if (node->getBasicType() == glslang::EbtDouble)
  2625. one = builder.makeDoubleConstant(1.0);
  2626. else if (node->getBasicType() == glslang::EbtFloat16)
  2627. one = builder.makeFloat16Constant(1.0F);
  2628. else if (node->getBasicType() == glslang::EbtBFloat16)
  2629. one = builder.makeBFloat16Constant(1.0F);
  2630. else if (node->getBasicType() == glslang::EbtFloatE5M2)
  2631. one = builder.makeFloatE5M2Constant(1.0F);
  2632. else if (node->getBasicType() == glslang::EbtFloatE4M3)
  2633. one = builder.makeFloatE4M3Constant(1.0F);
  2634. else if (node->getBasicType() == glslang::EbtInt8 || node->getBasicType() == glslang::EbtUint8)
  2635. one = builder.makeInt8Constant(1);
  2636. else if (node->getBasicType() == glslang::EbtInt16 || node->getBasicType() == glslang::EbtUint16)
  2637. one = builder.makeInt16Constant(1);
  2638. else if (node->getBasicType() == glslang::EbtInt64 || node->getBasicType() == glslang::EbtUint64)
  2639. one = builder.makeInt64Constant(1);
  2640. else
  2641. one = builder.makeIntConstant(1);
  2642. glslang::TOperator op;
  2643. if (node->getOp() == glslang::EOpPreIncrement ||
  2644. node->getOp() == glslang::EOpPostIncrement)
  2645. op = glslang::EOpAdd;
  2646. else
  2647. op = glslang::EOpSub;
  2648. spv::Id result = createBinaryOperation(op, decorations,
  2649. convertGlslangToSpvType(node->getType()), operand, one,
  2650. node->getType().getBasicType());
  2651. assert(result != spv::NoResult);
  2652. // The result of operation is always stored, but conditionally the
  2653. // consumed result. The consumed result is always an r-value.
  2654. builder.accessChainStore(result,
  2655. TranslateNonUniformDecoration(builder.getAccessChain().coherentFlags));
  2656. builder.clearAccessChain();
  2657. if (node->getOp() == glslang::EOpPreIncrement ||
  2658. node->getOp() == glslang::EOpPreDecrement)
  2659. builder.setAccessChainRValue(result);
  2660. else
  2661. builder.setAccessChainRValue(operand);
  2662. }
  2663. return false;
  2664. case glslang::EOpAssumeEXT:
  2665. builder.addCapability(spv::Capability::ExpectAssumeKHR);
  2666. builder.addExtension(spv::E_SPV_KHR_expect_assume);
  2667. builder.createNoResultOp(spv::Op::OpAssumeTrueKHR, operand);
  2668. return false;
  2669. case glslang::EOpEmitStreamVertex:
  2670. builder.createNoResultOp(spv::Op::OpEmitStreamVertex, operand);
  2671. return false;
  2672. case glslang::EOpEndStreamPrimitive:
  2673. builder.createNoResultOp(spv::Op::OpEndStreamPrimitive, operand);
  2674. return false;
  2675. case glslang::EOpRayQueryTerminate:
  2676. builder.createNoResultOp(spv::Op::OpRayQueryTerminateKHR, operand);
  2677. return false;
  2678. case glslang::EOpRayQueryConfirmIntersection:
  2679. builder.createNoResultOp(spv::Op::OpRayQueryConfirmIntersectionKHR, operand);
  2680. return false;
  2681. case glslang::EOpReorderThreadNV:
  2682. builder.createNoResultOp(spv::Op::OpReorderThreadWithHitObjectNV, operand);
  2683. return false;
  2684. case glslang::EOpReorderThreadEXT:
  2685. builder.createNoResultOp(spv::Op::OpReorderThreadWithHitObjectEXT, operand);
  2686. return false;
  2687. case glslang::EOpHitObjectRecordEmptyNV:
  2688. builder.createNoResultOp(spv::Op::OpHitObjectRecordEmptyNV, operand);
  2689. return false;
  2690. case glslang::EOpHitObjectRecordEmptyEXT:
  2691. builder.createNoResultOp(spv::Op::OpHitObjectRecordEmptyEXT, operand);
  2692. return false;
  2693. case glslang::EOpCreateTensorLayoutNV:
  2694. result = builder.createOp(spv::Op::OpCreateTensorLayoutNV, resultType(), std::vector<spv::Id>{});
  2695. builder.clearAccessChain();
  2696. builder.setAccessChainRValue(result);
  2697. return false;
  2698. case glslang::EOpCreateTensorViewNV:
  2699. result = builder.createOp(spv::Op::OpCreateTensorViewNV, resultType(), std::vector<spv::Id>{});
  2700. builder.clearAccessChain();
  2701. builder.setAccessChainRValue(result);
  2702. return false;
  2703. default:
  2704. logger->missingFunctionality("unknown glslang unary");
  2705. return true; // pick up operand as placeholder result
  2706. }
  2707. }
  2708. // Construct a composite object, recursively copying members if their types don't match
  2709. spv::Id TGlslangToSpvTraverser::createCompositeConstruct(spv::Id resultTypeId, std::vector<spv::Id> constituents)
  2710. {
  2711. for (int c = 0; c < (int)constituents.size(); ++c) {
  2712. spv::Id& constituent = constituents[c];
  2713. spv::Id lType = builder.getContainedTypeId(resultTypeId, c);
  2714. spv::Id rType = builder.getTypeId(constituent);
  2715. if (lType != rType) {
  2716. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {
  2717. constituent = builder.createUnaryOp(spv::Op::OpCopyLogical, lType, constituent);
  2718. } else if (builder.isStructType(rType)) {
  2719. std::vector<spv::Id> rTypeConstituents;
  2720. int numrTypeConstituents = builder.getNumTypeConstituents(rType);
  2721. for (int i = 0; i < numrTypeConstituents; ++i) {
  2722. rTypeConstituents.push_back(builder.createCompositeExtract(constituent,
  2723. builder.getContainedTypeId(rType, i), i));
  2724. }
  2725. constituents[c] = createCompositeConstruct(lType, rTypeConstituents);
  2726. } else {
  2727. assert(builder.isArrayType(rType));
  2728. std::vector<spv::Id> rTypeConstituents;
  2729. int numrTypeConstituents = builder.getNumTypeConstituents(rType);
  2730. spv::Id elementRType = builder.getContainedTypeId(rType);
  2731. for (int i = 0; i < numrTypeConstituents; ++i) {
  2732. rTypeConstituents.push_back(builder.createCompositeExtract(constituent, elementRType, i));
  2733. }
  2734. constituents[c] = createCompositeConstruct(lType, rTypeConstituents);
  2735. }
  2736. }
  2737. }
  2738. return builder.createCompositeConstruct(resultTypeId, constituents);
  2739. }
  2740. bool TGlslangToSpvTraverser::visitAggregate(glslang::TVisit visit, glslang::TIntermAggregate* node)
  2741. {
  2742. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  2743. if (node->getType().getQualifier().isSpecConstant())
  2744. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  2745. spv::Id result = spv::NoResult;
  2746. spv::Id invertedType = spv::NoType; // to use to override the natural type of the node
  2747. std::vector<spv::Builder::AccessChain> complexLvalues; // for holding swizzling l-values too complex for
  2748. // SPIR-V, for an out parameter
  2749. std::vector<spv::Id> temporaryLvalues; // temporaries to pass, as proxies for complexLValues
  2750. auto resultType = [&invertedType, &node, this](){
  2751. if (invertedType != spv::NoType) {
  2752. return invertedType;
  2753. } else {
  2754. auto ret = convertGlslangToSpvType(node->getType());
  2755. // convertGlslangToSpvType may clobber the debug location, reset it
  2756. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2757. return ret;
  2758. }
  2759. };
  2760. // try texturing
  2761. result = createImageTextureFunctionCall(node);
  2762. if (result != spv::NoResult) {
  2763. builder.clearAccessChain();
  2764. builder.setAccessChainRValue(result);
  2765. return false;
  2766. } else if (node->getOp() == glslang::EOpImageStore ||
  2767. node->getOp() == glslang::EOpImageStoreLod ||
  2768. node->getOp() == glslang::EOpImageAtomicStore) {
  2769. // "imageStore" is a special case, which has no result
  2770. return false;
  2771. }
  2772. glslang::TOperator binOp = glslang::EOpNull;
  2773. bool reduceComparison = true;
  2774. bool isMatrix = false;
  2775. bool noReturnValue = false;
  2776. bool atomic = false;
  2777. spv::Builder::AccessChain::CoherentFlags lvalueCoherentFlags;
  2778. assert(node->getOp());
  2779. spv::Decoration precision = TranslatePrecisionDecoration(node->getOperationPrecision());
  2780. switch (node->getOp()) {
  2781. case glslang::EOpScope:
  2782. case glslang::EOpSequence:
  2783. {
  2784. if (visit == glslang::EvPreVisit) {
  2785. ++sequenceDepth;
  2786. if (sequenceDepth == 1) {
  2787. // If this is the parent node of all the functions, we want to see them
  2788. // early, so all call points have actual SPIR-V functions to reference.
  2789. // In all cases, still let the traverser visit the children for us.
  2790. makeFunctions(node->getAsAggregate()->getSequence());
  2791. // Global initializers is specific to the shader entry point, which does not exist in compile-only mode
  2792. if (!options.compileOnly) {
  2793. // Also, we want all globals initializers to go into the beginning of the entry point, before
  2794. // anything else gets there, so visit out of order, doing them all now.
  2795. makeGlobalInitializers(node->getAsAggregate()->getSequence());
  2796. }
  2797. //Pre process linker objects for ray tracing stages
  2798. if (glslangIntermediate->isRayTracingStage())
  2799. collectRayTracingLinkerObjects();
  2800. // Initializers are done, don't want to visit again, but functions and link objects need to be processed,
  2801. // so do them manually.
  2802. visitFunctions(node->getAsAggregate()->getSequence());
  2803. return false;
  2804. } else {
  2805. if (node->getOp() == glslang::EOpScope) {
  2806. auto loc = node->getLoc();
  2807. builder.enterLexicalBlock(loc.line, loc.column);
  2808. }
  2809. }
  2810. } else {
  2811. if (sequenceDepth > 1 && node->getOp() == glslang::EOpScope)
  2812. builder.leaveLexicalBlock();
  2813. --sequenceDepth;
  2814. }
  2815. return true;
  2816. }
  2817. case glslang::EOpLinkerObjects:
  2818. {
  2819. if (visit == glslang::EvPreVisit)
  2820. linkageOnly = true;
  2821. else
  2822. linkageOnly = false;
  2823. return true;
  2824. }
  2825. case glslang::EOpComma:
  2826. {
  2827. // processing from left to right naturally leaves the right-most
  2828. // lying around in the access chain
  2829. glslang::TIntermSequence& glslangOperands = node->getSequence();
  2830. for (int i = 0; i < (int)glslangOperands.size(); ++i)
  2831. glslangOperands[i]->traverse(this);
  2832. return false;
  2833. }
  2834. case glslang::EOpFunction:
  2835. if (visit == glslang::EvPreVisit) {
  2836. if (options.generateDebugInfo) {
  2837. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2838. }
  2839. if (isShaderEntryPoint(node)) {
  2840. inEntryPoint = true;
  2841. builder.setBuildPoint(shaderEntry->getLastBlock());
  2842. builder.enterFunction(shaderEntry);
  2843. currentFunction = shaderEntry;
  2844. } else {
  2845. // SPIR-V functions should already be in the functionMap from the prepass
  2846. // that called makeFunctions().
  2847. currentFunction = functionMap[node->getName().c_str()];
  2848. spv::Block* functionBlock = currentFunction->getEntryBlock();
  2849. builder.setBuildPoint(functionBlock);
  2850. builder.enterFunction(currentFunction);
  2851. }
  2852. if (options.generateDebugInfo && !options.emitNonSemanticShaderDebugInfo) {
  2853. const auto& loc = node->getLoc();
  2854. const char* sourceFileName = loc.getFilename();
  2855. spv::Id sourceFileId = sourceFileName ? builder.getStringId(sourceFileName) : builder.getMainFileId();
  2856. currentFunction->setDebugLineInfo(sourceFileId, loc.line, loc.column);
  2857. }
  2858. } else {
  2859. // Here we have finished visiting the function (post-visit). Finalize it.
  2860. if (options.generateDebugInfo) {
  2861. if (glslangIntermediate->getSource() == glslang::EShSourceGlsl && node->getSequence().size() > 1) {
  2862. auto endLoc = node->getSequence()[1]->getAsAggregate()->getEndLoc();
  2863. builder.setDebugSourceLocation(endLoc.line, endLoc.getFilename());
  2864. }
  2865. }
  2866. if (inEntryPoint)
  2867. entryPointTerminated = true;
  2868. builder.leaveFunction();
  2869. inEntryPoint = false;
  2870. currentFunction = nullptr;
  2871. }
  2872. return true;
  2873. case glslang::EOpParameters:
  2874. // Parameters will have been consumed by EOpFunction processing, but not
  2875. // the body, so we still visited the function node's children, making this
  2876. // child redundant.
  2877. return false;
  2878. case glslang::EOpFunctionCall:
  2879. {
  2880. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2881. if (node->isUserDefined())
  2882. result = handleUserFunctionCall(node);
  2883. if (result) {
  2884. builder.clearAccessChain();
  2885. builder.setAccessChainRValue(result);
  2886. } else
  2887. logger->missingFunctionality("missing user function; linker needs to catch that");
  2888. return false;
  2889. }
  2890. case glslang::EOpConstructMat2x2:
  2891. case glslang::EOpConstructMat2x3:
  2892. case glslang::EOpConstructMat2x4:
  2893. case glslang::EOpConstructMat3x2:
  2894. case glslang::EOpConstructMat3x3:
  2895. case glslang::EOpConstructMat3x4:
  2896. case glslang::EOpConstructMat4x2:
  2897. case glslang::EOpConstructMat4x3:
  2898. case glslang::EOpConstructMat4x4:
  2899. case glslang::EOpConstructDMat2x2:
  2900. case glslang::EOpConstructDMat2x3:
  2901. case glslang::EOpConstructDMat2x4:
  2902. case glslang::EOpConstructDMat3x2:
  2903. case glslang::EOpConstructDMat3x3:
  2904. case glslang::EOpConstructDMat3x4:
  2905. case glslang::EOpConstructDMat4x2:
  2906. case glslang::EOpConstructDMat4x3:
  2907. case glslang::EOpConstructDMat4x4:
  2908. case glslang::EOpConstructIMat2x2:
  2909. case glslang::EOpConstructIMat2x3:
  2910. case glslang::EOpConstructIMat2x4:
  2911. case glslang::EOpConstructIMat3x2:
  2912. case glslang::EOpConstructIMat3x3:
  2913. case glslang::EOpConstructIMat3x4:
  2914. case glslang::EOpConstructIMat4x2:
  2915. case glslang::EOpConstructIMat4x3:
  2916. case glslang::EOpConstructIMat4x4:
  2917. case glslang::EOpConstructUMat2x2:
  2918. case glslang::EOpConstructUMat2x3:
  2919. case glslang::EOpConstructUMat2x4:
  2920. case glslang::EOpConstructUMat3x2:
  2921. case glslang::EOpConstructUMat3x3:
  2922. case glslang::EOpConstructUMat3x4:
  2923. case glslang::EOpConstructUMat4x2:
  2924. case glslang::EOpConstructUMat4x3:
  2925. case glslang::EOpConstructUMat4x4:
  2926. case glslang::EOpConstructBMat2x2:
  2927. case glslang::EOpConstructBMat2x3:
  2928. case glslang::EOpConstructBMat2x4:
  2929. case glslang::EOpConstructBMat3x2:
  2930. case glslang::EOpConstructBMat3x3:
  2931. case glslang::EOpConstructBMat3x4:
  2932. case glslang::EOpConstructBMat4x2:
  2933. case glslang::EOpConstructBMat4x3:
  2934. case glslang::EOpConstructBMat4x4:
  2935. case glslang::EOpConstructF16Mat2x2:
  2936. case glslang::EOpConstructF16Mat2x3:
  2937. case glslang::EOpConstructF16Mat2x4:
  2938. case glslang::EOpConstructF16Mat3x2:
  2939. case glslang::EOpConstructF16Mat3x3:
  2940. case glslang::EOpConstructF16Mat3x4:
  2941. case glslang::EOpConstructF16Mat4x2:
  2942. case glslang::EOpConstructF16Mat4x3:
  2943. case glslang::EOpConstructF16Mat4x4:
  2944. isMatrix = true;
  2945. [[fallthrough]];
  2946. case glslang::EOpConstructFloat:
  2947. case glslang::EOpConstructVec2:
  2948. case glslang::EOpConstructVec3:
  2949. case glslang::EOpConstructVec4:
  2950. case glslang::EOpConstructDouble:
  2951. case glslang::EOpConstructDVec2:
  2952. case glslang::EOpConstructDVec3:
  2953. case glslang::EOpConstructDVec4:
  2954. case glslang::EOpConstructFloat16:
  2955. case glslang::EOpConstructF16Vec2:
  2956. case glslang::EOpConstructF16Vec3:
  2957. case glslang::EOpConstructF16Vec4:
  2958. case glslang::EOpConstructBFloat16:
  2959. case glslang::EOpConstructBF16Vec2:
  2960. case glslang::EOpConstructBF16Vec3:
  2961. case glslang::EOpConstructBF16Vec4:
  2962. case glslang::EOpConstructFloatE5M2:
  2963. case glslang::EOpConstructFloatE5M2Vec2:
  2964. case glslang::EOpConstructFloatE5M2Vec3:
  2965. case glslang::EOpConstructFloatE5M2Vec4:
  2966. case glslang::EOpConstructFloatE4M3:
  2967. case glslang::EOpConstructFloatE4M3Vec2:
  2968. case glslang::EOpConstructFloatE4M3Vec3:
  2969. case glslang::EOpConstructFloatE4M3Vec4:
  2970. case glslang::EOpConstructBool:
  2971. case glslang::EOpConstructBVec2:
  2972. case glslang::EOpConstructBVec3:
  2973. case glslang::EOpConstructBVec4:
  2974. case glslang::EOpConstructInt8:
  2975. case glslang::EOpConstructI8Vec2:
  2976. case glslang::EOpConstructI8Vec3:
  2977. case glslang::EOpConstructI8Vec4:
  2978. case glslang::EOpConstructUint8:
  2979. case glslang::EOpConstructU8Vec2:
  2980. case glslang::EOpConstructU8Vec3:
  2981. case glslang::EOpConstructU8Vec4:
  2982. case glslang::EOpConstructInt16:
  2983. case glslang::EOpConstructI16Vec2:
  2984. case glslang::EOpConstructI16Vec3:
  2985. case glslang::EOpConstructI16Vec4:
  2986. case glslang::EOpConstructUint16:
  2987. case glslang::EOpConstructU16Vec2:
  2988. case glslang::EOpConstructU16Vec3:
  2989. case glslang::EOpConstructU16Vec4:
  2990. case glslang::EOpConstructInt:
  2991. case glslang::EOpConstructIVec2:
  2992. case glslang::EOpConstructIVec3:
  2993. case glslang::EOpConstructIVec4:
  2994. case glslang::EOpConstructUint:
  2995. case glslang::EOpConstructUVec2:
  2996. case glslang::EOpConstructUVec3:
  2997. case glslang::EOpConstructUVec4:
  2998. case glslang::EOpConstructInt64:
  2999. case glslang::EOpConstructI64Vec2:
  3000. case glslang::EOpConstructI64Vec3:
  3001. case glslang::EOpConstructI64Vec4:
  3002. case glslang::EOpConstructUint64:
  3003. case glslang::EOpConstructU64Vec2:
  3004. case glslang::EOpConstructU64Vec3:
  3005. case glslang::EOpConstructU64Vec4:
  3006. case glslang::EOpConstructStruct:
  3007. case glslang::EOpConstructTextureSampler:
  3008. case glslang::EOpConstructReference:
  3009. case glslang::EOpConstructCooperativeMatrixNV:
  3010. case glslang::EOpConstructCooperativeMatrixKHR:
  3011. case glslang::EOpConstructCooperativeVectorNV:
  3012. case glslang::EOpConstructSaturated:
  3013. {
  3014. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  3015. std::vector<spv::Id> arguments;
  3016. translateArguments(*node, arguments, lvalueCoherentFlags);
  3017. spv::Id constructed;
  3018. if (node->getOp() == glslang::EOpConstructTextureSampler) {
  3019. const glslang::TType& texType = node->getSequence()[0]->getAsTyped()->getType();
  3020. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6 &&
  3021. texType.getSampler().isBuffer()) {
  3022. // SamplerBuffer is not supported in spirv1.6 so
  3023. // `samplerBuffer(textureBuffer, sampler)` is a no-op
  3024. // and textureBuffer is the result going forward
  3025. constructed = arguments[0];
  3026. } else
  3027. constructed = builder.createOp(spv::Op::OpSampledImage, resultType(), arguments);
  3028. } else if (node->getOp() == glslang::EOpConstructCooperativeMatrixKHR &&
  3029. node->getType().isCoopMatKHR() && node->getSequence()[0]->getAsTyped()->getType().isCoopMatKHR()) {
  3030. builder.addCapability(spv::Capability::CooperativeMatrixConversionsNV);
  3031. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  3032. constructed = builder.createCooperativeMatrixConversion(resultType(), arguments[0]);
  3033. } else if (node->getOp() == glslang::EOpConstructCooperativeVectorNV &&
  3034. arguments.size() == 1 &&
  3035. builder.getTypeId(arguments[0]) == resultType()) {
  3036. constructed = arguments[0];
  3037. } else if (node->getOp() == glslang::EOpConstructStruct ||
  3038. node->getOp() == glslang::EOpConstructCooperativeMatrixNV ||
  3039. node->getOp() == glslang::EOpConstructCooperativeMatrixKHR ||
  3040. node->getType().isArray() ||
  3041. // Handle constructing coopvec from one component here, to avoid the component
  3042. // getting smeared
  3043. (node->getOp() == glslang::EOpConstructCooperativeVectorNV && arguments.size() == 1 && builder.isScalar(arguments[0]))) {
  3044. std::vector<spv::Id> constituents;
  3045. for (int c = 0; c < (int)arguments.size(); ++c)
  3046. constituents.push_back(arguments[c]);
  3047. constructed = createCompositeConstruct(resultType(), constituents);
  3048. } else if (isMatrix)
  3049. constructed = builder.createMatrixConstructor(precision, arguments, resultType());
  3050. else if (node->getOp() == glslang::EOpConstructSaturated) {
  3051. OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
  3052. TranslateNoContractionDecoration(node->getType().getQualifier()),
  3053. TranslateNonUniformDecoration(lvalueCoherentFlags) };
  3054. constructed = createConversion(node->getOp(), decorations, resultType(), arguments[1],
  3055. node->getType().getBasicType(), node->getSequence()[1]->getAsTyped()->getBasicType());
  3056. builder.addDecoration(constructed, spv::Decoration::SaturatedToLargestFloat8NormalConversionEXT);
  3057. builder.createStore(constructed, arguments[0]);
  3058. }
  3059. else
  3060. constructed = builder.createConstructor(precision, arguments, resultType());
  3061. if (node->getType().getQualifier().isNonUniform()) {
  3062. builder.addDecoration(constructed, spv::Decoration::NonUniformEXT);
  3063. }
  3064. builder.clearAccessChain();
  3065. builder.setAccessChainRValue(constructed);
  3066. return false;
  3067. }
  3068. // These six are component-wise compares with component-wise results.
  3069. // Forward on to createBinaryOperation(), requesting a vector result.
  3070. case glslang::EOpLessThan:
  3071. case glslang::EOpGreaterThan:
  3072. case glslang::EOpLessThanEqual:
  3073. case glslang::EOpGreaterThanEqual:
  3074. case glslang::EOpVectorEqual:
  3075. case glslang::EOpVectorNotEqual:
  3076. {
  3077. // Map the operation to a binary
  3078. binOp = node->getOp();
  3079. reduceComparison = false;
  3080. switch (node->getOp()) {
  3081. case glslang::EOpVectorEqual: binOp = glslang::EOpVectorEqual; break;
  3082. case glslang::EOpVectorNotEqual: binOp = glslang::EOpVectorNotEqual; break;
  3083. default: binOp = node->getOp(); break;
  3084. }
  3085. break;
  3086. }
  3087. case glslang::EOpMul:
  3088. // component-wise matrix multiply
  3089. binOp = glslang::EOpMul;
  3090. break;
  3091. case glslang::EOpOuterProduct:
  3092. // two vectors multiplied to make a matrix
  3093. binOp = glslang::EOpOuterProduct;
  3094. break;
  3095. case glslang::EOpDot:
  3096. {
  3097. // for scalar dot product, use multiply
  3098. glslang::TIntermSequence& glslangOperands = node->getSequence();
  3099. if (glslangOperands[0]->getAsTyped()->getVectorSize() == 1)
  3100. binOp = glslang::EOpMul;
  3101. break;
  3102. }
  3103. case glslang::EOpMod:
  3104. // when an aggregate, this is the floating-point mod built-in function,
  3105. // which can be emitted by the one in createBinaryOperation()
  3106. binOp = glslang::EOpMod;
  3107. break;
  3108. case glslang::EOpEmitVertex:
  3109. case glslang::EOpEndPrimitive:
  3110. case glslang::EOpBarrier:
  3111. case glslang::EOpMemoryBarrier:
  3112. case glslang::EOpMemoryBarrierAtomicCounter:
  3113. case glslang::EOpMemoryBarrierBuffer:
  3114. case glslang::EOpMemoryBarrierImage:
  3115. case glslang::EOpMemoryBarrierShared:
  3116. case glslang::EOpGroupMemoryBarrier:
  3117. case glslang::EOpDeviceMemoryBarrier:
  3118. case glslang::EOpAllMemoryBarrierWithGroupSync:
  3119. case glslang::EOpDeviceMemoryBarrierWithGroupSync:
  3120. case glslang::EOpWorkgroupMemoryBarrier:
  3121. case glslang::EOpWorkgroupMemoryBarrierWithGroupSync:
  3122. case glslang::EOpSubgroupBarrier:
  3123. case glslang::EOpSubgroupMemoryBarrier:
  3124. case glslang::EOpSubgroupMemoryBarrierBuffer:
  3125. case glslang::EOpSubgroupMemoryBarrierImage:
  3126. case glslang::EOpSubgroupMemoryBarrierShared:
  3127. noReturnValue = true;
  3128. // These all have 0 operands and will naturally finish up in the code below for 0 operands
  3129. break;
  3130. case glslang::EOpAtomicAdd:
  3131. case glslang::EOpAtomicSubtract:
  3132. case glslang::EOpAtomicMin:
  3133. case glslang::EOpAtomicMax:
  3134. case glslang::EOpAtomicAnd:
  3135. case glslang::EOpAtomicOr:
  3136. case glslang::EOpAtomicXor:
  3137. case glslang::EOpAtomicExchange:
  3138. case glslang::EOpAtomicCompSwap:
  3139. atomic = true;
  3140. break;
  3141. case glslang::EOpAtomicStore:
  3142. noReturnValue = true;
  3143. [[fallthrough]];
  3144. case glslang::EOpAtomicLoad:
  3145. atomic = true;
  3146. break;
  3147. case glslang::EOpAtomicCounterAdd:
  3148. case glslang::EOpAtomicCounterSubtract:
  3149. case glslang::EOpAtomicCounterMin:
  3150. case glslang::EOpAtomicCounterMax:
  3151. case glslang::EOpAtomicCounterAnd:
  3152. case glslang::EOpAtomicCounterOr:
  3153. case glslang::EOpAtomicCounterXor:
  3154. case glslang::EOpAtomicCounterExchange:
  3155. case glslang::EOpAtomicCounterCompSwap:
  3156. builder.addExtension("SPV_KHR_shader_atomic_counter_ops");
  3157. builder.addCapability(spv::Capability::AtomicStorageOps);
  3158. atomic = true;
  3159. break;
  3160. case glslang::EOpAbsDifference:
  3161. case glslang::EOpAddSaturate:
  3162. case glslang::EOpSubSaturate:
  3163. case glslang::EOpAverage:
  3164. case glslang::EOpAverageRounded:
  3165. case glslang::EOpMul32x16:
  3166. builder.addCapability(spv::Capability::IntegerFunctions2INTEL);
  3167. builder.addExtension("SPV_INTEL_shader_integer_functions2");
  3168. binOp = node->getOp();
  3169. break;
  3170. case glslang::EOpExpectEXT:
  3171. builder.addCapability(spv::Capability::ExpectAssumeKHR);
  3172. builder.addExtension(spv::E_SPV_KHR_expect_assume);
  3173. binOp = node->getOp();
  3174. break;
  3175. case glslang::EOpIgnoreIntersectionNV:
  3176. case glslang::EOpTerminateRayNV:
  3177. case glslang::EOpTraceNV:
  3178. case glslang::EOpTraceRayMotionNV:
  3179. case glslang::EOpTraceKHR:
  3180. case glslang::EOpExecuteCallableNV:
  3181. case glslang::EOpExecuteCallableKHR:
  3182. case glslang::EOpWritePackedPrimitiveIndices4x8NV:
  3183. case glslang::EOpEmitMeshTasksEXT:
  3184. case glslang::EOpSetMeshOutputsEXT:
  3185. noReturnValue = true;
  3186. break;
  3187. case glslang::EOpRayQueryInitialize:
  3188. case glslang::EOpRayQueryTerminate:
  3189. case glslang::EOpRayQueryGenerateIntersection:
  3190. case glslang::EOpRayQueryConfirmIntersection:
  3191. builder.addExtension("SPV_KHR_ray_query");
  3192. builder.addCapability(spv::Capability::RayQueryKHR);
  3193. noReturnValue = true;
  3194. break;
  3195. case glslang::EOpRayQueryProceed:
  3196. case glslang::EOpRayQueryGetIntersectionType:
  3197. case glslang::EOpRayQueryGetRayTMin:
  3198. case glslang::EOpRayQueryGetRayFlags:
  3199. case glslang::EOpRayQueryGetIntersectionT:
  3200. case glslang::EOpRayQueryGetIntersectionInstanceCustomIndex:
  3201. case glslang::EOpRayQueryGetIntersectionInstanceId:
  3202. case glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset:
  3203. case glslang::EOpRayQueryGetIntersectionGeometryIndex:
  3204. case glslang::EOpRayQueryGetIntersectionPrimitiveIndex:
  3205. case glslang::EOpRayQueryGetIntersectionBarycentrics:
  3206. case glslang::EOpRayQueryGetIntersectionFrontFace:
  3207. case glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque:
  3208. case glslang::EOpRayQueryGetIntersectionObjectRayDirection:
  3209. case glslang::EOpRayQueryGetIntersectionObjectRayOrigin:
  3210. case glslang::EOpRayQueryGetWorldRayDirection:
  3211. case glslang::EOpRayQueryGetWorldRayOrigin:
  3212. case glslang::EOpRayQueryGetIntersectionObjectToWorld:
  3213. case glslang::EOpRayQueryGetIntersectionWorldToObject:
  3214. builder.addExtension("SPV_KHR_ray_query");
  3215. builder.addCapability(spv::Capability::RayQueryKHR);
  3216. break;
  3217. case glslang::EOpCooperativeMatrixLoad:
  3218. case glslang::EOpCooperativeMatrixStore:
  3219. case glslang::EOpCooperativeMatrixLoadNV:
  3220. case glslang::EOpCooperativeMatrixStoreNV:
  3221. case glslang::EOpCooperativeMatrixLoadTensorNV:
  3222. case glslang::EOpCooperativeMatrixStoreTensorNV:
  3223. case glslang::EOpCooperativeMatrixReduceNV:
  3224. case glslang::EOpCooperativeMatrixPerElementOpNV:
  3225. case glslang::EOpCooperativeMatrixTransposeNV:
  3226. case glslang::EOpCooperativeVectorMatMulNV:
  3227. case glslang::EOpCooperativeVectorMatMulAddNV:
  3228. case glslang::EOpCooperativeVectorLoadNV:
  3229. case glslang::EOpCooperativeVectorStoreNV:
  3230. case glslang::EOpCooperativeVectorOuterProductAccumulateNV:
  3231. case glslang::EOpCooperativeVectorReduceSumAccumulateNV:
  3232. noReturnValue = true;
  3233. break;
  3234. case glslang::EOpBeginInvocationInterlock:
  3235. case glslang::EOpEndInvocationInterlock:
  3236. builder.addExtension(spv::E_SPV_EXT_fragment_shader_interlock);
  3237. noReturnValue = true;
  3238. break;
  3239. case glslang::EOpHitObjectTraceRayNV:
  3240. case glslang::EOpHitObjectTraceRayMotionNV:
  3241. case glslang::EOpHitObjectGetAttributesNV:
  3242. case glslang::EOpHitObjectExecuteShaderNV:
  3243. case glslang::EOpHitObjectRecordEmptyNV:
  3244. case glslang::EOpHitObjectRecordMissNV:
  3245. case glslang::EOpHitObjectRecordMissMotionNV:
  3246. case glslang::EOpHitObjectRecordHitNV:
  3247. case glslang::EOpHitObjectRecordHitMotionNV:
  3248. case glslang::EOpHitObjectRecordHitWithIndexNV:
  3249. case glslang::EOpHitObjectRecordHitWithIndexMotionNV:
  3250. case glslang::EOpReorderThreadNV:
  3251. noReturnValue = true;
  3252. [[fallthrough]];
  3253. case glslang::EOpHitObjectIsEmptyNV:
  3254. case glslang::EOpHitObjectIsMissNV:
  3255. case glslang::EOpHitObjectIsHitNV:
  3256. case glslang::EOpHitObjectGetRayTMinNV:
  3257. case glslang::EOpHitObjectGetRayTMaxNV:
  3258. case glslang::EOpHitObjectGetObjectRayOriginNV:
  3259. case glslang::EOpHitObjectGetObjectRayDirectionNV:
  3260. case glslang::EOpHitObjectGetWorldRayOriginNV:
  3261. case glslang::EOpHitObjectGetWorldRayDirectionNV:
  3262. case glslang::EOpHitObjectGetObjectToWorldNV:
  3263. case glslang::EOpHitObjectGetWorldToObjectNV:
  3264. case glslang::EOpHitObjectGetInstanceCustomIndexNV:
  3265. case glslang::EOpHitObjectGetInstanceIdNV:
  3266. case glslang::EOpHitObjectGetGeometryIndexNV:
  3267. case glslang::EOpHitObjectGetPrimitiveIndexNV:
  3268. case glslang::EOpHitObjectGetHitKindNV:
  3269. case glslang::EOpHitObjectGetCurrentTimeNV:
  3270. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:
  3271. case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:
  3272. builder.addExtension(spv::E_SPV_NV_shader_invocation_reorder);
  3273. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  3274. break;
  3275. case glslang::EOpHitObjectGetLSSPositionsNV:
  3276. case glslang::EOpHitObjectGetLSSRadiiNV:
  3277. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  3278. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  3279. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  3280. noReturnValue = true;
  3281. break;
  3282. case glslang::EOpRayQueryGetIntersectionLSSPositionsNV:
  3283. case glslang::EOpRayQueryGetIntersectionLSSRadiiNV:
  3284. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  3285. builder.addCapability(spv::Capability::RayQueryKHR);
  3286. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  3287. noReturnValue = true;
  3288. break;
  3289. case glslang::EOpRayQueryGetIntersectionSpherePositionNV:
  3290. case glslang::EOpRayQueryGetIntersectionSphereRadiusNV:
  3291. case glslang::EOpRayQueryIsSphereHitNV:
  3292. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  3293. builder.addCapability(spv::Capability::RayQueryKHR);
  3294. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  3295. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  3296. break;
  3297. case glslang::EOpRayQueryGetIntersectionLSSHitValueNV:
  3298. case glslang::EOpRayQueryIsLSSHitNV:
  3299. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  3300. builder.addCapability(spv::Capability::RayQueryKHR);
  3301. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  3302. break;
  3303. case glslang::EOpHitObjectTraceRayEXT:
  3304. case glslang::EOpHitObjectTraceRayMotionEXT:
  3305. case glslang::EOpHitObjectGetAttributesEXT:
  3306. case glslang::EOpHitObjectExecuteShaderEXT:
  3307. case glslang::EOpHitObjectRecordEmptyEXT:
  3308. case glslang::EOpHitObjectRecordMissEXT:
  3309. case glslang::EOpHitObjectRecordMissMotionEXT:
  3310. case glslang::EOpReorderThreadEXT:
  3311. case glslang::EOpHitObjectSetShaderBindingTableRecordIndexEXT:
  3312. case glslang::EOpHitObjectReorderExecuteEXT:
  3313. case glslang::EOpHitObjectTraceReorderExecuteEXT:
  3314. case glslang::EOpHitObjectTraceMotionReorderExecuteEXT:
  3315. case glslang::EOpHitObjectRecordFromQueryEXT:
  3316. case glslang::EOpHitObjectGetIntersectionTriangleVertexPositionsEXT:
  3317. noReturnValue = true;
  3318. [[fallthrough]];
  3319. case glslang::EOpHitObjectIsEmptyEXT:
  3320. case glslang::EOpHitObjectIsMissEXT:
  3321. case glslang::EOpHitObjectIsHitEXT:
  3322. case glslang::EOpHitObjectGetRayTMinEXT:
  3323. case glslang::EOpHitObjectGetRayTMaxEXT:
  3324. case glslang::EOpHitObjectGetRayFlagsEXT:
  3325. case glslang::EOpHitObjectGetObjectRayOriginEXT:
  3326. case glslang::EOpHitObjectGetObjectRayDirectionEXT:
  3327. case glslang::EOpHitObjectGetWorldRayOriginEXT:
  3328. case glslang::EOpHitObjectGetWorldRayDirectionEXT:
  3329. case glslang::EOpHitObjectGetObjectToWorldEXT:
  3330. case glslang::EOpHitObjectGetWorldToObjectEXT:
  3331. case glslang::EOpHitObjectGetInstanceCustomIndexEXT:
  3332. case glslang::EOpHitObjectGetInstanceIdEXT:
  3333. case glslang::EOpHitObjectGetGeometryIndexEXT:
  3334. case glslang::EOpHitObjectGetPrimitiveIndexEXT:
  3335. case glslang::EOpHitObjectGetHitKindEXT:
  3336. case glslang::EOpHitObjectGetCurrentTimeEXT:
  3337. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexEXT:
  3338. case glslang::EOpHitObjectGetShaderRecordBufferHandleEXT:
  3339. builder.addExtension(spv::E_SPV_EXT_shader_invocation_reorder);
  3340. builder.addCapability(spv::Capability::ShaderInvocationReorderEXT);
  3341. break;
  3342. case glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT:
  3343. builder.addExtension(spv::E_SPV_KHR_ray_tracing_position_fetch);
  3344. builder.addCapability(spv::Capability::RayQueryPositionFetchKHR);
  3345. noReturnValue = true;
  3346. break;
  3347. case glslang::EOpImageSampleWeightedQCOM:
  3348. builder.addCapability(spv::Capability::TextureSampleWeightedQCOM);
  3349. builder.addExtension(spv::E_SPV_QCOM_image_processing);
  3350. break;
  3351. case glslang::EOpImageBoxFilterQCOM:
  3352. builder.addCapability(spv::Capability::TextureBoxFilterQCOM);
  3353. builder.addExtension(spv::E_SPV_QCOM_image_processing);
  3354. break;
  3355. case glslang::EOpImageBlockMatchSADQCOM:
  3356. case glslang::EOpImageBlockMatchSSDQCOM:
  3357. builder.addCapability(spv::Capability::TextureBlockMatchQCOM);
  3358. builder.addExtension(spv::E_SPV_QCOM_image_processing);
  3359. break;
  3360. case glslang::EOpTensorWriteARM:
  3361. noReturnValue = true;
  3362. break;
  3363. case glslang::EOpImageBlockMatchWindowSSDQCOM:
  3364. case glslang::EOpImageBlockMatchWindowSADQCOM:
  3365. builder.addCapability(spv::Capability::TextureBlockMatchQCOM);
  3366. builder.addExtension(spv::E_SPV_QCOM_image_processing);
  3367. builder.addCapability(spv::Capability::TextureBlockMatch2QCOM);
  3368. builder.addExtension(spv::E_SPV_QCOM_image_processing2);
  3369. break;
  3370. case glslang::EOpImageBlockMatchGatherSSDQCOM:
  3371. case glslang::EOpImageBlockMatchGatherSADQCOM:
  3372. builder.addCapability(spv::Capability::TextureBlockMatchQCOM);
  3373. builder.addExtension(spv::E_SPV_QCOM_image_processing);
  3374. builder.addCapability(spv::Capability::TextureBlockMatch2QCOM);
  3375. builder.addExtension(spv::E_SPV_QCOM_image_processing2);
  3376. break;
  3377. case glslang::EOpFetchMicroTriangleVertexPositionNV:
  3378. case glslang::EOpFetchMicroTriangleVertexBarycentricNV:
  3379. builder.addExtension(spv::E_SPV_NV_displacement_micromap);
  3380. builder.addCapability(spv::Capability::DisplacementMicromapNV);
  3381. break;
  3382. case glslang::EOpRayQueryGetIntersectionClusterIdNV:
  3383. builder.addExtension(spv::E_SPV_NV_cluster_acceleration_structure);
  3384. builder.addCapability(spv::Capability::RayQueryKHR);
  3385. builder.addCapability(spv::Capability::RayTracingClusterAccelerationStructureNV);
  3386. break;
  3387. case glslang::EOpDebugPrintf:
  3388. noReturnValue = true;
  3389. break;
  3390. default:
  3391. break;
  3392. }
  3393. //
  3394. // See if it maps to a regular operation.
  3395. //
  3396. if (binOp != glslang::EOpNull) {
  3397. glslang::TIntermTyped* left = node->getSequence()[0]->getAsTyped();
  3398. glslang::TIntermTyped* right = node->getSequence()[1]->getAsTyped();
  3399. assert(left && right);
  3400. builder.clearAccessChain();
  3401. left->traverse(this);
  3402. spv::Id leftId = accessChainLoad(left->getType());
  3403. builder.clearAccessChain();
  3404. right->traverse(this);
  3405. spv::Id rightId = accessChainLoad(right->getType());
  3406. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  3407. OpDecorations decorations = { precision,
  3408. TranslateNoContractionDecoration(node->getType().getQualifier()),
  3409. TranslateNonUniformDecoration(node->getType().getQualifier()) };
  3410. result = createBinaryOperation(binOp, decorations,
  3411. resultType(), leftId, rightId,
  3412. left->getType().getBasicType(), reduceComparison);
  3413. // code above should only make binOp that exists in createBinaryOperation
  3414. assert(result != spv::NoResult);
  3415. builder.clearAccessChain();
  3416. builder.setAccessChainRValue(result);
  3417. return false;
  3418. }
  3419. //
  3420. // Create the list of operands.
  3421. //
  3422. glslang::TIntermSequence& glslangOperands = node->getSequence();
  3423. std::vector<spv::Id> operands;
  3424. std::vector<spv::IdImmediate> memoryAccessOperands;
  3425. for (int arg = 0; arg < (int)glslangOperands.size(); ++arg) {
  3426. // special case l-value operands; there are just a few
  3427. bool lvalue = false;
  3428. switch (node->getOp()) {
  3429. case glslang::EOpModf:
  3430. if (arg == 1)
  3431. lvalue = true;
  3432. break;
  3433. case glslang::EOpHitObjectRecordFromQueryEXT:
  3434. case glslang::EOpHitObjectGetIntersectionTriangleVertexPositionsEXT:
  3435. if (arg == 0 || arg == 1)
  3436. lvalue = true;
  3437. break;
  3438. case glslang::EOpHitObjectRecordHitNV:
  3439. case glslang::EOpHitObjectRecordHitMotionNV:
  3440. case glslang::EOpHitObjectRecordHitWithIndexNV:
  3441. case glslang::EOpHitObjectRecordHitWithIndexMotionNV:
  3442. case glslang::EOpHitObjectTraceRayNV:
  3443. case glslang::EOpHitObjectTraceRayMotionNV:
  3444. case glslang::EOpHitObjectExecuteShaderNV:
  3445. case glslang::EOpHitObjectRecordMissNV:
  3446. case glslang::EOpHitObjectRecordMissMotionNV:
  3447. case glslang::EOpHitObjectGetAttributesNV:
  3448. case glslang::EOpHitObjectGetClusterIdNV:
  3449. case glslang::EOpHitObjectTraceRayEXT:
  3450. case glslang::EOpHitObjectTraceRayMotionEXT:
  3451. case glslang::EOpHitObjectExecuteShaderEXT:
  3452. case glslang::EOpHitObjectRecordMissEXT:
  3453. case glslang::EOpHitObjectRecordMissMotionEXT:
  3454. case glslang::EOpHitObjectGetAttributesEXT:
  3455. case glslang::EOpHitObjectSetShaderBindingTableRecordIndexEXT:
  3456. case glslang::EOpHitObjectReorderExecuteEXT:
  3457. case glslang::EOpHitObjectTraceReorderExecuteEXT:
  3458. case glslang::EOpHitObjectTraceMotionReorderExecuteEXT:
  3459. if (arg == 0)
  3460. lvalue = true;
  3461. break;
  3462. case glslang::EOpHitObjectGetLSSPositionsNV:
  3463. case glslang::EOpHitObjectGetLSSRadiiNV:
  3464. lvalue = true;
  3465. break;
  3466. case glslang::EOpRayQueryInitialize:
  3467. case glslang::EOpRayQueryTerminate:
  3468. case glslang::EOpRayQueryConfirmIntersection:
  3469. case glslang::EOpRayQueryProceed:
  3470. case glslang::EOpRayQueryGenerateIntersection:
  3471. case glslang::EOpRayQueryGetIntersectionType:
  3472. case glslang::EOpRayQueryGetIntersectionT:
  3473. case glslang::EOpRayQueryGetIntersectionInstanceCustomIndex:
  3474. case glslang::EOpRayQueryGetIntersectionInstanceId:
  3475. case glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset:
  3476. case glslang::EOpRayQueryGetIntersectionGeometryIndex:
  3477. case glslang::EOpRayQueryGetIntersectionPrimitiveIndex:
  3478. case glslang::EOpRayQueryGetIntersectionBarycentrics:
  3479. case glslang::EOpRayQueryGetIntersectionFrontFace:
  3480. case glslang::EOpRayQueryGetIntersectionObjectRayDirection:
  3481. case glslang::EOpRayQueryGetIntersectionObjectRayOrigin:
  3482. case glslang::EOpRayQueryGetIntersectionObjectToWorld:
  3483. case glslang::EOpRayQueryGetIntersectionWorldToObject:
  3484. case glslang::EOpRayQueryGetIntersectionClusterIdNV:
  3485. case glslang::EOpRayQueryGetIntersectionSpherePositionNV:
  3486. case glslang::EOpRayQueryGetIntersectionSphereRadiusNV:
  3487. case glslang::EOpRayQueryGetIntersectionLSSHitValueNV:
  3488. case glslang::EOpRayQueryIsSphereHitNV:
  3489. case glslang::EOpRayQueryIsLSSHitNV:
  3490. if (arg == 0)
  3491. lvalue = true;
  3492. break;
  3493. case glslang::EOpAtomicAdd:
  3494. case glslang::EOpAtomicSubtract:
  3495. case glslang::EOpAtomicMin:
  3496. case glslang::EOpAtomicMax:
  3497. case glslang::EOpAtomicAnd:
  3498. case glslang::EOpAtomicOr:
  3499. case glslang::EOpAtomicXor:
  3500. case glslang::EOpAtomicExchange:
  3501. case glslang::EOpAtomicCompSwap:
  3502. if (arg == 0)
  3503. lvalue = true;
  3504. break;
  3505. case glslang::EOpFrexp:
  3506. if (arg == 1)
  3507. lvalue = true;
  3508. break;
  3509. case glslang::EOpInterpolateAtSample:
  3510. case glslang::EOpInterpolateAtOffset:
  3511. case glslang::EOpInterpolateAtVertex:
  3512. if (arg == 0) {
  3513. // If GLSL, use the address of the interpolant argument.
  3514. // If HLSL, use an internal version of OpInterolates that takes
  3515. // the rvalue of the interpolant. A fixup pass in spirv-opt
  3516. // legalization will remove the OpLoad and convert to an lvalue.
  3517. // Had to do this because legalization will only propagate a
  3518. // builtin into an rvalue.
  3519. lvalue = glslangIntermediate->getSource() != glslang::EShSourceHlsl;
  3520. // Does it need a swizzle inversion? If so, evaluation is inverted;
  3521. // operate first on the swizzle base, then apply the swizzle.
  3522. // That is, we transform
  3523. //
  3524. // interpolate(v.zy) -> interpolate(v).zy
  3525. //
  3526. if (glslangOperands[0]->getAsOperator() &&
  3527. glslangOperands[0]->getAsOperator()->getOp() == glslang::EOpVectorSwizzle)
  3528. invertedType = convertGlslangToSpvType(
  3529. glslangOperands[0]->getAsBinaryNode()->getLeft()->getType());
  3530. }
  3531. break;
  3532. case glslang::EOpAtomicLoad:
  3533. case glslang::EOpAtomicStore:
  3534. case glslang::EOpAtomicCounterAdd:
  3535. case glslang::EOpAtomicCounterSubtract:
  3536. case glslang::EOpAtomicCounterMin:
  3537. case glslang::EOpAtomicCounterMax:
  3538. case glslang::EOpAtomicCounterAnd:
  3539. case glslang::EOpAtomicCounterOr:
  3540. case glslang::EOpAtomicCounterXor:
  3541. case glslang::EOpAtomicCounterExchange:
  3542. case glslang::EOpAtomicCounterCompSwap:
  3543. if (arg == 0)
  3544. lvalue = true;
  3545. break;
  3546. case glslang::EOpAddCarry:
  3547. case glslang::EOpSubBorrow:
  3548. if (arg == 2)
  3549. lvalue = true;
  3550. break;
  3551. case glslang::EOpUMulExtended:
  3552. case glslang::EOpIMulExtended:
  3553. if (arg >= 2)
  3554. lvalue = true;
  3555. break;
  3556. case glslang::EOpCooperativeMatrixLoad:
  3557. case glslang::EOpCooperativeMatrixLoadNV:
  3558. case glslang::EOpCooperativeMatrixLoadTensorNV:
  3559. case glslang::EOpCooperativeVectorLoadNV:
  3560. if (arg == 0 || arg == 1)
  3561. lvalue = true;
  3562. break;
  3563. case glslang::EOpCooperativeMatrixStore:
  3564. case glslang::EOpCooperativeMatrixStoreNV:
  3565. case glslang::EOpCooperativeMatrixStoreTensorNV:
  3566. case glslang::EOpCooperativeVectorStoreNV:
  3567. if (arg == 1)
  3568. lvalue = true;
  3569. break;
  3570. case glslang::EOpCooperativeVectorMatMulNV:
  3571. if (arg == 0 || arg == 3)
  3572. lvalue = true;
  3573. break;
  3574. case glslang::EOpCooperativeVectorMatMulAddNV:
  3575. if (arg == 0 || arg == 3 || arg == 6)
  3576. lvalue = true;
  3577. break;
  3578. case glslang::EOpCooperativeVectorOuterProductAccumulateNV:
  3579. if (arg == 2)
  3580. lvalue = true;
  3581. break;
  3582. case glslang::EOpCooperativeVectorReduceSumAccumulateNV:
  3583. if (arg == 1)
  3584. lvalue = true;
  3585. break;
  3586. case glslang::EOpCooperativeMatrixReduceNV:
  3587. case glslang::EOpCooperativeMatrixPerElementOpNV:
  3588. case glslang::EOpCooperativeMatrixTransposeNV:
  3589. if (arg == 0)
  3590. lvalue = true;
  3591. break;
  3592. case glslang::EOpSpirvInst:
  3593. if (glslangOperands[arg]->getAsTyped()->getQualifier().isSpirvByReference())
  3594. lvalue = true;
  3595. break;
  3596. case glslang::EOpReorderThreadNV:
  3597. case glslang::EOpReorderThreadEXT:
  3598. //Three variants of reorderThreadNV, two of them use hitObjectNV
  3599. if (arg == 0 && glslangOperands.size() != 2)
  3600. lvalue = true;
  3601. break;
  3602. case glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT:
  3603. case glslang::EOpRayQueryGetIntersectionLSSPositionsNV:
  3604. case glslang::EOpRayQueryGetIntersectionLSSRadiiNV:
  3605. if (arg == 0 || arg == 2)
  3606. lvalue = true;
  3607. break;
  3608. case glslang::EOpTensorReadARM:
  3609. if (arg == 2)
  3610. lvalue = true;
  3611. break;
  3612. default:
  3613. break;
  3614. }
  3615. builder.clearAccessChain();
  3616. if (invertedType != spv::NoType && arg == 0)
  3617. glslangOperands[0]->getAsBinaryNode()->getLeft()->traverse(this);
  3618. else
  3619. glslangOperands[arg]->traverse(this);
  3620. bool isCoopMat = node->getOp() == glslang::EOpCooperativeMatrixLoad ||
  3621. node->getOp() == glslang::EOpCooperativeMatrixStore ||
  3622. node->getOp() == glslang::EOpCooperativeMatrixLoadNV ||
  3623. node->getOp() == glslang::EOpCooperativeMatrixStoreNV ||
  3624. node->getOp() == glslang::EOpCooperativeMatrixLoadTensorNV ||
  3625. node->getOp() == glslang::EOpCooperativeMatrixStoreTensorNV;
  3626. bool isCoopVec = node->getOp() == glslang::EOpCooperativeVectorLoadNV ||
  3627. node->getOp() == glslang::EOpCooperativeVectorStoreNV;
  3628. if (isCoopMat || isCoopVec) {
  3629. if (arg == 1) {
  3630. spv::Builder::AccessChain::CoherentFlags coherentFlags {};
  3631. unsigned int alignment {};
  3632. if (isCoopMat) {
  3633. // fold "element" parameter into the access chain
  3634. spv::Builder::AccessChain save = builder.getAccessChain();
  3635. builder.clearAccessChain();
  3636. glslangOperands[2]->traverse(this);
  3637. spv::Id elementId = accessChainLoad(glslangOperands[2]->getAsTyped()->getType());
  3638. builder.setAccessChain(save);
  3639. // Point to the first element of the array.
  3640. builder.accessChainPush(elementId,
  3641. TranslateCoherent(glslangOperands[arg]->getAsTyped()->getType()),
  3642. glslangOperands[arg]->getAsTyped()->getType().getBufferReferenceAlignment());
  3643. coherentFlags = builder.getAccessChain().coherentFlags;
  3644. alignment = builder.getAccessChain().alignment;
  3645. } else {
  3646. coherentFlags = builder.getAccessChain().coherentFlags;
  3647. coherentFlags |= TranslateCoherent(glslangOperands[arg]->getAsTyped()->getType());
  3648. alignment = 16;
  3649. }
  3650. spv::MemoryAccessMask memoryAccess = TranslateMemoryAccess(coherentFlags);
  3651. if (node->getOp() == glslang::EOpCooperativeMatrixLoad ||
  3652. node->getOp() == glslang::EOpCooperativeMatrixLoadNV ||
  3653. node->getOp() == glslang::EOpCooperativeMatrixLoadTensorNV ||
  3654. node->getOp() == glslang::EOpCooperativeVectorLoadNV)
  3655. memoryAccess = (memoryAccess & ~spv::MemoryAccessMask::MakePointerAvailableKHR);
  3656. if (node->getOp() == glslang::EOpCooperativeMatrixStore ||
  3657. node->getOp() == glslang::EOpCooperativeMatrixStoreNV ||
  3658. node->getOp() == glslang::EOpCooperativeMatrixStoreTensorNV ||
  3659. node->getOp() == glslang::EOpCooperativeVectorStoreNV)
  3660. memoryAccess = (memoryAccess & ~spv::MemoryAccessMask::MakePointerVisibleKHR);
  3661. if (builder.getStorageClass(builder.getAccessChain().base) ==
  3662. spv::StorageClass::PhysicalStorageBufferEXT) {
  3663. memoryAccess = (spv::MemoryAccessMask)(memoryAccess | spv::MemoryAccessMask::Aligned);
  3664. }
  3665. memoryAccessOperands.push_back(spv::IdImmediate(false, memoryAccess));
  3666. if (anySet(memoryAccess, spv::MemoryAccessMask::Aligned)) {
  3667. memoryAccessOperands.push_back(spv::IdImmediate(false, alignment));
  3668. }
  3669. if (anySet(memoryAccess,
  3670. spv::MemoryAccessMask::MakePointerAvailableKHR | spv::MemoryAccessMask::MakePointerVisibleKHR)) {
  3671. memoryAccessOperands.push_back(spv::IdImmediate(true,
  3672. builder.makeUintConstant(TranslateMemoryScope(coherentFlags))));
  3673. }
  3674. } else if (isCoopMat && arg == 2) {
  3675. continue;
  3676. }
  3677. }
  3678. // for l-values, pass the address, for r-values, pass the value
  3679. if (lvalue) {
  3680. if (invertedType == spv::NoType && !builder.isSpvLvalue()) {
  3681. // SPIR-V cannot represent an l-value containing a swizzle that doesn't
  3682. // reduce to a simple access chain. So, we need a temporary vector to
  3683. // receive the result, and must later swizzle that into the original
  3684. // l-value.
  3685. complexLvalues.push_back(builder.getAccessChain());
  3686. temporaryLvalues.push_back(builder.createVariable(
  3687. spv::NoPrecision, spv::StorageClass::Function,
  3688. builder.accessChainGetInferredType(), "swizzleTemp"));
  3689. operands.push_back(temporaryLvalues.back());
  3690. } else {
  3691. operands.push_back(builder.accessChainGetLValue());
  3692. }
  3693. lvalueCoherentFlags = builder.getAccessChain().coherentFlags;
  3694. lvalueCoherentFlags |= TranslateCoherent(glslangOperands[arg]->getAsTyped()->getType());
  3695. } else {
  3696. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  3697. glslang::TOperator glslangOp = node->getOp();
  3698. if (arg == 1 &&
  3699. (glslangOp == glslang::EOpRayQueryGetIntersectionType ||
  3700. glslangOp == glslang::EOpRayQueryGetIntersectionT ||
  3701. glslangOp == glslang::EOpRayQueryGetIntersectionInstanceCustomIndex ||
  3702. glslangOp == glslang::EOpRayQueryGetIntersectionInstanceId ||
  3703. glslangOp == glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset ||
  3704. glslangOp == glslang::EOpRayQueryGetIntersectionGeometryIndex ||
  3705. glslangOp == glslang::EOpRayQueryGetIntersectionPrimitiveIndex ||
  3706. glslangOp == glslang::EOpRayQueryGetIntersectionBarycentrics ||
  3707. glslangOp == glslang::EOpRayQueryGetIntersectionFrontFace ||
  3708. glslangOp == glslang::EOpRayQueryGetIntersectionObjectRayDirection ||
  3709. glslangOp == glslang::EOpRayQueryGetIntersectionObjectRayOrigin ||
  3710. glslangOp == glslang::EOpRayQueryGetIntersectionObjectToWorld ||
  3711. glslangOp == glslang::EOpRayQueryGetIntersectionWorldToObject ||
  3712. glslangOp == glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT ||
  3713. glslangOp == glslang::EOpRayQueryGetIntersectionClusterIdNV ||
  3714. glslangOp == glslang::EOpRayQueryGetIntersectionSpherePositionNV ||
  3715. glslangOp == glslang::EOpRayQueryGetIntersectionSphereRadiusNV ||
  3716. glslangOp == glslang::EOpRayQueryGetIntersectionLSSHitValueNV ||
  3717. glslangOp == glslang::EOpRayQueryGetIntersectionLSSPositionsNV ||
  3718. glslangOp == glslang::EOpRayQueryGetIntersectionLSSRadiiNV ||
  3719. glslangOp == glslang::EOpRayQueryIsLSSHitNV ||
  3720. glslangOp == glslang::EOpRayQueryIsSphereHitNV
  3721. )) {
  3722. bool cond = glslangOperands[arg]->getAsConstantUnion()->getConstArray()[0].getBConst();
  3723. operands.push_back(builder.makeIntConstant(cond ? 1 : 0));
  3724. } else if ((arg == 10 && glslangOp == glslang::EOpTraceKHR) ||
  3725. (arg == 11 && glslangOp == glslang::EOpTraceRayMotionNV) ||
  3726. (arg == 1 && glslangOp == glslang::EOpExecuteCallableKHR) ||
  3727. (arg == 1 && glslangOp == glslang::EOpHitObjectExecuteShaderNV) ||
  3728. (arg == 1 && glslangOp == glslang::EOpHitObjectExecuteShaderEXT) ||
  3729. (arg == 11 && glslangOp == glslang::EOpHitObjectTraceRayNV) ||
  3730. (arg == 11 && glslangOp == glslang::EOpHitObjectTraceRayEXT) ||
  3731. (arg == 12 && glslangOp == glslang::EOpHitObjectTraceRayMotionNV) ||
  3732. (arg == 12 && glslangOp == glslang::EOpHitObjectTraceRayMotionEXT) ||
  3733. (arg == 12 && glslangOp == glslang::EOpHitObjectTraceMotionReorderExecuteEXT && glslangOperands.size() == 13) ||
  3734. (arg == 14 && glslangOp == glslang::EOpHitObjectTraceMotionReorderExecuteEXT && glslangOperands.size() == 15) ||
  3735. (arg == 11 && glslangOp == glslang::EOpHitObjectTraceReorderExecuteEXT && glslangOperands.size() == 12) ||
  3736. (arg == 13 && glslangOp == glslang::EOpHitObjectTraceReorderExecuteEXT && glslangOperands.size() == 14) ||
  3737. (arg == 1 && glslangOp == glslang::EOpHitObjectReorderExecuteEXT && glslangOperands.size() == 2) ||
  3738. (arg == 3 && glslangOp == glslang::EOpHitObjectReorderExecuteEXT && glslangOperands.size() == 4)) {
  3739. const int set = glslangOp == glslang::EOpExecuteCallableKHR ? 1 : 0;
  3740. const int location = glslangOperands[arg]->getAsConstantUnion()->getConstArray()[0].getUConst();
  3741. auto itNode = locationToSymbol[set].find(location);
  3742. visitSymbol(itNode->second);
  3743. spv::Id symId = getSymbolId(itNode->second);
  3744. operands.push_back(symId);
  3745. } else if ((arg == 12 && glslangOp == glslang::EOpHitObjectRecordHitNV) ||
  3746. (arg == 13 && glslangOp == glslang::EOpHitObjectRecordHitMotionNV) ||
  3747. (arg == 11 && glslangOp == glslang::EOpHitObjectRecordHitWithIndexNV) ||
  3748. (arg == 12 && glslangOp == glslang::EOpHitObjectRecordHitWithIndexMotionNV) ||
  3749. (arg == 3 && glslangOp == glslang::EOpHitObjectRecordFromQueryEXT) ||
  3750. (arg == 1 && glslangOp == glslang::EOpHitObjectGetAttributesEXT) ||
  3751. (arg == 1 && glslangOp == glslang::EOpHitObjectGetAttributesNV)) {
  3752. const int location = glslangOperands[arg]->getAsConstantUnion()->getConstArray()[0].getUConst();
  3753. const int set = 2;
  3754. auto itNode = locationToSymbol[set].find(location);
  3755. visitSymbol(itNode->second);
  3756. spv::Id symId = getSymbolId(itNode->second);
  3757. operands.push_back(symId);
  3758. } else if (glslangOperands[arg]->getAsTyped()->getQualifier().isSpirvLiteral()) {
  3759. // Will be translated to a literal value, make a placeholder here
  3760. operands.push_back(spv::NoResult);
  3761. } else if (glslangOperands[arg]->getAsTyped()->getBasicType() == glslang::EbtFunction) {
  3762. spv::Function* function = functionMap[glslangOperands[arg]->getAsSymbolNode()->getMangledName().c_str()];
  3763. assert(function);
  3764. operands.push_back(function->getId());
  3765. } else {
  3766. operands.push_back(accessChainLoad(glslangOperands[arg]->getAsTyped()->getType()));
  3767. }
  3768. }
  3769. }
  3770. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  3771. if (node->getOp() == glslang::EOpCooperativeMatrixLoadTensorNV) {
  3772. std::vector<spv::IdImmediate> idImmOps;
  3773. builder.addCapability(spv::Capability::CooperativeMatrixTensorAddressingNV);
  3774. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  3775. spv::Id object = builder.createLoad(operands[0], spv::NoPrecision);
  3776. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // Pointer
  3777. idImmOps.push_back(spv::IdImmediate(true, object)); // Object
  3778. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // tensorLayout
  3779. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end()); // memoryaccess
  3780. // initialize tensor operands to zero, then OR in flags based on the operands
  3781. size_t tensorOpIdx = idImmOps.size();
  3782. idImmOps.push_back(spv::IdImmediate(false, 0));
  3783. for (uint32_t i = 3; i < operands.size(); ++i) {
  3784. if (builder.isTensorView(operands[i])) {
  3785. addMask(idImmOps[tensorOpIdx].word, spv::TensorAddressingOperandsMask::TensorView);
  3786. } else {
  3787. // must be the decode func
  3788. addMask(idImmOps[tensorOpIdx].word, spv::TensorAddressingOperandsMask::DecodeFunc);
  3789. builder.addCapability(spv::Capability::CooperativeMatrixBlockLoadsNV);
  3790. }
  3791. idImmOps.push_back(spv::IdImmediate(true, operands[i])); // tensorView or decodeFunc
  3792. }
  3793. // get the pointee type
  3794. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  3795. assert(builder.isCooperativeMatrixType(typeId));
  3796. // do the op
  3797. spv::Id result = builder.createOp(spv::Op::OpCooperativeMatrixLoadTensorNV, typeId, idImmOps);
  3798. // store the result to the pointer (out param 'm')
  3799. builder.createStore(result, operands[0]);
  3800. result = 0;
  3801. } else if (node->getOp() == glslang::EOpCooperativeMatrixLoad ||
  3802. node->getOp() == glslang::EOpCooperativeMatrixLoadNV) {
  3803. std::vector<spv::IdImmediate> idImmOps;
  3804. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  3805. if (node->getOp() == glslang::EOpCooperativeMatrixLoad) {
  3806. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // matrixLayout
  3807. auto layout = (spv::CooperativeMatrixLayout)builder.getConstantScalar(operands[3]);
  3808. if (layout == spv::CooperativeMatrixLayout::RowBlockedInterleavedARM ||
  3809. layout == spv::CooperativeMatrixLayout::ColumnBlockedInterleavedARM) {
  3810. builder.addExtension(spv::E_SPV_ARM_cooperative_matrix_layouts);
  3811. builder.addCapability(spv::Capability::CooperativeMatrixLayoutsARM);
  3812. }
  3813. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
  3814. } else {
  3815. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
  3816. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // colMajor
  3817. }
  3818. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
  3819. // get the pointee type
  3820. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  3821. assert(builder.isCooperativeMatrixType(typeId));
  3822. // do the op
  3823. spv::Id result = node->getOp() == glslang::EOpCooperativeMatrixLoad
  3824. ? builder.createOp(spv::Op::OpCooperativeMatrixLoadKHR, typeId, idImmOps)
  3825. : builder.createOp(spv::Op::OpCooperativeMatrixLoadNV, typeId, idImmOps);
  3826. // store the result to the pointer (out param 'm')
  3827. builder.createStore(result, operands[0]);
  3828. result = 0;
  3829. } else if (node->getOp() == glslang::EOpCooperativeMatrixStoreTensorNV) {
  3830. std::vector<spv::IdImmediate> idImmOps;
  3831. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  3832. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // object
  3833. builder.addCapability(spv::Capability::CooperativeMatrixTensorAddressingNV);
  3834. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  3835. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // tensorLayout
  3836. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end()); // memoryaccess
  3837. if (operands.size() > 3) {
  3838. idImmOps.push_back(spv::IdImmediate(false, spv::TensorAddressingOperandsMask::TensorView));
  3839. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // tensorView
  3840. } else {
  3841. idImmOps.push_back(spv::IdImmediate(false, 0));
  3842. }
  3843. builder.createNoResultOp(spv::Op::OpCooperativeMatrixStoreTensorNV, idImmOps);
  3844. result = 0;
  3845. } else if (node->getOp() == glslang::EOpCooperativeMatrixStore ||
  3846. node->getOp() == glslang::EOpCooperativeMatrixStoreNV) {
  3847. std::vector<spv::IdImmediate> idImmOps;
  3848. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  3849. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // object
  3850. if (node->getOp() == glslang::EOpCooperativeMatrixStore) {
  3851. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // matrixLayout
  3852. auto layout = (spv::CooperativeMatrixLayout)builder.getConstantScalar(operands[3]);
  3853. if (layout == spv::CooperativeMatrixLayout::RowBlockedInterleavedARM ||
  3854. layout == spv::CooperativeMatrixLayout::ColumnBlockedInterleavedARM) {
  3855. builder.addExtension(spv::E_SPV_ARM_cooperative_matrix_layouts);
  3856. builder.addCapability(spv::Capability::CooperativeMatrixLayoutsARM);
  3857. }
  3858. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
  3859. } else {
  3860. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
  3861. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // colMajor
  3862. }
  3863. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
  3864. if (node->getOp() == glslang::EOpCooperativeMatrixStore)
  3865. builder.createNoResultOp(spv::Op::OpCooperativeMatrixStoreKHR, idImmOps);
  3866. else
  3867. builder.createNoResultOp(spv::Op::OpCooperativeMatrixStoreNV, idImmOps);
  3868. result = 0;
  3869. } else if (node->getOp() == glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT) {
  3870. std::vector<spv::IdImmediate> idImmOps;
  3871. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // q
  3872. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // committed
  3873. spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),
  3874. builder.makeUintConstant(3), 0);
  3875. // do the op
  3876. spv::Op spvOp = spv::Op::OpRayQueryGetIntersectionTriangleVertexPositionsKHR;
  3877. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  3878. // store the result to the pointer (out param 'm')
  3879. builder.createStore(result, operands[2]);
  3880. result = 0;
  3881. } else if (node->getOp() == glslang::EOpRayQueryGetIntersectionLSSPositionsNV) {
  3882. std::vector<spv::IdImmediate> idImmOps;
  3883. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // q
  3884. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // committed
  3885. spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),
  3886. builder.makeUintConstant(2), 0);
  3887. // do the op
  3888. spv::Op spvOp = spv::Op::OpRayQueryGetIntersectionLSSPositionsNV;
  3889. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  3890. // store the result to the pointer (out param 'm')
  3891. builder.createStore(result, operands[2]);
  3892. result = 0;
  3893. } else if (node->getOp() == glslang::EOpRayQueryGetIntersectionLSSRadiiNV) {
  3894. std::vector<spv::IdImmediate> idImmOps;
  3895. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // q
  3896. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // committed
  3897. spv::Id typeId = builder.makeArrayType(builder.makeFloatType(32),
  3898. builder.makeUintConstant(2), 0);
  3899. // do the op
  3900. spv::Op spvOp = spv::Op::OpRayQueryGetIntersectionLSSRadiiNV;
  3901. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  3902. // store the result to the pointer (out param 'm')
  3903. builder.createStore(result, operands[2]);
  3904. result = 0;
  3905. } else if (node->getOp() == glslang::EOpHitObjectGetLSSPositionsNV) {
  3906. std::vector<spv::IdImmediate> idImmOps;
  3907. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // hitObject
  3908. spv::Op spvOp = spv::Op::OpHitObjectGetLSSPositionsNV;
  3909. spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),
  3910. builder.makeUintConstant(2), 0);
  3911. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  3912. // store the result to the pointer (out param 'm')
  3913. builder.createStore(result, operands[1]);
  3914. result = 0;
  3915. } else if (node->getOp() == glslang::EOpHitObjectGetLSSRadiiNV) {
  3916. std::vector<spv::IdImmediate> idImmOps;
  3917. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // hitObject
  3918. spv::Op spvOp = spv::Op::OpHitObjectGetLSSRadiiNV;
  3919. spv::Id typeId = builder.makeArrayType(builder.makeFloatType(32),
  3920. builder.makeUintConstant(2), 0);
  3921. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  3922. // store the result to the pointer (out param 'm')
  3923. builder.createStore(result, operands[1]);
  3924. result = 0;
  3925. } else if (node->getOp() == glslang::EOpHitObjectGetIntersectionTriangleVertexPositionsEXT) {
  3926. std::vector<spv::IdImmediate> idImmOps;
  3927. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // hitObject
  3928. spv::Op spvOp = spv::Op::OpHitObjectGetIntersectionTriangleVertexPositionsEXT;
  3929. spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),
  3930. builder.makeUintConstant(3), 0);
  3931. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  3932. // store the result to the pointer (out param 'm')
  3933. builder.createStore(result, operands[1]);
  3934. result = 0;
  3935. } else if (node->getOp() == glslang::EOpCooperativeMatrixMulAdd) {
  3936. auto matrixOperands = spv::CooperativeMatrixOperandsMask::MaskNone;
  3937. // If the optional operand is present, initialize matrixOperands to that value.
  3938. if (glslangOperands.size() == 4 && glslangOperands[3]->getAsConstantUnion()) {
  3939. matrixOperands = (spv::CooperativeMatrixOperandsMask)glslangOperands[3]->getAsConstantUnion()->getConstArray()[0].getIConst();
  3940. }
  3941. // Determine Cooperative Matrix Operands bits from the signedness of the types.
  3942. if (isTypeSignedInt(glslangOperands[0]->getAsTyped()->getBasicType()))
  3943. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixASignedComponentsKHR);
  3944. if (isTypeSignedInt(glslangOperands[1]->getAsTyped()->getBasicType()))
  3945. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixBSignedComponentsKHR);
  3946. if (isTypeSignedInt(glslangOperands[2]->getAsTyped()->getBasicType()))
  3947. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixCSignedComponentsKHR);
  3948. if (isTypeSignedInt(node->getBasicType()))
  3949. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixResultSignedComponentsKHR);
  3950. std::vector<spv::IdImmediate> idImmOps;
  3951. idImmOps.push_back(spv::IdImmediate(true, operands[0]));
  3952. idImmOps.push_back(spv::IdImmediate(true, operands[1]));
  3953. idImmOps.push_back(spv::IdImmediate(true, operands[2]));
  3954. if (matrixOperands != spv::CooperativeMatrixOperandsMask::MaskNone)
  3955. idImmOps.push_back(spv::IdImmediate(false, matrixOperands));
  3956. result = builder.createOp(spv::Op::OpCooperativeMatrixMulAddKHR, resultType(), idImmOps);
  3957. } else if (node->getOp() == glslang::EOpCooperativeMatrixReduceNV) {
  3958. builder.addCapability(spv::Capability::CooperativeMatrixReductionsNV);
  3959. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  3960. spv::Op opcode = spv::Op::OpCooperativeMatrixReduceNV;
  3961. unsigned mask = glslangOperands[2]->getAsConstantUnion()->getConstArray()[0].getUConst();
  3962. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  3963. assert(builder.isCooperativeMatrixType(typeId));
  3964. result = builder.createCooperativeMatrixReduce(opcode, typeId, operands[1], mask, operands[3]);
  3965. // store the result to the pointer (out param 'm')
  3966. builder.createStore(result, operands[0]);
  3967. result = 0;
  3968. } else if (node->getOp() == glslang::EOpCooperativeMatrixPerElementOpNV) {
  3969. builder.addCapability(spv::Capability::CooperativeMatrixPerElementOperationsNV);
  3970. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  3971. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  3972. assert(builder.isCooperativeMatrixType(typeId));
  3973. result = builder.createCooperativeMatrixPerElementOp(typeId, operands);
  3974. // store the result to the pointer
  3975. builder.createStore(result, operands[0]);
  3976. result = 0;
  3977. } else if (node->getOp() == glslang::EOpCooperativeMatrixTransposeNV) {
  3978. builder.addCapability(spv::Capability::CooperativeMatrixConversionsNV);
  3979. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  3980. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  3981. assert(builder.isCooperativeMatrixType(typeId));
  3982. result = builder.createUnaryOp(spv::Op::OpCooperativeMatrixTransposeNV, typeId, operands[1]);
  3983. // store the result to the pointer
  3984. builder.createStore(result, operands[0]);
  3985. result = 0;
  3986. } else if (node->getOp() == glslang::EOpBitCastArrayQCOM) {
  3987. builder.addCapability(spv::Capability::CooperativeMatrixConversionQCOM);
  3988. builder.addExtension(spv::E_SPV_QCOM_cooperative_matrix_conversion);
  3989. result = builder.createUnaryOp(spv::Op::OpBitCastArrayQCOM, resultType(), operands[0]);
  3990. } else if (node->getOp() == glslang::EOpCompositeConstructCoopMatQCOM) {
  3991. builder.addCapability(spv::Capability::CooperativeMatrixConversionQCOM);
  3992. builder.addExtension(spv::E_SPV_QCOM_cooperative_matrix_conversion);
  3993. result = builder.createUnaryOp(spv::Op::OpCompositeConstructCoopMatQCOM, resultType(), operands[0]);
  3994. } else if (node->getOp() == glslang::EOpCompositeExtractCoopMatQCOM) {
  3995. builder.addCapability(spv::Capability::CooperativeMatrixConversionQCOM);
  3996. builder.addExtension(spv::E_SPV_QCOM_cooperative_matrix_conversion);
  3997. result = builder.createUnaryOp(spv::Op::OpCompositeExtractCoopMatQCOM, resultType(), operands[0]);
  3998. } else if (node->getOp() == glslang::EOpExtractSubArrayQCOM) {
  3999. builder.addCapability(spv::Capability::CooperativeMatrixConversionQCOM);
  4000. builder.addExtension(spv::E_SPV_QCOM_cooperative_matrix_conversion);
  4001. std::vector<spv::Id> arguments { operands[0], operands[1] };;
  4002. result = builder.createOp(spv::Op::OpExtractSubArrayQCOM, resultType(), arguments);
  4003. } else if (node->getOp() == glslang::EOpCooperativeVectorMatMulNV ||
  4004. node->getOp() == glslang::EOpCooperativeVectorMatMulAddNV) {
  4005. auto matrixOperands = spv::CooperativeMatrixOperandsMask::MaskNone;
  4006. bool isMulAdd = node->getOp() == glslang::EOpCooperativeVectorMatMulAddNV;
  4007. // Determine Cooperative Matrix Operands bits from the signedness of the types.
  4008. if (isTypeSignedInt(glslangOperands[1]->getAsTyped()->getBasicType()))
  4009. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixBSignedComponentsKHR);
  4010. if (isTypeSignedInt(glslangOperands[0]->getAsTyped()->getBasicType()))
  4011. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixResultSignedComponentsKHR);
  4012. uint32_t opIdx = 1;
  4013. std::vector<spv::IdImmediate> idImmOps;
  4014. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Input
  4015. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // InputInterpretation
  4016. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Matrix
  4017. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MatrixOffset
  4018. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MatrixInterpretation
  4019. if (isMulAdd) {
  4020. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Bias
  4021. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // BiasOffset
  4022. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // BiasInterpretation
  4023. }
  4024. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // M
  4025. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // K
  4026. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MemoryLayout
  4027. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Transpose
  4028. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MatrixStride
  4029. if (matrixOperands != spv::CooperativeMatrixOperandsMask::MaskNone)
  4030. idImmOps.push_back(spv::IdImmediate(false, matrixOperands)); // Cooperative Matrix Operands
  4031. // get the pointee type
  4032. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  4033. assert(builder.isCooperativeVectorType(typeId));
  4034. // do the op
  4035. spv::Id result = builder.createOp(isMulAdd ? spv::Op::OpCooperativeVectorMatrixMulAddNV : spv::Op::OpCooperativeVectorMatrixMulNV, typeId, idImmOps);
  4036. // store the result to the pointer (out param 'res')
  4037. builder.createStore(result, operands[0]);
  4038. result = 0;
  4039. } else if (node->getOp() == glslang::EOpCooperativeVectorLoadNV) {
  4040. std::vector<spv::IdImmediate> idImmOps;
  4041. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  4042. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // offset
  4043. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
  4044. // get the pointee type
  4045. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  4046. assert(builder.isCooperativeVectorType(typeId));
  4047. // do the op
  4048. spv::Id result = builder.createOp(spv::Op::OpCooperativeVectorLoadNV, typeId, idImmOps);
  4049. // store the result to the pointer (out param 'v')
  4050. builder.createStore(result, operands[0]);
  4051. result = 0;
  4052. } else if (node->getOp() == glslang::EOpCooperativeVectorStoreNV) {
  4053. std::vector<spv::IdImmediate> idImmOps;
  4054. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  4055. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // offset
  4056. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // object
  4057. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
  4058. builder.createNoResultOp(spv::Op::OpCooperativeVectorStoreNV, idImmOps);
  4059. result = 0;
  4060. } else if (node->getOp() == glslang::EOpCooperativeVectorOuterProductAccumulateNV) {
  4061. builder.addCapability(spv::Capability::CooperativeVectorTrainingNV);
  4062. builder.addExtension(spv::E_SPV_NV_cooperative_vector);
  4063. std::vector<spv::IdImmediate> idImmOps;
  4064. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // Matrix
  4065. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // Offset
  4066. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // A
  4067. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // B
  4068. idImmOps.push_back(spv::IdImmediate(true, operands[5])); // MemoryLayout
  4069. idImmOps.push_back(spv::IdImmediate(true, operands[6])); // MatrixInterpretation
  4070. idImmOps.push_back(spv::IdImmediate(true, operands[4])); // Stride
  4071. builder.createNoResultOp(spv::Op::OpCooperativeVectorOuterProductAccumulateNV, idImmOps);
  4072. result = 0;
  4073. } else if (node->getOp() == glslang::EOpCooperativeVectorReduceSumAccumulateNV) {
  4074. builder.addCapability(spv::Capability::CooperativeVectorTrainingNV);
  4075. builder.addExtension(spv::E_SPV_NV_cooperative_vector);
  4076. std::vector<spv::IdImmediate> idImmOps;
  4077. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // Buf
  4078. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // Offset
  4079. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // A
  4080. builder.createNoResultOp(spv::Op::OpCooperativeVectorReduceSumAccumulateNV, idImmOps);
  4081. result = 0;
  4082. } else if (node->getOp() == glslang::EOpTensorReadARM ||
  4083. node->getOp() == glslang::EOpTensorWriteARM) {
  4084. const bool isWrite = node->getOp() == glslang::EOpTensorWriteARM;
  4085. const unsigned int tensorMinOperandCount = 3;
  4086. assert(operands.size() >= tensorMinOperandCount);
  4087. std::vector<spv::IdImmediate> idImmOps;
  4088. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // tensor
  4089. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // coords
  4090. if (isWrite) {
  4091. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // value
  4092. }
  4093. // Analyze the tensor operands
  4094. spv::IdImmediate tensorOperands = { false, uint32_t(spv::TensorOperandsMask::MaskNone) };
  4095. bool pushExtraArg = false;
  4096. if (operands.size() > tensorMinOperandCount) {
  4097. auto enumVal = builder.getConstantScalar(operands[tensorMinOperandCount]);
  4098. if (enumVal & uint32_t(spv::TensorOperandsMask::NontemporalARM)) {
  4099. tensorOperands.word |= uint32_t(spv::TensorOperandsMask::NontemporalARM);
  4100. }
  4101. if (enumVal & uint32_t(spv::TensorOperandsMask::OutOfBoundsValueARM)) {
  4102. tensorOperands.word |= uint32_t(spv::TensorOperandsMask::OutOfBoundsValueARM);
  4103. assert(operands.size() >= tensorMinOperandCount + 2 &&
  4104. "TensorOperandsOutOfBoundsValueMask requires an additional value");
  4105. pushExtraArg = true;
  4106. }
  4107. }
  4108. // Append optional tensor operands if the mask was non-zero.
  4109. if (tensorOperands.word) {
  4110. idImmOps.push_back(tensorOperands);
  4111. if (pushExtraArg)
  4112. idImmOps.push_back(spv::IdImmediate(true, operands[tensorMinOperandCount + 1]));
  4113. }
  4114. if (isWrite) {
  4115. builder.createNoResultOp(spv::Op::OpTensorWriteARM, idImmOps);
  4116. result = 0;
  4117. } else {
  4118. // Use the result argument type as the OpTensorReadARM result type.
  4119. const glslang::TType &resArgType = glslangOperands[2]->getAsTyped()->getType();
  4120. spv::Id retType = convertGlslangToSpvType(resArgType);
  4121. result = builder.createOp(spv::Op::OpTensorReadARM, retType, idImmOps);
  4122. // Store the result to the result argument.
  4123. builder.createStore(result, operands[2]);
  4124. }
  4125. } else if (node->getOp() == glslang::EOpTensorSizeARM) {
  4126. // Expected operands are (tensor, dimension)
  4127. assert(operands.size() == 2);
  4128. spv::Id tensorOp = operands[0];
  4129. spv::Id dimOp = operands[1];
  4130. assert(builder.isTensorTypeARM(builder.getTypeId(tensorOp)) && "operand #0 must be a tensor");
  4131. std::vector<spv::IdImmediate> idImmOps;
  4132. idImmOps.push_back(spv::IdImmediate(true, tensorOp));
  4133. idImmOps.push_back(spv::IdImmediate(true, dimOp));
  4134. result = builder.createOp(spv::Op::OpTensorQuerySizeARM, resultType(), idImmOps);
  4135. } else if (atomic) {
  4136. // Handle all atomics
  4137. glslang::TBasicType typeProxy = (node->getOp() == glslang::EOpAtomicStore)
  4138. ? node->getSequence()[0]->getAsTyped()->getBasicType() : node->getBasicType();
  4139. result = createAtomicOperation(node->getOp(), precision, resultType(), operands, typeProxy,
  4140. lvalueCoherentFlags, node->getType());
  4141. } else if (node->getOp() == glslang::EOpSpirvInst) {
  4142. const auto& spirvInst = node->getSpirvInstruction();
  4143. if (spirvInst.set == "") {
  4144. std::vector<spv::IdImmediate> idImmOps;
  4145. for (unsigned int i = 0; i < glslangOperands.size(); ++i) {
  4146. if (glslangOperands[i]->getAsTyped()->getQualifier().isSpirvLiteral()) {
  4147. // Translate the constant to a literal value
  4148. std::vector<unsigned> literals;
  4149. glslang::TVector<const glslang::TIntermConstantUnion*> constants;
  4150. constants.push_back(glslangOperands[i]->getAsConstantUnion());
  4151. TranslateLiterals(constants, literals);
  4152. idImmOps.push_back({false, literals[0]});
  4153. } else
  4154. idImmOps.push_back({true, operands[i]});
  4155. }
  4156. if (node->getBasicType() == glslang::EbtVoid)
  4157. builder.createNoResultOp(static_cast<spv::Op>(spirvInst.id), idImmOps);
  4158. else
  4159. result = builder.createOp(static_cast<spv::Op>(spirvInst.id), resultType(), idImmOps);
  4160. } else {
  4161. result = builder.createBuiltinCall(
  4162. resultType(), spirvInst.set == "GLSL.std.450" ? stdBuiltins : getExtBuiltins(spirvInst.set.c_str()),
  4163. spirvInst.id, operands);
  4164. }
  4165. noReturnValue = node->getBasicType() == glslang::EbtVoid;
  4166. } else if (node->getOp() == glslang::EOpDebugPrintf) {
  4167. if (!nonSemanticDebugPrintf) {
  4168. nonSemanticDebugPrintf = builder.import("NonSemantic.DebugPrintf");
  4169. }
  4170. result = builder.createBuiltinCall(builder.makeVoidType(), nonSemanticDebugPrintf, spv::NonSemanticDebugPrintfDebugPrintf, operands);
  4171. builder.addExtension(spv::E_SPV_KHR_non_semantic_info);
  4172. } else {
  4173. // Pass through to generic operations.
  4174. switch (glslangOperands.size()) {
  4175. case 0:
  4176. result = createNoArgOperation(node->getOp(), precision, resultType());
  4177. break;
  4178. case 1:
  4179. {
  4180. OpDecorations decorations = { precision,
  4181. TranslateNoContractionDecoration(node->getType().getQualifier()),
  4182. TranslateNonUniformDecoration(node->getType().getQualifier()) };
  4183. result = createUnaryOperation(
  4184. node->getOp(), decorations,
  4185. resultType(), operands.front(),
  4186. glslangOperands[0]->getAsTyped()->getBasicType(), lvalueCoherentFlags, node->getType());
  4187. }
  4188. break;
  4189. default:
  4190. result = createMiscOperation(node->getOp(), precision, resultType(), operands, node->getBasicType());
  4191. break;
  4192. }
  4193. if (invertedType != spv::NoResult)
  4194. result = createInvertedSwizzle(precision, *glslangOperands[0]->getAsBinaryNode(), result);
  4195. for (unsigned int i = 0; i < temporaryLvalues.size(); ++i) {
  4196. builder.setAccessChain(complexLvalues[i]);
  4197. builder.accessChainStore(builder.createLoad(temporaryLvalues[i], spv::NoPrecision),
  4198. TranslateNonUniformDecoration(complexLvalues[i].coherentFlags));
  4199. }
  4200. }
  4201. if (noReturnValue)
  4202. return false;
  4203. if (! result) {
  4204. logger->missingFunctionality("unknown glslang aggregate");
  4205. return true; // pick up a child as a placeholder operand
  4206. } else {
  4207. builder.clearAccessChain();
  4208. builder.setAccessChainRValue(result);
  4209. return false;
  4210. }
  4211. }
  4212. // This path handles both if-then-else and ?:
  4213. // The if-then-else has a node type of void, while
  4214. // ?: has either a void or a non-void node type
  4215. //
  4216. // Leaving the result, when not void:
  4217. // GLSL only has r-values as the result of a :?, but
  4218. // if we have an l-value, that can be more efficient if it will
  4219. // become the base of a complex r-value expression, because the
  4220. // next layer copies r-values into memory to use the access-chain mechanism
  4221. bool TGlslangToSpvTraverser::visitSelection(glslang::TVisit /* visit */, glslang::TIntermSelection* node)
  4222. {
  4223. // see if OpSelect can handle it
  4224. const auto isOpSelectable = [&]() {
  4225. if (node->getBasicType() == glslang::EbtVoid)
  4226. return false;
  4227. // OpSelect can do all other types starting with SPV 1.4
  4228. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_4) {
  4229. // pre-1.4, only scalars and vectors can be handled
  4230. if ((!node->getType().isScalar() && !node->getType().isVector()))
  4231. return false;
  4232. }
  4233. return true;
  4234. };
  4235. // See if it simple and safe, or required, to execute both sides.
  4236. // Crucially, side effects must be either semantically required or avoided,
  4237. // and there are performance trade-offs.
  4238. // Return true if required or a good idea (and safe) to execute both sides,
  4239. // false otherwise.
  4240. const auto bothSidesPolicy = [&]() -> bool {
  4241. // do we have both sides?
  4242. if (node->getTrueBlock() == nullptr ||
  4243. node->getFalseBlock() == nullptr)
  4244. return false;
  4245. // required? (unless we write additional code to look for side effects
  4246. // and make performance trade-offs if none are present)
  4247. if (!node->getShortCircuit())
  4248. return true;
  4249. // if not required to execute both, decide based on performance/practicality...
  4250. if (!isOpSelectable())
  4251. return false;
  4252. assert(node->getType() == node->getTrueBlock() ->getAsTyped()->getType() &&
  4253. node->getType() == node->getFalseBlock()->getAsTyped()->getType());
  4254. // return true if a single operand to ? : is okay for OpSelect
  4255. const auto operandOkay = [](glslang::TIntermTyped* node) {
  4256. return node->getAsSymbolNode() || node->getType().getQualifier().isConstant();
  4257. };
  4258. return operandOkay(node->getTrueBlock() ->getAsTyped()) &&
  4259. operandOkay(node->getFalseBlock()->getAsTyped());
  4260. };
  4261. spv::Id result = spv::NoResult; // upcoming result selecting between trueValue and falseValue
  4262. // emit the condition before doing anything with selection
  4263. node->getCondition()->traverse(this);
  4264. spv::Id condition = accessChainLoad(node->getCondition()->getType());
  4265. // Find a way of executing both sides and selecting the right result.
  4266. const auto executeBothSides = [&]() -> void {
  4267. // execute both sides
  4268. spv::Id resultType = convertGlslangToSpvType(node->getType());
  4269. node->getTrueBlock()->traverse(this);
  4270. spv::Id trueValue = accessChainLoad(node->getTrueBlock()->getAsTyped()->getType());
  4271. node->getFalseBlock()->traverse(this);
  4272. spv::Id falseValue = accessChainLoad(node->getFalseBlock()->getAsTyped()->getType());
  4273. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  4274. // done if void
  4275. if (node->getBasicType() == glslang::EbtVoid)
  4276. return;
  4277. // emit code to select between trueValue and falseValue
  4278. // see if OpSelect can handle the result type, and that the SPIR-V types
  4279. // of the inputs match the result type.
  4280. if (isOpSelectable()) {
  4281. // Emit OpSelect for this selection.
  4282. // smear condition to vector, if necessary (AST is always scalar)
  4283. // Before 1.4, smear like for mix(), starting with 1.4, keep it scalar
  4284. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_4 && builder.isVector(trueValue)) {
  4285. condition = builder.smearScalar(spv::NoPrecision, condition,
  4286. builder.makeVectorType(builder.makeBoolType(),
  4287. builder.getNumComponents(trueValue)));
  4288. }
  4289. // If the types do not match, it is because of mismatched decorations on aggregates.
  4290. // Since isOpSelectable only lets us get here for SPIR-V >= 1.4, we can use OpCopyObject
  4291. // to get matching types.
  4292. if (builder.getTypeId(trueValue) != resultType) {
  4293. trueValue = builder.createUnaryOp(spv::Op::OpCopyLogical, resultType, trueValue);
  4294. }
  4295. if (builder.getTypeId(falseValue) != resultType) {
  4296. falseValue = builder.createUnaryOp(spv::Op::OpCopyLogical, resultType, falseValue);
  4297. }
  4298. // OpSelect
  4299. result = builder.createTriOp(spv::Op::OpSelect, resultType, condition, trueValue, falseValue);
  4300. builder.clearAccessChain();
  4301. builder.setAccessChainRValue(result);
  4302. } else {
  4303. // We need control flow to select the result.
  4304. // TODO: Once SPIR-V OpSelect allows arbitrary types, eliminate this path.
  4305. result = builder.createVariable(TranslatePrecisionDecoration(node->getType()),
  4306. spv::StorageClass::Function, resultType);
  4307. // Selection control:
  4308. const spv::SelectionControlMask control = TranslateSelectionControl(*node);
  4309. // make an "if" based on the value created by the condition
  4310. spv::Builder::If ifBuilder(condition, control, builder);
  4311. // emit the "then" statement
  4312. builder.clearAccessChain();
  4313. builder.setAccessChainLValue(result);
  4314. multiTypeStore(node->getType(), trueValue);
  4315. ifBuilder.makeBeginElse();
  4316. // emit the "else" statement
  4317. builder.clearAccessChain();
  4318. builder.setAccessChainLValue(result);
  4319. multiTypeStore(node->getType(), falseValue);
  4320. // finish off the control flow
  4321. ifBuilder.makeEndIf();
  4322. builder.clearAccessChain();
  4323. builder.setAccessChainLValue(result);
  4324. }
  4325. };
  4326. // Execute the one side needed, as per the condition
  4327. const auto executeOneSide = [&]() {
  4328. // Always emit control flow.
  4329. if (node->getBasicType() != glslang::EbtVoid) {
  4330. result = builder.createVariable(TranslatePrecisionDecoration(node->getType()), spv::StorageClass::Function,
  4331. convertGlslangToSpvType(node->getType()));
  4332. }
  4333. // Selection control:
  4334. const spv::SelectionControlMask control = TranslateSelectionControl(*node);
  4335. // make an "if" based on the value created by the condition
  4336. spv::Builder::If ifBuilder(condition, control, builder);
  4337. // emit the "then" statement
  4338. if (node->getTrueBlock() != nullptr) {
  4339. node->getTrueBlock()->traverse(this);
  4340. if (result != spv::NoResult) {
  4341. spv::Id load = accessChainLoad(node->getTrueBlock()->getAsTyped()->getType());
  4342. builder.clearAccessChain();
  4343. builder.setAccessChainLValue(result);
  4344. multiTypeStore(node->getType(), load);
  4345. }
  4346. }
  4347. if (node->getFalseBlock() != nullptr) {
  4348. ifBuilder.makeBeginElse();
  4349. // emit the "else" statement
  4350. node->getFalseBlock()->traverse(this);
  4351. if (result != spv::NoResult) {
  4352. spv::Id load = accessChainLoad(node->getFalseBlock()->getAsTyped()->getType());
  4353. builder.clearAccessChain();
  4354. builder.setAccessChainLValue(result);
  4355. multiTypeStore(node->getType(), load);
  4356. }
  4357. }
  4358. // finish off the control flow
  4359. ifBuilder.makeEndIf();
  4360. if (result != spv::NoResult) {
  4361. builder.clearAccessChain();
  4362. builder.setAccessChainLValue(result);
  4363. }
  4364. };
  4365. // Try for OpSelect (or a requirement to execute both sides)
  4366. if (bothSidesPolicy()) {
  4367. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  4368. if (node->getType().getQualifier().isSpecConstant())
  4369. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  4370. executeBothSides();
  4371. } else
  4372. executeOneSide();
  4373. return false;
  4374. }
  4375. bool TGlslangToSpvTraverser::visitSwitch(glslang::TVisit /* visit */, glslang::TIntermSwitch* node)
  4376. {
  4377. // emit and get the condition before doing anything with switch
  4378. node->getCondition()->traverse(this);
  4379. spv::Id selector = accessChainLoad(node->getCondition()->getAsTyped()->getType());
  4380. // Selection control:
  4381. const spv::SelectionControlMask control = TranslateSwitchControl(*node);
  4382. // browse the children to sort out code segments
  4383. int defaultSegment = -1;
  4384. std::vector<TIntermNode*> codeSegments;
  4385. glslang::TIntermSequence& sequence = node->getBody()->getSequence();
  4386. std::vector<int> caseValues;
  4387. std::vector<int> valueIndexToSegment(sequence.size()); // note: probably not all are used, it is an overestimate
  4388. for (glslang::TIntermSequence::iterator c = sequence.begin(); c != sequence.end(); ++c) {
  4389. TIntermNode* child = *c;
  4390. if (child->getAsBranchNode() && child->getAsBranchNode()->getFlowOp() == glslang::EOpDefault)
  4391. defaultSegment = (int)codeSegments.size();
  4392. else if (child->getAsBranchNode() && child->getAsBranchNode()->getFlowOp() == glslang::EOpCase) {
  4393. valueIndexToSegment[caseValues.size()] = (int)codeSegments.size();
  4394. caseValues.push_back(child->getAsBranchNode()->getExpression()->getAsConstantUnion()
  4395. ->getConstArray()[0].getIConst());
  4396. } else
  4397. codeSegments.push_back(child);
  4398. }
  4399. // handle the case where the last code segment is missing, due to no code
  4400. // statements between the last case and the end of the switch statement
  4401. if ((caseValues.size() && (int)codeSegments.size() == valueIndexToSegment[caseValues.size() - 1]) ||
  4402. (int)codeSegments.size() == defaultSegment)
  4403. codeSegments.push_back(nullptr);
  4404. // make the switch statement
  4405. std::vector<spv::Block*> segmentBlocks; // returned, as the blocks allocated in the call
  4406. builder.makeSwitch(selector, control, (int)codeSegments.size(), caseValues, valueIndexToSegment, defaultSegment,
  4407. segmentBlocks);
  4408. // emit all the code in the segments
  4409. breakForLoop.push(false);
  4410. for (unsigned int s = 0; s < codeSegments.size(); ++s) {
  4411. builder.nextSwitchSegment(segmentBlocks, s);
  4412. if (codeSegments[s])
  4413. codeSegments[s]->traverse(this);
  4414. else
  4415. builder.addSwitchBreak(true);
  4416. }
  4417. breakForLoop.pop();
  4418. builder.endSwitch(segmentBlocks);
  4419. return false;
  4420. }
  4421. void TGlslangToSpvTraverser::visitConstantUnion(glslang::TIntermConstantUnion* node)
  4422. {
  4423. if (node->getQualifier().isSpirvLiteral())
  4424. return; // Translated to a literal value, skip further processing
  4425. int nextConst = 0;
  4426. spv::Id constant = createSpvConstantFromConstUnionArray(node->getType(), node->getConstArray(), nextConst, false);
  4427. builder.clearAccessChain();
  4428. builder.setAccessChainRValue(constant);
  4429. }
  4430. bool TGlslangToSpvTraverser::visitLoop(glslang::TVisit /* visit */, glslang::TIntermLoop* node)
  4431. {
  4432. auto blocks = builder.makeNewLoop();
  4433. builder.createBranch(true, &blocks.head);
  4434. // Loop control:
  4435. std::vector<unsigned int> operands;
  4436. const spv::LoopControlMask control = TranslateLoopControl(*node, operands);
  4437. // Spec requires back edges to target header blocks, and every header block
  4438. // must dominate its merge block. Make a header block first to ensure these
  4439. // conditions are met. By definition, it will contain OpLoopMerge, followed
  4440. // by a block-ending branch. But we don't want to put any other body/test
  4441. // instructions in it, since the body/test may have arbitrary instructions,
  4442. // including merges of its own.
  4443. builder.setBuildPoint(&blocks.head);
  4444. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  4445. builder.createLoopMerge(&blocks.merge, &blocks.continue_target, control, operands);
  4446. if (node->testFirst() && node->getTest()) {
  4447. spv::Block& test = builder.makeNewBlock();
  4448. builder.createBranch(true, &test);
  4449. builder.setBuildPoint(&test);
  4450. node->getTest()->traverse(this);
  4451. spv::Id condition = accessChainLoad(node->getTestExpr()->getType());
  4452. builder.createConditionalBranch(condition, &blocks.body, &blocks.merge);
  4453. builder.setBuildPoint(&blocks.body);
  4454. breakForLoop.push(true);
  4455. if (node->getBody())
  4456. node->getBody()->traverse(this);
  4457. builder.createBranch(true, &blocks.continue_target);
  4458. breakForLoop.pop();
  4459. builder.setBuildPoint(&blocks.continue_target);
  4460. if (node->getTerminal())
  4461. node->getTerminal()->traverse(this);
  4462. builder.createBranch(true, &blocks.head);
  4463. } else {
  4464. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  4465. builder.createBranch(true, &blocks.body);
  4466. breakForLoop.push(true);
  4467. builder.setBuildPoint(&blocks.body);
  4468. if (node->getBody())
  4469. node->getBody()->traverse(this);
  4470. builder.createBranch(true, &blocks.continue_target);
  4471. breakForLoop.pop();
  4472. builder.setBuildPoint(&blocks.continue_target);
  4473. if (node->getTerminal())
  4474. node->getTerminal()->traverse(this);
  4475. if (node->getTest()) {
  4476. node->getTest()->traverse(this);
  4477. spv::Id condition =
  4478. accessChainLoad(node->getTestExpr()->getType());
  4479. builder.createConditionalBranch(condition, &blocks.head, &blocks.merge);
  4480. } else {
  4481. // TODO: unless there was a break/return/discard instruction
  4482. // somewhere in the body, this is an infinite loop, so we should
  4483. // issue a warning.
  4484. builder.createBranch(true, &blocks.head);
  4485. }
  4486. }
  4487. builder.setBuildPoint(&blocks.merge);
  4488. builder.closeLoop();
  4489. return false;
  4490. }
  4491. bool TGlslangToSpvTraverser::visitBranch(glslang::TVisit /* visit */, glslang::TIntermBranch* node)
  4492. {
  4493. if (node->getExpression())
  4494. node->getExpression()->traverse(this);
  4495. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  4496. switch (node->getFlowOp()) {
  4497. case glslang::EOpKill:
  4498. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {
  4499. builder.addCapability(spv::Capability::DemoteToHelperInvocation);
  4500. builder.createNoResultOp(spv::Op::OpDemoteToHelperInvocationEXT);
  4501. } else {
  4502. builder.makeStatementTerminator(spv::Op::OpKill, "post-discard");
  4503. }
  4504. break;
  4505. case glslang::EOpTerminateInvocation:
  4506. builder.addExtension(spv::E_SPV_KHR_terminate_invocation);
  4507. builder.makeStatementTerminator(spv::Op::OpTerminateInvocation, "post-terminate-invocation");
  4508. break;
  4509. case glslang::EOpBreak:
  4510. if (breakForLoop.top())
  4511. builder.createLoopExit();
  4512. else
  4513. builder.addSwitchBreak(false);
  4514. break;
  4515. case glslang::EOpContinue:
  4516. builder.createLoopContinue();
  4517. break;
  4518. case glslang::EOpReturn:
  4519. if (node->getExpression() != nullptr) {
  4520. const glslang::TType& glslangReturnType = node->getExpression()->getType();
  4521. spv::Id returnId = accessChainLoad(glslangReturnType);
  4522. if (builder.getTypeId(returnId) != currentFunction->getReturnType() ||
  4523. TranslatePrecisionDecoration(glslangReturnType) != currentFunction->getReturnPrecision()) {
  4524. builder.clearAccessChain();
  4525. spv::Id copyId = builder.createVariable(currentFunction->getReturnPrecision(),
  4526. spv::StorageClass::Function, currentFunction->getReturnType());
  4527. builder.setAccessChainLValue(copyId);
  4528. multiTypeStore(glslangReturnType, returnId);
  4529. returnId = builder.createLoad(copyId, currentFunction->getReturnPrecision());
  4530. }
  4531. builder.makeReturn(false, returnId);
  4532. } else
  4533. builder.makeReturn(false);
  4534. builder.clearAccessChain();
  4535. break;
  4536. case glslang::EOpDemote:
  4537. builder.createNoResultOp(spv::Op::OpDemoteToHelperInvocationEXT);
  4538. builder.addExtension(spv::E_SPV_EXT_demote_to_helper_invocation);
  4539. builder.addCapability(spv::Capability::DemoteToHelperInvocationEXT);
  4540. break;
  4541. case glslang::EOpTerminateRayKHR:
  4542. builder.makeStatementTerminator(spv::Op::OpTerminateRayKHR, "post-terminateRayKHR");
  4543. break;
  4544. case glslang::EOpIgnoreIntersectionKHR:
  4545. builder.makeStatementTerminator(spv::Op::OpIgnoreIntersectionKHR, "post-ignoreIntersectionKHR");
  4546. break;
  4547. default:
  4548. assert(0);
  4549. break;
  4550. }
  4551. return false;
  4552. }
  4553. bool TGlslangToSpvTraverser::visitVariableDecl(glslang::TVisit visit, glslang::TIntermVariableDecl* node)
  4554. {
  4555. if (visit == glslang::EvPreVisit) {
  4556. builder.setDebugSourceLocation(node->getDeclSymbol()->getLoc().line, node->getDeclSymbol()->getLoc().getFilename());
  4557. // We touch the symbol once here to create the debug info.
  4558. getSymbolId(node->getDeclSymbol());
  4559. }
  4560. return true;
  4561. }
  4562. spv::Id TGlslangToSpvTraverser::createSpvVariable(const glslang::TIntermSymbol* node, spv::Id forcedType)
  4563. {
  4564. // First, steer off constants, which are not SPIR-V variables, but
  4565. // can still have a mapping to a SPIR-V Id.
  4566. // This includes specialization constants.
  4567. if (node->getQualifier().isConstant()) {
  4568. spv::Id result = createSpvConstant(*node);
  4569. if (result != spv::NoResult) {
  4570. auto name = node->getAsSymbolNode()->getAccessName().c_str();
  4571. auto typeId = convertGlslangToSpvType(node->getType());
  4572. builder.createConstVariable(typeId, name, result, currentFunction == nullptr);
  4573. return result;
  4574. }
  4575. }
  4576. // Now, handle actual variables
  4577. spv::StorageClass storageClass = TranslateStorageClass(node->getType());
  4578. spv::Id spvType = forcedType == spv::NoType ? convertGlslangToSpvType(node->getType())
  4579. : forcedType;
  4580. const bool contains16BitType = node->getType().contains16BitFloat() ||
  4581. node->getType().contains16BitInt();
  4582. if (contains16BitType) {
  4583. switch (storageClass) {
  4584. case spv::StorageClass::Input:
  4585. case spv::StorageClass::Output:
  4586. builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);
  4587. builder.addCapability(spv::Capability::StorageInputOutput16);
  4588. break;
  4589. case spv::StorageClass::Uniform:
  4590. builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);
  4591. if (node->getType().getQualifier().storage == glslang::EvqBuffer)
  4592. builder.addCapability(spv::Capability::StorageUniformBufferBlock16);
  4593. else
  4594. builder.addCapability(spv::Capability::StorageUniform16);
  4595. break;
  4596. case spv::StorageClass::PushConstant:
  4597. builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);
  4598. builder.addCapability(spv::Capability::StoragePushConstant16);
  4599. break;
  4600. case spv::StorageClass::StorageBuffer:
  4601. case spv::StorageClass::PhysicalStorageBufferEXT:
  4602. builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);
  4603. builder.addCapability(spv::Capability::StorageUniformBufferBlock16);
  4604. break;
  4605. case spv::StorageClass::TileAttachmentQCOM:
  4606. builder.addCapability(spv::Capability::TileShadingQCOM);
  4607. break;
  4608. default:
  4609. if (storageClass == spv::StorageClass::Workgroup &&
  4610. node->getType().getBasicType() == glslang::EbtBlock) {
  4611. builder.addCapability(spv::Capability::WorkgroupMemoryExplicitLayout16BitAccessKHR);
  4612. break;
  4613. }
  4614. if (node->getType().contains16BitFloat())
  4615. builder.addCapability(spv::Capability::Float16);
  4616. if (node->getType().contains16BitInt())
  4617. builder.addCapability(spv::Capability::Int16);
  4618. break;
  4619. }
  4620. }
  4621. if (node->getType().contains8BitInt()) {
  4622. if (storageClass == spv::StorageClass::PushConstant) {
  4623. builder.addIncorporatedExtension(spv::E_SPV_KHR_8bit_storage, spv::Spv_1_5);
  4624. builder.addCapability(spv::Capability::StoragePushConstant8);
  4625. } else if (storageClass == spv::StorageClass::Uniform) {
  4626. builder.addIncorporatedExtension(spv::E_SPV_KHR_8bit_storage, spv::Spv_1_5);
  4627. builder.addCapability(spv::Capability::UniformAndStorageBuffer8BitAccess);
  4628. } else if (storageClass == spv::StorageClass::StorageBuffer) {
  4629. builder.addIncorporatedExtension(spv::E_SPV_KHR_8bit_storage, spv::Spv_1_5);
  4630. builder.addCapability(spv::Capability::StorageBuffer8BitAccess);
  4631. } else if (storageClass == spv::StorageClass::Workgroup &&
  4632. node->getType().getBasicType() == glslang::EbtBlock) {
  4633. builder.addCapability(spv::Capability::WorkgroupMemoryExplicitLayout8BitAccessKHR);
  4634. } else {
  4635. builder.addCapability(spv::Capability::Int8);
  4636. }
  4637. }
  4638. const char* name = node->getName().c_str();
  4639. if (glslang::IsAnonymous(name))
  4640. name = "";
  4641. spv::Id initializer = spv::NoResult;
  4642. if (node->getType().getQualifier().storage == glslang::EvqUniform && !node->getConstArray().empty()) {
  4643. int nextConst = 0;
  4644. initializer = createSpvConstantFromConstUnionArray(node->getType(),
  4645. node->getConstArray(),
  4646. nextConst,
  4647. false /* specConst */);
  4648. } else if (node->getType().getQualifier().isNullInit()) {
  4649. initializer = builder.makeNullConstant(spvType);
  4650. }
  4651. spv::Id var = builder.createVariable(spv::NoPrecision, storageClass, spvType, name, initializer, false);
  4652. if (options.emitNonSemanticShaderDebugInfo && storageClass != spv::StorageClass::Function) {
  4653. // Create variable alias for retargeted symbols if any.
  4654. // Notably, this is only applicable to built-in variables so that it is okay to only use name as the key.
  4655. auto [itBegin, itEnd] = glslangIntermediate->getBuiltinAliasLookup().equal_range(name);
  4656. for (auto it = itBegin; it != itEnd; ++it) {
  4657. builder.createDebugGlobalVariable(builder.getDebugType(spvType), it->second.c_str(), var);
  4658. }
  4659. }
  4660. std::vector<spv::Decoration> topLevelDecorations;
  4661. glslang::TQualifier typeQualifier = node->getType().getQualifier();
  4662. TranslateMemoryDecoration(typeQualifier, topLevelDecorations, glslangIntermediate->usingVulkanMemoryModel());
  4663. for (auto deco : topLevelDecorations) {
  4664. builder.addDecoration(var, deco);
  4665. }
  4666. return var;
  4667. }
  4668. // Return type Id of the sampled type.
  4669. spv::Id TGlslangToSpvTraverser::getSampledType(const glslang::TSampler& sampler)
  4670. {
  4671. switch (sampler.type) {
  4672. case glslang::EbtInt: return builder.makeIntType(32);
  4673. case glslang::EbtUint: return builder.makeUintType(32);
  4674. case glslang::EbtFloat: return builder.makeFloatType(32);
  4675. case glslang::EbtFloat16:
  4676. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float_fetch);
  4677. builder.addCapability(spv::Capability::Float16ImageAMD);
  4678. return builder.makeFloatType(16);
  4679. case glslang::EbtInt64:
  4680. builder.addExtension(spv::E_SPV_EXT_shader_image_int64);
  4681. builder.addCapability(spv::Capability::Int64ImageEXT);
  4682. return builder.makeIntType(64);
  4683. case glslang::EbtUint64:
  4684. builder.addExtension(spv::E_SPV_EXT_shader_image_int64);
  4685. builder.addCapability(spv::Capability::Int64ImageEXT);
  4686. return builder.makeUintType(64);
  4687. default:
  4688. assert(0);
  4689. return builder.makeFloatType(32);
  4690. }
  4691. }
  4692. // If node is a swizzle operation, return the type that should be used if
  4693. // the swizzle base is first consumed by another operation, before the swizzle
  4694. // is applied.
  4695. spv::Id TGlslangToSpvTraverser::getInvertedSwizzleType(const glslang::TIntermTyped& node)
  4696. {
  4697. if (node.getAsOperator() &&
  4698. node.getAsOperator()->getOp() == glslang::EOpVectorSwizzle)
  4699. return convertGlslangToSpvType(node.getAsBinaryNode()->getLeft()->getType());
  4700. else
  4701. return spv::NoType;
  4702. }
  4703. // When inverting a swizzle with a parent op, this function
  4704. // will apply the swizzle operation to a completed parent operation.
  4705. spv::Id TGlslangToSpvTraverser::createInvertedSwizzle(spv::Decoration precision, const glslang::TIntermTyped& node,
  4706. spv::Id parentResult)
  4707. {
  4708. std::vector<unsigned> swizzle;
  4709. convertSwizzle(*node.getAsBinaryNode()->getRight()->getAsAggregate(), swizzle);
  4710. return builder.createRvalueSwizzle(precision, convertGlslangToSpvType(node.getType()), parentResult, swizzle);
  4711. }
  4712. // Convert a glslang AST swizzle node to a swizzle vector for building SPIR-V.
  4713. void TGlslangToSpvTraverser::convertSwizzle(const glslang::TIntermAggregate& node, std::vector<unsigned>& swizzle)
  4714. {
  4715. const glslang::TIntermSequence& swizzleSequence = node.getSequence();
  4716. for (int i = 0; i < (int)swizzleSequence.size(); ++i)
  4717. swizzle.push_back(swizzleSequence[i]->getAsConstantUnion()->getConstArray()[0].getIConst());
  4718. }
  4719. // Convert from a glslang type to an SPV type, by calling into a
  4720. // recursive version of this function. This establishes the inherited
  4721. // layout state rooted from the top-level type.
  4722. spv::Id TGlslangToSpvTraverser::convertGlslangToSpvType(const glslang::TType& type, bool forwardReferenceOnly)
  4723. {
  4724. return convertGlslangToSpvType(type, getExplicitLayout(type), type.getQualifier(), false, forwardReferenceOnly);
  4725. }
  4726. spv::LinkageType TGlslangToSpvTraverser::convertGlslangLinkageToSpv(glslang::TLinkType linkType)
  4727. {
  4728. switch (linkType) {
  4729. case glslang::ELinkExport:
  4730. return spv::LinkageType::Export;
  4731. default:
  4732. return spv::LinkageType::Max;
  4733. }
  4734. }
  4735. // Do full recursive conversion of an arbitrary glslang type to a SPIR-V Id.
  4736. // explicitLayout can be kept the same throughout the hierarchical recursive walk.
  4737. // Mutually recursive with convertGlslangStructToSpvType().
  4738. spv::Id TGlslangToSpvTraverser::convertGlslangToSpvType(const glslang::TType& type,
  4739. glslang::TLayoutPacking explicitLayout, const glslang::TQualifier& qualifier,
  4740. bool lastBufferBlockMember, bool forwardReferenceOnly)
  4741. {
  4742. spv::Id spvType = spv::NoResult;
  4743. switch (type.getBasicType()) {
  4744. case glslang::EbtVoid:
  4745. spvType = builder.makeVoidType();
  4746. assert (! type.isArray());
  4747. break;
  4748. case glslang::EbtBool:
  4749. // "transparent" bool doesn't exist in SPIR-V. The GLSL convention is
  4750. // a 32-bit int where non-0 means true.
  4751. if (explicitLayout != glslang::ElpNone)
  4752. spvType = builder.makeUintType(32);
  4753. else
  4754. spvType = builder.makeBoolType();
  4755. break;
  4756. case glslang::EbtInt:
  4757. spvType = builder.makeIntType(32);
  4758. break;
  4759. case glslang::EbtUint:
  4760. spvType = builder.makeUintType(32);
  4761. break;
  4762. case glslang::EbtFloat:
  4763. spvType = builder.makeFloatType(32);
  4764. break;
  4765. case glslang::EbtDouble:
  4766. spvType = builder.makeFloatType(64);
  4767. break;
  4768. case glslang::EbtFloat16:
  4769. spvType = builder.makeFloatType(16);
  4770. break;
  4771. case glslang::EbtBFloat16:
  4772. spvType = builder.makeBFloat16Type();
  4773. break;
  4774. case glslang::EbtFloatE5M2:
  4775. spvType = builder.makeFloatE5M2Type();
  4776. break;
  4777. case glslang::EbtFloatE4M3:
  4778. spvType = builder.makeFloatE4M3Type();
  4779. break;
  4780. case glslang::EbtInt8:
  4781. spvType = builder.makeIntType(8);
  4782. break;
  4783. case glslang::EbtUint8:
  4784. spvType = builder.makeUintType(8);
  4785. break;
  4786. case glslang::EbtInt16:
  4787. spvType = builder.makeIntType(16);
  4788. break;
  4789. case glslang::EbtUint16:
  4790. spvType = builder.makeUintType(16);
  4791. break;
  4792. case glslang::EbtInt64:
  4793. spvType = builder.makeIntType(64);
  4794. break;
  4795. case glslang::EbtUint64:
  4796. spvType = builder.makeUintType(64);
  4797. break;
  4798. case glslang::EbtAtomicUint:
  4799. builder.addCapability(spv::Capability::AtomicStorage);
  4800. spvType = builder.makeUintType(32);
  4801. break;
  4802. case glslang::EbtAccStruct:
  4803. switch (glslangIntermediate->getStage()) {
  4804. case EShLangRayGen:
  4805. case EShLangIntersect:
  4806. case EShLangAnyHit:
  4807. case EShLangClosestHit:
  4808. case EShLangMiss:
  4809. case EShLangCallable:
  4810. // these all should have the RayTracingNV/KHR capability already
  4811. break;
  4812. default:
  4813. {
  4814. auto& extensions = glslangIntermediate->getRequestedExtensions();
  4815. if (extensions.find("GL_EXT_ray_query") != extensions.end()) {
  4816. builder.addExtension(spv::E_SPV_KHR_ray_query);
  4817. builder.addCapability(spv::Capability::RayQueryKHR);
  4818. }
  4819. }
  4820. break;
  4821. }
  4822. spvType = builder.makeAccelerationStructureType();
  4823. break;
  4824. case glslang::EbtRayQuery:
  4825. {
  4826. auto& extensions = glslangIntermediate->getRequestedExtensions();
  4827. if (extensions.find("GL_EXT_ray_query") != extensions.end()) {
  4828. builder.addExtension(spv::E_SPV_KHR_ray_query);
  4829. builder.addCapability(spv::Capability::RayQueryKHR);
  4830. }
  4831. spvType = builder.makeRayQueryType();
  4832. }
  4833. break;
  4834. case glslang::EbtReference:
  4835. {
  4836. // Make the forward pointer, then recurse to convert the structure type, then
  4837. // patch up the forward pointer with a real pointer type.
  4838. if (forwardPointers.find(type.getReferentType()) == forwardPointers.end()) {
  4839. spv::Id forwardId = builder.makeForwardPointer(spv::StorageClass::PhysicalStorageBufferEXT);
  4840. forwardPointers[type.getReferentType()] = forwardId;
  4841. }
  4842. spvType = forwardPointers[type.getReferentType()];
  4843. if (!forwardReferenceOnly) {
  4844. spv::Id referentType = convertGlslangToSpvType(*type.getReferentType());
  4845. builder.makePointerFromForwardPointer(spv::StorageClass::PhysicalStorageBufferEXT,
  4846. forwardPointers[type.getReferentType()],
  4847. referentType);
  4848. }
  4849. }
  4850. break;
  4851. case glslang::EbtSampler:
  4852. {
  4853. const glslang::TSampler& sampler = type.getSampler();
  4854. std::string debugName;
  4855. if (sampler.isPureSampler()) {
  4856. if (options.emitNonSemanticShaderDebugInfo) {
  4857. if (glslangIntermediate->getSource() == glslang::EShSourceGlsl) {
  4858. debugName = sampler.getString();
  4859. }
  4860. else {
  4861. debugName = "type.sampler";
  4862. }
  4863. }
  4864. spvType = builder.makeSamplerType(debugName.c_str());
  4865. } else {
  4866. // an image is present, make its type
  4867. if (options.emitNonSemanticShaderDebugInfo) {
  4868. if (glslangIntermediate->getSource() == glslang::EShSourceGlsl) {
  4869. debugName = sampler.removeCombined().getString();
  4870. }
  4871. else {
  4872. switch (sampler.dim) {
  4873. case glslang::Esd1D: debugName = "type.1d.image"; break;
  4874. case glslang::Esd2D: debugName = "type.2d.image"; break;
  4875. case glslang::Esd3D: debugName = "type.3d.image"; break;
  4876. case glslang::EsdCube: debugName = "type.cube.image"; break;
  4877. default: debugName = "type.image"; break;
  4878. }
  4879. }
  4880. }
  4881. spvType = builder.makeImageType(getSampledType(sampler), TranslateDimensionality(sampler),
  4882. sampler.isShadow(), sampler.isArrayed(), sampler.isMultiSample(),
  4883. sampler.isImageClass() ? 2 : 1, TranslateImageFormat(type), debugName.c_str());
  4884. if (sampler.isCombined() &&
  4885. (!sampler.isBuffer() || glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_6)) {
  4886. // Already has both image and sampler, make the combined type. Only combine sampler to
  4887. // buffer if before SPIR-V 1.6.
  4888. if (options.emitNonSemanticShaderDebugInfo) {
  4889. if (glslangIntermediate->getSource() == glslang::EShSourceGlsl) {
  4890. debugName = sampler.getString();
  4891. }
  4892. else {
  4893. debugName = "type.sampled.image";
  4894. }
  4895. }
  4896. spvType = builder.makeSampledImageType(spvType, debugName.c_str());
  4897. }
  4898. }
  4899. }
  4900. break;
  4901. case glslang::EbtStruct:
  4902. case glslang::EbtBlock:
  4903. {
  4904. // If we've seen this struct type, return it
  4905. const glslang::TTypeList* glslangMembers = type.getStruct();
  4906. // Try to share structs for different layouts, but not yet for other
  4907. // kinds of qualification (primarily not yet including interpolant qualification).
  4908. if (! HasNonLayoutQualifiers(type, qualifier))
  4909. spvType = structMap[explicitLayout][qualifier.layoutMatrix][glslangMembers];
  4910. if (spvType != spv::NoResult)
  4911. break;
  4912. // else, we haven't seen it...
  4913. if (type.getBasicType() == glslang::EbtBlock)
  4914. memberRemapper[glslangTypeToIdMap[glslangMembers]].resize(glslangMembers->size());
  4915. spvType = convertGlslangStructToSpvType(type, glslangMembers, explicitLayout, qualifier);
  4916. }
  4917. break;
  4918. case glslang::EbtString:
  4919. // no type used for OpString
  4920. return 0;
  4921. case glslang::EbtHitObjectNV: {
  4922. builder.addExtension(spv::E_SPV_NV_shader_invocation_reorder);
  4923. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  4924. spvType = builder.makeHitObjectNVType();
  4925. }
  4926. break;
  4927. case glslang::EbtHitObjectEXT: {
  4928. builder.addExtension(spv::E_SPV_EXT_shader_invocation_reorder);
  4929. builder.addCapability(spv::Capability::ShaderInvocationReorderEXT);
  4930. spvType = builder.makeHitObjectEXTType();
  4931. }
  4932. break;
  4933. case glslang::EbtSpirvType: {
  4934. // GL_EXT_spirv_intrinsics
  4935. const auto& spirvType = type.getSpirvType();
  4936. const auto& spirvInst = spirvType.spirvInst;
  4937. std::vector<spv::IdImmediate> operands;
  4938. for (const auto& typeParam : spirvType.typeParams) {
  4939. if (typeParam.getAsConstant() != nullptr) {
  4940. // Constant expression
  4941. auto constant = typeParam.getAsConstant();
  4942. if (constant->isLiteral()) {
  4943. if (constant->getBasicType() == glslang::EbtFloat) {
  4944. float floatValue = static_cast<float>(constant->getConstArray()[0].getDConst());
  4945. unsigned literal;
  4946. static_assert(sizeof(literal) == sizeof(floatValue), "sizeof(unsigned) != sizeof(float)");
  4947. memcpy(&literal, &floatValue, sizeof(literal));
  4948. operands.push_back({false, literal});
  4949. } else if (constant->getBasicType() == glslang::EbtInt) {
  4950. unsigned literal = constant->getConstArray()[0].getIConst();
  4951. operands.push_back({false, literal});
  4952. } else if (constant->getBasicType() == glslang::EbtUint) {
  4953. unsigned literal = constant->getConstArray()[0].getUConst();
  4954. operands.push_back({false, literal});
  4955. } else if (constant->getBasicType() == glslang::EbtBool) {
  4956. unsigned literal = constant->getConstArray()[0].getBConst();
  4957. operands.push_back({false, literal});
  4958. } else if (constant->getBasicType() == glslang::EbtString) {
  4959. auto str = constant->getConstArray()[0].getSConst()->c_str();
  4960. unsigned literal = 0;
  4961. char* literalPtr = reinterpret_cast<char*>(&literal);
  4962. unsigned charCount = 0;
  4963. char ch = 0;
  4964. do {
  4965. ch = *(str++);
  4966. *(literalPtr++) = ch;
  4967. ++charCount;
  4968. if (charCount == 4) {
  4969. operands.push_back({false, literal});
  4970. literalPtr = reinterpret_cast<char*>(&literal);
  4971. charCount = 0;
  4972. }
  4973. } while (ch != 0);
  4974. // Partial literal is padded with 0
  4975. if (charCount > 0) {
  4976. for (; charCount < 4; ++charCount)
  4977. *(literalPtr++) = 0;
  4978. operands.push_back({false, literal});
  4979. }
  4980. } else
  4981. assert(0); // Unexpected type
  4982. } else
  4983. operands.push_back({true, createSpvConstant(*constant)});
  4984. } else {
  4985. // Type specifier
  4986. assert(typeParam.getAsType() != nullptr);
  4987. operands.push_back({true, convertGlslangToSpvType(*typeParam.getAsType())});
  4988. }
  4989. }
  4990. assert(spirvInst.set == ""); // Currently, couldn't be extended instructions.
  4991. spvType = builder.makeGenericType(static_cast<spv::Op>(spirvInst.id), operands);
  4992. break;
  4993. }
  4994. case glslang::EbtTensorLayoutNV:
  4995. {
  4996. builder.addCapability(spv::Capability::TensorAddressingNV);
  4997. builder.addExtension(spv::E_SPV_NV_tensor_addressing);
  4998. std::vector<spv::IdImmediate> operands;
  4999. for (uint32_t i = 0; i < 2; ++i) {
  5000. operands.push_back({true, makeArraySizeId(*type.getTypeParameters()->arraySizes, i, true)});
  5001. }
  5002. spvType = builder.makeGenericType(spv::Op::OpTypeTensorLayoutNV, operands);
  5003. break;
  5004. }
  5005. case glslang::EbtTensorViewNV:
  5006. {
  5007. builder.addCapability(spv::Capability::TensorAddressingNV);
  5008. builder.addExtension(spv::E_SPV_NV_tensor_addressing);
  5009. uint32_t dim = type.getTypeParameters()->arraySizes->getDimSize(0);
  5010. assert(dim >= 1 && dim <= 5);
  5011. std::vector<spv::IdImmediate> operands;
  5012. for (uint32_t i = 0; i < dim + 2; ++i) {
  5013. operands.push_back({true, makeArraySizeId(*type.getTypeParameters()->arraySizes, i, true, i==1)});
  5014. }
  5015. spvType = builder.makeGenericType(spv::Op::OpTypeTensorViewNV, operands);
  5016. break;
  5017. }
  5018. default:
  5019. assert(0);
  5020. break;
  5021. }
  5022. if (type.isMatrix())
  5023. spvType = builder.makeMatrixType(spvType, type.getMatrixCols(), type.getMatrixRows());
  5024. else {
  5025. // If this variable has a vector element count greater than 1, create a SPIR-V vector
  5026. if (type.getVectorSize() > 1)
  5027. spvType = builder.makeVectorType(spvType, type.getVectorSize());
  5028. }
  5029. if (type.isCoopMatNV()) {
  5030. builder.addCapability(spv::Capability::CooperativeMatrixNV);
  5031. builder.addExtension(spv::E_SPV_NV_cooperative_matrix);
  5032. if (type.getBasicType() == glslang::EbtFloat16)
  5033. builder.addCapability(spv::Capability::Float16);
  5034. if (type.getBasicType() == glslang::EbtUint8 ||
  5035. type.getBasicType() == glslang::EbtInt8) {
  5036. builder.addCapability(spv::Capability::Int8);
  5037. }
  5038. spv::Id scope = makeArraySizeId(*type.getTypeParameters()->arraySizes, 1);
  5039. spv::Id rows = makeArraySizeId(*type.getTypeParameters()->arraySizes, 2);
  5040. spv::Id cols = makeArraySizeId(*type.getTypeParameters()->arraySizes, 3);
  5041. spvType = builder.makeCooperativeMatrixTypeNV(spvType, scope, rows, cols);
  5042. }
  5043. if (type.isCoopMatKHR()) {
  5044. builder.addCapability(spv::Capability::CooperativeMatrixKHR);
  5045. builder.addExtension(spv::E_SPV_KHR_cooperative_matrix);
  5046. if (type.getBasicType() == glslang::EbtBFloat16) {
  5047. builder.addExtension(spv::E_SPV_KHR_bfloat16);
  5048. builder.addCapability(spv::Capability::BFloat16CooperativeMatrixKHR);
  5049. }
  5050. if (type.getBasicType() == glslang::EbtFloatE5M2 || type.getBasicType() == glslang::EbtFloatE4M3) {
  5051. builder.addExtension(spv::E_SPV_EXT_float8);
  5052. builder.addCapability(spv::Capability::Float8CooperativeMatrixEXT);
  5053. }
  5054. if (type.getBasicType() == glslang::EbtFloat16)
  5055. builder.addCapability(spv::Capability::Float16);
  5056. if (type.getBasicType() == glslang::EbtUint8 || type.getBasicType() == glslang::EbtInt8) {
  5057. builder.addCapability(spv::Capability::Int8);
  5058. }
  5059. spv::Id scope = makeArraySizeId(*type.getTypeParameters()->arraySizes, 0);
  5060. spv::Id rows = makeArraySizeId(*type.getTypeParameters()->arraySizes, 1);
  5061. spv::Id cols = makeArraySizeId(*type.getTypeParameters()->arraySizes, 2);
  5062. spv::Id use = makeArraySizeId(*type.getTypeParameters()->arraySizes, 3, true);
  5063. spvType = builder.makeCooperativeMatrixTypeKHR(spvType, scope, rows, cols, use);
  5064. }
  5065. else if (type.isTensorARM()) {
  5066. builder.addCapability(spv::Capability::TensorsARM);
  5067. builder.addExtension(spv::E_SPV_ARM_tensors);
  5068. if (type.getBasicType() == glslang::EbtInt8 || type.getBasicType() == glslang::EbtUint8) {
  5069. builder.addCapability(spv::Capability::Int8);
  5070. } else if (type.getBasicType() == glslang::EbtInt16 ||
  5071. type.getBasicType() == glslang::EbtUint16) {
  5072. builder.addCapability(spv::Capability::Int16);
  5073. } else if (type.getBasicType() == glslang::EbtInt64 ||
  5074. type.getBasicType() == glslang::EbtUint64) {
  5075. builder.addCapability(spv::Capability::Int64);
  5076. } else if (type.getBasicType() == glslang::EbtFloat16) {
  5077. builder.addCapability(spv::Capability::Float16);
  5078. }
  5079. spv::Id rank = makeArraySizeId(*type.getTypeParameters()->arraySizes, 0);
  5080. spvType = builder.makeTensorTypeARM(spvType, rank);
  5081. }
  5082. if (type.isCoopVecNV()) {
  5083. builder.addCapability(spv::Capability::CooperativeVectorNV);
  5084. builder.addExtension(spv::E_SPV_NV_cooperative_vector);
  5085. if (type.getBasicType() == glslang::EbtFloat16)
  5086. builder.addCapability(spv::Capability::Float16);
  5087. if (type.getBasicType() == glslang::EbtUint8 || type.getBasicType() == glslang::EbtInt8) {
  5088. builder.addCapability(spv::Capability::Int8);
  5089. }
  5090. spv::Id components = makeArraySizeId(*type.getTypeParameters()->arraySizes, 0);
  5091. spvType = builder.makeCooperativeVectorTypeNV(spvType, components);
  5092. }
  5093. if (type.isArray()) {
  5094. int stride = 0; // keep this 0 unless doing an explicit layout; 0 will mean no decoration, no stride
  5095. // Do all but the outer dimension
  5096. if (type.getArraySizes()->getNumDims() > 1) {
  5097. // We need to decorate array strides for types needing explicit layout, except blocks.
  5098. if (explicitLayout != glslang::ElpNone && type.getBasicType() != glslang::EbtBlock) {
  5099. // Use a dummy glslang type for querying internal strides of
  5100. // arrays of arrays, but using just a one-dimensional array.
  5101. glslang::TType simpleArrayType(type, 0); // deference type of the array
  5102. while (simpleArrayType.getArraySizes()->getNumDims() > 1)
  5103. simpleArrayType.getArraySizes()->dereference();
  5104. // Will compute the higher-order strides here, rather than making a whole
  5105. // pile of types and doing repetitive recursion on their contents.
  5106. stride = getArrayStride(simpleArrayType, explicitLayout, qualifier.layoutMatrix);
  5107. }
  5108. // make the arrays
  5109. for (int dim = type.getArraySizes()->getNumDims() - 1; dim > 0; --dim) {
  5110. spvType = builder.makeArrayType(spvType, makeArraySizeId(*type.getArraySizes(), dim), stride);
  5111. if (stride > 0)
  5112. builder.addDecoration(spvType, spv::Decoration::ArrayStride, stride);
  5113. stride *= type.getArraySizes()->getDimSize(dim);
  5114. }
  5115. } else {
  5116. // single-dimensional array, and don't yet have stride
  5117. // We need to decorate array strides for types needing explicit layout, except blocks.
  5118. if (explicitLayout != glslang::ElpNone && type.getBasicType() != glslang::EbtBlock)
  5119. stride = getArrayStride(type, explicitLayout, qualifier.layoutMatrix);
  5120. }
  5121. // Do the outer dimension, which might not be known for a runtime-sized array.
  5122. // (Unsized arrays that survive through linking will be runtime-sized arrays)
  5123. if (type.isSizedArray())
  5124. spvType = builder.makeArrayType(spvType, makeArraySizeId(*type.getArraySizes(), 0), stride);
  5125. else {
  5126. // If we see an runtime array in a buffer_reference, it is not a descriptor
  5127. if (!lastBufferBlockMember && type.getBasicType() != glslang::EbtReference) {
  5128. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  5129. builder.addCapability(spv::Capability::RuntimeDescriptorArrayEXT);
  5130. }
  5131. spvType = builder.makeRuntimeArray(spvType);
  5132. }
  5133. if (stride > 0)
  5134. builder.addDecoration(spvType, spv::Decoration::ArrayStride, stride);
  5135. }
  5136. return spvType;
  5137. }
  5138. // Apply SPIR-V decorations to the SPIR-V object (provided by SPIR-V ID). If member index is provided, the
  5139. // decorations are applied to this member.
  5140. void TGlslangToSpvTraverser::applySpirvDecorate(const glslang::TType& type, spv::Id id, std::optional<int> member)
  5141. {
  5142. assert(type.getQualifier().hasSpirvDecorate());
  5143. const glslang::TSpirvDecorate& spirvDecorate = type.getQualifier().getSpirvDecorate();
  5144. // Add spirv_decorate
  5145. for (auto& decorate : spirvDecorate.decorates) {
  5146. if (!decorate.second.empty()) {
  5147. std::vector<unsigned> literals;
  5148. TranslateLiterals(decorate.second, literals);
  5149. if (member.has_value())
  5150. builder.addMemberDecoration(id, *member, static_cast<spv::Decoration>(decorate.first), literals);
  5151. else
  5152. builder.addDecoration(id, static_cast<spv::Decoration>(decorate.first), literals);
  5153. } else {
  5154. if (member.has_value())
  5155. builder.addMemberDecoration(id, *member, static_cast<spv::Decoration>(decorate.first));
  5156. else
  5157. builder.addDecoration(id, static_cast<spv::Decoration>(decorate.first));
  5158. }
  5159. }
  5160. // Add spirv_decorate_id
  5161. if (member.has_value()) {
  5162. // spirv_decorate_id not applied to members
  5163. assert(spirvDecorate.decorateIds.empty());
  5164. } else {
  5165. for (auto& decorateId : spirvDecorate.decorateIds) {
  5166. std::vector<spv::Id> operandIds;
  5167. assert(!decorateId.second.empty());
  5168. for (auto extraOperand : decorateId.second) {
  5169. if (extraOperand->getQualifier().isFrontEndConstant())
  5170. operandIds.push_back(createSpvConstant(*extraOperand));
  5171. else
  5172. operandIds.push_back(getSymbolId(extraOperand->getAsSymbolNode()));
  5173. }
  5174. builder.addDecorationId(id, static_cast<spv::Decoration>(decorateId.first), operandIds);
  5175. }
  5176. }
  5177. // Add spirv_decorate_string
  5178. for (auto& decorateString : spirvDecorate.decorateStrings) {
  5179. std::vector<const char*> strings;
  5180. assert(!decorateString.second.empty());
  5181. for (auto extraOperand : decorateString.second) {
  5182. const char* string = extraOperand->getConstArray()[0].getSConst()->c_str();
  5183. strings.push_back(string);
  5184. }
  5185. if (member.has_value())
  5186. builder.addMemberDecoration(id, *member, static_cast<spv::Decoration>(decorateString.first), strings);
  5187. else
  5188. builder.addDecoration(id, static_cast<spv::Decoration>(decorateString.first), strings);
  5189. }
  5190. }
  5191. // TODO: this functionality should exist at a higher level, in creating the AST
  5192. //
  5193. // Identify interface members that don't have their required extension turned on.
  5194. //
  5195. bool TGlslangToSpvTraverser::filterMember(const glslang::TType& member)
  5196. {
  5197. auto& extensions = glslangIntermediate->getRequestedExtensions();
  5198. if (member.getFieldName() == "gl_SecondaryViewportMaskNV" &&
  5199. extensions.find("GL_NV_stereo_view_rendering") == extensions.end())
  5200. return true;
  5201. if (member.getFieldName() == "gl_SecondaryPositionNV" &&
  5202. extensions.find("GL_NV_stereo_view_rendering") == extensions.end())
  5203. return true;
  5204. if (glslangIntermediate->getStage() == EShLangMesh) {
  5205. if (member.getFieldName() == "gl_PrimitiveShadingRateEXT" &&
  5206. extensions.find("GL_EXT_fragment_shading_rate") == extensions.end())
  5207. return true;
  5208. }
  5209. if (glslangIntermediate->getStage() != EShLangMesh) {
  5210. if (member.getFieldName() == "gl_ViewportMask" &&
  5211. extensions.find("GL_NV_viewport_array2") == extensions.end())
  5212. return true;
  5213. if (member.getFieldName() == "gl_PositionPerViewNV" &&
  5214. extensions.find("GL_NVX_multiview_per_view_attributes") == extensions.end())
  5215. return true;
  5216. if (member.getFieldName() == "gl_ViewportMaskPerViewNV" &&
  5217. extensions.find("GL_NVX_multiview_per_view_attributes") == extensions.end())
  5218. return true;
  5219. }
  5220. return false;
  5221. }
  5222. // Do full recursive conversion of a glslang structure (or block) type to a SPIR-V Id.
  5223. // explicitLayout can be kept the same throughout the hierarchical recursive walk.
  5224. // Mutually recursive with convertGlslangToSpvType().
  5225. spv::Id TGlslangToSpvTraverser::convertGlslangStructToSpvType(const glslang::TType& type,
  5226. const glslang::TTypeList* glslangMembers,
  5227. glslang::TLayoutPacking explicitLayout,
  5228. const glslang::TQualifier& qualifier)
  5229. {
  5230. // Create a vector of struct types for SPIR-V to consume
  5231. std::vector<spv::Id> spvMembers;
  5232. int memberDelta = 0; // how much the member's index changes from glslang to SPIR-V, normally 0,
  5233. // except sometimes for blocks
  5234. std::vector<std::pair<glslang::TType*, glslang::TQualifier> > deferredForwardPointers;
  5235. std::vector<spv::StructMemberDebugInfo> memberDebugInfo;
  5236. for (int i = 0; i < (int)glslangMembers->size(); i++) {
  5237. auto& glslangMember = (*glslangMembers)[i];
  5238. if (glslangMember.type->hiddenMember()) {
  5239. ++memberDelta;
  5240. if (type.getBasicType() == glslang::EbtBlock)
  5241. memberRemapper[glslangTypeToIdMap[glslangMembers]][i] = -1;
  5242. } else {
  5243. if (type.getBasicType() == glslang::EbtBlock) {
  5244. if (filterMember(*glslangMember.type)) {
  5245. memberDelta++;
  5246. memberRemapper[glslangTypeToIdMap[glslangMembers]][i] = -1;
  5247. continue;
  5248. }
  5249. memberRemapper[glslangTypeToIdMap[glslangMembers]][i] = i - memberDelta;
  5250. }
  5251. // modify just this child's view of the qualifier
  5252. glslang::TQualifier memberQualifier = glslangMember.type->getQualifier();
  5253. InheritQualifiers(memberQualifier, qualifier);
  5254. // manually inherit location
  5255. if (! memberQualifier.hasLocation() && qualifier.hasLocation())
  5256. memberQualifier.layoutLocation = qualifier.layoutLocation;
  5257. // recurse
  5258. bool lastBufferBlockMember = qualifier.storage == glslang::EvqBuffer &&
  5259. i == (int)glslangMembers->size() - 1;
  5260. // Make forward pointers for any pointer members.
  5261. if (glslangMember.type->isReference() &&
  5262. forwardPointers.find(glslangMember.type->getReferentType()) == forwardPointers.end()) {
  5263. deferredForwardPointers.push_back(std::make_pair(glslangMember.type, memberQualifier));
  5264. }
  5265. // Create the member type.
  5266. auto const spvMember = convertGlslangToSpvType(*glslangMember.type, explicitLayout, memberQualifier, lastBufferBlockMember,
  5267. glslangMember.type->isReference());
  5268. spvMembers.push_back(spvMember);
  5269. // Update the builder with the type's location so that we can create debug types for the structure members.
  5270. // There doesn't exist a "clean" entry point for this information to be passed along to the builder so, for now,
  5271. // it is stored in the builder and consumed during the construction of composite debug types.
  5272. // TODO: This probably warrants further investigation. This approach was decided to be the least ugly of the
  5273. // quick and dirty approaches that were tried.
  5274. // Advantages of this approach:
  5275. // + Relatively clean. No direct calls into debug type system.
  5276. // + Handles nested recursive structures.
  5277. // Disadvantages of this approach:
  5278. // + Not as clean as desired. Traverser queries/sets persistent state. This is fragile.
  5279. // + Table lookup during creation of composite debug types. This really shouldn't be necessary.
  5280. if(options.emitNonSemanticShaderDebugInfo) {
  5281. spv::StructMemberDebugInfo debugInfo{};
  5282. debugInfo.name = glslangMember.type->getFieldName();
  5283. debugInfo.line = glslangMember.loc.line;
  5284. debugInfo.column = glslangMember.loc.column;
  5285. // Per the GLSL spec, bool variables inside of a uniform or buffer block are generated as uint.
  5286. // But for debug info, we want to represent them as bool because that is the original type in
  5287. // the source code. The bool type can be nested within a vector or a multidimensional array,
  5288. // so we must construct the chain of types up from the scalar bool.
  5289. if (glslangIntermediate->getSource() == glslang::EShSourceGlsl && explicitLayout != glslang::ElpNone &&
  5290. glslangMember.type->getBasicType() == glslang::EbtBool) {
  5291. auto typeId = builder.makeBoolType();
  5292. if (glslangMember.type->isVector()) {
  5293. typeId = builder.makeVectorType(typeId, glslangMember.type->getVectorSize());
  5294. }
  5295. if (glslangMember.type->isArray()) {
  5296. const auto* arraySizes = glslangMember.type->getArraySizes();
  5297. int dims = arraySizes->getNumDims();
  5298. for (int i = dims - 1; i >= 0; --i) {
  5299. spv::Id size = builder.makeIntConstant(arraySizes->getDimSize(i));
  5300. typeId = builder.makeArrayType(typeId, size, 0);
  5301. }
  5302. }
  5303. debugInfo.debugTypeOverride = builder.getDebugType(typeId);
  5304. }
  5305. memberDebugInfo.push_back(debugInfo);
  5306. }
  5307. }
  5308. }
  5309. // Make the SPIR-V type
  5310. spv::Id spvType = builder.makeStructType(spvMembers, memberDebugInfo, type.getTypeName().c_str(), false);
  5311. if (! HasNonLayoutQualifiers(type, qualifier))
  5312. structMap[explicitLayout][qualifier.layoutMatrix][glslangMembers] = spvType;
  5313. // Decorate it
  5314. decorateStructType(type, glslangMembers, explicitLayout, qualifier, spvType, spvMembers);
  5315. for (int i = 0; i < (int)deferredForwardPointers.size(); ++i) {
  5316. auto it = deferredForwardPointers[i];
  5317. convertGlslangToSpvType(*it.first, explicitLayout, it.second, false);
  5318. }
  5319. return spvType;
  5320. }
  5321. void TGlslangToSpvTraverser::decorateStructType(const glslang::TType& type,
  5322. const glslang::TTypeList* glslangMembers,
  5323. glslang::TLayoutPacking explicitLayout,
  5324. const glslang::TQualifier& qualifier,
  5325. spv::Id spvType,
  5326. const std::vector<spv::Id>& spvMembers)
  5327. {
  5328. // Name and decorate the non-hidden members
  5329. int offset = -1;
  5330. bool memberLocationInvalid = type.isArrayOfArrays() ||
  5331. (type.isArray() && (type.getQualifier().isArrayedIo(glslangIntermediate->getStage()) == false));
  5332. for (int i = 0; i < (int)glslangMembers->size(); i++) {
  5333. glslang::TType& glslangMember = *(*glslangMembers)[i].type;
  5334. int member = i;
  5335. if (type.getBasicType() == glslang::EbtBlock) {
  5336. member = memberRemapper[glslangTypeToIdMap[glslangMembers]][i];
  5337. if (filterMember(glslangMember))
  5338. continue;
  5339. }
  5340. // modify just this child's view of the qualifier
  5341. glslang::TQualifier memberQualifier = glslangMember.getQualifier();
  5342. InheritQualifiers(memberQualifier, qualifier);
  5343. // using -1 above to indicate a hidden member
  5344. if (member < 0)
  5345. continue;
  5346. builder.addMemberName(spvType, member, glslangMember.getFieldName().c_str());
  5347. builder.addMemberDecoration(spvType, member,
  5348. TranslateLayoutDecoration(glslangMember, memberQualifier.layoutMatrix));
  5349. builder.addMemberDecoration(spvType, member, TranslatePrecisionDecoration(glslangMember));
  5350. // Add interpolation and auxiliary storage decorations only to
  5351. // top-level members of Input and Output storage classes
  5352. if (type.getQualifier().storage == glslang::EvqVaryingIn ||
  5353. type.getQualifier().storage == glslang::EvqVaryingOut) {
  5354. if (type.getBasicType() == glslang::EbtBlock ||
  5355. glslangIntermediate->getSource() == glslang::EShSourceHlsl) {
  5356. builder.addMemberDecoration(spvType, member, TranslateInterpolationDecoration(memberQualifier));
  5357. builder.addMemberDecoration(spvType, member, TranslateAuxiliaryStorageDecoration(memberQualifier));
  5358. addMeshNVDecoration(spvType, member, memberQualifier);
  5359. }
  5360. }
  5361. builder.addMemberDecoration(spvType, member, TranslateInvariantDecoration(memberQualifier));
  5362. if (type.getBasicType() == glslang::EbtBlock &&
  5363. qualifier.storage == glslang::EvqBuffer) {
  5364. // Add memory decorations only to top-level members of shader storage block
  5365. std::vector<spv::Decoration> memory;
  5366. TranslateMemoryDecoration(memberQualifier, memory, glslangIntermediate->usingVulkanMemoryModel());
  5367. for (unsigned int i = 0; i < memory.size(); ++i)
  5368. builder.addMemberDecoration(spvType, member, memory[i]);
  5369. }
  5370. // Location assignment was already completed correctly by the front end,
  5371. // just track whether a member needs to be decorated.
  5372. // Ignore member locations if the container is an array, as that's
  5373. // ill-specified and decisions have been made to not allow this.
  5374. if (!memberLocationInvalid && memberQualifier.hasLocation())
  5375. builder.addMemberDecoration(spvType, member, spv::Decoration::Location, memberQualifier.layoutLocation);
  5376. // component, XFB, others
  5377. if (glslangMember.getQualifier().hasComponent())
  5378. builder.addMemberDecoration(spvType, member, spv::Decoration::Component,
  5379. glslangMember.getQualifier().layoutComponent);
  5380. if (glslangMember.getQualifier().hasXfbOffset())
  5381. builder.addMemberDecoration(spvType, member, spv::Decoration::Offset,
  5382. glslangMember.getQualifier().layoutXfbOffset);
  5383. else if (explicitLayout != glslang::ElpNone) {
  5384. // figure out what to do with offset, which is accumulating
  5385. int nextOffset;
  5386. updateMemberOffset(type, glslangMember, offset, nextOffset, explicitLayout, memberQualifier.layoutMatrix);
  5387. if (offset >= 0)
  5388. builder.addMemberDecoration(spvType, member, spv::Decoration::Offset, offset);
  5389. offset = nextOffset;
  5390. }
  5391. if (glslangMember.isMatrix() && explicitLayout != glslang::ElpNone)
  5392. builder.addMemberDecoration(spvType, member, spv::Decoration::MatrixStride,
  5393. getMatrixStride(glslangMember, explicitLayout, memberQualifier.layoutMatrix));
  5394. // built-in variable decorations
  5395. spv::BuiltIn builtIn = TranslateBuiltInDecoration(glslangMember.getQualifier().builtIn, true);
  5396. if (builtIn != spv::BuiltIn::Max)
  5397. builder.addMemberDecoration(spvType, member, spv::Decoration::BuiltIn, (int)builtIn);
  5398. // nonuniform
  5399. builder.addMemberDecoration(spvType, member, TranslateNonUniformDecoration(glslangMember.getQualifier()));
  5400. if (glslangIntermediate->getHlslFunctionality1() && memberQualifier.semanticName != nullptr) {
  5401. builder.addExtension("SPV_GOOGLE_hlsl_functionality1");
  5402. builder.addMemberDecoration(spvType, member, spv::Decoration::HlslSemanticGOOGLE,
  5403. memberQualifier.semanticName);
  5404. }
  5405. if (builtIn == spv::BuiltIn::Layer) {
  5406. // SPV_NV_viewport_array2 extension
  5407. if (glslangMember.getQualifier().layoutViewportRelative){
  5408. builder.addMemberDecoration(spvType, member, spv::Decoration::ViewportRelativeNV);
  5409. builder.addCapability(spv::Capability::ShaderViewportMaskNV);
  5410. builder.addExtension(spv::E_SPV_NV_viewport_array2);
  5411. }
  5412. if (glslangMember.getQualifier().layoutSecondaryViewportRelativeOffset != -2048){
  5413. builder.addMemberDecoration(spvType, member,
  5414. spv::Decoration::SecondaryViewportRelativeNV,
  5415. glslangMember.getQualifier().layoutSecondaryViewportRelativeOffset);
  5416. builder.addCapability(spv::Capability::ShaderStereoViewNV);
  5417. builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
  5418. }
  5419. }
  5420. if (glslangMember.getQualifier().layoutPassthrough) {
  5421. builder.addMemberDecoration(spvType, member, spv::Decoration::PassthroughNV);
  5422. builder.addCapability(spv::Capability::GeometryShaderPassthroughNV);
  5423. builder.addExtension(spv::E_SPV_NV_geometry_shader_passthrough);
  5424. }
  5425. // Add SPIR-V decorations (GL_EXT_spirv_intrinsics)
  5426. if (glslangMember.getQualifier().hasSpirvDecorate())
  5427. applySpirvDecorate(glslangMember, spvType, member);
  5428. }
  5429. // Decorate the structure
  5430. builder.addDecoration(spvType, TranslateLayoutDecoration(type, qualifier.layoutMatrix));
  5431. const auto basicType = type.getBasicType();
  5432. const auto typeStorageQualifier = type.getQualifier().storage;
  5433. if (basicType == glslang::EbtBlock) {
  5434. builder.addDecoration(spvType, TranslateBlockDecoration(typeStorageQualifier, glslangIntermediate->usingStorageBuffer()));
  5435. } else if (basicType == glslang::EbtStruct && glslangIntermediate->getSpv().vulkan > 0) {
  5436. const auto hasRuntimeArray = !spvMembers.empty() && builder.getOpCode(spvMembers.back()) == spv::Op::OpTypeRuntimeArray;
  5437. if (hasRuntimeArray) {
  5438. builder.addDecoration(spvType, TranslateBlockDecoration(typeStorageQualifier, glslangIntermediate->usingStorageBuffer()));
  5439. }
  5440. }
  5441. if (qualifier.hasHitObjectShaderRecordNV())
  5442. builder.addDecoration(spvType, spv::Decoration::HitObjectShaderRecordBufferNV);
  5443. if (qualifier.hasHitObjectShaderRecordEXT())
  5444. builder.addDecoration(spvType, spv::Decoration::HitObjectShaderRecordBufferEXT);
  5445. }
  5446. // Turn the expression forming the array size into an id.
  5447. // This is not quite trivial, because of specialization constants.
  5448. // Sometimes, a raw constant is turned into an Id, and sometimes
  5449. // a specialization constant expression is.
  5450. spv::Id TGlslangToSpvTraverser::makeArraySizeId(const glslang::TArraySizes& arraySizes, int dim, bool allowZero, bool boolType)
  5451. {
  5452. // First, see if this is sized with a node, meaning a specialization constant:
  5453. glslang::TIntermTyped* specNode = arraySizes.getDimNode(dim);
  5454. if (specNode != nullptr) {
  5455. builder.clearAccessChain();
  5456. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  5457. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  5458. specNode->traverse(this);
  5459. return accessChainLoad(specNode->getAsTyped()->getType());
  5460. }
  5461. // Otherwise, need a compile-time (front end) size, get it:
  5462. int size = arraySizes.getDimSize(dim);
  5463. if (!allowZero)
  5464. assert(size > 0);
  5465. if (boolType) {
  5466. return builder.makeBoolConstant(size);
  5467. } else {
  5468. return builder.makeUintConstant(size);
  5469. }
  5470. }
  5471. // Wrap the builder's accessChainLoad to:
  5472. // - localize handling of RelaxedPrecision
  5473. // - use the SPIR-V inferred type instead of another conversion of the glslang type
  5474. // (avoids unnecessary work and possible type punning for structures)
  5475. // - do conversion of concrete to abstract type
  5476. spv::Id TGlslangToSpvTraverser::accessChainLoad(const glslang::TType& type)
  5477. {
  5478. spv::Id nominalTypeId = builder.accessChainGetInferredType();
  5479. spv::Builder::AccessChain::CoherentFlags coherentFlags = builder.getAccessChain().coherentFlags;
  5480. coherentFlags |= TranslateCoherent(type);
  5481. spv::MemoryAccessMask accessMask = spv::MemoryAccessMask(TranslateMemoryAccess(coherentFlags) & ~spv::MemoryAccessMask::MakePointerAvailableKHR);
  5482. // If the value being loaded is HelperInvocation, SPIR-V 1.6 is being generated (so that
  5483. // SPV_EXT_demote_to_helper_invocation is in core) and the memory model is in use, add
  5484. // the Volatile MemoryAccess semantic.
  5485. if (type.getQualifier().builtIn == glslang::EbvHelperInvocation &&
  5486. glslangIntermediate->usingVulkanMemoryModel() &&
  5487. glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {
  5488. accessMask = spv::MemoryAccessMask(accessMask | spv::MemoryAccessMask::Volatile);
  5489. }
  5490. unsigned int alignment = builder.getAccessChain().alignment;
  5491. alignment |= type.getBufferReferenceAlignment();
  5492. spv::Id loadedId = builder.accessChainLoad(TranslatePrecisionDecoration(type),
  5493. TranslateNonUniformDecoration(builder.getAccessChain().coherentFlags),
  5494. TranslateNonUniformDecoration(type.getQualifier()),
  5495. nominalTypeId,
  5496. accessMask,
  5497. TranslateMemoryScope(coherentFlags),
  5498. alignment);
  5499. // Need to convert to abstract types when necessary
  5500. if (type.getBasicType() == glslang::EbtBool) {
  5501. loadedId = convertLoadedBoolInUniformToUint(type, nominalTypeId, loadedId);
  5502. }
  5503. return loadedId;
  5504. }
  5505. // Wrap the builder's accessChainStore to:
  5506. // - do conversion of concrete to abstract type
  5507. //
  5508. // Implicitly uses the existing builder.accessChain as the storage target.
  5509. void TGlslangToSpvTraverser::accessChainStore(const glslang::TType& type, spv::Id rvalue)
  5510. {
  5511. // Need to convert to abstract types when necessary
  5512. if (type.getBasicType() == glslang::EbtBool) {
  5513. spv::Id nominalTypeId = builder.accessChainGetInferredType();
  5514. if (builder.isScalarType(nominalTypeId)) {
  5515. // Conversion for bool
  5516. spv::Id boolType = builder.makeBoolType();
  5517. if (nominalTypeId != boolType) {
  5518. // keep these outside arguments, for determinant order-of-evaluation
  5519. spv::Id one = builder.makeUintConstant(1);
  5520. spv::Id zero = builder.makeUintConstant(0);
  5521. rvalue = builder.createTriOp(spv::Op::OpSelect, nominalTypeId, rvalue, one, zero);
  5522. } else if (builder.getTypeId(rvalue) != boolType)
  5523. rvalue = builder.createBinOp(spv::Op::OpINotEqual, boolType, rvalue, builder.makeUintConstant(0));
  5524. } else if (builder.isVectorType(nominalTypeId)) {
  5525. // Conversion for bvec
  5526. int vecSize = builder.getNumTypeComponents(nominalTypeId);
  5527. spv::Id bvecType = builder.makeVectorType(builder.makeBoolType(), vecSize);
  5528. if (nominalTypeId != bvecType) {
  5529. // keep these outside arguments, for determinant order-of-evaluation
  5530. spv::Id one = makeSmearedConstant(builder.makeUintConstant(1), vecSize);
  5531. spv::Id zero = makeSmearedConstant(builder.makeUintConstant(0), vecSize);
  5532. rvalue = builder.createTriOp(spv::Op::OpSelect, nominalTypeId, rvalue, one, zero);
  5533. } else if (builder.getTypeId(rvalue) != bvecType)
  5534. rvalue = builder.createBinOp(spv::Op::OpINotEqual, bvecType, rvalue,
  5535. makeSmearedConstant(builder.makeUintConstant(0), vecSize));
  5536. }
  5537. }
  5538. spv::Builder::AccessChain::CoherentFlags coherentFlags = builder.getAccessChain().coherentFlags;
  5539. coherentFlags |= TranslateCoherent(type);
  5540. unsigned int alignment = builder.getAccessChain().alignment;
  5541. alignment |= type.getBufferReferenceAlignment();
  5542. builder.accessChainStore(rvalue, TranslateNonUniformDecoration(builder.getAccessChain().coherentFlags),
  5543. spv::MemoryAccessMask(TranslateMemoryAccess(coherentFlags) &
  5544. ~spv::MemoryAccessMask::MakePointerVisibleKHR),
  5545. TranslateMemoryScope(coherentFlags), alignment);
  5546. }
  5547. // For storing when types match at the glslang level, but not might match at the
  5548. // SPIR-V level.
  5549. //
  5550. // This especially happens when a single glslang type expands to multiple
  5551. // SPIR-V types, like a struct that is used in a member-undecorated way as well
  5552. // as in a member-decorated way.
  5553. //
  5554. // NOTE: This function can handle any store request; if it's not special it
  5555. // simplifies to a simple OpStore.
  5556. //
  5557. // Implicitly uses the existing builder.accessChain as the storage target.
  5558. void TGlslangToSpvTraverser::multiTypeStore(const glslang::TType& type, spv::Id rValue)
  5559. {
  5560. // we only do the complex path here if it's an aggregate
  5561. if (! type.isStruct() && ! type.isArray()) {
  5562. accessChainStore(type, rValue);
  5563. return;
  5564. }
  5565. // and, it has to be a case of type aliasing
  5566. spv::Id rType = builder.getTypeId(rValue);
  5567. spv::Id lValue = builder.accessChainGetLValue();
  5568. spv::Id lType = builder.getContainedTypeId(builder.getTypeId(lValue));
  5569. if (lType == rType) {
  5570. accessChainStore(type, rValue);
  5571. return;
  5572. }
  5573. // Recursively (as needed) copy an aggregate type to a different aggregate type,
  5574. // where the two types were the same type in GLSL. This requires member
  5575. // by member copy, recursively.
  5576. // SPIR-V 1.4 added an instruction to do help do this.
  5577. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {
  5578. // However, bool in uniform space is changed to int, so
  5579. // OpCopyLogical does not work for that.
  5580. // TODO: It would be more robust to do a full recursive verification of the types satisfying SPIR-V rules.
  5581. bool rBool = builder.containsType(builder.getTypeId(rValue), spv::Op::OpTypeBool, 0);
  5582. bool lBool = builder.containsType(lType, spv::Op::OpTypeBool, 0);
  5583. if (lBool == rBool) {
  5584. spv::Id logicalCopy = builder.createUnaryOp(spv::Op::OpCopyLogical, lType, rValue);
  5585. accessChainStore(type, logicalCopy);
  5586. return;
  5587. }
  5588. }
  5589. // If an array, copy element by element.
  5590. if (type.isArray()) {
  5591. glslang::TType glslangElementType(type, 0);
  5592. spv::Id elementRType = builder.getContainedTypeId(rType);
  5593. for (int index = 0; index < type.getOuterArraySize(); ++index) {
  5594. // get the source member
  5595. spv::Id elementRValue = builder.createCompositeExtract(rValue, elementRType, index);
  5596. // set up the target storage
  5597. builder.clearAccessChain();
  5598. builder.setAccessChainLValue(lValue);
  5599. builder.accessChainPush(builder.makeIntConstant(index), TranslateCoherent(type),
  5600. type.getBufferReferenceAlignment());
  5601. // store the member
  5602. multiTypeStore(glslangElementType, elementRValue);
  5603. }
  5604. } else {
  5605. assert(type.isStruct());
  5606. // loop over structure members
  5607. const glslang::TTypeList& members = *type.getStruct();
  5608. for (int m = 0; m < (int)members.size(); ++m) {
  5609. const glslang::TType& glslangMemberType = *members[m].type;
  5610. // get the source member
  5611. spv::Id memberRType = builder.getContainedTypeId(rType, m);
  5612. spv::Id memberRValue = builder.createCompositeExtract(rValue, memberRType, m);
  5613. // set up the target storage
  5614. builder.clearAccessChain();
  5615. builder.setAccessChainLValue(lValue);
  5616. builder.accessChainPush(builder.makeIntConstant(m), TranslateCoherent(type),
  5617. type.getBufferReferenceAlignment());
  5618. // store the member
  5619. multiTypeStore(glslangMemberType, memberRValue);
  5620. }
  5621. }
  5622. }
  5623. // Decide whether or not this type should be
  5624. // decorated with offsets and strides, and if so
  5625. // whether std140 or std430 rules should be applied.
  5626. glslang::TLayoutPacking TGlslangToSpvTraverser::getExplicitLayout(const glslang::TType& type) const
  5627. {
  5628. // has to be a block
  5629. if (type.getBasicType() != glslang::EbtBlock)
  5630. return glslang::ElpNone;
  5631. // has to be a uniform or buffer block or task in/out blocks
  5632. if (type.getQualifier().storage != glslang::EvqUniform &&
  5633. type.getQualifier().storage != glslang::EvqBuffer &&
  5634. type.getQualifier().storage != glslang::EvqShared &&
  5635. !type.getQualifier().isTaskMemory())
  5636. return glslang::ElpNone;
  5637. // return the layout to use
  5638. switch (type.getQualifier().layoutPacking) {
  5639. case glslang::ElpStd140:
  5640. case glslang::ElpStd430:
  5641. case glslang::ElpScalar:
  5642. return type.getQualifier().layoutPacking;
  5643. default:
  5644. return glslang::ElpNone;
  5645. }
  5646. }
  5647. // Given an array type, returns the integer stride required for that array
  5648. int TGlslangToSpvTraverser::getArrayStride(const glslang::TType& arrayType, glslang::TLayoutPacking explicitLayout,
  5649. glslang::TLayoutMatrix matrixLayout)
  5650. {
  5651. int size;
  5652. int stride;
  5653. glslangIntermediate->getMemberAlignment(arrayType, size, stride, explicitLayout,
  5654. matrixLayout == glslang::ElmRowMajor);
  5655. return stride;
  5656. }
  5657. // Given a matrix type, or array (of array) of matrixes type, returns the integer stride required for that matrix
  5658. // when used as a member of an interface block
  5659. int TGlslangToSpvTraverser::getMatrixStride(const glslang::TType& matrixType, glslang::TLayoutPacking explicitLayout,
  5660. glslang::TLayoutMatrix matrixLayout)
  5661. {
  5662. glslang::TType elementType;
  5663. elementType.shallowCopy(matrixType);
  5664. elementType.clearArraySizes();
  5665. int size;
  5666. int stride;
  5667. glslangIntermediate->getMemberAlignment(elementType, size, stride, explicitLayout,
  5668. matrixLayout == glslang::ElmRowMajor);
  5669. return stride;
  5670. }
  5671. // Given a member type of a struct, realign the current offset for it, and compute
  5672. // the next (not yet aligned) offset for the next member, which will get aligned
  5673. // on the next call.
  5674. // 'currentOffset' should be passed in already initialized, ready to modify, and reflecting
  5675. // the migration of data from nextOffset -> currentOffset. It should be -1 on the first call.
  5676. // -1 means a non-forced member offset (no decoration needed).
  5677. void TGlslangToSpvTraverser::updateMemberOffset(const glslang::TType& structType, const glslang::TType& memberType,
  5678. int& currentOffset, int& nextOffset, glslang::TLayoutPacking explicitLayout, glslang::TLayoutMatrix matrixLayout)
  5679. {
  5680. // this will get a positive value when deemed necessary
  5681. nextOffset = -1;
  5682. // override anything in currentOffset with user-set offset
  5683. if (memberType.getQualifier().hasOffset())
  5684. currentOffset = memberType.getQualifier().layoutOffset;
  5685. // It could be that current linker usage in glslang updated all the layoutOffset,
  5686. // in which case the following code does not matter. But, that's not quite right
  5687. // once cross-compilation unit GLSL validation is done, as the original user
  5688. // settings are needed in layoutOffset, and then the following will come into play.
  5689. if (explicitLayout == glslang::ElpNone) {
  5690. if (! memberType.getQualifier().hasOffset())
  5691. currentOffset = -1;
  5692. return;
  5693. }
  5694. // Getting this far means we need explicit offsets
  5695. if (currentOffset < 0)
  5696. currentOffset = 0;
  5697. // Now, currentOffset is valid (either 0, or from a previous nextOffset),
  5698. // but possibly not yet correctly aligned.
  5699. int memberSize;
  5700. int dummyStride;
  5701. int memberAlignment = glslangIntermediate->getMemberAlignment(memberType, memberSize, dummyStride, explicitLayout,
  5702. matrixLayout == glslang::ElmRowMajor);
  5703. bool isVectorLike = memberType.isVector();
  5704. if (memberType.isMatrix()) {
  5705. if (matrixLayout == glslang::ElmRowMajor)
  5706. isVectorLike = memberType.getMatrixRows() == 1;
  5707. else
  5708. isVectorLike = memberType.getMatrixCols() == 1;
  5709. }
  5710. // Adjust alignment for HLSL rules
  5711. // TODO: make this consistent in early phases of code:
  5712. // adjusting this late means inconsistencies with earlier code, which for reflection is an issue
  5713. // Until reflection is brought in sync with these adjustments, don't apply to $Global,
  5714. // which is the most likely to rely on reflection, and least likely to rely implicit layouts
  5715. if (glslangIntermediate->usingHlslOffsets() &&
  5716. ! memberType.isStruct() && structType.getTypeName().compare("$Global") != 0) {
  5717. int componentSize;
  5718. int componentAlignment = glslangIntermediate->getBaseAlignmentScalar(memberType, componentSize);
  5719. if (! memberType.isArray() && isVectorLike && componentAlignment <= 4)
  5720. memberAlignment = componentAlignment;
  5721. // Don't add unnecessary padding after this member
  5722. // (undo std140 bumping size to a mutliple of vec4)
  5723. if (explicitLayout == glslang::ElpStd140) {
  5724. if (memberType.isMatrix()) {
  5725. if (matrixLayout == glslang::ElmRowMajor)
  5726. memberSize -= componentSize * (4 - memberType.getMatrixCols());
  5727. else
  5728. memberSize -= componentSize * (4 - memberType.getMatrixRows());
  5729. } else if (memberType.isArray())
  5730. memberSize -= componentSize * (4 - memberType.getVectorSize());
  5731. }
  5732. }
  5733. // Bump up to member alignment
  5734. glslang::RoundToPow2(currentOffset, memberAlignment);
  5735. // Bump up to vec4 if there is a bad straddle
  5736. if (explicitLayout != glslang::ElpScalar && glslangIntermediate->improperStraddle(memberType, memberSize,
  5737. currentOffset, isVectorLike))
  5738. glslang::RoundToPow2(currentOffset, 16);
  5739. nextOffset = currentOffset + memberSize;
  5740. }
  5741. void TGlslangToSpvTraverser::declareUseOfStructMember(const glslang::TTypeList& members, int glslangMember)
  5742. {
  5743. const glslang::TBuiltInVariable glslangBuiltIn = members[glslangMember].type->getQualifier().builtIn;
  5744. switch (glslangBuiltIn)
  5745. {
  5746. case glslang::EbvPointSize:
  5747. case glslang::EbvClipDistance:
  5748. case glslang::EbvCullDistance:
  5749. case glslang::EbvViewportMaskNV:
  5750. case glslang::EbvSecondaryPositionNV:
  5751. case glslang::EbvSecondaryViewportMaskNV:
  5752. case glslang::EbvPositionPerViewNV:
  5753. case glslang::EbvViewportMaskPerViewNV:
  5754. case glslang::EbvTaskCountNV:
  5755. case glslang::EbvPrimitiveCountNV:
  5756. case glslang::EbvPrimitiveIndicesNV:
  5757. case glslang::EbvClipDistancePerViewNV:
  5758. case glslang::EbvCullDistancePerViewNV:
  5759. case glslang::EbvLayerPerViewNV:
  5760. case glslang::EbvMeshViewCountNV:
  5761. case glslang::EbvMeshViewIndicesNV:
  5762. // Generate the associated capability. Delegate to TranslateBuiltInDecoration.
  5763. // Alternately, we could just call this for any glslang built-in, since the
  5764. // capability already guards against duplicates.
  5765. TranslateBuiltInDecoration(glslangBuiltIn, false);
  5766. break;
  5767. default:
  5768. // Capabilities were already generated when the struct was declared.
  5769. break;
  5770. }
  5771. }
  5772. bool TGlslangToSpvTraverser::isShaderEntryPoint(const glslang::TIntermAggregate* node)
  5773. {
  5774. return node->getName().compare(glslangIntermediate->getEntryPointMangledName().c_str()) == 0;
  5775. }
  5776. // Does parameter need a place to keep writes, separate from the original?
  5777. // Assumes called after originalParam(), which filters out block/buffer/opaque-based
  5778. // qualifiers such that we should have only in/out/inout/constreadonly here.
  5779. bool TGlslangToSpvTraverser::writableParam(glslang::TStorageQualifier qualifier) const
  5780. {
  5781. assert(qualifier == glslang::EvqIn ||
  5782. qualifier == glslang::EvqOut ||
  5783. qualifier == glslang::EvqInOut ||
  5784. qualifier == glslang::EvqUniform ||
  5785. qualifier == glslang::EvqConstReadOnly);
  5786. return qualifier != glslang::EvqConstReadOnly &&
  5787. qualifier != glslang::EvqUniform;
  5788. }
  5789. // Is parameter pass-by-original?
  5790. bool TGlslangToSpvTraverser::originalParam(glslang::TStorageQualifier qualifier, const glslang::TType& paramType,
  5791. bool implicitThisParam)
  5792. {
  5793. if (implicitThisParam) // implicit this
  5794. return true;
  5795. if (glslangIntermediate->getSource() == glslang::EShSourceHlsl)
  5796. return paramType.getBasicType() == glslang::EbtBlock;
  5797. return (paramType.containsOpaque() && !glslangIntermediate->getBindlessMode()) || // sampler, etc.
  5798. paramType.getQualifier().isSpirvByReference() || // spirv_by_reference
  5799. (paramType.getBasicType() == glslang::EbtBlock && qualifier == glslang::EvqBuffer); // SSBO
  5800. }
  5801. // Make all the functions, skeletally, without actually visiting their bodies.
  5802. void TGlslangToSpvTraverser::makeFunctions(const glslang::TIntermSequence& glslFunctions)
  5803. {
  5804. const auto getParamDecorations = [&](std::vector<spv::Decoration>& decorations, const glslang::TType& type,
  5805. bool useVulkanMemoryModel) {
  5806. spv::Decoration paramPrecision = TranslatePrecisionDecoration(type);
  5807. if (paramPrecision != spv::NoPrecision)
  5808. decorations.push_back(paramPrecision);
  5809. TranslateMemoryDecoration(type.getQualifier(), decorations, useVulkanMemoryModel);
  5810. if (type.isReference()) {
  5811. // Original and non-writable params pass the pointer directly and
  5812. // use restrict/aliased, others are stored to a pointer in Function
  5813. // memory and use RestrictPointer/AliasedPointer.
  5814. if (originalParam(type.getQualifier().storage, type, false) ||
  5815. !writableParam(type.getQualifier().storage)) {
  5816. // TranslateMemoryDecoration added Restrict decoration already.
  5817. if (!type.getQualifier().isRestrict()) {
  5818. decorations.push_back(spv::Decoration::Aliased);
  5819. }
  5820. } else {
  5821. decorations.push_back(type.getQualifier().isRestrict() ? spv::Decoration::RestrictPointerEXT :
  5822. spv::Decoration::AliasedPointerEXT);
  5823. }
  5824. }
  5825. };
  5826. for (int f = 0; f < (int)glslFunctions.size(); ++f) {
  5827. glslang::TIntermAggregate* glslFunction = glslFunctions[f]->getAsAggregate();
  5828. if (! glslFunction || glslFunction->getOp() != glslang::EOpFunction)
  5829. continue;
  5830. builder.setDebugSourceLocation(glslFunction->getLoc().line, glslFunction->getLoc().getFilename());
  5831. if (isShaderEntryPoint(glslFunction)) {
  5832. // For HLSL, the entry function is actually a compiler generated function to resolve the difference of
  5833. // entry function signature between HLSL and SPIR-V. So we don't emit debug information for that.
  5834. if (glslangIntermediate->getSource() != glslang::EShSourceHlsl) {
  5835. builder.setupFunctionDebugInfo(shaderEntry, glslangIntermediate->getEntryPointMangledName().c_str(),
  5836. std::vector<spv::Id>(), // main function has no param
  5837. std::vector<char const*>());
  5838. }
  5839. continue;
  5840. }
  5841. // We're on a user function. Set up the basic interface for the function now,
  5842. // so that it's available to call. Translating the body will happen later.
  5843. //
  5844. // Typically (except for a "const in" parameter), an address will be passed to the
  5845. // function. What it is an address of varies:
  5846. //
  5847. // - "in" parameters not marked as "const" can be written to without modifying the calling
  5848. // argument so that write needs to be to a copy, hence the address of a copy works.
  5849. //
  5850. // - "const in" parameters can just be the r-value, as no writes need occur.
  5851. //
  5852. // - "out" and "inout" arguments can't be done as pointers to the calling argument, because
  5853. // GLSL has copy-in/copy-out semantics. They can be handled though with a pointer to a copy.
  5854. std::vector<spv::Id> paramTypes;
  5855. std::vector<char const*> paramNames;
  5856. std::vector<std::vector<spv::Decoration>> paramDecorations; // list of decorations per parameter
  5857. glslang::TIntermSequence& parameters = glslFunction->getSequence()[0]->getAsAggregate()->getSequence();
  5858. #ifdef ENABLE_HLSL
  5859. bool implicitThis = (int)parameters.size() > 0 && parameters[0]->getAsSymbolNode()->getName() ==
  5860. glslangIntermediate->implicitThisName;
  5861. #else
  5862. bool implicitThis = false;
  5863. #endif
  5864. paramDecorations.resize(parameters.size());
  5865. for (int p = 0; p < (int)parameters.size(); ++p) {
  5866. const glslang::TType& paramType = parameters[p]->getAsTyped()->getType();
  5867. spv::Id typeId = convertGlslangToSpvType(paramType);
  5868. if (originalParam(paramType.getQualifier().storage, paramType, implicitThis && p == 0))
  5869. typeId = builder.makePointer(TranslateStorageClass(paramType), typeId);
  5870. else if (writableParam(paramType.getQualifier().storage))
  5871. typeId = builder.makePointer(spv::StorageClass::Function, typeId);
  5872. else
  5873. rValueParameters.insert(parameters[p]->getAsSymbolNode()->getId());
  5874. getParamDecorations(paramDecorations[p], paramType, glslangIntermediate->usingVulkanMemoryModel());
  5875. paramTypes.push_back(typeId);
  5876. }
  5877. for (auto const parameter:parameters) {
  5878. paramNames.push_back(parameter->getAsSymbolNode()->getName().c_str());
  5879. }
  5880. spv::Block* functionBlock;
  5881. spv::Function* function = builder.makeFunctionEntry(
  5882. TranslatePrecisionDecoration(glslFunction->getType()), convertGlslangToSpvType(glslFunction->getType()),
  5883. glslFunction->getName().c_str(), convertGlslangLinkageToSpv(glslFunction->getLinkType()), paramTypes,
  5884. paramDecorations, &functionBlock);
  5885. builder.setupFunctionDebugInfo(function, glslFunction->getName().c_str(), paramTypes, paramNames);
  5886. if (implicitThis)
  5887. function->setImplicitThis();
  5888. // Track function to emit/call later
  5889. functionMap[glslFunction->getName().c_str()] = function;
  5890. // Set the parameter id's
  5891. for (int p = 0; p < (int)parameters.size(); ++p) {
  5892. symbolValues[parameters[p]->getAsSymbolNode()->getId()] = function->getParamId(p);
  5893. // give a name too
  5894. builder.addName(function->getParamId(p), parameters[p]->getAsSymbolNode()->getName().c_str());
  5895. const glslang::TType& paramType = parameters[p]->getAsTyped()->getType();
  5896. if (paramType.contains8BitInt())
  5897. builder.addCapability(spv::Capability::Int8);
  5898. if (paramType.contains16BitInt())
  5899. builder.addCapability(spv::Capability::Int16);
  5900. if (paramType.contains16BitFloat())
  5901. builder.addCapability(spv::Capability::Float16);
  5902. }
  5903. }
  5904. }
  5905. // Process all the initializers, while skipping the functions and link objects
  5906. void TGlslangToSpvTraverser::makeGlobalInitializers(const glslang::TIntermSequence& initializers)
  5907. {
  5908. builder.setBuildPoint(shaderEntry->getLastBlock());
  5909. for (int i = 0; i < (int)initializers.size(); ++i) {
  5910. glslang::TIntermAggregate* initializer = initializers[i]->getAsAggregate();
  5911. if (initializer && initializer->getOp() != glslang::EOpFunction && initializer->getOp() !=
  5912. glslang::EOpLinkerObjects) {
  5913. // We're on a top-level node that's not a function. Treat as an initializer, whose
  5914. // code goes into the beginning of the entry point.
  5915. initializer->traverse(this);
  5916. }
  5917. }
  5918. }
  5919. // Walk over all linker objects to create a map for payload and callable data linker objects
  5920. // and their location to be used during codegen for OpTraceKHR and OpExecuteCallableKHR
  5921. // This is done here since it is possible that these linker objects are not be referenced in the AST
  5922. void TGlslangToSpvTraverser::collectRayTracingLinkerObjects()
  5923. {
  5924. glslang::TIntermAggregate* linkerObjects = glslangIntermediate->findLinkerObjects();
  5925. for (auto& objSeq : linkerObjects->getSequence()) {
  5926. auto objNode = objSeq->getAsSymbolNode();
  5927. if (objNode != nullptr) {
  5928. if (objNode->getQualifier().hasLocation()) {
  5929. unsigned int location = objNode->getQualifier().layoutLocation;
  5930. auto st = objNode->getQualifier().storage;
  5931. int set;
  5932. switch (st)
  5933. {
  5934. case glslang::EvqPayload:
  5935. case glslang::EvqPayloadIn:
  5936. set = 0;
  5937. break;
  5938. case glslang::EvqCallableData:
  5939. case glslang::EvqCallableDataIn:
  5940. set = 1;
  5941. break;
  5942. case glslang::EvqHitObjectAttrNV:
  5943. case glslang::EvqHitObjectAttrEXT:
  5944. set = 2;
  5945. break;
  5946. default:
  5947. set = -1;
  5948. }
  5949. if (set != -1)
  5950. locationToSymbol[set].insert(std::make_pair(location, objNode));
  5951. }
  5952. }
  5953. }
  5954. }
  5955. // Process all the functions, while skipping initializers.
  5956. void TGlslangToSpvTraverser::visitFunctions(const glslang::TIntermSequence& glslFunctions)
  5957. {
  5958. for (int f = 0; f < (int)glslFunctions.size(); ++f) {
  5959. glslang::TIntermAggregate* node = glslFunctions[f]->getAsAggregate();
  5960. if (node && (node->getOp() == glslang::EOpFunction || node->getOp() == glslang::EOpLinkerObjects))
  5961. node->traverse(this);
  5962. }
  5963. }
  5964. void TGlslangToSpvTraverser::translateArguments(const glslang::TIntermAggregate& node, std::vector<spv::Id>& arguments,
  5965. spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags)
  5966. {
  5967. const glslang::TIntermSequence& glslangArguments = node.getSequence();
  5968. glslang::TSampler sampler = {};
  5969. bool cubeCompare = false;
  5970. bool f16ShadowCompare = false;
  5971. if (node.isTexture() || node.isImage()) {
  5972. sampler = glslangArguments[0]->getAsTyped()->getType().getSampler();
  5973. cubeCompare = sampler.dim == glslang::EsdCube && sampler.arrayed && sampler.shadow;
  5974. f16ShadowCompare = sampler.shadow &&
  5975. glslangArguments[1]->getAsTyped()->getType().getBasicType() == glslang::EbtFloat16;
  5976. }
  5977. for (int i = 0; i < (int)glslangArguments.size(); ++i) {
  5978. builder.clearAccessChain();
  5979. glslangArguments[i]->traverse(this);
  5980. // Special case l-value operands
  5981. bool lvalue = false;
  5982. switch (node.getOp()) {
  5983. case glslang::EOpImageAtomicAdd:
  5984. case glslang::EOpImageAtomicMin:
  5985. case glslang::EOpImageAtomicMax:
  5986. case glslang::EOpImageAtomicAnd:
  5987. case glslang::EOpImageAtomicOr:
  5988. case glslang::EOpImageAtomicXor:
  5989. case glslang::EOpImageAtomicExchange:
  5990. case glslang::EOpImageAtomicCompSwap:
  5991. case glslang::EOpImageAtomicLoad:
  5992. case glslang::EOpImageAtomicStore:
  5993. if (i == 0)
  5994. lvalue = true;
  5995. break;
  5996. case glslang::EOpSparseImageLoad:
  5997. if ((sampler.ms && i == 3) || (! sampler.ms && i == 2))
  5998. lvalue = true;
  5999. break;
  6000. case glslang::EOpSparseTexture:
  6001. if (((cubeCompare || f16ShadowCompare) && i == 3) || (! (cubeCompare || f16ShadowCompare) && i == 2))
  6002. lvalue = true;
  6003. break;
  6004. case glslang::EOpSparseTextureClamp:
  6005. if (((cubeCompare || f16ShadowCompare) && i == 4) || (! (cubeCompare || f16ShadowCompare) && i == 3))
  6006. lvalue = true;
  6007. break;
  6008. case glslang::EOpSparseTextureLod:
  6009. case glslang::EOpSparseTextureOffset:
  6010. if ((f16ShadowCompare && i == 4) || (! f16ShadowCompare && i == 3))
  6011. lvalue = true;
  6012. break;
  6013. case glslang::EOpSparseTextureFetch:
  6014. if ((sampler.dim != glslang::EsdRect && i == 3) || (sampler.dim == glslang::EsdRect && i == 2))
  6015. lvalue = true;
  6016. break;
  6017. case glslang::EOpSparseTextureFetchOffset:
  6018. if ((sampler.dim != glslang::EsdRect && i == 4) || (sampler.dim == glslang::EsdRect && i == 3))
  6019. lvalue = true;
  6020. break;
  6021. case glslang::EOpSparseTextureLodOffset:
  6022. case glslang::EOpSparseTextureGrad:
  6023. case glslang::EOpSparseTextureOffsetClamp:
  6024. if ((f16ShadowCompare && i == 5) || (! f16ShadowCompare && i == 4))
  6025. lvalue = true;
  6026. break;
  6027. case glslang::EOpSparseTextureGradOffset:
  6028. case glslang::EOpSparseTextureGradClamp:
  6029. if ((f16ShadowCompare && i == 6) || (! f16ShadowCompare && i == 5))
  6030. lvalue = true;
  6031. break;
  6032. case glslang::EOpSparseTextureGradOffsetClamp:
  6033. if ((f16ShadowCompare && i == 7) || (! f16ShadowCompare && i == 6))
  6034. lvalue = true;
  6035. break;
  6036. case glslang::EOpSparseTextureGather:
  6037. if ((sampler.shadow && i == 3) || (! sampler.shadow && i == 2))
  6038. lvalue = true;
  6039. break;
  6040. case glslang::EOpSparseTextureGatherOffset:
  6041. case glslang::EOpSparseTextureGatherOffsets:
  6042. if ((sampler.shadow && i == 4) || (! sampler.shadow && i == 3))
  6043. lvalue = true;
  6044. break;
  6045. case glslang::EOpSparseTextureGatherLod:
  6046. if (i == 3)
  6047. lvalue = true;
  6048. break;
  6049. case glslang::EOpSparseTextureGatherLodOffset:
  6050. case glslang::EOpSparseTextureGatherLodOffsets:
  6051. if (i == 4)
  6052. lvalue = true;
  6053. break;
  6054. case glslang::EOpSparseImageLoadLod:
  6055. if (i == 3)
  6056. lvalue = true;
  6057. break;
  6058. case glslang::EOpImageSampleFootprintNV:
  6059. if (i == 4)
  6060. lvalue = true;
  6061. break;
  6062. case glslang::EOpImageSampleFootprintClampNV:
  6063. case glslang::EOpImageSampleFootprintLodNV:
  6064. if (i == 5)
  6065. lvalue = true;
  6066. break;
  6067. case glslang::EOpImageSampleFootprintGradNV:
  6068. if (i == 6)
  6069. lvalue = true;
  6070. break;
  6071. case glslang::EOpImageSampleFootprintGradClampNV:
  6072. if (i == 7)
  6073. lvalue = true;
  6074. break;
  6075. case glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT:
  6076. case glslang::EOpRayQueryGetIntersectionLSSPositionsNV:
  6077. case glslang::EOpRayQueryGetIntersectionLSSRadiiNV:
  6078. if (i == 2)
  6079. lvalue = true;
  6080. break;
  6081. case glslang::EOpConstructSaturated:
  6082. if (i == 0)
  6083. lvalue = true;
  6084. break;
  6085. default:
  6086. break;
  6087. }
  6088. if (lvalue) {
  6089. spv::Id lvalue_id = builder.accessChainGetLValue();
  6090. arguments.push_back(lvalue_id);
  6091. lvalueCoherentFlags = builder.getAccessChain().coherentFlags;
  6092. builder.addDecoration(lvalue_id, TranslateNonUniformDecoration(lvalueCoherentFlags));
  6093. lvalueCoherentFlags |= TranslateCoherent(glslangArguments[i]->getAsTyped()->getType());
  6094. } else {
  6095. if (i > 0 &&
  6096. glslangArguments[i]->getAsSymbolNode() && glslangArguments[i-1]->getAsSymbolNode() &&
  6097. glslangArguments[i]->getAsSymbolNode()->getId() == glslangArguments[i-1]->getAsSymbolNode()->getId()) {
  6098. // Reuse the id if possible
  6099. arguments.push_back(arguments[i-1]);
  6100. } else {
  6101. arguments.push_back(accessChainLoad(glslangArguments[i]->getAsTyped()->getType()));
  6102. }
  6103. }
  6104. }
  6105. }
  6106. void TGlslangToSpvTraverser::translateArguments(glslang::TIntermUnary& node, std::vector<spv::Id>& arguments)
  6107. {
  6108. builder.clearAccessChain();
  6109. node.getOperand()->traverse(this);
  6110. arguments.push_back(accessChainLoad(node.getOperand()->getType()));
  6111. }
  6112. spv::Id TGlslangToSpvTraverser::createImageTextureFunctionCall(glslang::TIntermOperator* node)
  6113. {
  6114. if (! node->isImage() && ! node->isTexture())
  6115. return spv::NoResult;
  6116. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  6117. // Process a GLSL texturing op (will be SPV image)
  6118. const glslang::TType &imageType = node->getAsAggregate()
  6119. ? node->getAsAggregate()->getSequence()[0]->getAsTyped()->getType()
  6120. : node->getAsUnaryNode()->getOperand()->getAsTyped()->getType();
  6121. const glslang::TSampler sampler = imageType.getSampler();
  6122. bool f16ShadowCompare = (sampler.shadow && node->getAsAggregate())
  6123. ? node->getAsAggregate()->getSequence()[1]->getAsTyped()->getType().getBasicType() == glslang::EbtFloat16
  6124. : false;
  6125. const auto signExtensionMask = [&]() {
  6126. if (builder.getSpvVersion() >= spv::Spv_1_4) {
  6127. if (sampler.type == glslang::EbtUint)
  6128. return spv::ImageOperandsMask::ZeroExtend;
  6129. else if (sampler.type == glslang::EbtInt)
  6130. return spv::ImageOperandsMask::SignExtend;
  6131. }
  6132. return spv::ImageOperandsMask::MaskNone;
  6133. };
  6134. spv::Builder::AccessChain::CoherentFlags lvalueCoherentFlags;
  6135. std::vector<spv::Id> arguments;
  6136. if (node->getAsAggregate())
  6137. translateArguments(*node->getAsAggregate(), arguments, lvalueCoherentFlags);
  6138. else
  6139. translateArguments(*node->getAsUnaryNode(), arguments);
  6140. spv::Decoration precision = TranslatePrecisionDecoration(node->getType());
  6141. spv::Builder::TextureParameters params = { };
  6142. params.sampler = arguments[0];
  6143. glslang::TCrackedTextureOp cracked;
  6144. node->crackTexture(sampler, cracked);
  6145. const bool isUnsignedResult = node->getType().getBasicType() == glslang::EbtUint;
  6146. if (builder.isSampledImage(params.sampler) &&
  6147. ((cracked.query && node->getOp() != glslang::EOpTextureQueryLod) || cracked.fragMask || cracked.fetch)) {
  6148. params.sampler = builder.createUnaryOp(spv::Op::OpImage, builder.getImageType(params.sampler), params.sampler);
  6149. if (imageType.getQualifier().isNonUniform()) {
  6150. builder.addDecoration(params.sampler, spv::Decoration::NonUniformEXT);
  6151. }
  6152. }
  6153. // Check for queries
  6154. if (cracked.query) {
  6155. switch (node->getOp()) {
  6156. case glslang::EOpImageQuerySize:
  6157. case glslang::EOpTextureQuerySize:
  6158. if (arguments.size() > 1) {
  6159. params.lod = arguments[1];
  6160. return builder.createTextureQueryCall(spv::Op::OpImageQuerySizeLod, params, isUnsignedResult);
  6161. } else
  6162. return builder.createTextureQueryCall(spv::Op::OpImageQuerySize, params, isUnsignedResult);
  6163. case glslang::EOpImageQuerySamples:
  6164. case glslang::EOpTextureQuerySamples:
  6165. return builder.createTextureQueryCall(spv::Op::OpImageQuerySamples, params, isUnsignedResult);
  6166. case glslang::EOpTextureQueryLod:
  6167. params.coords = arguments[1];
  6168. return builder.createTextureQueryCall(spv::Op::OpImageQueryLod, params, isUnsignedResult);
  6169. case glslang::EOpTextureQueryLevels:
  6170. return builder.createTextureQueryCall(spv::Op::OpImageQueryLevels, params, isUnsignedResult);
  6171. case glslang::EOpSparseTexelsResident:
  6172. return builder.createUnaryOp(spv::Op::OpImageSparseTexelsResident, builder.makeBoolType(), arguments[0]);
  6173. default:
  6174. assert(0);
  6175. break;
  6176. }
  6177. }
  6178. int components = node->getType().getVectorSize();
  6179. if (node->getOp() == glslang::EOpImageLoad ||
  6180. node->getOp() == glslang::EOpImageLoadLod ||
  6181. node->getOp() == glslang::EOpTextureFetch ||
  6182. node->getOp() == glslang::EOpTextureFetchOffset) {
  6183. // These must produce 4 components, per SPIR-V spec. We'll add a conversion constructor if needed.
  6184. // This will only happen through the HLSL path for operator[], so we do not have to handle e.g.
  6185. // the EOpTexture/Proj/Lod/etc family. It would be harmless to do so, but would need more logic
  6186. // here around e.g. which ones return scalars or other types.
  6187. components = 4;
  6188. }
  6189. glslang::TType returnType(node->getType().getBasicType(), glslang::EvqTemporary, components);
  6190. auto resultType = [&returnType,this]{ return convertGlslangToSpvType(returnType); };
  6191. // Check for image functions other than queries
  6192. if (node->isImage()) {
  6193. std::vector<spv::IdImmediate> operands;
  6194. auto opIt = arguments.begin();
  6195. spv::IdImmediate image = { true, *(opIt++) };
  6196. operands.push_back(image);
  6197. // Handle subpass operations
  6198. // TODO: GLSL should change to have the "MS" only on the type rather than the
  6199. // built-in function.
  6200. if (cracked.subpass) {
  6201. // add on the (0,0) coordinate
  6202. spv::Id zero = builder.makeIntConstant(0);
  6203. std::vector<spv::Id> comps;
  6204. comps.push_back(zero);
  6205. comps.push_back(zero);
  6206. spv::IdImmediate coord = { true,
  6207. builder.makeCompositeConstant(builder.makeVectorType(builder.makeIntType(32), 2), comps) };
  6208. operands.push_back(coord);
  6209. spv::IdImmediate imageOperands = { false, spv::ImageOperandsMask::MaskNone };
  6210. imageOperands.word = imageOperands.word | (unsigned)signExtensionMask();
  6211. if (sampler.isMultiSample()) {
  6212. imageOperands.word = imageOperands.word | (unsigned)spv::ImageOperandsMask::Sample;
  6213. }
  6214. if (imageOperands.word != (unsigned)spv::ImageOperandsMask::MaskNone) {
  6215. operands.push_back(imageOperands);
  6216. if (sampler.isMultiSample()) {
  6217. spv::IdImmediate imageOperand = { true, *(opIt++) };
  6218. operands.push_back(imageOperand);
  6219. }
  6220. }
  6221. spv::Id result = builder.createOp(spv::Op::OpImageRead, resultType(), operands);
  6222. builder.setPrecision(result, precision);
  6223. return result;
  6224. }
  6225. if (cracked.attachmentEXT) {
  6226. if (opIt != arguments.end()) {
  6227. spv::IdImmediate sample = { true, *opIt };
  6228. operands.push_back(sample);
  6229. }
  6230. spv::Id result = builder.createOp(spv::Op::OpColorAttachmentReadEXT, resultType(), operands);
  6231. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  6232. builder.setPrecision(result, precision);
  6233. return result;
  6234. }
  6235. spv::IdImmediate coord = { true, *(opIt++) };
  6236. operands.push_back(coord);
  6237. if (node->getOp() == glslang::EOpImageLoad || node->getOp() == glslang::EOpImageLoadLod) {
  6238. spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;
  6239. if (sampler.isMultiSample()) {
  6240. mask = mask | spv::ImageOperandsMask::Sample;
  6241. }
  6242. if (cracked.lod) {
  6243. builder.addExtension(spv::E_SPV_AMD_shader_image_load_store_lod);
  6244. builder.addCapability(spv::Capability::ImageReadWriteLodAMD);
  6245. mask = mask | spv::ImageOperandsMask::Lod;
  6246. }
  6247. mask = mask | TranslateImageOperands(TranslateCoherent(imageType));
  6248. mask = (spv::ImageOperandsMask)(mask & ~spv::ImageOperandsMask::MakeTexelAvailableKHR);
  6249. mask = mask | signExtensionMask();
  6250. if (mask != spv::ImageOperandsMask::MaskNone) {
  6251. spv::IdImmediate imageOperands = { false, (unsigned int)mask };
  6252. operands.push_back(imageOperands);
  6253. }
  6254. if (anySet(mask, spv::ImageOperandsMask::Sample)) {
  6255. spv::IdImmediate imageOperand = { true, *opIt++ };
  6256. operands.push_back(imageOperand);
  6257. }
  6258. if (anySet(mask, spv::ImageOperandsMask::Lod)) {
  6259. spv::IdImmediate imageOperand = { true, *opIt++ };
  6260. operands.push_back(imageOperand);
  6261. }
  6262. if (anySet(mask, spv::ImageOperandsMask::MakeTexelVisibleKHR)) {
  6263. spv::IdImmediate imageOperand = { true,
  6264. builder.makeUintConstant(TranslateMemoryScope(TranslateCoherent(imageType))) };
  6265. operands.push_back(imageOperand);
  6266. }
  6267. if (builder.getImageTypeFormat(builder.getImageType(operands.front().word)) == spv::ImageFormat::Unknown)
  6268. builder.addCapability(spv::Capability::StorageImageReadWithoutFormat);
  6269. std::vector<spv::Id> result(1, builder.createOp(spv::Op::OpImageRead, resultType(), operands));
  6270. builder.setPrecision(result[0], precision);
  6271. // If needed, add a conversion constructor to the proper size.
  6272. if (components != node->getType().getVectorSize())
  6273. result[0] = builder.createConstructor(precision, result, convertGlslangToSpvType(node->getType()));
  6274. return result[0];
  6275. } else if (node->getOp() == glslang::EOpImageStore || node->getOp() == glslang::EOpImageStoreLod) {
  6276. // Push the texel value before the operands
  6277. if (sampler.isMultiSample() || cracked.lod) {
  6278. spv::IdImmediate texel = { true, *(opIt + 1) };
  6279. operands.push_back(texel);
  6280. } else {
  6281. spv::IdImmediate texel = { true, *opIt };
  6282. operands.push_back(texel);
  6283. }
  6284. spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;
  6285. if (sampler.isMultiSample()) {
  6286. mask = mask | spv::ImageOperandsMask::Sample;
  6287. }
  6288. if (cracked.lod) {
  6289. builder.addExtension(spv::E_SPV_AMD_shader_image_load_store_lod);
  6290. builder.addCapability(spv::Capability::ImageReadWriteLodAMD);
  6291. mask = mask | spv::ImageOperandsMask::Lod;
  6292. }
  6293. mask = mask | TranslateImageOperands(TranslateCoherent(imageType));
  6294. mask = (spv::ImageOperandsMask)(mask & ~spv::ImageOperandsMask::MakeTexelVisibleKHR);
  6295. mask = mask | signExtensionMask();
  6296. if (mask != spv::ImageOperandsMask::MaskNone) {
  6297. spv::IdImmediate imageOperands = { false, (unsigned int)mask };
  6298. operands.push_back(imageOperands);
  6299. }
  6300. if (anySet(mask, spv::ImageOperandsMask::Sample)) {
  6301. spv::IdImmediate imageOperand = { true, *opIt++ };
  6302. operands.push_back(imageOperand);
  6303. }
  6304. if (anySet(mask, spv::ImageOperandsMask::Lod)) {
  6305. spv::IdImmediate imageOperand = { true, *opIt++ };
  6306. operands.push_back(imageOperand);
  6307. }
  6308. if (anySet(mask, spv::ImageOperandsMask::MakeTexelAvailableKHR)) {
  6309. spv::IdImmediate imageOperand = { true,
  6310. builder.makeUintConstant(TranslateMemoryScope(TranslateCoherent(imageType))) };
  6311. operands.push_back(imageOperand);
  6312. }
  6313. builder.createNoResultOp(spv::Op::OpImageWrite, operands);
  6314. if (builder.getImageTypeFormat(builder.getImageType(operands.front().word)) == spv::ImageFormat::Unknown)
  6315. builder.addCapability(spv::Capability::StorageImageWriteWithoutFormat);
  6316. return spv::NoResult;
  6317. } else if (node->getOp() == glslang::EOpSparseImageLoad ||
  6318. node->getOp() == glslang::EOpSparseImageLoadLod) {
  6319. builder.addCapability(spv::Capability::SparseResidency);
  6320. if (builder.getImageTypeFormat(builder.getImageType(operands.front().word)) == spv::ImageFormat::Unknown)
  6321. builder.addCapability(spv::Capability::StorageImageReadWithoutFormat);
  6322. spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;
  6323. if (sampler.isMultiSample()) {
  6324. mask = mask | spv::ImageOperandsMask::Sample;
  6325. }
  6326. if (cracked.lod) {
  6327. builder.addExtension(spv::E_SPV_AMD_shader_image_load_store_lod);
  6328. builder.addCapability(spv::Capability::ImageReadWriteLodAMD);
  6329. mask = mask | spv::ImageOperandsMask::Lod;
  6330. }
  6331. mask = mask | TranslateImageOperands(TranslateCoherent(imageType));
  6332. mask = (spv::ImageOperandsMask)(mask & ~spv::ImageOperandsMask::MakeTexelAvailableKHR);
  6333. mask = mask | signExtensionMask();
  6334. if (mask != spv::ImageOperandsMask::MaskNone) {
  6335. spv::IdImmediate imageOperands = { false, (unsigned int)mask };
  6336. operands.push_back(imageOperands);
  6337. }
  6338. if (anySet(mask, spv::ImageOperandsMask::Sample)) {
  6339. spv::IdImmediate imageOperand = { true, *opIt++ };
  6340. operands.push_back(imageOperand);
  6341. }
  6342. if (anySet(mask, spv::ImageOperandsMask::Lod)) {
  6343. spv::IdImmediate imageOperand = { true, *opIt++ };
  6344. operands.push_back(imageOperand);
  6345. }
  6346. if (anySet(mask, spv::ImageOperandsMask::MakeTexelVisibleKHR)) {
  6347. spv::IdImmediate imageOperand = { true, builder.makeUintConstant(TranslateMemoryScope(
  6348. TranslateCoherent(imageType))) };
  6349. operands.push_back(imageOperand);
  6350. }
  6351. // Create the return type that was a special structure
  6352. spv::Id texelOut = *opIt;
  6353. spv::Id typeId0 = resultType();
  6354. spv::Id typeId1 = builder.getDerefTypeId(texelOut);
  6355. spv::Id resultTypeId = builder.makeStructResultType(typeId0, typeId1);
  6356. spv::Id resultId = builder.createOp(spv::Op::OpImageSparseRead, resultTypeId, operands);
  6357. // Decode the return type
  6358. builder.createStore(builder.createCompositeExtract(resultId, typeId1, 1), texelOut);
  6359. return builder.createCompositeExtract(resultId, typeId0, 0);
  6360. } else {
  6361. // Process image atomic operations
  6362. // GLSL "IMAGE_PARAMS" will involve in constructing an image texel pointer and this pointer,
  6363. // as the first source operand, is required by SPIR-V atomic operations.
  6364. // For non-MS, the sample value should be 0
  6365. spv::IdImmediate sample = { true, sampler.isMultiSample() ? *(opIt++) : builder.makeUintConstant(0) };
  6366. operands.push_back(sample);
  6367. spv::Id resultTypeId;
  6368. glslang::TBasicType typeProxy = node->getBasicType();
  6369. // imageAtomicStore has a void return type so base the pointer type on
  6370. // the type of the value operand.
  6371. if (node->getOp() == glslang::EOpImageAtomicStore) {
  6372. resultTypeId = builder.makePointer(spv::StorageClass::Image, builder.getTypeId(*opIt));
  6373. typeProxy = node->getAsAggregate()->getSequence()[0]->getAsTyped()->getType().getSampler().type;
  6374. } else {
  6375. resultTypeId = builder.makePointer(spv::StorageClass::Image, resultType());
  6376. }
  6377. spv::Id pointer = builder.createOp(spv::Op::OpImageTexelPointer, resultTypeId, operands);
  6378. if (imageType.getQualifier().nonUniform) {
  6379. builder.addDecoration(pointer, spv::Decoration::NonUniformEXT);
  6380. }
  6381. std::vector<spv::Id> operands;
  6382. operands.push_back(pointer);
  6383. for (; opIt != arguments.end(); ++opIt)
  6384. operands.push_back(*opIt);
  6385. return createAtomicOperation(node->getOp(), precision, resultType(), operands, typeProxy,
  6386. lvalueCoherentFlags, node->getType());
  6387. }
  6388. }
  6389. // Check for fragment mask functions other than queries
  6390. if (cracked.fragMask) {
  6391. assert(sampler.ms);
  6392. auto opIt = arguments.begin();
  6393. std::vector<spv::Id> operands;
  6394. operands.push_back(params.sampler);
  6395. ++opIt;
  6396. if (sampler.isSubpass()) {
  6397. // add on the (0,0) coordinate
  6398. spv::Id zero = builder.makeIntConstant(0);
  6399. std::vector<spv::Id> comps;
  6400. comps.push_back(zero);
  6401. comps.push_back(zero);
  6402. operands.push_back(builder.makeCompositeConstant(
  6403. builder.makeVectorType(builder.makeIntType(32), 2), comps));
  6404. }
  6405. for (; opIt != arguments.end(); ++opIt)
  6406. operands.push_back(*opIt);
  6407. spv::Op fragMaskOp = spv::Op::OpNop;
  6408. if (node->getOp() == glslang::EOpFragmentMaskFetch)
  6409. fragMaskOp = spv::Op::OpFragmentMaskFetchAMD;
  6410. else if (node->getOp() == glslang::EOpFragmentFetch)
  6411. fragMaskOp = spv::Op::OpFragmentFetchAMD;
  6412. builder.addExtension(spv::E_SPV_AMD_shader_fragment_mask);
  6413. builder.addCapability(spv::Capability::FragmentMaskAMD);
  6414. return builder.createOp(fragMaskOp, resultType(), operands);
  6415. }
  6416. // Check for texture functions other than queries
  6417. bool sparse = node->isSparseTexture();
  6418. bool imageFootprint = node->isImageFootprint();
  6419. bool cubeCompare = sampler.dim == glslang::EsdCube && sampler.isArrayed() && sampler.isShadow();
  6420. // check for bias argument
  6421. bool bias = false;
  6422. if (! cracked.lod && ! cracked.grad && ! cracked.fetch && ! cubeCompare) {
  6423. int nonBiasArgCount = 2;
  6424. if (cracked.gather)
  6425. ++nonBiasArgCount; // comp argument should be present when bias argument is present
  6426. if (f16ShadowCompare)
  6427. ++nonBiasArgCount;
  6428. if (cracked.offset)
  6429. ++nonBiasArgCount;
  6430. else if (cracked.offsets)
  6431. ++nonBiasArgCount;
  6432. if (cracked.grad)
  6433. nonBiasArgCount += 2;
  6434. if (cracked.lodClamp)
  6435. ++nonBiasArgCount;
  6436. if (sparse)
  6437. ++nonBiasArgCount;
  6438. if (imageFootprint)
  6439. //Following three extra arguments
  6440. // int granularity, bool coarse, out gl_TextureFootprint2DNV footprint
  6441. nonBiasArgCount += 3;
  6442. if ((int)arguments.size() > nonBiasArgCount)
  6443. bias = true;
  6444. }
  6445. if (cracked.gather) {
  6446. const auto& sourceExtensions = glslangIntermediate->getRequestedExtensions();
  6447. if (bias || cracked.lod ||
  6448. sourceExtensions.find(glslang::E_GL_AMD_texture_gather_bias_lod) != sourceExtensions.end()) {
  6449. builder.addExtension(spv::E_SPV_AMD_texture_gather_bias_lod);
  6450. builder.addCapability(spv::Capability::ImageGatherBiasLodAMD);
  6451. }
  6452. }
  6453. // set the rest of the arguments
  6454. params.coords = arguments[1];
  6455. int extraArgs = 0;
  6456. bool noImplicitLod = false;
  6457. // sort out where Dref is coming from
  6458. if (cubeCompare || f16ShadowCompare) {
  6459. params.Dref = arguments[2];
  6460. ++extraArgs;
  6461. } else if (sampler.shadow && cracked.gather) {
  6462. params.Dref = arguments[2];
  6463. ++extraArgs;
  6464. } else if (sampler.shadow) {
  6465. std::vector<spv::Id> indexes;
  6466. int dRefComp;
  6467. if (cracked.proj)
  6468. dRefComp = 2; // "The resulting 3rd component of P in the shadow forms is used as Dref"
  6469. else
  6470. dRefComp = builder.getNumComponents(params.coords) - 1;
  6471. indexes.push_back(dRefComp);
  6472. params.Dref = builder.createCompositeExtract(params.coords,
  6473. builder.getScalarTypeId(builder.getTypeId(params.coords)), indexes);
  6474. }
  6475. // lod
  6476. if (cracked.lod) {
  6477. params.lod = arguments[2 + extraArgs];
  6478. ++extraArgs;
  6479. } else if (glslangIntermediate->getStage() != EShLangFragment &&
  6480. !(glslangIntermediate->getStage() == EShLangCompute &&
  6481. glslangIntermediate->hasLayoutDerivativeModeNone())) {
  6482. // we need to invent the default lod for an explicit lod instruction for a non-fragment stage
  6483. noImplicitLod = true;
  6484. }
  6485. // multisample
  6486. if (sampler.isMultiSample()) {
  6487. params.sample = arguments[2 + extraArgs]; // For MS, "sample" should be specified
  6488. ++extraArgs;
  6489. }
  6490. // gradient
  6491. if (cracked.grad) {
  6492. params.gradX = arguments[2 + extraArgs];
  6493. params.gradY = arguments[3 + extraArgs];
  6494. extraArgs += 2;
  6495. }
  6496. // offset and offsets
  6497. if (cracked.offset) {
  6498. params.offset = arguments[2 + extraArgs];
  6499. ++extraArgs;
  6500. } else if (cracked.offsets) {
  6501. params.offsets = arguments[2 + extraArgs];
  6502. ++extraArgs;
  6503. }
  6504. // lod clamp
  6505. if (cracked.lodClamp) {
  6506. params.lodClamp = arguments[2 + extraArgs];
  6507. ++extraArgs;
  6508. }
  6509. // sparse
  6510. if (sparse) {
  6511. params.texelOut = arguments[2 + extraArgs];
  6512. ++extraArgs;
  6513. }
  6514. // gather component
  6515. if (cracked.gather && ! sampler.shadow) {
  6516. // default component is 0, if missing, otherwise an argument
  6517. if (2 + extraArgs < (int)arguments.size()) {
  6518. params.component = arguments[2 + extraArgs];
  6519. ++extraArgs;
  6520. } else
  6521. params.component = builder.makeIntConstant(0);
  6522. }
  6523. spv::Id resultStruct = spv::NoResult;
  6524. if (imageFootprint) {
  6525. //Following three extra arguments
  6526. // int granularity, bool coarse, out gl_TextureFootprint2DNV footprint
  6527. params.granularity = arguments[2 + extraArgs];
  6528. params.coarse = arguments[3 + extraArgs];
  6529. resultStruct = arguments[4 + extraArgs];
  6530. extraArgs += 3;
  6531. }
  6532. // bias
  6533. if (bias) {
  6534. params.bias = arguments[2 + extraArgs];
  6535. ++extraArgs;
  6536. }
  6537. if (imageFootprint) {
  6538. builder.addExtension(spv::E_SPV_NV_shader_image_footprint);
  6539. builder.addCapability(spv::Capability::ImageFootprintNV);
  6540. //resultStructType(OpenGL type) contains 5 elements:
  6541. //struct gl_TextureFootprint2DNV {
  6542. // uvec2 anchor;
  6543. // uvec2 offset;
  6544. // uvec2 mask;
  6545. // uint lod;
  6546. // uint granularity;
  6547. //};
  6548. //or
  6549. //struct gl_TextureFootprint3DNV {
  6550. // uvec3 anchor;
  6551. // uvec3 offset;
  6552. // uvec2 mask;
  6553. // uint lod;
  6554. // uint granularity;
  6555. //};
  6556. spv::Id resultStructType = builder.getContainedTypeId(builder.getTypeId(resultStruct));
  6557. assert(builder.isStructType(resultStructType));
  6558. //resType (SPIR-V type) contains 6 elements:
  6559. //Member 0 must be a Boolean type scalar(LOD),
  6560. //Member 1 must be a vector of integer type, whose Signedness operand is 0(anchor),
  6561. //Member 2 must be a vector of integer type, whose Signedness operand is 0(offset),
  6562. //Member 3 must be a vector of integer type, whose Signedness operand is 0(mask),
  6563. //Member 4 must be a scalar of integer type, whose Signedness operand is 0(lod),
  6564. //Member 5 must be a scalar of integer type, whose Signedness operand is 0(granularity).
  6565. std::vector<spv::Id> members;
  6566. members.push_back(resultType());
  6567. for (int i = 0; i < 5; i++) {
  6568. members.push_back(builder.getContainedTypeId(resultStructType, i));
  6569. }
  6570. spv::Id resType = builder.makeStructType(members, {}, "ResType");
  6571. //call ImageFootprintNV
  6572. spv::Id res = builder.createTextureCall(precision, resType, sparse, cracked.fetch, cracked.proj,
  6573. cracked.gather, noImplicitLod, params, signExtensionMask());
  6574. //copy resType (SPIR-V type) to resultStructType(OpenGL type)
  6575. for (int i = 0; i < 5; i++) {
  6576. builder.clearAccessChain();
  6577. builder.setAccessChainLValue(resultStruct);
  6578. //Accessing to a struct we created, no coherent flag is set
  6579. spv::Builder::AccessChain::CoherentFlags flags;
  6580. flags.clear();
  6581. builder.accessChainPush(builder.makeIntConstant(i), flags, 0);
  6582. builder.accessChainStore(builder.createCompositeExtract(res, builder.getContainedTypeId(resType, i+1),
  6583. i+1), TranslateNonUniformDecoration(imageType.getQualifier()));
  6584. }
  6585. return builder.createCompositeExtract(res, resultType(), 0);
  6586. }
  6587. // projective component (might not to move)
  6588. // GLSL: "The texture coordinates consumed from P, not including the last component of P,
  6589. // are divided by the last component of P."
  6590. // SPIR-V: "... (u [, v] [, w], q)... It may be a vector larger than needed, but all
  6591. // unused components will appear after all used components."
  6592. if (cracked.proj) {
  6593. int projSourceComp = builder.getNumComponents(params.coords) - 1;
  6594. int projTargetComp;
  6595. switch (sampler.dim) {
  6596. case glslang::Esd1D: projTargetComp = 1; break;
  6597. case glslang::Esd2D: projTargetComp = 2; break;
  6598. case glslang::EsdRect: projTargetComp = 2; break;
  6599. default: projTargetComp = projSourceComp; break;
  6600. }
  6601. // copy the projective coordinate if we have to
  6602. if (projTargetComp != projSourceComp) {
  6603. spv::Id projComp = builder.createCompositeExtract(params.coords,
  6604. builder.getScalarTypeId(builder.getTypeId(params.coords)), projSourceComp);
  6605. params.coords = builder.createCompositeInsert(projComp, params.coords,
  6606. builder.getTypeId(params.coords), projTargetComp);
  6607. }
  6608. }
  6609. // nonprivate
  6610. if (imageType.getQualifier().nonprivate) {
  6611. params.nonprivate = true;
  6612. }
  6613. // volatile
  6614. if (imageType.getQualifier().volatil) {
  6615. params.volatil = true;
  6616. }
  6617. if (imageType.getQualifier().nontemporal) {
  6618. params.nontemporal = true;
  6619. }
  6620. std::vector<spv::Id> result( 1,
  6621. builder.createTextureCall(precision, resultType(), sparse, cracked.fetch, cracked.proj, cracked.gather,
  6622. noImplicitLod, params, signExtensionMask())
  6623. );
  6624. if (components != node->getType().getVectorSize())
  6625. result[0] = builder.createConstructor(precision, result, convertGlslangToSpvType(node->getType()));
  6626. return result[0];
  6627. }
  6628. spv::Id TGlslangToSpvTraverser::handleUserFunctionCall(const glslang::TIntermAggregate* node)
  6629. {
  6630. // Grab the function's pointer from the previously created function
  6631. spv::Function* function = functionMap[node->getName().c_str()];
  6632. if (! function)
  6633. return 0;
  6634. const glslang::TIntermSequence& glslangArgs = node->getSequence();
  6635. const glslang::TQualifierList& qualifiers = node->getQualifierList();
  6636. // See comments in makeFunctions() for details about the semantics for parameter passing.
  6637. //
  6638. // These imply we need a four step process:
  6639. // 1. Evaluate the arguments
  6640. // 2. Allocate and make copies of in, out, and inout arguments
  6641. // 3. Make the call
  6642. // 4. Copy back the results
  6643. // 1. Evaluate the arguments and their types
  6644. std::vector<spv::Builder::AccessChain> lValues;
  6645. std::vector<spv::Id> rValues;
  6646. std::vector<const glslang::TType*> argTypes;
  6647. for (int a = 0; a < (int)glslangArgs.size(); ++a) {
  6648. argTypes.push_back(&glslangArgs[a]->getAsTyped()->getType());
  6649. // build l-value
  6650. builder.clearAccessChain();
  6651. glslangArgs[a]->traverse(this);
  6652. // keep outputs and pass-by-originals as l-values, evaluate others as r-values
  6653. if (originalParam(qualifiers[a], *argTypes[a], function->hasImplicitThis() && a == 0) ||
  6654. writableParam(qualifiers[a])) {
  6655. // save l-value
  6656. lValues.push_back(builder.getAccessChain());
  6657. } else {
  6658. // process r-value
  6659. rValues.push_back(accessChainLoad(*argTypes.back()));
  6660. }
  6661. }
  6662. // Reset source location to the function call location after argument evaluation
  6663. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  6664. // 2. Allocate space for anything needing a copy, and if it's "in" or "inout"
  6665. // copy the original into that space.
  6666. //
  6667. // Also, build up the list of actual arguments to pass in for the call
  6668. int lValueCount = 0;
  6669. int rValueCount = 0;
  6670. std::vector<spv::Id> spvArgs;
  6671. for (int a = 0; a < (int)glslangArgs.size(); ++a) {
  6672. spv::Id arg;
  6673. if (originalParam(qualifiers[a], *argTypes[a], function->hasImplicitThis() && a == 0)) {
  6674. builder.setAccessChain(lValues[lValueCount]);
  6675. arg = builder.accessChainGetLValue();
  6676. ++lValueCount;
  6677. } else if (writableParam(qualifiers[a])) {
  6678. // need space to hold the copy
  6679. arg = builder.createVariable(function->getParamPrecision(a), spv::StorageClass::Function,
  6680. builder.getContainedTypeId(function->getParamType(a)), "param");
  6681. if (qualifiers[a] == glslang::EvqIn || qualifiers[a] == glslang::EvqInOut) {
  6682. // need to copy the input into output space
  6683. builder.setAccessChain(lValues[lValueCount]);
  6684. spv::Id copy = accessChainLoad(*argTypes[a]);
  6685. builder.clearAccessChain();
  6686. builder.setAccessChainLValue(arg);
  6687. multiTypeStore(*argTypes[a], copy);
  6688. }
  6689. ++lValueCount;
  6690. } else {
  6691. // process r-value, which involves a copy for a type mismatch
  6692. if (function->getParamType(a) != builder.getTypeId(rValues[rValueCount]) ||
  6693. TranslatePrecisionDecoration(*argTypes[a]) != function->getParamPrecision(a))
  6694. {
  6695. spv::Id argCopy = builder.createVariable(function->getParamPrecision(a), spv::StorageClass::Function, function->getParamType(a), "arg");
  6696. builder.clearAccessChain();
  6697. builder.setAccessChainLValue(argCopy);
  6698. multiTypeStore(*argTypes[a], rValues[rValueCount]);
  6699. arg = builder.createLoad(argCopy, function->getParamPrecision(a));
  6700. } else
  6701. arg = rValues[rValueCount];
  6702. ++rValueCount;
  6703. }
  6704. spvArgs.push_back(arg);
  6705. }
  6706. // 3. Make the call.
  6707. spv::Id result = builder.createFunctionCall(function, spvArgs);
  6708. builder.setPrecision(result, TranslatePrecisionDecoration(node->getType()));
  6709. builder.addDecoration(result, TranslateNonUniformDecoration(node->getType().getQualifier()));
  6710. // 4. Copy back out an "out" arguments.
  6711. lValueCount = 0;
  6712. for (int a = 0; a < (int)glslangArgs.size(); ++a) {
  6713. if (originalParam(qualifiers[a], *argTypes[a], function->hasImplicitThis() && a == 0))
  6714. ++lValueCount;
  6715. else if (writableParam(qualifiers[a])) {
  6716. if (qualifiers[a] == glslang::EvqOut || qualifiers[a] == glslang::EvqInOut) {
  6717. spv::Id copy = builder.createLoad(spvArgs[a], spv::NoPrecision);
  6718. builder.addDecoration(copy, TranslateNonUniformDecoration(argTypes[a]->getQualifier()));
  6719. builder.setAccessChain(lValues[lValueCount]);
  6720. multiTypeStore(*argTypes[a], copy);
  6721. }
  6722. ++lValueCount;
  6723. }
  6724. }
  6725. return result;
  6726. }
  6727. // Translate AST operation to SPV operation, already having SPV-based operands/types.
  6728. spv::Id TGlslangToSpvTraverser::createBinaryOperation(glslang::TOperator op, OpDecorations& decorations,
  6729. spv::Id typeId, spv::Id left, spv::Id right,
  6730. glslang::TBasicType typeProxy, bool reduceComparison)
  6731. {
  6732. bool isUnsigned = isTypeUnsignedInt(typeProxy);
  6733. bool isFloat = isTypeFloat(typeProxy);
  6734. bool isBool = typeProxy == glslang::EbtBool;
  6735. spv::Op binOp = spv::Op::OpNop;
  6736. bool needMatchingVectors = true; // for non-matrix ops, would a scalar need to smear to match a vector?
  6737. bool comparison = false;
  6738. switch (op) {
  6739. case glslang::EOpAdd:
  6740. case glslang::EOpAddAssign:
  6741. if (isFloat)
  6742. binOp = spv::Op::OpFAdd;
  6743. else
  6744. binOp = spv::Op::OpIAdd;
  6745. break;
  6746. case glslang::EOpSub:
  6747. case glslang::EOpSubAssign:
  6748. if (isFloat)
  6749. binOp = spv::Op::OpFSub;
  6750. else
  6751. binOp = spv::Op::OpISub;
  6752. break;
  6753. case glslang::EOpMul:
  6754. case glslang::EOpMulAssign:
  6755. if (isFloat)
  6756. binOp = spv::Op::OpFMul;
  6757. else
  6758. binOp = spv::Op::OpIMul;
  6759. break;
  6760. case glslang::EOpVectorTimesScalar:
  6761. case glslang::EOpVectorTimesScalarAssign:
  6762. if (isFloat && (builder.isVector(left) || builder.isVector(right) || builder.isCooperativeVector(left) || builder.isCooperativeVector(right))) {
  6763. if (builder.isVector(right) || builder.isCooperativeVector(right))
  6764. std::swap(left, right);
  6765. assert(builder.isScalar(right));
  6766. needMatchingVectors = false;
  6767. binOp = spv::Op::OpVectorTimesScalar;
  6768. } else if (isFloat) {
  6769. binOp = spv::Op::OpFMul;
  6770. } else if (builder.isCooperativeVector(left) || builder.isCooperativeVector(right)) {
  6771. if (builder.isCooperativeVector(right))
  6772. std::swap(left, right);
  6773. assert(builder.isScalar(right));
  6774. // Construct a cooperative vector from the scalar
  6775. right = builder.createCompositeConstruct(builder.getTypeId(left), { right });
  6776. binOp = spv::Op::OpIMul;
  6777. } else {
  6778. binOp = spv::Op::OpIMul;
  6779. }
  6780. break;
  6781. case glslang::EOpVectorTimesMatrix:
  6782. case glslang::EOpVectorTimesMatrixAssign:
  6783. binOp = spv::Op::OpVectorTimesMatrix;
  6784. break;
  6785. case glslang::EOpMatrixTimesVector:
  6786. binOp = spv::Op::OpMatrixTimesVector;
  6787. break;
  6788. case glslang::EOpMatrixTimesScalar:
  6789. case glslang::EOpMatrixTimesScalarAssign:
  6790. binOp = spv::Op::OpMatrixTimesScalar;
  6791. break;
  6792. case glslang::EOpMatrixTimesMatrix:
  6793. case glslang::EOpMatrixTimesMatrixAssign:
  6794. binOp = spv::Op::OpMatrixTimesMatrix;
  6795. break;
  6796. case glslang::EOpOuterProduct:
  6797. binOp = spv::Op::OpOuterProduct;
  6798. needMatchingVectors = false;
  6799. break;
  6800. case glslang::EOpDiv:
  6801. case glslang::EOpDivAssign:
  6802. if (isFloat)
  6803. binOp = spv::Op::OpFDiv;
  6804. else if (isUnsigned)
  6805. binOp = spv::Op::OpUDiv;
  6806. else
  6807. binOp = spv::Op::OpSDiv;
  6808. break;
  6809. case glslang::EOpMod:
  6810. case glslang::EOpModAssign:
  6811. if (isFloat)
  6812. binOp = spv::Op::OpFMod;
  6813. else if (isUnsigned)
  6814. binOp = spv::Op::OpUMod;
  6815. else
  6816. binOp = spv::Op::OpSMod;
  6817. break;
  6818. case glslang::EOpRightShift:
  6819. case glslang::EOpRightShiftAssign:
  6820. if (isUnsigned)
  6821. binOp = spv::Op::OpShiftRightLogical;
  6822. else
  6823. binOp = spv::Op::OpShiftRightArithmetic;
  6824. break;
  6825. case glslang::EOpLeftShift:
  6826. case glslang::EOpLeftShiftAssign:
  6827. binOp = spv::Op::OpShiftLeftLogical;
  6828. break;
  6829. case glslang::EOpAnd:
  6830. case glslang::EOpAndAssign:
  6831. binOp = spv::Op::OpBitwiseAnd;
  6832. break;
  6833. case glslang::EOpLogicalAnd:
  6834. needMatchingVectors = false;
  6835. binOp = spv::Op::OpLogicalAnd;
  6836. break;
  6837. case glslang::EOpInclusiveOr:
  6838. case glslang::EOpInclusiveOrAssign:
  6839. binOp = spv::Op::OpBitwiseOr;
  6840. break;
  6841. case glslang::EOpLogicalOr:
  6842. needMatchingVectors = false;
  6843. binOp = spv::Op::OpLogicalOr;
  6844. break;
  6845. case glslang::EOpExclusiveOr:
  6846. case glslang::EOpExclusiveOrAssign:
  6847. binOp = spv::Op::OpBitwiseXor;
  6848. break;
  6849. case glslang::EOpLogicalXor:
  6850. needMatchingVectors = false;
  6851. binOp = spv::Op::OpLogicalNotEqual;
  6852. break;
  6853. case glslang::EOpAbsDifference:
  6854. binOp = isUnsigned ? spv::Op::OpAbsUSubINTEL : spv::Op::OpAbsISubINTEL;
  6855. break;
  6856. case glslang::EOpAddSaturate:
  6857. binOp = isUnsigned ? spv::Op::OpUAddSatINTEL : spv::Op::OpIAddSatINTEL;
  6858. break;
  6859. case glslang::EOpSubSaturate:
  6860. binOp = isUnsigned ? spv::Op::OpUSubSatINTEL : spv::Op::OpISubSatINTEL;
  6861. break;
  6862. case glslang::EOpAverage:
  6863. binOp = isUnsigned ? spv::Op::OpUAverageINTEL : spv::Op::OpIAverageINTEL;
  6864. break;
  6865. case glslang::EOpAverageRounded:
  6866. binOp = isUnsigned ? spv::Op::OpUAverageRoundedINTEL : spv::Op::OpIAverageRoundedINTEL;
  6867. break;
  6868. case glslang::EOpMul32x16:
  6869. binOp = isUnsigned ? spv::Op::OpUMul32x16INTEL : spv::Op::OpIMul32x16INTEL;
  6870. break;
  6871. case glslang::EOpExpectEXT:
  6872. binOp = spv::Op::OpExpectKHR;
  6873. break;
  6874. case glslang::EOpLessThan:
  6875. case glslang::EOpGreaterThan:
  6876. case glslang::EOpLessThanEqual:
  6877. case glslang::EOpGreaterThanEqual:
  6878. case glslang::EOpEqual:
  6879. case glslang::EOpNotEqual:
  6880. case glslang::EOpVectorEqual:
  6881. case glslang::EOpVectorNotEqual:
  6882. comparison = true;
  6883. break;
  6884. default:
  6885. break;
  6886. }
  6887. // handle mapped binary operations (should be non-comparison)
  6888. if (binOp != spv::Op::OpNop) {
  6889. assert(comparison == false);
  6890. if (builder.isMatrix(left) || builder.isMatrix(right) ||
  6891. builder.isCooperativeMatrix(left) || builder.isCooperativeMatrix(right))
  6892. return createBinaryMatrixOperation(binOp, decorations, typeId, left, right);
  6893. // No matrix involved; make both operands be the same number of components, if needed
  6894. if (needMatchingVectors)
  6895. builder.promoteScalar(decorations.precision, left, right);
  6896. spv::Id result = builder.createBinOp(binOp, typeId, left, right);
  6897. decorations.addNoContraction(builder, result);
  6898. decorations.addNonUniform(builder, result);
  6899. return builder.setPrecision(result, decorations.precision);
  6900. }
  6901. if (! comparison)
  6902. return 0;
  6903. // Handle comparison instructions
  6904. if (reduceComparison && (op == glslang::EOpEqual || op == glslang::EOpNotEqual)
  6905. && (builder.isVector(left) || builder.isMatrix(left) || builder.isAggregate(left))) {
  6906. spv::Id result = builder.createCompositeCompare(decorations.precision, left, right, op == glslang::EOpEqual);
  6907. decorations.addNonUniform(builder, result);
  6908. return result;
  6909. }
  6910. switch (op) {
  6911. case glslang::EOpLessThan:
  6912. if (isFloat)
  6913. binOp = spv::Op::OpFOrdLessThan;
  6914. else if (isUnsigned)
  6915. binOp = spv::Op::OpULessThan;
  6916. else
  6917. binOp = spv::Op::OpSLessThan;
  6918. break;
  6919. case glslang::EOpGreaterThan:
  6920. if (isFloat)
  6921. binOp = spv::Op::OpFOrdGreaterThan;
  6922. else if (isUnsigned)
  6923. binOp = spv::Op::OpUGreaterThan;
  6924. else
  6925. binOp = spv::Op::OpSGreaterThan;
  6926. break;
  6927. case glslang::EOpLessThanEqual:
  6928. if (isFloat)
  6929. binOp = spv::Op::OpFOrdLessThanEqual;
  6930. else if (isUnsigned)
  6931. binOp = spv::Op::OpULessThanEqual;
  6932. else
  6933. binOp = spv::Op::OpSLessThanEqual;
  6934. break;
  6935. case glslang::EOpGreaterThanEqual:
  6936. if (isFloat)
  6937. binOp = spv::Op::OpFOrdGreaterThanEqual;
  6938. else if (isUnsigned)
  6939. binOp = spv::Op::OpUGreaterThanEqual;
  6940. else
  6941. binOp = spv::Op::OpSGreaterThanEqual;
  6942. break;
  6943. case glslang::EOpEqual:
  6944. case glslang::EOpVectorEqual:
  6945. if (isFloat)
  6946. binOp = spv::Op::OpFOrdEqual;
  6947. else if (isBool)
  6948. binOp = spv::Op::OpLogicalEqual;
  6949. else
  6950. binOp = spv::Op::OpIEqual;
  6951. break;
  6952. case glslang::EOpNotEqual:
  6953. case glslang::EOpVectorNotEqual:
  6954. if (isFloat)
  6955. binOp = spv::Op::OpFUnordNotEqual;
  6956. else if (isBool)
  6957. binOp = spv::Op::OpLogicalNotEqual;
  6958. else
  6959. binOp = spv::Op::OpINotEqual;
  6960. break;
  6961. default:
  6962. break;
  6963. }
  6964. if (binOp != spv::Op::OpNop) {
  6965. spv::Id result = builder.createBinOp(binOp, typeId, left, right);
  6966. decorations.addNoContraction(builder, result);
  6967. decorations.addNonUniform(builder, result);
  6968. return builder.setPrecision(result, decorations.precision);
  6969. }
  6970. return 0;
  6971. }
  6972. //
  6973. // Translate AST matrix operation to SPV operation, already having SPV-based operands/types.
  6974. // These can be any of:
  6975. //
  6976. // matrix * scalar
  6977. // scalar * matrix
  6978. // matrix * matrix linear algebraic
  6979. // matrix * vector
  6980. // vector * matrix
  6981. // matrix * matrix componentwise
  6982. // matrix op matrix op in {+, -, /}
  6983. // matrix op scalar op in {+, -, /}
  6984. // scalar op matrix op in {+, -, /}
  6985. //
  6986. spv::Id TGlslangToSpvTraverser::createBinaryMatrixOperation(spv::Op op, OpDecorations& decorations, spv::Id typeId,
  6987. spv::Id left, spv::Id right)
  6988. {
  6989. bool firstClass = true;
  6990. // First, handle first-class matrix operations (* and matrix/scalar)
  6991. switch (op) {
  6992. case spv::Op::OpFDiv:
  6993. if (builder.isMatrix(left) && builder.isScalar(right)) {
  6994. // turn matrix / scalar into a multiply...
  6995. spv::Id resultType = builder.getTypeId(right);
  6996. right = builder.createBinOp(spv::Op::OpFDiv, resultType, builder.makeFpConstant(resultType, 1.0), right);
  6997. op = spv::Op::OpMatrixTimesScalar;
  6998. } else
  6999. firstClass = false;
  7000. break;
  7001. case spv::Op::OpMatrixTimesScalar:
  7002. if (builder.isMatrix(right) || builder.isCooperativeMatrix(right))
  7003. std::swap(left, right);
  7004. assert(builder.isScalar(right));
  7005. break;
  7006. case spv::Op::OpVectorTimesMatrix:
  7007. assert(builder.isVector(left));
  7008. assert(builder.isMatrix(right));
  7009. break;
  7010. case spv::Op::OpMatrixTimesVector:
  7011. assert(builder.isMatrix(left));
  7012. assert(builder.isVector(right));
  7013. break;
  7014. case spv::Op::OpMatrixTimesMatrix:
  7015. assert(builder.isMatrix(left));
  7016. assert(builder.isMatrix(right));
  7017. break;
  7018. default:
  7019. firstClass = false;
  7020. break;
  7021. }
  7022. if (builder.isCooperativeMatrix(left) || builder.isCooperativeMatrix(right))
  7023. firstClass = true;
  7024. if (firstClass) {
  7025. spv::Id result = builder.createBinOp(op, typeId, left, right);
  7026. decorations.addNoContraction(builder, result);
  7027. decorations.addNonUniform(builder, result);
  7028. return builder.setPrecision(result, decorations.precision);
  7029. }
  7030. // Handle component-wise +, -, *, %, and / for all combinations of type.
  7031. // The result type of all of them is the same type as the (a) matrix operand.
  7032. // The algorithm is to:
  7033. // - break the matrix(es) into vectors
  7034. // - smear any scalar to a vector
  7035. // - do vector operations
  7036. // - make a matrix out the vector results
  7037. switch (op) {
  7038. case spv::Op::OpFAdd:
  7039. case spv::Op::OpFSub:
  7040. case spv::Op::OpFDiv:
  7041. case spv::Op::OpFMod:
  7042. case spv::Op::OpFMul:
  7043. {
  7044. // one time set up...
  7045. bool leftMat = builder.isMatrix(left);
  7046. bool rightMat = builder.isMatrix(right);
  7047. unsigned int numCols = leftMat ? builder.getNumColumns(left) : builder.getNumColumns(right);
  7048. int numRows = leftMat ? builder.getNumRows(left) : builder.getNumRows(right);
  7049. spv::Id scalarType = builder.getScalarTypeId(typeId);
  7050. spv::Id vecType = builder.makeVectorType(scalarType, numRows);
  7051. std::vector<spv::Id> results;
  7052. spv::Id smearVec = spv::NoResult;
  7053. if (builder.isScalar(left))
  7054. smearVec = builder.smearScalar(decorations.precision, left, vecType);
  7055. else if (builder.isScalar(right))
  7056. smearVec = builder.smearScalar(decorations.precision, right, vecType);
  7057. // do each vector op
  7058. for (unsigned int c = 0; c < numCols; ++c) {
  7059. std::vector<unsigned int> indexes;
  7060. indexes.push_back(c);
  7061. spv::Id leftVec = leftMat ? builder.createCompositeExtract( left, vecType, indexes) : smearVec;
  7062. spv::Id rightVec = rightMat ? builder.createCompositeExtract(right, vecType, indexes) : smearVec;
  7063. spv::Id result = builder.createBinOp(op, vecType, leftVec, rightVec);
  7064. decorations.addNoContraction(builder, result);
  7065. decorations.addNonUniform(builder, result);
  7066. results.push_back(builder.setPrecision(result, decorations.precision));
  7067. }
  7068. // put the pieces together
  7069. spv::Id result = builder.setPrecision(builder.createCompositeConstruct(typeId, results), decorations.precision);
  7070. decorations.addNonUniform(builder, result);
  7071. return result;
  7072. }
  7073. default:
  7074. assert(0);
  7075. return spv::NoResult;
  7076. }
  7077. }
  7078. spv::Id TGlslangToSpvTraverser::createUnaryOperation(glslang::TOperator op, OpDecorations& decorations, spv::Id typeId,
  7079. spv::Id operand, glslang::TBasicType typeProxy, const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags,
  7080. const glslang::TType &opType)
  7081. {
  7082. spv::Op unaryOp = spv::Op::OpNop;
  7083. int extBuiltins = -1;
  7084. int libCall = -1;
  7085. bool isUnsigned = isTypeUnsignedInt(typeProxy);
  7086. bool isFloat = isTypeFloat(typeProxy);
  7087. switch (op) {
  7088. case glslang::EOpNegative:
  7089. if (isFloat) {
  7090. unaryOp = spv::Op::OpFNegate;
  7091. if (builder.isMatrixType(typeId))
  7092. return createUnaryMatrixOperation(unaryOp, decorations, typeId, operand, typeProxy);
  7093. } else
  7094. unaryOp = spv::Op::OpSNegate;
  7095. break;
  7096. case glslang::EOpLogicalNot:
  7097. case glslang::EOpVectorLogicalNot:
  7098. unaryOp = spv::Op::OpLogicalNot;
  7099. break;
  7100. case glslang::EOpBitwiseNot:
  7101. unaryOp = spv::Op::OpNot;
  7102. break;
  7103. case glslang::EOpDeterminant:
  7104. libCall = spv::GLSLstd450Determinant;
  7105. break;
  7106. case glslang::EOpMatrixInverse:
  7107. libCall = spv::GLSLstd450MatrixInverse;
  7108. break;
  7109. case glslang::EOpTranspose:
  7110. unaryOp = spv::Op::OpTranspose;
  7111. break;
  7112. case glslang::EOpRadians:
  7113. libCall = spv::GLSLstd450Radians;
  7114. break;
  7115. case glslang::EOpDegrees:
  7116. libCall = spv::GLSLstd450Degrees;
  7117. break;
  7118. case glslang::EOpSin:
  7119. libCall = spv::GLSLstd450Sin;
  7120. break;
  7121. case glslang::EOpCos:
  7122. libCall = spv::GLSLstd450Cos;
  7123. break;
  7124. case glslang::EOpTan:
  7125. libCall = spv::GLSLstd450Tan;
  7126. break;
  7127. case glslang::EOpAcos:
  7128. libCall = spv::GLSLstd450Acos;
  7129. break;
  7130. case glslang::EOpAsin:
  7131. libCall = spv::GLSLstd450Asin;
  7132. break;
  7133. case glslang::EOpAtan:
  7134. libCall = spv::GLSLstd450Atan;
  7135. break;
  7136. case glslang::EOpAcosh:
  7137. libCall = spv::GLSLstd450Acosh;
  7138. break;
  7139. case glslang::EOpAsinh:
  7140. libCall = spv::GLSLstd450Asinh;
  7141. break;
  7142. case glslang::EOpAtanh:
  7143. libCall = spv::GLSLstd450Atanh;
  7144. break;
  7145. case glslang::EOpTanh:
  7146. libCall = spv::GLSLstd450Tanh;
  7147. break;
  7148. case glslang::EOpCosh:
  7149. libCall = spv::GLSLstd450Cosh;
  7150. break;
  7151. case glslang::EOpSinh:
  7152. libCall = spv::GLSLstd450Sinh;
  7153. break;
  7154. case glslang::EOpLength:
  7155. libCall = spv::GLSLstd450Length;
  7156. break;
  7157. case glslang::EOpNormalize:
  7158. libCall = spv::GLSLstd450Normalize;
  7159. break;
  7160. case glslang::EOpExp:
  7161. libCall = spv::GLSLstd450Exp;
  7162. break;
  7163. case glslang::EOpLog:
  7164. libCall = spv::GLSLstd450Log;
  7165. break;
  7166. case glslang::EOpExp2:
  7167. libCall = spv::GLSLstd450Exp2;
  7168. break;
  7169. case glslang::EOpLog2:
  7170. libCall = spv::GLSLstd450Log2;
  7171. break;
  7172. case glslang::EOpSqrt:
  7173. libCall = spv::GLSLstd450Sqrt;
  7174. break;
  7175. case glslang::EOpInverseSqrt:
  7176. libCall = spv::GLSLstd450InverseSqrt;
  7177. break;
  7178. case glslang::EOpFloor:
  7179. libCall = spv::GLSLstd450Floor;
  7180. break;
  7181. case glslang::EOpTrunc:
  7182. libCall = spv::GLSLstd450Trunc;
  7183. break;
  7184. case glslang::EOpRound:
  7185. libCall = spv::GLSLstd450Round;
  7186. break;
  7187. case glslang::EOpRoundEven:
  7188. libCall = spv::GLSLstd450RoundEven;
  7189. break;
  7190. case glslang::EOpCeil:
  7191. libCall = spv::GLSLstd450Ceil;
  7192. break;
  7193. case glslang::EOpFract:
  7194. libCall = spv::GLSLstd450Fract;
  7195. break;
  7196. case glslang::EOpIsNan:
  7197. unaryOp = spv::Op::OpIsNan;
  7198. break;
  7199. case glslang::EOpIsInf:
  7200. unaryOp = spv::Op::OpIsInf;
  7201. break;
  7202. case glslang::EOpIsFinite:
  7203. unaryOp = spv::Op::OpIsFinite;
  7204. break;
  7205. case glslang::EOpFloatBitsToInt:
  7206. case glslang::EOpFloatBitsToUint:
  7207. case glslang::EOpIntBitsToFloat:
  7208. case glslang::EOpUintBitsToFloat:
  7209. case glslang::EOpDoubleBitsToInt64:
  7210. case glslang::EOpDoubleBitsToUint64:
  7211. case glslang::EOpInt64BitsToDouble:
  7212. case glslang::EOpUint64BitsToDouble:
  7213. case glslang::EOpFloat16BitsToInt16:
  7214. case glslang::EOpFloat16BitsToUint16:
  7215. case glslang::EOpInt16BitsToFloat16:
  7216. case glslang::EOpUint16BitsToFloat16:
  7217. unaryOp = spv::Op::OpBitcast;
  7218. break;
  7219. case glslang::EOpPackSnorm2x16:
  7220. libCall = spv::GLSLstd450PackSnorm2x16;
  7221. break;
  7222. case glslang::EOpUnpackSnorm2x16:
  7223. libCall = spv::GLSLstd450UnpackSnorm2x16;
  7224. break;
  7225. case glslang::EOpPackUnorm2x16:
  7226. libCall = spv::GLSLstd450PackUnorm2x16;
  7227. break;
  7228. case glslang::EOpUnpackUnorm2x16:
  7229. libCall = spv::GLSLstd450UnpackUnorm2x16;
  7230. break;
  7231. case glslang::EOpPackHalf2x16:
  7232. libCall = spv::GLSLstd450PackHalf2x16;
  7233. break;
  7234. case glslang::EOpUnpackHalf2x16:
  7235. libCall = spv::GLSLstd450UnpackHalf2x16;
  7236. break;
  7237. case glslang::EOpPackSnorm4x8:
  7238. libCall = spv::GLSLstd450PackSnorm4x8;
  7239. break;
  7240. case glslang::EOpUnpackSnorm4x8:
  7241. libCall = spv::GLSLstd450UnpackSnorm4x8;
  7242. break;
  7243. case glslang::EOpPackUnorm4x8:
  7244. libCall = spv::GLSLstd450PackUnorm4x8;
  7245. break;
  7246. case glslang::EOpUnpackUnorm4x8:
  7247. libCall = spv::GLSLstd450UnpackUnorm4x8;
  7248. break;
  7249. case glslang::EOpPackDouble2x32:
  7250. libCall = spv::GLSLstd450PackDouble2x32;
  7251. break;
  7252. case glslang::EOpUnpackDouble2x32:
  7253. libCall = spv::GLSLstd450UnpackDouble2x32;
  7254. break;
  7255. case glslang::EOpPackInt2x32:
  7256. case glslang::EOpUnpackInt2x32:
  7257. case glslang::EOpPackUint2x32:
  7258. case glslang::EOpUnpackUint2x32:
  7259. case glslang::EOpPack16:
  7260. case glslang::EOpPack32:
  7261. case glslang::EOpPack64:
  7262. case glslang::EOpUnpack32:
  7263. case glslang::EOpUnpack16:
  7264. case glslang::EOpUnpack8:
  7265. case glslang::EOpPackInt2x16:
  7266. case glslang::EOpUnpackInt2x16:
  7267. case glslang::EOpPackUint2x16:
  7268. case glslang::EOpUnpackUint2x16:
  7269. case glslang::EOpPackInt4x16:
  7270. case glslang::EOpUnpackInt4x16:
  7271. case glslang::EOpPackUint4x16:
  7272. case glslang::EOpUnpackUint4x16:
  7273. case glslang::EOpPackFloat2x16:
  7274. case glslang::EOpUnpackFloat2x16:
  7275. unaryOp = spv::Op::OpBitcast;
  7276. break;
  7277. case glslang::EOpDPdx:
  7278. unaryOp = spv::Op::OpDPdx;
  7279. break;
  7280. case glslang::EOpDPdy:
  7281. unaryOp = spv::Op::OpDPdy;
  7282. break;
  7283. case glslang::EOpFwidth:
  7284. unaryOp = spv::Op::OpFwidth;
  7285. break;
  7286. case glslang::EOpAny:
  7287. unaryOp = spv::Op::OpAny;
  7288. break;
  7289. case glslang::EOpAll:
  7290. unaryOp = spv::Op::OpAll;
  7291. break;
  7292. case glslang::EOpAbs:
  7293. if (isFloat)
  7294. libCall = spv::GLSLstd450FAbs;
  7295. else
  7296. libCall = spv::GLSLstd450SAbs;
  7297. break;
  7298. case glslang::EOpSign:
  7299. if (isFloat)
  7300. libCall = spv::GLSLstd450FSign;
  7301. else
  7302. libCall = spv::GLSLstd450SSign;
  7303. break;
  7304. case glslang::EOpDPdxFine:
  7305. unaryOp = spv::Op::OpDPdxFine;
  7306. break;
  7307. case glslang::EOpDPdyFine:
  7308. unaryOp = spv::Op::OpDPdyFine;
  7309. break;
  7310. case glslang::EOpFwidthFine:
  7311. unaryOp = spv::Op::OpFwidthFine;
  7312. break;
  7313. case glslang::EOpDPdxCoarse:
  7314. unaryOp = spv::Op::OpDPdxCoarse;
  7315. break;
  7316. case glslang::EOpDPdyCoarse:
  7317. unaryOp = spv::Op::OpDPdyCoarse;
  7318. break;
  7319. case glslang::EOpFwidthCoarse:
  7320. unaryOp = spv::Op::OpFwidthCoarse;
  7321. break;
  7322. case glslang::EOpRayQueryProceed:
  7323. unaryOp = spv::Op::OpRayQueryProceedKHR;
  7324. break;
  7325. case glslang::EOpRayQueryGetRayTMin:
  7326. unaryOp = spv::Op::OpRayQueryGetRayTMinKHR;
  7327. break;
  7328. case glslang::EOpRayQueryGetRayFlags:
  7329. unaryOp = spv::Op::OpRayQueryGetRayFlagsKHR;
  7330. break;
  7331. case glslang::EOpRayQueryGetWorldRayOrigin:
  7332. unaryOp = spv::Op::OpRayQueryGetWorldRayOriginKHR;
  7333. break;
  7334. case glslang::EOpRayQueryGetWorldRayDirection:
  7335. unaryOp = spv::Op::OpRayQueryGetWorldRayDirectionKHR;
  7336. break;
  7337. case glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque:
  7338. unaryOp = spv::Op::OpRayQueryGetIntersectionCandidateAABBOpaqueKHR;
  7339. break;
  7340. case glslang::EOpInterpolateAtCentroid:
  7341. if (typeProxy == glslang::EbtFloat16)
  7342. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
  7343. libCall = spv::GLSLstd450InterpolateAtCentroid;
  7344. break;
  7345. case glslang::EOpAtomicCounterIncrement:
  7346. case glslang::EOpAtomicCounterDecrement:
  7347. case glslang::EOpAtomicCounter:
  7348. {
  7349. // Handle all of the atomics in one place, in createAtomicOperation()
  7350. std::vector<spv::Id> operands;
  7351. operands.push_back(operand);
  7352. return createAtomicOperation(op, decorations.precision, typeId, operands, typeProxy, lvalueCoherentFlags, opType);
  7353. }
  7354. case glslang::EOpBitFieldReverse:
  7355. unaryOp = spv::Op::OpBitReverse;
  7356. break;
  7357. case glslang::EOpBitCount:
  7358. unaryOp = spv::Op::OpBitCount;
  7359. break;
  7360. case glslang::EOpFindLSB:
  7361. libCall = spv::GLSLstd450FindILsb;
  7362. break;
  7363. case glslang::EOpFindMSB:
  7364. if (isUnsigned)
  7365. libCall = spv::GLSLstd450FindUMsb;
  7366. else
  7367. libCall = spv::GLSLstd450FindSMsb;
  7368. break;
  7369. case glslang::EOpCountLeadingZeros:
  7370. builder.addCapability(spv::Capability::IntegerFunctions2INTEL);
  7371. builder.addExtension("SPV_INTEL_shader_integer_functions2");
  7372. unaryOp = spv::Op::OpUCountLeadingZerosINTEL;
  7373. break;
  7374. case glslang::EOpCountTrailingZeros:
  7375. builder.addCapability(spv::Capability::IntegerFunctions2INTEL);
  7376. builder.addExtension("SPV_INTEL_shader_integer_functions2");
  7377. unaryOp = spv::Op::OpUCountTrailingZerosINTEL;
  7378. break;
  7379. case glslang::EOpBallot:
  7380. case glslang::EOpReadFirstInvocation:
  7381. case glslang::EOpAnyInvocation:
  7382. case glslang::EOpAllInvocations:
  7383. case glslang::EOpAllInvocationsEqual:
  7384. case glslang::EOpMinInvocations:
  7385. case glslang::EOpMaxInvocations:
  7386. case glslang::EOpAddInvocations:
  7387. case glslang::EOpMinInvocationsNonUniform:
  7388. case glslang::EOpMaxInvocationsNonUniform:
  7389. case glslang::EOpAddInvocationsNonUniform:
  7390. case glslang::EOpMinInvocationsInclusiveScan:
  7391. case glslang::EOpMaxInvocationsInclusiveScan:
  7392. case glslang::EOpAddInvocationsInclusiveScan:
  7393. case glslang::EOpMinInvocationsInclusiveScanNonUniform:
  7394. case glslang::EOpMaxInvocationsInclusiveScanNonUniform:
  7395. case glslang::EOpAddInvocationsInclusiveScanNonUniform:
  7396. case glslang::EOpMinInvocationsExclusiveScan:
  7397. case glslang::EOpMaxInvocationsExclusiveScan:
  7398. case glslang::EOpAddInvocationsExclusiveScan:
  7399. case glslang::EOpMinInvocationsExclusiveScanNonUniform:
  7400. case glslang::EOpMaxInvocationsExclusiveScanNonUniform:
  7401. case glslang::EOpAddInvocationsExclusiveScanNonUniform:
  7402. {
  7403. std::vector<spv::Id> operands;
  7404. operands.push_back(operand);
  7405. return createInvocationsOperation(op, typeId, operands, typeProxy);
  7406. }
  7407. case glslang::EOpSubgroupAll:
  7408. case glslang::EOpSubgroupAny:
  7409. case glslang::EOpSubgroupAllEqual:
  7410. case glslang::EOpSubgroupBroadcastFirst:
  7411. case glslang::EOpSubgroupBallot:
  7412. case glslang::EOpSubgroupInverseBallot:
  7413. case glslang::EOpSubgroupBallotBitCount:
  7414. case glslang::EOpSubgroupBallotInclusiveBitCount:
  7415. case glslang::EOpSubgroupBallotExclusiveBitCount:
  7416. case glslang::EOpSubgroupBallotFindLSB:
  7417. case glslang::EOpSubgroupBallotFindMSB:
  7418. case glslang::EOpSubgroupAdd:
  7419. case glslang::EOpSubgroupMul:
  7420. case glslang::EOpSubgroupMin:
  7421. case glslang::EOpSubgroupMax:
  7422. case glslang::EOpSubgroupAnd:
  7423. case glslang::EOpSubgroupOr:
  7424. case glslang::EOpSubgroupXor:
  7425. case glslang::EOpSubgroupInclusiveAdd:
  7426. case glslang::EOpSubgroupInclusiveMul:
  7427. case glslang::EOpSubgroupInclusiveMin:
  7428. case glslang::EOpSubgroupInclusiveMax:
  7429. case glslang::EOpSubgroupInclusiveAnd:
  7430. case glslang::EOpSubgroupInclusiveOr:
  7431. case glslang::EOpSubgroupInclusiveXor:
  7432. case glslang::EOpSubgroupExclusiveAdd:
  7433. case glslang::EOpSubgroupExclusiveMul:
  7434. case glslang::EOpSubgroupExclusiveMin:
  7435. case glslang::EOpSubgroupExclusiveMax:
  7436. case glslang::EOpSubgroupExclusiveAnd:
  7437. case glslang::EOpSubgroupExclusiveOr:
  7438. case glslang::EOpSubgroupExclusiveXor:
  7439. case glslang::EOpSubgroupQuadSwapHorizontal:
  7440. case glslang::EOpSubgroupQuadSwapVertical:
  7441. case glslang::EOpSubgroupQuadSwapDiagonal:
  7442. case glslang::EOpSubgroupQuadAll:
  7443. case glslang::EOpSubgroupQuadAny: {
  7444. std::vector<spv::Id> operands;
  7445. operands.push_back(operand);
  7446. return createSubgroupOperation(op, typeId, operands, typeProxy);
  7447. }
  7448. case glslang::EOpMbcnt:
  7449. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
  7450. libCall = spv::MbcntAMD;
  7451. break;
  7452. case glslang::EOpCubeFaceIndex:
  7453. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_gcn_shader);
  7454. libCall = spv::CubeFaceIndexAMD;
  7455. break;
  7456. case glslang::EOpCubeFaceCoord:
  7457. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_gcn_shader);
  7458. libCall = spv::CubeFaceCoordAMD;
  7459. break;
  7460. case glslang::EOpSubgroupPartition:
  7461. unaryOp = spv::Op::OpGroupNonUniformPartitionNV;
  7462. break;
  7463. case glslang::EOpConstructReference:
  7464. unaryOp = spv::Op::OpBitcast;
  7465. break;
  7466. case glslang::EOpConvUint64ToAccStruct:
  7467. case glslang::EOpConvUvec2ToAccStruct:
  7468. unaryOp = spv::Op::OpConvertUToAccelerationStructureKHR;
  7469. break;
  7470. case glslang::EOpHitObjectIsEmptyNV:
  7471. unaryOp = spv::Op::OpHitObjectIsEmptyNV;
  7472. break;
  7473. case glslang::EOpHitObjectIsEmptyEXT:
  7474. unaryOp = spv::Op::OpHitObjectIsEmptyEXT;
  7475. break;
  7476. case glslang::EOpHitObjectIsMissNV:
  7477. unaryOp = spv::Op::OpHitObjectIsMissNV;
  7478. break;
  7479. case glslang::EOpHitObjectIsMissEXT:
  7480. unaryOp = spv::Op::OpHitObjectIsMissEXT;
  7481. break;
  7482. case glslang::EOpHitObjectIsHitNV:
  7483. unaryOp = spv::Op::OpHitObjectIsHitNV;
  7484. break;
  7485. case glslang::EOpHitObjectIsHitEXT:
  7486. unaryOp = spv::Op::OpHitObjectIsHitEXT;
  7487. break;
  7488. case glslang::EOpHitObjectGetObjectRayOriginNV:
  7489. unaryOp = spv::Op::OpHitObjectGetObjectRayOriginNV;
  7490. break;
  7491. case glslang::EOpHitObjectGetObjectRayOriginEXT:
  7492. unaryOp = spv::Op::OpHitObjectGetObjectRayOriginEXT;
  7493. break;
  7494. case glslang::EOpHitObjectGetObjectRayDirectionNV:
  7495. unaryOp = spv::Op::OpHitObjectGetObjectRayDirectionNV;
  7496. break;
  7497. case glslang::EOpHitObjectGetObjectRayDirectionEXT:
  7498. unaryOp = spv::Op::OpHitObjectGetObjectRayDirectionEXT;
  7499. break;
  7500. case glslang::EOpHitObjectGetWorldRayOriginNV:
  7501. unaryOp = spv::Op::OpHitObjectGetWorldRayOriginNV;
  7502. break;
  7503. case glslang::EOpHitObjectGetWorldRayOriginEXT:
  7504. unaryOp = spv::Op::OpHitObjectGetWorldRayOriginEXT;
  7505. break;
  7506. case glslang::EOpHitObjectGetWorldRayDirectionNV:
  7507. unaryOp = spv::Op::OpHitObjectGetWorldRayDirectionNV;
  7508. break;
  7509. case glslang::EOpHitObjectGetWorldRayDirectionEXT:
  7510. unaryOp = spv::Op::OpHitObjectGetWorldRayDirectionEXT;
  7511. break;
  7512. case glslang::EOpHitObjectGetObjectToWorldNV:
  7513. unaryOp = spv::Op::OpHitObjectGetObjectToWorldNV;
  7514. break;
  7515. case glslang::EOpHitObjectGetObjectToWorldEXT:
  7516. unaryOp = spv::Op::OpHitObjectGetObjectToWorldEXT;
  7517. break;
  7518. case glslang::EOpHitObjectGetWorldToObjectNV:
  7519. unaryOp = spv::Op::OpHitObjectGetWorldToObjectNV;
  7520. break;
  7521. case glslang::EOpHitObjectGetWorldToObjectEXT:
  7522. unaryOp = spv::Op::OpHitObjectGetWorldToObjectEXT;
  7523. break;
  7524. case glslang::EOpHitObjectGetRayTMinNV:
  7525. unaryOp = spv::Op::OpHitObjectGetRayTMinNV;
  7526. break;
  7527. case glslang::EOpHitObjectGetRayTMinEXT:
  7528. unaryOp = spv::Op::OpHitObjectGetRayTMinEXT;
  7529. break;
  7530. case glslang::EOpHitObjectGetRayTMaxNV:
  7531. unaryOp = spv::Op::OpHitObjectGetRayTMaxNV;
  7532. break;
  7533. case glslang::EOpHitObjectGetRayTMaxEXT:
  7534. unaryOp = spv::Op::OpHitObjectGetRayTMaxEXT;
  7535. break;
  7536. case glslang::EOpHitObjectGetRayFlagsEXT:
  7537. unaryOp = spv::Op::OpHitObjectGetRayFlagsEXT;
  7538. break;
  7539. case glslang::EOpHitObjectGetPrimitiveIndexNV:
  7540. unaryOp = spv::Op::OpHitObjectGetPrimitiveIndexNV;
  7541. break;
  7542. case glslang::EOpHitObjectGetPrimitiveIndexEXT:
  7543. unaryOp = spv::Op::OpHitObjectGetPrimitiveIndexEXT;
  7544. break;
  7545. case glslang::EOpHitObjectGetInstanceIdNV:
  7546. unaryOp = spv::Op::OpHitObjectGetInstanceIdNV;
  7547. break;
  7548. case glslang::EOpHitObjectGetInstanceIdEXT:
  7549. unaryOp = spv::Op::OpHitObjectGetInstanceIdEXT;
  7550. break;
  7551. case glslang::EOpHitObjectGetInstanceCustomIndexNV:
  7552. unaryOp = spv::Op::OpHitObjectGetInstanceCustomIndexNV;
  7553. break;
  7554. case glslang::EOpHitObjectGetInstanceCustomIndexEXT:
  7555. unaryOp = spv::Op::OpHitObjectGetInstanceCustomIndexEXT;
  7556. break;
  7557. case glslang::EOpHitObjectGetGeometryIndexNV:
  7558. unaryOp = spv::Op::OpHitObjectGetGeometryIndexNV;
  7559. break;
  7560. case glslang::EOpHitObjectGetGeometryIndexEXT:
  7561. unaryOp = spv::Op::OpHitObjectGetGeometryIndexEXT;
  7562. break;
  7563. case glslang::EOpHitObjectGetHitKindNV:
  7564. unaryOp = spv::Op::OpHitObjectGetHitKindNV;
  7565. break;
  7566. case glslang::EOpHitObjectGetHitKindEXT:
  7567. unaryOp = spv::Op::OpHitObjectGetHitKindEXT;
  7568. break;
  7569. case glslang::EOpHitObjectGetCurrentTimeNV:
  7570. unaryOp = spv::Op::OpHitObjectGetCurrentTimeNV;
  7571. break;
  7572. case glslang::EOpHitObjectGetCurrentTimeEXT:
  7573. unaryOp = spv::Op::OpHitObjectGetCurrentTimeEXT;
  7574. break;
  7575. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:
  7576. unaryOp = spv::Op::OpHitObjectGetShaderBindingTableRecordIndexNV;
  7577. break;
  7578. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexEXT:
  7579. unaryOp = spv::Op::OpHitObjectGetShaderBindingTableRecordIndexEXT;
  7580. break;
  7581. case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:
  7582. unaryOp = spv::Op::OpHitObjectGetShaderRecordBufferHandleNV;
  7583. break;
  7584. case glslang::EOpHitObjectGetClusterIdNV:
  7585. unaryOp = spv::Op::OpHitObjectGetClusterIdNV;
  7586. builder.addExtension(spv::E_SPV_NV_cluster_acceleration_structure);
  7587. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  7588. builder.addCapability(spv::Capability::RayTracingClusterAccelerationStructureNV);
  7589. break;
  7590. case glslang::EOpHitObjectGetSpherePositionNV:
  7591. unaryOp = spv::Op::OpHitObjectGetSpherePositionNV;
  7592. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  7593. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  7594. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  7595. break;
  7596. case glslang::EOpHitObjectGetSphereRadiusNV:
  7597. unaryOp = spv::Op::OpHitObjectGetSphereRadiusNV;
  7598. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  7599. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  7600. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  7601. break;
  7602. case glslang::EOpHitObjectIsSphereHitNV:
  7603. unaryOp = spv::Op::OpHitObjectIsSphereHitNV;
  7604. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  7605. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  7606. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  7607. break;
  7608. case glslang::EOpHitObjectIsLSSHitNV:
  7609. unaryOp = spv::Op::OpHitObjectIsLSSHitNV;
  7610. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  7611. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  7612. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  7613. break;
  7614. case glslang::EOpHitObjectGetShaderRecordBufferHandleEXT:
  7615. unaryOp = spv::Op::OpHitObjectGetShaderRecordBufferHandleEXT;
  7616. break;
  7617. case glslang::EOpFetchMicroTriangleVertexPositionNV:
  7618. unaryOp = spv::Op::OpFetchMicroTriangleVertexPositionNV;
  7619. break;
  7620. case glslang::EOpFetchMicroTriangleVertexBarycentricNV:
  7621. unaryOp = spv::Op::OpFetchMicroTriangleVertexBarycentricNV;
  7622. break;
  7623. case glslang::EOpCopyObject:
  7624. unaryOp = spv::Op::OpCopyObject;
  7625. break;
  7626. case glslang::EOpDepthAttachmentReadEXT:
  7627. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  7628. builder.addCapability(spv::Capability::TileImageDepthReadAccessEXT);
  7629. unaryOp = spv::Op::OpDepthAttachmentReadEXT;
  7630. decorations.precision = spv::NoPrecision;
  7631. break;
  7632. case glslang::EOpStencilAttachmentReadEXT:
  7633. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  7634. builder.addCapability(spv::Capability::TileImageStencilReadAccessEXT);
  7635. unaryOp = spv::Op::OpStencilAttachmentReadEXT;
  7636. decorations.precision = spv::Decoration::RelaxedPrecision;
  7637. break;
  7638. default:
  7639. return 0;
  7640. }
  7641. spv::Id id;
  7642. if (libCall >= 0) {
  7643. std::vector<spv::Id> args;
  7644. args.push_back(operand);
  7645. id = builder.createBuiltinCall(typeId, extBuiltins >= 0 ? extBuiltins : stdBuiltins, libCall, args);
  7646. } else {
  7647. id = builder.createUnaryOp(unaryOp, typeId, operand);
  7648. }
  7649. decorations.addNoContraction(builder, id);
  7650. decorations.addNonUniform(builder, id);
  7651. return builder.setPrecision(id, decorations.precision);
  7652. }
  7653. // Create a unary operation on a matrix
  7654. spv::Id TGlslangToSpvTraverser::createUnaryMatrixOperation(spv::Op op, OpDecorations& decorations, spv::Id typeId,
  7655. spv::Id operand, glslang::TBasicType /* typeProxy */)
  7656. {
  7657. // Handle unary operations vector by vector.
  7658. // The result type is the same type as the original type.
  7659. // The algorithm is to:
  7660. // - break the matrix into vectors
  7661. // - apply the operation to each vector
  7662. // - make a matrix out the vector results
  7663. // get the types sorted out
  7664. int numCols = builder.getNumColumns(operand);
  7665. int numRows = builder.getNumRows(operand);
  7666. spv::Id srcVecType = builder.makeVectorType(builder.getScalarTypeId(builder.getTypeId(operand)), numRows);
  7667. spv::Id destVecType = builder.makeVectorType(builder.getScalarTypeId(typeId), numRows);
  7668. std::vector<spv::Id> results;
  7669. // do each vector op
  7670. for (int c = 0; c < numCols; ++c) {
  7671. std::vector<unsigned int> indexes;
  7672. indexes.push_back(c);
  7673. spv::Id srcVec = builder.createCompositeExtract(operand, srcVecType, indexes);
  7674. spv::Id destVec = builder.createUnaryOp(op, destVecType, srcVec);
  7675. decorations.addNoContraction(builder, destVec);
  7676. decorations.addNonUniform(builder, destVec);
  7677. results.push_back(builder.setPrecision(destVec, decorations.precision));
  7678. }
  7679. // put the pieces together
  7680. spv::Id result = builder.setPrecision(builder.createCompositeConstruct(typeId, results), decorations.precision);
  7681. decorations.addNonUniform(builder, result);
  7682. return result;
  7683. }
  7684. // For converting integers where both the bitwidth and the signedness could
  7685. // change, but only do the width change here. The caller is still responsible
  7686. // for the signedness conversion.
  7687. // destType is the final type that will be converted to, but this function
  7688. // may only be doing part of that conversion.
  7689. spv::Id TGlslangToSpvTraverser::createIntWidthConversion(spv::Id operand, int vectorSize, spv::Id destType,
  7690. glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType)
  7691. {
  7692. // Get the result type width, based on the type to convert to.
  7693. int width = GetNumBits(resultBasicType);
  7694. // Get the conversion operation and result type,
  7695. // based on the target width, but the source type.
  7696. spv::Id type = spv::NoType;
  7697. spv::Op convOp = spv::Op::OpNop;
  7698. if (isTypeSignedInt(operandBasicType)) {
  7699. convOp = spv::Op::OpSConvert;
  7700. type = builder.makeIntType(width);
  7701. } else {
  7702. convOp = spv::Op::OpUConvert;
  7703. type = builder.makeUintType(width);
  7704. }
  7705. if (builder.getOpCode(destType) == spv::Op::OpTypeCooperativeVectorNV) {
  7706. type = builder.makeCooperativeVectorTypeNV(type, builder.getCooperativeVectorNumComponents(destType));
  7707. } else if (vectorSize > 0)
  7708. type = builder.makeVectorType(type, vectorSize);
  7709. else if (builder.getOpCode(destType) == spv::Op::OpTypeCooperativeMatrixKHR ||
  7710. builder.getOpCode(destType) == spv::Op::OpTypeCooperativeMatrixNV) {
  7711. type = builder.makeCooperativeMatrixTypeWithSameShape(type, destType);
  7712. }
  7713. return builder.createUnaryOp(convOp, type, operand);
  7714. }
  7715. spv::Id TGlslangToSpvTraverser::createConversion(glslang::TOperator op, OpDecorations& decorations, spv::Id destType,
  7716. spv::Id operand, glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType)
  7717. {
  7718. spv::Op convOp = spv::Op::OpNop;
  7719. spv::Id zero = 0;
  7720. spv::Id one = 0;
  7721. int vectorSize = builder.isVectorType(destType) ? builder.getNumTypeComponents(destType) : 0;
  7722. if (IsOpNumericConv(op) || op == glslang::EOpConstructSaturated) {
  7723. if (isTypeSignedInt(operandBasicType) && isTypeFloat(resultBasicType)) {
  7724. convOp = spv::Op::OpConvertSToF;
  7725. }
  7726. if (isTypeUnsignedInt(operandBasicType) && isTypeFloat(resultBasicType)) {
  7727. convOp = spv::Op::OpConvertUToF;
  7728. }
  7729. if (isTypeFloat(operandBasicType) && isTypeSignedInt(resultBasicType)) {
  7730. convOp = spv::Op::OpConvertFToS;
  7731. }
  7732. if (isTypeFloat(operandBasicType) && isTypeUnsignedInt(resultBasicType)) {
  7733. convOp = spv::Op::OpConvertFToU;
  7734. }
  7735. if (isTypeSignedInt(operandBasicType) && isTypeSignedInt(resultBasicType)) {
  7736. convOp = spv::Op::OpSConvert;
  7737. }
  7738. if (isTypeUnsignedInt(operandBasicType) && isTypeUnsignedInt(resultBasicType)) {
  7739. convOp = spv::Op::OpUConvert;
  7740. }
  7741. if (isTypeFloat(operandBasicType) && isTypeFloat(resultBasicType)) {
  7742. convOp = spv::Op::OpFConvert;
  7743. if (builder.isMatrixType(destType))
  7744. return createUnaryMatrixOperation(convOp, decorations, destType, operand, operandBasicType);
  7745. }
  7746. if (isTypeInt(operandBasicType) && isTypeInt(resultBasicType) &&
  7747. isTypeUnsignedInt(operandBasicType) != isTypeUnsignedInt(resultBasicType)) {
  7748. if (GetNumBits(operandBasicType) != GetNumBits(resultBasicType)) {
  7749. // OpSConvert/OpUConvert + OpBitCast
  7750. operand = createIntWidthConversion(operand, vectorSize, destType, resultBasicType, operandBasicType);
  7751. }
  7752. if (builder.isInSpecConstCodeGenMode()) {
  7753. uint32_t bits = GetNumBits(resultBasicType);
  7754. spv::Id zeroType = builder.makeUintType(bits);
  7755. if (bits == 64) {
  7756. zero = builder.makeInt64Constant(zeroType, 0, false);
  7757. } else {
  7758. zero = builder.makeIntConstant(zeroType, 0, false);
  7759. }
  7760. zero = makeSmearedConstant(zero, vectorSize);
  7761. // Use OpIAdd, instead of OpBitcast to do the conversion when
  7762. // generating for OpSpecConstantOp instruction.
  7763. return builder.createBinOp(spv::Op::OpIAdd, destType, operand, zero);
  7764. }
  7765. // For normal run-time conversion instruction, use OpBitcast.
  7766. convOp = spv::Op::OpBitcast;
  7767. }
  7768. if (resultBasicType == glslang::EbtBool) {
  7769. uint32_t bits = GetNumBits(operandBasicType);
  7770. if (isTypeInt(operandBasicType)) {
  7771. spv::Id zeroType = builder.makeUintType(bits);
  7772. if (bits == 64) {
  7773. zero = builder.makeInt64Constant(zeroType, 0, false);
  7774. } else {
  7775. zero = builder.makeIntConstant(zeroType, 0, false);
  7776. }
  7777. zero = makeSmearedConstant(zero, vectorSize);
  7778. return builder.createBinOp(spv::Op::OpINotEqual, destType, operand, zero);
  7779. } else {
  7780. assert(isTypeFloat(operandBasicType));
  7781. if (bits == 64) {
  7782. zero = builder.makeDoubleConstant(0.0);
  7783. } else if (bits == 32) {
  7784. zero = builder.makeFloatConstant(0.0);
  7785. } else {
  7786. assert(bits == 16);
  7787. zero = builder.makeFloat16Constant(0.0);
  7788. }
  7789. zero = makeSmearedConstant(zero, vectorSize);
  7790. return builder.createBinOp(spv::Op::OpFUnordNotEqual, destType, operand, zero);
  7791. }
  7792. }
  7793. if (operandBasicType == glslang::EbtBool) {
  7794. uint32_t bits = GetNumBits(resultBasicType);
  7795. convOp = spv::Op::OpSelect;
  7796. if (isTypeInt(resultBasicType)) {
  7797. spv::Id zeroType = isTypeSignedInt(resultBasicType) ? builder.makeIntType(bits) : builder.makeUintType(bits);
  7798. if (bits == 64) {
  7799. zero = builder.makeInt64Constant(zeroType, 0, false);
  7800. one = builder.makeInt64Constant(zeroType, 1, false);
  7801. } else {
  7802. zero = builder.makeIntConstant(zeroType, 0, false);
  7803. one = builder.makeIntConstant(zeroType, 1, false);
  7804. }
  7805. } else {
  7806. assert(isTypeFloat(resultBasicType));
  7807. if (bits == 64) {
  7808. zero = builder.makeDoubleConstant(0.0);
  7809. one = builder.makeDoubleConstant(1.0);
  7810. } else if (bits == 32) {
  7811. zero = builder.makeFloatConstant(0.0);
  7812. one = builder.makeFloatConstant(1.0);
  7813. } else {
  7814. assert(bits == 16);
  7815. zero = builder.makeFloat16Constant(0.0);
  7816. one = builder.makeFloat16Constant(1.0);
  7817. }
  7818. }
  7819. }
  7820. }
  7821. if (convOp == spv::Op::OpNop) {
  7822. switch (op) {
  7823. case glslang::EOpConvUint64ToPtr:
  7824. convOp = spv::Op::OpConvertUToPtr;
  7825. break;
  7826. case glslang::EOpConvPtrToUint64:
  7827. convOp = spv::Op::OpConvertPtrToU;
  7828. break;
  7829. case glslang::EOpConvPtrToUvec2:
  7830. case glslang::EOpConvUvec2ToPtr:
  7831. convOp = spv::Op::OpBitcast;
  7832. break;
  7833. default:
  7834. break;
  7835. }
  7836. }
  7837. spv::Id result = 0;
  7838. if (convOp == spv::Op::OpNop)
  7839. return result;
  7840. if (convOp == spv::Op::OpSelect) {
  7841. zero = makeSmearedConstant(zero, vectorSize);
  7842. one = makeSmearedConstant(one, vectorSize);
  7843. result = builder.createTriOp(convOp, destType, operand, one, zero);
  7844. } else
  7845. result = builder.createUnaryOp(convOp, destType, operand);
  7846. result = builder.setPrecision(result, decorations.precision);
  7847. decorations.addNonUniform(builder, result);
  7848. return result;
  7849. }
  7850. spv::Id TGlslangToSpvTraverser::makeSmearedConstant(spv::Id constant, int vectorSize)
  7851. {
  7852. if (vectorSize == 0)
  7853. return constant;
  7854. spv::Id vectorTypeId = builder.makeVectorType(builder.getTypeId(constant), vectorSize);
  7855. std::vector<spv::Id> components;
  7856. for (int c = 0; c < vectorSize; ++c)
  7857. components.push_back(constant);
  7858. return builder.makeCompositeConstant(vectorTypeId, components);
  7859. }
  7860. // For glslang ops that map to SPV atomic opCodes
  7861. spv::Id TGlslangToSpvTraverser::createAtomicOperation(glslang::TOperator op, spv::Decoration /*precision*/,
  7862. spv::Id typeId, std::vector<spv::Id>& operands, glslang::TBasicType typeProxy,
  7863. const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags, const glslang::TType &opType)
  7864. {
  7865. spv::Op opCode = spv::Op::OpNop;
  7866. switch (op) {
  7867. case glslang::EOpAtomicAdd:
  7868. case glslang::EOpImageAtomicAdd:
  7869. case glslang::EOpAtomicCounterAdd:
  7870. opCode = spv::Op::OpAtomicIAdd;
  7871. if (typeProxy == glslang::EbtFloat16 || typeProxy == glslang::EbtFloat || typeProxy == glslang::EbtDouble) {
  7872. opCode = spv::Op::OpAtomicFAddEXT;
  7873. if (typeProxy == glslang::EbtFloat16 &&
  7874. (opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {
  7875. builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);
  7876. builder.addCapability(spv::Capability::AtomicFloat16VectorNV);
  7877. } else {
  7878. builder.addExtension(spv::E_SPV_EXT_shader_atomic_float_add);
  7879. if (typeProxy == glslang::EbtFloat16) {
  7880. builder.addExtension(spv::E_SPV_EXT_shader_atomic_float16_add);
  7881. builder.addCapability(spv::Capability::AtomicFloat16AddEXT);
  7882. } else if (typeProxy == glslang::EbtFloat) {
  7883. builder.addCapability(spv::Capability::AtomicFloat32AddEXT);
  7884. } else {
  7885. builder.addCapability(spv::Capability::AtomicFloat64AddEXT);
  7886. }
  7887. }
  7888. }
  7889. break;
  7890. case glslang::EOpAtomicSubtract:
  7891. case glslang::EOpAtomicCounterSubtract:
  7892. opCode = spv::Op::OpAtomicISub;
  7893. break;
  7894. case glslang::EOpAtomicMin:
  7895. case glslang::EOpImageAtomicMin:
  7896. case glslang::EOpAtomicCounterMin:
  7897. if (typeProxy == glslang::EbtFloat16 || typeProxy == glslang::EbtFloat || typeProxy == glslang::EbtDouble) {
  7898. opCode = spv::Op::OpAtomicFMinEXT;
  7899. if (typeProxy == glslang::EbtFloat16 &&
  7900. (opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {
  7901. builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);
  7902. builder.addCapability(spv::Capability::AtomicFloat16VectorNV);
  7903. } else {
  7904. builder.addExtension(spv::E_SPV_EXT_shader_atomic_float_min_max);
  7905. if (typeProxy == glslang::EbtFloat16)
  7906. builder.addCapability(spv::Capability::AtomicFloat16MinMaxEXT);
  7907. else if (typeProxy == glslang::EbtFloat)
  7908. builder.addCapability(spv::Capability::AtomicFloat32MinMaxEXT);
  7909. else
  7910. builder.addCapability(spv::Capability::AtomicFloat64MinMaxEXT);
  7911. }
  7912. } else if (typeProxy == glslang::EbtUint || typeProxy == glslang::EbtUint64) {
  7913. opCode = spv::Op::OpAtomicUMin;
  7914. } else {
  7915. opCode = spv::Op::OpAtomicSMin;
  7916. }
  7917. break;
  7918. case glslang::EOpAtomicMax:
  7919. case glslang::EOpImageAtomicMax:
  7920. case glslang::EOpAtomicCounterMax:
  7921. if (typeProxy == glslang::EbtFloat16 || typeProxy == glslang::EbtFloat || typeProxy == glslang::EbtDouble) {
  7922. opCode = spv::Op::OpAtomicFMaxEXT;
  7923. if (typeProxy == glslang::EbtFloat16 &&
  7924. (opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {
  7925. builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);
  7926. builder.addCapability(spv::Capability::AtomicFloat16VectorNV);
  7927. } else {
  7928. builder.addExtension(spv::E_SPV_EXT_shader_atomic_float_min_max);
  7929. if (typeProxy == glslang::EbtFloat16)
  7930. builder.addCapability(spv::Capability::AtomicFloat16MinMaxEXT);
  7931. else if (typeProxy == glslang::EbtFloat)
  7932. builder.addCapability(spv::Capability::AtomicFloat32MinMaxEXT);
  7933. else
  7934. builder.addCapability(spv::Capability::AtomicFloat64MinMaxEXT);
  7935. }
  7936. } else if (typeProxy == glslang::EbtUint || typeProxy == glslang::EbtUint64) {
  7937. opCode = spv::Op::OpAtomicUMax;
  7938. } else {
  7939. opCode = spv::Op::OpAtomicSMax;
  7940. }
  7941. break;
  7942. case glslang::EOpAtomicAnd:
  7943. case glslang::EOpImageAtomicAnd:
  7944. case glslang::EOpAtomicCounterAnd:
  7945. opCode = spv::Op::OpAtomicAnd;
  7946. break;
  7947. case glslang::EOpAtomicOr:
  7948. case glslang::EOpImageAtomicOr:
  7949. case glslang::EOpAtomicCounterOr:
  7950. opCode = spv::Op::OpAtomicOr;
  7951. break;
  7952. case glslang::EOpAtomicXor:
  7953. case glslang::EOpImageAtomicXor:
  7954. case glslang::EOpAtomicCounterXor:
  7955. opCode = spv::Op::OpAtomicXor;
  7956. break;
  7957. case glslang::EOpAtomicExchange:
  7958. case glslang::EOpImageAtomicExchange:
  7959. case glslang::EOpAtomicCounterExchange:
  7960. if ((typeProxy == glslang::EbtFloat16) &&
  7961. (opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {
  7962. builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);
  7963. builder.addCapability(spv::Capability::AtomicFloat16VectorNV);
  7964. }
  7965. opCode = spv::Op::OpAtomicExchange;
  7966. break;
  7967. case glslang::EOpAtomicCompSwap:
  7968. case glslang::EOpImageAtomicCompSwap:
  7969. case glslang::EOpAtomicCounterCompSwap:
  7970. opCode = spv::Op::OpAtomicCompareExchange;
  7971. break;
  7972. case glslang::EOpAtomicCounterIncrement:
  7973. opCode = spv::Op::OpAtomicIIncrement;
  7974. break;
  7975. case glslang::EOpAtomicCounterDecrement:
  7976. opCode = spv::Op::OpAtomicIDecrement;
  7977. break;
  7978. case glslang::EOpAtomicCounter:
  7979. case glslang::EOpImageAtomicLoad:
  7980. case glslang::EOpAtomicLoad:
  7981. opCode = spv::Op::OpAtomicLoad;
  7982. break;
  7983. case glslang::EOpAtomicStore:
  7984. case glslang::EOpImageAtomicStore:
  7985. opCode = spv::Op::OpAtomicStore;
  7986. break;
  7987. default:
  7988. assert(0);
  7989. break;
  7990. }
  7991. if (typeProxy == glslang::EbtInt64 || typeProxy == glslang::EbtUint64)
  7992. builder.addCapability(spv::Capability::Int64Atomics);
  7993. // Sort out the operands
  7994. // - mapping from glslang -> SPV
  7995. // - there are extra SPV operands that are optional in glslang
  7996. // - compare-exchange swaps the value and comparator
  7997. // - compare-exchange has an extra memory semantics
  7998. // - EOpAtomicCounterDecrement needs a post decrement
  7999. spv::Id pointerId = 0, compareId = 0, valueId = 0;
  8000. // scope defaults to Device in the old model, QueueFamilyKHR in the new model
  8001. spv::Id scopeId;
  8002. if (glslangIntermediate->usingVulkanMemoryModel()) {
  8003. scopeId = builder.makeUintConstant(spv::Scope::QueueFamilyKHR);
  8004. } else {
  8005. scopeId = builder.makeUintConstant(spv::Scope::Device);
  8006. }
  8007. // semantics default to relaxed
  8008. spv::Id semanticsId = builder.makeUintConstant(lvalueCoherentFlags.isVolatile() &&
  8009. glslangIntermediate->usingVulkanMemoryModel() ?
  8010. spv::MemorySemanticsMask::Volatile :
  8011. spv::MemorySemanticsMask::MaskNone);
  8012. spv::Id semanticsId2 = semanticsId;
  8013. pointerId = operands[0];
  8014. if (opCode == spv::Op::OpAtomicIIncrement || opCode == spv::Op::OpAtomicIDecrement) {
  8015. // no additional operands
  8016. } else if (opCode == spv::Op::OpAtomicCompareExchange) {
  8017. compareId = operands[1];
  8018. valueId = operands[2];
  8019. if (operands.size() > 3) {
  8020. scopeId = operands[3];
  8021. semanticsId = builder.makeUintConstant(
  8022. builder.getConstantScalar(operands[4]) | builder.getConstantScalar(operands[5]));
  8023. semanticsId2 = builder.makeUintConstant(
  8024. builder.getConstantScalar(operands[6]) | builder.getConstantScalar(operands[7]));
  8025. }
  8026. } else if (opCode == spv::Op::OpAtomicLoad) {
  8027. if (operands.size() > 1) {
  8028. scopeId = operands[1];
  8029. semanticsId = builder.makeUintConstant(
  8030. builder.getConstantScalar(operands[2]) | builder.getConstantScalar(operands[3]));
  8031. }
  8032. } else {
  8033. // atomic store or RMW
  8034. valueId = operands[1];
  8035. if (operands.size() > 2) {
  8036. scopeId = operands[2];
  8037. semanticsId = builder.makeUintConstant
  8038. (builder.getConstantScalar(operands[3]) | builder.getConstantScalar(operands[4]));
  8039. }
  8040. }
  8041. // Check for capabilities
  8042. auto const semanticsImmediate = (spv::MemorySemanticsMask)(builder.getConstantScalar(semanticsId) | builder.getConstantScalar(semanticsId2));
  8043. if (anySet(semanticsImmediate, spv::MemorySemanticsMask::MakeAvailableKHR |
  8044. spv::MemorySemanticsMask::MakeVisibleKHR |
  8045. spv::MemorySemanticsMask::OutputMemoryKHR |
  8046. spv::MemorySemanticsMask::Volatile)) {
  8047. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  8048. }
  8049. auto const scope = (spv::Scope)builder.getConstantScalar(scopeId);
  8050. if (scope == spv::Scope::QueueFamily) {
  8051. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  8052. }
  8053. if (glslangIntermediate->usingVulkanMemoryModel() && scope == spv::Scope::Device) {
  8054. builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);
  8055. }
  8056. std::vector<spv::Id> spvAtomicOperands; // hold the spv operands
  8057. spvAtomicOperands.reserve(6);
  8058. spvAtomicOperands.push_back(pointerId);
  8059. spvAtomicOperands.push_back(scopeId);
  8060. spvAtomicOperands.push_back(semanticsId);
  8061. if (opCode == spv::Op::OpAtomicCompareExchange) {
  8062. spvAtomicOperands.push_back(semanticsId2);
  8063. spvAtomicOperands.push_back(valueId);
  8064. spvAtomicOperands.push_back(compareId);
  8065. } else if (opCode != spv::Op::OpAtomicLoad && opCode != spv::Op::OpAtomicIIncrement && opCode != spv::Op::OpAtomicIDecrement) {
  8066. spvAtomicOperands.push_back(valueId);
  8067. }
  8068. if (opCode == spv::Op::OpAtomicStore) {
  8069. builder.createNoResultOp(opCode, spvAtomicOperands);
  8070. return 0;
  8071. } else {
  8072. spv::Id resultId = builder.createOp(opCode, typeId, spvAtomicOperands);
  8073. // GLSL and HLSL atomic-counter decrement return post-decrement value,
  8074. // while SPIR-V returns pre-decrement value. Translate between these semantics.
  8075. if (op == glslang::EOpAtomicCounterDecrement)
  8076. resultId = builder.createBinOp(spv::Op::OpISub, typeId, resultId, builder.makeIntConstant(1));
  8077. return resultId;
  8078. }
  8079. }
  8080. // Create group invocation operations.
  8081. spv::Id TGlslangToSpvTraverser::createInvocationsOperation(glslang::TOperator op, spv::Id typeId,
  8082. std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)
  8083. {
  8084. bool isUnsigned = isTypeUnsignedInt(typeProxy);
  8085. bool isFloat = isTypeFloat(typeProxy);
  8086. spv::Op opCode = spv::Op::OpNop;
  8087. std::vector<spv::IdImmediate> spvGroupOperands;
  8088. spv::GroupOperation groupOperation = spv::GroupOperation::Max;
  8089. if (op == glslang::EOpBallot || op == glslang::EOpReadFirstInvocation ||
  8090. op == glslang::EOpReadInvocation) {
  8091. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  8092. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  8093. } else if (op == glslang::EOpAnyInvocation ||
  8094. op == glslang::EOpAllInvocations ||
  8095. op == glslang::EOpAllInvocationsEqual) {
  8096. builder.addExtension(spv::E_SPV_KHR_subgroup_vote);
  8097. builder.addCapability(spv::Capability::SubgroupVoteKHR);
  8098. } else {
  8099. builder.addCapability(spv::Capability::Groups);
  8100. if (op == glslang::EOpMinInvocationsNonUniform ||
  8101. op == glslang::EOpMaxInvocationsNonUniform ||
  8102. op == glslang::EOpAddInvocationsNonUniform ||
  8103. op == glslang::EOpMinInvocationsInclusiveScanNonUniform ||
  8104. op == glslang::EOpMaxInvocationsInclusiveScanNonUniform ||
  8105. op == glslang::EOpAddInvocationsInclusiveScanNonUniform ||
  8106. op == glslang::EOpMinInvocationsExclusiveScanNonUniform ||
  8107. op == glslang::EOpMaxInvocationsExclusiveScanNonUniform ||
  8108. op == glslang::EOpAddInvocationsExclusiveScanNonUniform)
  8109. builder.addExtension(spv::E_SPV_AMD_shader_ballot);
  8110. switch (op) {
  8111. case glslang::EOpMinInvocations:
  8112. case glslang::EOpMaxInvocations:
  8113. case glslang::EOpAddInvocations:
  8114. case glslang::EOpMinInvocationsNonUniform:
  8115. case glslang::EOpMaxInvocationsNonUniform:
  8116. case glslang::EOpAddInvocationsNonUniform:
  8117. groupOperation = spv::GroupOperation::Reduce;
  8118. break;
  8119. case glslang::EOpMinInvocationsInclusiveScan:
  8120. case glslang::EOpMaxInvocationsInclusiveScan:
  8121. case glslang::EOpAddInvocationsInclusiveScan:
  8122. case glslang::EOpMinInvocationsInclusiveScanNonUniform:
  8123. case glslang::EOpMaxInvocationsInclusiveScanNonUniform:
  8124. case glslang::EOpAddInvocationsInclusiveScanNonUniform:
  8125. groupOperation = spv::GroupOperation::InclusiveScan;
  8126. break;
  8127. case glslang::EOpMinInvocationsExclusiveScan:
  8128. case glslang::EOpMaxInvocationsExclusiveScan:
  8129. case glslang::EOpAddInvocationsExclusiveScan:
  8130. case glslang::EOpMinInvocationsExclusiveScanNonUniform:
  8131. case glslang::EOpMaxInvocationsExclusiveScanNonUniform:
  8132. case glslang::EOpAddInvocationsExclusiveScanNonUniform:
  8133. groupOperation = spv::GroupOperation::ExclusiveScan;
  8134. break;
  8135. default:
  8136. break;
  8137. }
  8138. spv::IdImmediate scope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };
  8139. spvGroupOperands.push_back(scope);
  8140. if (groupOperation != spv::GroupOperation::Max) {
  8141. spv::IdImmediate groupOp = { false, (unsigned)groupOperation };
  8142. spvGroupOperands.push_back(groupOp);
  8143. }
  8144. }
  8145. for (auto opIt = operands.begin(); opIt != operands.end(); ++opIt) {
  8146. spv::IdImmediate op = { true, *opIt };
  8147. spvGroupOperands.push_back(op);
  8148. }
  8149. switch (op) {
  8150. case glslang::EOpAnyInvocation:
  8151. opCode = spv::Op::OpSubgroupAnyKHR;
  8152. break;
  8153. case glslang::EOpAllInvocations:
  8154. opCode = spv::Op::OpSubgroupAllKHR;
  8155. break;
  8156. case glslang::EOpAllInvocationsEqual:
  8157. opCode = spv::Op::OpSubgroupAllEqualKHR;
  8158. break;
  8159. case glslang::EOpReadInvocation:
  8160. opCode = spv::Op::OpSubgroupReadInvocationKHR;
  8161. if (builder.isVectorType(typeId))
  8162. return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
  8163. break;
  8164. case glslang::EOpReadFirstInvocation:
  8165. opCode = spv::Op::OpSubgroupFirstInvocationKHR;
  8166. if (builder.isVectorType(typeId))
  8167. return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
  8168. break;
  8169. case glslang::EOpBallot:
  8170. {
  8171. // NOTE: According to the spec, the result type of "OpSubgroupBallotKHR" must be a 4 component vector of 32
  8172. // bit integer types. The GLSL built-in function "ballotARB()" assumes the maximum number of invocations in
  8173. // a subgroup is 64. Thus, we have to convert uvec4.xy to uint64_t as follow:
  8174. //
  8175. // result = Bitcast(SubgroupBallotKHR(Predicate).xy)
  8176. //
  8177. spv::Id uintType = builder.makeUintType(32);
  8178. spv::Id uvec4Type = builder.makeVectorType(uintType, 4);
  8179. spv::Id result = builder.createOp(spv::Op::OpSubgroupBallotKHR, uvec4Type, spvGroupOperands);
  8180. std::vector<spv::Id> components;
  8181. components.push_back(builder.createCompositeExtract(result, uintType, 0));
  8182. components.push_back(builder.createCompositeExtract(result, uintType, 1));
  8183. spv::Id uvec2Type = builder.makeVectorType(uintType, 2);
  8184. return builder.createUnaryOp(spv::Op::OpBitcast, typeId,
  8185. builder.createCompositeConstruct(uvec2Type, components));
  8186. }
  8187. case glslang::EOpMinInvocations:
  8188. case glslang::EOpMaxInvocations:
  8189. case glslang::EOpAddInvocations:
  8190. case glslang::EOpMinInvocationsInclusiveScan:
  8191. case glslang::EOpMaxInvocationsInclusiveScan:
  8192. case glslang::EOpAddInvocationsInclusiveScan:
  8193. case glslang::EOpMinInvocationsExclusiveScan:
  8194. case glslang::EOpMaxInvocationsExclusiveScan:
  8195. case glslang::EOpAddInvocationsExclusiveScan:
  8196. if (op == glslang::EOpMinInvocations ||
  8197. op == glslang::EOpMinInvocationsInclusiveScan ||
  8198. op == glslang::EOpMinInvocationsExclusiveScan) {
  8199. if (isFloat)
  8200. opCode = spv::Op::OpGroupFMin;
  8201. else {
  8202. if (isUnsigned)
  8203. opCode = spv::Op::OpGroupUMin;
  8204. else
  8205. opCode = spv::Op::OpGroupSMin;
  8206. }
  8207. } else if (op == glslang::EOpMaxInvocations ||
  8208. op == glslang::EOpMaxInvocationsInclusiveScan ||
  8209. op == glslang::EOpMaxInvocationsExclusiveScan) {
  8210. if (isFloat)
  8211. opCode = spv::Op::OpGroupFMax;
  8212. else {
  8213. if (isUnsigned)
  8214. opCode = spv::Op::OpGroupUMax;
  8215. else
  8216. opCode = spv::Op::OpGroupSMax;
  8217. }
  8218. } else {
  8219. if (isFloat)
  8220. opCode = spv::Op::OpGroupFAdd;
  8221. else
  8222. opCode = spv::Op::OpGroupIAdd;
  8223. }
  8224. if (builder.isVectorType(typeId))
  8225. return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
  8226. break;
  8227. case glslang::EOpMinInvocationsNonUniform:
  8228. case glslang::EOpMaxInvocationsNonUniform:
  8229. case glslang::EOpAddInvocationsNonUniform:
  8230. case glslang::EOpMinInvocationsInclusiveScanNonUniform:
  8231. case glslang::EOpMaxInvocationsInclusiveScanNonUniform:
  8232. case glslang::EOpAddInvocationsInclusiveScanNonUniform:
  8233. case glslang::EOpMinInvocationsExclusiveScanNonUniform:
  8234. case glslang::EOpMaxInvocationsExclusiveScanNonUniform:
  8235. case glslang::EOpAddInvocationsExclusiveScanNonUniform:
  8236. if (op == glslang::EOpMinInvocationsNonUniform ||
  8237. op == glslang::EOpMinInvocationsInclusiveScanNonUniform ||
  8238. op == glslang::EOpMinInvocationsExclusiveScanNonUniform) {
  8239. if (isFloat)
  8240. opCode = spv::Op::OpGroupFMinNonUniformAMD;
  8241. else {
  8242. if (isUnsigned)
  8243. opCode = spv::Op::OpGroupUMinNonUniformAMD;
  8244. else
  8245. opCode = spv::Op::OpGroupSMinNonUniformAMD;
  8246. }
  8247. }
  8248. else if (op == glslang::EOpMaxInvocationsNonUniform ||
  8249. op == glslang::EOpMaxInvocationsInclusiveScanNonUniform ||
  8250. op == glslang::EOpMaxInvocationsExclusiveScanNonUniform) {
  8251. if (isFloat)
  8252. opCode = spv::Op::OpGroupFMaxNonUniformAMD;
  8253. else {
  8254. if (isUnsigned)
  8255. opCode = spv::Op::OpGroupUMaxNonUniformAMD;
  8256. else
  8257. opCode = spv::Op::OpGroupSMaxNonUniformAMD;
  8258. }
  8259. }
  8260. else {
  8261. if (isFloat)
  8262. opCode = spv::Op::OpGroupFAddNonUniformAMD;
  8263. else
  8264. opCode = spv::Op::OpGroupIAddNonUniformAMD;
  8265. }
  8266. if (builder.isVectorType(typeId))
  8267. return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
  8268. break;
  8269. default:
  8270. logger->missingFunctionality("invocation operation");
  8271. return spv::NoResult;
  8272. }
  8273. assert(opCode != spv::Op::OpNop);
  8274. return builder.createOp(opCode, typeId, spvGroupOperands);
  8275. }
  8276. // Create group invocation operations on a vector
  8277. spv::Id TGlslangToSpvTraverser::CreateInvocationsVectorOperation(spv::Op op, spv::GroupOperation groupOperation,
  8278. spv::Id typeId, std::vector<spv::Id>& operands)
  8279. {
  8280. assert(op == spv::Op::OpGroupFMin || op == spv::Op::OpGroupUMin || op == spv::Op::OpGroupSMin ||
  8281. op == spv::Op::OpGroupFMax || op == spv::Op::OpGroupUMax || op == spv::Op::OpGroupSMax ||
  8282. op == spv::Op::OpGroupFAdd || op == spv::Op::OpGroupIAdd || op == spv::Op::OpGroupBroadcast ||
  8283. op == spv::Op::OpSubgroupReadInvocationKHR || op == spv::Op::OpSubgroupFirstInvocationKHR ||
  8284. op == spv::Op::OpGroupFMinNonUniformAMD || op == spv::Op::OpGroupUMinNonUniformAMD ||
  8285. op == spv::Op::OpGroupSMinNonUniformAMD ||
  8286. op == spv::Op::OpGroupFMaxNonUniformAMD || op == spv::Op::OpGroupUMaxNonUniformAMD ||
  8287. op == spv::Op::OpGroupSMaxNonUniformAMD ||
  8288. op == spv::Op::OpGroupFAddNonUniformAMD || op == spv::Op::OpGroupIAddNonUniformAMD);
  8289. // Handle group invocation operations scalar by scalar.
  8290. // The result type is the same type as the original type.
  8291. // The algorithm is to:
  8292. // - break the vector into scalars
  8293. // - apply the operation to each scalar
  8294. // - make a vector out the scalar results
  8295. // get the types sorted out
  8296. int numComponents = builder.getNumComponents(operands[0]);
  8297. spv::Id scalarType = builder.getScalarTypeId(builder.getTypeId(operands[0]));
  8298. std::vector<spv::Id> results;
  8299. // do each scalar op
  8300. for (int comp = 0; comp < numComponents; ++comp) {
  8301. std::vector<unsigned int> indexes;
  8302. indexes.push_back(comp);
  8303. spv::IdImmediate scalar = { true, builder.createCompositeExtract(operands[0], scalarType, indexes) };
  8304. std::vector<spv::IdImmediate> spvGroupOperands;
  8305. if (op == spv::Op::OpSubgroupReadInvocationKHR) {
  8306. spvGroupOperands.push_back(scalar);
  8307. spv::IdImmediate operand = { true, operands[1] };
  8308. spvGroupOperands.push_back(operand);
  8309. } else if (op == spv::Op::OpSubgroupFirstInvocationKHR) {
  8310. spvGroupOperands.push_back(scalar);
  8311. } else if (op == spv::Op::OpGroupBroadcast) {
  8312. spv::IdImmediate scope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };
  8313. spvGroupOperands.push_back(scope);
  8314. spvGroupOperands.push_back(scalar);
  8315. spv::IdImmediate operand = { true, operands[1] };
  8316. spvGroupOperands.push_back(operand);
  8317. } else {
  8318. spv::IdImmediate scope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };
  8319. spvGroupOperands.push_back(scope);
  8320. spv::IdImmediate groupOp = { false, (unsigned)groupOperation };
  8321. spvGroupOperands.push_back(groupOp);
  8322. spvGroupOperands.push_back(scalar);
  8323. }
  8324. results.push_back(builder.createOp(op, scalarType, spvGroupOperands));
  8325. }
  8326. // put the pieces together
  8327. return builder.createCompositeConstruct(typeId, results);
  8328. }
  8329. // Create subgroup invocation operations.
  8330. spv::Id TGlslangToSpvTraverser::createSubgroupOperation(glslang::TOperator op, spv::Id typeId,
  8331. std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)
  8332. {
  8333. // Add the required capabilities.
  8334. switch (op) {
  8335. case glslang::EOpSubgroupElect:
  8336. builder.addCapability(spv::Capability::GroupNonUniform);
  8337. break;
  8338. case glslang::EOpSubgroupQuadAll:
  8339. case glslang::EOpSubgroupQuadAny:
  8340. builder.addExtension(spv::E_SPV_KHR_quad_control);
  8341. builder.addCapability(spv::Capability::QuadControlKHR);
  8342. [[fallthrough]];
  8343. case glslang::EOpSubgroupAll:
  8344. case glslang::EOpSubgroupAny:
  8345. case glslang::EOpSubgroupAllEqual:
  8346. builder.addCapability(spv::Capability::GroupNonUniform);
  8347. builder.addCapability(spv::Capability::GroupNonUniformVote);
  8348. break;
  8349. case glslang::EOpSubgroupBroadcast:
  8350. case glslang::EOpSubgroupBroadcastFirst:
  8351. case glslang::EOpSubgroupBallot:
  8352. case glslang::EOpSubgroupInverseBallot:
  8353. case glslang::EOpSubgroupBallotBitExtract:
  8354. case glslang::EOpSubgroupBallotBitCount:
  8355. case glslang::EOpSubgroupBallotInclusiveBitCount:
  8356. case glslang::EOpSubgroupBallotExclusiveBitCount:
  8357. case glslang::EOpSubgroupBallotFindLSB:
  8358. case glslang::EOpSubgroupBallotFindMSB:
  8359. builder.addCapability(spv::Capability::GroupNonUniform);
  8360. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  8361. break;
  8362. case glslang::EOpSubgroupRotate:
  8363. case glslang::EOpSubgroupClusteredRotate:
  8364. builder.addExtension(spv::E_SPV_KHR_subgroup_rotate);
  8365. builder.addCapability(spv::Capability::GroupNonUniformRotateKHR);
  8366. break;
  8367. case glslang::EOpSubgroupShuffle:
  8368. case glslang::EOpSubgroupShuffleXor:
  8369. builder.addCapability(spv::Capability::GroupNonUniform);
  8370. builder.addCapability(spv::Capability::GroupNonUniformShuffle);
  8371. break;
  8372. case glslang::EOpSubgroupShuffleUp:
  8373. case glslang::EOpSubgroupShuffleDown:
  8374. builder.addCapability(spv::Capability::GroupNonUniform);
  8375. builder.addCapability(spv::Capability::GroupNonUniformShuffleRelative);
  8376. break;
  8377. case glslang::EOpSubgroupAdd:
  8378. case glslang::EOpSubgroupMul:
  8379. case glslang::EOpSubgroupMin:
  8380. case glslang::EOpSubgroupMax:
  8381. case glslang::EOpSubgroupAnd:
  8382. case glslang::EOpSubgroupOr:
  8383. case glslang::EOpSubgroupXor:
  8384. case glslang::EOpSubgroupInclusiveAdd:
  8385. case glslang::EOpSubgroupInclusiveMul:
  8386. case glslang::EOpSubgroupInclusiveMin:
  8387. case glslang::EOpSubgroupInclusiveMax:
  8388. case glslang::EOpSubgroupInclusiveAnd:
  8389. case glslang::EOpSubgroupInclusiveOr:
  8390. case glslang::EOpSubgroupInclusiveXor:
  8391. case glslang::EOpSubgroupExclusiveAdd:
  8392. case glslang::EOpSubgroupExclusiveMul:
  8393. case glslang::EOpSubgroupExclusiveMin:
  8394. case glslang::EOpSubgroupExclusiveMax:
  8395. case glslang::EOpSubgroupExclusiveAnd:
  8396. case glslang::EOpSubgroupExclusiveOr:
  8397. case glslang::EOpSubgroupExclusiveXor:
  8398. builder.addCapability(spv::Capability::GroupNonUniform);
  8399. builder.addCapability(spv::Capability::GroupNonUniformArithmetic);
  8400. break;
  8401. case glslang::EOpSubgroupClusteredAdd:
  8402. case glslang::EOpSubgroupClusteredMul:
  8403. case glslang::EOpSubgroupClusteredMin:
  8404. case glslang::EOpSubgroupClusteredMax:
  8405. case glslang::EOpSubgroupClusteredAnd:
  8406. case glslang::EOpSubgroupClusteredOr:
  8407. case glslang::EOpSubgroupClusteredXor:
  8408. builder.addCapability(spv::Capability::GroupNonUniform);
  8409. builder.addCapability(spv::Capability::GroupNonUniformClustered);
  8410. break;
  8411. case glslang::EOpSubgroupQuadBroadcast:
  8412. case glslang::EOpSubgroupQuadSwapHorizontal:
  8413. case glslang::EOpSubgroupQuadSwapVertical:
  8414. case glslang::EOpSubgroupQuadSwapDiagonal:
  8415. builder.addCapability(spv::Capability::GroupNonUniform);
  8416. builder.addCapability(spv::Capability::GroupNonUniformQuad);
  8417. break;
  8418. case glslang::EOpSubgroupPartitionedAdd:
  8419. case glslang::EOpSubgroupPartitionedMul:
  8420. case glslang::EOpSubgroupPartitionedMin:
  8421. case glslang::EOpSubgroupPartitionedMax:
  8422. case glslang::EOpSubgroupPartitionedAnd:
  8423. case glslang::EOpSubgroupPartitionedOr:
  8424. case glslang::EOpSubgroupPartitionedXor:
  8425. case glslang::EOpSubgroupPartitionedInclusiveAdd:
  8426. case glslang::EOpSubgroupPartitionedInclusiveMul:
  8427. case glslang::EOpSubgroupPartitionedInclusiveMin:
  8428. case glslang::EOpSubgroupPartitionedInclusiveMax:
  8429. case glslang::EOpSubgroupPartitionedInclusiveAnd:
  8430. case glslang::EOpSubgroupPartitionedInclusiveOr:
  8431. case glslang::EOpSubgroupPartitionedInclusiveXor:
  8432. case glslang::EOpSubgroupPartitionedExclusiveAdd:
  8433. case glslang::EOpSubgroupPartitionedExclusiveMul:
  8434. case glslang::EOpSubgroupPartitionedExclusiveMin:
  8435. case glslang::EOpSubgroupPartitionedExclusiveMax:
  8436. case glslang::EOpSubgroupPartitionedExclusiveAnd:
  8437. case glslang::EOpSubgroupPartitionedExclusiveOr:
  8438. case glslang::EOpSubgroupPartitionedExclusiveXor:
  8439. builder.addExtension(spv::E_SPV_NV_shader_subgroup_partitioned);
  8440. builder.addCapability(spv::Capability::GroupNonUniformPartitionedNV);
  8441. break;
  8442. default: assert(0 && "Unhandled subgroup operation!");
  8443. }
  8444. const bool isUnsigned = isTypeUnsignedInt(typeProxy);
  8445. const bool isFloat = isTypeFloat(typeProxy);
  8446. const bool isBool = typeProxy == glslang::EbtBool;
  8447. spv::Op opCode = spv::Op::OpNop;
  8448. // Figure out which opcode to use.
  8449. switch (op) {
  8450. case glslang::EOpSubgroupElect: opCode = spv::Op::OpGroupNonUniformElect; break;
  8451. case glslang::EOpSubgroupQuadAll: opCode = spv::Op::OpGroupNonUniformQuadAllKHR; break;
  8452. case glslang::EOpSubgroupAll: opCode = spv::Op::OpGroupNonUniformAll; break;
  8453. case glslang::EOpSubgroupQuadAny: opCode = spv::Op::OpGroupNonUniformQuadAnyKHR; break;
  8454. case glslang::EOpSubgroupAny: opCode = spv::Op::OpGroupNonUniformAny; break;
  8455. case glslang::EOpSubgroupAllEqual: opCode = spv::Op::OpGroupNonUniformAllEqual; break;
  8456. case glslang::EOpSubgroupBroadcast: opCode = spv::Op::OpGroupNonUniformBroadcast; break;
  8457. case glslang::EOpSubgroupBroadcastFirst: opCode = spv::Op::OpGroupNonUniformBroadcastFirst; break;
  8458. case glslang::EOpSubgroupBallot: opCode = spv::Op::OpGroupNonUniformBallot; break;
  8459. case glslang::EOpSubgroupInverseBallot: opCode = spv::Op::OpGroupNonUniformInverseBallot; break;
  8460. case glslang::EOpSubgroupBallotBitExtract: opCode = spv::Op::OpGroupNonUniformBallotBitExtract; break;
  8461. case glslang::EOpSubgroupBallotBitCount:
  8462. case glslang::EOpSubgroupBallotInclusiveBitCount:
  8463. case glslang::EOpSubgroupBallotExclusiveBitCount: opCode = spv::Op::OpGroupNonUniformBallotBitCount; break;
  8464. case glslang::EOpSubgroupBallotFindLSB: opCode = spv::Op::OpGroupNonUniformBallotFindLSB; break;
  8465. case glslang::EOpSubgroupBallotFindMSB: opCode = spv::Op::OpGroupNonUniformBallotFindMSB; break;
  8466. case glslang::EOpSubgroupShuffle: opCode = spv::Op::OpGroupNonUniformShuffle; break;
  8467. case glslang::EOpSubgroupShuffleXor: opCode = spv::Op::OpGroupNonUniformShuffleXor; break;
  8468. case glslang::EOpSubgroupShuffleUp: opCode = spv::Op::OpGroupNonUniformShuffleUp; break;
  8469. case glslang::EOpSubgroupShuffleDown: opCode = spv::Op::OpGroupNonUniformShuffleDown; break;
  8470. case glslang::EOpSubgroupRotate:
  8471. case glslang::EOpSubgroupClusteredRotate: opCode = spv::Op::OpGroupNonUniformRotateKHR; break;
  8472. case glslang::EOpSubgroupAdd:
  8473. case glslang::EOpSubgroupInclusiveAdd:
  8474. case glslang::EOpSubgroupExclusiveAdd:
  8475. case glslang::EOpSubgroupClusteredAdd:
  8476. case glslang::EOpSubgroupPartitionedAdd:
  8477. case glslang::EOpSubgroupPartitionedInclusiveAdd:
  8478. case glslang::EOpSubgroupPartitionedExclusiveAdd:
  8479. if (isFloat) {
  8480. opCode = spv::Op::OpGroupNonUniformFAdd;
  8481. } else {
  8482. opCode = spv::Op::OpGroupNonUniformIAdd;
  8483. }
  8484. break;
  8485. case glslang::EOpSubgroupMul:
  8486. case glslang::EOpSubgroupInclusiveMul:
  8487. case glslang::EOpSubgroupExclusiveMul:
  8488. case glslang::EOpSubgroupClusteredMul:
  8489. case glslang::EOpSubgroupPartitionedMul:
  8490. case glslang::EOpSubgroupPartitionedInclusiveMul:
  8491. case glslang::EOpSubgroupPartitionedExclusiveMul:
  8492. if (isFloat) {
  8493. opCode = spv::Op::OpGroupNonUniformFMul;
  8494. } else {
  8495. opCode = spv::Op::OpGroupNonUniformIMul;
  8496. }
  8497. break;
  8498. case glslang::EOpSubgroupMin:
  8499. case glslang::EOpSubgroupInclusiveMin:
  8500. case glslang::EOpSubgroupExclusiveMin:
  8501. case glslang::EOpSubgroupClusteredMin:
  8502. case glslang::EOpSubgroupPartitionedMin:
  8503. case glslang::EOpSubgroupPartitionedInclusiveMin:
  8504. case glslang::EOpSubgroupPartitionedExclusiveMin:
  8505. if (isFloat) {
  8506. opCode = spv::Op::OpGroupNonUniformFMin;
  8507. } else if (isUnsigned) {
  8508. opCode = spv::Op::OpGroupNonUniformUMin;
  8509. } else {
  8510. opCode = spv::Op::OpGroupNonUniformSMin;
  8511. }
  8512. break;
  8513. case glslang::EOpSubgroupMax:
  8514. case glslang::EOpSubgroupInclusiveMax:
  8515. case glslang::EOpSubgroupExclusiveMax:
  8516. case glslang::EOpSubgroupClusteredMax:
  8517. case glslang::EOpSubgroupPartitionedMax:
  8518. case glslang::EOpSubgroupPartitionedInclusiveMax:
  8519. case glslang::EOpSubgroupPartitionedExclusiveMax:
  8520. if (isFloat) {
  8521. opCode = spv::Op::OpGroupNonUniformFMax;
  8522. } else if (isUnsigned) {
  8523. opCode = spv::Op::OpGroupNonUniformUMax;
  8524. } else {
  8525. opCode = spv::Op::OpGroupNonUniformSMax;
  8526. }
  8527. break;
  8528. case glslang::EOpSubgroupAnd:
  8529. case glslang::EOpSubgroupInclusiveAnd:
  8530. case glslang::EOpSubgroupExclusiveAnd:
  8531. case glslang::EOpSubgroupClusteredAnd:
  8532. case glslang::EOpSubgroupPartitionedAnd:
  8533. case glslang::EOpSubgroupPartitionedInclusiveAnd:
  8534. case glslang::EOpSubgroupPartitionedExclusiveAnd:
  8535. if (isBool) {
  8536. opCode = spv::Op::OpGroupNonUniformLogicalAnd;
  8537. } else {
  8538. opCode = spv::Op::OpGroupNonUniformBitwiseAnd;
  8539. }
  8540. break;
  8541. case glslang::EOpSubgroupOr:
  8542. case glslang::EOpSubgroupInclusiveOr:
  8543. case glslang::EOpSubgroupExclusiveOr:
  8544. case glslang::EOpSubgroupClusteredOr:
  8545. case glslang::EOpSubgroupPartitionedOr:
  8546. case glslang::EOpSubgroupPartitionedInclusiveOr:
  8547. case glslang::EOpSubgroupPartitionedExclusiveOr:
  8548. if (isBool) {
  8549. opCode = spv::Op::OpGroupNonUniformLogicalOr;
  8550. } else {
  8551. opCode = spv::Op::OpGroupNonUniformBitwiseOr;
  8552. }
  8553. break;
  8554. case glslang::EOpSubgroupXor:
  8555. case glslang::EOpSubgroupInclusiveXor:
  8556. case glslang::EOpSubgroupExclusiveXor:
  8557. case glslang::EOpSubgroupClusteredXor:
  8558. case glslang::EOpSubgroupPartitionedXor:
  8559. case glslang::EOpSubgroupPartitionedInclusiveXor:
  8560. case glslang::EOpSubgroupPartitionedExclusiveXor:
  8561. if (isBool) {
  8562. opCode = spv::Op::OpGroupNonUniformLogicalXor;
  8563. } else {
  8564. opCode = spv::Op::OpGroupNonUniformBitwiseXor;
  8565. }
  8566. break;
  8567. case glslang::EOpSubgroupQuadBroadcast: opCode = spv::Op::OpGroupNonUniformQuadBroadcast; break;
  8568. case glslang::EOpSubgroupQuadSwapHorizontal:
  8569. case glslang::EOpSubgroupQuadSwapVertical:
  8570. case glslang::EOpSubgroupQuadSwapDiagonal: opCode = spv::Op::OpGroupNonUniformQuadSwap; break;
  8571. default: assert(0 && "Unhandled subgroup operation!");
  8572. }
  8573. // get the right Group Operation
  8574. spv::GroupOperation groupOperation = spv::GroupOperation::Max;
  8575. switch (op) {
  8576. default:
  8577. break;
  8578. case glslang::EOpSubgroupBallotBitCount:
  8579. case glslang::EOpSubgroupAdd:
  8580. case glslang::EOpSubgroupMul:
  8581. case glslang::EOpSubgroupMin:
  8582. case glslang::EOpSubgroupMax:
  8583. case glslang::EOpSubgroupAnd:
  8584. case glslang::EOpSubgroupOr:
  8585. case glslang::EOpSubgroupXor:
  8586. groupOperation = spv::GroupOperation::Reduce;
  8587. break;
  8588. case glslang::EOpSubgroupBallotInclusiveBitCount:
  8589. case glslang::EOpSubgroupInclusiveAdd:
  8590. case glslang::EOpSubgroupInclusiveMul:
  8591. case glslang::EOpSubgroupInclusiveMin:
  8592. case glslang::EOpSubgroupInclusiveMax:
  8593. case glslang::EOpSubgroupInclusiveAnd:
  8594. case glslang::EOpSubgroupInclusiveOr:
  8595. case glslang::EOpSubgroupInclusiveXor:
  8596. groupOperation = spv::GroupOperation::InclusiveScan;
  8597. break;
  8598. case glslang::EOpSubgroupBallotExclusiveBitCount:
  8599. case glslang::EOpSubgroupExclusiveAdd:
  8600. case glslang::EOpSubgroupExclusiveMul:
  8601. case glslang::EOpSubgroupExclusiveMin:
  8602. case glslang::EOpSubgroupExclusiveMax:
  8603. case glslang::EOpSubgroupExclusiveAnd:
  8604. case glslang::EOpSubgroupExclusiveOr:
  8605. case glslang::EOpSubgroupExclusiveXor:
  8606. groupOperation = spv::GroupOperation::ExclusiveScan;
  8607. break;
  8608. case glslang::EOpSubgroupClusteredAdd:
  8609. case glslang::EOpSubgroupClusteredMul:
  8610. case glslang::EOpSubgroupClusteredMin:
  8611. case glslang::EOpSubgroupClusteredMax:
  8612. case glslang::EOpSubgroupClusteredAnd:
  8613. case glslang::EOpSubgroupClusteredOr:
  8614. case glslang::EOpSubgroupClusteredXor:
  8615. groupOperation = spv::GroupOperation::ClusteredReduce;
  8616. break;
  8617. case glslang::EOpSubgroupPartitionedAdd:
  8618. case glslang::EOpSubgroupPartitionedMul:
  8619. case glslang::EOpSubgroupPartitionedMin:
  8620. case glslang::EOpSubgroupPartitionedMax:
  8621. case glslang::EOpSubgroupPartitionedAnd:
  8622. case glslang::EOpSubgroupPartitionedOr:
  8623. case glslang::EOpSubgroupPartitionedXor:
  8624. groupOperation = spv::GroupOperation::PartitionedReduceNV;
  8625. break;
  8626. case glslang::EOpSubgroupPartitionedInclusiveAdd:
  8627. case glslang::EOpSubgroupPartitionedInclusiveMul:
  8628. case glslang::EOpSubgroupPartitionedInclusiveMin:
  8629. case glslang::EOpSubgroupPartitionedInclusiveMax:
  8630. case glslang::EOpSubgroupPartitionedInclusiveAnd:
  8631. case glslang::EOpSubgroupPartitionedInclusiveOr:
  8632. case glslang::EOpSubgroupPartitionedInclusiveXor:
  8633. groupOperation = spv::GroupOperation::PartitionedInclusiveScanNV;
  8634. break;
  8635. case glslang::EOpSubgroupPartitionedExclusiveAdd:
  8636. case glslang::EOpSubgroupPartitionedExclusiveMul:
  8637. case glslang::EOpSubgroupPartitionedExclusiveMin:
  8638. case glslang::EOpSubgroupPartitionedExclusiveMax:
  8639. case glslang::EOpSubgroupPartitionedExclusiveAnd:
  8640. case glslang::EOpSubgroupPartitionedExclusiveOr:
  8641. case glslang::EOpSubgroupPartitionedExclusiveXor:
  8642. groupOperation = spv::GroupOperation::PartitionedExclusiveScanNV;
  8643. break;
  8644. }
  8645. // build the instruction
  8646. std::vector<spv::IdImmediate> spvGroupOperands;
  8647. // Every operation begins with the Execution Scope operand.
  8648. spv::IdImmediate executionScope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };
  8649. // All other ops need the execution scope. Quad Control Ops don't need scope, it's always Quad.
  8650. if (opCode != spv::Op::OpGroupNonUniformQuadAllKHR && opCode != spv::Op::OpGroupNonUniformQuadAnyKHR) {
  8651. spvGroupOperands.push_back(executionScope);
  8652. }
  8653. // Next, for all operations that use a Group Operation, push that as an operand.
  8654. if (groupOperation != spv::GroupOperation::Max) {
  8655. spv::IdImmediate groupOperand = { false, (unsigned)groupOperation };
  8656. spvGroupOperands.push_back(groupOperand);
  8657. }
  8658. // Push back the operands next.
  8659. for (auto opIt = operands.cbegin(); opIt != operands.cend(); ++opIt) {
  8660. spv::IdImmediate operand = { true, *opIt };
  8661. spvGroupOperands.push_back(operand);
  8662. }
  8663. // Some opcodes have additional operands.
  8664. spv::Id directionId = spv::NoResult;
  8665. switch (op) {
  8666. default: break;
  8667. case glslang::EOpSubgroupQuadSwapHorizontal: directionId = builder.makeUintConstant(0); break;
  8668. case glslang::EOpSubgroupQuadSwapVertical: directionId = builder.makeUintConstant(1); break;
  8669. case glslang::EOpSubgroupQuadSwapDiagonal: directionId = builder.makeUintConstant(2); break;
  8670. }
  8671. if (directionId != spv::NoResult) {
  8672. spv::IdImmediate direction = { true, directionId };
  8673. spvGroupOperands.push_back(direction);
  8674. }
  8675. return builder.createOp(opCode, typeId, spvGroupOperands);
  8676. }
  8677. spv::Id TGlslangToSpvTraverser::createMiscOperation(glslang::TOperator op, spv::Decoration precision,
  8678. spv::Id typeId, std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)
  8679. {
  8680. bool isUnsigned = isTypeUnsignedInt(typeProxy);
  8681. bool isFloat = isTypeFloat(typeProxy);
  8682. spv::Op opCode = spv::Op::OpNop;
  8683. int extBuiltins = -1;
  8684. int libCall = -1;
  8685. size_t consumedOperands = operands.size();
  8686. spv::Id typeId0 = 0;
  8687. if (consumedOperands > 0)
  8688. typeId0 = builder.getTypeId(operands[0]);
  8689. spv::Id typeId1 = 0;
  8690. if (consumedOperands > 1)
  8691. typeId1 = builder.getTypeId(operands[1]);
  8692. spv::Id frexpIntType = 0;
  8693. switch (op) {
  8694. case glslang::EOpMin:
  8695. if (isFloat)
  8696. libCall = nanMinMaxClamp ? spv::GLSLstd450NMin : spv::GLSLstd450FMin;
  8697. else if (isUnsigned)
  8698. libCall = spv::GLSLstd450UMin;
  8699. else
  8700. libCall = spv::GLSLstd450SMin;
  8701. builder.promoteScalar(precision, operands.front(), operands.back());
  8702. break;
  8703. case glslang::EOpModf:
  8704. {
  8705. libCall = spv::GLSLstd450ModfStruct;
  8706. assert(builder.isFloatType(builder.getScalarTypeId(typeId0)));
  8707. // The returned struct has two members of the same type as the first argument
  8708. typeId = builder.makeStructResultType(typeId0, typeId0);
  8709. consumedOperands = 1;
  8710. }
  8711. break;
  8712. case glslang::EOpMax:
  8713. if (isFloat)
  8714. libCall = nanMinMaxClamp ? spv::GLSLstd450NMax : spv::GLSLstd450FMax;
  8715. else if (isUnsigned)
  8716. libCall = spv::GLSLstd450UMax;
  8717. else
  8718. libCall = spv::GLSLstd450SMax;
  8719. builder.promoteScalar(precision, operands.front(), operands.back());
  8720. break;
  8721. case glslang::EOpPow:
  8722. libCall = spv::GLSLstd450Pow;
  8723. break;
  8724. case glslang::EOpDot:
  8725. case glslang::EOpDotPackedEXT:
  8726. case glslang::EOpDotAccSatEXT:
  8727. case glslang::EOpDotPackedAccSatEXT:
  8728. {
  8729. if (builder.isFloatType(builder.getScalarTypeId(typeId0)) ||
  8730. // HLSL supports dot(int,int) which is just a multiply
  8731. glslangIntermediate->getSource() == glslang::EShSourceHlsl) {
  8732. if (typeProxy == glslang::EbtBFloat16) {
  8733. builder.addExtension(spv::E_SPV_KHR_bfloat16);
  8734. builder.addCapability(spv::Capability::BFloat16DotProductKHR);
  8735. }
  8736. opCode = spv::Op::OpDot;
  8737. } else {
  8738. builder.addExtension(spv::E_SPV_KHR_integer_dot_product);
  8739. builder.addCapability(spv::Capability::DotProductKHR);
  8740. const unsigned int vectorSize = builder.getNumComponents(operands[0]);
  8741. if (op == glslang::EOpDotPackedEXT || op == glslang::EOpDotPackedAccSatEXT) {
  8742. builder.addCapability(spv::Capability::DotProductInput4x8BitPackedKHR);
  8743. } else if (vectorSize == 4 && builder.getScalarTypeWidth(typeId0) == 8) {
  8744. builder.addCapability(spv::Capability::DotProductInput4x8BitKHR);
  8745. } else {
  8746. builder.addCapability(spv::Capability::DotProductInputAllKHR);
  8747. }
  8748. const bool type0isSigned = builder.isIntType(builder.getScalarTypeId(typeId0));
  8749. const bool type1isSigned = builder.isIntType(builder.getScalarTypeId(typeId1));
  8750. const bool accSat = (op == glslang::EOpDotAccSatEXT || op == glslang::EOpDotPackedAccSatEXT);
  8751. if (!type0isSigned && !type1isSigned) {
  8752. opCode = accSat ? spv::Op::OpUDotAccSatKHR : spv::Op::OpUDotKHR;
  8753. } else if (type0isSigned && type1isSigned) {
  8754. opCode = accSat ? spv::Op::OpSDotAccSatKHR : spv::Op::OpSDotKHR;
  8755. } else {
  8756. opCode = accSat ? spv::Op::OpSUDotAccSatKHR : spv::Op::OpSUDotKHR;
  8757. // the spir-v opcode assumes the operands to be "signed, unsigned" in that order, so swap if needed
  8758. if (type1isSigned) {
  8759. std::swap(operands[0], operands[1]);
  8760. }
  8761. }
  8762. std::vector<spv::IdImmediate> operands2;
  8763. for (auto &o : operands) {
  8764. operands2.push_back({true, o});
  8765. }
  8766. if (op == glslang::EOpDotPackedEXT || op == glslang::EOpDotPackedAccSatEXT) {
  8767. operands2.push_back({false, 0});
  8768. }
  8769. return builder.createOp(opCode, typeId, operands2);
  8770. }
  8771. }
  8772. break;
  8773. case glslang::EOpAtan:
  8774. libCall = spv::GLSLstd450Atan2;
  8775. break;
  8776. case glslang::EOpClamp:
  8777. if (isFloat)
  8778. libCall = nanMinMaxClamp ? spv::GLSLstd450NClamp : spv::GLSLstd450FClamp;
  8779. else if (isUnsigned)
  8780. libCall = spv::GLSLstd450UClamp;
  8781. else
  8782. libCall = spv::GLSLstd450SClamp;
  8783. builder.promoteScalar(precision, operands.front(), operands[1]);
  8784. builder.promoteScalar(precision, operands.front(), operands[2]);
  8785. break;
  8786. case glslang::EOpMix:
  8787. if (! builder.isBoolType(builder.getScalarTypeId(builder.getTypeId(operands.back())))) {
  8788. assert(isFloat);
  8789. libCall = spv::GLSLstd450FMix;
  8790. } else {
  8791. opCode = spv::Op::OpSelect;
  8792. std::swap(operands.front(), operands.back());
  8793. }
  8794. builder.promoteScalar(precision, operands.front(), operands.back());
  8795. break;
  8796. case glslang::EOpStep:
  8797. libCall = spv::GLSLstd450Step;
  8798. builder.promoteScalar(precision, operands.front(), operands.back());
  8799. break;
  8800. case glslang::EOpSmoothStep:
  8801. libCall = spv::GLSLstd450SmoothStep;
  8802. builder.promoteScalar(precision, operands[0], operands[2]);
  8803. builder.promoteScalar(precision, operands[1], operands[2]);
  8804. break;
  8805. case glslang::EOpDistance:
  8806. libCall = spv::GLSLstd450Distance;
  8807. break;
  8808. case glslang::EOpCross:
  8809. libCall = spv::GLSLstd450Cross;
  8810. break;
  8811. case glslang::EOpFaceForward:
  8812. libCall = spv::GLSLstd450FaceForward;
  8813. break;
  8814. case glslang::EOpReflect:
  8815. libCall = spv::GLSLstd450Reflect;
  8816. break;
  8817. case glslang::EOpRefract:
  8818. libCall = spv::GLSLstd450Refract;
  8819. break;
  8820. case glslang::EOpBarrier:
  8821. {
  8822. // This is for the extended controlBarrier function, with four operands.
  8823. // The unextended barrier() goes through createNoArgOperation.
  8824. assert(operands.size() == 4);
  8825. auto const executionScope = (spv::Scope)builder.getConstantScalar(operands[0]);
  8826. auto const memoryScope = (spv::Scope)builder.getConstantScalar(operands[1]);
  8827. auto const semantics = (spv::MemorySemanticsMask)(builder.getConstantScalar(operands[2]) | builder.getConstantScalar(operands[3]));
  8828. builder.createControlBarrier(executionScope, memoryScope,
  8829. semantics);
  8830. if (anySet(semantics, spv::MemorySemanticsMask::MakeAvailableKHR |
  8831. spv::MemorySemanticsMask::MakeVisibleKHR |
  8832. spv::MemorySemanticsMask::OutputMemoryKHR |
  8833. spv::MemorySemanticsMask::Volatile)) {
  8834. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  8835. }
  8836. if (glslangIntermediate->usingVulkanMemoryModel() && (executionScope == spv::Scope::Device ||
  8837. memoryScope == spv::Scope::Device)) {
  8838. builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);
  8839. }
  8840. return 0;
  8841. }
  8842. break;
  8843. case glslang::EOpMemoryBarrier:
  8844. {
  8845. // This is for the extended memoryBarrier function, with three operands.
  8846. // The unextended memoryBarrier() goes through createNoArgOperation.
  8847. assert(operands.size() == 3);
  8848. auto const memoryScope = (spv::Scope)builder.getConstantScalar(operands[0]);
  8849. auto const semantics = (spv::MemorySemanticsMask)(builder.getConstantScalar(operands[1]) | builder.getConstantScalar(operands[2]));
  8850. builder.createMemoryBarrier(memoryScope, semantics);
  8851. if (anySet(semantics, spv::MemorySemanticsMask::MakeAvailableKHR |
  8852. spv::MemorySemanticsMask::MakeVisibleKHR |
  8853. spv::MemorySemanticsMask::OutputMemoryKHR |
  8854. spv::MemorySemanticsMask::Volatile)) {
  8855. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  8856. }
  8857. if (glslangIntermediate->usingVulkanMemoryModel() && memoryScope == spv::Scope::Device) {
  8858. builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);
  8859. }
  8860. return 0;
  8861. }
  8862. break;
  8863. case glslang::EOpInterpolateAtSample:
  8864. if (typeProxy == glslang::EbtFloat16)
  8865. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
  8866. libCall = spv::GLSLstd450InterpolateAtSample;
  8867. break;
  8868. case glslang::EOpInterpolateAtOffset:
  8869. if (typeProxy == glslang::EbtFloat16)
  8870. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
  8871. libCall = spv::GLSLstd450InterpolateAtOffset;
  8872. break;
  8873. case glslang::EOpAddCarry:
  8874. opCode = spv::Op::OpIAddCarry;
  8875. typeId = builder.makeStructResultType(typeId0, typeId0);
  8876. consumedOperands = 2;
  8877. break;
  8878. case glslang::EOpSubBorrow:
  8879. opCode = spv::Op::OpISubBorrow;
  8880. typeId = builder.makeStructResultType(typeId0, typeId0);
  8881. consumedOperands = 2;
  8882. break;
  8883. case glslang::EOpUMulExtended:
  8884. opCode = spv::Op::OpUMulExtended;
  8885. typeId = builder.makeStructResultType(typeId0, typeId0);
  8886. consumedOperands = 2;
  8887. break;
  8888. case glslang::EOpIMulExtended:
  8889. opCode = spv::Op::OpSMulExtended;
  8890. typeId = builder.makeStructResultType(typeId0, typeId0);
  8891. consumedOperands = 2;
  8892. break;
  8893. case glslang::EOpBitfieldExtract:
  8894. if (isUnsigned)
  8895. opCode = spv::Op::OpBitFieldUExtract;
  8896. else
  8897. opCode = spv::Op::OpBitFieldSExtract;
  8898. break;
  8899. case glslang::EOpBitfieldInsert:
  8900. opCode = spv::Op::OpBitFieldInsert;
  8901. break;
  8902. case glslang::EOpFma:
  8903. libCall = spv::GLSLstd450Fma;
  8904. break;
  8905. case glslang::EOpFrexp:
  8906. {
  8907. libCall = spv::GLSLstd450FrexpStruct;
  8908. assert(builder.isPointerType(typeId1));
  8909. typeId1 = builder.getContainedTypeId(typeId1);
  8910. int width = builder.getScalarTypeWidth(typeId1);
  8911. if (width == 16)
  8912. // Using 16-bit exp operand, enable extension SPV_AMD_gpu_shader_int16
  8913. builder.addExtension(spv::E_SPV_AMD_gpu_shader_int16);
  8914. if (builder.getNumComponents(operands[0]) == 1)
  8915. frexpIntType = builder.makeIntegerType(width, true);
  8916. else
  8917. frexpIntType = builder.makeVectorType(builder.makeIntegerType(width, true),
  8918. builder.getNumComponents(operands[0]));
  8919. typeId = builder.makeStructResultType(typeId0, frexpIntType);
  8920. consumedOperands = 1;
  8921. }
  8922. break;
  8923. case glslang::EOpLdexp:
  8924. libCall = spv::GLSLstd450Ldexp;
  8925. break;
  8926. case glslang::EOpReadInvocation:
  8927. return createInvocationsOperation(op, typeId, operands, typeProxy);
  8928. case glslang::EOpSubgroupBroadcast:
  8929. case glslang::EOpSubgroupBallotBitExtract:
  8930. case glslang::EOpSubgroupShuffle:
  8931. case glslang::EOpSubgroupShuffleXor:
  8932. case glslang::EOpSubgroupShuffleUp:
  8933. case glslang::EOpSubgroupShuffleDown:
  8934. case glslang::EOpSubgroupRotate:
  8935. case glslang::EOpSubgroupClusteredRotate:
  8936. case glslang::EOpSubgroupClusteredAdd:
  8937. case glslang::EOpSubgroupClusteredMul:
  8938. case glslang::EOpSubgroupClusteredMin:
  8939. case glslang::EOpSubgroupClusteredMax:
  8940. case glslang::EOpSubgroupClusteredAnd:
  8941. case glslang::EOpSubgroupClusteredOr:
  8942. case glslang::EOpSubgroupClusteredXor:
  8943. case glslang::EOpSubgroupQuadBroadcast:
  8944. case glslang::EOpSubgroupPartitionedAdd:
  8945. case glslang::EOpSubgroupPartitionedMul:
  8946. case glslang::EOpSubgroupPartitionedMin:
  8947. case glslang::EOpSubgroupPartitionedMax:
  8948. case glslang::EOpSubgroupPartitionedAnd:
  8949. case glslang::EOpSubgroupPartitionedOr:
  8950. case glslang::EOpSubgroupPartitionedXor:
  8951. case glslang::EOpSubgroupPartitionedInclusiveAdd:
  8952. case glslang::EOpSubgroupPartitionedInclusiveMul:
  8953. case glslang::EOpSubgroupPartitionedInclusiveMin:
  8954. case glslang::EOpSubgroupPartitionedInclusiveMax:
  8955. case glslang::EOpSubgroupPartitionedInclusiveAnd:
  8956. case glslang::EOpSubgroupPartitionedInclusiveOr:
  8957. case glslang::EOpSubgroupPartitionedInclusiveXor:
  8958. case glslang::EOpSubgroupPartitionedExclusiveAdd:
  8959. case glslang::EOpSubgroupPartitionedExclusiveMul:
  8960. case glslang::EOpSubgroupPartitionedExclusiveMin:
  8961. case glslang::EOpSubgroupPartitionedExclusiveMax:
  8962. case glslang::EOpSubgroupPartitionedExclusiveAnd:
  8963. case glslang::EOpSubgroupPartitionedExclusiveOr:
  8964. case glslang::EOpSubgroupPartitionedExclusiveXor:
  8965. return createSubgroupOperation(op, typeId, operands, typeProxy);
  8966. case glslang::EOpSwizzleInvocations:
  8967. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
  8968. libCall = spv::SwizzleInvocationsAMD;
  8969. break;
  8970. case glslang::EOpSwizzleInvocationsMasked:
  8971. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
  8972. libCall = spv::SwizzleInvocationsMaskedAMD;
  8973. break;
  8974. case glslang::EOpWriteInvocation:
  8975. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
  8976. libCall = spv::WriteInvocationAMD;
  8977. break;
  8978. case glslang::EOpMin3:
  8979. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_trinary_minmax);
  8980. if (isFloat)
  8981. libCall = spv::FMin3AMD;
  8982. else {
  8983. if (isUnsigned)
  8984. libCall = spv::UMin3AMD;
  8985. else
  8986. libCall = spv::SMin3AMD;
  8987. }
  8988. break;
  8989. case glslang::EOpMax3:
  8990. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_trinary_minmax);
  8991. if (isFloat)
  8992. libCall = spv::FMax3AMD;
  8993. else {
  8994. if (isUnsigned)
  8995. libCall = spv::UMax3AMD;
  8996. else
  8997. libCall = spv::SMax3AMD;
  8998. }
  8999. break;
  9000. case glslang::EOpMid3:
  9001. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_trinary_minmax);
  9002. if (isFloat)
  9003. libCall = spv::FMid3AMD;
  9004. else {
  9005. if (isUnsigned)
  9006. libCall = spv::UMid3AMD;
  9007. else
  9008. libCall = spv::SMid3AMD;
  9009. }
  9010. break;
  9011. case glslang::EOpInterpolateAtVertex:
  9012. if (typeProxy == glslang::EbtFloat16)
  9013. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
  9014. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  9015. libCall = spv::InterpolateAtVertexAMD;
  9016. break;
  9017. case glslang::EOpReportIntersection:
  9018. typeId = builder.makeBoolType();
  9019. opCode = spv::Op::OpReportIntersectionKHR;
  9020. break;
  9021. case glslang::EOpTraceNV:
  9022. builder.createNoResultOp(spv::Op::OpTraceNV, operands);
  9023. return 0;
  9024. case glslang::EOpTraceRayMotionNV:
  9025. builder.addExtension(spv::E_SPV_NV_ray_tracing_motion_blur);
  9026. builder.addCapability(spv::Capability::RayTracingMotionBlurNV);
  9027. builder.createNoResultOp(spv::Op::OpTraceRayMotionNV, operands);
  9028. return 0;
  9029. case glslang::EOpTraceKHR:
  9030. builder.createNoResultOp(spv::Op::OpTraceRayKHR, operands);
  9031. return 0;
  9032. case glslang::EOpExecuteCallableNV:
  9033. builder.createNoResultOp(spv::Op::OpExecuteCallableNV, operands);
  9034. return 0;
  9035. case glslang::EOpExecuteCallableKHR:
  9036. builder.createNoResultOp(spv::Op::OpExecuteCallableKHR, operands);
  9037. return 0;
  9038. case glslang::EOpRayQueryInitialize:
  9039. builder.createNoResultOp(spv::Op::OpRayQueryInitializeKHR, operands);
  9040. return 0;
  9041. case glslang::EOpRayQueryTerminate:
  9042. builder.createNoResultOp(spv::Op::OpRayQueryTerminateKHR, operands);
  9043. return 0;
  9044. case glslang::EOpRayQueryGenerateIntersection:
  9045. builder.createNoResultOp(spv::Op::OpRayQueryGenerateIntersectionKHR, operands);
  9046. return 0;
  9047. case glslang::EOpRayQueryConfirmIntersection:
  9048. builder.createNoResultOp(spv::Op::OpRayQueryConfirmIntersectionKHR, operands);
  9049. return 0;
  9050. case glslang::EOpRayQueryProceed:
  9051. typeId = builder.makeBoolType();
  9052. opCode = spv::Op::OpRayQueryProceedKHR;
  9053. break;
  9054. case glslang::EOpRayQueryGetIntersectionType:
  9055. typeId = builder.makeUintType(32);
  9056. opCode = spv::Op::OpRayQueryGetIntersectionTypeKHR;
  9057. break;
  9058. case glslang::EOpRayQueryGetRayTMin:
  9059. typeId = builder.makeFloatType(32);
  9060. opCode = spv::Op::OpRayQueryGetRayTMinKHR;
  9061. break;
  9062. case glslang::EOpRayQueryGetRayFlags:
  9063. typeId = builder.makeIntType(32);
  9064. opCode = spv::Op::OpRayQueryGetRayFlagsKHR;
  9065. break;
  9066. case glslang::EOpRayQueryGetIntersectionT:
  9067. typeId = builder.makeFloatType(32);
  9068. opCode = spv::Op::OpRayQueryGetIntersectionTKHR;
  9069. break;
  9070. case glslang::EOpRayQueryGetIntersectionInstanceCustomIndex:
  9071. typeId = builder.makeIntType(32);
  9072. opCode = spv::Op::OpRayQueryGetIntersectionInstanceCustomIndexKHR;
  9073. break;
  9074. case glslang::EOpRayQueryGetIntersectionInstanceId:
  9075. typeId = builder.makeIntType(32);
  9076. opCode = spv::Op::OpRayQueryGetIntersectionInstanceIdKHR;
  9077. break;
  9078. case glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset:
  9079. typeId = builder.makeUintType(32);
  9080. opCode = spv::Op::OpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffsetKHR;
  9081. break;
  9082. case glslang::EOpRayQueryGetIntersectionGeometryIndex:
  9083. typeId = builder.makeIntType(32);
  9084. opCode = spv::Op::OpRayQueryGetIntersectionGeometryIndexKHR;
  9085. break;
  9086. case glslang::EOpRayQueryGetIntersectionPrimitiveIndex:
  9087. typeId = builder.makeIntType(32);
  9088. opCode = spv::Op::OpRayQueryGetIntersectionPrimitiveIndexKHR;
  9089. break;
  9090. case glslang::EOpRayQueryGetIntersectionBarycentrics:
  9091. typeId = builder.makeVectorType(builder.makeFloatType(32), 2);
  9092. opCode = spv::Op::OpRayQueryGetIntersectionBarycentricsKHR;
  9093. break;
  9094. case glslang::EOpRayQueryGetIntersectionFrontFace:
  9095. typeId = builder.makeBoolType();
  9096. opCode = spv::Op::OpRayQueryGetIntersectionFrontFaceKHR;
  9097. break;
  9098. case glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque:
  9099. typeId = builder.makeBoolType();
  9100. opCode = spv::Op::OpRayQueryGetIntersectionCandidateAABBOpaqueKHR;
  9101. break;
  9102. case glslang::EOpRayQueryGetIntersectionObjectRayDirection:
  9103. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9104. opCode = spv::Op::OpRayQueryGetIntersectionObjectRayDirectionKHR;
  9105. break;
  9106. case glslang::EOpRayQueryGetIntersectionObjectRayOrigin:
  9107. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9108. opCode = spv::Op::OpRayQueryGetIntersectionObjectRayOriginKHR;
  9109. break;
  9110. case glslang::EOpRayQueryGetWorldRayDirection:
  9111. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9112. opCode = spv::Op::OpRayQueryGetWorldRayDirectionKHR;
  9113. break;
  9114. case glslang::EOpRayQueryGetWorldRayOrigin:
  9115. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9116. opCode = spv::Op::OpRayQueryGetWorldRayOriginKHR;
  9117. break;
  9118. case glslang::EOpRayQueryGetIntersectionObjectToWorld:
  9119. typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  9120. opCode = spv::Op::OpRayQueryGetIntersectionObjectToWorldKHR;
  9121. break;
  9122. case glslang::EOpRayQueryGetIntersectionClusterIdNV:
  9123. typeId = builder.makeIntegerType(32, 1);
  9124. opCode = spv::Op::OpRayQueryGetClusterIdNV;
  9125. break;
  9126. case glslang::EOpRayQueryGetIntersectionWorldToObject:
  9127. typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  9128. opCode = spv::Op::OpRayQueryGetIntersectionWorldToObjectKHR;
  9129. break;
  9130. case glslang::EOpRayQueryGetIntersectionSpherePositionNV:
  9131. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9132. opCode = spv::Op::OpRayQueryGetIntersectionSpherePositionNV;
  9133. break;
  9134. case glslang::EOpRayQueryGetIntersectionSphereRadiusNV:
  9135. typeId = builder.makeFloatType(32);
  9136. opCode = spv::Op::OpRayQueryGetIntersectionSphereRadiusNV;
  9137. break;
  9138. case glslang::EOpRayQueryGetIntersectionLSSHitValueNV:
  9139. typeId = builder.makeFloatType(32);
  9140. opCode = spv::Op::OpRayQueryGetIntersectionLSSHitValueNV;
  9141. break;
  9142. case glslang::EOpRayQueryIsSphereHitNV:
  9143. typeId = builder.makeBoolType();
  9144. opCode = spv::Op::OpRayQueryIsSphereHitNV;
  9145. break;
  9146. case glslang::EOpRayQueryIsLSSHitNV:
  9147. typeId = builder.makeBoolType();
  9148. opCode = spv::Op::OpRayQueryIsLSSHitNV;
  9149. break;
  9150. case glslang::EOpWritePackedPrimitiveIndices4x8NV:
  9151. builder.createNoResultOp(spv::Op::OpWritePackedPrimitiveIndices4x8NV, operands);
  9152. return 0;
  9153. case glslang::EOpEmitMeshTasksEXT:
  9154. if (taskPayloadID)
  9155. operands.push_back(taskPayloadID);
  9156. // As per SPV_EXT_mesh_shader make it a terminating instruction in the current block
  9157. builder.makeStatementTerminator(spv::Op::OpEmitMeshTasksEXT, operands, "post-OpEmitMeshTasksEXT");
  9158. return 0;
  9159. case glslang::EOpSetMeshOutputsEXT:
  9160. builder.createNoResultOp(spv::Op::OpSetMeshOutputsEXT, operands);
  9161. return 0;
  9162. case glslang::EOpCooperativeMatrixMulAddNV:
  9163. opCode = spv::Op::OpCooperativeMatrixMulAddNV;
  9164. break;
  9165. case glslang::EOpHitObjectTraceRayNV:
  9166. builder.createNoResultOp(spv::Op::OpHitObjectTraceRayNV, operands);
  9167. return 0;
  9168. case glslang::EOpHitObjectTraceRayEXT:
  9169. builder.createNoResultOp(spv::Op::OpHitObjectTraceRayEXT, operands);
  9170. return 0;
  9171. case glslang::EOpHitObjectTraceRayMotionNV:
  9172. builder.createNoResultOp(spv::Op::OpHitObjectTraceRayMotionNV, operands);
  9173. return 0;
  9174. case glslang::EOpHitObjectTraceRayMotionEXT:
  9175. builder.createNoResultOp(spv::Op::OpHitObjectTraceRayMotionEXT, operands);
  9176. return 0;
  9177. case glslang::EOpHitObjectRecordHitNV:
  9178. builder.createNoResultOp(spv::Op::OpHitObjectRecordHitNV, operands);
  9179. return 0;
  9180. case glslang::EOpHitObjectRecordHitMotionNV:
  9181. builder.createNoResultOp(spv::Op::OpHitObjectRecordHitMotionNV, operands);
  9182. return 0;
  9183. case glslang::EOpHitObjectRecordHitWithIndexNV:
  9184. builder.createNoResultOp(spv::Op::OpHitObjectRecordHitWithIndexNV, operands);
  9185. return 0;
  9186. case glslang::EOpHitObjectRecordHitWithIndexMotionNV:
  9187. builder.createNoResultOp(spv::Op::OpHitObjectRecordHitWithIndexMotionNV, operands);
  9188. return 0;
  9189. case glslang::EOpHitObjectRecordMissNV:
  9190. builder.createNoResultOp(spv::Op::OpHitObjectRecordMissNV, operands);
  9191. return 0;
  9192. case glslang::EOpHitObjectRecordMissEXT:
  9193. builder.createNoResultOp(spv::Op::OpHitObjectRecordMissEXT, operands);
  9194. return 0;
  9195. case glslang::EOpHitObjectRecordMissMotionNV:
  9196. builder.createNoResultOp(spv::Op::OpHitObjectRecordMissMotionNV, operands);
  9197. return 0;
  9198. case glslang::EOpHitObjectRecordMissMotionEXT:
  9199. builder.createNoResultOp(spv::Op::OpHitObjectRecordMissMotionEXT, operands);
  9200. return 0;
  9201. case glslang::EOpHitObjectExecuteShaderNV:
  9202. builder.createNoResultOp(spv::Op::OpHitObjectExecuteShaderNV, operands);
  9203. return 0;
  9204. case glslang::EOpHitObjectExecuteShaderEXT:
  9205. builder.createNoResultOp(spv::Op::OpHitObjectExecuteShaderEXT, operands);
  9206. return 0;
  9207. case glslang::EOpHitObjectIsEmptyNV:
  9208. typeId = builder.makeBoolType();
  9209. opCode = spv::Op::OpHitObjectIsEmptyNV;
  9210. break;
  9211. case glslang::EOpHitObjectIsEmptyEXT:
  9212. typeId = builder.makeBoolType();
  9213. opCode = spv::Op::OpHitObjectIsEmptyEXT;
  9214. break;
  9215. case glslang::EOpHitObjectIsMissNV:
  9216. typeId = builder.makeBoolType();
  9217. opCode = spv::Op::OpHitObjectIsMissNV;
  9218. break;
  9219. case glslang::EOpHitObjectIsMissEXT:
  9220. typeId = builder.makeBoolType();
  9221. opCode = spv::Op::OpHitObjectIsMissEXT;
  9222. break;
  9223. case glslang::EOpHitObjectIsHitNV:
  9224. typeId = builder.makeBoolType();
  9225. opCode = spv::Op::OpHitObjectIsHitNV;
  9226. break;
  9227. case glslang::EOpHitObjectIsSphereHitNV:
  9228. typeId = builder.makeBoolType();
  9229. opCode = spv::Op::OpHitObjectIsSphereHitNV;
  9230. break;
  9231. case glslang::EOpHitObjectIsLSSHitNV:
  9232. typeId = builder.makeBoolType();
  9233. opCode = spv::Op::OpHitObjectIsLSSHitNV;
  9234. break;
  9235. case glslang::EOpHitObjectIsHitEXT:
  9236. typeId = builder.makeBoolType();
  9237. opCode = spv::Op::OpHitObjectIsHitEXT;
  9238. break;
  9239. case glslang::EOpHitObjectGetRayTMinNV:
  9240. typeId = builder.makeFloatType(32);
  9241. opCode = spv::Op::OpHitObjectGetRayTMinNV;
  9242. break;
  9243. case glslang::EOpHitObjectGetRayTMinEXT:
  9244. typeId = builder.makeFloatType(32);
  9245. opCode = spv::Op::OpHitObjectGetRayTMinEXT;
  9246. break;
  9247. case glslang::EOpHitObjectGetRayTMaxNV:
  9248. typeId = builder.makeFloatType(32);
  9249. opCode = spv::Op::OpHitObjectGetRayTMaxNV;
  9250. break;
  9251. case glslang::EOpHitObjectGetRayTMaxEXT:
  9252. typeId = builder.makeFloatType(32);
  9253. opCode = spv::Op::OpHitObjectGetRayTMaxEXT;
  9254. break;
  9255. case glslang::EOpHitObjectGetRayFlagsEXT:
  9256. typeId = builder.makeIntegerType(32, 0);
  9257. opCode = spv::Op::OpHitObjectGetRayFlagsEXT;
  9258. break;
  9259. case glslang::EOpHitObjectGetObjectRayOriginNV:
  9260. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9261. opCode = spv::Op::OpHitObjectGetObjectRayOriginNV;
  9262. break;
  9263. case glslang::EOpHitObjectGetObjectRayOriginEXT:
  9264. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9265. opCode = spv::Op::OpHitObjectGetObjectRayOriginEXT;
  9266. break;
  9267. case glslang::EOpHitObjectGetObjectRayDirectionNV:
  9268. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9269. opCode = spv::Op::OpHitObjectGetObjectRayDirectionNV;
  9270. break;
  9271. case glslang::EOpHitObjectGetObjectRayDirectionEXT:
  9272. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9273. opCode = spv::Op::OpHitObjectGetObjectRayDirectionEXT;
  9274. break;
  9275. case glslang::EOpHitObjectGetWorldRayOriginNV:
  9276. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9277. opCode = spv::Op::OpHitObjectGetWorldRayOriginNV;
  9278. break;
  9279. case glslang::EOpHitObjectGetWorldRayOriginEXT:
  9280. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9281. opCode = spv::Op::OpHitObjectGetWorldRayOriginEXT;
  9282. break;
  9283. case glslang::EOpHitObjectGetWorldRayDirectionNV:
  9284. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9285. opCode = spv::Op::OpHitObjectGetWorldRayDirectionNV;
  9286. break;
  9287. case glslang::EOpHitObjectGetWorldRayDirectionEXT:
  9288. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9289. opCode = spv::Op::OpHitObjectGetWorldRayDirectionEXT;
  9290. break;
  9291. case glslang::EOpHitObjectGetWorldToObjectNV:
  9292. typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  9293. opCode = spv::Op::OpHitObjectGetWorldToObjectNV;
  9294. break;
  9295. case glslang::EOpHitObjectGetWorldToObjectEXT:
  9296. typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  9297. opCode = spv::Op::OpHitObjectGetWorldToObjectEXT;
  9298. break;
  9299. case glslang::EOpHitObjectGetObjectToWorldNV:
  9300. typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  9301. opCode = spv::Op::OpHitObjectGetObjectToWorldNV;
  9302. break;
  9303. case glslang::EOpHitObjectGetObjectToWorldEXT:
  9304. typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  9305. opCode = spv::Op::OpHitObjectGetObjectToWorldEXT;
  9306. break;
  9307. case glslang::EOpHitObjectGetInstanceCustomIndexNV:
  9308. typeId = builder.makeIntegerType(32, 1);
  9309. opCode = spv::Op::OpHitObjectGetInstanceCustomIndexNV;
  9310. break;
  9311. case glslang::EOpHitObjectGetInstanceCustomIndexEXT:
  9312. typeId = builder.makeIntegerType(32, 1);
  9313. opCode = spv::Op::OpHitObjectGetInstanceCustomIndexEXT;
  9314. break;
  9315. case glslang::EOpHitObjectGetInstanceIdNV:
  9316. typeId = builder.makeIntegerType(32, 1);
  9317. opCode = spv::Op::OpHitObjectGetInstanceIdNV;
  9318. break;
  9319. case glslang::EOpHitObjectGetInstanceIdEXT:
  9320. typeId = builder.makeIntegerType(32, 1);
  9321. opCode = spv::Op::OpHitObjectGetInstanceIdEXT;
  9322. break;
  9323. case glslang::EOpHitObjectGetGeometryIndexNV:
  9324. typeId = builder.makeIntegerType(32, 1);
  9325. opCode = spv::Op::OpHitObjectGetGeometryIndexNV;
  9326. break;
  9327. case glslang::EOpHitObjectGetGeometryIndexEXT:
  9328. typeId = builder.makeIntegerType(32, 1);
  9329. opCode = spv::Op::OpHitObjectGetGeometryIndexEXT;
  9330. break;
  9331. case glslang::EOpHitObjectGetPrimitiveIndexNV:
  9332. typeId = builder.makeIntegerType(32, 1);
  9333. opCode = spv::Op::OpHitObjectGetPrimitiveIndexNV;
  9334. break;
  9335. case glslang::EOpHitObjectGetPrimitiveIndexEXT:
  9336. typeId = builder.makeIntegerType(32, 1);
  9337. opCode = spv::Op::OpHitObjectGetPrimitiveIndexEXT;
  9338. break;
  9339. case glslang::EOpHitObjectGetHitKindNV:
  9340. typeId = builder.makeIntegerType(32, 0);
  9341. opCode = spv::Op::OpHitObjectGetHitKindNV;
  9342. break;
  9343. case glslang::EOpHitObjectGetHitKindEXT:
  9344. typeId = builder.makeIntegerType(32, 0);
  9345. opCode = spv::Op::OpHitObjectGetHitKindEXT;
  9346. break;
  9347. case glslang::EOpHitObjectGetCurrentTimeNV:
  9348. typeId = builder.makeFloatType(32);
  9349. opCode = spv::Op::OpHitObjectGetCurrentTimeNV;
  9350. break;
  9351. case glslang::EOpHitObjectGetCurrentTimeEXT:
  9352. typeId = builder.makeFloatType(32);
  9353. opCode = spv::Op::OpHitObjectGetCurrentTimeEXT;
  9354. break;
  9355. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:
  9356. typeId = builder.makeIntegerType(32, 0);
  9357. opCode = spv::Op::OpHitObjectGetShaderBindingTableRecordIndexNV;
  9358. return 0;
  9359. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexEXT:
  9360. typeId = builder.makeIntegerType(32, 0);
  9361. opCode = spv::Op::OpHitObjectGetShaderBindingTableRecordIndexEXT;
  9362. return 0;
  9363. case glslang::EOpHitObjectGetAttributesNV:
  9364. builder.createNoResultOp(spv::Op::OpHitObjectGetAttributesNV, operands);
  9365. return 0;
  9366. case glslang::EOpHitObjectGetAttributesEXT:
  9367. builder.createNoResultOp(spv::Op::OpHitObjectGetAttributesEXT, operands);
  9368. return 0;
  9369. case glslang::EOpHitObjectRecordFromQueryEXT:
  9370. builder.createNoResultOp(spv::Op::OpHitObjectRecordFromQueryEXT, operands);
  9371. return 0;
  9372. case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:
  9373. typeId = builder.makeVectorType(builder.makeUintType(32), 2);
  9374. opCode = spv::Op::OpHitObjectGetShaderRecordBufferHandleNV;
  9375. break;
  9376. case glslang::EOpHitObjectGetClusterIdNV:
  9377. typeId = builder.makeIntegerType(32, 1);
  9378. opCode = spv::Op::OpHitObjectGetClusterIdNV;
  9379. break;
  9380. case glslang::EOpHitObjectGetShaderRecordBufferHandleEXT:
  9381. typeId = builder.makeVectorType(builder.makeUintType(32), 2);
  9382. opCode = spv::Op::OpHitObjectGetShaderRecordBufferHandleEXT;
  9383. break;
  9384. case glslang::EOpHitObjectSetShaderBindingTableRecordIndexEXT:
  9385. builder.createNoResultOp(spv::Op::OpHitObjectSetShaderBindingTableRecordIndexEXT, operands);
  9386. return 0;
  9387. case glslang::EOpReorderThreadNV: {
  9388. if (operands.size() == 2) {
  9389. builder.createNoResultOp(spv::Op::OpReorderThreadWithHintNV, operands);
  9390. } else {
  9391. builder.createNoResultOp(spv::Op::OpReorderThreadWithHitObjectNV, operands);
  9392. }
  9393. return 0;
  9394. }
  9395. case glslang::EOpReorderThreadEXT: {
  9396. if (operands.size() == 2) {
  9397. builder.createNoResultOp(spv::Op::OpReorderThreadWithHintEXT, operands);
  9398. } else {
  9399. builder.createNoResultOp(spv::Op::OpReorderThreadWithHitObjectEXT, operands);
  9400. }
  9401. return 0;
  9402. }
  9403. case glslang::EOpHitObjectReorderExecuteEXT: {
  9404. if (operands.size() == 2) {
  9405. builder.createNoResultOp(spv::Op::OpHitObjectReorderExecuteShaderEXT, operands);
  9406. } else {
  9407. // GLSL intrinsic is
  9408. // hitObjectReorderExecuteEXT(hitObjectEXT hitObject, uint hint, uint bits,int payload) while
  9409. // SPIRV is hitObject id , payload id, optional hint id, optional bits id hence reorder operands
  9410. builder.createNoResultOp(spv::Op::OpHitObjectReorderExecuteShaderEXT, {operands[0], operands[3], operands[1], operands[2]});
  9411. }
  9412. return 0;
  9413. }
  9414. case glslang::EOpHitObjectTraceReorderExecuteEXT: {
  9415. if (operands.size() == 12) {
  9416. builder.createNoResultOp(spv::Op::OpHitObjectTraceReorderExecuteEXT, operands);
  9417. } else {
  9418. std::vector<spv::Id> argOperands;
  9419. std::copy(operands.begin(), operands.begin() + 11, std::back_inserter(argOperands));
  9420. argOperands.push_back(operands[13]);
  9421. argOperands.push_back(operands[11]);
  9422. argOperands.push_back(operands[12]);
  9423. builder.createNoResultOp(spv::Op::OpHitObjectTraceReorderExecuteEXT, argOperands);
  9424. }
  9425. return 0;
  9426. }
  9427. case glslang::EOpHitObjectTraceMotionReorderExecuteEXT: {
  9428. if (operands.size() == 13) {
  9429. builder.createNoResultOp(spv::Op::OpHitObjectTraceMotionReorderExecuteEXT, operands);
  9430. } else {
  9431. std::vector<spv::Id> argOperands;
  9432. std::copy(operands.begin(), operands.begin() + 12, std::back_inserter(argOperands));
  9433. argOperands.push_back(operands[14]);
  9434. argOperands.push_back(operands[12]);
  9435. argOperands.push_back(operands[13]);
  9436. builder.createNoResultOp(spv::Op::OpHitObjectTraceMotionReorderExecuteEXT, argOperands);
  9437. }
  9438. return 0;
  9439. }
  9440. case glslang::EOpImageSampleWeightedQCOM:
  9441. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9442. opCode = spv::Op::OpImageSampleWeightedQCOM;
  9443. addImageProcessingQCOMDecoration(operands[2], spv::Decoration::WeightTextureQCOM);
  9444. break;
  9445. case glslang::EOpImageBoxFilterQCOM:
  9446. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9447. opCode = spv::Op::OpImageBoxFilterQCOM;
  9448. break;
  9449. case glslang::EOpImageBlockMatchSADQCOM:
  9450. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9451. opCode = spv::Op::OpImageBlockMatchSADQCOM;
  9452. addImageProcessingQCOMDecoration(operands[0], spv::Decoration::BlockMatchTextureQCOM);
  9453. addImageProcessingQCOMDecoration(operands[2], spv::Decoration::BlockMatchTextureQCOM);
  9454. break;
  9455. case glslang::EOpImageBlockMatchSSDQCOM:
  9456. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9457. opCode = spv::Op::OpImageBlockMatchSSDQCOM;
  9458. addImageProcessingQCOMDecoration(operands[0], spv::Decoration::BlockMatchTextureQCOM);
  9459. addImageProcessingQCOMDecoration(operands[2], spv::Decoration::BlockMatchTextureQCOM);
  9460. break;
  9461. case glslang::EOpFetchMicroTriangleVertexBarycentricNV:
  9462. typeId = builder.makeVectorType(builder.makeFloatType(32), 2);
  9463. opCode = spv::Op::OpFetchMicroTriangleVertexBarycentricNV;
  9464. break;
  9465. case glslang::EOpFetchMicroTriangleVertexPositionNV:
  9466. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9467. opCode = spv::Op::OpFetchMicroTriangleVertexPositionNV;
  9468. break;
  9469. case glslang::EOpImageBlockMatchWindowSSDQCOM:
  9470. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9471. opCode = spv::Op::OpImageBlockMatchWindowSSDQCOM;
  9472. addImageProcessing2QCOMDecoration(operands[0], false);
  9473. addImageProcessing2QCOMDecoration(operands[2], false);
  9474. break;
  9475. case glslang::EOpImageBlockMatchWindowSADQCOM:
  9476. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9477. opCode = spv::Op::OpImageBlockMatchWindowSADQCOM;
  9478. addImageProcessing2QCOMDecoration(operands[0], false);
  9479. addImageProcessing2QCOMDecoration(operands[2], false);
  9480. break;
  9481. case glslang::EOpImageBlockMatchGatherSSDQCOM:
  9482. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9483. opCode = spv::Op::OpImageBlockMatchGatherSSDQCOM;
  9484. addImageProcessing2QCOMDecoration(operands[0], true);
  9485. addImageProcessing2QCOMDecoration(operands[2], true);
  9486. break;
  9487. case glslang::EOpImageBlockMatchGatherSADQCOM:
  9488. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9489. opCode = spv::Op::OpImageBlockMatchGatherSADQCOM;
  9490. addImageProcessing2QCOMDecoration(operands[0], true);
  9491. addImageProcessing2QCOMDecoration(operands[2], true);
  9492. break;
  9493. case glslang::EOpCreateTensorLayoutNV:
  9494. return builder.createOp(spv::Op::OpCreateTensorLayoutNV, typeId, std::vector<spv::Id>{});
  9495. case glslang::EOpCreateTensorViewNV:
  9496. return builder.createOp(spv::Op::OpCreateTensorViewNV, typeId, std::vector<spv::Id>{});
  9497. case glslang::EOpTensorLayoutSetBlockSizeNV:
  9498. opCode = spv::Op::OpTensorLayoutSetBlockSizeNV;
  9499. break;
  9500. case glslang::EOpTensorLayoutSetDimensionNV:
  9501. opCode = spv::Op::OpTensorLayoutSetDimensionNV;
  9502. break;
  9503. case glslang::EOpTensorLayoutSetStrideNV:
  9504. opCode = spv::Op::OpTensorLayoutSetStrideNV;
  9505. break;
  9506. case glslang::EOpTensorLayoutSliceNV:
  9507. opCode = spv::Op::OpTensorLayoutSliceNV;
  9508. break;
  9509. case glslang::EOpTensorLayoutSetClampValueNV:
  9510. opCode = spv::Op::OpTensorLayoutSetClampValueNV;
  9511. break;
  9512. case glslang::EOpTensorViewSetDimensionNV:
  9513. opCode = spv::Op::OpTensorViewSetDimensionNV;
  9514. break;
  9515. case glslang::EOpTensorViewSetStrideNV:
  9516. opCode = spv::Op::OpTensorViewSetStrideNV;
  9517. break;
  9518. case glslang::EOpTensorViewSetClipNV:
  9519. opCode = spv::Op::OpTensorViewSetClipNV;
  9520. break;
  9521. default:
  9522. return 0;
  9523. }
  9524. spv::Id id = 0;
  9525. if (libCall >= 0) {
  9526. // Use an extended instruction from the standard library.
  9527. // Construct the call arguments, without modifying the original operands vector.
  9528. // We might need the remaining arguments, e.g. in the EOpFrexp case.
  9529. std::vector<spv::Id> callArguments(operands.begin(), operands.begin() + consumedOperands);
  9530. id = builder.createBuiltinCall(typeId, extBuiltins >= 0 ? extBuiltins : stdBuiltins, libCall, callArguments);
  9531. } else if (opCode == spv::Op::OpDot && !isFloat) {
  9532. // int dot(int, int)
  9533. // NOTE: never called for scalar/vector1, this is turned into simple mul before this can be reached
  9534. const int componentCount = builder.getNumComponents(operands[0]);
  9535. spv::Id mulOp = builder.createBinOp(spv::Op::OpIMul, builder.getTypeId(operands[0]), operands[0], operands[1]);
  9536. builder.setPrecision(mulOp, precision);
  9537. id = builder.createCompositeExtract(mulOp, typeId, 0);
  9538. for (int i = 1; i < componentCount; ++i) {
  9539. builder.setPrecision(id, precision);
  9540. id = builder.createBinOp(spv::Op::OpIAdd, typeId, id, builder.createCompositeExtract(mulOp, typeId, i));
  9541. }
  9542. } else {
  9543. switch (consumedOperands) {
  9544. case 0:
  9545. // should all be handled by visitAggregate and createNoArgOperation
  9546. assert(0);
  9547. return 0;
  9548. case 1:
  9549. // should all be handled by createUnaryOperation
  9550. assert(0);
  9551. return 0;
  9552. case 2:
  9553. id = builder.createBinOp(opCode, typeId, operands[0], operands[1]);
  9554. break;
  9555. default:
  9556. // anything 3 or over doesn't have l-value operands, so all should be consumed
  9557. assert(consumedOperands == operands.size());
  9558. id = builder.createOp(opCode, typeId, operands);
  9559. break;
  9560. }
  9561. }
  9562. // Decode the return types that were structures
  9563. switch (op) {
  9564. case glslang::EOpAddCarry:
  9565. case glslang::EOpSubBorrow:
  9566. builder.createStore(builder.createCompositeExtract(id, typeId0, 1), operands[2]);
  9567. id = builder.createCompositeExtract(id, typeId0, 0);
  9568. break;
  9569. case glslang::EOpUMulExtended:
  9570. case glslang::EOpIMulExtended:
  9571. builder.createStore(builder.createCompositeExtract(id, typeId0, 0), operands[3]);
  9572. builder.createStore(builder.createCompositeExtract(id, typeId0, 1), operands[2]);
  9573. break;
  9574. case glslang::EOpModf:
  9575. {
  9576. assert(operands.size() == 2);
  9577. builder.createStore(builder.createCompositeExtract(id, typeId0, 1), operands[1]);
  9578. id = builder.createCompositeExtract(id, typeId0, 0);
  9579. }
  9580. break;
  9581. case glslang::EOpFrexp:
  9582. {
  9583. assert(operands.size() == 2);
  9584. if (builder.isFloatType(builder.getScalarTypeId(typeId1))) {
  9585. // "exp" is floating-point type (from HLSL intrinsic)
  9586. spv::Id member1 = builder.createCompositeExtract(id, frexpIntType, 1);
  9587. member1 = builder.createUnaryOp(spv::Op::OpConvertSToF, typeId1, member1);
  9588. builder.createStore(member1, operands[1]);
  9589. } else
  9590. // "exp" is integer type (from GLSL built-in function)
  9591. builder.createStore(builder.createCompositeExtract(id, frexpIntType, 1), operands[1]);
  9592. id = builder.createCompositeExtract(id, typeId0, 0);
  9593. }
  9594. break;
  9595. default:
  9596. break;
  9597. }
  9598. return builder.setPrecision(id, precision);
  9599. }
  9600. // Intrinsics with no arguments (or no return value, and no precision).
  9601. spv::Id TGlslangToSpvTraverser::createNoArgOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId)
  9602. {
  9603. // GLSL memory barriers use queuefamily scope in new model, device scope in old model
  9604. spv::Scope memoryBarrierScope = glslangIntermediate->usingVulkanMemoryModel() ?
  9605. spv::Scope::QueueFamilyKHR : spv::Scope::Device;
  9606. switch (op) {
  9607. case glslang::EOpBarrier:
  9608. if (glslangIntermediate->getStage() == EShLangTessControl) {
  9609. if (glslangIntermediate->usingVulkanMemoryModel()) {
  9610. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Workgroup,
  9611. spv::MemorySemanticsMask::OutputMemoryKHR |
  9612. spv::MemorySemanticsMask::AcquireRelease);
  9613. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  9614. } else {
  9615. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Invocation, spv::MemorySemanticsMask::MaskNone);
  9616. }
  9617. } else {
  9618. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Workgroup,
  9619. spv::MemorySemanticsMask::WorkgroupMemory |
  9620. spv::MemorySemanticsMask::AcquireRelease);
  9621. }
  9622. return 0;
  9623. case glslang::EOpMemoryBarrier:
  9624. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsAllMemory |
  9625. spv::MemorySemanticsMask::AcquireRelease);
  9626. return 0;
  9627. case glslang::EOpMemoryBarrierBuffer:
  9628. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::UniformMemory |
  9629. spv::MemorySemanticsMask::AcquireRelease);
  9630. return 0;
  9631. case glslang::EOpMemoryBarrierShared:
  9632. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::WorkgroupMemory |
  9633. spv::MemorySemanticsMask::AcquireRelease);
  9634. return 0;
  9635. case glslang::EOpGroupMemoryBarrier:
  9636. builder.createMemoryBarrier(spv::Scope::Workgroup, spv::MemorySemanticsAllMemory |
  9637. spv::MemorySemanticsMask::AcquireRelease);
  9638. return 0;
  9639. case glslang::EOpMemoryBarrierAtomicCounter:
  9640. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::AtomicCounterMemory |
  9641. spv::MemorySemanticsMask::AcquireRelease);
  9642. return 0;
  9643. case glslang::EOpMemoryBarrierImage:
  9644. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::ImageMemory |
  9645. spv::MemorySemanticsMask::AcquireRelease);
  9646. return 0;
  9647. case glslang::EOpAllMemoryBarrierWithGroupSync:
  9648. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Device,
  9649. spv::MemorySemanticsAllMemory |
  9650. spv::MemorySemanticsMask::AcquireRelease);
  9651. return 0;
  9652. case glslang::EOpDeviceMemoryBarrier:
  9653. builder.createMemoryBarrier(spv::Scope::Device, spv::MemorySemanticsMask::UniformMemory |
  9654. spv::MemorySemanticsMask::ImageMemory |
  9655. spv::MemorySemanticsMask::AcquireRelease);
  9656. return 0;
  9657. case glslang::EOpDeviceMemoryBarrierWithGroupSync:
  9658. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Device, spv::MemorySemanticsMask::UniformMemory |
  9659. spv::MemorySemanticsMask::ImageMemory |
  9660. spv::MemorySemanticsMask::AcquireRelease);
  9661. return 0;
  9662. case glslang::EOpWorkgroupMemoryBarrier:
  9663. builder.createMemoryBarrier(spv::Scope::Workgroup, spv::MemorySemanticsMask::WorkgroupMemory |
  9664. spv::MemorySemanticsMask::AcquireRelease);
  9665. return 0;
  9666. case glslang::EOpWorkgroupMemoryBarrierWithGroupSync:
  9667. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Workgroup,
  9668. spv::MemorySemanticsMask::WorkgroupMemory |
  9669. spv::MemorySemanticsMask::AcquireRelease);
  9670. return 0;
  9671. case glslang::EOpSubgroupBarrier:
  9672. builder.createControlBarrier(spv::Scope::Subgroup, spv::Scope::Subgroup, spv::MemorySemanticsAllMemory |
  9673. spv::MemorySemanticsMask::AcquireRelease);
  9674. return spv::NoResult;
  9675. case glslang::EOpSubgroupMemoryBarrier:
  9676. builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsAllMemory |
  9677. spv::MemorySemanticsMask::AcquireRelease);
  9678. return spv::NoResult;
  9679. case glslang::EOpSubgroupMemoryBarrierBuffer:
  9680. builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsMask::UniformMemory |
  9681. spv::MemorySemanticsMask::AcquireRelease);
  9682. return spv::NoResult;
  9683. case glslang::EOpSubgroupMemoryBarrierImage:
  9684. builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsMask::ImageMemory |
  9685. spv::MemorySemanticsMask::AcquireRelease);
  9686. return spv::NoResult;
  9687. case glslang::EOpSubgroupMemoryBarrierShared:
  9688. builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsMask::WorkgroupMemory |
  9689. spv::MemorySemanticsMask::AcquireRelease);
  9690. return spv::NoResult;
  9691. case glslang::EOpEmitVertex:
  9692. builder.createNoResultOp(spv::Op::OpEmitVertex);
  9693. return 0;
  9694. case glslang::EOpEndPrimitive:
  9695. builder.createNoResultOp(spv::Op::OpEndPrimitive);
  9696. return 0;
  9697. case glslang::EOpSubgroupElect: {
  9698. std::vector<spv::Id> operands;
  9699. return createSubgroupOperation(op, typeId, operands, glslang::EbtVoid);
  9700. }
  9701. case glslang::EOpTime:
  9702. {
  9703. std::vector<spv::Id> args; // Dummy arguments
  9704. spv::Id id = builder.createBuiltinCall(typeId, getExtBuiltins(spv::E_SPV_AMD_gcn_shader), spv::TimeAMD, args);
  9705. return builder.setPrecision(id, precision);
  9706. }
  9707. case glslang::EOpIgnoreIntersectionNV:
  9708. builder.createNoResultOp(spv::Op::OpIgnoreIntersectionNV);
  9709. return 0;
  9710. case glslang::EOpTerminateRayNV:
  9711. builder.createNoResultOp(spv::Op::OpTerminateRayNV);
  9712. return 0;
  9713. case glslang::EOpRayQueryInitialize:
  9714. builder.createNoResultOp(spv::Op::OpRayQueryInitializeKHR);
  9715. return 0;
  9716. case glslang::EOpRayQueryTerminate:
  9717. builder.createNoResultOp(spv::Op::OpRayQueryTerminateKHR);
  9718. return 0;
  9719. case glslang::EOpRayQueryGenerateIntersection:
  9720. builder.createNoResultOp(spv::Op::OpRayQueryGenerateIntersectionKHR);
  9721. return 0;
  9722. case glslang::EOpRayQueryConfirmIntersection:
  9723. builder.createNoResultOp(spv::Op::OpRayQueryConfirmIntersectionKHR);
  9724. return 0;
  9725. case glslang::EOpBeginInvocationInterlock:
  9726. builder.createNoResultOp(spv::Op::OpBeginInvocationInterlockEXT);
  9727. return 0;
  9728. case glslang::EOpEndInvocationInterlock:
  9729. builder.createNoResultOp(spv::Op::OpEndInvocationInterlockEXT);
  9730. return 0;
  9731. case glslang::EOpIsHelperInvocation:
  9732. {
  9733. std::vector<spv::Id> args; // Dummy arguments
  9734. builder.addExtension(spv::E_SPV_EXT_demote_to_helper_invocation);
  9735. builder.addCapability(spv::Capability::DemoteToHelperInvocationEXT);
  9736. return builder.createOp(spv::Op::OpIsHelperInvocationEXT, typeId, args);
  9737. }
  9738. case glslang::EOpReadClockSubgroupKHR: {
  9739. std::vector<spv::Id> args;
  9740. args.push_back(builder.makeUintConstant(spv::Scope::Subgroup));
  9741. builder.addExtension(spv::E_SPV_KHR_shader_clock);
  9742. builder.addCapability(spv::Capability::ShaderClockKHR);
  9743. return builder.createOp(spv::Op::OpReadClockKHR, typeId, args);
  9744. }
  9745. case glslang::EOpReadClockDeviceKHR: {
  9746. std::vector<spv::Id> args;
  9747. args.push_back(builder.makeUintConstant(spv::Scope::Device));
  9748. builder.addExtension(spv::E_SPV_KHR_shader_clock);
  9749. builder.addCapability(spv::Capability::ShaderClockKHR);
  9750. return builder.createOp(spv::Op::OpReadClockKHR, typeId, args);
  9751. }
  9752. case glslang::EOpStencilAttachmentReadEXT:
  9753. case glslang::EOpDepthAttachmentReadEXT:
  9754. {
  9755. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  9756. spv::Decoration precision;
  9757. spv::Op spv_op;
  9758. if (op == glslang::EOpStencilAttachmentReadEXT)
  9759. {
  9760. precision = spv::Decoration::RelaxedPrecision;
  9761. spv_op = spv::Op::OpStencilAttachmentReadEXT;
  9762. builder.addCapability(spv::Capability::TileImageStencilReadAccessEXT);
  9763. }
  9764. else
  9765. {
  9766. precision = spv::NoPrecision;
  9767. spv_op = spv::Op::OpDepthAttachmentReadEXT;
  9768. builder.addCapability(spv::Capability::TileImageDepthReadAccessEXT);
  9769. }
  9770. std::vector<spv::Id> args; // Dummy args
  9771. spv::Id result = builder.createOp(spv_op, typeId, args);
  9772. return builder.setPrecision(result, precision);
  9773. }
  9774. default:
  9775. break;
  9776. }
  9777. logger->missingFunctionality("unknown operation with no arguments");
  9778. return 0;
  9779. }
  9780. spv::Id TGlslangToSpvTraverser::getSymbolId(const glslang::TIntermSymbol* symbol)
  9781. {
  9782. auto iter = symbolValues.find(symbol->getId());
  9783. spv::Id id;
  9784. if (symbolValues.end() != iter) {
  9785. id = iter->second;
  9786. return id;
  9787. }
  9788. // it was not found, create it
  9789. spv::BuiltIn builtIn = TranslateBuiltInDecoration(symbol->getQualifier().builtIn, false);
  9790. auto forcedType = getForcedType(symbol->getQualifier().builtIn, symbol->getType());
  9791. // There are pairs of symbols that map to the same SPIR-V built-in:
  9792. // gl_ObjectToWorldEXT and gl_ObjectToWorld3x4EXT, and gl_WorldToObjectEXT
  9793. // and gl_WorldToObject3x4EXT. SPIR-V forbids having two OpVariables
  9794. // with the same BuiltIn in the same storage class, so we must re-use one.
  9795. const bool mayNeedToReuseBuiltIn =
  9796. builtIn == spv::BuiltIn::ObjectToWorldKHR ||
  9797. builtIn == spv::BuiltIn::WorldToObjectKHR;
  9798. if (mayNeedToReuseBuiltIn) {
  9799. auto iter = builtInVariableIds.find(uint32_t(builtIn));
  9800. if (builtInVariableIds.end() != iter) {
  9801. id = iter->second;
  9802. symbolValues[symbol->getId()] = id;
  9803. if (forcedType.second != spv::NoType)
  9804. forceType[id] = forcedType.second;
  9805. return id;
  9806. }
  9807. }
  9808. if (symbol->getBasicType() == glslang::EbtFunction) {
  9809. return 0;
  9810. }
  9811. id = createSpvVariable(symbol, forcedType.first);
  9812. if (mayNeedToReuseBuiltIn) {
  9813. builtInVariableIds.insert({uint32_t(builtIn), id});
  9814. }
  9815. symbolValues[symbol->getId()] = id;
  9816. if (forcedType.second != spv::NoType)
  9817. forceType[id] = forcedType.second;
  9818. if (symbol->getBasicType() != glslang::EbtBlock) {
  9819. builder.addDecoration(id, TranslatePrecisionDecoration(symbol->getType()));
  9820. builder.addDecoration(id, TranslateInterpolationDecoration(symbol->getType().getQualifier()));
  9821. builder.addDecoration(id, TranslateAuxiliaryStorageDecoration(symbol->getType().getQualifier()));
  9822. addMeshNVDecoration(id, /*member*/ -1, symbol->getType().getQualifier());
  9823. if (symbol->getQualifier().hasComponent())
  9824. builder.addDecoration(id, spv::Decoration::Component, symbol->getQualifier().layoutComponent);
  9825. if (symbol->getQualifier().hasIndex())
  9826. builder.addDecoration(id, spv::Decoration::Index, symbol->getQualifier().layoutIndex);
  9827. if (symbol->getType().getQualifier().hasSpecConstantId())
  9828. builder.addDecoration(id, spv::Decoration::SpecId, symbol->getType().getQualifier().layoutSpecConstantId);
  9829. // atomic counters use this:
  9830. if (symbol->getQualifier().hasOffset())
  9831. builder.addDecoration(id, spv::Decoration::Offset, symbol->getQualifier().layoutOffset);
  9832. }
  9833. if (symbol->getQualifier().hasLocation()) {
  9834. if (!(glslangIntermediate->isRayTracingStage() &&
  9835. (glslangIntermediate->IsRequestedExtension(glslang::E_GL_EXT_ray_tracing) ||
  9836. glslangIntermediate->IsRequestedExtension(glslang::E_GL_NV_shader_invocation_reorder) ||
  9837. glslangIntermediate->IsRequestedExtension(glslang::E_GL_EXT_shader_invocation_reorder))
  9838. && (builder.getStorageClass(id) == spv::StorageClass::RayPayloadKHR ||
  9839. builder.getStorageClass(id) == spv::StorageClass::IncomingRayPayloadKHR ||
  9840. builder.getStorageClass(id) == spv::StorageClass::CallableDataKHR ||
  9841. builder.getStorageClass(id) == spv::StorageClass::IncomingCallableDataKHR ||
  9842. builder.getStorageClass(id) == spv::StorageClass::HitObjectAttributeEXT ||
  9843. builder.getStorageClass(id) == spv::StorageClass::HitObjectAttributeNV))) {
  9844. // Location values are used to link TraceRayKHR/ExecuteCallableKHR/HitObjectGetAttributesNV
  9845. // to corresponding variables but are not valid in SPIRV since they are supported only
  9846. // for Input/Output Storage classes.
  9847. builder.addDecoration(id, spv::Decoration::Location, symbol->getQualifier().layoutLocation);
  9848. }
  9849. }
  9850. builder.addDecoration(id, TranslateInvariantDecoration(symbol->getType().getQualifier()));
  9851. if (symbol->getQualifier().hasStream() && glslangIntermediate->isMultiStream()) {
  9852. builder.addCapability(spv::Capability::GeometryStreams);
  9853. builder.addDecoration(id, spv::Decoration::Stream, symbol->getQualifier().layoutStream);
  9854. }
  9855. if (symbol->getQualifier().hasSet())
  9856. builder.addDecoration(id, spv::Decoration::DescriptorSet, symbol->getQualifier().layoutSet);
  9857. else if (IsDescriptorResource(symbol->getType())) {
  9858. // default to 0
  9859. builder.addDecoration(id, spv::Decoration::DescriptorSet, 0);
  9860. }
  9861. if (symbol->getQualifier().hasBinding())
  9862. builder.addDecoration(id, spv::Decoration::Binding, symbol->getQualifier().layoutBinding);
  9863. else if (IsDescriptorResource(symbol->getType())) {
  9864. // default to 0
  9865. builder.addDecoration(id, spv::Decoration::Binding, 0);
  9866. }
  9867. if (symbol->getQualifier().hasAttachment())
  9868. builder.addDecoration(id, spv::Decoration::InputAttachmentIndex, symbol->getQualifier().layoutAttachment);
  9869. if (glslangIntermediate->getXfbMode()) {
  9870. builder.addCapability(spv::Capability::TransformFeedback);
  9871. if (symbol->getQualifier().hasXfbBuffer()) {
  9872. builder.addDecoration(id, spv::Decoration::XfbBuffer, symbol->getQualifier().layoutXfbBuffer);
  9873. unsigned stride = glslangIntermediate->getXfbStride(symbol->getQualifier().layoutXfbBuffer);
  9874. if (stride != glslang::TQualifier::layoutXfbStrideEnd)
  9875. builder.addDecoration(id, spv::Decoration::XfbStride, stride);
  9876. }
  9877. if (symbol->getQualifier().hasXfbOffset())
  9878. builder.addDecoration(id, spv::Decoration::Offset, symbol->getQualifier().layoutXfbOffset);
  9879. }
  9880. // add built-in variable decoration
  9881. if (builtIn != spv::BuiltIn::Max) {
  9882. // WorkgroupSize deprecated in spirv1.6
  9883. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_6 ||
  9884. builtIn != spv::BuiltIn::WorkgroupSize)
  9885. builder.addDecoration(id, spv::Decoration::BuiltIn, (int)builtIn);
  9886. }
  9887. // Add volatile decoration to HelperInvocation for spirv1.6 and beyond
  9888. if (builtIn == spv::BuiltIn::HelperInvocation &&
  9889. !glslangIntermediate->usingVulkanMemoryModel() &&
  9890. glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {
  9891. builder.addDecoration(id, spv::Decoration::Volatile);
  9892. }
  9893. // Subgroup builtins which have input storage class are volatile for ray tracing stages.
  9894. if (symbol->getType().isImage() || symbol->getQualifier().isPipeInput()) {
  9895. std::vector<spv::Decoration> memory;
  9896. TranslateMemoryDecoration(symbol->getType().getQualifier(), memory,
  9897. glslangIntermediate->usingVulkanMemoryModel());
  9898. for (unsigned int i = 0; i < memory.size(); ++i)
  9899. builder.addDecoration(id, memory[i]);
  9900. }
  9901. if (builtIn == spv::BuiltIn::SampleMask) {
  9902. spv::Decoration decoration;
  9903. // GL_NV_sample_mask_override_coverage extension
  9904. if (glslangIntermediate->getLayoutOverrideCoverage())
  9905. decoration = spv::Decoration::OverrideCoverageNV;
  9906. else
  9907. decoration = spv::Decoration::Max;
  9908. builder.addDecoration(id, decoration);
  9909. if (decoration != spv::Decoration::Max) {
  9910. builder.addCapability(spv::Capability::SampleMaskOverrideCoverageNV);
  9911. builder.addExtension(spv::E_SPV_NV_sample_mask_override_coverage);
  9912. }
  9913. }
  9914. else if (builtIn == spv::BuiltIn::Layer) {
  9915. // SPV_NV_viewport_array2 extension
  9916. if (symbol->getQualifier().layoutViewportRelative) {
  9917. builder.addDecoration(id, spv::Decoration::ViewportRelativeNV);
  9918. builder.addCapability(spv::Capability::ShaderViewportMaskNV);
  9919. builder.addExtension(spv::E_SPV_NV_viewport_array2);
  9920. }
  9921. if (symbol->getQualifier().layoutSecondaryViewportRelativeOffset != -2048) {
  9922. builder.addDecoration(id, spv::Decoration::SecondaryViewportRelativeNV,
  9923. symbol->getQualifier().layoutSecondaryViewportRelativeOffset);
  9924. builder.addCapability(spv::Capability::ShaderStereoViewNV);
  9925. builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
  9926. }
  9927. }
  9928. if (symbol->getQualifier().layoutPassthrough) {
  9929. builder.addDecoration(id, spv::Decoration::PassthroughNV);
  9930. builder.addCapability(spv::Capability::GeometryShaderPassthroughNV);
  9931. builder.addExtension(spv::E_SPV_NV_geometry_shader_passthrough);
  9932. }
  9933. if (symbol->getQualifier().pervertexNV) {
  9934. builder.addDecoration(id, spv::Decoration::PerVertexNV);
  9935. builder.addCapability(spv::Capability::FragmentBarycentricNV);
  9936. builder.addExtension(spv::E_SPV_NV_fragment_shader_barycentric);
  9937. }
  9938. if (symbol->getQualifier().pervertexEXT) {
  9939. builder.addDecoration(id, spv::Decoration::PerVertexKHR);
  9940. builder.addCapability(spv::Capability::FragmentBarycentricKHR);
  9941. builder.addExtension(spv::E_SPV_KHR_fragment_shader_barycentric);
  9942. }
  9943. if (glslangIntermediate->getHlslFunctionality1() && symbol->getType().getQualifier().semanticName != nullptr) {
  9944. builder.addExtension("SPV_GOOGLE_hlsl_functionality1");
  9945. builder.addDecoration(id, spv::Decoration::HlslSemanticGOOGLE,
  9946. symbol->getType().getQualifier().semanticName);
  9947. }
  9948. if (symbol->isReference()) {
  9949. builder.addDecoration(id, symbol->getType().getQualifier().restrict ?
  9950. spv::Decoration::RestrictPointerEXT : spv::Decoration::AliasedPointerEXT);
  9951. }
  9952. // Add SPIR-V decorations (GL_EXT_spirv_intrinsics)
  9953. if (symbol->getType().getQualifier().hasSpirvDecorate())
  9954. applySpirvDecorate(symbol->getType(), id, {});
  9955. return id;
  9956. }
  9957. // add per-primitive, per-view. per-task decorations to a struct member (member >= 0) or an object
  9958. void TGlslangToSpvTraverser::addMeshNVDecoration(spv::Id id, int member, const glslang::TQualifier& qualifier)
  9959. {
  9960. bool isMeshShaderExt = (glslangIntermediate->getRequestedExtensions().find(glslang::E_GL_EXT_mesh_shader) !=
  9961. glslangIntermediate->getRequestedExtensions().end());
  9962. if (member >= 0) {
  9963. if (qualifier.perPrimitiveNV) {
  9964. // Need to add capability/extension for fragment shader.
  9965. // Mesh shader already adds this by default.
  9966. if (glslangIntermediate->getStage() == EShLangFragment) {
  9967. if(isMeshShaderExt) {
  9968. builder.addCapability(spv::Capability::MeshShadingEXT);
  9969. builder.addExtension(spv::E_SPV_EXT_mesh_shader);
  9970. } else {
  9971. builder.addCapability(spv::Capability::MeshShadingNV);
  9972. builder.addExtension(spv::E_SPV_NV_mesh_shader);
  9973. }
  9974. }
  9975. builder.addMemberDecoration(id, (unsigned)member, spv::Decoration::PerPrimitiveNV);
  9976. }
  9977. if (qualifier.perViewNV)
  9978. builder.addMemberDecoration(id, (unsigned)member, spv::Decoration::PerViewNV);
  9979. if (qualifier.perTaskNV)
  9980. builder.addMemberDecoration(id, (unsigned)member, spv::Decoration::PerTaskNV);
  9981. } else {
  9982. if (qualifier.perPrimitiveNV) {
  9983. // Need to add capability/extension for fragment shader.
  9984. // Mesh shader already adds this by default.
  9985. if (glslangIntermediate->getStage() == EShLangFragment) {
  9986. if(isMeshShaderExt) {
  9987. builder.addCapability(spv::Capability::MeshShadingEXT);
  9988. builder.addExtension(spv::E_SPV_EXT_mesh_shader);
  9989. } else {
  9990. builder.addCapability(spv::Capability::MeshShadingNV);
  9991. builder.addExtension(spv::E_SPV_NV_mesh_shader);
  9992. }
  9993. }
  9994. builder.addDecoration(id, spv::Decoration::PerPrimitiveNV);
  9995. }
  9996. if (qualifier.perViewNV)
  9997. builder.addDecoration(id, spv::Decoration::PerViewNV);
  9998. if (qualifier.perTaskNV)
  9999. builder.addDecoration(id, spv::Decoration::PerTaskNV);
  10000. }
  10001. }
  10002. bool TGlslangToSpvTraverser::hasQCOMImageProceessingDecoration(spv::Id id, spv::Decoration decor)
  10003. {
  10004. std::vector<spv::Decoration> &decoVec = idToQCOMDecorations[id];
  10005. for ( auto d : decoVec ) {
  10006. if ( d == decor )
  10007. return true;
  10008. }
  10009. return false;
  10010. }
  10011. void TGlslangToSpvTraverser::addImageProcessingQCOMDecoration(spv::Id id, spv::Decoration decor)
  10012. {
  10013. spv::Op opc = builder.getOpCode(id);
  10014. if (opc == spv::Op::OpSampledImage) {
  10015. id = builder.getIdOperand(id, 0);
  10016. opc = builder.getOpCode(id);
  10017. }
  10018. if (opc == spv::Op::OpLoad) {
  10019. spv::Id texid = builder.getIdOperand(id, 0);
  10020. if (!hasQCOMImageProceessingDecoration(texid, decor)) {//
  10021. builder.addDecoration(texid, decor);
  10022. idToQCOMDecorations[texid].push_back(decor);
  10023. }
  10024. }
  10025. }
  10026. void TGlslangToSpvTraverser::addImageProcessing2QCOMDecoration(spv::Id id, bool isForGather)
  10027. {
  10028. if (isForGather) {
  10029. return addImageProcessingQCOMDecoration(id, spv::Decoration::BlockMatchTextureQCOM);
  10030. }
  10031. auto addDecor =
  10032. [this](spv::Id id, spv::Decoration decor) {
  10033. spv::Op tsopc = this->builder.getOpCode(id);
  10034. if (tsopc == spv::Op::OpLoad) {
  10035. spv::Id tsid = this->builder.getIdOperand(id, 0);
  10036. if (this->glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {
  10037. assert(iOSet.count(tsid) > 0);
  10038. }
  10039. if (!hasQCOMImageProceessingDecoration(tsid, decor)) {
  10040. this->builder.addDecoration(tsid, decor);
  10041. idToQCOMDecorations[tsid].push_back(decor);
  10042. }
  10043. }
  10044. };
  10045. spv::Op opc = builder.getOpCode(id);
  10046. bool isInterfaceObject = (opc != spv::Op::OpSampledImage);
  10047. if (!isInterfaceObject) {
  10048. addDecor(builder.getIdOperand(id, 0), spv::Decoration::BlockMatchTextureQCOM);
  10049. addDecor(builder.getIdOperand(id, 1), spv::Decoration::BlockMatchSamplerQCOM);
  10050. } else {
  10051. addDecor(id, spv::Decoration::BlockMatchTextureQCOM);
  10052. addDecor(id, spv::Decoration::BlockMatchSamplerQCOM);
  10053. }
  10054. }
  10055. // Make a full tree of instructions to build a SPIR-V specialization constant,
  10056. // or regular constant if possible.
  10057. //
  10058. // TBD: this is not yet done, nor verified to be the best design, it does do the leaf symbols though
  10059. //
  10060. // Recursively walk the nodes. The nodes form a tree whose leaves are
  10061. // regular constants, which themselves are trees that createSpvConstant()
  10062. // recursively walks. So, this function walks the "top" of the tree:
  10063. // - emit specialization constant-building instructions for specConstant
  10064. // - when running into a non-spec-constant, switch to createSpvConstant()
  10065. spv::Id TGlslangToSpvTraverser::createSpvConstant(const glslang::TIntermTyped& node)
  10066. {
  10067. assert(node.getQualifier().isConstant());
  10068. // Handle front-end constants first (non-specialization constants).
  10069. if (! node.getQualifier().specConstant) {
  10070. // hand off to the non-spec-constant path
  10071. assert(node.getAsConstantUnion() != nullptr || node.getAsSymbolNode() != nullptr);
  10072. int nextConst = 0;
  10073. return createSpvConstantFromConstUnionArray(node.getType(), node.getAsConstantUnion() ?
  10074. node.getAsConstantUnion()->getConstArray() : node.getAsSymbolNode()->getConstArray(),
  10075. nextConst, false);
  10076. }
  10077. // We now know we have a specialization constant to build
  10078. // Extra capabilities may be needed.
  10079. if (node.getType().contains8BitInt())
  10080. builder.addCapability(spv::Capability::Int8);
  10081. if (node.getType().contains16BitFloat())
  10082. builder.addCapability(spv::Capability::Float16);
  10083. if (node.getType().contains16BitInt())
  10084. builder.addCapability(spv::Capability::Int16);
  10085. if (node.getType().contains64BitInt())
  10086. builder.addCapability(spv::Capability::Int64);
  10087. if (node.getType().containsDouble())
  10088. builder.addCapability(spv::Capability::Float64);
  10089. // gl_WorkGroupSize is a special case until the front-end handles hierarchical specialization constants,
  10090. // even then, it's specialization ids are handled by special case syntax in GLSL: layout(local_size_x = ...
  10091. if (node.getType().getQualifier().builtIn == glslang::EbvWorkGroupSize) {
  10092. std::vector<spv::Id> dimConstId;
  10093. for (int dim = 0; dim < 3; ++dim) {
  10094. bool specConst = (glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet);
  10095. dimConstId.push_back(builder.makeUintConstant(glslangIntermediate->getLocalSize(dim), specConst));
  10096. if (specConst) {
  10097. builder.addDecoration(dimConstId.back(), spv::Decoration::SpecId,
  10098. glslangIntermediate->getLocalSizeSpecId(dim));
  10099. }
  10100. }
  10101. return builder.makeCompositeConstant(builder.makeVectorType(builder.makeUintType(32), 3), dimConstId, true);
  10102. }
  10103. // An AST node labelled as specialization constant should be a symbol node.
  10104. // Its initializer should either be a sub tree with constant nodes, or a constant union array.
  10105. if (auto* sn = node.getAsSymbolNode()) {
  10106. spv::Id result;
  10107. if (auto* sub_tree = sn->getConstSubtree()) {
  10108. // Traverse the constant constructor sub tree like generating normal run-time instructions.
  10109. // During the AST traversal, if the node is marked as 'specConstant', SpecConstantOpModeGuard
  10110. // will set the builder into spec constant op instruction generating mode.
  10111. sub_tree->traverse(this);
  10112. result = accessChainLoad(sub_tree->getType());
  10113. } else if (auto* const_union_array = &sn->getConstArray()) {
  10114. int nextConst = 0;
  10115. result = createSpvConstantFromConstUnionArray(sn->getType(), *const_union_array, nextConst, true);
  10116. } else {
  10117. logger->missingFunctionality("Invalid initializer for spec constant.");
  10118. return spv::NoResult;
  10119. }
  10120. builder.addName(result, sn->getName().c_str());
  10121. return result;
  10122. }
  10123. // Neither a front-end constant node, nor a specialization constant node with constant union array or
  10124. // constant sub tree as initializer.
  10125. logger->missingFunctionality("Neither a front-end constant nor a spec constant.");
  10126. return spv::NoResult;
  10127. }
  10128. // Use 'consts' as the flattened glslang source of scalar constants to recursively
  10129. // build the aggregate SPIR-V constant.
  10130. //
  10131. // If there are not enough elements present in 'consts', 0 will be substituted;
  10132. // an empty 'consts' can be used to create a fully zeroed SPIR-V constant.
  10133. //
  10134. spv::Id TGlslangToSpvTraverser::createSpvConstantFromConstUnionArray(const glslang::TType& glslangType,
  10135. const glslang::TConstUnionArray& consts, int& nextConst, bool specConstant)
  10136. {
  10137. // vector of constants for SPIR-V
  10138. std::vector<spv::Id> spvConsts;
  10139. // Type is used for struct and array constants
  10140. spv::Id typeId = convertGlslangToSpvType(glslangType);
  10141. if (glslangType.isArray()) {
  10142. glslang::TType elementType(glslangType, 0);
  10143. for (int i = 0; i < glslangType.getOuterArraySize(); ++i)
  10144. spvConsts.push_back(createSpvConstantFromConstUnionArray(elementType, consts, nextConst, false));
  10145. } else if (glslangType.isMatrix()) {
  10146. glslang::TType vectorType(glslangType, 0);
  10147. for (int col = 0; col < glslangType.getMatrixCols(); ++col)
  10148. spvConsts.push_back(createSpvConstantFromConstUnionArray(vectorType, consts, nextConst, false));
  10149. } else if (glslangType.isCoopMat()) {
  10150. glslang::TType componentType(glslangType.getBasicType());
  10151. spvConsts.push_back(createSpvConstantFromConstUnionArray(componentType, consts, nextConst, false));
  10152. } else if (glslangType.isStruct()) {
  10153. glslang::TVector<glslang::TTypeLoc>::const_iterator iter;
  10154. for (iter = glslangType.getStruct()->begin(); iter != glslangType.getStruct()->end(); ++iter)
  10155. spvConsts.push_back(createSpvConstantFromConstUnionArray(*iter->type, consts, nextConst, false));
  10156. } else if (glslangType.getVectorSize() > 1 || glslangType.isCoopVecNV()) {
  10157. unsigned int numComponents = glslangType.isCoopVecNV() ? glslangType.getTypeParameters()->arraySizes->getDimSize(0) : glslangType.getVectorSize();
  10158. for (unsigned int i = 0; i < numComponents; ++i) {
  10159. bool zero = nextConst >= consts.size();
  10160. switch (glslangType.getBasicType()) {
  10161. case glslang::EbtInt:
  10162. spvConsts.push_back(builder.makeIntConstant(zero ? 0 : consts[nextConst].getIConst()));
  10163. break;
  10164. case glslang::EbtUint:
  10165. spvConsts.push_back(builder.makeUintConstant(zero ? 0 : consts[nextConst].getUConst()));
  10166. break;
  10167. case glslang::EbtFloat:
  10168. spvConsts.push_back(builder.makeFloatConstant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  10169. break;
  10170. case glslang::EbtBool:
  10171. spvConsts.push_back(builder.makeBoolConstant(zero ? false : consts[nextConst].getBConst()));
  10172. break;
  10173. case glslang::EbtInt8:
  10174. builder.addCapability(spv::Capability::Int8);
  10175. spvConsts.push_back(builder.makeInt8Constant(zero ? 0 : consts[nextConst].getI8Const()));
  10176. break;
  10177. case glslang::EbtUint8:
  10178. builder.addCapability(spv::Capability::Int8);
  10179. spvConsts.push_back(builder.makeUint8Constant(zero ? 0 : consts[nextConst].getU8Const()));
  10180. break;
  10181. case glslang::EbtInt16:
  10182. builder.addCapability(spv::Capability::Int16);
  10183. spvConsts.push_back(builder.makeInt16Constant(zero ? 0 : consts[nextConst].getI16Const()));
  10184. break;
  10185. case glslang::EbtUint16:
  10186. builder.addCapability(spv::Capability::Int16);
  10187. spvConsts.push_back(builder.makeUint16Constant(zero ? 0 : consts[nextConst].getU16Const()));
  10188. break;
  10189. case glslang::EbtInt64:
  10190. spvConsts.push_back(builder.makeInt64Constant(zero ? 0 : consts[nextConst].getI64Const()));
  10191. break;
  10192. case glslang::EbtUint64:
  10193. spvConsts.push_back(builder.makeUint64Constant(zero ? 0 : consts[nextConst].getU64Const()));
  10194. break;
  10195. case glslang::EbtDouble:
  10196. spvConsts.push_back(builder.makeDoubleConstant(zero ? 0.0 : consts[nextConst].getDConst()));
  10197. break;
  10198. case glslang::EbtFloat16:
  10199. builder.addCapability(spv::Capability::Float16);
  10200. spvConsts.push_back(builder.makeFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  10201. break;
  10202. case glslang::EbtBFloat16:
  10203. spvConsts.push_back(builder.makeBFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  10204. break;
  10205. case glslang::EbtFloatE5M2:
  10206. spvConsts.push_back(builder.makeFloatE5M2Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  10207. break;
  10208. case glslang::EbtFloatE4M3:
  10209. spvConsts.push_back(builder.makeFloatE4M3Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  10210. break;
  10211. default:
  10212. assert(0);
  10213. break;
  10214. }
  10215. ++nextConst;
  10216. }
  10217. } else {
  10218. // we have a non-aggregate (scalar) constant
  10219. bool zero = nextConst >= consts.size();
  10220. spv::Id scalar = 0;
  10221. switch (glslangType.getBasicType()) {
  10222. case glslang::EbtInt:
  10223. scalar = builder.makeIntConstant(zero ? 0 : consts[nextConst].getIConst(), specConstant);
  10224. break;
  10225. case glslang::EbtUint:
  10226. scalar = builder.makeUintConstant(zero ? 0 : consts[nextConst].getUConst(), specConstant);
  10227. break;
  10228. case glslang::EbtFloat:
  10229. scalar = builder.makeFloatConstant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  10230. break;
  10231. case glslang::EbtBool:
  10232. scalar = builder.makeBoolConstant(zero ? false : consts[nextConst].getBConst(), specConstant);
  10233. break;
  10234. case glslang::EbtInt8:
  10235. builder.addCapability(spv::Capability::Int8);
  10236. scalar = builder.makeInt8Constant(zero ? 0 : consts[nextConst].getI8Const(), specConstant);
  10237. break;
  10238. case glslang::EbtUint8:
  10239. builder.addCapability(spv::Capability::Int8);
  10240. scalar = builder.makeUint8Constant(zero ? 0 : consts[nextConst].getU8Const(), specConstant);
  10241. break;
  10242. case glslang::EbtInt16:
  10243. builder.addCapability(spv::Capability::Int16);
  10244. scalar = builder.makeInt16Constant(zero ? 0 : consts[nextConst].getI16Const(), specConstant);
  10245. break;
  10246. case glslang::EbtUint16:
  10247. builder.addCapability(spv::Capability::Int16);
  10248. scalar = builder.makeUint16Constant(zero ? 0 : consts[nextConst].getU16Const(), specConstant);
  10249. break;
  10250. case glslang::EbtInt64:
  10251. scalar = builder.makeInt64Constant(zero ? 0 : consts[nextConst].getI64Const(), specConstant);
  10252. break;
  10253. case glslang::EbtUint64:
  10254. scalar = builder.makeUint64Constant(zero ? 0 : consts[nextConst].getU64Const(), specConstant);
  10255. break;
  10256. case glslang::EbtDouble:
  10257. scalar = builder.makeDoubleConstant(zero ? 0.0 : consts[nextConst].getDConst(), specConstant);
  10258. break;
  10259. case glslang::EbtFloat16:
  10260. builder.addCapability(spv::Capability::Float16);
  10261. scalar = builder.makeFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  10262. break;
  10263. case glslang::EbtBFloat16:
  10264. scalar = builder.makeBFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  10265. break;
  10266. case glslang::EbtFloatE5M2:
  10267. scalar = builder.makeFloatE5M2Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  10268. break;
  10269. case glslang::EbtFloatE4M3:
  10270. scalar = builder.makeFloatE4M3Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  10271. break;
  10272. case glslang::EbtReference:
  10273. scalar = builder.makeUint64Constant(zero ? 0 : consts[nextConst].getU64Const(), specConstant);
  10274. scalar = builder.createUnaryOp(spv::Op::OpBitcast, typeId, scalar);
  10275. break;
  10276. case glslang::EbtString:
  10277. scalar = builder.getStringId(consts[nextConst].getSConst()->c_str());
  10278. break;
  10279. default:
  10280. assert(0);
  10281. break;
  10282. }
  10283. ++nextConst;
  10284. return scalar;
  10285. }
  10286. return builder.makeCompositeConstant(typeId, spvConsts);
  10287. }
  10288. // Return true if the node is a constant or symbol whose reading has no
  10289. // non-trivial observable cost or effect.
  10290. bool TGlslangToSpvTraverser::isTrivialLeaf(const glslang::TIntermTyped* node)
  10291. {
  10292. // don't know what this is
  10293. if (node == nullptr)
  10294. return false;
  10295. // a constant is safe
  10296. if (node->getAsConstantUnion() != nullptr)
  10297. return true;
  10298. // not a symbol means non-trivial
  10299. if (node->getAsSymbolNode() == nullptr)
  10300. return false;
  10301. // a symbol, depends on what's being read
  10302. switch (node->getType().getQualifier().storage) {
  10303. case glslang::EvqTemporary:
  10304. case glslang::EvqGlobal:
  10305. case glslang::EvqIn:
  10306. case glslang::EvqInOut:
  10307. case glslang::EvqConst:
  10308. case glslang::EvqConstReadOnly:
  10309. case glslang::EvqUniform:
  10310. return true;
  10311. default:
  10312. return false;
  10313. }
  10314. }
  10315. // A node is trivial if it is a single operation with no side effects.
  10316. // HLSL (and/or vectors) are always trivial, as it does not short circuit.
  10317. // Otherwise, error on the side of saying non-trivial.
  10318. // Return true if trivial.
  10319. bool TGlslangToSpvTraverser::isTrivial(const glslang::TIntermTyped* node)
  10320. {
  10321. if (node == nullptr)
  10322. return false;
  10323. // count non scalars as trivial, as well as anything coming from HLSL
  10324. if (! node->getType().isScalarOrVec1() || glslangIntermediate->getSource() == glslang::EShSourceHlsl)
  10325. return true;
  10326. // symbols and constants are trivial
  10327. if (isTrivialLeaf(node))
  10328. return true;
  10329. // otherwise, it needs to be a simple operation or one or two leaf nodes
  10330. // not a simple operation
  10331. const glslang::TIntermBinary* binaryNode = node->getAsBinaryNode();
  10332. const glslang::TIntermUnary* unaryNode = node->getAsUnaryNode();
  10333. if (binaryNode == nullptr && unaryNode == nullptr)
  10334. return false;
  10335. // not on leaf nodes
  10336. if (binaryNode && (! isTrivialLeaf(binaryNode->getLeft()) || ! isTrivialLeaf(binaryNode->getRight())))
  10337. return false;
  10338. if (unaryNode && ! isTrivialLeaf(unaryNode->getOperand())) {
  10339. return false;
  10340. }
  10341. if (IsOpNumericConv(node->getAsOperator()->getOp()) &&
  10342. node->getType().getBasicType() == glslang::EbtBool) {
  10343. return true;
  10344. }
  10345. switch (node->getAsOperator()->getOp()) {
  10346. case glslang::EOpLogicalNot:
  10347. case glslang::EOpEqual:
  10348. case glslang::EOpNotEqual:
  10349. case glslang::EOpLessThan:
  10350. case glslang::EOpGreaterThan:
  10351. case glslang::EOpLessThanEqual:
  10352. case glslang::EOpGreaterThanEqual:
  10353. case glslang::EOpIndexDirect:
  10354. case glslang::EOpIndexDirectStruct:
  10355. case glslang::EOpLogicalXor:
  10356. case glslang::EOpAny:
  10357. case glslang::EOpAll:
  10358. return true;
  10359. default:
  10360. return false;
  10361. }
  10362. }
  10363. // Emit short-circuiting code, where 'right' is never evaluated unless
  10364. // the left side is true (for &&) or false (for ||).
  10365. spv::Id TGlslangToSpvTraverser::createShortCircuit(glslang::TOperator op, glslang::TIntermTyped& left,
  10366. glslang::TIntermTyped& right)
  10367. {
  10368. spv::Id boolTypeId = builder.makeBoolType();
  10369. // emit left operand
  10370. builder.clearAccessChain();
  10371. left.traverse(this);
  10372. spv::Id leftId = accessChainLoad(left.getType());
  10373. // Operands to accumulate OpPhi operands
  10374. std::vector<spv::Id> phiOperands;
  10375. phiOperands.reserve(4);
  10376. // accumulate left operand's phi information
  10377. phiOperands.push_back(leftId);
  10378. phiOperands.push_back(builder.getBuildPoint()->getId());
  10379. // Make the two kinds of operation symmetric with a "!"
  10380. // || => emit "if (! left) result = right"
  10381. // && => emit "if ( left) result = right"
  10382. //
  10383. // TODO: this runtime "not" for || could be avoided by adding functionality
  10384. // to 'builder' to have an "else" without an "then"
  10385. if (op == glslang::EOpLogicalOr)
  10386. leftId = builder.createUnaryOp(spv::Op::OpLogicalNot, boolTypeId, leftId);
  10387. // make an "if" based on the left value
  10388. spv::Builder::If ifBuilder(leftId, spv::SelectionControlMask::MaskNone, builder);
  10389. // emit right operand as the "then" part of the "if"
  10390. builder.clearAccessChain();
  10391. right.traverse(this);
  10392. spv::Id rightId = accessChainLoad(right.getType());
  10393. // accumulate left operand's phi information
  10394. phiOperands.push_back(rightId);
  10395. phiOperands.push_back(builder.getBuildPoint()->getId());
  10396. // finish the "if"
  10397. ifBuilder.makeEndIf();
  10398. // phi together the two results
  10399. return builder.createOp(spv::Op::OpPhi, boolTypeId, phiOperands);
  10400. }
  10401. // Return type Id of the imported set of extended instructions corresponds to the name.
  10402. // Import this set if it has not been imported yet.
  10403. spv::Id TGlslangToSpvTraverser::getExtBuiltins(const char* name)
  10404. {
  10405. if (extBuiltinMap.find(name) != extBuiltinMap.end())
  10406. return extBuiltinMap[name];
  10407. else {
  10408. spv::Id extBuiltins = builder.import(name);
  10409. extBuiltinMap[name] = extBuiltins;
  10410. return extBuiltins;
  10411. }
  10412. }
  10413. } // end anonymous namespace
  10414. namespace glslang {
  10415. void GetSpirvVersion(std::string& version)
  10416. {
  10417. const int bufSize = 100;
  10418. char buf[bufSize];
  10419. snprintf(buf, bufSize, "0x%08x, Revision %d", spv::Version, spv::Revision);
  10420. version = buf;
  10421. }
  10422. // For low-order part of the generator's magic number. Bump up
  10423. // when there is a change in the style (e.g., if SSA form changes,
  10424. // or a different instruction sequence to do something gets used).
  10425. int GetSpirvGeneratorVersion()
  10426. {
  10427. // return 1; // start
  10428. // return 2; // EOpAtomicCounterDecrement gets a post decrement, to map between GLSL -> SPIR-V
  10429. // return 3; // change/correct barrier-instruction operands, to match memory model group decisions
  10430. // return 4; // some deeper access chains: for dynamic vector component, and local Boolean component
  10431. // return 5; // make OpArrayLength result type be an int with signedness of 0
  10432. // return 6; // revert version 5 change, which makes a different (new) kind of incorrect code,
  10433. // versions 4 and 6 each generate OpArrayLength as it has long been done
  10434. // return 7; // GLSL volatile keyword maps to both SPIR-V decorations Volatile and Coherent
  10435. // return 8; // switch to new dead block eliminator; use OpUnreachable
  10436. // return 9; // don't include opaque function parameters in OpEntryPoint global's operand list
  10437. // return 10; // Generate OpFUnordNotEqual for != comparisons
  10438. return 11; // Make OpEmitMeshTasksEXT a terminal instruction
  10439. }
  10440. // Write SPIR-V out to a binary file
  10441. bool OutputSpvBin(const std::vector<unsigned int>& spirv, const char* baseName)
  10442. {
  10443. std::ofstream out;
  10444. out.open(baseName, std::ios::binary | std::ios::out);
  10445. if (out.fail()) {
  10446. printf("ERROR: Failed to open file: %s\n", baseName);
  10447. return false;
  10448. }
  10449. for (int i = 0; i < (int)spirv.size(); ++i) {
  10450. unsigned int word = spirv[i];
  10451. out.write((const char*)&word, 4);
  10452. }
  10453. out.close();
  10454. return true;
  10455. }
  10456. // Write SPIR-V out to a text file with 32-bit hexadecimal words
  10457. bool OutputSpvHex(const std::vector<unsigned int>& spirv, const char* baseName, const char* varName)
  10458. {
  10459. std::ofstream out;
  10460. out.open(baseName, std::ios::binary | std::ios::out);
  10461. if (out.fail()) {
  10462. printf("ERROR: Failed to open file: %s\n", baseName);
  10463. return false;
  10464. }
  10465. out << "\t// " <<
  10466. GetSpirvGeneratorVersion() <<
  10467. GLSLANG_VERSION_MAJOR << "." << GLSLANG_VERSION_MINOR << "." << GLSLANG_VERSION_PATCH <<
  10468. GLSLANG_VERSION_FLAVOR << std::endl;
  10469. if (varName != nullptr) {
  10470. out << "\t #pragma once" << std::endl;
  10471. out << "const uint32_t " << varName << "[] = {" << std::endl;
  10472. }
  10473. const int WORDS_PER_LINE = 8;
  10474. for (int i = 0; i < (int)spirv.size(); i += WORDS_PER_LINE) {
  10475. out << "\t";
  10476. for (int j = 0; j < WORDS_PER_LINE && i + j < (int)spirv.size(); ++j) {
  10477. const unsigned int word = spirv[i + j];
  10478. out << "0x" << std::hex << std::setw(8) << std::setfill('0') << word;
  10479. if (i + j + 1 < (int)spirv.size()) {
  10480. out << ",";
  10481. }
  10482. }
  10483. out << std::endl;
  10484. }
  10485. if (varName != nullptr) {
  10486. out << "};";
  10487. out << std::endl;
  10488. }
  10489. out.close();
  10490. return true;
  10491. }
  10492. //
  10493. // Set up the glslang traversal
  10494. //
  10495. void GlslangToSpv(const TIntermediate& intermediate, std::vector<unsigned int>& spirv, SpvOptions* options)
  10496. {
  10497. spv::SpvBuildLogger logger;
  10498. GlslangToSpv(intermediate, spirv, &logger, options);
  10499. }
  10500. void GlslangToSpv(const TIntermediate& intermediate, std::vector<unsigned int>& spirv,
  10501. spv::SpvBuildLogger* logger, SpvOptions* options)
  10502. {
  10503. TIntermNode* root = intermediate.getTreeRoot();
  10504. if (root == nullptr)
  10505. return;
  10506. SpvOptions defaultOptions;
  10507. if (options == nullptr)
  10508. options = &defaultOptions;
  10509. GetThreadPoolAllocator().push();
  10510. TGlslangToSpvTraverser it(intermediate.getSpv().spv, &intermediate, logger, *options);
  10511. root->traverse(&it);
  10512. it.finishSpv(options->compileOnly);
  10513. it.dumpSpv(spirv);
  10514. #if ENABLE_OPT
  10515. // If from HLSL, run spirv-opt to "legalize" the SPIR-V for Vulkan
  10516. // eg. forward and remove memory writes of opaque types.
  10517. bool prelegalization = intermediate.getSource() == EShSourceHlsl;
  10518. if ((prelegalization || options->optimizeSize) && !options->disableOptimizer) {
  10519. SpirvToolsTransform(intermediate, spirv, logger, options);
  10520. prelegalization = false;
  10521. }
  10522. else if (options->stripDebugInfo) {
  10523. // Strip debug info even if optimization is disabled.
  10524. SpirvToolsStripDebugInfo(intermediate, spirv, logger);
  10525. }
  10526. if (options->validate)
  10527. SpirvToolsValidate(intermediate, spirv, logger, prelegalization);
  10528. if (options->disassemble)
  10529. SpirvToolsDisassemble(std::cout, spirv);
  10530. #endif
  10531. GetThreadPoolAllocator().pop();
  10532. }
  10533. } // end namespace glslang