GlslangToSpv.cpp 492 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488248924902491249224932494249524962497249824992500250125022503250425052506250725082509251025112512251325142515251625172518251925202521252225232524252525262527252825292530253125322533253425352536253725382539254025412542254325442545254625472548254925502551255225532554255525562557255825592560256125622563256425652566256725682569257025712572257325742575257625772578257925802581258225832584258525862587258825892590259125922593259425952596259725982599260026012602260326042605260626072608260926102611261226132614261526162617261826192620262126222623262426252626262726282629263026312632263326342635263626372638263926402641264226432644264526462647264826492650265126522653265426552656265726582659266026612662266326642665266626672668266926702671267226732674267526762677267826792680268126822683268426852686268726882689269026912692269326942695269626972698269927002701270227032704270527062707270827092710271127122713271427152716271727182719272027212722272327242725272627272728272927302731273227332734273527362737273827392740274127422743274427452746274727482749275027512752275327542755275627572758275927602761276227632764276527662767276827692770277127722773277427752776277727782779278027812782278327842785278627872788278927902791279227932794279527962797279827992800280128022803280428052806280728082809281028112812281328142815281628172818281928202821282228232824282528262827282828292830283128322833283428352836283728382839284028412842284328442845284628472848284928502851285228532854285528562857285828592860286128622863286428652866286728682869287028712872287328742875287628772878287928802881288228832884288528862887288828892890289128922893289428952896289728982899290029012902290329042905290629072908290929102911291229132914291529162917291829192920292129222923292429252926292729282929293029312932293329342935293629372938293929402941294229432944294529462947294829492950295129522953295429552956295729582959296029612962296329642965296629672968296929702971297229732974297529762977297829792980298129822983298429852986298729882989299029912992299329942995299629972998299930003001300230033004300530063007300830093010301130123013301430153016301730183019302030213022302330243025302630273028302930303031303230333034303530363037303830393040304130423043304430453046304730483049305030513052305330543055305630573058305930603061306230633064306530663067306830693070307130723073307430753076307730783079308030813082308330843085308630873088308930903091309230933094309530963097309830993100310131023103310431053106310731083109311031113112311331143115311631173118311931203121312231233124312531263127312831293130313131323133313431353136313731383139314031413142314331443145314631473148314931503151315231533154315531563157315831593160316131623163316431653166316731683169317031713172317331743175317631773178317931803181318231833184318531863187318831893190319131923193319431953196319731983199320032013202320332043205320632073208320932103211321232133214321532163217321832193220322132223223322432253226322732283229323032313232323332343235323632373238323932403241324232433244324532463247324832493250325132523253325432553256325732583259326032613262326332643265326632673268326932703271327232733274327532763277327832793280328132823283328432853286328732883289329032913292329332943295329632973298329933003301330233033304330533063307330833093310331133123313331433153316331733183319332033213322332333243325332633273328332933303331333233333334333533363337333833393340334133423343334433453346334733483349335033513352335333543355335633573358335933603361336233633364336533663367336833693370337133723373337433753376337733783379338033813382338333843385338633873388338933903391339233933394339533963397339833993400340134023403340434053406340734083409341034113412341334143415341634173418341934203421342234233424342534263427342834293430343134323433343434353436343734383439344034413442344334443445344634473448344934503451345234533454345534563457345834593460346134623463346434653466346734683469347034713472347334743475347634773478347934803481348234833484348534863487348834893490349134923493349434953496349734983499350035013502350335043505350635073508350935103511351235133514351535163517351835193520352135223523352435253526352735283529353035313532353335343535353635373538353935403541354235433544354535463547354835493550355135523553355435553556355735583559356035613562356335643565356635673568356935703571357235733574357535763577357835793580358135823583358435853586358735883589359035913592359335943595359635973598359936003601360236033604360536063607360836093610361136123613361436153616361736183619362036213622362336243625362636273628362936303631363236333634363536363637363836393640364136423643364436453646364736483649365036513652365336543655365636573658365936603661366236633664366536663667366836693670367136723673367436753676367736783679368036813682368336843685368636873688368936903691369236933694369536963697369836993700370137023703370437053706370737083709371037113712371337143715371637173718371937203721372237233724372537263727372837293730373137323733373437353736373737383739374037413742374337443745374637473748374937503751375237533754375537563757375837593760376137623763376437653766376737683769377037713772377337743775377637773778377937803781378237833784378537863787378837893790379137923793379437953796379737983799380038013802380338043805380638073808380938103811381238133814381538163817381838193820382138223823382438253826382738283829383038313832383338343835383638373838383938403841384238433844384538463847384838493850385138523853385438553856385738583859386038613862386338643865386638673868386938703871387238733874387538763877387838793880388138823883388438853886388738883889389038913892389338943895389638973898389939003901390239033904390539063907390839093910391139123913391439153916391739183919392039213922392339243925392639273928392939303931393239333934393539363937393839393940394139423943394439453946394739483949395039513952395339543955395639573958395939603961396239633964396539663967396839693970397139723973397439753976397739783979398039813982398339843985398639873988398939903991399239933994399539963997399839994000400140024003400440054006400740084009401040114012401340144015401640174018401940204021402240234024402540264027402840294030403140324033403440354036403740384039404040414042404340444045404640474048404940504051405240534054405540564057405840594060406140624063406440654066406740684069407040714072407340744075407640774078407940804081408240834084408540864087408840894090409140924093409440954096409740984099410041014102410341044105410641074108410941104111411241134114411541164117411841194120412141224123412441254126412741284129413041314132413341344135413641374138413941404141414241434144414541464147414841494150415141524153415441554156415741584159416041614162416341644165416641674168416941704171417241734174417541764177417841794180418141824183418441854186418741884189419041914192419341944195419641974198419942004201420242034204420542064207420842094210421142124213421442154216421742184219422042214222422342244225422642274228422942304231423242334234423542364237423842394240424142424243424442454246424742484249425042514252425342544255425642574258425942604261426242634264426542664267426842694270427142724273427442754276427742784279428042814282428342844285428642874288428942904291429242934294429542964297429842994300430143024303430443054306430743084309431043114312431343144315431643174318431943204321432243234324432543264327432843294330433143324333433443354336433743384339434043414342434343444345434643474348434943504351435243534354435543564357435843594360436143624363436443654366436743684369437043714372437343744375437643774378437943804381438243834384438543864387438843894390439143924393439443954396439743984399440044014402440344044405440644074408440944104411441244134414441544164417441844194420442144224423442444254426442744284429443044314432443344344435443644374438443944404441444244434444444544464447444844494450445144524453445444554456445744584459446044614462446344644465446644674468446944704471447244734474447544764477447844794480448144824483448444854486448744884489449044914492449344944495449644974498449945004501450245034504450545064507450845094510451145124513451445154516451745184519452045214522452345244525452645274528452945304531453245334534453545364537453845394540454145424543454445454546454745484549455045514552455345544555455645574558455945604561456245634564456545664567456845694570457145724573457445754576457745784579458045814582458345844585458645874588458945904591459245934594459545964597459845994600460146024603460446054606460746084609461046114612461346144615461646174618461946204621462246234624462546264627462846294630463146324633463446354636463746384639464046414642464346444645464646474648464946504651465246534654465546564657465846594660466146624663466446654666466746684669467046714672467346744675467646774678467946804681468246834684468546864687468846894690469146924693469446954696469746984699470047014702470347044705470647074708470947104711471247134714471547164717471847194720472147224723472447254726472747284729473047314732473347344735473647374738473947404741474247434744474547464747474847494750475147524753475447554756475747584759476047614762476347644765476647674768476947704771477247734774477547764777477847794780478147824783478447854786478747884789479047914792479347944795479647974798479948004801480248034804480548064807480848094810481148124813481448154816481748184819482048214822482348244825482648274828482948304831483248334834483548364837483848394840484148424843484448454846484748484849485048514852485348544855485648574858485948604861486248634864486548664867486848694870487148724873487448754876487748784879488048814882488348844885488648874888488948904891489248934894489548964897489848994900490149024903490449054906490749084909491049114912491349144915491649174918491949204921492249234924492549264927492849294930493149324933493449354936493749384939494049414942494349444945494649474948494949504951495249534954495549564957495849594960496149624963496449654966496749684969497049714972497349744975497649774978497949804981498249834984498549864987498849894990499149924993499449954996499749984999500050015002500350045005500650075008500950105011501250135014501550165017501850195020502150225023502450255026502750285029503050315032503350345035503650375038503950405041504250435044504550465047504850495050505150525053505450555056505750585059506050615062506350645065506650675068506950705071507250735074507550765077507850795080508150825083508450855086508750885089509050915092509350945095509650975098509951005101510251035104510551065107510851095110511151125113511451155116511751185119512051215122512351245125512651275128512951305131513251335134513551365137513851395140514151425143514451455146514751485149515051515152515351545155515651575158515951605161516251635164516551665167516851695170517151725173517451755176517751785179518051815182518351845185518651875188518951905191519251935194519551965197519851995200520152025203520452055206520752085209521052115212521352145215521652175218521952205221522252235224522552265227522852295230523152325233523452355236523752385239524052415242524352445245524652475248524952505251525252535254525552565257525852595260526152625263526452655266526752685269527052715272527352745275527652775278527952805281528252835284528552865287528852895290529152925293529452955296529752985299530053015302530353045305530653075308530953105311531253135314531553165317531853195320532153225323532453255326532753285329533053315332533353345335533653375338533953405341534253435344534553465347534853495350535153525353535453555356535753585359536053615362536353645365536653675368536953705371537253735374537553765377537853795380538153825383538453855386538753885389539053915392539353945395539653975398539954005401540254035404540554065407540854095410541154125413541454155416541754185419542054215422542354245425542654275428542954305431543254335434543554365437543854395440544154425443544454455446544754485449545054515452545354545455545654575458545954605461546254635464546554665467546854695470547154725473547454755476547754785479548054815482548354845485548654875488548954905491549254935494549554965497549854995500550155025503550455055506550755085509551055115512551355145515551655175518551955205521552255235524552555265527552855295530553155325533553455355536553755385539554055415542554355445545554655475548554955505551555255535554555555565557555855595560556155625563556455655566556755685569557055715572557355745575557655775578557955805581558255835584558555865587558855895590559155925593559455955596559755985599560056015602560356045605560656075608560956105611561256135614561556165617561856195620562156225623562456255626562756285629563056315632563356345635563656375638563956405641564256435644564556465647564856495650565156525653565456555656565756585659566056615662566356645665566656675668566956705671567256735674567556765677567856795680568156825683568456855686568756885689569056915692569356945695569656975698569957005701570257035704570557065707570857095710571157125713571457155716571757185719572057215722572357245725572657275728572957305731573257335734573557365737573857395740574157425743574457455746574757485749575057515752575357545755575657575758575957605761576257635764576557665767576857695770577157725773577457755776577757785779578057815782578357845785578657875788578957905791579257935794579557965797579857995800580158025803580458055806580758085809581058115812581358145815581658175818581958205821582258235824582558265827582858295830583158325833583458355836583758385839584058415842584358445845584658475848584958505851585258535854585558565857585858595860586158625863586458655866586758685869587058715872587358745875587658775878587958805881588258835884588558865887588858895890589158925893589458955896589758985899590059015902590359045905590659075908590959105911591259135914591559165917591859195920592159225923592459255926592759285929593059315932593359345935593659375938593959405941594259435944594559465947594859495950595159525953595459555956595759585959596059615962596359645965596659675968596959705971597259735974597559765977597859795980598159825983598459855986598759885989599059915992599359945995599659975998599960006001600260036004600560066007600860096010601160126013601460156016601760186019602060216022602360246025602660276028602960306031603260336034603560366037603860396040604160426043604460456046604760486049605060516052605360546055605660576058605960606061606260636064606560666067606860696070607160726073607460756076607760786079608060816082608360846085608660876088608960906091609260936094609560966097609860996100610161026103610461056106610761086109611061116112611361146115611661176118611961206121612261236124612561266127612861296130613161326133613461356136613761386139614061416142614361446145614661476148614961506151615261536154615561566157615861596160616161626163616461656166616761686169617061716172617361746175617661776178617961806181618261836184618561866187618861896190619161926193619461956196619761986199620062016202620362046205620662076208620962106211621262136214621562166217621862196220622162226223622462256226622762286229623062316232623362346235623662376238623962406241624262436244624562466247624862496250625162526253625462556256625762586259626062616262626362646265626662676268626962706271627262736274627562766277627862796280628162826283628462856286628762886289629062916292629362946295629662976298629963006301630263036304630563066307630863096310631163126313631463156316631763186319632063216322632363246325632663276328632963306331633263336334633563366337633863396340634163426343634463456346634763486349635063516352635363546355635663576358635963606361636263636364636563666367636863696370637163726373637463756376637763786379638063816382638363846385638663876388638963906391639263936394639563966397639863996400640164026403640464056406640764086409641064116412641364146415641664176418641964206421642264236424642564266427642864296430643164326433643464356436643764386439644064416442644364446445644664476448644964506451645264536454645564566457645864596460646164626463646464656466646764686469647064716472647364746475647664776478647964806481648264836484648564866487648864896490649164926493649464956496649764986499650065016502650365046505650665076508650965106511651265136514651565166517651865196520652165226523652465256526652765286529653065316532653365346535653665376538653965406541654265436544654565466547654865496550655165526553655465556556655765586559656065616562656365646565656665676568656965706571657265736574657565766577657865796580658165826583658465856586658765886589659065916592659365946595659665976598659966006601660266036604660566066607660866096610661166126613661466156616661766186619662066216622662366246625662666276628662966306631663266336634663566366637663866396640664166426643664466456646664766486649665066516652665366546655665666576658665966606661666266636664666566666667666866696670667166726673667466756676667766786679668066816682668366846685668666876688668966906691669266936694669566966697669866996700670167026703670467056706670767086709671067116712671367146715671667176718671967206721672267236724672567266727672867296730673167326733673467356736673767386739674067416742674367446745674667476748674967506751675267536754675567566757675867596760676167626763676467656766676767686769677067716772677367746775677667776778677967806781678267836784678567866787678867896790679167926793679467956796679767986799680068016802680368046805680668076808680968106811681268136814681568166817681868196820682168226823682468256826682768286829683068316832683368346835683668376838683968406841684268436844684568466847684868496850685168526853685468556856685768586859686068616862686368646865686668676868686968706871687268736874687568766877687868796880688168826883688468856886688768886889689068916892689368946895689668976898689969006901690269036904690569066907690869096910691169126913691469156916691769186919692069216922692369246925692669276928692969306931693269336934693569366937693869396940694169426943694469456946694769486949695069516952695369546955695669576958695969606961696269636964696569666967696869696970697169726973697469756976697769786979698069816982698369846985698669876988698969906991699269936994699569966997699869997000700170027003700470057006700770087009701070117012701370147015701670177018701970207021702270237024702570267027702870297030703170327033703470357036703770387039704070417042704370447045704670477048704970507051705270537054705570567057705870597060706170627063706470657066706770687069707070717072707370747075707670777078707970807081708270837084708570867087708870897090709170927093709470957096709770987099710071017102710371047105710671077108710971107111711271137114711571167117711871197120712171227123712471257126712771287129713071317132713371347135713671377138713971407141714271437144714571467147714871497150715171527153715471557156715771587159716071617162716371647165716671677168716971707171717271737174717571767177717871797180718171827183718471857186718771887189719071917192719371947195719671977198719972007201720272037204720572067207720872097210721172127213721472157216721772187219722072217222722372247225722672277228722972307231723272337234723572367237723872397240724172427243724472457246724772487249725072517252725372547255725672577258725972607261726272637264726572667267726872697270727172727273727472757276727772787279728072817282728372847285728672877288728972907291729272937294729572967297729872997300730173027303730473057306730773087309731073117312731373147315731673177318731973207321732273237324732573267327732873297330733173327333733473357336733773387339734073417342734373447345734673477348734973507351735273537354735573567357735873597360736173627363736473657366736773687369737073717372737373747375737673777378737973807381738273837384738573867387738873897390739173927393739473957396739773987399740074017402740374047405740674077408740974107411741274137414741574167417741874197420742174227423742474257426742774287429743074317432743374347435743674377438743974407441744274437444744574467447744874497450745174527453745474557456745774587459746074617462746374647465746674677468746974707471747274737474747574767477747874797480748174827483748474857486748774887489749074917492749374947495749674977498749975007501750275037504750575067507750875097510751175127513751475157516751775187519752075217522752375247525752675277528752975307531753275337534753575367537753875397540754175427543754475457546754775487549755075517552755375547555755675577558755975607561756275637564756575667567756875697570757175727573757475757576757775787579758075817582758375847585758675877588758975907591759275937594759575967597759875997600760176027603760476057606760776087609761076117612761376147615761676177618761976207621762276237624762576267627762876297630763176327633763476357636763776387639764076417642764376447645764676477648764976507651765276537654765576567657765876597660766176627663766476657666766776687669767076717672767376747675767676777678767976807681768276837684768576867687768876897690769176927693769476957696769776987699770077017702770377047705770677077708770977107711771277137714771577167717771877197720772177227723772477257726772777287729773077317732773377347735773677377738773977407741774277437744774577467747774877497750775177527753775477557756775777587759776077617762776377647765776677677768776977707771777277737774777577767777777877797780778177827783778477857786778777887789779077917792779377947795779677977798779978007801780278037804780578067807780878097810781178127813781478157816781778187819782078217822782378247825782678277828782978307831783278337834783578367837783878397840784178427843784478457846784778487849785078517852785378547855785678577858785978607861786278637864786578667867786878697870787178727873787478757876787778787879788078817882788378847885788678877888788978907891789278937894789578967897789878997900790179027903790479057906790779087909791079117912791379147915791679177918791979207921792279237924792579267927792879297930793179327933793479357936793779387939794079417942794379447945794679477948794979507951795279537954795579567957795879597960796179627963796479657966796779687969797079717972797379747975797679777978797979807981798279837984798579867987798879897990799179927993799479957996799779987999800080018002800380048005800680078008800980108011801280138014801580168017801880198020802180228023802480258026802780288029803080318032803380348035803680378038803980408041804280438044804580468047804880498050805180528053805480558056805780588059806080618062806380648065806680678068806980708071807280738074807580768077807880798080808180828083808480858086808780888089809080918092809380948095809680978098809981008101810281038104810581068107810881098110811181128113811481158116811781188119812081218122812381248125812681278128812981308131813281338134813581368137813881398140814181428143814481458146814781488149815081518152815381548155815681578158815981608161816281638164816581668167816881698170817181728173817481758176817781788179818081818182818381848185818681878188818981908191819281938194819581968197819881998200820182028203820482058206820782088209821082118212821382148215821682178218821982208221822282238224822582268227822882298230823182328233823482358236823782388239824082418242824382448245824682478248824982508251825282538254825582568257825882598260826182628263826482658266826782688269827082718272827382748275827682778278827982808281828282838284828582868287828882898290829182928293829482958296829782988299830083018302830383048305830683078308830983108311831283138314831583168317831883198320832183228323832483258326832783288329833083318332833383348335833683378338833983408341834283438344834583468347834883498350835183528353835483558356835783588359836083618362836383648365836683678368836983708371837283738374837583768377837883798380838183828383838483858386838783888389839083918392839383948395839683978398839984008401840284038404840584068407840884098410841184128413841484158416841784188419842084218422842384248425842684278428842984308431843284338434843584368437843884398440844184428443844484458446844784488449845084518452845384548455845684578458845984608461846284638464846584668467846884698470847184728473847484758476847784788479848084818482848384848485848684878488848984908491849284938494849584968497849884998500850185028503850485058506850785088509851085118512851385148515851685178518851985208521852285238524852585268527852885298530853185328533853485358536853785388539854085418542854385448545854685478548854985508551855285538554855585568557855885598560856185628563856485658566856785688569857085718572857385748575857685778578857985808581858285838584858585868587858885898590859185928593859485958596859785988599860086018602860386048605860686078608860986108611861286138614861586168617861886198620862186228623862486258626862786288629863086318632863386348635863686378638863986408641864286438644864586468647864886498650865186528653865486558656865786588659866086618662866386648665866686678668866986708671867286738674867586768677867886798680868186828683868486858686868786888689869086918692869386948695869686978698869987008701870287038704870587068707870887098710871187128713871487158716871787188719872087218722872387248725872687278728872987308731873287338734873587368737873887398740874187428743874487458746874787488749875087518752875387548755875687578758875987608761876287638764876587668767876887698770877187728773877487758776877787788779878087818782878387848785878687878788878987908791879287938794879587968797879887998800880188028803880488058806880788088809881088118812881388148815881688178818881988208821882288238824882588268827882888298830883188328833883488358836883788388839884088418842884388448845884688478848884988508851885288538854885588568857885888598860886188628863886488658866886788688869887088718872887388748875887688778878887988808881888288838884888588868887888888898890889188928893889488958896889788988899890089018902890389048905890689078908890989108911891289138914891589168917891889198920892189228923892489258926892789288929893089318932893389348935893689378938893989408941894289438944894589468947894889498950895189528953895489558956895789588959896089618962896389648965896689678968896989708971897289738974897589768977897889798980898189828983898489858986898789888989899089918992899389948995899689978998899990009001900290039004900590069007900890099010901190129013901490159016901790189019902090219022902390249025902690279028902990309031903290339034903590369037903890399040904190429043904490459046904790489049905090519052905390549055905690579058905990609061906290639064906590669067906890699070907190729073907490759076907790789079908090819082908390849085908690879088908990909091909290939094909590969097909890999100910191029103910491059106910791089109911091119112911391149115911691179118911991209121912291239124912591269127912891299130913191329133913491359136913791389139914091419142914391449145914691479148914991509151915291539154915591569157915891599160916191629163916491659166916791689169917091719172917391749175917691779178917991809181918291839184918591869187918891899190919191929193919491959196919791989199920092019202920392049205920692079208920992109211921292139214921592169217921892199220922192229223922492259226922792289229923092319232923392349235923692379238923992409241924292439244924592469247924892499250925192529253925492559256925792589259926092619262926392649265926692679268926992709271927292739274927592769277927892799280928192829283928492859286928792889289929092919292929392949295929692979298929993009301930293039304930593069307930893099310931193129313931493159316931793189319932093219322932393249325932693279328932993309331933293339334933593369337933893399340934193429343934493459346934793489349935093519352935393549355935693579358935993609361936293639364936593669367936893699370937193729373937493759376937793789379938093819382938393849385938693879388938993909391939293939394939593969397939893999400940194029403940494059406940794089409941094119412941394149415941694179418941994209421942294239424942594269427942894299430943194329433943494359436943794389439944094419442944394449445944694479448944994509451945294539454945594569457945894599460946194629463946494659466946794689469947094719472947394749475947694779478947994809481948294839484948594869487948894899490949194929493949494959496949794989499950095019502950395049505950695079508950995109511951295139514951595169517951895199520952195229523952495259526952795289529953095319532953395349535953695379538953995409541954295439544954595469547954895499550955195529553955495559556955795589559956095619562956395649565956695679568956995709571957295739574957595769577957895799580958195829583958495859586958795889589959095919592959395949595959695979598959996009601960296039604960596069607960896099610961196129613961496159616961796189619962096219622962396249625962696279628962996309631963296339634963596369637963896399640964196429643964496459646964796489649965096519652965396549655965696579658965996609661966296639664966596669667966896699670967196729673967496759676967796789679968096819682968396849685968696879688968996909691969296939694969596969697969896999700970197029703970497059706970797089709971097119712971397149715971697179718971997209721972297239724972597269727972897299730973197329733973497359736973797389739974097419742974397449745974697479748974997509751975297539754975597569757975897599760976197629763976497659766976797689769977097719772977397749775977697779778977997809781978297839784978597869787978897899790979197929793979497959796979797989799980098019802980398049805980698079808980998109811981298139814981598169817981898199820982198229823982498259826982798289829983098319832983398349835983698379838983998409841984298439844984598469847984898499850985198529853985498559856985798589859986098619862986398649865986698679868986998709871987298739874987598769877987898799880988198829883988498859886988798889889989098919892989398949895989698979898989999009901990299039904990599069907990899099910991199129913991499159916991799189919992099219922992399249925992699279928992999309931993299339934993599369937993899399940994199429943994499459946994799489949995099519952995399549955995699579958995999609961996299639964996599669967996899699970997199729973997499759976997799789979998099819982998399849985998699879988998999909991999299939994999599969997999899991000010001100021000310004100051000610007100081000910010100111001210013100141001510016100171001810019100201002110022100231002410025100261002710028100291003010031100321003310034100351003610037100381003910040100411004210043100441004510046100471004810049100501005110052100531005410055100561005710058100591006010061100621006310064100651006610067100681006910070100711007210073100741007510076100771007810079100801008110082100831008410085100861008710088100891009010091100921009310094100951009610097100981009910100101011010210103101041010510106101071010810109101101011110112101131011410115101161011710118101191012010121101221012310124101251012610127101281012910130101311013210133101341013510136101371013810139101401014110142101431014410145101461014710148101491015010151101521015310154101551015610157101581015910160101611016210163101641016510166101671016810169101701017110172101731017410175101761017710178101791018010181101821018310184101851018610187101881018910190101911019210193101941019510196101971019810199102001020110202102031020410205102061020710208102091021010211102121021310214102151021610217102181021910220102211022210223102241022510226102271022810229102301023110232102331023410235102361023710238102391024010241102421024310244102451024610247102481024910250102511025210253102541025510256102571025810259102601026110262102631026410265102661026710268102691027010271102721027310274102751027610277102781027910280102811028210283102841028510286102871028810289102901029110292102931029410295102961029710298102991030010301103021030310304103051030610307103081030910310103111031210313103141031510316103171031810319103201032110322103231032410325103261032710328103291033010331103321033310334103351033610337103381033910340103411034210343103441034510346103471034810349103501035110352103531035410355103561035710358103591036010361103621036310364103651036610367103681036910370103711037210373103741037510376103771037810379103801038110382103831038410385103861038710388103891039010391103921039310394103951039610397103981039910400104011040210403104041040510406104071040810409104101041110412104131041410415104161041710418104191042010421104221042310424104251042610427104281042910430104311043210433104341043510436104371043810439104401044110442104431044410445104461044710448104491045010451104521045310454104551045610457104581045910460104611046210463104641046510466104671046810469104701047110472104731047410475104761047710478104791048010481104821048310484104851048610487104881048910490104911049210493104941049510496104971049810499105001050110502105031050410505105061050710508105091051010511105121051310514105151051610517105181051910520105211052210523105241052510526105271052810529105301053110532105331053410535105361053710538105391054010541105421054310544105451054610547105481054910550105511055210553105541055510556105571055810559105601056110562105631056410565105661056710568105691057010571105721057310574105751057610577105781057910580105811058210583105841058510586105871058810589105901059110592105931059410595105961059710598105991060010601106021060310604106051060610607106081060910610106111061210613106141061510616106171061810619106201062110622106231062410625106261062710628106291063010631106321063310634106351063610637106381063910640106411064210643106441064510646106471064810649106501065110652106531065410655106561065710658106591066010661106621066310664106651066610667106681066910670106711067210673106741067510676106771067810679106801068110682106831068410685106861068710688106891069010691106921069310694106951069610697106981069910700107011070210703107041070510706107071070810709107101071110712107131071410715107161071710718107191072010721107221072310724107251072610727107281072910730107311073210733107341073510736107371073810739107401074110742107431074410745107461074710748107491075010751107521075310754107551075610757107581075910760107611076210763107641076510766107671076810769107701077110772107731077410775107761077710778107791078010781107821078310784107851078610787107881078910790107911079210793107941079510796107971079810799108001080110802108031080410805108061080710808108091081010811108121081310814108151081610817108181081910820108211082210823108241082510826108271082810829108301083110832108331083410835108361083710838108391084010841108421084310844108451084610847108481084910850108511085210853108541085510856108571085810859108601086110862108631086410865108661086710868108691087010871108721087310874108751087610877108781087910880108811088210883108841088510886108871088810889108901089110892108931089410895108961089710898108991090010901109021090310904109051090610907109081090910910109111091210913109141091510916109171091810919109201092110922109231092410925109261092710928109291093010931109321093310934109351093610937109381093910940109411094210943109441094510946109471094810949109501095110952109531095410955109561095710958109591096010961109621096310964109651096610967109681096910970109711097210973109741097510976109771097810979109801098110982109831098410985109861098710988109891099010991109921099310994109951099610997109981099911000110011100211003110041100511006110071100811009110101101111012110131101411015110161101711018110191102011021110221102311024110251102611027110281102911030110311103211033110341103511036110371103811039110401104111042110431104411045110461104711048110491105011051110521105311054110551105611057110581105911060110611106211063110641106511066110671106811069110701107111072110731107411075110761107711078110791108011081110821108311084
  1. //
  2. // Copyright (C) 2014-2016 LunarG, Inc.
  3. // Copyright (C) 2015-2020 Google, Inc.
  4. // Copyright (C) 2017, 2022-2025 Arm Limited.
  5. // Modifications Copyright (C) 2020 Advanced Micro Devices, Inc. All rights reserved.
  6. //
  7. // All rights reserved.
  8. //
  9. // Redistribution and use in source and binary forms, with or without
  10. // modification, are permitted provided that the following conditions
  11. // are met:
  12. //
  13. // Redistributions of source code must retain the above copyright
  14. // notice, this list of conditions and the following disclaimer.
  15. //
  16. // Redistributions in binary form must reproduce the above
  17. // copyright notice, this list of conditions and the following
  18. // disclaimer in the documentation and/or other materials provided
  19. // with the distribution.
  20. //
  21. // Neither the name of 3Dlabs Inc. Ltd. nor the names of its
  22. // contributors may be used to endorse or promote products derived
  23. // from this software without specific prior written permission.
  24. //
  25. // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  26. // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  27. // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
  28. // FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
  29. // COPYRIGHT HOLDERS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
  30. // INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
  31. // BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  32. // LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
  33. // CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  34. // LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
  35. // ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  36. // POSSIBILITY OF SUCH DAMAGE.
  37. //
  38. // Visit the nodes in the glslang intermediate tree representation to
  39. // translate them to SPIR-V.
  40. //
  41. #include "spirv.hpp11"
  42. #include "GlslangToSpv.h"
  43. #include "SpvBuilder.h"
  44. #include "SpvTools.h"
  45. #include "spvUtil.h"
  46. namespace spv {
  47. #include "GLSL.std.450.h"
  48. #include "GLSL.ext.KHR.h"
  49. #include "GLSL.ext.EXT.h"
  50. #include "GLSL.ext.AMD.h"
  51. #include "GLSL.ext.NV.h"
  52. #include "GLSL.ext.ARM.h"
  53. #include "GLSL.ext.QCOM.h"
  54. #include "NonSemanticDebugPrintf.h"
  55. }
  56. // Glslang includes
  57. #include "../glslang/MachineIndependent/localintermediate.h"
  58. #include "../glslang/MachineIndependent/SymbolTable.h"
  59. #include "../glslang/Include/Common.h"
  60. // Build-time generated includes
  61. #include "glslang/build_info.h"
  62. #include <fstream>
  63. #include <iomanip>
  64. #include <list>
  65. #include <map>
  66. #include <optional>
  67. #include <stack>
  68. #include <string>
  69. #include <vector>
  70. namespace {
  71. namespace {
  72. class SpecConstantOpModeGuard {
  73. public:
  74. SpecConstantOpModeGuard(spv::Builder* builder)
  75. : builder_(builder) {
  76. previous_flag_ = builder->isInSpecConstCodeGenMode();
  77. }
  78. ~SpecConstantOpModeGuard() {
  79. previous_flag_ ? builder_->setToSpecConstCodeGenMode()
  80. : builder_->setToNormalCodeGenMode();
  81. }
  82. void turnOnSpecConstantOpMode() {
  83. builder_->setToSpecConstCodeGenMode();
  84. }
  85. private:
  86. spv::Builder* builder_;
  87. bool previous_flag_;
  88. };
  89. struct OpDecorations {
  90. public:
  91. OpDecorations(spv::Decoration precision, spv::Decoration noContraction, spv::Decoration nonUniform) :
  92. precision(precision)
  93. ,
  94. noContraction(noContraction),
  95. nonUniform(nonUniform)
  96. { }
  97. spv::Decoration precision;
  98. void addNoContraction(spv::Builder& builder, spv::Id t) { builder.addDecoration(t, noContraction); }
  99. void addNonUniform(spv::Builder& builder, spv::Id t) { builder.addDecoration(t, nonUniform); }
  100. protected:
  101. spv::Decoration noContraction;
  102. spv::Decoration nonUniform;
  103. };
  104. } // namespace
  105. //
  106. // The main holder of information for translating glslang to SPIR-V.
  107. //
  108. // Derives from the AST walking base class.
  109. //
  110. class TGlslangToSpvTraverser : public glslang::TIntermTraverser {
  111. public:
  112. TGlslangToSpvTraverser(unsigned int spvVersion, const glslang::TIntermediate*, spv::SpvBuildLogger* logger,
  113. glslang::SpvOptions& options);
  114. virtual ~TGlslangToSpvTraverser() { }
  115. bool visitAggregate(glslang::TVisit, glslang::TIntermAggregate*);
  116. bool visitBinary(glslang::TVisit, glslang::TIntermBinary*);
  117. void visitConstantUnion(glslang::TIntermConstantUnion*);
  118. bool visitSelection(glslang::TVisit, glslang::TIntermSelection*);
  119. bool visitSwitch(glslang::TVisit, glslang::TIntermSwitch*);
  120. void visitSymbol(glslang::TIntermSymbol* symbol);
  121. bool visitUnary(glslang::TVisit, glslang::TIntermUnary*);
  122. bool visitLoop(glslang::TVisit, glslang::TIntermLoop*);
  123. bool visitBranch(glslang::TVisit visit, glslang::TIntermBranch*);
  124. void finishSpv(bool compileOnly);
  125. void dumpSpv(std::vector<unsigned int>& out);
  126. protected:
  127. TGlslangToSpvTraverser(TGlslangToSpvTraverser&);
  128. TGlslangToSpvTraverser& operator=(TGlslangToSpvTraverser&);
  129. spv::Decoration TranslateInterpolationDecoration(const glslang::TQualifier& qualifier);
  130. spv::Decoration TranslateAuxiliaryStorageDecoration(const glslang::TQualifier& qualifier);
  131. spv::Decoration TranslateNonUniformDecoration(const glslang::TQualifier& qualifier);
  132. spv::Decoration TranslateNonUniformDecoration(const spv::Builder::AccessChain::CoherentFlags& coherentFlags);
  133. spv::Builder::AccessChain::CoherentFlags TranslateCoherent(const glslang::TType& type);
  134. spv::MemoryAccessMask TranslateMemoryAccess(const spv::Builder::AccessChain::CoherentFlags &coherentFlags);
  135. spv::ImageOperandsMask TranslateImageOperands(const spv::Builder::AccessChain::CoherentFlags &coherentFlags);
  136. spv::Scope TranslateMemoryScope(const spv::Builder::AccessChain::CoherentFlags &coherentFlags);
  137. spv::BuiltIn TranslateBuiltInDecoration(glslang::TBuiltInVariable, bool memberDeclaration);
  138. spv::ImageFormat TranslateImageFormat(const glslang::TType& type);
  139. spv::SelectionControlMask TranslateSelectionControl(const glslang::TIntermSelection&) const;
  140. spv::SelectionControlMask TranslateSwitchControl(const glslang::TIntermSwitch&) const;
  141. spv::LoopControlMask TranslateLoopControl(const glslang::TIntermLoop&, std::vector<unsigned int>& operands) const;
  142. spv::StorageClass TranslateStorageClass(const glslang::TType&);
  143. void TranslateLiterals(const glslang::TVector<const glslang::TIntermConstantUnion*>&, std::vector<unsigned>&) const;
  144. void addIndirectionIndexCapabilities(const glslang::TType& baseType, const glslang::TType& indexType);
  145. spv::Id createSpvVariable(const glslang::TIntermSymbol*, spv::Id forcedType);
  146. spv::Id getSampledType(const glslang::TSampler&);
  147. spv::Id getInvertedSwizzleType(const glslang::TIntermTyped&);
  148. spv::Id createInvertedSwizzle(spv::Decoration precision, const glslang::TIntermTyped&, spv::Id parentResult);
  149. void convertSwizzle(const glslang::TIntermAggregate&, std::vector<unsigned>& swizzle);
  150. spv::Id convertGlslangToSpvType(const glslang::TType& type, bool forwardReferenceOnly = false);
  151. spv::Id convertGlslangToSpvType(const glslang::TType& type, glslang::TLayoutPacking, const glslang::TQualifier&,
  152. bool lastBufferBlockMember, bool forwardReferenceOnly = false);
  153. void applySpirvDecorate(const glslang::TType& type, spv::Id id, std::optional<int> member);
  154. bool filterMember(const glslang::TType& member);
  155. spv::Id convertGlslangStructToSpvType(const glslang::TType&, const glslang::TTypeList* glslangStruct,
  156. glslang::TLayoutPacking, const glslang::TQualifier&);
  157. spv::LinkageType convertGlslangLinkageToSpv(glslang::TLinkType glslangLinkType);
  158. void decorateStructType(const glslang::TType&, const glslang::TTypeList* glslangStruct, glslang::TLayoutPacking,
  159. const glslang::TQualifier&, spv::Id, const std::vector<spv::Id>& spvMembers);
  160. spv::Id makeArraySizeId(const glslang::TArraySizes&, int dim, bool allowZero = false, bool boolType = false);
  161. spv::Id accessChainLoad(const glslang::TType& type);
  162. void accessChainStore(const glslang::TType& type, spv::Id rvalue);
  163. void multiTypeStore(const glslang::TType&, spv::Id rValue);
  164. spv::Id convertLoadedBoolInUniformToUint(const glslang::TType& type, spv::Id nominalTypeId, spv::Id loadedId);
  165. glslang::TLayoutPacking getExplicitLayout(const glslang::TType& type) const;
  166. int getArrayStride(const glslang::TType& arrayType, glslang::TLayoutPacking, glslang::TLayoutMatrix);
  167. int getMatrixStride(const glslang::TType& matrixType, glslang::TLayoutPacking, glslang::TLayoutMatrix);
  168. void updateMemberOffset(const glslang::TType& structType, const glslang::TType& memberType, int& currentOffset,
  169. int& nextOffset, glslang::TLayoutPacking, glslang::TLayoutMatrix);
  170. void declareUseOfStructMember(const glslang::TTypeList& members, int glslangMember);
  171. bool isShaderEntryPoint(const glslang::TIntermAggregate* node);
  172. bool writableParam(glslang::TStorageQualifier) const;
  173. bool originalParam(glslang::TStorageQualifier, const glslang::TType&, bool implicitThisParam);
  174. void makeFunctions(const glslang::TIntermSequence&);
  175. void makeGlobalInitializers(const glslang::TIntermSequence&);
  176. void collectRayTracingLinkerObjects();
  177. void visitFunctions(const glslang::TIntermSequence&);
  178. void handleFunctionEntry(const glslang::TIntermAggregate* node);
  179. void translateArguments(const glslang::TIntermAggregate& node, std::vector<spv::Id>& arguments,
  180. spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags);
  181. void translateArguments(glslang::TIntermUnary& node, std::vector<spv::Id>& arguments);
  182. spv::Id createImageTextureFunctionCall(glslang::TIntermOperator* node);
  183. spv::Id handleUserFunctionCall(const glslang::TIntermAggregate*);
  184. spv::Id createBinaryOperation(glslang::TOperator op, OpDecorations&, spv::Id typeId, spv::Id left, spv::Id right,
  185. glslang::TBasicType typeProxy, bool reduceComparison = true);
  186. spv::Id createBinaryMatrixOperation(spv::Op, OpDecorations&, spv::Id typeId, spv::Id left, spv::Id right);
  187. spv::Id createUnaryOperation(glslang::TOperator op, OpDecorations&, spv::Id typeId, spv::Id operand,
  188. glslang::TBasicType typeProxy,
  189. const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags,
  190. const glslang::TType &opType);
  191. spv::Id createUnaryMatrixOperation(spv::Op op, OpDecorations&, spv::Id typeId, spv::Id operand,
  192. glslang::TBasicType typeProxy);
  193. spv::Id createConversion(glslang::TOperator op, OpDecorations&, spv::Id destTypeId, spv::Id operand,
  194. glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType);
  195. spv::Id createIntWidthConversion(spv::Id operand, int vectorSize, spv::Id destType,
  196. glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType);
  197. spv::Id makeSmearedConstant(spv::Id constant, int vectorSize);
  198. spv::Id createAtomicOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId,
  199. std::vector<spv::Id>& operands, glslang::TBasicType typeProxy,
  200. const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags,
  201. const glslang::TType &opType);
  202. spv::Id createInvocationsOperation(glslang::TOperator op, spv::Id typeId, std::vector<spv::Id>& operands,
  203. glslang::TBasicType typeProxy);
  204. spv::Id CreateInvocationsVectorOperation(spv::Op op, spv::GroupOperation groupOperation,
  205. spv::Id typeId, std::vector<spv::Id>& operands);
  206. spv::Id createSubgroupOperation(glslang::TOperator op, spv::Id typeId, std::vector<spv::Id>& operands,
  207. glslang::TBasicType typeProxy);
  208. spv::Id createMiscOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId,
  209. std::vector<spv::Id>& operands, glslang::TBasicType typeProxy);
  210. spv::Id createNoArgOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId);
  211. spv::Id getSymbolId(const glslang::TIntermSymbol* node);
  212. void addMeshNVDecoration(spv::Id id, int member, const glslang::TQualifier & qualifier);
  213. bool hasQCOMImageProceessingDecoration(spv::Id id, spv::Decoration decor);
  214. void addImageProcessingQCOMDecoration(spv::Id id, spv::Decoration decor);
  215. void addImageProcessing2QCOMDecoration(spv::Id id, bool isForGather);
  216. spv::Id createSpvConstant(const glslang::TIntermTyped&);
  217. spv::Id createSpvConstantFromConstUnionArray(const glslang::TType& type, const glslang::TConstUnionArray&,
  218. int& nextConst, bool specConstant);
  219. bool isTrivialLeaf(const glslang::TIntermTyped* node);
  220. bool isTrivial(const glslang::TIntermTyped* node);
  221. spv::Id createShortCircuit(glslang::TOperator, glslang::TIntermTyped& left, glslang::TIntermTyped& right);
  222. spv::Id getExtBuiltins(const char* name);
  223. std::pair<spv::Id, spv::Id> getForcedType(glslang::TBuiltInVariable builtIn, const glslang::TType&);
  224. spv::Id translateForcedType(spv::Id object);
  225. spv::Id createCompositeConstruct(spv::Id typeId, std::vector<spv::Id> constituents);
  226. glslang::SpvOptions& options;
  227. spv::Function* shaderEntry;
  228. spv::Function* currentFunction;
  229. spv::Instruction* entryPoint;
  230. int sequenceDepth;
  231. spv::SpvBuildLogger* logger;
  232. // There is a 1:1 mapping between a spv builder and a module; this is thread safe
  233. spv::Builder builder;
  234. bool inEntryPoint;
  235. bool entryPointTerminated;
  236. bool linkageOnly; // true when visiting the set of objects in the AST present only for
  237. // establishing interface, whether or not they were statically used
  238. std::set<spv::Id> iOSet; // all input/output variables from either static use or declaration of interface
  239. const glslang::TIntermediate* glslangIntermediate;
  240. bool nanMinMaxClamp; // true if use NMin/NMax/NClamp instead of FMin/FMax/FClamp
  241. spv::Id stdBuiltins;
  242. spv::Id nonSemanticDebugPrintf;
  243. std::unordered_map<std::string, spv::Id> extBuiltinMap;
  244. std::unordered_map<long long, spv::Id> symbolValues;
  245. std::unordered_map<uint32_t, spv::Id> builtInVariableIds;
  246. std::unordered_set<long long> rValueParameters; // set of formal function parameters passed as rValues,
  247. // rather than a pointer
  248. std::unordered_map<std::string, spv::Function*> functionMap;
  249. std::unordered_map<const glslang::TTypeList*, spv::Id> structMap[glslang::ElpCount][glslang::ElmCount];
  250. // for mapping glslang block indices to spv indices (e.g., due to hidden members):
  251. std::unordered_map<long long, std::vector<int>> memberRemapper;
  252. // for mapping glslang symbol struct to symbol Id
  253. std::unordered_map<const glslang::TTypeList*, long long> glslangTypeToIdMap;
  254. std::stack<bool> breakForLoop; // false means break for switch
  255. std::unordered_map<std::string, const glslang::TIntermSymbol*> counterOriginator;
  256. // Map pointee types for EbtReference to their forward pointers
  257. std::map<const glslang::TType *, spv::Id> forwardPointers;
  258. // Type forcing, for when SPIR-V wants a different type than the AST,
  259. // requiring local translation to and from SPIR-V type on every access.
  260. // Maps <builtin-variable-id -> AST-required-type-id>
  261. std::unordered_map<spv::Id, spv::Id> forceType;
  262. // Used by Task shader while generating opearnds for OpEmitMeshTasksEXT
  263. spv::Id taskPayloadID;
  264. // Used later for generating OpTraceKHR/OpExecuteCallableKHR/OpHitObjectRecordHit*/OpHitObjectGetShaderBindingTableData
  265. std::unordered_map<unsigned int, glslang::TIntermSymbol *> locationToSymbol[4];
  266. std::unordered_map<spv::Id, std::vector<spv::Decoration> > idToQCOMDecorations;
  267. };
  268. //
  269. // Helper functions for translating glslang representations to SPIR-V enumerants.
  270. //
  271. // Translate glslang profile to SPIR-V source language.
  272. spv::SourceLanguage TranslateSourceLanguage(glslang::EShSource source, EProfile profile)
  273. {
  274. switch (source) {
  275. case glslang::EShSourceGlsl:
  276. switch (profile) {
  277. case ENoProfile:
  278. case ECoreProfile:
  279. case ECompatibilityProfile:
  280. return spv::SourceLanguage::GLSL;
  281. case EEsProfile:
  282. return spv::SourceLanguage::ESSL;
  283. default:
  284. return spv::SourceLanguage::Unknown;
  285. }
  286. case glslang::EShSourceHlsl:
  287. return spv::SourceLanguage::HLSL;
  288. default:
  289. return spv::SourceLanguage::Unknown;
  290. }
  291. }
  292. // Translate glslang language (stage) to SPIR-V execution model.
  293. spv::ExecutionModel TranslateExecutionModel(EShLanguage stage, bool isMeshShaderEXT = false)
  294. {
  295. switch (stage) {
  296. case EShLangVertex: return spv::ExecutionModel::Vertex;
  297. case EShLangFragment: return spv::ExecutionModel::Fragment;
  298. case EShLangCompute: return spv::ExecutionModel::GLCompute;
  299. case EShLangTessControl: return spv::ExecutionModel::TessellationControl;
  300. case EShLangTessEvaluation: return spv::ExecutionModel::TessellationEvaluation;
  301. case EShLangGeometry: return spv::ExecutionModel::Geometry;
  302. case EShLangRayGen: return spv::ExecutionModel::RayGenerationKHR;
  303. case EShLangIntersect: return spv::ExecutionModel::IntersectionKHR;
  304. case EShLangAnyHit: return spv::ExecutionModel::AnyHitKHR;
  305. case EShLangClosestHit: return spv::ExecutionModel::ClosestHitKHR;
  306. case EShLangMiss: return spv::ExecutionModel::MissKHR;
  307. case EShLangCallable: return spv::ExecutionModel::CallableKHR;
  308. case EShLangTask: return (isMeshShaderEXT)? spv::ExecutionModel::TaskEXT : spv::ExecutionModel::TaskNV;
  309. case EShLangMesh: return (isMeshShaderEXT)? spv::ExecutionModel::MeshEXT : spv::ExecutionModel::MeshNV;
  310. default:
  311. assert(0);
  312. return spv::ExecutionModel::Fragment;
  313. }
  314. }
  315. // Translate glslang sampler type to SPIR-V dimensionality.
  316. spv::Dim TranslateDimensionality(const glslang::TSampler& sampler)
  317. {
  318. switch (sampler.dim) {
  319. case glslang::Esd1D: return spv::Dim::Dim1D;
  320. case glslang::Esd2D: return spv::Dim::Dim2D;
  321. case glslang::Esd3D: return spv::Dim::Dim3D;
  322. case glslang::EsdCube: return spv::Dim::Cube;
  323. case glslang::EsdRect: return spv::Dim::Rect;
  324. case glslang::EsdBuffer: return spv::Dim::Buffer;
  325. case glslang::EsdSubpass: return spv::Dim::SubpassData;
  326. case glslang::EsdAttachmentEXT: return spv::Dim::TileImageDataEXT;
  327. default:
  328. assert(0);
  329. return spv::Dim::Dim2D;
  330. }
  331. }
  332. // Translate glslang precision to SPIR-V precision decorations.
  333. spv::Decoration TranslatePrecisionDecoration(glslang::TPrecisionQualifier glslangPrecision)
  334. {
  335. switch (glslangPrecision) {
  336. case glslang::EpqLow: return spv::Decoration::RelaxedPrecision;
  337. case glslang::EpqMedium: return spv::Decoration::RelaxedPrecision;
  338. default:
  339. return spv::NoPrecision;
  340. }
  341. }
  342. // Translate glslang type to SPIR-V precision decorations.
  343. spv::Decoration TranslatePrecisionDecoration(const glslang::TType& type)
  344. {
  345. return TranslatePrecisionDecoration(type.getQualifier().precision);
  346. }
  347. // Translate glslang type to SPIR-V block decorations.
  348. spv::Decoration TranslateBlockDecoration(const glslang::TStorageQualifier storage, bool useStorageBuffer)
  349. {
  350. switch (storage) {
  351. case glslang::EvqUniform: return spv::Decoration::Block;
  352. case glslang::EvqBuffer: return useStorageBuffer ? spv::Decoration::Block : spv::Decoration::BufferBlock;
  353. case glslang::EvqVaryingIn: return spv::Decoration::Block;
  354. case glslang::EvqVaryingOut: return spv::Decoration::Block;
  355. case glslang::EvqShared: return spv::Decoration::Block;
  356. case glslang::EvqPayload: return spv::Decoration::Block;
  357. case glslang::EvqPayloadIn: return spv::Decoration::Block;
  358. case glslang::EvqHitAttr: return spv::Decoration::Block;
  359. case glslang::EvqCallableData: return spv::Decoration::Block;
  360. case glslang::EvqCallableDataIn: return spv::Decoration::Block;
  361. case glslang::EvqHitObjectAttrNV: return spv::Decoration::Block;
  362. default:
  363. assert(0);
  364. break;
  365. }
  366. return spv::Decoration::Max;
  367. }
  368. // Translate glslang type to SPIR-V memory decorations.
  369. void TranslateMemoryDecoration(const glslang::TQualifier& qualifier, std::vector<spv::Decoration>& memory,
  370. bool useVulkanMemoryModel)
  371. {
  372. if (!useVulkanMemoryModel) {
  373. if (qualifier.isVolatile()) {
  374. memory.push_back(spv::Decoration::Volatile);
  375. memory.push_back(spv::Decoration::Coherent);
  376. } else if (qualifier.isCoherent()) {
  377. memory.push_back(spv::Decoration::Coherent);
  378. }
  379. }
  380. if (qualifier.isRestrict())
  381. memory.push_back(spv::Decoration::Restrict);
  382. if (qualifier.isReadOnly())
  383. memory.push_back(spv::Decoration::NonWritable);
  384. if (qualifier.isWriteOnly())
  385. memory.push_back(spv::Decoration::NonReadable);
  386. }
  387. // Translate glslang type to SPIR-V layout decorations.
  388. spv::Decoration TranslateLayoutDecoration(const glslang::TType& type, glslang::TLayoutMatrix matrixLayout)
  389. {
  390. if (type.isMatrix()) {
  391. switch (matrixLayout) {
  392. case glslang::ElmRowMajor:
  393. return spv::Decoration::RowMajor;
  394. case glslang::ElmColumnMajor:
  395. return spv::Decoration::ColMajor;
  396. default:
  397. // opaque layouts don't need a majorness
  398. return spv::Decoration::Max;
  399. }
  400. } else {
  401. switch (type.getBasicType()) {
  402. default:
  403. return spv::Decoration::Max;
  404. break;
  405. case glslang::EbtBlock:
  406. switch (type.getQualifier().storage) {
  407. case glslang::EvqShared:
  408. case glslang::EvqUniform:
  409. case glslang::EvqBuffer:
  410. switch (type.getQualifier().layoutPacking) {
  411. case glslang::ElpShared: return spv::Decoration::GLSLShared;
  412. case glslang::ElpPacked: return spv::Decoration::GLSLPacked;
  413. default:
  414. return spv::Decoration::Max;
  415. }
  416. case glslang::EvqVaryingIn:
  417. case glslang::EvqVaryingOut:
  418. if (type.getQualifier().isTaskMemory()) {
  419. switch (type.getQualifier().layoutPacking) {
  420. case glslang::ElpShared: return spv::Decoration::GLSLShared;
  421. case glslang::ElpPacked: return spv::Decoration::GLSLPacked;
  422. default: break;
  423. }
  424. } else {
  425. assert(type.getQualifier().layoutPacking == glslang::ElpNone);
  426. }
  427. return spv::Decoration::Max;
  428. case glslang::EvqPayload:
  429. case glslang::EvqPayloadIn:
  430. case glslang::EvqHitAttr:
  431. case glslang::EvqCallableData:
  432. case glslang::EvqCallableDataIn:
  433. case glslang::EvqHitObjectAttrNV:
  434. return spv::Decoration::Max;
  435. default:
  436. assert(0);
  437. return spv::Decoration::Max;
  438. }
  439. }
  440. }
  441. }
  442. // Translate glslang type to SPIR-V interpolation decorations.
  443. // Returns spv::Decoration::Max when no decoration
  444. // should be applied.
  445. spv::Decoration TGlslangToSpvTraverser::TranslateInterpolationDecoration(const glslang::TQualifier& qualifier)
  446. {
  447. if (qualifier.smooth)
  448. // Smooth decoration doesn't exist in SPIR-V 1.0
  449. return spv::Decoration::Max;
  450. else if (qualifier.isNonPerspective())
  451. return spv::Decoration::NoPerspective;
  452. else if (qualifier.flat)
  453. return spv::Decoration::Flat;
  454. else if (qualifier.isExplicitInterpolation()) {
  455. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  456. return spv::Decoration::ExplicitInterpAMD;
  457. }
  458. else
  459. return spv::Decoration::Max;
  460. }
  461. // Translate glslang type to SPIR-V auxiliary storage decorations.
  462. // Returns spv::Decoration::Max when no decoration
  463. // should be applied.
  464. spv::Decoration TGlslangToSpvTraverser::TranslateAuxiliaryStorageDecoration(const glslang::TQualifier& qualifier)
  465. {
  466. if (qualifier.centroid)
  467. return spv::Decoration::Centroid;
  468. else if (qualifier.patch)
  469. return spv::Decoration::Patch;
  470. else if (qualifier.sample) {
  471. builder.addCapability(spv::Capability::SampleRateShading);
  472. return spv::Decoration::Sample;
  473. }
  474. return spv::Decoration::Max;
  475. }
  476. // If glslang type is invariant, return SPIR-V invariant decoration.
  477. spv::Decoration TranslateInvariantDecoration(const glslang::TQualifier& qualifier)
  478. {
  479. if (qualifier.invariant)
  480. return spv::Decoration::Invariant;
  481. else
  482. return spv::Decoration::Max;
  483. }
  484. // If glslang type is noContraction, return SPIR-V NoContraction decoration.
  485. spv::Decoration TranslateNoContractionDecoration(const glslang::TQualifier& qualifier)
  486. {
  487. if (qualifier.isNoContraction())
  488. return spv::Decoration::NoContraction;
  489. else
  490. return spv::Decoration::Max;
  491. }
  492. // If glslang type is nonUniform, return SPIR-V NonUniform decoration.
  493. spv::Decoration TGlslangToSpvTraverser::TranslateNonUniformDecoration(const glslang::TQualifier& qualifier)
  494. {
  495. if (qualifier.isNonUniform()) {
  496. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  497. builder.addCapability(spv::Capability::ShaderNonUniformEXT);
  498. return spv::Decoration::NonUniformEXT;
  499. } else
  500. return spv::Decoration::Max;
  501. }
  502. // If lvalue flags contains nonUniform, return SPIR-V NonUniform decoration.
  503. spv::Decoration TGlslangToSpvTraverser::TranslateNonUniformDecoration(
  504. const spv::Builder::AccessChain::CoherentFlags& coherentFlags)
  505. {
  506. if (coherentFlags.isNonUniform()) {
  507. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  508. builder.addCapability(spv::Capability::ShaderNonUniformEXT);
  509. return spv::Decoration::NonUniformEXT;
  510. } else
  511. return spv::Decoration::Max;
  512. }
  513. spv::MemoryAccessMask TGlslangToSpvTraverser::TranslateMemoryAccess(
  514. const spv::Builder::AccessChain::CoherentFlags &coherentFlags)
  515. {
  516. spv::MemoryAccessMask mask = spv::MemoryAccessMask::MaskNone;
  517. if (!glslangIntermediate->usingVulkanMemoryModel() || coherentFlags.isImage)
  518. return mask;
  519. if (coherentFlags.isVolatile() || coherentFlags.anyCoherent()) {
  520. mask = mask | spv::MemoryAccessMask::MakePointerAvailableKHR |
  521. spv::MemoryAccessMask::MakePointerVisibleKHR;
  522. }
  523. if (coherentFlags.nonprivate) {
  524. mask = mask | spv::MemoryAccessMask::NonPrivatePointerKHR;
  525. }
  526. if (coherentFlags.volatil) {
  527. mask = mask | spv::MemoryAccessMask::Volatile;
  528. }
  529. if (coherentFlags.nontemporal) {
  530. mask = mask | spv::MemoryAccessMask::Nontemporal;
  531. }
  532. if (mask != spv::MemoryAccessMask::MaskNone) {
  533. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  534. }
  535. return mask;
  536. }
  537. spv::ImageOperandsMask TGlslangToSpvTraverser::TranslateImageOperands(
  538. const spv::Builder::AccessChain::CoherentFlags &coherentFlags)
  539. {
  540. spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;
  541. if (!glslangIntermediate->usingVulkanMemoryModel())
  542. return mask;
  543. if (coherentFlags.volatil ||
  544. coherentFlags.anyCoherent()) {
  545. mask = mask | spv::ImageOperandsMask::MakeTexelAvailableKHR |
  546. spv::ImageOperandsMask::MakeTexelVisibleKHR;
  547. }
  548. if (coherentFlags.nonprivate) {
  549. mask = mask | spv::ImageOperandsMask::NonPrivateTexelKHR;
  550. }
  551. if (coherentFlags.volatil) {
  552. mask = mask | spv::ImageOperandsMask::VolatileTexelKHR;
  553. }
  554. if (coherentFlags.nontemporal && builder.getSpvVersion() >= spv::Spv_1_6) {
  555. mask = mask | spv::ImageOperandsMask::Nontemporal;
  556. }
  557. if (mask != spv::ImageOperandsMask::MaskNone) {
  558. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  559. }
  560. return mask;
  561. }
  562. spv::Builder::AccessChain::CoherentFlags TGlslangToSpvTraverser::TranslateCoherent(const glslang::TType& type)
  563. {
  564. spv::Builder::AccessChain::CoherentFlags flags = {};
  565. flags.coherent = type.getQualifier().coherent;
  566. flags.devicecoherent = type.getQualifier().devicecoherent;
  567. flags.queuefamilycoherent = type.getQualifier().queuefamilycoherent;
  568. // shared variables are implicitly workgroupcoherent in GLSL.
  569. flags.workgroupcoherent = type.getQualifier().workgroupcoherent ||
  570. type.getQualifier().storage == glslang::EvqShared;
  571. flags.subgroupcoherent = type.getQualifier().subgroupcoherent;
  572. flags.shadercallcoherent = type.getQualifier().shadercallcoherent;
  573. flags.volatil = type.getQualifier().volatil;
  574. flags.nontemporal = type.getQualifier().nontemporal;
  575. // *coherent variables are implicitly nonprivate in GLSL
  576. flags.nonprivate = type.getQualifier().nonprivate ||
  577. flags.anyCoherent() ||
  578. flags.volatil;
  579. flags.isImage = type.getBasicType() == glslang::EbtSampler;
  580. flags.nonUniform = type.getQualifier().nonUniform;
  581. return flags;
  582. }
  583. spv::Scope TGlslangToSpvTraverser::TranslateMemoryScope(
  584. const spv::Builder::AccessChain::CoherentFlags &coherentFlags)
  585. {
  586. spv::Scope scope = spv::Scope::Max;
  587. if (coherentFlags.volatil || coherentFlags.coherent) {
  588. // coherent defaults to Device scope in the old model, QueueFamilyKHR scope in the new model
  589. scope = glslangIntermediate->usingVulkanMemoryModel() ? spv::Scope::QueueFamilyKHR : spv::Scope::Device;
  590. } else if (coherentFlags.devicecoherent) {
  591. scope = spv::Scope::Device;
  592. } else if (coherentFlags.queuefamilycoherent) {
  593. scope = spv::Scope::QueueFamilyKHR;
  594. } else if (coherentFlags.workgroupcoherent) {
  595. scope = spv::Scope::Workgroup;
  596. } else if (coherentFlags.subgroupcoherent) {
  597. scope = spv::Scope::Subgroup;
  598. } else if (coherentFlags.shadercallcoherent) {
  599. scope = spv::Scope::ShaderCallKHR;
  600. }
  601. if (glslangIntermediate->usingVulkanMemoryModel() && scope == spv::Scope::Device) {
  602. builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);
  603. }
  604. return scope;
  605. }
  606. // Translate a glslang built-in variable to a SPIR-V built in decoration. Also generate
  607. // associated capabilities when required. For some built-in variables, a capability
  608. // is generated only when using the variable in an executable instruction, but not when
  609. // just declaring a struct member variable with it. This is true for PointSize,
  610. // ClipDistance, and CullDistance.
  611. spv::BuiltIn TGlslangToSpvTraverser::TranslateBuiltInDecoration(glslang::TBuiltInVariable builtIn,
  612. bool memberDeclaration)
  613. {
  614. switch (builtIn) {
  615. case glslang::EbvPointSize:
  616. // Defer adding the capability until the built-in is actually used.
  617. if (! memberDeclaration) {
  618. switch (glslangIntermediate->getStage()) {
  619. case EShLangGeometry:
  620. builder.addCapability(spv::Capability::GeometryPointSize);
  621. break;
  622. case EShLangTessControl:
  623. case EShLangTessEvaluation:
  624. builder.addCapability(spv::Capability::TessellationPointSize);
  625. break;
  626. default:
  627. break;
  628. }
  629. }
  630. return spv::BuiltIn::PointSize;
  631. case glslang::EbvPosition: return spv::BuiltIn::Position;
  632. case glslang::EbvVertexId: return spv::BuiltIn::VertexId;
  633. case glslang::EbvInstanceId: return spv::BuiltIn::InstanceId;
  634. case glslang::EbvVertexIndex: return spv::BuiltIn::VertexIndex;
  635. case glslang::EbvInstanceIndex: return spv::BuiltIn::InstanceIndex;
  636. case glslang::EbvFragCoord: return spv::BuiltIn::FragCoord;
  637. case glslang::EbvPointCoord: return spv::BuiltIn::PointCoord;
  638. case glslang::EbvFace: return spv::BuiltIn::FrontFacing;
  639. case glslang::EbvFragDepth: return spv::BuiltIn::FragDepth;
  640. case glslang::EbvNumWorkGroups: return spv::BuiltIn::NumWorkgroups;
  641. case glslang::EbvWorkGroupSize: return spv::BuiltIn::WorkgroupSize;
  642. case glslang::EbvWorkGroupId: return spv::BuiltIn::WorkgroupId;
  643. case glslang::EbvLocalInvocationId: return spv::BuiltIn::LocalInvocationId;
  644. case glslang::EbvLocalInvocationIndex: return spv::BuiltIn::LocalInvocationIndex;
  645. case glslang::EbvGlobalInvocationId: return spv::BuiltIn::GlobalInvocationId;
  646. // These *Distance capabilities logically belong here, but if the member is declared and
  647. // then never used, consumers of SPIR-V prefer the capability not be declared.
  648. // They are now generated when used, rather than here when declared.
  649. // Potentially, the specification should be more clear what the minimum
  650. // use needed is to trigger the capability.
  651. //
  652. case glslang::EbvClipDistance:
  653. if (!memberDeclaration)
  654. builder.addCapability(spv::Capability::ClipDistance);
  655. return spv::BuiltIn::ClipDistance;
  656. case glslang::EbvCullDistance:
  657. if (!memberDeclaration)
  658. builder.addCapability(spv::Capability::CullDistance);
  659. return spv::BuiltIn::CullDistance;
  660. case glslang::EbvViewportIndex:
  661. if (glslangIntermediate->getStage() == EShLangGeometry ||
  662. glslangIntermediate->getStage() == EShLangFragment) {
  663. builder.addCapability(spv::Capability::MultiViewport);
  664. }
  665. if (glslangIntermediate->getStage() == EShLangVertex ||
  666. glslangIntermediate->getStage() == EShLangTessControl ||
  667. glslangIntermediate->getStage() == EShLangTessEvaluation) {
  668. if (builder.getSpvVersion() < spv::Spv_1_5) {
  669. builder.addIncorporatedExtension(spv::E_SPV_EXT_shader_viewport_index_layer, spv::Spv_1_5);
  670. builder.addCapability(spv::Capability::ShaderViewportIndexLayerEXT);
  671. }
  672. else
  673. builder.addCapability(spv::Capability::ShaderViewportIndex);
  674. }
  675. return spv::BuiltIn::ViewportIndex;
  676. case glslang::EbvSampleId:
  677. builder.addCapability(spv::Capability::SampleRateShading);
  678. return spv::BuiltIn::SampleId;
  679. case glslang::EbvSamplePosition:
  680. builder.addCapability(spv::Capability::SampleRateShading);
  681. return spv::BuiltIn::SamplePosition;
  682. case glslang::EbvSampleMask:
  683. return spv::BuiltIn::SampleMask;
  684. case glslang::EbvLayer:
  685. if (glslangIntermediate->getStage() == EShLangMesh) {
  686. return spv::BuiltIn::Layer;
  687. }
  688. if (glslangIntermediate->getStage() == EShLangGeometry ||
  689. glslangIntermediate->getStage() == EShLangFragment) {
  690. builder.addCapability(spv::Capability::Geometry);
  691. }
  692. if (glslangIntermediate->getStage() == EShLangVertex ||
  693. glslangIntermediate->getStage() == EShLangTessControl ||
  694. glslangIntermediate->getStage() == EShLangTessEvaluation) {
  695. if (builder.getSpvVersion() < spv::Spv_1_5) {
  696. builder.addIncorporatedExtension(spv::E_SPV_EXT_shader_viewport_index_layer, spv::Spv_1_5);
  697. builder.addCapability(spv::Capability::ShaderViewportIndexLayerEXT);
  698. } else
  699. builder.addCapability(spv::Capability::ShaderLayer);
  700. }
  701. return spv::BuiltIn::Layer;
  702. case glslang::EbvBaseVertex:
  703. builder.addIncorporatedExtension(spv::E_SPV_KHR_shader_draw_parameters, spv::Spv_1_3);
  704. builder.addCapability(spv::Capability::DrawParameters);
  705. return spv::BuiltIn::BaseVertex;
  706. case glslang::EbvBaseInstance:
  707. builder.addIncorporatedExtension(spv::E_SPV_KHR_shader_draw_parameters, spv::Spv_1_3);
  708. builder.addCapability(spv::Capability::DrawParameters);
  709. return spv::BuiltIn::BaseInstance;
  710. case glslang::EbvDrawId:
  711. builder.addIncorporatedExtension(spv::E_SPV_KHR_shader_draw_parameters, spv::Spv_1_3);
  712. builder.addCapability(spv::Capability::DrawParameters);
  713. return spv::BuiltIn::DrawIndex;
  714. case glslang::EbvPrimitiveId:
  715. if (glslangIntermediate->getStage() == EShLangFragment)
  716. builder.addCapability(spv::Capability::Geometry);
  717. return spv::BuiltIn::PrimitiveId;
  718. case glslang::EbvFragStencilRef:
  719. builder.addExtension(spv::E_SPV_EXT_shader_stencil_export);
  720. builder.addCapability(spv::Capability::StencilExportEXT);
  721. return spv::BuiltIn::FragStencilRefEXT;
  722. case glslang::EbvShadingRateKHR:
  723. builder.addExtension(spv::E_SPV_KHR_fragment_shading_rate);
  724. builder.addCapability(spv::Capability::FragmentShadingRateKHR);
  725. return spv::BuiltIn::ShadingRateKHR;
  726. case glslang::EbvPrimitiveShadingRateKHR:
  727. builder.addExtension(spv::E_SPV_KHR_fragment_shading_rate);
  728. builder.addCapability(spv::Capability::FragmentShadingRateKHR);
  729. return spv::BuiltIn::PrimitiveShadingRateKHR;
  730. case glslang::EbvInvocationId: return spv::BuiltIn::InvocationId;
  731. case glslang::EbvTessLevelInner: return spv::BuiltIn::TessLevelInner;
  732. case glslang::EbvTessLevelOuter: return spv::BuiltIn::TessLevelOuter;
  733. case glslang::EbvTessCoord: return spv::BuiltIn::TessCoord;
  734. case glslang::EbvPatchVertices: return spv::BuiltIn::PatchVertices;
  735. case glslang::EbvHelperInvocation: return spv::BuiltIn::HelperInvocation;
  736. case glslang::EbvSubGroupSize:
  737. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  738. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  739. return spv::BuiltIn::SubgroupSize;
  740. case glslang::EbvSubGroupInvocation:
  741. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  742. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  743. return spv::BuiltIn::SubgroupLocalInvocationId;
  744. case glslang::EbvSubGroupEqMask:
  745. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  746. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  747. return spv::BuiltIn::SubgroupEqMask;
  748. case glslang::EbvSubGroupGeMask:
  749. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  750. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  751. return spv::BuiltIn::SubgroupGeMask;
  752. case glslang::EbvSubGroupGtMask:
  753. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  754. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  755. return spv::BuiltIn::SubgroupGtMask;
  756. case glslang::EbvSubGroupLeMask:
  757. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  758. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  759. return spv::BuiltIn::SubgroupLeMask;
  760. case glslang::EbvSubGroupLtMask:
  761. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  762. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  763. return spv::BuiltIn::SubgroupLtMask;
  764. case glslang::EbvNumSubgroups:
  765. builder.addCapability(spv::Capability::GroupNonUniform);
  766. return spv::BuiltIn::NumSubgroups;
  767. case glslang::EbvSubgroupID:
  768. builder.addCapability(spv::Capability::GroupNonUniform);
  769. return spv::BuiltIn::SubgroupId;
  770. case glslang::EbvSubgroupSize2:
  771. builder.addCapability(spv::Capability::GroupNonUniform);
  772. return spv::BuiltIn::SubgroupSize;
  773. case glslang::EbvSubgroupInvocation2:
  774. builder.addCapability(spv::Capability::GroupNonUniform);
  775. return spv::BuiltIn::SubgroupLocalInvocationId;
  776. case glslang::EbvSubgroupEqMask2:
  777. builder.addCapability(spv::Capability::GroupNonUniform);
  778. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  779. return spv::BuiltIn::SubgroupEqMask;
  780. case glslang::EbvSubgroupGeMask2:
  781. builder.addCapability(spv::Capability::GroupNonUniform);
  782. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  783. return spv::BuiltIn::SubgroupGeMask;
  784. case glslang::EbvSubgroupGtMask2:
  785. builder.addCapability(spv::Capability::GroupNonUniform);
  786. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  787. return spv::BuiltIn::SubgroupGtMask;
  788. case glslang::EbvSubgroupLeMask2:
  789. builder.addCapability(spv::Capability::GroupNonUniform);
  790. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  791. return spv::BuiltIn::SubgroupLeMask;
  792. case glslang::EbvSubgroupLtMask2:
  793. builder.addCapability(spv::Capability::GroupNonUniform);
  794. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  795. return spv::BuiltIn::SubgroupLtMask;
  796. case glslang::EbvBaryCoordNoPersp:
  797. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  798. return spv::BuiltIn::BaryCoordNoPerspAMD;
  799. case glslang::EbvBaryCoordNoPerspCentroid:
  800. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  801. return spv::BuiltIn::BaryCoordNoPerspCentroidAMD;
  802. case glslang::EbvBaryCoordNoPerspSample:
  803. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  804. return spv::BuiltIn::BaryCoordNoPerspSampleAMD;
  805. case glslang::EbvBaryCoordSmooth:
  806. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  807. return spv::BuiltIn::BaryCoordSmoothAMD;
  808. case glslang::EbvBaryCoordSmoothCentroid:
  809. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  810. return spv::BuiltIn::BaryCoordSmoothCentroidAMD;
  811. case glslang::EbvBaryCoordSmoothSample:
  812. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  813. return spv::BuiltIn::BaryCoordSmoothSampleAMD;
  814. case glslang::EbvBaryCoordPullModel:
  815. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  816. return spv::BuiltIn::BaryCoordPullModelAMD;
  817. case glslang::EbvDeviceIndex:
  818. builder.addIncorporatedExtension(spv::E_SPV_KHR_device_group, spv::Spv_1_3);
  819. builder.addCapability(spv::Capability::DeviceGroup);
  820. return spv::BuiltIn::DeviceIndex;
  821. case glslang::EbvViewIndex:
  822. builder.addIncorporatedExtension(spv::E_SPV_KHR_multiview, spv::Spv_1_3);
  823. builder.addCapability(spv::Capability::MultiView);
  824. return spv::BuiltIn::ViewIndex;
  825. case glslang::EbvFragSizeEXT:
  826. builder.addExtension(spv::E_SPV_EXT_fragment_invocation_density);
  827. builder.addCapability(spv::Capability::FragmentDensityEXT);
  828. return spv::BuiltIn::FragSizeEXT;
  829. case glslang::EbvFragInvocationCountEXT:
  830. builder.addExtension(spv::E_SPV_EXT_fragment_invocation_density);
  831. builder.addCapability(spv::Capability::FragmentDensityEXT);
  832. return spv::BuiltIn::FragInvocationCountEXT;
  833. case glslang::EbvViewportMaskNV:
  834. if (!memberDeclaration) {
  835. builder.addExtension(spv::E_SPV_NV_viewport_array2);
  836. builder.addCapability(spv::Capability::ShaderViewportMaskNV);
  837. }
  838. return spv::BuiltIn::ViewportMaskNV;
  839. case glslang::EbvSecondaryPositionNV:
  840. if (!memberDeclaration) {
  841. builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
  842. builder.addCapability(spv::Capability::ShaderStereoViewNV);
  843. }
  844. return spv::BuiltIn::SecondaryPositionNV;
  845. case glslang::EbvSecondaryViewportMaskNV:
  846. if (!memberDeclaration) {
  847. builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
  848. builder.addCapability(spv::Capability::ShaderStereoViewNV);
  849. }
  850. return spv::BuiltIn::SecondaryViewportMaskNV;
  851. case glslang::EbvPositionPerViewNV:
  852. if (!memberDeclaration) {
  853. builder.addExtension(spv::E_SPV_NVX_multiview_per_view_attributes);
  854. builder.addCapability(spv::Capability::PerViewAttributesNV);
  855. }
  856. return spv::BuiltIn::PositionPerViewNV;
  857. case glslang::EbvViewportMaskPerViewNV:
  858. if (!memberDeclaration) {
  859. builder.addExtension(spv::E_SPV_NVX_multiview_per_view_attributes);
  860. builder.addCapability(spv::Capability::PerViewAttributesNV);
  861. }
  862. return spv::BuiltIn::ViewportMaskPerViewNV;
  863. case glslang::EbvFragFullyCoveredNV:
  864. builder.addExtension(spv::E_SPV_EXT_fragment_fully_covered);
  865. builder.addCapability(spv::Capability::FragmentFullyCoveredEXT);
  866. return spv::BuiltIn::FullyCoveredEXT;
  867. case glslang::EbvFragmentSizeNV:
  868. builder.addExtension(spv::E_SPV_NV_shading_rate);
  869. builder.addCapability(spv::Capability::ShadingRateNV);
  870. return spv::BuiltIn::FragmentSizeNV;
  871. case glslang::EbvInvocationsPerPixelNV:
  872. builder.addExtension(spv::E_SPV_NV_shading_rate);
  873. builder.addCapability(spv::Capability::ShadingRateNV);
  874. return spv::BuiltIn::InvocationsPerPixelNV;
  875. // ray tracing
  876. case glslang::EbvLaunchId:
  877. return spv::BuiltIn::LaunchIdKHR;
  878. case glslang::EbvLaunchSize:
  879. return spv::BuiltIn::LaunchSizeKHR;
  880. case glslang::EbvWorldRayOrigin:
  881. return spv::BuiltIn::WorldRayOriginKHR;
  882. case glslang::EbvWorldRayDirection:
  883. return spv::BuiltIn::WorldRayDirectionKHR;
  884. case glslang::EbvObjectRayOrigin:
  885. return spv::BuiltIn::ObjectRayOriginKHR;
  886. case glslang::EbvObjectRayDirection:
  887. return spv::BuiltIn::ObjectRayDirectionKHR;
  888. case glslang::EbvRayTmin:
  889. return spv::BuiltIn::RayTminKHR;
  890. case glslang::EbvRayTmax:
  891. return spv::BuiltIn::RayTmaxKHR;
  892. case glslang::EbvCullMask:
  893. return spv::BuiltIn::CullMaskKHR;
  894. case glslang::EbvPositionFetch:
  895. return spv::BuiltIn::HitTriangleVertexPositionsKHR;
  896. case glslang::EbvInstanceCustomIndex:
  897. return spv::BuiltIn::InstanceCustomIndexKHR;
  898. case glslang::EbvHitKind:
  899. return spv::BuiltIn::HitKindKHR;
  900. case glslang::EbvObjectToWorld:
  901. case glslang::EbvObjectToWorld3x4:
  902. return spv::BuiltIn::ObjectToWorldKHR;
  903. case glslang::EbvWorldToObject:
  904. case glslang::EbvWorldToObject3x4:
  905. return spv::BuiltIn::WorldToObjectKHR;
  906. case glslang::EbvIncomingRayFlags:
  907. return spv::BuiltIn::IncomingRayFlagsKHR;
  908. case glslang::EbvGeometryIndex:
  909. return spv::BuiltIn::RayGeometryIndexKHR;
  910. case glslang::EbvCurrentRayTimeNV:
  911. builder.addExtension(spv::E_SPV_NV_ray_tracing_motion_blur);
  912. builder.addCapability(spv::Capability::RayTracingMotionBlurNV);
  913. return spv::BuiltIn::CurrentRayTimeNV;
  914. case glslang::EbvMicroTrianglePositionNV:
  915. builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);
  916. builder.addExtension("SPV_NV_displacement_micromap");
  917. return spv::BuiltIn::HitMicroTriangleVertexPositionsNV;
  918. case glslang::EbvMicroTriangleBaryNV:
  919. builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);
  920. builder.addExtension("SPV_NV_displacement_micromap");
  921. return spv::BuiltIn::HitMicroTriangleVertexBarycentricsNV;
  922. case glslang::EbvHitKindFrontFacingMicroTriangleNV:
  923. builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);
  924. builder.addExtension("SPV_NV_displacement_micromap");
  925. return spv::BuiltIn::HitKindFrontFacingMicroTriangleNV;
  926. case glslang::EbvHitKindBackFacingMicroTriangleNV:
  927. builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);
  928. builder.addExtension("SPV_NV_displacement_micromap");
  929. return spv::BuiltIn::HitKindBackFacingMicroTriangleNV;
  930. case glslang::EbvClusterIDNV:
  931. builder.addCapability(spv::Capability::RayTracingClusterAccelerationStructureNV);
  932. builder.addExtension("SPV_NV_cluster_acceleration_structure");
  933. return spv::BuiltIn::ClusterIDNV;
  934. case glslang::EbvHitIsSphereNV:
  935. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  936. builder.addExtension("SPV_NV_linear_swept_spheres");
  937. return spv::BuiltIn::HitIsSphereNV;
  938. case glslang::EbvHitIsLSSNV:
  939. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  940. builder.addExtension("SPV_NV_linear_swept_spheres");
  941. return spv::BuiltIn::HitIsLSSNV;
  942. case glslang::EbvHitSpherePositionNV:
  943. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  944. builder.addExtension("SPV_NV_linear_swept_spheres");
  945. return spv::BuiltIn::HitSpherePositionNV;
  946. case glslang::EbvHitSphereRadiusNV:
  947. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  948. builder.addExtension("SPV_NV_linear_swept_spheres");
  949. return spv::BuiltIn::HitSphereRadiusNV;
  950. case glslang::EbvHitLSSPositionsNV:
  951. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  952. builder.addExtension("SPV_NV_linear_swept_spheres");
  953. return spv::BuiltIn::HitLSSPositionsNV;
  954. case glslang::EbvHitLSSRadiiNV:
  955. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  956. builder.addExtension("SPV_NV_linear_swept_spheres");
  957. return spv::BuiltIn::HitLSSRadiiNV;
  958. // barycentrics
  959. case glslang::EbvBaryCoordNV:
  960. builder.addExtension(spv::E_SPV_NV_fragment_shader_barycentric);
  961. builder.addCapability(spv::Capability::FragmentBarycentricNV);
  962. return spv::BuiltIn::BaryCoordNV;
  963. case glslang::EbvBaryCoordNoPerspNV:
  964. builder.addExtension(spv::E_SPV_NV_fragment_shader_barycentric);
  965. builder.addCapability(spv::Capability::FragmentBarycentricNV);
  966. return spv::BuiltIn::BaryCoordNoPerspNV;
  967. case glslang::EbvBaryCoordEXT:
  968. builder.addExtension(spv::E_SPV_KHR_fragment_shader_barycentric);
  969. builder.addCapability(spv::Capability::FragmentBarycentricKHR);
  970. return spv::BuiltIn::BaryCoordKHR;
  971. case glslang::EbvBaryCoordNoPerspEXT:
  972. builder.addExtension(spv::E_SPV_KHR_fragment_shader_barycentric);
  973. builder.addCapability(spv::Capability::FragmentBarycentricKHR);
  974. return spv::BuiltIn::BaryCoordNoPerspKHR;
  975. // mesh shaders
  976. case glslang::EbvTaskCountNV:
  977. return spv::BuiltIn::TaskCountNV;
  978. case glslang::EbvPrimitiveCountNV:
  979. return spv::BuiltIn::PrimitiveCountNV;
  980. case glslang::EbvPrimitiveIndicesNV:
  981. return spv::BuiltIn::PrimitiveIndicesNV;
  982. case glslang::EbvClipDistancePerViewNV:
  983. return spv::BuiltIn::ClipDistancePerViewNV;
  984. case glslang::EbvCullDistancePerViewNV:
  985. return spv::BuiltIn::CullDistancePerViewNV;
  986. case glslang::EbvLayerPerViewNV:
  987. return spv::BuiltIn::LayerPerViewNV;
  988. case glslang::EbvMeshViewCountNV:
  989. return spv::BuiltIn::MeshViewCountNV;
  990. case glslang::EbvMeshViewIndicesNV:
  991. return spv::BuiltIn::MeshViewIndicesNV;
  992. // SPV_EXT_mesh_shader
  993. case glslang::EbvPrimitivePointIndicesEXT:
  994. return spv::BuiltIn::PrimitivePointIndicesEXT;
  995. case glslang::EbvPrimitiveLineIndicesEXT:
  996. return spv::BuiltIn::PrimitiveLineIndicesEXT;
  997. case glslang::EbvPrimitiveTriangleIndicesEXT:
  998. return spv::BuiltIn::PrimitiveTriangleIndicesEXT;
  999. case glslang::EbvCullPrimitiveEXT:
  1000. return spv::BuiltIn::CullPrimitiveEXT;
  1001. // sm builtins
  1002. case glslang::EbvWarpsPerSM:
  1003. builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);
  1004. builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);
  1005. return spv::BuiltIn::WarpsPerSMNV;
  1006. case glslang::EbvSMCount:
  1007. builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);
  1008. builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);
  1009. return spv::BuiltIn::SMCountNV;
  1010. case glslang::EbvWarpID:
  1011. builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);
  1012. builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);
  1013. return spv::BuiltIn::WarpIDNV;
  1014. case glslang::EbvSMID:
  1015. builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);
  1016. builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);
  1017. return spv::BuiltIn::SMIDNV;
  1018. // ARM builtins
  1019. case glslang::EbvCoreCountARM:
  1020. builder.addExtension(spv::E_SPV_ARM_core_builtins);
  1021. builder.addCapability(spv::Capability::CoreBuiltinsARM);
  1022. return spv::BuiltIn::CoreCountARM;
  1023. case glslang::EbvCoreIDARM:
  1024. builder.addExtension(spv::E_SPV_ARM_core_builtins);
  1025. builder.addCapability(spv::Capability::CoreBuiltinsARM);
  1026. return spv::BuiltIn::CoreIDARM;
  1027. case glslang::EbvCoreMaxIDARM:
  1028. builder.addExtension(spv::E_SPV_ARM_core_builtins);
  1029. builder.addCapability(spv::Capability::CoreBuiltinsARM);
  1030. return spv::BuiltIn::CoreMaxIDARM;
  1031. case glslang::EbvWarpIDARM:
  1032. builder.addExtension(spv::E_SPV_ARM_core_builtins);
  1033. builder.addCapability(spv::Capability::CoreBuiltinsARM);
  1034. return spv::BuiltIn::WarpIDARM;
  1035. case glslang::EbvWarpMaxIDARM:
  1036. builder.addExtension(spv::E_SPV_ARM_core_builtins);
  1037. builder.addCapability(spv::Capability::CoreBuiltinsARM);
  1038. return spv::BuiltIn::WarpMaxIDARM;
  1039. // QCOM builtins
  1040. case glslang::EbvTileOffsetQCOM:
  1041. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1042. return spv::BuiltIn::TileOffsetQCOM;
  1043. case glslang::EbvTileDimensionQCOM:
  1044. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1045. return spv::BuiltIn::TileDimensionQCOM;
  1046. case glslang::EbvTileApronSizeQCOM:
  1047. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1048. return spv::BuiltIn::TileApronSizeQCOM;
  1049. default:
  1050. return spv::BuiltIn::Max;
  1051. }
  1052. }
  1053. // Translate glslang image layout format to SPIR-V image format.
  1054. spv::ImageFormat TGlslangToSpvTraverser::TranslateImageFormat(const glslang::TType& type)
  1055. {
  1056. assert(type.getBasicType() == glslang::EbtSampler);
  1057. // Check for capabilities
  1058. switch (type.getQualifier().getFormat()) {
  1059. case glslang::ElfRg32f:
  1060. case glslang::ElfRg16f:
  1061. case glslang::ElfR11fG11fB10f:
  1062. case glslang::ElfR16f:
  1063. case glslang::ElfRgba16:
  1064. case glslang::ElfRgb10A2:
  1065. case glslang::ElfRg16:
  1066. case glslang::ElfRg8:
  1067. case glslang::ElfR16:
  1068. case glslang::ElfR8:
  1069. case glslang::ElfRgba16Snorm:
  1070. case glslang::ElfRg16Snorm:
  1071. case glslang::ElfRg8Snorm:
  1072. case glslang::ElfR16Snorm:
  1073. case glslang::ElfR8Snorm:
  1074. case glslang::ElfRg32i:
  1075. case glslang::ElfRg16i:
  1076. case glslang::ElfRg8i:
  1077. case glslang::ElfR16i:
  1078. case glslang::ElfR8i:
  1079. case glslang::ElfRgb10a2ui:
  1080. case glslang::ElfRg32ui:
  1081. case glslang::ElfRg16ui:
  1082. case glslang::ElfRg8ui:
  1083. case glslang::ElfR16ui:
  1084. case glslang::ElfR8ui:
  1085. builder.addCapability(spv::Capability::StorageImageExtendedFormats);
  1086. break;
  1087. case glslang::ElfR64ui:
  1088. case glslang::ElfR64i:
  1089. builder.addExtension(spv::E_SPV_EXT_shader_image_int64);
  1090. builder.addCapability(spv::Capability::Int64ImageEXT);
  1091. break;
  1092. default:
  1093. break;
  1094. }
  1095. // do the translation
  1096. switch (type.getQualifier().getFormat()) {
  1097. case glslang::ElfNone: return spv::ImageFormat::Unknown;
  1098. case glslang::ElfRgba32f: return spv::ImageFormat::Rgba32f;
  1099. case glslang::ElfRgba16f: return spv::ImageFormat::Rgba16f;
  1100. case glslang::ElfR32f: return spv::ImageFormat::R32f;
  1101. case glslang::ElfRgba8: return spv::ImageFormat::Rgba8;
  1102. case glslang::ElfRgba8Snorm: return spv::ImageFormat::Rgba8Snorm;
  1103. case glslang::ElfRg32f: return spv::ImageFormat::Rg32f;
  1104. case glslang::ElfRg16f: return spv::ImageFormat::Rg16f;
  1105. case glslang::ElfR11fG11fB10f: return spv::ImageFormat::R11fG11fB10f;
  1106. case glslang::ElfR16f: return spv::ImageFormat::R16f;
  1107. case glslang::ElfRgba16: return spv::ImageFormat::Rgba16;
  1108. case glslang::ElfRgb10A2: return spv::ImageFormat::Rgb10A2;
  1109. case glslang::ElfRg16: return spv::ImageFormat::Rg16;
  1110. case glslang::ElfRg8: return spv::ImageFormat::Rg8;
  1111. case glslang::ElfR16: return spv::ImageFormat::R16;
  1112. case glslang::ElfR8: return spv::ImageFormat::R8;
  1113. case glslang::ElfRgba16Snorm: return spv::ImageFormat::Rgba16Snorm;
  1114. case glslang::ElfRg16Snorm: return spv::ImageFormat::Rg16Snorm;
  1115. case glslang::ElfRg8Snorm: return spv::ImageFormat::Rg8Snorm;
  1116. case glslang::ElfR16Snorm: return spv::ImageFormat::R16Snorm;
  1117. case glslang::ElfR8Snorm: return spv::ImageFormat::R8Snorm;
  1118. case glslang::ElfRgba32i: return spv::ImageFormat::Rgba32i;
  1119. case glslang::ElfRgba16i: return spv::ImageFormat::Rgba16i;
  1120. case glslang::ElfRgba8i: return spv::ImageFormat::Rgba8i;
  1121. case glslang::ElfR32i: return spv::ImageFormat::R32i;
  1122. case glslang::ElfRg32i: return spv::ImageFormat::Rg32i;
  1123. case glslang::ElfRg16i: return spv::ImageFormat::Rg16i;
  1124. case glslang::ElfRg8i: return spv::ImageFormat::Rg8i;
  1125. case glslang::ElfR16i: return spv::ImageFormat::R16i;
  1126. case glslang::ElfR8i: return spv::ImageFormat::R8i;
  1127. case glslang::ElfRgba32ui: return spv::ImageFormat::Rgba32ui;
  1128. case glslang::ElfRgba16ui: return spv::ImageFormat::Rgba16ui;
  1129. case glslang::ElfRgba8ui: return spv::ImageFormat::Rgba8ui;
  1130. case glslang::ElfR32ui: return spv::ImageFormat::R32ui;
  1131. case glslang::ElfRg32ui: return spv::ImageFormat::Rg32ui;
  1132. case glslang::ElfRg16ui: return spv::ImageFormat::Rg16ui;
  1133. case glslang::ElfRgb10a2ui: return spv::ImageFormat::Rgb10a2ui;
  1134. case glslang::ElfRg8ui: return spv::ImageFormat::Rg8ui;
  1135. case glslang::ElfR16ui: return spv::ImageFormat::R16ui;
  1136. case glslang::ElfR8ui: return spv::ImageFormat::R8ui;
  1137. case glslang::ElfR64ui: return spv::ImageFormat::R64ui;
  1138. case glslang::ElfR64i: return spv::ImageFormat::R64i;
  1139. default: return spv::ImageFormat::Max;
  1140. }
  1141. }
  1142. spv::SelectionControlMask TGlslangToSpvTraverser::TranslateSelectionControl(
  1143. const glslang::TIntermSelection& selectionNode) const
  1144. {
  1145. if (selectionNode.getFlatten())
  1146. return spv::SelectionControlMask::Flatten;
  1147. if (selectionNode.getDontFlatten())
  1148. return spv::SelectionControlMask::DontFlatten;
  1149. return spv::SelectionControlMask::MaskNone;
  1150. }
  1151. spv::SelectionControlMask TGlslangToSpvTraverser::TranslateSwitchControl(const glslang::TIntermSwitch& switchNode)
  1152. const
  1153. {
  1154. if (switchNode.getFlatten())
  1155. return spv::SelectionControlMask::Flatten;
  1156. if (switchNode.getDontFlatten())
  1157. return spv::SelectionControlMask::DontFlatten;
  1158. return spv::SelectionControlMask::MaskNone;
  1159. }
  1160. // return a non-0 dependency if the dependency argument must be set
  1161. spv::LoopControlMask TGlslangToSpvTraverser::TranslateLoopControl(const glslang::TIntermLoop& loopNode,
  1162. std::vector<unsigned int>& operands) const
  1163. {
  1164. spv::LoopControlMask control = spv::LoopControlMask::MaskNone;
  1165. if (loopNode.getDontUnroll())
  1166. control = control | spv::LoopControlMask::DontUnroll;
  1167. if (loopNode.getUnroll())
  1168. control = control | spv::LoopControlMask::Unroll;
  1169. if (unsigned(loopNode.getLoopDependency()) == glslang::TIntermLoop::dependencyInfinite)
  1170. control = control | spv::LoopControlMask::DependencyInfinite;
  1171. else if (loopNode.getLoopDependency() > 0) {
  1172. control = control | spv::LoopControlMask::DependencyLength;
  1173. operands.push_back((unsigned int)loopNode.getLoopDependency());
  1174. }
  1175. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {
  1176. if (loopNode.getMinIterations() > 0) {
  1177. control = control | spv::LoopControlMask::MinIterations;
  1178. operands.push_back(loopNode.getMinIterations());
  1179. }
  1180. if (loopNode.getMaxIterations() < glslang::TIntermLoop::iterationsInfinite) {
  1181. control = control | spv::LoopControlMask::MaxIterations;
  1182. operands.push_back(loopNode.getMaxIterations());
  1183. }
  1184. if (loopNode.getIterationMultiple() > 1) {
  1185. control = control | spv::LoopControlMask::IterationMultiple;
  1186. operands.push_back(loopNode.getIterationMultiple());
  1187. }
  1188. if (loopNode.getPeelCount() > 0) {
  1189. control = control | spv::LoopControlMask::PeelCount;
  1190. operands.push_back(loopNode.getPeelCount());
  1191. }
  1192. if (loopNode.getPartialCount() > 0) {
  1193. control = control | spv::LoopControlMask::PartialCount;
  1194. operands.push_back(loopNode.getPartialCount());
  1195. }
  1196. }
  1197. return control;
  1198. }
  1199. // Translate glslang type to SPIR-V storage class.
  1200. spv::StorageClass TGlslangToSpvTraverser::TranslateStorageClass(const glslang::TType& type)
  1201. {
  1202. if (type.getBasicType() == glslang::EbtRayQuery || type.getBasicType() == glslang::EbtHitObjectNV)
  1203. return spv::StorageClass::Private;
  1204. if (type.getQualifier().isSpirvByReference()) {
  1205. if (type.getQualifier().isParamInput() || type.getQualifier().isParamOutput())
  1206. return spv::StorageClass::Function;
  1207. }
  1208. if (type.getQualifier().isPipeInput())
  1209. return spv::StorageClass::Input;
  1210. if (type.getQualifier().isPipeOutput())
  1211. return spv::StorageClass::Output;
  1212. if (type.getQualifier().storage == glslang::EvqTileImageEXT || type.isAttachmentEXT()) {
  1213. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  1214. builder.addCapability(spv::Capability::TileImageColorReadAccessEXT);
  1215. return spv::StorageClass::TileImageEXT;
  1216. }
  1217. if (type.getQualifier().isTileAttachmentQCOM()) {
  1218. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1219. builder.addCapability(spv::Capability::TileShadingQCOM);
  1220. return spv::StorageClass::TileAttachmentQCOM;
  1221. }
  1222. if (glslangIntermediate->getSource() != glslang::EShSourceHlsl ||
  1223. type.getQualifier().storage == glslang::EvqUniform) {
  1224. if (type.isAtomic())
  1225. return spv::StorageClass::AtomicCounter;
  1226. if (type.containsOpaque() && !glslangIntermediate->getBindlessMode())
  1227. return spv::StorageClass::UniformConstant;
  1228. }
  1229. if (type.getQualifier().isUniformOrBuffer() &&
  1230. type.getQualifier().isShaderRecord()) {
  1231. return spv::StorageClass::ShaderRecordBufferKHR;
  1232. }
  1233. if (glslangIntermediate->usingStorageBuffer() && type.getQualifier().storage == glslang::EvqBuffer) {
  1234. builder.addIncorporatedExtension(spv::E_SPV_KHR_storage_buffer_storage_class, spv::Spv_1_3);
  1235. return spv::StorageClass::StorageBuffer;
  1236. }
  1237. if (type.getQualifier().isUniformOrBuffer()) {
  1238. if (type.getQualifier().isPushConstant())
  1239. return spv::StorageClass::PushConstant;
  1240. if (type.getBasicType() == glslang::EbtBlock)
  1241. return spv::StorageClass::Uniform;
  1242. return spv::StorageClass::UniformConstant;
  1243. }
  1244. if (type.getQualifier().storage == glslang::EvqShared && type.getBasicType() == glslang::EbtBlock) {
  1245. builder.addExtension(spv::E_SPV_KHR_workgroup_memory_explicit_layout);
  1246. builder.addCapability(spv::Capability::WorkgroupMemoryExplicitLayoutKHR);
  1247. return spv::StorageClass::Workgroup;
  1248. }
  1249. switch (type.getQualifier().storage) {
  1250. case glslang::EvqGlobal: return spv::StorageClass::Private;
  1251. case glslang::EvqConstReadOnly: return spv::StorageClass::Function;
  1252. case glslang::EvqTemporary: return spv::StorageClass::Function;
  1253. case glslang::EvqShared: return spv::StorageClass::Workgroup;
  1254. case glslang::EvqPayload: return spv::StorageClass::RayPayloadKHR;
  1255. case glslang::EvqPayloadIn: return spv::StorageClass::IncomingRayPayloadKHR;
  1256. case glslang::EvqHitAttr: return spv::StorageClass::HitAttributeKHR;
  1257. case glslang::EvqCallableData: return spv::StorageClass::CallableDataKHR;
  1258. case glslang::EvqCallableDataIn: return spv::StorageClass::IncomingCallableDataKHR;
  1259. case glslang::EvqtaskPayloadSharedEXT : return spv::StorageClass::TaskPayloadWorkgroupEXT;
  1260. case glslang::EvqHitObjectAttrNV: return spv::StorageClass::HitObjectAttributeNV;
  1261. case glslang::EvqSpirvStorageClass: return static_cast<spv::StorageClass>(type.getQualifier().spirvStorageClass);
  1262. default:
  1263. assert(0);
  1264. break;
  1265. }
  1266. return spv::StorageClass::Function;
  1267. }
  1268. // Translate glslang constants to SPIR-V literals
  1269. void TGlslangToSpvTraverser::TranslateLiterals(const glslang::TVector<const glslang::TIntermConstantUnion*>& constants,
  1270. std::vector<unsigned>& literals) const
  1271. {
  1272. for (auto constant : constants) {
  1273. if (constant->getBasicType() == glslang::EbtFloat) {
  1274. float floatValue = static_cast<float>(constant->getConstArray()[0].getDConst());
  1275. unsigned literal;
  1276. static_assert(sizeof(literal) == sizeof(floatValue), "sizeof(unsigned) != sizeof(float)");
  1277. memcpy(&literal, &floatValue, sizeof(literal));
  1278. literals.push_back(literal);
  1279. } else if (constant->getBasicType() == glslang::EbtInt) {
  1280. unsigned literal = constant->getConstArray()[0].getIConst();
  1281. literals.push_back(literal);
  1282. } else if (constant->getBasicType() == glslang::EbtUint) {
  1283. unsigned literal = constant->getConstArray()[0].getUConst();
  1284. literals.push_back(literal);
  1285. } else if (constant->getBasicType() == glslang::EbtBool) {
  1286. unsigned literal = constant->getConstArray()[0].getBConst();
  1287. literals.push_back(literal);
  1288. } else if (constant->getBasicType() == glslang::EbtString) {
  1289. auto str = constant->getConstArray()[0].getSConst()->c_str();
  1290. unsigned literal = 0;
  1291. char* literalPtr = reinterpret_cast<char*>(&literal);
  1292. unsigned charCount = 0;
  1293. char ch = 0;
  1294. do {
  1295. ch = *(str++);
  1296. *(literalPtr++) = ch;
  1297. ++charCount;
  1298. if (charCount == 4) {
  1299. literals.push_back(literal);
  1300. literalPtr = reinterpret_cast<char*>(&literal);
  1301. charCount = 0;
  1302. }
  1303. } while (ch != 0);
  1304. // Partial literal is padded with 0
  1305. if (charCount > 0) {
  1306. for (; charCount < 4; ++charCount)
  1307. *(literalPtr++) = 0;
  1308. literals.push_back(literal);
  1309. }
  1310. } else
  1311. assert(0); // Unexpected type
  1312. }
  1313. }
  1314. // Add capabilities pertaining to how an array is indexed.
  1315. void TGlslangToSpvTraverser::addIndirectionIndexCapabilities(const glslang::TType& baseType,
  1316. const glslang::TType& indexType)
  1317. {
  1318. if (indexType.getQualifier().isNonUniform()) {
  1319. // deal with an asserted non-uniform index
  1320. // SPV_EXT_descriptor_indexing already added in TranslateNonUniformDecoration
  1321. if (baseType.getBasicType() == glslang::EbtSampler) {
  1322. if (baseType.getQualifier().hasAttachment())
  1323. builder.addCapability(spv::Capability::InputAttachmentArrayNonUniformIndexingEXT);
  1324. else if (baseType.isImage() && baseType.getSampler().isBuffer())
  1325. builder.addCapability(spv::Capability::StorageTexelBufferArrayNonUniformIndexingEXT);
  1326. else if (baseType.isTexture() && baseType.getSampler().isBuffer())
  1327. builder.addCapability(spv::Capability::UniformTexelBufferArrayNonUniformIndexingEXT);
  1328. else if (baseType.isImage())
  1329. builder.addCapability(spv::Capability::StorageImageArrayNonUniformIndexingEXT);
  1330. else if (baseType.isTexture())
  1331. builder.addCapability(spv::Capability::SampledImageArrayNonUniformIndexingEXT);
  1332. } else if (baseType.getBasicType() == glslang::EbtBlock) {
  1333. if (baseType.getQualifier().storage == glslang::EvqBuffer)
  1334. builder.addCapability(spv::Capability::StorageBufferArrayNonUniformIndexingEXT);
  1335. else if (baseType.getQualifier().storage == glslang::EvqUniform)
  1336. builder.addCapability(spv::Capability::UniformBufferArrayNonUniformIndexingEXT);
  1337. }
  1338. } else {
  1339. // assume a dynamically uniform index
  1340. if (baseType.getBasicType() == glslang::EbtSampler) {
  1341. if (baseType.getQualifier().hasAttachment()) {
  1342. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  1343. builder.addCapability(spv::Capability::InputAttachmentArrayDynamicIndexingEXT);
  1344. } else if (baseType.isImage() && baseType.getSampler().isBuffer()) {
  1345. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  1346. builder.addCapability(spv::Capability::StorageTexelBufferArrayDynamicIndexingEXT);
  1347. } else if (baseType.isTexture() && baseType.getSampler().isBuffer()) {
  1348. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  1349. builder.addCapability(spv::Capability::UniformTexelBufferArrayDynamicIndexingEXT);
  1350. }
  1351. }
  1352. }
  1353. }
  1354. // Return whether or not the given type is something that should be tied to a
  1355. // descriptor set.
  1356. bool IsDescriptorResource(const glslang::TType& type)
  1357. {
  1358. // uniform and buffer blocks are included, unless it is a push_constant
  1359. if (type.getBasicType() == glslang::EbtBlock)
  1360. return type.getQualifier().isUniformOrBuffer() &&
  1361. ! type.getQualifier().isShaderRecord() &&
  1362. ! type.getQualifier().isPushConstant();
  1363. // non block...
  1364. // basically samplerXXX/subpass/sampler/texture are all included
  1365. // if they are the global-scope-class, not the function parameter
  1366. // (or local, if they ever exist) class.
  1367. if (type.getBasicType() == glslang::EbtSampler ||
  1368. type.getBasicType() == glslang::EbtAccStruct)
  1369. return type.getQualifier().isUniformOrBuffer();
  1370. // Tensors are tied to a descriptor.
  1371. if (type.isTensorARM())
  1372. return true;
  1373. // None of the above.
  1374. return false;
  1375. }
  1376. void InheritQualifiers(glslang::TQualifier& child, const glslang::TQualifier& parent)
  1377. {
  1378. if (child.layoutMatrix == glslang::ElmNone)
  1379. child.layoutMatrix = parent.layoutMatrix;
  1380. if (parent.invariant)
  1381. child.invariant = true;
  1382. if (parent.flat)
  1383. child.flat = true;
  1384. if (parent.centroid)
  1385. child.centroid = true;
  1386. if (parent.nopersp)
  1387. child.nopersp = true;
  1388. if (parent.explicitInterp)
  1389. child.explicitInterp = true;
  1390. if (parent.perPrimitiveNV)
  1391. child.perPrimitiveNV = true;
  1392. if (parent.perViewNV)
  1393. child.perViewNV = true;
  1394. if (parent.perTaskNV)
  1395. child.perTaskNV = true;
  1396. if (parent.storage == glslang::EvqtaskPayloadSharedEXT)
  1397. child.storage = glslang::EvqtaskPayloadSharedEXT;
  1398. if (parent.patch)
  1399. child.patch = true;
  1400. if (parent.sample)
  1401. child.sample = true;
  1402. if (parent.coherent)
  1403. child.coherent = true;
  1404. if (parent.devicecoherent)
  1405. child.devicecoherent = true;
  1406. if (parent.queuefamilycoherent)
  1407. child.queuefamilycoherent = true;
  1408. if (parent.workgroupcoherent)
  1409. child.workgroupcoherent = true;
  1410. if (parent.subgroupcoherent)
  1411. child.subgroupcoherent = true;
  1412. if (parent.shadercallcoherent)
  1413. child.shadercallcoherent = true;
  1414. if (parent.nonprivate)
  1415. child.nonprivate = true;
  1416. if (parent.volatil)
  1417. child.volatil = true;
  1418. if (parent.nontemporal)
  1419. child.nontemporal = true;
  1420. if (parent.restrict)
  1421. child.restrict = true;
  1422. if (parent.readonly)
  1423. child.readonly = true;
  1424. if (parent.writeonly)
  1425. child.writeonly = true;
  1426. if (parent.nonUniform)
  1427. child.nonUniform = true;
  1428. }
  1429. bool HasNonLayoutQualifiers(const glslang::TType& type, const glslang::TQualifier& qualifier)
  1430. {
  1431. // This should list qualifiers that simultaneous satisfy:
  1432. // - struct members might inherit from a struct declaration
  1433. // (note that non-block structs don't explicitly inherit,
  1434. // only implicitly, meaning no decoration involved)
  1435. // - affect decorations on the struct members
  1436. // (note smooth does not, and expecting something like volatile
  1437. // to effect the whole object)
  1438. // - are not part of the offset/st430/etc or row/column-major layout
  1439. return qualifier.invariant || (qualifier.hasLocation() && type.getBasicType() == glslang::EbtBlock);
  1440. }
  1441. //
  1442. // Implement the TGlslangToSpvTraverser class.
  1443. //
  1444. TGlslangToSpvTraverser::TGlslangToSpvTraverser(unsigned int spvVersion,
  1445. const glslang::TIntermediate* glslangIntermediate,
  1446. spv::SpvBuildLogger* buildLogger, glslang::SpvOptions& options) :
  1447. TIntermTraverser(true, false, true),
  1448. options(options),
  1449. shaderEntry(nullptr), currentFunction(nullptr),
  1450. sequenceDepth(0), logger(buildLogger),
  1451. builder(spvVersion, (glslang::GetKhronosToolId() << 16) | glslang::GetSpirvGeneratorVersion(), logger),
  1452. inEntryPoint(false), entryPointTerminated(false), linkageOnly(false),
  1453. glslangIntermediate(glslangIntermediate),
  1454. nanMinMaxClamp(glslangIntermediate->getNanMinMaxClamp()),
  1455. nonSemanticDebugPrintf(0),
  1456. taskPayloadID(0)
  1457. {
  1458. bool isMeshShaderExt = (glslangIntermediate->getRequestedExtensions().find(glslang::E_GL_EXT_mesh_shader) !=
  1459. glslangIntermediate->getRequestedExtensions().end());
  1460. spv::ExecutionModel executionModel = TranslateExecutionModel(glslangIntermediate->getStage(), isMeshShaderExt);
  1461. builder.clearAccessChain();
  1462. builder.setSource(TranslateSourceLanguage(glslangIntermediate->getSource(), glslangIntermediate->getProfile()),
  1463. glslangIntermediate->getVersion());
  1464. if (options.emitNonSemanticShaderDebugSource)
  1465. this->options.emitNonSemanticShaderDebugInfo = true;
  1466. if (options.emitNonSemanticShaderDebugInfo)
  1467. this->options.generateDebugInfo = true;
  1468. if (this->options.generateDebugInfo) {
  1469. if (this->options.emitNonSemanticShaderDebugInfo) {
  1470. builder.setEmitNonSemanticShaderDebugInfo(this->options.emitNonSemanticShaderDebugSource);
  1471. }
  1472. else {
  1473. builder.setEmitSpirvDebugInfo();
  1474. }
  1475. builder.setDebugMainSourceFile(glslangIntermediate->getSourceFile());
  1476. // Set the source shader's text. If for SPV version 1.0, include
  1477. // a preamble in comments stating the OpModuleProcessed instructions.
  1478. // Otherwise, emit those as actual instructions.
  1479. std::string text;
  1480. const std::vector<std::string>& processes = glslangIntermediate->getProcesses();
  1481. for (int p = 0; p < (int)processes.size(); ++p) {
  1482. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_1) {
  1483. text.append("// OpModuleProcessed ");
  1484. text.append(processes[p]);
  1485. text.append("\n");
  1486. } else
  1487. builder.addModuleProcessed(processes[p]);
  1488. }
  1489. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_1 && (int)processes.size() > 0)
  1490. text.append("#line 1\n");
  1491. text.append(glslangIntermediate->getSourceText());
  1492. builder.setSourceText(text);
  1493. // Pass name and text for all included files
  1494. const std::map<std::string, std::string>& include_txt = glslangIntermediate->getIncludeText();
  1495. for (auto iItr = include_txt.begin(); iItr != include_txt.end(); ++iItr)
  1496. builder.addInclude(iItr->first, iItr->second);
  1497. }
  1498. builder.setUseReplicatedComposites(glslangIntermediate->usingReplicatedComposites());
  1499. stdBuiltins = builder.import("GLSL.std.450");
  1500. spv::AddressingModel addressingModel = spv::AddressingModel::Logical;
  1501. spv::MemoryModel memoryModel = spv::MemoryModel::GLSL450;
  1502. if (glslangIntermediate->usingPhysicalStorageBuffer()) {
  1503. addressingModel = spv::AddressingModel::PhysicalStorageBuffer64EXT;
  1504. builder.addIncorporatedExtension(spv::E_SPV_KHR_physical_storage_buffer, spv::Spv_1_5);
  1505. builder.addCapability(spv::Capability::PhysicalStorageBufferAddressesEXT);
  1506. }
  1507. if (glslangIntermediate->usingVulkanMemoryModel()) {
  1508. memoryModel = spv::MemoryModel::VulkanKHR;
  1509. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  1510. builder.addIncorporatedExtension(spv::E_SPV_KHR_vulkan_memory_model, spv::Spv_1_5);
  1511. }
  1512. builder.setMemoryModel(addressingModel, memoryModel);
  1513. if (glslangIntermediate->usingVariablePointers()) {
  1514. builder.addCapability(spv::Capability::VariablePointers);
  1515. }
  1516. // If not linking, there is no entry point
  1517. if (!options.compileOnly) {
  1518. shaderEntry = builder.makeEntryPoint(glslangIntermediate->getEntryPointName().c_str());
  1519. entryPoint =
  1520. builder.addEntryPoint(executionModel, shaderEntry, glslangIntermediate->getEntryPointName().c_str());
  1521. }
  1522. // Add the source extensions
  1523. const auto& sourceExtensions = glslangIntermediate->getRequestedExtensions();
  1524. for (auto it = sourceExtensions.begin(); it != sourceExtensions.end(); ++it)
  1525. builder.addSourceExtension(it->c_str());
  1526. // Add the top-level modes for this shader.
  1527. if (glslangIntermediate->getXfbMode()) {
  1528. builder.addCapability(spv::Capability::TransformFeedback);
  1529. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::Xfb);
  1530. }
  1531. if (glslangIntermediate->getLayoutPrimitiveCulling()) {
  1532. builder.addCapability(spv::Capability::RayTraversalPrimitiveCullingKHR);
  1533. }
  1534. if (glslangIntermediate->getSubgroupUniformControlFlow()) {
  1535. builder.addExtension(spv::E_SPV_KHR_subgroup_uniform_control_flow);
  1536. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::SubgroupUniformControlFlowKHR);
  1537. }
  1538. if (glslangIntermediate->getMaximallyReconverges()) {
  1539. builder.addExtension(spv::E_SPV_KHR_maximal_reconvergence);
  1540. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::MaximallyReconvergesKHR);
  1541. }
  1542. if (glslangIntermediate->getQuadDerivMode())
  1543. {
  1544. builder.addCapability(spv::Capability::QuadControlKHR);
  1545. builder.addExtension(spv::E_SPV_KHR_quad_control);
  1546. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::QuadDerivativesKHR);
  1547. }
  1548. if (glslangIntermediate->getReqFullQuadsMode())
  1549. {
  1550. builder.addCapability(spv::Capability::QuadControlKHR);
  1551. builder.addExtension(spv::E_SPV_KHR_quad_control);
  1552. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::RequireFullQuadsKHR);
  1553. }
  1554. spv::ExecutionMode mode;
  1555. switch (glslangIntermediate->getStage()) {
  1556. case EShLangVertex:
  1557. builder.addCapability(spv::Capability::Shader);
  1558. break;
  1559. case EShLangFragment:
  1560. builder.addCapability(spv::Capability::Shader);
  1561. if (glslangIntermediate->getPixelCenterInteger())
  1562. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::PixelCenterInteger);
  1563. if (glslangIntermediate->getOriginUpperLeft())
  1564. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OriginUpperLeft);
  1565. else
  1566. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OriginLowerLeft);
  1567. if (glslangIntermediate->getEarlyFragmentTests())
  1568. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::EarlyFragmentTests);
  1569. if (glslangIntermediate->getEarlyAndLateFragmentTestsAMD())
  1570. {
  1571. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::EarlyAndLateFragmentTestsAMD);
  1572. builder.addExtension(spv::E_SPV_AMD_shader_early_and_late_fragment_tests);
  1573. }
  1574. if (glslangIntermediate->getPostDepthCoverage()) {
  1575. builder.addCapability(spv::Capability::SampleMaskPostDepthCoverage);
  1576. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::PostDepthCoverage);
  1577. builder.addExtension(spv::E_SPV_KHR_post_depth_coverage);
  1578. }
  1579. if (glslangIntermediate->getNonCoherentColorAttachmentReadEXT()) {
  1580. builder.addCapability(spv::Capability::TileImageColorReadAccessEXT);
  1581. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentColorAttachmentReadEXT);
  1582. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  1583. }
  1584. if (glslangIntermediate->getNonCoherentDepthAttachmentReadEXT()) {
  1585. builder.addCapability(spv::Capability::TileImageDepthReadAccessEXT);
  1586. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentDepthAttachmentReadEXT);
  1587. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  1588. }
  1589. if (glslangIntermediate->getNonCoherentStencilAttachmentReadEXT()) {
  1590. builder.addCapability(spv::Capability::TileImageStencilReadAccessEXT);
  1591. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentStencilAttachmentReadEXT);
  1592. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  1593. }
  1594. if (glslangIntermediate->getNonCoherentTileAttachmentReadQCOM()) {
  1595. builder.addCapability(spv::Capability::TileShadingQCOM);
  1596. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentTileAttachmentReadQCOM);
  1597. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1598. }
  1599. if (glslangIntermediate->isDepthReplacing())
  1600. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::DepthReplacing);
  1601. if (glslangIntermediate->isStencilReplacing())
  1602. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::StencilRefReplacingEXT);
  1603. switch(glslangIntermediate->getDepth()) {
  1604. case glslang::EldGreater: mode = spv::ExecutionMode::DepthGreater; break;
  1605. case glslang::EldLess: mode = spv::ExecutionMode::DepthLess; break;
  1606. case glslang::EldUnchanged: mode = spv::ExecutionMode::DepthUnchanged; break;
  1607. default: mode = spv::ExecutionMode::Max; break;
  1608. }
  1609. if (mode != spv::ExecutionMode::Max)
  1610. builder.addExecutionMode(shaderEntry, mode);
  1611. switch (glslangIntermediate->getStencil()) {
  1612. case glslang::ElsRefUnchangedFrontAMD: mode = spv::ExecutionMode::StencilRefUnchangedFrontAMD; break;
  1613. case glslang::ElsRefGreaterFrontAMD: mode = spv::ExecutionMode::StencilRefGreaterFrontAMD; break;
  1614. case glslang::ElsRefLessFrontAMD: mode = spv::ExecutionMode::StencilRefLessFrontAMD; break;
  1615. case glslang::ElsRefUnchangedBackAMD: mode = spv::ExecutionMode::StencilRefUnchangedBackAMD; break;
  1616. case glslang::ElsRefGreaterBackAMD: mode = spv::ExecutionMode::StencilRefGreaterBackAMD; break;
  1617. case glslang::ElsRefLessBackAMD: mode = spv::ExecutionMode::StencilRefLessBackAMD; break;
  1618. default: mode = spv::ExecutionMode::Max; break;
  1619. }
  1620. if (mode != spv::ExecutionMode::Max)
  1621. builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
  1622. switch (glslangIntermediate->getInterlockOrdering()) {
  1623. case glslang::EioPixelInterlockOrdered: mode = spv::ExecutionMode::PixelInterlockOrderedEXT;
  1624. break;
  1625. case glslang::EioPixelInterlockUnordered: mode = spv::ExecutionMode::PixelInterlockUnorderedEXT;
  1626. break;
  1627. case glslang::EioSampleInterlockOrdered: mode = spv::ExecutionMode::SampleInterlockOrderedEXT;
  1628. break;
  1629. case glslang::EioSampleInterlockUnordered: mode = spv::ExecutionMode::SampleInterlockUnorderedEXT;
  1630. break;
  1631. case glslang::EioShadingRateInterlockOrdered: mode = spv::ExecutionMode::ShadingRateInterlockOrderedEXT;
  1632. break;
  1633. case glslang::EioShadingRateInterlockUnordered: mode = spv::ExecutionMode::ShadingRateInterlockUnorderedEXT;
  1634. break;
  1635. default: mode = spv::ExecutionMode::Max;
  1636. break;
  1637. }
  1638. if (mode != spv::ExecutionMode::Max) {
  1639. builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
  1640. if (mode == spv::ExecutionMode::ShadingRateInterlockOrderedEXT ||
  1641. mode == spv::ExecutionMode::ShadingRateInterlockUnorderedEXT) {
  1642. builder.addCapability(spv::Capability::FragmentShaderShadingRateInterlockEXT);
  1643. } else if (mode == spv::ExecutionMode::PixelInterlockOrderedEXT ||
  1644. mode == spv::ExecutionMode::PixelInterlockUnorderedEXT) {
  1645. builder.addCapability(spv::Capability::FragmentShaderPixelInterlockEXT);
  1646. } else {
  1647. builder.addCapability(spv::Capability::FragmentShaderSampleInterlockEXT);
  1648. }
  1649. builder.addExtension(spv::E_SPV_EXT_fragment_shader_interlock);
  1650. }
  1651. break;
  1652. case EShLangCompute: {
  1653. builder.addCapability(spv::Capability::Shader);
  1654. bool needSizeId = false;
  1655. for (int dim = 0; dim < 3; ++dim) {
  1656. if ((glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet)) {
  1657. needSizeId = true;
  1658. break;
  1659. }
  1660. }
  1661. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6 && needSizeId) {
  1662. std::vector<spv::Id> dimConstId;
  1663. for (int dim = 0; dim < 3; ++dim) {
  1664. bool specConst = (glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet);
  1665. dimConstId.push_back(builder.makeUintConstant(glslangIntermediate->getLocalSize(dim), specConst));
  1666. if (specConst) {
  1667. builder.addDecoration(dimConstId.back(), spv::Decoration::SpecId,
  1668. glslangIntermediate->getLocalSizeSpecId(dim));
  1669. needSizeId = true;
  1670. }
  1671. }
  1672. builder.addExecutionModeId(shaderEntry, spv::ExecutionMode::LocalSizeId, dimConstId);
  1673. } else {
  1674. if (glslangIntermediate->getTileShadingRateQCOM(0) >= 1 || glslangIntermediate->getTileShadingRateQCOM(1) >= 1 || glslangIntermediate->getTileShadingRateQCOM(2) >= 1) {
  1675. auto rate_x = glslangIntermediate->getTileShadingRateQCOM(0);
  1676. auto rate_y = glslangIntermediate->getTileShadingRateQCOM(1);
  1677. auto rate_z = glslangIntermediate->getTileShadingRateQCOM(2);
  1678. rate_x = ( rate_x == 0 ? 1 : rate_x );
  1679. rate_y = ( rate_y == 0 ? 1 : rate_y );
  1680. rate_z = ( rate_z == 0 ? 1 : rate_z );
  1681. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::TileShadingRateQCOM, rate_x, rate_y, rate_z);
  1682. } else {
  1683. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::LocalSize, glslangIntermediate->getLocalSize(0),
  1684. glslangIntermediate->getLocalSize(1),
  1685. glslangIntermediate->getLocalSize(2));
  1686. }
  1687. }
  1688. if (glslangIntermediate->getLayoutDerivativeModeNone() == glslang::LayoutDerivativeGroupQuads) {
  1689. builder.addCapability(spv::Capability::ComputeDerivativeGroupQuadsNV);
  1690. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::DerivativeGroupQuadsNV);
  1691. builder.addExtension(spv::E_SPV_NV_compute_shader_derivatives);
  1692. } else if (glslangIntermediate->getLayoutDerivativeModeNone() == glslang::LayoutDerivativeGroupLinear) {
  1693. builder.addCapability(spv::Capability::ComputeDerivativeGroupLinearNV);
  1694. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::DerivativeGroupLinearNV);
  1695. builder.addExtension(spv::E_SPV_NV_compute_shader_derivatives);
  1696. }
  1697. if (glslangIntermediate->getNonCoherentTileAttachmentReadQCOM()) {
  1698. builder.addCapability(spv::Capability::TileShadingQCOM);
  1699. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentTileAttachmentReadQCOM);
  1700. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1701. }
  1702. break;
  1703. }
  1704. case EShLangTessEvaluation:
  1705. case EShLangTessControl:
  1706. builder.addCapability(spv::Capability::Tessellation);
  1707. glslang::TLayoutGeometry primitive;
  1708. if (glslangIntermediate->getStage() == EShLangTessControl) {
  1709. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputVertices,
  1710. glslangIntermediate->getVertices());
  1711. primitive = glslangIntermediate->getOutputPrimitive();
  1712. } else {
  1713. primitive = glslangIntermediate->getInputPrimitive();
  1714. }
  1715. switch (primitive) {
  1716. case glslang::ElgTriangles: mode = spv::ExecutionMode::Triangles; break;
  1717. case glslang::ElgQuads: mode = spv::ExecutionMode::Quads; break;
  1718. case glslang::ElgIsolines: mode = spv::ExecutionMode::Isolines; break;
  1719. default: mode = spv::ExecutionMode::Max; break;
  1720. }
  1721. if (mode != spv::ExecutionMode::Max)
  1722. builder.addExecutionMode(shaderEntry, mode);
  1723. switch (glslangIntermediate->getVertexSpacing()) {
  1724. case glslang::EvsEqual: mode = spv::ExecutionMode::SpacingEqual; break;
  1725. case glslang::EvsFractionalEven: mode = spv::ExecutionMode::SpacingFractionalEven; break;
  1726. case glslang::EvsFractionalOdd: mode = spv::ExecutionMode::SpacingFractionalOdd; break;
  1727. default: mode = spv::ExecutionMode::Max; break;
  1728. }
  1729. if (mode != spv::ExecutionMode::Max)
  1730. builder.addExecutionMode(shaderEntry, mode);
  1731. switch (glslangIntermediate->getVertexOrder()) {
  1732. case glslang::EvoCw: mode = spv::ExecutionMode::VertexOrderCw; break;
  1733. case glslang::EvoCcw: mode = spv::ExecutionMode::VertexOrderCcw; break;
  1734. default: mode = spv::ExecutionMode::Max; break;
  1735. }
  1736. if (mode != spv::ExecutionMode::Max)
  1737. builder.addExecutionMode(shaderEntry, mode);
  1738. if (glslangIntermediate->getPointMode())
  1739. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::PointMode);
  1740. break;
  1741. case EShLangGeometry:
  1742. builder.addCapability(spv::Capability::Geometry);
  1743. switch (glslangIntermediate->getInputPrimitive()) {
  1744. case glslang::ElgPoints: mode = spv::ExecutionMode::InputPoints; break;
  1745. case glslang::ElgLines: mode = spv::ExecutionMode::InputLines; break;
  1746. case glslang::ElgLinesAdjacency: mode = spv::ExecutionMode::InputLinesAdjacency; break;
  1747. case glslang::ElgTriangles: mode = spv::ExecutionMode::Triangles; break;
  1748. case glslang::ElgTrianglesAdjacency: mode = spv::ExecutionMode::InputTrianglesAdjacency; break;
  1749. default: mode = spv::ExecutionMode::Max; break;
  1750. }
  1751. if (mode != spv::ExecutionMode::Max)
  1752. builder.addExecutionMode(shaderEntry, mode);
  1753. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::Invocations, glslangIntermediate->getInvocations());
  1754. switch (glslangIntermediate->getOutputPrimitive()) {
  1755. case glslang::ElgPoints: mode = spv::ExecutionMode::OutputPoints; break;
  1756. case glslang::ElgLineStrip: mode = spv::ExecutionMode::OutputLineStrip; break;
  1757. case glslang::ElgTriangleStrip: mode = spv::ExecutionMode::OutputTriangleStrip; break;
  1758. default: mode = spv::ExecutionMode::Max; break;
  1759. }
  1760. if (mode != spv::ExecutionMode::Max)
  1761. builder.addExecutionMode(shaderEntry, mode);
  1762. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputVertices, glslangIntermediate->getVertices());
  1763. break;
  1764. case EShLangRayGen:
  1765. case EShLangIntersect:
  1766. case EShLangAnyHit:
  1767. case EShLangClosestHit:
  1768. case EShLangMiss:
  1769. case EShLangCallable:
  1770. {
  1771. auto& extensions = glslangIntermediate->getRequestedExtensions();
  1772. if (extensions.find("GL_EXT_opacity_micromap") != extensions.end()) {
  1773. builder.addCapability(spv::Capability::RayTracingOpacityMicromapEXT);
  1774. builder.addExtension("SPV_EXT_opacity_micromap");
  1775. }
  1776. if (extensions.find("GL_NV_ray_tracing") == extensions.end()) {
  1777. builder.addCapability(spv::Capability::RayTracingKHR);
  1778. builder.addExtension("SPV_KHR_ray_tracing");
  1779. }
  1780. else {
  1781. builder.addCapability(spv::Capability::RayTracingNV);
  1782. builder.addExtension("SPV_NV_ray_tracing");
  1783. }
  1784. if (glslangIntermediate->getStage() != EShLangRayGen && glslangIntermediate->getStage() != EShLangCallable) {
  1785. if (extensions.find("GL_EXT_ray_cull_mask") != extensions.end()) {
  1786. builder.addCapability(spv::Capability::RayCullMaskKHR);
  1787. builder.addExtension("SPV_KHR_ray_cull_mask");
  1788. }
  1789. if (extensions.find("GL_EXT_ray_tracing_position_fetch") != extensions.end()) {
  1790. builder.addCapability(spv::Capability::RayTracingPositionFetchKHR);
  1791. builder.addExtension("SPV_KHR_ray_tracing_position_fetch");
  1792. }
  1793. }
  1794. break;
  1795. }
  1796. case EShLangTask:
  1797. case EShLangMesh:
  1798. if(isMeshShaderExt) {
  1799. builder.addCapability(spv::Capability::MeshShadingEXT);
  1800. builder.addExtension(spv::E_SPV_EXT_mesh_shader);
  1801. } else {
  1802. builder.addCapability(spv::Capability::MeshShadingNV);
  1803. builder.addExtension(spv::E_SPV_NV_mesh_shader);
  1804. }
  1805. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {
  1806. std::vector<spv::Id> dimConstId;
  1807. for (int dim = 0; dim < 3; ++dim) {
  1808. bool specConst = (glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet);
  1809. dimConstId.push_back(builder.makeUintConstant(glslangIntermediate->getLocalSize(dim), specConst));
  1810. if (specConst) {
  1811. builder.addDecoration(dimConstId.back(), spv::Decoration::SpecId,
  1812. glslangIntermediate->getLocalSizeSpecId(dim));
  1813. }
  1814. }
  1815. builder.addExecutionModeId(shaderEntry, spv::ExecutionMode::LocalSizeId, dimConstId);
  1816. } else {
  1817. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::LocalSize, glslangIntermediate->getLocalSize(0),
  1818. glslangIntermediate->getLocalSize(1),
  1819. glslangIntermediate->getLocalSize(2));
  1820. }
  1821. if (glslangIntermediate->getStage() == EShLangMesh) {
  1822. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputVertices,
  1823. glslangIntermediate->getVertices());
  1824. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputPrimitivesNV,
  1825. glslangIntermediate->getPrimitives());
  1826. switch (glslangIntermediate->getOutputPrimitive()) {
  1827. case glslang::ElgPoints: mode = spv::ExecutionMode::OutputPoints; break;
  1828. case glslang::ElgLines: mode = spv::ExecutionMode::OutputLinesNV; break;
  1829. case glslang::ElgTriangles: mode = spv::ExecutionMode::OutputTrianglesNV; break;
  1830. default: mode = spv::ExecutionMode::Max; break;
  1831. }
  1832. if (mode != spv::ExecutionMode::Max)
  1833. builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
  1834. }
  1835. break;
  1836. default:
  1837. break;
  1838. }
  1839. //
  1840. // Add SPIR-V requirements (GL_EXT_spirv_intrinsics)
  1841. //
  1842. if (glslangIntermediate->hasSpirvRequirement()) {
  1843. const glslang::TSpirvRequirement& spirvRequirement = glslangIntermediate->getSpirvRequirement();
  1844. // Add SPIR-V extension requirement
  1845. for (auto& extension : spirvRequirement.extensions)
  1846. builder.addExtension(extension.c_str());
  1847. // Add SPIR-V capability requirement
  1848. for (auto capability : spirvRequirement.capabilities)
  1849. builder.addCapability(static_cast<spv::Capability>(capability));
  1850. }
  1851. //
  1852. // Add SPIR-V execution mode qualifiers (GL_EXT_spirv_intrinsics)
  1853. //
  1854. if (glslangIntermediate->hasSpirvExecutionMode()) {
  1855. const glslang::TSpirvExecutionMode spirvExecutionMode = glslangIntermediate->getSpirvExecutionMode();
  1856. // Add spirv_execution_mode
  1857. for (auto& mode : spirvExecutionMode.modes) {
  1858. if (!mode.second.empty()) {
  1859. std::vector<unsigned> literals;
  1860. TranslateLiterals(mode.second, literals);
  1861. builder.addExecutionMode(shaderEntry, static_cast<spv::ExecutionMode>(mode.first), literals);
  1862. } else
  1863. builder.addExecutionMode(shaderEntry, static_cast<spv::ExecutionMode>(mode.first));
  1864. }
  1865. // Add spirv_execution_mode_id
  1866. for (auto& modeId : spirvExecutionMode.modeIds) {
  1867. std::vector<spv::Id> operandIds;
  1868. assert(!modeId.second.empty());
  1869. for (auto extraOperand : modeId.second) {
  1870. if (extraOperand->getType().getQualifier().isSpecConstant())
  1871. operandIds.push_back(getSymbolId(extraOperand->getAsSymbolNode()));
  1872. else
  1873. operandIds.push_back(createSpvConstant(*extraOperand));
  1874. }
  1875. builder.addExecutionModeId(shaderEntry, static_cast<spv::ExecutionMode>(modeId.first), operandIds);
  1876. }
  1877. }
  1878. }
  1879. // Finish creating SPV, after the traversal is complete.
  1880. void TGlslangToSpvTraverser::finishSpv(bool compileOnly)
  1881. {
  1882. // If not linking, an entry point is not expected
  1883. if (!compileOnly) {
  1884. // Finish the entry point function
  1885. if (!entryPointTerminated) {
  1886. builder.setBuildPoint(shaderEntry->getLastBlock());
  1887. builder.leaveFunction();
  1888. }
  1889. // finish off the entry-point SPV instruction by adding the Input/Output <id>
  1890. entryPoint->reserveOperands(iOSet.size());
  1891. for (auto id : iOSet)
  1892. entryPoint->addIdOperand(id);
  1893. }
  1894. // Add capabilities, extensions, remove unneeded decorations, etc.,
  1895. // based on the resulting SPIR-V.
  1896. // Note: WebGPU code generation must have the opportunity to aggressively
  1897. // prune unreachable merge blocks and continue targets.
  1898. builder.postProcess(compileOnly);
  1899. }
  1900. // Write the SPV into 'out'.
  1901. void TGlslangToSpvTraverser::dumpSpv(std::vector<unsigned int>& out)
  1902. {
  1903. builder.dump(out);
  1904. }
  1905. //
  1906. // Implement the traversal functions.
  1907. //
  1908. // Return true from interior nodes to have the external traversal
  1909. // continue on to children. Return false if children were
  1910. // already processed.
  1911. //
  1912. //
  1913. // Symbols can turn into
  1914. // - uniform/input reads
  1915. // - output writes
  1916. // - complex lvalue base setups: foo.bar[3].... , where we see foo and start up an access chain
  1917. // - something simple that degenerates into the last bullet
  1918. //
  1919. void TGlslangToSpvTraverser::visitSymbol(glslang::TIntermSymbol* symbol)
  1920. {
  1921. // We update the line information even though no code might be generated here
  1922. // This is helpful to yield correct lines for control flow instructions
  1923. if (!linkageOnly) {
  1924. builder.setDebugSourceLocation(symbol->getLoc().line, symbol->getLoc().getFilename());
  1925. }
  1926. if (symbol->getBasicType() == glslang::EbtFunction) {
  1927. return;
  1928. }
  1929. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  1930. if (symbol->getType().isStruct())
  1931. glslangTypeToIdMap[symbol->getType().getStruct()] = symbol->getId();
  1932. if (symbol->getType().getQualifier().isSpecConstant())
  1933. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  1934. #ifdef ENABLE_HLSL
  1935. // Skip symbol handling if it is string-typed
  1936. if (symbol->getBasicType() == glslang::EbtString)
  1937. return;
  1938. #endif
  1939. // getSymbolId() will set up all the IO decorations on the first call.
  1940. // Formal function parameters were mapped during makeFunctions().
  1941. spv::Id id = getSymbolId(symbol);
  1942. if (symbol->getType().getQualifier().isTaskPayload())
  1943. taskPayloadID = id; // cache the taskPayloadID to be used it as operand for OpEmitMeshTasksEXT
  1944. if (builder.isPointer(id)) {
  1945. if (!symbol->getType().getQualifier().isParamInput() &&
  1946. !symbol->getType().getQualifier().isParamOutput()) {
  1947. // Include all "static use" and "linkage only" interface variables on the OpEntryPoint instruction
  1948. // Consider adding to the OpEntryPoint interface list.
  1949. // Only looking at structures if they have at least one member.
  1950. if (!symbol->getType().isStruct() || symbol->getType().getStruct()->size() > 0) {
  1951. spv::StorageClass sc = builder.getStorageClass(id);
  1952. // Before SPIR-V 1.4, we only want to include Input and Output.
  1953. // Starting with SPIR-V 1.4, we want all globals.
  1954. if ((glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4 && builder.isGlobalVariable(id)) ||
  1955. (sc == spv::StorageClass::Input || sc == spv::StorageClass::Output)) {
  1956. iOSet.insert(id);
  1957. }
  1958. }
  1959. }
  1960. // If the SPIR-V type is required to be different than the AST type
  1961. // (for ex SubgroupMasks or 3x4 ObjectToWorld/WorldToObject matrices),
  1962. // translate now from the SPIR-V type to the AST type, for the consuming
  1963. // operation.
  1964. // Note this turns it from an l-value to an r-value.
  1965. // Currently, all symbols needing this are inputs; avoid the map lookup when non-input.
  1966. if (symbol->getType().getQualifier().storage == glslang::EvqVaryingIn)
  1967. id = translateForcedType(id);
  1968. }
  1969. // Only process non-linkage-only nodes for generating actual static uses
  1970. if (! linkageOnly || symbol->getQualifier().isSpecConstant()) {
  1971. // Prepare to generate code for the access
  1972. // L-value chains will be computed left to right. We're on the symbol now,
  1973. // which is the left-most part of the access chain, so now is "clear" time,
  1974. // followed by setting the base.
  1975. builder.clearAccessChain();
  1976. // For now, we consider all user variables as being in memory, so they are pointers,
  1977. // except for
  1978. // A) R-Value arguments to a function, which are an intermediate object.
  1979. // See comments in handleUserFunctionCall().
  1980. // B) Specialization constants (normal constants don't even come in as a variable),
  1981. // These are also pure R-values.
  1982. // C) R-Values from type translation, see above call to translateForcedType()
  1983. glslang::TQualifier qualifier = symbol->getQualifier();
  1984. if (qualifier.isSpecConstant() || rValueParameters.find(symbol->getId()) != rValueParameters.end() ||
  1985. !builder.isPointerType(builder.getTypeId(id)))
  1986. builder.setAccessChainRValue(id);
  1987. else
  1988. builder.setAccessChainLValue(id);
  1989. }
  1990. #ifdef ENABLE_HLSL
  1991. // Process linkage-only nodes for any special additional interface work.
  1992. if (linkageOnly) {
  1993. if (glslangIntermediate->getHlslFunctionality1()) {
  1994. // Map implicit counter buffers to their originating buffers, which should have been
  1995. // seen by now, given earlier pruning of unused counters, and preservation of order
  1996. // of declaration.
  1997. if (symbol->getType().getQualifier().isUniformOrBuffer()) {
  1998. if (!glslangIntermediate->hasCounterBufferName(symbol->getName())) {
  1999. // Save possible originating buffers for counter buffers, keyed by
  2000. // making the potential counter-buffer name.
  2001. std::string keyName = symbol->getName().c_str();
  2002. keyName = glslangIntermediate->addCounterBufferName(keyName);
  2003. counterOriginator[keyName] = symbol;
  2004. } else {
  2005. // Handle a counter buffer, by finding the saved originating buffer.
  2006. std::string keyName = symbol->getName().c_str();
  2007. auto it = counterOriginator.find(keyName);
  2008. if (it != counterOriginator.end()) {
  2009. id = getSymbolId(it->second);
  2010. if (id != spv::NoResult) {
  2011. spv::Id counterId = getSymbolId(symbol);
  2012. if (counterId != spv::NoResult) {
  2013. builder.addExtension("SPV_GOOGLE_hlsl_functionality1");
  2014. builder.addDecorationId(id, spv::Decoration::HlslCounterBufferGOOGLE, counterId);
  2015. }
  2016. }
  2017. }
  2018. }
  2019. }
  2020. }
  2021. }
  2022. #endif
  2023. }
  2024. bool TGlslangToSpvTraverser::visitBinary(glslang::TVisit /* visit */, glslang::TIntermBinary* node)
  2025. {
  2026. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2027. if (node->getLeft()->getAsSymbolNode() != nullptr && node->getLeft()->getType().isStruct()) {
  2028. glslangTypeToIdMap[node->getLeft()->getType().getStruct()] = node->getLeft()->getAsSymbolNode()->getId();
  2029. }
  2030. if (node->getRight()->getAsSymbolNode() != nullptr && node->getRight()->getType().isStruct()) {
  2031. glslangTypeToIdMap[node->getRight()->getType().getStruct()] = node->getRight()->getAsSymbolNode()->getId();
  2032. }
  2033. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  2034. if (node->getType().getQualifier().isSpecConstant())
  2035. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  2036. // First, handle special cases
  2037. switch (node->getOp()) {
  2038. case glslang::EOpAssign:
  2039. case glslang::EOpAddAssign:
  2040. case glslang::EOpSubAssign:
  2041. case glslang::EOpMulAssign:
  2042. case glslang::EOpVectorTimesMatrixAssign:
  2043. case glslang::EOpVectorTimesScalarAssign:
  2044. case glslang::EOpMatrixTimesScalarAssign:
  2045. case glslang::EOpMatrixTimesMatrixAssign:
  2046. case glslang::EOpDivAssign:
  2047. case glslang::EOpModAssign:
  2048. case glslang::EOpAndAssign:
  2049. case glslang::EOpInclusiveOrAssign:
  2050. case glslang::EOpExclusiveOrAssign:
  2051. case glslang::EOpLeftShiftAssign:
  2052. case glslang::EOpRightShiftAssign:
  2053. // A bin-op assign "a += b" means the same thing as "a = a + b"
  2054. // where a is evaluated before b. For a simple assignment, GLSL
  2055. // says to evaluate the left before the right. So, always, left
  2056. // node then right node.
  2057. {
  2058. // get the left l-value, save it away
  2059. builder.clearAccessChain();
  2060. node->getLeft()->traverse(this);
  2061. spv::Builder::AccessChain lValue = builder.getAccessChain();
  2062. // evaluate the right
  2063. builder.clearAccessChain();
  2064. node->getRight()->traverse(this);
  2065. spv::Id rValue = accessChainLoad(node->getRight()->getType());
  2066. // reset line number for assignment
  2067. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2068. if (node->getOp() != glslang::EOpAssign) {
  2069. // the left is also an r-value
  2070. builder.setAccessChain(lValue);
  2071. spv::Id leftRValue = accessChainLoad(node->getLeft()->getType());
  2072. // do the operation
  2073. spv::Builder::AccessChain::CoherentFlags coherentFlags = TranslateCoherent(node->getLeft()->getType());
  2074. coherentFlags |= TranslateCoherent(node->getRight()->getType());
  2075. OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
  2076. TranslateNoContractionDecoration(node->getType().getQualifier()),
  2077. TranslateNonUniformDecoration(coherentFlags) };
  2078. rValue = createBinaryOperation(node->getOp(), decorations,
  2079. convertGlslangToSpvType(node->getType()), leftRValue, rValue,
  2080. node->getType().getBasicType());
  2081. // these all need their counterparts in createBinaryOperation()
  2082. assert(rValue != spv::NoResult);
  2083. }
  2084. // store the result
  2085. builder.setAccessChain(lValue);
  2086. multiTypeStore(node->getLeft()->getType(), rValue);
  2087. // assignments are expressions having an rValue after they are evaluated...
  2088. builder.clearAccessChain();
  2089. builder.setAccessChainRValue(rValue);
  2090. }
  2091. return false;
  2092. case glslang::EOpIndexDirect:
  2093. case glslang::EOpIndexDirectStruct:
  2094. {
  2095. // Structure, array, matrix, or vector indirection with statically known index.
  2096. // Get the left part of the access chain.
  2097. node->getLeft()->traverse(this);
  2098. // Add the next element in the chain
  2099. const int glslangIndex = node->getRight()->getAsConstantUnion()->getConstArray()[0].getIConst();
  2100. if (! node->getLeft()->getType().isArray() &&
  2101. node->getLeft()->getType().isVector() &&
  2102. node->getOp() == glslang::EOpIndexDirect) {
  2103. // Swizzle is uniform so propagate uniform into access chain
  2104. spv::Builder::AccessChain::CoherentFlags coherentFlags = TranslateCoherent(node->getLeft()->getType());
  2105. coherentFlags.nonUniform = 0;
  2106. // This is essentially a hard-coded vector swizzle of size 1,
  2107. // so short circuit the access-chain stuff with a swizzle.
  2108. std::vector<unsigned> swizzle;
  2109. swizzle.push_back(glslangIndex);
  2110. int dummySize;
  2111. builder.accessChainPushSwizzle(swizzle, convertGlslangToSpvType(node->getLeft()->getType()),
  2112. coherentFlags,
  2113. glslangIntermediate->getBaseAlignmentScalar(
  2114. node->getLeft()->getType(), dummySize));
  2115. } else {
  2116. // Load through a block reference is performed with a dot operator that
  2117. // is mapped to EOpIndexDirectStruct. When we get to the actual reference,
  2118. // do a load and reset the access chain.
  2119. if (node->getLeft()->isReference() &&
  2120. !node->getLeft()->getType().isArray() &&
  2121. node->getOp() == glslang::EOpIndexDirectStruct)
  2122. {
  2123. spv::Id left = accessChainLoad(node->getLeft()->getType());
  2124. builder.clearAccessChain();
  2125. builder.setAccessChainLValue(left);
  2126. }
  2127. int spvIndex = glslangIndex;
  2128. if (node->getLeft()->getBasicType() == glslang::EbtBlock &&
  2129. node->getOp() == glslang::EOpIndexDirectStruct)
  2130. {
  2131. // This may be, e.g., an anonymous block-member selection, which generally need
  2132. // index remapping due to hidden members in anonymous blocks.
  2133. long long glslangId = glslangTypeToIdMap[node->getLeft()->getType().getStruct()];
  2134. if (memberRemapper.find(glslangId) != memberRemapper.end()) {
  2135. std::vector<int>& remapper = memberRemapper[glslangId];
  2136. assert(remapper.size() > 0);
  2137. spvIndex = remapper[glslangIndex];
  2138. }
  2139. }
  2140. // Struct reference propagates uniform lvalue
  2141. spv::Builder::AccessChain::CoherentFlags coherentFlags =
  2142. TranslateCoherent(node->getLeft()->getType());
  2143. coherentFlags.nonUniform = 0;
  2144. // normal case for indexing array or structure or block
  2145. builder.accessChainPush(builder.makeIntConstant(spvIndex),
  2146. coherentFlags,
  2147. node->getLeft()->getType().getBufferReferenceAlignment());
  2148. // Add capabilities here for accessing PointSize and clip/cull distance.
  2149. // We have deferred generation of associated capabilities until now.
  2150. if (node->getLeft()->getType().isStruct() && ! node->getLeft()->getType().isArray())
  2151. declareUseOfStructMember(*(node->getLeft()->getType().getStruct()), glslangIndex);
  2152. }
  2153. }
  2154. return false;
  2155. case glslang::EOpIndexIndirect:
  2156. {
  2157. // Array, matrix, or vector indirection with variable index.
  2158. // Will use native SPIR-V access-chain for and array indirection;
  2159. // matrices are arrays of vectors, so will also work for a matrix.
  2160. // Will use the access chain's 'component' for variable index into a vector.
  2161. // This adapter is building access chains left to right.
  2162. // Set up the access chain to the left.
  2163. node->getLeft()->traverse(this);
  2164. // save it so that computing the right side doesn't trash it
  2165. spv::Builder::AccessChain partial = builder.getAccessChain();
  2166. // compute the next index in the chain
  2167. builder.clearAccessChain();
  2168. node->getRight()->traverse(this);
  2169. spv::Id index = accessChainLoad(node->getRight()->getType());
  2170. addIndirectionIndexCapabilities(node->getLeft()->getType(), node->getRight()->getType());
  2171. // restore the saved access chain
  2172. builder.setAccessChain(partial);
  2173. // Only if index is nonUniform should we propagate nonUniform into access chain
  2174. spv::Builder::AccessChain::CoherentFlags index_flags = TranslateCoherent(node->getRight()->getType());
  2175. spv::Builder::AccessChain::CoherentFlags coherent_flags = TranslateCoherent(node->getLeft()->getType());
  2176. coherent_flags.nonUniform = index_flags.nonUniform;
  2177. if (! node->getLeft()->getType().isArray() && node->getLeft()->getType().isVector()) {
  2178. int dummySize;
  2179. builder.accessChainPushComponent(
  2180. index, convertGlslangToSpvType(node->getLeft()->getType()), coherent_flags,
  2181. glslangIntermediate->getBaseAlignmentScalar(node->getLeft()->getType(),
  2182. dummySize));
  2183. } else
  2184. builder.accessChainPush(index, coherent_flags,
  2185. node->getLeft()->getType().getBufferReferenceAlignment());
  2186. }
  2187. return false;
  2188. case glslang::EOpVectorSwizzle:
  2189. {
  2190. node->getLeft()->traverse(this);
  2191. std::vector<unsigned> swizzle;
  2192. convertSwizzle(*node->getRight()->getAsAggregate(), swizzle);
  2193. int dummySize;
  2194. builder.accessChainPushSwizzle(swizzle, convertGlslangToSpvType(node->getLeft()->getType()),
  2195. TranslateCoherent(node->getLeft()->getType()),
  2196. glslangIntermediate->getBaseAlignmentScalar(node->getLeft()->getType(),
  2197. dummySize));
  2198. }
  2199. return false;
  2200. case glslang::EOpMatrixSwizzle:
  2201. logger->missingFunctionality("matrix swizzle");
  2202. return true;
  2203. case glslang::EOpLogicalOr:
  2204. case glslang::EOpLogicalAnd:
  2205. {
  2206. // These may require short circuiting, but can sometimes be done as straight
  2207. // binary operations. The right operand must be short circuited if it has
  2208. // side effects, and should probably be if it is complex.
  2209. if (isTrivial(node->getRight()->getAsTyped()))
  2210. break; // handle below as a normal binary operation
  2211. // otherwise, we need to do dynamic short circuiting on the right operand
  2212. spv::Id result = createShortCircuit(node->getOp(), *node->getLeft()->getAsTyped(),
  2213. *node->getRight()->getAsTyped());
  2214. builder.clearAccessChain();
  2215. builder.setAccessChainRValue(result);
  2216. }
  2217. return false;
  2218. default:
  2219. break;
  2220. }
  2221. // Assume generic binary op...
  2222. // get right operand
  2223. builder.clearAccessChain();
  2224. node->getLeft()->traverse(this);
  2225. spv::Id left = accessChainLoad(node->getLeft()->getType());
  2226. // get left operand
  2227. builder.clearAccessChain();
  2228. node->getRight()->traverse(this);
  2229. spv::Id right = accessChainLoad(node->getRight()->getType());
  2230. // get result
  2231. OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
  2232. TranslateNoContractionDecoration(node->getType().getQualifier()),
  2233. TranslateNonUniformDecoration(node->getType().getQualifier()) };
  2234. spv::Id result = createBinaryOperation(node->getOp(), decorations,
  2235. convertGlslangToSpvType(node->getType()), left, right,
  2236. node->getLeft()->getType().getBasicType());
  2237. builder.clearAccessChain();
  2238. if (! result) {
  2239. logger->missingFunctionality("unknown glslang binary operation");
  2240. return true; // pick up a child as the place-holder result
  2241. } else {
  2242. builder.setAccessChainRValue(result);
  2243. return false;
  2244. }
  2245. }
  2246. spv::Id TGlslangToSpvTraverser::convertLoadedBoolInUniformToUint(const glslang::TType& type,
  2247. spv::Id nominalTypeId,
  2248. spv::Id loadedId)
  2249. {
  2250. if (builder.isScalarType(nominalTypeId)) {
  2251. // Conversion for bool
  2252. spv::Id boolType = builder.makeBoolType();
  2253. if (nominalTypeId != boolType)
  2254. return builder.createBinOp(spv::Op::OpINotEqual, boolType, loadedId, builder.makeUintConstant(0));
  2255. } else if (builder.isVectorType(nominalTypeId)) {
  2256. // Conversion for bvec
  2257. int vecSize = builder.getNumTypeComponents(nominalTypeId);
  2258. spv::Id bvecType = builder.makeVectorType(builder.makeBoolType(), vecSize);
  2259. if (nominalTypeId != bvecType)
  2260. loadedId = builder.createBinOp(spv::Op::OpINotEqual, bvecType, loadedId,
  2261. makeSmearedConstant(builder.makeUintConstant(0), vecSize));
  2262. } else if (builder.isArrayType(nominalTypeId)) {
  2263. // Conversion for bool array
  2264. spv::Id boolArrayTypeId = convertGlslangToSpvType(type);
  2265. if (nominalTypeId != boolArrayTypeId)
  2266. {
  2267. // Use OpCopyLogical from SPIR-V 1.4 if available.
  2268. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4)
  2269. return builder.createUnaryOp(spv::Op::OpCopyLogical, boolArrayTypeId, loadedId);
  2270. glslang::TType glslangElementType(type, 0);
  2271. spv::Id elementNominalTypeId = builder.getContainedTypeId(nominalTypeId);
  2272. std::vector<spv::Id> constituents;
  2273. for (int index = 0; index < type.getOuterArraySize(); ++index) {
  2274. // get the element
  2275. spv::Id elementValue = builder.createCompositeExtract(loadedId, elementNominalTypeId, index);
  2276. // recursively convert it
  2277. spv::Id elementConvertedValue = convertLoadedBoolInUniformToUint(glslangElementType, elementNominalTypeId, elementValue);
  2278. constituents.push_back(elementConvertedValue);
  2279. }
  2280. return builder.createCompositeConstruct(boolArrayTypeId, constituents);
  2281. }
  2282. }
  2283. return loadedId;
  2284. }
  2285. // Figure out what, if any, type changes are needed when accessing a specific built-in.
  2286. // Returns <the type SPIR-V requires for declarion, the type to translate to on use>.
  2287. // Also see comment for 'forceType', regarding tracking SPIR-V-required types.
  2288. std::pair<spv::Id, spv::Id> TGlslangToSpvTraverser::getForcedType(glslang::TBuiltInVariable glslangBuiltIn,
  2289. const glslang::TType& glslangType)
  2290. {
  2291. switch(glslangBuiltIn)
  2292. {
  2293. case glslang::EbvSubGroupEqMask:
  2294. case glslang::EbvSubGroupGeMask:
  2295. case glslang::EbvSubGroupGtMask:
  2296. case glslang::EbvSubGroupLeMask:
  2297. case glslang::EbvSubGroupLtMask: {
  2298. // these require changing a 64-bit scaler -> a vector of 32-bit components
  2299. if (glslangType.isVector())
  2300. break;
  2301. spv::Id ivec4_type = builder.makeVectorType(builder.makeUintType(32), 4);
  2302. spv::Id uint64_type = builder.makeUintType(64);
  2303. std::pair<spv::Id, spv::Id> ret(ivec4_type, uint64_type);
  2304. return ret;
  2305. }
  2306. // There are no SPIR-V builtins defined for these and map onto original non-transposed
  2307. // builtins. During visitBinary we insert a transpose
  2308. case glslang::EbvWorldToObject3x4:
  2309. case glslang::EbvObjectToWorld3x4: {
  2310. spv::Id mat43 = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  2311. spv::Id mat34 = builder.makeMatrixType(builder.makeFloatType(32), 3, 4);
  2312. std::pair<spv::Id, spv::Id> ret(mat43, mat34);
  2313. return ret;
  2314. }
  2315. default:
  2316. break;
  2317. }
  2318. std::pair<spv::Id, spv::Id> ret(spv::NoType, spv::NoType);
  2319. return ret;
  2320. }
  2321. // For an object previously identified (see getForcedType() and forceType)
  2322. // as needing type translations, do the translation needed for a load, turning
  2323. // an L-value into in R-value.
  2324. spv::Id TGlslangToSpvTraverser::translateForcedType(spv::Id object)
  2325. {
  2326. const auto forceIt = forceType.find(object);
  2327. if (forceIt == forceType.end())
  2328. return object;
  2329. spv::Id desiredTypeId = forceIt->second;
  2330. spv::Id objectTypeId = builder.getTypeId(object);
  2331. assert(builder.isPointerType(objectTypeId));
  2332. objectTypeId = builder.getContainedTypeId(objectTypeId);
  2333. if (builder.isVectorType(objectTypeId) &&
  2334. builder.getScalarTypeWidth(builder.getContainedTypeId(objectTypeId)) == 32) {
  2335. if (builder.getScalarTypeWidth(desiredTypeId) == 64) {
  2336. // handle 32-bit v.xy* -> 64-bit
  2337. builder.clearAccessChain();
  2338. builder.setAccessChainLValue(object);
  2339. object = builder.accessChainLoad(spv::NoPrecision, spv::Decoration::Max, spv::Decoration::Max, objectTypeId);
  2340. std::vector<spv::Id> components;
  2341. components.push_back(builder.createCompositeExtract(object, builder.getContainedTypeId(objectTypeId), 0));
  2342. components.push_back(builder.createCompositeExtract(object, builder.getContainedTypeId(objectTypeId), 1));
  2343. spv::Id vecType = builder.makeVectorType(builder.getContainedTypeId(objectTypeId), 2);
  2344. return builder.createUnaryOp(spv::Op::OpBitcast, desiredTypeId,
  2345. builder.createCompositeConstruct(vecType, components));
  2346. } else {
  2347. logger->missingFunctionality("forcing 32-bit vector type to non 64-bit scalar");
  2348. }
  2349. } else if (builder.isMatrixType(objectTypeId)) {
  2350. // There are no SPIR-V builtins defined for 3x4 variants of ObjectToWorld/WorldToObject
  2351. // and we insert a transpose after loading the original non-transposed builtins
  2352. builder.clearAccessChain();
  2353. builder.setAccessChainLValue(object);
  2354. object = builder.accessChainLoad(spv::NoPrecision, spv::Decoration::Max, spv::Decoration::Max, objectTypeId);
  2355. return builder.createUnaryOp(spv::Op::OpTranspose, desiredTypeId, object);
  2356. } else {
  2357. logger->missingFunctionality("forcing non 32-bit vector type");
  2358. }
  2359. return object;
  2360. }
  2361. bool TGlslangToSpvTraverser::visitUnary(glslang::TVisit /* visit */, glslang::TIntermUnary* node)
  2362. {
  2363. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2364. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  2365. if (node->getType().getQualifier().isSpecConstant())
  2366. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  2367. spv::Id result = spv::NoResult;
  2368. // try texturing first
  2369. result = createImageTextureFunctionCall(node);
  2370. if (result != spv::NoResult) {
  2371. builder.clearAccessChain();
  2372. builder.setAccessChainRValue(result);
  2373. return false; // done with this node
  2374. }
  2375. // Non-texturing.
  2376. if (node->getOp() == glslang::EOpArrayLength) {
  2377. // Quite special; won't want to evaluate the operand.
  2378. // Currently, the front-end does not allow .length() on an array until it is sized,
  2379. // except for the last block membeor of an SSBO.
  2380. // TODO: If this changes, link-time sized arrays might show up here, and need their
  2381. // size extracted.
  2382. // Normal .length() would have been constant folded by the front-end.
  2383. // So, this has to be block.lastMember.length().
  2384. // SPV wants "block" and member number as the operands, go get them.
  2385. spv::Id length;
  2386. if (node->getOperand()->getType().isCoopMat()) {
  2387. spv::Id typeId = convertGlslangToSpvType(node->getOperand()->getType());
  2388. assert(builder.isCooperativeMatrixType(typeId));
  2389. if (node->getOperand()->getType().isCoopMatKHR()) {
  2390. length = builder.createCooperativeMatrixLengthKHR(typeId);
  2391. } else {
  2392. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  2393. length = builder.createCooperativeMatrixLengthNV(typeId);
  2394. }
  2395. } else if (node->getOperand()->getType().isCoopVecNV()) {
  2396. spv::Id typeId = convertGlslangToSpvType(node->getOperand()->getType());
  2397. length = builder.getCooperativeVectorNumComponents(typeId);
  2398. } else {
  2399. glslang::TIntermTyped* block = node->getOperand()->getAsBinaryNode()->getLeft();
  2400. block->traverse(this);
  2401. unsigned int member = node->getOperand()->getAsBinaryNode()->getRight()->getAsConstantUnion()
  2402. ->getConstArray()[0].getUConst();
  2403. length = builder.createArrayLength(builder.accessChainGetLValue(), member);
  2404. }
  2405. // GLSL semantics say the result of .length() is an int, while SPIR-V says
  2406. // signedness must be 0. So, convert from SPIR-V unsigned back to GLSL's
  2407. // AST expectation of a signed result.
  2408. if (glslangIntermediate->getSource() == glslang::EShSourceGlsl) {
  2409. if (builder.isInSpecConstCodeGenMode()) {
  2410. length = builder.createBinOp(spv::Op::OpIAdd, builder.makeIntType(32), length, builder.makeIntConstant(0));
  2411. } else {
  2412. length = builder.createUnaryOp(spv::Op::OpBitcast, builder.makeIntType(32), length);
  2413. }
  2414. }
  2415. builder.clearAccessChain();
  2416. builder.setAccessChainRValue(length);
  2417. return false;
  2418. }
  2419. // Force variable declaration - Debug Mode Only
  2420. if (node->getOp() == glslang::EOpDeclare) {
  2421. builder.clearAccessChain();
  2422. node->getOperand()->traverse(this);
  2423. builder.clearAccessChain();
  2424. return false;
  2425. }
  2426. // Start by evaluating the operand
  2427. // Does it need a swizzle inversion? If so, evaluation is inverted;
  2428. // operate first on the swizzle base, then apply the swizzle.
  2429. spv::Id invertedType = spv::NoType;
  2430. auto resultType = [&invertedType, &node, this](){ return invertedType != spv::NoType ?
  2431. invertedType : convertGlslangToSpvType(node->getType()); };
  2432. if (node->getOp() == glslang::EOpInterpolateAtCentroid)
  2433. invertedType = getInvertedSwizzleType(*node->getOperand());
  2434. builder.clearAccessChain();
  2435. TIntermNode *operandNode;
  2436. if (invertedType != spv::NoType)
  2437. operandNode = node->getOperand()->getAsBinaryNode()->getLeft();
  2438. else
  2439. operandNode = node->getOperand();
  2440. operandNode->traverse(this);
  2441. spv::Id operand = spv::NoResult;
  2442. spv::Builder::AccessChain::CoherentFlags lvalueCoherentFlags;
  2443. const auto hitObjectOpsWithLvalue = [](glslang::TOperator op) {
  2444. switch(op) {
  2445. case glslang::EOpReorderThreadNV:
  2446. case glslang::EOpHitObjectGetCurrentTimeNV:
  2447. case glslang::EOpHitObjectGetHitKindNV:
  2448. case glslang::EOpHitObjectGetPrimitiveIndexNV:
  2449. case glslang::EOpHitObjectGetGeometryIndexNV:
  2450. case glslang::EOpHitObjectGetInstanceIdNV:
  2451. case glslang::EOpHitObjectGetInstanceCustomIndexNV:
  2452. case glslang::EOpHitObjectGetObjectRayDirectionNV:
  2453. case glslang::EOpHitObjectGetObjectRayOriginNV:
  2454. case glslang::EOpHitObjectGetWorldRayDirectionNV:
  2455. case glslang::EOpHitObjectGetWorldRayOriginNV:
  2456. case glslang::EOpHitObjectGetWorldToObjectNV:
  2457. case glslang::EOpHitObjectGetObjectToWorldNV:
  2458. case glslang::EOpHitObjectGetRayTMaxNV:
  2459. case glslang::EOpHitObjectGetRayTMinNV:
  2460. case glslang::EOpHitObjectIsEmptyNV:
  2461. case glslang::EOpHitObjectIsHitNV:
  2462. case glslang::EOpHitObjectIsMissNV:
  2463. case glslang::EOpHitObjectRecordEmptyNV:
  2464. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:
  2465. case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:
  2466. case glslang::EOpHitObjectGetClusterIdNV:
  2467. case glslang::EOpHitObjectGetSpherePositionNV:
  2468. case glslang::EOpHitObjectGetSphereRadiusNV:
  2469. case glslang::EOpHitObjectIsSphereHitNV:
  2470. case glslang::EOpHitObjectIsLSSHitNV:
  2471. return true;
  2472. default:
  2473. return false;
  2474. }
  2475. };
  2476. if (node->getOp() == glslang::EOpAtomicCounterIncrement ||
  2477. node->getOp() == glslang::EOpAtomicCounterDecrement ||
  2478. node->getOp() == glslang::EOpAtomicCounter ||
  2479. (node->getOp() == glslang::EOpInterpolateAtCentroid &&
  2480. glslangIntermediate->getSource() != glslang::EShSourceHlsl) ||
  2481. node->getOp() == glslang::EOpRayQueryProceed ||
  2482. node->getOp() == glslang::EOpRayQueryGetRayTMin ||
  2483. node->getOp() == glslang::EOpRayQueryGetRayFlags ||
  2484. node->getOp() == glslang::EOpRayQueryGetWorldRayOrigin ||
  2485. node->getOp() == glslang::EOpRayQueryGetWorldRayDirection ||
  2486. node->getOp() == glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque ||
  2487. node->getOp() == glslang::EOpRayQueryTerminate ||
  2488. node->getOp() == glslang::EOpRayQueryConfirmIntersection ||
  2489. (node->getOp() == glslang::EOpSpirvInst && operandNode->getAsTyped()->getQualifier().isSpirvByReference()) ||
  2490. hitObjectOpsWithLvalue(node->getOp())) {
  2491. operand = builder.accessChainGetLValue(); // Special case l-value operands
  2492. lvalueCoherentFlags = builder.getAccessChain().coherentFlags;
  2493. lvalueCoherentFlags |= TranslateCoherent(operandNode->getAsTyped()->getType());
  2494. } else if (operandNode->getAsTyped()->getQualifier().isSpirvLiteral()) {
  2495. // Will be translated to a literal value, make a placeholder here
  2496. operand = spv::NoResult;
  2497. } else {
  2498. operand = accessChainLoad(node->getOperand()->getType());
  2499. }
  2500. OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
  2501. TranslateNoContractionDecoration(node->getType().getQualifier()),
  2502. TranslateNonUniformDecoration(node->getType().getQualifier()) };
  2503. // it could be a conversion
  2504. if (! result) {
  2505. result = createConversion(node->getOp(), decorations, resultType(), operand,
  2506. node->getType().getBasicType(), node->getOperand()->getBasicType());
  2507. if (result) {
  2508. if (node->getType().isCoopMatKHR() && node->getOperand()->getAsTyped()->getType().isCoopMatKHR() &&
  2509. !node->getAsTyped()->getType().sameCoopMatUse(node->getOperand()->getAsTyped()->getType())) {
  2510. // Conversions that change use need CapabilityCooperativeMatrixConversionsNV
  2511. builder.addCapability(spv::Capability::CooperativeMatrixConversionsNV);
  2512. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  2513. }
  2514. }
  2515. }
  2516. // if not, then possibly an operation
  2517. if (! result)
  2518. result = createUnaryOperation(node->getOp(), decorations, resultType(), operand,
  2519. node->getOperand()->getBasicType(), lvalueCoherentFlags, node->getType());
  2520. // it could be attached to a SPIR-V intruction
  2521. if (!result) {
  2522. if (node->getOp() == glslang::EOpSpirvInst) {
  2523. const auto& spirvInst = node->getSpirvInstruction();
  2524. if (spirvInst.set == "") {
  2525. spv::IdImmediate idImmOp = {true, operand};
  2526. if (operandNode->getAsTyped()->getQualifier().isSpirvLiteral()) {
  2527. // Translate the constant to a literal value
  2528. std::vector<unsigned> literals;
  2529. glslang::TVector<const glslang::TIntermConstantUnion*> constants;
  2530. constants.push_back(operandNode->getAsConstantUnion());
  2531. TranslateLiterals(constants, literals);
  2532. idImmOp = {false, literals[0]};
  2533. }
  2534. if (node->getBasicType() == glslang::EbtVoid)
  2535. builder.createNoResultOp(static_cast<spv::Op>(spirvInst.id), {idImmOp});
  2536. else
  2537. result = builder.createOp(static_cast<spv::Op>(spirvInst.id), resultType(), {idImmOp});
  2538. } else {
  2539. result = builder.createBuiltinCall(
  2540. resultType(), spirvInst.set == "GLSL.std.450" ? stdBuiltins : getExtBuiltins(spirvInst.set.c_str()),
  2541. spirvInst.id, {operand});
  2542. }
  2543. if (node->getBasicType() == glslang::EbtVoid)
  2544. return false; // done with this node
  2545. }
  2546. }
  2547. if (result) {
  2548. if (invertedType) {
  2549. result = createInvertedSwizzle(decorations.precision, *node->getOperand(), result);
  2550. decorations.addNonUniform(builder, result);
  2551. }
  2552. builder.clearAccessChain();
  2553. builder.setAccessChainRValue(result);
  2554. return false; // done with this node
  2555. }
  2556. // it must be a special case, check...
  2557. switch (node->getOp()) {
  2558. case glslang::EOpPostIncrement:
  2559. case glslang::EOpPostDecrement:
  2560. case glslang::EOpPreIncrement:
  2561. case glslang::EOpPreDecrement:
  2562. {
  2563. // we need the integer value "1" or the floating point "1.0" to add/subtract
  2564. spv::Id one = 0;
  2565. if (node->getBasicType() == glslang::EbtFloat)
  2566. one = builder.makeFloatConstant(1.0F);
  2567. else if (node->getBasicType() == glslang::EbtDouble)
  2568. one = builder.makeDoubleConstant(1.0);
  2569. else if (node->getBasicType() == glslang::EbtFloat16)
  2570. one = builder.makeFloat16Constant(1.0F);
  2571. else if (node->getBasicType() == glslang::EbtBFloat16)
  2572. one = builder.makeBFloat16Constant(1.0F);
  2573. else if (node->getBasicType() == glslang::EbtFloatE5M2)
  2574. one = builder.makeFloatE5M2Constant(1.0F);
  2575. else if (node->getBasicType() == glslang::EbtFloatE4M3)
  2576. one = builder.makeFloatE4M3Constant(1.0F);
  2577. else if (node->getBasicType() == glslang::EbtInt8 || node->getBasicType() == glslang::EbtUint8)
  2578. one = builder.makeInt8Constant(1);
  2579. else if (node->getBasicType() == glslang::EbtInt16 || node->getBasicType() == glslang::EbtUint16)
  2580. one = builder.makeInt16Constant(1);
  2581. else if (node->getBasicType() == glslang::EbtInt64 || node->getBasicType() == glslang::EbtUint64)
  2582. one = builder.makeInt64Constant(1);
  2583. else
  2584. one = builder.makeIntConstant(1);
  2585. glslang::TOperator op;
  2586. if (node->getOp() == glslang::EOpPreIncrement ||
  2587. node->getOp() == glslang::EOpPostIncrement)
  2588. op = glslang::EOpAdd;
  2589. else
  2590. op = glslang::EOpSub;
  2591. spv::Id result = createBinaryOperation(op, decorations,
  2592. convertGlslangToSpvType(node->getType()), operand, one,
  2593. node->getType().getBasicType());
  2594. assert(result != spv::NoResult);
  2595. // The result of operation is always stored, but conditionally the
  2596. // consumed result. The consumed result is always an r-value.
  2597. builder.accessChainStore(result,
  2598. TranslateNonUniformDecoration(builder.getAccessChain().coherentFlags));
  2599. builder.clearAccessChain();
  2600. if (node->getOp() == glslang::EOpPreIncrement ||
  2601. node->getOp() == glslang::EOpPreDecrement)
  2602. builder.setAccessChainRValue(result);
  2603. else
  2604. builder.setAccessChainRValue(operand);
  2605. }
  2606. return false;
  2607. case glslang::EOpAssumeEXT:
  2608. builder.addCapability(spv::Capability::ExpectAssumeKHR);
  2609. builder.addExtension(spv::E_SPV_KHR_expect_assume);
  2610. builder.createNoResultOp(spv::Op::OpAssumeTrueKHR, operand);
  2611. return false;
  2612. case glslang::EOpEmitStreamVertex:
  2613. builder.createNoResultOp(spv::Op::OpEmitStreamVertex, operand);
  2614. return false;
  2615. case glslang::EOpEndStreamPrimitive:
  2616. builder.createNoResultOp(spv::Op::OpEndStreamPrimitive, operand);
  2617. return false;
  2618. case glslang::EOpRayQueryTerminate:
  2619. builder.createNoResultOp(spv::Op::OpRayQueryTerminateKHR, operand);
  2620. return false;
  2621. case glslang::EOpRayQueryConfirmIntersection:
  2622. builder.createNoResultOp(spv::Op::OpRayQueryConfirmIntersectionKHR, operand);
  2623. return false;
  2624. case glslang::EOpReorderThreadNV:
  2625. builder.createNoResultOp(spv::Op::OpReorderThreadWithHitObjectNV, operand);
  2626. return false;
  2627. case glslang::EOpHitObjectRecordEmptyNV:
  2628. builder.createNoResultOp(spv::Op::OpHitObjectRecordEmptyNV, operand);
  2629. return false;
  2630. case glslang::EOpCreateTensorLayoutNV:
  2631. result = builder.createOp(spv::Op::OpCreateTensorLayoutNV, resultType(), std::vector<spv::Id>{});
  2632. builder.clearAccessChain();
  2633. builder.setAccessChainRValue(result);
  2634. return false;
  2635. case glslang::EOpCreateTensorViewNV:
  2636. result = builder.createOp(spv::Op::OpCreateTensorViewNV, resultType(), std::vector<spv::Id>{});
  2637. builder.clearAccessChain();
  2638. builder.setAccessChainRValue(result);
  2639. return false;
  2640. default:
  2641. logger->missingFunctionality("unknown glslang unary");
  2642. return true; // pick up operand as placeholder result
  2643. }
  2644. }
  2645. // Construct a composite object, recursively copying members if their types don't match
  2646. spv::Id TGlslangToSpvTraverser::createCompositeConstruct(spv::Id resultTypeId, std::vector<spv::Id> constituents)
  2647. {
  2648. for (int c = 0; c < (int)constituents.size(); ++c) {
  2649. spv::Id& constituent = constituents[c];
  2650. spv::Id lType = builder.getContainedTypeId(resultTypeId, c);
  2651. spv::Id rType = builder.getTypeId(constituent);
  2652. if (lType != rType) {
  2653. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {
  2654. constituent = builder.createUnaryOp(spv::Op::OpCopyLogical, lType, constituent);
  2655. } else if (builder.isStructType(rType)) {
  2656. std::vector<spv::Id> rTypeConstituents;
  2657. int numrTypeConstituents = builder.getNumTypeConstituents(rType);
  2658. for (int i = 0; i < numrTypeConstituents; ++i) {
  2659. rTypeConstituents.push_back(builder.createCompositeExtract(constituent,
  2660. builder.getContainedTypeId(rType, i), i));
  2661. }
  2662. constituents[c] = createCompositeConstruct(lType, rTypeConstituents);
  2663. } else {
  2664. assert(builder.isArrayType(rType));
  2665. std::vector<spv::Id> rTypeConstituents;
  2666. int numrTypeConstituents = builder.getNumTypeConstituents(rType);
  2667. spv::Id elementRType = builder.getContainedTypeId(rType);
  2668. for (int i = 0; i < numrTypeConstituents; ++i) {
  2669. rTypeConstituents.push_back(builder.createCompositeExtract(constituent, elementRType, i));
  2670. }
  2671. constituents[c] = createCompositeConstruct(lType, rTypeConstituents);
  2672. }
  2673. }
  2674. }
  2675. return builder.createCompositeConstruct(resultTypeId, constituents);
  2676. }
  2677. bool TGlslangToSpvTraverser::visitAggregate(glslang::TVisit visit, glslang::TIntermAggregate* node)
  2678. {
  2679. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  2680. if (node->getType().getQualifier().isSpecConstant())
  2681. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  2682. spv::Id result = spv::NoResult;
  2683. spv::Id invertedType = spv::NoType; // to use to override the natural type of the node
  2684. std::vector<spv::Builder::AccessChain> complexLvalues; // for holding swizzling l-values too complex for
  2685. // SPIR-V, for an out parameter
  2686. std::vector<spv::Id> temporaryLvalues; // temporaries to pass, as proxies for complexLValues
  2687. auto resultType = [&invertedType, &node, this](){
  2688. if (invertedType != spv::NoType) {
  2689. return invertedType;
  2690. } else {
  2691. auto ret = convertGlslangToSpvType(node->getType());
  2692. // convertGlslangToSpvType may clobber the debug location, reset it
  2693. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2694. return ret;
  2695. }
  2696. };
  2697. // try texturing
  2698. result = createImageTextureFunctionCall(node);
  2699. if (result != spv::NoResult) {
  2700. builder.clearAccessChain();
  2701. builder.setAccessChainRValue(result);
  2702. return false;
  2703. } else if (node->getOp() == glslang::EOpImageStore ||
  2704. node->getOp() == glslang::EOpImageStoreLod ||
  2705. node->getOp() == glslang::EOpImageAtomicStore) {
  2706. // "imageStore" is a special case, which has no result
  2707. return false;
  2708. }
  2709. glslang::TOperator binOp = glslang::EOpNull;
  2710. bool reduceComparison = true;
  2711. bool isMatrix = false;
  2712. bool noReturnValue = false;
  2713. bool atomic = false;
  2714. spv::Builder::AccessChain::CoherentFlags lvalueCoherentFlags;
  2715. assert(node->getOp());
  2716. spv::Decoration precision = TranslatePrecisionDecoration(node->getOperationPrecision());
  2717. switch (node->getOp()) {
  2718. case glslang::EOpScope:
  2719. case glslang::EOpSequence:
  2720. {
  2721. if (visit == glslang::EvPreVisit) {
  2722. ++sequenceDepth;
  2723. if (sequenceDepth == 1) {
  2724. // If this is the parent node of all the functions, we want to see them
  2725. // early, so all call points have actual SPIR-V functions to reference.
  2726. // In all cases, still let the traverser visit the children for us.
  2727. makeFunctions(node->getAsAggregate()->getSequence());
  2728. // Global initializers is specific to the shader entry point, which does not exist in compile-only mode
  2729. if (!options.compileOnly) {
  2730. // Also, we want all globals initializers to go into the beginning of the entry point, before
  2731. // anything else gets there, so visit out of order, doing them all now.
  2732. makeGlobalInitializers(node->getAsAggregate()->getSequence());
  2733. }
  2734. //Pre process linker objects for ray tracing stages
  2735. if (glslangIntermediate->isRayTracingStage())
  2736. collectRayTracingLinkerObjects();
  2737. // Initializers are done, don't want to visit again, but functions and link objects need to be processed,
  2738. // so do them manually.
  2739. visitFunctions(node->getAsAggregate()->getSequence());
  2740. return false;
  2741. } else {
  2742. if (node->getOp() == glslang::EOpScope) {
  2743. auto loc = node->getLoc();
  2744. builder.enterLexicalBlock(loc.line, loc.column);
  2745. }
  2746. }
  2747. } else {
  2748. if (sequenceDepth > 1 && node->getOp() == glslang::EOpScope)
  2749. builder.leaveLexicalBlock();
  2750. --sequenceDepth;
  2751. }
  2752. return true;
  2753. }
  2754. case glslang::EOpLinkerObjects:
  2755. {
  2756. if (visit == glslang::EvPreVisit)
  2757. linkageOnly = true;
  2758. else
  2759. linkageOnly = false;
  2760. return true;
  2761. }
  2762. case glslang::EOpComma:
  2763. {
  2764. // processing from left to right naturally leaves the right-most
  2765. // lying around in the access chain
  2766. glslang::TIntermSequence& glslangOperands = node->getSequence();
  2767. for (int i = 0; i < (int)glslangOperands.size(); ++i)
  2768. glslangOperands[i]->traverse(this);
  2769. return false;
  2770. }
  2771. case glslang::EOpFunction:
  2772. if (visit == glslang::EvPreVisit) {
  2773. if (options.generateDebugInfo) {
  2774. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2775. }
  2776. if (isShaderEntryPoint(node)) {
  2777. inEntryPoint = true;
  2778. builder.setBuildPoint(shaderEntry->getLastBlock());
  2779. builder.enterFunction(shaderEntry);
  2780. currentFunction = shaderEntry;
  2781. } else {
  2782. handleFunctionEntry(node);
  2783. }
  2784. if (options.generateDebugInfo && !options.emitNonSemanticShaderDebugInfo) {
  2785. const auto& loc = node->getLoc();
  2786. const char* sourceFileName = loc.getFilename();
  2787. spv::Id sourceFileId = sourceFileName ? builder.getStringId(sourceFileName) : builder.getMainFileId();
  2788. currentFunction->setDebugLineInfo(sourceFileId, loc.line, loc.column);
  2789. }
  2790. } else {
  2791. if (options.generateDebugInfo) {
  2792. if (glslangIntermediate->getSource() == glslang::EShSourceGlsl && node->getSequence().size() > 1) {
  2793. auto endLoc = node->getSequence()[1]->getAsAggregate()->getEndLoc();
  2794. builder.setDebugSourceLocation(endLoc.line, endLoc.getFilename());
  2795. }
  2796. }
  2797. if (inEntryPoint)
  2798. entryPointTerminated = true;
  2799. builder.leaveFunction();
  2800. inEntryPoint = false;
  2801. }
  2802. return true;
  2803. case glslang::EOpParameters:
  2804. // Parameters will have been consumed by EOpFunction processing, but not
  2805. // the body, so we still visited the function node's children, making this
  2806. // child redundant.
  2807. return false;
  2808. case glslang::EOpFunctionCall:
  2809. {
  2810. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2811. if (node->isUserDefined())
  2812. result = handleUserFunctionCall(node);
  2813. if (result) {
  2814. builder.clearAccessChain();
  2815. builder.setAccessChainRValue(result);
  2816. } else
  2817. logger->missingFunctionality("missing user function; linker needs to catch that");
  2818. return false;
  2819. }
  2820. case glslang::EOpConstructMat2x2:
  2821. case glslang::EOpConstructMat2x3:
  2822. case glslang::EOpConstructMat2x4:
  2823. case glslang::EOpConstructMat3x2:
  2824. case glslang::EOpConstructMat3x3:
  2825. case glslang::EOpConstructMat3x4:
  2826. case glslang::EOpConstructMat4x2:
  2827. case glslang::EOpConstructMat4x3:
  2828. case glslang::EOpConstructMat4x4:
  2829. case glslang::EOpConstructDMat2x2:
  2830. case glslang::EOpConstructDMat2x3:
  2831. case glslang::EOpConstructDMat2x4:
  2832. case glslang::EOpConstructDMat3x2:
  2833. case glslang::EOpConstructDMat3x3:
  2834. case glslang::EOpConstructDMat3x4:
  2835. case glslang::EOpConstructDMat4x2:
  2836. case glslang::EOpConstructDMat4x3:
  2837. case glslang::EOpConstructDMat4x4:
  2838. case glslang::EOpConstructIMat2x2:
  2839. case glslang::EOpConstructIMat2x3:
  2840. case glslang::EOpConstructIMat2x4:
  2841. case glslang::EOpConstructIMat3x2:
  2842. case glslang::EOpConstructIMat3x3:
  2843. case glslang::EOpConstructIMat3x4:
  2844. case glslang::EOpConstructIMat4x2:
  2845. case glslang::EOpConstructIMat4x3:
  2846. case glslang::EOpConstructIMat4x4:
  2847. case glslang::EOpConstructUMat2x2:
  2848. case glslang::EOpConstructUMat2x3:
  2849. case glslang::EOpConstructUMat2x4:
  2850. case glslang::EOpConstructUMat3x2:
  2851. case glslang::EOpConstructUMat3x3:
  2852. case glslang::EOpConstructUMat3x4:
  2853. case glslang::EOpConstructUMat4x2:
  2854. case glslang::EOpConstructUMat4x3:
  2855. case glslang::EOpConstructUMat4x4:
  2856. case glslang::EOpConstructBMat2x2:
  2857. case glslang::EOpConstructBMat2x3:
  2858. case glslang::EOpConstructBMat2x4:
  2859. case glslang::EOpConstructBMat3x2:
  2860. case glslang::EOpConstructBMat3x3:
  2861. case glslang::EOpConstructBMat3x4:
  2862. case glslang::EOpConstructBMat4x2:
  2863. case glslang::EOpConstructBMat4x3:
  2864. case glslang::EOpConstructBMat4x4:
  2865. case glslang::EOpConstructF16Mat2x2:
  2866. case glslang::EOpConstructF16Mat2x3:
  2867. case glslang::EOpConstructF16Mat2x4:
  2868. case glslang::EOpConstructF16Mat3x2:
  2869. case glslang::EOpConstructF16Mat3x3:
  2870. case glslang::EOpConstructF16Mat3x4:
  2871. case glslang::EOpConstructF16Mat4x2:
  2872. case glslang::EOpConstructF16Mat4x3:
  2873. case glslang::EOpConstructF16Mat4x4:
  2874. isMatrix = true;
  2875. [[fallthrough]];
  2876. case glslang::EOpConstructFloat:
  2877. case glslang::EOpConstructVec2:
  2878. case glslang::EOpConstructVec3:
  2879. case glslang::EOpConstructVec4:
  2880. case glslang::EOpConstructDouble:
  2881. case glslang::EOpConstructDVec2:
  2882. case glslang::EOpConstructDVec3:
  2883. case glslang::EOpConstructDVec4:
  2884. case glslang::EOpConstructFloat16:
  2885. case glslang::EOpConstructF16Vec2:
  2886. case glslang::EOpConstructF16Vec3:
  2887. case glslang::EOpConstructF16Vec4:
  2888. case glslang::EOpConstructBFloat16:
  2889. case glslang::EOpConstructBF16Vec2:
  2890. case glslang::EOpConstructBF16Vec3:
  2891. case glslang::EOpConstructBF16Vec4:
  2892. case glslang::EOpConstructFloatE5M2:
  2893. case glslang::EOpConstructFloatE5M2Vec2:
  2894. case glslang::EOpConstructFloatE5M2Vec3:
  2895. case glslang::EOpConstructFloatE5M2Vec4:
  2896. case glslang::EOpConstructFloatE4M3:
  2897. case glslang::EOpConstructFloatE4M3Vec2:
  2898. case glslang::EOpConstructFloatE4M3Vec3:
  2899. case glslang::EOpConstructFloatE4M3Vec4:
  2900. case glslang::EOpConstructBool:
  2901. case glslang::EOpConstructBVec2:
  2902. case glslang::EOpConstructBVec3:
  2903. case glslang::EOpConstructBVec4:
  2904. case glslang::EOpConstructInt8:
  2905. case glslang::EOpConstructI8Vec2:
  2906. case glslang::EOpConstructI8Vec3:
  2907. case glslang::EOpConstructI8Vec4:
  2908. case glslang::EOpConstructUint8:
  2909. case glslang::EOpConstructU8Vec2:
  2910. case glslang::EOpConstructU8Vec3:
  2911. case glslang::EOpConstructU8Vec4:
  2912. case glslang::EOpConstructInt16:
  2913. case glslang::EOpConstructI16Vec2:
  2914. case glslang::EOpConstructI16Vec3:
  2915. case glslang::EOpConstructI16Vec4:
  2916. case glslang::EOpConstructUint16:
  2917. case glslang::EOpConstructU16Vec2:
  2918. case glslang::EOpConstructU16Vec3:
  2919. case glslang::EOpConstructU16Vec4:
  2920. case glslang::EOpConstructInt:
  2921. case glslang::EOpConstructIVec2:
  2922. case glslang::EOpConstructIVec3:
  2923. case glslang::EOpConstructIVec4:
  2924. case glslang::EOpConstructUint:
  2925. case glslang::EOpConstructUVec2:
  2926. case glslang::EOpConstructUVec3:
  2927. case glslang::EOpConstructUVec4:
  2928. case glslang::EOpConstructInt64:
  2929. case glslang::EOpConstructI64Vec2:
  2930. case glslang::EOpConstructI64Vec3:
  2931. case glslang::EOpConstructI64Vec4:
  2932. case glslang::EOpConstructUint64:
  2933. case glslang::EOpConstructU64Vec2:
  2934. case glslang::EOpConstructU64Vec3:
  2935. case glslang::EOpConstructU64Vec4:
  2936. case glslang::EOpConstructStruct:
  2937. case glslang::EOpConstructTextureSampler:
  2938. case glslang::EOpConstructReference:
  2939. case glslang::EOpConstructCooperativeMatrixNV:
  2940. case glslang::EOpConstructCooperativeMatrixKHR:
  2941. case glslang::EOpConstructCooperativeVectorNV:
  2942. case glslang::EOpConstructSaturated:
  2943. {
  2944. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2945. std::vector<spv::Id> arguments;
  2946. translateArguments(*node, arguments, lvalueCoherentFlags);
  2947. spv::Id constructed;
  2948. if (node->getOp() == glslang::EOpConstructTextureSampler) {
  2949. const glslang::TType& texType = node->getSequence()[0]->getAsTyped()->getType();
  2950. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6 &&
  2951. texType.getSampler().isBuffer()) {
  2952. // SamplerBuffer is not supported in spirv1.6 so
  2953. // `samplerBuffer(textureBuffer, sampler)` is a no-op
  2954. // and textureBuffer is the result going forward
  2955. constructed = arguments[0];
  2956. } else
  2957. constructed = builder.createOp(spv::Op::OpSampledImage, resultType(), arguments);
  2958. } else if (node->getOp() == glslang::EOpConstructCooperativeMatrixKHR &&
  2959. node->getType().isCoopMatKHR() && node->getSequence()[0]->getAsTyped()->getType().isCoopMatKHR()) {
  2960. builder.addCapability(spv::Capability::CooperativeMatrixConversionsNV);
  2961. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  2962. constructed = builder.createCooperativeMatrixConversion(resultType(), arguments[0]);
  2963. } else if (node->getOp() == glslang::EOpConstructCooperativeVectorNV &&
  2964. arguments.size() == 1 &&
  2965. builder.getTypeId(arguments[0]) == resultType()) {
  2966. constructed = arguments[0];
  2967. } else if (node->getOp() == glslang::EOpConstructStruct ||
  2968. node->getOp() == glslang::EOpConstructCooperativeMatrixNV ||
  2969. node->getOp() == glslang::EOpConstructCooperativeMatrixKHR ||
  2970. node->getType().isArray() ||
  2971. // Handle constructing coopvec from one component here, to avoid the component
  2972. // getting smeared
  2973. (node->getOp() == glslang::EOpConstructCooperativeVectorNV && arguments.size() == 1 && builder.isScalar(arguments[0]))) {
  2974. std::vector<spv::Id> constituents;
  2975. for (int c = 0; c < (int)arguments.size(); ++c)
  2976. constituents.push_back(arguments[c]);
  2977. constructed = createCompositeConstruct(resultType(), constituents);
  2978. } else if (isMatrix)
  2979. constructed = builder.createMatrixConstructor(precision, arguments, resultType());
  2980. else if (node->getOp() == glslang::EOpConstructSaturated) {
  2981. OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
  2982. TranslateNoContractionDecoration(node->getType().getQualifier()),
  2983. TranslateNonUniformDecoration(lvalueCoherentFlags) };
  2984. constructed = createConversion(node->getOp(), decorations, resultType(), arguments[1],
  2985. node->getType().getBasicType(), node->getSequence()[1]->getAsTyped()->getBasicType());
  2986. builder.addDecoration(constructed, spv::Decoration::SaturatedToLargestFloat8NormalConversionEXT);
  2987. builder.createStore(constructed, arguments[0]);
  2988. }
  2989. else
  2990. constructed = builder.createConstructor(precision, arguments, resultType());
  2991. if (node->getType().getQualifier().isNonUniform()) {
  2992. builder.addDecoration(constructed, spv::Decoration::NonUniformEXT);
  2993. }
  2994. builder.clearAccessChain();
  2995. builder.setAccessChainRValue(constructed);
  2996. return false;
  2997. }
  2998. // These six are component-wise compares with component-wise results.
  2999. // Forward on to createBinaryOperation(), requesting a vector result.
  3000. case glslang::EOpLessThan:
  3001. case glslang::EOpGreaterThan:
  3002. case glslang::EOpLessThanEqual:
  3003. case glslang::EOpGreaterThanEqual:
  3004. case glslang::EOpVectorEqual:
  3005. case glslang::EOpVectorNotEqual:
  3006. {
  3007. // Map the operation to a binary
  3008. binOp = node->getOp();
  3009. reduceComparison = false;
  3010. switch (node->getOp()) {
  3011. case glslang::EOpVectorEqual: binOp = glslang::EOpVectorEqual; break;
  3012. case glslang::EOpVectorNotEqual: binOp = glslang::EOpVectorNotEqual; break;
  3013. default: binOp = node->getOp(); break;
  3014. }
  3015. break;
  3016. }
  3017. case glslang::EOpMul:
  3018. // component-wise matrix multiply
  3019. binOp = glslang::EOpMul;
  3020. break;
  3021. case glslang::EOpOuterProduct:
  3022. // two vectors multiplied to make a matrix
  3023. binOp = glslang::EOpOuterProduct;
  3024. break;
  3025. case glslang::EOpDot:
  3026. {
  3027. // for scalar dot product, use multiply
  3028. glslang::TIntermSequence& glslangOperands = node->getSequence();
  3029. if (glslangOperands[0]->getAsTyped()->getVectorSize() == 1)
  3030. binOp = glslang::EOpMul;
  3031. break;
  3032. }
  3033. case glslang::EOpMod:
  3034. // when an aggregate, this is the floating-point mod built-in function,
  3035. // which can be emitted by the one in createBinaryOperation()
  3036. binOp = glslang::EOpMod;
  3037. break;
  3038. case glslang::EOpEmitVertex:
  3039. case glslang::EOpEndPrimitive:
  3040. case glslang::EOpBarrier:
  3041. case glslang::EOpMemoryBarrier:
  3042. case glslang::EOpMemoryBarrierAtomicCounter:
  3043. case glslang::EOpMemoryBarrierBuffer:
  3044. case glslang::EOpMemoryBarrierImage:
  3045. case glslang::EOpMemoryBarrierShared:
  3046. case glslang::EOpGroupMemoryBarrier:
  3047. case glslang::EOpDeviceMemoryBarrier:
  3048. case glslang::EOpAllMemoryBarrierWithGroupSync:
  3049. case glslang::EOpDeviceMemoryBarrierWithGroupSync:
  3050. case glslang::EOpWorkgroupMemoryBarrier:
  3051. case glslang::EOpWorkgroupMemoryBarrierWithGroupSync:
  3052. case glslang::EOpSubgroupBarrier:
  3053. case glslang::EOpSubgroupMemoryBarrier:
  3054. case glslang::EOpSubgroupMemoryBarrierBuffer:
  3055. case glslang::EOpSubgroupMemoryBarrierImage:
  3056. case glslang::EOpSubgroupMemoryBarrierShared:
  3057. noReturnValue = true;
  3058. // These all have 0 operands and will naturally finish up in the code below for 0 operands
  3059. break;
  3060. case glslang::EOpAtomicAdd:
  3061. case glslang::EOpAtomicSubtract:
  3062. case glslang::EOpAtomicMin:
  3063. case glslang::EOpAtomicMax:
  3064. case glslang::EOpAtomicAnd:
  3065. case glslang::EOpAtomicOr:
  3066. case glslang::EOpAtomicXor:
  3067. case glslang::EOpAtomicExchange:
  3068. case glslang::EOpAtomicCompSwap:
  3069. atomic = true;
  3070. break;
  3071. case glslang::EOpAtomicStore:
  3072. noReturnValue = true;
  3073. [[fallthrough]];
  3074. case glslang::EOpAtomicLoad:
  3075. atomic = true;
  3076. break;
  3077. case glslang::EOpAtomicCounterAdd:
  3078. case glslang::EOpAtomicCounterSubtract:
  3079. case glslang::EOpAtomicCounterMin:
  3080. case glslang::EOpAtomicCounterMax:
  3081. case glslang::EOpAtomicCounterAnd:
  3082. case glslang::EOpAtomicCounterOr:
  3083. case glslang::EOpAtomicCounterXor:
  3084. case glslang::EOpAtomicCounterExchange:
  3085. case glslang::EOpAtomicCounterCompSwap:
  3086. builder.addExtension("SPV_KHR_shader_atomic_counter_ops");
  3087. builder.addCapability(spv::Capability::AtomicStorageOps);
  3088. atomic = true;
  3089. break;
  3090. case glslang::EOpAbsDifference:
  3091. case glslang::EOpAddSaturate:
  3092. case glslang::EOpSubSaturate:
  3093. case glslang::EOpAverage:
  3094. case glslang::EOpAverageRounded:
  3095. case glslang::EOpMul32x16:
  3096. builder.addCapability(spv::Capability::IntegerFunctions2INTEL);
  3097. builder.addExtension("SPV_INTEL_shader_integer_functions2");
  3098. binOp = node->getOp();
  3099. break;
  3100. case glslang::EOpExpectEXT:
  3101. builder.addCapability(spv::Capability::ExpectAssumeKHR);
  3102. builder.addExtension(spv::E_SPV_KHR_expect_assume);
  3103. binOp = node->getOp();
  3104. break;
  3105. case glslang::EOpIgnoreIntersectionNV:
  3106. case glslang::EOpTerminateRayNV:
  3107. case glslang::EOpTraceNV:
  3108. case glslang::EOpTraceRayMotionNV:
  3109. case glslang::EOpTraceKHR:
  3110. case glslang::EOpExecuteCallableNV:
  3111. case glslang::EOpExecuteCallableKHR:
  3112. case glslang::EOpWritePackedPrimitiveIndices4x8NV:
  3113. case glslang::EOpEmitMeshTasksEXT:
  3114. case glslang::EOpSetMeshOutputsEXT:
  3115. noReturnValue = true;
  3116. break;
  3117. case glslang::EOpRayQueryInitialize:
  3118. case glslang::EOpRayQueryTerminate:
  3119. case glslang::EOpRayQueryGenerateIntersection:
  3120. case glslang::EOpRayQueryConfirmIntersection:
  3121. builder.addExtension("SPV_KHR_ray_query");
  3122. builder.addCapability(spv::Capability::RayQueryKHR);
  3123. noReturnValue = true;
  3124. break;
  3125. case glslang::EOpRayQueryProceed:
  3126. case glslang::EOpRayQueryGetIntersectionType:
  3127. case glslang::EOpRayQueryGetRayTMin:
  3128. case glslang::EOpRayQueryGetRayFlags:
  3129. case glslang::EOpRayQueryGetIntersectionT:
  3130. case glslang::EOpRayQueryGetIntersectionInstanceCustomIndex:
  3131. case glslang::EOpRayQueryGetIntersectionInstanceId:
  3132. case glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset:
  3133. case glslang::EOpRayQueryGetIntersectionGeometryIndex:
  3134. case glslang::EOpRayQueryGetIntersectionPrimitiveIndex:
  3135. case glslang::EOpRayQueryGetIntersectionBarycentrics:
  3136. case glslang::EOpRayQueryGetIntersectionFrontFace:
  3137. case glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque:
  3138. case glslang::EOpRayQueryGetIntersectionObjectRayDirection:
  3139. case glslang::EOpRayQueryGetIntersectionObjectRayOrigin:
  3140. case glslang::EOpRayQueryGetWorldRayDirection:
  3141. case glslang::EOpRayQueryGetWorldRayOrigin:
  3142. case glslang::EOpRayQueryGetIntersectionObjectToWorld:
  3143. case glslang::EOpRayQueryGetIntersectionWorldToObject:
  3144. builder.addExtension("SPV_KHR_ray_query");
  3145. builder.addCapability(spv::Capability::RayQueryKHR);
  3146. break;
  3147. case glslang::EOpCooperativeMatrixLoad:
  3148. case glslang::EOpCooperativeMatrixStore:
  3149. case glslang::EOpCooperativeMatrixLoadNV:
  3150. case glslang::EOpCooperativeMatrixStoreNV:
  3151. case glslang::EOpCooperativeMatrixLoadTensorNV:
  3152. case glslang::EOpCooperativeMatrixStoreTensorNV:
  3153. case glslang::EOpCooperativeMatrixReduceNV:
  3154. case glslang::EOpCooperativeMatrixPerElementOpNV:
  3155. case glslang::EOpCooperativeMatrixTransposeNV:
  3156. case glslang::EOpCooperativeVectorMatMulNV:
  3157. case glslang::EOpCooperativeVectorMatMulAddNV:
  3158. case glslang::EOpCooperativeVectorLoadNV:
  3159. case glslang::EOpCooperativeVectorStoreNV:
  3160. case glslang::EOpCooperativeVectorOuterProductAccumulateNV:
  3161. case glslang::EOpCooperativeVectorReduceSumAccumulateNV:
  3162. noReturnValue = true;
  3163. break;
  3164. case glslang::EOpBeginInvocationInterlock:
  3165. case glslang::EOpEndInvocationInterlock:
  3166. builder.addExtension(spv::E_SPV_EXT_fragment_shader_interlock);
  3167. noReturnValue = true;
  3168. break;
  3169. case glslang::EOpHitObjectTraceRayNV:
  3170. case glslang::EOpHitObjectTraceRayMotionNV:
  3171. case glslang::EOpHitObjectGetAttributesNV:
  3172. case glslang::EOpHitObjectExecuteShaderNV:
  3173. case glslang::EOpHitObjectRecordEmptyNV:
  3174. case glslang::EOpHitObjectRecordMissNV:
  3175. case glslang::EOpHitObjectRecordMissMotionNV:
  3176. case glslang::EOpHitObjectRecordHitNV:
  3177. case glslang::EOpHitObjectRecordHitMotionNV:
  3178. case glslang::EOpHitObjectRecordHitWithIndexNV:
  3179. case glslang::EOpHitObjectRecordHitWithIndexMotionNV:
  3180. case glslang::EOpReorderThreadNV:
  3181. noReturnValue = true;
  3182. [[fallthrough]];
  3183. case glslang::EOpHitObjectIsEmptyNV:
  3184. case glslang::EOpHitObjectIsMissNV:
  3185. case glslang::EOpHitObjectIsHitNV:
  3186. case glslang::EOpHitObjectGetRayTMinNV:
  3187. case glslang::EOpHitObjectGetRayTMaxNV:
  3188. case glslang::EOpHitObjectGetObjectRayOriginNV:
  3189. case glslang::EOpHitObjectGetObjectRayDirectionNV:
  3190. case glslang::EOpHitObjectGetWorldRayOriginNV:
  3191. case glslang::EOpHitObjectGetWorldRayDirectionNV:
  3192. case glslang::EOpHitObjectGetObjectToWorldNV:
  3193. case glslang::EOpHitObjectGetWorldToObjectNV:
  3194. case glslang::EOpHitObjectGetInstanceCustomIndexNV:
  3195. case glslang::EOpHitObjectGetInstanceIdNV:
  3196. case glslang::EOpHitObjectGetGeometryIndexNV:
  3197. case glslang::EOpHitObjectGetPrimitiveIndexNV:
  3198. case glslang::EOpHitObjectGetHitKindNV:
  3199. case glslang::EOpHitObjectGetCurrentTimeNV:
  3200. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:
  3201. case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:
  3202. builder.addExtension(spv::E_SPV_NV_shader_invocation_reorder);
  3203. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  3204. break;
  3205. case glslang::EOpHitObjectGetLSSPositionsNV:
  3206. case glslang::EOpHitObjectGetLSSRadiiNV:
  3207. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  3208. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  3209. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  3210. noReturnValue = true;
  3211. break;
  3212. case glslang::EOpRayQueryGetIntersectionLSSPositionsNV:
  3213. case glslang::EOpRayQueryGetIntersectionLSSRadiiNV:
  3214. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  3215. builder.addCapability(spv::Capability::RayQueryKHR);
  3216. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  3217. noReturnValue = true;
  3218. break;
  3219. case glslang::EOpRayQueryGetIntersectionSpherePositionNV:
  3220. case glslang::EOpRayQueryGetIntersectionSphereRadiusNV:
  3221. case glslang::EOpRayQueryIsSphereHitNV:
  3222. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  3223. builder.addCapability(spv::Capability::RayQueryKHR);
  3224. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  3225. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  3226. break;
  3227. case glslang::EOpRayQueryGetIntersectionLSSHitValueNV:
  3228. case glslang::EOpRayQueryIsLSSHitNV:
  3229. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  3230. builder.addCapability(spv::Capability::RayQueryKHR);
  3231. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  3232. break;
  3233. case glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT:
  3234. builder.addExtension(spv::E_SPV_KHR_ray_tracing_position_fetch);
  3235. builder.addCapability(spv::Capability::RayQueryPositionFetchKHR);
  3236. noReturnValue = true;
  3237. break;
  3238. case glslang::EOpImageSampleWeightedQCOM:
  3239. builder.addCapability(spv::Capability::TextureSampleWeightedQCOM);
  3240. builder.addExtension(spv::E_SPV_QCOM_image_processing);
  3241. break;
  3242. case glslang::EOpImageBoxFilterQCOM:
  3243. builder.addCapability(spv::Capability::TextureBoxFilterQCOM);
  3244. builder.addExtension(spv::E_SPV_QCOM_image_processing);
  3245. break;
  3246. case glslang::EOpImageBlockMatchSADQCOM:
  3247. case glslang::EOpImageBlockMatchSSDQCOM:
  3248. builder.addCapability(spv::Capability::TextureBlockMatchQCOM);
  3249. builder.addExtension(spv::E_SPV_QCOM_image_processing);
  3250. break;
  3251. case glslang::EOpTensorWriteARM:
  3252. noReturnValue = true;
  3253. break;
  3254. case glslang::EOpImageBlockMatchWindowSSDQCOM:
  3255. case glslang::EOpImageBlockMatchWindowSADQCOM:
  3256. builder.addCapability(spv::Capability::TextureBlockMatchQCOM);
  3257. builder.addExtension(spv::E_SPV_QCOM_image_processing);
  3258. builder.addCapability(spv::Capability::TextureBlockMatch2QCOM);
  3259. builder.addExtension(spv::E_SPV_QCOM_image_processing2);
  3260. break;
  3261. case glslang::EOpImageBlockMatchGatherSSDQCOM:
  3262. case glslang::EOpImageBlockMatchGatherSADQCOM:
  3263. builder.addCapability(spv::Capability::TextureBlockMatchQCOM);
  3264. builder.addExtension(spv::E_SPV_QCOM_image_processing);
  3265. builder.addCapability(spv::Capability::TextureBlockMatch2QCOM);
  3266. builder.addExtension(spv::E_SPV_QCOM_image_processing2);
  3267. break;
  3268. case glslang::EOpFetchMicroTriangleVertexPositionNV:
  3269. case glslang::EOpFetchMicroTriangleVertexBarycentricNV:
  3270. builder.addExtension(spv::E_SPV_NV_displacement_micromap);
  3271. builder.addCapability(spv::Capability::DisplacementMicromapNV);
  3272. break;
  3273. case glslang::EOpRayQueryGetIntersectionClusterIdNV:
  3274. builder.addExtension(spv::E_SPV_NV_cluster_acceleration_structure);
  3275. builder.addCapability(spv::Capability::RayQueryKHR);
  3276. builder.addCapability(spv::Capability::RayTracingClusterAccelerationStructureNV);
  3277. break;
  3278. case glslang::EOpDebugPrintf:
  3279. noReturnValue = true;
  3280. break;
  3281. default:
  3282. break;
  3283. }
  3284. //
  3285. // See if it maps to a regular operation.
  3286. //
  3287. if (binOp != glslang::EOpNull) {
  3288. glslang::TIntermTyped* left = node->getSequence()[0]->getAsTyped();
  3289. glslang::TIntermTyped* right = node->getSequence()[1]->getAsTyped();
  3290. assert(left && right);
  3291. builder.clearAccessChain();
  3292. left->traverse(this);
  3293. spv::Id leftId = accessChainLoad(left->getType());
  3294. builder.clearAccessChain();
  3295. right->traverse(this);
  3296. spv::Id rightId = accessChainLoad(right->getType());
  3297. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  3298. OpDecorations decorations = { precision,
  3299. TranslateNoContractionDecoration(node->getType().getQualifier()),
  3300. TranslateNonUniformDecoration(node->getType().getQualifier()) };
  3301. result = createBinaryOperation(binOp, decorations,
  3302. resultType(), leftId, rightId,
  3303. left->getType().getBasicType(), reduceComparison);
  3304. // code above should only make binOp that exists in createBinaryOperation
  3305. assert(result != spv::NoResult);
  3306. builder.clearAccessChain();
  3307. builder.setAccessChainRValue(result);
  3308. return false;
  3309. }
  3310. //
  3311. // Create the list of operands.
  3312. //
  3313. glslang::TIntermSequence& glslangOperands = node->getSequence();
  3314. std::vector<spv::Id> operands;
  3315. std::vector<spv::IdImmediate> memoryAccessOperands;
  3316. for (int arg = 0; arg < (int)glslangOperands.size(); ++arg) {
  3317. // special case l-value operands; there are just a few
  3318. bool lvalue = false;
  3319. switch (node->getOp()) {
  3320. case glslang::EOpModf:
  3321. if (arg == 1)
  3322. lvalue = true;
  3323. break;
  3324. case glslang::EOpHitObjectRecordHitNV:
  3325. case glslang::EOpHitObjectRecordHitMotionNV:
  3326. case glslang::EOpHitObjectRecordHitWithIndexNV:
  3327. case glslang::EOpHitObjectRecordHitWithIndexMotionNV:
  3328. case glslang::EOpHitObjectTraceRayNV:
  3329. case glslang::EOpHitObjectTraceRayMotionNV:
  3330. case glslang::EOpHitObjectExecuteShaderNV:
  3331. case glslang::EOpHitObjectRecordMissNV:
  3332. case glslang::EOpHitObjectRecordMissMotionNV:
  3333. case glslang::EOpHitObjectGetAttributesNV:
  3334. case glslang::EOpHitObjectGetClusterIdNV:
  3335. if (arg == 0)
  3336. lvalue = true;
  3337. break;
  3338. case glslang::EOpHitObjectGetLSSPositionsNV:
  3339. case glslang::EOpHitObjectGetLSSRadiiNV:
  3340. lvalue = true;
  3341. break;
  3342. case glslang::EOpRayQueryInitialize:
  3343. case glslang::EOpRayQueryTerminate:
  3344. case glslang::EOpRayQueryConfirmIntersection:
  3345. case glslang::EOpRayQueryProceed:
  3346. case glslang::EOpRayQueryGenerateIntersection:
  3347. case glslang::EOpRayQueryGetIntersectionType:
  3348. case glslang::EOpRayQueryGetIntersectionT:
  3349. case glslang::EOpRayQueryGetIntersectionInstanceCustomIndex:
  3350. case glslang::EOpRayQueryGetIntersectionInstanceId:
  3351. case glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset:
  3352. case glslang::EOpRayQueryGetIntersectionGeometryIndex:
  3353. case glslang::EOpRayQueryGetIntersectionPrimitiveIndex:
  3354. case glslang::EOpRayQueryGetIntersectionBarycentrics:
  3355. case glslang::EOpRayQueryGetIntersectionFrontFace:
  3356. case glslang::EOpRayQueryGetIntersectionObjectRayDirection:
  3357. case glslang::EOpRayQueryGetIntersectionObjectRayOrigin:
  3358. case glslang::EOpRayQueryGetIntersectionObjectToWorld:
  3359. case glslang::EOpRayQueryGetIntersectionWorldToObject:
  3360. case glslang::EOpRayQueryGetIntersectionClusterIdNV:
  3361. case glslang::EOpRayQueryGetIntersectionSpherePositionNV:
  3362. case glslang::EOpRayQueryGetIntersectionSphereRadiusNV:
  3363. case glslang::EOpRayQueryGetIntersectionLSSHitValueNV:
  3364. case glslang::EOpRayQueryIsSphereHitNV:
  3365. case glslang::EOpRayQueryIsLSSHitNV:
  3366. if (arg == 0)
  3367. lvalue = true;
  3368. break;
  3369. case glslang::EOpAtomicAdd:
  3370. case glslang::EOpAtomicSubtract:
  3371. case glslang::EOpAtomicMin:
  3372. case glslang::EOpAtomicMax:
  3373. case glslang::EOpAtomicAnd:
  3374. case glslang::EOpAtomicOr:
  3375. case glslang::EOpAtomicXor:
  3376. case glslang::EOpAtomicExchange:
  3377. case glslang::EOpAtomicCompSwap:
  3378. if (arg == 0)
  3379. lvalue = true;
  3380. break;
  3381. case glslang::EOpFrexp:
  3382. if (arg == 1)
  3383. lvalue = true;
  3384. break;
  3385. case glslang::EOpInterpolateAtSample:
  3386. case glslang::EOpInterpolateAtOffset:
  3387. case glslang::EOpInterpolateAtVertex:
  3388. if (arg == 0) {
  3389. // If GLSL, use the address of the interpolant argument.
  3390. // If HLSL, use an internal version of OpInterolates that takes
  3391. // the rvalue of the interpolant. A fixup pass in spirv-opt
  3392. // legalization will remove the OpLoad and convert to an lvalue.
  3393. // Had to do this because legalization will only propagate a
  3394. // builtin into an rvalue.
  3395. lvalue = glslangIntermediate->getSource() != glslang::EShSourceHlsl;
  3396. // Does it need a swizzle inversion? If so, evaluation is inverted;
  3397. // operate first on the swizzle base, then apply the swizzle.
  3398. // That is, we transform
  3399. //
  3400. // interpolate(v.zy) -> interpolate(v).zy
  3401. //
  3402. if (glslangOperands[0]->getAsOperator() &&
  3403. glslangOperands[0]->getAsOperator()->getOp() == glslang::EOpVectorSwizzle)
  3404. invertedType = convertGlslangToSpvType(
  3405. glslangOperands[0]->getAsBinaryNode()->getLeft()->getType());
  3406. }
  3407. break;
  3408. case glslang::EOpAtomicLoad:
  3409. case glslang::EOpAtomicStore:
  3410. case glslang::EOpAtomicCounterAdd:
  3411. case glslang::EOpAtomicCounterSubtract:
  3412. case glslang::EOpAtomicCounterMin:
  3413. case glslang::EOpAtomicCounterMax:
  3414. case glslang::EOpAtomicCounterAnd:
  3415. case glslang::EOpAtomicCounterOr:
  3416. case glslang::EOpAtomicCounterXor:
  3417. case glslang::EOpAtomicCounterExchange:
  3418. case glslang::EOpAtomicCounterCompSwap:
  3419. if (arg == 0)
  3420. lvalue = true;
  3421. break;
  3422. case glslang::EOpAddCarry:
  3423. case glslang::EOpSubBorrow:
  3424. if (arg == 2)
  3425. lvalue = true;
  3426. break;
  3427. case glslang::EOpUMulExtended:
  3428. case glslang::EOpIMulExtended:
  3429. if (arg >= 2)
  3430. lvalue = true;
  3431. break;
  3432. case glslang::EOpCooperativeMatrixLoad:
  3433. case glslang::EOpCooperativeMatrixLoadNV:
  3434. case glslang::EOpCooperativeMatrixLoadTensorNV:
  3435. case glslang::EOpCooperativeVectorLoadNV:
  3436. if (arg == 0 || arg == 1)
  3437. lvalue = true;
  3438. break;
  3439. case glslang::EOpCooperativeMatrixStore:
  3440. case glslang::EOpCooperativeMatrixStoreNV:
  3441. case glslang::EOpCooperativeMatrixStoreTensorNV:
  3442. case glslang::EOpCooperativeVectorStoreNV:
  3443. if (arg == 1)
  3444. lvalue = true;
  3445. break;
  3446. case glslang::EOpCooperativeVectorMatMulNV:
  3447. if (arg == 0 || arg == 3)
  3448. lvalue = true;
  3449. break;
  3450. case glslang::EOpCooperativeVectorMatMulAddNV:
  3451. if (arg == 0 || arg == 3 || arg == 6)
  3452. lvalue = true;
  3453. break;
  3454. case glslang::EOpCooperativeVectorOuterProductAccumulateNV:
  3455. if (arg == 2)
  3456. lvalue = true;
  3457. break;
  3458. case glslang::EOpCooperativeVectorReduceSumAccumulateNV:
  3459. if (arg == 1)
  3460. lvalue = true;
  3461. break;
  3462. case glslang::EOpCooperativeMatrixReduceNV:
  3463. case glslang::EOpCooperativeMatrixPerElementOpNV:
  3464. case glslang::EOpCooperativeMatrixTransposeNV:
  3465. if (arg == 0)
  3466. lvalue = true;
  3467. break;
  3468. case glslang::EOpSpirvInst:
  3469. if (glslangOperands[arg]->getAsTyped()->getQualifier().isSpirvByReference())
  3470. lvalue = true;
  3471. break;
  3472. case glslang::EOpReorderThreadNV:
  3473. //Three variants of reorderThreadNV, two of them use hitObjectNV
  3474. if (arg == 0 && glslangOperands.size() != 2)
  3475. lvalue = true;
  3476. break;
  3477. case glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT:
  3478. case glslang::EOpRayQueryGetIntersectionLSSPositionsNV:
  3479. case glslang::EOpRayQueryGetIntersectionLSSRadiiNV:
  3480. if (arg == 0 || arg == 2)
  3481. lvalue = true;
  3482. break;
  3483. case glslang::EOpTensorReadARM:
  3484. if (arg == 2)
  3485. lvalue = true;
  3486. break;
  3487. default:
  3488. break;
  3489. }
  3490. builder.clearAccessChain();
  3491. if (invertedType != spv::NoType && arg == 0)
  3492. glslangOperands[0]->getAsBinaryNode()->getLeft()->traverse(this);
  3493. else
  3494. glslangOperands[arg]->traverse(this);
  3495. bool isCoopMat = node->getOp() == glslang::EOpCooperativeMatrixLoad ||
  3496. node->getOp() == glslang::EOpCooperativeMatrixStore ||
  3497. node->getOp() == glslang::EOpCooperativeMatrixLoadNV ||
  3498. node->getOp() == glslang::EOpCooperativeMatrixStoreNV ||
  3499. node->getOp() == glslang::EOpCooperativeMatrixLoadTensorNV ||
  3500. node->getOp() == glslang::EOpCooperativeMatrixStoreTensorNV;
  3501. bool isCoopVec = node->getOp() == glslang::EOpCooperativeVectorLoadNV ||
  3502. node->getOp() == glslang::EOpCooperativeVectorStoreNV;
  3503. if (isCoopMat || isCoopVec) {
  3504. if (arg == 1) {
  3505. spv::Builder::AccessChain::CoherentFlags coherentFlags {};
  3506. unsigned int alignment {};
  3507. if (isCoopMat) {
  3508. // fold "element" parameter into the access chain
  3509. spv::Builder::AccessChain save = builder.getAccessChain();
  3510. builder.clearAccessChain();
  3511. glslangOperands[2]->traverse(this);
  3512. spv::Id elementId = accessChainLoad(glslangOperands[2]->getAsTyped()->getType());
  3513. builder.setAccessChain(save);
  3514. // Point to the first element of the array.
  3515. builder.accessChainPush(elementId,
  3516. TranslateCoherent(glslangOperands[arg]->getAsTyped()->getType()),
  3517. glslangOperands[arg]->getAsTyped()->getType().getBufferReferenceAlignment());
  3518. coherentFlags = builder.getAccessChain().coherentFlags;
  3519. alignment = builder.getAccessChain().alignment;
  3520. } else {
  3521. coherentFlags = builder.getAccessChain().coherentFlags;
  3522. coherentFlags |= TranslateCoherent(glslangOperands[arg]->getAsTyped()->getType());
  3523. alignment = 16;
  3524. }
  3525. spv::MemoryAccessMask memoryAccess = TranslateMemoryAccess(coherentFlags);
  3526. if (node->getOp() == glslang::EOpCooperativeMatrixLoad ||
  3527. node->getOp() == glslang::EOpCooperativeMatrixLoadNV ||
  3528. node->getOp() == glslang::EOpCooperativeMatrixLoadTensorNV ||
  3529. node->getOp() == glslang::EOpCooperativeVectorLoadNV)
  3530. memoryAccess = (memoryAccess & ~spv::MemoryAccessMask::MakePointerAvailableKHR);
  3531. if (node->getOp() == glslang::EOpCooperativeMatrixStore ||
  3532. node->getOp() == glslang::EOpCooperativeMatrixStoreNV ||
  3533. node->getOp() == glslang::EOpCooperativeMatrixStoreTensorNV ||
  3534. node->getOp() == glslang::EOpCooperativeVectorStoreNV)
  3535. memoryAccess = (memoryAccess & ~spv::MemoryAccessMask::MakePointerVisibleKHR);
  3536. if (builder.getStorageClass(builder.getAccessChain().base) ==
  3537. spv::StorageClass::PhysicalStorageBufferEXT) {
  3538. memoryAccess = (spv::MemoryAccessMask)(memoryAccess | spv::MemoryAccessMask::Aligned);
  3539. }
  3540. memoryAccessOperands.push_back(spv::IdImmediate(false, memoryAccess));
  3541. if (anySet(memoryAccess, spv::MemoryAccessMask::Aligned)) {
  3542. memoryAccessOperands.push_back(spv::IdImmediate(false, alignment));
  3543. }
  3544. if (anySet(memoryAccess,
  3545. spv::MemoryAccessMask::MakePointerAvailableKHR | spv::MemoryAccessMask::MakePointerVisibleKHR)) {
  3546. memoryAccessOperands.push_back(spv::IdImmediate(true,
  3547. builder.makeUintConstant(TranslateMemoryScope(coherentFlags))));
  3548. }
  3549. } else if (isCoopMat && arg == 2) {
  3550. continue;
  3551. }
  3552. }
  3553. // for l-values, pass the address, for r-values, pass the value
  3554. if (lvalue) {
  3555. if (invertedType == spv::NoType && !builder.isSpvLvalue()) {
  3556. // SPIR-V cannot represent an l-value containing a swizzle that doesn't
  3557. // reduce to a simple access chain. So, we need a temporary vector to
  3558. // receive the result, and must later swizzle that into the original
  3559. // l-value.
  3560. complexLvalues.push_back(builder.getAccessChain());
  3561. temporaryLvalues.push_back(builder.createVariable(
  3562. spv::NoPrecision, spv::StorageClass::Function,
  3563. builder.accessChainGetInferredType(), "swizzleTemp"));
  3564. operands.push_back(temporaryLvalues.back());
  3565. } else {
  3566. operands.push_back(builder.accessChainGetLValue());
  3567. }
  3568. lvalueCoherentFlags = builder.getAccessChain().coherentFlags;
  3569. lvalueCoherentFlags |= TranslateCoherent(glslangOperands[arg]->getAsTyped()->getType());
  3570. } else {
  3571. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  3572. glslang::TOperator glslangOp = node->getOp();
  3573. if (arg == 1 &&
  3574. (glslangOp == glslang::EOpRayQueryGetIntersectionType ||
  3575. glslangOp == glslang::EOpRayQueryGetIntersectionT ||
  3576. glslangOp == glslang::EOpRayQueryGetIntersectionInstanceCustomIndex ||
  3577. glslangOp == glslang::EOpRayQueryGetIntersectionInstanceId ||
  3578. glslangOp == glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset ||
  3579. glslangOp == glslang::EOpRayQueryGetIntersectionGeometryIndex ||
  3580. glslangOp == glslang::EOpRayQueryGetIntersectionPrimitiveIndex ||
  3581. glslangOp == glslang::EOpRayQueryGetIntersectionBarycentrics ||
  3582. glslangOp == glslang::EOpRayQueryGetIntersectionFrontFace ||
  3583. glslangOp == glslang::EOpRayQueryGetIntersectionObjectRayDirection ||
  3584. glslangOp == glslang::EOpRayQueryGetIntersectionObjectRayOrigin ||
  3585. glslangOp == glslang::EOpRayQueryGetIntersectionObjectToWorld ||
  3586. glslangOp == glslang::EOpRayQueryGetIntersectionWorldToObject ||
  3587. glslangOp == glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT ||
  3588. glslangOp == glslang::EOpRayQueryGetIntersectionClusterIdNV ||
  3589. glslangOp == glslang::EOpRayQueryGetIntersectionSpherePositionNV ||
  3590. glslangOp == glslang::EOpRayQueryGetIntersectionSphereRadiusNV ||
  3591. glslangOp == glslang::EOpRayQueryGetIntersectionLSSHitValueNV ||
  3592. glslangOp == glslang::EOpRayQueryGetIntersectionLSSPositionsNV ||
  3593. glslangOp == glslang::EOpRayQueryGetIntersectionLSSRadiiNV ||
  3594. glslangOp == glslang::EOpRayQueryIsLSSHitNV ||
  3595. glslangOp == glslang::EOpRayQueryIsSphereHitNV
  3596. )) {
  3597. bool cond = glslangOperands[arg]->getAsConstantUnion()->getConstArray()[0].getBConst();
  3598. operands.push_back(builder.makeIntConstant(cond ? 1 : 0));
  3599. } else if ((arg == 10 && glslangOp == glslang::EOpTraceKHR) ||
  3600. (arg == 11 && glslangOp == glslang::EOpTraceRayMotionNV) ||
  3601. (arg == 1 && glslangOp == glslang::EOpExecuteCallableKHR) ||
  3602. (arg == 1 && glslangOp == glslang::EOpHitObjectExecuteShaderNV) ||
  3603. (arg == 11 && glslangOp == glslang::EOpHitObjectTraceRayNV) ||
  3604. (arg == 12 && glslangOp == glslang::EOpHitObjectTraceRayMotionNV)) {
  3605. const int set = glslangOp == glslang::EOpExecuteCallableKHR ? 1 : 0;
  3606. const int location = glslangOperands[arg]->getAsConstantUnion()->getConstArray()[0].getUConst();
  3607. auto itNode = locationToSymbol[set].find(location);
  3608. visitSymbol(itNode->second);
  3609. spv::Id symId = getSymbolId(itNode->second);
  3610. operands.push_back(symId);
  3611. } else if ((arg == 12 && glslangOp == glslang::EOpHitObjectRecordHitNV) ||
  3612. (arg == 13 && glslangOp == glslang::EOpHitObjectRecordHitMotionNV) ||
  3613. (arg == 11 && glslangOp == glslang::EOpHitObjectRecordHitWithIndexNV) ||
  3614. (arg == 12 && glslangOp == glslang::EOpHitObjectRecordHitWithIndexMotionNV) ||
  3615. (arg == 1 && glslangOp == glslang::EOpHitObjectGetAttributesNV)) {
  3616. const int location = glslangOperands[arg]->getAsConstantUnion()->getConstArray()[0].getUConst();
  3617. const int set = 2;
  3618. auto itNode = locationToSymbol[set].find(location);
  3619. visitSymbol(itNode->second);
  3620. spv::Id symId = getSymbolId(itNode->second);
  3621. operands.push_back(symId);
  3622. } else if (glslangOperands[arg]->getAsTyped()->getQualifier().isSpirvLiteral()) {
  3623. // Will be translated to a literal value, make a placeholder here
  3624. operands.push_back(spv::NoResult);
  3625. } else if (glslangOperands[arg]->getAsTyped()->getBasicType() == glslang::EbtFunction) {
  3626. spv::Function* function = functionMap[glslangOperands[arg]->getAsSymbolNode()->getMangledName().c_str()];
  3627. assert(function);
  3628. operands.push_back(function->getId());
  3629. } else {
  3630. operands.push_back(accessChainLoad(glslangOperands[arg]->getAsTyped()->getType()));
  3631. }
  3632. }
  3633. }
  3634. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  3635. if (node->getOp() == glslang::EOpCooperativeMatrixLoadTensorNV) {
  3636. std::vector<spv::IdImmediate> idImmOps;
  3637. builder.addCapability(spv::Capability::CooperativeMatrixTensorAddressingNV);
  3638. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  3639. spv::Id object = builder.createLoad(operands[0], spv::NoPrecision);
  3640. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // Pointer
  3641. idImmOps.push_back(spv::IdImmediate(true, object)); // Object
  3642. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // tensorLayout
  3643. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end()); // memoryaccess
  3644. // initialize tensor operands to zero, then OR in flags based on the operands
  3645. size_t tensorOpIdx = idImmOps.size();
  3646. idImmOps.push_back(spv::IdImmediate(false, 0));
  3647. for (uint32_t i = 3; i < operands.size(); ++i) {
  3648. if (builder.isTensorView(operands[i])) {
  3649. addMask(idImmOps[tensorOpIdx].word, spv::TensorAddressingOperandsMask::TensorView);
  3650. } else {
  3651. // must be the decode func
  3652. addMask(idImmOps[tensorOpIdx].word, spv::TensorAddressingOperandsMask::DecodeFunc);
  3653. builder.addCapability(spv::Capability::CooperativeMatrixBlockLoadsNV);
  3654. }
  3655. idImmOps.push_back(spv::IdImmediate(true, operands[i])); // tensorView or decodeFunc
  3656. }
  3657. // get the pointee type
  3658. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  3659. assert(builder.isCooperativeMatrixType(typeId));
  3660. // do the op
  3661. spv::Id result = builder.createOp(spv::Op::OpCooperativeMatrixLoadTensorNV, typeId, idImmOps);
  3662. // store the result to the pointer (out param 'm')
  3663. builder.createStore(result, operands[0]);
  3664. result = 0;
  3665. } else if (node->getOp() == glslang::EOpCooperativeMatrixLoad ||
  3666. node->getOp() == glslang::EOpCooperativeMatrixLoadNV) {
  3667. std::vector<spv::IdImmediate> idImmOps;
  3668. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  3669. if (node->getOp() == glslang::EOpCooperativeMatrixLoad) {
  3670. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // matrixLayout
  3671. auto layout = (spv::CooperativeMatrixLayout)builder.getConstantScalar(operands[3]);
  3672. if (layout == spv::CooperativeMatrixLayout::RowBlockedInterleavedARM ||
  3673. layout == spv::CooperativeMatrixLayout::ColumnBlockedInterleavedARM) {
  3674. builder.addExtension(spv::E_SPV_ARM_cooperative_matrix_layouts);
  3675. builder.addCapability(spv::Capability::CooperativeMatrixLayoutsARM);
  3676. }
  3677. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
  3678. } else {
  3679. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
  3680. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // colMajor
  3681. }
  3682. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
  3683. // get the pointee type
  3684. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  3685. assert(builder.isCooperativeMatrixType(typeId));
  3686. // do the op
  3687. spv::Id result = node->getOp() == glslang::EOpCooperativeMatrixLoad
  3688. ? builder.createOp(spv::Op::OpCooperativeMatrixLoadKHR, typeId, idImmOps)
  3689. : builder.createOp(spv::Op::OpCooperativeMatrixLoadNV, typeId, idImmOps);
  3690. // store the result to the pointer (out param 'm')
  3691. builder.createStore(result, operands[0]);
  3692. result = 0;
  3693. } else if (node->getOp() == glslang::EOpCooperativeMatrixStoreTensorNV) {
  3694. std::vector<spv::IdImmediate> idImmOps;
  3695. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  3696. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // object
  3697. builder.addCapability(spv::Capability::CooperativeMatrixTensorAddressingNV);
  3698. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  3699. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // tensorLayout
  3700. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end()); // memoryaccess
  3701. if (operands.size() > 3) {
  3702. idImmOps.push_back(spv::IdImmediate(false, spv::TensorAddressingOperandsMask::TensorView));
  3703. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // tensorView
  3704. } else {
  3705. idImmOps.push_back(spv::IdImmediate(false, 0));
  3706. }
  3707. builder.createNoResultOp(spv::Op::OpCooperativeMatrixStoreTensorNV, idImmOps);
  3708. result = 0;
  3709. } else if (node->getOp() == glslang::EOpCooperativeMatrixStore ||
  3710. node->getOp() == glslang::EOpCooperativeMatrixStoreNV) {
  3711. std::vector<spv::IdImmediate> idImmOps;
  3712. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  3713. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // object
  3714. if (node->getOp() == glslang::EOpCooperativeMatrixStore) {
  3715. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // matrixLayout
  3716. auto layout = (spv::CooperativeMatrixLayout)builder.getConstantScalar(operands[3]);
  3717. if (layout == spv::CooperativeMatrixLayout::RowBlockedInterleavedARM ||
  3718. layout == spv::CooperativeMatrixLayout::ColumnBlockedInterleavedARM) {
  3719. builder.addExtension(spv::E_SPV_ARM_cooperative_matrix_layouts);
  3720. builder.addCapability(spv::Capability::CooperativeMatrixLayoutsARM);
  3721. }
  3722. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
  3723. } else {
  3724. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
  3725. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // colMajor
  3726. }
  3727. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
  3728. if (node->getOp() == glslang::EOpCooperativeMatrixStore)
  3729. builder.createNoResultOp(spv::Op::OpCooperativeMatrixStoreKHR, idImmOps);
  3730. else
  3731. builder.createNoResultOp(spv::Op::OpCooperativeMatrixStoreNV, idImmOps);
  3732. result = 0;
  3733. } else if (node->getOp() == glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT) {
  3734. std::vector<spv::IdImmediate> idImmOps;
  3735. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // q
  3736. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // committed
  3737. spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),
  3738. builder.makeUintConstant(3), 0);
  3739. // do the op
  3740. spv::Op spvOp = spv::Op::OpRayQueryGetIntersectionTriangleVertexPositionsKHR;
  3741. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  3742. // store the result to the pointer (out param 'm')
  3743. builder.createStore(result, operands[2]);
  3744. result = 0;
  3745. } else if (node->getOp() == glslang::EOpRayQueryGetIntersectionLSSPositionsNV) {
  3746. std::vector<spv::IdImmediate> idImmOps;
  3747. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // q
  3748. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // committed
  3749. spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),
  3750. builder.makeUintConstant(2), 0);
  3751. // do the op
  3752. spv::Op spvOp = spv::Op::OpRayQueryGetIntersectionLSSPositionsNV;
  3753. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  3754. // store the result to the pointer (out param 'm')
  3755. builder.createStore(result, operands[2]);
  3756. result = 0;
  3757. } else if (node->getOp() == glslang::EOpRayQueryGetIntersectionLSSRadiiNV) {
  3758. std::vector<spv::IdImmediate> idImmOps;
  3759. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // q
  3760. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // committed
  3761. spv::Id typeId = builder.makeArrayType(builder.makeFloatType(32),
  3762. builder.makeUintConstant(2), 0);
  3763. // do the op
  3764. spv::Op spvOp = spv::Op::OpRayQueryGetIntersectionLSSRadiiNV;
  3765. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  3766. // store the result to the pointer (out param 'm')
  3767. builder.createStore(result, operands[2]);
  3768. result = 0;
  3769. } else if (node->getOp() == glslang::EOpHitObjectGetLSSPositionsNV) {
  3770. std::vector<spv::IdImmediate> idImmOps;
  3771. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // hitObject
  3772. spv::Op spvOp = spv::Op::OpHitObjectGetLSSPositionsNV;
  3773. spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),
  3774. builder.makeUintConstant(2), 0);
  3775. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  3776. // store the result to the pointer (out param 'm')
  3777. builder.createStore(result, operands[1]);
  3778. result = 0;
  3779. } else if (node->getOp() == glslang::EOpHitObjectGetLSSRadiiNV) {
  3780. std::vector<spv::IdImmediate> idImmOps;
  3781. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // hitObject
  3782. spv::Op spvOp = spv::Op::OpHitObjectGetLSSRadiiNV;
  3783. spv::Id typeId = builder.makeArrayType(builder.makeFloatType(32),
  3784. builder.makeUintConstant(2), 0);
  3785. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  3786. // store the result to the pointer (out param 'm')
  3787. builder.createStore(result, operands[1]);
  3788. result = 0;
  3789. } else if (node->getOp() == glslang::EOpCooperativeMatrixMulAdd) {
  3790. auto matrixOperands = spv::CooperativeMatrixOperandsMask::MaskNone;
  3791. // If the optional operand is present, initialize matrixOperands to that value.
  3792. if (glslangOperands.size() == 4 && glslangOperands[3]->getAsConstantUnion()) {
  3793. matrixOperands = (spv::CooperativeMatrixOperandsMask)glslangOperands[3]->getAsConstantUnion()->getConstArray()[0].getIConst();
  3794. }
  3795. // Determine Cooperative Matrix Operands bits from the signedness of the types.
  3796. if (isTypeSignedInt(glslangOperands[0]->getAsTyped()->getBasicType()))
  3797. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixASignedComponentsKHR);
  3798. if (isTypeSignedInt(glslangOperands[1]->getAsTyped()->getBasicType()))
  3799. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixBSignedComponentsKHR);
  3800. if (isTypeSignedInt(glslangOperands[2]->getAsTyped()->getBasicType()))
  3801. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixCSignedComponentsKHR);
  3802. if (isTypeSignedInt(node->getBasicType()))
  3803. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixResultSignedComponentsKHR);
  3804. std::vector<spv::IdImmediate> idImmOps;
  3805. idImmOps.push_back(spv::IdImmediate(true, operands[0]));
  3806. idImmOps.push_back(spv::IdImmediate(true, operands[1]));
  3807. idImmOps.push_back(spv::IdImmediate(true, operands[2]));
  3808. if (matrixOperands != spv::CooperativeMatrixOperandsMask::MaskNone)
  3809. idImmOps.push_back(spv::IdImmediate(false, matrixOperands));
  3810. result = builder.createOp(spv::Op::OpCooperativeMatrixMulAddKHR, resultType(), idImmOps);
  3811. } else if (node->getOp() == glslang::EOpCooperativeMatrixReduceNV) {
  3812. builder.addCapability(spv::Capability::CooperativeMatrixReductionsNV);
  3813. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  3814. spv::Op opcode = spv::Op::OpCooperativeMatrixReduceNV;
  3815. unsigned mask = glslangOperands[2]->getAsConstantUnion()->getConstArray()[0].getUConst();
  3816. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  3817. assert(builder.isCooperativeMatrixType(typeId));
  3818. result = builder.createCooperativeMatrixReduce(opcode, typeId, operands[1], mask, operands[3]);
  3819. // store the result to the pointer (out param 'm')
  3820. builder.createStore(result, operands[0]);
  3821. result = 0;
  3822. } else if (node->getOp() == glslang::EOpCooperativeMatrixPerElementOpNV) {
  3823. builder.addCapability(spv::Capability::CooperativeMatrixPerElementOperationsNV);
  3824. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  3825. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  3826. assert(builder.isCooperativeMatrixType(typeId));
  3827. result = builder.createCooperativeMatrixPerElementOp(typeId, operands);
  3828. // store the result to the pointer
  3829. builder.createStore(result, operands[0]);
  3830. result = 0;
  3831. } else if (node->getOp() == glslang::EOpCooperativeMatrixTransposeNV) {
  3832. builder.addCapability(spv::Capability::CooperativeMatrixConversionsNV);
  3833. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  3834. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  3835. assert(builder.isCooperativeMatrixType(typeId));
  3836. result = builder.createUnaryOp(spv::Op::OpCooperativeMatrixTransposeNV, typeId, operands[1]);
  3837. // store the result to the pointer
  3838. builder.createStore(result, operands[0]);
  3839. result = 0;
  3840. } else if (node->getOp() == glslang::EOpCooperativeVectorMatMulNV ||
  3841. node->getOp() == glslang::EOpCooperativeVectorMatMulAddNV) {
  3842. auto matrixOperands = spv::CooperativeMatrixOperandsMask::MaskNone;
  3843. bool isMulAdd = node->getOp() == glslang::EOpCooperativeVectorMatMulAddNV;
  3844. // Determine Cooperative Matrix Operands bits from the signedness of the types.
  3845. if (isTypeSignedInt(glslangOperands[1]->getAsTyped()->getBasicType()))
  3846. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixBSignedComponentsKHR);
  3847. if (isTypeSignedInt(glslangOperands[0]->getAsTyped()->getBasicType()))
  3848. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixResultSignedComponentsKHR);
  3849. uint32_t opIdx = 1;
  3850. std::vector<spv::IdImmediate> idImmOps;
  3851. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Input
  3852. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // InputInterpretation
  3853. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Matrix
  3854. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MatrixOffset
  3855. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MatrixInterpretation
  3856. if (isMulAdd) {
  3857. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Bias
  3858. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // BiasOffset
  3859. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // BiasInterpretation
  3860. }
  3861. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // M
  3862. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // K
  3863. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MemoryLayout
  3864. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Transpose
  3865. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MatrixStride
  3866. if (matrixOperands != spv::CooperativeMatrixOperandsMask::MaskNone)
  3867. idImmOps.push_back(spv::IdImmediate(false, matrixOperands)); // Cooperative Matrix Operands
  3868. // get the pointee type
  3869. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  3870. assert(builder.isCooperativeVectorType(typeId));
  3871. // do the op
  3872. spv::Id result = builder.createOp(isMulAdd ? spv::Op::OpCooperativeVectorMatrixMulAddNV : spv::Op::OpCooperativeVectorMatrixMulNV, typeId, idImmOps);
  3873. // store the result to the pointer (out param 'res')
  3874. builder.createStore(result, operands[0]);
  3875. result = 0;
  3876. } else if (node->getOp() == glslang::EOpCooperativeVectorLoadNV) {
  3877. std::vector<spv::IdImmediate> idImmOps;
  3878. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  3879. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // offset
  3880. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
  3881. // get the pointee type
  3882. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  3883. assert(builder.isCooperativeVectorType(typeId));
  3884. // do the op
  3885. spv::Id result = builder.createOp(spv::Op::OpCooperativeVectorLoadNV, typeId, idImmOps);
  3886. // store the result to the pointer (out param 'v')
  3887. builder.createStore(result, operands[0]);
  3888. result = 0;
  3889. } else if (node->getOp() == glslang::EOpCooperativeVectorStoreNV) {
  3890. std::vector<spv::IdImmediate> idImmOps;
  3891. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  3892. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // offset
  3893. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // object
  3894. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
  3895. builder.createNoResultOp(spv::Op::OpCooperativeVectorStoreNV, idImmOps);
  3896. result = 0;
  3897. } else if (node->getOp() == glslang::EOpCooperativeVectorOuterProductAccumulateNV) {
  3898. builder.addCapability(spv::Capability::CooperativeVectorTrainingNV);
  3899. builder.addExtension(spv::E_SPV_NV_cooperative_vector);
  3900. std::vector<spv::IdImmediate> idImmOps;
  3901. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // Matrix
  3902. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // Offset
  3903. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // A
  3904. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // B
  3905. idImmOps.push_back(spv::IdImmediate(true, operands[5])); // MemoryLayout
  3906. idImmOps.push_back(spv::IdImmediate(true, operands[6])); // MatrixInterpretation
  3907. idImmOps.push_back(spv::IdImmediate(true, operands[4])); // Stride
  3908. builder.createNoResultOp(spv::Op::OpCooperativeVectorOuterProductAccumulateNV, idImmOps);
  3909. result = 0;
  3910. } else if (node->getOp() == glslang::EOpCooperativeVectorReduceSumAccumulateNV) {
  3911. builder.addCapability(spv::Capability::CooperativeVectorTrainingNV);
  3912. builder.addExtension(spv::E_SPV_NV_cooperative_vector);
  3913. std::vector<spv::IdImmediate> idImmOps;
  3914. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // Buf
  3915. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // Offset
  3916. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // A
  3917. builder.createNoResultOp(spv::Op::OpCooperativeVectorReduceSumAccumulateNV, idImmOps);
  3918. result = 0;
  3919. } else if (node->getOp() == glslang::EOpTensorReadARM ||
  3920. node->getOp() == glslang::EOpTensorWriteARM) {
  3921. const bool isWrite = node->getOp() == glslang::EOpTensorWriteARM;
  3922. const unsigned int tensorMinOperandCount = 3;
  3923. assert(operands.size() >= tensorMinOperandCount);
  3924. std::vector<spv::IdImmediate> idImmOps;
  3925. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // tensor
  3926. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // coords
  3927. if (isWrite) {
  3928. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // value
  3929. }
  3930. // Analyze the tensor operands
  3931. spv::IdImmediate tensorOperands = { false, uint32_t(spv::TensorOperandsMask::MaskNone) };
  3932. bool pushExtraArg = false;
  3933. if (operands.size() > tensorMinOperandCount) {
  3934. auto enumVal = builder.getConstantScalar(operands[tensorMinOperandCount]);
  3935. if (enumVal & uint32_t(spv::TensorOperandsMask::NontemporalARM)) {
  3936. tensorOperands.word |= uint32_t(spv::TensorOperandsMask::NontemporalARM);
  3937. }
  3938. if (enumVal & uint32_t(spv::TensorOperandsMask::OutOfBoundsValueARM)) {
  3939. tensorOperands.word |= uint32_t(spv::TensorOperandsMask::OutOfBoundsValueARM);
  3940. assert(operands.size() >= tensorMinOperandCount + 2 &&
  3941. "TensorOperandsOutOfBoundsValueMask requires an additional value");
  3942. pushExtraArg = true;
  3943. }
  3944. }
  3945. // Append optional tensor operands if the mask was non-zero.
  3946. if (tensorOperands.word) {
  3947. idImmOps.push_back(tensorOperands);
  3948. if (pushExtraArg)
  3949. idImmOps.push_back(spv::IdImmediate(true, operands[tensorMinOperandCount + 1]));
  3950. }
  3951. if (isWrite) {
  3952. builder.createNoResultOp(spv::Op::OpTensorWriteARM, idImmOps);
  3953. result = 0;
  3954. } else {
  3955. // Use the result argument type as the OpTensorReadARM result type.
  3956. const glslang::TType &resArgType = glslangOperands[2]->getAsTyped()->getType();
  3957. spv::Id retType = convertGlslangToSpvType(resArgType);
  3958. result = builder.createOp(spv::Op::OpTensorReadARM, retType, idImmOps);
  3959. // Store the result to the result argument.
  3960. builder.createStore(result, operands[2]);
  3961. }
  3962. } else if (node->getOp() == glslang::EOpTensorSizeARM) {
  3963. // Expected operands are (tensor, dimension)
  3964. assert(operands.size() == 2);
  3965. spv::Id tensorOp = operands[0];
  3966. spv::Id dimOp = operands[1];
  3967. assert(builder.isTensorTypeARM(builder.getTypeId(tensorOp)) && "operand #0 must be a tensor");
  3968. std::vector<spv::IdImmediate> idImmOps;
  3969. idImmOps.push_back(spv::IdImmediate(true, tensorOp));
  3970. idImmOps.push_back(spv::IdImmediate(true, dimOp));
  3971. result = builder.createOp(spv::Op::OpTensorQuerySizeARM, resultType(), idImmOps);
  3972. } else if (atomic) {
  3973. // Handle all atomics
  3974. glslang::TBasicType typeProxy = (node->getOp() == glslang::EOpAtomicStore)
  3975. ? node->getSequence()[0]->getAsTyped()->getBasicType() : node->getBasicType();
  3976. result = createAtomicOperation(node->getOp(), precision, resultType(), operands, typeProxy,
  3977. lvalueCoherentFlags, node->getType());
  3978. } else if (node->getOp() == glslang::EOpSpirvInst) {
  3979. const auto& spirvInst = node->getSpirvInstruction();
  3980. if (spirvInst.set == "") {
  3981. std::vector<spv::IdImmediate> idImmOps;
  3982. for (unsigned int i = 0; i < glslangOperands.size(); ++i) {
  3983. if (glslangOperands[i]->getAsTyped()->getQualifier().isSpirvLiteral()) {
  3984. // Translate the constant to a literal value
  3985. std::vector<unsigned> literals;
  3986. glslang::TVector<const glslang::TIntermConstantUnion*> constants;
  3987. constants.push_back(glslangOperands[i]->getAsConstantUnion());
  3988. TranslateLiterals(constants, literals);
  3989. idImmOps.push_back({false, literals[0]});
  3990. } else
  3991. idImmOps.push_back({true, operands[i]});
  3992. }
  3993. if (node->getBasicType() == glslang::EbtVoid)
  3994. builder.createNoResultOp(static_cast<spv::Op>(spirvInst.id), idImmOps);
  3995. else
  3996. result = builder.createOp(static_cast<spv::Op>(spirvInst.id), resultType(), idImmOps);
  3997. } else {
  3998. result = builder.createBuiltinCall(
  3999. resultType(), spirvInst.set == "GLSL.std.450" ? stdBuiltins : getExtBuiltins(spirvInst.set.c_str()),
  4000. spirvInst.id, operands);
  4001. }
  4002. noReturnValue = node->getBasicType() == glslang::EbtVoid;
  4003. } else if (node->getOp() == glslang::EOpDebugPrintf) {
  4004. if (!nonSemanticDebugPrintf) {
  4005. nonSemanticDebugPrintf = builder.import("NonSemantic.DebugPrintf");
  4006. }
  4007. result = builder.createBuiltinCall(builder.makeVoidType(), nonSemanticDebugPrintf, spv::NonSemanticDebugPrintfDebugPrintf, operands);
  4008. builder.addExtension(spv::E_SPV_KHR_non_semantic_info);
  4009. } else {
  4010. // Pass through to generic operations.
  4011. switch (glslangOperands.size()) {
  4012. case 0:
  4013. result = createNoArgOperation(node->getOp(), precision, resultType());
  4014. break;
  4015. case 1:
  4016. {
  4017. OpDecorations decorations = { precision,
  4018. TranslateNoContractionDecoration(node->getType().getQualifier()),
  4019. TranslateNonUniformDecoration(node->getType().getQualifier()) };
  4020. result = createUnaryOperation(
  4021. node->getOp(), decorations,
  4022. resultType(), operands.front(),
  4023. glslangOperands[0]->getAsTyped()->getBasicType(), lvalueCoherentFlags, node->getType());
  4024. }
  4025. break;
  4026. default:
  4027. result = createMiscOperation(node->getOp(), precision, resultType(), operands, node->getBasicType());
  4028. break;
  4029. }
  4030. if (invertedType != spv::NoResult)
  4031. result = createInvertedSwizzle(precision, *glslangOperands[0]->getAsBinaryNode(), result);
  4032. for (unsigned int i = 0; i < temporaryLvalues.size(); ++i) {
  4033. builder.setAccessChain(complexLvalues[i]);
  4034. builder.accessChainStore(builder.createLoad(temporaryLvalues[i], spv::NoPrecision),
  4035. TranslateNonUniformDecoration(complexLvalues[i].coherentFlags));
  4036. }
  4037. }
  4038. if (noReturnValue)
  4039. return false;
  4040. if (! result) {
  4041. logger->missingFunctionality("unknown glslang aggregate");
  4042. return true; // pick up a child as a placeholder operand
  4043. } else {
  4044. builder.clearAccessChain();
  4045. builder.setAccessChainRValue(result);
  4046. return false;
  4047. }
  4048. }
  4049. // This path handles both if-then-else and ?:
  4050. // The if-then-else has a node type of void, while
  4051. // ?: has either a void or a non-void node type
  4052. //
  4053. // Leaving the result, when not void:
  4054. // GLSL only has r-values as the result of a :?, but
  4055. // if we have an l-value, that can be more efficient if it will
  4056. // become the base of a complex r-value expression, because the
  4057. // next layer copies r-values into memory to use the access-chain mechanism
  4058. bool TGlslangToSpvTraverser::visitSelection(glslang::TVisit /* visit */, glslang::TIntermSelection* node)
  4059. {
  4060. // see if OpSelect can handle it
  4061. const auto isOpSelectable = [&]() {
  4062. if (node->getBasicType() == glslang::EbtVoid)
  4063. return false;
  4064. // OpSelect can do all other types starting with SPV 1.4
  4065. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_4) {
  4066. // pre-1.4, only scalars and vectors can be handled
  4067. if ((!node->getType().isScalar() && !node->getType().isVector()))
  4068. return false;
  4069. }
  4070. return true;
  4071. };
  4072. // See if it simple and safe, or required, to execute both sides.
  4073. // Crucially, side effects must be either semantically required or avoided,
  4074. // and there are performance trade-offs.
  4075. // Return true if required or a good idea (and safe) to execute both sides,
  4076. // false otherwise.
  4077. const auto bothSidesPolicy = [&]() -> bool {
  4078. // do we have both sides?
  4079. if (node->getTrueBlock() == nullptr ||
  4080. node->getFalseBlock() == nullptr)
  4081. return false;
  4082. // required? (unless we write additional code to look for side effects
  4083. // and make performance trade-offs if none are present)
  4084. if (!node->getShortCircuit())
  4085. return true;
  4086. // if not required to execute both, decide based on performance/practicality...
  4087. if (!isOpSelectable())
  4088. return false;
  4089. assert(node->getType() == node->getTrueBlock() ->getAsTyped()->getType() &&
  4090. node->getType() == node->getFalseBlock()->getAsTyped()->getType());
  4091. // return true if a single operand to ? : is okay for OpSelect
  4092. const auto operandOkay = [](glslang::TIntermTyped* node) {
  4093. return node->getAsSymbolNode() || node->getType().getQualifier().isConstant();
  4094. };
  4095. return operandOkay(node->getTrueBlock() ->getAsTyped()) &&
  4096. operandOkay(node->getFalseBlock()->getAsTyped());
  4097. };
  4098. spv::Id result = spv::NoResult; // upcoming result selecting between trueValue and falseValue
  4099. // emit the condition before doing anything with selection
  4100. node->getCondition()->traverse(this);
  4101. spv::Id condition = accessChainLoad(node->getCondition()->getType());
  4102. // Find a way of executing both sides and selecting the right result.
  4103. const auto executeBothSides = [&]() -> void {
  4104. // execute both sides
  4105. spv::Id resultType = convertGlslangToSpvType(node->getType());
  4106. node->getTrueBlock()->traverse(this);
  4107. spv::Id trueValue = accessChainLoad(node->getTrueBlock()->getAsTyped()->getType());
  4108. node->getFalseBlock()->traverse(this);
  4109. spv::Id falseValue = accessChainLoad(node->getFalseBlock()->getAsTyped()->getType());
  4110. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  4111. // done if void
  4112. if (node->getBasicType() == glslang::EbtVoid)
  4113. return;
  4114. // emit code to select between trueValue and falseValue
  4115. // see if OpSelect can handle the result type, and that the SPIR-V types
  4116. // of the inputs match the result type.
  4117. if (isOpSelectable()) {
  4118. // Emit OpSelect for this selection.
  4119. // smear condition to vector, if necessary (AST is always scalar)
  4120. // Before 1.4, smear like for mix(), starting with 1.4, keep it scalar
  4121. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_4 && builder.isVector(trueValue)) {
  4122. condition = builder.smearScalar(spv::NoPrecision, condition,
  4123. builder.makeVectorType(builder.makeBoolType(),
  4124. builder.getNumComponents(trueValue)));
  4125. }
  4126. // If the types do not match, it is because of mismatched decorations on aggregates.
  4127. // Since isOpSelectable only lets us get here for SPIR-V >= 1.4, we can use OpCopyObject
  4128. // to get matching types.
  4129. if (builder.getTypeId(trueValue) != resultType) {
  4130. trueValue = builder.createUnaryOp(spv::Op::OpCopyLogical, resultType, trueValue);
  4131. }
  4132. if (builder.getTypeId(falseValue) != resultType) {
  4133. falseValue = builder.createUnaryOp(spv::Op::OpCopyLogical, resultType, falseValue);
  4134. }
  4135. // OpSelect
  4136. result = builder.createTriOp(spv::Op::OpSelect, resultType, condition, trueValue, falseValue);
  4137. builder.clearAccessChain();
  4138. builder.setAccessChainRValue(result);
  4139. } else {
  4140. // We need control flow to select the result.
  4141. // TODO: Once SPIR-V OpSelect allows arbitrary types, eliminate this path.
  4142. result = builder.createVariable(TranslatePrecisionDecoration(node->getType()),
  4143. spv::StorageClass::Function, resultType);
  4144. // Selection control:
  4145. const spv::SelectionControlMask control = TranslateSelectionControl(*node);
  4146. // make an "if" based on the value created by the condition
  4147. spv::Builder::If ifBuilder(condition, control, builder);
  4148. // emit the "then" statement
  4149. builder.clearAccessChain();
  4150. builder.setAccessChainLValue(result);
  4151. multiTypeStore(node->getType(), trueValue);
  4152. ifBuilder.makeBeginElse();
  4153. // emit the "else" statement
  4154. builder.clearAccessChain();
  4155. builder.setAccessChainLValue(result);
  4156. multiTypeStore(node->getType(), falseValue);
  4157. // finish off the control flow
  4158. ifBuilder.makeEndIf();
  4159. builder.clearAccessChain();
  4160. builder.setAccessChainLValue(result);
  4161. }
  4162. };
  4163. // Execute the one side needed, as per the condition
  4164. const auto executeOneSide = [&]() {
  4165. // Always emit control flow.
  4166. if (node->getBasicType() != glslang::EbtVoid) {
  4167. result = builder.createVariable(TranslatePrecisionDecoration(node->getType()), spv::StorageClass::Function,
  4168. convertGlslangToSpvType(node->getType()));
  4169. }
  4170. // Selection control:
  4171. const spv::SelectionControlMask control = TranslateSelectionControl(*node);
  4172. // make an "if" based on the value created by the condition
  4173. spv::Builder::If ifBuilder(condition, control, builder);
  4174. // emit the "then" statement
  4175. if (node->getTrueBlock() != nullptr) {
  4176. node->getTrueBlock()->traverse(this);
  4177. if (result != spv::NoResult) {
  4178. spv::Id load = accessChainLoad(node->getTrueBlock()->getAsTyped()->getType());
  4179. builder.clearAccessChain();
  4180. builder.setAccessChainLValue(result);
  4181. multiTypeStore(node->getType(), load);
  4182. }
  4183. }
  4184. if (node->getFalseBlock() != nullptr) {
  4185. ifBuilder.makeBeginElse();
  4186. // emit the "else" statement
  4187. node->getFalseBlock()->traverse(this);
  4188. if (result != spv::NoResult) {
  4189. spv::Id load = accessChainLoad(node->getFalseBlock()->getAsTyped()->getType());
  4190. builder.clearAccessChain();
  4191. builder.setAccessChainLValue(result);
  4192. multiTypeStore(node->getType(), load);
  4193. }
  4194. }
  4195. // finish off the control flow
  4196. ifBuilder.makeEndIf();
  4197. if (result != spv::NoResult) {
  4198. builder.clearAccessChain();
  4199. builder.setAccessChainLValue(result);
  4200. }
  4201. };
  4202. // Try for OpSelect (or a requirement to execute both sides)
  4203. if (bothSidesPolicy()) {
  4204. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  4205. if (node->getType().getQualifier().isSpecConstant())
  4206. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  4207. executeBothSides();
  4208. } else
  4209. executeOneSide();
  4210. return false;
  4211. }
  4212. bool TGlslangToSpvTraverser::visitSwitch(glslang::TVisit /* visit */, glslang::TIntermSwitch* node)
  4213. {
  4214. // emit and get the condition before doing anything with switch
  4215. node->getCondition()->traverse(this);
  4216. spv::Id selector = accessChainLoad(node->getCondition()->getAsTyped()->getType());
  4217. // Selection control:
  4218. const spv::SelectionControlMask control = TranslateSwitchControl(*node);
  4219. // browse the children to sort out code segments
  4220. int defaultSegment = -1;
  4221. std::vector<TIntermNode*> codeSegments;
  4222. glslang::TIntermSequence& sequence = node->getBody()->getSequence();
  4223. std::vector<int> caseValues;
  4224. std::vector<int> valueIndexToSegment(sequence.size()); // note: probably not all are used, it is an overestimate
  4225. for (glslang::TIntermSequence::iterator c = sequence.begin(); c != sequence.end(); ++c) {
  4226. TIntermNode* child = *c;
  4227. if (child->getAsBranchNode() && child->getAsBranchNode()->getFlowOp() == glslang::EOpDefault)
  4228. defaultSegment = (int)codeSegments.size();
  4229. else if (child->getAsBranchNode() && child->getAsBranchNode()->getFlowOp() == glslang::EOpCase) {
  4230. valueIndexToSegment[caseValues.size()] = (int)codeSegments.size();
  4231. caseValues.push_back(child->getAsBranchNode()->getExpression()->getAsConstantUnion()
  4232. ->getConstArray()[0].getIConst());
  4233. } else
  4234. codeSegments.push_back(child);
  4235. }
  4236. // handle the case where the last code segment is missing, due to no code
  4237. // statements between the last case and the end of the switch statement
  4238. if ((caseValues.size() && (int)codeSegments.size() == valueIndexToSegment[caseValues.size() - 1]) ||
  4239. (int)codeSegments.size() == defaultSegment)
  4240. codeSegments.push_back(nullptr);
  4241. // make the switch statement
  4242. std::vector<spv::Block*> segmentBlocks; // returned, as the blocks allocated in the call
  4243. builder.makeSwitch(selector, control, (int)codeSegments.size(), caseValues, valueIndexToSegment, defaultSegment,
  4244. segmentBlocks);
  4245. // emit all the code in the segments
  4246. breakForLoop.push(false);
  4247. for (unsigned int s = 0; s < codeSegments.size(); ++s) {
  4248. builder.nextSwitchSegment(segmentBlocks, s);
  4249. if (codeSegments[s])
  4250. codeSegments[s]->traverse(this);
  4251. else
  4252. builder.addSwitchBreak(true);
  4253. }
  4254. breakForLoop.pop();
  4255. builder.endSwitch(segmentBlocks);
  4256. return false;
  4257. }
  4258. void TGlslangToSpvTraverser::visitConstantUnion(glslang::TIntermConstantUnion* node)
  4259. {
  4260. if (node->getQualifier().isSpirvLiteral())
  4261. return; // Translated to a literal value, skip further processing
  4262. int nextConst = 0;
  4263. spv::Id constant = createSpvConstantFromConstUnionArray(node->getType(), node->getConstArray(), nextConst, false);
  4264. builder.clearAccessChain();
  4265. builder.setAccessChainRValue(constant);
  4266. }
  4267. bool TGlslangToSpvTraverser::visitLoop(glslang::TVisit /* visit */, glslang::TIntermLoop* node)
  4268. {
  4269. auto blocks = builder.makeNewLoop();
  4270. builder.createBranch(true, &blocks.head);
  4271. // Loop control:
  4272. std::vector<unsigned int> operands;
  4273. const spv::LoopControlMask control = TranslateLoopControl(*node, operands);
  4274. // Spec requires back edges to target header blocks, and every header block
  4275. // must dominate its merge block. Make a header block first to ensure these
  4276. // conditions are met. By definition, it will contain OpLoopMerge, followed
  4277. // by a block-ending branch. But we don't want to put any other body/test
  4278. // instructions in it, since the body/test may have arbitrary instructions,
  4279. // including merges of its own.
  4280. builder.setBuildPoint(&blocks.head);
  4281. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  4282. builder.createLoopMerge(&blocks.merge, &blocks.continue_target, control, operands);
  4283. if (node->testFirst() && node->getTest()) {
  4284. spv::Block& test = builder.makeNewBlock();
  4285. builder.createBranch(true, &test);
  4286. builder.setBuildPoint(&test);
  4287. node->getTest()->traverse(this);
  4288. spv::Id condition = accessChainLoad(node->getTest()->getType());
  4289. builder.createConditionalBranch(condition, &blocks.body, &blocks.merge);
  4290. builder.setBuildPoint(&blocks.body);
  4291. breakForLoop.push(true);
  4292. if (node->getBody())
  4293. node->getBody()->traverse(this);
  4294. builder.createBranch(true, &blocks.continue_target);
  4295. breakForLoop.pop();
  4296. builder.setBuildPoint(&blocks.continue_target);
  4297. if (node->getTerminal())
  4298. node->getTerminal()->traverse(this);
  4299. builder.createBranch(true, &blocks.head);
  4300. } else {
  4301. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  4302. builder.createBranch(true, &blocks.body);
  4303. breakForLoop.push(true);
  4304. builder.setBuildPoint(&blocks.body);
  4305. if (node->getBody())
  4306. node->getBody()->traverse(this);
  4307. builder.createBranch(true, &blocks.continue_target);
  4308. breakForLoop.pop();
  4309. builder.setBuildPoint(&blocks.continue_target);
  4310. if (node->getTerminal())
  4311. node->getTerminal()->traverse(this);
  4312. if (node->getTest()) {
  4313. node->getTest()->traverse(this);
  4314. spv::Id condition =
  4315. accessChainLoad(node->getTest()->getType());
  4316. builder.createConditionalBranch(condition, &blocks.head, &blocks.merge);
  4317. } else {
  4318. // TODO: unless there was a break/return/discard instruction
  4319. // somewhere in the body, this is an infinite loop, so we should
  4320. // issue a warning.
  4321. builder.createBranch(true, &blocks.head);
  4322. }
  4323. }
  4324. builder.setBuildPoint(&blocks.merge);
  4325. builder.closeLoop();
  4326. return false;
  4327. }
  4328. bool TGlslangToSpvTraverser::visitBranch(glslang::TVisit /* visit */, glslang::TIntermBranch* node)
  4329. {
  4330. if (node->getExpression())
  4331. node->getExpression()->traverse(this);
  4332. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  4333. switch (node->getFlowOp()) {
  4334. case glslang::EOpKill:
  4335. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {
  4336. builder.addCapability(spv::Capability::DemoteToHelperInvocation);
  4337. builder.createNoResultOp(spv::Op::OpDemoteToHelperInvocationEXT);
  4338. } else {
  4339. builder.makeStatementTerminator(spv::Op::OpKill, "post-discard");
  4340. }
  4341. break;
  4342. case glslang::EOpTerminateInvocation:
  4343. builder.addExtension(spv::E_SPV_KHR_terminate_invocation);
  4344. builder.makeStatementTerminator(spv::Op::OpTerminateInvocation, "post-terminate-invocation");
  4345. break;
  4346. case glslang::EOpBreak:
  4347. if (breakForLoop.top())
  4348. builder.createLoopExit();
  4349. else
  4350. builder.addSwitchBreak(false);
  4351. break;
  4352. case glslang::EOpContinue:
  4353. builder.createLoopContinue();
  4354. break;
  4355. case glslang::EOpReturn:
  4356. if (node->getExpression() != nullptr) {
  4357. const glslang::TType& glslangReturnType = node->getExpression()->getType();
  4358. spv::Id returnId = accessChainLoad(glslangReturnType);
  4359. if (builder.getTypeId(returnId) != currentFunction->getReturnType() ||
  4360. TranslatePrecisionDecoration(glslangReturnType) != currentFunction->getReturnPrecision()) {
  4361. builder.clearAccessChain();
  4362. spv::Id copyId = builder.createVariable(currentFunction->getReturnPrecision(),
  4363. spv::StorageClass::Function, currentFunction->getReturnType());
  4364. builder.setAccessChainLValue(copyId);
  4365. multiTypeStore(glslangReturnType, returnId);
  4366. returnId = builder.createLoad(copyId, currentFunction->getReturnPrecision());
  4367. }
  4368. builder.makeReturn(false, returnId);
  4369. } else
  4370. builder.makeReturn(false);
  4371. builder.clearAccessChain();
  4372. break;
  4373. case glslang::EOpDemote:
  4374. builder.createNoResultOp(spv::Op::OpDemoteToHelperInvocationEXT);
  4375. builder.addExtension(spv::E_SPV_EXT_demote_to_helper_invocation);
  4376. builder.addCapability(spv::Capability::DemoteToHelperInvocationEXT);
  4377. break;
  4378. case glslang::EOpTerminateRayKHR:
  4379. builder.makeStatementTerminator(spv::Op::OpTerminateRayKHR, "post-terminateRayKHR");
  4380. break;
  4381. case glslang::EOpIgnoreIntersectionKHR:
  4382. builder.makeStatementTerminator(spv::Op::OpIgnoreIntersectionKHR, "post-ignoreIntersectionKHR");
  4383. break;
  4384. default:
  4385. assert(0);
  4386. break;
  4387. }
  4388. return false;
  4389. }
  4390. spv::Id TGlslangToSpvTraverser::createSpvVariable(const glslang::TIntermSymbol* node, spv::Id forcedType)
  4391. {
  4392. // First, steer off constants, which are not SPIR-V variables, but
  4393. // can still have a mapping to a SPIR-V Id.
  4394. // This includes specialization constants.
  4395. if (node->getQualifier().isConstant()) {
  4396. spv::Id result = createSpvConstant(*node);
  4397. if (result != spv::NoResult)
  4398. return result;
  4399. }
  4400. // Now, handle actual variables
  4401. spv::StorageClass storageClass = TranslateStorageClass(node->getType());
  4402. spv::Id spvType = forcedType == spv::NoType ? convertGlslangToSpvType(node->getType())
  4403. : forcedType;
  4404. const bool contains16BitType = node->getType().contains16BitFloat() ||
  4405. node->getType().contains16BitInt();
  4406. if (contains16BitType) {
  4407. switch (storageClass) {
  4408. case spv::StorageClass::Input:
  4409. case spv::StorageClass::Output:
  4410. builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);
  4411. builder.addCapability(spv::Capability::StorageInputOutput16);
  4412. break;
  4413. case spv::StorageClass::Uniform:
  4414. builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);
  4415. if (node->getType().getQualifier().storage == glslang::EvqBuffer)
  4416. builder.addCapability(spv::Capability::StorageUniformBufferBlock16);
  4417. else
  4418. builder.addCapability(spv::Capability::StorageUniform16);
  4419. break;
  4420. case spv::StorageClass::PushConstant:
  4421. builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);
  4422. builder.addCapability(spv::Capability::StoragePushConstant16);
  4423. break;
  4424. case spv::StorageClass::StorageBuffer:
  4425. case spv::StorageClass::PhysicalStorageBufferEXT:
  4426. builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);
  4427. builder.addCapability(spv::Capability::StorageUniformBufferBlock16);
  4428. break;
  4429. case spv::StorageClass::TileAttachmentQCOM:
  4430. builder.addCapability(spv::Capability::TileShadingQCOM);
  4431. break;
  4432. default:
  4433. if (storageClass == spv::StorageClass::Workgroup &&
  4434. node->getType().getBasicType() == glslang::EbtBlock) {
  4435. builder.addCapability(spv::Capability::WorkgroupMemoryExplicitLayout16BitAccessKHR);
  4436. break;
  4437. }
  4438. if (node->getType().contains16BitFloat())
  4439. builder.addCapability(spv::Capability::Float16);
  4440. if (node->getType().contains16BitInt())
  4441. builder.addCapability(spv::Capability::Int16);
  4442. break;
  4443. }
  4444. }
  4445. if (node->getType().contains8BitInt()) {
  4446. if (storageClass == spv::StorageClass::PushConstant) {
  4447. builder.addIncorporatedExtension(spv::E_SPV_KHR_8bit_storage, spv::Spv_1_5);
  4448. builder.addCapability(spv::Capability::StoragePushConstant8);
  4449. } else if (storageClass == spv::StorageClass::Uniform) {
  4450. builder.addIncorporatedExtension(spv::E_SPV_KHR_8bit_storage, spv::Spv_1_5);
  4451. builder.addCapability(spv::Capability::UniformAndStorageBuffer8BitAccess);
  4452. } else if (storageClass == spv::StorageClass::StorageBuffer) {
  4453. builder.addIncorporatedExtension(spv::E_SPV_KHR_8bit_storage, spv::Spv_1_5);
  4454. builder.addCapability(spv::Capability::StorageBuffer8BitAccess);
  4455. } else if (storageClass == spv::StorageClass::Workgroup &&
  4456. node->getType().getBasicType() == glslang::EbtBlock) {
  4457. builder.addCapability(spv::Capability::WorkgroupMemoryExplicitLayout8BitAccessKHR);
  4458. } else {
  4459. builder.addCapability(spv::Capability::Int8);
  4460. }
  4461. }
  4462. const char* name = node->getName().c_str();
  4463. if (glslang::IsAnonymous(name))
  4464. name = "";
  4465. spv::Id initializer = spv::NoResult;
  4466. if (node->getType().getQualifier().storage == glslang::EvqUniform && !node->getConstArray().empty()) {
  4467. int nextConst = 0;
  4468. initializer = createSpvConstantFromConstUnionArray(node->getType(),
  4469. node->getConstArray(),
  4470. nextConst,
  4471. false /* specConst */);
  4472. } else if (node->getType().getQualifier().isNullInit()) {
  4473. initializer = builder.makeNullConstant(spvType);
  4474. }
  4475. spv::Id var = builder.createVariable(spv::NoPrecision, storageClass, spvType, name, initializer, false);
  4476. std::vector<spv::Decoration> topLevelDecorations;
  4477. glslang::TQualifier typeQualifier = node->getType().getQualifier();
  4478. TranslateMemoryDecoration(typeQualifier, topLevelDecorations, glslangIntermediate->usingVulkanMemoryModel());
  4479. for (auto deco : topLevelDecorations) {
  4480. builder.addDecoration(var, deco);
  4481. }
  4482. return var;
  4483. }
  4484. // Return type Id of the sampled type.
  4485. spv::Id TGlslangToSpvTraverser::getSampledType(const glslang::TSampler& sampler)
  4486. {
  4487. switch (sampler.type) {
  4488. case glslang::EbtInt: return builder.makeIntType(32);
  4489. case glslang::EbtUint: return builder.makeUintType(32);
  4490. case glslang::EbtFloat: return builder.makeFloatType(32);
  4491. case glslang::EbtFloat16:
  4492. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float_fetch);
  4493. builder.addCapability(spv::Capability::Float16ImageAMD);
  4494. return builder.makeFloatType(16);
  4495. case glslang::EbtInt64:
  4496. builder.addExtension(spv::E_SPV_EXT_shader_image_int64);
  4497. builder.addCapability(spv::Capability::Int64ImageEXT);
  4498. return builder.makeIntType(64);
  4499. case glslang::EbtUint64:
  4500. builder.addExtension(spv::E_SPV_EXT_shader_image_int64);
  4501. builder.addCapability(spv::Capability::Int64ImageEXT);
  4502. return builder.makeUintType(64);
  4503. default:
  4504. assert(0);
  4505. return builder.makeFloatType(32);
  4506. }
  4507. }
  4508. // If node is a swizzle operation, return the type that should be used if
  4509. // the swizzle base is first consumed by another operation, before the swizzle
  4510. // is applied.
  4511. spv::Id TGlslangToSpvTraverser::getInvertedSwizzleType(const glslang::TIntermTyped& node)
  4512. {
  4513. if (node.getAsOperator() &&
  4514. node.getAsOperator()->getOp() == glslang::EOpVectorSwizzle)
  4515. return convertGlslangToSpvType(node.getAsBinaryNode()->getLeft()->getType());
  4516. else
  4517. return spv::NoType;
  4518. }
  4519. // When inverting a swizzle with a parent op, this function
  4520. // will apply the swizzle operation to a completed parent operation.
  4521. spv::Id TGlslangToSpvTraverser::createInvertedSwizzle(spv::Decoration precision, const glslang::TIntermTyped& node,
  4522. spv::Id parentResult)
  4523. {
  4524. std::vector<unsigned> swizzle;
  4525. convertSwizzle(*node.getAsBinaryNode()->getRight()->getAsAggregate(), swizzle);
  4526. return builder.createRvalueSwizzle(precision, convertGlslangToSpvType(node.getType()), parentResult, swizzle);
  4527. }
  4528. // Convert a glslang AST swizzle node to a swizzle vector for building SPIR-V.
  4529. void TGlslangToSpvTraverser::convertSwizzle(const glslang::TIntermAggregate& node, std::vector<unsigned>& swizzle)
  4530. {
  4531. const glslang::TIntermSequence& swizzleSequence = node.getSequence();
  4532. for (int i = 0; i < (int)swizzleSequence.size(); ++i)
  4533. swizzle.push_back(swizzleSequence[i]->getAsConstantUnion()->getConstArray()[0].getIConst());
  4534. }
  4535. // Convert from a glslang type to an SPV type, by calling into a
  4536. // recursive version of this function. This establishes the inherited
  4537. // layout state rooted from the top-level type.
  4538. spv::Id TGlslangToSpvTraverser::convertGlslangToSpvType(const glslang::TType& type, bool forwardReferenceOnly)
  4539. {
  4540. return convertGlslangToSpvType(type, getExplicitLayout(type), type.getQualifier(), false, forwardReferenceOnly);
  4541. }
  4542. spv::LinkageType TGlslangToSpvTraverser::convertGlslangLinkageToSpv(glslang::TLinkType linkType)
  4543. {
  4544. switch (linkType) {
  4545. case glslang::ELinkExport:
  4546. return spv::LinkageType::Export;
  4547. default:
  4548. return spv::LinkageType::Max;
  4549. }
  4550. }
  4551. // Do full recursive conversion of an arbitrary glslang type to a SPIR-V Id.
  4552. // explicitLayout can be kept the same throughout the hierarchical recursive walk.
  4553. // Mutually recursive with convertGlslangStructToSpvType().
  4554. spv::Id TGlslangToSpvTraverser::convertGlslangToSpvType(const glslang::TType& type,
  4555. glslang::TLayoutPacking explicitLayout, const glslang::TQualifier& qualifier,
  4556. bool lastBufferBlockMember, bool forwardReferenceOnly)
  4557. {
  4558. spv::Id spvType = spv::NoResult;
  4559. switch (type.getBasicType()) {
  4560. case glslang::EbtVoid:
  4561. spvType = builder.makeVoidType();
  4562. assert (! type.isArray());
  4563. break;
  4564. case glslang::EbtBool:
  4565. // "transparent" bool doesn't exist in SPIR-V. The GLSL convention is
  4566. // a 32-bit int where non-0 means true.
  4567. if (explicitLayout != glslang::ElpNone)
  4568. spvType = builder.makeUintType(32);
  4569. else
  4570. spvType = builder.makeBoolType();
  4571. break;
  4572. case glslang::EbtInt:
  4573. spvType = builder.makeIntType(32);
  4574. break;
  4575. case glslang::EbtUint:
  4576. spvType = builder.makeUintType(32);
  4577. break;
  4578. case glslang::EbtFloat:
  4579. spvType = builder.makeFloatType(32);
  4580. break;
  4581. case glslang::EbtDouble:
  4582. spvType = builder.makeFloatType(64);
  4583. break;
  4584. case glslang::EbtFloat16:
  4585. spvType = builder.makeFloatType(16);
  4586. break;
  4587. case glslang::EbtBFloat16:
  4588. spvType = builder.makeBFloat16Type();
  4589. break;
  4590. case glslang::EbtFloatE5M2:
  4591. spvType = builder.makeFloatE5M2Type();
  4592. break;
  4593. case glslang::EbtFloatE4M3:
  4594. spvType = builder.makeFloatE4M3Type();
  4595. break;
  4596. case glslang::EbtInt8:
  4597. spvType = builder.makeIntType(8);
  4598. break;
  4599. case glslang::EbtUint8:
  4600. spvType = builder.makeUintType(8);
  4601. break;
  4602. case glslang::EbtInt16:
  4603. spvType = builder.makeIntType(16);
  4604. break;
  4605. case glslang::EbtUint16:
  4606. spvType = builder.makeUintType(16);
  4607. break;
  4608. case glslang::EbtInt64:
  4609. spvType = builder.makeIntType(64);
  4610. break;
  4611. case glslang::EbtUint64:
  4612. spvType = builder.makeUintType(64);
  4613. break;
  4614. case glslang::EbtAtomicUint:
  4615. builder.addCapability(spv::Capability::AtomicStorage);
  4616. spvType = builder.makeUintType(32);
  4617. break;
  4618. case glslang::EbtAccStruct:
  4619. switch (glslangIntermediate->getStage()) {
  4620. case EShLangRayGen:
  4621. case EShLangIntersect:
  4622. case EShLangAnyHit:
  4623. case EShLangClosestHit:
  4624. case EShLangMiss:
  4625. case EShLangCallable:
  4626. // these all should have the RayTracingNV/KHR capability already
  4627. break;
  4628. default:
  4629. {
  4630. auto& extensions = glslangIntermediate->getRequestedExtensions();
  4631. if (extensions.find("GL_EXT_ray_query") != extensions.end()) {
  4632. builder.addExtension(spv::E_SPV_KHR_ray_query);
  4633. builder.addCapability(spv::Capability::RayQueryKHR);
  4634. }
  4635. }
  4636. break;
  4637. }
  4638. spvType = builder.makeAccelerationStructureType();
  4639. break;
  4640. case glslang::EbtRayQuery:
  4641. {
  4642. auto& extensions = glslangIntermediate->getRequestedExtensions();
  4643. if (extensions.find("GL_EXT_ray_query") != extensions.end()) {
  4644. builder.addExtension(spv::E_SPV_KHR_ray_query);
  4645. builder.addCapability(spv::Capability::RayQueryKHR);
  4646. }
  4647. spvType = builder.makeRayQueryType();
  4648. }
  4649. break;
  4650. case glslang::EbtReference:
  4651. {
  4652. // Make the forward pointer, then recurse to convert the structure type, then
  4653. // patch up the forward pointer with a real pointer type.
  4654. if (forwardPointers.find(type.getReferentType()) == forwardPointers.end()) {
  4655. spv::Id forwardId = builder.makeForwardPointer(spv::StorageClass::PhysicalStorageBufferEXT);
  4656. forwardPointers[type.getReferentType()] = forwardId;
  4657. }
  4658. spvType = forwardPointers[type.getReferentType()];
  4659. if (!forwardReferenceOnly) {
  4660. spv::Id referentType = convertGlslangToSpvType(*type.getReferentType());
  4661. builder.makePointerFromForwardPointer(spv::StorageClass::PhysicalStorageBufferEXT,
  4662. forwardPointers[type.getReferentType()],
  4663. referentType);
  4664. }
  4665. }
  4666. break;
  4667. case glslang::EbtSampler:
  4668. {
  4669. const glslang::TSampler& sampler = type.getSampler();
  4670. if (sampler.isPureSampler()) {
  4671. spvType = builder.makeSamplerType();
  4672. } else {
  4673. // an image is present, make its type
  4674. spvType = builder.makeImageType(getSampledType(sampler), TranslateDimensionality(sampler),
  4675. sampler.isShadow(), sampler.isArrayed(), sampler.isMultiSample(),
  4676. sampler.isImageClass() ? 2 : 1, TranslateImageFormat(type));
  4677. if (sampler.isCombined() &&
  4678. (!sampler.isBuffer() || glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_6)) {
  4679. // Already has both image and sampler, make the combined type. Only combine sampler to
  4680. // buffer if before SPIR-V 1.6.
  4681. spvType = builder.makeSampledImageType(spvType);
  4682. }
  4683. }
  4684. }
  4685. break;
  4686. case glslang::EbtStruct:
  4687. case glslang::EbtBlock:
  4688. {
  4689. // If we've seen this struct type, return it
  4690. const glslang::TTypeList* glslangMembers = type.getStruct();
  4691. // Try to share structs for different layouts, but not yet for other
  4692. // kinds of qualification (primarily not yet including interpolant qualification).
  4693. if (! HasNonLayoutQualifiers(type, qualifier))
  4694. spvType = structMap[explicitLayout][qualifier.layoutMatrix][glslangMembers];
  4695. if (spvType != spv::NoResult)
  4696. break;
  4697. // else, we haven't seen it...
  4698. if (type.getBasicType() == glslang::EbtBlock)
  4699. memberRemapper[glslangTypeToIdMap[glslangMembers]].resize(glslangMembers->size());
  4700. spvType = convertGlslangStructToSpvType(type, glslangMembers, explicitLayout, qualifier);
  4701. }
  4702. break;
  4703. case glslang::EbtString:
  4704. // no type used for OpString
  4705. return 0;
  4706. case glslang::EbtHitObjectNV: {
  4707. builder.addExtension(spv::E_SPV_NV_shader_invocation_reorder);
  4708. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  4709. spvType = builder.makeHitObjectNVType();
  4710. }
  4711. break;
  4712. case glslang::EbtSpirvType: {
  4713. // GL_EXT_spirv_intrinsics
  4714. const auto& spirvType = type.getSpirvType();
  4715. const auto& spirvInst = spirvType.spirvInst;
  4716. std::vector<spv::IdImmediate> operands;
  4717. for (const auto& typeParam : spirvType.typeParams) {
  4718. if (typeParam.getAsConstant() != nullptr) {
  4719. // Constant expression
  4720. auto constant = typeParam.getAsConstant();
  4721. if (constant->isLiteral()) {
  4722. if (constant->getBasicType() == glslang::EbtFloat) {
  4723. float floatValue = static_cast<float>(constant->getConstArray()[0].getDConst());
  4724. unsigned literal;
  4725. static_assert(sizeof(literal) == sizeof(floatValue), "sizeof(unsigned) != sizeof(float)");
  4726. memcpy(&literal, &floatValue, sizeof(literal));
  4727. operands.push_back({false, literal});
  4728. } else if (constant->getBasicType() == glslang::EbtInt) {
  4729. unsigned literal = constant->getConstArray()[0].getIConst();
  4730. operands.push_back({false, literal});
  4731. } else if (constant->getBasicType() == glslang::EbtUint) {
  4732. unsigned literal = constant->getConstArray()[0].getUConst();
  4733. operands.push_back({false, literal});
  4734. } else if (constant->getBasicType() == glslang::EbtBool) {
  4735. unsigned literal = constant->getConstArray()[0].getBConst();
  4736. operands.push_back({false, literal});
  4737. } else if (constant->getBasicType() == glslang::EbtString) {
  4738. auto str = constant->getConstArray()[0].getSConst()->c_str();
  4739. unsigned literal = 0;
  4740. char* literalPtr = reinterpret_cast<char*>(&literal);
  4741. unsigned charCount = 0;
  4742. char ch = 0;
  4743. do {
  4744. ch = *(str++);
  4745. *(literalPtr++) = ch;
  4746. ++charCount;
  4747. if (charCount == 4) {
  4748. operands.push_back({false, literal});
  4749. literalPtr = reinterpret_cast<char*>(&literal);
  4750. charCount = 0;
  4751. }
  4752. } while (ch != 0);
  4753. // Partial literal is padded with 0
  4754. if (charCount > 0) {
  4755. for (; charCount < 4; ++charCount)
  4756. *(literalPtr++) = 0;
  4757. operands.push_back({false, literal});
  4758. }
  4759. } else
  4760. assert(0); // Unexpected type
  4761. } else
  4762. operands.push_back({true, createSpvConstant(*constant)});
  4763. } else {
  4764. // Type specifier
  4765. assert(typeParam.getAsType() != nullptr);
  4766. operands.push_back({true, convertGlslangToSpvType(*typeParam.getAsType())});
  4767. }
  4768. }
  4769. assert(spirvInst.set == ""); // Currently, couldn't be extended instructions.
  4770. spvType = builder.makeGenericType(static_cast<spv::Op>(spirvInst.id), operands);
  4771. break;
  4772. }
  4773. case glslang::EbtTensorLayoutNV:
  4774. {
  4775. builder.addCapability(spv::Capability::TensorAddressingNV);
  4776. builder.addExtension(spv::E_SPV_NV_tensor_addressing);
  4777. std::vector<spv::IdImmediate> operands;
  4778. for (uint32_t i = 0; i < 2; ++i) {
  4779. operands.push_back({true, makeArraySizeId(*type.getTypeParameters()->arraySizes, i, true)});
  4780. }
  4781. spvType = builder.makeGenericType(spv::Op::OpTypeTensorLayoutNV, operands);
  4782. break;
  4783. }
  4784. case glslang::EbtTensorViewNV:
  4785. {
  4786. builder.addCapability(spv::Capability::TensorAddressingNV);
  4787. builder.addExtension(spv::E_SPV_NV_tensor_addressing);
  4788. uint32_t dim = type.getTypeParameters()->arraySizes->getDimSize(0);
  4789. assert(dim >= 1 && dim <= 5);
  4790. std::vector<spv::IdImmediate> operands;
  4791. for (uint32_t i = 0; i < dim + 2; ++i) {
  4792. operands.push_back({true, makeArraySizeId(*type.getTypeParameters()->arraySizes, i, true, i==1)});
  4793. }
  4794. spvType = builder.makeGenericType(spv::Op::OpTypeTensorViewNV, operands);
  4795. break;
  4796. }
  4797. default:
  4798. assert(0);
  4799. break;
  4800. }
  4801. if (type.isMatrix())
  4802. spvType = builder.makeMatrixType(spvType, type.getMatrixCols(), type.getMatrixRows());
  4803. else {
  4804. // If this variable has a vector element count greater than 1, create a SPIR-V vector
  4805. if (type.getVectorSize() > 1)
  4806. spvType = builder.makeVectorType(spvType, type.getVectorSize());
  4807. }
  4808. if (type.isCoopMatNV()) {
  4809. builder.addCapability(spv::Capability::CooperativeMatrixNV);
  4810. builder.addExtension(spv::E_SPV_NV_cooperative_matrix);
  4811. if (type.getBasicType() == glslang::EbtFloat16)
  4812. builder.addCapability(spv::Capability::Float16);
  4813. if (type.getBasicType() == glslang::EbtUint8 ||
  4814. type.getBasicType() == glslang::EbtInt8) {
  4815. builder.addCapability(spv::Capability::Int8);
  4816. }
  4817. spv::Id scope = makeArraySizeId(*type.getTypeParameters()->arraySizes, 1);
  4818. spv::Id rows = makeArraySizeId(*type.getTypeParameters()->arraySizes, 2);
  4819. spv::Id cols = makeArraySizeId(*type.getTypeParameters()->arraySizes, 3);
  4820. spvType = builder.makeCooperativeMatrixTypeNV(spvType, scope, rows, cols);
  4821. }
  4822. if (type.isCoopMatKHR()) {
  4823. builder.addCapability(spv::Capability::CooperativeMatrixKHR);
  4824. builder.addExtension(spv::E_SPV_KHR_cooperative_matrix);
  4825. if (type.getBasicType() == glslang::EbtBFloat16) {
  4826. builder.addExtension(spv::E_SPV_KHR_bfloat16);
  4827. builder.addCapability(spv::Capability::BFloat16CooperativeMatrixKHR);
  4828. }
  4829. if (type.getBasicType() == glslang::EbtFloatE5M2 || type.getBasicType() == glslang::EbtFloatE4M3) {
  4830. builder.addExtension(spv::E_SPV_EXT_float8);
  4831. builder.addCapability(spv::Capability::Float8CooperativeMatrixEXT);
  4832. }
  4833. if (type.getBasicType() == glslang::EbtFloat16)
  4834. builder.addCapability(spv::Capability::Float16);
  4835. if (type.getBasicType() == glslang::EbtUint8 || type.getBasicType() == glslang::EbtInt8) {
  4836. builder.addCapability(spv::Capability::Int8);
  4837. }
  4838. spv::Id scope = makeArraySizeId(*type.getTypeParameters()->arraySizes, 0);
  4839. spv::Id rows = makeArraySizeId(*type.getTypeParameters()->arraySizes, 1);
  4840. spv::Id cols = makeArraySizeId(*type.getTypeParameters()->arraySizes, 2);
  4841. spv::Id use = builder.makeUintConstant(type.getCoopMatKHRuse());
  4842. spvType = builder.makeCooperativeMatrixTypeKHR(spvType, scope, rows, cols, use);
  4843. }
  4844. else if (type.isTensorARM()) {
  4845. builder.addCapability(spv::Capability::TensorsARM);
  4846. builder.addExtension(spv::E_SPV_ARM_tensors);
  4847. if (type.getBasicType() == glslang::EbtInt8 || type.getBasicType() == glslang::EbtUint8) {
  4848. builder.addCapability(spv::Capability::Int8);
  4849. } else if (type.getBasicType() == glslang::EbtInt16 ||
  4850. type.getBasicType() == glslang::EbtUint16) {
  4851. builder.addCapability(spv::Capability::Int16);
  4852. } else if (type.getBasicType() == glslang::EbtInt64 ||
  4853. type.getBasicType() == glslang::EbtUint64) {
  4854. builder.addCapability(spv::Capability::Int64);
  4855. } else if (type.getBasicType() == glslang::EbtFloat16) {
  4856. builder.addCapability(spv::Capability::Float16);
  4857. }
  4858. spv::Id rank = makeArraySizeId(*type.getTypeParameters()->arraySizes, 0);
  4859. spvType = builder.makeTensorTypeARM(spvType, rank);
  4860. }
  4861. if (type.isCoopVecNV()) {
  4862. builder.addCapability(spv::Capability::CooperativeVectorNV);
  4863. builder.addExtension(spv::E_SPV_NV_cooperative_vector);
  4864. if (type.getBasicType() == glslang::EbtFloat16)
  4865. builder.addCapability(spv::Capability::Float16);
  4866. if (type.getBasicType() == glslang::EbtUint8 || type.getBasicType() == glslang::EbtInt8) {
  4867. builder.addCapability(spv::Capability::Int8);
  4868. }
  4869. spv::Id components = makeArraySizeId(*type.getTypeParameters()->arraySizes, 0);
  4870. spvType = builder.makeCooperativeVectorTypeNV(spvType, components);
  4871. }
  4872. if (type.isArray()) {
  4873. int stride = 0; // keep this 0 unless doing an explicit layout; 0 will mean no decoration, no stride
  4874. // Do all but the outer dimension
  4875. if (type.getArraySizes()->getNumDims() > 1) {
  4876. // We need to decorate array strides for types needing explicit layout, except blocks.
  4877. if (explicitLayout != glslang::ElpNone && type.getBasicType() != glslang::EbtBlock) {
  4878. // Use a dummy glslang type for querying internal strides of
  4879. // arrays of arrays, but using just a one-dimensional array.
  4880. glslang::TType simpleArrayType(type, 0); // deference type of the array
  4881. while (simpleArrayType.getArraySizes()->getNumDims() > 1)
  4882. simpleArrayType.getArraySizes()->dereference();
  4883. // Will compute the higher-order strides here, rather than making a whole
  4884. // pile of types and doing repetitive recursion on their contents.
  4885. stride = getArrayStride(simpleArrayType, explicitLayout, qualifier.layoutMatrix);
  4886. }
  4887. // make the arrays
  4888. for (int dim = type.getArraySizes()->getNumDims() - 1; dim > 0; --dim) {
  4889. spvType = builder.makeArrayType(spvType, makeArraySizeId(*type.getArraySizes(), dim), stride);
  4890. if (stride > 0)
  4891. builder.addDecoration(spvType, spv::Decoration::ArrayStride, stride);
  4892. stride *= type.getArraySizes()->getDimSize(dim);
  4893. }
  4894. } else {
  4895. // single-dimensional array, and don't yet have stride
  4896. // We need to decorate array strides for types needing explicit layout, except blocks.
  4897. if (explicitLayout != glslang::ElpNone && type.getBasicType() != glslang::EbtBlock)
  4898. stride = getArrayStride(type, explicitLayout, qualifier.layoutMatrix);
  4899. }
  4900. // Do the outer dimension, which might not be known for a runtime-sized array.
  4901. // (Unsized arrays that survive through linking will be runtime-sized arrays)
  4902. if (type.isSizedArray())
  4903. spvType = builder.makeArrayType(spvType, makeArraySizeId(*type.getArraySizes(), 0), stride);
  4904. else {
  4905. if (!lastBufferBlockMember) {
  4906. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  4907. builder.addCapability(spv::Capability::RuntimeDescriptorArrayEXT);
  4908. }
  4909. spvType = builder.makeRuntimeArray(spvType);
  4910. }
  4911. if (stride > 0)
  4912. builder.addDecoration(spvType, spv::Decoration::ArrayStride, stride);
  4913. }
  4914. return spvType;
  4915. }
  4916. // Apply SPIR-V decorations to the SPIR-V object (provided by SPIR-V ID). If member index is provided, the
  4917. // decorations are applied to this member.
  4918. void TGlslangToSpvTraverser::applySpirvDecorate(const glslang::TType& type, spv::Id id, std::optional<int> member)
  4919. {
  4920. assert(type.getQualifier().hasSpirvDecorate());
  4921. const glslang::TSpirvDecorate& spirvDecorate = type.getQualifier().getSpirvDecorate();
  4922. // Add spirv_decorate
  4923. for (auto& decorate : spirvDecorate.decorates) {
  4924. if (!decorate.second.empty()) {
  4925. std::vector<unsigned> literals;
  4926. TranslateLiterals(decorate.second, literals);
  4927. if (member.has_value())
  4928. builder.addMemberDecoration(id, *member, static_cast<spv::Decoration>(decorate.first), literals);
  4929. else
  4930. builder.addDecoration(id, static_cast<spv::Decoration>(decorate.first), literals);
  4931. } else {
  4932. if (member.has_value())
  4933. builder.addMemberDecoration(id, *member, static_cast<spv::Decoration>(decorate.first));
  4934. else
  4935. builder.addDecoration(id, static_cast<spv::Decoration>(decorate.first));
  4936. }
  4937. }
  4938. // Add spirv_decorate_id
  4939. if (member.has_value()) {
  4940. // spirv_decorate_id not applied to members
  4941. assert(spirvDecorate.decorateIds.empty());
  4942. } else {
  4943. for (auto& decorateId : spirvDecorate.decorateIds) {
  4944. std::vector<spv::Id> operandIds;
  4945. assert(!decorateId.second.empty());
  4946. for (auto extraOperand : decorateId.second) {
  4947. if (extraOperand->getQualifier().isFrontEndConstant())
  4948. operandIds.push_back(createSpvConstant(*extraOperand));
  4949. else
  4950. operandIds.push_back(getSymbolId(extraOperand->getAsSymbolNode()));
  4951. }
  4952. builder.addDecorationId(id, static_cast<spv::Decoration>(decorateId.first), operandIds);
  4953. }
  4954. }
  4955. // Add spirv_decorate_string
  4956. for (auto& decorateString : spirvDecorate.decorateStrings) {
  4957. std::vector<const char*> strings;
  4958. assert(!decorateString.second.empty());
  4959. for (auto extraOperand : decorateString.second) {
  4960. const char* string = extraOperand->getConstArray()[0].getSConst()->c_str();
  4961. strings.push_back(string);
  4962. }
  4963. if (member.has_value())
  4964. builder.addMemberDecoration(id, *member, static_cast<spv::Decoration>(decorateString.first), strings);
  4965. else
  4966. builder.addDecoration(id, static_cast<spv::Decoration>(decorateString.first), strings);
  4967. }
  4968. }
  4969. // TODO: this functionality should exist at a higher level, in creating the AST
  4970. //
  4971. // Identify interface members that don't have their required extension turned on.
  4972. //
  4973. bool TGlslangToSpvTraverser::filterMember(const glslang::TType& member)
  4974. {
  4975. auto& extensions = glslangIntermediate->getRequestedExtensions();
  4976. if (member.getFieldName() == "gl_SecondaryViewportMaskNV" &&
  4977. extensions.find("GL_NV_stereo_view_rendering") == extensions.end())
  4978. return true;
  4979. if (member.getFieldName() == "gl_SecondaryPositionNV" &&
  4980. extensions.find("GL_NV_stereo_view_rendering") == extensions.end())
  4981. return true;
  4982. if (glslangIntermediate->getStage() == EShLangMesh) {
  4983. if (member.getFieldName() == "gl_PrimitiveShadingRateEXT" &&
  4984. extensions.find("GL_EXT_fragment_shading_rate") == extensions.end())
  4985. return true;
  4986. }
  4987. if (glslangIntermediate->getStage() != EShLangMesh) {
  4988. if (member.getFieldName() == "gl_ViewportMask" &&
  4989. extensions.find("GL_NV_viewport_array2") == extensions.end())
  4990. return true;
  4991. if (member.getFieldName() == "gl_PositionPerViewNV" &&
  4992. extensions.find("GL_NVX_multiview_per_view_attributes") == extensions.end())
  4993. return true;
  4994. if (member.getFieldName() == "gl_ViewportMaskPerViewNV" &&
  4995. extensions.find("GL_NVX_multiview_per_view_attributes") == extensions.end())
  4996. return true;
  4997. }
  4998. return false;
  4999. }
  5000. // Do full recursive conversion of a glslang structure (or block) type to a SPIR-V Id.
  5001. // explicitLayout can be kept the same throughout the hierarchical recursive walk.
  5002. // Mutually recursive with convertGlslangToSpvType().
  5003. spv::Id TGlslangToSpvTraverser::convertGlslangStructToSpvType(const glslang::TType& type,
  5004. const glslang::TTypeList* glslangMembers,
  5005. glslang::TLayoutPacking explicitLayout,
  5006. const glslang::TQualifier& qualifier)
  5007. {
  5008. // Create a vector of struct types for SPIR-V to consume
  5009. std::vector<spv::Id> spvMembers;
  5010. int memberDelta = 0; // how much the member's index changes from glslang to SPIR-V, normally 0,
  5011. // except sometimes for blocks
  5012. std::vector<std::pair<glslang::TType*, glslang::TQualifier> > deferredForwardPointers;
  5013. for (int i = 0; i < (int)glslangMembers->size(); i++) {
  5014. auto& glslangMember = (*glslangMembers)[i];
  5015. if (glslangMember.type->hiddenMember()) {
  5016. ++memberDelta;
  5017. if (type.getBasicType() == glslang::EbtBlock)
  5018. memberRemapper[glslangTypeToIdMap[glslangMembers]][i] = -1;
  5019. } else {
  5020. if (type.getBasicType() == glslang::EbtBlock) {
  5021. if (filterMember(*glslangMember.type)) {
  5022. memberDelta++;
  5023. memberRemapper[glslangTypeToIdMap[glslangMembers]][i] = -1;
  5024. continue;
  5025. }
  5026. memberRemapper[glslangTypeToIdMap[glslangMembers]][i] = i - memberDelta;
  5027. }
  5028. // modify just this child's view of the qualifier
  5029. glslang::TQualifier memberQualifier = glslangMember.type->getQualifier();
  5030. InheritQualifiers(memberQualifier, qualifier);
  5031. // manually inherit location
  5032. if (! memberQualifier.hasLocation() && qualifier.hasLocation())
  5033. memberQualifier.layoutLocation = qualifier.layoutLocation;
  5034. // recurse
  5035. bool lastBufferBlockMember = qualifier.storage == glslang::EvqBuffer &&
  5036. i == (int)glslangMembers->size() - 1;
  5037. // Make forward pointers for any pointer members.
  5038. if (glslangMember.type->isReference() &&
  5039. forwardPointers.find(glslangMember.type->getReferentType()) == forwardPointers.end()) {
  5040. deferredForwardPointers.push_back(std::make_pair(glslangMember.type, memberQualifier));
  5041. }
  5042. // Create the member type.
  5043. auto const spvMember = convertGlslangToSpvType(*glslangMember.type, explicitLayout, memberQualifier, lastBufferBlockMember,
  5044. glslangMember.type->isReference());
  5045. spvMembers.push_back(spvMember);
  5046. // Update the builder with the type's location so that we can create debug types for the structure members.
  5047. // There doesn't exist a "clean" entry point for this information to be passed along to the builder so, for now,
  5048. // it is stored in the builder and consumed during the construction of composite debug types.
  5049. // TODO: This probably warrants further investigation. This approach was decided to be the least ugly of the
  5050. // quick and dirty approaches that were tried.
  5051. // Advantages of this approach:
  5052. // + Relatively clean. No direct calls into debug type system.
  5053. // + Handles nested recursive structures.
  5054. // Disadvantages of this approach:
  5055. // + Not as clean as desired. Traverser queries/sets persistent state. This is fragile.
  5056. // + Table lookup during creation of composite debug types. This really shouldn't be necessary.
  5057. if(options.emitNonSemanticShaderDebugInfo) {
  5058. builder.debugTypeLocs[spvMember].name = glslangMember.type->getFieldName().c_str();
  5059. builder.debugTypeLocs[spvMember].line = glslangMember.loc.line;
  5060. builder.debugTypeLocs[spvMember].column = glslangMember.loc.column;
  5061. }
  5062. }
  5063. }
  5064. // Make the SPIR-V type
  5065. spv::Id spvType = builder.makeStructType(spvMembers, type.getTypeName().c_str(), false);
  5066. if (! HasNonLayoutQualifiers(type, qualifier))
  5067. structMap[explicitLayout][qualifier.layoutMatrix][glslangMembers] = spvType;
  5068. // Decorate it
  5069. decorateStructType(type, glslangMembers, explicitLayout, qualifier, spvType, spvMembers);
  5070. for (int i = 0; i < (int)deferredForwardPointers.size(); ++i) {
  5071. auto it = deferredForwardPointers[i];
  5072. convertGlslangToSpvType(*it.first, explicitLayout, it.second, false);
  5073. }
  5074. return spvType;
  5075. }
  5076. void TGlslangToSpvTraverser::decorateStructType(const glslang::TType& type,
  5077. const glslang::TTypeList* glslangMembers,
  5078. glslang::TLayoutPacking explicitLayout,
  5079. const glslang::TQualifier& qualifier,
  5080. spv::Id spvType,
  5081. const std::vector<spv::Id>& spvMembers)
  5082. {
  5083. // Name and decorate the non-hidden members
  5084. int offset = -1;
  5085. bool memberLocationInvalid = type.isArrayOfArrays() ||
  5086. (type.isArray() && (type.getQualifier().isArrayedIo(glslangIntermediate->getStage()) == false));
  5087. for (int i = 0; i < (int)glslangMembers->size(); i++) {
  5088. glslang::TType& glslangMember = *(*glslangMembers)[i].type;
  5089. int member = i;
  5090. if (type.getBasicType() == glslang::EbtBlock) {
  5091. member = memberRemapper[glslangTypeToIdMap[glslangMembers]][i];
  5092. if (filterMember(glslangMember))
  5093. continue;
  5094. }
  5095. // modify just this child's view of the qualifier
  5096. glslang::TQualifier memberQualifier = glslangMember.getQualifier();
  5097. InheritQualifiers(memberQualifier, qualifier);
  5098. // using -1 above to indicate a hidden member
  5099. if (member < 0)
  5100. continue;
  5101. builder.addMemberName(spvType, member, glslangMember.getFieldName().c_str());
  5102. builder.addMemberDecoration(spvType, member,
  5103. TranslateLayoutDecoration(glslangMember, memberQualifier.layoutMatrix));
  5104. builder.addMemberDecoration(spvType, member, TranslatePrecisionDecoration(glslangMember));
  5105. // Add interpolation and auxiliary storage decorations only to
  5106. // top-level members of Input and Output storage classes
  5107. if (type.getQualifier().storage == glslang::EvqVaryingIn ||
  5108. type.getQualifier().storage == glslang::EvqVaryingOut) {
  5109. if (type.getBasicType() == glslang::EbtBlock ||
  5110. glslangIntermediate->getSource() == glslang::EShSourceHlsl) {
  5111. builder.addMemberDecoration(spvType, member, TranslateInterpolationDecoration(memberQualifier));
  5112. builder.addMemberDecoration(spvType, member, TranslateAuxiliaryStorageDecoration(memberQualifier));
  5113. addMeshNVDecoration(spvType, member, memberQualifier);
  5114. }
  5115. }
  5116. builder.addMemberDecoration(spvType, member, TranslateInvariantDecoration(memberQualifier));
  5117. if (type.getBasicType() == glslang::EbtBlock &&
  5118. qualifier.storage == glslang::EvqBuffer) {
  5119. // Add memory decorations only to top-level members of shader storage block
  5120. std::vector<spv::Decoration> memory;
  5121. TranslateMemoryDecoration(memberQualifier, memory, glslangIntermediate->usingVulkanMemoryModel());
  5122. for (unsigned int i = 0; i < memory.size(); ++i)
  5123. builder.addMemberDecoration(spvType, member, memory[i]);
  5124. }
  5125. // Location assignment was already completed correctly by the front end,
  5126. // just track whether a member needs to be decorated.
  5127. // Ignore member locations if the container is an array, as that's
  5128. // ill-specified and decisions have been made to not allow this.
  5129. if (!memberLocationInvalid && memberQualifier.hasLocation())
  5130. builder.addMemberDecoration(spvType, member, spv::Decoration::Location, memberQualifier.layoutLocation);
  5131. // component, XFB, others
  5132. if (glslangMember.getQualifier().hasComponent())
  5133. builder.addMemberDecoration(spvType, member, spv::Decoration::Component,
  5134. glslangMember.getQualifier().layoutComponent);
  5135. if (glslangMember.getQualifier().hasXfbOffset())
  5136. builder.addMemberDecoration(spvType, member, spv::Decoration::Offset,
  5137. glslangMember.getQualifier().layoutXfbOffset);
  5138. else if (explicitLayout != glslang::ElpNone) {
  5139. // figure out what to do with offset, which is accumulating
  5140. int nextOffset;
  5141. updateMemberOffset(type, glslangMember, offset, nextOffset, explicitLayout, memberQualifier.layoutMatrix);
  5142. if (offset >= 0)
  5143. builder.addMemberDecoration(spvType, member, spv::Decoration::Offset, offset);
  5144. offset = nextOffset;
  5145. }
  5146. if (glslangMember.isMatrix() && explicitLayout != glslang::ElpNone)
  5147. builder.addMemberDecoration(spvType, member, spv::Decoration::MatrixStride,
  5148. getMatrixStride(glslangMember, explicitLayout, memberQualifier.layoutMatrix));
  5149. // built-in variable decorations
  5150. spv::BuiltIn builtIn = TranslateBuiltInDecoration(glslangMember.getQualifier().builtIn, true);
  5151. if (builtIn != spv::BuiltIn::Max)
  5152. builder.addMemberDecoration(spvType, member, spv::Decoration::BuiltIn, (int)builtIn);
  5153. // nonuniform
  5154. builder.addMemberDecoration(spvType, member, TranslateNonUniformDecoration(glslangMember.getQualifier()));
  5155. if (glslangIntermediate->getHlslFunctionality1() && memberQualifier.semanticName != nullptr) {
  5156. builder.addExtension("SPV_GOOGLE_hlsl_functionality1");
  5157. builder.addMemberDecoration(spvType, member, spv::Decoration::HlslSemanticGOOGLE,
  5158. memberQualifier.semanticName);
  5159. }
  5160. if (builtIn == spv::BuiltIn::Layer) {
  5161. // SPV_NV_viewport_array2 extension
  5162. if (glslangMember.getQualifier().layoutViewportRelative){
  5163. builder.addMemberDecoration(spvType, member, spv::Decoration::ViewportRelativeNV);
  5164. builder.addCapability(spv::Capability::ShaderViewportMaskNV);
  5165. builder.addExtension(spv::E_SPV_NV_viewport_array2);
  5166. }
  5167. if (glslangMember.getQualifier().layoutSecondaryViewportRelativeOffset != -2048){
  5168. builder.addMemberDecoration(spvType, member,
  5169. spv::Decoration::SecondaryViewportRelativeNV,
  5170. glslangMember.getQualifier().layoutSecondaryViewportRelativeOffset);
  5171. builder.addCapability(spv::Capability::ShaderStereoViewNV);
  5172. builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
  5173. }
  5174. }
  5175. if (glslangMember.getQualifier().layoutPassthrough) {
  5176. builder.addMemberDecoration(spvType, member, spv::Decoration::PassthroughNV);
  5177. builder.addCapability(spv::Capability::GeometryShaderPassthroughNV);
  5178. builder.addExtension(spv::E_SPV_NV_geometry_shader_passthrough);
  5179. }
  5180. // Add SPIR-V decorations (GL_EXT_spirv_intrinsics)
  5181. if (glslangMember.getQualifier().hasSpirvDecorate())
  5182. applySpirvDecorate(glslangMember, spvType, member);
  5183. }
  5184. // Decorate the structure
  5185. builder.addDecoration(spvType, TranslateLayoutDecoration(type, qualifier.layoutMatrix));
  5186. const auto basicType = type.getBasicType();
  5187. const auto typeStorageQualifier = type.getQualifier().storage;
  5188. if (basicType == glslang::EbtBlock) {
  5189. builder.addDecoration(spvType, TranslateBlockDecoration(typeStorageQualifier, glslangIntermediate->usingStorageBuffer()));
  5190. } else if (basicType == glslang::EbtStruct && glslangIntermediate->getSpv().vulkan > 0) {
  5191. const auto hasRuntimeArray = !spvMembers.empty() && builder.getOpCode(spvMembers.back()) == spv::Op::OpTypeRuntimeArray;
  5192. if (hasRuntimeArray) {
  5193. builder.addDecoration(spvType, TranslateBlockDecoration(typeStorageQualifier, glslangIntermediate->usingStorageBuffer()));
  5194. }
  5195. }
  5196. if (qualifier.hasHitObjectShaderRecordNV())
  5197. builder.addDecoration(spvType, spv::Decoration::HitObjectShaderRecordBufferNV);
  5198. }
  5199. // Turn the expression forming the array size into an id.
  5200. // This is not quite trivial, because of specialization constants.
  5201. // Sometimes, a raw constant is turned into an Id, and sometimes
  5202. // a specialization constant expression is.
  5203. spv::Id TGlslangToSpvTraverser::makeArraySizeId(const glslang::TArraySizes& arraySizes, int dim, bool allowZero, bool boolType)
  5204. {
  5205. // First, see if this is sized with a node, meaning a specialization constant:
  5206. glslang::TIntermTyped* specNode = arraySizes.getDimNode(dim);
  5207. if (specNode != nullptr) {
  5208. builder.clearAccessChain();
  5209. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  5210. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  5211. specNode->traverse(this);
  5212. return accessChainLoad(specNode->getAsTyped()->getType());
  5213. }
  5214. // Otherwise, need a compile-time (front end) size, get it:
  5215. int size = arraySizes.getDimSize(dim);
  5216. if (!allowZero)
  5217. assert(size > 0);
  5218. if (boolType) {
  5219. return builder.makeBoolConstant(size);
  5220. } else {
  5221. return builder.makeUintConstant(size);
  5222. }
  5223. }
  5224. // Wrap the builder's accessChainLoad to:
  5225. // - localize handling of RelaxedPrecision
  5226. // - use the SPIR-V inferred type instead of another conversion of the glslang type
  5227. // (avoids unnecessary work and possible type punning for structures)
  5228. // - do conversion of concrete to abstract type
  5229. spv::Id TGlslangToSpvTraverser::accessChainLoad(const glslang::TType& type)
  5230. {
  5231. spv::Id nominalTypeId = builder.accessChainGetInferredType();
  5232. spv::Builder::AccessChain::CoherentFlags coherentFlags = builder.getAccessChain().coherentFlags;
  5233. coherentFlags |= TranslateCoherent(type);
  5234. spv::MemoryAccessMask accessMask = spv::MemoryAccessMask(TranslateMemoryAccess(coherentFlags) & ~spv::MemoryAccessMask::MakePointerAvailableKHR);
  5235. // If the value being loaded is HelperInvocation, SPIR-V 1.6 is being generated (so that
  5236. // SPV_EXT_demote_to_helper_invocation is in core) and the memory model is in use, add
  5237. // the Volatile MemoryAccess semantic.
  5238. if (type.getQualifier().builtIn == glslang::EbvHelperInvocation &&
  5239. glslangIntermediate->usingVulkanMemoryModel() &&
  5240. glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {
  5241. accessMask = spv::MemoryAccessMask(accessMask | spv::MemoryAccessMask::Volatile);
  5242. }
  5243. unsigned int alignment = builder.getAccessChain().alignment;
  5244. alignment |= type.getBufferReferenceAlignment();
  5245. spv::Id loadedId = builder.accessChainLoad(TranslatePrecisionDecoration(type),
  5246. TranslateNonUniformDecoration(builder.getAccessChain().coherentFlags),
  5247. TranslateNonUniformDecoration(type.getQualifier()),
  5248. nominalTypeId,
  5249. accessMask,
  5250. TranslateMemoryScope(coherentFlags),
  5251. alignment);
  5252. // Need to convert to abstract types when necessary
  5253. if (type.getBasicType() == glslang::EbtBool) {
  5254. loadedId = convertLoadedBoolInUniformToUint(type, nominalTypeId, loadedId);
  5255. }
  5256. return loadedId;
  5257. }
  5258. // Wrap the builder's accessChainStore to:
  5259. // - do conversion of concrete to abstract type
  5260. //
  5261. // Implicitly uses the existing builder.accessChain as the storage target.
  5262. void TGlslangToSpvTraverser::accessChainStore(const glslang::TType& type, spv::Id rvalue)
  5263. {
  5264. // Need to convert to abstract types when necessary
  5265. if (type.getBasicType() == glslang::EbtBool) {
  5266. spv::Id nominalTypeId = builder.accessChainGetInferredType();
  5267. if (builder.isScalarType(nominalTypeId)) {
  5268. // Conversion for bool
  5269. spv::Id boolType = builder.makeBoolType();
  5270. if (nominalTypeId != boolType) {
  5271. // keep these outside arguments, for determinant order-of-evaluation
  5272. spv::Id one = builder.makeUintConstant(1);
  5273. spv::Id zero = builder.makeUintConstant(0);
  5274. rvalue = builder.createTriOp(spv::Op::OpSelect, nominalTypeId, rvalue, one, zero);
  5275. } else if (builder.getTypeId(rvalue) != boolType)
  5276. rvalue = builder.createBinOp(spv::Op::OpINotEqual, boolType, rvalue, builder.makeUintConstant(0));
  5277. } else if (builder.isVectorType(nominalTypeId)) {
  5278. // Conversion for bvec
  5279. int vecSize = builder.getNumTypeComponents(nominalTypeId);
  5280. spv::Id bvecType = builder.makeVectorType(builder.makeBoolType(), vecSize);
  5281. if (nominalTypeId != bvecType) {
  5282. // keep these outside arguments, for determinant order-of-evaluation
  5283. spv::Id one = makeSmearedConstant(builder.makeUintConstant(1), vecSize);
  5284. spv::Id zero = makeSmearedConstant(builder.makeUintConstant(0), vecSize);
  5285. rvalue = builder.createTriOp(spv::Op::OpSelect, nominalTypeId, rvalue, one, zero);
  5286. } else if (builder.getTypeId(rvalue) != bvecType)
  5287. rvalue = builder.createBinOp(spv::Op::OpINotEqual, bvecType, rvalue,
  5288. makeSmearedConstant(builder.makeUintConstant(0), vecSize));
  5289. }
  5290. }
  5291. spv::Builder::AccessChain::CoherentFlags coherentFlags = builder.getAccessChain().coherentFlags;
  5292. coherentFlags |= TranslateCoherent(type);
  5293. unsigned int alignment = builder.getAccessChain().alignment;
  5294. alignment |= type.getBufferReferenceAlignment();
  5295. builder.accessChainStore(rvalue, TranslateNonUniformDecoration(builder.getAccessChain().coherentFlags),
  5296. spv::MemoryAccessMask(TranslateMemoryAccess(coherentFlags) &
  5297. ~spv::MemoryAccessMask::MakePointerVisibleKHR),
  5298. TranslateMemoryScope(coherentFlags), alignment);
  5299. }
  5300. // For storing when types match at the glslang level, but not might match at the
  5301. // SPIR-V level.
  5302. //
  5303. // This especially happens when a single glslang type expands to multiple
  5304. // SPIR-V types, like a struct that is used in a member-undecorated way as well
  5305. // as in a member-decorated way.
  5306. //
  5307. // NOTE: This function can handle any store request; if it's not special it
  5308. // simplifies to a simple OpStore.
  5309. //
  5310. // Implicitly uses the existing builder.accessChain as the storage target.
  5311. void TGlslangToSpvTraverser::multiTypeStore(const glslang::TType& type, spv::Id rValue)
  5312. {
  5313. // we only do the complex path here if it's an aggregate
  5314. if (! type.isStruct() && ! type.isArray()) {
  5315. accessChainStore(type, rValue);
  5316. return;
  5317. }
  5318. // and, it has to be a case of type aliasing
  5319. spv::Id rType = builder.getTypeId(rValue);
  5320. spv::Id lValue = builder.accessChainGetLValue();
  5321. spv::Id lType = builder.getContainedTypeId(builder.getTypeId(lValue));
  5322. if (lType == rType) {
  5323. accessChainStore(type, rValue);
  5324. return;
  5325. }
  5326. // Recursively (as needed) copy an aggregate type to a different aggregate type,
  5327. // where the two types were the same type in GLSL. This requires member
  5328. // by member copy, recursively.
  5329. // SPIR-V 1.4 added an instruction to do help do this.
  5330. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {
  5331. // However, bool in uniform space is changed to int, so
  5332. // OpCopyLogical does not work for that.
  5333. // TODO: It would be more robust to do a full recursive verification of the types satisfying SPIR-V rules.
  5334. bool rBool = builder.containsType(builder.getTypeId(rValue), spv::Op::OpTypeBool, 0);
  5335. bool lBool = builder.containsType(lType, spv::Op::OpTypeBool, 0);
  5336. if (lBool == rBool) {
  5337. spv::Id logicalCopy = builder.createUnaryOp(spv::Op::OpCopyLogical, lType, rValue);
  5338. accessChainStore(type, logicalCopy);
  5339. return;
  5340. }
  5341. }
  5342. // If an array, copy element by element.
  5343. if (type.isArray()) {
  5344. glslang::TType glslangElementType(type, 0);
  5345. spv::Id elementRType = builder.getContainedTypeId(rType);
  5346. for (int index = 0; index < type.getOuterArraySize(); ++index) {
  5347. // get the source member
  5348. spv::Id elementRValue = builder.createCompositeExtract(rValue, elementRType, index);
  5349. // set up the target storage
  5350. builder.clearAccessChain();
  5351. builder.setAccessChainLValue(lValue);
  5352. builder.accessChainPush(builder.makeIntConstant(index), TranslateCoherent(type),
  5353. type.getBufferReferenceAlignment());
  5354. // store the member
  5355. multiTypeStore(glslangElementType, elementRValue);
  5356. }
  5357. } else {
  5358. assert(type.isStruct());
  5359. // loop over structure members
  5360. const glslang::TTypeList& members = *type.getStruct();
  5361. for (int m = 0; m < (int)members.size(); ++m) {
  5362. const glslang::TType& glslangMemberType = *members[m].type;
  5363. // get the source member
  5364. spv::Id memberRType = builder.getContainedTypeId(rType, m);
  5365. spv::Id memberRValue = builder.createCompositeExtract(rValue, memberRType, m);
  5366. // set up the target storage
  5367. builder.clearAccessChain();
  5368. builder.setAccessChainLValue(lValue);
  5369. builder.accessChainPush(builder.makeIntConstant(m), TranslateCoherent(type),
  5370. type.getBufferReferenceAlignment());
  5371. // store the member
  5372. multiTypeStore(glslangMemberType, memberRValue);
  5373. }
  5374. }
  5375. }
  5376. // Decide whether or not this type should be
  5377. // decorated with offsets and strides, and if so
  5378. // whether std140 or std430 rules should be applied.
  5379. glslang::TLayoutPacking TGlslangToSpvTraverser::getExplicitLayout(const glslang::TType& type) const
  5380. {
  5381. // has to be a block
  5382. if (type.getBasicType() != glslang::EbtBlock)
  5383. return glslang::ElpNone;
  5384. // has to be a uniform or buffer block or task in/out blocks
  5385. if (type.getQualifier().storage != glslang::EvqUniform &&
  5386. type.getQualifier().storage != glslang::EvqBuffer &&
  5387. type.getQualifier().storage != glslang::EvqShared &&
  5388. !type.getQualifier().isTaskMemory())
  5389. return glslang::ElpNone;
  5390. // return the layout to use
  5391. switch (type.getQualifier().layoutPacking) {
  5392. case glslang::ElpStd140:
  5393. case glslang::ElpStd430:
  5394. case glslang::ElpScalar:
  5395. return type.getQualifier().layoutPacking;
  5396. default:
  5397. return glslang::ElpNone;
  5398. }
  5399. }
  5400. // Given an array type, returns the integer stride required for that array
  5401. int TGlslangToSpvTraverser::getArrayStride(const glslang::TType& arrayType, glslang::TLayoutPacking explicitLayout,
  5402. glslang::TLayoutMatrix matrixLayout)
  5403. {
  5404. int size;
  5405. int stride;
  5406. glslangIntermediate->getMemberAlignment(arrayType, size, stride, explicitLayout,
  5407. matrixLayout == glslang::ElmRowMajor);
  5408. return stride;
  5409. }
  5410. // Given a matrix type, or array (of array) of matrixes type, returns the integer stride required for that matrix
  5411. // when used as a member of an interface block
  5412. int TGlslangToSpvTraverser::getMatrixStride(const glslang::TType& matrixType, glslang::TLayoutPacking explicitLayout,
  5413. glslang::TLayoutMatrix matrixLayout)
  5414. {
  5415. glslang::TType elementType;
  5416. elementType.shallowCopy(matrixType);
  5417. elementType.clearArraySizes();
  5418. int size;
  5419. int stride;
  5420. glslangIntermediate->getMemberAlignment(elementType, size, stride, explicitLayout,
  5421. matrixLayout == glslang::ElmRowMajor);
  5422. return stride;
  5423. }
  5424. // Given a member type of a struct, realign the current offset for it, and compute
  5425. // the next (not yet aligned) offset for the next member, which will get aligned
  5426. // on the next call.
  5427. // 'currentOffset' should be passed in already initialized, ready to modify, and reflecting
  5428. // the migration of data from nextOffset -> currentOffset. It should be -1 on the first call.
  5429. // -1 means a non-forced member offset (no decoration needed).
  5430. void TGlslangToSpvTraverser::updateMemberOffset(const glslang::TType& structType, const glslang::TType& memberType,
  5431. int& currentOffset, int& nextOffset, glslang::TLayoutPacking explicitLayout, glslang::TLayoutMatrix matrixLayout)
  5432. {
  5433. // this will get a positive value when deemed necessary
  5434. nextOffset = -1;
  5435. // override anything in currentOffset with user-set offset
  5436. if (memberType.getQualifier().hasOffset())
  5437. currentOffset = memberType.getQualifier().layoutOffset;
  5438. // It could be that current linker usage in glslang updated all the layoutOffset,
  5439. // in which case the following code does not matter. But, that's not quite right
  5440. // once cross-compilation unit GLSL validation is done, as the original user
  5441. // settings are needed in layoutOffset, and then the following will come into play.
  5442. if (explicitLayout == glslang::ElpNone) {
  5443. if (! memberType.getQualifier().hasOffset())
  5444. currentOffset = -1;
  5445. return;
  5446. }
  5447. // Getting this far means we need explicit offsets
  5448. if (currentOffset < 0)
  5449. currentOffset = 0;
  5450. // Now, currentOffset is valid (either 0, or from a previous nextOffset),
  5451. // but possibly not yet correctly aligned.
  5452. int memberSize;
  5453. int dummyStride;
  5454. int memberAlignment = glslangIntermediate->getMemberAlignment(memberType, memberSize, dummyStride, explicitLayout,
  5455. matrixLayout == glslang::ElmRowMajor);
  5456. bool isVectorLike = memberType.isVector();
  5457. if (memberType.isMatrix()) {
  5458. if (matrixLayout == glslang::ElmRowMajor)
  5459. isVectorLike = memberType.getMatrixRows() == 1;
  5460. else
  5461. isVectorLike = memberType.getMatrixCols() == 1;
  5462. }
  5463. // Adjust alignment for HLSL rules
  5464. // TODO: make this consistent in early phases of code:
  5465. // adjusting this late means inconsistencies with earlier code, which for reflection is an issue
  5466. // Until reflection is brought in sync with these adjustments, don't apply to $Global,
  5467. // which is the most likely to rely on reflection, and least likely to rely implicit layouts
  5468. if (glslangIntermediate->usingHlslOffsets() &&
  5469. ! memberType.isStruct() && structType.getTypeName().compare("$Global") != 0) {
  5470. int componentSize;
  5471. int componentAlignment = glslangIntermediate->getBaseAlignmentScalar(memberType, componentSize);
  5472. if (! memberType.isArray() && isVectorLike && componentAlignment <= 4)
  5473. memberAlignment = componentAlignment;
  5474. // Don't add unnecessary padding after this member
  5475. // (undo std140 bumping size to a mutliple of vec4)
  5476. if (explicitLayout == glslang::ElpStd140) {
  5477. if (memberType.isMatrix()) {
  5478. if (matrixLayout == glslang::ElmRowMajor)
  5479. memberSize -= componentSize * (4 - memberType.getMatrixCols());
  5480. else
  5481. memberSize -= componentSize * (4 - memberType.getMatrixRows());
  5482. } else if (memberType.isArray())
  5483. memberSize -= componentSize * (4 - memberType.getVectorSize());
  5484. }
  5485. }
  5486. // Bump up to member alignment
  5487. glslang::RoundToPow2(currentOffset, memberAlignment);
  5488. // Bump up to vec4 if there is a bad straddle
  5489. if (explicitLayout != glslang::ElpScalar && glslangIntermediate->improperStraddle(memberType, memberSize,
  5490. currentOffset, isVectorLike))
  5491. glslang::RoundToPow2(currentOffset, 16);
  5492. nextOffset = currentOffset + memberSize;
  5493. }
  5494. void TGlslangToSpvTraverser::declareUseOfStructMember(const glslang::TTypeList& members, int glslangMember)
  5495. {
  5496. const glslang::TBuiltInVariable glslangBuiltIn = members[glslangMember].type->getQualifier().builtIn;
  5497. switch (glslangBuiltIn)
  5498. {
  5499. case glslang::EbvPointSize:
  5500. case glslang::EbvClipDistance:
  5501. case glslang::EbvCullDistance:
  5502. case glslang::EbvViewportMaskNV:
  5503. case glslang::EbvSecondaryPositionNV:
  5504. case glslang::EbvSecondaryViewportMaskNV:
  5505. case glslang::EbvPositionPerViewNV:
  5506. case glslang::EbvViewportMaskPerViewNV:
  5507. case glslang::EbvTaskCountNV:
  5508. case glslang::EbvPrimitiveCountNV:
  5509. case glslang::EbvPrimitiveIndicesNV:
  5510. case glslang::EbvClipDistancePerViewNV:
  5511. case glslang::EbvCullDistancePerViewNV:
  5512. case glslang::EbvLayerPerViewNV:
  5513. case glslang::EbvMeshViewCountNV:
  5514. case glslang::EbvMeshViewIndicesNV:
  5515. // Generate the associated capability. Delegate to TranslateBuiltInDecoration.
  5516. // Alternately, we could just call this for any glslang built-in, since the
  5517. // capability already guards against duplicates.
  5518. TranslateBuiltInDecoration(glslangBuiltIn, false);
  5519. break;
  5520. default:
  5521. // Capabilities were already generated when the struct was declared.
  5522. break;
  5523. }
  5524. }
  5525. bool TGlslangToSpvTraverser::isShaderEntryPoint(const glslang::TIntermAggregate* node)
  5526. {
  5527. return node->getName().compare(glslangIntermediate->getEntryPointMangledName().c_str()) == 0;
  5528. }
  5529. // Does parameter need a place to keep writes, separate from the original?
  5530. // Assumes called after originalParam(), which filters out block/buffer/opaque-based
  5531. // qualifiers such that we should have only in/out/inout/constreadonly here.
  5532. bool TGlslangToSpvTraverser::writableParam(glslang::TStorageQualifier qualifier) const
  5533. {
  5534. assert(qualifier == glslang::EvqIn ||
  5535. qualifier == glslang::EvqOut ||
  5536. qualifier == glslang::EvqInOut ||
  5537. qualifier == glslang::EvqUniform ||
  5538. qualifier == glslang::EvqConstReadOnly);
  5539. return qualifier != glslang::EvqConstReadOnly &&
  5540. qualifier != glslang::EvqUniform;
  5541. }
  5542. // Is parameter pass-by-original?
  5543. bool TGlslangToSpvTraverser::originalParam(glslang::TStorageQualifier qualifier, const glslang::TType& paramType,
  5544. bool implicitThisParam)
  5545. {
  5546. if (implicitThisParam) // implicit this
  5547. return true;
  5548. if (glslangIntermediate->getSource() == glslang::EShSourceHlsl)
  5549. return paramType.getBasicType() == glslang::EbtBlock;
  5550. return (paramType.containsOpaque() && !glslangIntermediate->getBindlessMode()) || // sampler, etc.
  5551. paramType.getQualifier().isSpirvByReference() || // spirv_by_reference
  5552. (paramType.getBasicType() == glslang::EbtBlock && qualifier == glslang::EvqBuffer); // SSBO
  5553. }
  5554. // Make all the functions, skeletally, without actually visiting their bodies.
  5555. void TGlslangToSpvTraverser::makeFunctions(const glslang::TIntermSequence& glslFunctions)
  5556. {
  5557. const auto getParamDecorations = [&](std::vector<spv::Decoration>& decorations, const glslang::TType& type,
  5558. bool useVulkanMemoryModel) {
  5559. spv::Decoration paramPrecision = TranslatePrecisionDecoration(type);
  5560. if (paramPrecision != spv::NoPrecision)
  5561. decorations.push_back(paramPrecision);
  5562. TranslateMemoryDecoration(type.getQualifier(), decorations, useVulkanMemoryModel);
  5563. if (type.isReference()) {
  5564. // Original and non-writable params pass the pointer directly and
  5565. // use restrict/aliased, others are stored to a pointer in Function
  5566. // memory and use RestrictPointer/AliasedPointer.
  5567. if (originalParam(type.getQualifier().storage, type, false) ||
  5568. !writableParam(type.getQualifier().storage)) {
  5569. // TranslateMemoryDecoration added Restrict decoration already.
  5570. if (!type.getQualifier().isRestrict()) {
  5571. decorations.push_back(spv::Decoration::Aliased);
  5572. }
  5573. } else {
  5574. decorations.push_back(type.getQualifier().isRestrict() ? spv::Decoration::RestrictPointerEXT :
  5575. spv::Decoration::AliasedPointerEXT);
  5576. }
  5577. }
  5578. };
  5579. for (int f = 0; f < (int)glslFunctions.size(); ++f) {
  5580. glslang::TIntermAggregate* glslFunction = glslFunctions[f]->getAsAggregate();
  5581. if (! glslFunction || glslFunction->getOp() != glslang::EOpFunction)
  5582. continue;
  5583. builder.setDebugSourceLocation(glslFunction->getLoc().line, glslFunction->getLoc().getFilename());
  5584. if (isShaderEntryPoint(glslFunction)) {
  5585. // For HLSL, the entry function is actually a compiler generated function to resolve the difference of
  5586. // entry function signature between HLSL and SPIR-V. So we don't emit debug information for that.
  5587. if (glslangIntermediate->getSource() != glslang::EShSourceHlsl) {
  5588. builder.setupFunctionDebugInfo(shaderEntry, glslangIntermediate->getEntryPointMangledName().c_str(),
  5589. std::vector<spv::Id>(), // main function has no param
  5590. std::vector<char const*>());
  5591. }
  5592. continue;
  5593. }
  5594. // We're on a user function. Set up the basic interface for the function now,
  5595. // so that it's available to call. Translating the body will happen later.
  5596. //
  5597. // Typically (except for a "const in" parameter), an address will be passed to the
  5598. // function. What it is an address of varies:
  5599. //
  5600. // - "in" parameters not marked as "const" can be written to without modifying the calling
  5601. // argument so that write needs to be to a copy, hence the address of a copy works.
  5602. //
  5603. // - "const in" parameters can just be the r-value, as no writes need occur.
  5604. //
  5605. // - "out" and "inout" arguments can't be done as pointers to the calling argument, because
  5606. // GLSL has copy-in/copy-out semantics. They can be handled though with a pointer to a copy.
  5607. std::vector<spv::Id> paramTypes;
  5608. std::vector<char const*> paramNames;
  5609. std::vector<std::vector<spv::Decoration>> paramDecorations; // list of decorations per parameter
  5610. glslang::TIntermSequence& parameters = glslFunction->getSequence()[0]->getAsAggregate()->getSequence();
  5611. #ifdef ENABLE_HLSL
  5612. bool implicitThis = (int)parameters.size() > 0 && parameters[0]->getAsSymbolNode()->getName() ==
  5613. glslangIntermediate->implicitThisName;
  5614. #else
  5615. bool implicitThis = false;
  5616. #endif
  5617. paramDecorations.resize(parameters.size());
  5618. for (int p = 0; p < (int)parameters.size(); ++p) {
  5619. const glslang::TType& paramType = parameters[p]->getAsTyped()->getType();
  5620. spv::Id typeId = convertGlslangToSpvType(paramType);
  5621. if (originalParam(paramType.getQualifier().storage, paramType, implicitThis && p == 0))
  5622. typeId = builder.makePointer(TranslateStorageClass(paramType), typeId);
  5623. else if (writableParam(paramType.getQualifier().storage))
  5624. typeId = builder.makePointer(spv::StorageClass::Function, typeId);
  5625. else
  5626. rValueParameters.insert(parameters[p]->getAsSymbolNode()->getId());
  5627. getParamDecorations(paramDecorations[p], paramType, glslangIntermediate->usingVulkanMemoryModel());
  5628. paramTypes.push_back(typeId);
  5629. }
  5630. for (auto const parameter:parameters) {
  5631. paramNames.push_back(parameter->getAsSymbolNode()->getName().c_str());
  5632. }
  5633. spv::Block* functionBlock;
  5634. spv::Function* function = builder.makeFunctionEntry(
  5635. TranslatePrecisionDecoration(glslFunction->getType()), convertGlslangToSpvType(glslFunction->getType()),
  5636. glslFunction->getName().c_str(), convertGlslangLinkageToSpv(glslFunction->getLinkType()), paramTypes,
  5637. paramDecorations, &functionBlock);
  5638. builder.setupFunctionDebugInfo(function, glslFunction->getName().c_str(), paramTypes, paramNames);
  5639. if (implicitThis)
  5640. function->setImplicitThis();
  5641. // Track function to emit/call later
  5642. functionMap[glslFunction->getName().c_str()] = function;
  5643. // Set the parameter id's
  5644. for (int p = 0; p < (int)parameters.size(); ++p) {
  5645. symbolValues[parameters[p]->getAsSymbolNode()->getId()] = function->getParamId(p);
  5646. // give a name too
  5647. builder.addName(function->getParamId(p), parameters[p]->getAsSymbolNode()->getName().c_str());
  5648. const glslang::TType& paramType = parameters[p]->getAsTyped()->getType();
  5649. if (paramType.contains8BitInt())
  5650. builder.addCapability(spv::Capability::Int8);
  5651. if (paramType.contains16BitInt())
  5652. builder.addCapability(spv::Capability::Int16);
  5653. if (paramType.contains16BitFloat())
  5654. builder.addCapability(spv::Capability::Float16);
  5655. }
  5656. }
  5657. }
  5658. // Process all the initializers, while skipping the functions and link objects
  5659. void TGlslangToSpvTraverser::makeGlobalInitializers(const glslang::TIntermSequence& initializers)
  5660. {
  5661. builder.setBuildPoint(shaderEntry->getLastBlock());
  5662. for (int i = 0; i < (int)initializers.size(); ++i) {
  5663. glslang::TIntermAggregate* initializer = initializers[i]->getAsAggregate();
  5664. if (initializer && initializer->getOp() != glslang::EOpFunction && initializer->getOp() !=
  5665. glslang::EOpLinkerObjects) {
  5666. // We're on a top-level node that's not a function. Treat as an initializer, whose
  5667. // code goes into the beginning of the entry point.
  5668. initializer->traverse(this);
  5669. }
  5670. }
  5671. }
  5672. // Walk over all linker objects to create a map for payload and callable data linker objects
  5673. // and their location to be used during codegen for OpTraceKHR and OpExecuteCallableKHR
  5674. // This is done here since it is possible that these linker objects are not be referenced in the AST
  5675. void TGlslangToSpvTraverser::collectRayTracingLinkerObjects()
  5676. {
  5677. glslang::TIntermAggregate* linkerObjects = glslangIntermediate->findLinkerObjects();
  5678. for (auto& objSeq : linkerObjects->getSequence()) {
  5679. auto objNode = objSeq->getAsSymbolNode();
  5680. if (objNode != nullptr) {
  5681. if (objNode->getQualifier().hasLocation()) {
  5682. unsigned int location = objNode->getQualifier().layoutLocation;
  5683. auto st = objNode->getQualifier().storage;
  5684. int set;
  5685. switch (st)
  5686. {
  5687. case glslang::EvqPayload:
  5688. case glslang::EvqPayloadIn:
  5689. set = 0;
  5690. break;
  5691. case glslang::EvqCallableData:
  5692. case glslang::EvqCallableDataIn:
  5693. set = 1;
  5694. break;
  5695. case glslang::EvqHitObjectAttrNV:
  5696. set = 2;
  5697. break;
  5698. default:
  5699. set = -1;
  5700. }
  5701. if (set != -1)
  5702. locationToSymbol[set].insert(std::make_pair(location, objNode));
  5703. }
  5704. }
  5705. }
  5706. }
  5707. // Process all the functions, while skipping initializers.
  5708. void TGlslangToSpvTraverser::visitFunctions(const glslang::TIntermSequence& glslFunctions)
  5709. {
  5710. for (int f = 0; f < (int)glslFunctions.size(); ++f) {
  5711. glslang::TIntermAggregate* node = glslFunctions[f]->getAsAggregate();
  5712. if (node && (node->getOp() == glslang::EOpFunction || node->getOp() == glslang::EOpLinkerObjects))
  5713. node->traverse(this);
  5714. }
  5715. }
  5716. void TGlslangToSpvTraverser::handleFunctionEntry(const glslang::TIntermAggregate* node)
  5717. {
  5718. // SPIR-V functions should already be in the functionMap from the prepass
  5719. // that called makeFunctions().
  5720. currentFunction = functionMap[node->getName().c_str()];
  5721. spv::Block* functionBlock = currentFunction->getEntryBlock();
  5722. builder.setBuildPoint(functionBlock);
  5723. builder.enterFunction(currentFunction);
  5724. }
  5725. void TGlslangToSpvTraverser::translateArguments(const glslang::TIntermAggregate& node, std::vector<spv::Id>& arguments,
  5726. spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags)
  5727. {
  5728. const glslang::TIntermSequence& glslangArguments = node.getSequence();
  5729. glslang::TSampler sampler = {};
  5730. bool cubeCompare = false;
  5731. bool f16ShadowCompare = false;
  5732. if (node.isTexture() || node.isImage()) {
  5733. sampler = glslangArguments[0]->getAsTyped()->getType().getSampler();
  5734. cubeCompare = sampler.dim == glslang::EsdCube && sampler.arrayed && sampler.shadow;
  5735. f16ShadowCompare = sampler.shadow &&
  5736. glslangArguments[1]->getAsTyped()->getType().getBasicType() == glslang::EbtFloat16;
  5737. }
  5738. for (int i = 0; i < (int)glslangArguments.size(); ++i) {
  5739. builder.clearAccessChain();
  5740. glslangArguments[i]->traverse(this);
  5741. // Special case l-value operands
  5742. bool lvalue = false;
  5743. switch (node.getOp()) {
  5744. case glslang::EOpImageAtomicAdd:
  5745. case glslang::EOpImageAtomicMin:
  5746. case glslang::EOpImageAtomicMax:
  5747. case glslang::EOpImageAtomicAnd:
  5748. case glslang::EOpImageAtomicOr:
  5749. case glslang::EOpImageAtomicXor:
  5750. case glslang::EOpImageAtomicExchange:
  5751. case glslang::EOpImageAtomicCompSwap:
  5752. case glslang::EOpImageAtomicLoad:
  5753. case glslang::EOpImageAtomicStore:
  5754. if (i == 0)
  5755. lvalue = true;
  5756. break;
  5757. case glslang::EOpSparseImageLoad:
  5758. if ((sampler.ms && i == 3) || (! sampler.ms && i == 2))
  5759. lvalue = true;
  5760. break;
  5761. case glslang::EOpSparseTexture:
  5762. if (((cubeCompare || f16ShadowCompare) && i == 3) || (! (cubeCompare || f16ShadowCompare) && i == 2))
  5763. lvalue = true;
  5764. break;
  5765. case glslang::EOpSparseTextureClamp:
  5766. if (((cubeCompare || f16ShadowCompare) && i == 4) || (! (cubeCompare || f16ShadowCompare) && i == 3))
  5767. lvalue = true;
  5768. break;
  5769. case glslang::EOpSparseTextureLod:
  5770. case glslang::EOpSparseTextureOffset:
  5771. if ((f16ShadowCompare && i == 4) || (! f16ShadowCompare && i == 3))
  5772. lvalue = true;
  5773. break;
  5774. case glslang::EOpSparseTextureFetch:
  5775. if ((sampler.dim != glslang::EsdRect && i == 3) || (sampler.dim == glslang::EsdRect && i == 2))
  5776. lvalue = true;
  5777. break;
  5778. case glslang::EOpSparseTextureFetchOffset:
  5779. if ((sampler.dim != glslang::EsdRect && i == 4) || (sampler.dim == glslang::EsdRect && i == 3))
  5780. lvalue = true;
  5781. break;
  5782. case glslang::EOpSparseTextureLodOffset:
  5783. case glslang::EOpSparseTextureGrad:
  5784. case glslang::EOpSparseTextureOffsetClamp:
  5785. if ((f16ShadowCompare && i == 5) || (! f16ShadowCompare && i == 4))
  5786. lvalue = true;
  5787. break;
  5788. case glslang::EOpSparseTextureGradOffset:
  5789. case glslang::EOpSparseTextureGradClamp:
  5790. if ((f16ShadowCompare && i == 6) || (! f16ShadowCompare && i == 5))
  5791. lvalue = true;
  5792. break;
  5793. case glslang::EOpSparseTextureGradOffsetClamp:
  5794. if ((f16ShadowCompare && i == 7) || (! f16ShadowCompare && i == 6))
  5795. lvalue = true;
  5796. break;
  5797. case glslang::EOpSparseTextureGather:
  5798. if ((sampler.shadow && i == 3) || (! sampler.shadow && i == 2))
  5799. lvalue = true;
  5800. break;
  5801. case glslang::EOpSparseTextureGatherOffset:
  5802. case glslang::EOpSparseTextureGatherOffsets:
  5803. if ((sampler.shadow && i == 4) || (! sampler.shadow && i == 3))
  5804. lvalue = true;
  5805. break;
  5806. case glslang::EOpSparseTextureGatherLod:
  5807. if (i == 3)
  5808. lvalue = true;
  5809. break;
  5810. case glslang::EOpSparseTextureGatherLodOffset:
  5811. case glslang::EOpSparseTextureGatherLodOffsets:
  5812. if (i == 4)
  5813. lvalue = true;
  5814. break;
  5815. case glslang::EOpSparseImageLoadLod:
  5816. if (i == 3)
  5817. lvalue = true;
  5818. break;
  5819. case glslang::EOpImageSampleFootprintNV:
  5820. if (i == 4)
  5821. lvalue = true;
  5822. break;
  5823. case glslang::EOpImageSampleFootprintClampNV:
  5824. case glslang::EOpImageSampleFootprintLodNV:
  5825. if (i == 5)
  5826. lvalue = true;
  5827. break;
  5828. case glslang::EOpImageSampleFootprintGradNV:
  5829. if (i == 6)
  5830. lvalue = true;
  5831. break;
  5832. case glslang::EOpImageSampleFootprintGradClampNV:
  5833. if (i == 7)
  5834. lvalue = true;
  5835. break;
  5836. case glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT:
  5837. case glslang::EOpRayQueryGetIntersectionLSSPositionsNV:
  5838. case glslang::EOpRayQueryGetIntersectionLSSRadiiNV:
  5839. if (i == 2)
  5840. lvalue = true;
  5841. break;
  5842. case glslang::EOpConstructSaturated:
  5843. if (i == 0)
  5844. lvalue = true;
  5845. break;
  5846. default:
  5847. break;
  5848. }
  5849. if (lvalue) {
  5850. spv::Id lvalue_id = builder.accessChainGetLValue();
  5851. arguments.push_back(lvalue_id);
  5852. lvalueCoherentFlags = builder.getAccessChain().coherentFlags;
  5853. builder.addDecoration(lvalue_id, TranslateNonUniformDecoration(lvalueCoherentFlags));
  5854. lvalueCoherentFlags |= TranslateCoherent(glslangArguments[i]->getAsTyped()->getType());
  5855. } else {
  5856. if (i > 0 &&
  5857. glslangArguments[i]->getAsSymbolNode() && glslangArguments[i-1]->getAsSymbolNode() &&
  5858. glslangArguments[i]->getAsSymbolNode()->getId() == glslangArguments[i-1]->getAsSymbolNode()->getId()) {
  5859. // Reuse the id if possible
  5860. arguments.push_back(arguments[i-1]);
  5861. } else {
  5862. arguments.push_back(accessChainLoad(glslangArguments[i]->getAsTyped()->getType()));
  5863. }
  5864. }
  5865. }
  5866. }
  5867. void TGlslangToSpvTraverser::translateArguments(glslang::TIntermUnary& node, std::vector<spv::Id>& arguments)
  5868. {
  5869. builder.clearAccessChain();
  5870. node.getOperand()->traverse(this);
  5871. arguments.push_back(accessChainLoad(node.getOperand()->getType()));
  5872. }
  5873. spv::Id TGlslangToSpvTraverser::createImageTextureFunctionCall(glslang::TIntermOperator* node)
  5874. {
  5875. if (! node->isImage() && ! node->isTexture())
  5876. return spv::NoResult;
  5877. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  5878. // Process a GLSL texturing op (will be SPV image)
  5879. const glslang::TType &imageType = node->getAsAggregate()
  5880. ? node->getAsAggregate()->getSequence()[0]->getAsTyped()->getType()
  5881. : node->getAsUnaryNode()->getOperand()->getAsTyped()->getType();
  5882. const glslang::TSampler sampler = imageType.getSampler();
  5883. bool f16ShadowCompare = (sampler.shadow && node->getAsAggregate())
  5884. ? node->getAsAggregate()->getSequence()[1]->getAsTyped()->getType().getBasicType() == glslang::EbtFloat16
  5885. : false;
  5886. const auto signExtensionMask = [&]() {
  5887. if (builder.getSpvVersion() >= spv::Spv_1_4) {
  5888. if (sampler.type == glslang::EbtUint)
  5889. return spv::ImageOperandsMask::ZeroExtend;
  5890. else if (sampler.type == glslang::EbtInt)
  5891. return spv::ImageOperandsMask::SignExtend;
  5892. }
  5893. return spv::ImageOperandsMask::MaskNone;
  5894. };
  5895. spv::Builder::AccessChain::CoherentFlags lvalueCoherentFlags;
  5896. std::vector<spv::Id> arguments;
  5897. if (node->getAsAggregate())
  5898. translateArguments(*node->getAsAggregate(), arguments, lvalueCoherentFlags);
  5899. else
  5900. translateArguments(*node->getAsUnaryNode(), arguments);
  5901. spv::Decoration precision = TranslatePrecisionDecoration(node->getType());
  5902. spv::Builder::TextureParameters params = { };
  5903. params.sampler = arguments[0];
  5904. glslang::TCrackedTextureOp cracked;
  5905. node->crackTexture(sampler, cracked);
  5906. const bool isUnsignedResult = node->getType().getBasicType() == glslang::EbtUint;
  5907. if (builder.isSampledImage(params.sampler) &&
  5908. ((cracked.query && node->getOp() != glslang::EOpTextureQueryLod) || cracked.fragMask || cracked.fetch)) {
  5909. params.sampler = builder.createUnaryOp(spv::Op::OpImage, builder.getImageType(params.sampler), params.sampler);
  5910. if (imageType.getQualifier().isNonUniform()) {
  5911. builder.addDecoration(params.sampler, spv::Decoration::NonUniformEXT);
  5912. }
  5913. }
  5914. // Check for queries
  5915. if (cracked.query) {
  5916. switch (node->getOp()) {
  5917. case glslang::EOpImageQuerySize:
  5918. case glslang::EOpTextureQuerySize:
  5919. if (arguments.size() > 1) {
  5920. params.lod = arguments[1];
  5921. return builder.createTextureQueryCall(spv::Op::OpImageQuerySizeLod, params, isUnsignedResult);
  5922. } else
  5923. return builder.createTextureQueryCall(spv::Op::OpImageQuerySize, params, isUnsignedResult);
  5924. case glslang::EOpImageQuerySamples:
  5925. case glslang::EOpTextureQuerySamples:
  5926. return builder.createTextureQueryCall(spv::Op::OpImageQuerySamples, params, isUnsignedResult);
  5927. case glslang::EOpTextureQueryLod:
  5928. params.coords = arguments[1];
  5929. return builder.createTextureQueryCall(spv::Op::OpImageQueryLod, params, isUnsignedResult);
  5930. case glslang::EOpTextureQueryLevels:
  5931. return builder.createTextureQueryCall(spv::Op::OpImageQueryLevels, params, isUnsignedResult);
  5932. case glslang::EOpSparseTexelsResident:
  5933. return builder.createUnaryOp(spv::Op::OpImageSparseTexelsResident, builder.makeBoolType(), arguments[0]);
  5934. default:
  5935. assert(0);
  5936. break;
  5937. }
  5938. }
  5939. int components = node->getType().getVectorSize();
  5940. if (node->getOp() == glslang::EOpImageLoad ||
  5941. node->getOp() == glslang::EOpImageLoadLod ||
  5942. node->getOp() == glslang::EOpTextureFetch ||
  5943. node->getOp() == glslang::EOpTextureFetchOffset) {
  5944. // These must produce 4 components, per SPIR-V spec. We'll add a conversion constructor if needed.
  5945. // This will only happen through the HLSL path for operator[], so we do not have to handle e.g.
  5946. // the EOpTexture/Proj/Lod/etc family. It would be harmless to do so, but would need more logic
  5947. // here around e.g. which ones return scalars or other types.
  5948. components = 4;
  5949. }
  5950. glslang::TType returnType(node->getType().getBasicType(), glslang::EvqTemporary, components);
  5951. auto resultType = [&returnType,this]{ return convertGlslangToSpvType(returnType); };
  5952. // Check for image functions other than queries
  5953. if (node->isImage()) {
  5954. std::vector<spv::IdImmediate> operands;
  5955. auto opIt = arguments.begin();
  5956. spv::IdImmediate image = { true, *(opIt++) };
  5957. operands.push_back(image);
  5958. // Handle subpass operations
  5959. // TODO: GLSL should change to have the "MS" only on the type rather than the
  5960. // built-in function.
  5961. if (cracked.subpass) {
  5962. // add on the (0,0) coordinate
  5963. spv::Id zero = builder.makeIntConstant(0);
  5964. std::vector<spv::Id> comps;
  5965. comps.push_back(zero);
  5966. comps.push_back(zero);
  5967. spv::IdImmediate coord = { true,
  5968. builder.makeCompositeConstant(builder.makeVectorType(builder.makeIntType(32), 2), comps) };
  5969. operands.push_back(coord);
  5970. spv::IdImmediate imageOperands = { false, spv::ImageOperandsMask::MaskNone };
  5971. imageOperands.word = imageOperands.word | (unsigned)signExtensionMask();
  5972. if (sampler.isMultiSample()) {
  5973. imageOperands.word = imageOperands.word | (unsigned)spv::ImageOperandsMask::Sample;
  5974. }
  5975. if (imageOperands.word != (unsigned)spv::ImageOperandsMask::MaskNone) {
  5976. operands.push_back(imageOperands);
  5977. if (sampler.isMultiSample()) {
  5978. spv::IdImmediate imageOperand = { true, *(opIt++) };
  5979. operands.push_back(imageOperand);
  5980. }
  5981. }
  5982. spv::Id result = builder.createOp(spv::Op::OpImageRead, resultType(), operands);
  5983. builder.setPrecision(result, precision);
  5984. return result;
  5985. }
  5986. if (cracked.attachmentEXT) {
  5987. if (opIt != arguments.end()) {
  5988. spv::IdImmediate sample = { true, *opIt };
  5989. operands.push_back(sample);
  5990. }
  5991. spv::Id result = builder.createOp(spv::Op::OpColorAttachmentReadEXT, resultType(), operands);
  5992. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  5993. builder.setPrecision(result, precision);
  5994. return result;
  5995. }
  5996. spv::IdImmediate coord = { true, *(opIt++) };
  5997. operands.push_back(coord);
  5998. if (node->getOp() == glslang::EOpImageLoad || node->getOp() == glslang::EOpImageLoadLod) {
  5999. spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;
  6000. if (sampler.isMultiSample()) {
  6001. mask = mask | spv::ImageOperandsMask::Sample;
  6002. }
  6003. if (cracked.lod) {
  6004. builder.addExtension(spv::E_SPV_AMD_shader_image_load_store_lod);
  6005. builder.addCapability(spv::Capability::ImageReadWriteLodAMD);
  6006. mask = mask | spv::ImageOperandsMask::Lod;
  6007. }
  6008. mask = mask | TranslateImageOperands(TranslateCoherent(imageType));
  6009. mask = (spv::ImageOperandsMask)(mask & ~spv::ImageOperandsMask::MakeTexelAvailableKHR);
  6010. mask = mask | signExtensionMask();
  6011. if (mask != spv::ImageOperandsMask::MaskNone) {
  6012. spv::IdImmediate imageOperands = { false, (unsigned int)mask };
  6013. operands.push_back(imageOperands);
  6014. }
  6015. if (anySet(mask, spv::ImageOperandsMask::Sample)) {
  6016. spv::IdImmediate imageOperand = { true, *opIt++ };
  6017. operands.push_back(imageOperand);
  6018. }
  6019. if (anySet(mask, spv::ImageOperandsMask::Lod)) {
  6020. spv::IdImmediate imageOperand = { true, *opIt++ };
  6021. operands.push_back(imageOperand);
  6022. }
  6023. if (anySet(mask, spv::ImageOperandsMask::MakeTexelVisibleKHR)) {
  6024. spv::IdImmediate imageOperand = { true,
  6025. builder.makeUintConstant(TranslateMemoryScope(TranslateCoherent(imageType))) };
  6026. operands.push_back(imageOperand);
  6027. }
  6028. if (builder.getImageTypeFormat(builder.getImageType(operands.front().word)) == spv::ImageFormat::Unknown)
  6029. builder.addCapability(spv::Capability::StorageImageReadWithoutFormat);
  6030. std::vector<spv::Id> result(1, builder.createOp(spv::Op::OpImageRead, resultType(), operands));
  6031. builder.setPrecision(result[0], precision);
  6032. // If needed, add a conversion constructor to the proper size.
  6033. if (components != node->getType().getVectorSize())
  6034. result[0] = builder.createConstructor(precision, result, convertGlslangToSpvType(node->getType()));
  6035. return result[0];
  6036. } else if (node->getOp() == glslang::EOpImageStore || node->getOp() == glslang::EOpImageStoreLod) {
  6037. // Push the texel value before the operands
  6038. if (sampler.isMultiSample() || cracked.lod) {
  6039. spv::IdImmediate texel = { true, *(opIt + 1) };
  6040. operands.push_back(texel);
  6041. } else {
  6042. spv::IdImmediate texel = { true, *opIt };
  6043. operands.push_back(texel);
  6044. }
  6045. spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;
  6046. if (sampler.isMultiSample()) {
  6047. mask = mask | spv::ImageOperandsMask::Sample;
  6048. }
  6049. if (cracked.lod) {
  6050. builder.addExtension(spv::E_SPV_AMD_shader_image_load_store_lod);
  6051. builder.addCapability(spv::Capability::ImageReadWriteLodAMD);
  6052. mask = mask | spv::ImageOperandsMask::Lod;
  6053. }
  6054. mask = mask | TranslateImageOperands(TranslateCoherent(imageType));
  6055. mask = (spv::ImageOperandsMask)(mask & ~spv::ImageOperandsMask::MakeTexelVisibleKHR);
  6056. mask = mask | signExtensionMask();
  6057. if (mask != spv::ImageOperandsMask::MaskNone) {
  6058. spv::IdImmediate imageOperands = { false, (unsigned int)mask };
  6059. operands.push_back(imageOperands);
  6060. }
  6061. if (anySet(mask, spv::ImageOperandsMask::Sample)) {
  6062. spv::IdImmediate imageOperand = { true, *opIt++ };
  6063. operands.push_back(imageOperand);
  6064. }
  6065. if (anySet(mask, spv::ImageOperandsMask::Lod)) {
  6066. spv::IdImmediate imageOperand = { true, *opIt++ };
  6067. operands.push_back(imageOperand);
  6068. }
  6069. if (anySet(mask, spv::ImageOperandsMask::MakeTexelAvailableKHR)) {
  6070. spv::IdImmediate imageOperand = { true,
  6071. builder.makeUintConstant(TranslateMemoryScope(TranslateCoherent(imageType))) };
  6072. operands.push_back(imageOperand);
  6073. }
  6074. builder.createNoResultOp(spv::Op::OpImageWrite, operands);
  6075. if (builder.getImageTypeFormat(builder.getImageType(operands.front().word)) == spv::ImageFormat::Unknown)
  6076. builder.addCapability(spv::Capability::StorageImageWriteWithoutFormat);
  6077. return spv::NoResult;
  6078. } else if (node->getOp() == glslang::EOpSparseImageLoad ||
  6079. node->getOp() == glslang::EOpSparseImageLoadLod) {
  6080. builder.addCapability(spv::Capability::SparseResidency);
  6081. if (builder.getImageTypeFormat(builder.getImageType(operands.front().word)) == spv::ImageFormat::Unknown)
  6082. builder.addCapability(spv::Capability::StorageImageReadWithoutFormat);
  6083. spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;
  6084. if (sampler.isMultiSample()) {
  6085. mask = mask | spv::ImageOperandsMask::Sample;
  6086. }
  6087. if (cracked.lod) {
  6088. builder.addExtension(spv::E_SPV_AMD_shader_image_load_store_lod);
  6089. builder.addCapability(spv::Capability::ImageReadWriteLodAMD);
  6090. mask = mask | spv::ImageOperandsMask::Lod;
  6091. }
  6092. mask = mask | TranslateImageOperands(TranslateCoherent(imageType));
  6093. mask = (spv::ImageOperandsMask)(mask & ~spv::ImageOperandsMask::MakeTexelAvailableKHR);
  6094. mask = mask | signExtensionMask();
  6095. if (mask != spv::ImageOperandsMask::MaskNone) {
  6096. spv::IdImmediate imageOperands = { false, (unsigned int)mask };
  6097. operands.push_back(imageOperands);
  6098. }
  6099. if (anySet(mask, spv::ImageOperandsMask::Sample)) {
  6100. spv::IdImmediate imageOperand = { true, *opIt++ };
  6101. operands.push_back(imageOperand);
  6102. }
  6103. if (anySet(mask, spv::ImageOperandsMask::Lod)) {
  6104. spv::IdImmediate imageOperand = { true, *opIt++ };
  6105. operands.push_back(imageOperand);
  6106. }
  6107. if (anySet(mask, spv::ImageOperandsMask::MakeTexelVisibleKHR)) {
  6108. spv::IdImmediate imageOperand = { true, builder.makeUintConstant(TranslateMemoryScope(
  6109. TranslateCoherent(imageType))) };
  6110. operands.push_back(imageOperand);
  6111. }
  6112. // Create the return type that was a special structure
  6113. spv::Id texelOut = *opIt;
  6114. spv::Id typeId0 = resultType();
  6115. spv::Id typeId1 = builder.getDerefTypeId(texelOut);
  6116. spv::Id resultTypeId = builder.makeStructResultType(typeId0, typeId1);
  6117. spv::Id resultId = builder.createOp(spv::Op::OpImageSparseRead, resultTypeId, operands);
  6118. // Decode the return type
  6119. builder.createStore(builder.createCompositeExtract(resultId, typeId1, 1), texelOut);
  6120. return builder.createCompositeExtract(resultId, typeId0, 0);
  6121. } else {
  6122. // Process image atomic operations
  6123. // GLSL "IMAGE_PARAMS" will involve in constructing an image texel pointer and this pointer,
  6124. // as the first source operand, is required by SPIR-V atomic operations.
  6125. // For non-MS, the sample value should be 0
  6126. spv::IdImmediate sample = { true, sampler.isMultiSample() ? *(opIt++) : builder.makeUintConstant(0) };
  6127. operands.push_back(sample);
  6128. spv::Id resultTypeId;
  6129. glslang::TBasicType typeProxy = node->getBasicType();
  6130. // imageAtomicStore has a void return type so base the pointer type on
  6131. // the type of the value operand.
  6132. if (node->getOp() == glslang::EOpImageAtomicStore) {
  6133. resultTypeId = builder.makePointer(spv::StorageClass::Image, builder.getTypeId(*opIt));
  6134. typeProxy = node->getAsAggregate()->getSequence()[0]->getAsTyped()->getType().getSampler().type;
  6135. } else {
  6136. resultTypeId = builder.makePointer(spv::StorageClass::Image, resultType());
  6137. }
  6138. spv::Id pointer = builder.createOp(spv::Op::OpImageTexelPointer, resultTypeId, operands);
  6139. if (imageType.getQualifier().nonUniform) {
  6140. builder.addDecoration(pointer, spv::Decoration::NonUniformEXT);
  6141. }
  6142. std::vector<spv::Id> operands;
  6143. operands.push_back(pointer);
  6144. for (; opIt != arguments.end(); ++opIt)
  6145. operands.push_back(*opIt);
  6146. return createAtomicOperation(node->getOp(), precision, resultType(), operands, typeProxy,
  6147. lvalueCoherentFlags, node->getType());
  6148. }
  6149. }
  6150. // Check for fragment mask functions other than queries
  6151. if (cracked.fragMask) {
  6152. assert(sampler.ms);
  6153. auto opIt = arguments.begin();
  6154. std::vector<spv::Id> operands;
  6155. operands.push_back(params.sampler);
  6156. ++opIt;
  6157. if (sampler.isSubpass()) {
  6158. // add on the (0,0) coordinate
  6159. spv::Id zero = builder.makeIntConstant(0);
  6160. std::vector<spv::Id> comps;
  6161. comps.push_back(zero);
  6162. comps.push_back(zero);
  6163. operands.push_back(builder.makeCompositeConstant(
  6164. builder.makeVectorType(builder.makeIntType(32), 2), comps));
  6165. }
  6166. for (; opIt != arguments.end(); ++opIt)
  6167. operands.push_back(*opIt);
  6168. spv::Op fragMaskOp = spv::Op::OpNop;
  6169. if (node->getOp() == glslang::EOpFragmentMaskFetch)
  6170. fragMaskOp = spv::Op::OpFragmentMaskFetchAMD;
  6171. else if (node->getOp() == glslang::EOpFragmentFetch)
  6172. fragMaskOp = spv::Op::OpFragmentFetchAMD;
  6173. builder.addExtension(spv::E_SPV_AMD_shader_fragment_mask);
  6174. builder.addCapability(spv::Capability::FragmentMaskAMD);
  6175. return builder.createOp(fragMaskOp, resultType(), operands);
  6176. }
  6177. // Check for texture functions other than queries
  6178. bool sparse = node->isSparseTexture();
  6179. bool imageFootprint = node->isImageFootprint();
  6180. bool cubeCompare = sampler.dim == glslang::EsdCube && sampler.isArrayed() && sampler.isShadow();
  6181. // check for bias argument
  6182. bool bias = false;
  6183. if (! cracked.lod && ! cracked.grad && ! cracked.fetch && ! cubeCompare) {
  6184. int nonBiasArgCount = 2;
  6185. if (cracked.gather)
  6186. ++nonBiasArgCount; // comp argument should be present when bias argument is present
  6187. if (f16ShadowCompare)
  6188. ++nonBiasArgCount;
  6189. if (cracked.offset)
  6190. ++nonBiasArgCount;
  6191. else if (cracked.offsets)
  6192. ++nonBiasArgCount;
  6193. if (cracked.grad)
  6194. nonBiasArgCount += 2;
  6195. if (cracked.lodClamp)
  6196. ++nonBiasArgCount;
  6197. if (sparse)
  6198. ++nonBiasArgCount;
  6199. if (imageFootprint)
  6200. //Following three extra arguments
  6201. // int granularity, bool coarse, out gl_TextureFootprint2DNV footprint
  6202. nonBiasArgCount += 3;
  6203. if ((int)arguments.size() > nonBiasArgCount)
  6204. bias = true;
  6205. }
  6206. if (cracked.gather) {
  6207. const auto& sourceExtensions = glslangIntermediate->getRequestedExtensions();
  6208. if (bias || cracked.lod ||
  6209. sourceExtensions.find(glslang::E_GL_AMD_texture_gather_bias_lod) != sourceExtensions.end()) {
  6210. builder.addExtension(spv::E_SPV_AMD_texture_gather_bias_lod);
  6211. builder.addCapability(spv::Capability::ImageGatherBiasLodAMD);
  6212. }
  6213. }
  6214. // set the rest of the arguments
  6215. params.coords = arguments[1];
  6216. int extraArgs = 0;
  6217. bool noImplicitLod = false;
  6218. // sort out where Dref is coming from
  6219. if (cubeCompare || f16ShadowCompare) {
  6220. params.Dref = arguments[2];
  6221. ++extraArgs;
  6222. } else if (sampler.shadow && cracked.gather) {
  6223. params.Dref = arguments[2];
  6224. ++extraArgs;
  6225. } else if (sampler.shadow) {
  6226. std::vector<spv::Id> indexes;
  6227. int dRefComp;
  6228. if (cracked.proj)
  6229. dRefComp = 2; // "The resulting 3rd component of P in the shadow forms is used as Dref"
  6230. else
  6231. dRefComp = builder.getNumComponents(params.coords) - 1;
  6232. indexes.push_back(dRefComp);
  6233. params.Dref = builder.createCompositeExtract(params.coords,
  6234. builder.getScalarTypeId(builder.getTypeId(params.coords)), indexes);
  6235. }
  6236. // lod
  6237. if (cracked.lod) {
  6238. params.lod = arguments[2 + extraArgs];
  6239. ++extraArgs;
  6240. } else if (glslangIntermediate->getStage() != EShLangFragment &&
  6241. !(glslangIntermediate->getStage() == EShLangCompute &&
  6242. glslangIntermediate->hasLayoutDerivativeModeNone())) {
  6243. // we need to invent the default lod for an explicit lod instruction for a non-fragment stage
  6244. noImplicitLod = true;
  6245. }
  6246. // multisample
  6247. if (sampler.isMultiSample()) {
  6248. params.sample = arguments[2 + extraArgs]; // For MS, "sample" should be specified
  6249. ++extraArgs;
  6250. }
  6251. // gradient
  6252. if (cracked.grad) {
  6253. params.gradX = arguments[2 + extraArgs];
  6254. params.gradY = arguments[3 + extraArgs];
  6255. extraArgs += 2;
  6256. }
  6257. // offset and offsets
  6258. if (cracked.offset) {
  6259. params.offset = arguments[2 + extraArgs];
  6260. ++extraArgs;
  6261. } else if (cracked.offsets) {
  6262. params.offsets = arguments[2 + extraArgs];
  6263. ++extraArgs;
  6264. }
  6265. // lod clamp
  6266. if (cracked.lodClamp) {
  6267. params.lodClamp = arguments[2 + extraArgs];
  6268. ++extraArgs;
  6269. }
  6270. // sparse
  6271. if (sparse) {
  6272. params.texelOut = arguments[2 + extraArgs];
  6273. ++extraArgs;
  6274. }
  6275. // gather component
  6276. if (cracked.gather && ! sampler.shadow) {
  6277. // default component is 0, if missing, otherwise an argument
  6278. if (2 + extraArgs < (int)arguments.size()) {
  6279. params.component = arguments[2 + extraArgs];
  6280. ++extraArgs;
  6281. } else
  6282. params.component = builder.makeIntConstant(0);
  6283. }
  6284. spv::Id resultStruct = spv::NoResult;
  6285. if (imageFootprint) {
  6286. //Following three extra arguments
  6287. // int granularity, bool coarse, out gl_TextureFootprint2DNV footprint
  6288. params.granularity = arguments[2 + extraArgs];
  6289. params.coarse = arguments[3 + extraArgs];
  6290. resultStruct = arguments[4 + extraArgs];
  6291. extraArgs += 3;
  6292. }
  6293. // bias
  6294. if (bias) {
  6295. params.bias = arguments[2 + extraArgs];
  6296. ++extraArgs;
  6297. }
  6298. if (imageFootprint) {
  6299. builder.addExtension(spv::E_SPV_NV_shader_image_footprint);
  6300. builder.addCapability(spv::Capability::ImageFootprintNV);
  6301. //resultStructType(OpenGL type) contains 5 elements:
  6302. //struct gl_TextureFootprint2DNV {
  6303. // uvec2 anchor;
  6304. // uvec2 offset;
  6305. // uvec2 mask;
  6306. // uint lod;
  6307. // uint granularity;
  6308. //};
  6309. //or
  6310. //struct gl_TextureFootprint3DNV {
  6311. // uvec3 anchor;
  6312. // uvec3 offset;
  6313. // uvec2 mask;
  6314. // uint lod;
  6315. // uint granularity;
  6316. //};
  6317. spv::Id resultStructType = builder.getContainedTypeId(builder.getTypeId(resultStruct));
  6318. assert(builder.isStructType(resultStructType));
  6319. //resType (SPIR-V type) contains 6 elements:
  6320. //Member 0 must be a Boolean type scalar(LOD),
  6321. //Member 1 must be a vector of integer type, whose Signedness operand is 0(anchor),
  6322. //Member 2 must be a vector of integer type, whose Signedness operand is 0(offset),
  6323. //Member 3 must be a vector of integer type, whose Signedness operand is 0(mask),
  6324. //Member 4 must be a scalar of integer type, whose Signedness operand is 0(lod),
  6325. //Member 5 must be a scalar of integer type, whose Signedness operand is 0(granularity).
  6326. std::vector<spv::Id> members;
  6327. members.push_back(resultType());
  6328. for (int i = 0; i < 5; i++) {
  6329. members.push_back(builder.getContainedTypeId(resultStructType, i));
  6330. }
  6331. spv::Id resType = builder.makeStructType(members, "ResType");
  6332. //call ImageFootprintNV
  6333. spv::Id res = builder.createTextureCall(precision, resType, sparse, cracked.fetch, cracked.proj,
  6334. cracked.gather, noImplicitLod, params, signExtensionMask());
  6335. //copy resType (SPIR-V type) to resultStructType(OpenGL type)
  6336. for (int i = 0; i < 5; i++) {
  6337. builder.clearAccessChain();
  6338. builder.setAccessChainLValue(resultStruct);
  6339. //Accessing to a struct we created, no coherent flag is set
  6340. spv::Builder::AccessChain::CoherentFlags flags;
  6341. flags.clear();
  6342. builder.accessChainPush(builder.makeIntConstant(i), flags, 0);
  6343. builder.accessChainStore(builder.createCompositeExtract(res, builder.getContainedTypeId(resType, i+1),
  6344. i+1), TranslateNonUniformDecoration(imageType.getQualifier()));
  6345. }
  6346. return builder.createCompositeExtract(res, resultType(), 0);
  6347. }
  6348. // projective component (might not to move)
  6349. // GLSL: "The texture coordinates consumed from P, not including the last component of P,
  6350. // are divided by the last component of P."
  6351. // SPIR-V: "... (u [, v] [, w], q)... It may be a vector larger than needed, but all
  6352. // unused components will appear after all used components."
  6353. if (cracked.proj) {
  6354. int projSourceComp = builder.getNumComponents(params.coords) - 1;
  6355. int projTargetComp;
  6356. switch (sampler.dim) {
  6357. case glslang::Esd1D: projTargetComp = 1; break;
  6358. case glslang::Esd2D: projTargetComp = 2; break;
  6359. case glslang::EsdRect: projTargetComp = 2; break;
  6360. default: projTargetComp = projSourceComp; break;
  6361. }
  6362. // copy the projective coordinate if we have to
  6363. if (projTargetComp != projSourceComp) {
  6364. spv::Id projComp = builder.createCompositeExtract(params.coords,
  6365. builder.getScalarTypeId(builder.getTypeId(params.coords)), projSourceComp);
  6366. params.coords = builder.createCompositeInsert(projComp, params.coords,
  6367. builder.getTypeId(params.coords), projTargetComp);
  6368. }
  6369. }
  6370. // nonprivate
  6371. if (imageType.getQualifier().nonprivate) {
  6372. params.nonprivate = true;
  6373. }
  6374. // volatile
  6375. if (imageType.getQualifier().volatil) {
  6376. params.volatil = true;
  6377. }
  6378. if (imageType.getQualifier().nontemporal) {
  6379. params.nontemporal = true;
  6380. }
  6381. std::vector<spv::Id> result( 1,
  6382. builder.createTextureCall(precision, resultType(), sparse, cracked.fetch, cracked.proj, cracked.gather,
  6383. noImplicitLod, params, signExtensionMask())
  6384. );
  6385. if (components != node->getType().getVectorSize())
  6386. result[0] = builder.createConstructor(precision, result, convertGlslangToSpvType(node->getType()));
  6387. return result[0];
  6388. }
  6389. spv::Id TGlslangToSpvTraverser::handleUserFunctionCall(const glslang::TIntermAggregate* node)
  6390. {
  6391. // Grab the function's pointer from the previously created function
  6392. spv::Function* function = functionMap[node->getName().c_str()];
  6393. if (! function)
  6394. return 0;
  6395. const glslang::TIntermSequence& glslangArgs = node->getSequence();
  6396. const glslang::TQualifierList& qualifiers = node->getQualifierList();
  6397. // See comments in makeFunctions() for details about the semantics for parameter passing.
  6398. //
  6399. // These imply we need a four step process:
  6400. // 1. Evaluate the arguments
  6401. // 2. Allocate and make copies of in, out, and inout arguments
  6402. // 3. Make the call
  6403. // 4. Copy back the results
  6404. // 1. Evaluate the arguments and their types
  6405. std::vector<spv::Builder::AccessChain> lValues;
  6406. std::vector<spv::Id> rValues;
  6407. std::vector<const glslang::TType*> argTypes;
  6408. for (int a = 0; a < (int)glslangArgs.size(); ++a) {
  6409. argTypes.push_back(&glslangArgs[a]->getAsTyped()->getType());
  6410. // build l-value
  6411. builder.clearAccessChain();
  6412. glslangArgs[a]->traverse(this);
  6413. // keep outputs and pass-by-originals as l-values, evaluate others as r-values
  6414. if (originalParam(qualifiers[a], *argTypes[a], function->hasImplicitThis() && a == 0) ||
  6415. writableParam(qualifiers[a])) {
  6416. // save l-value
  6417. lValues.push_back(builder.getAccessChain());
  6418. } else {
  6419. // process r-value
  6420. rValues.push_back(accessChainLoad(*argTypes.back()));
  6421. }
  6422. }
  6423. // Reset source location to the function call location after argument evaluation
  6424. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  6425. // 2. Allocate space for anything needing a copy, and if it's "in" or "inout"
  6426. // copy the original into that space.
  6427. //
  6428. // Also, build up the list of actual arguments to pass in for the call
  6429. int lValueCount = 0;
  6430. int rValueCount = 0;
  6431. std::vector<spv::Id> spvArgs;
  6432. for (int a = 0; a < (int)glslangArgs.size(); ++a) {
  6433. spv::Id arg;
  6434. if (originalParam(qualifiers[a], *argTypes[a], function->hasImplicitThis() && a == 0)) {
  6435. builder.setAccessChain(lValues[lValueCount]);
  6436. arg = builder.accessChainGetLValue();
  6437. ++lValueCount;
  6438. } else if (writableParam(qualifiers[a])) {
  6439. // need space to hold the copy
  6440. arg = builder.createVariable(function->getParamPrecision(a), spv::StorageClass::Function,
  6441. builder.getContainedTypeId(function->getParamType(a)), "param");
  6442. if (qualifiers[a] == glslang::EvqIn || qualifiers[a] == glslang::EvqInOut) {
  6443. // need to copy the input into output space
  6444. builder.setAccessChain(lValues[lValueCount]);
  6445. spv::Id copy = accessChainLoad(*argTypes[a]);
  6446. builder.clearAccessChain();
  6447. builder.setAccessChainLValue(arg);
  6448. multiTypeStore(*argTypes[a], copy);
  6449. }
  6450. ++lValueCount;
  6451. } else {
  6452. // process r-value, which involves a copy for a type mismatch
  6453. if (function->getParamType(a) != builder.getTypeId(rValues[rValueCount]) ||
  6454. TranslatePrecisionDecoration(*argTypes[a]) != function->getParamPrecision(a))
  6455. {
  6456. spv::Id argCopy = builder.createVariable(function->getParamPrecision(a), spv::StorageClass::Function, function->getParamType(a), "arg");
  6457. builder.clearAccessChain();
  6458. builder.setAccessChainLValue(argCopy);
  6459. multiTypeStore(*argTypes[a], rValues[rValueCount]);
  6460. arg = builder.createLoad(argCopy, function->getParamPrecision(a));
  6461. } else
  6462. arg = rValues[rValueCount];
  6463. ++rValueCount;
  6464. }
  6465. spvArgs.push_back(arg);
  6466. }
  6467. // 3. Make the call.
  6468. spv::Id result = builder.createFunctionCall(function, spvArgs);
  6469. builder.setPrecision(result, TranslatePrecisionDecoration(node->getType()));
  6470. builder.addDecoration(result, TranslateNonUniformDecoration(node->getType().getQualifier()));
  6471. // 4. Copy back out an "out" arguments.
  6472. lValueCount = 0;
  6473. for (int a = 0; a < (int)glslangArgs.size(); ++a) {
  6474. if (originalParam(qualifiers[a], *argTypes[a], function->hasImplicitThis() && a == 0))
  6475. ++lValueCount;
  6476. else if (writableParam(qualifiers[a])) {
  6477. if (qualifiers[a] == glslang::EvqOut || qualifiers[a] == glslang::EvqInOut) {
  6478. spv::Id copy = builder.createLoad(spvArgs[a], spv::NoPrecision);
  6479. builder.addDecoration(copy, TranslateNonUniformDecoration(argTypes[a]->getQualifier()));
  6480. builder.setAccessChain(lValues[lValueCount]);
  6481. multiTypeStore(*argTypes[a], copy);
  6482. }
  6483. ++lValueCount;
  6484. }
  6485. }
  6486. return result;
  6487. }
  6488. // Translate AST operation to SPV operation, already having SPV-based operands/types.
  6489. spv::Id TGlslangToSpvTraverser::createBinaryOperation(glslang::TOperator op, OpDecorations& decorations,
  6490. spv::Id typeId, spv::Id left, spv::Id right,
  6491. glslang::TBasicType typeProxy, bool reduceComparison)
  6492. {
  6493. bool isUnsigned = isTypeUnsignedInt(typeProxy);
  6494. bool isFloat = isTypeFloat(typeProxy);
  6495. bool isBool = typeProxy == glslang::EbtBool;
  6496. spv::Op binOp = spv::Op::OpNop;
  6497. bool needMatchingVectors = true; // for non-matrix ops, would a scalar need to smear to match a vector?
  6498. bool comparison = false;
  6499. switch (op) {
  6500. case glslang::EOpAdd:
  6501. case glslang::EOpAddAssign:
  6502. if (isFloat)
  6503. binOp = spv::Op::OpFAdd;
  6504. else
  6505. binOp = spv::Op::OpIAdd;
  6506. break;
  6507. case glslang::EOpSub:
  6508. case glslang::EOpSubAssign:
  6509. if (isFloat)
  6510. binOp = spv::Op::OpFSub;
  6511. else
  6512. binOp = spv::Op::OpISub;
  6513. break;
  6514. case glslang::EOpMul:
  6515. case glslang::EOpMulAssign:
  6516. if (isFloat)
  6517. binOp = spv::Op::OpFMul;
  6518. else
  6519. binOp = spv::Op::OpIMul;
  6520. break;
  6521. case glslang::EOpVectorTimesScalar:
  6522. case glslang::EOpVectorTimesScalarAssign:
  6523. if (isFloat && (builder.isVector(left) || builder.isVector(right) || builder.isCooperativeVector(left) || builder.isCooperativeVector(right))) {
  6524. if (builder.isVector(right) || builder.isCooperativeVector(right))
  6525. std::swap(left, right);
  6526. assert(builder.isScalar(right));
  6527. needMatchingVectors = false;
  6528. binOp = spv::Op::OpVectorTimesScalar;
  6529. } else if (isFloat) {
  6530. binOp = spv::Op::OpFMul;
  6531. } else if (builder.isCooperativeVector(left) || builder.isCooperativeVector(right)) {
  6532. if (builder.isCooperativeVector(right))
  6533. std::swap(left, right);
  6534. assert(builder.isScalar(right));
  6535. // Construct a cooperative vector from the scalar
  6536. right = builder.createCompositeConstruct(builder.getTypeId(left), { right });
  6537. binOp = spv::Op::OpIMul;
  6538. } else {
  6539. binOp = spv::Op::OpIMul;
  6540. }
  6541. break;
  6542. case glslang::EOpVectorTimesMatrix:
  6543. case glslang::EOpVectorTimesMatrixAssign:
  6544. binOp = spv::Op::OpVectorTimesMatrix;
  6545. break;
  6546. case glslang::EOpMatrixTimesVector:
  6547. binOp = spv::Op::OpMatrixTimesVector;
  6548. break;
  6549. case glslang::EOpMatrixTimesScalar:
  6550. case glslang::EOpMatrixTimesScalarAssign:
  6551. binOp = spv::Op::OpMatrixTimesScalar;
  6552. break;
  6553. case glslang::EOpMatrixTimesMatrix:
  6554. case glslang::EOpMatrixTimesMatrixAssign:
  6555. binOp = spv::Op::OpMatrixTimesMatrix;
  6556. break;
  6557. case glslang::EOpOuterProduct:
  6558. binOp = spv::Op::OpOuterProduct;
  6559. needMatchingVectors = false;
  6560. break;
  6561. case glslang::EOpDiv:
  6562. case glslang::EOpDivAssign:
  6563. if (isFloat)
  6564. binOp = spv::Op::OpFDiv;
  6565. else if (isUnsigned)
  6566. binOp = spv::Op::OpUDiv;
  6567. else
  6568. binOp = spv::Op::OpSDiv;
  6569. break;
  6570. case glslang::EOpMod:
  6571. case glslang::EOpModAssign:
  6572. if (isFloat)
  6573. binOp = spv::Op::OpFMod;
  6574. else if (isUnsigned)
  6575. binOp = spv::Op::OpUMod;
  6576. else
  6577. binOp = spv::Op::OpSMod;
  6578. break;
  6579. case glslang::EOpRightShift:
  6580. case glslang::EOpRightShiftAssign:
  6581. if (isUnsigned)
  6582. binOp = spv::Op::OpShiftRightLogical;
  6583. else
  6584. binOp = spv::Op::OpShiftRightArithmetic;
  6585. break;
  6586. case glslang::EOpLeftShift:
  6587. case glslang::EOpLeftShiftAssign:
  6588. binOp = spv::Op::OpShiftLeftLogical;
  6589. break;
  6590. case glslang::EOpAnd:
  6591. case glslang::EOpAndAssign:
  6592. binOp = spv::Op::OpBitwiseAnd;
  6593. break;
  6594. case glslang::EOpLogicalAnd:
  6595. needMatchingVectors = false;
  6596. binOp = spv::Op::OpLogicalAnd;
  6597. break;
  6598. case glslang::EOpInclusiveOr:
  6599. case glslang::EOpInclusiveOrAssign:
  6600. binOp = spv::Op::OpBitwiseOr;
  6601. break;
  6602. case glslang::EOpLogicalOr:
  6603. needMatchingVectors = false;
  6604. binOp = spv::Op::OpLogicalOr;
  6605. break;
  6606. case glslang::EOpExclusiveOr:
  6607. case glslang::EOpExclusiveOrAssign:
  6608. binOp = spv::Op::OpBitwiseXor;
  6609. break;
  6610. case glslang::EOpLogicalXor:
  6611. needMatchingVectors = false;
  6612. binOp = spv::Op::OpLogicalNotEqual;
  6613. break;
  6614. case glslang::EOpAbsDifference:
  6615. binOp = isUnsigned ? spv::Op::OpAbsUSubINTEL : spv::Op::OpAbsISubINTEL;
  6616. break;
  6617. case glslang::EOpAddSaturate:
  6618. binOp = isUnsigned ? spv::Op::OpUAddSatINTEL : spv::Op::OpIAddSatINTEL;
  6619. break;
  6620. case glslang::EOpSubSaturate:
  6621. binOp = isUnsigned ? spv::Op::OpUSubSatINTEL : spv::Op::OpISubSatINTEL;
  6622. break;
  6623. case glslang::EOpAverage:
  6624. binOp = isUnsigned ? spv::Op::OpUAverageINTEL : spv::Op::OpIAverageINTEL;
  6625. break;
  6626. case glslang::EOpAverageRounded:
  6627. binOp = isUnsigned ? spv::Op::OpUAverageRoundedINTEL : spv::Op::OpIAverageRoundedINTEL;
  6628. break;
  6629. case glslang::EOpMul32x16:
  6630. binOp = isUnsigned ? spv::Op::OpUMul32x16INTEL : spv::Op::OpIMul32x16INTEL;
  6631. break;
  6632. case glslang::EOpExpectEXT:
  6633. binOp = spv::Op::OpExpectKHR;
  6634. break;
  6635. case glslang::EOpLessThan:
  6636. case glslang::EOpGreaterThan:
  6637. case glslang::EOpLessThanEqual:
  6638. case glslang::EOpGreaterThanEqual:
  6639. case glslang::EOpEqual:
  6640. case glslang::EOpNotEqual:
  6641. case glslang::EOpVectorEqual:
  6642. case glslang::EOpVectorNotEqual:
  6643. comparison = true;
  6644. break;
  6645. default:
  6646. break;
  6647. }
  6648. // handle mapped binary operations (should be non-comparison)
  6649. if (binOp != spv::Op::OpNop) {
  6650. assert(comparison == false);
  6651. if (builder.isMatrix(left) || builder.isMatrix(right) ||
  6652. builder.isCooperativeMatrix(left) || builder.isCooperativeMatrix(right))
  6653. return createBinaryMatrixOperation(binOp, decorations, typeId, left, right);
  6654. // No matrix involved; make both operands be the same number of components, if needed
  6655. if (needMatchingVectors)
  6656. builder.promoteScalar(decorations.precision, left, right);
  6657. spv::Id result = builder.createBinOp(binOp, typeId, left, right);
  6658. decorations.addNoContraction(builder, result);
  6659. decorations.addNonUniform(builder, result);
  6660. return builder.setPrecision(result, decorations.precision);
  6661. }
  6662. if (! comparison)
  6663. return 0;
  6664. // Handle comparison instructions
  6665. if (reduceComparison && (op == glslang::EOpEqual || op == glslang::EOpNotEqual)
  6666. && (builder.isVector(left) || builder.isMatrix(left) || builder.isAggregate(left))) {
  6667. spv::Id result = builder.createCompositeCompare(decorations.precision, left, right, op == glslang::EOpEqual);
  6668. decorations.addNonUniform(builder, result);
  6669. return result;
  6670. }
  6671. switch (op) {
  6672. case glslang::EOpLessThan:
  6673. if (isFloat)
  6674. binOp = spv::Op::OpFOrdLessThan;
  6675. else if (isUnsigned)
  6676. binOp = spv::Op::OpULessThan;
  6677. else
  6678. binOp = spv::Op::OpSLessThan;
  6679. break;
  6680. case glslang::EOpGreaterThan:
  6681. if (isFloat)
  6682. binOp = spv::Op::OpFOrdGreaterThan;
  6683. else if (isUnsigned)
  6684. binOp = spv::Op::OpUGreaterThan;
  6685. else
  6686. binOp = spv::Op::OpSGreaterThan;
  6687. break;
  6688. case glslang::EOpLessThanEqual:
  6689. if (isFloat)
  6690. binOp = spv::Op::OpFOrdLessThanEqual;
  6691. else if (isUnsigned)
  6692. binOp = spv::Op::OpULessThanEqual;
  6693. else
  6694. binOp = spv::Op::OpSLessThanEqual;
  6695. break;
  6696. case glslang::EOpGreaterThanEqual:
  6697. if (isFloat)
  6698. binOp = spv::Op::OpFOrdGreaterThanEqual;
  6699. else if (isUnsigned)
  6700. binOp = spv::Op::OpUGreaterThanEqual;
  6701. else
  6702. binOp = spv::Op::OpSGreaterThanEqual;
  6703. break;
  6704. case glslang::EOpEqual:
  6705. case glslang::EOpVectorEqual:
  6706. if (isFloat)
  6707. binOp = spv::Op::OpFOrdEqual;
  6708. else if (isBool)
  6709. binOp = spv::Op::OpLogicalEqual;
  6710. else
  6711. binOp = spv::Op::OpIEqual;
  6712. break;
  6713. case glslang::EOpNotEqual:
  6714. case glslang::EOpVectorNotEqual:
  6715. if (isFloat)
  6716. binOp = spv::Op::OpFUnordNotEqual;
  6717. else if (isBool)
  6718. binOp = spv::Op::OpLogicalNotEqual;
  6719. else
  6720. binOp = spv::Op::OpINotEqual;
  6721. break;
  6722. default:
  6723. break;
  6724. }
  6725. if (binOp != spv::Op::OpNop) {
  6726. spv::Id result = builder.createBinOp(binOp, typeId, left, right);
  6727. decorations.addNoContraction(builder, result);
  6728. decorations.addNonUniform(builder, result);
  6729. return builder.setPrecision(result, decorations.precision);
  6730. }
  6731. return 0;
  6732. }
  6733. //
  6734. // Translate AST matrix operation to SPV operation, already having SPV-based operands/types.
  6735. // These can be any of:
  6736. //
  6737. // matrix * scalar
  6738. // scalar * matrix
  6739. // matrix * matrix linear algebraic
  6740. // matrix * vector
  6741. // vector * matrix
  6742. // matrix * matrix componentwise
  6743. // matrix op matrix op in {+, -, /}
  6744. // matrix op scalar op in {+, -, /}
  6745. // scalar op matrix op in {+, -, /}
  6746. //
  6747. spv::Id TGlslangToSpvTraverser::createBinaryMatrixOperation(spv::Op op, OpDecorations& decorations, spv::Id typeId,
  6748. spv::Id left, spv::Id right)
  6749. {
  6750. bool firstClass = true;
  6751. // First, handle first-class matrix operations (* and matrix/scalar)
  6752. switch (op) {
  6753. case spv::Op::OpFDiv:
  6754. if (builder.isMatrix(left) && builder.isScalar(right)) {
  6755. // turn matrix / scalar into a multiply...
  6756. spv::Id resultType = builder.getTypeId(right);
  6757. right = builder.createBinOp(spv::Op::OpFDiv, resultType, builder.makeFpConstant(resultType, 1.0), right);
  6758. op = spv::Op::OpMatrixTimesScalar;
  6759. } else
  6760. firstClass = false;
  6761. break;
  6762. case spv::Op::OpMatrixTimesScalar:
  6763. if (builder.isMatrix(right) || builder.isCooperativeMatrix(right))
  6764. std::swap(left, right);
  6765. assert(builder.isScalar(right));
  6766. break;
  6767. case spv::Op::OpVectorTimesMatrix:
  6768. assert(builder.isVector(left));
  6769. assert(builder.isMatrix(right));
  6770. break;
  6771. case spv::Op::OpMatrixTimesVector:
  6772. assert(builder.isMatrix(left));
  6773. assert(builder.isVector(right));
  6774. break;
  6775. case spv::Op::OpMatrixTimesMatrix:
  6776. assert(builder.isMatrix(left));
  6777. assert(builder.isMatrix(right));
  6778. break;
  6779. default:
  6780. firstClass = false;
  6781. break;
  6782. }
  6783. if (builder.isCooperativeMatrix(left) || builder.isCooperativeMatrix(right))
  6784. firstClass = true;
  6785. if (firstClass) {
  6786. spv::Id result = builder.createBinOp(op, typeId, left, right);
  6787. decorations.addNoContraction(builder, result);
  6788. decorations.addNonUniform(builder, result);
  6789. return builder.setPrecision(result, decorations.precision);
  6790. }
  6791. // Handle component-wise +, -, *, %, and / for all combinations of type.
  6792. // The result type of all of them is the same type as the (a) matrix operand.
  6793. // The algorithm is to:
  6794. // - break the matrix(es) into vectors
  6795. // - smear any scalar to a vector
  6796. // - do vector operations
  6797. // - make a matrix out the vector results
  6798. switch (op) {
  6799. case spv::Op::OpFAdd:
  6800. case spv::Op::OpFSub:
  6801. case spv::Op::OpFDiv:
  6802. case spv::Op::OpFMod:
  6803. case spv::Op::OpFMul:
  6804. {
  6805. // one time set up...
  6806. bool leftMat = builder.isMatrix(left);
  6807. bool rightMat = builder.isMatrix(right);
  6808. unsigned int numCols = leftMat ? builder.getNumColumns(left) : builder.getNumColumns(right);
  6809. int numRows = leftMat ? builder.getNumRows(left) : builder.getNumRows(right);
  6810. spv::Id scalarType = builder.getScalarTypeId(typeId);
  6811. spv::Id vecType = builder.makeVectorType(scalarType, numRows);
  6812. std::vector<spv::Id> results;
  6813. spv::Id smearVec = spv::NoResult;
  6814. if (builder.isScalar(left))
  6815. smearVec = builder.smearScalar(decorations.precision, left, vecType);
  6816. else if (builder.isScalar(right))
  6817. smearVec = builder.smearScalar(decorations.precision, right, vecType);
  6818. // do each vector op
  6819. for (unsigned int c = 0; c < numCols; ++c) {
  6820. std::vector<unsigned int> indexes;
  6821. indexes.push_back(c);
  6822. spv::Id leftVec = leftMat ? builder.createCompositeExtract( left, vecType, indexes) : smearVec;
  6823. spv::Id rightVec = rightMat ? builder.createCompositeExtract(right, vecType, indexes) : smearVec;
  6824. spv::Id result = builder.createBinOp(op, vecType, leftVec, rightVec);
  6825. decorations.addNoContraction(builder, result);
  6826. decorations.addNonUniform(builder, result);
  6827. results.push_back(builder.setPrecision(result, decorations.precision));
  6828. }
  6829. // put the pieces together
  6830. spv::Id result = builder.setPrecision(builder.createCompositeConstruct(typeId, results), decorations.precision);
  6831. decorations.addNonUniform(builder, result);
  6832. return result;
  6833. }
  6834. default:
  6835. assert(0);
  6836. return spv::NoResult;
  6837. }
  6838. }
  6839. spv::Id TGlslangToSpvTraverser::createUnaryOperation(glslang::TOperator op, OpDecorations& decorations, spv::Id typeId,
  6840. spv::Id operand, glslang::TBasicType typeProxy, const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags,
  6841. const glslang::TType &opType)
  6842. {
  6843. spv::Op unaryOp = spv::Op::OpNop;
  6844. int extBuiltins = -1;
  6845. int libCall = -1;
  6846. bool isUnsigned = isTypeUnsignedInt(typeProxy);
  6847. bool isFloat = isTypeFloat(typeProxy);
  6848. switch (op) {
  6849. case glslang::EOpNegative:
  6850. if (isFloat) {
  6851. unaryOp = spv::Op::OpFNegate;
  6852. if (builder.isMatrixType(typeId))
  6853. return createUnaryMatrixOperation(unaryOp, decorations, typeId, operand, typeProxy);
  6854. } else
  6855. unaryOp = spv::Op::OpSNegate;
  6856. break;
  6857. case glslang::EOpLogicalNot:
  6858. case glslang::EOpVectorLogicalNot:
  6859. unaryOp = spv::Op::OpLogicalNot;
  6860. break;
  6861. case glslang::EOpBitwiseNot:
  6862. unaryOp = spv::Op::OpNot;
  6863. break;
  6864. case glslang::EOpDeterminant:
  6865. libCall = spv::GLSLstd450Determinant;
  6866. break;
  6867. case glslang::EOpMatrixInverse:
  6868. libCall = spv::GLSLstd450MatrixInverse;
  6869. break;
  6870. case glslang::EOpTranspose:
  6871. unaryOp = spv::Op::OpTranspose;
  6872. break;
  6873. case glslang::EOpRadians:
  6874. libCall = spv::GLSLstd450Radians;
  6875. break;
  6876. case glslang::EOpDegrees:
  6877. libCall = spv::GLSLstd450Degrees;
  6878. break;
  6879. case glslang::EOpSin:
  6880. libCall = spv::GLSLstd450Sin;
  6881. break;
  6882. case glslang::EOpCos:
  6883. libCall = spv::GLSLstd450Cos;
  6884. break;
  6885. case glslang::EOpTan:
  6886. libCall = spv::GLSLstd450Tan;
  6887. break;
  6888. case glslang::EOpAcos:
  6889. libCall = spv::GLSLstd450Acos;
  6890. break;
  6891. case glslang::EOpAsin:
  6892. libCall = spv::GLSLstd450Asin;
  6893. break;
  6894. case glslang::EOpAtan:
  6895. libCall = spv::GLSLstd450Atan;
  6896. break;
  6897. case glslang::EOpAcosh:
  6898. libCall = spv::GLSLstd450Acosh;
  6899. break;
  6900. case glslang::EOpAsinh:
  6901. libCall = spv::GLSLstd450Asinh;
  6902. break;
  6903. case glslang::EOpAtanh:
  6904. libCall = spv::GLSLstd450Atanh;
  6905. break;
  6906. case glslang::EOpTanh:
  6907. libCall = spv::GLSLstd450Tanh;
  6908. break;
  6909. case glslang::EOpCosh:
  6910. libCall = spv::GLSLstd450Cosh;
  6911. break;
  6912. case glslang::EOpSinh:
  6913. libCall = spv::GLSLstd450Sinh;
  6914. break;
  6915. case glslang::EOpLength:
  6916. libCall = spv::GLSLstd450Length;
  6917. break;
  6918. case glslang::EOpNormalize:
  6919. libCall = spv::GLSLstd450Normalize;
  6920. break;
  6921. case glslang::EOpExp:
  6922. libCall = spv::GLSLstd450Exp;
  6923. break;
  6924. case glslang::EOpLog:
  6925. libCall = spv::GLSLstd450Log;
  6926. break;
  6927. case glslang::EOpExp2:
  6928. libCall = spv::GLSLstd450Exp2;
  6929. break;
  6930. case glslang::EOpLog2:
  6931. libCall = spv::GLSLstd450Log2;
  6932. break;
  6933. case glslang::EOpSqrt:
  6934. libCall = spv::GLSLstd450Sqrt;
  6935. break;
  6936. case glslang::EOpInverseSqrt:
  6937. libCall = spv::GLSLstd450InverseSqrt;
  6938. break;
  6939. case glslang::EOpFloor:
  6940. libCall = spv::GLSLstd450Floor;
  6941. break;
  6942. case glslang::EOpTrunc:
  6943. libCall = spv::GLSLstd450Trunc;
  6944. break;
  6945. case glslang::EOpRound:
  6946. libCall = spv::GLSLstd450Round;
  6947. break;
  6948. case glslang::EOpRoundEven:
  6949. libCall = spv::GLSLstd450RoundEven;
  6950. break;
  6951. case glslang::EOpCeil:
  6952. libCall = spv::GLSLstd450Ceil;
  6953. break;
  6954. case glslang::EOpFract:
  6955. libCall = spv::GLSLstd450Fract;
  6956. break;
  6957. case glslang::EOpIsNan:
  6958. unaryOp = spv::Op::OpIsNan;
  6959. break;
  6960. case glslang::EOpIsInf:
  6961. unaryOp = spv::Op::OpIsInf;
  6962. break;
  6963. case glslang::EOpIsFinite:
  6964. unaryOp = spv::Op::OpIsFinite;
  6965. break;
  6966. case glslang::EOpFloatBitsToInt:
  6967. case glslang::EOpFloatBitsToUint:
  6968. case glslang::EOpIntBitsToFloat:
  6969. case glslang::EOpUintBitsToFloat:
  6970. case glslang::EOpDoubleBitsToInt64:
  6971. case glslang::EOpDoubleBitsToUint64:
  6972. case glslang::EOpInt64BitsToDouble:
  6973. case glslang::EOpUint64BitsToDouble:
  6974. case glslang::EOpFloat16BitsToInt16:
  6975. case glslang::EOpFloat16BitsToUint16:
  6976. case glslang::EOpInt16BitsToFloat16:
  6977. case glslang::EOpUint16BitsToFloat16:
  6978. unaryOp = spv::Op::OpBitcast;
  6979. break;
  6980. case glslang::EOpPackSnorm2x16:
  6981. libCall = spv::GLSLstd450PackSnorm2x16;
  6982. break;
  6983. case glslang::EOpUnpackSnorm2x16:
  6984. libCall = spv::GLSLstd450UnpackSnorm2x16;
  6985. break;
  6986. case glslang::EOpPackUnorm2x16:
  6987. libCall = spv::GLSLstd450PackUnorm2x16;
  6988. break;
  6989. case glslang::EOpUnpackUnorm2x16:
  6990. libCall = spv::GLSLstd450UnpackUnorm2x16;
  6991. break;
  6992. case glslang::EOpPackHalf2x16:
  6993. libCall = spv::GLSLstd450PackHalf2x16;
  6994. break;
  6995. case glslang::EOpUnpackHalf2x16:
  6996. libCall = spv::GLSLstd450UnpackHalf2x16;
  6997. break;
  6998. case glslang::EOpPackSnorm4x8:
  6999. libCall = spv::GLSLstd450PackSnorm4x8;
  7000. break;
  7001. case glslang::EOpUnpackSnorm4x8:
  7002. libCall = spv::GLSLstd450UnpackSnorm4x8;
  7003. break;
  7004. case glslang::EOpPackUnorm4x8:
  7005. libCall = spv::GLSLstd450PackUnorm4x8;
  7006. break;
  7007. case glslang::EOpUnpackUnorm4x8:
  7008. libCall = spv::GLSLstd450UnpackUnorm4x8;
  7009. break;
  7010. case glslang::EOpPackDouble2x32:
  7011. libCall = spv::GLSLstd450PackDouble2x32;
  7012. break;
  7013. case glslang::EOpUnpackDouble2x32:
  7014. libCall = spv::GLSLstd450UnpackDouble2x32;
  7015. break;
  7016. case glslang::EOpPackInt2x32:
  7017. case glslang::EOpUnpackInt2x32:
  7018. case glslang::EOpPackUint2x32:
  7019. case glslang::EOpUnpackUint2x32:
  7020. case glslang::EOpPack16:
  7021. case glslang::EOpPack32:
  7022. case glslang::EOpPack64:
  7023. case glslang::EOpUnpack32:
  7024. case glslang::EOpUnpack16:
  7025. case glslang::EOpUnpack8:
  7026. case glslang::EOpPackInt2x16:
  7027. case glslang::EOpUnpackInt2x16:
  7028. case glslang::EOpPackUint2x16:
  7029. case glslang::EOpUnpackUint2x16:
  7030. case glslang::EOpPackInt4x16:
  7031. case glslang::EOpUnpackInt4x16:
  7032. case glslang::EOpPackUint4x16:
  7033. case glslang::EOpUnpackUint4x16:
  7034. case glslang::EOpPackFloat2x16:
  7035. case glslang::EOpUnpackFloat2x16:
  7036. unaryOp = spv::Op::OpBitcast;
  7037. break;
  7038. case glslang::EOpDPdx:
  7039. unaryOp = spv::Op::OpDPdx;
  7040. break;
  7041. case glslang::EOpDPdy:
  7042. unaryOp = spv::Op::OpDPdy;
  7043. break;
  7044. case glslang::EOpFwidth:
  7045. unaryOp = spv::Op::OpFwidth;
  7046. break;
  7047. case glslang::EOpAny:
  7048. unaryOp = spv::Op::OpAny;
  7049. break;
  7050. case glslang::EOpAll:
  7051. unaryOp = spv::Op::OpAll;
  7052. break;
  7053. case glslang::EOpAbs:
  7054. if (isFloat)
  7055. libCall = spv::GLSLstd450FAbs;
  7056. else
  7057. libCall = spv::GLSLstd450SAbs;
  7058. break;
  7059. case glslang::EOpSign:
  7060. if (isFloat)
  7061. libCall = spv::GLSLstd450FSign;
  7062. else
  7063. libCall = spv::GLSLstd450SSign;
  7064. break;
  7065. case glslang::EOpDPdxFine:
  7066. unaryOp = spv::Op::OpDPdxFine;
  7067. break;
  7068. case glslang::EOpDPdyFine:
  7069. unaryOp = spv::Op::OpDPdyFine;
  7070. break;
  7071. case glslang::EOpFwidthFine:
  7072. unaryOp = spv::Op::OpFwidthFine;
  7073. break;
  7074. case glslang::EOpDPdxCoarse:
  7075. unaryOp = spv::Op::OpDPdxCoarse;
  7076. break;
  7077. case glslang::EOpDPdyCoarse:
  7078. unaryOp = spv::Op::OpDPdyCoarse;
  7079. break;
  7080. case glslang::EOpFwidthCoarse:
  7081. unaryOp = spv::Op::OpFwidthCoarse;
  7082. break;
  7083. case glslang::EOpRayQueryProceed:
  7084. unaryOp = spv::Op::OpRayQueryProceedKHR;
  7085. break;
  7086. case glslang::EOpRayQueryGetRayTMin:
  7087. unaryOp = spv::Op::OpRayQueryGetRayTMinKHR;
  7088. break;
  7089. case glslang::EOpRayQueryGetRayFlags:
  7090. unaryOp = spv::Op::OpRayQueryGetRayFlagsKHR;
  7091. break;
  7092. case glslang::EOpRayQueryGetWorldRayOrigin:
  7093. unaryOp = spv::Op::OpRayQueryGetWorldRayOriginKHR;
  7094. break;
  7095. case glslang::EOpRayQueryGetWorldRayDirection:
  7096. unaryOp = spv::Op::OpRayQueryGetWorldRayDirectionKHR;
  7097. break;
  7098. case glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque:
  7099. unaryOp = spv::Op::OpRayQueryGetIntersectionCandidateAABBOpaqueKHR;
  7100. break;
  7101. case glslang::EOpInterpolateAtCentroid:
  7102. if (typeProxy == glslang::EbtFloat16)
  7103. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
  7104. libCall = spv::GLSLstd450InterpolateAtCentroid;
  7105. break;
  7106. case glslang::EOpAtomicCounterIncrement:
  7107. case glslang::EOpAtomicCounterDecrement:
  7108. case glslang::EOpAtomicCounter:
  7109. {
  7110. // Handle all of the atomics in one place, in createAtomicOperation()
  7111. std::vector<spv::Id> operands;
  7112. operands.push_back(operand);
  7113. return createAtomicOperation(op, decorations.precision, typeId, operands, typeProxy, lvalueCoherentFlags, opType);
  7114. }
  7115. case glslang::EOpBitFieldReverse:
  7116. unaryOp = spv::Op::OpBitReverse;
  7117. break;
  7118. case glslang::EOpBitCount:
  7119. unaryOp = spv::Op::OpBitCount;
  7120. break;
  7121. case glslang::EOpFindLSB:
  7122. libCall = spv::GLSLstd450FindILsb;
  7123. break;
  7124. case glslang::EOpFindMSB:
  7125. if (isUnsigned)
  7126. libCall = spv::GLSLstd450FindUMsb;
  7127. else
  7128. libCall = spv::GLSLstd450FindSMsb;
  7129. break;
  7130. case glslang::EOpCountLeadingZeros:
  7131. builder.addCapability(spv::Capability::IntegerFunctions2INTEL);
  7132. builder.addExtension("SPV_INTEL_shader_integer_functions2");
  7133. unaryOp = spv::Op::OpUCountLeadingZerosINTEL;
  7134. break;
  7135. case glslang::EOpCountTrailingZeros:
  7136. builder.addCapability(spv::Capability::IntegerFunctions2INTEL);
  7137. builder.addExtension("SPV_INTEL_shader_integer_functions2");
  7138. unaryOp = spv::Op::OpUCountTrailingZerosINTEL;
  7139. break;
  7140. case glslang::EOpBallot:
  7141. case glslang::EOpReadFirstInvocation:
  7142. case glslang::EOpAnyInvocation:
  7143. case glslang::EOpAllInvocations:
  7144. case glslang::EOpAllInvocationsEqual:
  7145. case glslang::EOpMinInvocations:
  7146. case glslang::EOpMaxInvocations:
  7147. case glslang::EOpAddInvocations:
  7148. case glslang::EOpMinInvocationsNonUniform:
  7149. case glslang::EOpMaxInvocationsNonUniform:
  7150. case glslang::EOpAddInvocationsNonUniform:
  7151. case glslang::EOpMinInvocationsInclusiveScan:
  7152. case glslang::EOpMaxInvocationsInclusiveScan:
  7153. case glslang::EOpAddInvocationsInclusiveScan:
  7154. case glslang::EOpMinInvocationsInclusiveScanNonUniform:
  7155. case glslang::EOpMaxInvocationsInclusiveScanNonUniform:
  7156. case glslang::EOpAddInvocationsInclusiveScanNonUniform:
  7157. case glslang::EOpMinInvocationsExclusiveScan:
  7158. case glslang::EOpMaxInvocationsExclusiveScan:
  7159. case glslang::EOpAddInvocationsExclusiveScan:
  7160. case glslang::EOpMinInvocationsExclusiveScanNonUniform:
  7161. case glslang::EOpMaxInvocationsExclusiveScanNonUniform:
  7162. case glslang::EOpAddInvocationsExclusiveScanNonUniform:
  7163. {
  7164. std::vector<spv::Id> operands;
  7165. operands.push_back(operand);
  7166. return createInvocationsOperation(op, typeId, operands, typeProxy);
  7167. }
  7168. case glslang::EOpSubgroupAll:
  7169. case glslang::EOpSubgroupAny:
  7170. case glslang::EOpSubgroupAllEqual:
  7171. case glslang::EOpSubgroupBroadcastFirst:
  7172. case glslang::EOpSubgroupBallot:
  7173. case glslang::EOpSubgroupInverseBallot:
  7174. case glslang::EOpSubgroupBallotBitCount:
  7175. case glslang::EOpSubgroupBallotInclusiveBitCount:
  7176. case glslang::EOpSubgroupBallotExclusiveBitCount:
  7177. case glslang::EOpSubgroupBallotFindLSB:
  7178. case glslang::EOpSubgroupBallotFindMSB:
  7179. case glslang::EOpSubgroupAdd:
  7180. case glslang::EOpSubgroupMul:
  7181. case glslang::EOpSubgroupMin:
  7182. case glslang::EOpSubgroupMax:
  7183. case glslang::EOpSubgroupAnd:
  7184. case glslang::EOpSubgroupOr:
  7185. case glslang::EOpSubgroupXor:
  7186. case glslang::EOpSubgroupInclusiveAdd:
  7187. case glslang::EOpSubgroupInclusiveMul:
  7188. case glslang::EOpSubgroupInclusiveMin:
  7189. case glslang::EOpSubgroupInclusiveMax:
  7190. case glslang::EOpSubgroupInclusiveAnd:
  7191. case glslang::EOpSubgroupInclusiveOr:
  7192. case glslang::EOpSubgroupInclusiveXor:
  7193. case glslang::EOpSubgroupExclusiveAdd:
  7194. case glslang::EOpSubgroupExclusiveMul:
  7195. case glslang::EOpSubgroupExclusiveMin:
  7196. case glslang::EOpSubgroupExclusiveMax:
  7197. case glslang::EOpSubgroupExclusiveAnd:
  7198. case glslang::EOpSubgroupExclusiveOr:
  7199. case glslang::EOpSubgroupExclusiveXor:
  7200. case glslang::EOpSubgroupQuadSwapHorizontal:
  7201. case glslang::EOpSubgroupQuadSwapVertical:
  7202. case glslang::EOpSubgroupQuadSwapDiagonal:
  7203. case glslang::EOpSubgroupQuadAll:
  7204. case glslang::EOpSubgroupQuadAny: {
  7205. std::vector<spv::Id> operands;
  7206. operands.push_back(operand);
  7207. return createSubgroupOperation(op, typeId, operands, typeProxy);
  7208. }
  7209. case glslang::EOpMbcnt:
  7210. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
  7211. libCall = spv::MbcntAMD;
  7212. break;
  7213. case glslang::EOpCubeFaceIndex:
  7214. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_gcn_shader);
  7215. libCall = spv::CubeFaceIndexAMD;
  7216. break;
  7217. case glslang::EOpCubeFaceCoord:
  7218. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_gcn_shader);
  7219. libCall = spv::CubeFaceCoordAMD;
  7220. break;
  7221. case glslang::EOpSubgroupPartition:
  7222. unaryOp = spv::Op::OpGroupNonUniformPartitionNV;
  7223. break;
  7224. case glslang::EOpConstructReference:
  7225. unaryOp = spv::Op::OpBitcast;
  7226. break;
  7227. case glslang::EOpConvUint64ToAccStruct:
  7228. case glslang::EOpConvUvec2ToAccStruct:
  7229. unaryOp = spv::Op::OpConvertUToAccelerationStructureKHR;
  7230. break;
  7231. case glslang::EOpHitObjectIsEmptyNV:
  7232. unaryOp = spv::Op::OpHitObjectIsEmptyNV;
  7233. break;
  7234. case glslang::EOpHitObjectIsMissNV:
  7235. unaryOp = spv::Op::OpHitObjectIsMissNV;
  7236. break;
  7237. case glslang::EOpHitObjectIsHitNV:
  7238. unaryOp = spv::Op::OpHitObjectIsHitNV;
  7239. break;
  7240. case glslang::EOpHitObjectGetObjectRayOriginNV:
  7241. unaryOp = spv::Op::OpHitObjectGetObjectRayOriginNV;
  7242. break;
  7243. case glslang::EOpHitObjectGetObjectRayDirectionNV:
  7244. unaryOp = spv::Op::OpHitObjectGetObjectRayDirectionNV;
  7245. break;
  7246. case glslang::EOpHitObjectGetWorldRayOriginNV:
  7247. unaryOp = spv::Op::OpHitObjectGetWorldRayOriginNV;
  7248. break;
  7249. case glslang::EOpHitObjectGetWorldRayDirectionNV:
  7250. unaryOp = spv::Op::OpHitObjectGetWorldRayDirectionNV;
  7251. break;
  7252. case glslang::EOpHitObjectGetObjectToWorldNV:
  7253. unaryOp = spv::Op::OpHitObjectGetObjectToWorldNV;
  7254. break;
  7255. case glslang::EOpHitObjectGetWorldToObjectNV:
  7256. unaryOp = spv::Op::OpHitObjectGetWorldToObjectNV;
  7257. break;
  7258. case glslang::EOpHitObjectGetRayTMinNV:
  7259. unaryOp = spv::Op::OpHitObjectGetRayTMinNV;
  7260. break;
  7261. case glslang::EOpHitObjectGetRayTMaxNV:
  7262. unaryOp = spv::Op::OpHitObjectGetRayTMaxNV;
  7263. break;
  7264. case glslang::EOpHitObjectGetPrimitiveIndexNV:
  7265. unaryOp = spv::Op::OpHitObjectGetPrimitiveIndexNV;
  7266. break;
  7267. case glslang::EOpHitObjectGetInstanceIdNV:
  7268. unaryOp = spv::Op::OpHitObjectGetInstanceIdNV;
  7269. break;
  7270. case glslang::EOpHitObjectGetInstanceCustomIndexNV:
  7271. unaryOp = spv::Op::OpHitObjectGetInstanceCustomIndexNV;
  7272. break;
  7273. case glslang::EOpHitObjectGetGeometryIndexNV:
  7274. unaryOp = spv::Op::OpHitObjectGetGeometryIndexNV;
  7275. break;
  7276. case glslang::EOpHitObjectGetHitKindNV:
  7277. unaryOp = spv::Op::OpHitObjectGetHitKindNV;
  7278. break;
  7279. case glslang::EOpHitObjectGetCurrentTimeNV:
  7280. unaryOp = spv::Op::OpHitObjectGetCurrentTimeNV;
  7281. break;
  7282. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:
  7283. unaryOp = spv::Op::OpHitObjectGetShaderBindingTableRecordIndexNV;
  7284. break;
  7285. case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:
  7286. unaryOp = spv::Op::OpHitObjectGetShaderRecordBufferHandleNV;
  7287. break;
  7288. case glslang::EOpHitObjectGetClusterIdNV:
  7289. unaryOp = spv::Op::OpHitObjectGetClusterIdNV;
  7290. builder.addExtension(spv::E_SPV_NV_cluster_acceleration_structure);
  7291. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  7292. builder.addCapability(spv::Capability::RayTracingClusterAccelerationStructureNV);
  7293. break;
  7294. case glslang::EOpHitObjectGetSpherePositionNV:
  7295. unaryOp = spv::Op::OpHitObjectGetSpherePositionNV;
  7296. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  7297. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  7298. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  7299. break;
  7300. case glslang::EOpHitObjectGetSphereRadiusNV:
  7301. unaryOp = spv::Op::OpHitObjectGetSphereRadiusNV;
  7302. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  7303. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  7304. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  7305. break;
  7306. case glslang::EOpHitObjectIsSphereHitNV:
  7307. unaryOp = spv::Op::OpHitObjectIsSphereHitNV;
  7308. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  7309. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  7310. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  7311. break;
  7312. case glslang::EOpHitObjectIsLSSHitNV:
  7313. unaryOp = spv::Op::OpHitObjectIsLSSHitNV;
  7314. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  7315. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  7316. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  7317. break;
  7318. case glslang::EOpFetchMicroTriangleVertexPositionNV:
  7319. unaryOp = spv::Op::OpFetchMicroTriangleVertexPositionNV;
  7320. break;
  7321. case glslang::EOpFetchMicroTriangleVertexBarycentricNV:
  7322. unaryOp = spv::Op::OpFetchMicroTriangleVertexBarycentricNV;
  7323. break;
  7324. case glslang::EOpCopyObject:
  7325. unaryOp = spv::Op::OpCopyObject;
  7326. break;
  7327. case glslang::EOpDepthAttachmentReadEXT:
  7328. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  7329. builder.addCapability(spv::Capability::TileImageDepthReadAccessEXT);
  7330. unaryOp = spv::Op::OpDepthAttachmentReadEXT;
  7331. decorations.precision = spv::NoPrecision;
  7332. break;
  7333. case glslang::EOpStencilAttachmentReadEXT:
  7334. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  7335. builder.addCapability(spv::Capability::TileImageStencilReadAccessEXT);
  7336. unaryOp = spv::Op::OpStencilAttachmentReadEXT;
  7337. decorations.precision = spv::Decoration::RelaxedPrecision;
  7338. break;
  7339. default:
  7340. return 0;
  7341. }
  7342. spv::Id id;
  7343. if (libCall >= 0) {
  7344. std::vector<spv::Id> args;
  7345. args.push_back(operand);
  7346. id = builder.createBuiltinCall(typeId, extBuiltins >= 0 ? extBuiltins : stdBuiltins, libCall, args);
  7347. } else {
  7348. id = builder.createUnaryOp(unaryOp, typeId, operand);
  7349. }
  7350. decorations.addNoContraction(builder, id);
  7351. decorations.addNonUniform(builder, id);
  7352. return builder.setPrecision(id, decorations.precision);
  7353. }
  7354. // Create a unary operation on a matrix
  7355. spv::Id TGlslangToSpvTraverser::createUnaryMatrixOperation(spv::Op op, OpDecorations& decorations, spv::Id typeId,
  7356. spv::Id operand, glslang::TBasicType /* typeProxy */)
  7357. {
  7358. // Handle unary operations vector by vector.
  7359. // The result type is the same type as the original type.
  7360. // The algorithm is to:
  7361. // - break the matrix into vectors
  7362. // - apply the operation to each vector
  7363. // - make a matrix out the vector results
  7364. // get the types sorted out
  7365. int numCols = builder.getNumColumns(operand);
  7366. int numRows = builder.getNumRows(operand);
  7367. spv::Id srcVecType = builder.makeVectorType(builder.getScalarTypeId(builder.getTypeId(operand)), numRows);
  7368. spv::Id destVecType = builder.makeVectorType(builder.getScalarTypeId(typeId), numRows);
  7369. std::vector<spv::Id> results;
  7370. // do each vector op
  7371. for (int c = 0; c < numCols; ++c) {
  7372. std::vector<unsigned int> indexes;
  7373. indexes.push_back(c);
  7374. spv::Id srcVec = builder.createCompositeExtract(operand, srcVecType, indexes);
  7375. spv::Id destVec = builder.createUnaryOp(op, destVecType, srcVec);
  7376. decorations.addNoContraction(builder, destVec);
  7377. decorations.addNonUniform(builder, destVec);
  7378. results.push_back(builder.setPrecision(destVec, decorations.precision));
  7379. }
  7380. // put the pieces together
  7381. spv::Id result = builder.setPrecision(builder.createCompositeConstruct(typeId, results), decorations.precision);
  7382. decorations.addNonUniform(builder, result);
  7383. return result;
  7384. }
  7385. // For converting integers where both the bitwidth and the signedness could
  7386. // change, but only do the width change here. The caller is still responsible
  7387. // for the signedness conversion.
  7388. // destType is the final type that will be converted to, but this function
  7389. // may only be doing part of that conversion.
  7390. spv::Id TGlslangToSpvTraverser::createIntWidthConversion(spv::Id operand, int vectorSize, spv::Id destType,
  7391. glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType)
  7392. {
  7393. // Get the result type width, based on the type to convert to.
  7394. int width = GetNumBits(resultBasicType);
  7395. // Get the conversion operation and result type,
  7396. // based on the target width, but the source type.
  7397. spv::Id type = spv::NoType;
  7398. spv::Op convOp = spv::Op::OpNop;
  7399. if (isTypeSignedInt(operandBasicType)) {
  7400. convOp = spv::Op::OpSConvert;
  7401. type = builder.makeIntType(width);
  7402. } else {
  7403. convOp = spv::Op::OpUConvert;
  7404. type = builder.makeUintType(width);
  7405. }
  7406. if (builder.getOpCode(destType) == spv::Op::OpTypeCooperativeVectorNV) {
  7407. type = builder.makeCooperativeVectorTypeNV(type, builder.getCooperativeVectorNumComponents(destType));
  7408. } else if (vectorSize > 0)
  7409. type = builder.makeVectorType(type, vectorSize);
  7410. else if (builder.getOpCode(destType) == spv::Op::OpTypeCooperativeMatrixKHR ||
  7411. builder.getOpCode(destType) == spv::Op::OpTypeCooperativeMatrixNV) {
  7412. type = builder.makeCooperativeMatrixTypeWithSameShape(type, destType);
  7413. }
  7414. return builder.createUnaryOp(convOp, type, operand);
  7415. }
  7416. spv::Id TGlslangToSpvTraverser::createConversion(glslang::TOperator op, OpDecorations& decorations, spv::Id destType,
  7417. spv::Id operand, glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType)
  7418. {
  7419. spv::Op convOp = spv::Op::OpNop;
  7420. spv::Id zero = 0;
  7421. spv::Id one = 0;
  7422. int vectorSize = builder.isVectorType(destType) ? builder.getNumTypeComponents(destType) : 0;
  7423. if (IsOpNumericConv(op) || op == glslang::EOpConstructSaturated) {
  7424. if (isTypeSignedInt(operandBasicType) && isTypeFloat(resultBasicType)) {
  7425. convOp = spv::Op::OpConvertSToF;
  7426. }
  7427. if (isTypeUnsignedInt(operandBasicType) && isTypeFloat(resultBasicType)) {
  7428. convOp = spv::Op::OpConvertUToF;
  7429. }
  7430. if (isTypeFloat(operandBasicType) && isTypeSignedInt(resultBasicType)) {
  7431. convOp = spv::Op::OpConvertFToS;
  7432. }
  7433. if (isTypeFloat(operandBasicType) && isTypeUnsignedInt(resultBasicType)) {
  7434. convOp = spv::Op::OpConvertFToU;
  7435. }
  7436. if (isTypeSignedInt(operandBasicType) && isTypeSignedInt(resultBasicType)) {
  7437. convOp = spv::Op::OpSConvert;
  7438. }
  7439. if (isTypeUnsignedInt(operandBasicType) && isTypeUnsignedInt(resultBasicType)) {
  7440. convOp = spv::Op::OpUConvert;
  7441. }
  7442. if (isTypeFloat(operandBasicType) && isTypeFloat(resultBasicType)) {
  7443. convOp = spv::Op::OpFConvert;
  7444. if (builder.isMatrixType(destType))
  7445. return createUnaryMatrixOperation(convOp, decorations, destType, operand, operandBasicType);
  7446. }
  7447. if (isTypeInt(operandBasicType) && isTypeInt(resultBasicType) &&
  7448. isTypeUnsignedInt(operandBasicType) != isTypeUnsignedInt(resultBasicType)) {
  7449. if (GetNumBits(operandBasicType) != GetNumBits(resultBasicType)) {
  7450. // OpSConvert/OpUConvert + OpBitCast
  7451. operand = createIntWidthConversion(operand, vectorSize, destType, resultBasicType, operandBasicType);
  7452. }
  7453. if (builder.isInSpecConstCodeGenMode()) {
  7454. uint32_t bits = GetNumBits(resultBasicType);
  7455. spv::Id zeroType = builder.makeUintType(bits);
  7456. if (bits == 64) {
  7457. zero = builder.makeInt64Constant(zeroType, 0, false);
  7458. } else {
  7459. zero = builder.makeIntConstant(zeroType, 0, false);
  7460. }
  7461. zero = makeSmearedConstant(zero, vectorSize);
  7462. // Use OpIAdd, instead of OpBitcast to do the conversion when
  7463. // generating for OpSpecConstantOp instruction.
  7464. return builder.createBinOp(spv::Op::OpIAdd, destType, operand, zero);
  7465. }
  7466. // For normal run-time conversion instruction, use OpBitcast.
  7467. convOp = spv::Op::OpBitcast;
  7468. }
  7469. if (resultBasicType == glslang::EbtBool) {
  7470. uint32_t bits = GetNumBits(operandBasicType);
  7471. if (isTypeInt(operandBasicType)) {
  7472. spv::Id zeroType = builder.makeUintType(bits);
  7473. if (bits == 64) {
  7474. zero = builder.makeInt64Constant(zeroType, 0, false);
  7475. } else {
  7476. zero = builder.makeIntConstant(zeroType, 0, false);
  7477. }
  7478. zero = makeSmearedConstant(zero, vectorSize);
  7479. return builder.createBinOp(spv::Op::OpINotEqual, destType, operand, zero);
  7480. } else {
  7481. assert(isTypeFloat(operandBasicType));
  7482. if (bits == 64) {
  7483. zero = builder.makeDoubleConstant(0.0);
  7484. } else if (bits == 32) {
  7485. zero = builder.makeFloatConstant(0.0);
  7486. } else {
  7487. assert(bits == 16);
  7488. zero = builder.makeFloat16Constant(0.0);
  7489. }
  7490. zero = makeSmearedConstant(zero, vectorSize);
  7491. return builder.createBinOp(spv::Op::OpFUnordNotEqual, destType, operand, zero);
  7492. }
  7493. }
  7494. if (operandBasicType == glslang::EbtBool) {
  7495. uint32_t bits = GetNumBits(resultBasicType);
  7496. convOp = spv::Op::OpSelect;
  7497. if (isTypeInt(resultBasicType)) {
  7498. spv::Id zeroType = isTypeSignedInt(resultBasicType) ? builder.makeIntType(bits) : builder.makeUintType(bits);
  7499. if (bits == 64) {
  7500. zero = builder.makeInt64Constant(zeroType, 0, false);
  7501. one = builder.makeInt64Constant(zeroType, 1, false);
  7502. } else {
  7503. zero = builder.makeIntConstant(zeroType, 0, false);
  7504. one = builder.makeIntConstant(zeroType, 1, false);
  7505. }
  7506. } else {
  7507. assert(isTypeFloat(resultBasicType));
  7508. if (bits == 64) {
  7509. zero = builder.makeDoubleConstant(0.0);
  7510. one = builder.makeDoubleConstant(1.0);
  7511. } else if (bits == 32) {
  7512. zero = builder.makeFloatConstant(0.0);
  7513. one = builder.makeFloatConstant(1.0);
  7514. } else {
  7515. assert(bits == 16);
  7516. zero = builder.makeFloat16Constant(0.0);
  7517. one = builder.makeFloat16Constant(1.0);
  7518. }
  7519. }
  7520. }
  7521. }
  7522. if (convOp == spv::Op::OpNop) {
  7523. switch (op) {
  7524. case glslang::EOpConvUint64ToPtr:
  7525. convOp = spv::Op::OpConvertUToPtr;
  7526. break;
  7527. case glslang::EOpConvPtrToUint64:
  7528. convOp = spv::Op::OpConvertPtrToU;
  7529. break;
  7530. case glslang::EOpConvPtrToUvec2:
  7531. case glslang::EOpConvUvec2ToPtr:
  7532. convOp = spv::Op::OpBitcast;
  7533. break;
  7534. default:
  7535. break;
  7536. }
  7537. }
  7538. spv::Id result = 0;
  7539. if (convOp == spv::Op::OpNop)
  7540. return result;
  7541. if (convOp == spv::Op::OpSelect) {
  7542. zero = makeSmearedConstant(zero, vectorSize);
  7543. one = makeSmearedConstant(one, vectorSize);
  7544. result = builder.createTriOp(convOp, destType, operand, one, zero);
  7545. } else
  7546. result = builder.createUnaryOp(convOp, destType, operand);
  7547. result = builder.setPrecision(result, decorations.precision);
  7548. decorations.addNonUniform(builder, result);
  7549. return result;
  7550. }
  7551. spv::Id TGlslangToSpvTraverser::makeSmearedConstant(spv::Id constant, int vectorSize)
  7552. {
  7553. if (vectorSize == 0)
  7554. return constant;
  7555. spv::Id vectorTypeId = builder.makeVectorType(builder.getTypeId(constant), vectorSize);
  7556. std::vector<spv::Id> components;
  7557. for (int c = 0; c < vectorSize; ++c)
  7558. components.push_back(constant);
  7559. return builder.makeCompositeConstant(vectorTypeId, components);
  7560. }
  7561. // For glslang ops that map to SPV atomic opCodes
  7562. spv::Id TGlslangToSpvTraverser::createAtomicOperation(glslang::TOperator op, spv::Decoration /*precision*/,
  7563. spv::Id typeId, std::vector<spv::Id>& operands, glslang::TBasicType typeProxy,
  7564. const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags, const glslang::TType &opType)
  7565. {
  7566. spv::Op opCode = spv::Op::OpNop;
  7567. switch (op) {
  7568. case glslang::EOpAtomicAdd:
  7569. case glslang::EOpImageAtomicAdd:
  7570. case glslang::EOpAtomicCounterAdd:
  7571. opCode = spv::Op::OpAtomicIAdd;
  7572. if (typeProxy == glslang::EbtFloat16 || typeProxy == glslang::EbtFloat || typeProxy == glslang::EbtDouble) {
  7573. opCode = spv::Op::OpAtomicFAddEXT;
  7574. if (typeProxy == glslang::EbtFloat16 &&
  7575. (opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {
  7576. builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);
  7577. builder.addCapability(spv::Capability::AtomicFloat16VectorNV);
  7578. } else {
  7579. builder.addExtension(spv::E_SPV_EXT_shader_atomic_float_add);
  7580. if (typeProxy == glslang::EbtFloat16) {
  7581. builder.addExtension(spv::E_SPV_EXT_shader_atomic_float16_add);
  7582. builder.addCapability(spv::Capability::AtomicFloat16AddEXT);
  7583. } else if (typeProxy == glslang::EbtFloat) {
  7584. builder.addCapability(spv::Capability::AtomicFloat32AddEXT);
  7585. } else {
  7586. builder.addCapability(spv::Capability::AtomicFloat64AddEXT);
  7587. }
  7588. }
  7589. }
  7590. break;
  7591. case glslang::EOpAtomicSubtract:
  7592. case glslang::EOpAtomicCounterSubtract:
  7593. opCode = spv::Op::OpAtomicISub;
  7594. break;
  7595. case glslang::EOpAtomicMin:
  7596. case glslang::EOpImageAtomicMin:
  7597. case glslang::EOpAtomicCounterMin:
  7598. if (typeProxy == glslang::EbtFloat16 || typeProxy == glslang::EbtFloat || typeProxy == glslang::EbtDouble) {
  7599. opCode = spv::Op::OpAtomicFMinEXT;
  7600. if (typeProxy == glslang::EbtFloat16 &&
  7601. (opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {
  7602. builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);
  7603. builder.addCapability(spv::Capability::AtomicFloat16VectorNV);
  7604. } else {
  7605. builder.addExtension(spv::E_SPV_EXT_shader_atomic_float_min_max);
  7606. if (typeProxy == glslang::EbtFloat16)
  7607. builder.addCapability(spv::Capability::AtomicFloat16MinMaxEXT);
  7608. else if (typeProxy == glslang::EbtFloat)
  7609. builder.addCapability(spv::Capability::AtomicFloat32MinMaxEXT);
  7610. else
  7611. builder.addCapability(spv::Capability::AtomicFloat64MinMaxEXT);
  7612. }
  7613. } else if (typeProxy == glslang::EbtUint || typeProxy == glslang::EbtUint64) {
  7614. opCode = spv::Op::OpAtomicUMin;
  7615. } else {
  7616. opCode = spv::Op::OpAtomicSMin;
  7617. }
  7618. break;
  7619. case glslang::EOpAtomicMax:
  7620. case glslang::EOpImageAtomicMax:
  7621. case glslang::EOpAtomicCounterMax:
  7622. if (typeProxy == glslang::EbtFloat16 || typeProxy == glslang::EbtFloat || typeProxy == glslang::EbtDouble) {
  7623. opCode = spv::Op::OpAtomicFMaxEXT;
  7624. if (typeProxy == glslang::EbtFloat16 &&
  7625. (opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {
  7626. builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);
  7627. builder.addCapability(spv::Capability::AtomicFloat16VectorNV);
  7628. } else {
  7629. builder.addExtension(spv::E_SPV_EXT_shader_atomic_float_min_max);
  7630. if (typeProxy == glslang::EbtFloat16)
  7631. builder.addCapability(spv::Capability::AtomicFloat16MinMaxEXT);
  7632. else if (typeProxy == glslang::EbtFloat)
  7633. builder.addCapability(spv::Capability::AtomicFloat32MinMaxEXT);
  7634. else
  7635. builder.addCapability(spv::Capability::AtomicFloat64MinMaxEXT);
  7636. }
  7637. } else if (typeProxy == glslang::EbtUint || typeProxy == glslang::EbtUint64) {
  7638. opCode = spv::Op::OpAtomicUMax;
  7639. } else {
  7640. opCode = spv::Op::OpAtomicSMax;
  7641. }
  7642. break;
  7643. case glslang::EOpAtomicAnd:
  7644. case glslang::EOpImageAtomicAnd:
  7645. case glslang::EOpAtomicCounterAnd:
  7646. opCode = spv::Op::OpAtomicAnd;
  7647. break;
  7648. case glslang::EOpAtomicOr:
  7649. case glslang::EOpImageAtomicOr:
  7650. case glslang::EOpAtomicCounterOr:
  7651. opCode = spv::Op::OpAtomicOr;
  7652. break;
  7653. case glslang::EOpAtomicXor:
  7654. case glslang::EOpImageAtomicXor:
  7655. case glslang::EOpAtomicCounterXor:
  7656. opCode = spv::Op::OpAtomicXor;
  7657. break;
  7658. case glslang::EOpAtomicExchange:
  7659. case glslang::EOpImageAtomicExchange:
  7660. case glslang::EOpAtomicCounterExchange:
  7661. if ((typeProxy == glslang::EbtFloat16) &&
  7662. (opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {
  7663. builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);
  7664. builder.addCapability(spv::Capability::AtomicFloat16VectorNV);
  7665. }
  7666. opCode = spv::Op::OpAtomicExchange;
  7667. break;
  7668. case glslang::EOpAtomicCompSwap:
  7669. case glslang::EOpImageAtomicCompSwap:
  7670. case glslang::EOpAtomicCounterCompSwap:
  7671. opCode = spv::Op::OpAtomicCompareExchange;
  7672. break;
  7673. case glslang::EOpAtomicCounterIncrement:
  7674. opCode = spv::Op::OpAtomicIIncrement;
  7675. break;
  7676. case glslang::EOpAtomicCounterDecrement:
  7677. opCode = spv::Op::OpAtomicIDecrement;
  7678. break;
  7679. case glslang::EOpAtomicCounter:
  7680. case glslang::EOpImageAtomicLoad:
  7681. case glslang::EOpAtomicLoad:
  7682. opCode = spv::Op::OpAtomicLoad;
  7683. break;
  7684. case glslang::EOpAtomicStore:
  7685. case glslang::EOpImageAtomicStore:
  7686. opCode = spv::Op::OpAtomicStore;
  7687. break;
  7688. default:
  7689. assert(0);
  7690. break;
  7691. }
  7692. if (typeProxy == glslang::EbtInt64 || typeProxy == glslang::EbtUint64)
  7693. builder.addCapability(spv::Capability::Int64Atomics);
  7694. // Sort out the operands
  7695. // - mapping from glslang -> SPV
  7696. // - there are extra SPV operands that are optional in glslang
  7697. // - compare-exchange swaps the value and comparator
  7698. // - compare-exchange has an extra memory semantics
  7699. // - EOpAtomicCounterDecrement needs a post decrement
  7700. spv::Id pointerId = 0, compareId = 0, valueId = 0;
  7701. // scope defaults to Device in the old model, QueueFamilyKHR in the new model
  7702. spv::Id scopeId;
  7703. if (glslangIntermediate->usingVulkanMemoryModel()) {
  7704. scopeId = builder.makeUintConstant(spv::Scope::QueueFamilyKHR);
  7705. } else {
  7706. scopeId = builder.makeUintConstant(spv::Scope::Device);
  7707. }
  7708. // semantics default to relaxed
  7709. spv::Id semanticsId = builder.makeUintConstant(lvalueCoherentFlags.isVolatile() &&
  7710. glslangIntermediate->usingVulkanMemoryModel() ?
  7711. spv::MemorySemanticsMask::Volatile :
  7712. spv::MemorySemanticsMask::MaskNone);
  7713. spv::Id semanticsId2 = semanticsId;
  7714. pointerId = operands[0];
  7715. if (opCode == spv::Op::OpAtomicIIncrement || opCode == spv::Op::OpAtomicIDecrement) {
  7716. // no additional operands
  7717. } else if (opCode == spv::Op::OpAtomicCompareExchange) {
  7718. compareId = operands[1];
  7719. valueId = operands[2];
  7720. if (operands.size() > 3) {
  7721. scopeId = operands[3];
  7722. semanticsId = builder.makeUintConstant(
  7723. builder.getConstantScalar(operands[4]) | builder.getConstantScalar(operands[5]));
  7724. semanticsId2 = builder.makeUintConstant(
  7725. builder.getConstantScalar(operands[6]) | builder.getConstantScalar(operands[7]));
  7726. }
  7727. } else if (opCode == spv::Op::OpAtomicLoad) {
  7728. if (operands.size() > 1) {
  7729. scopeId = operands[1];
  7730. semanticsId = builder.makeUintConstant(
  7731. builder.getConstantScalar(operands[2]) | builder.getConstantScalar(operands[3]));
  7732. }
  7733. } else {
  7734. // atomic store or RMW
  7735. valueId = operands[1];
  7736. if (operands.size() > 2) {
  7737. scopeId = operands[2];
  7738. semanticsId = builder.makeUintConstant
  7739. (builder.getConstantScalar(operands[3]) | builder.getConstantScalar(operands[4]));
  7740. }
  7741. }
  7742. // Check for capabilities
  7743. auto const semanticsImmediate = (spv::MemorySemanticsMask)(builder.getConstantScalar(semanticsId) | builder.getConstantScalar(semanticsId2));
  7744. if (anySet(semanticsImmediate, spv::MemorySemanticsMask::MakeAvailableKHR |
  7745. spv::MemorySemanticsMask::MakeVisibleKHR |
  7746. spv::MemorySemanticsMask::OutputMemoryKHR |
  7747. spv::MemorySemanticsMask::Volatile)) {
  7748. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  7749. }
  7750. auto const scope = (spv::Scope)builder.getConstantScalar(scopeId);
  7751. if (scope == spv::Scope::QueueFamily) {
  7752. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  7753. }
  7754. if (glslangIntermediate->usingVulkanMemoryModel() && scope == spv::Scope::Device) {
  7755. builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);
  7756. }
  7757. std::vector<spv::Id> spvAtomicOperands; // hold the spv operands
  7758. spvAtomicOperands.reserve(6);
  7759. spvAtomicOperands.push_back(pointerId);
  7760. spvAtomicOperands.push_back(scopeId);
  7761. spvAtomicOperands.push_back(semanticsId);
  7762. if (opCode == spv::Op::OpAtomicCompareExchange) {
  7763. spvAtomicOperands.push_back(semanticsId2);
  7764. spvAtomicOperands.push_back(valueId);
  7765. spvAtomicOperands.push_back(compareId);
  7766. } else if (opCode != spv::Op::OpAtomicLoad && opCode != spv::Op::OpAtomicIIncrement && opCode != spv::Op::OpAtomicIDecrement) {
  7767. spvAtomicOperands.push_back(valueId);
  7768. }
  7769. if (opCode == spv::Op::OpAtomicStore) {
  7770. builder.createNoResultOp(opCode, spvAtomicOperands);
  7771. return 0;
  7772. } else {
  7773. spv::Id resultId = builder.createOp(opCode, typeId, spvAtomicOperands);
  7774. // GLSL and HLSL atomic-counter decrement return post-decrement value,
  7775. // while SPIR-V returns pre-decrement value. Translate between these semantics.
  7776. if (op == glslang::EOpAtomicCounterDecrement)
  7777. resultId = builder.createBinOp(spv::Op::OpISub, typeId, resultId, builder.makeIntConstant(1));
  7778. return resultId;
  7779. }
  7780. }
  7781. // Create group invocation operations.
  7782. spv::Id TGlslangToSpvTraverser::createInvocationsOperation(glslang::TOperator op, spv::Id typeId,
  7783. std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)
  7784. {
  7785. bool isUnsigned = isTypeUnsignedInt(typeProxy);
  7786. bool isFloat = isTypeFloat(typeProxy);
  7787. spv::Op opCode = spv::Op::OpNop;
  7788. std::vector<spv::IdImmediate> spvGroupOperands;
  7789. spv::GroupOperation groupOperation = spv::GroupOperation::Max;
  7790. if (op == glslang::EOpBallot || op == glslang::EOpReadFirstInvocation ||
  7791. op == glslang::EOpReadInvocation) {
  7792. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  7793. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  7794. } else if (op == glslang::EOpAnyInvocation ||
  7795. op == glslang::EOpAllInvocations ||
  7796. op == glslang::EOpAllInvocationsEqual) {
  7797. builder.addExtension(spv::E_SPV_KHR_subgroup_vote);
  7798. builder.addCapability(spv::Capability::SubgroupVoteKHR);
  7799. } else {
  7800. builder.addCapability(spv::Capability::Groups);
  7801. if (op == glslang::EOpMinInvocationsNonUniform ||
  7802. op == glslang::EOpMaxInvocationsNonUniform ||
  7803. op == glslang::EOpAddInvocationsNonUniform ||
  7804. op == glslang::EOpMinInvocationsInclusiveScanNonUniform ||
  7805. op == glslang::EOpMaxInvocationsInclusiveScanNonUniform ||
  7806. op == glslang::EOpAddInvocationsInclusiveScanNonUniform ||
  7807. op == glslang::EOpMinInvocationsExclusiveScanNonUniform ||
  7808. op == glslang::EOpMaxInvocationsExclusiveScanNonUniform ||
  7809. op == glslang::EOpAddInvocationsExclusiveScanNonUniform)
  7810. builder.addExtension(spv::E_SPV_AMD_shader_ballot);
  7811. switch (op) {
  7812. case glslang::EOpMinInvocations:
  7813. case glslang::EOpMaxInvocations:
  7814. case glslang::EOpAddInvocations:
  7815. case glslang::EOpMinInvocationsNonUniform:
  7816. case glslang::EOpMaxInvocationsNonUniform:
  7817. case glslang::EOpAddInvocationsNonUniform:
  7818. groupOperation = spv::GroupOperation::Reduce;
  7819. break;
  7820. case glslang::EOpMinInvocationsInclusiveScan:
  7821. case glslang::EOpMaxInvocationsInclusiveScan:
  7822. case glslang::EOpAddInvocationsInclusiveScan:
  7823. case glslang::EOpMinInvocationsInclusiveScanNonUniform:
  7824. case glslang::EOpMaxInvocationsInclusiveScanNonUniform:
  7825. case glslang::EOpAddInvocationsInclusiveScanNonUniform:
  7826. groupOperation = spv::GroupOperation::InclusiveScan;
  7827. break;
  7828. case glslang::EOpMinInvocationsExclusiveScan:
  7829. case glslang::EOpMaxInvocationsExclusiveScan:
  7830. case glslang::EOpAddInvocationsExclusiveScan:
  7831. case glslang::EOpMinInvocationsExclusiveScanNonUniform:
  7832. case glslang::EOpMaxInvocationsExclusiveScanNonUniform:
  7833. case glslang::EOpAddInvocationsExclusiveScanNonUniform:
  7834. groupOperation = spv::GroupOperation::ExclusiveScan;
  7835. break;
  7836. default:
  7837. break;
  7838. }
  7839. spv::IdImmediate scope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };
  7840. spvGroupOperands.push_back(scope);
  7841. if (groupOperation != spv::GroupOperation::Max) {
  7842. spv::IdImmediate groupOp = { false, (unsigned)groupOperation };
  7843. spvGroupOperands.push_back(groupOp);
  7844. }
  7845. }
  7846. for (auto opIt = operands.begin(); opIt != operands.end(); ++opIt) {
  7847. spv::IdImmediate op = { true, *opIt };
  7848. spvGroupOperands.push_back(op);
  7849. }
  7850. switch (op) {
  7851. case glslang::EOpAnyInvocation:
  7852. opCode = spv::Op::OpSubgroupAnyKHR;
  7853. break;
  7854. case glslang::EOpAllInvocations:
  7855. opCode = spv::Op::OpSubgroupAllKHR;
  7856. break;
  7857. case glslang::EOpAllInvocationsEqual:
  7858. opCode = spv::Op::OpSubgroupAllEqualKHR;
  7859. break;
  7860. case glslang::EOpReadInvocation:
  7861. opCode = spv::Op::OpSubgroupReadInvocationKHR;
  7862. if (builder.isVectorType(typeId))
  7863. return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
  7864. break;
  7865. case glslang::EOpReadFirstInvocation:
  7866. opCode = spv::Op::OpSubgroupFirstInvocationKHR;
  7867. if (builder.isVectorType(typeId))
  7868. return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
  7869. break;
  7870. case glslang::EOpBallot:
  7871. {
  7872. // NOTE: According to the spec, the result type of "OpSubgroupBallotKHR" must be a 4 component vector of 32
  7873. // bit integer types. The GLSL built-in function "ballotARB()" assumes the maximum number of invocations in
  7874. // a subgroup is 64. Thus, we have to convert uvec4.xy to uint64_t as follow:
  7875. //
  7876. // result = Bitcast(SubgroupBallotKHR(Predicate).xy)
  7877. //
  7878. spv::Id uintType = builder.makeUintType(32);
  7879. spv::Id uvec4Type = builder.makeVectorType(uintType, 4);
  7880. spv::Id result = builder.createOp(spv::Op::OpSubgroupBallotKHR, uvec4Type, spvGroupOperands);
  7881. std::vector<spv::Id> components;
  7882. components.push_back(builder.createCompositeExtract(result, uintType, 0));
  7883. components.push_back(builder.createCompositeExtract(result, uintType, 1));
  7884. spv::Id uvec2Type = builder.makeVectorType(uintType, 2);
  7885. return builder.createUnaryOp(spv::Op::OpBitcast, typeId,
  7886. builder.createCompositeConstruct(uvec2Type, components));
  7887. }
  7888. case glslang::EOpMinInvocations:
  7889. case glslang::EOpMaxInvocations:
  7890. case glslang::EOpAddInvocations:
  7891. case glslang::EOpMinInvocationsInclusiveScan:
  7892. case glslang::EOpMaxInvocationsInclusiveScan:
  7893. case glslang::EOpAddInvocationsInclusiveScan:
  7894. case glslang::EOpMinInvocationsExclusiveScan:
  7895. case glslang::EOpMaxInvocationsExclusiveScan:
  7896. case glslang::EOpAddInvocationsExclusiveScan:
  7897. if (op == glslang::EOpMinInvocations ||
  7898. op == glslang::EOpMinInvocationsInclusiveScan ||
  7899. op == glslang::EOpMinInvocationsExclusiveScan) {
  7900. if (isFloat)
  7901. opCode = spv::Op::OpGroupFMin;
  7902. else {
  7903. if (isUnsigned)
  7904. opCode = spv::Op::OpGroupUMin;
  7905. else
  7906. opCode = spv::Op::OpGroupSMin;
  7907. }
  7908. } else if (op == glslang::EOpMaxInvocations ||
  7909. op == glslang::EOpMaxInvocationsInclusiveScan ||
  7910. op == glslang::EOpMaxInvocationsExclusiveScan) {
  7911. if (isFloat)
  7912. opCode = spv::Op::OpGroupFMax;
  7913. else {
  7914. if (isUnsigned)
  7915. opCode = spv::Op::OpGroupUMax;
  7916. else
  7917. opCode = spv::Op::OpGroupSMax;
  7918. }
  7919. } else {
  7920. if (isFloat)
  7921. opCode = spv::Op::OpGroupFAdd;
  7922. else
  7923. opCode = spv::Op::OpGroupIAdd;
  7924. }
  7925. if (builder.isVectorType(typeId))
  7926. return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
  7927. break;
  7928. case glslang::EOpMinInvocationsNonUniform:
  7929. case glslang::EOpMaxInvocationsNonUniform:
  7930. case glslang::EOpAddInvocationsNonUniform:
  7931. case glslang::EOpMinInvocationsInclusiveScanNonUniform:
  7932. case glslang::EOpMaxInvocationsInclusiveScanNonUniform:
  7933. case glslang::EOpAddInvocationsInclusiveScanNonUniform:
  7934. case glslang::EOpMinInvocationsExclusiveScanNonUniform:
  7935. case glslang::EOpMaxInvocationsExclusiveScanNonUniform:
  7936. case glslang::EOpAddInvocationsExclusiveScanNonUniform:
  7937. if (op == glslang::EOpMinInvocationsNonUniform ||
  7938. op == glslang::EOpMinInvocationsInclusiveScanNonUniform ||
  7939. op == glslang::EOpMinInvocationsExclusiveScanNonUniform) {
  7940. if (isFloat)
  7941. opCode = spv::Op::OpGroupFMinNonUniformAMD;
  7942. else {
  7943. if (isUnsigned)
  7944. opCode = spv::Op::OpGroupUMinNonUniformAMD;
  7945. else
  7946. opCode = spv::Op::OpGroupSMinNonUniformAMD;
  7947. }
  7948. }
  7949. else if (op == glslang::EOpMaxInvocationsNonUniform ||
  7950. op == glslang::EOpMaxInvocationsInclusiveScanNonUniform ||
  7951. op == glslang::EOpMaxInvocationsExclusiveScanNonUniform) {
  7952. if (isFloat)
  7953. opCode = spv::Op::OpGroupFMaxNonUniformAMD;
  7954. else {
  7955. if (isUnsigned)
  7956. opCode = spv::Op::OpGroupUMaxNonUniformAMD;
  7957. else
  7958. opCode = spv::Op::OpGroupSMaxNonUniformAMD;
  7959. }
  7960. }
  7961. else {
  7962. if (isFloat)
  7963. opCode = spv::Op::OpGroupFAddNonUniformAMD;
  7964. else
  7965. opCode = spv::Op::OpGroupIAddNonUniformAMD;
  7966. }
  7967. if (builder.isVectorType(typeId))
  7968. return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
  7969. break;
  7970. default:
  7971. logger->missingFunctionality("invocation operation");
  7972. return spv::NoResult;
  7973. }
  7974. assert(opCode != spv::Op::OpNop);
  7975. return builder.createOp(opCode, typeId, spvGroupOperands);
  7976. }
  7977. // Create group invocation operations on a vector
  7978. spv::Id TGlslangToSpvTraverser::CreateInvocationsVectorOperation(spv::Op op, spv::GroupOperation groupOperation,
  7979. spv::Id typeId, std::vector<spv::Id>& operands)
  7980. {
  7981. assert(op == spv::Op::OpGroupFMin || op == spv::Op::OpGroupUMin || op == spv::Op::OpGroupSMin ||
  7982. op == spv::Op::OpGroupFMax || op == spv::Op::OpGroupUMax || op == spv::Op::OpGroupSMax ||
  7983. op == spv::Op::OpGroupFAdd || op == spv::Op::OpGroupIAdd || op == spv::Op::OpGroupBroadcast ||
  7984. op == spv::Op::OpSubgroupReadInvocationKHR || op == spv::Op::OpSubgroupFirstInvocationKHR ||
  7985. op == spv::Op::OpGroupFMinNonUniformAMD || op == spv::Op::OpGroupUMinNonUniformAMD ||
  7986. op == spv::Op::OpGroupSMinNonUniformAMD ||
  7987. op == spv::Op::OpGroupFMaxNonUniformAMD || op == spv::Op::OpGroupUMaxNonUniformAMD ||
  7988. op == spv::Op::OpGroupSMaxNonUniformAMD ||
  7989. op == spv::Op::OpGroupFAddNonUniformAMD || op == spv::Op::OpGroupIAddNonUniformAMD);
  7990. // Handle group invocation operations scalar by scalar.
  7991. // The result type is the same type as the original type.
  7992. // The algorithm is to:
  7993. // - break the vector into scalars
  7994. // - apply the operation to each scalar
  7995. // - make a vector out the scalar results
  7996. // get the types sorted out
  7997. int numComponents = builder.getNumComponents(operands[0]);
  7998. spv::Id scalarType = builder.getScalarTypeId(builder.getTypeId(operands[0]));
  7999. std::vector<spv::Id> results;
  8000. // do each scalar op
  8001. for (int comp = 0; comp < numComponents; ++comp) {
  8002. std::vector<unsigned int> indexes;
  8003. indexes.push_back(comp);
  8004. spv::IdImmediate scalar = { true, builder.createCompositeExtract(operands[0], scalarType, indexes) };
  8005. std::vector<spv::IdImmediate> spvGroupOperands;
  8006. if (op == spv::Op::OpSubgroupReadInvocationKHR) {
  8007. spvGroupOperands.push_back(scalar);
  8008. spv::IdImmediate operand = { true, operands[1] };
  8009. spvGroupOperands.push_back(operand);
  8010. } else if (op == spv::Op::OpSubgroupFirstInvocationKHR) {
  8011. spvGroupOperands.push_back(scalar);
  8012. } else if (op == spv::Op::OpGroupBroadcast) {
  8013. spv::IdImmediate scope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };
  8014. spvGroupOperands.push_back(scope);
  8015. spvGroupOperands.push_back(scalar);
  8016. spv::IdImmediate operand = { true, operands[1] };
  8017. spvGroupOperands.push_back(operand);
  8018. } else {
  8019. spv::IdImmediate scope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };
  8020. spvGroupOperands.push_back(scope);
  8021. spv::IdImmediate groupOp = { false, (unsigned)groupOperation };
  8022. spvGroupOperands.push_back(groupOp);
  8023. spvGroupOperands.push_back(scalar);
  8024. }
  8025. results.push_back(builder.createOp(op, scalarType, spvGroupOperands));
  8026. }
  8027. // put the pieces together
  8028. return builder.createCompositeConstruct(typeId, results);
  8029. }
  8030. // Create subgroup invocation operations.
  8031. spv::Id TGlslangToSpvTraverser::createSubgroupOperation(glslang::TOperator op, spv::Id typeId,
  8032. std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)
  8033. {
  8034. // Add the required capabilities.
  8035. switch (op) {
  8036. case glslang::EOpSubgroupElect:
  8037. builder.addCapability(spv::Capability::GroupNonUniform);
  8038. break;
  8039. case glslang::EOpSubgroupQuadAll:
  8040. case glslang::EOpSubgroupQuadAny:
  8041. builder.addExtension(spv::E_SPV_KHR_quad_control);
  8042. builder.addCapability(spv::Capability::QuadControlKHR);
  8043. [[fallthrough]];
  8044. case glslang::EOpSubgroupAll:
  8045. case glslang::EOpSubgroupAny:
  8046. case glslang::EOpSubgroupAllEqual:
  8047. builder.addCapability(spv::Capability::GroupNonUniform);
  8048. builder.addCapability(spv::Capability::GroupNonUniformVote);
  8049. break;
  8050. case glslang::EOpSubgroupBroadcast:
  8051. case glslang::EOpSubgroupBroadcastFirst:
  8052. case glslang::EOpSubgroupBallot:
  8053. case glslang::EOpSubgroupInverseBallot:
  8054. case glslang::EOpSubgroupBallotBitExtract:
  8055. case glslang::EOpSubgroupBallotBitCount:
  8056. case glslang::EOpSubgroupBallotInclusiveBitCount:
  8057. case glslang::EOpSubgroupBallotExclusiveBitCount:
  8058. case glslang::EOpSubgroupBallotFindLSB:
  8059. case glslang::EOpSubgroupBallotFindMSB:
  8060. builder.addCapability(spv::Capability::GroupNonUniform);
  8061. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  8062. break;
  8063. case glslang::EOpSubgroupRotate:
  8064. case glslang::EOpSubgroupClusteredRotate:
  8065. builder.addExtension(spv::E_SPV_KHR_subgroup_rotate);
  8066. builder.addCapability(spv::Capability::GroupNonUniformRotateKHR);
  8067. break;
  8068. case glslang::EOpSubgroupShuffle:
  8069. case glslang::EOpSubgroupShuffleXor:
  8070. builder.addCapability(spv::Capability::GroupNonUniform);
  8071. builder.addCapability(spv::Capability::GroupNonUniformShuffle);
  8072. break;
  8073. case glslang::EOpSubgroupShuffleUp:
  8074. case glslang::EOpSubgroupShuffleDown:
  8075. builder.addCapability(spv::Capability::GroupNonUniform);
  8076. builder.addCapability(spv::Capability::GroupNonUniformShuffleRelative);
  8077. break;
  8078. case glslang::EOpSubgroupAdd:
  8079. case glslang::EOpSubgroupMul:
  8080. case glslang::EOpSubgroupMin:
  8081. case glslang::EOpSubgroupMax:
  8082. case glslang::EOpSubgroupAnd:
  8083. case glslang::EOpSubgroupOr:
  8084. case glslang::EOpSubgroupXor:
  8085. case glslang::EOpSubgroupInclusiveAdd:
  8086. case glslang::EOpSubgroupInclusiveMul:
  8087. case glslang::EOpSubgroupInclusiveMin:
  8088. case glslang::EOpSubgroupInclusiveMax:
  8089. case glslang::EOpSubgroupInclusiveAnd:
  8090. case glslang::EOpSubgroupInclusiveOr:
  8091. case glslang::EOpSubgroupInclusiveXor:
  8092. case glslang::EOpSubgroupExclusiveAdd:
  8093. case glslang::EOpSubgroupExclusiveMul:
  8094. case glslang::EOpSubgroupExclusiveMin:
  8095. case glslang::EOpSubgroupExclusiveMax:
  8096. case glslang::EOpSubgroupExclusiveAnd:
  8097. case glslang::EOpSubgroupExclusiveOr:
  8098. case glslang::EOpSubgroupExclusiveXor:
  8099. builder.addCapability(spv::Capability::GroupNonUniform);
  8100. builder.addCapability(spv::Capability::GroupNonUniformArithmetic);
  8101. break;
  8102. case glslang::EOpSubgroupClusteredAdd:
  8103. case glslang::EOpSubgroupClusteredMul:
  8104. case glslang::EOpSubgroupClusteredMin:
  8105. case glslang::EOpSubgroupClusteredMax:
  8106. case glslang::EOpSubgroupClusteredAnd:
  8107. case glslang::EOpSubgroupClusteredOr:
  8108. case glslang::EOpSubgroupClusteredXor:
  8109. builder.addCapability(spv::Capability::GroupNonUniform);
  8110. builder.addCapability(spv::Capability::GroupNonUniformClustered);
  8111. break;
  8112. case glslang::EOpSubgroupQuadBroadcast:
  8113. case glslang::EOpSubgroupQuadSwapHorizontal:
  8114. case glslang::EOpSubgroupQuadSwapVertical:
  8115. case glslang::EOpSubgroupQuadSwapDiagonal:
  8116. builder.addCapability(spv::Capability::GroupNonUniform);
  8117. builder.addCapability(spv::Capability::GroupNonUniformQuad);
  8118. break;
  8119. case glslang::EOpSubgroupPartitionedAdd:
  8120. case glslang::EOpSubgroupPartitionedMul:
  8121. case glslang::EOpSubgroupPartitionedMin:
  8122. case glslang::EOpSubgroupPartitionedMax:
  8123. case glslang::EOpSubgroupPartitionedAnd:
  8124. case glslang::EOpSubgroupPartitionedOr:
  8125. case glslang::EOpSubgroupPartitionedXor:
  8126. case glslang::EOpSubgroupPartitionedInclusiveAdd:
  8127. case glslang::EOpSubgroupPartitionedInclusiveMul:
  8128. case glslang::EOpSubgroupPartitionedInclusiveMin:
  8129. case glslang::EOpSubgroupPartitionedInclusiveMax:
  8130. case glslang::EOpSubgroupPartitionedInclusiveAnd:
  8131. case glslang::EOpSubgroupPartitionedInclusiveOr:
  8132. case glslang::EOpSubgroupPartitionedInclusiveXor:
  8133. case glslang::EOpSubgroupPartitionedExclusiveAdd:
  8134. case glslang::EOpSubgroupPartitionedExclusiveMul:
  8135. case glslang::EOpSubgroupPartitionedExclusiveMin:
  8136. case glslang::EOpSubgroupPartitionedExclusiveMax:
  8137. case glslang::EOpSubgroupPartitionedExclusiveAnd:
  8138. case glslang::EOpSubgroupPartitionedExclusiveOr:
  8139. case glslang::EOpSubgroupPartitionedExclusiveXor:
  8140. builder.addExtension(spv::E_SPV_NV_shader_subgroup_partitioned);
  8141. builder.addCapability(spv::Capability::GroupNonUniformPartitionedNV);
  8142. break;
  8143. default: assert(0 && "Unhandled subgroup operation!");
  8144. }
  8145. const bool isUnsigned = isTypeUnsignedInt(typeProxy);
  8146. const bool isFloat = isTypeFloat(typeProxy);
  8147. const bool isBool = typeProxy == glslang::EbtBool;
  8148. spv::Op opCode = spv::Op::OpNop;
  8149. // Figure out which opcode to use.
  8150. switch (op) {
  8151. case glslang::EOpSubgroupElect: opCode = spv::Op::OpGroupNonUniformElect; break;
  8152. case glslang::EOpSubgroupQuadAll: opCode = spv::Op::OpGroupNonUniformQuadAllKHR; break;
  8153. case glslang::EOpSubgroupAll: opCode = spv::Op::OpGroupNonUniformAll; break;
  8154. case glslang::EOpSubgroupQuadAny: opCode = spv::Op::OpGroupNonUniformQuadAnyKHR; break;
  8155. case glslang::EOpSubgroupAny: opCode = spv::Op::OpGroupNonUniformAny; break;
  8156. case glslang::EOpSubgroupAllEqual: opCode = spv::Op::OpGroupNonUniformAllEqual; break;
  8157. case glslang::EOpSubgroupBroadcast: opCode = spv::Op::OpGroupNonUniformBroadcast; break;
  8158. case glslang::EOpSubgroupBroadcastFirst: opCode = spv::Op::OpGroupNonUniformBroadcastFirst; break;
  8159. case glslang::EOpSubgroupBallot: opCode = spv::Op::OpGroupNonUniformBallot; break;
  8160. case glslang::EOpSubgroupInverseBallot: opCode = spv::Op::OpGroupNonUniformInverseBallot; break;
  8161. case glslang::EOpSubgroupBallotBitExtract: opCode = spv::Op::OpGroupNonUniformBallotBitExtract; break;
  8162. case glslang::EOpSubgroupBallotBitCount:
  8163. case glslang::EOpSubgroupBallotInclusiveBitCount:
  8164. case glslang::EOpSubgroupBallotExclusiveBitCount: opCode = spv::Op::OpGroupNonUniformBallotBitCount; break;
  8165. case glslang::EOpSubgroupBallotFindLSB: opCode = spv::Op::OpGroupNonUniformBallotFindLSB; break;
  8166. case glslang::EOpSubgroupBallotFindMSB: opCode = spv::Op::OpGroupNonUniformBallotFindMSB; break;
  8167. case glslang::EOpSubgroupShuffle: opCode = spv::Op::OpGroupNonUniformShuffle; break;
  8168. case glslang::EOpSubgroupShuffleXor: opCode = spv::Op::OpGroupNonUniformShuffleXor; break;
  8169. case glslang::EOpSubgroupShuffleUp: opCode = spv::Op::OpGroupNonUniformShuffleUp; break;
  8170. case glslang::EOpSubgroupShuffleDown: opCode = spv::Op::OpGroupNonUniformShuffleDown; break;
  8171. case glslang::EOpSubgroupRotate:
  8172. case glslang::EOpSubgroupClusteredRotate: opCode = spv::Op::OpGroupNonUniformRotateKHR; break;
  8173. case glslang::EOpSubgroupAdd:
  8174. case glslang::EOpSubgroupInclusiveAdd:
  8175. case glslang::EOpSubgroupExclusiveAdd:
  8176. case glslang::EOpSubgroupClusteredAdd:
  8177. case glslang::EOpSubgroupPartitionedAdd:
  8178. case glslang::EOpSubgroupPartitionedInclusiveAdd:
  8179. case glslang::EOpSubgroupPartitionedExclusiveAdd:
  8180. if (isFloat) {
  8181. opCode = spv::Op::OpGroupNonUniformFAdd;
  8182. } else {
  8183. opCode = spv::Op::OpGroupNonUniformIAdd;
  8184. }
  8185. break;
  8186. case glslang::EOpSubgroupMul:
  8187. case glslang::EOpSubgroupInclusiveMul:
  8188. case glslang::EOpSubgroupExclusiveMul:
  8189. case glslang::EOpSubgroupClusteredMul:
  8190. case glslang::EOpSubgroupPartitionedMul:
  8191. case glslang::EOpSubgroupPartitionedInclusiveMul:
  8192. case glslang::EOpSubgroupPartitionedExclusiveMul:
  8193. if (isFloat) {
  8194. opCode = spv::Op::OpGroupNonUniformFMul;
  8195. } else {
  8196. opCode = spv::Op::OpGroupNonUniformIMul;
  8197. }
  8198. break;
  8199. case glslang::EOpSubgroupMin:
  8200. case glslang::EOpSubgroupInclusiveMin:
  8201. case glslang::EOpSubgroupExclusiveMin:
  8202. case glslang::EOpSubgroupClusteredMin:
  8203. case glslang::EOpSubgroupPartitionedMin:
  8204. case glslang::EOpSubgroupPartitionedInclusiveMin:
  8205. case glslang::EOpSubgroupPartitionedExclusiveMin:
  8206. if (isFloat) {
  8207. opCode = spv::Op::OpGroupNonUniformFMin;
  8208. } else if (isUnsigned) {
  8209. opCode = spv::Op::OpGroupNonUniformUMin;
  8210. } else {
  8211. opCode = spv::Op::OpGroupNonUniformSMin;
  8212. }
  8213. break;
  8214. case glslang::EOpSubgroupMax:
  8215. case glslang::EOpSubgroupInclusiveMax:
  8216. case glslang::EOpSubgroupExclusiveMax:
  8217. case glslang::EOpSubgroupClusteredMax:
  8218. case glslang::EOpSubgroupPartitionedMax:
  8219. case glslang::EOpSubgroupPartitionedInclusiveMax:
  8220. case glslang::EOpSubgroupPartitionedExclusiveMax:
  8221. if (isFloat) {
  8222. opCode = spv::Op::OpGroupNonUniformFMax;
  8223. } else if (isUnsigned) {
  8224. opCode = spv::Op::OpGroupNonUniformUMax;
  8225. } else {
  8226. opCode = spv::Op::OpGroupNonUniformSMax;
  8227. }
  8228. break;
  8229. case glslang::EOpSubgroupAnd:
  8230. case glslang::EOpSubgroupInclusiveAnd:
  8231. case glslang::EOpSubgroupExclusiveAnd:
  8232. case glslang::EOpSubgroupClusteredAnd:
  8233. case glslang::EOpSubgroupPartitionedAnd:
  8234. case glslang::EOpSubgroupPartitionedInclusiveAnd:
  8235. case glslang::EOpSubgroupPartitionedExclusiveAnd:
  8236. if (isBool) {
  8237. opCode = spv::Op::OpGroupNonUniformLogicalAnd;
  8238. } else {
  8239. opCode = spv::Op::OpGroupNonUniformBitwiseAnd;
  8240. }
  8241. break;
  8242. case glslang::EOpSubgroupOr:
  8243. case glslang::EOpSubgroupInclusiveOr:
  8244. case glslang::EOpSubgroupExclusiveOr:
  8245. case glslang::EOpSubgroupClusteredOr:
  8246. case glslang::EOpSubgroupPartitionedOr:
  8247. case glslang::EOpSubgroupPartitionedInclusiveOr:
  8248. case glslang::EOpSubgroupPartitionedExclusiveOr:
  8249. if (isBool) {
  8250. opCode = spv::Op::OpGroupNonUniformLogicalOr;
  8251. } else {
  8252. opCode = spv::Op::OpGroupNonUniformBitwiseOr;
  8253. }
  8254. break;
  8255. case glslang::EOpSubgroupXor:
  8256. case glslang::EOpSubgroupInclusiveXor:
  8257. case glslang::EOpSubgroupExclusiveXor:
  8258. case glslang::EOpSubgroupClusteredXor:
  8259. case glslang::EOpSubgroupPartitionedXor:
  8260. case glslang::EOpSubgroupPartitionedInclusiveXor:
  8261. case glslang::EOpSubgroupPartitionedExclusiveXor:
  8262. if (isBool) {
  8263. opCode = spv::Op::OpGroupNonUniformLogicalXor;
  8264. } else {
  8265. opCode = spv::Op::OpGroupNonUniformBitwiseXor;
  8266. }
  8267. break;
  8268. case glslang::EOpSubgroupQuadBroadcast: opCode = spv::Op::OpGroupNonUniformQuadBroadcast; break;
  8269. case glslang::EOpSubgroupQuadSwapHorizontal:
  8270. case glslang::EOpSubgroupQuadSwapVertical:
  8271. case glslang::EOpSubgroupQuadSwapDiagonal: opCode = spv::Op::OpGroupNonUniformQuadSwap; break;
  8272. default: assert(0 && "Unhandled subgroup operation!");
  8273. }
  8274. // get the right Group Operation
  8275. spv::GroupOperation groupOperation = spv::GroupOperation::Max;
  8276. switch (op) {
  8277. default:
  8278. break;
  8279. case glslang::EOpSubgroupBallotBitCount:
  8280. case glslang::EOpSubgroupAdd:
  8281. case glslang::EOpSubgroupMul:
  8282. case glslang::EOpSubgroupMin:
  8283. case glslang::EOpSubgroupMax:
  8284. case glslang::EOpSubgroupAnd:
  8285. case glslang::EOpSubgroupOr:
  8286. case glslang::EOpSubgroupXor:
  8287. groupOperation = spv::GroupOperation::Reduce;
  8288. break;
  8289. case glslang::EOpSubgroupBallotInclusiveBitCount:
  8290. case glslang::EOpSubgroupInclusiveAdd:
  8291. case glslang::EOpSubgroupInclusiveMul:
  8292. case glslang::EOpSubgroupInclusiveMin:
  8293. case glslang::EOpSubgroupInclusiveMax:
  8294. case glslang::EOpSubgroupInclusiveAnd:
  8295. case glslang::EOpSubgroupInclusiveOr:
  8296. case glslang::EOpSubgroupInclusiveXor:
  8297. groupOperation = spv::GroupOperation::InclusiveScan;
  8298. break;
  8299. case glslang::EOpSubgroupBallotExclusiveBitCount:
  8300. case glslang::EOpSubgroupExclusiveAdd:
  8301. case glslang::EOpSubgroupExclusiveMul:
  8302. case glslang::EOpSubgroupExclusiveMin:
  8303. case glslang::EOpSubgroupExclusiveMax:
  8304. case glslang::EOpSubgroupExclusiveAnd:
  8305. case glslang::EOpSubgroupExclusiveOr:
  8306. case glslang::EOpSubgroupExclusiveXor:
  8307. groupOperation = spv::GroupOperation::ExclusiveScan;
  8308. break;
  8309. case glslang::EOpSubgroupClusteredAdd:
  8310. case glslang::EOpSubgroupClusteredMul:
  8311. case glslang::EOpSubgroupClusteredMin:
  8312. case glslang::EOpSubgroupClusteredMax:
  8313. case glslang::EOpSubgroupClusteredAnd:
  8314. case glslang::EOpSubgroupClusteredOr:
  8315. case glslang::EOpSubgroupClusteredXor:
  8316. groupOperation = spv::GroupOperation::ClusteredReduce;
  8317. break;
  8318. case glslang::EOpSubgroupPartitionedAdd:
  8319. case glslang::EOpSubgroupPartitionedMul:
  8320. case glslang::EOpSubgroupPartitionedMin:
  8321. case glslang::EOpSubgroupPartitionedMax:
  8322. case glslang::EOpSubgroupPartitionedAnd:
  8323. case glslang::EOpSubgroupPartitionedOr:
  8324. case glslang::EOpSubgroupPartitionedXor:
  8325. groupOperation = spv::GroupOperation::PartitionedReduceNV;
  8326. break;
  8327. case glslang::EOpSubgroupPartitionedInclusiveAdd:
  8328. case glslang::EOpSubgroupPartitionedInclusiveMul:
  8329. case glslang::EOpSubgroupPartitionedInclusiveMin:
  8330. case glslang::EOpSubgroupPartitionedInclusiveMax:
  8331. case glslang::EOpSubgroupPartitionedInclusiveAnd:
  8332. case glslang::EOpSubgroupPartitionedInclusiveOr:
  8333. case glslang::EOpSubgroupPartitionedInclusiveXor:
  8334. groupOperation = spv::GroupOperation::PartitionedInclusiveScanNV;
  8335. break;
  8336. case glslang::EOpSubgroupPartitionedExclusiveAdd:
  8337. case glslang::EOpSubgroupPartitionedExclusiveMul:
  8338. case glslang::EOpSubgroupPartitionedExclusiveMin:
  8339. case glslang::EOpSubgroupPartitionedExclusiveMax:
  8340. case glslang::EOpSubgroupPartitionedExclusiveAnd:
  8341. case glslang::EOpSubgroupPartitionedExclusiveOr:
  8342. case glslang::EOpSubgroupPartitionedExclusiveXor:
  8343. groupOperation = spv::GroupOperation::PartitionedExclusiveScanNV;
  8344. break;
  8345. }
  8346. // build the instruction
  8347. std::vector<spv::IdImmediate> spvGroupOperands;
  8348. // Every operation begins with the Execution Scope operand.
  8349. spv::IdImmediate executionScope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };
  8350. // All other ops need the execution scope. Quad Control Ops don't need scope, it's always Quad.
  8351. if (opCode != spv::Op::OpGroupNonUniformQuadAllKHR && opCode != spv::Op::OpGroupNonUniformQuadAnyKHR) {
  8352. spvGroupOperands.push_back(executionScope);
  8353. }
  8354. // Next, for all operations that use a Group Operation, push that as an operand.
  8355. if (groupOperation != spv::GroupOperation::Max) {
  8356. spv::IdImmediate groupOperand = { false, (unsigned)groupOperation };
  8357. spvGroupOperands.push_back(groupOperand);
  8358. }
  8359. // Push back the operands next.
  8360. for (auto opIt = operands.cbegin(); opIt != operands.cend(); ++opIt) {
  8361. spv::IdImmediate operand = { true, *opIt };
  8362. spvGroupOperands.push_back(operand);
  8363. }
  8364. // Some opcodes have additional operands.
  8365. spv::Id directionId = spv::NoResult;
  8366. switch (op) {
  8367. default: break;
  8368. case glslang::EOpSubgroupQuadSwapHorizontal: directionId = builder.makeUintConstant(0); break;
  8369. case glslang::EOpSubgroupQuadSwapVertical: directionId = builder.makeUintConstant(1); break;
  8370. case glslang::EOpSubgroupQuadSwapDiagonal: directionId = builder.makeUintConstant(2); break;
  8371. }
  8372. if (directionId != spv::NoResult) {
  8373. spv::IdImmediate direction = { true, directionId };
  8374. spvGroupOperands.push_back(direction);
  8375. }
  8376. return builder.createOp(opCode, typeId, spvGroupOperands);
  8377. }
  8378. spv::Id TGlslangToSpvTraverser::createMiscOperation(glslang::TOperator op, spv::Decoration precision,
  8379. spv::Id typeId, std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)
  8380. {
  8381. bool isUnsigned = isTypeUnsignedInt(typeProxy);
  8382. bool isFloat = isTypeFloat(typeProxy);
  8383. spv::Op opCode = spv::Op::OpNop;
  8384. int extBuiltins = -1;
  8385. int libCall = -1;
  8386. size_t consumedOperands = operands.size();
  8387. spv::Id typeId0 = 0;
  8388. if (consumedOperands > 0)
  8389. typeId0 = builder.getTypeId(operands[0]);
  8390. spv::Id typeId1 = 0;
  8391. if (consumedOperands > 1)
  8392. typeId1 = builder.getTypeId(operands[1]);
  8393. spv::Id frexpIntType = 0;
  8394. switch (op) {
  8395. case glslang::EOpMin:
  8396. if (isFloat)
  8397. libCall = nanMinMaxClamp ? spv::GLSLstd450NMin : spv::GLSLstd450FMin;
  8398. else if (isUnsigned)
  8399. libCall = spv::GLSLstd450UMin;
  8400. else
  8401. libCall = spv::GLSLstd450SMin;
  8402. builder.promoteScalar(precision, operands.front(), operands.back());
  8403. break;
  8404. case glslang::EOpModf:
  8405. {
  8406. libCall = spv::GLSLstd450ModfStruct;
  8407. assert(builder.isFloatType(builder.getScalarTypeId(typeId0)));
  8408. // The returned struct has two members of the same type as the first argument
  8409. typeId = builder.makeStructResultType(typeId0, typeId0);
  8410. consumedOperands = 1;
  8411. }
  8412. break;
  8413. case glslang::EOpMax:
  8414. if (isFloat)
  8415. libCall = nanMinMaxClamp ? spv::GLSLstd450NMax : spv::GLSLstd450FMax;
  8416. else if (isUnsigned)
  8417. libCall = spv::GLSLstd450UMax;
  8418. else
  8419. libCall = spv::GLSLstd450SMax;
  8420. builder.promoteScalar(precision, operands.front(), operands.back());
  8421. break;
  8422. case glslang::EOpPow:
  8423. libCall = spv::GLSLstd450Pow;
  8424. break;
  8425. case glslang::EOpDot:
  8426. case glslang::EOpDotPackedEXT:
  8427. case glslang::EOpDotAccSatEXT:
  8428. case glslang::EOpDotPackedAccSatEXT:
  8429. {
  8430. if (builder.isFloatType(builder.getScalarTypeId(typeId0)) ||
  8431. // HLSL supports dot(int,int) which is just a multiply
  8432. glslangIntermediate->getSource() == glslang::EShSourceHlsl) {
  8433. if (typeProxy == glslang::EbtBFloat16) {
  8434. builder.addExtension(spv::E_SPV_KHR_bfloat16);
  8435. builder.addCapability(spv::Capability::BFloat16DotProductKHR);
  8436. }
  8437. opCode = spv::Op::OpDot;
  8438. } else {
  8439. builder.addExtension(spv::E_SPV_KHR_integer_dot_product);
  8440. builder.addCapability(spv::Capability::DotProductKHR);
  8441. const unsigned int vectorSize = builder.getNumComponents(operands[0]);
  8442. if (op == glslang::EOpDotPackedEXT || op == glslang::EOpDotPackedAccSatEXT) {
  8443. builder.addCapability(spv::Capability::DotProductInput4x8BitPackedKHR);
  8444. } else if (vectorSize == 4 && builder.getScalarTypeWidth(typeId0) == 8) {
  8445. builder.addCapability(spv::Capability::DotProductInput4x8BitKHR);
  8446. } else {
  8447. builder.addCapability(spv::Capability::DotProductInputAllKHR);
  8448. }
  8449. const bool type0isSigned = builder.isIntType(builder.getScalarTypeId(typeId0));
  8450. const bool type1isSigned = builder.isIntType(builder.getScalarTypeId(typeId1));
  8451. const bool accSat = (op == glslang::EOpDotAccSatEXT || op == glslang::EOpDotPackedAccSatEXT);
  8452. if (!type0isSigned && !type1isSigned) {
  8453. opCode = accSat ? spv::Op::OpUDotAccSatKHR : spv::Op::OpUDotKHR;
  8454. } else if (type0isSigned && type1isSigned) {
  8455. opCode = accSat ? spv::Op::OpSDotAccSatKHR : spv::Op::OpSDotKHR;
  8456. } else {
  8457. opCode = accSat ? spv::Op::OpSUDotAccSatKHR : spv::Op::OpSUDotKHR;
  8458. // the spir-v opcode assumes the operands to be "signed, unsigned" in that order, so swap if needed
  8459. if (type1isSigned) {
  8460. std::swap(operands[0], operands[1]);
  8461. }
  8462. }
  8463. std::vector<spv::IdImmediate> operands2;
  8464. for (auto &o : operands) {
  8465. operands2.push_back({true, o});
  8466. }
  8467. if (op == glslang::EOpDotPackedEXT || op == glslang::EOpDotPackedAccSatEXT) {
  8468. operands2.push_back({false, 0});
  8469. }
  8470. return builder.createOp(opCode, typeId, operands2);
  8471. }
  8472. }
  8473. break;
  8474. case glslang::EOpAtan:
  8475. libCall = spv::GLSLstd450Atan2;
  8476. break;
  8477. case glslang::EOpClamp:
  8478. if (isFloat)
  8479. libCall = nanMinMaxClamp ? spv::GLSLstd450NClamp : spv::GLSLstd450FClamp;
  8480. else if (isUnsigned)
  8481. libCall = spv::GLSLstd450UClamp;
  8482. else
  8483. libCall = spv::GLSLstd450SClamp;
  8484. builder.promoteScalar(precision, operands.front(), operands[1]);
  8485. builder.promoteScalar(precision, operands.front(), operands[2]);
  8486. break;
  8487. case glslang::EOpMix:
  8488. if (! builder.isBoolType(builder.getScalarTypeId(builder.getTypeId(operands.back())))) {
  8489. assert(isFloat);
  8490. libCall = spv::GLSLstd450FMix;
  8491. } else {
  8492. opCode = spv::Op::OpSelect;
  8493. std::swap(operands.front(), operands.back());
  8494. }
  8495. builder.promoteScalar(precision, operands.front(), operands.back());
  8496. break;
  8497. case glslang::EOpStep:
  8498. libCall = spv::GLSLstd450Step;
  8499. builder.promoteScalar(precision, operands.front(), operands.back());
  8500. break;
  8501. case glslang::EOpSmoothStep:
  8502. libCall = spv::GLSLstd450SmoothStep;
  8503. builder.promoteScalar(precision, operands[0], operands[2]);
  8504. builder.promoteScalar(precision, operands[1], operands[2]);
  8505. break;
  8506. case glslang::EOpDistance:
  8507. libCall = spv::GLSLstd450Distance;
  8508. break;
  8509. case glslang::EOpCross:
  8510. libCall = spv::GLSLstd450Cross;
  8511. break;
  8512. case glslang::EOpFaceForward:
  8513. libCall = spv::GLSLstd450FaceForward;
  8514. break;
  8515. case glslang::EOpReflect:
  8516. libCall = spv::GLSLstd450Reflect;
  8517. break;
  8518. case glslang::EOpRefract:
  8519. libCall = spv::GLSLstd450Refract;
  8520. break;
  8521. case glslang::EOpBarrier:
  8522. {
  8523. // This is for the extended controlBarrier function, with four operands.
  8524. // The unextended barrier() goes through createNoArgOperation.
  8525. assert(operands.size() == 4);
  8526. auto const executionScope = (spv::Scope)builder.getConstantScalar(operands[0]);
  8527. auto const memoryScope = (spv::Scope)builder.getConstantScalar(operands[1]);
  8528. auto const semantics = (spv::MemorySemanticsMask)(builder.getConstantScalar(operands[2]) | builder.getConstantScalar(operands[3]));
  8529. builder.createControlBarrier(executionScope, memoryScope,
  8530. semantics);
  8531. if (anySet(semantics, spv::MemorySemanticsMask::MakeAvailableKHR |
  8532. spv::MemorySemanticsMask::MakeVisibleKHR |
  8533. spv::MemorySemanticsMask::OutputMemoryKHR |
  8534. spv::MemorySemanticsMask::Volatile)) {
  8535. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  8536. }
  8537. if (glslangIntermediate->usingVulkanMemoryModel() && (executionScope == spv::Scope::Device ||
  8538. memoryScope == spv::Scope::Device)) {
  8539. builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);
  8540. }
  8541. return 0;
  8542. }
  8543. break;
  8544. case glslang::EOpMemoryBarrier:
  8545. {
  8546. // This is for the extended memoryBarrier function, with three operands.
  8547. // The unextended memoryBarrier() goes through createNoArgOperation.
  8548. assert(operands.size() == 3);
  8549. auto const memoryScope = (spv::Scope)builder.getConstantScalar(operands[0]);
  8550. auto const semantics = (spv::MemorySemanticsMask)(builder.getConstantScalar(operands[1]) | builder.getConstantScalar(operands[2]));
  8551. builder.createMemoryBarrier(memoryScope, semantics);
  8552. if (anySet(semantics, spv::MemorySemanticsMask::MakeAvailableKHR |
  8553. spv::MemorySemanticsMask::MakeVisibleKHR |
  8554. spv::MemorySemanticsMask::OutputMemoryKHR |
  8555. spv::MemorySemanticsMask::Volatile)) {
  8556. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  8557. }
  8558. if (glslangIntermediate->usingVulkanMemoryModel() && memoryScope == spv::Scope::Device) {
  8559. builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);
  8560. }
  8561. return 0;
  8562. }
  8563. break;
  8564. case glslang::EOpInterpolateAtSample:
  8565. if (typeProxy == glslang::EbtFloat16)
  8566. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
  8567. libCall = spv::GLSLstd450InterpolateAtSample;
  8568. break;
  8569. case glslang::EOpInterpolateAtOffset:
  8570. if (typeProxy == glslang::EbtFloat16)
  8571. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
  8572. libCall = spv::GLSLstd450InterpolateAtOffset;
  8573. break;
  8574. case glslang::EOpAddCarry:
  8575. opCode = spv::Op::OpIAddCarry;
  8576. typeId = builder.makeStructResultType(typeId0, typeId0);
  8577. consumedOperands = 2;
  8578. break;
  8579. case glslang::EOpSubBorrow:
  8580. opCode = spv::Op::OpISubBorrow;
  8581. typeId = builder.makeStructResultType(typeId0, typeId0);
  8582. consumedOperands = 2;
  8583. break;
  8584. case glslang::EOpUMulExtended:
  8585. opCode = spv::Op::OpUMulExtended;
  8586. typeId = builder.makeStructResultType(typeId0, typeId0);
  8587. consumedOperands = 2;
  8588. break;
  8589. case glslang::EOpIMulExtended:
  8590. opCode = spv::Op::OpSMulExtended;
  8591. typeId = builder.makeStructResultType(typeId0, typeId0);
  8592. consumedOperands = 2;
  8593. break;
  8594. case glslang::EOpBitfieldExtract:
  8595. if (isUnsigned)
  8596. opCode = spv::Op::OpBitFieldUExtract;
  8597. else
  8598. opCode = spv::Op::OpBitFieldSExtract;
  8599. break;
  8600. case glslang::EOpBitfieldInsert:
  8601. opCode = spv::Op::OpBitFieldInsert;
  8602. break;
  8603. case glslang::EOpFma:
  8604. libCall = spv::GLSLstd450Fma;
  8605. break;
  8606. case glslang::EOpFrexp:
  8607. {
  8608. libCall = spv::GLSLstd450FrexpStruct;
  8609. assert(builder.isPointerType(typeId1));
  8610. typeId1 = builder.getContainedTypeId(typeId1);
  8611. int width = builder.getScalarTypeWidth(typeId1);
  8612. if (width == 16)
  8613. // Using 16-bit exp operand, enable extension SPV_AMD_gpu_shader_int16
  8614. builder.addExtension(spv::E_SPV_AMD_gpu_shader_int16);
  8615. if (builder.getNumComponents(operands[0]) == 1)
  8616. frexpIntType = builder.makeIntegerType(width, true);
  8617. else
  8618. frexpIntType = builder.makeVectorType(builder.makeIntegerType(width, true),
  8619. builder.getNumComponents(operands[0]));
  8620. typeId = builder.makeStructResultType(typeId0, frexpIntType);
  8621. consumedOperands = 1;
  8622. }
  8623. break;
  8624. case glslang::EOpLdexp:
  8625. libCall = spv::GLSLstd450Ldexp;
  8626. break;
  8627. case glslang::EOpReadInvocation:
  8628. return createInvocationsOperation(op, typeId, operands, typeProxy);
  8629. case glslang::EOpSubgroupBroadcast:
  8630. case glslang::EOpSubgroupBallotBitExtract:
  8631. case glslang::EOpSubgroupShuffle:
  8632. case glslang::EOpSubgroupShuffleXor:
  8633. case glslang::EOpSubgroupShuffleUp:
  8634. case glslang::EOpSubgroupShuffleDown:
  8635. case glslang::EOpSubgroupRotate:
  8636. case glslang::EOpSubgroupClusteredRotate:
  8637. case glslang::EOpSubgroupClusteredAdd:
  8638. case glslang::EOpSubgroupClusteredMul:
  8639. case glslang::EOpSubgroupClusteredMin:
  8640. case glslang::EOpSubgroupClusteredMax:
  8641. case glslang::EOpSubgroupClusteredAnd:
  8642. case glslang::EOpSubgroupClusteredOr:
  8643. case glslang::EOpSubgroupClusteredXor:
  8644. case glslang::EOpSubgroupQuadBroadcast:
  8645. case glslang::EOpSubgroupPartitionedAdd:
  8646. case glslang::EOpSubgroupPartitionedMul:
  8647. case glslang::EOpSubgroupPartitionedMin:
  8648. case glslang::EOpSubgroupPartitionedMax:
  8649. case glslang::EOpSubgroupPartitionedAnd:
  8650. case glslang::EOpSubgroupPartitionedOr:
  8651. case glslang::EOpSubgroupPartitionedXor:
  8652. case glslang::EOpSubgroupPartitionedInclusiveAdd:
  8653. case glslang::EOpSubgroupPartitionedInclusiveMul:
  8654. case glslang::EOpSubgroupPartitionedInclusiveMin:
  8655. case glslang::EOpSubgroupPartitionedInclusiveMax:
  8656. case glslang::EOpSubgroupPartitionedInclusiveAnd:
  8657. case glslang::EOpSubgroupPartitionedInclusiveOr:
  8658. case glslang::EOpSubgroupPartitionedInclusiveXor:
  8659. case glslang::EOpSubgroupPartitionedExclusiveAdd:
  8660. case glslang::EOpSubgroupPartitionedExclusiveMul:
  8661. case glslang::EOpSubgroupPartitionedExclusiveMin:
  8662. case glslang::EOpSubgroupPartitionedExclusiveMax:
  8663. case glslang::EOpSubgroupPartitionedExclusiveAnd:
  8664. case glslang::EOpSubgroupPartitionedExclusiveOr:
  8665. case glslang::EOpSubgroupPartitionedExclusiveXor:
  8666. return createSubgroupOperation(op, typeId, operands, typeProxy);
  8667. case glslang::EOpSwizzleInvocations:
  8668. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
  8669. libCall = spv::SwizzleInvocationsAMD;
  8670. break;
  8671. case glslang::EOpSwizzleInvocationsMasked:
  8672. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
  8673. libCall = spv::SwizzleInvocationsMaskedAMD;
  8674. break;
  8675. case glslang::EOpWriteInvocation:
  8676. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
  8677. libCall = spv::WriteInvocationAMD;
  8678. break;
  8679. case glslang::EOpMin3:
  8680. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_trinary_minmax);
  8681. if (isFloat)
  8682. libCall = spv::FMin3AMD;
  8683. else {
  8684. if (isUnsigned)
  8685. libCall = spv::UMin3AMD;
  8686. else
  8687. libCall = spv::SMin3AMD;
  8688. }
  8689. break;
  8690. case glslang::EOpMax3:
  8691. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_trinary_minmax);
  8692. if (isFloat)
  8693. libCall = spv::FMax3AMD;
  8694. else {
  8695. if (isUnsigned)
  8696. libCall = spv::UMax3AMD;
  8697. else
  8698. libCall = spv::SMax3AMD;
  8699. }
  8700. break;
  8701. case glslang::EOpMid3:
  8702. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_trinary_minmax);
  8703. if (isFloat)
  8704. libCall = spv::FMid3AMD;
  8705. else {
  8706. if (isUnsigned)
  8707. libCall = spv::UMid3AMD;
  8708. else
  8709. libCall = spv::SMid3AMD;
  8710. }
  8711. break;
  8712. case glslang::EOpInterpolateAtVertex:
  8713. if (typeProxy == glslang::EbtFloat16)
  8714. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
  8715. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  8716. libCall = spv::InterpolateAtVertexAMD;
  8717. break;
  8718. case glslang::EOpReportIntersection:
  8719. typeId = builder.makeBoolType();
  8720. opCode = spv::Op::OpReportIntersectionKHR;
  8721. break;
  8722. case glslang::EOpTraceNV:
  8723. builder.createNoResultOp(spv::Op::OpTraceNV, operands);
  8724. return 0;
  8725. case glslang::EOpTraceRayMotionNV:
  8726. builder.addExtension(spv::E_SPV_NV_ray_tracing_motion_blur);
  8727. builder.addCapability(spv::Capability::RayTracingMotionBlurNV);
  8728. builder.createNoResultOp(spv::Op::OpTraceRayMotionNV, operands);
  8729. return 0;
  8730. case glslang::EOpTraceKHR:
  8731. builder.createNoResultOp(spv::Op::OpTraceRayKHR, operands);
  8732. return 0;
  8733. case glslang::EOpExecuteCallableNV:
  8734. builder.createNoResultOp(spv::Op::OpExecuteCallableNV, operands);
  8735. return 0;
  8736. case glslang::EOpExecuteCallableKHR:
  8737. builder.createNoResultOp(spv::Op::OpExecuteCallableKHR, operands);
  8738. return 0;
  8739. case glslang::EOpRayQueryInitialize:
  8740. builder.createNoResultOp(spv::Op::OpRayQueryInitializeKHR, operands);
  8741. return 0;
  8742. case glslang::EOpRayQueryTerminate:
  8743. builder.createNoResultOp(spv::Op::OpRayQueryTerminateKHR, operands);
  8744. return 0;
  8745. case glslang::EOpRayQueryGenerateIntersection:
  8746. builder.createNoResultOp(spv::Op::OpRayQueryGenerateIntersectionKHR, operands);
  8747. return 0;
  8748. case glslang::EOpRayQueryConfirmIntersection:
  8749. builder.createNoResultOp(spv::Op::OpRayQueryConfirmIntersectionKHR, operands);
  8750. return 0;
  8751. case glslang::EOpRayQueryProceed:
  8752. typeId = builder.makeBoolType();
  8753. opCode = spv::Op::OpRayQueryProceedKHR;
  8754. break;
  8755. case glslang::EOpRayQueryGetIntersectionType:
  8756. typeId = builder.makeUintType(32);
  8757. opCode = spv::Op::OpRayQueryGetIntersectionTypeKHR;
  8758. break;
  8759. case glslang::EOpRayQueryGetRayTMin:
  8760. typeId = builder.makeFloatType(32);
  8761. opCode = spv::Op::OpRayQueryGetRayTMinKHR;
  8762. break;
  8763. case glslang::EOpRayQueryGetRayFlags:
  8764. typeId = builder.makeIntType(32);
  8765. opCode = spv::Op::OpRayQueryGetRayFlagsKHR;
  8766. break;
  8767. case glslang::EOpRayQueryGetIntersectionT:
  8768. typeId = builder.makeFloatType(32);
  8769. opCode = spv::Op::OpRayQueryGetIntersectionTKHR;
  8770. break;
  8771. case glslang::EOpRayQueryGetIntersectionInstanceCustomIndex:
  8772. typeId = builder.makeIntType(32);
  8773. opCode = spv::Op::OpRayQueryGetIntersectionInstanceCustomIndexKHR;
  8774. break;
  8775. case glslang::EOpRayQueryGetIntersectionInstanceId:
  8776. typeId = builder.makeIntType(32);
  8777. opCode = spv::Op::OpRayQueryGetIntersectionInstanceIdKHR;
  8778. break;
  8779. case glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset:
  8780. typeId = builder.makeUintType(32);
  8781. opCode = spv::Op::OpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffsetKHR;
  8782. break;
  8783. case glslang::EOpRayQueryGetIntersectionGeometryIndex:
  8784. typeId = builder.makeIntType(32);
  8785. opCode = spv::Op::OpRayQueryGetIntersectionGeometryIndexKHR;
  8786. break;
  8787. case glslang::EOpRayQueryGetIntersectionPrimitiveIndex:
  8788. typeId = builder.makeIntType(32);
  8789. opCode = spv::Op::OpRayQueryGetIntersectionPrimitiveIndexKHR;
  8790. break;
  8791. case glslang::EOpRayQueryGetIntersectionBarycentrics:
  8792. typeId = builder.makeVectorType(builder.makeFloatType(32), 2);
  8793. opCode = spv::Op::OpRayQueryGetIntersectionBarycentricsKHR;
  8794. break;
  8795. case glslang::EOpRayQueryGetIntersectionFrontFace:
  8796. typeId = builder.makeBoolType();
  8797. opCode = spv::Op::OpRayQueryGetIntersectionFrontFaceKHR;
  8798. break;
  8799. case glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque:
  8800. typeId = builder.makeBoolType();
  8801. opCode = spv::Op::OpRayQueryGetIntersectionCandidateAABBOpaqueKHR;
  8802. break;
  8803. case glslang::EOpRayQueryGetIntersectionObjectRayDirection:
  8804. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  8805. opCode = spv::Op::OpRayQueryGetIntersectionObjectRayDirectionKHR;
  8806. break;
  8807. case glslang::EOpRayQueryGetIntersectionObjectRayOrigin:
  8808. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  8809. opCode = spv::Op::OpRayQueryGetIntersectionObjectRayOriginKHR;
  8810. break;
  8811. case glslang::EOpRayQueryGetWorldRayDirection:
  8812. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  8813. opCode = spv::Op::OpRayQueryGetWorldRayDirectionKHR;
  8814. break;
  8815. case glslang::EOpRayQueryGetWorldRayOrigin:
  8816. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  8817. opCode = spv::Op::OpRayQueryGetWorldRayOriginKHR;
  8818. break;
  8819. case glslang::EOpRayQueryGetIntersectionObjectToWorld:
  8820. typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  8821. opCode = spv::Op::OpRayQueryGetIntersectionObjectToWorldKHR;
  8822. break;
  8823. case glslang::EOpRayQueryGetIntersectionClusterIdNV:
  8824. typeId = builder.makeIntegerType(32, 1);
  8825. opCode = spv::Op::OpRayQueryGetClusterIdNV;
  8826. break;
  8827. case glslang::EOpRayQueryGetIntersectionWorldToObject:
  8828. typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  8829. opCode = spv::Op::OpRayQueryGetIntersectionWorldToObjectKHR;
  8830. break;
  8831. case glslang::EOpRayQueryGetIntersectionSpherePositionNV:
  8832. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  8833. opCode = spv::Op::OpRayQueryGetIntersectionSpherePositionNV;
  8834. break;
  8835. case glslang::EOpRayQueryGetIntersectionSphereRadiusNV:
  8836. typeId = builder.makeFloatType(32);
  8837. opCode = spv::Op::OpRayQueryGetIntersectionSphereRadiusNV;
  8838. break;
  8839. case glslang::EOpRayQueryGetIntersectionLSSHitValueNV:
  8840. typeId = builder.makeFloatType(32);
  8841. opCode = spv::Op::OpRayQueryGetIntersectionLSSHitValueNV;
  8842. break;
  8843. case glslang::EOpRayQueryIsSphereHitNV:
  8844. typeId = builder.makeBoolType();
  8845. opCode = spv::Op::OpRayQueryIsSphereHitNV;
  8846. break;
  8847. case glslang::EOpRayQueryIsLSSHitNV:
  8848. typeId = builder.makeBoolType();
  8849. opCode = spv::Op::OpRayQueryIsLSSHitNV;
  8850. break;
  8851. case glslang::EOpWritePackedPrimitiveIndices4x8NV:
  8852. builder.createNoResultOp(spv::Op::OpWritePackedPrimitiveIndices4x8NV, operands);
  8853. return 0;
  8854. case glslang::EOpEmitMeshTasksEXT:
  8855. if (taskPayloadID)
  8856. operands.push_back(taskPayloadID);
  8857. // As per SPV_EXT_mesh_shader make it a terminating instruction in the current block
  8858. builder.makeStatementTerminator(spv::Op::OpEmitMeshTasksEXT, operands, "post-OpEmitMeshTasksEXT");
  8859. return 0;
  8860. case glslang::EOpSetMeshOutputsEXT:
  8861. builder.createNoResultOp(spv::Op::OpSetMeshOutputsEXT, operands);
  8862. return 0;
  8863. case glslang::EOpCooperativeMatrixMulAddNV:
  8864. opCode = spv::Op::OpCooperativeMatrixMulAddNV;
  8865. break;
  8866. case glslang::EOpHitObjectTraceRayNV:
  8867. builder.createNoResultOp(spv::Op::OpHitObjectTraceRayNV, operands);
  8868. return 0;
  8869. case glslang::EOpHitObjectTraceRayMotionNV:
  8870. builder.createNoResultOp(spv::Op::OpHitObjectTraceRayMotionNV, operands);
  8871. return 0;
  8872. case glslang::EOpHitObjectRecordHitNV:
  8873. builder.createNoResultOp(spv::Op::OpHitObjectRecordHitNV, operands);
  8874. return 0;
  8875. case glslang::EOpHitObjectRecordHitMotionNV:
  8876. builder.createNoResultOp(spv::Op::OpHitObjectRecordHitMotionNV, operands);
  8877. return 0;
  8878. case glslang::EOpHitObjectRecordHitWithIndexNV:
  8879. builder.createNoResultOp(spv::Op::OpHitObjectRecordHitWithIndexNV, operands);
  8880. return 0;
  8881. case glslang::EOpHitObjectRecordHitWithIndexMotionNV:
  8882. builder.createNoResultOp(spv::Op::OpHitObjectRecordHitWithIndexMotionNV, operands);
  8883. return 0;
  8884. case glslang::EOpHitObjectRecordMissNV:
  8885. builder.createNoResultOp(spv::Op::OpHitObjectRecordMissNV, operands);
  8886. return 0;
  8887. case glslang::EOpHitObjectRecordMissMotionNV:
  8888. builder.createNoResultOp(spv::Op::OpHitObjectRecordMissMotionNV, operands);
  8889. return 0;
  8890. case glslang::EOpHitObjectExecuteShaderNV:
  8891. builder.createNoResultOp(spv::Op::OpHitObjectExecuteShaderNV, operands);
  8892. return 0;
  8893. case glslang::EOpHitObjectIsEmptyNV:
  8894. typeId = builder.makeBoolType();
  8895. opCode = spv::Op::OpHitObjectIsEmptyNV;
  8896. break;
  8897. case glslang::EOpHitObjectIsMissNV:
  8898. typeId = builder.makeBoolType();
  8899. opCode = spv::Op::OpHitObjectIsMissNV;
  8900. break;
  8901. case glslang::EOpHitObjectIsHitNV:
  8902. typeId = builder.makeBoolType();
  8903. opCode = spv::Op::OpHitObjectIsHitNV;
  8904. break;
  8905. case glslang::EOpHitObjectIsSphereHitNV:
  8906. typeId = builder.makeBoolType();
  8907. opCode = spv::Op::OpHitObjectIsSphereHitNV;
  8908. break;
  8909. case glslang::EOpHitObjectIsLSSHitNV:
  8910. typeId = builder.makeBoolType();
  8911. opCode = spv::Op::OpHitObjectIsLSSHitNV;
  8912. break;
  8913. case glslang::EOpHitObjectGetRayTMinNV:
  8914. typeId = builder.makeFloatType(32);
  8915. opCode = spv::Op::OpHitObjectGetRayTMinNV;
  8916. break;
  8917. case glslang::EOpHitObjectGetRayTMaxNV:
  8918. typeId = builder.makeFloatType(32);
  8919. opCode = spv::Op::OpHitObjectGetRayTMaxNV;
  8920. break;
  8921. case glslang::EOpHitObjectGetObjectRayOriginNV:
  8922. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  8923. opCode = spv::Op::OpHitObjectGetObjectRayOriginNV;
  8924. break;
  8925. case glslang::EOpHitObjectGetObjectRayDirectionNV:
  8926. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  8927. opCode = spv::Op::OpHitObjectGetObjectRayDirectionNV;
  8928. break;
  8929. case glslang::EOpHitObjectGetWorldRayOriginNV:
  8930. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  8931. opCode = spv::Op::OpHitObjectGetWorldRayOriginNV;
  8932. break;
  8933. case glslang::EOpHitObjectGetWorldRayDirectionNV:
  8934. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  8935. opCode = spv::Op::OpHitObjectGetWorldRayDirectionNV;
  8936. break;
  8937. case glslang::EOpHitObjectGetWorldToObjectNV:
  8938. typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  8939. opCode = spv::Op::OpHitObjectGetWorldToObjectNV;
  8940. break;
  8941. case glslang::EOpHitObjectGetObjectToWorldNV:
  8942. typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  8943. opCode = spv::Op::OpHitObjectGetObjectToWorldNV;
  8944. break;
  8945. case glslang::EOpHitObjectGetInstanceCustomIndexNV:
  8946. typeId = builder.makeIntegerType(32, 1);
  8947. opCode = spv::Op::OpHitObjectGetInstanceCustomIndexNV;
  8948. break;
  8949. case glslang::EOpHitObjectGetInstanceIdNV:
  8950. typeId = builder.makeIntegerType(32, 1);
  8951. opCode = spv::Op::OpHitObjectGetInstanceIdNV;
  8952. break;
  8953. case glslang::EOpHitObjectGetGeometryIndexNV:
  8954. typeId = builder.makeIntegerType(32, 1);
  8955. opCode = spv::Op::OpHitObjectGetGeometryIndexNV;
  8956. break;
  8957. case glslang::EOpHitObjectGetPrimitiveIndexNV:
  8958. typeId = builder.makeIntegerType(32, 1);
  8959. opCode = spv::Op::OpHitObjectGetPrimitiveIndexNV;
  8960. break;
  8961. case glslang::EOpHitObjectGetHitKindNV:
  8962. typeId = builder.makeIntegerType(32, 0);
  8963. opCode = spv::Op::OpHitObjectGetHitKindNV;
  8964. break;
  8965. case glslang::EOpHitObjectGetCurrentTimeNV:
  8966. typeId = builder.makeFloatType(32);
  8967. opCode = spv::Op::OpHitObjectGetCurrentTimeNV;
  8968. break;
  8969. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:
  8970. typeId = builder.makeIntegerType(32, 0);
  8971. opCode = spv::Op::OpHitObjectGetShaderBindingTableRecordIndexNV;
  8972. return 0;
  8973. case glslang::EOpHitObjectGetAttributesNV:
  8974. builder.createNoResultOp(spv::Op::OpHitObjectGetAttributesNV, operands);
  8975. return 0;
  8976. case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:
  8977. typeId = builder.makeVectorType(builder.makeUintType(32), 2);
  8978. opCode = spv::Op::OpHitObjectGetShaderRecordBufferHandleNV;
  8979. break;
  8980. case glslang::EOpHitObjectGetClusterIdNV:
  8981. typeId = builder.makeIntegerType(32, 1);
  8982. opCode = spv::Op::OpHitObjectGetClusterIdNV;
  8983. break;
  8984. case glslang::EOpReorderThreadNV: {
  8985. if (operands.size() == 2) {
  8986. builder.createNoResultOp(spv::Op::OpReorderThreadWithHintNV, operands);
  8987. } else {
  8988. builder.createNoResultOp(spv::Op::OpReorderThreadWithHitObjectNV, operands);
  8989. }
  8990. return 0;
  8991. }
  8992. case glslang::EOpImageSampleWeightedQCOM:
  8993. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  8994. opCode = spv::Op::OpImageSampleWeightedQCOM;
  8995. addImageProcessingQCOMDecoration(operands[2], spv::Decoration::WeightTextureQCOM);
  8996. break;
  8997. case glslang::EOpImageBoxFilterQCOM:
  8998. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  8999. opCode = spv::Op::OpImageBoxFilterQCOM;
  9000. break;
  9001. case glslang::EOpImageBlockMatchSADQCOM:
  9002. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9003. opCode = spv::Op::OpImageBlockMatchSADQCOM;
  9004. addImageProcessingQCOMDecoration(operands[0], spv::Decoration::BlockMatchTextureQCOM);
  9005. addImageProcessingQCOMDecoration(operands[2], spv::Decoration::BlockMatchTextureQCOM);
  9006. break;
  9007. case glslang::EOpImageBlockMatchSSDQCOM:
  9008. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9009. opCode = spv::Op::OpImageBlockMatchSSDQCOM;
  9010. addImageProcessingQCOMDecoration(operands[0], spv::Decoration::BlockMatchTextureQCOM);
  9011. addImageProcessingQCOMDecoration(operands[2], spv::Decoration::BlockMatchTextureQCOM);
  9012. break;
  9013. case glslang::EOpFetchMicroTriangleVertexBarycentricNV:
  9014. typeId = builder.makeVectorType(builder.makeFloatType(32), 2);
  9015. opCode = spv::Op::OpFetchMicroTriangleVertexBarycentricNV;
  9016. break;
  9017. case glslang::EOpFetchMicroTriangleVertexPositionNV:
  9018. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9019. opCode = spv::Op::OpFetchMicroTriangleVertexPositionNV;
  9020. break;
  9021. case glslang::EOpImageBlockMatchWindowSSDQCOM:
  9022. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9023. opCode = spv::Op::OpImageBlockMatchWindowSSDQCOM;
  9024. addImageProcessing2QCOMDecoration(operands[0], false);
  9025. addImageProcessing2QCOMDecoration(operands[2], false);
  9026. break;
  9027. case glslang::EOpImageBlockMatchWindowSADQCOM:
  9028. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9029. opCode = spv::Op::OpImageBlockMatchWindowSADQCOM;
  9030. addImageProcessing2QCOMDecoration(operands[0], false);
  9031. addImageProcessing2QCOMDecoration(operands[2], false);
  9032. break;
  9033. case glslang::EOpImageBlockMatchGatherSSDQCOM:
  9034. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9035. opCode = spv::Op::OpImageBlockMatchGatherSSDQCOM;
  9036. addImageProcessing2QCOMDecoration(operands[0], true);
  9037. addImageProcessing2QCOMDecoration(operands[2], true);
  9038. break;
  9039. case glslang::EOpImageBlockMatchGatherSADQCOM:
  9040. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9041. opCode = spv::Op::OpImageBlockMatchGatherSADQCOM;
  9042. addImageProcessing2QCOMDecoration(operands[0], true);
  9043. addImageProcessing2QCOMDecoration(operands[2], true);
  9044. break;
  9045. case glslang::EOpCreateTensorLayoutNV:
  9046. return builder.createOp(spv::Op::OpCreateTensorLayoutNV, typeId, std::vector<spv::Id>{});
  9047. case glslang::EOpCreateTensorViewNV:
  9048. return builder.createOp(spv::Op::OpCreateTensorViewNV, typeId, std::vector<spv::Id>{});
  9049. case glslang::EOpTensorLayoutSetBlockSizeNV:
  9050. opCode = spv::Op::OpTensorLayoutSetBlockSizeNV;
  9051. break;
  9052. case glslang::EOpTensorLayoutSetDimensionNV:
  9053. opCode = spv::Op::OpTensorLayoutSetDimensionNV;
  9054. break;
  9055. case glslang::EOpTensorLayoutSetStrideNV:
  9056. opCode = spv::Op::OpTensorLayoutSetStrideNV;
  9057. break;
  9058. case glslang::EOpTensorLayoutSliceNV:
  9059. opCode = spv::Op::OpTensorLayoutSliceNV;
  9060. break;
  9061. case glslang::EOpTensorLayoutSetClampValueNV:
  9062. opCode = spv::Op::OpTensorLayoutSetClampValueNV;
  9063. break;
  9064. case glslang::EOpTensorViewSetDimensionNV:
  9065. opCode = spv::Op::OpTensorViewSetDimensionNV;
  9066. break;
  9067. case glslang::EOpTensorViewSetStrideNV:
  9068. opCode = spv::Op::OpTensorViewSetStrideNV;
  9069. break;
  9070. case glslang::EOpTensorViewSetClipNV:
  9071. opCode = spv::Op::OpTensorViewSetClipNV;
  9072. break;
  9073. default:
  9074. return 0;
  9075. }
  9076. spv::Id id = 0;
  9077. if (libCall >= 0) {
  9078. // Use an extended instruction from the standard library.
  9079. // Construct the call arguments, without modifying the original operands vector.
  9080. // We might need the remaining arguments, e.g. in the EOpFrexp case.
  9081. std::vector<spv::Id> callArguments(operands.begin(), operands.begin() + consumedOperands);
  9082. id = builder.createBuiltinCall(typeId, extBuiltins >= 0 ? extBuiltins : stdBuiltins, libCall, callArguments);
  9083. } else if (opCode == spv::Op::OpDot && !isFloat) {
  9084. // int dot(int, int)
  9085. // NOTE: never called for scalar/vector1, this is turned into simple mul before this can be reached
  9086. const int componentCount = builder.getNumComponents(operands[0]);
  9087. spv::Id mulOp = builder.createBinOp(spv::Op::OpIMul, builder.getTypeId(operands[0]), operands[0], operands[1]);
  9088. builder.setPrecision(mulOp, precision);
  9089. id = builder.createCompositeExtract(mulOp, typeId, 0);
  9090. for (int i = 1; i < componentCount; ++i) {
  9091. builder.setPrecision(id, precision);
  9092. id = builder.createBinOp(spv::Op::OpIAdd, typeId, id, builder.createCompositeExtract(mulOp, typeId, i));
  9093. }
  9094. } else {
  9095. switch (consumedOperands) {
  9096. case 0:
  9097. // should all be handled by visitAggregate and createNoArgOperation
  9098. assert(0);
  9099. return 0;
  9100. case 1:
  9101. // should all be handled by createUnaryOperation
  9102. assert(0);
  9103. return 0;
  9104. case 2:
  9105. id = builder.createBinOp(opCode, typeId, operands[0], operands[1]);
  9106. break;
  9107. default:
  9108. // anything 3 or over doesn't have l-value operands, so all should be consumed
  9109. assert(consumedOperands == operands.size());
  9110. id = builder.createOp(opCode, typeId, operands);
  9111. break;
  9112. }
  9113. }
  9114. // Decode the return types that were structures
  9115. switch (op) {
  9116. case glslang::EOpAddCarry:
  9117. case glslang::EOpSubBorrow:
  9118. builder.createStore(builder.createCompositeExtract(id, typeId0, 1), operands[2]);
  9119. id = builder.createCompositeExtract(id, typeId0, 0);
  9120. break;
  9121. case glslang::EOpUMulExtended:
  9122. case glslang::EOpIMulExtended:
  9123. builder.createStore(builder.createCompositeExtract(id, typeId0, 0), operands[3]);
  9124. builder.createStore(builder.createCompositeExtract(id, typeId0, 1), operands[2]);
  9125. break;
  9126. case glslang::EOpModf:
  9127. {
  9128. assert(operands.size() == 2);
  9129. builder.createStore(builder.createCompositeExtract(id, typeId0, 1), operands[1]);
  9130. id = builder.createCompositeExtract(id, typeId0, 0);
  9131. }
  9132. break;
  9133. case glslang::EOpFrexp:
  9134. {
  9135. assert(operands.size() == 2);
  9136. if (builder.isFloatType(builder.getScalarTypeId(typeId1))) {
  9137. // "exp" is floating-point type (from HLSL intrinsic)
  9138. spv::Id member1 = builder.createCompositeExtract(id, frexpIntType, 1);
  9139. member1 = builder.createUnaryOp(spv::Op::OpConvertSToF, typeId1, member1);
  9140. builder.createStore(member1, operands[1]);
  9141. } else
  9142. // "exp" is integer type (from GLSL built-in function)
  9143. builder.createStore(builder.createCompositeExtract(id, frexpIntType, 1), operands[1]);
  9144. id = builder.createCompositeExtract(id, typeId0, 0);
  9145. }
  9146. break;
  9147. default:
  9148. break;
  9149. }
  9150. return builder.setPrecision(id, precision);
  9151. }
  9152. // Intrinsics with no arguments (or no return value, and no precision).
  9153. spv::Id TGlslangToSpvTraverser::createNoArgOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId)
  9154. {
  9155. // GLSL memory barriers use queuefamily scope in new model, device scope in old model
  9156. spv::Scope memoryBarrierScope = glslangIntermediate->usingVulkanMemoryModel() ?
  9157. spv::Scope::QueueFamilyKHR : spv::Scope::Device;
  9158. switch (op) {
  9159. case glslang::EOpBarrier:
  9160. if (glslangIntermediate->getStage() == EShLangTessControl) {
  9161. if (glslangIntermediate->usingVulkanMemoryModel()) {
  9162. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Workgroup,
  9163. spv::MemorySemanticsMask::OutputMemoryKHR |
  9164. spv::MemorySemanticsMask::AcquireRelease);
  9165. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  9166. } else {
  9167. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Invocation, spv::MemorySemanticsMask::MaskNone);
  9168. }
  9169. } else {
  9170. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Workgroup,
  9171. spv::MemorySemanticsMask::WorkgroupMemory |
  9172. spv::MemorySemanticsMask::AcquireRelease);
  9173. }
  9174. return 0;
  9175. case glslang::EOpMemoryBarrier:
  9176. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsAllMemory |
  9177. spv::MemorySemanticsMask::AcquireRelease);
  9178. return 0;
  9179. case glslang::EOpMemoryBarrierBuffer:
  9180. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::UniformMemory |
  9181. spv::MemorySemanticsMask::AcquireRelease);
  9182. return 0;
  9183. case glslang::EOpMemoryBarrierShared:
  9184. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::WorkgroupMemory |
  9185. spv::MemorySemanticsMask::AcquireRelease);
  9186. return 0;
  9187. case glslang::EOpGroupMemoryBarrier:
  9188. builder.createMemoryBarrier(spv::Scope::Workgroup, spv::MemorySemanticsAllMemory |
  9189. spv::MemorySemanticsMask::AcquireRelease);
  9190. return 0;
  9191. case glslang::EOpMemoryBarrierAtomicCounter:
  9192. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::AtomicCounterMemory |
  9193. spv::MemorySemanticsMask::AcquireRelease);
  9194. return 0;
  9195. case glslang::EOpMemoryBarrierImage:
  9196. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::ImageMemory |
  9197. spv::MemorySemanticsMask::AcquireRelease);
  9198. return 0;
  9199. case glslang::EOpAllMemoryBarrierWithGroupSync:
  9200. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Device,
  9201. spv::MemorySemanticsAllMemory |
  9202. spv::MemorySemanticsMask::AcquireRelease);
  9203. return 0;
  9204. case glslang::EOpDeviceMemoryBarrier:
  9205. builder.createMemoryBarrier(spv::Scope::Device, spv::MemorySemanticsMask::UniformMemory |
  9206. spv::MemorySemanticsMask::ImageMemory |
  9207. spv::MemorySemanticsMask::AcquireRelease);
  9208. return 0;
  9209. case glslang::EOpDeviceMemoryBarrierWithGroupSync:
  9210. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Device, spv::MemorySemanticsMask::UniformMemory |
  9211. spv::MemorySemanticsMask::ImageMemory |
  9212. spv::MemorySemanticsMask::AcquireRelease);
  9213. return 0;
  9214. case glslang::EOpWorkgroupMemoryBarrier:
  9215. builder.createMemoryBarrier(spv::Scope::Workgroup, spv::MemorySemanticsMask::WorkgroupMemory |
  9216. spv::MemorySemanticsMask::AcquireRelease);
  9217. return 0;
  9218. case glslang::EOpWorkgroupMemoryBarrierWithGroupSync:
  9219. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Workgroup,
  9220. spv::MemorySemanticsMask::WorkgroupMemory |
  9221. spv::MemorySemanticsMask::AcquireRelease);
  9222. return 0;
  9223. case glslang::EOpSubgroupBarrier:
  9224. builder.createControlBarrier(spv::Scope::Subgroup, spv::Scope::Subgroup, spv::MemorySemanticsAllMemory |
  9225. spv::MemorySemanticsMask::AcquireRelease);
  9226. return spv::NoResult;
  9227. case glslang::EOpSubgroupMemoryBarrier:
  9228. builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsAllMemory |
  9229. spv::MemorySemanticsMask::AcquireRelease);
  9230. return spv::NoResult;
  9231. case glslang::EOpSubgroupMemoryBarrierBuffer:
  9232. builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsMask::UniformMemory |
  9233. spv::MemorySemanticsMask::AcquireRelease);
  9234. return spv::NoResult;
  9235. case glslang::EOpSubgroupMemoryBarrierImage:
  9236. builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsMask::ImageMemory |
  9237. spv::MemorySemanticsMask::AcquireRelease);
  9238. return spv::NoResult;
  9239. case glslang::EOpSubgroupMemoryBarrierShared:
  9240. builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsMask::WorkgroupMemory |
  9241. spv::MemorySemanticsMask::AcquireRelease);
  9242. return spv::NoResult;
  9243. case glslang::EOpEmitVertex:
  9244. builder.createNoResultOp(spv::Op::OpEmitVertex);
  9245. return 0;
  9246. case glslang::EOpEndPrimitive:
  9247. builder.createNoResultOp(spv::Op::OpEndPrimitive);
  9248. return 0;
  9249. case glslang::EOpSubgroupElect: {
  9250. std::vector<spv::Id> operands;
  9251. return createSubgroupOperation(op, typeId, operands, glslang::EbtVoid);
  9252. }
  9253. case glslang::EOpTime:
  9254. {
  9255. std::vector<spv::Id> args; // Dummy arguments
  9256. spv::Id id = builder.createBuiltinCall(typeId, getExtBuiltins(spv::E_SPV_AMD_gcn_shader), spv::TimeAMD, args);
  9257. return builder.setPrecision(id, precision);
  9258. }
  9259. case glslang::EOpIgnoreIntersectionNV:
  9260. builder.createNoResultOp(spv::Op::OpIgnoreIntersectionNV);
  9261. return 0;
  9262. case glslang::EOpTerminateRayNV:
  9263. builder.createNoResultOp(spv::Op::OpTerminateRayNV);
  9264. return 0;
  9265. case glslang::EOpRayQueryInitialize:
  9266. builder.createNoResultOp(spv::Op::OpRayQueryInitializeKHR);
  9267. return 0;
  9268. case glslang::EOpRayQueryTerminate:
  9269. builder.createNoResultOp(spv::Op::OpRayQueryTerminateKHR);
  9270. return 0;
  9271. case glslang::EOpRayQueryGenerateIntersection:
  9272. builder.createNoResultOp(spv::Op::OpRayQueryGenerateIntersectionKHR);
  9273. return 0;
  9274. case glslang::EOpRayQueryConfirmIntersection:
  9275. builder.createNoResultOp(spv::Op::OpRayQueryConfirmIntersectionKHR);
  9276. return 0;
  9277. case glslang::EOpBeginInvocationInterlock:
  9278. builder.createNoResultOp(spv::Op::OpBeginInvocationInterlockEXT);
  9279. return 0;
  9280. case glslang::EOpEndInvocationInterlock:
  9281. builder.createNoResultOp(spv::Op::OpEndInvocationInterlockEXT);
  9282. return 0;
  9283. case glslang::EOpIsHelperInvocation:
  9284. {
  9285. std::vector<spv::Id> args; // Dummy arguments
  9286. builder.addExtension(spv::E_SPV_EXT_demote_to_helper_invocation);
  9287. builder.addCapability(spv::Capability::DemoteToHelperInvocationEXT);
  9288. return builder.createOp(spv::Op::OpIsHelperInvocationEXT, typeId, args);
  9289. }
  9290. case glslang::EOpReadClockSubgroupKHR: {
  9291. std::vector<spv::Id> args;
  9292. args.push_back(builder.makeUintConstant(spv::Scope::Subgroup));
  9293. builder.addExtension(spv::E_SPV_KHR_shader_clock);
  9294. builder.addCapability(spv::Capability::ShaderClockKHR);
  9295. return builder.createOp(spv::Op::OpReadClockKHR, typeId, args);
  9296. }
  9297. case glslang::EOpReadClockDeviceKHR: {
  9298. std::vector<spv::Id> args;
  9299. args.push_back(builder.makeUintConstant(spv::Scope::Device));
  9300. builder.addExtension(spv::E_SPV_KHR_shader_clock);
  9301. builder.addCapability(spv::Capability::ShaderClockKHR);
  9302. return builder.createOp(spv::Op::OpReadClockKHR, typeId, args);
  9303. }
  9304. case glslang::EOpStencilAttachmentReadEXT:
  9305. case glslang::EOpDepthAttachmentReadEXT:
  9306. {
  9307. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  9308. spv::Decoration precision;
  9309. spv::Op spv_op;
  9310. if (op == glslang::EOpStencilAttachmentReadEXT)
  9311. {
  9312. precision = spv::Decoration::RelaxedPrecision;
  9313. spv_op = spv::Op::OpStencilAttachmentReadEXT;
  9314. builder.addCapability(spv::Capability::TileImageStencilReadAccessEXT);
  9315. }
  9316. else
  9317. {
  9318. precision = spv::NoPrecision;
  9319. spv_op = spv::Op::OpDepthAttachmentReadEXT;
  9320. builder.addCapability(spv::Capability::TileImageDepthReadAccessEXT);
  9321. }
  9322. std::vector<spv::Id> args; // Dummy args
  9323. spv::Id result = builder.createOp(spv_op, typeId, args);
  9324. return builder.setPrecision(result, precision);
  9325. }
  9326. default:
  9327. break;
  9328. }
  9329. logger->missingFunctionality("unknown operation with no arguments");
  9330. return 0;
  9331. }
  9332. spv::Id TGlslangToSpvTraverser::getSymbolId(const glslang::TIntermSymbol* symbol)
  9333. {
  9334. auto iter = symbolValues.find(symbol->getId());
  9335. spv::Id id;
  9336. if (symbolValues.end() != iter) {
  9337. id = iter->second;
  9338. return id;
  9339. }
  9340. // it was not found, create it
  9341. spv::BuiltIn builtIn = TranslateBuiltInDecoration(symbol->getQualifier().builtIn, false);
  9342. auto forcedType = getForcedType(symbol->getQualifier().builtIn, symbol->getType());
  9343. // There are pairs of symbols that map to the same SPIR-V built-in:
  9344. // gl_ObjectToWorldEXT and gl_ObjectToWorld3x4EXT, and gl_WorldToObjectEXT
  9345. // and gl_WorldToObject3x4EXT. SPIR-V forbids having two OpVariables
  9346. // with the same BuiltIn in the same storage class, so we must re-use one.
  9347. const bool mayNeedToReuseBuiltIn =
  9348. builtIn == spv::BuiltIn::ObjectToWorldKHR ||
  9349. builtIn == spv::BuiltIn::WorldToObjectKHR;
  9350. if (mayNeedToReuseBuiltIn) {
  9351. auto iter = builtInVariableIds.find(uint32_t(builtIn));
  9352. if (builtInVariableIds.end() != iter) {
  9353. id = iter->second;
  9354. symbolValues[symbol->getId()] = id;
  9355. if (forcedType.second != spv::NoType)
  9356. forceType[id] = forcedType.second;
  9357. return id;
  9358. }
  9359. }
  9360. if (symbol->getBasicType() == glslang::EbtFunction) {
  9361. return 0;
  9362. }
  9363. id = createSpvVariable(symbol, forcedType.first);
  9364. if (mayNeedToReuseBuiltIn) {
  9365. builtInVariableIds.insert({uint32_t(builtIn), id});
  9366. }
  9367. symbolValues[symbol->getId()] = id;
  9368. if (forcedType.second != spv::NoType)
  9369. forceType[id] = forcedType.second;
  9370. if (symbol->getBasicType() != glslang::EbtBlock) {
  9371. builder.addDecoration(id, TranslatePrecisionDecoration(symbol->getType()));
  9372. builder.addDecoration(id, TranslateInterpolationDecoration(symbol->getType().getQualifier()));
  9373. builder.addDecoration(id, TranslateAuxiliaryStorageDecoration(symbol->getType().getQualifier()));
  9374. addMeshNVDecoration(id, /*member*/ -1, symbol->getType().getQualifier());
  9375. if (symbol->getQualifier().hasComponent())
  9376. builder.addDecoration(id, spv::Decoration::Component, symbol->getQualifier().layoutComponent);
  9377. if (symbol->getQualifier().hasIndex())
  9378. builder.addDecoration(id, spv::Decoration::Index, symbol->getQualifier().layoutIndex);
  9379. if (symbol->getType().getQualifier().hasSpecConstantId())
  9380. builder.addDecoration(id, spv::Decoration::SpecId, symbol->getType().getQualifier().layoutSpecConstantId);
  9381. // atomic counters use this:
  9382. if (symbol->getQualifier().hasOffset())
  9383. builder.addDecoration(id, spv::Decoration::Offset, symbol->getQualifier().layoutOffset);
  9384. }
  9385. if (symbol->getQualifier().hasLocation()) {
  9386. if (!(glslangIntermediate->isRayTracingStage() &&
  9387. (glslangIntermediate->IsRequestedExtension(glslang::E_GL_EXT_ray_tracing) ||
  9388. glslangIntermediate->IsRequestedExtension(glslang::E_GL_NV_shader_invocation_reorder))
  9389. && (builder.getStorageClass(id) == spv::StorageClass::RayPayloadKHR ||
  9390. builder.getStorageClass(id) == spv::StorageClass::IncomingRayPayloadKHR ||
  9391. builder.getStorageClass(id) == spv::StorageClass::CallableDataKHR ||
  9392. builder.getStorageClass(id) == spv::StorageClass::IncomingCallableDataKHR ||
  9393. builder.getStorageClass(id) == spv::StorageClass::HitObjectAttributeNV))) {
  9394. // Location values are used to link TraceRayKHR/ExecuteCallableKHR/HitObjectGetAttributesNV
  9395. // to corresponding variables but are not valid in SPIRV since they are supported only
  9396. // for Input/Output Storage classes.
  9397. builder.addDecoration(id, spv::Decoration::Location, symbol->getQualifier().layoutLocation);
  9398. }
  9399. }
  9400. builder.addDecoration(id, TranslateInvariantDecoration(symbol->getType().getQualifier()));
  9401. if (symbol->getQualifier().hasStream() && glslangIntermediate->isMultiStream()) {
  9402. builder.addCapability(spv::Capability::GeometryStreams);
  9403. builder.addDecoration(id, spv::Decoration::Stream, symbol->getQualifier().layoutStream);
  9404. }
  9405. if (symbol->getQualifier().hasSet())
  9406. builder.addDecoration(id, spv::Decoration::DescriptorSet, symbol->getQualifier().layoutSet);
  9407. else if (IsDescriptorResource(symbol->getType())) {
  9408. // default to 0
  9409. builder.addDecoration(id, spv::Decoration::DescriptorSet, 0);
  9410. }
  9411. if (symbol->getQualifier().hasBinding())
  9412. builder.addDecoration(id, spv::Decoration::Binding, symbol->getQualifier().layoutBinding);
  9413. else if (IsDescriptorResource(symbol->getType())) {
  9414. // default to 0
  9415. builder.addDecoration(id, spv::Decoration::Binding, 0);
  9416. }
  9417. if (symbol->getQualifier().hasAttachment())
  9418. builder.addDecoration(id, spv::Decoration::InputAttachmentIndex, symbol->getQualifier().layoutAttachment);
  9419. if (glslangIntermediate->getXfbMode()) {
  9420. builder.addCapability(spv::Capability::TransformFeedback);
  9421. if (symbol->getQualifier().hasXfbBuffer()) {
  9422. builder.addDecoration(id, spv::Decoration::XfbBuffer, symbol->getQualifier().layoutXfbBuffer);
  9423. unsigned stride = glslangIntermediate->getXfbStride(symbol->getQualifier().layoutXfbBuffer);
  9424. if (stride != glslang::TQualifier::layoutXfbStrideEnd)
  9425. builder.addDecoration(id, spv::Decoration::XfbStride, stride);
  9426. }
  9427. if (symbol->getQualifier().hasXfbOffset())
  9428. builder.addDecoration(id, spv::Decoration::Offset, symbol->getQualifier().layoutXfbOffset);
  9429. }
  9430. // add built-in variable decoration
  9431. if (builtIn != spv::BuiltIn::Max) {
  9432. // WorkgroupSize deprecated in spirv1.6
  9433. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_6 ||
  9434. builtIn != spv::BuiltIn::WorkgroupSize)
  9435. builder.addDecoration(id, spv::Decoration::BuiltIn, (int)builtIn);
  9436. }
  9437. // Add volatile decoration to HelperInvocation for spirv1.6 and beyond
  9438. if (builtIn == spv::BuiltIn::HelperInvocation &&
  9439. !glslangIntermediate->usingVulkanMemoryModel() &&
  9440. glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {
  9441. builder.addDecoration(id, spv::Decoration::Volatile);
  9442. }
  9443. // Subgroup builtins which have input storage class are volatile for ray tracing stages.
  9444. if (symbol->getType().isImage() || symbol->getQualifier().isPipeInput()) {
  9445. std::vector<spv::Decoration> memory;
  9446. TranslateMemoryDecoration(symbol->getType().getQualifier(), memory,
  9447. glslangIntermediate->usingVulkanMemoryModel());
  9448. for (unsigned int i = 0; i < memory.size(); ++i)
  9449. builder.addDecoration(id, memory[i]);
  9450. }
  9451. if (builtIn == spv::BuiltIn::SampleMask) {
  9452. spv::Decoration decoration;
  9453. // GL_NV_sample_mask_override_coverage extension
  9454. if (glslangIntermediate->getLayoutOverrideCoverage())
  9455. decoration = spv::Decoration::OverrideCoverageNV;
  9456. else
  9457. decoration = spv::Decoration::Max;
  9458. builder.addDecoration(id, decoration);
  9459. if (decoration != spv::Decoration::Max) {
  9460. builder.addCapability(spv::Capability::SampleMaskOverrideCoverageNV);
  9461. builder.addExtension(spv::E_SPV_NV_sample_mask_override_coverage);
  9462. }
  9463. }
  9464. else if (builtIn == spv::BuiltIn::Layer) {
  9465. // SPV_NV_viewport_array2 extension
  9466. if (symbol->getQualifier().layoutViewportRelative) {
  9467. builder.addDecoration(id, spv::Decoration::ViewportRelativeNV);
  9468. builder.addCapability(spv::Capability::ShaderViewportMaskNV);
  9469. builder.addExtension(spv::E_SPV_NV_viewport_array2);
  9470. }
  9471. if (symbol->getQualifier().layoutSecondaryViewportRelativeOffset != -2048) {
  9472. builder.addDecoration(id, spv::Decoration::SecondaryViewportRelativeNV,
  9473. symbol->getQualifier().layoutSecondaryViewportRelativeOffset);
  9474. builder.addCapability(spv::Capability::ShaderStereoViewNV);
  9475. builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
  9476. }
  9477. }
  9478. if (symbol->getQualifier().layoutPassthrough) {
  9479. builder.addDecoration(id, spv::Decoration::PassthroughNV);
  9480. builder.addCapability(spv::Capability::GeometryShaderPassthroughNV);
  9481. builder.addExtension(spv::E_SPV_NV_geometry_shader_passthrough);
  9482. }
  9483. if (symbol->getQualifier().pervertexNV) {
  9484. builder.addDecoration(id, spv::Decoration::PerVertexNV);
  9485. builder.addCapability(spv::Capability::FragmentBarycentricNV);
  9486. builder.addExtension(spv::E_SPV_NV_fragment_shader_barycentric);
  9487. }
  9488. if (symbol->getQualifier().pervertexEXT) {
  9489. builder.addDecoration(id, spv::Decoration::PerVertexKHR);
  9490. builder.addCapability(spv::Capability::FragmentBarycentricKHR);
  9491. builder.addExtension(spv::E_SPV_KHR_fragment_shader_barycentric);
  9492. }
  9493. if (glslangIntermediate->getHlslFunctionality1() && symbol->getType().getQualifier().semanticName != nullptr) {
  9494. builder.addExtension("SPV_GOOGLE_hlsl_functionality1");
  9495. builder.addDecoration(id, spv::Decoration::HlslSemanticGOOGLE,
  9496. symbol->getType().getQualifier().semanticName);
  9497. }
  9498. if (symbol->isReference()) {
  9499. builder.addDecoration(id, symbol->getType().getQualifier().restrict ?
  9500. spv::Decoration::RestrictPointerEXT : spv::Decoration::AliasedPointerEXT);
  9501. }
  9502. // Add SPIR-V decorations (GL_EXT_spirv_intrinsics)
  9503. if (symbol->getType().getQualifier().hasSpirvDecorate())
  9504. applySpirvDecorate(symbol->getType(), id, {});
  9505. return id;
  9506. }
  9507. // add per-primitive, per-view. per-task decorations to a struct member (member >= 0) or an object
  9508. void TGlslangToSpvTraverser::addMeshNVDecoration(spv::Id id, int member, const glslang::TQualifier& qualifier)
  9509. {
  9510. bool isMeshShaderExt = (glslangIntermediate->getRequestedExtensions().find(glslang::E_GL_EXT_mesh_shader) !=
  9511. glslangIntermediate->getRequestedExtensions().end());
  9512. if (member >= 0) {
  9513. if (qualifier.perPrimitiveNV) {
  9514. // Need to add capability/extension for fragment shader.
  9515. // Mesh shader already adds this by default.
  9516. if (glslangIntermediate->getStage() == EShLangFragment) {
  9517. if(isMeshShaderExt) {
  9518. builder.addCapability(spv::Capability::MeshShadingEXT);
  9519. builder.addExtension(spv::E_SPV_EXT_mesh_shader);
  9520. } else {
  9521. builder.addCapability(spv::Capability::MeshShadingNV);
  9522. builder.addExtension(spv::E_SPV_NV_mesh_shader);
  9523. }
  9524. }
  9525. builder.addMemberDecoration(id, (unsigned)member, spv::Decoration::PerPrimitiveNV);
  9526. }
  9527. if (qualifier.perViewNV)
  9528. builder.addMemberDecoration(id, (unsigned)member, spv::Decoration::PerViewNV);
  9529. if (qualifier.perTaskNV)
  9530. builder.addMemberDecoration(id, (unsigned)member, spv::Decoration::PerTaskNV);
  9531. } else {
  9532. if (qualifier.perPrimitiveNV) {
  9533. // Need to add capability/extension for fragment shader.
  9534. // Mesh shader already adds this by default.
  9535. if (glslangIntermediate->getStage() == EShLangFragment) {
  9536. if(isMeshShaderExt) {
  9537. builder.addCapability(spv::Capability::MeshShadingEXT);
  9538. builder.addExtension(spv::E_SPV_EXT_mesh_shader);
  9539. } else {
  9540. builder.addCapability(spv::Capability::MeshShadingNV);
  9541. builder.addExtension(spv::E_SPV_NV_mesh_shader);
  9542. }
  9543. }
  9544. builder.addDecoration(id, spv::Decoration::PerPrimitiveNV);
  9545. }
  9546. if (qualifier.perViewNV)
  9547. builder.addDecoration(id, spv::Decoration::PerViewNV);
  9548. if (qualifier.perTaskNV)
  9549. builder.addDecoration(id, spv::Decoration::PerTaskNV);
  9550. }
  9551. }
  9552. bool TGlslangToSpvTraverser::hasQCOMImageProceessingDecoration(spv::Id id, spv::Decoration decor)
  9553. {
  9554. std::vector<spv::Decoration> &decoVec = idToQCOMDecorations[id];
  9555. for ( auto d : decoVec ) {
  9556. if ( d == decor )
  9557. return true;
  9558. }
  9559. return false;
  9560. }
  9561. void TGlslangToSpvTraverser::addImageProcessingQCOMDecoration(spv::Id id, spv::Decoration decor)
  9562. {
  9563. spv::Op opc = builder.getOpCode(id);
  9564. if (opc == spv::Op::OpSampledImage) {
  9565. id = builder.getIdOperand(id, 0);
  9566. opc = builder.getOpCode(id);
  9567. }
  9568. if (opc == spv::Op::OpLoad) {
  9569. spv::Id texid = builder.getIdOperand(id, 0);
  9570. if (!hasQCOMImageProceessingDecoration(texid, decor)) {//
  9571. builder.addDecoration(texid, decor);
  9572. idToQCOMDecorations[texid].push_back(decor);
  9573. }
  9574. }
  9575. }
  9576. void TGlslangToSpvTraverser::addImageProcessing2QCOMDecoration(spv::Id id, bool isForGather)
  9577. {
  9578. if (isForGather) {
  9579. return addImageProcessingQCOMDecoration(id, spv::Decoration::BlockMatchTextureQCOM);
  9580. }
  9581. auto addDecor =
  9582. [this](spv::Id id, spv::Decoration decor) {
  9583. spv::Op tsopc = this->builder.getOpCode(id);
  9584. if (tsopc == spv::Op::OpLoad) {
  9585. spv::Id tsid = this->builder.getIdOperand(id, 0);
  9586. if (this->glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {
  9587. assert(iOSet.count(tsid) > 0);
  9588. }
  9589. if (!hasQCOMImageProceessingDecoration(tsid, decor)) {
  9590. this->builder.addDecoration(tsid, decor);
  9591. idToQCOMDecorations[tsid].push_back(decor);
  9592. }
  9593. }
  9594. };
  9595. spv::Op opc = builder.getOpCode(id);
  9596. bool isInterfaceObject = (opc != spv::Op::OpSampledImage);
  9597. if (!isInterfaceObject) {
  9598. addDecor(builder.getIdOperand(id, 0), spv::Decoration::BlockMatchTextureQCOM);
  9599. addDecor(builder.getIdOperand(id, 1), spv::Decoration::BlockMatchSamplerQCOM);
  9600. } else {
  9601. addDecor(id, spv::Decoration::BlockMatchTextureQCOM);
  9602. addDecor(id, spv::Decoration::BlockMatchSamplerQCOM);
  9603. }
  9604. }
  9605. // Make a full tree of instructions to build a SPIR-V specialization constant,
  9606. // or regular constant if possible.
  9607. //
  9608. // TBD: this is not yet done, nor verified to be the best design, it does do the leaf symbols though
  9609. //
  9610. // Recursively walk the nodes. The nodes form a tree whose leaves are
  9611. // regular constants, which themselves are trees that createSpvConstant()
  9612. // recursively walks. So, this function walks the "top" of the tree:
  9613. // - emit specialization constant-building instructions for specConstant
  9614. // - when running into a non-spec-constant, switch to createSpvConstant()
  9615. spv::Id TGlslangToSpvTraverser::createSpvConstant(const glslang::TIntermTyped& node)
  9616. {
  9617. assert(node.getQualifier().isConstant());
  9618. // Handle front-end constants first (non-specialization constants).
  9619. if (! node.getQualifier().specConstant) {
  9620. // hand off to the non-spec-constant path
  9621. assert(node.getAsConstantUnion() != nullptr || node.getAsSymbolNode() != nullptr);
  9622. int nextConst = 0;
  9623. return createSpvConstantFromConstUnionArray(node.getType(), node.getAsConstantUnion() ?
  9624. node.getAsConstantUnion()->getConstArray() : node.getAsSymbolNode()->getConstArray(),
  9625. nextConst, false);
  9626. }
  9627. // We now know we have a specialization constant to build
  9628. // Extra capabilities may be needed.
  9629. if (node.getType().contains8BitInt())
  9630. builder.addCapability(spv::Capability::Int8);
  9631. if (node.getType().contains16BitFloat())
  9632. builder.addCapability(spv::Capability::Float16);
  9633. if (node.getType().contains16BitInt())
  9634. builder.addCapability(spv::Capability::Int16);
  9635. if (node.getType().contains64BitInt())
  9636. builder.addCapability(spv::Capability::Int64);
  9637. if (node.getType().containsDouble())
  9638. builder.addCapability(spv::Capability::Float64);
  9639. // gl_WorkGroupSize is a special case until the front-end handles hierarchical specialization constants,
  9640. // even then, it's specialization ids are handled by special case syntax in GLSL: layout(local_size_x = ...
  9641. if (node.getType().getQualifier().builtIn == glslang::EbvWorkGroupSize) {
  9642. std::vector<spv::Id> dimConstId;
  9643. for (int dim = 0; dim < 3; ++dim) {
  9644. bool specConst = (glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet);
  9645. dimConstId.push_back(builder.makeUintConstant(glslangIntermediate->getLocalSize(dim), specConst));
  9646. if (specConst) {
  9647. builder.addDecoration(dimConstId.back(), spv::Decoration::SpecId,
  9648. glslangIntermediate->getLocalSizeSpecId(dim));
  9649. }
  9650. }
  9651. return builder.makeCompositeConstant(builder.makeVectorType(builder.makeUintType(32), 3), dimConstId, true);
  9652. }
  9653. // An AST node labelled as specialization constant should be a symbol node.
  9654. // Its initializer should either be a sub tree with constant nodes, or a constant union array.
  9655. if (auto* sn = node.getAsSymbolNode()) {
  9656. spv::Id result;
  9657. if (auto* sub_tree = sn->getConstSubtree()) {
  9658. // Traverse the constant constructor sub tree like generating normal run-time instructions.
  9659. // During the AST traversal, if the node is marked as 'specConstant', SpecConstantOpModeGuard
  9660. // will set the builder into spec constant op instruction generating mode.
  9661. sub_tree->traverse(this);
  9662. result = accessChainLoad(sub_tree->getType());
  9663. } else if (auto* const_union_array = &sn->getConstArray()) {
  9664. int nextConst = 0;
  9665. result = createSpvConstantFromConstUnionArray(sn->getType(), *const_union_array, nextConst, true);
  9666. } else {
  9667. logger->missingFunctionality("Invalid initializer for spec onstant.");
  9668. return spv::NoResult;
  9669. }
  9670. builder.addName(result, sn->getName().c_str());
  9671. return result;
  9672. }
  9673. // Neither a front-end constant node, nor a specialization constant node with constant union array or
  9674. // constant sub tree as initializer.
  9675. logger->missingFunctionality("Neither a front-end constant nor a spec constant.");
  9676. return spv::NoResult;
  9677. }
  9678. // Use 'consts' as the flattened glslang source of scalar constants to recursively
  9679. // build the aggregate SPIR-V constant.
  9680. //
  9681. // If there are not enough elements present in 'consts', 0 will be substituted;
  9682. // an empty 'consts' can be used to create a fully zeroed SPIR-V constant.
  9683. //
  9684. spv::Id TGlslangToSpvTraverser::createSpvConstantFromConstUnionArray(const glslang::TType& glslangType,
  9685. const glslang::TConstUnionArray& consts, int& nextConst, bool specConstant)
  9686. {
  9687. // vector of constants for SPIR-V
  9688. std::vector<spv::Id> spvConsts;
  9689. // Type is used for struct and array constants
  9690. spv::Id typeId = convertGlslangToSpvType(glslangType);
  9691. if (glslangType.isArray()) {
  9692. glslang::TType elementType(glslangType, 0);
  9693. for (int i = 0; i < glslangType.getOuterArraySize(); ++i)
  9694. spvConsts.push_back(createSpvConstantFromConstUnionArray(elementType, consts, nextConst, false));
  9695. } else if (glslangType.isMatrix()) {
  9696. glslang::TType vectorType(glslangType, 0);
  9697. for (int col = 0; col < glslangType.getMatrixCols(); ++col)
  9698. spvConsts.push_back(createSpvConstantFromConstUnionArray(vectorType, consts, nextConst, false));
  9699. } else if (glslangType.isCoopMat()) {
  9700. glslang::TType componentType(glslangType.getBasicType());
  9701. spvConsts.push_back(createSpvConstantFromConstUnionArray(componentType, consts, nextConst, false));
  9702. } else if (glslangType.isStruct()) {
  9703. glslang::TVector<glslang::TTypeLoc>::const_iterator iter;
  9704. for (iter = glslangType.getStruct()->begin(); iter != glslangType.getStruct()->end(); ++iter)
  9705. spvConsts.push_back(createSpvConstantFromConstUnionArray(*iter->type, consts, nextConst, false));
  9706. } else if (glslangType.getVectorSize() > 1 || glslangType.isCoopVecNV()) {
  9707. unsigned int numComponents = glslangType.isCoopVecNV() ? glslangType.getTypeParameters()->arraySizes->getDimSize(0) : glslangType.getVectorSize();
  9708. for (unsigned int i = 0; i < numComponents; ++i) {
  9709. bool zero = nextConst >= consts.size();
  9710. switch (glslangType.getBasicType()) {
  9711. case glslang::EbtInt:
  9712. spvConsts.push_back(builder.makeIntConstant(zero ? 0 : consts[nextConst].getIConst()));
  9713. break;
  9714. case glslang::EbtUint:
  9715. spvConsts.push_back(builder.makeUintConstant(zero ? 0 : consts[nextConst].getUConst()));
  9716. break;
  9717. case glslang::EbtFloat:
  9718. spvConsts.push_back(builder.makeFloatConstant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  9719. break;
  9720. case glslang::EbtBool:
  9721. spvConsts.push_back(builder.makeBoolConstant(zero ? false : consts[nextConst].getBConst()));
  9722. break;
  9723. case glslang::EbtInt8:
  9724. builder.addCapability(spv::Capability::Int8);
  9725. spvConsts.push_back(builder.makeInt8Constant(zero ? 0 : consts[nextConst].getI8Const()));
  9726. break;
  9727. case glslang::EbtUint8:
  9728. builder.addCapability(spv::Capability::Int8);
  9729. spvConsts.push_back(builder.makeUint8Constant(zero ? 0 : consts[nextConst].getU8Const()));
  9730. break;
  9731. case glslang::EbtInt16:
  9732. builder.addCapability(spv::Capability::Int16);
  9733. spvConsts.push_back(builder.makeInt16Constant(zero ? 0 : consts[nextConst].getI16Const()));
  9734. break;
  9735. case glslang::EbtUint16:
  9736. builder.addCapability(spv::Capability::Int16);
  9737. spvConsts.push_back(builder.makeUint16Constant(zero ? 0 : consts[nextConst].getU16Const()));
  9738. break;
  9739. case glslang::EbtInt64:
  9740. spvConsts.push_back(builder.makeInt64Constant(zero ? 0 : consts[nextConst].getI64Const()));
  9741. break;
  9742. case glslang::EbtUint64:
  9743. spvConsts.push_back(builder.makeUint64Constant(zero ? 0 : consts[nextConst].getU64Const()));
  9744. break;
  9745. case glslang::EbtDouble:
  9746. spvConsts.push_back(builder.makeDoubleConstant(zero ? 0.0 : consts[nextConst].getDConst()));
  9747. break;
  9748. case glslang::EbtFloat16:
  9749. builder.addCapability(spv::Capability::Float16);
  9750. spvConsts.push_back(builder.makeFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  9751. break;
  9752. case glslang::EbtBFloat16:
  9753. spvConsts.push_back(builder.makeBFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  9754. break;
  9755. case glslang::EbtFloatE5M2:
  9756. spvConsts.push_back(builder.makeFloatE5M2Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  9757. break;
  9758. case glslang::EbtFloatE4M3:
  9759. spvConsts.push_back(builder.makeFloatE4M3Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  9760. break;
  9761. default:
  9762. assert(0);
  9763. break;
  9764. }
  9765. ++nextConst;
  9766. }
  9767. } else {
  9768. // we have a non-aggregate (scalar) constant
  9769. bool zero = nextConst >= consts.size();
  9770. spv::Id scalar = 0;
  9771. switch (glslangType.getBasicType()) {
  9772. case glslang::EbtInt:
  9773. scalar = builder.makeIntConstant(zero ? 0 : consts[nextConst].getIConst(), specConstant);
  9774. break;
  9775. case glslang::EbtUint:
  9776. scalar = builder.makeUintConstant(zero ? 0 : consts[nextConst].getUConst(), specConstant);
  9777. break;
  9778. case glslang::EbtFloat:
  9779. scalar = builder.makeFloatConstant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  9780. break;
  9781. case glslang::EbtBool:
  9782. scalar = builder.makeBoolConstant(zero ? false : consts[nextConst].getBConst(), specConstant);
  9783. break;
  9784. case glslang::EbtInt8:
  9785. builder.addCapability(spv::Capability::Int8);
  9786. scalar = builder.makeInt8Constant(zero ? 0 : consts[nextConst].getI8Const(), specConstant);
  9787. break;
  9788. case glslang::EbtUint8:
  9789. builder.addCapability(spv::Capability::Int8);
  9790. scalar = builder.makeUint8Constant(zero ? 0 : consts[nextConst].getU8Const(), specConstant);
  9791. break;
  9792. case glslang::EbtInt16:
  9793. builder.addCapability(spv::Capability::Int16);
  9794. scalar = builder.makeInt16Constant(zero ? 0 : consts[nextConst].getI16Const(), specConstant);
  9795. break;
  9796. case glslang::EbtUint16:
  9797. builder.addCapability(spv::Capability::Int16);
  9798. scalar = builder.makeUint16Constant(zero ? 0 : consts[nextConst].getU16Const(), specConstant);
  9799. break;
  9800. case glslang::EbtInt64:
  9801. scalar = builder.makeInt64Constant(zero ? 0 : consts[nextConst].getI64Const(), specConstant);
  9802. break;
  9803. case glslang::EbtUint64:
  9804. scalar = builder.makeUint64Constant(zero ? 0 : consts[nextConst].getU64Const(), specConstant);
  9805. break;
  9806. case glslang::EbtDouble:
  9807. scalar = builder.makeDoubleConstant(zero ? 0.0 : consts[nextConst].getDConst(), specConstant);
  9808. break;
  9809. case glslang::EbtFloat16:
  9810. builder.addCapability(spv::Capability::Float16);
  9811. scalar = builder.makeFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  9812. break;
  9813. case glslang::EbtBFloat16:
  9814. scalar = builder.makeBFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  9815. break;
  9816. case glslang::EbtFloatE5M2:
  9817. scalar = builder.makeFloatE5M2Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  9818. break;
  9819. case glslang::EbtFloatE4M3:
  9820. scalar = builder.makeFloatE4M3Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  9821. break;
  9822. case glslang::EbtReference:
  9823. scalar = builder.makeUint64Constant(zero ? 0 : consts[nextConst].getU64Const(), specConstant);
  9824. scalar = builder.createUnaryOp(spv::Op::OpBitcast, typeId, scalar);
  9825. break;
  9826. case glslang::EbtString:
  9827. scalar = builder.getStringId(consts[nextConst].getSConst()->c_str());
  9828. break;
  9829. default:
  9830. assert(0);
  9831. break;
  9832. }
  9833. ++nextConst;
  9834. return scalar;
  9835. }
  9836. return builder.makeCompositeConstant(typeId, spvConsts);
  9837. }
  9838. // Return true if the node is a constant or symbol whose reading has no
  9839. // non-trivial observable cost or effect.
  9840. bool TGlslangToSpvTraverser::isTrivialLeaf(const glslang::TIntermTyped* node)
  9841. {
  9842. // don't know what this is
  9843. if (node == nullptr)
  9844. return false;
  9845. // a constant is safe
  9846. if (node->getAsConstantUnion() != nullptr)
  9847. return true;
  9848. // not a symbol means non-trivial
  9849. if (node->getAsSymbolNode() == nullptr)
  9850. return false;
  9851. // a symbol, depends on what's being read
  9852. switch (node->getType().getQualifier().storage) {
  9853. case glslang::EvqTemporary:
  9854. case glslang::EvqGlobal:
  9855. case glslang::EvqIn:
  9856. case glslang::EvqInOut:
  9857. case glslang::EvqConst:
  9858. case glslang::EvqConstReadOnly:
  9859. case glslang::EvqUniform:
  9860. return true;
  9861. default:
  9862. return false;
  9863. }
  9864. }
  9865. // A node is trivial if it is a single operation with no side effects.
  9866. // HLSL (and/or vectors) are always trivial, as it does not short circuit.
  9867. // Otherwise, error on the side of saying non-trivial.
  9868. // Return true if trivial.
  9869. bool TGlslangToSpvTraverser::isTrivial(const glslang::TIntermTyped* node)
  9870. {
  9871. if (node == nullptr)
  9872. return false;
  9873. // count non scalars as trivial, as well as anything coming from HLSL
  9874. if (! node->getType().isScalarOrVec1() || glslangIntermediate->getSource() == glslang::EShSourceHlsl)
  9875. return true;
  9876. // symbols and constants are trivial
  9877. if (isTrivialLeaf(node))
  9878. return true;
  9879. // otherwise, it needs to be a simple operation or one or two leaf nodes
  9880. // not a simple operation
  9881. const glslang::TIntermBinary* binaryNode = node->getAsBinaryNode();
  9882. const glslang::TIntermUnary* unaryNode = node->getAsUnaryNode();
  9883. if (binaryNode == nullptr && unaryNode == nullptr)
  9884. return false;
  9885. // not on leaf nodes
  9886. if (binaryNode && (! isTrivialLeaf(binaryNode->getLeft()) || ! isTrivialLeaf(binaryNode->getRight())))
  9887. return false;
  9888. if (unaryNode && ! isTrivialLeaf(unaryNode->getOperand())) {
  9889. return false;
  9890. }
  9891. if (IsOpNumericConv(node->getAsOperator()->getOp()) &&
  9892. node->getType().getBasicType() == glslang::EbtBool) {
  9893. return true;
  9894. }
  9895. switch (node->getAsOperator()->getOp()) {
  9896. case glslang::EOpLogicalNot:
  9897. case glslang::EOpEqual:
  9898. case glslang::EOpNotEqual:
  9899. case glslang::EOpLessThan:
  9900. case glslang::EOpGreaterThan:
  9901. case glslang::EOpLessThanEqual:
  9902. case glslang::EOpGreaterThanEqual:
  9903. case glslang::EOpIndexDirect:
  9904. case glslang::EOpIndexDirectStruct:
  9905. case glslang::EOpLogicalXor:
  9906. case glslang::EOpAny:
  9907. case glslang::EOpAll:
  9908. return true;
  9909. default:
  9910. return false;
  9911. }
  9912. }
  9913. // Emit short-circuiting code, where 'right' is never evaluated unless
  9914. // the left side is true (for &&) or false (for ||).
  9915. spv::Id TGlslangToSpvTraverser::createShortCircuit(glslang::TOperator op, glslang::TIntermTyped& left,
  9916. glslang::TIntermTyped& right)
  9917. {
  9918. spv::Id boolTypeId = builder.makeBoolType();
  9919. // emit left operand
  9920. builder.clearAccessChain();
  9921. left.traverse(this);
  9922. spv::Id leftId = accessChainLoad(left.getType());
  9923. // Operands to accumulate OpPhi operands
  9924. std::vector<spv::Id> phiOperands;
  9925. phiOperands.reserve(4);
  9926. // accumulate left operand's phi information
  9927. phiOperands.push_back(leftId);
  9928. phiOperands.push_back(builder.getBuildPoint()->getId());
  9929. // Make the two kinds of operation symmetric with a "!"
  9930. // || => emit "if (! left) result = right"
  9931. // && => emit "if ( left) result = right"
  9932. //
  9933. // TODO: this runtime "not" for || could be avoided by adding functionality
  9934. // to 'builder' to have an "else" without an "then"
  9935. if (op == glslang::EOpLogicalOr)
  9936. leftId = builder.createUnaryOp(spv::Op::OpLogicalNot, boolTypeId, leftId);
  9937. // make an "if" based on the left value
  9938. spv::Builder::If ifBuilder(leftId, spv::SelectionControlMask::MaskNone, builder);
  9939. // emit right operand as the "then" part of the "if"
  9940. builder.clearAccessChain();
  9941. right.traverse(this);
  9942. spv::Id rightId = accessChainLoad(right.getType());
  9943. // accumulate left operand's phi information
  9944. phiOperands.push_back(rightId);
  9945. phiOperands.push_back(builder.getBuildPoint()->getId());
  9946. // finish the "if"
  9947. ifBuilder.makeEndIf();
  9948. // phi together the two results
  9949. return builder.createOp(spv::Op::OpPhi, boolTypeId, phiOperands);
  9950. }
  9951. // Return type Id of the imported set of extended instructions corresponds to the name.
  9952. // Import this set if it has not been imported yet.
  9953. spv::Id TGlslangToSpvTraverser::getExtBuiltins(const char* name)
  9954. {
  9955. if (extBuiltinMap.find(name) != extBuiltinMap.end())
  9956. return extBuiltinMap[name];
  9957. else {
  9958. spv::Id extBuiltins = builder.import(name);
  9959. extBuiltinMap[name] = extBuiltins;
  9960. return extBuiltins;
  9961. }
  9962. }
  9963. } // end anonymous namespace
  9964. namespace glslang {
  9965. void GetSpirvVersion(std::string& version)
  9966. {
  9967. const int bufSize = 100;
  9968. char buf[bufSize];
  9969. snprintf(buf, bufSize, "0x%08x, Revision %d", spv::Version, spv::Revision);
  9970. version = buf;
  9971. }
  9972. // For low-order part of the generator's magic number. Bump up
  9973. // when there is a change in the style (e.g., if SSA form changes,
  9974. // or a different instruction sequence to do something gets used).
  9975. int GetSpirvGeneratorVersion()
  9976. {
  9977. // return 1; // start
  9978. // return 2; // EOpAtomicCounterDecrement gets a post decrement, to map between GLSL -> SPIR-V
  9979. // return 3; // change/correct barrier-instruction operands, to match memory model group decisions
  9980. // return 4; // some deeper access chains: for dynamic vector component, and local Boolean component
  9981. // return 5; // make OpArrayLength result type be an int with signedness of 0
  9982. // return 6; // revert version 5 change, which makes a different (new) kind of incorrect code,
  9983. // versions 4 and 6 each generate OpArrayLength as it has long been done
  9984. // return 7; // GLSL volatile keyword maps to both SPIR-V decorations Volatile and Coherent
  9985. // return 8; // switch to new dead block eliminator; use OpUnreachable
  9986. // return 9; // don't include opaque function parameters in OpEntryPoint global's operand list
  9987. // return 10; // Generate OpFUnordNotEqual for != comparisons
  9988. return 11; // Make OpEmitMeshTasksEXT a terminal instruction
  9989. }
  9990. // Write SPIR-V out to a binary file
  9991. bool OutputSpvBin(const std::vector<unsigned int>& spirv, const char* baseName)
  9992. {
  9993. std::ofstream out;
  9994. out.open(baseName, std::ios::binary | std::ios::out);
  9995. if (out.fail()) {
  9996. printf("ERROR: Failed to open file: %s\n", baseName);
  9997. return false;
  9998. }
  9999. for (int i = 0; i < (int)spirv.size(); ++i) {
  10000. unsigned int word = spirv[i];
  10001. out.write((const char*)&word, 4);
  10002. }
  10003. out.close();
  10004. return true;
  10005. }
  10006. // Write SPIR-V out to a text file with 32-bit hexadecimal words
  10007. bool OutputSpvHex(const std::vector<unsigned int>& spirv, const char* baseName, const char* varName)
  10008. {
  10009. std::ofstream out;
  10010. out.open(baseName, std::ios::binary | std::ios::out);
  10011. if (out.fail()) {
  10012. printf("ERROR: Failed to open file: %s\n", baseName);
  10013. return false;
  10014. }
  10015. out << "\t// " <<
  10016. GetSpirvGeneratorVersion() <<
  10017. GLSLANG_VERSION_MAJOR << "." << GLSLANG_VERSION_MINOR << "." << GLSLANG_VERSION_PATCH <<
  10018. GLSLANG_VERSION_FLAVOR << std::endl;
  10019. if (varName != nullptr) {
  10020. out << "\t #pragma once" << std::endl;
  10021. out << "const uint32_t " << varName << "[] = {" << std::endl;
  10022. }
  10023. const int WORDS_PER_LINE = 8;
  10024. for (int i = 0; i < (int)spirv.size(); i += WORDS_PER_LINE) {
  10025. out << "\t";
  10026. for (int j = 0; j < WORDS_PER_LINE && i + j < (int)spirv.size(); ++j) {
  10027. const unsigned int word = spirv[i + j];
  10028. out << "0x" << std::hex << std::setw(8) << std::setfill('0') << word;
  10029. if (i + j + 1 < (int)spirv.size()) {
  10030. out << ",";
  10031. }
  10032. }
  10033. out << std::endl;
  10034. }
  10035. if (varName != nullptr) {
  10036. out << "};";
  10037. out << std::endl;
  10038. }
  10039. out.close();
  10040. return true;
  10041. }
  10042. //
  10043. // Set up the glslang traversal
  10044. //
  10045. void GlslangToSpv(const TIntermediate& intermediate, std::vector<unsigned int>& spirv, SpvOptions* options)
  10046. {
  10047. spv::SpvBuildLogger logger;
  10048. GlslangToSpv(intermediate, spirv, &logger, options);
  10049. }
  10050. void GlslangToSpv(const TIntermediate& intermediate, std::vector<unsigned int>& spirv,
  10051. spv::SpvBuildLogger* logger, SpvOptions* options)
  10052. {
  10053. TIntermNode* root = intermediate.getTreeRoot();
  10054. if (root == nullptr)
  10055. return;
  10056. SpvOptions defaultOptions;
  10057. if (options == nullptr)
  10058. options = &defaultOptions;
  10059. GetThreadPoolAllocator().push();
  10060. TGlslangToSpvTraverser it(intermediate.getSpv().spv, &intermediate, logger, *options);
  10061. root->traverse(&it);
  10062. it.finishSpv(options->compileOnly);
  10063. it.dumpSpv(spirv);
  10064. #if ENABLE_OPT
  10065. // If from HLSL, run spirv-opt to "legalize" the SPIR-V for Vulkan
  10066. // eg. forward and remove memory writes of opaque types.
  10067. bool prelegalization = intermediate.getSource() == EShSourceHlsl;
  10068. if ((prelegalization || options->optimizeSize) && !options->disableOptimizer) {
  10069. SpirvToolsTransform(intermediate, spirv, logger, options);
  10070. prelegalization = false;
  10071. }
  10072. else if (options->stripDebugInfo) {
  10073. // Strip debug info even if optimization is disabled.
  10074. SpirvToolsStripDebugInfo(intermediate, spirv, logger);
  10075. }
  10076. if (options->validate)
  10077. SpirvToolsValidate(intermediate, spirv, logger, prelegalization);
  10078. if (options->disassemble)
  10079. SpirvToolsDisassemble(std::cout, spirv);
  10080. #endif
  10081. GetThreadPoolAllocator().pop();
  10082. }
  10083. } // end namespace glslang