GlslangToSpv.cpp 535 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488248924902491249224932494249524962497249824992500250125022503250425052506250725082509251025112512251325142515251625172518251925202521252225232524252525262527252825292530253125322533253425352536253725382539254025412542254325442545254625472548254925502551255225532554255525562557255825592560256125622563256425652566256725682569257025712572257325742575257625772578257925802581258225832584258525862587258825892590259125922593259425952596259725982599260026012602260326042605260626072608260926102611261226132614261526162617261826192620262126222623262426252626262726282629263026312632263326342635263626372638263926402641264226432644264526462647264826492650265126522653265426552656265726582659266026612662266326642665266626672668266926702671267226732674267526762677267826792680268126822683268426852686268726882689269026912692269326942695269626972698269927002701270227032704270527062707270827092710271127122713271427152716271727182719272027212722272327242725272627272728272927302731273227332734273527362737273827392740274127422743274427452746274727482749275027512752275327542755275627572758275927602761276227632764276527662767276827692770277127722773277427752776277727782779278027812782278327842785278627872788278927902791279227932794279527962797279827992800280128022803280428052806280728082809281028112812281328142815281628172818281928202821282228232824282528262827282828292830283128322833283428352836283728382839284028412842284328442845284628472848284928502851285228532854285528562857285828592860286128622863286428652866286728682869287028712872287328742875287628772878287928802881288228832884288528862887288828892890289128922893289428952896289728982899290029012902290329042905290629072908290929102911291229132914291529162917291829192920292129222923292429252926292729282929293029312932293329342935293629372938293929402941294229432944294529462947294829492950295129522953295429552956295729582959296029612962296329642965296629672968296929702971297229732974297529762977297829792980298129822983298429852986298729882989299029912992299329942995299629972998299930003001300230033004300530063007300830093010301130123013301430153016301730183019302030213022302330243025302630273028302930303031303230333034303530363037303830393040304130423043304430453046304730483049305030513052305330543055305630573058305930603061306230633064306530663067306830693070307130723073307430753076307730783079308030813082308330843085308630873088308930903091309230933094309530963097309830993100310131023103310431053106310731083109311031113112311331143115311631173118311931203121312231233124312531263127312831293130313131323133313431353136313731383139314031413142314331443145314631473148314931503151315231533154315531563157315831593160316131623163316431653166316731683169317031713172317331743175317631773178317931803181318231833184318531863187318831893190319131923193319431953196319731983199320032013202320332043205320632073208320932103211321232133214321532163217321832193220322132223223322432253226322732283229323032313232323332343235323632373238323932403241324232433244324532463247324832493250325132523253325432553256325732583259326032613262326332643265326632673268326932703271327232733274327532763277327832793280328132823283328432853286328732883289329032913292329332943295329632973298329933003301330233033304330533063307330833093310331133123313331433153316331733183319332033213322332333243325332633273328332933303331333233333334333533363337333833393340334133423343334433453346334733483349335033513352335333543355335633573358335933603361336233633364336533663367336833693370337133723373337433753376337733783379338033813382338333843385338633873388338933903391339233933394339533963397339833993400340134023403340434053406340734083409341034113412341334143415341634173418341934203421342234233424342534263427342834293430343134323433343434353436343734383439344034413442344334443445344634473448344934503451345234533454345534563457345834593460346134623463346434653466346734683469347034713472347334743475347634773478347934803481348234833484348534863487348834893490349134923493349434953496349734983499350035013502350335043505350635073508350935103511351235133514351535163517351835193520352135223523352435253526352735283529353035313532353335343535353635373538353935403541354235433544354535463547354835493550355135523553355435553556355735583559356035613562356335643565356635673568356935703571357235733574357535763577357835793580358135823583358435853586358735883589359035913592359335943595359635973598359936003601360236033604360536063607360836093610361136123613361436153616361736183619362036213622362336243625362636273628362936303631363236333634363536363637363836393640364136423643364436453646364736483649365036513652365336543655365636573658365936603661366236633664366536663667366836693670367136723673367436753676367736783679368036813682368336843685368636873688368936903691369236933694369536963697369836993700370137023703370437053706370737083709371037113712371337143715371637173718371937203721372237233724372537263727372837293730373137323733373437353736373737383739374037413742374337443745374637473748374937503751375237533754375537563757375837593760376137623763376437653766376737683769377037713772377337743775377637773778377937803781378237833784378537863787378837893790379137923793379437953796379737983799380038013802380338043805380638073808380938103811381238133814381538163817381838193820382138223823382438253826382738283829383038313832383338343835383638373838383938403841384238433844384538463847384838493850385138523853385438553856385738583859386038613862386338643865386638673868386938703871387238733874387538763877387838793880388138823883388438853886388738883889389038913892389338943895389638973898389939003901390239033904390539063907390839093910391139123913391439153916391739183919392039213922392339243925392639273928392939303931393239333934393539363937393839393940394139423943394439453946394739483949395039513952395339543955395639573958395939603961396239633964396539663967396839693970397139723973397439753976397739783979398039813982398339843985398639873988398939903991399239933994399539963997399839994000400140024003400440054006400740084009401040114012401340144015401640174018401940204021402240234024402540264027402840294030403140324033403440354036403740384039404040414042404340444045404640474048404940504051405240534054405540564057405840594060406140624063406440654066406740684069407040714072407340744075407640774078407940804081408240834084408540864087408840894090409140924093409440954096409740984099410041014102410341044105410641074108410941104111411241134114411541164117411841194120412141224123412441254126412741284129413041314132413341344135413641374138413941404141414241434144414541464147414841494150415141524153415441554156415741584159416041614162416341644165416641674168416941704171417241734174417541764177417841794180418141824183418441854186418741884189419041914192419341944195419641974198419942004201420242034204420542064207420842094210421142124213421442154216421742184219422042214222422342244225422642274228422942304231423242334234423542364237423842394240424142424243424442454246424742484249425042514252425342544255425642574258425942604261426242634264426542664267426842694270427142724273427442754276427742784279428042814282428342844285428642874288428942904291429242934294429542964297429842994300430143024303430443054306430743084309431043114312431343144315431643174318431943204321432243234324432543264327432843294330433143324333433443354336433743384339434043414342434343444345434643474348434943504351435243534354435543564357435843594360436143624363436443654366436743684369437043714372437343744375437643774378437943804381438243834384438543864387438843894390439143924393439443954396439743984399440044014402440344044405440644074408440944104411441244134414441544164417441844194420442144224423442444254426442744284429443044314432443344344435443644374438443944404441444244434444444544464447444844494450445144524453445444554456445744584459446044614462446344644465446644674468446944704471447244734474447544764477447844794480448144824483448444854486448744884489449044914492449344944495449644974498449945004501450245034504450545064507450845094510451145124513451445154516451745184519452045214522452345244525452645274528452945304531453245334534453545364537453845394540454145424543454445454546454745484549455045514552455345544555455645574558455945604561456245634564456545664567456845694570457145724573457445754576457745784579458045814582458345844585458645874588458945904591459245934594459545964597459845994600460146024603460446054606460746084609461046114612461346144615461646174618461946204621462246234624462546264627462846294630463146324633463446354636463746384639464046414642464346444645464646474648464946504651465246534654465546564657465846594660466146624663466446654666466746684669467046714672467346744675467646774678467946804681468246834684468546864687468846894690469146924693469446954696469746984699470047014702470347044705470647074708470947104711471247134714471547164717471847194720472147224723472447254726472747284729473047314732473347344735473647374738473947404741474247434744474547464747474847494750475147524753475447554756475747584759476047614762476347644765476647674768476947704771477247734774477547764777477847794780478147824783478447854786478747884789479047914792479347944795479647974798479948004801480248034804480548064807480848094810481148124813481448154816481748184819482048214822482348244825482648274828482948304831483248334834483548364837483848394840484148424843484448454846484748484849485048514852485348544855485648574858485948604861486248634864486548664867486848694870487148724873487448754876487748784879488048814882488348844885488648874888488948904891489248934894489548964897489848994900490149024903490449054906490749084909491049114912491349144915491649174918491949204921492249234924492549264927492849294930493149324933493449354936493749384939494049414942494349444945494649474948494949504951495249534954495549564957495849594960496149624963496449654966496749684969497049714972497349744975497649774978497949804981498249834984498549864987498849894990499149924993499449954996499749984999500050015002500350045005500650075008500950105011501250135014501550165017501850195020502150225023502450255026502750285029503050315032503350345035503650375038503950405041504250435044504550465047504850495050505150525053505450555056505750585059506050615062506350645065506650675068506950705071507250735074507550765077507850795080508150825083508450855086508750885089509050915092509350945095509650975098509951005101510251035104510551065107510851095110511151125113511451155116511751185119512051215122512351245125512651275128512951305131513251335134513551365137513851395140514151425143514451455146514751485149515051515152515351545155515651575158515951605161516251635164516551665167516851695170517151725173517451755176517751785179518051815182518351845185518651875188518951905191519251935194519551965197519851995200520152025203520452055206520752085209521052115212521352145215521652175218521952205221522252235224522552265227522852295230523152325233523452355236523752385239524052415242524352445245524652475248524952505251525252535254525552565257525852595260526152625263526452655266526752685269527052715272527352745275527652775278527952805281528252835284528552865287528852895290529152925293529452955296529752985299530053015302530353045305530653075308530953105311531253135314531553165317531853195320532153225323532453255326532753285329533053315332533353345335533653375338533953405341534253435344534553465347534853495350535153525353535453555356535753585359536053615362536353645365536653675368536953705371537253735374537553765377537853795380538153825383538453855386538753885389539053915392539353945395539653975398539954005401540254035404540554065407540854095410541154125413541454155416541754185419542054215422542354245425542654275428542954305431543254335434543554365437543854395440544154425443544454455446544754485449545054515452545354545455545654575458545954605461546254635464546554665467546854695470547154725473547454755476547754785479548054815482548354845485548654875488548954905491549254935494549554965497549854995500550155025503550455055506550755085509551055115512551355145515551655175518551955205521552255235524552555265527552855295530553155325533553455355536553755385539554055415542554355445545554655475548554955505551555255535554555555565557555855595560556155625563556455655566556755685569557055715572557355745575557655775578557955805581558255835584558555865587558855895590559155925593559455955596559755985599560056015602560356045605560656075608560956105611561256135614561556165617561856195620562156225623562456255626562756285629563056315632563356345635563656375638563956405641564256435644564556465647564856495650565156525653565456555656565756585659566056615662566356645665566656675668566956705671567256735674567556765677567856795680568156825683568456855686568756885689569056915692569356945695569656975698569957005701570257035704570557065707570857095710571157125713571457155716571757185719572057215722572357245725572657275728572957305731573257335734573557365737573857395740574157425743574457455746574757485749575057515752575357545755575657575758575957605761576257635764576557665767576857695770577157725773577457755776577757785779578057815782578357845785578657875788578957905791579257935794579557965797579857995800580158025803580458055806580758085809581058115812581358145815581658175818581958205821582258235824582558265827582858295830583158325833583458355836583758385839584058415842584358445845584658475848584958505851585258535854585558565857585858595860586158625863586458655866586758685869587058715872587358745875587658775878587958805881588258835884588558865887588858895890589158925893589458955896589758985899590059015902590359045905590659075908590959105911591259135914591559165917591859195920592159225923592459255926592759285929593059315932593359345935593659375938593959405941594259435944594559465947594859495950595159525953595459555956595759585959596059615962596359645965596659675968596959705971597259735974597559765977597859795980598159825983598459855986598759885989599059915992599359945995599659975998599960006001600260036004600560066007600860096010601160126013601460156016601760186019602060216022602360246025602660276028602960306031603260336034603560366037603860396040604160426043604460456046604760486049605060516052605360546055605660576058605960606061606260636064606560666067606860696070607160726073607460756076607760786079608060816082608360846085608660876088608960906091609260936094609560966097609860996100610161026103610461056106610761086109611061116112611361146115611661176118611961206121612261236124612561266127612861296130613161326133613461356136613761386139614061416142614361446145614661476148614961506151615261536154615561566157615861596160616161626163616461656166616761686169617061716172617361746175617661776178617961806181618261836184618561866187618861896190619161926193619461956196619761986199620062016202620362046205620662076208620962106211621262136214621562166217621862196220622162226223622462256226622762286229623062316232623362346235623662376238623962406241624262436244624562466247624862496250625162526253625462556256625762586259626062616262626362646265626662676268626962706271627262736274627562766277627862796280628162826283628462856286628762886289629062916292629362946295629662976298629963006301630263036304630563066307630863096310631163126313631463156316631763186319632063216322632363246325632663276328632963306331633263336334633563366337633863396340634163426343634463456346634763486349635063516352635363546355635663576358635963606361636263636364636563666367636863696370637163726373637463756376637763786379638063816382638363846385638663876388638963906391639263936394639563966397639863996400640164026403640464056406640764086409641064116412641364146415641664176418641964206421642264236424642564266427642864296430643164326433643464356436643764386439644064416442644364446445644664476448644964506451645264536454645564566457645864596460646164626463646464656466646764686469647064716472647364746475647664776478647964806481648264836484648564866487648864896490649164926493649464956496649764986499650065016502650365046505650665076508650965106511651265136514651565166517651865196520652165226523652465256526652765286529653065316532653365346535653665376538653965406541654265436544654565466547654865496550655165526553655465556556655765586559656065616562656365646565656665676568656965706571657265736574657565766577657865796580658165826583658465856586658765886589659065916592659365946595659665976598659966006601660266036604660566066607660866096610661166126613661466156616661766186619662066216622662366246625662666276628662966306631663266336634663566366637663866396640664166426643664466456646664766486649665066516652665366546655665666576658665966606661666266636664666566666667666866696670667166726673667466756676667766786679668066816682668366846685668666876688668966906691669266936694669566966697669866996700670167026703670467056706670767086709671067116712671367146715671667176718671967206721672267236724672567266727672867296730673167326733673467356736673767386739674067416742674367446745674667476748674967506751675267536754675567566757675867596760676167626763676467656766676767686769677067716772677367746775677667776778677967806781678267836784678567866787678867896790679167926793679467956796679767986799680068016802680368046805680668076808680968106811681268136814681568166817681868196820682168226823682468256826682768286829683068316832683368346835683668376838683968406841684268436844684568466847684868496850685168526853685468556856685768586859686068616862686368646865686668676868686968706871687268736874687568766877687868796880688168826883688468856886688768886889689068916892689368946895689668976898689969006901690269036904690569066907690869096910691169126913691469156916691769186919692069216922692369246925692669276928692969306931693269336934693569366937693869396940694169426943694469456946694769486949695069516952695369546955695669576958695969606961696269636964696569666967696869696970697169726973697469756976697769786979698069816982698369846985698669876988698969906991699269936994699569966997699869997000700170027003700470057006700770087009701070117012701370147015701670177018701970207021702270237024702570267027702870297030703170327033703470357036703770387039704070417042704370447045704670477048704970507051705270537054705570567057705870597060706170627063706470657066706770687069707070717072707370747075707670777078707970807081708270837084708570867087708870897090709170927093709470957096709770987099710071017102710371047105710671077108710971107111711271137114711571167117711871197120712171227123712471257126712771287129713071317132713371347135713671377138713971407141714271437144714571467147714871497150715171527153715471557156715771587159716071617162716371647165716671677168716971707171717271737174717571767177717871797180718171827183718471857186718771887189719071917192719371947195719671977198719972007201720272037204720572067207720872097210721172127213721472157216721772187219722072217222722372247225722672277228722972307231723272337234723572367237723872397240724172427243724472457246724772487249725072517252725372547255725672577258725972607261726272637264726572667267726872697270727172727273727472757276727772787279728072817282728372847285728672877288728972907291729272937294729572967297729872997300730173027303730473057306730773087309731073117312731373147315731673177318731973207321732273237324732573267327732873297330733173327333733473357336733773387339734073417342734373447345734673477348734973507351735273537354735573567357735873597360736173627363736473657366736773687369737073717372737373747375737673777378737973807381738273837384738573867387738873897390739173927393739473957396739773987399740074017402740374047405740674077408740974107411741274137414741574167417741874197420742174227423742474257426742774287429743074317432743374347435743674377438743974407441744274437444744574467447744874497450745174527453745474557456745774587459746074617462746374647465746674677468746974707471747274737474747574767477747874797480748174827483748474857486748774887489749074917492749374947495749674977498749975007501750275037504750575067507750875097510751175127513751475157516751775187519752075217522752375247525752675277528752975307531753275337534753575367537753875397540754175427543754475457546754775487549755075517552755375547555755675577558755975607561756275637564756575667567756875697570757175727573757475757576757775787579758075817582758375847585758675877588758975907591759275937594759575967597759875997600760176027603760476057606760776087609761076117612761376147615761676177618761976207621762276237624762576267627762876297630763176327633763476357636763776387639764076417642764376447645764676477648764976507651765276537654765576567657765876597660766176627663766476657666766776687669767076717672767376747675767676777678767976807681768276837684768576867687768876897690769176927693769476957696769776987699770077017702770377047705770677077708770977107711771277137714771577167717771877197720772177227723772477257726772777287729773077317732773377347735773677377738773977407741774277437744774577467747774877497750775177527753775477557756775777587759776077617762776377647765776677677768776977707771777277737774777577767777777877797780778177827783778477857786778777887789779077917792779377947795779677977798779978007801780278037804780578067807780878097810781178127813781478157816781778187819782078217822782378247825782678277828782978307831783278337834783578367837783878397840784178427843784478457846784778487849785078517852785378547855785678577858785978607861786278637864786578667867786878697870787178727873787478757876787778787879788078817882788378847885788678877888788978907891789278937894789578967897789878997900790179027903790479057906790779087909791079117912791379147915791679177918791979207921792279237924792579267927792879297930793179327933793479357936793779387939794079417942794379447945794679477948794979507951795279537954795579567957795879597960796179627963796479657966796779687969797079717972797379747975797679777978797979807981798279837984798579867987798879897990799179927993799479957996799779987999800080018002800380048005800680078008800980108011801280138014801580168017801880198020802180228023802480258026802780288029803080318032803380348035803680378038803980408041804280438044804580468047804880498050805180528053805480558056805780588059806080618062806380648065806680678068806980708071807280738074807580768077807880798080808180828083808480858086808780888089809080918092809380948095809680978098809981008101810281038104810581068107810881098110811181128113811481158116811781188119812081218122812381248125812681278128812981308131813281338134813581368137813881398140814181428143814481458146814781488149815081518152815381548155815681578158815981608161816281638164816581668167816881698170817181728173817481758176817781788179818081818182818381848185818681878188818981908191819281938194819581968197819881998200820182028203820482058206820782088209821082118212821382148215821682178218821982208221822282238224822582268227822882298230823182328233823482358236823782388239824082418242824382448245824682478248824982508251825282538254825582568257825882598260826182628263826482658266826782688269827082718272827382748275827682778278827982808281828282838284828582868287828882898290829182928293829482958296829782988299830083018302830383048305830683078308830983108311831283138314831583168317831883198320832183228323832483258326832783288329833083318332833383348335833683378338833983408341834283438344834583468347834883498350835183528353835483558356835783588359836083618362836383648365836683678368836983708371837283738374837583768377837883798380838183828383838483858386838783888389839083918392839383948395839683978398839984008401840284038404840584068407840884098410841184128413841484158416841784188419842084218422842384248425842684278428842984308431843284338434843584368437843884398440844184428443844484458446844784488449845084518452845384548455845684578458845984608461846284638464846584668467846884698470847184728473847484758476847784788479848084818482848384848485848684878488848984908491849284938494849584968497849884998500850185028503850485058506850785088509851085118512851385148515851685178518851985208521852285238524852585268527852885298530853185328533853485358536853785388539854085418542854385448545854685478548854985508551855285538554855585568557855885598560856185628563856485658566856785688569857085718572857385748575857685778578857985808581858285838584858585868587858885898590859185928593859485958596859785988599860086018602860386048605860686078608860986108611861286138614861586168617861886198620862186228623862486258626862786288629863086318632863386348635863686378638863986408641864286438644864586468647864886498650865186528653865486558656865786588659866086618662866386648665866686678668866986708671867286738674867586768677867886798680868186828683868486858686868786888689869086918692869386948695869686978698869987008701870287038704870587068707870887098710871187128713871487158716871787188719872087218722872387248725872687278728872987308731873287338734873587368737873887398740874187428743874487458746874787488749875087518752875387548755875687578758875987608761876287638764876587668767876887698770877187728773877487758776877787788779878087818782878387848785878687878788878987908791879287938794879587968797879887998800880188028803880488058806880788088809881088118812881388148815881688178818881988208821882288238824882588268827882888298830883188328833883488358836883788388839884088418842884388448845884688478848884988508851885288538854885588568857885888598860886188628863886488658866886788688869887088718872887388748875887688778878887988808881888288838884888588868887888888898890889188928893889488958896889788988899890089018902890389048905890689078908890989108911891289138914891589168917891889198920892189228923892489258926892789288929893089318932893389348935893689378938893989408941894289438944894589468947894889498950895189528953895489558956895789588959896089618962896389648965896689678968896989708971897289738974897589768977897889798980898189828983898489858986898789888989899089918992899389948995899689978998899990009001900290039004900590069007900890099010901190129013901490159016901790189019902090219022902390249025902690279028902990309031903290339034903590369037903890399040904190429043904490459046904790489049905090519052905390549055905690579058905990609061906290639064906590669067906890699070907190729073907490759076907790789079908090819082908390849085908690879088908990909091909290939094909590969097909890999100910191029103910491059106910791089109911091119112911391149115911691179118911991209121912291239124912591269127912891299130913191329133913491359136913791389139914091419142914391449145914691479148914991509151915291539154915591569157915891599160916191629163916491659166916791689169917091719172917391749175917691779178917991809181918291839184918591869187918891899190919191929193919491959196919791989199920092019202920392049205920692079208920992109211921292139214921592169217921892199220922192229223922492259226922792289229923092319232923392349235923692379238923992409241924292439244924592469247924892499250925192529253925492559256925792589259926092619262926392649265926692679268926992709271927292739274927592769277927892799280928192829283928492859286928792889289929092919292929392949295929692979298929993009301930293039304930593069307930893099310931193129313931493159316931793189319932093219322932393249325932693279328932993309331933293339334933593369337933893399340934193429343934493459346934793489349935093519352935393549355935693579358935993609361936293639364936593669367936893699370937193729373937493759376937793789379938093819382938393849385938693879388938993909391939293939394939593969397939893999400940194029403940494059406940794089409941094119412941394149415941694179418941994209421942294239424942594269427942894299430943194329433943494359436943794389439944094419442944394449445944694479448944994509451945294539454945594569457945894599460946194629463946494659466946794689469947094719472947394749475947694779478947994809481948294839484948594869487948894899490949194929493949494959496949794989499950095019502950395049505950695079508950995109511951295139514951595169517951895199520952195229523952495259526952795289529953095319532953395349535953695379538953995409541954295439544954595469547954895499550955195529553955495559556955795589559956095619562956395649565956695679568956995709571957295739574957595769577957895799580958195829583958495859586958795889589959095919592959395949595959695979598959996009601960296039604960596069607960896099610961196129613961496159616961796189619962096219622962396249625962696279628962996309631963296339634963596369637963896399640964196429643964496459646964796489649965096519652965396549655965696579658965996609661966296639664966596669667966896699670967196729673967496759676967796789679968096819682968396849685968696879688968996909691969296939694969596969697969896999700970197029703970497059706970797089709971097119712971397149715971697179718971997209721972297239724972597269727972897299730973197329733973497359736973797389739974097419742974397449745974697479748974997509751975297539754975597569757975897599760976197629763976497659766976797689769977097719772977397749775977697779778977997809781978297839784978597869787978897899790979197929793979497959796979797989799980098019802980398049805980698079808980998109811981298139814981598169817981898199820982198229823982498259826982798289829983098319832983398349835983698379838983998409841984298439844984598469847984898499850985198529853985498559856985798589859986098619862986398649865986698679868986998709871987298739874987598769877987898799880988198829883988498859886988798889889989098919892989398949895989698979898989999009901990299039904990599069907990899099910991199129913991499159916991799189919992099219922992399249925992699279928992999309931993299339934993599369937993899399940994199429943994499459946994799489949995099519952995399549955995699579958995999609961996299639964996599669967996899699970997199729973997499759976997799789979998099819982998399849985998699879988998999909991999299939994999599969997999899991000010001100021000310004100051000610007100081000910010100111001210013100141001510016100171001810019100201002110022100231002410025100261002710028100291003010031100321003310034100351003610037100381003910040100411004210043100441004510046100471004810049100501005110052100531005410055100561005710058100591006010061100621006310064100651006610067100681006910070100711007210073100741007510076100771007810079100801008110082100831008410085100861008710088100891009010091100921009310094100951009610097100981009910100101011010210103101041010510106101071010810109101101011110112101131011410115101161011710118101191012010121101221012310124101251012610127101281012910130101311013210133101341013510136101371013810139101401014110142101431014410145101461014710148101491015010151101521015310154101551015610157101581015910160101611016210163101641016510166101671016810169101701017110172101731017410175101761017710178101791018010181101821018310184101851018610187101881018910190101911019210193101941019510196101971019810199102001020110202102031020410205102061020710208102091021010211102121021310214102151021610217102181021910220102211022210223102241022510226102271022810229102301023110232102331023410235102361023710238102391024010241102421024310244102451024610247102481024910250102511025210253102541025510256102571025810259102601026110262102631026410265102661026710268102691027010271102721027310274102751027610277102781027910280102811028210283102841028510286102871028810289102901029110292102931029410295102961029710298102991030010301103021030310304103051030610307103081030910310103111031210313103141031510316103171031810319103201032110322103231032410325103261032710328103291033010331103321033310334103351033610337103381033910340103411034210343103441034510346103471034810349103501035110352103531035410355103561035710358103591036010361103621036310364103651036610367103681036910370103711037210373103741037510376103771037810379103801038110382103831038410385103861038710388103891039010391103921039310394103951039610397103981039910400104011040210403104041040510406104071040810409104101041110412104131041410415104161041710418104191042010421104221042310424104251042610427104281042910430104311043210433104341043510436104371043810439104401044110442104431044410445104461044710448104491045010451104521045310454104551045610457104581045910460104611046210463104641046510466104671046810469104701047110472104731047410475104761047710478104791048010481104821048310484104851048610487104881048910490104911049210493104941049510496104971049810499105001050110502105031050410505105061050710508105091051010511105121051310514105151051610517105181051910520105211052210523105241052510526105271052810529105301053110532105331053410535105361053710538105391054010541105421054310544105451054610547105481054910550105511055210553105541055510556105571055810559105601056110562105631056410565105661056710568105691057010571105721057310574105751057610577105781057910580105811058210583105841058510586105871058810589105901059110592105931059410595105961059710598105991060010601106021060310604106051060610607106081060910610106111061210613106141061510616106171061810619106201062110622106231062410625106261062710628106291063010631106321063310634106351063610637106381063910640106411064210643106441064510646106471064810649106501065110652106531065410655106561065710658106591066010661106621066310664106651066610667106681066910670106711067210673106741067510676106771067810679106801068110682106831068410685106861068710688106891069010691106921069310694106951069610697106981069910700107011070210703107041070510706107071070810709107101071110712107131071410715107161071710718107191072010721107221072310724107251072610727107281072910730107311073210733107341073510736107371073810739107401074110742107431074410745107461074710748107491075010751107521075310754107551075610757107581075910760107611076210763107641076510766107671076810769107701077110772107731077410775107761077710778107791078010781107821078310784107851078610787107881078910790107911079210793107941079510796107971079810799108001080110802108031080410805108061080710808108091081010811108121081310814108151081610817108181081910820108211082210823108241082510826108271082810829108301083110832108331083410835108361083710838108391084010841108421084310844108451084610847108481084910850108511085210853108541085510856108571085810859108601086110862108631086410865108661086710868108691087010871108721087310874108751087610877108781087910880108811088210883108841088510886108871088810889108901089110892108931089410895108961089710898108991090010901109021090310904109051090610907109081090910910109111091210913109141091510916109171091810919109201092110922109231092410925109261092710928109291093010931109321093310934109351093610937109381093910940109411094210943109441094510946109471094810949109501095110952109531095410955109561095710958109591096010961109621096310964109651096610967109681096910970109711097210973109741097510976109771097810979109801098110982109831098410985109861098710988109891099010991109921099310994109951099610997109981099911000110011100211003110041100511006110071100811009110101101111012110131101411015110161101711018110191102011021110221102311024110251102611027110281102911030110311103211033110341103511036110371103811039110401104111042110431104411045110461104711048110491105011051110521105311054110551105611057110581105911060110611106211063110641106511066110671106811069110701107111072110731107411075110761107711078110791108011081110821108311084110851108611087110881108911090110911109211093110941109511096110971109811099111001110111102111031110411105111061110711108111091111011111111121111311114111151111611117111181111911120111211112211123111241112511126111271112811129111301113111132111331113411135111361113711138111391114011141111421114311144111451114611147111481114911150111511115211153111541115511156111571115811159111601116111162111631116411165111661116711168111691117011171111721117311174111751117611177111781117911180111811118211183111841118511186111871118811189111901119111192111931119411195111961119711198111991120011201112021120311204112051120611207112081120911210112111121211213112141121511216112171121811219112201122111222112231122411225112261122711228112291123011231112321123311234112351123611237112381123911240112411124211243112441124511246112471124811249112501125111252112531125411255112561125711258112591126011261112621126311264112651126611267112681126911270112711127211273112741127511276112771127811279112801128111282112831128411285112861128711288112891129011291112921129311294112951129611297112981129911300113011130211303113041130511306113071130811309113101131111312113131131411315113161131711318113191132011321113221132311324113251132611327113281132911330113311133211333113341133511336113371133811339113401134111342113431134411345113461134711348113491135011351113521135311354113551135611357113581135911360113611136211363113641136511366113671136811369113701137111372113731137411375113761137711378113791138011381113821138311384113851138611387113881138911390113911139211393113941139511396113971139811399114001140111402114031140411405114061140711408114091141011411114121141311414114151141611417114181141911420114211142211423114241142511426114271142811429114301143111432114331143411435114361143711438114391144011441114421144311444114451144611447114481144911450114511145211453114541145511456114571145811459114601146111462114631146411465114661146711468114691147011471114721147311474114751147611477114781147911480114811148211483114841148511486114871148811489114901149111492114931149411495114961149711498114991150011501115021150311504115051150611507115081150911510115111151211513115141151511516115171151811519115201152111522115231152411525115261152711528115291153011531115321153311534115351153611537115381153911540115411154211543115441154511546115471154811549115501155111552115531155411555115561155711558115591156011561115621156311564115651156611567115681156911570115711157211573115741157511576115771157811579115801158111582115831158411585115861158711588115891159011591115921159311594115951159611597115981159911600116011160211603116041160511606116071160811609116101161111612116131161411615116161161711618116191162011621116221162311624116251162611627116281162911630116311163211633116341163511636116371163811639116401164111642116431164411645116461164711648116491165011651116521165311654116551165611657116581165911660116611166211663116641166511666116671166811669116701167111672116731167411675116761167711678116791168011681116821168311684116851168611687116881168911690116911169211693116941169511696116971169811699117001170111702117031170411705117061170711708117091171011711117121171311714117151171611717117181171911720117211172211723117241172511726117271172811729117301173111732117331173411735117361173711738117391174011741117421174311744117451174611747117481174911750117511175211753117541175511756117571175811759117601176111762117631176411765117661176711768117691177011771117721177311774117751177611777117781177911780117811178211783117841178511786117871178811789117901179111792117931179411795117961179711798117991180011801118021180311804118051180611807118081180911810118111181211813118141181511816118171181811819118201182111822118231182411825118261182711828118291183011831118321183311834118351183611837118381183911840118411184211843118441184511846118471184811849118501185111852118531185411855118561185711858118591186011861118621186311864118651186611867118681186911870118711187211873118741187511876118771187811879118801188111882118831188411885118861188711888118891189011891118921189311894118951189611897118981189911900
  1. //
  2. // Copyright (C) 2014-2016 LunarG, Inc.
  3. // Copyright (C) 2015-2020 Google, Inc.
  4. // Copyright (C) 2017, 2022-2025 Arm Limited.
  5. // Modifications Copyright (C) 2020 Advanced Micro Devices, Inc. All rights reserved.
  6. //
  7. // All rights reserved.
  8. //
  9. // Redistribution and use in source and binary forms, with or without
  10. // modification, are permitted provided that the following conditions
  11. // are met:
  12. //
  13. // Redistributions of source code must retain the above copyright
  14. // notice, this list of conditions and the following disclaimer.
  15. //
  16. // Redistributions in binary form must reproduce the above
  17. // copyright notice, this list of conditions and the following
  18. // disclaimer in the documentation and/or other materials provided
  19. // with the distribution.
  20. //
  21. // Neither the name of 3Dlabs Inc. Ltd. nor the names of its
  22. // contributors may be used to endorse or promote products derived
  23. // from this software without specific prior written permission.
  24. //
  25. // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  26. // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  27. // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
  28. // FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
  29. // COPYRIGHT HOLDERS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
  30. // INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
  31. // BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  32. // LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
  33. // CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  34. // LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
  35. // ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  36. // POSSIBILITY OF SUCH DAMAGE.
  37. //
  38. // Visit the nodes in the glslang intermediate tree representation to
  39. // translate them to SPIR-V.
  40. //
  41. #include "spirv.hpp11"
  42. #include "GlslangToSpv.h"
  43. #include "SpvBuilder.h"
  44. #include "SpvTools.h"
  45. #include "spvUtil.h"
  46. namespace spv {
  47. #include "GLSL.std.450.h"
  48. #include "GLSL.ext.KHR.h"
  49. #include "GLSL.ext.EXT.h"
  50. #include "GLSL.ext.AMD.h"
  51. #include "GLSL.ext.NV.h"
  52. #include "GLSL.ext.ARM.h"
  53. #include "GLSL.ext.QCOM.h"
  54. #include "NonSemanticDebugPrintf.h"
  55. }
  56. // Glslang includes
  57. #include "../glslang/MachineIndependent/localintermediate.h"
  58. #include "../glslang/MachineIndependent/SymbolTable.h"
  59. #include "../glslang/Include/Common.h"
  60. // Build-time generated includes
  61. #include "glslang/build_info.h"
  62. #include <fstream>
  63. #include <iomanip>
  64. #include <list>
  65. #include <map>
  66. #include <optional>
  67. #include <stack>
  68. #include <string>
  69. #include <vector>
  70. namespace {
  71. namespace {
  72. class SpecConstantOpModeGuard {
  73. public:
  74. SpecConstantOpModeGuard(spv::Builder* builder)
  75. : builder_(builder) {
  76. previous_flag_ = builder->isInSpecConstCodeGenMode();
  77. }
  78. ~SpecConstantOpModeGuard() {
  79. previous_flag_ ? builder_->setToSpecConstCodeGenMode()
  80. : builder_->setToNormalCodeGenMode();
  81. }
  82. void turnOnSpecConstantOpMode() {
  83. builder_->setToSpecConstCodeGenMode();
  84. }
  85. private:
  86. spv::Builder* builder_;
  87. bool previous_flag_;
  88. };
  89. struct OpDecorations {
  90. public:
  91. OpDecorations(spv::Decoration precision, spv::Decoration noContraction, spv::Decoration nonUniform) :
  92. precision(precision)
  93. ,
  94. noContraction(noContraction),
  95. nonUniform(nonUniform)
  96. { }
  97. spv::Decoration precision;
  98. void addNoContraction(spv::Builder& builder, spv::Id t) { builder.addDecoration(t, noContraction); }
  99. void addNonUniform(spv::Builder& builder, spv::Id t) { builder.addDecoration(t, nonUniform); }
  100. protected:
  101. spv::Decoration noContraction;
  102. spv::Decoration nonUniform;
  103. };
  104. } // namespace
  105. //
  106. // The main holder of information for translating glslang to SPIR-V.
  107. //
  108. // Derives from the AST walking base class.
  109. //
  110. class TGlslangToSpvTraverser : public glslang::TIntermTraverser {
  111. public:
  112. TGlslangToSpvTraverser(unsigned int spvVersion, const glslang::TIntermediate*, spv::SpvBuildLogger* logger,
  113. glslang::SpvOptions& options);
  114. virtual ~TGlslangToSpvTraverser() { }
  115. bool visitAggregate(glslang::TVisit, glslang::TIntermAggregate*) override;
  116. bool visitBinary(glslang::TVisit, glslang::TIntermBinary*) override;
  117. void visitConstantUnion(glslang::TIntermConstantUnion*) override;
  118. bool visitSelection(glslang::TVisit, glslang::TIntermSelection*) override;
  119. bool visitSwitch(glslang::TVisit, glslang::TIntermSwitch*) override;
  120. void visitSymbol(glslang::TIntermSymbol* symbol) override;
  121. bool visitUnary(glslang::TVisit, glslang::TIntermUnary*) override;
  122. bool visitLoop(glslang::TVisit, glslang::TIntermLoop*) override;
  123. bool visitBranch(glslang::TVisit visit, glslang::TIntermBranch*) override;
  124. bool visitVariableDecl(glslang::TVisit, glslang::TIntermVariableDecl*) override;
  125. void finishSpv(bool compileOnly);
  126. void dumpSpv(std::vector<unsigned int>& out);
  127. protected:
  128. TGlslangToSpvTraverser(TGlslangToSpvTraverser&);
  129. TGlslangToSpvTraverser& operator=(TGlslangToSpvTraverser&);
  130. spv::Decoration TranslateInterpolationDecoration(const glslang::TQualifier& qualifier);
  131. spv::Decoration TranslateAuxiliaryStorageDecoration(const glslang::TQualifier& qualifier);
  132. spv::Decoration TranslateNonUniformDecoration(const glslang::TQualifier& qualifier);
  133. spv::Decoration TranslateNonUniformDecoration(const spv::Builder::AccessChain::CoherentFlags& coherentFlags);
  134. spv::Builder::AccessChain::CoherentFlags TranslateCoherent(const glslang::TType& type);
  135. spv::MemoryAccessMask TranslateMemoryAccess(const spv::Builder::AccessChain::CoherentFlags &coherentFlags);
  136. spv::ImageOperandsMask TranslateImageOperands(const spv::Builder::AccessChain::CoherentFlags &coherentFlags);
  137. spv::Scope TranslateMemoryScope(const spv::Builder::AccessChain::CoherentFlags &coherentFlags);
  138. spv::BuiltIn TranslateBuiltInDecoration(glslang::TBuiltInVariable, bool memberDeclaration);
  139. spv::ImageFormat TranslateImageFormat(const glslang::TType& type);
  140. spv::SelectionControlMask TranslateSelectionControl(const glslang::TIntermSelection&) const;
  141. spv::SelectionControlMask TranslateSwitchControl(const glslang::TIntermSwitch&) const;
  142. spv::LoopControlMask TranslateLoopControl(const glslang::TIntermLoop&, std::vector<unsigned int>& operands) const;
  143. spv::StorageClass TranslateStorageClass(const glslang::TType&);
  144. void TranslateLiterals(const glslang::TVector<const glslang::TIntermConstantUnion*>&, std::vector<unsigned>&) const;
  145. void addIndirectionIndexCapabilities(const glslang::TType& baseType, const glslang::TType& indexType);
  146. spv::Id createSpvVariable(const glslang::TIntermSymbol*, spv::Id forcedType);
  147. spv::Id getSampledType(const glslang::TSampler&);
  148. spv::Id getInvertedSwizzleType(const glslang::TIntermTyped&);
  149. spv::Id createInvertedSwizzle(spv::Decoration precision, const glslang::TIntermTyped&, spv::Id parentResult);
  150. void convertSwizzle(const glslang::TIntermAggregate&, std::vector<unsigned>& swizzle);
  151. spv::Id convertGlslangToSpvType(const glslang::TType& type, bool forwardReferenceOnly = false);
  152. spv::Id convertGlslangToSpvType(const glslang::TType& type, glslang::TLayoutPacking, const glslang::TQualifier&,
  153. bool lastBufferBlockMember, bool forwardReferenceOnly = false);
  154. void applySpirvDecorate(const glslang::TType& type, spv::Id id, std::optional<int> member);
  155. bool filterMember(const glslang::TType& member);
  156. spv::Id convertGlslangStructToSpvType(const glslang::TType&, const glslang::TTypeList* glslangStruct,
  157. glslang::TLayoutPacking, const glslang::TQualifier&);
  158. spv::LinkageType convertGlslangLinkageToSpv(glslang::TLinkType glslangLinkType);
  159. spv::Id decorateDescHeapType(const glslang::TType& type, spv::Id& memberBaseOffset, spv::Id& alignment,
  160. int& maxPlainDataAlignment);
  161. void decorateStructType(const glslang::TType&, const glslang::TTypeList* glslangStruct, glslang::TLayoutPacking,
  162. const glslang::TQualifier&, spv::Id, const std::vector<spv::Id>& spvMembers);
  163. spv::Id makeArraySizeId(const glslang::TArraySizes&, int dim, bool allowZero = false, bool boolType = false);
  164. spv::Id accessChainLoad(const glslang::TType& type);
  165. void accessChainStore(const glslang::TType& type, spv::Id rvalue);
  166. void multiTypeStore(const glslang::TType&, spv::Id rValue);
  167. spv::Id convertLoadedBoolInUniformToUint(const glslang::TType& type, spv::Id nominalTypeId, spv::Id loadedId);
  168. glslang::TLayoutPacking getExplicitLayout(const glslang::TType& type) const;
  169. int getArrayStride(const glslang::TType& arrayType, glslang::TLayoutPacking, glslang::TLayoutMatrix);
  170. int getMatrixStride(const glslang::TType& matrixType, glslang::TLayoutPacking, glslang::TLayoutMatrix);
  171. void updateMemberOffset(const glslang::TType& structType, const glslang::TType& memberType, int& currentOffset,
  172. int& nextOffset, glslang::TLayoutPacking, glslang::TLayoutMatrix);
  173. void declareUseOfStructMember(const glslang::TTypeList& members, int glslangMember);
  174. bool isShaderEntryPoint(const glslang::TIntermAggregate* node);
  175. bool writableParam(glslang::TStorageQualifier) const;
  176. bool originalParam(glslang::TStorageQualifier, const glslang::TType&, bool implicitThisParam);
  177. void makeFunctions(const glslang::TIntermSequence&);
  178. void makeGlobalInitializers(const glslang::TIntermSequence&);
  179. void collectRayTracingLinkerObjects();
  180. void visitFunctions(const glslang::TIntermSequence&);
  181. void translateArguments(const glslang::TIntermAggregate& node, std::vector<spv::Id>& arguments,
  182. spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags);
  183. void translateArguments(glslang::TIntermUnary& node, std::vector<spv::Id>& arguments);
  184. spv::Id createImageTextureFunctionCall(glslang::TIntermOperator* node);
  185. spv::Id handleUserFunctionCall(const glslang::TIntermAggregate*);
  186. spv::Id createBinaryOperation(glslang::TOperator op, OpDecorations&, spv::Id typeId, spv::Id left, spv::Id right,
  187. glslang::TBasicType typeProxy, bool reduceComparison = true);
  188. spv::Id createBinaryMatrixOperation(spv::Op, OpDecorations&, spv::Id typeId, spv::Id left, spv::Id right);
  189. spv::Id createUnaryOperation(glslang::TOperator op, OpDecorations&, spv::Id typeId, spv::Id operand,
  190. glslang::TBasicType typeProxy,
  191. const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags,
  192. const glslang::TType &opType);
  193. spv::Id createUnaryMatrixOperation(spv::Op op, OpDecorations&, spv::Id typeId, spv::Id operand,
  194. glslang::TBasicType typeProxy);
  195. spv::Id createConversion(glslang::TOperator op, OpDecorations&, spv::Id destTypeId, spv::Id operand,
  196. glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType);
  197. spv::Id createIntWidthConversion(spv::Id operand, int vectorSize, spv::Id destType,
  198. glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType);
  199. spv::Id makeSmearedConstant(spv::Id constant, int vectorSize);
  200. spv::Id createAtomicOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId,
  201. std::vector<spv::Id>& operands, glslang::TBasicType typeProxy,
  202. const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags,
  203. const glslang::TType &opType);
  204. spv::Id createInvocationsOperation(glslang::TOperator op, spv::Id typeId, std::vector<spv::Id>& operands,
  205. glslang::TBasicType typeProxy);
  206. spv::Id CreateInvocationsVectorOperation(spv::Op op, spv::GroupOperation groupOperation,
  207. spv::Id typeId, std::vector<spv::Id>& operands);
  208. spv::Id createSubgroupOperation(glslang::TOperator op, spv::Id typeId, std::vector<spv::Id>& operands,
  209. glslang::TBasicType typeProxy);
  210. spv::Id createMiscOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId,
  211. std::vector<spv::Id>& operands, glslang::TBasicType typeProxy);
  212. spv::Id createNoArgOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId);
  213. spv::Id getSymbolId(const glslang::TIntermSymbol* node);
  214. void addMeshNVDecoration(spv::Id id, int member, const glslang::TQualifier & qualifier);
  215. bool hasQCOMImageProceessingDecoration(spv::Id id, spv::Decoration decor);
  216. void addImageProcessingQCOMDecoration(spv::Id id, spv::Decoration decor);
  217. void addImageProcessing2QCOMDecoration(spv::Id id, bool isForGather);
  218. spv::Id createSpvConstant(const glslang::TIntermTyped&);
  219. spv::Id createSpvConstantFromConstUnionArray(const glslang::TType& type, const glslang::TConstUnionArray&,
  220. int& nextConst, bool specConstant);
  221. bool isTrivialLeaf(const glslang::TIntermTyped* node);
  222. bool isTrivial(const glslang::TIntermTyped* node);
  223. spv::Id createShortCircuit(glslang::TOperator, glslang::TIntermTyped& left, glslang::TIntermTyped& right);
  224. spv::Id getExtBuiltins(const char* name);
  225. std::pair<spv::Id, spv::Id> getForcedType(glslang::TBuiltInVariable builtIn, const glslang::TType&);
  226. spv::Id translateForcedType(spv::Id object);
  227. spv::Id createCompositeConstruct(spv::Id typeId, std::vector<spv::Id> constituents);
  228. void recordDescHeapAccessChainInfo(glslang::TIntermBinary* node);
  229. glslang::SpvOptions& options;
  230. spv::Function* shaderEntry;
  231. spv::Function* currentFunction;
  232. spv::Instruction* entryPoint;
  233. int sequenceDepth;
  234. spv::SpvBuildLogger* logger;
  235. // There is a 1:1 mapping between a spv builder and a module; this is thread safe
  236. spv::Builder builder;
  237. bool inEntryPoint;
  238. bool entryPointTerminated;
  239. bool linkageOnly; // true when visiting the set of objects in the AST present only for
  240. // establishing interface, whether or not they were statically used
  241. std::set<spv::Id> iOSet; // all input/output variables from either static use or declaration of interface
  242. const glslang::TIntermediate* glslangIntermediate;
  243. bool nanMinMaxClamp; // true if use NMin/NMax/NClamp instead of FMin/FMax/FClamp
  244. spv::Id stdBuiltins;
  245. spv::Id nonSemanticDebugPrintf;
  246. std::unordered_map<std::string, spv::Id> extBuiltinMap;
  247. std::unordered_map<long long, spv::Id> symbolValues;
  248. std::unordered_map<uint32_t, spv::Id> builtInVariableIds;
  249. std::unordered_set<long long> rValueParameters; // set of formal function parameters passed as rValues,
  250. // rather than a pointer
  251. std::unordered_map<std::string, spv::Function*> functionMap;
  252. std::unordered_map<const glslang::TTypeList*, spv::Id> structMap[glslang::ElpCount][glslang::ElmCount];
  253. // for mapping glslang block indices to spv indices (e.g., due to hidden members):
  254. std::unordered_map<long long, std::vector<int>> memberRemapper;
  255. // for mapping glslang symbol struct to symbol Id
  256. std::unordered_map<const glslang::TTypeList*, long long> glslangTypeToIdMap;
  257. std::stack<bool> breakForLoop; // false means break for switch
  258. std::unordered_map<std::string, const glslang::TIntermSymbol*> counterOriginator;
  259. // Map pointee types for EbtReference to their forward pointers
  260. std::map<const glslang::TType *, spv::Id> forwardPointers;
  261. // Type forcing, for when SPIR-V wants a different type than the AST,
  262. // requiring local translation to and from SPIR-V type on every access.
  263. // Maps <builtin-variable-id -> AST-required-type-id>
  264. std::unordered_map<spv::Id, spv::Id> forceType;
  265. // Used by Task shader while generating opearnds for OpEmitMeshTasksEXT
  266. spv::Id taskPayloadID;
  267. // Used later for generating OpTraceKHR/OpExecuteCallableKHR/OpHitObjectRecordHit*/OpHitObjectGetShaderBindingTableData
  268. std::unordered_map<unsigned int, glslang::TIntermSymbol *> locationToSymbol[4];
  269. std::unordered_map<spv::Id, std::vector<spv::Decoration> > idToQCOMDecorations;
  270. // For nested or inner resource heap structure's alignment and offset records.
  271. typedef struct heapMetaData {
  272. spv::Id typeStride;
  273. spv::Id maxRsrcTypeAlignment;
  274. int maxPlainDataAlignment;
  275. } HeapMetaData;
  276. std::unordered_map<const glslang::TType*, HeapMetaData> heapStructureTypeMetaData;
  277. std::unordered_map<spv::Id, spv::Id> heapStructureTypeSize;
  278. std::vector<spv::Id> heapStructureMemberOffsets;
  279. };
  280. //
  281. // Helper functions for translating glslang representations to SPIR-V enumerants.
  282. //
  283. // Translate glslang profile to SPIR-V source language.
  284. spv::SourceLanguage TranslateSourceLanguage(glslang::EShSource source, EProfile profile)
  285. {
  286. switch (source) {
  287. case glslang::EShSourceGlsl:
  288. switch (profile) {
  289. case ENoProfile:
  290. case ECoreProfile:
  291. case ECompatibilityProfile:
  292. return spv::SourceLanguage::GLSL;
  293. case EEsProfile:
  294. return spv::SourceLanguage::ESSL;
  295. default:
  296. return spv::SourceLanguage::Unknown;
  297. }
  298. case glslang::EShSourceHlsl:
  299. return spv::SourceLanguage::HLSL;
  300. default:
  301. return spv::SourceLanguage::Unknown;
  302. }
  303. }
  304. // Translate glslang language (stage) to SPIR-V execution model.
  305. spv::ExecutionModel TranslateExecutionModel(EShLanguage stage, bool isMeshShaderEXT = false)
  306. {
  307. switch (stage) {
  308. case EShLangVertex: return spv::ExecutionModel::Vertex;
  309. case EShLangFragment: return spv::ExecutionModel::Fragment;
  310. case EShLangCompute: return spv::ExecutionModel::GLCompute;
  311. case EShLangTessControl: return spv::ExecutionModel::TessellationControl;
  312. case EShLangTessEvaluation: return spv::ExecutionModel::TessellationEvaluation;
  313. case EShLangGeometry: return spv::ExecutionModel::Geometry;
  314. case EShLangRayGen: return spv::ExecutionModel::RayGenerationKHR;
  315. case EShLangIntersect: return spv::ExecutionModel::IntersectionKHR;
  316. case EShLangAnyHit: return spv::ExecutionModel::AnyHitKHR;
  317. case EShLangClosestHit: return spv::ExecutionModel::ClosestHitKHR;
  318. case EShLangMiss: return spv::ExecutionModel::MissKHR;
  319. case EShLangCallable: return spv::ExecutionModel::CallableKHR;
  320. case EShLangTask: return (isMeshShaderEXT)? spv::ExecutionModel::TaskEXT : spv::ExecutionModel::TaskNV;
  321. case EShLangMesh: return (isMeshShaderEXT)? spv::ExecutionModel::MeshEXT : spv::ExecutionModel::MeshNV;
  322. default:
  323. assert(0);
  324. return spv::ExecutionModel::Fragment;
  325. }
  326. }
  327. // Translate glslang sampler type to SPIR-V dimensionality.
  328. spv::Dim TranslateDimensionality(const glslang::TSampler& sampler)
  329. {
  330. switch (sampler.dim) {
  331. case glslang::Esd1D: return spv::Dim::Dim1D;
  332. case glslang::Esd2D: return spv::Dim::Dim2D;
  333. case glslang::Esd3D: return spv::Dim::Dim3D;
  334. case glslang::EsdCube: return spv::Dim::Cube;
  335. case glslang::EsdRect: return spv::Dim::Rect;
  336. case glslang::EsdBuffer: return spv::Dim::Buffer;
  337. case glslang::EsdSubpass: return spv::Dim::SubpassData;
  338. case glslang::EsdAttachmentEXT: return spv::Dim::TileImageDataEXT;
  339. default:
  340. assert(0);
  341. return spv::Dim::Dim2D;
  342. }
  343. }
  344. // Translate glslang precision to SPIR-V precision decorations.
  345. spv::Decoration TranslatePrecisionDecoration(glslang::TPrecisionQualifier glslangPrecision)
  346. {
  347. switch (glslangPrecision) {
  348. case glslang::EpqLow: return spv::Decoration::RelaxedPrecision;
  349. case glslang::EpqMedium: return spv::Decoration::RelaxedPrecision;
  350. default:
  351. return spv::NoPrecision;
  352. }
  353. }
  354. // Translate glslang type to SPIR-V precision decorations.
  355. spv::Decoration TranslatePrecisionDecoration(const glslang::TType& type)
  356. {
  357. return TranslatePrecisionDecoration(type.getQualifier().precision);
  358. }
  359. // Translate glslang type to SPIR-V block decorations.
  360. spv::Decoration TranslateBlockDecoration(const glslang::TStorageQualifier storage, bool useStorageBuffer)
  361. {
  362. switch (storage) {
  363. case glslang::EvqUniform: return spv::Decoration::Block;
  364. case glslang::EvqBuffer: return useStorageBuffer ? spv::Decoration::Block : spv::Decoration::BufferBlock;
  365. case glslang::EvqVaryingIn: return spv::Decoration::Block;
  366. case glslang::EvqVaryingOut: return spv::Decoration::Block;
  367. case glslang::EvqShared: return spv::Decoration::Block;
  368. case glslang::EvqPayload: return spv::Decoration::Block;
  369. case glslang::EvqPayloadIn: return spv::Decoration::Block;
  370. case glslang::EvqHitAttr: return spv::Decoration::Block;
  371. case glslang::EvqCallableData: return spv::Decoration::Block;
  372. case glslang::EvqCallableDataIn: return spv::Decoration::Block;
  373. case glslang::EvqHitObjectAttrNV: return spv::Decoration::Block;
  374. case glslang::EvqHitObjectAttrEXT: return spv::Decoration::Block;
  375. case glslang::EvqResourceHeap: return spv::Decoration::Block;
  376. case glslang::EvqSamplerHeap: return spv::Decoration::Block;
  377. default:
  378. assert(0);
  379. break;
  380. }
  381. return spv::Decoration::Max;
  382. }
  383. // Translate glslang type to SPIR-V memory decorations.
  384. void TranslateMemoryDecoration(const glslang::TQualifier& qualifier, std::vector<spv::Decoration>& memory,
  385. bool useVulkanMemoryModel)
  386. {
  387. if (!useVulkanMemoryModel) {
  388. if (qualifier.isVolatile()) {
  389. memory.push_back(spv::Decoration::Volatile);
  390. memory.push_back(spv::Decoration::Coherent);
  391. } else if (qualifier.isCoherent()) {
  392. memory.push_back(spv::Decoration::Coherent);
  393. }
  394. }
  395. if (qualifier.isRestrict())
  396. memory.push_back(spv::Decoration::Restrict);
  397. if (qualifier.isReadOnly())
  398. memory.push_back(spv::Decoration::NonWritable);
  399. if (qualifier.isWriteOnly())
  400. memory.push_back(spv::Decoration::NonReadable);
  401. }
  402. // Translate glslang type to SPIR-V layout decorations.
  403. spv::Decoration TranslateLayoutDecoration(const glslang::TType& type, glslang::TLayoutMatrix matrixLayout)
  404. {
  405. if (type.isMatrix()) {
  406. switch (matrixLayout) {
  407. case glslang::ElmRowMajor:
  408. return spv::Decoration::RowMajor;
  409. case glslang::ElmColumnMajor:
  410. return spv::Decoration::ColMajor;
  411. default:
  412. // opaque layouts don't need a majorness
  413. return spv::Decoration::Max;
  414. }
  415. } else {
  416. switch (type.getBasicType()) {
  417. default:
  418. return spv::Decoration::Max;
  419. break;
  420. case glslang::EbtBlock:
  421. switch (type.getQualifier().storage) {
  422. case glslang::EvqShared:
  423. case glslang::EvqUniform:
  424. case glslang::EvqBuffer:
  425. switch (type.getQualifier().layoutPacking) {
  426. case glslang::ElpShared: return spv::Decoration::GLSLShared;
  427. case glslang::ElpPacked: return spv::Decoration::GLSLPacked;
  428. default:
  429. return spv::Decoration::Max;
  430. }
  431. case glslang::EvqVaryingIn:
  432. case glslang::EvqVaryingOut:
  433. if (type.getQualifier().isTaskMemory()) {
  434. switch (type.getQualifier().layoutPacking) {
  435. case glslang::ElpShared: return spv::Decoration::GLSLShared;
  436. case glslang::ElpPacked: return spv::Decoration::GLSLPacked;
  437. default: break;
  438. }
  439. } else {
  440. assert(type.getQualifier().layoutPacking == glslang::ElpNone);
  441. }
  442. return spv::Decoration::Max;
  443. case glslang::EvqPayload:
  444. case glslang::EvqPayloadIn:
  445. case glslang::EvqHitAttr:
  446. case glslang::EvqCallableData:
  447. case glslang::EvqCallableDataIn:
  448. case glslang::EvqHitObjectAttrNV:
  449. case glslang::EvqHitObjectAttrEXT:
  450. case glslang::EvqResourceHeap:
  451. case glslang::EvqSamplerHeap:
  452. return spv::Decoration::Max;
  453. default:
  454. assert(0);
  455. return spv::Decoration::Max;
  456. }
  457. }
  458. }
  459. }
  460. // Translate glslang type to SPIR-V interpolation decorations.
  461. // Returns spv::Decoration::Max when no decoration
  462. // should be applied.
  463. spv::Decoration TGlslangToSpvTraverser::TranslateInterpolationDecoration(const glslang::TQualifier& qualifier)
  464. {
  465. if (qualifier.smooth)
  466. // Smooth decoration doesn't exist in SPIR-V 1.0
  467. return spv::Decoration::Max;
  468. else if (qualifier.isNonPerspective())
  469. return spv::Decoration::NoPerspective;
  470. else if (qualifier.flat)
  471. return spv::Decoration::Flat;
  472. else if (qualifier.isExplicitInterpolation()) {
  473. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  474. return spv::Decoration::ExplicitInterpAMD;
  475. }
  476. else
  477. return spv::Decoration::Max;
  478. }
  479. // Translate glslang type to SPIR-V auxiliary storage decorations.
  480. // Returns spv::Decoration::Max when no decoration
  481. // should be applied.
  482. spv::Decoration TGlslangToSpvTraverser::TranslateAuxiliaryStorageDecoration(const glslang::TQualifier& qualifier)
  483. {
  484. if (qualifier.centroid)
  485. return spv::Decoration::Centroid;
  486. else if (qualifier.patch)
  487. return spv::Decoration::Patch;
  488. else if (qualifier.sample) {
  489. builder.addCapability(spv::Capability::SampleRateShading);
  490. return spv::Decoration::Sample;
  491. }
  492. return spv::Decoration::Max;
  493. }
  494. // If glslang type is invariant, return SPIR-V invariant decoration.
  495. spv::Decoration TranslateInvariantDecoration(const glslang::TQualifier& qualifier)
  496. {
  497. if (qualifier.invariant)
  498. return spv::Decoration::Invariant;
  499. else
  500. return spv::Decoration::Max;
  501. }
  502. // If glslang type is noContraction, return SPIR-V NoContraction decoration.
  503. spv::Decoration TranslateNoContractionDecoration(const glslang::TQualifier& qualifier)
  504. {
  505. if (qualifier.isNoContraction())
  506. return spv::Decoration::NoContraction;
  507. else
  508. return spv::Decoration::Max;
  509. }
  510. // If glslang type is nonUniform, return SPIR-V NonUniform decoration.
  511. spv::Decoration TGlslangToSpvTraverser::TranslateNonUniformDecoration(const glslang::TQualifier& qualifier)
  512. {
  513. if (qualifier.isNonUniform()) {
  514. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  515. builder.addCapability(spv::Capability::ShaderNonUniformEXT);
  516. return spv::Decoration::NonUniformEXT;
  517. } else
  518. return spv::Decoration::Max;
  519. }
  520. // If lvalue flags contains nonUniform, return SPIR-V NonUniform decoration.
  521. spv::Decoration TGlslangToSpvTraverser::TranslateNonUniformDecoration(
  522. const spv::Builder::AccessChain::CoherentFlags& coherentFlags)
  523. {
  524. if (coherentFlags.isNonUniform()) {
  525. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  526. builder.addCapability(spv::Capability::ShaderNonUniformEXT);
  527. return spv::Decoration::NonUniformEXT;
  528. } else
  529. return spv::Decoration::Max;
  530. }
  531. spv::MemoryAccessMask TGlslangToSpvTraverser::TranslateMemoryAccess(
  532. const spv::Builder::AccessChain::CoherentFlags &coherentFlags)
  533. {
  534. spv::MemoryAccessMask mask = spv::MemoryAccessMask::MaskNone;
  535. if (!glslangIntermediate->usingVulkanMemoryModel() || coherentFlags.isImage)
  536. return mask;
  537. if (coherentFlags.isVolatile() || coherentFlags.anyCoherent()) {
  538. mask = mask | spv::MemoryAccessMask::MakePointerAvailableKHR |
  539. spv::MemoryAccessMask::MakePointerVisibleKHR;
  540. }
  541. if (coherentFlags.nonprivate) {
  542. mask = mask | spv::MemoryAccessMask::NonPrivatePointerKHR;
  543. }
  544. if (coherentFlags.volatil) {
  545. mask = mask | spv::MemoryAccessMask::Volatile;
  546. }
  547. if (coherentFlags.nontemporal) {
  548. mask = mask | spv::MemoryAccessMask::Nontemporal;
  549. }
  550. if (mask != spv::MemoryAccessMask::MaskNone) {
  551. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  552. }
  553. return mask;
  554. }
  555. spv::ImageOperandsMask TGlslangToSpvTraverser::TranslateImageOperands(
  556. const spv::Builder::AccessChain::CoherentFlags &coherentFlags)
  557. {
  558. spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;
  559. if (!glslangIntermediate->usingVulkanMemoryModel())
  560. return mask;
  561. if (coherentFlags.volatil ||
  562. coherentFlags.anyCoherent()) {
  563. mask = mask | spv::ImageOperandsMask::MakeTexelAvailableKHR |
  564. spv::ImageOperandsMask::MakeTexelVisibleKHR;
  565. }
  566. if (coherentFlags.nonprivate) {
  567. mask = mask | spv::ImageOperandsMask::NonPrivateTexelKHR;
  568. }
  569. if (coherentFlags.volatil) {
  570. mask = mask | spv::ImageOperandsMask::VolatileTexelKHR;
  571. }
  572. if (coherentFlags.nontemporal && builder.getSpvVersion() >= spv::Spv_1_6) {
  573. mask = mask | spv::ImageOperandsMask::Nontemporal;
  574. }
  575. if (mask != spv::ImageOperandsMask::MaskNone) {
  576. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  577. }
  578. return mask;
  579. }
  580. spv::Builder::AccessChain::CoherentFlags TGlslangToSpvTraverser::TranslateCoherent(const glslang::TType& type)
  581. {
  582. spv::Builder::AccessChain::CoherentFlags flags = {};
  583. flags.coherent = type.getQualifier().coherent;
  584. flags.devicecoherent = type.getQualifier().devicecoherent;
  585. flags.queuefamilycoherent = type.getQualifier().queuefamilycoherent;
  586. // shared variables are implicitly workgroupcoherent in GLSL.
  587. flags.workgroupcoherent = type.getQualifier().workgroupcoherent ||
  588. type.getQualifier().storage == glslang::EvqShared;
  589. flags.subgroupcoherent = type.getQualifier().subgroupcoherent;
  590. flags.shadercallcoherent = type.getQualifier().shadercallcoherent;
  591. flags.volatil = type.getQualifier().volatil;
  592. flags.nontemporal = type.getQualifier().nontemporal;
  593. // *coherent variables are implicitly nonprivate in GLSL
  594. flags.nonprivate = type.getQualifier().nonprivate ||
  595. flags.anyCoherent() ||
  596. flags.volatil;
  597. flags.isImage = type.getBasicType() == glslang::EbtSampler;
  598. flags.nonUniform = type.getQualifier().nonUniform;
  599. return flags;
  600. }
  601. spv::Scope TGlslangToSpvTraverser::TranslateMemoryScope(
  602. const spv::Builder::AccessChain::CoherentFlags &coherentFlags)
  603. {
  604. spv::Scope scope = spv::Scope::Max;
  605. if (coherentFlags.volatil || coherentFlags.coherent) {
  606. // coherent defaults to Device scope in the old model, QueueFamilyKHR scope in the new model
  607. scope = glslangIntermediate->usingVulkanMemoryModel() ? spv::Scope::QueueFamilyKHR : spv::Scope::Device;
  608. } else if (coherentFlags.devicecoherent) {
  609. scope = spv::Scope::Device;
  610. } else if (coherentFlags.queuefamilycoherent) {
  611. scope = spv::Scope::QueueFamilyKHR;
  612. } else if (coherentFlags.workgroupcoherent) {
  613. scope = spv::Scope::Workgroup;
  614. } else if (coherentFlags.subgroupcoherent) {
  615. scope = spv::Scope::Subgroup;
  616. } else if (coherentFlags.shadercallcoherent) {
  617. scope = spv::Scope::ShaderCallKHR;
  618. }
  619. if (glslangIntermediate->usingVulkanMemoryModel() && scope == spv::Scope::Device) {
  620. builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);
  621. }
  622. return scope;
  623. }
  624. // Translate a glslang built-in variable to a SPIR-V built in decoration. Also generate
  625. // associated capabilities when required. For some built-in variables, a capability
  626. // is generated only when using the variable in an executable instruction, but not when
  627. // just declaring a struct member variable with it. This is true for PointSize,
  628. // ClipDistance, and CullDistance.
  629. spv::BuiltIn TGlslangToSpvTraverser::TranslateBuiltInDecoration(glslang::TBuiltInVariable builtIn,
  630. bool memberDeclaration)
  631. {
  632. switch (builtIn) {
  633. case glslang::EbvPointSize:
  634. // Defer adding the capability until the built-in is actually used.
  635. if (! memberDeclaration) {
  636. switch (glslangIntermediate->getStage()) {
  637. case EShLangGeometry:
  638. builder.addCapability(spv::Capability::GeometryPointSize);
  639. break;
  640. case EShLangTessControl:
  641. case EShLangTessEvaluation:
  642. builder.addCapability(spv::Capability::TessellationPointSize);
  643. break;
  644. default:
  645. break;
  646. }
  647. }
  648. return spv::BuiltIn::PointSize;
  649. case glslang::EbvPosition: return spv::BuiltIn::Position;
  650. case glslang::EbvVertexId: return spv::BuiltIn::VertexId;
  651. case glslang::EbvInstanceId: return spv::BuiltIn::InstanceId;
  652. case glslang::EbvVertexIndex: return spv::BuiltIn::VertexIndex;
  653. case glslang::EbvInstanceIndex: return spv::BuiltIn::InstanceIndex;
  654. case glslang::EbvFragCoord: return spv::BuiltIn::FragCoord;
  655. case glslang::EbvPointCoord: return spv::BuiltIn::PointCoord;
  656. case glslang::EbvFace: return spv::BuiltIn::FrontFacing;
  657. case glslang::EbvFragDepth: return spv::BuiltIn::FragDepth;
  658. case glslang::EbvNumWorkGroups: return spv::BuiltIn::NumWorkgroups;
  659. case glslang::EbvWorkGroupSize: return spv::BuiltIn::WorkgroupSize;
  660. case glslang::EbvWorkGroupId: return spv::BuiltIn::WorkgroupId;
  661. case glslang::EbvLocalInvocationId: return spv::BuiltIn::LocalInvocationId;
  662. case glslang::EbvLocalInvocationIndex: return spv::BuiltIn::LocalInvocationIndex;
  663. case glslang::EbvGlobalInvocationId: return spv::BuiltIn::GlobalInvocationId;
  664. // These *Distance capabilities logically belong here, but if the member is declared and
  665. // then never used, consumers of SPIR-V prefer the capability not be declared.
  666. // They are now generated when used, rather than here when declared.
  667. // Potentially, the specification should be more clear what the minimum
  668. // use needed is to trigger the capability.
  669. //
  670. case glslang::EbvClipDistance:
  671. if (!memberDeclaration)
  672. builder.addCapability(spv::Capability::ClipDistance);
  673. return spv::BuiltIn::ClipDistance;
  674. case glslang::EbvCullDistance:
  675. if (!memberDeclaration)
  676. builder.addCapability(spv::Capability::CullDistance);
  677. return spv::BuiltIn::CullDistance;
  678. case glslang::EbvViewportIndex:
  679. if (glslangIntermediate->getStage() == EShLangGeometry ||
  680. glslangIntermediate->getStage() == EShLangFragment) {
  681. builder.addCapability(spv::Capability::MultiViewport);
  682. }
  683. if (glslangIntermediate->getStage() == EShLangVertex ||
  684. glslangIntermediate->getStage() == EShLangTessControl ||
  685. glslangIntermediate->getStage() == EShLangTessEvaluation) {
  686. if (builder.getSpvVersion() < spv::Spv_1_5) {
  687. builder.addIncorporatedExtension(spv::E_SPV_EXT_shader_viewport_index_layer, spv::Spv_1_5);
  688. builder.addCapability(spv::Capability::ShaderViewportIndexLayerEXT);
  689. }
  690. else
  691. builder.addCapability(spv::Capability::ShaderViewportIndex);
  692. }
  693. return spv::BuiltIn::ViewportIndex;
  694. case glslang::EbvSampleId:
  695. builder.addCapability(spv::Capability::SampleRateShading);
  696. return spv::BuiltIn::SampleId;
  697. case glslang::EbvSamplePosition:
  698. builder.addCapability(spv::Capability::SampleRateShading);
  699. return spv::BuiltIn::SamplePosition;
  700. case glslang::EbvSampleMask:
  701. return spv::BuiltIn::SampleMask;
  702. case glslang::EbvLayer:
  703. if (glslangIntermediate->getStage() == EShLangMesh) {
  704. return spv::BuiltIn::Layer;
  705. }
  706. if (glslangIntermediate->getStage() == EShLangGeometry ||
  707. glslangIntermediate->getStage() == EShLangFragment) {
  708. builder.addCapability(spv::Capability::Geometry);
  709. }
  710. if (glslangIntermediate->getStage() == EShLangVertex ||
  711. glslangIntermediate->getStage() == EShLangTessControl ||
  712. glslangIntermediate->getStage() == EShLangTessEvaluation) {
  713. if (builder.getSpvVersion() < spv::Spv_1_5) {
  714. builder.addIncorporatedExtension(spv::E_SPV_EXT_shader_viewport_index_layer, spv::Spv_1_5);
  715. builder.addCapability(spv::Capability::ShaderViewportIndexLayerEXT);
  716. } else
  717. builder.addCapability(spv::Capability::ShaderLayer);
  718. }
  719. return spv::BuiltIn::Layer;
  720. case glslang::EbvBaseVertex:
  721. builder.addIncorporatedExtension(spv::E_SPV_KHR_shader_draw_parameters, spv::Spv_1_3);
  722. builder.addCapability(spv::Capability::DrawParameters);
  723. return spv::BuiltIn::BaseVertex;
  724. case glslang::EbvBaseInstance:
  725. builder.addIncorporatedExtension(spv::E_SPV_KHR_shader_draw_parameters, spv::Spv_1_3);
  726. builder.addCapability(spv::Capability::DrawParameters);
  727. return spv::BuiltIn::BaseInstance;
  728. case glslang::EbvDrawId:
  729. builder.addIncorporatedExtension(spv::E_SPV_KHR_shader_draw_parameters, spv::Spv_1_3);
  730. builder.addCapability(spv::Capability::DrawParameters);
  731. return spv::BuiltIn::DrawIndex;
  732. case glslang::EbvPrimitiveId:
  733. if (glslangIntermediate->getStage() == EShLangFragment)
  734. builder.addCapability(spv::Capability::Geometry);
  735. return spv::BuiltIn::PrimitiveId;
  736. case glslang::EbvFragStencilRef:
  737. builder.addExtension(spv::E_SPV_EXT_shader_stencil_export);
  738. builder.addCapability(spv::Capability::StencilExportEXT);
  739. return spv::BuiltIn::FragStencilRefEXT;
  740. case glslang::EbvShadingRateKHR:
  741. builder.addExtension(spv::E_SPV_KHR_fragment_shading_rate);
  742. builder.addCapability(spv::Capability::FragmentShadingRateKHR);
  743. return spv::BuiltIn::ShadingRateKHR;
  744. case glslang::EbvPrimitiveShadingRateKHR:
  745. builder.addExtension(spv::E_SPV_KHR_fragment_shading_rate);
  746. builder.addCapability(spv::Capability::FragmentShadingRateKHR);
  747. return spv::BuiltIn::PrimitiveShadingRateKHR;
  748. case glslang::EbvInvocationId: return spv::BuiltIn::InvocationId;
  749. case glslang::EbvTessLevelInner: return spv::BuiltIn::TessLevelInner;
  750. case glslang::EbvTessLevelOuter: return spv::BuiltIn::TessLevelOuter;
  751. case glslang::EbvTessCoord: return spv::BuiltIn::TessCoord;
  752. case glslang::EbvPatchVertices: return spv::BuiltIn::PatchVertices;
  753. case glslang::EbvHelperInvocation: return spv::BuiltIn::HelperInvocation;
  754. case glslang::EbvSubGroupSize:
  755. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  756. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  757. return spv::BuiltIn::SubgroupSize;
  758. case glslang::EbvSubGroupInvocation:
  759. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  760. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  761. return spv::BuiltIn::SubgroupLocalInvocationId;
  762. case glslang::EbvSubGroupEqMask:
  763. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  764. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  765. return spv::BuiltIn::SubgroupEqMask;
  766. case glslang::EbvSubGroupGeMask:
  767. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  768. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  769. return spv::BuiltIn::SubgroupGeMask;
  770. case glslang::EbvSubGroupGtMask:
  771. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  772. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  773. return spv::BuiltIn::SubgroupGtMask;
  774. case glslang::EbvSubGroupLeMask:
  775. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  776. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  777. return spv::BuiltIn::SubgroupLeMask;
  778. case glslang::EbvSubGroupLtMask:
  779. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  780. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  781. return spv::BuiltIn::SubgroupLtMask;
  782. case glslang::EbvNumSubgroups:
  783. builder.addCapability(spv::Capability::GroupNonUniform);
  784. return spv::BuiltIn::NumSubgroups;
  785. case glslang::EbvSubgroupID:
  786. builder.addCapability(spv::Capability::GroupNonUniform);
  787. return spv::BuiltIn::SubgroupId;
  788. case glslang::EbvSubgroupSize2:
  789. builder.addCapability(spv::Capability::GroupNonUniform);
  790. return spv::BuiltIn::SubgroupSize;
  791. case glslang::EbvSubgroupInvocation2:
  792. builder.addCapability(spv::Capability::GroupNonUniform);
  793. return spv::BuiltIn::SubgroupLocalInvocationId;
  794. case glslang::EbvSubgroupEqMask2:
  795. builder.addCapability(spv::Capability::GroupNonUniform);
  796. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  797. return spv::BuiltIn::SubgroupEqMask;
  798. case glslang::EbvSubgroupGeMask2:
  799. builder.addCapability(spv::Capability::GroupNonUniform);
  800. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  801. return spv::BuiltIn::SubgroupGeMask;
  802. case glslang::EbvSubgroupGtMask2:
  803. builder.addCapability(spv::Capability::GroupNonUniform);
  804. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  805. return spv::BuiltIn::SubgroupGtMask;
  806. case glslang::EbvSubgroupLeMask2:
  807. builder.addCapability(spv::Capability::GroupNonUniform);
  808. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  809. return spv::BuiltIn::SubgroupLeMask;
  810. case glslang::EbvSubgroupLtMask2:
  811. builder.addCapability(spv::Capability::GroupNonUniform);
  812. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  813. return spv::BuiltIn::SubgroupLtMask;
  814. case glslang::EbvBaryCoordNoPersp:
  815. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  816. return spv::BuiltIn::BaryCoordNoPerspAMD;
  817. case glslang::EbvBaryCoordNoPerspCentroid:
  818. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  819. return spv::BuiltIn::BaryCoordNoPerspCentroidAMD;
  820. case glslang::EbvBaryCoordNoPerspSample:
  821. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  822. return spv::BuiltIn::BaryCoordNoPerspSampleAMD;
  823. case glslang::EbvBaryCoordSmooth:
  824. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  825. return spv::BuiltIn::BaryCoordSmoothAMD;
  826. case glslang::EbvBaryCoordSmoothCentroid:
  827. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  828. return spv::BuiltIn::BaryCoordSmoothCentroidAMD;
  829. case glslang::EbvBaryCoordSmoothSample:
  830. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  831. return spv::BuiltIn::BaryCoordSmoothSampleAMD;
  832. case glslang::EbvBaryCoordPullModel:
  833. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  834. return spv::BuiltIn::BaryCoordPullModelAMD;
  835. case glslang::EbvDeviceIndex:
  836. builder.addIncorporatedExtension(spv::E_SPV_KHR_device_group, spv::Spv_1_3);
  837. builder.addCapability(spv::Capability::DeviceGroup);
  838. return spv::BuiltIn::DeviceIndex;
  839. case glslang::EbvViewIndex:
  840. builder.addIncorporatedExtension(spv::E_SPV_KHR_multiview, spv::Spv_1_3);
  841. builder.addCapability(spv::Capability::MultiView);
  842. return spv::BuiltIn::ViewIndex;
  843. case glslang::EbvFragSizeEXT:
  844. builder.addExtension(spv::E_SPV_EXT_fragment_invocation_density);
  845. builder.addCapability(spv::Capability::FragmentDensityEXT);
  846. return spv::BuiltIn::FragSizeEXT;
  847. case glslang::EbvFragInvocationCountEXT:
  848. builder.addExtension(spv::E_SPV_EXT_fragment_invocation_density);
  849. builder.addCapability(spv::Capability::FragmentDensityEXT);
  850. return spv::BuiltIn::FragInvocationCountEXT;
  851. case glslang::EbvViewportMaskNV:
  852. if (!memberDeclaration) {
  853. builder.addExtension(spv::E_SPV_NV_viewport_array2);
  854. builder.addCapability(spv::Capability::ShaderViewportMaskNV);
  855. }
  856. return spv::BuiltIn::ViewportMaskNV;
  857. case glslang::EbvSecondaryPositionNV:
  858. if (!memberDeclaration) {
  859. builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
  860. builder.addCapability(spv::Capability::ShaderStereoViewNV);
  861. }
  862. return spv::BuiltIn::SecondaryPositionNV;
  863. case glslang::EbvSecondaryViewportMaskNV:
  864. if (!memberDeclaration) {
  865. builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
  866. builder.addCapability(spv::Capability::ShaderStereoViewNV);
  867. }
  868. return spv::BuiltIn::SecondaryViewportMaskNV;
  869. case glslang::EbvPositionPerViewNV:
  870. if (!memberDeclaration) {
  871. builder.addExtension(spv::E_SPV_NVX_multiview_per_view_attributes);
  872. builder.addCapability(spv::Capability::PerViewAttributesNV);
  873. }
  874. return spv::BuiltIn::PositionPerViewNV;
  875. case glslang::EbvViewportMaskPerViewNV:
  876. if (!memberDeclaration) {
  877. builder.addExtension(spv::E_SPV_NVX_multiview_per_view_attributes);
  878. builder.addCapability(spv::Capability::PerViewAttributesNV);
  879. }
  880. return spv::BuiltIn::ViewportMaskPerViewNV;
  881. case glslang::EbvFragFullyCoveredNV:
  882. builder.addExtension(spv::E_SPV_EXT_fragment_fully_covered);
  883. builder.addCapability(spv::Capability::FragmentFullyCoveredEXT);
  884. return spv::BuiltIn::FullyCoveredEXT;
  885. case glslang::EbvFragmentSizeNV:
  886. builder.addExtension(spv::E_SPV_NV_shading_rate);
  887. builder.addCapability(spv::Capability::ShadingRateNV);
  888. return spv::BuiltIn::FragmentSizeNV;
  889. case glslang::EbvInvocationsPerPixelNV:
  890. builder.addExtension(spv::E_SPV_NV_shading_rate);
  891. builder.addCapability(spv::Capability::ShadingRateNV);
  892. return spv::BuiltIn::InvocationsPerPixelNV;
  893. // ray tracing
  894. case glslang::EbvLaunchId:
  895. return spv::BuiltIn::LaunchIdKHR;
  896. case glslang::EbvLaunchSize:
  897. return spv::BuiltIn::LaunchSizeKHR;
  898. case glslang::EbvWorldRayOrigin:
  899. return spv::BuiltIn::WorldRayOriginKHR;
  900. case glslang::EbvWorldRayDirection:
  901. return spv::BuiltIn::WorldRayDirectionKHR;
  902. case glslang::EbvObjectRayOrigin:
  903. return spv::BuiltIn::ObjectRayOriginKHR;
  904. case glslang::EbvObjectRayDirection:
  905. return spv::BuiltIn::ObjectRayDirectionKHR;
  906. case glslang::EbvRayTmin:
  907. return spv::BuiltIn::RayTminKHR;
  908. case glslang::EbvRayTmax:
  909. return spv::BuiltIn::RayTmaxKHR;
  910. case glslang::EbvCullMask:
  911. return spv::BuiltIn::CullMaskKHR;
  912. case glslang::EbvPositionFetch:
  913. return spv::BuiltIn::HitTriangleVertexPositionsKHR;
  914. case glslang::EbvInstanceCustomIndex:
  915. return spv::BuiltIn::InstanceCustomIndexKHR;
  916. case glslang::EbvHitKind:
  917. return spv::BuiltIn::HitKindKHR;
  918. case glslang::EbvObjectToWorld:
  919. case glslang::EbvObjectToWorld3x4:
  920. return spv::BuiltIn::ObjectToWorldKHR;
  921. case glslang::EbvWorldToObject:
  922. case glslang::EbvWorldToObject3x4:
  923. return spv::BuiltIn::WorldToObjectKHR;
  924. case glslang::EbvIncomingRayFlags:
  925. return spv::BuiltIn::IncomingRayFlagsKHR;
  926. case glslang::EbvGeometryIndex:
  927. return spv::BuiltIn::RayGeometryIndexKHR;
  928. case glslang::EbvCurrentRayTimeNV:
  929. builder.addExtension(spv::E_SPV_NV_ray_tracing_motion_blur);
  930. builder.addCapability(spv::Capability::RayTracingMotionBlurNV);
  931. return spv::BuiltIn::CurrentRayTimeNV;
  932. case glslang::EbvMicroTrianglePositionNV:
  933. builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);
  934. builder.addExtension("SPV_NV_displacement_micromap");
  935. return spv::BuiltIn::HitMicroTriangleVertexPositionsNV;
  936. case glslang::EbvMicroTriangleBaryNV:
  937. builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);
  938. builder.addExtension("SPV_NV_displacement_micromap");
  939. return spv::BuiltIn::HitMicroTriangleVertexBarycentricsNV;
  940. case glslang::EbvHitKindFrontFacingMicroTriangleNV:
  941. builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);
  942. builder.addExtension("SPV_NV_displacement_micromap");
  943. return spv::BuiltIn::HitKindFrontFacingMicroTriangleNV;
  944. case glslang::EbvHitKindBackFacingMicroTriangleNV:
  945. builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);
  946. builder.addExtension("SPV_NV_displacement_micromap");
  947. return spv::BuiltIn::HitKindBackFacingMicroTriangleNV;
  948. case glslang::EbvClusterIDNV:
  949. builder.addCapability(spv::Capability::RayTracingClusterAccelerationStructureNV);
  950. builder.addExtension("SPV_NV_cluster_acceleration_structure");
  951. return spv::BuiltIn::ClusterIDNV;
  952. case glslang::EbvHitIsSphereNV:
  953. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  954. builder.addExtension("SPV_NV_linear_swept_spheres");
  955. return spv::BuiltIn::HitIsSphereNV;
  956. case glslang::EbvHitIsLSSNV:
  957. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  958. builder.addExtension("SPV_NV_linear_swept_spheres");
  959. return spv::BuiltIn::HitIsLSSNV;
  960. case glslang::EbvHitSpherePositionNV:
  961. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  962. builder.addExtension("SPV_NV_linear_swept_spheres");
  963. return spv::BuiltIn::HitSpherePositionNV;
  964. case glslang::EbvHitSphereRadiusNV:
  965. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  966. builder.addExtension("SPV_NV_linear_swept_spheres");
  967. return spv::BuiltIn::HitSphereRadiusNV;
  968. case glslang::EbvHitLSSPositionsNV:
  969. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  970. builder.addExtension("SPV_NV_linear_swept_spheres");
  971. return spv::BuiltIn::HitLSSPositionsNV;
  972. case glslang::EbvHitLSSRadiiNV:
  973. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  974. builder.addExtension("SPV_NV_linear_swept_spheres");
  975. return spv::BuiltIn::HitLSSRadiiNV;
  976. // barycentrics
  977. case glslang::EbvBaryCoordNV:
  978. builder.addExtension(spv::E_SPV_NV_fragment_shader_barycentric);
  979. builder.addCapability(spv::Capability::FragmentBarycentricNV);
  980. return spv::BuiltIn::BaryCoordNV;
  981. case glslang::EbvBaryCoordNoPerspNV:
  982. builder.addExtension(spv::E_SPV_NV_fragment_shader_barycentric);
  983. builder.addCapability(spv::Capability::FragmentBarycentricNV);
  984. return spv::BuiltIn::BaryCoordNoPerspNV;
  985. case glslang::EbvBaryCoordEXT:
  986. builder.addExtension(spv::E_SPV_KHR_fragment_shader_barycentric);
  987. builder.addCapability(spv::Capability::FragmentBarycentricKHR);
  988. return spv::BuiltIn::BaryCoordKHR;
  989. case glslang::EbvBaryCoordNoPerspEXT:
  990. builder.addExtension(spv::E_SPV_KHR_fragment_shader_barycentric);
  991. builder.addCapability(spv::Capability::FragmentBarycentricKHR);
  992. return spv::BuiltIn::BaryCoordNoPerspKHR;
  993. // mesh shaders
  994. case glslang::EbvTaskCountNV:
  995. return spv::BuiltIn::TaskCountNV;
  996. case glslang::EbvPrimitiveCountNV:
  997. return spv::BuiltIn::PrimitiveCountNV;
  998. case glslang::EbvPrimitiveIndicesNV:
  999. return spv::BuiltIn::PrimitiveIndicesNV;
  1000. case glslang::EbvClipDistancePerViewNV:
  1001. return spv::BuiltIn::ClipDistancePerViewNV;
  1002. case glslang::EbvCullDistancePerViewNV:
  1003. return spv::BuiltIn::CullDistancePerViewNV;
  1004. case glslang::EbvLayerPerViewNV:
  1005. return spv::BuiltIn::LayerPerViewNV;
  1006. case glslang::EbvMeshViewCountNV:
  1007. return spv::BuiltIn::MeshViewCountNV;
  1008. case glslang::EbvMeshViewIndicesNV:
  1009. return spv::BuiltIn::MeshViewIndicesNV;
  1010. // SPV_EXT_mesh_shader
  1011. case glslang::EbvPrimitivePointIndicesEXT:
  1012. return spv::BuiltIn::PrimitivePointIndicesEXT;
  1013. case glslang::EbvPrimitiveLineIndicesEXT:
  1014. return spv::BuiltIn::PrimitiveLineIndicesEXT;
  1015. case glslang::EbvPrimitiveTriangleIndicesEXT:
  1016. return spv::BuiltIn::PrimitiveTriangleIndicesEXT;
  1017. case glslang::EbvCullPrimitiveEXT:
  1018. return spv::BuiltIn::CullPrimitiveEXT;
  1019. // sm builtins
  1020. case glslang::EbvWarpsPerSM:
  1021. builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);
  1022. builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);
  1023. return spv::BuiltIn::WarpsPerSMNV;
  1024. case glslang::EbvSMCount:
  1025. builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);
  1026. builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);
  1027. return spv::BuiltIn::SMCountNV;
  1028. case glslang::EbvWarpID:
  1029. builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);
  1030. builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);
  1031. return spv::BuiltIn::WarpIDNV;
  1032. case glslang::EbvSMID:
  1033. builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);
  1034. builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);
  1035. return spv::BuiltIn::SMIDNV;
  1036. // ARM builtins
  1037. case glslang::EbvCoreCountARM:
  1038. builder.addExtension(spv::E_SPV_ARM_core_builtins);
  1039. builder.addCapability(spv::Capability::CoreBuiltinsARM);
  1040. return spv::BuiltIn::CoreCountARM;
  1041. case glslang::EbvCoreIDARM:
  1042. builder.addExtension(spv::E_SPV_ARM_core_builtins);
  1043. builder.addCapability(spv::Capability::CoreBuiltinsARM);
  1044. return spv::BuiltIn::CoreIDARM;
  1045. case glslang::EbvCoreMaxIDARM:
  1046. builder.addExtension(spv::E_SPV_ARM_core_builtins);
  1047. builder.addCapability(spv::Capability::CoreBuiltinsARM);
  1048. return spv::BuiltIn::CoreMaxIDARM;
  1049. case glslang::EbvWarpIDARM:
  1050. builder.addExtension(spv::E_SPV_ARM_core_builtins);
  1051. builder.addCapability(spv::Capability::CoreBuiltinsARM);
  1052. return spv::BuiltIn::WarpIDARM;
  1053. case glslang::EbvWarpMaxIDARM:
  1054. builder.addExtension(spv::E_SPV_ARM_core_builtins);
  1055. builder.addCapability(spv::Capability::CoreBuiltinsARM);
  1056. return spv::BuiltIn::WarpMaxIDARM;
  1057. // QCOM builtins
  1058. case glslang::EbvTileOffsetQCOM:
  1059. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1060. return spv::BuiltIn::TileOffsetQCOM;
  1061. case glslang::EbvTileDimensionQCOM:
  1062. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1063. return spv::BuiltIn::TileDimensionQCOM;
  1064. case glslang::EbvTileApronSizeQCOM:
  1065. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1066. return spv::BuiltIn::TileApronSizeQCOM;
  1067. // SPV_EXT_descriptor_heap
  1068. case glslang::EbvSamplerHeapEXT:
  1069. builder.addExtension(spv::E_SPV_EXT_descriptor_heap);
  1070. builder.addExtension(spv::E_SPV_KHR_untyped_pointers);
  1071. builder.addCapability(spv::Capability::DescriptorHeapEXT);
  1072. builder.addCapability(spv::Capability::UntypedPointersKHR);
  1073. // Add SamplerHeapEXT Symbol for spv level.
  1074. if (builtInVariableIds.find(uint32_t(spv::BuiltIn::SamplerHeapEXT)) == builtInVariableIds.end()) {
  1075. spv::Id samplerHeapEXT =
  1076. builder.createUntypedVariable(spv::NoPrecision, spv::StorageClass::UniformConstant, "sampler_heap");
  1077. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4)
  1078. entryPoint->addIdOperand(samplerHeapEXT);
  1079. builder.addDecoration(samplerHeapEXT, spv::Decoration::BuiltIn, (int)spv::BuiltIn::SamplerHeapEXT);
  1080. builtInVariableIds.insert({uint32_t(spv::BuiltIn::SamplerHeapEXT), samplerHeapEXT});
  1081. }
  1082. return spv::BuiltIn::SamplerHeapEXT;
  1083. case glslang::EbvResourceHeapEXT:
  1084. builder.addExtension(spv::E_SPV_EXT_descriptor_heap);
  1085. builder.addExtension(spv::E_SPV_KHR_untyped_pointers);
  1086. builder.addCapability(spv::Capability::DescriptorHeapEXT);
  1087. builder.addCapability(spv::Capability::UntypedPointersKHR);
  1088. // Add ResourceHeapEXT Symbol for spv level.
  1089. if (builtInVariableIds.find(uint32_t(spv::BuiltIn::ResourceHeapEXT)) == builtInVariableIds.end()) {
  1090. spv::Id resourceHeapEXT =
  1091. builder.createUntypedVariable(spv::NoPrecision, spv::StorageClass::UniformConstant, "resource_heap");
  1092. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4)
  1093. entryPoint->addIdOperand(resourceHeapEXT);
  1094. builder.addDecoration(resourceHeapEXT, spv::Decoration::BuiltIn, (int)spv::BuiltIn::ResourceHeapEXT);
  1095. builtInVariableIds.insert({uint32_t(spv::BuiltIn::ResourceHeapEXT), resourceHeapEXT});
  1096. }
  1097. return spv::BuiltIn::ResourceHeapEXT;
  1098. default:
  1099. return spv::BuiltIn::Max;
  1100. }
  1101. }
  1102. // Translate glslang image layout format to SPIR-V image format.
  1103. spv::ImageFormat TGlslangToSpvTraverser::TranslateImageFormat(const glslang::TType& type)
  1104. {
  1105. assert(type.getBasicType() == glslang::EbtSampler);
  1106. // Check for capabilities
  1107. switch (type.getQualifier().getFormat()) {
  1108. case glslang::ElfRg32f:
  1109. case glslang::ElfRg16f:
  1110. case glslang::ElfR11fG11fB10f:
  1111. case glslang::ElfR16f:
  1112. case glslang::ElfRgba16:
  1113. case glslang::ElfRgb10A2:
  1114. case glslang::ElfRg16:
  1115. case glslang::ElfRg8:
  1116. case glslang::ElfR16:
  1117. case glslang::ElfR8:
  1118. case glslang::ElfRgba16Snorm:
  1119. case glslang::ElfRg16Snorm:
  1120. case glslang::ElfRg8Snorm:
  1121. case glslang::ElfR16Snorm:
  1122. case glslang::ElfR8Snorm:
  1123. case glslang::ElfRg32i:
  1124. case glslang::ElfRg16i:
  1125. case glslang::ElfRg8i:
  1126. case glslang::ElfR16i:
  1127. case glslang::ElfR8i:
  1128. case glslang::ElfRgb10a2ui:
  1129. case glslang::ElfRg32ui:
  1130. case glslang::ElfRg16ui:
  1131. case glslang::ElfRg8ui:
  1132. case glslang::ElfR16ui:
  1133. case glslang::ElfR8ui:
  1134. builder.addCapability(spv::Capability::StorageImageExtendedFormats);
  1135. break;
  1136. case glslang::ElfR64ui:
  1137. case glslang::ElfR64i:
  1138. builder.addExtension(spv::E_SPV_EXT_shader_image_int64);
  1139. builder.addCapability(spv::Capability::Int64ImageEXT);
  1140. break;
  1141. default:
  1142. break;
  1143. }
  1144. // do the translation
  1145. switch (type.getQualifier().getFormat()) {
  1146. case glslang::ElfNone: return spv::ImageFormat::Unknown;
  1147. case glslang::ElfRgba32f: return spv::ImageFormat::Rgba32f;
  1148. case glslang::ElfRgba16f: return spv::ImageFormat::Rgba16f;
  1149. case glslang::ElfR32f: return spv::ImageFormat::R32f;
  1150. case glslang::ElfRgba8: return spv::ImageFormat::Rgba8;
  1151. case glslang::ElfRgba8Snorm: return spv::ImageFormat::Rgba8Snorm;
  1152. case glslang::ElfRg32f: return spv::ImageFormat::Rg32f;
  1153. case glslang::ElfRg16f: return spv::ImageFormat::Rg16f;
  1154. case glslang::ElfR11fG11fB10f: return spv::ImageFormat::R11fG11fB10f;
  1155. case glslang::ElfR16f: return spv::ImageFormat::R16f;
  1156. case glslang::ElfRgba16: return spv::ImageFormat::Rgba16;
  1157. case glslang::ElfRgb10A2: return spv::ImageFormat::Rgb10A2;
  1158. case glslang::ElfRg16: return spv::ImageFormat::Rg16;
  1159. case glslang::ElfRg8: return spv::ImageFormat::Rg8;
  1160. case glslang::ElfR16: return spv::ImageFormat::R16;
  1161. case glslang::ElfR8: return spv::ImageFormat::R8;
  1162. case glslang::ElfRgba16Snorm: return spv::ImageFormat::Rgba16Snorm;
  1163. case glslang::ElfRg16Snorm: return spv::ImageFormat::Rg16Snorm;
  1164. case glslang::ElfRg8Snorm: return spv::ImageFormat::Rg8Snorm;
  1165. case glslang::ElfR16Snorm: return spv::ImageFormat::R16Snorm;
  1166. case glslang::ElfR8Snorm: return spv::ImageFormat::R8Snorm;
  1167. case glslang::ElfRgba32i: return spv::ImageFormat::Rgba32i;
  1168. case glslang::ElfRgba16i: return spv::ImageFormat::Rgba16i;
  1169. case glslang::ElfRgba8i: return spv::ImageFormat::Rgba8i;
  1170. case glslang::ElfR32i: return spv::ImageFormat::R32i;
  1171. case glslang::ElfRg32i: return spv::ImageFormat::Rg32i;
  1172. case glslang::ElfRg16i: return spv::ImageFormat::Rg16i;
  1173. case glslang::ElfRg8i: return spv::ImageFormat::Rg8i;
  1174. case glslang::ElfR16i: return spv::ImageFormat::R16i;
  1175. case glslang::ElfR8i: return spv::ImageFormat::R8i;
  1176. case glslang::ElfRgba32ui: return spv::ImageFormat::Rgba32ui;
  1177. case glslang::ElfRgba16ui: return spv::ImageFormat::Rgba16ui;
  1178. case glslang::ElfRgba8ui: return spv::ImageFormat::Rgba8ui;
  1179. case glslang::ElfR32ui: return spv::ImageFormat::R32ui;
  1180. case glslang::ElfRg32ui: return spv::ImageFormat::Rg32ui;
  1181. case glslang::ElfRg16ui: return spv::ImageFormat::Rg16ui;
  1182. case glslang::ElfRgb10a2ui: return spv::ImageFormat::Rgb10a2ui;
  1183. case glslang::ElfRg8ui: return spv::ImageFormat::Rg8ui;
  1184. case glslang::ElfR16ui: return spv::ImageFormat::R16ui;
  1185. case glslang::ElfR8ui: return spv::ImageFormat::R8ui;
  1186. case glslang::ElfR64ui: return spv::ImageFormat::R64ui;
  1187. case glslang::ElfR64i: return spv::ImageFormat::R64i;
  1188. default: return spv::ImageFormat::Max;
  1189. }
  1190. }
  1191. spv::SelectionControlMask TGlslangToSpvTraverser::TranslateSelectionControl(
  1192. const glslang::TIntermSelection& selectionNode) const
  1193. {
  1194. if (selectionNode.getFlatten())
  1195. return spv::SelectionControlMask::Flatten;
  1196. if (selectionNode.getDontFlatten())
  1197. return spv::SelectionControlMask::DontFlatten;
  1198. return spv::SelectionControlMask::MaskNone;
  1199. }
  1200. spv::SelectionControlMask TGlslangToSpvTraverser::TranslateSwitchControl(const glslang::TIntermSwitch& switchNode)
  1201. const
  1202. {
  1203. if (switchNode.getFlatten())
  1204. return spv::SelectionControlMask::Flatten;
  1205. if (switchNode.getDontFlatten())
  1206. return spv::SelectionControlMask::DontFlatten;
  1207. return spv::SelectionControlMask::MaskNone;
  1208. }
  1209. // return a non-0 dependency if the dependency argument must be set
  1210. spv::LoopControlMask TGlslangToSpvTraverser::TranslateLoopControl(const glslang::TIntermLoop& loopNode,
  1211. std::vector<unsigned int>& operands) const
  1212. {
  1213. spv::LoopControlMask control = spv::LoopControlMask::MaskNone;
  1214. if (loopNode.getDontUnroll())
  1215. control = control | spv::LoopControlMask::DontUnroll;
  1216. if (loopNode.getUnroll())
  1217. control = control | spv::LoopControlMask::Unroll;
  1218. if (unsigned(loopNode.getLoopDependency()) == glslang::TIntermLoop::dependencyInfinite)
  1219. control = control | spv::LoopControlMask::DependencyInfinite;
  1220. else if (loopNode.getLoopDependency() > 0) {
  1221. control = control | spv::LoopControlMask::DependencyLength;
  1222. operands.push_back((unsigned int)loopNode.getLoopDependency());
  1223. }
  1224. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {
  1225. if (loopNode.getMinIterations() > 0) {
  1226. control = control | spv::LoopControlMask::MinIterations;
  1227. operands.push_back(loopNode.getMinIterations());
  1228. }
  1229. if (loopNode.getMaxIterations() < glslang::TIntermLoop::iterationsInfinite) {
  1230. control = control | spv::LoopControlMask::MaxIterations;
  1231. operands.push_back(loopNode.getMaxIterations());
  1232. }
  1233. if (loopNode.getIterationMultiple() > 1) {
  1234. control = control | spv::LoopControlMask::IterationMultiple;
  1235. operands.push_back(loopNode.getIterationMultiple());
  1236. }
  1237. if (loopNode.getPeelCount() > 0) {
  1238. control = control | spv::LoopControlMask::PeelCount;
  1239. operands.push_back(loopNode.getPeelCount());
  1240. }
  1241. if (loopNode.getPartialCount() > 0) {
  1242. control = control | spv::LoopControlMask::PartialCount;
  1243. operands.push_back(loopNode.getPartialCount());
  1244. }
  1245. }
  1246. return control;
  1247. }
  1248. // Translate glslang type to SPIR-V storage class.
  1249. spv::StorageClass TGlslangToSpvTraverser::TranslateStorageClass(const glslang::TType& type)
  1250. {
  1251. if (type.getBasicType() == glslang::EbtRayQuery || type.getBasicType() == glslang::EbtHitObjectNV
  1252. || type.getBasicType() == glslang::EbtHitObjectEXT)
  1253. return spv::StorageClass::Private;
  1254. if (type.getQualifier().isSpirvByReference()) {
  1255. if (type.getQualifier().isParamInput() || type.getQualifier().isParamOutput())
  1256. return spv::StorageClass::Function;
  1257. }
  1258. if (type.getQualifier().isPipeInput())
  1259. return spv::StorageClass::Input;
  1260. if (type.getQualifier().isPipeOutput())
  1261. return spv::StorageClass::Output;
  1262. if (type.getQualifier().storage == glslang::EvqTileImageEXT || type.isAttachmentEXT()) {
  1263. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  1264. builder.addCapability(spv::Capability::TileImageColorReadAccessEXT);
  1265. return spv::StorageClass::TileImageEXT;
  1266. }
  1267. if (type.getQualifier().isTileAttachmentQCOM()) {
  1268. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1269. builder.addCapability(spv::Capability::TileShadingQCOM);
  1270. return spv::StorageClass::TileAttachmentQCOM;
  1271. }
  1272. if (glslangIntermediate->getSource() != glslang::EShSourceHlsl ||
  1273. type.getQualifier().storage == glslang::EvqUniform) {
  1274. if (type.isAtomic())
  1275. return spv::StorageClass::AtomicCounter;
  1276. if (type.containsOpaque() && !glslangIntermediate->getBindlessMode()) {
  1277. if (type.getQualifier().storage == glslang::EvqResourceHeap ||
  1278. type.getQualifier().storage == glslang::EvqSamplerHeap)
  1279. return spv::StorageClass::Uniform;
  1280. else
  1281. return spv::StorageClass::UniformConstant;
  1282. }
  1283. }
  1284. if (type.getQualifier().isUniformOrBuffer() &&
  1285. type.getQualifier().isShaderRecord()) {
  1286. return spv::StorageClass::ShaderRecordBufferKHR;
  1287. }
  1288. if (glslangIntermediate->usingStorageBuffer() && type.getQualifier().storage == glslang::EvqBuffer) {
  1289. builder.addIncorporatedExtension(spv::E_SPV_KHR_storage_buffer_storage_class, spv::Spv_1_3);
  1290. return spv::StorageClass::StorageBuffer;
  1291. }
  1292. if (type.getQualifier().isUniformOrBuffer()) {
  1293. if (type.getQualifier().isPushConstant())
  1294. return spv::StorageClass::PushConstant;
  1295. if (type.getBasicType() == glslang::EbtBlock ||
  1296. type.getQualifier().layoutDescriptorHeap)
  1297. return spv::StorageClass::Uniform;
  1298. return spv::StorageClass::UniformConstant;
  1299. }
  1300. if (type.getQualifier().storage == glslang::EvqShared && type.getBasicType() == glslang::EbtBlock) {
  1301. builder.addExtension(spv::E_SPV_KHR_workgroup_memory_explicit_layout);
  1302. builder.addCapability(spv::Capability::WorkgroupMemoryExplicitLayoutKHR);
  1303. return spv::StorageClass::Workgroup;
  1304. }
  1305. switch (type.getQualifier().storage) {
  1306. case glslang::EvqGlobal: return spv::StorageClass::Private;
  1307. case glslang::EvqConstReadOnly: return spv::StorageClass::Function;
  1308. case glslang::EvqTemporary: return spv::StorageClass::Function;
  1309. case glslang::EvqShared: return spv::StorageClass::Workgroup;
  1310. case glslang::EvqPayload: return spv::StorageClass::RayPayloadKHR;
  1311. case glslang::EvqPayloadIn: return spv::StorageClass::IncomingRayPayloadKHR;
  1312. case glslang::EvqHitAttr: return spv::StorageClass::HitAttributeKHR;
  1313. case glslang::EvqCallableData: return spv::StorageClass::CallableDataKHR;
  1314. case glslang::EvqCallableDataIn: return spv::StorageClass::IncomingCallableDataKHR;
  1315. case glslang::EvqtaskPayloadSharedEXT : return spv::StorageClass::TaskPayloadWorkgroupEXT;
  1316. case glslang::EvqHitObjectAttrNV: return spv::StorageClass::HitObjectAttributeNV;
  1317. case glslang::EvqHitObjectAttrEXT: return spv::StorageClass::HitObjectAttributeEXT;
  1318. case glslang::EvqSpirvStorageClass: return static_cast<spv::StorageClass>(type.getQualifier().spirvStorageClass);
  1319. default:
  1320. assert(0);
  1321. break;
  1322. }
  1323. return spv::StorageClass::Function;
  1324. }
  1325. // Translate glslang constants to SPIR-V literals
  1326. void TGlslangToSpvTraverser::TranslateLiterals(const glslang::TVector<const glslang::TIntermConstantUnion*>& constants,
  1327. std::vector<unsigned>& literals) const
  1328. {
  1329. for (auto constant : constants) {
  1330. if (constant->getBasicType() == glslang::EbtFloat) {
  1331. float floatValue = static_cast<float>(constant->getConstArray()[0].getDConst());
  1332. unsigned literal;
  1333. static_assert(sizeof(literal) == sizeof(floatValue), "sizeof(unsigned) != sizeof(float)");
  1334. memcpy(&literal, &floatValue, sizeof(literal));
  1335. literals.push_back(literal);
  1336. } else if (constant->getBasicType() == glslang::EbtInt) {
  1337. unsigned literal = constant->getConstArray()[0].getIConst();
  1338. literals.push_back(literal);
  1339. } else if (constant->getBasicType() == glslang::EbtUint) {
  1340. unsigned literal = constant->getConstArray()[0].getUConst();
  1341. literals.push_back(literal);
  1342. } else if (constant->getBasicType() == glslang::EbtBool) {
  1343. unsigned literal = constant->getConstArray()[0].getBConst();
  1344. literals.push_back(literal);
  1345. } else if (constant->getBasicType() == glslang::EbtString) {
  1346. auto str = constant->getConstArray()[0].getSConst()->c_str();
  1347. unsigned literal = 0;
  1348. char* literalPtr = reinterpret_cast<char*>(&literal);
  1349. unsigned charCount = 0;
  1350. char ch = 0;
  1351. do {
  1352. ch = *(str++);
  1353. *(literalPtr++) = ch;
  1354. ++charCount;
  1355. if (charCount == 4) {
  1356. literals.push_back(literal);
  1357. literalPtr = reinterpret_cast<char*>(&literal);
  1358. charCount = 0;
  1359. }
  1360. } while (ch != 0);
  1361. // Partial literal is padded with 0
  1362. if (charCount > 0) {
  1363. for (; charCount < 4; ++charCount)
  1364. *(literalPtr++) = 0;
  1365. literals.push_back(literal);
  1366. }
  1367. } else
  1368. assert(0); // Unexpected type
  1369. }
  1370. }
  1371. // Add capabilities pertaining to how an array is indexed.
  1372. void TGlslangToSpvTraverser::addIndirectionIndexCapabilities(const glslang::TType& baseType,
  1373. const glslang::TType& indexType)
  1374. {
  1375. if (indexType.getQualifier().isNonUniform()) {
  1376. // deal with an asserted non-uniform index
  1377. // SPV_EXT_descriptor_indexing already added in TranslateNonUniformDecoration
  1378. if (baseType.getBasicType() == glslang::EbtSampler) {
  1379. if (baseType.getQualifier().hasAttachment())
  1380. builder.addCapability(spv::Capability::InputAttachmentArrayNonUniformIndexingEXT);
  1381. else if (baseType.isImage() && baseType.getSampler().isBuffer())
  1382. builder.addCapability(spv::Capability::StorageTexelBufferArrayNonUniformIndexingEXT);
  1383. else if (baseType.isTexture() && baseType.getSampler().isBuffer())
  1384. builder.addCapability(spv::Capability::UniformTexelBufferArrayNonUniformIndexingEXT);
  1385. else if (baseType.isImage())
  1386. builder.addCapability(spv::Capability::StorageImageArrayNonUniformIndexingEXT);
  1387. else if (baseType.isTexture())
  1388. builder.addCapability(spv::Capability::SampledImageArrayNonUniformIndexingEXT);
  1389. } else if (baseType.getBasicType() == glslang::EbtBlock) {
  1390. if (baseType.getQualifier().storage == glslang::EvqBuffer)
  1391. builder.addCapability(spv::Capability::StorageBufferArrayNonUniformIndexingEXT);
  1392. else if (baseType.getQualifier().storage == glslang::EvqUniform)
  1393. builder.addCapability(spv::Capability::UniformBufferArrayNonUniformIndexingEXT);
  1394. }
  1395. } else {
  1396. // assume a dynamically uniform index
  1397. if (baseType.getBasicType() == glslang::EbtSampler) {
  1398. if (baseType.getQualifier().hasAttachment()) {
  1399. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  1400. builder.addCapability(spv::Capability::InputAttachmentArrayDynamicIndexingEXT);
  1401. } else if (baseType.isImage() && baseType.getSampler().isBuffer()) {
  1402. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  1403. builder.addCapability(spv::Capability::StorageTexelBufferArrayDynamicIndexingEXT);
  1404. } else if (baseType.isTexture() && baseType.getSampler().isBuffer()) {
  1405. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  1406. builder.addCapability(spv::Capability::UniformTexelBufferArrayDynamicIndexingEXT);
  1407. }
  1408. }
  1409. }
  1410. }
  1411. // Return whether or not the given type is something that should be tied to a
  1412. // descriptor set.
  1413. bool IsDescriptorResource(const glslang::TType& type)
  1414. {
  1415. // uniform and buffer blocks are included, unless it is a push_constant
  1416. if (type.getBasicType() == glslang::EbtBlock)
  1417. return type.getQualifier().isUniformOrBuffer() &&
  1418. ! type.getQualifier().isShaderRecord() &&
  1419. ! type.getQualifier().isPushConstant();
  1420. // non block...
  1421. // basically samplerXXX/subpass/sampler/texture are all included
  1422. // if they are the global-scope-class, not the function parameter
  1423. // (or local, if they ever exist) class.
  1424. if (type.getBasicType() == glslang::EbtSampler ||
  1425. type.getBasicType() == glslang::EbtAccStruct)
  1426. return type.getQualifier().isUniformOrBuffer();
  1427. // Tensors are tied to a descriptor.
  1428. if (type.isTensorARM())
  1429. return true;
  1430. // None of the above.
  1431. return false;
  1432. }
  1433. void InheritQualifiers(glslang::TQualifier& child, const glslang::TQualifier& parent)
  1434. {
  1435. if (child.layoutMatrix == glslang::ElmNone)
  1436. child.layoutMatrix = parent.layoutMatrix;
  1437. if (parent.invariant)
  1438. child.invariant = true;
  1439. if (parent.flat)
  1440. child.flat = true;
  1441. if (parent.centroid)
  1442. child.centroid = true;
  1443. if (parent.nopersp)
  1444. child.nopersp = true;
  1445. if (parent.explicitInterp)
  1446. child.explicitInterp = true;
  1447. if (parent.perPrimitiveNV)
  1448. child.perPrimitiveNV = true;
  1449. if (parent.perViewNV)
  1450. child.perViewNV = true;
  1451. if (parent.perTaskNV)
  1452. child.perTaskNV = true;
  1453. if (parent.storage == glslang::EvqtaskPayloadSharedEXT)
  1454. child.storage = glslang::EvqtaskPayloadSharedEXT;
  1455. if (parent.patch)
  1456. child.patch = true;
  1457. if (parent.sample)
  1458. child.sample = true;
  1459. if (parent.coherent)
  1460. child.coherent = true;
  1461. if (parent.devicecoherent)
  1462. child.devicecoherent = true;
  1463. if (parent.queuefamilycoherent)
  1464. child.queuefamilycoherent = true;
  1465. if (parent.workgroupcoherent)
  1466. child.workgroupcoherent = true;
  1467. if (parent.subgroupcoherent)
  1468. child.subgroupcoherent = true;
  1469. if (parent.shadercallcoherent)
  1470. child.shadercallcoherent = true;
  1471. if (parent.nonprivate)
  1472. child.nonprivate = true;
  1473. if (parent.volatil)
  1474. child.volatil = true;
  1475. if (parent.nontemporal)
  1476. child.nontemporal = true;
  1477. if (parent.restrict)
  1478. child.restrict = true;
  1479. if (parent.readonly)
  1480. child.readonly = true;
  1481. if (parent.writeonly)
  1482. child.writeonly = true;
  1483. if (parent.nonUniform)
  1484. child.nonUniform = true;
  1485. }
  1486. bool HasNonLayoutQualifiers(const glslang::TType& type, const glslang::TQualifier& qualifier)
  1487. {
  1488. // This should list qualifiers that simultaneous satisfy:
  1489. // - struct members might inherit from a struct declaration
  1490. // (note that non-block structs don't explicitly inherit,
  1491. // only implicitly, meaning no decoration involved)
  1492. // - affect decorations on the struct members
  1493. // (note smooth does not, and expecting something like volatile
  1494. // to effect the whole object)
  1495. // - are not part of the offset/st430/etc or row/column-major layout
  1496. return qualifier.invariant || (qualifier.hasLocation() && type.getBasicType() == glslang::EbtBlock);
  1497. }
  1498. //
  1499. // Implement the TGlslangToSpvTraverser class.
  1500. //
  1501. TGlslangToSpvTraverser::TGlslangToSpvTraverser(unsigned int spvVersion,
  1502. const glslang::TIntermediate* glslangIntermediate,
  1503. spv::SpvBuildLogger* buildLogger, glslang::SpvOptions& options) :
  1504. TIntermTraverser(true, false, true),
  1505. options(options),
  1506. shaderEntry(nullptr), currentFunction(nullptr),
  1507. sequenceDepth(0), logger(buildLogger),
  1508. builder(spvVersion, (glslang::GetKhronosToolId() << 16) | glslang::GetSpirvGeneratorVersion(), logger),
  1509. inEntryPoint(false), entryPointTerminated(false), linkageOnly(false),
  1510. glslangIntermediate(glslangIntermediate),
  1511. nanMinMaxClamp(glslangIntermediate->getNanMinMaxClamp()),
  1512. nonSemanticDebugPrintf(0),
  1513. taskPayloadID(0)
  1514. {
  1515. bool isMeshShaderExt = (glslangIntermediate->getRequestedExtensions().find(glslang::E_GL_EXT_mesh_shader) !=
  1516. glslangIntermediate->getRequestedExtensions().end());
  1517. spv::ExecutionModel executionModel = TranslateExecutionModel(glslangIntermediate->getStage(), isMeshShaderExt);
  1518. builder.clearAccessChain();
  1519. builder.setSource(TranslateSourceLanguage(glslangIntermediate->getSource(), glslangIntermediate->getProfile()),
  1520. glslangIntermediate->getVersion());
  1521. if (options.emitNonSemanticShaderDebugSource)
  1522. this->options.emitNonSemanticShaderDebugInfo = true;
  1523. if (options.emitNonSemanticShaderDebugInfo)
  1524. this->options.generateDebugInfo = true;
  1525. if (this->options.generateDebugInfo) {
  1526. if (this->options.emitNonSemanticShaderDebugInfo) {
  1527. builder.setEmitNonSemanticShaderDebugInfo(this->options.emitNonSemanticShaderDebugSource);
  1528. }
  1529. else {
  1530. builder.setEmitSpirvDebugInfo();
  1531. }
  1532. builder.setDebugMainSourceFile(glslangIntermediate->getSourceFile());
  1533. // Set the source shader's text. If for SPV version 1.0, include
  1534. // a preamble in comments stating the OpModuleProcessed instructions.
  1535. // Otherwise, emit those as actual instructions.
  1536. std::string text;
  1537. const std::vector<std::string>& processes = glslangIntermediate->getProcesses();
  1538. for (int p = 0; p < (int)processes.size(); ++p) {
  1539. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_1) {
  1540. text.append("// OpModuleProcessed ");
  1541. text.append(processes[p]);
  1542. text.append("\n");
  1543. } else
  1544. builder.addModuleProcessed(processes[p]);
  1545. }
  1546. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_1 && (int)processes.size() > 0)
  1547. text.append("#line 1\n");
  1548. text.append(glslangIntermediate->getSourceText());
  1549. builder.setSourceText(text);
  1550. // Pass name and text for all included files
  1551. const std::map<std::string, std::string>& include_txt = glslangIntermediate->getIncludeText();
  1552. for (auto iItr = include_txt.begin(); iItr != include_txt.end(); ++iItr)
  1553. builder.addInclude(iItr->first, iItr->second);
  1554. }
  1555. builder.setUseReplicatedComposites(glslangIntermediate->usingReplicatedComposites());
  1556. stdBuiltins = builder.import("GLSL.std.450");
  1557. spv::AddressingModel addressingModel = spv::AddressingModel::Logical;
  1558. spv::MemoryModel memoryModel = spv::MemoryModel::GLSL450;
  1559. if (glslangIntermediate->usingPhysicalStorageBuffer()) {
  1560. addressingModel = spv::AddressingModel::PhysicalStorageBuffer64EXT;
  1561. builder.addIncorporatedExtension(spv::E_SPV_KHR_physical_storage_buffer, spv::Spv_1_5);
  1562. builder.addCapability(spv::Capability::PhysicalStorageBufferAddressesEXT);
  1563. }
  1564. if (glslangIntermediate->usingVulkanMemoryModel()) {
  1565. memoryModel = spv::MemoryModel::VulkanKHR;
  1566. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  1567. builder.addIncorporatedExtension(spv::E_SPV_KHR_vulkan_memory_model, spv::Spv_1_5);
  1568. }
  1569. builder.setMemoryModel(addressingModel, memoryModel);
  1570. if (glslangIntermediate->usingVariablePointers()) {
  1571. builder.addCapability(spv::Capability::VariablePointers);
  1572. }
  1573. // If not linking, there is no entry point
  1574. if (!options.compileOnly) {
  1575. shaderEntry = builder.makeEntryPoint(glslangIntermediate->getEntryPointName().c_str());
  1576. entryPoint =
  1577. builder.addEntryPoint(executionModel, shaderEntry, glslangIntermediate->getEntryPointName().c_str());
  1578. }
  1579. // Add the source extensions
  1580. const auto& sourceExtensions = glslangIntermediate->getRequestedExtensions();
  1581. for (auto it = sourceExtensions.begin(); it != sourceExtensions.end(); ++it)
  1582. builder.addSourceExtension(it->c_str());
  1583. // Add the top-level modes for this shader.
  1584. if (glslangIntermediate->getXfbMode()) {
  1585. builder.addCapability(spv::Capability::TransformFeedback);
  1586. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::Xfb);
  1587. }
  1588. if (glslangIntermediate->getLayoutPrimitiveCulling()) {
  1589. builder.addCapability(spv::Capability::RayTraversalPrimitiveCullingKHR);
  1590. }
  1591. if (glslangIntermediate->getSubgroupUniformControlFlow()) {
  1592. builder.addExtension(spv::E_SPV_KHR_subgroup_uniform_control_flow);
  1593. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::SubgroupUniformControlFlowKHR);
  1594. }
  1595. if (glslangIntermediate->getMaximallyReconverges()) {
  1596. builder.addExtension(spv::E_SPV_KHR_maximal_reconvergence);
  1597. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::MaximallyReconvergesKHR);
  1598. }
  1599. if (glslangIntermediate->getQuadDerivMode())
  1600. {
  1601. builder.addCapability(spv::Capability::QuadControlKHR);
  1602. builder.addExtension(spv::E_SPV_KHR_quad_control);
  1603. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::QuadDerivativesKHR);
  1604. }
  1605. if (glslangIntermediate->getReqFullQuadsMode())
  1606. {
  1607. builder.addCapability(spv::Capability::QuadControlKHR);
  1608. builder.addExtension(spv::E_SPV_KHR_quad_control);
  1609. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::RequireFullQuadsKHR);
  1610. }
  1611. if (glslangIntermediate->usingShader64BitIndexing())
  1612. {
  1613. builder.addCapability(spv::Capability::Shader64BitIndexingEXT);
  1614. builder.addExtension(spv::E_SPV_EXT_shader_64bit_indexing);
  1615. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::Shader64BitIndexingEXT);
  1616. }
  1617. spv::ExecutionMode mode;
  1618. switch (glslangIntermediate->getStage()) {
  1619. case EShLangVertex:
  1620. builder.addCapability(spv::Capability::Shader);
  1621. break;
  1622. case EShLangFragment:
  1623. builder.addCapability(spv::Capability::Shader);
  1624. if (glslangIntermediate->getPixelCenterInteger())
  1625. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::PixelCenterInteger);
  1626. if (glslangIntermediate->getOriginUpperLeft())
  1627. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OriginUpperLeft);
  1628. else
  1629. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OriginLowerLeft);
  1630. if (glslangIntermediate->getEarlyFragmentTests())
  1631. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::EarlyFragmentTests);
  1632. if (glslangIntermediate->getEarlyAndLateFragmentTestsAMD())
  1633. {
  1634. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::EarlyAndLateFragmentTestsAMD);
  1635. builder.addExtension(spv::E_SPV_AMD_shader_early_and_late_fragment_tests);
  1636. }
  1637. if (glslangIntermediate->getPostDepthCoverage()) {
  1638. builder.addCapability(spv::Capability::SampleMaskPostDepthCoverage);
  1639. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::PostDepthCoverage);
  1640. builder.addExtension(spv::E_SPV_KHR_post_depth_coverage);
  1641. }
  1642. if (glslangIntermediate->getNonCoherentColorAttachmentReadEXT()) {
  1643. builder.addCapability(spv::Capability::TileImageColorReadAccessEXT);
  1644. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentColorAttachmentReadEXT);
  1645. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  1646. }
  1647. if (glslangIntermediate->getNonCoherentDepthAttachmentReadEXT()) {
  1648. builder.addCapability(spv::Capability::TileImageDepthReadAccessEXT);
  1649. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentDepthAttachmentReadEXT);
  1650. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  1651. }
  1652. if (glslangIntermediate->getNonCoherentStencilAttachmentReadEXT()) {
  1653. builder.addCapability(spv::Capability::TileImageStencilReadAccessEXT);
  1654. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentStencilAttachmentReadEXT);
  1655. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  1656. }
  1657. if (glslangIntermediate->getNonCoherentTileAttachmentReadQCOM()) {
  1658. builder.addCapability(spv::Capability::TileShadingQCOM);
  1659. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentTileAttachmentReadQCOM);
  1660. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1661. }
  1662. if (glslangIntermediate->isDepthReplacing())
  1663. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::DepthReplacing);
  1664. if (glslangIntermediate->isStencilReplacing())
  1665. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::StencilRefReplacingEXT);
  1666. switch(glslangIntermediate->getDepth()) {
  1667. case glslang::EldGreater: mode = spv::ExecutionMode::DepthGreater; break;
  1668. case glslang::EldLess: mode = spv::ExecutionMode::DepthLess; break;
  1669. case glslang::EldUnchanged: mode = spv::ExecutionMode::DepthUnchanged; break;
  1670. default: mode = spv::ExecutionMode::Max; break;
  1671. }
  1672. if (mode != spv::ExecutionMode::Max)
  1673. builder.addExecutionMode(shaderEntry, mode);
  1674. switch (glslangIntermediate->getStencil()) {
  1675. case glslang::ElsRefUnchangedFrontAMD: mode = spv::ExecutionMode::StencilRefUnchangedFrontAMD; break;
  1676. case glslang::ElsRefGreaterFrontAMD: mode = spv::ExecutionMode::StencilRefGreaterFrontAMD; break;
  1677. case glslang::ElsRefLessFrontAMD: mode = spv::ExecutionMode::StencilRefLessFrontAMD; break;
  1678. case glslang::ElsRefUnchangedBackAMD: mode = spv::ExecutionMode::StencilRefUnchangedBackAMD; break;
  1679. case glslang::ElsRefGreaterBackAMD: mode = spv::ExecutionMode::StencilRefGreaterBackAMD; break;
  1680. case glslang::ElsRefLessBackAMD: mode = spv::ExecutionMode::StencilRefLessBackAMD; break;
  1681. default: mode = spv::ExecutionMode::Max; break;
  1682. }
  1683. if (mode != spv::ExecutionMode::Max)
  1684. builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
  1685. switch (glslangIntermediate->getInterlockOrdering()) {
  1686. case glslang::EioPixelInterlockOrdered: mode = spv::ExecutionMode::PixelInterlockOrderedEXT;
  1687. break;
  1688. case glslang::EioPixelInterlockUnordered: mode = spv::ExecutionMode::PixelInterlockUnorderedEXT;
  1689. break;
  1690. case glslang::EioSampleInterlockOrdered: mode = spv::ExecutionMode::SampleInterlockOrderedEXT;
  1691. break;
  1692. case glslang::EioSampleInterlockUnordered: mode = spv::ExecutionMode::SampleInterlockUnorderedEXT;
  1693. break;
  1694. case glslang::EioShadingRateInterlockOrdered: mode = spv::ExecutionMode::ShadingRateInterlockOrderedEXT;
  1695. break;
  1696. case glslang::EioShadingRateInterlockUnordered: mode = spv::ExecutionMode::ShadingRateInterlockUnorderedEXT;
  1697. break;
  1698. default: mode = spv::ExecutionMode::Max;
  1699. break;
  1700. }
  1701. if (mode != spv::ExecutionMode::Max) {
  1702. builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
  1703. if (mode == spv::ExecutionMode::ShadingRateInterlockOrderedEXT ||
  1704. mode == spv::ExecutionMode::ShadingRateInterlockUnorderedEXT) {
  1705. builder.addCapability(spv::Capability::FragmentShaderShadingRateInterlockEXT);
  1706. } else if (mode == spv::ExecutionMode::PixelInterlockOrderedEXT ||
  1707. mode == spv::ExecutionMode::PixelInterlockUnorderedEXT) {
  1708. builder.addCapability(spv::Capability::FragmentShaderPixelInterlockEXT);
  1709. } else {
  1710. builder.addCapability(spv::Capability::FragmentShaderSampleInterlockEXT);
  1711. }
  1712. builder.addExtension(spv::E_SPV_EXT_fragment_shader_interlock);
  1713. }
  1714. break;
  1715. case EShLangCompute: {
  1716. builder.addCapability(spv::Capability::Shader);
  1717. bool needSizeId = false;
  1718. for (int dim = 0; dim < 3; ++dim) {
  1719. if ((glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet)) {
  1720. needSizeId = true;
  1721. break;
  1722. }
  1723. }
  1724. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6 && needSizeId) {
  1725. std::vector<spv::Id> dimConstId;
  1726. for (int dim = 0; dim < 3; ++dim) {
  1727. bool specConst = (glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet);
  1728. dimConstId.push_back(builder.makeUintConstant(glslangIntermediate->getLocalSize(dim), specConst));
  1729. if (specConst) {
  1730. builder.addDecoration(dimConstId.back(), spv::Decoration::SpecId,
  1731. glslangIntermediate->getLocalSizeSpecId(dim));
  1732. needSizeId = true;
  1733. }
  1734. }
  1735. builder.addExecutionModeId(shaderEntry, spv::ExecutionMode::LocalSizeId, dimConstId);
  1736. } else {
  1737. if (glslangIntermediate->getTileShadingRateQCOM(0) >= 1 || glslangIntermediate->getTileShadingRateQCOM(1) >= 1 || glslangIntermediate->getTileShadingRateQCOM(2) >= 1) {
  1738. auto rate_x = glslangIntermediate->getTileShadingRateQCOM(0);
  1739. auto rate_y = glslangIntermediate->getTileShadingRateQCOM(1);
  1740. auto rate_z = glslangIntermediate->getTileShadingRateQCOM(2);
  1741. rate_x = ( rate_x == 0 ? 1 : rate_x );
  1742. rate_y = ( rate_y == 0 ? 1 : rate_y );
  1743. rate_z = ( rate_z == 0 ? 1 : rate_z );
  1744. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::TileShadingRateQCOM, rate_x, rate_y, rate_z);
  1745. } else {
  1746. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::LocalSize, glslangIntermediate->getLocalSize(0),
  1747. glslangIntermediate->getLocalSize(1),
  1748. glslangIntermediate->getLocalSize(2));
  1749. }
  1750. }
  1751. if (glslangIntermediate->getLayoutDerivativeModeNone() == glslang::LayoutDerivativeGroupQuads) {
  1752. builder.addCapability(spv::Capability::ComputeDerivativeGroupQuadsNV);
  1753. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::DerivativeGroupQuadsNV);
  1754. builder.addExtension(spv::E_SPV_NV_compute_shader_derivatives);
  1755. } else if (glslangIntermediate->getLayoutDerivativeModeNone() == glslang::LayoutDerivativeGroupLinear) {
  1756. builder.addCapability(spv::Capability::ComputeDerivativeGroupLinearNV);
  1757. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::DerivativeGroupLinearNV);
  1758. builder.addExtension(spv::E_SPV_NV_compute_shader_derivatives);
  1759. }
  1760. if (glslangIntermediate->getNonCoherentTileAttachmentReadQCOM()) {
  1761. builder.addCapability(spv::Capability::TileShadingQCOM);
  1762. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentTileAttachmentReadQCOM);
  1763. builder.addExtension(spv::E_SPV_QCOM_tile_shading);
  1764. }
  1765. break;
  1766. }
  1767. case EShLangTessEvaluation:
  1768. case EShLangTessControl:
  1769. builder.addCapability(spv::Capability::Tessellation);
  1770. glslang::TLayoutGeometry primitive;
  1771. if (glslangIntermediate->getStage() == EShLangTessControl) {
  1772. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputVertices,
  1773. glslangIntermediate->getVertices());
  1774. primitive = glslangIntermediate->getOutputPrimitive();
  1775. } else {
  1776. primitive = glslangIntermediate->getInputPrimitive();
  1777. }
  1778. switch (primitive) {
  1779. case glslang::ElgTriangles: mode = spv::ExecutionMode::Triangles; break;
  1780. case glslang::ElgQuads: mode = spv::ExecutionMode::Quads; break;
  1781. case glslang::ElgIsolines: mode = spv::ExecutionMode::Isolines; break;
  1782. default: mode = spv::ExecutionMode::Max; break;
  1783. }
  1784. if (mode != spv::ExecutionMode::Max)
  1785. builder.addExecutionMode(shaderEntry, mode);
  1786. switch (glslangIntermediate->getVertexSpacing()) {
  1787. case glslang::EvsEqual: mode = spv::ExecutionMode::SpacingEqual; break;
  1788. case glslang::EvsFractionalEven: mode = spv::ExecutionMode::SpacingFractionalEven; break;
  1789. case glslang::EvsFractionalOdd: mode = spv::ExecutionMode::SpacingFractionalOdd; break;
  1790. default: mode = spv::ExecutionMode::Max; break;
  1791. }
  1792. if (mode != spv::ExecutionMode::Max)
  1793. builder.addExecutionMode(shaderEntry, mode);
  1794. switch (glslangIntermediate->getVertexOrder()) {
  1795. case glslang::EvoCw: mode = spv::ExecutionMode::VertexOrderCw; break;
  1796. case glslang::EvoCcw: mode = spv::ExecutionMode::VertexOrderCcw; break;
  1797. default: mode = spv::ExecutionMode::Max; break;
  1798. }
  1799. if (mode != spv::ExecutionMode::Max)
  1800. builder.addExecutionMode(shaderEntry, mode);
  1801. if (glslangIntermediate->getPointMode())
  1802. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::PointMode);
  1803. break;
  1804. case EShLangGeometry:
  1805. builder.addCapability(spv::Capability::Geometry);
  1806. switch (glslangIntermediate->getInputPrimitive()) {
  1807. case glslang::ElgPoints: mode = spv::ExecutionMode::InputPoints; break;
  1808. case glslang::ElgLines: mode = spv::ExecutionMode::InputLines; break;
  1809. case glslang::ElgLinesAdjacency: mode = spv::ExecutionMode::InputLinesAdjacency; break;
  1810. case glslang::ElgTriangles: mode = spv::ExecutionMode::Triangles; break;
  1811. case glslang::ElgTrianglesAdjacency: mode = spv::ExecutionMode::InputTrianglesAdjacency; break;
  1812. default: mode = spv::ExecutionMode::Max; break;
  1813. }
  1814. if (mode != spv::ExecutionMode::Max)
  1815. builder.addExecutionMode(shaderEntry, mode);
  1816. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::Invocations, glslangIntermediate->getInvocations());
  1817. switch (glslangIntermediate->getOutputPrimitive()) {
  1818. case glslang::ElgPoints: mode = spv::ExecutionMode::OutputPoints; break;
  1819. case glslang::ElgLineStrip: mode = spv::ExecutionMode::OutputLineStrip; break;
  1820. case glslang::ElgTriangleStrip: mode = spv::ExecutionMode::OutputTriangleStrip; break;
  1821. default: mode = spv::ExecutionMode::Max; break;
  1822. }
  1823. if (mode != spv::ExecutionMode::Max)
  1824. builder.addExecutionMode(shaderEntry, mode);
  1825. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputVertices, glslangIntermediate->getVertices());
  1826. break;
  1827. case EShLangRayGen:
  1828. case EShLangIntersect:
  1829. case EShLangAnyHit:
  1830. case EShLangClosestHit:
  1831. case EShLangMiss:
  1832. case EShLangCallable:
  1833. {
  1834. auto& extensions = glslangIntermediate->getRequestedExtensions();
  1835. if (extensions.find("GL_EXT_opacity_micromap") != extensions.end()) {
  1836. builder.addCapability(spv::Capability::RayTracingOpacityMicromapEXT);
  1837. builder.addExtension("SPV_EXT_opacity_micromap");
  1838. }
  1839. if (extensions.find("GL_NV_ray_tracing") == extensions.end()) {
  1840. builder.addCapability(spv::Capability::RayTracingKHR);
  1841. builder.addExtension("SPV_KHR_ray_tracing");
  1842. }
  1843. else {
  1844. builder.addCapability(spv::Capability::RayTracingNV);
  1845. builder.addExtension("SPV_NV_ray_tracing");
  1846. }
  1847. if (glslangIntermediate->getStage() != EShLangRayGen && glslangIntermediate->getStage() != EShLangCallable) {
  1848. if (extensions.find("GL_EXT_ray_cull_mask") != extensions.end()) {
  1849. builder.addCapability(spv::Capability::RayCullMaskKHR);
  1850. builder.addExtension("SPV_KHR_ray_cull_mask");
  1851. }
  1852. if (extensions.find("GL_EXT_ray_tracing_position_fetch") != extensions.end()) {
  1853. builder.addCapability(spv::Capability::RayTracingPositionFetchKHR);
  1854. builder.addExtension("SPV_KHR_ray_tracing_position_fetch");
  1855. }
  1856. }
  1857. break;
  1858. }
  1859. case EShLangTask:
  1860. case EShLangMesh:
  1861. if(isMeshShaderExt) {
  1862. builder.addCapability(spv::Capability::MeshShadingEXT);
  1863. builder.addExtension(spv::E_SPV_EXT_mesh_shader);
  1864. } else {
  1865. builder.addCapability(spv::Capability::MeshShadingNV);
  1866. builder.addExtension(spv::E_SPV_NV_mesh_shader);
  1867. }
  1868. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {
  1869. std::vector<spv::Id> dimConstId;
  1870. for (int dim = 0; dim < 3; ++dim) {
  1871. bool specConst = (glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet);
  1872. dimConstId.push_back(builder.makeUintConstant(glslangIntermediate->getLocalSize(dim), specConst));
  1873. if (specConst) {
  1874. builder.addDecoration(dimConstId.back(), spv::Decoration::SpecId,
  1875. glslangIntermediate->getLocalSizeSpecId(dim));
  1876. }
  1877. }
  1878. builder.addExecutionModeId(shaderEntry, spv::ExecutionMode::LocalSizeId, dimConstId);
  1879. } else {
  1880. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::LocalSize, glslangIntermediate->getLocalSize(0),
  1881. glslangIntermediate->getLocalSize(1),
  1882. glslangIntermediate->getLocalSize(2));
  1883. }
  1884. if (glslangIntermediate->getStage() == EShLangMesh) {
  1885. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputVertices,
  1886. glslangIntermediate->getVertices());
  1887. builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputPrimitivesNV,
  1888. glslangIntermediate->getPrimitives());
  1889. switch (glslangIntermediate->getOutputPrimitive()) {
  1890. case glslang::ElgPoints: mode = spv::ExecutionMode::OutputPoints; break;
  1891. case glslang::ElgLines: mode = spv::ExecutionMode::OutputLinesNV; break;
  1892. case glslang::ElgTriangles: mode = spv::ExecutionMode::OutputTrianglesNV; break;
  1893. default: mode = spv::ExecutionMode::Max; break;
  1894. }
  1895. if (mode != spv::ExecutionMode::Max)
  1896. builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
  1897. }
  1898. break;
  1899. default:
  1900. break;
  1901. }
  1902. //
  1903. // Add SPIR-V requirements (GL_EXT_spirv_intrinsics)
  1904. //
  1905. if (glslangIntermediate->hasSpirvRequirement()) {
  1906. const glslang::TSpirvRequirement& spirvRequirement = glslangIntermediate->getSpirvRequirement();
  1907. // Add SPIR-V extension requirement
  1908. for (auto& extension : spirvRequirement.extensions)
  1909. builder.addExtension(extension.c_str());
  1910. // Add SPIR-V capability requirement
  1911. for (auto capability : spirvRequirement.capabilities)
  1912. builder.addCapability(static_cast<spv::Capability>(capability));
  1913. }
  1914. //
  1915. // Add SPIR-V execution mode qualifiers (GL_EXT_spirv_intrinsics)
  1916. //
  1917. if (glslangIntermediate->hasSpirvExecutionMode()) {
  1918. const glslang::TSpirvExecutionMode spirvExecutionMode = glslangIntermediate->getSpirvExecutionMode();
  1919. // Add spirv_execution_mode
  1920. for (auto& mode : spirvExecutionMode.modes) {
  1921. if (!mode.second.empty()) {
  1922. std::vector<unsigned> literals;
  1923. TranslateLiterals(mode.second, literals);
  1924. builder.addExecutionMode(shaderEntry, static_cast<spv::ExecutionMode>(mode.first), literals);
  1925. } else
  1926. builder.addExecutionMode(shaderEntry, static_cast<spv::ExecutionMode>(mode.first));
  1927. }
  1928. // Add spirv_execution_mode_id
  1929. for (auto& modeId : spirvExecutionMode.modeIds) {
  1930. std::vector<spv::Id> operandIds;
  1931. assert(!modeId.second.empty());
  1932. for (auto extraOperand : modeId.second) {
  1933. if (extraOperand->getType().getQualifier().isSpecConstant())
  1934. operandIds.push_back(getSymbolId(extraOperand->getAsSymbolNode()));
  1935. else
  1936. operandIds.push_back(createSpvConstant(*extraOperand));
  1937. }
  1938. builder.addExecutionModeId(shaderEntry, static_cast<spv::ExecutionMode>(modeId.first), operandIds);
  1939. }
  1940. }
  1941. }
  1942. // Finish creating SPV, after the traversal is complete.
  1943. void TGlslangToSpvTraverser::finishSpv(bool compileOnly)
  1944. {
  1945. // If not linking, an entry point is not expected
  1946. if (!compileOnly) {
  1947. // Finish the entry point function
  1948. if (!entryPointTerminated) {
  1949. builder.setBuildPoint(shaderEntry->getLastBlock());
  1950. builder.leaveFunction();
  1951. }
  1952. // finish off the entry-point SPV instruction by adding the Input/Output <id>
  1953. entryPoint->reserveOperands(iOSet.size());
  1954. for (auto id : iOSet)
  1955. entryPoint->addIdOperand(id);
  1956. }
  1957. // Add capabilities, extensions, remove unneeded decorations, etc.,
  1958. // based on the resulting SPIR-V.
  1959. // Note: WebGPU code generation must have the opportunity to aggressively
  1960. // prune unreachable merge blocks and continue targets.
  1961. builder.postProcess(compileOnly);
  1962. }
  1963. // Write the SPV into 'out'.
  1964. void TGlslangToSpvTraverser::dumpSpv(std::vector<unsigned int>& out)
  1965. {
  1966. builder.dump(out);
  1967. }
  1968. //
  1969. // Implement the traversal functions.
  1970. //
  1971. // Return true from interior nodes to have the external traversal
  1972. // continue on to children. Return false if children were
  1973. // already processed.
  1974. //
  1975. //
  1976. // Symbols can turn into
  1977. // - uniform/input reads
  1978. // - output writes
  1979. // - complex lvalue base setups: foo.bar[3].... , where we see foo and start up an access chain
  1980. // - something simple that degenerates into the last bullet
  1981. //
  1982. void TGlslangToSpvTraverser::visitSymbol(glslang::TIntermSymbol* symbol)
  1983. {
  1984. // We update the line information even though no code might be generated here
  1985. // This is helpful to yield correct lines for control flow instructions
  1986. if (!linkageOnly) {
  1987. builder.setDebugSourceLocation(symbol->getLoc().line, symbol->getLoc().getFilename());
  1988. }
  1989. if (symbol->getBasicType() == glslang::EbtFunction) {
  1990. return;
  1991. }
  1992. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  1993. if (symbol->getType().isStruct())
  1994. glslangTypeToIdMap[symbol->getType().getStruct()] = symbol->getId();
  1995. if (symbol->getType().getQualifier().isSpecConstant())
  1996. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  1997. #ifdef ENABLE_HLSL
  1998. // Skip symbol handling if it is string-typed
  1999. if (symbol->getBasicType() == glslang::EbtString)
  2000. return;
  2001. #endif
  2002. // getSymbolId() will set up all the IO decorations on the first call.
  2003. // Formal function parameters were mapped during makeFunctions().
  2004. spv::Id id = getSymbolId(symbol);
  2005. if (symbol->getType().getQualifier().isTaskPayload())
  2006. taskPayloadID = id; // cache the taskPayloadID to be used it as operand for OpEmitMeshTasksEXT
  2007. if (builder.isPointer(id)) {
  2008. if (!symbol->getType().getQualifier().isParamInput() &&
  2009. !symbol->getType().getQualifier().isParamOutput()) {
  2010. // Include all "static use" and "linkage only" interface variables on the OpEntryPoint instruction
  2011. // Consider adding to the OpEntryPoint interface list.
  2012. // Only looking at structures if they have at least one member.
  2013. if (!symbol->getType().isStruct() || symbol->getType().getStruct()->size() > 0) {
  2014. spv::StorageClass sc = builder.getStorageClass(id);
  2015. // Before SPIR-V 1.4, we only want to include Input and Output.
  2016. // Starting with SPIR-V 1.4, we want all globals.
  2017. if ((glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4 && builder.isGlobalVariable(id)) ||
  2018. (sc == spv::StorageClass::Input || sc == spv::StorageClass::Output)) {
  2019. iOSet.insert(id);
  2020. }
  2021. }
  2022. }
  2023. // If the SPIR-V type is required to be different than the AST type
  2024. // (for ex SubgroupMasks or 3x4 ObjectToWorld/WorldToObject matrices),
  2025. // translate now from the SPIR-V type to the AST type, for the consuming
  2026. // operation.
  2027. // Note this turns it from an l-value to an r-value.
  2028. // Currently, all symbols needing this are inputs; avoid the map lookup when non-input.
  2029. if (symbol->getType().getQualifier().storage == glslang::EvqVaryingIn)
  2030. id = translateForcedType(id);
  2031. }
  2032. // Only process non-linkage-only nodes for generating actual static uses
  2033. if (! linkageOnly || symbol->getQualifier().isSpecConstant()) {
  2034. // Prepare to generate code for the access
  2035. // L-value chains will be computed left to right. We're on the symbol now,
  2036. // which is the left-most part of the access chain, so now is "clear" time,
  2037. // followed by setting the base.
  2038. builder.clearAccessChain();
  2039. // For now, we consider all user variables as being in memory, so they are pointers,
  2040. // except for
  2041. // A) R-Value arguments to a function, which are an intermediate object.
  2042. // See comments in handleUserFunctionCall().
  2043. // B) Specialization constants (normal constants don't even come in as a variable),
  2044. // These are also pure R-values.
  2045. // C) R-Values from type translation, see above call to translateForcedType()
  2046. glslang::TQualifier qualifier = symbol->getQualifier();
  2047. if (qualifier.isSpecConstant() || rValueParameters.find(symbol->getId()) != rValueParameters.end() ||
  2048. (!builder.isPointerType(builder.getTypeId(id)) && !builder.isUntypedPointer(id)))
  2049. builder.setAccessChainRValue(id);
  2050. else
  2051. builder.setAccessChainLValue(id);
  2052. }
  2053. #ifdef ENABLE_HLSL
  2054. // Process linkage-only nodes for any special additional interface work.
  2055. if (linkageOnly) {
  2056. if (glslangIntermediate->getHlslFunctionality1()) {
  2057. // Map implicit counter buffers to their originating buffers, which should have been
  2058. // seen by now, given earlier pruning of unused counters, and preservation of order
  2059. // of declaration.
  2060. if (symbol->getType().getQualifier().isUniformOrBuffer()) {
  2061. if (!glslangIntermediate->hasCounterBufferName(symbol->getName())) {
  2062. // Save possible originating buffers for counter buffers, keyed by
  2063. // making the potential counter-buffer name.
  2064. std::string keyName = symbol->getName().c_str();
  2065. keyName = glslangIntermediate->addCounterBufferName(keyName);
  2066. counterOriginator[keyName] = symbol;
  2067. } else {
  2068. // Handle a counter buffer, by finding the saved originating buffer.
  2069. std::string keyName = symbol->getName().c_str();
  2070. auto it = counterOriginator.find(keyName);
  2071. if (it != counterOriginator.end()) {
  2072. id = getSymbolId(it->second);
  2073. if (id != spv::NoResult) {
  2074. spv::Id counterId = getSymbolId(symbol);
  2075. if (counterId != spv::NoResult) {
  2076. builder.addExtension("SPV_GOOGLE_hlsl_functionality1");
  2077. builder.addDecorationId(id, spv::Decoration::HlslCounterBufferGOOGLE, counterId);
  2078. }
  2079. }
  2080. }
  2081. }
  2082. }
  2083. }
  2084. }
  2085. #endif
  2086. }
  2087. // Create new untyped access chain instruction to descriptor heap, based on EXT_descriptor_heap extension.
  2088. void TGlslangToSpvTraverser::recordDescHeapAccessChainInfo(glslang::TIntermBinary* node)
  2089. {
  2090. // EXT_descriptor_heap
  2091. glslang::TType* nodeTy = node->getWritableType().clone();
  2092. // For buffer/structure type, using its basic structure type:
  2093. // data ptr will be first loaded into a BufferPointerType before finally gets chained accessed.
  2094. if (node->getLeft()->getQualifier().isUniformOrBuffer())
  2095. nodeTy = node->getLeft()->getType().clone();
  2096. if (nodeTy->isArray())
  2097. nodeTy->clearArraySizes();
  2098. spv::BuiltIn bt = spv::BuiltIn::Max;
  2099. unsigned int firstArrIndex = 0;
  2100. auto rsrcOffsetIdx = builder.isStructureHeapMember(builder.getTypeId(builder.getAccessChain().base),
  2101. builder.getAccessChain().indexChain, 0, &bt, &firstArrIndex);
  2102. spv::Id remappedBuiltin = bt == spv::BuiltIn::Max ? 0 : builtInVariableIds[unsigned(bt)];
  2103. nodeTy->getQualifier().layoutDescriptorInnerBlock = false;
  2104. // Extra dimension is not needed when translate storage and type. Real loading type is based on orignal AST nodes.
  2105. builder.setAccessChainDescHeapInfo(TranslateStorageClass(*nodeTy), convertGlslangToSpvType(*nodeTy),
  2106. nodeTy->getQualifier().layoutDescriptorStride, rsrcOffsetIdx, remappedBuiltin, firstArrIndex);
  2107. }
  2108. bool TGlslangToSpvTraverser::visitBinary(glslang::TVisit /* visit */, glslang::TIntermBinary* node)
  2109. {
  2110. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2111. if (node->getLeft()->getAsSymbolNode() != nullptr && node->getLeft()->getType().isStruct()) {
  2112. glslangTypeToIdMap[node->getLeft()->getType().getStruct()] = node->getLeft()->getAsSymbolNode()->getId();
  2113. }
  2114. if (node->getRight()->getAsSymbolNode() != nullptr && node->getRight()->getType().isStruct()) {
  2115. glslangTypeToIdMap[node->getRight()->getType().getStruct()] = node->getRight()->getAsSymbolNode()->getId();
  2116. }
  2117. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  2118. if (node->getType().getQualifier().isSpecConstant())
  2119. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  2120. // First, handle special cases
  2121. switch (node->getOp()) {
  2122. case glslang::EOpAssign:
  2123. case glslang::EOpAddAssign:
  2124. case glslang::EOpSubAssign:
  2125. case glslang::EOpMulAssign:
  2126. case glslang::EOpVectorTimesMatrixAssign:
  2127. case glslang::EOpVectorTimesScalarAssign:
  2128. case glslang::EOpMatrixTimesScalarAssign:
  2129. case glslang::EOpMatrixTimesMatrixAssign:
  2130. case glslang::EOpDivAssign:
  2131. case glslang::EOpModAssign:
  2132. case glslang::EOpAndAssign:
  2133. case glslang::EOpInclusiveOrAssign:
  2134. case glslang::EOpExclusiveOrAssign:
  2135. case glslang::EOpLeftShiftAssign:
  2136. case glslang::EOpRightShiftAssign:
  2137. // A bin-op assign "a += b" means the same thing as "a = a + b"
  2138. // where a is evaluated before b. For a simple assignment, GLSL
  2139. // says to evaluate the left before the right. So, always, left
  2140. // node then right node.
  2141. {
  2142. // get the left l-value, save it away
  2143. builder.clearAccessChain();
  2144. node->getLeft()->traverse(this);
  2145. spv::Builder::AccessChain lValue = builder.getAccessChain();
  2146. // evaluate the right
  2147. builder.clearAccessChain();
  2148. node->getRight()->traverse(this);
  2149. spv::Id rValue = accessChainLoad(node->getRight()->getType());
  2150. // reset line number for assignment
  2151. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2152. if (node->getOp() != glslang::EOpAssign) {
  2153. // the left is also an r-value
  2154. builder.setAccessChain(lValue);
  2155. spv::Id leftRValue = accessChainLoad(node->getLeft()->getType());
  2156. // do the operation
  2157. spv::Builder::AccessChain::CoherentFlags coherentFlags = TranslateCoherent(node->getLeft()->getType());
  2158. coherentFlags |= TranslateCoherent(node->getRight()->getType());
  2159. OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
  2160. TranslateNoContractionDecoration(node->getType().getQualifier()),
  2161. TranslateNonUniformDecoration(coherentFlags) };
  2162. rValue = createBinaryOperation(node->getOp(), decorations,
  2163. convertGlslangToSpvType(node->getType()), leftRValue, rValue,
  2164. node->getType().getBasicType());
  2165. // these all need their counterparts in createBinaryOperation()
  2166. assert(rValue != spv::NoResult);
  2167. }
  2168. // store the result
  2169. builder.setAccessChain(lValue);
  2170. multiTypeStore(node->getLeft()->getType(), rValue);
  2171. // assignments are expressions having an rValue after they are evaluated...
  2172. builder.clearAccessChain();
  2173. builder.setAccessChainRValue(rValue);
  2174. }
  2175. return false;
  2176. case glslang::EOpIndexDirect:
  2177. case glslang::EOpIndexDirectStruct:
  2178. {
  2179. // Structure, array, matrix, or vector indirection with statically known index.
  2180. // Get the left part of the access chain.
  2181. node->getLeft()->traverse(this);
  2182. // Add the next element in the chain
  2183. const int glslangIndex = node->getRight()->getAsConstantUnion()->getConstArray()[0].getIConst();
  2184. if (! node->getLeft()->getType().isArray() &&
  2185. node->getLeft()->getType().isVector() &&
  2186. node->getOp() == glslang::EOpIndexDirect) {
  2187. // Swizzle is uniform so propagate uniform into access chain
  2188. spv::Builder::AccessChain::CoherentFlags coherentFlags = TranslateCoherent(node->getLeft()->getType());
  2189. coherentFlags.nonUniform = 0;
  2190. // This is essentially a hard-coded vector swizzle of size 1,
  2191. // so short circuit the access-chain stuff with a swizzle.
  2192. std::vector<unsigned> swizzle;
  2193. swizzle.push_back(glslangIndex);
  2194. int dummySize;
  2195. builder.accessChainPushSwizzle(swizzle, convertGlslangToSpvType(node->getLeft()->getType()),
  2196. coherentFlags,
  2197. glslangIntermediate->getBaseAlignmentScalar(
  2198. node->getLeft()->getType(), dummySize));
  2199. } else {
  2200. // Load through a block reference is performed with a dot operator that
  2201. // is mapped to EOpIndexDirectStruct. When we get to the actual reference,
  2202. // do a load and reset the access chain.
  2203. if (node->getLeft()->isReference() &&
  2204. !node->getLeft()->getType().isArray() &&
  2205. node->getOp() == glslang::EOpIndexDirectStruct)
  2206. {
  2207. spv::Id left = accessChainLoad(node->getLeft()->getType());
  2208. builder.clearAccessChain();
  2209. builder.setAccessChainLValue(left);
  2210. }
  2211. int spvIndex = glslangIndex;
  2212. if (node->getLeft()->getBasicType() == glslang::EbtBlock &&
  2213. node->getOp() == glslang::EOpIndexDirectStruct)
  2214. {
  2215. // This may be, e.g., an anonymous block-member selection, which generally need
  2216. // index remapping due to hidden members in anonymous blocks.
  2217. long long glslangId = glslangTypeToIdMap[node->getLeft()->getType().getStruct()];
  2218. if (memberRemapper.find(glslangId) != memberRemapper.end()) {
  2219. std::vector<int>& remapper = memberRemapper[glslangId];
  2220. assert(remapper.size() > 0);
  2221. spvIndex = remapper[glslangIndex];
  2222. }
  2223. }
  2224. // Struct reference propagates uniform lvalue
  2225. spv::Builder::AccessChain::CoherentFlags coherentFlags =
  2226. TranslateCoherent(node->getLeft()->getType());
  2227. coherentFlags.nonUniform = 0;
  2228. // normal case for indexing array or structure or block
  2229. if ((node->getRight()->getType().getBasicType() == glslang::EbtUint && glslangIntermediate->usingPromoteUint32Indices()) ||
  2230. node->getRight()->getType().contains64BitInt()) {
  2231. int64_t idx = node->getRight()->getType().contains64BitInt() ?
  2232. node->getRight()->getAsConstantUnion()->getConstArray()[0].getI64Const() :
  2233. node->getRight()->getAsConstantUnion()->getConstArray()[0].getUConst();
  2234. builder.accessChainPush(builder.makeInt64Constant(idx),
  2235. coherentFlags,
  2236. node->getLeft()->getType().getBufferReferenceAlignment());
  2237. } else {
  2238. builder.accessChainPush(builder.makeIntConstant(spvIndex),
  2239. coherentFlags,
  2240. node->getLeft()->getType().getBufferReferenceAlignment());
  2241. }
  2242. // Add capabilities here for accessing PointSize and clip/cull distance.
  2243. // We have deferred generation of associated capabilities until now.
  2244. if (node->getLeft()->getType().isStruct() && ! node->getLeft()->getType().isArray())
  2245. declareUseOfStructMember(*(node->getLeft()->getType().getStruct()), glslangIndex);
  2246. // EXT_descriptor_heap
  2247. // Record untyped descriptor heap access info.
  2248. if (node->getLeft()->getType().isBuiltIn() &&
  2249. (node->getLeft()->getQualifier().builtIn == glslang::EbvResourceHeapEXT ||
  2250. node->getLeft()->getQualifier().builtIn == glslang::EbvSamplerHeapEXT)) {
  2251. recordDescHeapAccessChainInfo(node);
  2252. }
  2253. }
  2254. }
  2255. return false;
  2256. case glslang::EOpIndexIndirect:
  2257. {
  2258. // Array, matrix, or vector indirection with variable index.
  2259. // Will use native SPIR-V access-chain for and array indirection;
  2260. // matrices are arrays of vectors, so will also work for a matrix.
  2261. // Will use the access chain's 'component' for variable index into a vector.
  2262. // This adapter is building access chains left to right.
  2263. // Set up the access chain to the left.
  2264. node->getLeft()->traverse(this);
  2265. // save it so that computing the right side doesn't trash it
  2266. spv::Builder::AccessChain partial = builder.getAccessChain();
  2267. // compute the next index in the chain
  2268. builder.clearAccessChain();
  2269. node->getRight()->traverse(this);
  2270. spv::Id index = accessChainLoad(node->getRight()->getType());
  2271. // Zero-extend smaller unsigned integer types for array indexing.
  2272. // SPIR-V OpAccessChain treats indices as signed, so we need to zero-extend
  2273. // unsigned types to preserve their values (signed types are fine as-is).
  2274. spv::Id indexType = builder.getTypeId(index);
  2275. if (builder.isUintType(indexType) && builder.getScalarTypeWidth(indexType) < 32) {
  2276. // Zero-extend unsigned types to preserve their values
  2277. spv::Id uintType = builder.makeUintType(32);
  2278. index = builder.createUnaryOp(spv::Op::OpUConvert, uintType, index);
  2279. }
  2280. addIndirectionIndexCapabilities(node->getLeft()->getType(), node->getRight()->getType());
  2281. // restore the saved access chain
  2282. builder.setAccessChain(partial);
  2283. // Only if index is nonUniform should we propagate nonUniform into access chain
  2284. spv::Builder::AccessChain::CoherentFlags index_flags = TranslateCoherent(node->getRight()->getType());
  2285. spv::Builder::AccessChain::CoherentFlags coherent_flags = TranslateCoherent(node->getLeft()->getType());
  2286. coherent_flags.nonUniform = index_flags.nonUniform;
  2287. if (! node->getLeft()->getType().isArray() && node->getLeft()->getType().isVector()) {
  2288. int dummySize;
  2289. builder.accessChainPushComponent(
  2290. index, convertGlslangToSpvType(node->getLeft()->getType()), coherent_flags,
  2291. glslangIntermediate->getBaseAlignmentScalar(node->getLeft()->getType(),
  2292. dummySize));
  2293. } else {
  2294. if (glslangIntermediate->usingPromoteUint32Indices() &&
  2295. node->getRight()->getType().getBasicType() == glslang::EbtUint) {
  2296. index = createIntWidthConversion(index, 0, builder.makeIntegerType(64, true), glslang::EbtInt64, node->getRight()->getType().getBasicType());
  2297. }
  2298. builder.accessChainPush(index, coherent_flags,
  2299. node->getLeft()->getType().getBufferReferenceAlignment());
  2300. }
  2301. // EXT_descriptor_heap
  2302. // Record untyped descriptor heap access info.
  2303. if (node->getLeft()->getType().isBuiltIn() &&
  2304. (node->getLeft()->getQualifier().builtIn == glslang::EbvResourceHeapEXT ||
  2305. node->getLeft()->getQualifier().builtIn == glslang::EbvSamplerHeapEXT)) {
  2306. recordDescHeapAccessChainInfo(node);
  2307. }
  2308. }
  2309. return false;
  2310. case glslang::EOpVectorSwizzle:
  2311. {
  2312. node->getLeft()->traverse(this);
  2313. std::vector<unsigned> swizzle;
  2314. convertSwizzle(*node->getRight()->getAsAggregate(), swizzle);
  2315. int dummySize;
  2316. builder.accessChainPushSwizzle(swizzle, convertGlslangToSpvType(node->getLeft()->getType()),
  2317. TranslateCoherent(node->getLeft()->getType()),
  2318. glslangIntermediate->getBaseAlignmentScalar(node->getLeft()->getType(),
  2319. dummySize));
  2320. }
  2321. return false;
  2322. case glslang::EOpMatrixSwizzle:
  2323. logger->missingFunctionality("matrix swizzle");
  2324. return true;
  2325. case glslang::EOpLogicalOr:
  2326. case glslang::EOpLogicalAnd:
  2327. {
  2328. // These may require short circuiting, but can sometimes be done as straight
  2329. // binary operations. The right operand must be short circuited if it has
  2330. // side effects, and should probably be if it is complex.
  2331. if (isTrivial(node->getRight()->getAsTyped()))
  2332. break; // handle below as a normal binary operation
  2333. // otherwise, we need to do dynamic short circuiting on the right operand
  2334. spv::Id result = createShortCircuit(node->getOp(), *node->getLeft()->getAsTyped(),
  2335. *node->getRight()->getAsTyped());
  2336. builder.clearAccessChain();
  2337. builder.setAccessChainRValue(result);
  2338. }
  2339. return false;
  2340. default:
  2341. break;
  2342. }
  2343. // Assume generic binary op...
  2344. // get right operand
  2345. builder.clearAccessChain();
  2346. node->getLeft()->traverse(this);
  2347. spv::Id left = accessChainLoad(node->getLeft()->getType());
  2348. // get left operand
  2349. builder.clearAccessChain();
  2350. node->getRight()->traverse(this);
  2351. spv::Id right = accessChainLoad(node->getRight()->getType());
  2352. // get result
  2353. OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
  2354. TranslateNoContractionDecoration(node->getType().getQualifier()),
  2355. TranslateNonUniformDecoration(node->getType().getQualifier()) };
  2356. spv::Id result = createBinaryOperation(node->getOp(), decorations,
  2357. convertGlslangToSpvType(node->getType()), left, right,
  2358. node->getLeft()->getType().getBasicType());
  2359. builder.clearAccessChain();
  2360. if (! result) {
  2361. logger->missingFunctionality("unknown glslang binary operation");
  2362. return true; // pick up a child as the place-holder result
  2363. } else {
  2364. builder.setAccessChainRValue(result);
  2365. return false;
  2366. }
  2367. }
  2368. spv::Id TGlslangToSpvTraverser::convertLoadedBoolInUniformToUint(const glslang::TType& type,
  2369. spv::Id nominalTypeId,
  2370. spv::Id loadedId)
  2371. {
  2372. if (builder.isScalarType(nominalTypeId)) {
  2373. // Conversion for bool
  2374. spv::Id boolType = builder.makeBoolType();
  2375. if (nominalTypeId != boolType)
  2376. return builder.createBinOp(spv::Op::OpINotEqual, boolType, loadedId, builder.makeUintConstant(0));
  2377. } else if (builder.isVectorType(nominalTypeId)) {
  2378. // Conversion for bvec
  2379. int vecSize = builder.getNumTypeComponents(nominalTypeId);
  2380. spv::Id bvecType = builder.makeVectorType(builder.makeBoolType(), vecSize);
  2381. if (nominalTypeId != bvecType)
  2382. loadedId = builder.createBinOp(spv::Op::OpINotEqual, bvecType, loadedId,
  2383. makeSmearedConstant(builder.makeUintConstant(0), vecSize));
  2384. } else if (builder.isArrayType(nominalTypeId)) {
  2385. // Conversion for bool array
  2386. spv::Id boolArrayTypeId = convertGlslangToSpvType(type);
  2387. if (nominalTypeId != boolArrayTypeId)
  2388. {
  2389. // Use OpCopyLogical from SPIR-V 1.4 if available.
  2390. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4)
  2391. return builder.createUnaryOp(spv::Op::OpCopyLogical, boolArrayTypeId, loadedId);
  2392. glslang::TType glslangElementType(type, 0);
  2393. spv::Id elementNominalTypeId = builder.getContainedTypeId(nominalTypeId);
  2394. std::vector<spv::Id> constituents;
  2395. for (int index = 0; index < type.getOuterArraySize(); ++index) {
  2396. // get the element
  2397. spv::Id elementValue = builder.createCompositeExtract(loadedId, elementNominalTypeId, index);
  2398. // recursively convert it
  2399. spv::Id elementConvertedValue = convertLoadedBoolInUniformToUint(glslangElementType, elementNominalTypeId, elementValue);
  2400. constituents.push_back(elementConvertedValue);
  2401. }
  2402. return builder.createCompositeConstruct(boolArrayTypeId, constituents);
  2403. }
  2404. }
  2405. return loadedId;
  2406. }
  2407. // Figure out what, if any, type changes are needed when accessing a specific built-in.
  2408. // Returns <the type SPIR-V requires for declarion, the type to translate to on use>.
  2409. // Also see comment for 'forceType', regarding tracking SPIR-V-required types.
  2410. std::pair<spv::Id, spv::Id> TGlslangToSpvTraverser::getForcedType(glslang::TBuiltInVariable glslangBuiltIn,
  2411. const glslang::TType& glslangType)
  2412. {
  2413. switch(glslangBuiltIn)
  2414. {
  2415. case glslang::EbvSubGroupEqMask:
  2416. case glslang::EbvSubGroupGeMask:
  2417. case glslang::EbvSubGroupGtMask:
  2418. case glslang::EbvSubGroupLeMask:
  2419. case glslang::EbvSubGroupLtMask: {
  2420. // these require changing a 64-bit scaler -> a vector of 32-bit components
  2421. if (glslangType.isVector())
  2422. break;
  2423. spv::Id ivec4_type = builder.makeVectorType(builder.makeUintType(32), 4);
  2424. spv::Id uint64_type = builder.makeUintType(64);
  2425. std::pair<spv::Id, spv::Id> ret(ivec4_type, uint64_type);
  2426. return ret;
  2427. }
  2428. // There are no SPIR-V builtins defined for these and map onto original non-transposed
  2429. // builtins. During visitBinary we insert a transpose
  2430. case glslang::EbvWorldToObject3x4:
  2431. case glslang::EbvObjectToWorld3x4: {
  2432. spv::Id mat43 = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  2433. spv::Id mat34 = builder.makeMatrixType(builder.makeFloatType(32), 3, 4);
  2434. std::pair<spv::Id, spv::Id> ret(mat43, mat34);
  2435. return ret;
  2436. }
  2437. default:
  2438. break;
  2439. }
  2440. std::pair<spv::Id, spv::Id> ret(spv::NoType, spv::NoType);
  2441. return ret;
  2442. }
  2443. // For an object previously identified (see getForcedType() and forceType)
  2444. // as needing type translations, do the translation needed for a load, turning
  2445. // an L-value into in R-value.
  2446. spv::Id TGlslangToSpvTraverser::translateForcedType(spv::Id object)
  2447. {
  2448. const auto forceIt = forceType.find(object);
  2449. if (forceIt == forceType.end())
  2450. return object;
  2451. spv::Id desiredTypeId = forceIt->second;
  2452. spv::Id objectTypeId = builder.getTypeId(object);
  2453. assert(builder.isPointerType(objectTypeId));
  2454. objectTypeId = builder.getContainedTypeId(objectTypeId);
  2455. if (builder.isVectorType(objectTypeId) &&
  2456. builder.getScalarTypeWidth(builder.getContainedTypeId(objectTypeId)) == 32) {
  2457. if (builder.getScalarTypeWidth(desiredTypeId) == 64) {
  2458. // handle 32-bit v.xy* -> 64-bit
  2459. builder.clearAccessChain();
  2460. builder.setAccessChainLValue(object);
  2461. object = builder.accessChainLoad(spv::NoPrecision, spv::Decoration::Max, spv::Decoration::Max, objectTypeId);
  2462. std::vector<spv::Id> components;
  2463. components.push_back(builder.createCompositeExtract(object, builder.getContainedTypeId(objectTypeId), 0));
  2464. components.push_back(builder.createCompositeExtract(object, builder.getContainedTypeId(objectTypeId), 1));
  2465. spv::Id vecType = builder.makeVectorType(builder.getContainedTypeId(objectTypeId), 2);
  2466. return builder.createUnaryOp(spv::Op::OpBitcast, desiredTypeId,
  2467. builder.createCompositeConstruct(vecType, components));
  2468. } else {
  2469. logger->missingFunctionality("forcing 32-bit vector type to non 64-bit scalar");
  2470. }
  2471. } else if (builder.isMatrixType(objectTypeId)) {
  2472. // There are no SPIR-V builtins defined for 3x4 variants of ObjectToWorld/WorldToObject
  2473. // and we insert a transpose after loading the original non-transposed builtins
  2474. builder.clearAccessChain();
  2475. builder.setAccessChainLValue(object);
  2476. object = builder.accessChainLoad(spv::NoPrecision, spv::Decoration::Max, spv::Decoration::Max, objectTypeId);
  2477. return builder.createUnaryOp(spv::Op::OpTranspose, desiredTypeId, object);
  2478. } else {
  2479. logger->missingFunctionality("forcing non 32-bit vector type");
  2480. }
  2481. return object;
  2482. }
  2483. bool TGlslangToSpvTraverser::visitUnary(glslang::TVisit /* visit */, glslang::TIntermUnary* node)
  2484. {
  2485. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2486. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  2487. if (node->getType().getQualifier().isSpecConstant())
  2488. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  2489. spv::Id result = spv::NoResult;
  2490. // try texturing first
  2491. result = createImageTextureFunctionCall(node);
  2492. if (result != spv::NoResult) {
  2493. builder.clearAccessChain();
  2494. builder.setAccessChainRValue(result);
  2495. return false; // done with this node
  2496. }
  2497. // Non-texturing.
  2498. if (node->getOp() == glslang::EOpArrayLength) {
  2499. // Quite special; won't want to evaluate the operand.
  2500. // Currently, the front-end does not allow .length() on an array until it is sized,
  2501. // except for the last block membeor of an SSBO.
  2502. // TODO: If this changes, link-time sized arrays might show up here, and need their
  2503. // size extracted.
  2504. // Normal .length() would have been constant folded by the front-end.
  2505. // So, this has to be block.lastMember.length().
  2506. // SPV wants "block" and member number as the operands, go get them.
  2507. uint32_t bits = node->getType().contains64BitInt() ? 64 : 32;
  2508. spv::Id length;
  2509. if (node->getOperand()->getType().isCoopMat()) {
  2510. spv::Id typeId = convertGlslangToSpvType(node->getOperand()->getType());
  2511. assert(builder.isCooperativeMatrixType(typeId));
  2512. if (node->getOperand()->getType().isCoopMatKHR()) {
  2513. length = builder.createCooperativeMatrixLengthKHR(typeId);
  2514. } else {
  2515. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  2516. length = builder.createCooperativeMatrixLengthNV(typeId);
  2517. }
  2518. } else if (node->getOperand()->getType().isCoopVecOrLongVector()) {
  2519. spv::Id typeId = convertGlslangToSpvType(node->getOperand()->getType());
  2520. if (builder.isCooperativeVectorType(typeId)) {
  2521. length = builder.getCooperativeVectorNumComponents(typeId);
  2522. } else {
  2523. length = builder.makeIntConstant(builder.getNumTypeConstituents(typeId));
  2524. }
  2525. } else {
  2526. glslang::TIntermTyped* block = node->getOperand()->getAsBinaryNode()->getLeft();
  2527. block->traverse(this);
  2528. unsigned int member = node->getOperand()->getAsBinaryNode()->getRight()->getAsConstantUnion()
  2529. ->getConstArray()[0].getUConst();
  2530. length = builder.createArrayLength(builder.accessChainGetLValue(), member, bits);
  2531. }
  2532. // GLSL semantics say the result of .length() is an int, while SPIR-V says
  2533. // signedness must be 0. So, convert from SPIR-V unsigned back to GLSL's
  2534. // AST expectation of a signed result.
  2535. if (glslangIntermediate->getSource() == glslang::EShSourceGlsl) {
  2536. if (builder.isInSpecConstCodeGenMode()) {
  2537. length = builder.createBinOp(spv::Op::OpIAdd, builder.makeIntType(bits), length, builder.makeIntConstant(0));
  2538. } else {
  2539. length = builder.createUnaryOp(spv::Op::OpBitcast, builder.makeIntType(bits), length);
  2540. }
  2541. }
  2542. builder.clearAccessChain();
  2543. builder.setAccessChainRValue(length);
  2544. return false;
  2545. }
  2546. // Force variable declaration - Debug Mode Only
  2547. if (node->getOp() == glslang::EOpDeclare) {
  2548. builder.clearAccessChain();
  2549. node->getOperand()->traverse(this);
  2550. builder.clearAccessChain();
  2551. return false;
  2552. }
  2553. // Start by evaluating the operand
  2554. // Does it need a swizzle inversion? If so, evaluation is inverted;
  2555. // operate first on the swizzle base, then apply the swizzle.
  2556. spv::Id invertedType = spv::NoType;
  2557. auto resultType = [&invertedType, &node, this](){ return invertedType != spv::NoType ?
  2558. invertedType : convertGlslangToSpvType(node->getType()); };
  2559. if (node->getOp() == glslang::EOpInterpolateAtCentroid)
  2560. invertedType = getInvertedSwizzleType(*node->getOperand());
  2561. builder.clearAccessChain();
  2562. TIntermNode *operandNode;
  2563. if (invertedType != spv::NoType)
  2564. operandNode = node->getOperand()->getAsBinaryNode()->getLeft();
  2565. else
  2566. operandNode = node->getOperand();
  2567. operandNode->traverse(this);
  2568. spv::Id operand = spv::NoResult;
  2569. spv::Builder::AccessChain::CoherentFlags lvalueCoherentFlags;
  2570. const auto hitObjectOpsWithLvalue = [](glslang::TOperator op) {
  2571. switch(op) {
  2572. case glslang::EOpReorderThreadNV:
  2573. case glslang::EOpHitObjectGetCurrentTimeNV:
  2574. case glslang::EOpHitObjectGetHitKindNV:
  2575. case glslang::EOpHitObjectGetPrimitiveIndexNV:
  2576. case glslang::EOpHitObjectGetGeometryIndexNV:
  2577. case glslang::EOpHitObjectGetInstanceIdNV:
  2578. case glslang::EOpHitObjectGetInstanceCustomIndexNV:
  2579. case glslang::EOpHitObjectGetObjectRayDirectionNV:
  2580. case glslang::EOpHitObjectGetObjectRayOriginNV:
  2581. case glslang::EOpHitObjectGetWorldRayDirectionNV:
  2582. case glslang::EOpHitObjectGetWorldRayOriginNV:
  2583. case glslang::EOpHitObjectGetWorldToObjectNV:
  2584. case glslang::EOpHitObjectGetObjectToWorldNV:
  2585. case glslang::EOpHitObjectGetRayTMaxNV:
  2586. case glslang::EOpHitObjectGetRayTMinNV:
  2587. case glslang::EOpHitObjectIsEmptyNV:
  2588. case glslang::EOpHitObjectIsHitNV:
  2589. case glslang::EOpHitObjectIsMissNV:
  2590. case glslang::EOpHitObjectRecordEmptyNV:
  2591. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:
  2592. case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:
  2593. case glslang::EOpHitObjectGetClusterIdNV:
  2594. case glslang::EOpHitObjectGetSpherePositionNV:
  2595. case glslang::EOpHitObjectGetSphereRadiusNV:
  2596. case glslang::EOpHitObjectIsSphereHitNV:
  2597. case glslang::EOpHitObjectIsLSSHitNV:
  2598. case glslang::EOpReorderThreadEXT:
  2599. case glslang::EOpHitObjectGetCurrentTimeEXT:
  2600. case glslang::EOpHitObjectGetHitKindEXT:
  2601. case glslang::EOpHitObjectGetPrimitiveIndexEXT:
  2602. case glslang::EOpHitObjectGetGeometryIndexEXT:
  2603. case glslang::EOpHitObjectGetInstanceIdEXT:
  2604. case glslang::EOpHitObjectGetInstanceCustomIndexEXT:
  2605. case glslang::EOpHitObjectGetObjectRayDirectionEXT:
  2606. case glslang::EOpHitObjectGetObjectRayOriginEXT:
  2607. case glslang::EOpHitObjectGetWorldRayDirectionEXT:
  2608. case glslang::EOpHitObjectGetWorldRayOriginEXT:
  2609. case glslang::EOpHitObjectGetWorldToObjectEXT:
  2610. case glslang::EOpHitObjectGetObjectToWorldEXT:
  2611. case glslang::EOpHitObjectGetRayTMaxEXT:
  2612. case glslang::EOpHitObjectGetRayTMinEXT:
  2613. case glslang::EOpHitObjectGetRayFlagsEXT:
  2614. case glslang::EOpHitObjectIsEmptyEXT:
  2615. case glslang::EOpHitObjectIsHitEXT:
  2616. case glslang::EOpHitObjectIsMissEXT:
  2617. case glslang::EOpHitObjectRecordEmptyEXT:
  2618. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexEXT:
  2619. case glslang::EOpHitObjectGetShaderRecordBufferHandleEXT:
  2620. return true;
  2621. default:
  2622. return false;
  2623. }
  2624. };
  2625. if (node->getOp() == glslang::EOpAtomicCounterIncrement ||
  2626. node->getOp() == glslang::EOpAtomicCounterDecrement ||
  2627. node->getOp() == glslang::EOpAtomicCounter ||
  2628. (node->getOp() == glslang::EOpInterpolateAtCentroid &&
  2629. glslangIntermediate->getSource() != glslang::EShSourceHlsl) ||
  2630. node->getOp() == glslang::EOpRayQueryProceed ||
  2631. node->getOp() == glslang::EOpRayQueryGetRayTMin ||
  2632. node->getOp() == glslang::EOpRayQueryGetRayFlags ||
  2633. node->getOp() == glslang::EOpRayQueryGetWorldRayOrigin ||
  2634. node->getOp() == glslang::EOpRayQueryGetWorldRayDirection ||
  2635. node->getOp() == glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque ||
  2636. node->getOp() == glslang::EOpRayQueryTerminate ||
  2637. node->getOp() == glslang::EOpRayQueryConfirmIntersection ||
  2638. (node->getOp() == glslang::EOpSpirvInst && operandNode->getAsTyped()->getQualifier().isSpirvByReference()) ||
  2639. hitObjectOpsWithLvalue(node->getOp())) {
  2640. operand = builder.accessChainGetLValue(); // Special case l-value operands
  2641. lvalueCoherentFlags = builder.getAccessChain().coherentFlags;
  2642. lvalueCoherentFlags |= TranslateCoherent(operandNode->getAsTyped()->getType());
  2643. } else if (operandNode->getAsTyped()->getQualifier().isSpirvLiteral()) {
  2644. // Will be translated to a literal value, make a placeholder here
  2645. operand = spv::NoResult;
  2646. } else {
  2647. operand = accessChainLoad(node->getOperand()->getType());
  2648. }
  2649. OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
  2650. TranslateNoContractionDecoration(node->getType().getQualifier()),
  2651. TranslateNonUniformDecoration(node->getType().getQualifier()) };
  2652. // it could be a conversion
  2653. if (! result) {
  2654. result = createConversion(node->getOp(), decorations, resultType(), operand,
  2655. node->getType().getBasicType(), node->getOperand()->getBasicType());
  2656. if (result) {
  2657. if (node->getType().isCoopMatKHR() && node->getOperand()->getAsTyped()->getType().isCoopMatKHR() &&
  2658. !node->getAsTyped()->getType().sameCoopMatUse(node->getOperand()->getAsTyped()->getType())) {
  2659. // Conversions that change use need CapabilityCooperativeMatrixConversionsNV
  2660. builder.addCapability(spv::Capability::CooperativeMatrixConversionsNV);
  2661. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  2662. }
  2663. }
  2664. }
  2665. // if not, then possibly an operation
  2666. if (! result)
  2667. result = createUnaryOperation(node->getOp(), decorations, resultType(), operand,
  2668. node->getOperand()->getBasicType(), lvalueCoherentFlags, node->getType());
  2669. // it could be attached to a SPIR-V intruction
  2670. if (!result) {
  2671. if (node->getOp() == glslang::EOpSpirvInst) {
  2672. const auto& spirvInst = node->getSpirvInstruction();
  2673. if (spirvInst.set == "") {
  2674. spv::IdImmediate idImmOp = {true, operand};
  2675. if (operandNode->getAsTyped()->getQualifier().isSpirvLiteral()) {
  2676. // Translate the constant to a literal value
  2677. std::vector<unsigned> literals;
  2678. glslang::TVector<const glslang::TIntermConstantUnion*> constants;
  2679. constants.push_back(operandNode->getAsConstantUnion());
  2680. TranslateLiterals(constants, literals);
  2681. idImmOp = {false, literals[0]};
  2682. }
  2683. if (node->getBasicType() == glslang::EbtVoid)
  2684. builder.createNoResultOp(static_cast<spv::Op>(spirvInst.id), {idImmOp});
  2685. else
  2686. result = builder.createOp(static_cast<spv::Op>(spirvInst.id), resultType(), {idImmOp});
  2687. } else {
  2688. result = builder.createBuiltinCall(
  2689. resultType(), spirvInst.set == "GLSL.std.450" ? stdBuiltins : getExtBuiltins(spirvInst.set.c_str()),
  2690. spirvInst.id, {operand});
  2691. }
  2692. if (node->getBasicType() == glslang::EbtVoid)
  2693. return false; // done with this node
  2694. }
  2695. }
  2696. if (result) {
  2697. if (invertedType) {
  2698. result = createInvertedSwizzle(decorations.precision, *node->getOperand(), result);
  2699. decorations.addNonUniform(builder, result);
  2700. }
  2701. builder.clearAccessChain();
  2702. builder.setAccessChainRValue(result);
  2703. return false; // done with this node
  2704. }
  2705. // it must be a special case, check...
  2706. switch (node->getOp()) {
  2707. case glslang::EOpPostIncrement:
  2708. case glslang::EOpPostDecrement:
  2709. case glslang::EOpPreIncrement:
  2710. case glslang::EOpPreDecrement:
  2711. {
  2712. // we need the integer value "1" or the floating point "1.0" to add/subtract
  2713. spv::Id one = 0;
  2714. if (node->getBasicType() == glslang::EbtFloat)
  2715. one = builder.makeFloatConstant(1.0F);
  2716. else if (node->getBasicType() == glslang::EbtDouble)
  2717. one = builder.makeDoubleConstant(1.0);
  2718. else if (node->getBasicType() == glslang::EbtFloat16)
  2719. one = builder.makeFloat16Constant(1.0F);
  2720. else if (node->getBasicType() == glslang::EbtBFloat16)
  2721. one = builder.makeBFloat16Constant(1.0F);
  2722. else if (node->getBasicType() == glslang::EbtFloatE5M2)
  2723. one = builder.makeFloatE5M2Constant(1.0F);
  2724. else if (node->getBasicType() == glslang::EbtFloatE4M3)
  2725. one = builder.makeFloatE4M3Constant(1.0F);
  2726. else if (node->getBasicType() == glslang::EbtInt8 || node->getBasicType() == glslang::EbtUint8)
  2727. one = builder.makeInt8Constant(1);
  2728. else if (node->getBasicType() == glslang::EbtInt16 || node->getBasicType() == glslang::EbtUint16)
  2729. one = builder.makeInt16Constant(1);
  2730. else if (node->getBasicType() == glslang::EbtInt64 || node->getBasicType() == glslang::EbtUint64)
  2731. one = builder.makeInt64Constant(1);
  2732. else
  2733. one = builder.makeIntConstant(1);
  2734. glslang::TOperator op;
  2735. if (node->getOp() == glslang::EOpPreIncrement ||
  2736. node->getOp() == glslang::EOpPostIncrement)
  2737. op = glslang::EOpAdd;
  2738. else
  2739. op = glslang::EOpSub;
  2740. spv::Id result = createBinaryOperation(op, decorations,
  2741. convertGlslangToSpvType(node->getType()), operand, one,
  2742. node->getType().getBasicType());
  2743. assert(result != spv::NoResult);
  2744. // The result of operation is always stored, but conditionally the
  2745. // consumed result. The consumed result is always an r-value.
  2746. builder.accessChainStore(result,
  2747. TranslateNonUniformDecoration(builder.getAccessChain().coherentFlags));
  2748. builder.clearAccessChain();
  2749. if (node->getOp() == glslang::EOpPreIncrement ||
  2750. node->getOp() == glslang::EOpPreDecrement)
  2751. builder.setAccessChainRValue(result);
  2752. else
  2753. builder.setAccessChainRValue(operand);
  2754. }
  2755. return false;
  2756. case glslang::EOpAssumeEXT:
  2757. builder.addCapability(spv::Capability::ExpectAssumeKHR);
  2758. builder.addExtension(spv::E_SPV_KHR_expect_assume);
  2759. builder.createNoResultOp(spv::Op::OpAssumeTrueKHR, operand);
  2760. return false;
  2761. case glslang::EOpEmitStreamVertex:
  2762. builder.createNoResultOp(spv::Op::OpEmitStreamVertex, operand);
  2763. return false;
  2764. case glslang::EOpEndStreamPrimitive:
  2765. builder.createNoResultOp(spv::Op::OpEndStreamPrimitive, operand);
  2766. return false;
  2767. case glslang::EOpRayQueryTerminate:
  2768. builder.createNoResultOp(spv::Op::OpRayQueryTerminateKHR, operand);
  2769. return false;
  2770. case glslang::EOpRayQueryConfirmIntersection:
  2771. builder.createNoResultOp(spv::Op::OpRayQueryConfirmIntersectionKHR, operand);
  2772. return false;
  2773. case glslang::EOpReorderThreadNV:
  2774. builder.createNoResultOp(spv::Op::OpReorderThreadWithHitObjectNV, operand);
  2775. return false;
  2776. case glslang::EOpReorderThreadEXT:
  2777. builder.createNoResultOp(spv::Op::OpReorderThreadWithHitObjectEXT, operand);
  2778. return false;
  2779. case glslang::EOpHitObjectRecordEmptyNV:
  2780. builder.createNoResultOp(spv::Op::OpHitObjectRecordEmptyNV, operand);
  2781. return false;
  2782. case glslang::EOpHitObjectRecordEmptyEXT:
  2783. builder.createNoResultOp(spv::Op::OpHitObjectRecordEmptyEXT, operand);
  2784. return false;
  2785. case glslang::EOpCreateTensorLayoutNV:
  2786. result = builder.createOp(spv::Op::OpCreateTensorLayoutNV, resultType(), std::vector<spv::Id>{});
  2787. builder.clearAccessChain();
  2788. builder.setAccessChainRValue(result);
  2789. return false;
  2790. case glslang::EOpCreateTensorViewNV:
  2791. result = builder.createOp(spv::Op::OpCreateTensorViewNV, resultType(), std::vector<spv::Id>{});
  2792. builder.clearAccessChain();
  2793. builder.setAccessChainRValue(result);
  2794. return false;
  2795. default:
  2796. logger->missingFunctionality("unknown glslang unary");
  2797. return true; // pick up operand as placeholder result
  2798. }
  2799. }
  2800. // Construct a composite object, recursively copying members if their types don't match
  2801. spv::Id TGlslangToSpvTraverser::createCompositeConstruct(spv::Id resultTypeId, std::vector<spv::Id> constituents)
  2802. {
  2803. for (int c = 0; c < (int)constituents.size(); ++c) {
  2804. spv::Id& constituent = constituents[c];
  2805. spv::Id lType = builder.getContainedTypeId(resultTypeId, c);
  2806. spv::Id rType = builder.getTypeId(constituent);
  2807. if (lType != rType) {
  2808. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {
  2809. constituent = builder.createUnaryOp(spv::Op::OpCopyLogical, lType, constituent);
  2810. } else if (builder.isStructType(rType)) {
  2811. std::vector<spv::Id> rTypeConstituents;
  2812. int numrTypeConstituents = builder.getNumTypeConstituents(rType);
  2813. for (int i = 0; i < numrTypeConstituents; ++i) {
  2814. rTypeConstituents.push_back(builder.createCompositeExtract(constituent,
  2815. builder.getContainedTypeId(rType, i), i));
  2816. }
  2817. constituents[c] = createCompositeConstruct(lType, rTypeConstituents);
  2818. } else {
  2819. assert(builder.isArrayType(rType));
  2820. std::vector<spv::Id> rTypeConstituents;
  2821. int numrTypeConstituents = builder.getNumTypeConstituents(rType);
  2822. spv::Id elementRType = builder.getContainedTypeId(rType);
  2823. for (int i = 0; i < numrTypeConstituents; ++i) {
  2824. rTypeConstituents.push_back(builder.createCompositeExtract(constituent, elementRType, i));
  2825. }
  2826. constituents[c] = createCompositeConstruct(lType, rTypeConstituents);
  2827. }
  2828. }
  2829. }
  2830. return builder.createCompositeConstruct(resultTypeId, constituents);
  2831. }
  2832. bool TGlslangToSpvTraverser::visitAggregate(glslang::TVisit visit, glslang::TIntermAggregate* node)
  2833. {
  2834. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  2835. if (node->getType().getQualifier().isSpecConstant())
  2836. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  2837. spv::Id result = spv::NoResult;
  2838. spv::Id invertedType = spv::NoType; // to use to override the natural type of the node
  2839. std::vector<spv::Builder::AccessChain> complexLvalues; // for holding swizzling l-values too complex for
  2840. // SPIR-V, for an out parameter
  2841. std::vector<spv::Id> temporaryLvalues; // temporaries to pass, as proxies for complexLValues
  2842. auto resultType = [&invertedType, &node, this](){
  2843. if (invertedType != spv::NoType) {
  2844. return invertedType;
  2845. } else {
  2846. auto ret = convertGlslangToSpvType(node->getType());
  2847. // convertGlslangToSpvType may clobber the debug location, reset it
  2848. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2849. return ret;
  2850. }
  2851. };
  2852. // try texturing
  2853. result = createImageTextureFunctionCall(node);
  2854. if (result != spv::NoResult) {
  2855. builder.clearAccessChain();
  2856. builder.setAccessChainRValue(result);
  2857. return false;
  2858. } else if (node->getOp() == glslang::EOpImageStore ||
  2859. node->getOp() == glslang::EOpImageStoreLod ||
  2860. node->getOp() == glslang::EOpImageAtomicStore) {
  2861. // "imageStore" is a special case, which has no result
  2862. return false;
  2863. }
  2864. glslang::TOperator binOp = glslang::EOpNull;
  2865. bool reduceComparison = true;
  2866. bool isMatrix = false;
  2867. bool noReturnValue = false;
  2868. bool atomic = false;
  2869. spv::Builder::AccessChain::CoherentFlags lvalueCoherentFlags;
  2870. assert(node->getOp());
  2871. spv::Decoration precision = TranslatePrecisionDecoration(node->getOperationPrecision());
  2872. switch (node->getOp()) {
  2873. case glslang::EOpScope:
  2874. case glslang::EOpSequence:
  2875. {
  2876. if (visit == glslang::EvPreVisit) {
  2877. ++sequenceDepth;
  2878. if (sequenceDepth == 1) {
  2879. // If this is the parent node of all the functions, we want to see them
  2880. // early, so all call points have actual SPIR-V functions to reference.
  2881. // In all cases, still let the traverser visit the children for us.
  2882. makeFunctions(node->getAsAggregate()->getSequence());
  2883. // Global initializers is specific to the shader entry point, which does not exist in compile-only mode
  2884. if (!options.compileOnly) {
  2885. // Also, we want all globals initializers to go into the beginning of the entry point, before
  2886. // anything else gets there, so visit out of order, doing them all now.
  2887. makeGlobalInitializers(node->getAsAggregate()->getSequence());
  2888. }
  2889. //Pre process linker objects for ray tracing stages
  2890. if (glslangIntermediate->isRayTracingStage())
  2891. collectRayTracingLinkerObjects();
  2892. // Initializers are done, don't want to visit again, but functions and link objects need to be processed,
  2893. // so do them manually.
  2894. visitFunctions(node->getAsAggregate()->getSequence());
  2895. return false;
  2896. } else {
  2897. if (node->getOp() == glslang::EOpScope) {
  2898. auto loc = node->getLoc();
  2899. builder.enterLexicalBlock(loc.line, loc.column);
  2900. }
  2901. }
  2902. } else {
  2903. if (sequenceDepth > 1 && node->getOp() == glslang::EOpScope)
  2904. builder.leaveLexicalBlock();
  2905. --sequenceDepth;
  2906. }
  2907. return true;
  2908. }
  2909. case glslang::EOpLinkerObjects:
  2910. {
  2911. if (visit == glslang::EvPreVisit)
  2912. linkageOnly = true;
  2913. else
  2914. linkageOnly = false;
  2915. return true;
  2916. }
  2917. case glslang::EOpComma:
  2918. {
  2919. // processing from left to right naturally leaves the right-most
  2920. // lying around in the access chain
  2921. glslang::TIntermSequence& glslangOperands = node->getSequence();
  2922. for (int i = 0; i < (int)glslangOperands.size(); ++i)
  2923. glslangOperands[i]->traverse(this);
  2924. return false;
  2925. }
  2926. case glslang::EOpFunction:
  2927. if (visit == glslang::EvPreVisit) {
  2928. if (options.generateDebugInfo) {
  2929. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2930. }
  2931. if (isShaderEntryPoint(node)) {
  2932. inEntryPoint = true;
  2933. builder.setBuildPoint(shaderEntry->getLastBlock());
  2934. builder.enterFunction(shaderEntry);
  2935. currentFunction = shaderEntry;
  2936. } else {
  2937. // SPIR-V functions should already be in the functionMap from the prepass
  2938. // that called makeFunctions().
  2939. currentFunction = functionMap[node->getName().c_str()];
  2940. spv::Block* functionBlock = currentFunction->getEntryBlock();
  2941. builder.setBuildPoint(functionBlock);
  2942. builder.enterFunction(currentFunction);
  2943. }
  2944. if (options.generateDebugInfo && !options.emitNonSemanticShaderDebugInfo) {
  2945. const auto& loc = node->getLoc();
  2946. const char* sourceFileName = loc.getFilename();
  2947. spv::Id sourceFileId = sourceFileName ? builder.getStringId(sourceFileName) : builder.getMainFileId();
  2948. currentFunction->setDebugLineInfo(sourceFileId, loc.line, loc.column);
  2949. }
  2950. } else {
  2951. // Here we have finished visiting the function (post-visit). Finalize it.
  2952. if (options.generateDebugInfo) {
  2953. if (glslangIntermediate->getSource() == glslang::EShSourceGlsl && node->getSequence().size() > 1) {
  2954. auto endLoc = node->getSequence()[1]->getAsAggregate()->getEndLoc();
  2955. builder.setDebugSourceLocation(endLoc.line, endLoc.getFilename());
  2956. }
  2957. }
  2958. if (inEntryPoint)
  2959. entryPointTerminated = true;
  2960. builder.leaveFunction();
  2961. inEntryPoint = false;
  2962. currentFunction = nullptr;
  2963. }
  2964. return true;
  2965. case glslang::EOpParameters:
  2966. // Parameters will have been consumed by EOpFunction processing, but not
  2967. // the body, so we still visited the function node's children, making this
  2968. // child redundant.
  2969. return false;
  2970. case glslang::EOpFunctionCall:
  2971. {
  2972. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  2973. if (node->isUserDefined())
  2974. result = handleUserFunctionCall(node);
  2975. if (result) {
  2976. builder.clearAccessChain();
  2977. builder.setAccessChainRValue(result);
  2978. } else
  2979. logger->missingFunctionality("missing user function; linker needs to catch that");
  2980. return false;
  2981. }
  2982. case glslang::EOpConstructMat2x2:
  2983. case glslang::EOpConstructMat2x3:
  2984. case glslang::EOpConstructMat2x4:
  2985. case glslang::EOpConstructMat3x2:
  2986. case glslang::EOpConstructMat3x3:
  2987. case glslang::EOpConstructMat3x4:
  2988. case glslang::EOpConstructMat4x2:
  2989. case glslang::EOpConstructMat4x3:
  2990. case glslang::EOpConstructMat4x4:
  2991. case glslang::EOpConstructDMat2x2:
  2992. case glslang::EOpConstructDMat2x3:
  2993. case glslang::EOpConstructDMat2x4:
  2994. case glslang::EOpConstructDMat3x2:
  2995. case glslang::EOpConstructDMat3x3:
  2996. case glslang::EOpConstructDMat3x4:
  2997. case glslang::EOpConstructDMat4x2:
  2998. case glslang::EOpConstructDMat4x3:
  2999. case glslang::EOpConstructDMat4x4:
  3000. case glslang::EOpConstructIMat2x2:
  3001. case glslang::EOpConstructIMat2x3:
  3002. case glslang::EOpConstructIMat2x4:
  3003. case glslang::EOpConstructIMat3x2:
  3004. case glslang::EOpConstructIMat3x3:
  3005. case glslang::EOpConstructIMat3x4:
  3006. case glslang::EOpConstructIMat4x2:
  3007. case glslang::EOpConstructIMat4x3:
  3008. case glslang::EOpConstructIMat4x4:
  3009. case glslang::EOpConstructUMat2x2:
  3010. case glslang::EOpConstructUMat2x3:
  3011. case glslang::EOpConstructUMat2x4:
  3012. case glslang::EOpConstructUMat3x2:
  3013. case glslang::EOpConstructUMat3x3:
  3014. case glslang::EOpConstructUMat3x4:
  3015. case glslang::EOpConstructUMat4x2:
  3016. case glslang::EOpConstructUMat4x3:
  3017. case glslang::EOpConstructUMat4x4:
  3018. case glslang::EOpConstructBMat2x2:
  3019. case glslang::EOpConstructBMat2x3:
  3020. case glslang::EOpConstructBMat2x4:
  3021. case glslang::EOpConstructBMat3x2:
  3022. case glslang::EOpConstructBMat3x3:
  3023. case glslang::EOpConstructBMat3x4:
  3024. case glslang::EOpConstructBMat4x2:
  3025. case glslang::EOpConstructBMat4x3:
  3026. case glslang::EOpConstructBMat4x4:
  3027. case glslang::EOpConstructF16Mat2x2:
  3028. case glslang::EOpConstructF16Mat2x3:
  3029. case glslang::EOpConstructF16Mat2x4:
  3030. case glslang::EOpConstructF16Mat3x2:
  3031. case glslang::EOpConstructF16Mat3x3:
  3032. case glslang::EOpConstructF16Mat3x4:
  3033. case glslang::EOpConstructF16Mat4x2:
  3034. case glslang::EOpConstructF16Mat4x3:
  3035. case glslang::EOpConstructF16Mat4x4:
  3036. isMatrix = true;
  3037. [[fallthrough]];
  3038. case glslang::EOpConstructFloat:
  3039. case glslang::EOpConstructVec2:
  3040. case glslang::EOpConstructVec3:
  3041. case glslang::EOpConstructVec4:
  3042. case glslang::EOpConstructDouble:
  3043. case glslang::EOpConstructDVec2:
  3044. case glslang::EOpConstructDVec3:
  3045. case glslang::EOpConstructDVec4:
  3046. case glslang::EOpConstructFloat16:
  3047. case glslang::EOpConstructF16Vec2:
  3048. case glslang::EOpConstructF16Vec3:
  3049. case glslang::EOpConstructF16Vec4:
  3050. case glslang::EOpConstructBFloat16:
  3051. case glslang::EOpConstructBF16Vec2:
  3052. case glslang::EOpConstructBF16Vec3:
  3053. case glslang::EOpConstructBF16Vec4:
  3054. case glslang::EOpConstructFloatE5M2:
  3055. case glslang::EOpConstructFloatE5M2Vec2:
  3056. case glslang::EOpConstructFloatE5M2Vec3:
  3057. case glslang::EOpConstructFloatE5M2Vec4:
  3058. case glslang::EOpConstructFloatE4M3:
  3059. case glslang::EOpConstructFloatE4M3Vec2:
  3060. case glslang::EOpConstructFloatE4M3Vec3:
  3061. case glslang::EOpConstructFloatE4M3Vec4:
  3062. case glslang::EOpConstructBool:
  3063. case glslang::EOpConstructBVec2:
  3064. case glslang::EOpConstructBVec3:
  3065. case glslang::EOpConstructBVec4:
  3066. case glslang::EOpConstructInt8:
  3067. case glslang::EOpConstructI8Vec2:
  3068. case glslang::EOpConstructI8Vec3:
  3069. case glslang::EOpConstructI8Vec4:
  3070. case glslang::EOpConstructUint8:
  3071. case glslang::EOpConstructU8Vec2:
  3072. case glslang::EOpConstructU8Vec3:
  3073. case glslang::EOpConstructU8Vec4:
  3074. case glslang::EOpConstructInt16:
  3075. case glslang::EOpConstructI16Vec2:
  3076. case glslang::EOpConstructI16Vec3:
  3077. case glslang::EOpConstructI16Vec4:
  3078. case glslang::EOpConstructUint16:
  3079. case glslang::EOpConstructU16Vec2:
  3080. case glslang::EOpConstructU16Vec3:
  3081. case glslang::EOpConstructU16Vec4:
  3082. case glslang::EOpConstructInt:
  3083. case glslang::EOpConstructIVec2:
  3084. case glslang::EOpConstructIVec3:
  3085. case glslang::EOpConstructIVec4:
  3086. case glslang::EOpConstructUint:
  3087. case glslang::EOpConstructUVec2:
  3088. case glslang::EOpConstructUVec3:
  3089. case glslang::EOpConstructUVec4:
  3090. case glslang::EOpConstructInt64:
  3091. case glslang::EOpConstructI64Vec2:
  3092. case glslang::EOpConstructI64Vec3:
  3093. case glslang::EOpConstructI64Vec4:
  3094. case glslang::EOpConstructUint64:
  3095. case glslang::EOpConstructU64Vec2:
  3096. case glslang::EOpConstructU64Vec3:
  3097. case glslang::EOpConstructU64Vec4:
  3098. case glslang::EOpConstructStruct:
  3099. case glslang::EOpConstructTextureSampler:
  3100. case glslang::EOpConstructReference:
  3101. case glslang::EOpConstructCooperativeMatrixNV:
  3102. case glslang::EOpConstructCooperativeMatrixKHR:
  3103. case glslang::EOpConstructCooperativeVectorNV:
  3104. case glslang::EOpConstructSaturated:
  3105. {
  3106. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  3107. std::vector<spv::Id> arguments;
  3108. translateArguments(*node, arguments, lvalueCoherentFlags);
  3109. spv::Id constructed;
  3110. if (node->getOp() == glslang::EOpConstructTextureSampler) {
  3111. const glslang::TType& texType = node->getSequence()[0]->getAsTyped()->getType();
  3112. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6 &&
  3113. texType.getSampler().isBuffer()) {
  3114. // SamplerBuffer is not supported in spirv1.6 so
  3115. // `samplerBuffer(textureBuffer, sampler)` is a no-op
  3116. // and textureBuffer is the result going forward
  3117. constructed = arguments[0];
  3118. } else
  3119. constructed = builder.createOp(spv::Op::OpSampledImage, resultType(), arguments);
  3120. } else if (node->getOp() == glslang::EOpConstructCooperativeMatrixKHR &&
  3121. node->getType().isCoopMatKHR() && node->getSequence()[0]->getAsTyped()->getType().isCoopMatKHR()) {
  3122. builder.addCapability(spv::Capability::CooperativeMatrixConversionsNV);
  3123. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  3124. constructed = builder.createCooperativeMatrixConversion(resultType(), arguments[0]);
  3125. } else if (node->getType().isCoopVecOrLongVector() &&
  3126. arguments.size() == 1 &&
  3127. builder.getTypeId(arguments[0]) == resultType()) {
  3128. constructed = arguments[0];
  3129. } else if (node->getOp() == glslang::EOpConstructStruct ||
  3130. node->getOp() == glslang::EOpConstructCooperativeMatrixNV ||
  3131. node->getOp() == glslang::EOpConstructCooperativeMatrixKHR ||
  3132. node->getType().isArray() ||
  3133. // Handle constructing coopvec from one component here, to avoid the component
  3134. // getting smeared
  3135. (node->getType().hasSpecConstantVectorComponents() && arguments.size() == 1 && builder.isScalar(arguments[0]))) {
  3136. std::vector<spv::Id> constituents;
  3137. for (int c = 0; c < (int)arguments.size(); ++c)
  3138. constituents.push_back(arguments[c]);
  3139. constructed = createCompositeConstruct(resultType(), constituents);
  3140. } else if (isMatrix)
  3141. constructed = builder.createMatrixConstructor(precision, arguments, resultType());
  3142. else if (node->getOp() == glslang::EOpConstructSaturated) {
  3143. OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
  3144. TranslateNoContractionDecoration(node->getType().getQualifier()),
  3145. TranslateNonUniformDecoration(lvalueCoherentFlags) };
  3146. constructed = createConversion(node->getOp(), decorations, resultType(), arguments[1],
  3147. node->getType().getBasicType(), node->getSequence()[1]->getAsTyped()->getBasicType());
  3148. builder.addDecoration(constructed, spv::Decoration::SaturatedToLargestFloat8NormalConversionEXT);
  3149. builder.createStore(constructed, arguments[0]);
  3150. }
  3151. else
  3152. constructed = builder.createConstructor(precision, arguments, resultType());
  3153. if (node->getType().getQualifier().isNonUniform()) {
  3154. builder.addDecoration(constructed, spv::Decoration::NonUniformEXT);
  3155. }
  3156. builder.clearAccessChain();
  3157. builder.setAccessChainRValue(constructed);
  3158. return false;
  3159. }
  3160. // These six are component-wise compares with component-wise results.
  3161. // Forward on to createBinaryOperation(), requesting a vector result.
  3162. case glslang::EOpLessThan:
  3163. case glslang::EOpGreaterThan:
  3164. case glslang::EOpLessThanEqual:
  3165. case glslang::EOpGreaterThanEqual:
  3166. case glslang::EOpVectorEqual:
  3167. case glslang::EOpVectorNotEqual:
  3168. {
  3169. // Map the operation to a binary
  3170. binOp = node->getOp();
  3171. reduceComparison = false;
  3172. switch (node->getOp()) {
  3173. case glslang::EOpVectorEqual: binOp = glslang::EOpVectorEqual; break;
  3174. case glslang::EOpVectorNotEqual: binOp = glslang::EOpVectorNotEqual; break;
  3175. default: binOp = node->getOp(); break;
  3176. }
  3177. break;
  3178. }
  3179. case glslang::EOpMul:
  3180. // component-wise matrix multiply
  3181. binOp = glslang::EOpMul;
  3182. break;
  3183. case glslang::EOpOuterProduct:
  3184. // two vectors multiplied to make a matrix
  3185. binOp = glslang::EOpOuterProduct;
  3186. break;
  3187. case glslang::EOpDot:
  3188. {
  3189. // for scalar dot product, use multiply
  3190. glslang::TIntermSequence& glslangOperands = node->getSequence();
  3191. if (!glslangOperands[0]->getAsTyped()->getType().isLongVector() &&
  3192. glslangOperands[0]->getAsTyped()->getVectorSize() == 1)
  3193. binOp = glslang::EOpMul;
  3194. break;
  3195. }
  3196. case glslang::EOpMod:
  3197. // when an aggregate, this is the floating-point mod built-in function,
  3198. // which can be emitted by the one in createBinaryOperation()
  3199. binOp = glslang::EOpMod;
  3200. break;
  3201. case glslang::EOpEmitVertex:
  3202. case glslang::EOpEndPrimitive:
  3203. case glslang::EOpBarrier:
  3204. case glslang::EOpMemoryBarrier:
  3205. case glslang::EOpMemoryBarrierAtomicCounter:
  3206. case glslang::EOpMemoryBarrierBuffer:
  3207. case glslang::EOpMemoryBarrierImage:
  3208. case glslang::EOpMemoryBarrierShared:
  3209. case glslang::EOpGroupMemoryBarrier:
  3210. case glslang::EOpDeviceMemoryBarrier:
  3211. case glslang::EOpAllMemoryBarrierWithGroupSync:
  3212. case glslang::EOpDeviceMemoryBarrierWithGroupSync:
  3213. case glslang::EOpWorkgroupMemoryBarrier:
  3214. case glslang::EOpWorkgroupMemoryBarrierWithGroupSync:
  3215. case glslang::EOpSubgroupBarrier:
  3216. case glslang::EOpSubgroupMemoryBarrier:
  3217. case glslang::EOpSubgroupMemoryBarrierBuffer:
  3218. case glslang::EOpSubgroupMemoryBarrierImage:
  3219. case glslang::EOpSubgroupMemoryBarrierShared:
  3220. noReturnValue = true;
  3221. // These all have 0 operands and will naturally finish up in the code below for 0 operands
  3222. break;
  3223. case glslang::EOpAtomicAdd:
  3224. case glslang::EOpAtomicSubtract:
  3225. case glslang::EOpAtomicMin:
  3226. case glslang::EOpAtomicMax:
  3227. case glslang::EOpAtomicAnd:
  3228. case glslang::EOpAtomicOr:
  3229. case glslang::EOpAtomicXor:
  3230. case glslang::EOpAtomicExchange:
  3231. case glslang::EOpAtomicCompSwap:
  3232. atomic = true;
  3233. break;
  3234. case glslang::EOpAtomicStore:
  3235. noReturnValue = true;
  3236. [[fallthrough]];
  3237. case glslang::EOpAtomicLoad:
  3238. atomic = true;
  3239. break;
  3240. case glslang::EOpAtomicCounterAdd:
  3241. case glslang::EOpAtomicCounterSubtract:
  3242. case glslang::EOpAtomicCounterMin:
  3243. case glslang::EOpAtomicCounterMax:
  3244. case glslang::EOpAtomicCounterAnd:
  3245. case glslang::EOpAtomicCounterOr:
  3246. case glslang::EOpAtomicCounterXor:
  3247. case glslang::EOpAtomicCounterExchange:
  3248. case glslang::EOpAtomicCounterCompSwap:
  3249. builder.addExtension("SPV_KHR_shader_atomic_counter_ops");
  3250. builder.addCapability(spv::Capability::AtomicStorageOps);
  3251. atomic = true;
  3252. break;
  3253. case glslang::EOpAbsDifference:
  3254. case glslang::EOpAddSaturate:
  3255. case glslang::EOpSubSaturate:
  3256. case glslang::EOpAverage:
  3257. case glslang::EOpAverageRounded:
  3258. case glslang::EOpMul32x16:
  3259. builder.addCapability(spv::Capability::IntegerFunctions2INTEL);
  3260. builder.addExtension("SPV_INTEL_shader_integer_functions2");
  3261. binOp = node->getOp();
  3262. break;
  3263. case glslang::EOpExpectEXT:
  3264. builder.addCapability(spv::Capability::ExpectAssumeKHR);
  3265. builder.addExtension(spv::E_SPV_KHR_expect_assume);
  3266. binOp = node->getOp();
  3267. break;
  3268. case glslang::EOpIgnoreIntersectionNV:
  3269. case glslang::EOpTerminateRayNV:
  3270. case glslang::EOpTraceNV:
  3271. case glslang::EOpTraceRayMotionNV:
  3272. case glslang::EOpTraceKHR:
  3273. case glslang::EOpExecuteCallableNV:
  3274. case glslang::EOpExecuteCallableKHR:
  3275. case glslang::EOpWritePackedPrimitiveIndices4x8NV:
  3276. case glslang::EOpEmitMeshTasksEXT:
  3277. case glslang::EOpSetMeshOutputsEXT:
  3278. noReturnValue = true;
  3279. break;
  3280. case glslang::EOpRayQueryInitialize:
  3281. case glslang::EOpRayQueryTerminate:
  3282. case glslang::EOpRayQueryGenerateIntersection:
  3283. case glslang::EOpRayQueryConfirmIntersection:
  3284. builder.addExtension("SPV_KHR_ray_query");
  3285. builder.addCapability(spv::Capability::RayQueryKHR);
  3286. noReturnValue = true;
  3287. break;
  3288. case glslang::EOpRayQueryProceed:
  3289. case glslang::EOpRayQueryGetIntersectionType:
  3290. case glslang::EOpRayQueryGetRayTMin:
  3291. case glslang::EOpRayQueryGetRayFlags:
  3292. case glslang::EOpRayQueryGetIntersectionT:
  3293. case glslang::EOpRayQueryGetIntersectionInstanceCustomIndex:
  3294. case glslang::EOpRayQueryGetIntersectionInstanceId:
  3295. case glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset:
  3296. case glslang::EOpRayQueryGetIntersectionGeometryIndex:
  3297. case glslang::EOpRayQueryGetIntersectionPrimitiveIndex:
  3298. case glslang::EOpRayQueryGetIntersectionBarycentrics:
  3299. case glslang::EOpRayQueryGetIntersectionFrontFace:
  3300. case glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque:
  3301. case glslang::EOpRayQueryGetIntersectionObjectRayDirection:
  3302. case glslang::EOpRayQueryGetIntersectionObjectRayOrigin:
  3303. case glslang::EOpRayQueryGetWorldRayDirection:
  3304. case glslang::EOpRayQueryGetWorldRayOrigin:
  3305. case glslang::EOpRayQueryGetIntersectionObjectToWorld:
  3306. case glslang::EOpRayQueryGetIntersectionWorldToObject:
  3307. builder.addExtension("SPV_KHR_ray_query");
  3308. builder.addCapability(spv::Capability::RayQueryKHR);
  3309. break;
  3310. case glslang::EOpCooperativeMatrixLoad:
  3311. case glslang::EOpCooperativeMatrixStore:
  3312. case glslang::EOpCooperativeMatrixLoadNV:
  3313. case glslang::EOpCooperativeMatrixStoreNV:
  3314. case glslang::EOpCooperativeMatrixLoadTensorNV:
  3315. case glslang::EOpCooperativeMatrixStoreTensorNV:
  3316. case glslang::EOpCooperativeMatrixReduceNV:
  3317. case glslang::EOpCooperativeMatrixPerElementOpNV:
  3318. case glslang::EOpCooperativeMatrixTransposeNV:
  3319. case glslang::EOpCooperativeVectorMatMulNV:
  3320. case glslang::EOpCooperativeVectorMatMulAddNV:
  3321. case glslang::EOpCooperativeVectorLoadNV:
  3322. case glslang::EOpCooperativeVectorStoreNV:
  3323. case glslang::EOpCooperativeVectorOuterProductAccumulateNV:
  3324. case glslang::EOpCooperativeVectorReduceSumAccumulateNV:
  3325. noReturnValue = true;
  3326. break;
  3327. case glslang::EOpBeginInvocationInterlock:
  3328. case glslang::EOpEndInvocationInterlock:
  3329. builder.addExtension(spv::E_SPV_EXT_fragment_shader_interlock);
  3330. noReturnValue = true;
  3331. break;
  3332. case glslang::EOpHitObjectTraceRayNV:
  3333. case glslang::EOpHitObjectTraceRayMotionNV:
  3334. case glslang::EOpHitObjectGetAttributesNV:
  3335. case glslang::EOpHitObjectExecuteShaderNV:
  3336. case glslang::EOpHitObjectRecordEmptyNV:
  3337. case glslang::EOpHitObjectRecordMissNV:
  3338. case glslang::EOpHitObjectRecordMissMotionNV:
  3339. case glslang::EOpHitObjectRecordHitNV:
  3340. case glslang::EOpHitObjectRecordHitMotionNV:
  3341. case glslang::EOpHitObjectRecordHitWithIndexNV:
  3342. case glslang::EOpHitObjectRecordHitWithIndexMotionNV:
  3343. case glslang::EOpReorderThreadNV:
  3344. noReturnValue = true;
  3345. [[fallthrough]];
  3346. case glslang::EOpHitObjectIsEmptyNV:
  3347. case glslang::EOpHitObjectIsMissNV:
  3348. case glslang::EOpHitObjectIsHitNV:
  3349. case glslang::EOpHitObjectGetRayTMinNV:
  3350. case glslang::EOpHitObjectGetRayTMaxNV:
  3351. case glslang::EOpHitObjectGetObjectRayOriginNV:
  3352. case glslang::EOpHitObjectGetObjectRayDirectionNV:
  3353. case glslang::EOpHitObjectGetWorldRayOriginNV:
  3354. case glslang::EOpHitObjectGetWorldRayDirectionNV:
  3355. case glslang::EOpHitObjectGetObjectToWorldNV:
  3356. case glslang::EOpHitObjectGetWorldToObjectNV:
  3357. case glslang::EOpHitObjectGetInstanceCustomIndexNV:
  3358. case glslang::EOpHitObjectGetInstanceIdNV:
  3359. case glslang::EOpHitObjectGetGeometryIndexNV:
  3360. case glslang::EOpHitObjectGetPrimitiveIndexNV:
  3361. case glslang::EOpHitObjectGetHitKindNV:
  3362. case glslang::EOpHitObjectGetCurrentTimeNV:
  3363. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:
  3364. case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:
  3365. builder.addExtension(spv::E_SPV_NV_shader_invocation_reorder);
  3366. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  3367. break;
  3368. case glslang::EOpHitObjectGetLSSPositionsNV:
  3369. case glslang::EOpHitObjectGetLSSRadiiNV:
  3370. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  3371. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  3372. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  3373. noReturnValue = true;
  3374. break;
  3375. case glslang::EOpRayQueryGetIntersectionLSSPositionsNV:
  3376. case glslang::EOpRayQueryGetIntersectionLSSRadiiNV:
  3377. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  3378. builder.addCapability(spv::Capability::RayQueryKHR);
  3379. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  3380. noReturnValue = true;
  3381. break;
  3382. case glslang::EOpRayQueryGetIntersectionSpherePositionNV:
  3383. case glslang::EOpRayQueryGetIntersectionSphereRadiusNV:
  3384. case glslang::EOpRayQueryIsSphereHitNV:
  3385. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  3386. builder.addCapability(spv::Capability::RayQueryKHR);
  3387. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  3388. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  3389. break;
  3390. case glslang::EOpRayQueryGetIntersectionLSSHitValueNV:
  3391. case glslang::EOpRayQueryIsLSSHitNV:
  3392. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  3393. builder.addCapability(spv::Capability::RayQueryKHR);
  3394. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  3395. break;
  3396. case glslang::EOpHitObjectTraceRayEXT:
  3397. case glslang::EOpHitObjectTraceRayMotionEXT:
  3398. case glslang::EOpHitObjectGetAttributesEXT:
  3399. case glslang::EOpHitObjectExecuteShaderEXT:
  3400. case glslang::EOpHitObjectRecordEmptyEXT:
  3401. case glslang::EOpHitObjectRecordMissEXT:
  3402. case glslang::EOpHitObjectRecordMissMotionEXT:
  3403. case glslang::EOpReorderThreadEXT:
  3404. case glslang::EOpHitObjectSetShaderBindingTableRecordIndexEXT:
  3405. case glslang::EOpHitObjectReorderExecuteEXT:
  3406. case glslang::EOpHitObjectTraceReorderExecuteEXT:
  3407. case glslang::EOpHitObjectTraceMotionReorderExecuteEXT:
  3408. case glslang::EOpHitObjectRecordFromQueryEXT:
  3409. case glslang::EOpHitObjectGetIntersectionTriangleVertexPositionsEXT:
  3410. noReturnValue = true;
  3411. [[fallthrough]];
  3412. case glslang::EOpHitObjectIsEmptyEXT:
  3413. case glslang::EOpHitObjectIsMissEXT:
  3414. case glslang::EOpHitObjectIsHitEXT:
  3415. case glslang::EOpHitObjectGetRayTMinEXT:
  3416. case glslang::EOpHitObjectGetRayTMaxEXT:
  3417. case glslang::EOpHitObjectGetRayFlagsEXT:
  3418. case glslang::EOpHitObjectGetObjectRayOriginEXT:
  3419. case glslang::EOpHitObjectGetObjectRayDirectionEXT:
  3420. case glslang::EOpHitObjectGetWorldRayOriginEXT:
  3421. case glslang::EOpHitObjectGetWorldRayDirectionEXT:
  3422. case glslang::EOpHitObjectGetObjectToWorldEXT:
  3423. case glslang::EOpHitObjectGetWorldToObjectEXT:
  3424. case glslang::EOpHitObjectGetInstanceCustomIndexEXT:
  3425. case glslang::EOpHitObjectGetInstanceIdEXT:
  3426. case glslang::EOpHitObjectGetGeometryIndexEXT:
  3427. case glslang::EOpHitObjectGetPrimitiveIndexEXT:
  3428. case glslang::EOpHitObjectGetHitKindEXT:
  3429. case glslang::EOpHitObjectGetCurrentTimeEXT:
  3430. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexEXT:
  3431. case glslang::EOpHitObjectGetShaderRecordBufferHandleEXT:
  3432. builder.addExtension(spv::E_SPV_EXT_shader_invocation_reorder);
  3433. builder.addCapability(spv::Capability::ShaderInvocationReorderEXT);
  3434. break;
  3435. case glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT:
  3436. builder.addExtension(spv::E_SPV_KHR_ray_tracing_position_fetch);
  3437. builder.addCapability(spv::Capability::RayQueryPositionFetchKHR);
  3438. noReturnValue = true;
  3439. break;
  3440. case glslang::EOpImageSampleWeightedQCOM:
  3441. builder.addCapability(spv::Capability::TextureSampleWeightedQCOM);
  3442. builder.addExtension(spv::E_SPV_QCOM_image_processing);
  3443. break;
  3444. case glslang::EOpImageBoxFilterQCOM:
  3445. builder.addCapability(spv::Capability::TextureBoxFilterQCOM);
  3446. builder.addExtension(spv::E_SPV_QCOM_image_processing);
  3447. break;
  3448. case glslang::EOpImageBlockMatchSADQCOM:
  3449. case glslang::EOpImageBlockMatchSSDQCOM:
  3450. builder.addCapability(spv::Capability::TextureBlockMatchQCOM);
  3451. builder.addExtension(spv::E_SPV_QCOM_image_processing);
  3452. break;
  3453. case glslang::EOpTensorWriteARM:
  3454. noReturnValue = true;
  3455. break;
  3456. case glslang::EOpImageBlockMatchWindowSSDQCOM:
  3457. case glslang::EOpImageBlockMatchWindowSADQCOM:
  3458. builder.addCapability(spv::Capability::TextureBlockMatchQCOM);
  3459. builder.addExtension(spv::E_SPV_QCOM_image_processing);
  3460. builder.addCapability(spv::Capability::TextureBlockMatch2QCOM);
  3461. builder.addExtension(spv::E_SPV_QCOM_image_processing2);
  3462. break;
  3463. case glslang::EOpImageBlockMatchGatherSSDQCOM:
  3464. case glslang::EOpImageBlockMatchGatherSADQCOM:
  3465. builder.addCapability(spv::Capability::TextureBlockMatchQCOM);
  3466. builder.addExtension(spv::E_SPV_QCOM_image_processing);
  3467. builder.addCapability(spv::Capability::TextureBlockMatch2QCOM);
  3468. builder.addExtension(spv::E_SPV_QCOM_image_processing2);
  3469. break;
  3470. case glslang::EOpFetchMicroTriangleVertexPositionNV:
  3471. case glslang::EOpFetchMicroTriangleVertexBarycentricNV:
  3472. builder.addExtension(spv::E_SPV_NV_displacement_micromap);
  3473. builder.addCapability(spv::Capability::DisplacementMicromapNV);
  3474. break;
  3475. case glslang::EOpRayQueryGetIntersectionClusterIdNV:
  3476. builder.addExtension(spv::E_SPV_NV_cluster_acceleration_structure);
  3477. builder.addCapability(spv::Capability::RayQueryKHR);
  3478. builder.addCapability(spv::Capability::RayTracingClusterAccelerationStructureNV);
  3479. break;
  3480. case glslang::EOpDebugPrintf:
  3481. noReturnValue = true;
  3482. break;
  3483. default:
  3484. break;
  3485. }
  3486. //
  3487. // See if it maps to a regular operation.
  3488. //
  3489. if (binOp != glslang::EOpNull) {
  3490. glslang::TIntermTyped* left = node->getSequence()[0]->getAsTyped();
  3491. glslang::TIntermTyped* right = node->getSequence()[1]->getAsTyped();
  3492. assert(left && right);
  3493. builder.clearAccessChain();
  3494. left->traverse(this);
  3495. spv::Id leftId = accessChainLoad(left->getType());
  3496. builder.clearAccessChain();
  3497. right->traverse(this);
  3498. spv::Id rightId = accessChainLoad(right->getType());
  3499. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  3500. OpDecorations decorations = { precision,
  3501. TranslateNoContractionDecoration(node->getType().getQualifier()),
  3502. TranslateNonUniformDecoration(node->getType().getQualifier()) };
  3503. result = createBinaryOperation(binOp, decorations,
  3504. resultType(), leftId, rightId,
  3505. left->getType().getBasicType(), reduceComparison);
  3506. // code above should only make binOp that exists in createBinaryOperation
  3507. assert(result != spv::NoResult);
  3508. builder.clearAccessChain();
  3509. builder.setAccessChainRValue(result);
  3510. return false;
  3511. }
  3512. //
  3513. // Create the list of operands.
  3514. //
  3515. glslang::TIntermSequence& glslangOperands = node->getSequence();
  3516. std::vector<spv::Id> operands;
  3517. std::vector<spv::IdImmediate> memoryAccessOperands;
  3518. for (int arg = 0; arg < (int)glslangOperands.size(); ++arg) {
  3519. // special case l-value operands; there are just a few
  3520. bool lvalue = false;
  3521. switch (node->getOp()) {
  3522. case glslang::EOpModf:
  3523. if (arg == 1)
  3524. lvalue = true;
  3525. break;
  3526. case glslang::EOpHitObjectRecordFromQueryEXT:
  3527. case glslang::EOpHitObjectGetIntersectionTriangleVertexPositionsEXT:
  3528. if (arg == 0 || arg == 1)
  3529. lvalue = true;
  3530. break;
  3531. case glslang::EOpHitObjectRecordHitNV:
  3532. case glslang::EOpHitObjectRecordHitMotionNV:
  3533. case glslang::EOpHitObjectRecordHitWithIndexNV:
  3534. case glslang::EOpHitObjectRecordHitWithIndexMotionNV:
  3535. case glslang::EOpHitObjectTraceRayNV:
  3536. case glslang::EOpHitObjectTraceRayMotionNV:
  3537. case glslang::EOpHitObjectExecuteShaderNV:
  3538. case glslang::EOpHitObjectRecordMissNV:
  3539. case glslang::EOpHitObjectRecordMissMotionNV:
  3540. case glslang::EOpHitObjectGetAttributesNV:
  3541. case glslang::EOpHitObjectGetClusterIdNV:
  3542. case glslang::EOpHitObjectTraceRayEXT:
  3543. case glslang::EOpHitObjectTraceRayMotionEXT:
  3544. case glslang::EOpHitObjectExecuteShaderEXT:
  3545. case glslang::EOpHitObjectRecordMissEXT:
  3546. case glslang::EOpHitObjectRecordMissMotionEXT:
  3547. case glslang::EOpHitObjectGetAttributesEXT:
  3548. case glslang::EOpHitObjectSetShaderBindingTableRecordIndexEXT:
  3549. case glslang::EOpHitObjectReorderExecuteEXT:
  3550. case glslang::EOpHitObjectTraceReorderExecuteEXT:
  3551. case glslang::EOpHitObjectTraceMotionReorderExecuteEXT:
  3552. if (arg == 0)
  3553. lvalue = true;
  3554. break;
  3555. case glslang::EOpHitObjectGetLSSPositionsNV:
  3556. case glslang::EOpHitObjectGetLSSRadiiNV:
  3557. lvalue = true;
  3558. break;
  3559. case glslang::EOpRayQueryInitialize:
  3560. case glslang::EOpRayQueryTerminate:
  3561. case glslang::EOpRayQueryConfirmIntersection:
  3562. case glslang::EOpRayQueryProceed:
  3563. case glslang::EOpRayQueryGenerateIntersection:
  3564. case glslang::EOpRayQueryGetIntersectionType:
  3565. case glslang::EOpRayQueryGetIntersectionT:
  3566. case glslang::EOpRayQueryGetIntersectionInstanceCustomIndex:
  3567. case glslang::EOpRayQueryGetIntersectionInstanceId:
  3568. case glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset:
  3569. case glslang::EOpRayQueryGetIntersectionGeometryIndex:
  3570. case glslang::EOpRayQueryGetIntersectionPrimitiveIndex:
  3571. case glslang::EOpRayQueryGetIntersectionBarycentrics:
  3572. case glslang::EOpRayQueryGetIntersectionFrontFace:
  3573. case glslang::EOpRayQueryGetIntersectionObjectRayDirection:
  3574. case glslang::EOpRayQueryGetIntersectionObjectRayOrigin:
  3575. case glslang::EOpRayQueryGetIntersectionObjectToWorld:
  3576. case glslang::EOpRayQueryGetIntersectionWorldToObject:
  3577. case glslang::EOpRayQueryGetIntersectionClusterIdNV:
  3578. case glslang::EOpRayQueryGetIntersectionSpherePositionNV:
  3579. case glslang::EOpRayQueryGetIntersectionSphereRadiusNV:
  3580. case glslang::EOpRayQueryGetIntersectionLSSHitValueNV:
  3581. case glslang::EOpRayQueryIsSphereHitNV:
  3582. case glslang::EOpRayQueryIsLSSHitNV:
  3583. if (arg == 0)
  3584. lvalue = true;
  3585. break;
  3586. case glslang::EOpAtomicAdd:
  3587. case glslang::EOpAtomicSubtract:
  3588. case glslang::EOpAtomicMin:
  3589. case glslang::EOpAtomicMax:
  3590. case glslang::EOpAtomicAnd:
  3591. case glslang::EOpAtomicOr:
  3592. case glslang::EOpAtomicXor:
  3593. case glslang::EOpAtomicExchange:
  3594. case glslang::EOpAtomicCompSwap:
  3595. if (arg == 0)
  3596. lvalue = true;
  3597. break;
  3598. case glslang::EOpFrexp:
  3599. if (arg == 1)
  3600. lvalue = true;
  3601. break;
  3602. case glslang::EOpInterpolateAtSample:
  3603. case glslang::EOpInterpolateAtOffset:
  3604. case glslang::EOpInterpolateAtVertex:
  3605. if (arg == 0) {
  3606. // If GLSL, use the address of the interpolant argument.
  3607. // If HLSL, use an internal version of OpInterolates that takes
  3608. // the rvalue of the interpolant. A fixup pass in spirv-opt
  3609. // legalization will remove the OpLoad and convert to an lvalue.
  3610. // Had to do this because legalization will only propagate a
  3611. // builtin into an rvalue.
  3612. lvalue = glslangIntermediate->getSource() != glslang::EShSourceHlsl;
  3613. // Does it need a swizzle inversion? If so, evaluation is inverted;
  3614. // operate first on the swizzle base, then apply the swizzle.
  3615. // That is, we transform
  3616. //
  3617. // interpolate(v.zy) -> interpolate(v).zy
  3618. //
  3619. if (glslangOperands[0]->getAsOperator() &&
  3620. glslangOperands[0]->getAsOperator()->getOp() == glslang::EOpVectorSwizzle)
  3621. invertedType = convertGlslangToSpvType(
  3622. glslangOperands[0]->getAsBinaryNode()->getLeft()->getType());
  3623. }
  3624. break;
  3625. case glslang::EOpAtomicLoad:
  3626. case glslang::EOpAtomicStore:
  3627. case glslang::EOpAtomicCounterAdd:
  3628. case glslang::EOpAtomicCounterSubtract:
  3629. case glslang::EOpAtomicCounterMin:
  3630. case glslang::EOpAtomicCounterMax:
  3631. case glslang::EOpAtomicCounterAnd:
  3632. case glslang::EOpAtomicCounterOr:
  3633. case glslang::EOpAtomicCounterXor:
  3634. case glslang::EOpAtomicCounterExchange:
  3635. case glslang::EOpAtomicCounterCompSwap:
  3636. if (arg == 0)
  3637. lvalue = true;
  3638. break;
  3639. case glslang::EOpAddCarry:
  3640. case glslang::EOpSubBorrow:
  3641. if (arg == 2)
  3642. lvalue = true;
  3643. break;
  3644. case glslang::EOpUMulExtended:
  3645. case glslang::EOpIMulExtended:
  3646. if (arg >= 2)
  3647. lvalue = true;
  3648. break;
  3649. case glslang::EOpCooperativeMatrixLoad:
  3650. case glslang::EOpCooperativeMatrixLoadNV:
  3651. case glslang::EOpCooperativeMatrixLoadTensorNV:
  3652. case glslang::EOpCooperativeVectorLoadNV:
  3653. if (arg == 0 || arg == 1)
  3654. lvalue = true;
  3655. break;
  3656. case glslang::EOpCooperativeMatrixStore:
  3657. case glslang::EOpCooperativeMatrixStoreNV:
  3658. case glslang::EOpCooperativeMatrixStoreTensorNV:
  3659. case glslang::EOpCooperativeVectorStoreNV:
  3660. if (arg == 1)
  3661. lvalue = true;
  3662. break;
  3663. case glslang::EOpCooperativeVectorMatMulNV:
  3664. if (arg == 0 || arg == 3)
  3665. lvalue = true;
  3666. break;
  3667. case glslang::EOpCooperativeVectorMatMulAddNV:
  3668. if (arg == 0 || arg == 3 || arg == 6)
  3669. lvalue = true;
  3670. break;
  3671. case glslang::EOpCooperativeVectorOuterProductAccumulateNV:
  3672. if (arg == 2)
  3673. lvalue = true;
  3674. break;
  3675. case glslang::EOpCooperativeVectorReduceSumAccumulateNV:
  3676. if (arg == 1)
  3677. lvalue = true;
  3678. break;
  3679. case glslang::EOpCooperativeMatrixReduceNV:
  3680. case glslang::EOpCooperativeMatrixPerElementOpNV:
  3681. case glslang::EOpCooperativeMatrixTransposeNV:
  3682. if (arg == 0)
  3683. lvalue = true;
  3684. break;
  3685. case glslang::EOpSpirvInst:
  3686. if (glslangOperands[arg]->getAsTyped()->getQualifier().isSpirvByReference())
  3687. lvalue = true;
  3688. break;
  3689. case glslang::EOpReorderThreadNV:
  3690. case glslang::EOpReorderThreadEXT:
  3691. //Three variants of reorderThreadNV, two of them use hitObjectNV
  3692. if (arg == 0 && glslangOperands.size() != 2)
  3693. lvalue = true;
  3694. break;
  3695. case glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT:
  3696. case glslang::EOpRayQueryGetIntersectionLSSPositionsNV:
  3697. case glslang::EOpRayQueryGetIntersectionLSSRadiiNV:
  3698. if (arg == 0 || arg == 2)
  3699. lvalue = true;
  3700. break;
  3701. case glslang::EOpTensorReadARM:
  3702. if (arg == 2)
  3703. lvalue = true;
  3704. break;
  3705. default:
  3706. break;
  3707. }
  3708. builder.clearAccessChain();
  3709. if (invertedType != spv::NoType && arg == 0)
  3710. glslangOperands[0]->getAsBinaryNode()->getLeft()->traverse(this);
  3711. else
  3712. glslangOperands[arg]->traverse(this);
  3713. bool isCoopMat = node->getOp() == glslang::EOpCooperativeMatrixLoad ||
  3714. node->getOp() == glslang::EOpCooperativeMatrixStore ||
  3715. node->getOp() == glslang::EOpCooperativeMatrixLoadNV ||
  3716. node->getOp() == glslang::EOpCooperativeMatrixStoreNV ||
  3717. node->getOp() == glslang::EOpCooperativeMatrixLoadTensorNV ||
  3718. node->getOp() == glslang::EOpCooperativeMatrixStoreTensorNV;
  3719. bool isCoopVec = node->getOp() == glslang::EOpCooperativeVectorLoadNV ||
  3720. node->getOp() == glslang::EOpCooperativeVectorStoreNV;
  3721. if (isCoopMat || isCoopVec) {
  3722. if (arg == 1) {
  3723. spv::Builder::AccessChain::CoherentFlags coherentFlags {};
  3724. unsigned int alignment {};
  3725. if (isCoopMat) {
  3726. // fold "element" parameter into the access chain
  3727. spv::Builder::AccessChain save = builder.getAccessChain();
  3728. builder.clearAccessChain();
  3729. glslangOperands[2]->traverse(this);
  3730. spv::Id elementId = accessChainLoad(glslangOperands[2]->getAsTyped()->getType());
  3731. builder.setAccessChain(save);
  3732. // Point to the first element of the array.
  3733. builder.accessChainPush(elementId,
  3734. TranslateCoherent(glslangOperands[arg]->getAsTyped()->getType()),
  3735. glslangOperands[arg]->getAsTyped()->getType().getBufferReferenceAlignment());
  3736. coherentFlags = builder.getAccessChain().coherentFlags;
  3737. alignment = builder.getAccessChain().alignment;
  3738. } else {
  3739. coherentFlags = builder.getAccessChain().coherentFlags;
  3740. coherentFlags |= TranslateCoherent(glslangOperands[arg]->getAsTyped()->getType());
  3741. alignment = 16;
  3742. }
  3743. spv::MemoryAccessMask memoryAccess = TranslateMemoryAccess(coherentFlags);
  3744. if (node->getOp() == glslang::EOpCooperativeMatrixLoad ||
  3745. node->getOp() == glslang::EOpCooperativeMatrixLoadNV ||
  3746. node->getOp() == glslang::EOpCooperativeMatrixLoadTensorNV ||
  3747. node->getOp() == glslang::EOpCooperativeVectorLoadNV)
  3748. memoryAccess = (memoryAccess & ~spv::MemoryAccessMask::MakePointerAvailableKHR);
  3749. if (node->getOp() == glslang::EOpCooperativeMatrixStore ||
  3750. node->getOp() == glslang::EOpCooperativeMatrixStoreNV ||
  3751. node->getOp() == glslang::EOpCooperativeMatrixStoreTensorNV ||
  3752. node->getOp() == glslang::EOpCooperativeVectorStoreNV)
  3753. memoryAccess = (memoryAccess & ~spv::MemoryAccessMask::MakePointerVisibleKHR);
  3754. if (builder.getStorageClass(builder.getAccessChain().base) ==
  3755. spv::StorageClass::PhysicalStorageBufferEXT) {
  3756. memoryAccess = (spv::MemoryAccessMask)(memoryAccess | spv::MemoryAccessMask::Aligned);
  3757. }
  3758. memoryAccessOperands.push_back(spv::IdImmediate(false, memoryAccess));
  3759. if (anySet(memoryAccess, spv::MemoryAccessMask::Aligned)) {
  3760. memoryAccessOperands.push_back(spv::IdImmediate(false, alignment));
  3761. }
  3762. if (anySet(memoryAccess,
  3763. spv::MemoryAccessMask::MakePointerAvailableKHR | spv::MemoryAccessMask::MakePointerVisibleKHR)) {
  3764. memoryAccessOperands.push_back(spv::IdImmediate(true,
  3765. builder.makeUintConstant(TranslateMemoryScope(coherentFlags))));
  3766. }
  3767. } else if (isCoopMat && arg == 2) {
  3768. continue;
  3769. }
  3770. }
  3771. // for l-values, pass the address, for r-values, pass the value
  3772. if (lvalue) {
  3773. if (invertedType == spv::NoType && !builder.isSpvLvalue()) {
  3774. // SPIR-V cannot represent an l-value containing a swizzle that doesn't
  3775. // reduce to a simple access chain. So, we need a temporary vector to
  3776. // receive the result, and must later swizzle that into the original
  3777. // l-value.
  3778. complexLvalues.push_back(builder.getAccessChain());
  3779. temporaryLvalues.push_back(builder.createVariable(
  3780. spv::NoPrecision, spv::StorageClass::Function,
  3781. builder.accessChainGetInferredType(), "swizzleTemp"));
  3782. operands.push_back(temporaryLvalues.back());
  3783. } else {
  3784. operands.push_back(builder.accessChainGetLValue());
  3785. }
  3786. lvalueCoherentFlags = builder.getAccessChain().coherentFlags;
  3787. lvalueCoherentFlags |= TranslateCoherent(glslangOperands[arg]->getAsTyped()->getType());
  3788. } else {
  3789. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  3790. glslang::TOperator glslangOp = node->getOp();
  3791. if (arg == 1 &&
  3792. (glslangOp == glslang::EOpRayQueryGetIntersectionType ||
  3793. glslangOp == glslang::EOpRayQueryGetIntersectionT ||
  3794. glslangOp == glslang::EOpRayQueryGetIntersectionInstanceCustomIndex ||
  3795. glslangOp == glslang::EOpRayQueryGetIntersectionInstanceId ||
  3796. glslangOp == glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset ||
  3797. glslangOp == glslang::EOpRayQueryGetIntersectionGeometryIndex ||
  3798. glslangOp == glslang::EOpRayQueryGetIntersectionPrimitiveIndex ||
  3799. glslangOp == glslang::EOpRayQueryGetIntersectionBarycentrics ||
  3800. glslangOp == glslang::EOpRayQueryGetIntersectionFrontFace ||
  3801. glslangOp == glslang::EOpRayQueryGetIntersectionObjectRayDirection ||
  3802. glslangOp == glslang::EOpRayQueryGetIntersectionObjectRayOrigin ||
  3803. glslangOp == glslang::EOpRayQueryGetIntersectionObjectToWorld ||
  3804. glslangOp == glslang::EOpRayQueryGetIntersectionWorldToObject ||
  3805. glslangOp == glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT ||
  3806. glslangOp == glslang::EOpRayQueryGetIntersectionClusterIdNV ||
  3807. glslangOp == glslang::EOpRayQueryGetIntersectionSpherePositionNV ||
  3808. glslangOp == glslang::EOpRayQueryGetIntersectionSphereRadiusNV ||
  3809. glslangOp == glslang::EOpRayQueryGetIntersectionLSSHitValueNV ||
  3810. glslangOp == glslang::EOpRayQueryGetIntersectionLSSPositionsNV ||
  3811. glslangOp == glslang::EOpRayQueryGetIntersectionLSSRadiiNV ||
  3812. glslangOp == glslang::EOpRayQueryIsLSSHitNV ||
  3813. glslangOp == glslang::EOpRayQueryIsSphereHitNV
  3814. )) {
  3815. bool cond = glslangOperands[arg]->getAsConstantUnion()->getConstArray()[0].getBConst();
  3816. operands.push_back(builder.makeIntConstant(cond ? 1 : 0));
  3817. } else if ((arg == 10 && glslangOp == glslang::EOpTraceKHR) ||
  3818. (arg == 11 && glslangOp == glslang::EOpTraceRayMotionNV) ||
  3819. (arg == 1 && glslangOp == glslang::EOpExecuteCallableKHR) ||
  3820. (arg == 1 && glslangOp == glslang::EOpHitObjectExecuteShaderNV) ||
  3821. (arg == 1 && glslangOp == glslang::EOpHitObjectExecuteShaderEXT) ||
  3822. (arg == 11 && glslangOp == glslang::EOpHitObjectTraceRayNV) ||
  3823. (arg == 11 && glslangOp == glslang::EOpHitObjectTraceRayEXT) ||
  3824. (arg == 12 && glslangOp == glslang::EOpHitObjectTraceRayMotionNV) ||
  3825. (arg == 12 && glslangOp == glslang::EOpHitObjectTraceRayMotionEXT) ||
  3826. (arg == 12 && glslangOp == glslang::EOpHitObjectTraceMotionReorderExecuteEXT && glslangOperands.size() == 13) ||
  3827. (arg == 14 && glslangOp == glslang::EOpHitObjectTraceMotionReorderExecuteEXT && glslangOperands.size() == 15) ||
  3828. (arg == 11 && glslangOp == glslang::EOpHitObjectTraceReorderExecuteEXT && glslangOperands.size() == 12) ||
  3829. (arg == 13 && glslangOp == glslang::EOpHitObjectTraceReorderExecuteEXT && glslangOperands.size() == 14) ||
  3830. (arg == 1 && glslangOp == glslang::EOpHitObjectReorderExecuteEXT && glslangOperands.size() == 2) ||
  3831. (arg == 3 && glslangOp == glslang::EOpHitObjectReorderExecuteEXT && glslangOperands.size() == 4)) {
  3832. const int set = glslangOp == glslang::EOpExecuteCallableKHR ? 1 : 0;
  3833. const int location = glslangOperands[arg]->getAsConstantUnion()->getConstArray()[0].getUConst();
  3834. auto itNode = locationToSymbol[set].find(location);
  3835. visitSymbol(itNode->second);
  3836. spv::Id symId = getSymbolId(itNode->second);
  3837. operands.push_back(symId);
  3838. } else if ((arg == 12 && glslangOp == glslang::EOpHitObjectRecordHitNV) ||
  3839. (arg == 13 && glslangOp == glslang::EOpHitObjectRecordHitMotionNV) ||
  3840. (arg == 11 && glslangOp == glslang::EOpHitObjectRecordHitWithIndexNV) ||
  3841. (arg == 12 && glslangOp == glslang::EOpHitObjectRecordHitWithIndexMotionNV) ||
  3842. (arg == 3 && glslangOp == glslang::EOpHitObjectRecordFromQueryEXT) ||
  3843. (arg == 1 && glslangOp == glslang::EOpHitObjectGetAttributesEXT) ||
  3844. (arg == 1 && glslangOp == glslang::EOpHitObjectGetAttributesNV)) {
  3845. const int location = glslangOperands[arg]->getAsConstantUnion()->getConstArray()[0].getUConst();
  3846. const int set = 2;
  3847. auto itNode = locationToSymbol[set].find(location);
  3848. visitSymbol(itNode->second);
  3849. spv::Id symId = getSymbolId(itNode->second);
  3850. operands.push_back(symId);
  3851. } else if (glslangOperands[arg]->getAsTyped()->getQualifier().isSpirvLiteral()) {
  3852. // Will be translated to a literal value, make a placeholder here
  3853. operands.push_back(spv::NoResult);
  3854. } else if (glslangOperands[arg]->getAsTyped()->getBasicType() == glslang::EbtFunction) {
  3855. spv::Function* function = functionMap[glslangOperands[arg]->getAsSymbolNode()->getMangledName().c_str()];
  3856. assert(function);
  3857. operands.push_back(function->getId());
  3858. } else {
  3859. operands.push_back(accessChainLoad(glslangOperands[arg]->getAsTyped()->getType()));
  3860. }
  3861. }
  3862. }
  3863. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  3864. if (node->getOp() == glslang::EOpCooperativeMatrixLoadTensorNV) {
  3865. std::vector<spv::IdImmediate> idImmOps;
  3866. builder.addCapability(spv::Capability::CooperativeMatrixTensorAddressingNV);
  3867. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  3868. spv::Id object = builder.createLoad(operands[0], spv::NoPrecision);
  3869. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // Pointer
  3870. idImmOps.push_back(spv::IdImmediate(true, object)); // Object
  3871. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // tensorLayout
  3872. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end()); // memoryaccess
  3873. // initialize tensor operands to zero, then OR in flags based on the operands
  3874. size_t tensorOpIdx = idImmOps.size();
  3875. idImmOps.push_back(spv::IdImmediate(false, 0));
  3876. for (uint32_t i = 3; i < operands.size(); ++i) {
  3877. if (builder.isTensorView(operands[i])) {
  3878. addMask(idImmOps[tensorOpIdx].word, spv::TensorAddressingOperandsMask::TensorView);
  3879. } else {
  3880. // must be the decode func
  3881. addMask(idImmOps[tensorOpIdx].word, spv::TensorAddressingOperandsMask::DecodeFunc);
  3882. builder.addCapability(spv::Capability::CooperativeMatrixBlockLoadsNV);
  3883. }
  3884. idImmOps.push_back(spv::IdImmediate(true, operands[i])); // tensorView or decodeFunc
  3885. }
  3886. // get the pointee type
  3887. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  3888. assert(builder.isCooperativeMatrixType(typeId));
  3889. // do the op
  3890. spv::Id result = builder.createOp(spv::Op::OpCooperativeMatrixLoadTensorNV, typeId, idImmOps);
  3891. // store the result to the pointer (out param 'm')
  3892. builder.createStore(result, operands[0]);
  3893. result = 0;
  3894. } else if (node->getOp() == glslang::EOpCooperativeMatrixLoad ||
  3895. node->getOp() == glslang::EOpCooperativeMatrixLoadNV) {
  3896. std::vector<spv::IdImmediate> idImmOps;
  3897. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  3898. if (node->getOp() == glslang::EOpCooperativeMatrixLoad) {
  3899. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // matrixLayout
  3900. auto layout = (spv::CooperativeMatrixLayout)builder.getConstantScalar(operands[3]);
  3901. if (layout == spv::CooperativeMatrixLayout::RowBlockedInterleavedARM ||
  3902. layout == spv::CooperativeMatrixLayout::ColumnBlockedInterleavedARM) {
  3903. builder.addExtension(spv::E_SPV_ARM_cooperative_matrix_layouts);
  3904. builder.addCapability(spv::Capability::CooperativeMatrixLayoutsARM);
  3905. }
  3906. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
  3907. } else {
  3908. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
  3909. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // colMajor
  3910. }
  3911. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
  3912. // get the pointee type
  3913. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  3914. assert(builder.isCooperativeMatrixType(typeId));
  3915. // do the op
  3916. spv::Id result = node->getOp() == glslang::EOpCooperativeMatrixLoad
  3917. ? builder.createOp(spv::Op::OpCooperativeMatrixLoadKHR, typeId, idImmOps)
  3918. : builder.createOp(spv::Op::OpCooperativeMatrixLoadNV, typeId, idImmOps);
  3919. // store the result to the pointer (out param 'm')
  3920. builder.createStore(result, operands[0]);
  3921. result = 0;
  3922. } else if (node->getOp() == glslang::EOpCooperativeMatrixStoreTensorNV) {
  3923. std::vector<spv::IdImmediate> idImmOps;
  3924. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  3925. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // object
  3926. builder.addCapability(spv::Capability::CooperativeMatrixTensorAddressingNV);
  3927. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  3928. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // tensorLayout
  3929. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end()); // memoryaccess
  3930. if (operands.size() > 3) {
  3931. idImmOps.push_back(spv::IdImmediate(false, spv::TensorAddressingOperandsMask::TensorView));
  3932. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // tensorView
  3933. } else {
  3934. idImmOps.push_back(spv::IdImmediate(false, 0));
  3935. }
  3936. builder.createNoResultOp(spv::Op::OpCooperativeMatrixStoreTensorNV, idImmOps);
  3937. result = 0;
  3938. } else if (node->getOp() == glslang::EOpCooperativeMatrixStore ||
  3939. node->getOp() == glslang::EOpCooperativeMatrixStoreNV) {
  3940. std::vector<spv::IdImmediate> idImmOps;
  3941. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  3942. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // object
  3943. if (node->getOp() == glslang::EOpCooperativeMatrixStore) {
  3944. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // matrixLayout
  3945. auto layout = (spv::CooperativeMatrixLayout)builder.getConstantScalar(operands[3]);
  3946. if (layout == spv::CooperativeMatrixLayout::RowBlockedInterleavedARM ||
  3947. layout == spv::CooperativeMatrixLayout::ColumnBlockedInterleavedARM) {
  3948. builder.addExtension(spv::E_SPV_ARM_cooperative_matrix_layouts);
  3949. builder.addCapability(spv::Capability::CooperativeMatrixLayoutsARM);
  3950. }
  3951. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
  3952. } else {
  3953. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
  3954. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // colMajor
  3955. }
  3956. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
  3957. if (node->getOp() == glslang::EOpCooperativeMatrixStore)
  3958. builder.createNoResultOp(spv::Op::OpCooperativeMatrixStoreKHR, idImmOps);
  3959. else
  3960. builder.createNoResultOp(spv::Op::OpCooperativeMatrixStoreNV, idImmOps);
  3961. result = 0;
  3962. } else if (node->getOp() == glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT) {
  3963. std::vector<spv::IdImmediate> idImmOps;
  3964. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // q
  3965. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // committed
  3966. spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),
  3967. builder.makeUintConstant(3), 0);
  3968. // do the op
  3969. spv::Op spvOp = spv::Op::OpRayQueryGetIntersectionTriangleVertexPositionsKHR;
  3970. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  3971. // store the result to the pointer (out param 'm')
  3972. builder.createStore(result, operands[2]);
  3973. result = 0;
  3974. } else if (node->getOp() == glslang::EOpRayQueryGetIntersectionLSSPositionsNV) {
  3975. std::vector<spv::IdImmediate> idImmOps;
  3976. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // q
  3977. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // committed
  3978. spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),
  3979. builder.makeUintConstant(2), 0);
  3980. // do the op
  3981. spv::Op spvOp = spv::Op::OpRayQueryGetIntersectionLSSPositionsNV;
  3982. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  3983. // store the result to the pointer (out param 'm')
  3984. builder.createStore(result, operands[2]);
  3985. result = 0;
  3986. } else if (node->getOp() == glslang::EOpRayQueryGetIntersectionLSSRadiiNV) {
  3987. std::vector<spv::IdImmediate> idImmOps;
  3988. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // q
  3989. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // committed
  3990. spv::Id typeId = builder.makeArrayType(builder.makeFloatType(32),
  3991. builder.makeUintConstant(2), 0);
  3992. // do the op
  3993. spv::Op spvOp = spv::Op::OpRayQueryGetIntersectionLSSRadiiNV;
  3994. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  3995. // store the result to the pointer (out param 'm')
  3996. builder.createStore(result, operands[2]);
  3997. result = 0;
  3998. } else if (node->getOp() == glslang::EOpHitObjectGetLSSPositionsNV) {
  3999. std::vector<spv::IdImmediate> idImmOps;
  4000. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // hitObject
  4001. spv::Op spvOp = spv::Op::OpHitObjectGetLSSPositionsNV;
  4002. spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),
  4003. builder.makeUintConstant(2), 0);
  4004. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  4005. // store the result to the pointer (out param 'm')
  4006. builder.createStore(result, operands[1]);
  4007. result = 0;
  4008. } else if (node->getOp() == glslang::EOpHitObjectGetLSSRadiiNV) {
  4009. std::vector<spv::IdImmediate> idImmOps;
  4010. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // hitObject
  4011. spv::Op spvOp = spv::Op::OpHitObjectGetLSSRadiiNV;
  4012. spv::Id typeId = builder.makeArrayType(builder.makeFloatType(32),
  4013. builder.makeUintConstant(2), 0);
  4014. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  4015. // store the result to the pointer (out param 'm')
  4016. builder.createStore(result, operands[1]);
  4017. result = 0;
  4018. } else if (node->getOp() == glslang::EOpHitObjectGetIntersectionTriangleVertexPositionsEXT) {
  4019. std::vector<spv::IdImmediate> idImmOps;
  4020. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // hitObject
  4021. spv::Op spvOp = spv::Op::OpHitObjectGetIntersectionTriangleVertexPositionsEXT;
  4022. spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),
  4023. builder.makeUintConstant(3), 0);
  4024. spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
  4025. // store the result to the pointer (out param 'm')
  4026. builder.createStore(result, operands[1]);
  4027. result = 0;
  4028. } else if (node->getOp() == glslang::EOpCooperativeMatrixMulAdd) {
  4029. auto matrixOperands = spv::CooperativeMatrixOperandsMask::MaskNone;
  4030. // If the optional operand is present, initialize matrixOperands to that value.
  4031. if (glslangOperands.size() == 4 && glslangOperands[3]->getAsConstantUnion()) {
  4032. matrixOperands = (spv::CooperativeMatrixOperandsMask)glslangOperands[3]->getAsConstantUnion()->getConstArray()[0].getIConst();
  4033. }
  4034. // Determine Cooperative Matrix Operands bits from the signedness of the types.
  4035. if (isTypeSignedInt(glslangOperands[0]->getAsTyped()->getBasicType()))
  4036. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixASignedComponentsKHR);
  4037. if (isTypeSignedInt(glslangOperands[1]->getAsTyped()->getBasicType()))
  4038. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixBSignedComponentsKHR);
  4039. if (isTypeSignedInt(glslangOperands[2]->getAsTyped()->getBasicType()))
  4040. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixCSignedComponentsKHR);
  4041. if (isTypeSignedInt(node->getBasicType()))
  4042. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixResultSignedComponentsKHR);
  4043. std::vector<spv::IdImmediate> idImmOps;
  4044. idImmOps.push_back(spv::IdImmediate(true, operands[0]));
  4045. idImmOps.push_back(spv::IdImmediate(true, operands[1]));
  4046. idImmOps.push_back(spv::IdImmediate(true, operands[2]));
  4047. if (matrixOperands != spv::CooperativeMatrixOperandsMask::MaskNone)
  4048. idImmOps.push_back(spv::IdImmediate(false, matrixOperands));
  4049. result = builder.createOp(spv::Op::OpCooperativeMatrixMulAddKHR, resultType(), idImmOps);
  4050. } else if (node->getOp() == glslang::EOpCooperativeMatrixReduceNV) {
  4051. builder.addCapability(spv::Capability::CooperativeMatrixReductionsNV);
  4052. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  4053. spv::Op opcode = spv::Op::OpCooperativeMatrixReduceNV;
  4054. unsigned mask = glslangOperands[2]->getAsConstantUnion()->getConstArray()[0].getUConst();
  4055. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  4056. assert(builder.isCooperativeMatrixType(typeId));
  4057. result = builder.createCooperativeMatrixReduce(opcode, typeId, operands[1], mask, operands[3]);
  4058. // store the result to the pointer (out param 'm')
  4059. builder.createStore(result, operands[0]);
  4060. result = 0;
  4061. } else if (node->getOp() == glslang::EOpCooperativeMatrixPerElementOpNV) {
  4062. builder.addCapability(spv::Capability::CooperativeMatrixPerElementOperationsNV);
  4063. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  4064. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  4065. assert(builder.isCooperativeMatrixType(typeId));
  4066. result = builder.createCooperativeMatrixPerElementOp(typeId, operands);
  4067. // store the result to the pointer
  4068. builder.createStore(result, operands[0]);
  4069. result = 0;
  4070. } else if (node->getOp() == glslang::EOpCooperativeMatrixTransposeNV) {
  4071. builder.addCapability(spv::Capability::CooperativeMatrixConversionsNV);
  4072. builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
  4073. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  4074. assert(builder.isCooperativeMatrixType(typeId));
  4075. result = builder.createUnaryOp(spv::Op::OpCooperativeMatrixTransposeNV, typeId, operands[1]);
  4076. // store the result to the pointer
  4077. builder.createStore(result, operands[0]);
  4078. result = 0;
  4079. } else if (node->getOp() == glslang::EOpBitCastArrayQCOM) {
  4080. builder.addCapability(spv::Capability::CooperativeMatrixConversionQCOM);
  4081. builder.addExtension(spv::E_SPV_QCOM_cooperative_matrix_conversion);
  4082. result = builder.createUnaryOp(spv::Op::OpBitCastArrayQCOM, resultType(), operands[0]);
  4083. } else if (node->getOp() == glslang::EOpCompositeConstructCoopMatQCOM) {
  4084. builder.addCapability(spv::Capability::CooperativeMatrixConversionQCOM);
  4085. builder.addExtension(spv::E_SPV_QCOM_cooperative_matrix_conversion);
  4086. result = builder.createUnaryOp(spv::Op::OpCompositeConstructCoopMatQCOM, resultType(), operands[0]);
  4087. } else if (node->getOp() == glslang::EOpCompositeExtractCoopMatQCOM) {
  4088. builder.addCapability(spv::Capability::CooperativeMatrixConversionQCOM);
  4089. builder.addExtension(spv::E_SPV_QCOM_cooperative_matrix_conversion);
  4090. result = builder.createUnaryOp(spv::Op::OpCompositeExtractCoopMatQCOM, resultType(), operands[0]);
  4091. } else if (node->getOp() == glslang::EOpExtractSubArrayQCOM) {
  4092. builder.addCapability(spv::Capability::CooperativeMatrixConversionQCOM);
  4093. builder.addExtension(spv::E_SPV_QCOM_cooperative_matrix_conversion);
  4094. std::vector<spv::Id> arguments { operands[0], operands[1] };;
  4095. result = builder.createOp(spv::Op::OpExtractSubArrayQCOM, resultType(), arguments);
  4096. } else if (node->getOp() == glslang::EOpCooperativeVectorMatMulNV ||
  4097. node->getOp() == glslang::EOpCooperativeVectorMatMulAddNV) {
  4098. auto matrixOperands = spv::CooperativeMatrixOperandsMask::MaskNone;
  4099. bool isMulAdd = node->getOp() == glslang::EOpCooperativeVectorMatMulAddNV;
  4100. // Determine Cooperative Matrix Operands bits from the signedness of the types.
  4101. if (isTypeSignedInt(glslangOperands[1]->getAsTyped()->getBasicType()))
  4102. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixBSignedComponentsKHR);
  4103. if (isTypeSignedInt(glslangOperands[0]->getAsTyped()->getBasicType()))
  4104. addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixResultSignedComponentsKHR);
  4105. uint32_t opIdx = 1;
  4106. std::vector<spv::IdImmediate> idImmOps;
  4107. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Input
  4108. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // InputInterpretation
  4109. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Matrix
  4110. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MatrixOffset
  4111. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MatrixInterpretation
  4112. if (isMulAdd) {
  4113. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Bias
  4114. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // BiasOffset
  4115. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // BiasInterpretation
  4116. }
  4117. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // M
  4118. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // K
  4119. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MemoryLayout
  4120. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Transpose
  4121. idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MatrixStride
  4122. if (matrixOperands != spv::CooperativeMatrixOperandsMask::MaskNone)
  4123. idImmOps.push_back(spv::IdImmediate(false, matrixOperands)); // Cooperative Matrix Operands
  4124. // get the pointee type
  4125. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  4126. assert(builder.isCooperativeVectorType(typeId));
  4127. // do the op
  4128. spv::Id result = builder.createOp(isMulAdd ? spv::Op::OpCooperativeVectorMatrixMulAddNV : spv::Op::OpCooperativeVectorMatrixMulNV, typeId, idImmOps);
  4129. // store the result to the pointer (out param 'res')
  4130. builder.createStore(result, operands[0]);
  4131. result = 0;
  4132. } else if (node->getOp() == glslang::EOpCooperativeVectorLoadNV) {
  4133. std::vector<spv::IdImmediate> idImmOps;
  4134. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  4135. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // offset
  4136. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
  4137. // get the pointee type
  4138. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  4139. assert(builder.isCooperativeVectorType(typeId));
  4140. // do the op
  4141. spv::Id result = builder.createOp(spv::Op::OpCooperativeVectorLoadNV, typeId, idImmOps);
  4142. // store the result to the pointer (out param 'v')
  4143. builder.createStore(result, operands[0]);
  4144. result = 0;
  4145. } else if (node->getOp() == glslang::EOpCooperativeVectorStoreNV) {
  4146. std::vector<spv::IdImmediate> idImmOps;
  4147. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  4148. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // offset
  4149. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // object
  4150. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
  4151. builder.createNoResultOp(spv::Op::OpCooperativeVectorStoreNV, idImmOps);
  4152. result = 0;
  4153. } else if (node->getOp() == glslang::EOpCooperativeVectorOuterProductAccumulateNV) {
  4154. builder.addCapability(spv::Capability::CooperativeVectorTrainingNV);
  4155. builder.addExtension(spv::E_SPV_NV_cooperative_vector);
  4156. std::vector<spv::IdImmediate> idImmOps;
  4157. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // Matrix
  4158. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // Offset
  4159. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // A
  4160. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // B
  4161. idImmOps.push_back(spv::IdImmediate(true, operands[5])); // MemoryLayout
  4162. idImmOps.push_back(spv::IdImmediate(true, operands[6])); // MatrixInterpretation
  4163. idImmOps.push_back(spv::IdImmediate(true, operands[4])); // Stride
  4164. builder.createNoResultOp(spv::Op::OpCooperativeVectorOuterProductAccumulateNV, idImmOps);
  4165. result = 0;
  4166. } else if (node->getOp() == glslang::EOpCooperativeVectorReduceSumAccumulateNV) {
  4167. builder.addCapability(spv::Capability::CooperativeVectorTrainingNV);
  4168. builder.addExtension(spv::E_SPV_NV_cooperative_vector);
  4169. std::vector<spv::IdImmediate> idImmOps;
  4170. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // Buf
  4171. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // Offset
  4172. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // A
  4173. builder.createNoResultOp(spv::Op::OpCooperativeVectorReduceSumAccumulateNV, idImmOps);
  4174. result = 0;
  4175. } else if (node->getOp() == glslang::EOpTensorReadARM ||
  4176. node->getOp() == glslang::EOpTensorWriteARM) {
  4177. const bool isWrite = node->getOp() == glslang::EOpTensorWriteARM;
  4178. const unsigned int tensorMinOperandCount = 3;
  4179. assert(operands.size() >= tensorMinOperandCount);
  4180. std::vector<spv::IdImmediate> idImmOps;
  4181. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // tensor
  4182. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // coords
  4183. if (isWrite) {
  4184. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // value
  4185. }
  4186. // Analyze the tensor operands
  4187. spv::IdImmediate tensorOperands = { false, uint32_t(spv::TensorOperandsMask::MaskNone) };
  4188. bool pushExtraArg = false;
  4189. if (operands.size() > tensorMinOperandCount) {
  4190. auto enumVal = builder.getConstantScalar(operands[tensorMinOperandCount]);
  4191. if (enumVal & uint32_t(spv::TensorOperandsMask::NontemporalARM)) {
  4192. tensorOperands.word |= uint32_t(spv::TensorOperandsMask::NontemporalARM);
  4193. }
  4194. if (enumVal & uint32_t(spv::TensorOperandsMask::OutOfBoundsValueARM)) {
  4195. tensorOperands.word |= uint32_t(spv::TensorOperandsMask::OutOfBoundsValueARM);
  4196. assert(operands.size() >= tensorMinOperandCount + 2 &&
  4197. "TensorOperandsOutOfBoundsValueMask requires an additional value");
  4198. pushExtraArg = true;
  4199. }
  4200. }
  4201. // Append optional tensor operands if the mask was non-zero.
  4202. if (tensorOperands.word) {
  4203. idImmOps.push_back(tensorOperands);
  4204. if (pushExtraArg)
  4205. idImmOps.push_back(spv::IdImmediate(true, operands[tensorMinOperandCount + 1]));
  4206. }
  4207. if (isWrite) {
  4208. builder.createNoResultOp(spv::Op::OpTensorWriteARM, idImmOps);
  4209. result = 0;
  4210. } else {
  4211. // Use the result argument type as the OpTensorReadARM result type.
  4212. const glslang::TType &resArgType = glslangOperands[2]->getAsTyped()->getType();
  4213. spv::Id retType = convertGlslangToSpvType(resArgType);
  4214. result = builder.createOp(spv::Op::OpTensorReadARM, retType, idImmOps);
  4215. // Store the result to the result argument.
  4216. builder.createStore(result, operands[2]);
  4217. }
  4218. } else if (node->getOp() == glslang::EOpTensorSizeARM) {
  4219. // Expected operands are (tensor, dimension)
  4220. assert(operands.size() == 2);
  4221. spv::Id tensorOp = operands[0];
  4222. spv::Id dimOp = operands[1];
  4223. assert(builder.isTensorTypeARM(builder.getTypeId(tensorOp)) && "operand #0 must be a tensor");
  4224. std::vector<spv::IdImmediate> idImmOps;
  4225. idImmOps.push_back(spv::IdImmediate(true, tensorOp));
  4226. idImmOps.push_back(spv::IdImmediate(true, dimOp));
  4227. result = builder.createOp(spv::Op::OpTensorQuerySizeARM, resultType(), idImmOps);
  4228. } else if (atomic) {
  4229. // Handle all atomics
  4230. glslang::TBasicType typeProxy = (node->getOp() == glslang::EOpAtomicStore)
  4231. ? node->getSequence()[0]->getAsTyped()->getBasicType() : node->getBasicType();
  4232. result = createAtomicOperation(node->getOp(), precision, resultType(), operands, typeProxy,
  4233. lvalueCoherentFlags, node->getType());
  4234. } else if (node->getOp() == glslang::EOpSpirvInst) {
  4235. const auto& spirvInst = node->getSpirvInstruction();
  4236. if (spirvInst.set == "") {
  4237. std::vector<spv::IdImmediate> idImmOps;
  4238. for (unsigned int i = 0; i < glslangOperands.size(); ++i) {
  4239. if (glslangOperands[i]->getAsTyped()->getQualifier().isSpirvLiteral()) {
  4240. // Translate the constant to a literal value
  4241. std::vector<unsigned> literals;
  4242. glslang::TVector<const glslang::TIntermConstantUnion*> constants;
  4243. constants.push_back(glslangOperands[i]->getAsConstantUnion());
  4244. TranslateLiterals(constants, literals);
  4245. idImmOps.push_back({false, literals[0]});
  4246. } else
  4247. idImmOps.push_back({true, operands[i]});
  4248. }
  4249. if (node->getBasicType() == glslang::EbtVoid)
  4250. builder.createNoResultOp(static_cast<spv::Op>(spirvInst.id), idImmOps);
  4251. else
  4252. result = builder.createOp(static_cast<spv::Op>(spirvInst.id), resultType(), idImmOps);
  4253. } else {
  4254. result = builder.createBuiltinCall(
  4255. resultType(), spirvInst.set == "GLSL.std.450" ? stdBuiltins : getExtBuiltins(spirvInst.set.c_str()),
  4256. spirvInst.id, operands);
  4257. }
  4258. noReturnValue = node->getBasicType() == glslang::EbtVoid;
  4259. } else if (node->getOp() == glslang::EOpDebugPrintf) {
  4260. if (!nonSemanticDebugPrintf) {
  4261. nonSemanticDebugPrintf = builder.import("NonSemantic.DebugPrintf");
  4262. }
  4263. result = builder.createBuiltinCall(builder.makeVoidType(), nonSemanticDebugPrintf, spv::NonSemanticDebugPrintfDebugPrintf, operands);
  4264. builder.addExtension(spv::E_SPV_KHR_non_semantic_info);
  4265. } else {
  4266. // Pass through to generic operations.
  4267. switch (glslangOperands.size()) {
  4268. case 0:
  4269. result = createNoArgOperation(node->getOp(), precision, resultType());
  4270. break;
  4271. case 1:
  4272. {
  4273. OpDecorations decorations = { precision,
  4274. TranslateNoContractionDecoration(node->getType().getQualifier()),
  4275. TranslateNonUniformDecoration(node->getType().getQualifier()) };
  4276. result = createUnaryOperation(
  4277. node->getOp(), decorations,
  4278. resultType(), operands.front(),
  4279. glslangOperands[0]->getAsTyped()->getBasicType(), lvalueCoherentFlags, node->getType());
  4280. }
  4281. break;
  4282. default:
  4283. result = createMiscOperation(node->getOp(), precision, resultType(), operands, node->getBasicType());
  4284. break;
  4285. }
  4286. if (invertedType != spv::NoResult)
  4287. result = createInvertedSwizzle(precision, *glslangOperands[0]->getAsBinaryNode(), result);
  4288. for (unsigned int i = 0; i < temporaryLvalues.size(); ++i) {
  4289. builder.setAccessChain(complexLvalues[i]);
  4290. builder.accessChainStore(builder.createLoad(temporaryLvalues[i], spv::NoPrecision),
  4291. TranslateNonUniformDecoration(complexLvalues[i].coherentFlags));
  4292. }
  4293. }
  4294. if (noReturnValue)
  4295. return false;
  4296. if (! result) {
  4297. logger->missingFunctionality("unknown glslang aggregate");
  4298. return true; // pick up a child as a placeholder operand
  4299. } else {
  4300. builder.clearAccessChain();
  4301. builder.setAccessChainRValue(result);
  4302. return false;
  4303. }
  4304. }
  4305. // This path handles both if-then-else and ?:
  4306. // The if-then-else has a node type of void, while
  4307. // ?: has either a void or a non-void node type
  4308. //
  4309. // Leaving the result, when not void:
  4310. // GLSL only has r-values as the result of a :?, but
  4311. // if we have an l-value, that can be more efficient if it will
  4312. // become the base of a complex r-value expression, because the
  4313. // next layer copies r-values into memory to use the access-chain mechanism
  4314. bool TGlslangToSpvTraverser::visitSelection(glslang::TVisit /* visit */, glslang::TIntermSelection* node)
  4315. {
  4316. // see if OpSelect can handle it
  4317. const auto isOpSelectable = [&]() {
  4318. if (node->getBasicType() == glslang::EbtVoid)
  4319. return false;
  4320. // OpSelect can do all other types starting with SPV 1.4
  4321. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_4) {
  4322. // pre-1.4, only scalars and vectors can be handled
  4323. if ((!node->getType().isScalar() && !node->getType().isVector()))
  4324. return false;
  4325. }
  4326. return true;
  4327. };
  4328. // See if it simple and safe, or required, to execute both sides.
  4329. // Crucially, side effects must be either semantically required or avoided,
  4330. // and there are performance trade-offs.
  4331. // Return true if required or a good idea (and safe) to execute both sides,
  4332. // false otherwise.
  4333. const auto bothSidesPolicy = [&]() -> bool {
  4334. // do we have both sides?
  4335. if (node->getTrueBlock() == nullptr ||
  4336. node->getFalseBlock() == nullptr)
  4337. return false;
  4338. // required? (unless we write additional code to look for side effects
  4339. // and make performance trade-offs if none are present)
  4340. if (!node->getShortCircuit())
  4341. return true;
  4342. // if not required to execute both, decide based on performance/practicality...
  4343. if (!isOpSelectable())
  4344. return false;
  4345. assert(node->getType() == node->getTrueBlock() ->getAsTyped()->getType() &&
  4346. node->getType() == node->getFalseBlock()->getAsTyped()->getType());
  4347. // return true if a single operand to ? : is okay for OpSelect
  4348. const auto operandOkay = [](glslang::TIntermTyped* node) {
  4349. return node->getAsSymbolNode() || node->getType().getQualifier().isConstant();
  4350. };
  4351. return operandOkay(node->getTrueBlock() ->getAsTyped()) &&
  4352. operandOkay(node->getFalseBlock()->getAsTyped());
  4353. };
  4354. spv::Id result = spv::NoResult; // upcoming result selecting between trueValue and falseValue
  4355. // emit the condition before doing anything with selection
  4356. node->getCondition()->traverse(this);
  4357. spv::Id condition = accessChainLoad(node->getCondition()->getType());
  4358. // Find a way of executing both sides and selecting the right result.
  4359. const auto executeBothSides = [&]() -> void {
  4360. // execute both sides
  4361. spv::Id resultType = convertGlslangToSpvType(node->getType());
  4362. node->getTrueBlock()->traverse(this);
  4363. spv::Id trueValue = accessChainLoad(node->getTrueBlock()->getAsTyped()->getType());
  4364. node->getFalseBlock()->traverse(this);
  4365. spv::Id falseValue = accessChainLoad(node->getFalseBlock()->getAsTyped()->getType());
  4366. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  4367. // done if void
  4368. if (node->getBasicType() == glslang::EbtVoid)
  4369. return;
  4370. // emit code to select between trueValue and falseValue
  4371. // see if OpSelect can handle the result type, and that the SPIR-V types
  4372. // of the inputs match the result type.
  4373. if (isOpSelectable()) {
  4374. // Emit OpSelect for this selection.
  4375. // smear condition to vector, if necessary (AST is always scalar)
  4376. // Before 1.4, smear like for mix(), starting with 1.4, keep it scalar
  4377. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_4 && builder.isVector(trueValue)) {
  4378. condition = builder.smearScalar(spv::NoPrecision, condition,
  4379. builder.makeVectorType(builder.makeBoolType(),
  4380. builder.getNumComponents(trueValue)));
  4381. }
  4382. // If the types do not match, it is because of mismatched decorations on aggregates.
  4383. // Since isOpSelectable only lets us get here for SPIR-V >= 1.4, we can use OpCopyObject
  4384. // to get matching types.
  4385. if (builder.getTypeId(trueValue) != resultType) {
  4386. trueValue = builder.createUnaryOp(spv::Op::OpCopyLogical, resultType, trueValue);
  4387. }
  4388. if (builder.getTypeId(falseValue) != resultType) {
  4389. falseValue = builder.createUnaryOp(spv::Op::OpCopyLogical, resultType, falseValue);
  4390. }
  4391. // OpSelect
  4392. result = builder.createTriOp(spv::Op::OpSelect, resultType, condition, trueValue, falseValue);
  4393. builder.clearAccessChain();
  4394. builder.setAccessChainRValue(result);
  4395. } else {
  4396. // We need control flow to select the result.
  4397. // TODO: Once SPIR-V OpSelect allows arbitrary types, eliminate this path.
  4398. result = builder.createVariable(TranslatePrecisionDecoration(node->getType()),
  4399. spv::StorageClass::Function, resultType);
  4400. // Selection control:
  4401. const spv::SelectionControlMask control = TranslateSelectionControl(*node);
  4402. // make an "if" based on the value created by the condition
  4403. spv::Builder::If ifBuilder(condition, control, builder);
  4404. // emit the "then" statement
  4405. builder.clearAccessChain();
  4406. builder.setAccessChainLValue(result);
  4407. multiTypeStore(node->getType(), trueValue);
  4408. ifBuilder.makeBeginElse();
  4409. // emit the "else" statement
  4410. builder.clearAccessChain();
  4411. builder.setAccessChainLValue(result);
  4412. multiTypeStore(node->getType(), falseValue);
  4413. // finish off the control flow
  4414. ifBuilder.makeEndIf();
  4415. builder.clearAccessChain();
  4416. builder.setAccessChainLValue(result);
  4417. }
  4418. };
  4419. // Execute the one side needed, as per the condition
  4420. const auto executeOneSide = [&]() {
  4421. // Always emit control flow.
  4422. if (node->getBasicType() != glslang::EbtVoid) {
  4423. result = builder.createVariable(TranslatePrecisionDecoration(node->getType()), spv::StorageClass::Function,
  4424. convertGlslangToSpvType(node->getType()));
  4425. }
  4426. // Selection control:
  4427. const spv::SelectionControlMask control = TranslateSelectionControl(*node);
  4428. // make an "if" based on the value created by the condition
  4429. spv::Builder::If ifBuilder(condition, control, builder);
  4430. // emit the "then" statement
  4431. if (node->getTrueBlock() != nullptr) {
  4432. node->getTrueBlock()->traverse(this);
  4433. if (result != spv::NoResult) {
  4434. spv::Id load = accessChainLoad(node->getTrueBlock()->getAsTyped()->getType());
  4435. builder.clearAccessChain();
  4436. builder.setAccessChainLValue(result);
  4437. multiTypeStore(node->getType(), load);
  4438. }
  4439. }
  4440. if (node->getFalseBlock() != nullptr) {
  4441. ifBuilder.makeBeginElse();
  4442. // emit the "else" statement
  4443. node->getFalseBlock()->traverse(this);
  4444. if (result != spv::NoResult) {
  4445. spv::Id load = accessChainLoad(node->getFalseBlock()->getAsTyped()->getType());
  4446. builder.clearAccessChain();
  4447. builder.setAccessChainLValue(result);
  4448. multiTypeStore(node->getType(), load);
  4449. }
  4450. }
  4451. // finish off the control flow
  4452. ifBuilder.makeEndIf();
  4453. if (result != spv::NoResult) {
  4454. builder.clearAccessChain();
  4455. builder.setAccessChainLValue(result);
  4456. }
  4457. };
  4458. // Try for OpSelect (or a requirement to execute both sides)
  4459. if (bothSidesPolicy()) {
  4460. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  4461. if (node->getType().getQualifier().isSpecConstant())
  4462. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  4463. executeBothSides();
  4464. } else
  4465. executeOneSide();
  4466. return false;
  4467. }
  4468. bool TGlslangToSpvTraverser::visitSwitch(glslang::TVisit /* visit */, glslang::TIntermSwitch* node)
  4469. {
  4470. // emit and get the condition before doing anything with switch
  4471. node->getCondition()->traverse(this);
  4472. spv::Id selector = accessChainLoad(node->getCondition()->getAsTyped()->getType());
  4473. // Selection control:
  4474. const spv::SelectionControlMask control = TranslateSwitchControl(*node);
  4475. // browse the children to sort out code segments
  4476. int defaultSegment = -1;
  4477. std::vector<TIntermNode*> codeSegments;
  4478. glslang::TIntermSequence& sequence = node->getBody()->getSequence();
  4479. std::vector<int> caseValues;
  4480. std::vector<int> valueIndexToSegment(sequence.size()); // note: probably not all are used, it is an overestimate
  4481. for (glslang::TIntermSequence::iterator c = sequence.begin(); c != sequence.end(); ++c) {
  4482. TIntermNode* child = *c;
  4483. if (child->getAsBranchNode() && child->getAsBranchNode()->getFlowOp() == glslang::EOpDefault)
  4484. defaultSegment = (int)codeSegments.size();
  4485. else if (child->getAsBranchNode() && child->getAsBranchNode()->getFlowOp() == glslang::EOpCase) {
  4486. valueIndexToSegment[caseValues.size()] = (int)codeSegments.size();
  4487. caseValues.push_back(child->getAsBranchNode()->getExpression()->getAsConstantUnion()
  4488. ->getConstArray()[0].getIConst());
  4489. } else
  4490. codeSegments.push_back(child);
  4491. }
  4492. // handle the case where the last code segment is missing, due to no code
  4493. // statements between the last case and the end of the switch statement
  4494. if ((caseValues.size() && (int)codeSegments.size() == valueIndexToSegment[caseValues.size() - 1]) ||
  4495. (int)codeSegments.size() == defaultSegment)
  4496. codeSegments.push_back(nullptr);
  4497. // make the switch statement
  4498. std::vector<spv::Block*> segmentBlocks; // returned, as the blocks allocated in the call
  4499. builder.makeSwitch(selector, control, (int)codeSegments.size(), caseValues, valueIndexToSegment, defaultSegment,
  4500. segmentBlocks);
  4501. // emit all the code in the segments
  4502. breakForLoop.push(false);
  4503. for (unsigned int s = 0; s < codeSegments.size(); ++s) {
  4504. builder.nextSwitchSegment(segmentBlocks, s);
  4505. if (codeSegments[s])
  4506. codeSegments[s]->traverse(this);
  4507. else
  4508. builder.addSwitchBreak(true);
  4509. }
  4510. breakForLoop.pop();
  4511. builder.endSwitch(segmentBlocks);
  4512. return false;
  4513. }
  4514. void TGlslangToSpvTraverser::visitConstantUnion(glslang::TIntermConstantUnion* node)
  4515. {
  4516. if (node->getQualifier().isSpirvLiteral())
  4517. return; // Translated to a literal value, skip further processing
  4518. int nextConst = 0;
  4519. spv::Id constant = createSpvConstantFromConstUnionArray(node->getType(), node->getConstArray(), nextConst, false);
  4520. builder.clearAccessChain();
  4521. builder.setAccessChainRValue(constant);
  4522. }
  4523. bool TGlslangToSpvTraverser::visitLoop(glslang::TVisit /* visit */, glslang::TIntermLoop* node)
  4524. {
  4525. auto blocks = builder.makeNewLoop();
  4526. builder.createBranch(true, &blocks.head);
  4527. // Loop control:
  4528. std::vector<unsigned int> operands;
  4529. const spv::LoopControlMask control = TranslateLoopControl(*node, operands);
  4530. // Spec requires back edges to target header blocks, and every header block
  4531. // must dominate its merge block. Make a header block first to ensure these
  4532. // conditions are met. By definition, it will contain OpLoopMerge, followed
  4533. // by a block-ending branch. But we don't want to put any other body/test
  4534. // instructions in it, since the body/test may have arbitrary instructions,
  4535. // including merges of its own.
  4536. builder.setBuildPoint(&blocks.head);
  4537. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  4538. builder.createLoopMerge(&blocks.merge, &blocks.continue_target, control, operands);
  4539. if (node->testFirst() && node->getTest()) {
  4540. spv::Block& test = builder.makeNewBlock();
  4541. builder.createBranch(true, &test);
  4542. builder.setBuildPoint(&test);
  4543. node->getTest()->traverse(this);
  4544. spv::Id condition = accessChainLoad(node->getTestExpr()->getType());
  4545. builder.createConditionalBranch(condition, &blocks.body, &blocks.merge);
  4546. builder.setBuildPoint(&blocks.body);
  4547. breakForLoop.push(true);
  4548. if (node->getBody())
  4549. node->getBody()->traverse(this);
  4550. builder.createBranch(true, &blocks.continue_target);
  4551. breakForLoop.pop();
  4552. builder.setBuildPoint(&blocks.continue_target);
  4553. if (node->getTerminal())
  4554. node->getTerminal()->traverse(this);
  4555. builder.createBranch(true, &blocks.head);
  4556. } else {
  4557. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  4558. builder.createBranch(true, &blocks.body);
  4559. breakForLoop.push(true);
  4560. builder.setBuildPoint(&blocks.body);
  4561. if (node->getBody())
  4562. node->getBody()->traverse(this);
  4563. builder.createBranch(true, &blocks.continue_target);
  4564. breakForLoop.pop();
  4565. builder.setBuildPoint(&blocks.continue_target);
  4566. if (node->getTerminal())
  4567. node->getTerminal()->traverse(this);
  4568. if (node->getTest()) {
  4569. node->getTest()->traverse(this);
  4570. spv::Id condition =
  4571. accessChainLoad(node->getTestExpr()->getType());
  4572. builder.createConditionalBranch(condition, &blocks.head, &blocks.merge);
  4573. } else {
  4574. // TODO: unless there was a break/return/discard instruction
  4575. // somewhere in the body, this is an infinite loop, so we should
  4576. // issue a warning.
  4577. builder.createBranch(true, &blocks.head);
  4578. }
  4579. }
  4580. builder.setBuildPoint(&blocks.merge);
  4581. builder.closeLoop();
  4582. return false;
  4583. }
  4584. bool TGlslangToSpvTraverser::visitBranch(glslang::TVisit /* visit */, glslang::TIntermBranch* node)
  4585. {
  4586. if (node->getExpression())
  4587. node->getExpression()->traverse(this);
  4588. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  4589. switch (node->getFlowOp()) {
  4590. case glslang::EOpKill:
  4591. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {
  4592. builder.addCapability(spv::Capability::DemoteToHelperInvocation);
  4593. builder.createNoResultOp(spv::Op::OpDemoteToHelperInvocationEXT);
  4594. } else {
  4595. builder.makeStatementTerminator(spv::Op::OpKill, "post-discard");
  4596. }
  4597. break;
  4598. case glslang::EOpTerminateInvocation:
  4599. builder.addExtension(spv::E_SPV_KHR_terminate_invocation);
  4600. builder.makeStatementTerminator(spv::Op::OpTerminateInvocation, "post-terminate-invocation");
  4601. break;
  4602. case glslang::EOpBreak:
  4603. if (breakForLoop.top())
  4604. builder.createLoopExit();
  4605. else
  4606. builder.addSwitchBreak(false);
  4607. break;
  4608. case glslang::EOpContinue:
  4609. builder.createLoopContinue();
  4610. break;
  4611. case glslang::EOpReturn:
  4612. if (node->getExpression() != nullptr) {
  4613. const glslang::TType& glslangReturnType = node->getExpression()->getType();
  4614. spv::Id returnId = accessChainLoad(glslangReturnType);
  4615. if (builder.getTypeId(returnId) != currentFunction->getReturnType() ||
  4616. TranslatePrecisionDecoration(glslangReturnType) != currentFunction->getReturnPrecision()) {
  4617. builder.clearAccessChain();
  4618. spv::Id copyId = builder.createVariable(currentFunction->getReturnPrecision(),
  4619. spv::StorageClass::Function, currentFunction->getReturnType());
  4620. builder.setAccessChainLValue(copyId);
  4621. multiTypeStore(glslangReturnType, returnId);
  4622. returnId = builder.createLoad(copyId, currentFunction->getReturnPrecision());
  4623. }
  4624. builder.makeReturn(false, returnId);
  4625. } else
  4626. builder.makeReturn(false);
  4627. builder.clearAccessChain();
  4628. break;
  4629. case glslang::EOpDemote:
  4630. builder.createNoResultOp(spv::Op::OpDemoteToHelperInvocationEXT);
  4631. builder.addExtension(spv::E_SPV_EXT_demote_to_helper_invocation);
  4632. builder.addCapability(spv::Capability::DemoteToHelperInvocationEXT);
  4633. break;
  4634. case glslang::EOpTerminateRayKHR:
  4635. builder.makeStatementTerminator(spv::Op::OpTerminateRayKHR, "post-terminateRayKHR");
  4636. break;
  4637. case glslang::EOpIgnoreIntersectionKHR:
  4638. builder.makeStatementTerminator(spv::Op::OpIgnoreIntersectionKHR, "post-ignoreIntersectionKHR");
  4639. break;
  4640. default:
  4641. assert(0);
  4642. break;
  4643. }
  4644. return false;
  4645. }
  4646. bool TGlslangToSpvTraverser::visitVariableDecl(glslang::TVisit visit, glslang::TIntermVariableDecl* node)
  4647. {
  4648. if (visit == glslang::EvPreVisit) {
  4649. builder.setDebugSourceLocation(node->getDeclSymbol()->getLoc().line, node->getDeclSymbol()->getLoc().getFilename());
  4650. // We touch the symbol once here to create the debug info.
  4651. getSymbolId(node->getDeclSymbol());
  4652. }
  4653. return true;
  4654. }
  4655. spv::Id TGlslangToSpvTraverser::createSpvVariable(const glslang::TIntermSymbol* node, spv::Id forcedType)
  4656. {
  4657. // First, steer off constants, which are not SPIR-V variables, but
  4658. // can still have a mapping to a SPIR-V Id.
  4659. // This includes specialization constants.
  4660. if (node->getQualifier().isConstant()) {
  4661. spv::Id result = createSpvConstant(*node);
  4662. if (result != spv::NoResult) {
  4663. auto name = node->getAsSymbolNode()->getAccessName().c_str();
  4664. auto typeId = convertGlslangToSpvType(node->getType());
  4665. builder.createConstVariable(typeId, name, result, currentFunction == nullptr);
  4666. return result;
  4667. }
  4668. }
  4669. // Now, handle actual variables
  4670. spv::StorageClass storageClass = TranslateStorageClass(node->getType());
  4671. spv::Id spvType = forcedType == spv::NoType ? convertGlslangToSpvType(node->getType())
  4672. : forcedType;
  4673. const bool contains16BitType = node->getType().contains16BitFloat() ||
  4674. node->getType().contains16BitInt();
  4675. if (contains16BitType) {
  4676. switch (storageClass) {
  4677. case spv::StorageClass::Input:
  4678. case spv::StorageClass::Output:
  4679. builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);
  4680. builder.addCapability(spv::Capability::StorageInputOutput16);
  4681. break;
  4682. case spv::StorageClass::Uniform:
  4683. builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);
  4684. if (node->getType().getQualifier().storage == glslang::EvqBuffer)
  4685. builder.addCapability(spv::Capability::StorageUniformBufferBlock16);
  4686. else
  4687. builder.addCapability(spv::Capability::StorageUniform16);
  4688. break;
  4689. case spv::StorageClass::PushConstant:
  4690. builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);
  4691. builder.addCapability(spv::Capability::StoragePushConstant16);
  4692. break;
  4693. case spv::StorageClass::StorageBuffer:
  4694. case spv::StorageClass::PhysicalStorageBufferEXT:
  4695. builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);
  4696. builder.addCapability(spv::Capability::StorageUniformBufferBlock16);
  4697. break;
  4698. case spv::StorageClass::TileAttachmentQCOM:
  4699. builder.addCapability(spv::Capability::TileShadingQCOM);
  4700. break;
  4701. default:
  4702. if (storageClass == spv::StorageClass::Workgroup &&
  4703. node->getType().getBasicType() == glslang::EbtBlock) {
  4704. builder.addCapability(spv::Capability::WorkgroupMemoryExplicitLayout16BitAccessKHR);
  4705. break;
  4706. }
  4707. if (node->getType().contains16BitFloat())
  4708. builder.addCapability(spv::Capability::Float16);
  4709. if (node->getType().contains16BitInt())
  4710. builder.addCapability(spv::Capability::Int16);
  4711. break;
  4712. }
  4713. }
  4714. if (node->getType().contains8BitInt()) {
  4715. if (storageClass == spv::StorageClass::PushConstant) {
  4716. builder.addIncorporatedExtension(spv::E_SPV_KHR_8bit_storage, spv::Spv_1_5);
  4717. builder.addCapability(spv::Capability::StoragePushConstant8);
  4718. } else if (storageClass == spv::StorageClass::Uniform) {
  4719. builder.addIncorporatedExtension(spv::E_SPV_KHR_8bit_storage, spv::Spv_1_5);
  4720. builder.addCapability(spv::Capability::UniformAndStorageBuffer8BitAccess);
  4721. } else if (storageClass == spv::StorageClass::StorageBuffer) {
  4722. builder.addIncorporatedExtension(spv::E_SPV_KHR_8bit_storage, spv::Spv_1_5);
  4723. builder.addCapability(spv::Capability::StorageBuffer8BitAccess);
  4724. } else if (storageClass == spv::StorageClass::Workgroup &&
  4725. node->getType().getBasicType() == glslang::EbtBlock) {
  4726. builder.addCapability(spv::Capability::WorkgroupMemoryExplicitLayout8BitAccessKHR);
  4727. } else {
  4728. builder.addCapability(spv::Capability::Int8);
  4729. }
  4730. }
  4731. const char* name = node->getName().c_str();
  4732. if (glslang::IsAnonymous(name))
  4733. name = "";
  4734. spv::Id initializer = spv::NoResult;
  4735. if (node->getType().getQualifier().storage == glslang::EvqUniform && !node->getConstArray().empty()) {
  4736. int nextConst = 0;
  4737. initializer = createSpvConstantFromConstUnionArray(node->getType(),
  4738. node->getConstArray(),
  4739. nextConst,
  4740. false /* specConst */);
  4741. } else if (node->getType().getQualifier().isNullInit()) {
  4742. initializer = builder.makeNullConstant(spvType);
  4743. }
  4744. spv::Id var = builder.createVariable(spv::NoPrecision, storageClass, spvType, name, initializer, false);
  4745. if (options.emitNonSemanticShaderDebugInfo && storageClass != spv::StorageClass::Function) {
  4746. // Create variable alias for retargeted symbols if any.
  4747. // Notably, this is only applicable to built-in variables so that it is okay to only use name as the key.
  4748. auto [itBegin, itEnd] = glslangIntermediate->getBuiltinAliasLookup().equal_range(name);
  4749. for (auto it = itBegin; it != itEnd; ++it) {
  4750. builder.createDebugGlobalVariable(builder.getDebugType(spvType), it->second.c_str(), var);
  4751. }
  4752. }
  4753. std::vector<spv::Decoration> topLevelDecorations;
  4754. glslang::TQualifier typeQualifier = node->getType().getQualifier();
  4755. TranslateMemoryDecoration(typeQualifier, topLevelDecorations, glslangIntermediate->usingVulkanMemoryModel());
  4756. for (auto deco : topLevelDecorations) {
  4757. builder.addDecoration(var, deco);
  4758. }
  4759. return var;
  4760. }
  4761. // Return type Id of the sampled type.
  4762. spv::Id TGlslangToSpvTraverser::getSampledType(const glslang::TSampler& sampler)
  4763. {
  4764. switch (sampler.type) {
  4765. case glslang::EbtInt: return builder.makeIntType(32);
  4766. case glslang::EbtUint: return builder.makeUintType(32);
  4767. case glslang::EbtFloat: return builder.makeFloatType(32);
  4768. case glslang::EbtFloat16:
  4769. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float_fetch);
  4770. builder.addCapability(spv::Capability::Float16ImageAMD);
  4771. return builder.makeFloatType(16);
  4772. case glslang::EbtInt64:
  4773. builder.addExtension(spv::E_SPV_EXT_shader_image_int64);
  4774. builder.addCapability(spv::Capability::Int64ImageEXT);
  4775. return builder.makeIntType(64);
  4776. case glslang::EbtUint64:
  4777. builder.addExtension(spv::E_SPV_EXT_shader_image_int64);
  4778. builder.addCapability(spv::Capability::Int64ImageEXT);
  4779. return builder.makeUintType(64);
  4780. default:
  4781. assert(0);
  4782. return builder.makeFloatType(32);
  4783. }
  4784. }
  4785. // If node is a swizzle operation, return the type that should be used if
  4786. // the swizzle base is first consumed by another operation, before the swizzle
  4787. // is applied.
  4788. spv::Id TGlslangToSpvTraverser::getInvertedSwizzleType(const glslang::TIntermTyped& node)
  4789. {
  4790. if (node.getAsOperator() &&
  4791. node.getAsOperator()->getOp() == glslang::EOpVectorSwizzle)
  4792. return convertGlslangToSpvType(node.getAsBinaryNode()->getLeft()->getType());
  4793. else
  4794. return spv::NoType;
  4795. }
  4796. // When inverting a swizzle with a parent op, this function
  4797. // will apply the swizzle operation to a completed parent operation.
  4798. spv::Id TGlslangToSpvTraverser::createInvertedSwizzle(spv::Decoration precision, const glslang::TIntermTyped& node,
  4799. spv::Id parentResult)
  4800. {
  4801. std::vector<unsigned> swizzle;
  4802. convertSwizzle(*node.getAsBinaryNode()->getRight()->getAsAggregate(), swizzle);
  4803. return builder.createRvalueSwizzle(precision, convertGlslangToSpvType(node.getType()), parentResult, swizzle);
  4804. }
  4805. // Convert a glslang AST swizzle node to a swizzle vector for building SPIR-V.
  4806. void TGlslangToSpvTraverser::convertSwizzle(const glslang::TIntermAggregate& node, std::vector<unsigned>& swizzle)
  4807. {
  4808. const glslang::TIntermSequence& swizzleSequence = node.getSequence();
  4809. for (int i = 0; i < (int)swizzleSequence.size(); ++i)
  4810. swizzle.push_back(swizzleSequence[i]->getAsConstantUnion()->getConstArray()[0].getIConst());
  4811. }
  4812. // Convert from a glslang type to an SPV type, by calling into a
  4813. // recursive version of this function. This establishes the inherited
  4814. // layout state rooted from the top-level type.
  4815. spv::Id TGlslangToSpvTraverser::convertGlslangToSpvType(const glslang::TType& type, bool forwardReferenceOnly)
  4816. {
  4817. return convertGlslangToSpvType(type, getExplicitLayout(type), type.getQualifier(), false, forwardReferenceOnly);
  4818. }
  4819. spv::LinkageType TGlslangToSpvTraverser::convertGlslangLinkageToSpv(glslang::TLinkType linkType)
  4820. {
  4821. switch (linkType) {
  4822. case glslang::ELinkExport:
  4823. return spv::LinkageType::Export;
  4824. default:
  4825. return spv::LinkageType::Max;
  4826. }
  4827. }
  4828. // Do full recursive conversion of an arbitrary glslang type to a SPIR-V Id.
  4829. // explicitLayout can be kept the same throughout the hierarchical recursive walk.
  4830. // Mutually recursive with convertGlslangStructToSpvType().
  4831. spv::Id TGlslangToSpvTraverser::convertGlslangToSpvType(const glslang::TType& type,
  4832. glslang::TLayoutPacking explicitLayout, const glslang::TQualifier& qualifier,
  4833. bool lastBufferBlockMember, bool forwardReferenceOnly)
  4834. {
  4835. spv::Id spvType = spv::NoResult;
  4836. switch (type.getBasicType()) {
  4837. case glslang::EbtVoid:
  4838. spvType = builder.makeVoidType();
  4839. assert (! type.isArray());
  4840. break;
  4841. case glslang::EbtBool:
  4842. // "transparent" bool doesn't exist in SPIR-V. The GLSL convention is
  4843. // a 32-bit int where non-0 means true.
  4844. if (explicitLayout != glslang::ElpNone)
  4845. spvType = builder.makeUintType(32);
  4846. else
  4847. spvType = builder.makeBoolType();
  4848. break;
  4849. case glslang::EbtInt:
  4850. spvType = builder.makeIntType(32);
  4851. break;
  4852. case glslang::EbtUint:
  4853. spvType = builder.makeUintType(32);
  4854. break;
  4855. case glslang::EbtFloat:
  4856. spvType = builder.makeFloatType(32);
  4857. break;
  4858. case glslang::EbtDouble:
  4859. spvType = builder.makeFloatType(64);
  4860. break;
  4861. case glslang::EbtFloat16:
  4862. spvType = builder.makeFloatType(16);
  4863. break;
  4864. case glslang::EbtBFloat16:
  4865. spvType = builder.makeBFloat16Type();
  4866. break;
  4867. case glslang::EbtFloatE5M2:
  4868. spvType = builder.makeFloatE5M2Type();
  4869. break;
  4870. case glslang::EbtFloatE4M3:
  4871. spvType = builder.makeFloatE4M3Type();
  4872. break;
  4873. case glslang::EbtInt8:
  4874. spvType = builder.makeIntType(8);
  4875. break;
  4876. case glslang::EbtUint8:
  4877. spvType = builder.makeUintType(8);
  4878. break;
  4879. case glslang::EbtInt16:
  4880. spvType = builder.makeIntType(16);
  4881. break;
  4882. case glslang::EbtUint16:
  4883. spvType = builder.makeUintType(16);
  4884. break;
  4885. case glslang::EbtInt64:
  4886. spvType = builder.makeIntType(64);
  4887. break;
  4888. case glslang::EbtUint64:
  4889. spvType = builder.makeUintType(64);
  4890. break;
  4891. case glslang::EbtAtomicUint:
  4892. builder.addCapability(spv::Capability::AtomicStorage);
  4893. spvType = builder.makeUintType(32);
  4894. break;
  4895. case glslang::EbtAccStruct:
  4896. switch (glslangIntermediate->getStage()) {
  4897. case EShLangRayGen:
  4898. case EShLangIntersect:
  4899. case EShLangAnyHit:
  4900. case EShLangClosestHit:
  4901. case EShLangMiss:
  4902. case EShLangCallable:
  4903. // these all should have the RayTracingNV/KHR capability already
  4904. break;
  4905. default:
  4906. {
  4907. auto& extensions = glslangIntermediate->getRequestedExtensions();
  4908. if (extensions.find("GL_EXT_ray_query") != extensions.end()) {
  4909. builder.addExtension(spv::E_SPV_KHR_ray_query);
  4910. builder.addCapability(spv::Capability::RayQueryKHR);
  4911. }
  4912. }
  4913. break;
  4914. }
  4915. spvType = builder.makeAccelerationStructureType();
  4916. break;
  4917. case glslang::EbtRayQuery:
  4918. {
  4919. auto& extensions = glslangIntermediate->getRequestedExtensions();
  4920. if (extensions.find("GL_EXT_ray_query") != extensions.end()) {
  4921. builder.addExtension(spv::E_SPV_KHR_ray_query);
  4922. builder.addCapability(spv::Capability::RayQueryKHR);
  4923. }
  4924. spvType = builder.makeRayQueryType();
  4925. }
  4926. break;
  4927. case glslang::EbtReference:
  4928. {
  4929. // Make the forward pointer, then recurse to convert the structure type, then
  4930. // patch up the forward pointer with a real pointer type.
  4931. if (forwardPointers.find(type.getReferentType()) == forwardPointers.end()) {
  4932. spv::Id forwardId = builder.makeForwardPointer(spv::StorageClass::PhysicalStorageBufferEXT);
  4933. forwardPointers[type.getReferentType()] = forwardId;
  4934. }
  4935. spvType = forwardPointers[type.getReferentType()];
  4936. if (!forwardReferenceOnly) {
  4937. spv::Id referentType = convertGlslangToSpvType(*type.getReferentType());
  4938. builder.makePointerFromForwardPointer(spv::StorageClass::PhysicalStorageBufferEXT,
  4939. forwardPointers[type.getReferentType()],
  4940. referentType);
  4941. }
  4942. }
  4943. break;
  4944. case glslang::EbtSampler:
  4945. {
  4946. const glslang::TSampler& sampler = type.getSampler();
  4947. std::string debugName;
  4948. if (sampler.isPureSampler()) {
  4949. if (options.emitNonSemanticShaderDebugInfo) {
  4950. if (glslangIntermediate->getSource() == glslang::EShSourceGlsl) {
  4951. debugName = sampler.getString();
  4952. }
  4953. else {
  4954. debugName = "type.sampler";
  4955. }
  4956. }
  4957. spvType = builder.makeSamplerType(debugName.c_str());
  4958. } else {
  4959. // an image is present, make its type
  4960. if (options.emitNonSemanticShaderDebugInfo) {
  4961. if (glslangIntermediate->getSource() == glslang::EShSourceGlsl) {
  4962. debugName = sampler.removeCombined().getString();
  4963. }
  4964. else {
  4965. switch (sampler.dim) {
  4966. case glslang::Esd1D: debugName = "type.1d.image"; break;
  4967. case glslang::Esd2D: debugName = "type.2d.image"; break;
  4968. case glslang::Esd3D: debugName = "type.3d.image"; break;
  4969. case glslang::EsdCube: debugName = "type.cube.image"; break;
  4970. default: debugName = "type.image"; break;
  4971. }
  4972. }
  4973. }
  4974. spvType = builder.makeImageType(getSampledType(sampler), TranslateDimensionality(sampler),
  4975. sampler.isShadow(), sampler.isArrayed(), sampler.isMultiSample(),
  4976. sampler.isImageClass() ? 2 : 1, TranslateImageFormat(type), debugName.c_str());
  4977. if (sampler.isCombined() &&
  4978. (!sampler.isBuffer() || glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_6)) {
  4979. // Already has both image and sampler, make the combined type. Only combine sampler to
  4980. // buffer if before SPIR-V 1.6.
  4981. if (options.emitNonSemanticShaderDebugInfo) {
  4982. if (glslangIntermediate->getSource() == glslang::EShSourceGlsl) {
  4983. debugName = sampler.getString();
  4984. }
  4985. else {
  4986. debugName = "type.sampled.image";
  4987. }
  4988. }
  4989. spvType = builder.makeSampledImageType(spvType, debugName.c_str());
  4990. }
  4991. }
  4992. }
  4993. break;
  4994. case glslang::EbtStruct:
  4995. case glslang::EbtBlock:
  4996. {
  4997. // If it's an inner declared heap buffer or uniform block, using OpTypeBufferEXT
  4998. // to convert it to an untyped type.
  4999. if (type.getQualifier().isUniformOrBuffer() &&
  5000. type.getQualifier().layoutDescriptorHeap && type.getQualifier().layoutDescriptorInnerBlock) {
  5001. spvType = builder.makeUntypedPointer(TranslateStorageClass(type), true);
  5002. break;
  5003. }
  5004. // If we've seen this struct type, return it
  5005. const glslang::TTypeList* glslangMembers = type.getStruct();
  5006. // Try to share structs for different layouts, but not yet for other
  5007. // kinds of qualification (primarily not yet including interpolant qualification).
  5008. if (! HasNonLayoutQualifiers(type, qualifier))
  5009. spvType = structMap[explicitLayout][qualifier.layoutMatrix][glslangMembers];
  5010. if (spvType != spv::NoResult)
  5011. break;
  5012. // else, we haven't seen it...
  5013. if (type.getBasicType() == glslang::EbtBlock)
  5014. memberRemapper[glslangTypeToIdMap[glslangMembers]].resize(glslangMembers->size());
  5015. spvType = convertGlslangStructToSpvType(type, glslangMembers, explicitLayout, qualifier);
  5016. }
  5017. break;
  5018. case glslang::EbtString:
  5019. // no type used for OpString
  5020. return 0;
  5021. case glslang::EbtHitObjectNV: {
  5022. builder.addExtension(spv::E_SPV_NV_shader_invocation_reorder);
  5023. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  5024. spvType = builder.makeHitObjectNVType();
  5025. }
  5026. break;
  5027. case glslang::EbtHitObjectEXT: {
  5028. builder.addExtension(spv::E_SPV_EXT_shader_invocation_reorder);
  5029. builder.addCapability(spv::Capability::ShaderInvocationReorderEXT);
  5030. spvType = builder.makeHitObjectEXTType();
  5031. }
  5032. break;
  5033. case glslang::EbtSpirvType: {
  5034. // GL_EXT_spirv_intrinsics
  5035. const auto& spirvType = type.getSpirvType();
  5036. const auto& spirvInst = spirvType.spirvInst;
  5037. std::vector<spv::IdImmediate> operands;
  5038. for (const auto& typeParam : spirvType.typeParams) {
  5039. if (typeParam.getAsConstant() != nullptr) {
  5040. // Constant expression
  5041. auto constant = typeParam.getAsConstant();
  5042. if (constant->isLiteral()) {
  5043. if (constant->getBasicType() == glslang::EbtFloat) {
  5044. float floatValue = static_cast<float>(constant->getConstArray()[0].getDConst());
  5045. unsigned literal;
  5046. static_assert(sizeof(literal) == sizeof(floatValue), "sizeof(unsigned) != sizeof(float)");
  5047. memcpy(&literal, &floatValue, sizeof(literal));
  5048. operands.push_back({false, literal});
  5049. } else if (constant->getBasicType() == glslang::EbtInt) {
  5050. unsigned literal = constant->getConstArray()[0].getIConst();
  5051. operands.push_back({false, literal});
  5052. } else if (constant->getBasicType() == glslang::EbtUint) {
  5053. unsigned literal = constant->getConstArray()[0].getUConst();
  5054. operands.push_back({false, literal});
  5055. } else if (constant->getBasicType() == glslang::EbtBool) {
  5056. unsigned literal = constant->getConstArray()[0].getBConst();
  5057. operands.push_back({false, literal});
  5058. } else if (constant->getBasicType() == glslang::EbtString) {
  5059. auto str = constant->getConstArray()[0].getSConst()->c_str();
  5060. unsigned literal = 0;
  5061. char* literalPtr = reinterpret_cast<char*>(&literal);
  5062. unsigned charCount = 0;
  5063. char ch = 0;
  5064. do {
  5065. ch = *(str++);
  5066. *(literalPtr++) = ch;
  5067. ++charCount;
  5068. if (charCount == 4) {
  5069. operands.push_back({false, literal});
  5070. literalPtr = reinterpret_cast<char*>(&literal);
  5071. charCount = 0;
  5072. }
  5073. } while (ch != 0);
  5074. // Partial literal is padded with 0
  5075. if (charCount > 0) {
  5076. for (; charCount < 4; ++charCount)
  5077. *(literalPtr++) = 0;
  5078. operands.push_back({false, literal});
  5079. }
  5080. } else
  5081. assert(0); // Unexpected type
  5082. } else
  5083. operands.push_back({true, createSpvConstant(*constant)});
  5084. } else {
  5085. // Type specifier
  5086. assert(typeParam.getAsType() != nullptr);
  5087. operands.push_back({true, convertGlslangToSpvType(*typeParam.getAsType())});
  5088. }
  5089. }
  5090. assert(spirvInst.set == ""); // Currently, couldn't be extended instructions.
  5091. spvType = builder.makeGenericType(static_cast<spv::Op>(spirvInst.id), operands);
  5092. break;
  5093. }
  5094. case glslang::EbtTensorLayoutNV:
  5095. {
  5096. builder.addCapability(spv::Capability::TensorAddressingNV);
  5097. builder.addExtension(spv::E_SPV_NV_tensor_addressing);
  5098. std::vector<spv::IdImmediate> operands;
  5099. for (uint32_t i = 0; i < 2; ++i) {
  5100. operands.push_back({true, makeArraySizeId(*type.getTypeParameters()->arraySizes, i, true)});
  5101. }
  5102. spvType = builder.makeGenericType(spv::Op::OpTypeTensorLayoutNV, operands);
  5103. break;
  5104. }
  5105. case glslang::EbtTensorViewNV:
  5106. {
  5107. builder.addCapability(spv::Capability::TensorAddressingNV);
  5108. builder.addExtension(spv::E_SPV_NV_tensor_addressing);
  5109. uint32_t dim = type.getTypeParameters()->arraySizes->getDimSize(0);
  5110. assert(dim >= 1 && dim <= 5);
  5111. std::vector<spv::IdImmediate> operands;
  5112. for (uint32_t i = 0; i < dim + 2; ++i) {
  5113. operands.push_back({true, makeArraySizeId(*type.getTypeParameters()->arraySizes, i, true, i==1)});
  5114. }
  5115. spvType = builder.makeGenericType(spv::Op::OpTypeTensorViewNV, operands);
  5116. break;
  5117. }
  5118. default:
  5119. assert(0);
  5120. break;
  5121. }
  5122. if (type.isMatrix())
  5123. spvType = builder.makeMatrixType(spvType, type.getMatrixCols(), type.getMatrixRows());
  5124. else {
  5125. // If this variable has a vector element count greater than 1, create a SPIR-V vector
  5126. if (type.getVectorSize() > 1)
  5127. spvType = builder.makeVectorType(spvType, type.getVectorSize());
  5128. }
  5129. if (type.isCoopMatNV()) {
  5130. builder.addCapability(spv::Capability::CooperativeMatrixNV);
  5131. builder.addExtension(spv::E_SPV_NV_cooperative_matrix);
  5132. if (type.getBasicType() == glslang::EbtFloat16)
  5133. builder.addCapability(spv::Capability::Float16);
  5134. if (type.getBasicType() == glslang::EbtUint8 ||
  5135. type.getBasicType() == glslang::EbtInt8) {
  5136. builder.addCapability(spv::Capability::Int8);
  5137. }
  5138. spv::Id scope = makeArraySizeId(*type.getTypeParameters()->arraySizes, 1);
  5139. spv::Id rows = makeArraySizeId(*type.getTypeParameters()->arraySizes, 2);
  5140. spv::Id cols = makeArraySizeId(*type.getTypeParameters()->arraySizes, 3);
  5141. spvType = builder.makeCooperativeMatrixTypeNV(spvType, scope, rows, cols);
  5142. }
  5143. if (type.isCoopMatKHR()) {
  5144. builder.addCapability(spv::Capability::CooperativeMatrixKHR);
  5145. builder.addExtension(spv::E_SPV_KHR_cooperative_matrix);
  5146. if (type.getBasicType() == glslang::EbtBFloat16) {
  5147. builder.addExtension(spv::E_SPV_KHR_bfloat16);
  5148. builder.addCapability(spv::Capability::BFloat16CooperativeMatrixKHR);
  5149. }
  5150. if (type.getBasicType() == glslang::EbtFloatE5M2 || type.getBasicType() == glslang::EbtFloatE4M3) {
  5151. builder.addExtension(spv::E_SPV_EXT_float8);
  5152. builder.addCapability(spv::Capability::Float8CooperativeMatrixEXT);
  5153. }
  5154. if (type.getBasicType() == glslang::EbtFloat16)
  5155. builder.addCapability(spv::Capability::Float16);
  5156. if (type.getBasicType() == glslang::EbtUint8 || type.getBasicType() == glslang::EbtInt8) {
  5157. builder.addCapability(spv::Capability::Int8);
  5158. }
  5159. spv::Id scope = makeArraySizeId(*type.getTypeParameters()->arraySizes, 0);
  5160. spv::Id rows = makeArraySizeId(*type.getTypeParameters()->arraySizes, 1);
  5161. spv::Id cols = makeArraySizeId(*type.getTypeParameters()->arraySizes, 2);
  5162. spv::Id use = makeArraySizeId(*type.getTypeParameters()->arraySizes, 3, true);
  5163. spvType = builder.makeCooperativeMatrixTypeKHR(spvType, scope, rows, cols, use);
  5164. }
  5165. else if (type.isTensorARM()) {
  5166. builder.addCapability(spv::Capability::TensorsARM);
  5167. builder.addExtension(spv::E_SPV_ARM_tensors);
  5168. if (type.getBasicType() == glslang::EbtInt8 || type.getBasicType() == glslang::EbtUint8) {
  5169. builder.addCapability(spv::Capability::Int8);
  5170. } else if (type.getBasicType() == glslang::EbtInt16 ||
  5171. type.getBasicType() == glslang::EbtUint16) {
  5172. builder.addCapability(spv::Capability::Int16);
  5173. } else if (type.getBasicType() == glslang::EbtInt64 ||
  5174. type.getBasicType() == glslang::EbtUint64) {
  5175. builder.addCapability(spv::Capability::Int64);
  5176. } else if (type.getBasicType() == glslang::EbtFloat16) {
  5177. builder.addCapability(spv::Capability::Float16);
  5178. }
  5179. spv::Id rank = makeArraySizeId(*type.getTypeParameters()->arraySizes, 0);
  5180. spvType = builder.makeTensorTypeARM(spvType, rank);
  5181. }
  5182. if (type.isCoopVecNV()) {
  5183. builder.addCapability(spv::Capability::CooperativeVectorNV);
  5184. builder.addExtension(spv::E_SPV_NV_cooperative_vector);
  5185. if (type.getBasicType() == glslang::EbtFloat16)
  5186. builder.addCapability(spv::Capability::Float16);
  5187. if (type.getBasicType() == glslang::EbtUint8 || type.getBasicType() == glslang::EbtInt8) {
  5188. builder.addCapability(spv::Capability::Int8);
  5189. }
  5190. spv::Id components = makeArraySizeId(*type.getTypeParameters()->arraySizes, 0);
  5191. spvType = builder.makeCooperativeVectorTypeNV(spvType, components);
  5192. }
  5193. if (type.isLongVector()) {
  5194. builder.addCapability(spv::Capability::LongVectorEXT);
  5195. builder.addExtension(spv::E_SPV_EXT_long_vector);
  5196. if (type.getBasicType() == glslang::EbtFloat16)
  5197. builder.addCapability(spv::Capability::Float16);
  5198. if (type.getBasicType() == glslang::EbtUint8 || type.getBasicType() == glslang::EbtInt8) {
  5199. builder.addCapability(spv::Capability::Int8);
  5200. }
  5201. if (type.hasSpecConstantVectorComponents()) {
  5202. spv::Id components = makeArraySizeId(*type.getTypeParameters()->arraySizes, 0);
  5203. spvType = builder.makeCooperativeVectorTypeNV(spvType, components);
  5204. } else {
  5205. spvType = builder.makeVectorType(spvType, type.getTypeParameters()->arraySizes->getDimSize(0));
  5206. }
  5207. }
  5208. if (type.isArray()) {
  5209. int stride = 0; // keep this 0 unless doing an explicit layout; 0 will mean no decoration, no stride
  5210. // Do all but the outer dimension
  5211. if (type.getArraySizes()->getNumDims() > 1) {
  5212. // We need to decorate array strides for types needing explicit layout, except blocks.
  5213. if (explicitLayout != glslang::ElpNone && type.getBasicType() != glslang::EbtBlock) {
  5214. // Use a dummy glslang type for querying internal strides of
  5215. // arrays of arrays, but using just a one-dimensional array.
  5216. glslang::TType simpleArrayType(type, 0); // deference type of the array
  5217. while (simpleArrayType.getArraySizes()->getNumDims() > 1)
  5218. simpleArrayType.getArraySizes()->dereference();
  5219. // Will compute the higher-order strides here, rather than making a whole
  5220. // pile of types and doing repetitive recursion on their contents.
  5221. stride = getArrayStride(simpleArrayType, explicitLayout, qualifier.layoutMatrix);
  5222. }
  5223. // make the arrays
  5224. for (int dim = type.getArraySizes()->getNumDims() - 1; dim > 0; --dim) {
  5225. spvType = builder.makeArrayType(spvType, makeArraySizeId(*type.getArraySizes(), dim), stride);
  5226. if (stride > 0)
  5227. builder.addDecoration(spvType, spv::Decoration::ArrayStride, stride);
  5228. stride *= type.getArraySizes()->getDimSize(dim);
  5229. }
  5230. } else {
  5231. // single-dimensional array, and don't yet have stride
  5232. // We need to decorate array strides for types needing explicit layout, except blocks.
  5233. if (explicitLayout != glslang::ElpNone && type.getBasicType() != glslang::EbtBlock)
  5234. stride = getArrayStride(type, explicitLayout, qualifier.layoutMatrix);
  5235. }
  5236. if (type.getQualifier().storage == glslang::EvqResourceHeap ||
  5237. type.getQualifier().storage == glslang::EvqSamplerHeap) {
  5238. auto structSize = heapStructureTypeSize[spvType];
  5239. spvType = builder.makeRuntimeArray(spvType);
  5240. builder.addDecorationId(spvType, spv::Decoration::ArrayStrideIdEXT, structSize);
  5241. }
  5242. // Do the outer dimension, which might not be known for a runtime-sized array.
  5243. // (Unsized arrays that survive through linking will be runtime-sized arrays)
  5244. else if (type.isSizedArray())
  5245. spvType = builder.makeArrayType(spvType, makeArraySizeId(*type.getArraySizes(), 0), stride);
  5246. else {
  5247. // If we see an runtime array in a buffer_reference, it is not a descriptor
  5248. if (!lastBufferBlockMember && type.getBasicType() != glslang::EbtReference) {
  5249. builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
  5250. builder.addCapability(spv::Capability::RuntimeDescriptorArrayEXT);
  5251. }
  5252. spvType = builder.makeRuntimeArray(spvType);
  5253. }
  5254. if (stride > 0)
  5255. builder.addDecoration(spvType, spv::Decoration::ArrayStride, stride);
  5256. }
  5257. return spvType;
  5258. }
  5259. // Apply SPIR-V decorations to the SPIR-V object (provided by SPIR-V ID). If member index is provided, the
  5260. // decorations are applied to this member.
  5261. void TGlslangToSpvTraverser::applySpirvDecorate(const glslang::TType& type, spv::Id id, std::optional<int> member)
  5262. {
  5263. assert(type.getQualifier().hasSpirvDecorate());
  5264. const glslang::TSpirvDecorate& spirvDecorate = type.getQualifier().getSpirvDecorate();
  5265. // Add spirv_decorate
  5266. for (auto& decorate : spirvDecorate.decorates) {
  5267. if (!decorate.second.empty()) {
  5268. std::vector<unsigned> literals;
  5269. TranslateLiterals(decorate.second, literals);
  5270. if (member.has_value())
  5271. builder.addMemberDecoration(id, *member, static_cast<spv::Decoration>(decorate.first), literals);
  5272. else
  5273. builder.addDecoration(id, static_cast<spv::Decoration>(decorate.first), literals);
  5274. } else {
  5275. if (member.has_value())
  5276. builder.addMemberDecoration(id, *member, static_cast<spv::Decoration>(decorate.first));
  5277. else
  5278. builder.addDecoration(id, static_cast<spv::Decoration>(decorate.first));
  5279. }
  5280. }
  5281. // Add spirv_decorate_id
  5282. if (member.has_value()) {
  5283. // spirv_decorate_id not applied to members
  5284. assert(spirvDecorate.decorateIds.empty());
  5285. } else {
  5286. for (auto& decorateId : spirvDecorate.decorateIds) {
  5287. std::vector<spv::Id> operandIds;
  5288. assert(!decorateId.second.empty());
  5289. for (auto extraOperand : decorateId.second) {
  5290. if (extraOperand->getQualifier().isFrontEndConstant())
  5291. operandIds.push_back(createSpvConstant(*extraOperand));
  5292. else
  5293. operandIds.push_back(getSymbolId(extraOperand->getAsSymbolNode()));
  5294. }
  5295. builder.addDecorationId(id, static_cast<spv::Decoration>(decorateId.first), operandIds);
  5296. }
  5297. }
  5298. // Add spirv_decorate_string
  5299. for (auto& decorateString : spirvDecorate.decorateStrings) {
  5300. std::vector<const char*> strings;
  5301. assert(!decorateString.second.empty());
  5302. for (auto extraOperand : decorateString.second) {
  5303. const char* string = extraOperand->getConstArray()[0].getSConst()->c_str();
  5304. strings.push_back(string);
  5305. }
  5306. if (member.has_value())
  5307. builder.addMemberDecoration(id, *member, static_cast<spv::Decoration>(decorateString.first), strings);
  5308. else
  5309. builder.addDecoration(id, static_cast<spv::Decoration>(decorateString.first), strings);
  5310. }
  5311. }
  5312. // TODO: this functionality should exist at a higher level, in creating the AST
  5313. //
  5314. // Identify interface members that don't have their required extension turned on.
  5315. //
  5316. bool TGlslangToSpvTraverser::filterMember(const glslang::TType& member)
  5317. {
  5318. auto& extensions = glslangIntermediate->getRequestedExtensions();
  5319. if (member.getFieldName() == "gl_SecondaryViewportMaskNV" &&
  5320. extensions.find("GL_NV_stereo_view_rendering") == extensions.end())
  5321. return true;
  5322. if (member.getFieldName() == "gl_SecondaryPositionNV" &&
  5323. extensions.find("GL_NV_stereo_view_rendering") == extensions.end())
  5324. return true;
  5325. if (glslangIntermediate->getStage() == EShLangMesh) {
  5326. if (member.getFieldName() == "gl_PrimitiveShadingRateEXT" &&
  5327. extensions.find("GL_EXT_fragment_shading_rate") == extensions.end())
  5328. return true;
  5329. }
  5330. if (glslangIntermediate->getStage() != EShLangMesh) {
  5331. if (member.getFieldName() == "gl_ViewportMask" &&
  5332. extensions.find("GL_NV_viewport_array2") == extensions.end())
  5333. return true;
  5334. if (member.getFieldName() == "gl_PositionPerViewNV" &&
  5335. extensions.find("GL_NVX_multiview_per_view_attributes") == extensions.end())
  5336. return true;
  5337. if (member.getFieldName() == "gl_ViewportMaskPerViewNV" &&
  5338. extensions.find("GL_NVX_multiview_per_view_attributes") == extensions.end())
  5339. return true;
  5340. }
  5341. return false;
  5342. }
  5343. // Do full recursive conversion of a glslang structure (or block) type to a SPIR-V Id.
  5344. // explicitLayout can be kept the same throughout the hierarchical recursive walk.
  5345. // Mutually recursive with convertGlslangToSpvType().
  5346. spv::Id TGlslangToSpvTraverser::convertGlslangStructToSpvType(const glslang::TType& type,
  5347. const glslang::TTypeList* glslangMembers,
  5348. glslang::TLayoutPacking explicitLayout,
  5349. const glslang::TQualifier& qualifier)
  5350. {
  5351. // Create a vector of struct types for SPIR-V to consume
  5352. std::vector<spv::Id> spvMembers;
  5353. int memberDelta = 0; // how much the member's index changes from glslang to SPIR-V, normally 0,
  5354. // except sometimes for blocks
  5355. std::vector<std::pair<glslang::TType*, glslang::TQualifier> > deferredForwardPointers;
  5356. std::vector<spv::StructMemberDebugInfo> memberDebugInfo;
  5357. for (int i = 0; i < (int)glslangMembers->size(); i++) {
  5358. auto& glslangMember = (*glslangMembers)[i];
  5359. if (glslangMember.type->hiddenMember()) {
  5360. ++memberDelta;
  5361. if (type.getBasicType() == glslang::EbtBlock)
  5362. memberRemapper[glslangTypeToIdMap[glslangMembers]][i] = -1;
  5363. } else {
  5364. if (type.getBasicType() == glslang::EbtBlock) {
  5365. if (filterMember(*glslangMember.type)) {
  5366. memberDelta++;
  5367. memberRemapper[glslangTypeToIdMap[glslangMembers]][i] = -1;
  5368. continue;
  5369. }
  5370. memberRemapper[glslangTypeToIdMap[glslangMembers]][i] = i - memberDelta;
  5371. }
  5372. // modify just this child's view of the qualifier
  5373. glslang::TQualifier memberQualifier = glslangMember.type->getQualifier();
  5374. InheritQualifiers(memberQualifier, qualifier);
  5375. // manually inherit location
  5376. if (! memberQualifier.hasLocation() && qualifier.hasLocation())
  5377. memberQualifier.layoutLocation = qualifier.layoutLocation;
  5378. // recurse
  5379. bool lastBufferBlockMember = qualifier.storage == glslang::EvqBuffer &&
  5380. i == (int)glslangMembers->size() - 1;
  5381. // Make forward pointers for any pointer members.
  5382. if (glslangMember.type->isReference() &&
  5383. forwardPointers.find(glslangMember.type->getReferentType()) == forwardPointers.end()) {
  5384. deferredForwardPointers.push_back(std::make_pair(glslangMember.type, memberQualifier));
  5385. }
  5386. // Create the member type.
  5387. auto const spvMember = convertGlslangToSpvType(*glslangMember.type, explicitLayout, memberQualifier, lastBufferBlockMember,
  5388. glslangMember.type->isReference());
  5389. spvMembers.push_back(spvMember);
  5390. // Update the builder with the type's location so that we can create debug types for the structure members.
  5391. // There doesn't exist a "clean" entry point for this information to be passed along to the builder so, for now,
  5392. // it is stored in the builder and consumed during the construction of composite debug types.
  5393. // TODO: This probably warrants further investigation. This approach was decided to be the least ugly of the
  5394. // quick and dirty approaches that were tried.
  5395. // Advantages of this approach:
  5396. // + Relatively clean. No direct calls into debug type system.
  5397. // + Handles nested recursive structures.
  5398. // Disadvantages of this approach:
  5399. // + Not as clean as desired. Traverser queries/sets persistent state. This is fragile.
  5400. // + Table lookup during creation of composite debug types. This really shouldn't be necessary.
  5401. if(options.emitNonSemanticShaderDebugInfo) {
  5402. spv::StructMemberDebugInfo debugInfo{};
  5403. debugInfo.name = glslangMember.type->getFieldName();
  5404. debugInfo.line = glslangMember.loc.line;
  5405. debugInfo.column = glslangMember.loc.column;
  5406. // Per the GLSL spec, bool variables inside of a uniform or buffer block are generated as uint.
  5407. // But for debug info, we want to represent them as bool because that is the original type in
  5408. // the source code. The bool type can be nested within a vector or a multidimensional array,
  5409. // so we must construct the chain of types up from the scalar bool.
  5410. if (glslangIntermediate->getSource() == glslang::EShSourceGlsl && explicitLayout != glslang::ElpNone &&
  5411. glslangMember.type->getBasicType() == glslang::EbtBool) {
  5412. auto typeId = builder.makeBoolType();
  5413. if (glslangMember.type->isVector()) {
  5414. typeId = builder.makeVectorType(typeId, glslangMember.type->getVectorSize());
  5415. }
  5416. if (glslangMember.type->isArray()) {
  5417. const auto* arraySizes = glslangMember.type->getArraySizes();
  5418. int dims = arraySizes->getNumDims();
  5419. for (int i = dims - 1; i >= 0; --i) {
  5420. spv::Id size = builder.makeIntConstant(arraySizes->getDimSize(i));
  5421. typeId = builder.makeArrayType(typeId, size, 0);
  5422. }
  5423. }
  5424. debugInfo.debugTypeOverride = builder.getDebugType(typeId);
  5425. }
  5426. memberDebugInfo.push_back(debugInfo);
  5427. }
  5428. }
  5429. }
  5430. // For those whose storage is ResourceHeap or SamplerHeap, we needs to recursively add
  5431. // member decorator for inner structure member declaration with spec Constant.
  5432. spv::Id heapStructSize = 0;
  5433. if (qualifier.storage == glslang::EvqResourceHeap || qualifier.storage == glslang::EvqSamplerHeap ||
  5434. qualifier.layoutDescriptorInnerBlock) {
  5435. auto memberBaseOffset = builder.makeUintConstant(0);
  5436. int maxPlainDataTypeAlignment = 0;
  5437. spv::Id descTypeMaxAlignment = 0;
  5438. auto structLastMemberSize =
  5439. decorateDescHeapType(type, memberBaseOffset, descTypeMaxAlignment, maxPlainDataTypeAlignment);
  5440. auto structureUnaligned = builder.createSpecConstantOp(
  5441. spv::Op::OpIAdd, builder.makeUintType(32), {memberBaseOffset, structLastMemberSize}, {});
  5442. auto structurePadding = builder.createSpecConstantOp(
  5443. spv::Op::OpUMod, builder.makeUintType(32), {descTypeMaxAlignment, structureUnaligned}, {});
  5444. heapStructSize = builder.createSpecConstantOp(
  5445. spv::Op::OpIAdd, builder.makeUintType(32), {structureUnaligned, structurePadding}, {});
  5446. HeapMetaData meta = {heapStructSize, descTypeMaxAlignment, maxPlainDataTypeAlignment};
  5447. heapStructureTypeMetaData[&type] = meta;
  5448. }
  5449. // Make the SPIR-V type
  5450. spv::Id spvType = builder.makeStructType(spvMembers, memberDebugInfo, type.getTypeName().c_str(), false);
  5451. if (! HasNonLayoutQualifiers(type, qualifier))
  5452. structMap[explicitLayout][qualifier.layoutMatrix][glslangMembers] = spvType;
  5453. // Keep decoration data order after spv structure type.
  5454. if (qualifier.storage == glslang::EvqResourceHeap || qualifier.storage == glslang::EvqSamplerHeap ||
  5455. qualifier.layoutDescriptorInnerBlock) {
  5456. heapStructureTypeSize[spvType] = heapStructSize;
  5457. for (unsigned int i = 0; i < spvMembers.size(); i++) {
  5458. builder.addMemberDecorationIdEXT(spvType, i, spv::Decoration::OffsetIdEXT, {heapStructureMemberOffsets[i]});
  5459. }
  5460. heapStructureMemberOffsets.clear();
  5461. }
  5462. // Decorate it
  5463. decorateStructType(type, glslangMembers, explicitLayout, qualifier, spvType, spvMembers);
  5464. for (int i = 0; i < (int)deferredForwardPointers.size(); ++i) {
  5465. auto it = deferredForwardPointers[i];
  5466. convertGlslangToSpvType(*it.first, explicitLayout, it.second, false);
  5467. }
  5468. return spvType;
  5469. }
  5470. // Return not aligned size of current type.
  5471. spv::Id TGlslangToSpvTraverser::decorateDescHeapType(
  5472. const glslang::TType& type,
  5473. spv::Id &memberBaseOffset,
  5474. spv::Id &descTypeAlignment,
  5475. int& maxPlainDataAlignment)
  5476. {
  5477. glslang::TLayoutPacking explicitLayout = glslang::ElpScalar;
  5478. auto selectMaxRsrcTyAlign = [&](spv::Id typeSize) {
  5479. if (descTypeAlignment != 0) {
  5480. auto compareInst = builder.createSpecConstantOp(spv::Op::OpUGreaterThan, builder.makeBoolType(),
  5481. {descTypeAlignment, typeSize}, {});
  5482. auto selectMaxAlign = builder.createSpecConstantOp(spv::Op::OpSelect, builder.makeUintType(32),
  5483. {compareInst, descTypeAlignment, typeSize}, {});
  5484. descTypeAlignment = selectMaxAlign;
  5485. } else
  5486. descTypeAlignment = typeSize;
  5487. };
  5488. // Get or calculate following info ordered.
  5489. // Member Type | Type size | Type alignment within current structure | Type offset.
  5490. // PS. resource blocks declared within a structure will not be processed as a normal declaration before,
  5491. // and its' size is dependent on constantSizeOfEXT op, so we won't trigger it as a normal structure here.
  5492. bool isArray = type.isArray();
  5493. if (type.isStruct() && !type.getQualifier().layoutDescriptorInnerBlock) {
  5494. // 1. Structure type is processed from inner to higher level.
  5495. // If member is a sturcture, it will be processed earlier,
  5496. // parent structure could just load early results.
  5497. if (heapStructureTypeMetaData.find(&type) != heapStructureTypeMetaData.end()) {
  5498. auto metadata = heapStructureTypeMetaData[&type];
  5499. selectMaxRsrcTyAlign(metadata.maxRsrcTypeAlignment);
  5500. maxPlainDataAlignment = std::max(metadata.maxPlainDataAlignment, maxPlainDataAlignment);
  5501. return metadata.typeStride;
  5502. }
  5503. // For other nested structure, it would be declared before its parent,
  5504. // so it should be directly returned a result in above check.
  5505. const glslang::TTypeList* structTyList = type.getStruct();
  5506. spv::Id previousTypeSize = 0;
  5507. auto currentOffset = memberBaseOffset;
  5508. for (int i = 0; i < (int)structTyList->size(); i++) {
  5509. // Get offset :
  5510. // OffsetsBase = default ? 0 : OffsetInLayout;
  5511. // OffsetsBase = OffsetsBase + previousOffset + previousPadding.
  5512. const glslang::TType& memberTy = *(*structTyList)[i].type;
  5513. spv::Id typeSize = decorateDescHeapType(memberTy, currentOffset, descTypeAlignment, maxPlainDataAlignment);
  5514. // 2. Get each member's unaligned offset, padding and aligned offset.
  5515. // As this function is processed recursively, from bottom to upper, so in here,
  5516. // non-structure member's alignment should have been known.
  5517. if (i != 0) {
  5518. auto offsetNotAligned = builder.createSpecConstantOp(spv::Op::OpIAdd, builder.makeUintType(32),
  5519. {currentOffset, previousTypeSize}, {});
  5520. auto offsetPadding = builder.createSpecConstantOp(spv::Op::OpUMod, builder.makeUintType(32),
  5521. {typeSize, offsetNotAligned}, {});
  5522. currentOffset = builder.createSpecConstantOp(spv::Op::OpIAdd, builder.makeUintType(32),
  5523. {offsetNotAligned, offsetPadding}, {});
  5524. }
  5525. heapStructureMemberOffsets.push_back(currentOffset);
  5526. previousTypeSize = typeSize;
  5527. }
  5528. // 3. Structure level, get max resource type's alignment, max plain data alignment and final
  5529. // structure inner alignment.
  5530. // Get compared result for alignment within whole structure.
  5531. spv::Id maxPlainAlignmentSize = builder.makeIntConstant(maxPlainDataAlignment);
  5532. // Select biggest alignemnt size between desc types and plain old types.
  5533. selectMaxRsrcTyAlign(maxPlainAlignmentSize);
  5534. memberBaseOffset = currentOffset;
  5535. // Now, return generates size of the MaterialData type
  5536. // Get structure level unaligned offset, padding and final offset outside.
  5537. return previousTypeSize;
  5538. }
  5539. // Following are normal types, structures/blocks have been processed in above part.
  5540. // Normal type or member type within a structure.
  5541. bool useConstantSizeOf =
  5542. ((type.getQualifier().isUniformOrBuffer() && type.getQualifier().layoutDescriptorHeap) ||
  5543. type.isImage() || type.isTexture() || type.isTensorARM() || type.getBasicType() == glslang::EbtAccStruct);
  5544. // Get single type and layout info.
  5545. int elemCurrentOffset, elemAlignedSize;
  5546. int memberSize, dummyStride, typeAlignment;
  5547. spv::Id spvType = 0;
  5548. if (isArray) {
  5549. glslang::TType elemTy(type, 0);
  5550. elemTy.clearArraySizes();
  5551. if (!useConstantSizeOf) {
  5552. typeAlignment = glslangIntermediate->getMemberAlignment(
  5553. elemTy, memberSize, dummyStride, glslang::ElpScalar, elemTy.getQualifier().layoutMatrix == glslang::ElmRowMajor);
  5554. updateMemberOffset(elemTy, elemTy, elemCurrentOffset, elemAlignedSize, explicitLayout, elemTy.getQualifier().layoutMatrix);
  5555. elemAlignedSize *= type.getCumulativeArraySize();
  5556. }
  5557. spvType = convertGlslangToSpvType(elemTy);
  5558. } else {
  5559. if (!useConstantSizeOf) {
  5560. typeAlignment = glslangIntermediate->getMemberAlignment(
  5561. type, memberSize, dummyStride, glslang::ElpScalar, type.getQualifier().layoutMatrix == glslang::ElmRowMajor);
  5562. updateMemberOffset(type, type, elemCurrentOffset, elemAlignedSize, explicitLayout, type.getQualifier().layoutMatrix);
  5563. }
  5564. spvType = convertGlslangToSpvType(type);
  5565. }
  5566. // Get alignment and type size.
  5567. spv::Id typeSize = 0;
  5568. if (useConstantSizeOf) {
  5569. typeSize = builder.createConstantSizeOfEXT(spvType);
  5570. // For resource type, needs to check current's largest alignment to select.
  5571. // New parent structure's alignment is equal to:
  5572. // maxInnerAlignment = currentAlignment > maxInnerAlignment
  5573. // ? currentAlignment
  5574. // : maxInnerAlignment;
  5575. selectMaxRsrcTyAlign(typeSize);
  5576. } else {
  5577. typeSize = builder.makeIntConstant(elemAlignedSize);
  5578. maxPlainDataAlignment = std::max(typeAlignment, maxPlainDataAlignment);
  5579. }
  5580. return typeSize;
  5581. }
  5582. void TGlslangToSpvTraverser::decorateStructType(const glslang::TType& type,
  5583. const glslang::TTypeList* glslangMembers,
  5584. glslang::TLayoutPacking explicitLayout,
  5585. const glslang::TQualifier& qualifier,
  5586. spv::Id spvType,
  5587. const std::vector<spv::Id>& spvMembers)
  5588. {
  5589. // Name and decorate the non-hidden members
  5590. int offset = -1;
  5591. bool memberLocationInvalid = type.isArrayOfArrays() ||
  5592. (type.isArray() && (type.getQualifier().isArrayedIo(glslangIntermediate->getStage()) == false));
  5593. for (int i = 0; i < (int)glslangMembers->size(); i++) {
  5594. glslang::TType& glslangMember = *(*glslangMembers)[i].type;
  5595. int member = i;
  5596. if (type.getBasicType() == glslang::EbtBlock) {
  5597. member = memberRemapper[glslangTypeToIdMap[glslangMembers]][i];
  5598. if (filterMember(glslangMember))
  5599. continue;
  5600. }
  5601. // modify just this child's view of the qualifier
  5602. glslang::TQualifier memberQualifier = glslangMember.getQualifier();
  5603. InheritQualifiers(memberQualifier, qualifier);
  5604. // using -1 above to indicate a hidden member
  5605. if (member < 0)
  5606. continue;
  5607. builder.addMemberName(spvType, member, glslangMember.getFieldName().c_str());
  5608. builder.addMemberDecoration(spvType, member,
  5609. TranslateLayoutDecoration(glslangMember, memberQualifier.layoutMatrix));
  5610. builder.addMemberDecoration(spvType, member, TranslatePrecisionDecoration(glslangMember));
  5611. // Add interpolation and auxiliary storage decorations only to
  5612. // top-level members of Input and Output storage classes
  5613. if (type.getQualifier().storage == glslang::EvqVaryingIn ||
  5614. type.getQualifier().storage == glslang::EvqVaryingOut) {
  5615. if (type.getBasicType() == glslang::EbtBlock ||
  5616. glslangIntermediate->getSource() == glslang::EShSourceHlsl) {
  5617. builder.addMemberDecoration(spvType, member, TranslateInterpolationDecoration(memberQualifier));
  5618. builder.addMemberDecoration(spvType, member, TranslateAuxiliaryStorageDecoration(memberQualifier));
  5619. addMeshNVDecoration(spvType, member, memberQualifier);
  5620. }
  5621. }
  5622. builder.addMemberDecoration(spvType, member, TranslateInvariantDecoration(memberQualifier));
  5623. if (type.getBasicType() == glslang::EbtBlock &&
  5624. qualifier.storage == glslang::EvqBuffer) {
  5625. // Add memory decorations only to top-level members of shader storage block
  5626. std::vector<spv::Decoration> memory;
  5627. TranslateMemoryDecoration(memberQualifier, memory, glslangIntermediate->usingVulkanMemoryModel());
  5628. for (unsigned int i = 0; i < memory.size(); ++i)
  5629. builder.addMemberDecoration(spvType, member, memory[i]);
  5630. }
  5631. // Location assignment was already completed correctly by the front end,
  5632. // just track whether a member needs to be decorated.
  5633. // Ignore member locations if the container is an array, as that's
  5634. // ill-specified and decisions have been made to not allow this.
  5635. if (!memberLocationInvalid && memberQualifier.hasLocation())
  5636. builder.addMemberDecoration(spvType, member, spv::Decoration::Location, memberQualifier.layoutLocation);
  5637. // component, XFB, others
  5638. if (glslangMember.getQualifier().hasComponent())
  5639. builder.addMemberDecoration(spvType, member, spv::Decoration::Component,
  5640. glslangMember.getQualifier().layoutComponent);
  5641. if (glslangMember.getQualifier().hasXfbOffset())
  5642. builder.addMemberDecoration(spvType, member, spv::Decoration::Offset,
  5643. glslangMember.getQualifier().layoutXfbOffset);
  5644. else if (glslangMember.getQualifier().hasMemberOffset()) {
  5645. builder.addExtension(spv::E_SPV_NV_push_constant_bank);
  5646. builder.addCapability(spv::Capability::PushConstantBanksNV);
  5647. builder.addMemberDecoration(spvType, member, spv::Decoration::MemberOffsetNV,
  5648. glslangMember.getQualifier().layoutMemberOffset);
  5649. } else if (explicitLayout != glslang::ElpNone) {
  5650. // figure out what to do with offset, which is accumulating
  5651. int nextOffset;
  5652. updateMemberOffset(type, glslangMember, offset, nextOffset, explicitLayout, memberQualifier.layoutMatrix);
  5653. if (offset >= 0)
  5654. builder.addMemberDecoration(spvType, member, spv::Decoration::Offset, offset);
  5655. offset = nextOffset;
  5656. }
  5657. if (glslangMember.isMatrix() && explicitLayout != glslang::ElpNone)
  5658. builder.addMemberDecoration(spvType, member, spv::Decoration::MatrixStride,
  5659. getMatrixStride(glslangMember, explicitLayout, memberQualifier.layoutMatrix));
  5660. // built-in variable decorations
  5661. spv::BuiltIn builtIn = TranslateBuiltInDecoration(glslangMember.getQualifier().builtIn, true);
  5662. // built-in decoration is used to detect AST nodes, but won't be decorated on member variables.
  5663. if (builtIn != spv::BuiltIn::Max &&
  5664. builtIn != spv::BuiltIn::ResourceHeapEXT && builtIn != spv::BuiltIn::SamplerHeapEXT)
  5665. builder.addMemberDecoration(spvType, member, spv::Decoration::BuiltIn, (int)builtIn);
  5666. // nonuniform
  5667. builder.addMemberDecoration(spvType, member, TranslateNonUniformDecoration(glslangMember.getQualifier()));
  5668. if (glslangIntermediate->getHlslFunctionality1() && memberQualifier.semanticName != nullptr) {
  5669. builder.addExtension("SPV_GOOGLE_hlsl_functionality1");
  5670. builder.addMemberDecoration(spvType, member, spv::Decoration::HlslSemanticGOOGLE,
  5671. memberQualifier.semanticName);
  5672. }
  5673. if (builtIn == spv::BuiltIn::Layer) {
  5674. // SPV_NV_viewport_array2 extension
  5675. if (glslangMember.getQualifier().layoutViewportRelative){
  5676. builder.addMemberDecoration(spvType, member, spv::Decoration::ViewportRelativeNV);
  5677. builder.addCapability(spv::Capability::ShaderViewportMaskNV);
  5678. builder.addExtension(spv::E_SPV_NV_viewport_array2);
  5679. }
  5680. if (glslangMember.getQualifier().layoutSecondaryViewportRelativeOffset != -2048){
  5681. builder.addMemberDecoration(spvType, member,
  5682. spv::Decoration::SecondaryViewportRelativeNV,
  5683. glslangMember.getQualifier().layoutSecondaryViewportRelativeOffset);
  5684. builder.addCapability(spv::Capability::ShaderStereoViewNV);
  5685. builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
  5686. }
  5687. }
  5688. if (glslangMember.getQualifier().layoutPassthrough) {
  5689. builder.addMemberDecoration(spvType, member, spv::Decoration::PassthroughNV);
  5690. builder.addCapability(spv::Capability::GeometryShaderPassthroughNV);
  5691. builder.addExtension(spv::E_SPV_NV_geometry_shader_passthrough);
  5692. }
  5693. // Add SPIR-V decorations (GL_EXT_spirv_intrinsics)
  5694. if (glslangMember.getQualifier().hasSpirvDecorate())
  5695. applySpirvDecorate(glslangMember, spvType, member);
  5696. }
  5697. // Decorate the structure
  5698. builder.addDecoration(spvType, TranslateLayoutDecoration(type, qualifier.layoutMatrix));
  5699. const auto basicType = type.getBasicType();
  5700. const auto typeStorageQualifier = type.getQualifier().storage;
  5701. if (basicType == glslang::EbtBlock) {
  5702. builder.addDecoration(spvType, TranslateBlockDecoration(typeStorageQualifier, glslangIntermediate->usingStorageBuffer()));
  5703. } else if (basicType == glslang::EbtStruct && glslangIntermediate->getSpv().vulkan > 0) {
  5704. const auto hasRuntimeArray = !spvMembers.empty() && builder.getOpCode(spvMembers.back()) == spv::Op::OpTypeRuntimeArray;
  5705. if (hasRuntimeArray) {
  5706. builder.addDecoration(spvType, TranslateBlockDecoration(typeStorageQualifier, glslangIntermediate->usingStorageBuffer()));
  5707. }
  5708. }
  5709. if (qualifier.hasHitObjectShaderRecordNV())
  5710. builder.addDecoration(spvType, spv::Decoration::HitObjectShaderRecordBufferNV);
  5711. if (qualifier.hasBank()) {
  5712. builder.addExtension(spv::E_SPV_NV_push_constant_bank);
  5713. builder.addCapability(spv::Capability::PushConstantBanksNV);
  5714. builder.addDecoration(spvType, spv::Decoration::BankNV, qualifier.layoutBank);
  5715. }
  5716. if (qualifier.hasHitObjectShaderRecordEXT())
  5717. builder.addDecoration(spvType, spv::Decoration::HitObjectShaderRecordBufferEXT);
  5718. }
  5719. // Turn the expression forming the array size into an id.
  5720. // This is not quite trivial, because of specialization constants.
  5721. // Sometimes, a raw constant is turned into an Id, and sometimes
  5722. // a specialization constant expression is.
  5723. spv::Id TGlslangToSpvTraverser::makeArraySizeId(const glslang::TArraySizes& arraySizes, int dim, bool allowZero, bool boolType)
  5724. {
  5725. // First, see if this is sized with a node, meaning a specialization constant:
  5726. glslang::TIntermTyped* specNode = arraySizes.getDimNode(dim);
  5727. if (specNode != nullptr) {
  5728. builder.clearAccessChain();
  5729. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  5730. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  5731. specNode->traverse(this);
  5732. return accessChainLoad(specNode->getAsTyped()->getType());
  5733. }
  5734. // Otherwise, need a compile-time (front end) size, get it:
  5735. int size = arraySizes.getDimSize(dim);
  5736. if (!allowZero)
  5737. assert(size > 0);
  5738. if (boolType) {
  5739. return builder.makeBoolConstant(size);
  5740. } else {
  5741. return builder.makeUintConstant(size);
  5742. }
  5743. }
  5744. // Wrap the builder's accessChainLoad to:
  5745. // - localize handling of RelaxedPrecision
  5746. // - use the SPIR-V inferred type instead of another conversion of the glslang type
  5747. // (avoids unnecessary work and possible type punning for structures)
  5748. // - do conversion of concrete to abstract type
  5749. spv::Id TGlslangToSpvTraverser::accessChainLoad(const glslang::TType& type)
  5750. {
  5751. spv::Id nominalTypeId = builder.accessChainGetInferredType();
  5752. spv::Builder::AccessChain::CoherentFlags coherentFlags = builder.getAccessChain().coherentFlags;
  5753. coherentFlags |= TranslateCoherent(type);
  5754. spv::MemoryAccessMask accessMask = spv::MemoryAccessMask(TranslateMemoryAccess(coherentFlags) & ~spv::MemoryAccessMask::MakePointerAvailableKHR);
  5755. // If the value being loaded is HelperInvocation, SPIR-V 1.6 is being generated (so that
  5756. // SPV_EXT_demote_to_helper_invocation is in core) and the memory model is in use, add
  5757. // the Volatile MemoryAccess semantic.
  5758. if (type.getQualifier().builtIn == glslang::EbvHelperInvocation &&
  5759. glslangIntermediate->usingVulkanMemoryModel() &&
  5760. glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {
  5761. accessMask = spv::MemoryAccessMask(accessMask | spv::MemoryAccessMask::Volatile);
  5762. }
  5763. unsigned int alignment = builder.getAccessChain().alignment;
  5764. alignment |= type.getBufferReferenceAlignment();
  5765. spv::Id loadedId = builder.accessChainLoad(TranslatePrecisionDecoration(type),
  5766. TranslateNonUniformDecoration(builder.getAccessChain().coherentFlags),
  5767. TranslateNonUniformDecoration(type.getQualifier()),
  5768. nominalTypeId,
  5769. accessMask,
  5770. TranslateMemoryScope(coherentFlags),
  5771. alignment);
  5772. // Need to convert to abstract types when necessary
  5773. if (type.getBasicType() == glslang::EbtBool) {
  5774. loadedId = convertLoadedBoolInUniformToUint(type, nominalTypeId, loadedId);
  5775. }
  5776. if (!builder.getAccessChain().descHeapInfo.descHeapInstId.empty()) {
  5777. for (auto heapInst : builder.getAccessChain().descHeapInfo.descHeapInstId)
  5778. heapInst->setTypeId(convertGlslangToSpvType(type));
  5779. builder.clearAccessChain();
  5780. }
  5781. return loadedId;
  5782. }
  5783. // Wrap the builder's accessChainStore to:
  5784. // - do conversion of concrete to abstract type
  5785. //
  5786. // Implicitly uses the existing builder.accessChain as the storage target.
  5787. void TGlslangToSpvTraverser::accessChainStore(const glslang::TType& type, spv::Id rvalue)
  5788. {
  5789. // Need to convert to abstract types when necessary
  5790. if (type.getBasicType() == glslang::EbtBool) {
  5791. spv::Id nominalTypeId = builder.accessChainGetInferredType();
  5792. if (builder.isScalarType(nominalTypeId)) {
  5793. // Conversion for bool
  5794. spv::Id boolType = builder.makeBoolType();
  5795. if (nominalTypeId != boolType) {
  5796. // keep these outside arguments, for determinant order-of-evaluation
  5797. spv::Id one = builder.makeUintConstant(1);
  5798. spv::Id zero = builder.makeUintConstant(0);
  5799. rvalue = builder.createTriOp(spv::Op::OpSelect, nominalTypeId, rvalue, one, zero);
  5800. } else if (builder.getTypeId(rvalue) != boolType)
  5801. rvalue = builder.createBinOp(spv::Op::OpINotEqual, boolType, rvalue, builder.makeUintConstant(0));
  5802. } else if (builder.isVectorType(nominalTypeId)) {
  5803. // Conversion for bvec
  5804. int vecSize = builder.getNumTypeComponents(nominalTypeId);
  5805. spv::Id bvecType = builder.makeVectorType(builder.makeBoolType(), vecSize);
  5806. if (nominalTypeId != bvecType) {
  5807. // keep these outside arguments, for determinant order-of-evaluation
  5808. spv::Id one = makeSmearedConstant(builder.makeUintConstant(1), vecSize);
  5809. spv::Id zero = makeSmearedConstant(builder.makeUintConstant(0), vecSize);
  5810. rvalue = builder.createTriOp(spv::Op::OpSelect, nominalTypeId, rvalue, one, zero);
  5811. } else if (builder.getTypeId(rvalue) != bvecType)
  5812. rvalue = builder.createBinOp(spv::Op::OpINotEqual, bvecType, rvalue,
  5813. makeSmearedConstant(builder.makeUintConstant(0), vecSize));
  5814. }
  5815. }
  5816. spv::Builder::AccessChain::CoherentFlags coherentFlags = builder.getAccessChain().coherentFlags;
  5817. coherentFlags |= TranslateCoherent(type);
  5818. unsigned int alignment = builder.getAccessChain().alignment;
  5819. alignment |= type.getBufferReferenceAlignment();
  5820. builder.accessChainStore(rvalue, TranslateNonUniformDecoration(builder.getAccessChain().coherentFlags),
  5821. spv::MemoryAccessMask(TranslateMemoryAccess(coherentFlags) &
  5822. ~spv::MemoryAccessMask::MakePointerVisibleKHR),
  5823. TranslateMemoryScope(coherentFlags), alignment);
  5824. }
  5825. // For storing when types match at the glslang level, but not might match at the
  5826. // SPIR-V level.
  5827. //
  5828. // This especially happens when a single glslang type expands to multiple
  5829. // SPIR-V types, like a struct that is used in a member-undecorated way as well
  5830. // as in a member-decorated way.
  5831. //
  5832. // NOTE: This function can handle any store request; if it's not special it
  5833. // simplifies to a simple OpStore.
  5834. //
  5835. // Implicitly uses the existing builder.accessChain as the storage target.
  5836. void TGlslangToSpvTraverser::multiTypeStore(const glslang::TType& type, spv::Id rValue)
  5837. {
  5838. // we only do the complex path here if it's an aggregate
  5839. if (! type.isStruct() && ! type.isArray()) {
  5840. accessChainStore(type, rValue);
  5841. return;
  5842. }
  5843. // and, it has to be a case of type aliasing
  5844. spv::Id rType = builder.getTypeId(rValue);
  5845. spv::Id lValue = builder.accessChainGetLValue();
  5846. spv::Id lType = builder.getContainedTypeId(builder.getTypeId(lValue));
  5847. if (lType == rType) {
  5848. accessChainStore(type, rValue);
  5849. return;
  5850. }
  5851. // Recursively (as needed) copy an aggregate type to a different aggregate type,
  5852. // where the two types were the same type in GLSL. This requires member
  5853. // by member copy, recursively.
  5854. // SPIR-V 1.4 added an instruction to do help do this.
  5855. if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {
  5856. // However, bool in uniform space is changed to int, so
  5857. // OpCopyLogical does not work for that.
  5858. // TODO: It would be more robust to do a full recursive verification of the types satisfying SPIR-V rules.
  5859. bool rBool = builder.containsType(builder.getTypeId(rValue), spv::Op::OpTypeBool, 0);
  5860. bool lBool = builder.containsType(lType, spv::Op::OpTypeBool, 0);
  5861. if (lBool == rBool) {
  5862. spv::Id logicalCopy = builder.createUnaryOp(spv::Op::OpCopyLogical, lType, rValue);
  5863. accessChainStore(type, logicalCopy);
  5864. return;
  5865. }
  5866. }
  5867. // If an array, copy element by element.
  5868. if (type.isArray()) {
  5869. glslang::TType glslangElementType(type, 0);
  5870. spv::Id elementRType = builder.getContainedTypeId(rType);
  5871. for (int index = 0; index < type.getOuterArraySize(); ++index) {
  5872. // get the source member
  5873. spv::Id elementRValue = builder.createCompositeExtract(rValue, elementRType, index);
  5874. // set up the target storage
  5875. builder.clearAccessChain();
  5876. builder.setAccessChainLValue(lValue);
  5877. builder.accessChainPush(builder.makeIntConstant(index), TranslateCoherent(type),
  5878. type.getBufferReferenceAlignment());
  5879. // store the member
  5880. multiTypeStore(glslangElementType, elementRValue);
  5881. }
  5882. } else {
  5883. assert(type.isStruct());
  5884. // loop over structure members
  5885. const glslang::TTypeList& members = *type.getStruct();
  5886. for (int m = 0; m < (int)members.size(); ++m) {
  5887. const glslang::TType& glslangMemberType = *members[m].type;
  5888. // get the source member
  5889. spv::Id memberRType = builder.getContainedTypeId(rType, m);
  5890. spv::Id memberRValue = builder.createCompositeExtract(rValue, memberRType, m);
  5891. // set up the target storage
  5892. builder.clearAccessChain();
  5893. builder.setAccessChainLValue(lValue);
  5894. builder.accessChainPush(builder.makeIntConstant(m), TranslateCoherent(type),
  5895. type.getBufferReferenceAlignment());
  5896. // store the member
  5897. multiTypeStore(glslangMemberType, memberRValue);
  5898. }
  5899. }
  5900. }
  5901. // Decide whether or not this type should be
  5902. // decorated with offsets and strides, and if so
  5903. // whether std140 or std430 rules should be applied.
  5904. glslang::TLayoutPacking TGlslangToSpvTraverser::getExplicitLayout(const glslang::TType& type) const
  5905. {
  5906. // has to be a block
  5907. if (type.getBasicType() != glslang::EbtBlock)
  5908. return glslang::ElpNone;
  5909. // has to be a uniform or buffer block or task in/out blocks
  5910. if (type.getQualifier().storage != glslang::EvqUniform &&
  5911. type.getQualifier().storage != glslang::EvqBuffer &&
  5912. type.getQualifier().storage != glslang::EvqShared &&
  5913. !type.getQualifier().isTaskMemory())
  5914. return glslang::ElpNone;
  5915. // return the layout to use
  5916. switch (type.getQualifier().layoutPacking) {
  5917. case glslang::ElpStd140:
  5918. case glslang::ElpStd430:
  5919. case glslang::ElpScalar:
  5920. return type.getQualifier().layoutPacking;
  5921. default:
  5922. return glslang::ElpNone;
  5923. }
  5924. }
  5925. // Given an array type, returns the integer stride required for that array
  5926. int TGlslangToSpvTraverser::getArrayStride(const glslang::TType& arrayType, glslang::TLayoutPacking explicitLayout,
  5927. glslang::TLayoutMatrix matrixLayout)
  5928. {
  5929. int size;
  5930. int stride;
  5931. glslangIntermediate->getMemberAlignment(arrayType, size, stride, explicitLayout,
  5932. matrixLayout == glslang::ElmRowMajor);
  5933. return stride;
  5934. }
  5935. // Given a matrix type, or array (of array) of matrixes type, returns the integer stride required for that matrix
  5936. // when used as a member of an interface block
  5937. int TGlslangToSpvTraverser::getMatrixStride(const glslang::TType& matrixType, glslang::TLayoutPacking explicitLayout,
  5938. glslang::TLayoutMatrix matrixLayout)
  5939. {
  5940. glslang::TType elementType;
  5941. elementType.shallowCopy(matrixType);
  5942. elementType.clearArraySizes();
  5943. int size;
  5944. int stride;
  5945. glslangIntermediate->getMemberAlignment(elementType, size, stride, explicitLayout,
  5946. matrixLayout == glslang::ElmRowMajor);
  5947. return stride;
  5948. }
  5949. // Given a member type of a struct, realign the current offset for it, and compute
  5950. // the next (not yet aligned) offset for the next member, which will get aligned
  5951. // on the next call.
  5952. // 'currentOffset' should be passed in already initialized, ready to modify, and reflecting
  5953. // the migration of data from nextOffset -> currentOffset. It should be -1 on the first call.
  5954. // -1 means a non-forced member offset (no decoration needed).
  5955. void TGlslangToSpvTraverser::updateMemberOffset(const glslang::TType& structType, const glslang::TType& memberType,
  5956. int& currentOffset, int& nextOffset, glslang::TLayoutPacking explicitLayout, glslang::TLayoutMatrix matrixLayout)
  5957. {
  5958. // this will get a positive value when deemed necessary
  5959. nextOffset = -1;
  5960. // override anything in currentOffset with user-set offset
  5961. if (memberType.getQualifier().hasOffset())
  5962. currentOffset = memberType.getQualifier().layoutOffset;
  5963. // It could be that current linker usage in glslang updated all the layoutOffset,
  5964. // in which case the following code does not matter. But, that's not quite right
  5965. // once cross-compilation unit GLSL validation is done, as the original user
  5966. // settings are needed in layoutOffset, and then the following will come into play.
  5967. if (explicitLayout == glslang::ElpNone) {
  5968. if (! memberType.getQualifier().hasOffset())
  5969. currentOffset = -1;
  5970. return;
  5971. }
  5972. // Getting this far means we need explicit offsets
  5973. if (currentOffset < 0)
  5974. currentOffset = 0;
  5975. // Now, currentOffset is valid (either 0, or from a previous nextOffset),
  5976. // but possibly not yet correctly aligned.
  5977. int memberSize;
  5978. int dummyStride;
  5979. int memberAlignment = glslangIntermediate->getMemberAlignment(memberType, memberSize, dummyStride, explicitLayout,
  5980. matrixLayout == glslang::ElmRowMajor);
  5981. bool isVectorLike = memberType.isVector();
  5982. if (memberType.isMatrix()) {
  5983. if (matrixLayout == glslang::ElmRowMajor)
  5984. isVectorLike = memberType.getMatrixRows() == 1;
  5985. else
  5986. isVectorLike = memberType.getMatrixCols() == 1;
  5987. }
  5988. // Adjust alignment for HLSL rules
  5989. // TODO: make this consistent in early phases of code:
  5990. // adjusting this late means inconsistencies with earlier code, which for reflection is an issue
  5991. // Until reflection is brought in sync with these adjustments, don't apply to $Global,
  5992. // which is the most likely to rely on reflection, and least likely to rely implicit layouts
  5993. if (glslangIntermediate->usingHlslOffsets() &&
  5994. ! memberType.isStruct() && structType.getTypeName().compare("$Global") != 0) {
  5995. int componentSize;
  5996. int componentAlignment = glslangIntermediate->getBaseAlignmentScalar(memberType, componentSize);
  5997. if (! memberType.isArray() && isVectorLike && componentAlignment <= 4)
  5998. memberAlignment = componentAlignment;
  5999. // Don't add unnecessary padding after this member
  6000. // (undo std140 bumping size to a mutliple of vec4)
  6001. if (explicitLayout == glslang::ElpStd140) {
  6002. if (memberType.isMatrix()) {
  6003. if (matrixLayout == glslang::ElmRowMajor)
  6004. memberSize -= componentSize * (4 - memberType.getMatrixCols());
  6005. else
  6006. memberSize -= componentSize * (4 - memberType.getMatrixRows());
  6007. } else if (memberType.isArray())
  6008. memberSize -= componentSize * (4 - memberType.getVectorSize());
  6009. }
  6010. }
  6011. // Bump up to member alignment
  6012. glslang::RoundToPow2(currentOffset, memberAlignment);
  6013. // Bump up to vec4 if there is a bad straddle
  6014. if (explicitLayout != glslang::ElpScalar && glslangIntermediate->improperStraddle(memberType, memberSize,
  6015. currentOffset, isVectorLike))
  6016. glslang::RoundToPow2(currentOffset, 16);
  6017. nextOffset = currentOffset + memberSize;
  6018. }
  6019. void TGlslangToSpvTraverser::declareUseOfStructMember(const glslang::TTypeList& members, int glslangMember)
  6020. {
  6021. const glslang::TBuiltInVariable glslangBuiltIn = members[glslangMember].type->getQualifier().builtIn;
  6022. switch (glslangBuiltIn)
  6023. {
  6024. case glslang::EbvPointSize:
  6025. case glslang::EbvClipDistance:
  6026. case glslang::EbvCullDistance:
  6027. case glslang::EbvViewportMaskNV:
  6028. case glslang::EbvSecondaryPositionNV:
  6029. case glslang::EbvSecondaryViewportMaskNV:
  6030. case glslang::EbvPositionPerViewNV:
  6031. case glslang::EbvViewportMaskPerViewNV:
  6032. case glslang::EbvTaskCountNV:
  6033. case glslang::EbvPrimitiveCountNV:
  6034. case glslang::EbvPrimitiveIndicesNV:
  6035. case glslang::EbvClipDistancePerViewNV:
  6036. case glslang::EbvCullDistancePerViewNV:
  6037. case glslang::EbvLayerPerViewNV:
  6038. case glslang::EbvMeshViewCountNV:
  6039. case glslang::EbvMeshViewIndicesNV:
  6040. // Generate the associated capability. Delegate to TranslateBuiltInDecoration.
  6041. // Alternately, we could just call this for any glslang built-in, since the
  6042. // capability already guards against duplicates.
  6043. TranslateBuiltInDecoration(glslangBuiltIn, false);
  6044. break;
  6045. default:
  6046. // Capabilities were already generated when the struct was declared.
  6047. break;
  6048. }
  6049. }
  6050. bool TGlslangToSpvTraverser::isShaderEntryPoint(const glslang::TIntermAggregate* node)
  6051. {
  6052. return node->getName().compare(glslangIntermediate->getEntryPointMangledName().c_str()) == 0;
  6053. }
  6054. // Does parameter need a place to keep writes, separate from the original?
  6055. // Assumes called after originalParam(), which filters out block/buffer/opaque-based
  6056. // qualifiers such that we should have only in/out/inout/constreadonly here.
  6057. bool TGlslangToSpvTraverser::writableParam(glslang::TStorageQualifier qualifier) const
  6058. {
  6059. assert(qualifier == glslang::EvqIn ||
  6060. qualifier == glslang::EvqOut ||
  6061. qualifier == glslang::EvqInOut ||
  6062. qualifier == glslang::EvqUniform ||
  6063. qualifier == glslang::EvqConstReadOnly);
  6064. return qualifier != glslang::EvqConstReadOnly &&
  6065. qualifier != glslang::EvqUniform;
  6066. }
  6067. // Is parameter pass-by-original?
  6068. bool TGlslangToSpvTraverser::originalParam(glslang::TStorageQualifier qualifier, const glslang::TType& paramType,
  6069. bool implicitThisParam)
  6070. {
  6071. if (implicitThisParam) // implicit this
  6072. return true;
  6073. if (glslangIntermediate->getSource() == glslang::EShSourceHlsl)
  6074. return paramType.getBasicType() == glslang::EbtBlock;
  6075. return (paramType.containsOpaque() && !glslangIntermediate->getBindlessMode()) || // sampler, etc.
  6076. paramType.getQualifier().isSpirvByReference() || // spirv_by_reference
  6077. (paramType.getBasicType() == glslang::EbtBlock && qualifier == glslang::EvqBuffer); // SSBO
  6078. }
  6079. // Make all the functions, skeletally, without actually visiting their bodies.
  6080. void TGlslangToSpvTraverser::makeFunctions(const glslang::TIntermSequence& glslFunctions)
  6081. {
  6082. const auto getParamDecorations = [&](std::vector<spv::Decoration>& decorations, const glslang::TType& type,
  6083. bool useVulkanMemoryModel) {
  6084. spv::Decoration paramPrecision = TranslatePrecisionDecoration(type);
  6085. if (paramPrecision != spv::NoPrecision)
  6086. decorations.push_back(paramPrecision);
  6087. TranslateMemoryDecoration(type.getQualifier(), decorations, useVulkanMemoryModel);
  6088. if (type.isReference()) {
  6089. // Original and non-writable params pass the pointer directly and
  6090. // use restrict/aliased, others are stored to a pointer in Function
  6091. // memory and use RestrictPointer/AliasedPointer.
  6092. if (originalParam(type.getQualifier().storage, type, false) ||
  6093. !writableParam(type.getQualifier().storage)) {
  6094. // TranslateMemoryDecoration added Restrict decoration already.
  6095. if (!type.getQualifier().isRestrict()) {
  6096. decorations.push_back(spv::Decoration::Aliased);
  6097. }
  6098. } else {
  6099. decorations.push_back(type.getQualifier().isRestrict() ? spv::Decoration::RestrictPointerEXT :
  6100. spv::Decoration::AliasedPointerEXT);
  6101. }
  6102. }
  6103. };
  6104. for (int f = 0; f < (int)glslFunctions.size(); ++f) {
  6105. glslang::TIntermAggregate* glslFunction = glslFunctions[f]->getAsAggregate();
  6106. if (! glslFunction || glslFunction->getOp() != glslang::EOpFunction)
  6107. continue;
  6108. builder.setDebugSourceLocation(glslFunction->getLoc().line, glslFunction->getLoc().getFilename());
  6109. if (isShaderEntryPoint(glslFunction)) {
  6110. // For HLSL, the entry function is actually a compiler generated function to resolve the difference of
  6111. // entry function signature between HLSL and SPIR-V. So we don't emit debug information for that.
  6112. if (glslangIntermediate->getSource() != glslang::EShSourceHlsl) {
  6113. builder.setupFunctionDebugInfo(shaderEntry, glslangIntermediate->getEntryPointMangledName().c_str(),
  6114. std::vector<spv::Id>(), // main function has no param
  6115. std::vector<char const*>());
  6116. }
  6117. continue;
  6118. }
  6119. // We're on a user function. Set up the basic interface for the function now,
  6120. // so that it's available to call. Translating the body will happen later.
  6121. //
  6122. // Typically (except for a "const in" parameter), an address will be passed to the
  6123. // function. What it is an address of varies:
  6124. //
  6125. // - "in" parameters not marked as "const" can be written to without modifying the calling
  6126. // argument so that write needs to be to a copy, hence the address of a copy works.
  6127. //
  6128. // - "const in" parameters can just be the r-value, as no writes need occur.
  6129. //
  6130. // - "out" and "inout" arguments can't be done as pointers to the calling argument, because
  6131. // GLSL has copy-in/copy-out semantics. They can be handled though with a pointer to a copy.
  6132. std::vector<spv::Id> paramTypes;
  6133. std::vector<char const*> paramNames;
  6134. std::vector<std::vector<spv::Decoration>> paramDecorations; // list of decorations per parameter
  6135. glslang::TIntermSequence& parameters = glslFunction->getSequence()[0]->getAsAggregate()->getSequence();
  6136. #ifdef ENABLE_HLSL
  6137. bool implicitThis = (int)parameters.size() > 0 && parameters[0]->getAsSymbolNode()->getName() ==
  6138. glslangIntermediate->implicitThisName;
  6139. #else
  6140. bool implicitThis = false;
  6141. #endif
  6142. paramDecorations.resize(parameters.size());
  6143. for (int p = 0; p < (int)parameters.size(); ++p) {
  6144. const glslang::TType& paramType = parameters[p]->getAsTyped()->getType();
  6145. spv::Id typeId = convertGlslangToSpvType(paramType);
  6146. if (originalParam(paramType.getQualifier().storage, paramType, implicitThis && p == 0))
  6147. typeId = builder.makePointer(TranslateStorageClass(paramType), typeId);
  6148. else if (writableParam(paramType.getQualifier().storage))
  6149. typeId = builder.makePointer(spv::StorageClass::Function, typeId);
  6150. else
  6151. rValueParameters.insert(parameters[p]->getAsSymbolNode()->getId());
  6152. getParamDecorations(paramDecorations[p], paramType, glslangIntermediate->usingVulkanMemoryModel());
  6153. paramTypes.push_back(typeId);
  6154. }
  6155. for (auto const parameter:parameters) {
  6156. paramNames.push_back(parameter->getAsSymbolNode()->getName().c_str());
  6157. }
  6158. spv::Block* functionBlock;
  6159. spv::Function* function = builder.makeFunctionEntry(
  6160. TranslatePrecisionDecoration(glslFunction->getType()), convertGlslangToSpvType(glslFunction->getType()),
  6161. glslFunction->getName().c_str(), convertGlslangLinkageToSpv(glslFunction->getLinkType()), paramTypes,
  6162. paramDecorations, &functionBlock);
  6163. builder.setupFunctionDebugInfo(function, glslFunction->getName().c_str(), paramTypes, paramNames);
  6164. if (implicitThis)
  6165. function->setImplicitThis();
  6166. // Track function to emit/call later
  6167. functionMap[glslFunction->getName().c_str()] = function;
  6168. // Set the parameter id's
  6169. for (int p = 0; p < (int)parameters.size(); ++p) {
  6170. symbolValues[parameters[p]->getAsSymbolNode()->getId()] = function->getParamId(p);
  6171. // give a name too
  6172. builder.addName(function->getParamId(p), parameters[p]->getAsSymbolNode()->getName().c_str());
  6173. const glslang::TType& paramType = parameters[p]->getAsTyped()->getType();
  6174. if (paramType.contains8BitInt())
  6175. builder.addCapability(spv::Capability::Int8);
  6176. if (paramType.contains16BitInt())
  6177. builder.addCapability(spv::Capability::Int16);
  6178. if (paramType.contains16BitFloat())
  6179. builder.addCapability(spv::Capability::Float16);
  6180. }
  6181. }
  6182. }
  6183. // Process all the initializers, while skipping the functions and link objects
  6184. void TGlslangToSpvTraverser::makeGlobalInitializers(const glslang::TIntermSequence& initializers)
  6185. {
  6186. builder.setBuildPoint(shaderEntry->getLastBlock());
  6187. for (int i = 0; i < (int)initializers.size(); ++i) {
  6188. glslang::TIntermAggregate* initializer = initializers[i]->getAsAggregate();
  6189. if (initializer && initializer->getOp() != glslang::EOpFunction && initializer->getOp() !=
  6190. glslang::EOpLinkerObjects) {
  6191. // We're on a top-level node that's not a function. Treat as an initializer, whose
  6192. // code goes into the beginning of the entry point.
  6193. initializer->traverse(this);
  6194. }
  6195. }
  6196. }
  6197. // Walk over all linker objects to create a map for payload and callable data linker objects
  6198. // and their location to be used during codegen for OpTraceKHR and OpExecuteCallableKHR
  6199. // This is done here since it is possible that these linker objects are not be referenced in the AST
  6200. void TGlslangToSpvTraverser::collectRayTracingLinkerObjects()
  6201. {
  6202. glslang::TIntermAggregate* linkerObjects = glslangIntermediate->findLinkerObjects();
  6203. for (auto& objSeq : linkerObjects->getSequence()) {
  6204. auto objNode = objSeq->getAsSymbolNode();
  6205. if (objNode != nullptr) {
  6206. if (objNode->getQualifier().hasLocation()) {
  6207. unsigned int location = objNode->getQualifier().layoutLocation;
  6208. auto st = objNode->getQualifier().storage;
  6209. int set;
  6210. switch (st)
  6211. {
  6212. case glslang::EvqPayload:
  6213. case glslang::EvqPayloadIn:
  6214. set = 0;
  6215. break;
  6216. case glslang::EvqCallableData:
  6217. case glslang::EvqCallableDataIn:
  6218. set = 1;
  6219. break;
  6220. case glslang::EvqHitObjectAttrNV:
  6221. case glslang::EvqHitObjectAttrEXT:
  6222. set = 2;
  6223. break;
  6224. default:
  6225. set = -1;
  6226. }
  6227. if (set != -1)
  6228. locationToSymbol[set].insert(std::make_pair(location, objNode));
  6229. }
  6230. }
  6231. }
  6232. }
  6233. // Process all the functions, while skipping initializers.
  6234. void TGlslangToSpvTraverser::visitFunctions(const glslang::TIntermSequence& glslFunctions)
  6235. {
  6236. for (int f = 0; f < (int)glslFunctions.size(); ++f) {
  6237. glslang::TIntermAggregate* node = glslFunctions[f]->getAsAggregate();
  6238. if (node && (node->getOp() == glslang::EOpFunction || node->getOp() == glslang::EOpLinkerObjects))
  6239. node->traverse(this);
  6240. }
  6241. }
  6242. void TGlslangToSpvTraverser::translateArguments(const glslang::TIntermAggregate& node, std::vector<spv::Id>& arguments,
  6243. spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags)
  6244. {
  6245. const glslang::TIntermSequence& glslangArguments = node.getSequence();
  6246. glslang::TSampler sampler = {};
  6247. bool cubeCompare = false;
  6248. bool f16ShadowCompare = false;
  6249. if (node.isTexture() || node.isImage()) {
  6250. sampler = glslangArguments[0]->getAsTyped()->getType().getSampler();
  6251. cubeCompare = sampler.dim == glslang::EsdCube && sampler.arrayed && sampler.shadow;
  6252. f16ShadowCompare = sampler.shadow &&
  6253. glslangArguments[1]->getAsTyped()->getType().getBasicType() == glslang::EbtFloat16;
  6254. }
  6255. for (int i = 0; i < (int)glslangArguments.size(); ++i) {
  6256. builder.clearAccessChain();
  6257. glslangArguments[i]->traverse(this);
  6258. // Special case l-value operands
  6259. bool lvalue = false;
  6260. switch (node.getOp()) {
  6261. case glslang::EOpImageAtomicAdd:
  6262. case glslang::EOpImageAtomicMin:
  6263. case glslang::EOpImageAtomicMax:
  6264. case glslang::EOpImageAtomicAnd:
  6265. case glslang::EOpImageAtomicOr:
  6266. case glslang::EOpImageAtomicXor:
  6267. case glslang::EOpImageAtomicExchange:
  6268. case glslang::EOpImageAtomicCompSwap:
  6269. case glslang::EOpImageAtomicLoad:
  6270. case glslang::EOpImageAtomicStore:
  6271. if (i == 0)
  6272. lvalue = true;
  6273. break;
  6274. case glslang::EOpSparseImageLoad:
  6275. if ((sampler.ms && i == 3) || (! sampler.ms && i == 2))
  6276. lvalue = true;
  6277. break;
  6278. case glslang::EOpSparseTexture:
  6279. if (((cubeCompare || f16ShadowCompare) && i == 3) || (! (cubeCompare || f16ShadowCompare) && i == 2))
  6280. lvalue = true;
  6281. break;
  6282. case glslang::EOpSparseTextureClamp:
  6283. if (((cubeCompare || f16ShadowCompare) && i == 4) || (! (cubeCompare || f16ShadowCompare) && i == 3))
  6284. lvalue = true;
  6285. break;
  6286. case glslang::EOpSparseTextureLod:
  6287. case glslang::EOpSparseTextureOffset:
  6288. if ((f16ShadowCompare && i == 4) || (! f16ShadowCompare && i == 3))
  6289. lvalue = true;
  6290. break;
  6291. case glslang::EOpSparseTextureFetch:
  6292. if ((sampler.dim != glslang::EsdRect && i == 3) || (sampler.dim == glslang::EsdRect && i == 2))
  6293. lvalue = true;
  6294. break;
  6295. case glslang::EOpSparseTextureFetchOffset:
  6296. if ((sampler.dim != glslang::EsdRect && i == 4) || (sampler.dim == glslang::EsdRect && i == 3))
  6297. lvalue = true;
  6298. break;
  6299. case glslang::EOpSparseTextureLodOffset:
  6300. case glslang::EOpSparseTextureGrad:
  6301. case glslang::EOpSparseTextureOffsetClamp:
  6302. if ((f16ShadowCompare && i == 5) || (! f16ShadowCompare && i == 4))
  6303. lvalue = true;
  6304. break;
  6305. case glslang::EOpSparseTextureGradOffset:
  6306. case glslang::EOpSparseTextureGradClamp:
  6307. if ((f16ShadowCompare && i == 6) || (! f16ShadowCompare && i == 5))
  6308. lvalue = true;
  6309. break;
  6310. case glslang::EOpSparseTextureGradOffsetClamp:
  6311. if ((f16ShadowCompare && i == 7) || (! f16ShadowCompare && i == 6))
  6312. lvalue = true;
  6313. break;
  6314. case glslang::EOpSparseTextureGather:
  6315. if ((sampler.shadow && i == 3) || (! sampler.shadow && i == 2))
  6316. lvalue = true;
  6317. break;
  6318. case glslang::EOpSparseTextureGatherOffset:
  6319. case glslang::EOpSparseTextureGatherOffsets:
  6320. if ((sampler.shadow && i == 4) || (! sampler.shadow && i == 3))
  6321. lvalue = true;
  6322. break;
  6323. case glslang::EOpSparseTextureGatherLod:
  6324. if (i == 3)
  6325. lvalue = true;
  6326. break;
  6327. case glslang::EOpSparseTextureGatherLodOffset:
  6328. case glslang::EOpSparseTextureGatherLodOffsets:
  6329. if (i == 4)
  6330. lvalue = true;
  6331. break;
  6332. case glslang::EOpSparseImageLoadLod:
  6333. if (i == 3)
  6334. lvalue = true;
  6335. break;
  6336. case glslang::EOpImageSampleFootprintNV:
  6337. if (i == 4)
  6338. lvalue = true;
  6339. break;
  6340. case glslang::EOpImageSampleFootprintClampNV:
  6341. case glslang::EOpImageSampleFootprintLodNV:
  6342. if (i == 5)
  6343. lvalue = true;
  6344. break;
  6345. case glslang::EOpImageSampleFootprintGradNV:
  6346. if (i == 6)
  6347. lvalue = true;
  6348. break;
  6349. case glslang::EOpImageSampleFootprintGradClampNV:
  6350. if (i == 7)
  6351. lvalue = true;
  6352. break;
  6353. case glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT:
  6354. case glslang::EOpRayQueryGetIntersectionLSSPositionsNV:
  6355. case glslang::EOpRayQueryGetIntersectionLSSRadiiNV:
  6356. if (i == 2)
  6357. lvalue = true;
  6358. break;
  6359. case glslang::EOpConstructSaturated:
  6360. if (i == 0)
  6361. lvalue = true;
  6362. break;
  6363. default:
  6364. break;
  6365. }
  6366. if (lvalue) {
  6367. spv::Id lvalue_id = builder.accessChainGetLValue();
  6368. arguments.push_back(lvalue_id);
  6369. lvalueCoherentFlags = builder.getAccessChain().coherentFlags;
  6370. builder.addDecoration(lvalue_id, TranslateNonUniformDecoration(lvalueCoherentFlags));
  6371. lvalueCoherentFlags |= TranslateCoherent(glslangArguments[i]->getAsTyped()->getType());
  6372. } else {
  6373. if (i > 0 &&
  6374. glslangArguments[i]->getAsSymbolNode() && glslangArguments[i-1]->getAsSymbolNode() &&
  6375. glslangArguments[i]->getAsSymbolNode()->getId() == glslangArguments[i-1]->getAsSymbolNode()->getId()) {
  6376. // Reuse the id if possible
  6377. arguments.push_back(arguments[i-1]);
  6378. } else {
  6379. arguments.push_back(accessChainLoad(glslangArguments[i]->getAsTyped()->getType()));
  6380. }
  6381. }
  6382. }
  6383. }
  6384. void TGlslangToSpvTraverser::translateArguments(glslang::TIntermUnary& node, std::vector<spv::Id>& arguments)
  6385. {
  6386. builder.clearAccessChain();
  6387. node.getOperand()->traverse(this);
  6388. arguments.push_back(accessChainLoad(node.getOperand()->getType()));
  6389. }
  6390. spv::Id TGlslangToSpvTraverser::createImageTextureFunctionCall(glslang::TIntermOperator* node)
  6391. {
  6392. if (! node->isImage() && ! node->isTexture())
  6393. return spv::NoResult;
  6394. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  6395. // Process a GLSL texturing op (will be SPV image)
  6396. const glslang::TType &imageType = node->getAsAggregate()
  6397. ? node->getAsAggregate()->getSequence()[0]->getAsTyped()->getType()
  6398. : node->getAsUnaryNode()->getOperand()->getAsTyped()->getType();
  6399. const glslang::TSampler sampler = imageType.getSampler();
  6400. bool f16ShadowCompare = (sampler.shadow && node->getAsAggregate())
  6401. ? node->getAsAggregate()->getSequence()[1]->getAsTyped()->getType().getBasicType() == glslang::EbtFloat16
  6402. : false;
  6403. const auto signExtensionMask = [&]() {
  6404. if (builder.getSpvVersion() >= spv::Spv_1_4) {
  6405. if (sampler.type == glslang::EbtUint)
  6406. return spv::ImageOperandsMask::ZeroExtend;
  6407. else if (sampler.type == glslang::EbtInt)
  6408. return spv::ImageOperandsMask::SignExtend;
  6409. }
  6410. return spv::ImageOperandsMask::MaskNone;
  6411. };
  6412. spv::Builder::AccessChain::CoherentFlags lvalueCoherentFlags;
  6413. std::vector<spv::Id> arguments;
  6414. if (node->getAsAggregate())
  6415. translateArguments(*node->getAsAggregate(), arguments, lvalueCoherentFlags);
  6416. else
  6417. translateArguments(*node->getAsUnaryNode(), arguments);
  6418. spv::Decoration precision = TranslatePrecisionDecoration(node->getType());
  6419. spv::Builder::TextureParameters params = { };
  6420. params.sampler = arguments[0];
  6421. glslang::TCrackedTextureOp cracked;
  6422. node->crackTexture(sampler, cracked);
  6423. const bool isUnsignedResult = node->getType().getBasicType() == glslang::EbtUint;
  6424. if (builder.isSampledImage(params.sampler) &&
  6425. ((cracked.query && node->getOp() != glslang::EOpTextureQueryLod) || cracked.fragMask || cracked.fetch)) {
  6426. params.sampler = builder.createUnaryOp(spv::Op::OpImage, builder.getImageType(params.sampler), params.sampler);
  6427. if (imageType.getQualifier().isNonUniform()) {
  6428. builder.addDecoration(params.sampler, spv::Decoration::NonUniformEXT);
  6429. }
  6430. }
  6431. // Check for queries
  6432. if (cracked.query) {
  6433. switch (node->getOp()) {
  6434. case glslang::EOpImageQuerySize:
  6435. case glslang::EOpTextureQuerySize:
  6436. if (arguments.size() > 1) {
  6437. params.lod = arguments[1];
  6438. return builder.createTextureQueryCall(spv::Op::OpImageQuerySizeLod, params, isUnsignedResult);
  6439. } else
  6440. return builder.createTextureQueryCall(spv::Op::OpImageQuerySize, params, isUnsignedResult);
  6441. case glslang::EOpImageQuerySamples:
  6442. case glslang::EOpTextureQuerySamples:
  6443. return builder.createTextureQueryCall(spv::Op::OpImageQuerySamples, params, isUnsignedResult);
  6444. case glslang::EOpTextureQueryLod:
  6445. params.coords = arguments[1];
  6446. return builder.createTextureQueryCall(spv::Op::OpImageQueryLod, params, isUnsignedResult);
  6447. case glslang::EOpTextureQueryLevels:
  6448. return builder.createTextureQueryCall(spv::Op::OpImageQueryLevels, params, isUnsignedResult);
  6449. case glslang::EOpSparseTexelsResident:
  6450. return builder.createUnaryOp(spv::Op::OpImageSparseTexelsResident, builder.makeBoolType(), arguments[0]);
  6451. default:
  6452. assert(0);
  6453. break;
  6454. }
  6455. }
  6456. int components = node->getType().getVectorSize();
  6457. if (node->getOp() == glslang::EOpImageLoad ||
  6458. node->getOp() == glslang::EOpImageLoadLod ||
  6459. node->getOp() == glslang::EOpTextureFetch ||
  6460. node->getOp() == glslang::EOpTextureFetchOffset) {
  6461. // These must produce 4 components, per SPIR-V spec. We'll add a conversion constructor if needed.
  6462. // This will only happen through the HLSL path for operator[], so we do not have to handle e.g.
  6463. // the EOpTexture/Proj/Lod/etc family. It would be harmless to do so, but would need more logic
  6464. // here around e.g. which ones return scalars or other types.
  6465. components = 4;
  6466. }
  6467. glslang::TType returnType(node->getType().getBasicType(), glslang::EvqTemporary, components);
  6468. auto resultType = [&returnType,this]{ return convertGlslangToSpvType(returnType); };
  6469. // Check for image functions other than queries
  6470. if (node->isImage()) {
  6471. std::vector<spv::IdImmediate> operands;
  6472. auto opIt = arguments.begin();
  6473. spv::IdImmediate image = { true, *(opIt++) };
  6474. operands.push_back(image);
  6475. // Handle subpass operations
  6476. // TODO: GLSL should change to have the "MS" only on the type rather than the
  6477. // built-in function.
  6478. if (cracked.subpass) {
  6479. // add on the (0,0) coordinate
  6480. spv::Id zero = builder.makeIntConstant(0);
  6481. std::vector<spv::Id> comps;
  6482. comps.push_back(zero);
  6483. comps.push_back(zero);
  6484. spv::IdImmediate coord = { true,
  6485. builder.makeCompositeConstant(builder.makeVectorType(builder.makeIntType(32), 2), comps) };
  6486. operands.push_back(coord);
  6487. spv::IdImmediate imageOperands = { false, spv::ImageOperandsMask::MaskNone };
  6488. imageOperands.word = imageOperands.word | (unsigned)signExtensionMask();
  6489. if (sampler.isMultiSample()) {
  6490. imageOperands.word = imageOperands.word | (unsigned)spv::ImageOperandsMask::Sample;
  6491. }
  6492. if (imageOperands.word != (unsigned)spv::ImageOperandsMask::MaskNone) {
  6493. operands.push_back(imageOperands);
  6494. if (sampler.isMultiSample()) {
  6495. spv::IdImmediate imageOperand = { true, *(opIt++) };
  6496. operands.push_back(imageOperand);
  6497. }
  6498. }
  6499. spv::Id result = builder.createOp(spv::Op::OpImageRead, resultType(), operands);
  6500. builder.setPrecision(result, precision);
  6501. return result;
  6502. }
  6503. if (cracked.attachmentEXT) {
  6504. if (opIt != arguments.end()) {
  6505. spv::IdImmediate sample = { true, *opIt };
  6506. operands.push_back(sample);
  6507. }
  6508. spv::Id result = builder.createOp(spv::Op::OpColorAttachmentReadEXT, resultType(), operands);
  6509. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  6510. builder.setPrecision(result, precision);
  6511. return result;
  6512. }
  6513. spv::IdImmediate coord = { true, *(opIt++) };
  6514. operands.push_back(coord);
  6515. if (node->getOp() == glslang::EOpImageLoad || node->getOp() == glslang::EOpImageLoadLod) {
  6516. spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;
  6517. if (sampler.isMultiSample()) {
  6518. mask = mask | spv::ImageOperandsMask::Sample;
  6519. }
  6520. if (cracked.lod) {
  6521. builder.addExtension(spv::E_SPV_AMD_shader_image_load_store_lod);
  6522. builder.addCapability(spv::Capability::ImageReadWriteLodAMD);
  6523. mask = mask | spv::ImageOperandsMask::Lod;
  6524. }
  6525. mask = mask | TranslateImageOperands(TranslateCoherent(imageType));
  6526. mask = (spv::ImageOperandsMask)(mask & ~spv::ImageOperandsMask::MakeTexelAvailableKHR);
  6527. mask = mask | signExtensionMask();
  6528. if (mask != spv::ImageOperandsMask::MaskNone) {
  6529. spv::IdImmediate imageOperands = { false, (unsigned int)mask };
  6530. operands.push_back(imageOperands);
  6531. }
  6532. if (anySet(mask, spv::ImageOperandsMask::Sample)) {
  6533. spv::IdImmediate imageOperand = { true, *opIt++ };
  6534. operands.push_back(imageOperand);
  6535. }
  6536. if (anySet(mask, spv::ImageOperandsMask::Lod)) {
  6537. spv::IdImmediate imageOperand = { true, *opIt++ };
  6538. operands.push_back(imageOperand);
  6539. }
  6540. if (anySet(mask, spv::ImageOperandsMask::MakeTexelVisibleKHR)) {
  6541. spv::IdImmediate imageOperand = { true,
  6542. builder.makeUintConstant(TranslateMemoryScope(TranslateCoherent(imageType))) };
  6543. operands.push_back(imageOperand);
  6544. }
  6545. if (builder.getImageTypeFormat(builder.getImageType(operands.front().word)) == spv::ImageFormat::Unknown)
  6546. builder.addCapability(spv::Capability::StorageImageReadWithoutFormat);
  6547. std::vector<spv::Id> result(1, builder.createOp(spv::Op::OpImageRead, resultType(), operands));
  6548. builder.setPrecision(result[0], precision);
  6549. // If needed, add a conversion constructor to the proper size.
  6550. if (components != node->getType().getVectorSize())
  6551. result[0] = builder.createConstructor(precision, result, convertGlslangToSpvType(node->getType()));
  6552. return result[0];
  6553. } else if (node->getOp() == glslang::EOpImageStore || node->getOp() == glslang::EOpImageStoreLod) {
  6554. // Push the texel value before the operands
  6555. if (sampler.isMultiSample() || cracked.lod) {
  6556. spv::IdImmediate texel = { true, *(opIt + 1) };
  6557. operands.push_back(texel);
  6558. } else {
  6559. spv::IdImmediate texel = { true, *opIt };
  6560. operands.push_back(texel);
  6561. }
  6562. spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;
  6563. if (sampler.isMultiSample()) {
  6564. mask = mask | spv::ImageOperandsMask::Sample;
  6565. }
  6566. if (cracked.lod) {
  6567. builder.addExtension(spv::E_SPV_AMD_shader_image_load_store_lod);
  6568. builder.addCapability(spv::Capability::ImageReadWriteLodAMD);
  6569. mask = mask | spv::ImageOperandsMask::Lod;
  6570. }
  6571. mask = mask | TranslateImageOperands(TranslateCoherent(imageType));
  6572. mask = (spv::ImageOperandsMask)(mask & ~spv::ImageOperandsMask::MakeTexelVisibleKHR);
  6573. mask = mask | signExtensionMask();
  6574. if (mask != spv::ImageOperandsMask::MaskNone) {
  6575. spv::IdImmediate imageOperands = { false, (unsigned int)mask };
  6576. operands.push_back(imageOperands);
  6577. }
  6578. if (anySet(mask, spv::ImageOperandsMask::Sample)) {
  6579. spv::IdImmediate imageOperand = { true, *opIt++ };
  6580. operands.push_back(imageOperand);
  6581. }
  6582. if (anySet(mask, spv::ImageOperandsMask::Lod)) {
  6583. spv::IdImmediate imageOperand = { true, *opIt++ };
  6584. operands.push_back(imageOperand);
  6585. }
  6586. if (anySet(mask, spv::ImageOperandsMask::MakeTexelAvailableKHR)) {
  6587. spv::IdImmediate imageOperand = { true,
  6588. builder.makeUintConstant(TranslateMemoryScope(TranslateCoherent(imageType))) };
  6589. operands.push_back(imageOperand);
  6590. }
  6591. builder.createNoResultOp(spv::Op::OpImageWrite, operands);
  6592. if (builder.getImageTypeFormat(builder.getImageType(operands.front().word)) == spv::ImageFormat::Unknown)
  6593. builder.addCapability(spv::Capability::StorageImageWriteWithoutFormat);
  6594. return spv::NoResult;
  6595. } else if (node->getOp() == glslang::EOpSparseImageLoad ||
  6596. node->getOp() == glslang::EOpSparseImageLoadLod) {
  6597. builder.addCapability(spv::Capability::SparseResidency);
  6598. if (builder.getImageTypeFormat(builder.getImageType(operands.front().word)) == spv::ImageFormat::Unknown)
  6599. builder.addCapability(spv::Capability::StorageImageReadWithoutFormat);
  6600. spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;
  6601. if (sampler.isMultiSample()) {
  6602. mask = mask | spv::ImageOperandsMask::Sample;
  6603. }
  6604. if (cracked.lod) {
  6605. builder.addExtension(spv::E_SPV_AMD_shader_image_load_store_lod);
  6606. builder.addCapability(spv::Capability::ImageReadWriteLodAMD);
  6607. mask = mask | spv::ImageOperandsMask::Lod;
  6608. }
  6609. mask = mask | TranslateImageOperands(TranslateCoherent(imageType));
  6610. mask = (spv::ImageOperandsMask)(mask & ~spv::ImageOperandsMask::MakeTexelAvailableKHR);
  6611. mask = mask | signExtensionMask();
  6612. if (mask != spv::ImageOperandsMask::MaskNone) {
  6613. spv::IdImmediate imageOperands = { false, (unsigned int)mask };
  6614. operands.push_back(imageOperands);
  6615. }
  6616. if (anySet(mask, spv::ImageOperandsMask::Sample)) {
  6617. spv::IdImmediate imageOperand = { true, *opIt++ };
  6618. operands.push_back(imageOperand);
  6619. }
  6620. if (anySet(mask, spv::ImageOperandsMask::Lod)) {
  6621. spv::IdImmediate imageOperand = { true, *opIt++ };
  6622. operands.push_back(imageOperand);
  6623. }
  6624. if (anySet(mask, spv::ImageOperandsMask::MakeTexelVisibleKHR)) {
  6625. spv::IdImmediate imageOperand = { true, builder.makeUintConstant(TranslateMemoryScope(
  6626. TranslateCoherent(imageType))) };
  6627. operands.push_back(imageOperand);
  6628. }
  6629. // Create the return type that was a special structure
  6630. spv::Id texelOut = *opIt;
  6631. spv::Id typeId0 = resultType();
  6632. spv::Id typeId1 = builder.getDerefTypeId(texelOut);
  6633. spv::Id resultTypeId = builder.makeStructResultType(typeId0, typeId1);
  6634. spv::Id resultId = builder.createOp(spv::Op::OpImageSparseRead, resultTypeId, operands);
  6635. // Decode the return type
  6636. builder.createStore(builder.createCompositeExtract(resultId, typeId1, 1), texelOut);
  6637. return builder.createCompositeExtract(resultId, typeId0, 0);
  6638. } else {
  6639. // Process image atomic operations
  6640. // GLSL "IMAGE_PARAMS" will involve in constructing an image texel pointer and this pointer,
  6641. // as the first source operand, is required by SPIR-V atomic operations.
  6642. // For non-MS, the sample value should be 0
  6643. spv::IdImmediate sample = { true, sampler.isMultiSample() ? *(opIt++) : builder.makeUintConstant(0) };
  6644. operands.push_back(sample);
  6645. spv::Id resultTypeId;
  6646. glslang::TBasicType typeProxy = node->getBasicType();
  6647. // imageAtomicStore has a void return type so base the pointer type on
  6648. // the type of the value operand.
  6649. if (node->getOp() == glslang::EOpImageAtomicStore) {
  6650. resultTypeId = builder.makePointer(spv::StorageClass::Image, builder.getTypeId(*opIt));
  6651. typeProxy = node->getAsAggregate()->getSequence()[0]->getAsTyped()->getType().getSampler().type;
  6652. } else {
  6653. resultTypeId = builder.makePointer(spv::StorageClass::Image, resultType());
  6654. }
  6655. // EXT_descriptor_heap
  6656. // For image atomic parameter, using untyped image texel pointer to carry on type metadata.
  6657. spv::Op imgTexelOp = spv::Op::OpImageTexelPointer;
  6658. if (node->getQualifier().isUsedByAtomic() &&
  6659. imageType.getQualifier().builtIn == glslang::EbvResourceHeapEXT) {
  6660. operands.insert(operands.begin(), {true, convertGlslangToSpvType(imageType)});
  6661. imgTexelOp = spv::Op::OpUntypedImageTexelPointerEXT;
  6662. resultTypeId = builder.makeUntypedPointer(spv::StorageClass::Image);
  6663. }
  6664. spv::Id pointer = builder.createOp(imgTexelOp, resultTypeId, operands);
  6665. if (imageType.getQualifier().nonUniform) {
  6666. builder.addDecoration(pointer, spv::Decoration::NonUniformEXT);
  6667. }
  6668. std::vector<spv::Id> operands;
  6669. operands.push_back(pointer);
  6670. for (; opIt != arguments.end(); ++opIt)
  6671. operands.push_back(*opIt);
  6672. return createAtomicOperation(node->getOp(), precision, resultType(), operands, typeProxy,
  6673. lvalueCoherentFlags, node->getType());
  6674. }
  6675. }
  6676. // Check for fragment mask functions other than queries
  6677. if (cracked.fragMask) {
  6678. assert(sampler.ms);
  6679. auto opIt = arguments.begin();
  6680. std::vector<spv::Id> operands;
  6681. operands.push_back(params.sampler);
  6682. ++opIt;
  6683. if (sampler.isSubpass()) {
  6684. // add on the (0,0) coordinate
  6685. spv::Id zero = builder.makeIntConstant(0);
  6686. std::vector<spv::Id> comps;
  6687. comps.push_back(zero);
  6688. comps.push_back(zero);
  6689. operands.push_back(builder.makeCompositeConstant(
  6690. builder.makeVectorType(builder.makeIntType(32), 2), comps));
  6691. }
  6692. for (; opIt != arguments.end(); ++opIt)
  6693. operands.push_back(*opIt);
  6694. spv::Op fragMaskOp = spv::Op::OpNop;
  6695. if (node->getOp() == glslang::EOpFragmentMaskFetch)
  6696. fragMaskOp = spv::Op::OpFragmentMaskFetchAMD;
  6697. else if (node->getOp() == glslang::EOpFragmentFetch)
  6698. fragMaskOp = spv::Op::OpFragmentFetchAMD;
  6699. builder.addExtension(spv::E_SPV_AMD_shader_fragment_mask);
  6700. builder.addCapability(spv::Capability::FragmentMaskAMD);
  6701. return builder.createOp(fragMaskOp, resultType(), operands);
  6702. }
  6703. // Check for texture functions other than queries
  6704. bool sparse = node->isSparseTexture();
  6705. bool imageFootprint = node->isImageFootprint();
  6706. bool cubeCompare = sampler.dim == glslang::EsdCube && sampler.isArrayed() && sampler.isShadow();
  6707. // check for bias argument
  6708. bool bias = false;
  6709. if (! cracked.lod && ! cracked.grad && ! cracked.fetch && ! cubeCompare) {
  6710. int nonBiasArgCount = 2;
  6711. if (cracked.gather)
  6712. ++nonBiasArgCount; // comp argument should be present when bias argument is present
  6713. if (f16ShadowCompare)
  6714. ++nonBiasArgCount;
  6715. if (cracked.offset)
  6716. ++nonBiasArgCount;
  6717. else if (cracked.offsets)
  6718. ++nonBiasArgCount;
  6719. if (cracked.grad)
  6720. nonBiasArgCount += 2;
  6721. if (cracked.lodClamp)
  6722. ++nonBiasArgCount;
  6723. if (sparse)
  6724. ++nonBiasArgCount;
  6725. if (imageFootprint)
  6726. //Following three extra arguments
  6727. // int granularity, bool coarse, out gl_TextureFootprint2DNV footprint
  6728. nonBiasArgCount += 3;
  6729. if ((int)arguments.size() > nonBiasArgCount)
  6730. bias = true;
  6731. }
  6732. if (cracked.gather) {
  6733. const auto& sourceExtensions = glslangIntermediate->getRequestedExtensions();
  6734. if (bias || cracked.lod ||
  6735. sourceExtensions.find(glslang::E_GL_AMD_texture_gather_bias_lod) != sourceExtensions.end()) {
  6736. builder.addExtension(spv::E_SPV_AMD_texture_gather_bias_lod);
  6737. builder.addCapability(spv::Capability::ImageGatherBiasLodAMD);
  6738. }
  6739. }
  6740. // set the rest of the arguments
  6741. params.coords = arguments[1];
  6742. int extraArgs = 0;
  6743. bool noImplicitLod = false;
  6744. // sort out where Dref is coming from
  6745. if (cubeCompare || f16ShadowCompare) {
  6746. params.Dref = arguments[2];
  6747. ++extraArgs;
  6748. } else if (sampler.shadow && cracked.gather) {
  6749. params.Dref = arguments[2];
  6750. ++extraArgs;
  6751. } else if (sampler.shadow) {
  6752. std::vector<spv::Id> indexes;
  6753. int dRefComp;
  6754. if (cracked.proj)
  6755. dRefComp = 2; // "The resulting 3rd component of P in the shadow forms is used as Dref"
  6756. else
  6757. dRefComp = builder.getNumComponents(params.coords) - 1;
  6758. indexes.push_back(dRefComp);
  6759. params.Dref = builder.createCompositeExtract(params.coords,
  6760. builder.getScalarTypeId(builder.getTypeId(params.coords)), indexes);
  6761. }
  6762. // lod
  6763. if (cracked.lod) {
  6764. params.lod = arguments[2 + extraArgs];
  6765. ++extraArgs;
  6766. } else if (glslangIntermediate->getStage() != EShLangFragment &&
  6767. !(glslangIntermediate->getStage() == EShLangCompute &&
  6768. glslangIntermediate->hasLayoutDerivativeModeNone())) {
  6769. // we need to invent the default lod for an explicit lod instruction for a non-fragment stage
  6770. noImplicitLod = true;
  6771. }
  6772. // multisample
  6773. if (sampler.isMultiSample()) {
  6774. params.sample = arguments[2 + extraArgs]; // For MS, "sample" should be specified
  6775. ++extraArgs;
  6776. }
  6777. // gradient
  6778. if (cracked.grad) {
  6779. params.gradX = arguments[2 + extraArgs];
  6780. params.gradY = arguments[3 + extraArgs];
  6781. extraArgs += 2;
  6782. }
  6783. // offset and offsets
  6784. if (cracked.offset) {
  6785. params.offset = arguments[2 + extraArgs];
  6786. ++extraArgs;
  6787. } else if (cracked.offsets) {
  6788. params.offsets = arguments[2 + extraArgs];
  6789. ++extraArgs;
  6790. }
  6791. // lod clamp
  6792. if (cracked.lodClamp) {
  6793. params.lodClamp = arguments[2 + extraArgs];
  6794. ++extraArgs;
  6795. }
  6796. // sparse
  6797. if (sparse) {
  6798. params.texelOut = arguments[2 + extraArgs];
  6799. ++extraArgs;
  6800. }
  6801. // gather component
  6802. if (cracked.gather && ! sampler.shadow) {
  6803. // default component is 0, if missing, otherwise an argument
  6804. if (2 + extraArgs < (int)arguments.size()) {
  6805. params.component = arguments[2 + extraArgs];
  6806. ++extraArgs;
  6807. } else
  6808. params.component = builder.makeIntConstant(0);
  6809. }
  6810. spv::Id resultStruct = spv::NoResult;
  6811. if (imageFootprint) {
  6812. //Following three extra arguments
  6813. // int granularity, bool coarse, out gl_TextureFootprint2DNV footprint
  6814. params.granularity = arguments[2 + extraArgs];
  6815. params.coarse = arguments[3 + extraArgs];
  6816. resultStruct = arguments[4 + extraArgs];
  6817. extraArgs += 3;
  6818. }
  6819. // bias
  6820. if (bias) {
  6821. params.bias = arguments[2 + extraArgs];
  6822. ++extraArgs;
  6823. }
  6824. if (imageFootprint) {
  6825. builder.addExtension(spv::E_SPV_NV_shader_image_footprint);
  6826. builder.addCapability(spv::Capability::ImageFootprintNV);
  6827. //resultStructType(OpenGL type) contains 5 elements:
  6828. //struct gl_TextureFootprint2DNV {
  6829. // uvec2 anchor;
  6830. // uvec2 offset;
  6831. // uvec2 mask;
  6832. // uint lod;
  6833. // uint granularity;
  6834. //};
  6835. //or
  6836. //struct gl_TextureFootprint3DNV {
  6837. // uvec3 anchor;
  6838. // uvec3 offset;
  6839. // uvec2 mask;
  6840. // uint lod;
  6841. // uint granularity;
  6842. //};
  6843. spv::Id resultStructType = builder.getContainedTypeId(builder.getTypeId(resultStruct));
  6844. assert(builder.isStructType(resultStructType));
  6845. //resType (SPIR-V type) contains 6 elements:
  6846. //Member 0 must be a Boolean type scalar(LOD),
  6847. //Member 1 must be a vector of integer type, whose Signedness operand is 0(anchor),
  6848. //Member 2 must be a vector of integer type, whose Signedness operand is 0(offset),
  6849. //Member 3 must be a vector of integer type, whose Signedness operand is 0(mask),
  6850. //Member 4 must be a scalar of integer type, whose Signedness operand is 0(lod),
  6851. //Member 5 must be a scalar of integer type, whose Signedness operand is 0(granularity).
  6852. std::vector<spv::Id> members;
  6853. members.push_back(resultType());
  6854. for (int i = 0; i < 5; i++) {
  6855. members.push_back(builder.getContainedTypeId(resultStructType, i));
  6856. }
  6857. spv::Id resType = builder.makeStructType(members, {}, "ResType");
  6858. //call ImageFootprintNV
  6859. spv::Id res = builder.createTextureCall(precision, resType, sparse, cracked.fetch, cracked.proj,
  6860. cracked.gather, noImplicitLod, params, signExtensionMask());
  6861. //copy resType (SPIR-V type) to resultStructType(OpenGL type)
  6862. for (int i = 0; i < 5; i++) {
  6863. builder.clearAccessChain();
  6864. builder.setAccessChainLValue(resultStruct);
  6865. //Accessing to a struct we created, no coherent flag is set
  6866. spv::Builder::AccessChain::CoherentFlags flags;
  6867. flags.clear();
  6868. builder.accessChainPush(builder.makeIntConstant(i), flags, 0);
  6869. builder.accessChainStore(builder.createCompositeExtract(res, builder.getContainedTypeId(resType, i+1),
  6870. i+1), TranslateNonUniformDecoration(imageType.getQualifier()));
  6871. }
  6872. return builder.createCompositeExtract(res, resultType(), 0);
  6873. }
  6874. // projective component (might not to move)
  6875. // GLSL: "The texture coordinates consumed from P, not including the last component of P,
  6876. // are divided by the last component of P."
  6877. // SPIR-V: "... (u [, v] [, w], q)... It may be a vector larger than needed, but all
  6878. // unused components will appear after all used components."
  6879. if (cracked.proj) {
  6880. int projSourceComp = builder.getNumComponents(params.coords) - 1;
  6881. int projTargetComp;
  6882. switch (sampler.dim) {
  6883. case glslang::Esd1D: projTargetComp = 1; break;
  6884. case glslang::Esd2D: projTargetComp = 2; break;
  6885. case glslang::EsdRect: projTargetComp = 2; break;
  6886. default: projTargetComp = projSourceComp; break;
  6887. }
  6888. // copy the projective coordinate if we have to
  6889. if (projTargetComp != projSourceComp) {
  6890. spv::Id projComp = builder.createCompositeExtract(params.coords,
  6891. builder.getScalarTypeId(builder.getTypeId(params.coords)), projSourceComp);
  6892. params.coords = builder.createCompositeInsert(projComp, params.coords,
  6893. builder.getTypeId(params.coords), projTargetComp);
  6894. }
  6895. }
  6896. // nonprivate
  6897. if (imageType.getQualifier().nonprivate) {
  6898. params.nonprivate = true;
  6899. }
  6900. // volatile
  6901. if (imageType.getQualifier().volatil) {
  6902. params.volatil = true;
  6903. }
  6904. if (imageType.getQualifier().nontemporal) {
  6905. params.nontemporal = true;
  6906. }
  6907. std::vector<spv::Id> result( 1,
  6908. builder.createTextureCall(precision, resultType(), sparse, cracked.fetch, cracked.proj, cracked.gather,
  6909. noImplicitLod, params, signExtensionMask())
  6910. );
  6911. if (components != node->getType().getVectorSize())
  6912. result[0] = builder.createConstructor(precision, result, convertGlslangToSpvType(node->getType()));
  6913. return result[0];
  6914. }
  6915. spv::Id TGlslangToSpvTraverser::handleUserFunctionCall(const glslang::TIntermAggregate* node)
  6916. {
  6917. // Grab the function's pointer from the previously created function
  6918. spv::Function* function = functionMap[node->getName().c_str()];
  6919. if (! function)
  6920. return 0;
  6921. const glslang::TIntermSequence& glslangArgs = node->getSequence();
  6922. const glslang::TQualifierList& qualifiers = node->getQualifierList();
  6923. // See comments in makeFunctions() for details about the semantics for parameter passing.
  6924. //
  6925. // These imply we need a four step process:
  6926. // 1. Evaluate the arguments
  6927. // 2. Allocate and make copies of in, out, and inout arguments
  6928. // 3. Make the call
  6929. // 4. Copy back the results
  6930. // 1. Evaluate the arguments and their types
  6931. std::vector<spv::Builder::AccessChain> lValues;
  6932. std::vector<spv::Id> rValues;
  6933. std::vector<const glslang::TType*> argTypes;
  6934. for (int a = 0; a < (int)glslangArgs.size(); ++a) {
  6935. argTypes.push_back(&glslangArgs[a]->getAsTyped()->getType());
  6936. // build l-value
  6937. builder.clearAccessChain();
  6938. glslangArgs[a]->traverse(this);
  6939. // keep outputs and pass-by-originals as l-values, evaluate others as r-values
  6940. if (originalParam(qualifiers[a], *argTypes[a], function->hasImplicitThis() && a == 0) ||
  6941. writableParam(qualifiers[a])) {
  6942. // save l-value
  6943. lValues.push_back(builder.getAccessChain());
  6944. } else {
  6945. // process r-value
  6946. rValues.push_back(accessChainLoad(*argTypes.back()));
  6947. }
  6948. }
  6949. // Reset source location to the function call location after argument evaluation
  6950. builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
  6951. // 2. Allocate space for anything needing a copy, and if it's "in" or "inout"
  6952. // copy the original into that space.
  6953. //
  6954. // Also, build up the list of actual arguments to pass in for the call
  6955. int lValueCount = 0;
  6956. int rValueCount = 0;
  6957. std::vector<spv::Id> spvArgs;
  6958. for (int a = 0; a < (int)glslangArgs.size(); ++a) {
  6959. spv::Id arg;
  6960. if (originalParam(qualifiers[a], *argTypes[a], function->hasImplicitThis() && a == 0)) {
  6961. builder.setAccessChain(lValues[lValueCount]);
  6962. arg = builder.accessChainGetLValue();
  6963. ++lValueCount;
  6964. } else if (writableParam(qualifiers[a])) {
  6965. // need space to hold the copy
  6966. arg = builder.createVariable(function->getParamPrecision(a), spv::StorageClass::Function,
  6967. builder.getContainedTypeId(function->getParamType(a)), "param");
  6968. if (qualifiers[a] == glslang::EvqIn || qualifiers[a] == glslang::EvqInOut) {
  6969. // need to copy the input into output space
  6970. builder.setAccessChain(lValues[lValueCount]);
  6971. spv::Id copy = accessChainLoad(*argTypes[a]);
  6972. builder.clearAccessChain();
  6973. builder.setAccessChainLValue(arg);
  6974. multiTypeStore(*argTypes[a], copy);
  6975. }
  6976. ++lValueCount;
  6977. } else {
  6978. // process r-value, which involves a copy for a type mismatch
  6979. if (function->getParamType(a) != builder.getTypeId(rValues[rValueCount]) ||
  6980. TranslatePrecisionDecoration(*argTypes[a]) != function->getParamPrecision(a))
  6981. {
  6982. spv::Id argCopy = builder.createVariable(function->getParamPrecision(a), spv::StorageClass::Function, function->getParamType(a), "arg");
  6983. builder.clearAccessChain();
  6984. builder.setAccessChainLValue(argCopy);
  6985. multiTypeStore(*argTypes[a], rValues[rValueCount]);
  6986. arg = builder.createLoad(argCopy, function->getParamPrecision(a));
  6987. } else
  6988. arg = rValues[rValueCount];
  6989. ++rValueCount;
  6990. }
  6991. spvArgs.push_back(arg);
  6992. }
  6993. // 3. Make the call.
  6994. spv::Id result = builder.createFunctionCall(function, spvArgs);
  6995. builder.setPrecision(result, TranslatePrecisionDecoration(node->getType()));
  6996. builder.addDecoration(result, TranslateNonUniformDecoration(node->getType().getQualifier()));
  6997. // 4. Copy back out an "out" arguments.
  6998. lValueCount = 0;
  6999. for (int a = 0; a < (int)glslangArgs.size(); ++a) {
  7000. if (originalParam(qualifiers[a], *argTypes[a], function->hasImplicitThis() && a == 0))
  7001. ++lValueCount;
  7002. else if (writableParam(qualifiers[a])) {
  7003. if (qualifiers[a] == glslang::EvqOut || qualifiers[a] == glslang::EvqInOut) {
  7004. spv::Id copy = builder.createLoad(spvArgs[a], spv::NoPrecision);
  7005. builder.addDecoration(copy, TranslateNonUniformDecoration(argTypes[a]->getQualifier()));
  7006. builder.setAccessChain(lValues[lValueCount]);
  7007. multiTypeStore(*argTypes[a], copy);
  7008. }
  7009. ++lValueCount;
  7010. }
  7011. }
  7012. return result;
  7013. }
  7014. // Translate AST operation to SPV operation, already having SPV-based operands/types.
  7015. spv::Id TGlslangToSpvTraverser::createBinaryOperation(glslang::TOperator op, OpDecorations& decorations,
  7016. spv::Id typeId, spv::Id left, spv::Id right,
  7017. glslang::TBasicType typeProxy, bool reduceComparison)
  7018. {
  7019. bool isUnsigned = isTypeUnsignedInt(typeProxy);
  7020. bool isFloat = isTypeFloat(typeProxy);
  7021. bool isBool = typeProxy == glslang::EbtBool;
  7022. spv::Op binOp = spv::Op::OpNop;
  7023. bool needMatchingVectors = true; // for non-matrix ops, would a scalar need to smear to match a vector?
  7024. bool comparison = false;
  7025. switch (op) {
  7026. case glslang::EOpAdd:
  7027. case glslang::EOpAddAssign:
  7028. if (isFloat)
  7029. binOp = spv::Op::OpFAdd;
  7030. else
  7031. binOp = spv::Op::OpIAdd;
  7032. break;
  7033. case glslang::EOpSub:
  7034. case glslang::EOpSubAssign:
  7035. if (isFloat)
  7036. binOp = spv::Op::OpFSub;
  7037. else
  7038. binOp = spv::Op::OpISub;
  7039. break;
  7040. case glslang::EOpMul:
  7041. case glslang::EOpMulAssign:
  7042. if (isFloat)
  7043. binOp = spv::Op::OpFMul;
  7044. else
  7045. binOp = spv::Op::OpIMul;
  7046. break;
  7047. case glslang::EOpVectorTimesScalar:
  7048. case glslang::EOpVectorTimesScalarAssign:
  7049. if (isFloat && (builder.isVector(left) || builder.isVector(right) || builder.isCooperativeVector(left) || builder.isCooperativeVector(right))) {
  7050. if (builder.isVector(right) || builder.isCooperativeVector(right))
  7051. std::swap(left, right);
  7052. assert(builder.isScalar(right));
  7053. needMatchingVectors = false;
  7054. binOp = spv::Op::OpVectorTimesScalar;
  7055. } else if (isFloat) {
  7056. binOp = spv::Op::OpFMul;
  7057. } else if (builder.isCooperativeVector(left) || builder.isCooperativeVector(right)) {
  7058. if (builder.isCooperativeVector(right))
  7059. std::swap(left, right);
  7060. assert(builder.isScalar(right));
  7061. // Construct a cooperative vector from the scalar
  7062. right = builder.createCompositeConstruct(builder.getTypeId(left), { right });
  7063. binOp = spv::Op::OpIMul;
  7064. } else {
  7065. binOp = spv::Op::OpIMul;
  7066. }
  7067. break;
  7068. case glslang::EOpVectorTimesMatrix:
  7069. case glslang::EOpVectorTimesMatrixAssign:
  7070. binOp = spv::Op::OpVectorTimesMatrix;
  7071. break;
  7072. case glslang::EOpMatrixTimesVector:
  7073. binOp = spv::Op::OpMatrixTimesVector;
  7074. break;
  7075. case glslang::EOpMatrixTimesScalar:
  7076. case glslang::EOpMatrixTimesScalarAssign:
  7077. binOp = spv::Op::OpMatrixTimesScalar;
  7078. break;
  7079. case glslang::EOpMatrixTimesMatrix:
  7080. case glslang::EOpMatrixTimesMatrixAssign:
  7081. binOp = spv::Op::OpMatrixTimesMatrix;
  7082. break;
  7083. case glslang::EOpOuterProduct:
  7084. binOp = spv::Op::OpOuterProduct;
  7085. needMatchingVectors = false;
  7086. break;
  7087. case glslang::EOpDiv:
  7088. case glslang::EOpDivAssign:
  7089. if (isFloat)
  7090. binOp = spv::Op::OpFDiv;
  7091. else if (isUnsigned)
  7092. binOp = spv::Op::OpUDiv;
  7093. else
  7094. binOp = spv::Op::OpSDiv;
  7095. break;
  7096. case glslang::EOpMod:
  7097. case glslang::EOpModAssign:
  7098. if (isFloat)
  7099. binOp = spv::Op::OpFMod;
  7100. else if (isUnsigned)
  7101. binOp = spv::Op::OpUMod;
  7102. else
  7103. binOp = spv::Op::OpSMod;
  7104. break;
  7105. case glslang::EOpRightShift:
  7106. case glslang::EOpRightShiftAssign:
  7107. if (isUnsigned)
  7108. binOp = spv::Op::OpShiftRightLogical;
  7109. else
  7110. binOp = spv::Op::OpShiftRightArithmetic;
  7111. break;
  7112. case glslang::EOpLeftShift:
  7113. case glslang::EOpLeftShiftAssign:
  7114. binOp = spv::Op::OpShiftLeftLogical;
  7115. break;
  7116. case glslang::EOpAnd:
  7117. case glslang::EOpAndAssign:
  7118. binOp = spv::Op::OpBitwiseAnd;
  7119. break;
  7120. case glslang::EOpLogicalAnd:
  7121. needMatchingVectors = false;
  7122. binOp = spv::Op::OpLogicalAnd;
  7123. break;
  7124. case glslang::EOpInclusiveOr:
  7125. case glslang::EOpInclusiveOrAssign:
  7126. binOp = spv::Op::OpBitwiseOr;
  7127. break;
  7128. case glslang::EOpLogicalOr:
  7129. needMatchingVectors = false;
  7130. binOp = spv::Op::OpLogicalOr;
  7131. break;
  7132. case glslang::EOpExclusiveOr:
  7133. case glslang::EOpExclusiveOrAssign:
  7134. binOp = spv::Op::OpBitwiseXor;
  7135. break;
  7136. case glslang::EOpLogicalXor:
  7137. needMatchingVectors = false;
  7138. binOp = spv::Op::OpLogicalNotEqual;
  7139. break;
  7140. case glslang::EOpAbsDifference:
  7141. binOp = isUnsigned ? spv::Op::OpAbsUSubINTEL : spv::Op::OpAbsISubINTEL;
  7142. break;
  7143. case glslang::EOpAddSaturate:
  7144. binOp = isUnsigned ? spv::Op::OpUAddSatINTEL : spv::Op::OpIAddSatINTEL;
  7145. break;
  7146. case glslang::EOpSubSaturate:
  7147. binOp = isUnsigned ? spv::Op::OpUSubSatINTEL : spv::Op::OpISubSatINTEL;
  7148. break;
  7149. case glslang::EOpAverage:
  7150. binOp = isUnsigned ? spv::Op::OpUAverageINTEL : spv::Op::OpIAverageINTEL;
  7151. break;
  7152. case glslang::EOpAverageRounded:
  7153. binOp = isUnsigned ? spv::Op::OpUAverageRoundedINTEL : spv::Op::OpIAverageRoundedINTEL;
  7154. break;
  7155. case glslang::EOpMul32x16:
  7156. binOp = isUnsigned ? spv::Op::OpUMul32x16INTEL : spv::Op::OpIMul32x16INTEL;
  7157. break;
  7158. case glslang::EOpExpectEXT:
  7159. binOp = spv::Op::OpExpectKHR;
  7160. break;
  7161. case glslang::EOpLessThan:
  7162. case glslang::EOpGreaterThan:
  7163. case glslang::EOpLessThanEqual:
  7164. case glslang::EOpGreaterThanEqual:
  7165. case glslang::EOpEqual:
  7166. case glslang::EOpNotEqual:
  7167. case glslang::EOpVectorEqual:
  7168. case glslang::EOpVectorNotEqual:
  7169. comparison = true;
  7170. break;
  7171. default:
  7172. break;
  7173. }
  7174. // handle mapped binary operations (should be non-comparison)
  7175. if (binOp != spv::Op::OpNop) {
  7176. assert(comparison == false);
  7177. if (builder.isMatrix(left) || builder.isMatrix(right) ||
  7178. builder.isCooperativeMatrix(left) || builder.isCooperativeMatrix(right))
  7179. return createBinaryMatrixOperation(binOp, decorations, typeId, left, right);
  7180. // No matrix involved; make both operands be the same number of components, if needed
  7181. if (needMatchingVectors)
  7182. builder.promoteScalar(decorations.precision, left, right);
  7183. spv::Id result = builder.createBinOp(binOp, typeId, left, right);
  7184. decorations.addNoContraction(builder, result);
  7185. decorations.addNonUniform(builder, result);
  7186. return builder.setPrecision(result, decorations.precision);
  7187. }
  7188. if (! comparison)
  7189. return 0;
  7190. // Handle comparison instructions
  7191. if (reduceComparison && (op == glslang::EOpEqual || op == glslang::EOpNotEqual)
  7192. && (builder.isVector(left) || builder.isMatrix(left) || builder.isAggregate(left))) {
  7193. spv::Id result = builder.createCompositeCompare(decorations.precision, left, right, op == glslang::EOpEqual);
  7194. decorations.addNonUniform(builder, result);
  7195. return result;
  7196. }
  7197. switch (op) {
  7198. case glslang::EOpLessThan:
  7199. if (isFloat)
  7200. binOp = spv::Op::OpFOrdLessThan;
  7201. else if (isUnsigned)
  7202. binOp = spv::Op::OpULessThan;
  7203. else
  7204. binOp = spv::Op::OpSLessThan;
  7205. break;
  7206. case glslang::EOpGreaterThan:
  7207. if (isFloat)
  7208. binOp = spv::Op::OpFOrdGreaterThan;
  7209. else if (isUnsigned)
  7210. binOp = spv::Op::OpUGreaterThan;
  7211. else
  7212. binOp = spv::Op::OpSGreaterThan;
  7213. break;
  7214. case glslang::EOpLessThanEqual:
  7215. if (isFloat)
  7216. binOp = spv::Op::OpFOrdLessThanEqual;
  7217. else if (isUnsigned)
  7218. binOp = spv::Op::OpULessThanEqual;
  7219. else
  7220. binOp = spv::Op::OpSLessThanEqual;
  7221. break;
  7222. case glslang::EOpGreaterThanEqual:
  7223. if (isFloat)
  7224. binOp = spv::Op::OpFOrdGreaterThanEqual;
  7225. else if (isUnsigned)
  7226. binOp = spv::Op::OpUGreaterThanEqual;
  7227. else
  7228. binOp = spv::Op::OpSGreaterThanEqual;
  7229. break;
  7230. case glslang::EOpEqual:
  7231. case glslang::EOpVectorEqual:
  7232. if (isFloat)
  7233. binOp = spv::Op::OpFOrdEqual;
  7234. else if (isBool)
  7235. binOp = spv::Op::OpLogicalEqual;
  7236. else
  7237. binOp = spv::Op::OpIEqual;
  7238. break;
  7239. case glslang::EOpNotEqual:
  7240. case glslang::EOpVectorNotEqual:
  7241. if (isFloat)
  7242. binOp = spv::Op::OpFUnordNotEqual;
  7243. else if (isBool)
  7244. binOp = spv::Op::OpLogicalNotEqual;
  7245. else
  7246. binOp = spv::Op::OpINotEqual;
  7247. break;
  7248. default:
  7249. break;
  7250. }
  7251. if (binOp != spv::Op::OpNop) {
  7252. spv::Id result = builder.createBinOp(binOp, typeId, left, right);
  7253. decorations.addNoContraction(builder, result);
  7254. decorations.addNonUniform(builder, result);
  7255. return builder.setPrecision(result, decorations.precision);
  7256. }
  7257. return 0;
  7258. }
  7259. //
  7260. // Translate AST matrix operation to SPV operation, already having SPV-based operands/types.
  7261. // These can be any of:
  7262. //
  7263. // matrix * scalar
  7264. // scalar * matrix
  7265. // matrix * matrix linear algebraic
  7266. // matrix * vector
  7267. // vector * matrix
  7268. // matrix * matrix componentwise
  7269. // matrix op matrix op in {+, -, /}
  7270. // matrix op scalar op in {+, -, /}
  7271. // scalar op matrix op in {+, -, /}
  7272. //
  7273. spv::Id TGlslangToSpvTraverser::createBinaryMatrixOperation(spv::Op op, OpDecorations& decorations, spv::Id typeId,
  7274. spv::Id left, spv::Id right)
  7275. {
  7276. bool firstClass = true;
  7277. // First, handle first-class matrix operations (* and matrix/scalar)
  7278. switch (op) {
  7279. case spv::Op::OpFDiv:
  7280. if (builder.isMatrix(left) && builder.isScalar(right)) {
  7281. // turn matrix / scalar into a multiply...
  7282. spv::Id resultType = builder.getTypeId(right);
  7283. right = builder.createBinOp(spv::Op::OpFDiv, resultType, builder.makeFpConstant(resultType, 1.0), right);
  7284. op = spv::Op::OpMatrixTimesScalar;
  7285. } else
  7286. firstClass = false;
  7287. break;
  7288. case spv::Op::OpMatrixTimesScalar:
  7289. if (builder.isMatrix(right) || builder.isCooperativeMatrix(right))
  7290. std::swap(left, right);
  7291. assert(builder.isScalar(right));
  7292. break;
  7293. case spv::Op::OpVectorTimesMatrix:
  7294. assert(builder.isVector(left));
  7295. assert(builder.isMatrix(right));
  7296. break;
  7297. case spv::Op::OpMatrixTimesVector:
  7298. assert(builder.isMatrix(left));
  7299. assert(builder.isVector(right));
  7300. break;
  7301. case spv::Op::OpMatrixTimesMatrix:
  7302. assert(builder.isMatrix(left));
  7303. assert(builder.isMatrix(right));
  7304. break;
  7305. default:
  7306. firstClass = false;
  7307. break;
  7308. }
  7309. if (builder.isCooperativeMatrix(left) || builder.isCooperativeMatrix(right))
  7310. firstClass = true;
  7311. if (firstClass) {
  7312. spv::Id result = builder.createBinOp(op, typeId, left, right);
  7313. decorations.addNoContraction(builder, result);
  7314. decorations.addNonUniform(builder, result);
  7315. return builder.setPrecision(result, decorations.precision);
  7316. }
  7317. // Handle component-wise +, -, *, %, and / for all combinations of type.
  7318. // The result type of all of them is the same type as the (a) matrix operand.
  7319. // The algorithm is to:
  7320. // - break the matrix(es) into vectors
  7321. // - smear any scalar to a vector
  7322. // - do vector operations
  7323. // - make a matrix out the vector results
  7324. switch (op) {
  7325. case spv::Op::OpFAdd:
  7326. case spv::Op::OpFSub:
  7327. case spv::Op::OpFDiv:
  7328. case spv::Op::OpFMod:
  7329. case spv::Op::OpFMul:
  7330. {
  7331. // one time set up...
  7332. bool leftMat = builder.isMatrix(left);
  7333. bool rightMat = builder.isMatrix(right);
  7334. unsigned int numCols = leftMat ? builder.getNumColumns(left) : builder.getNumColumns(right);
  7335. int numRows = leftMat ? builder.getNumRows(left) : builder.getNumRows(right);
  7336. spv::Id scalarType = builder.getScalarTypeId(typeId);
  7337. spv::Id vecType = builder.makeVectorType(scalarType, numRows);
  7338. std::vector<spv::Id> results;
  7339. spv::Id smearVec = spv::NoResult;
  7340. if (builder.isScalar(left))
  7341. smearVec = builder.smearScalar(decorations.precision, left, vecType);
  7342. else if (builder.isScalar(right))
  7343. smearVec = builder.smearScalar(decorations.precision, right, vecType);
  7344. // do each vector op
  7345. for (unsigned int c = 0; c < numCols; ++c) {
  7346. std::vector<unsigned int> indexes;
  7347. indexes.push_back(c);
  7348. spv::Id leftVec = leftMat ? builder.createCompositeExtract( left, vecType, indexes) : smearVec;
  7349. spv::Id rightVec = rightMat ? builder.createCompositeExtract(right, vecType, indexes) : smearVec;
  7350. spv::Id result = builder.createBinOp(op, vecType, leftVec, rightVec);
  7351. decorations.addNoContraction(builder, result);
  7352. decorations.addNonUniform(builder, result);
  7353. results.push_back(builder.setPrecision(result, decorations.precision));
  7354. }
  7355. // put the pieces together
  7356. spv::Id result = builder.setPrecision(builder.createCompositeConstruct(typeId, results), decorations.precision);
  7357. decorations.addNonUniform(builder, result);
  7358. return result;
  7359. }
  7360. default:
  7361. assert(0);
  7362. return spv::NoResult;
  7363. }
  7364. }
  7365. spv::Id TGlslangToSpvTraverser::createUnaryOperation(glslang::TOperator op, OpDecorations& decorations, spv::Id typeId,
  7366. spv::Id operand, glslang::TBasicType typeProxy, const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags,
  7367. const glslang::TType &opType)
  7368. {
  7369. spv::Op unaryOp = spv::Op::OpNop;
  7370. int extBuiltins = -1;
  7371. int libCall = -1;
  7372. bool isUnsigned = isTypeUnsignedInt(typeProxy);
  7373. bool isFloat = isTypeFloat(typeProxy);
  7374. switch (op) {
  7375. case glslang::EOpNegative:
  7376. if (isFloat) {
  7377. unaryOp = spv::Op::OpFNegate;
  7378. if (builder.isMatrixType(typeId))
  7379. return createUnaryMatrixOperation(unaryOp, decorations, typeId, operand, typeProxy);
  7380. } else
  7381. unaryOp = spv::Op::OpSNegate;
  7382. break;
  7383. case glslang::EOpLogicalNot:
  7384. case glslang::EOpVectorLogicalNot:
  7385. unaryOp = spv::Op::OpLogicalNot;
  7386. break;
  7387. case glslang::EOpBitwiseNot:
  7388. unaryOp = spv::Op::OpNot;
  7389. break;
  7390. case glslang::EOpDeterminant:
  7391. libCall = spv::GLSLstd450Determinant;
  7392. break;
  7393. case glslang::EOpMatrixInverse:
  7394. libCall = spv::GLSLstd450MatrixInverse;
  7395. break;
  7396. case glslang::EOpTranspose:
  7397. unaryOp = spv::Op::OpTranspose;
  7398. break;
  7399. case glslang::EOpRadians:
  7400. libCall = spv::GLSLstd450Radians;
  7401. break;
  7402. case glslang::EOpDegrees:
  7403. libCall = spv::GLSLstd450Degrees;
  7404. break;
  7405. case glslang::EOpSin:
  7406. libCall = spv::GLSLstd450Sin;
  7407. break;
  7408. case glslang::EOpCos:
  7409. libCall = spv::GLSLstd450Cos;
  7410. break;
  7411. case glslang::EOpTan:
  7412. libCall = spv::GLSLstd450Tan;
  7413. break;
  7414. case glslang::EOpAcos:
  7415. libCall = spv::GLSLstd450Acos;
  7416. break;
  7417. case glslang::EOpAsin:
  7418. libCall = spv::GLSLstd450Asin;
  7419. break;
  7420. case glslang::EOpAtan:
  7421. libCall = spv::GLSLstd450Atan;
  7422. break;
  7423. case glslang::EOpAcosh:
  7424. libCall = spv::GLSLstd450Acosh;
  7425. break;
  7426. case glslang::EOpAsinh:
  7427. libCall = spv::GLSLstd450Asinh;
  7428. break;
  7429. case glslang::EOpAtanh:
  7430. libCall = spv::GLSLstd450Atanh;
  7431. break;
  7432. case glslang::EOpTanh:
  7433. libCall = spv::GLSLstd450Tanh;
  7434. break;
  7435. case glslang::EOpCosh:
  7436. libCall = spv::GLSLstd450Cosh;
  7437. break;
  7438. case glslang::EOpSinh:
  7439. libCall = spv::GLSLstd450Sinh;
  7440. break;
  7441. case glslang::EOpLength:
  7442. libCall = spv::GLSLstd450Length;
  7443. break;
  7444. case glslang::EOpNormalize:
  7445. libCall = spv::GLSLstd450Normalize;
  7446. break;
  7447. case glslang::EOpExp:
  7448. libCall = spv::GLSLstd450Exp;
  7449. break;
  7450. case glslang::EOpLog:
  7451. libCall = spv::GLSLstd450Log;
  7452. break;
  7453. case glslang::EOpExp2:
  7454. libCall = spv::GLSLstd450Exp2;
  7455. break;
  7456. case glslang::EOpLog2:
  7457. libCall = spv::GLSLstd450Log2;
  7458. break;
  7459. case glslang::EOpSqrt:
  7460. libCall = spv::GLSLstd450Sqrt;
  7461. break;
  7462. case glslang::EOpInverseSqrt:
  7463. libCall = spv::GLSLstd450InverseSqrt;
  7464. break;
  7465. case glslang::EOpFloor:
  7466. libCall = spv::GLSLstd450Floor;
  7467. break;
  7468. case glslang::EOpTrunc:
  7469. libCall = spv::GLSLstd450Trunc;
  7470. break;
  7471. case glslang::EOpRound:
  7472. libCall = spv::GLSLstd450Round;
  7473. break;
  7474. case glslang::EOpRoundEven:
  7475. libCall = spv::GLSLstd450RoundEven;
  7476. break;
  7477. case glslang::EOpCeil:
  7478. libCall = spv::GLSLstd450Ceil;
  7479. break;
  7480. case glslang::EOpFract:
  7481. libCall = spv::GLSLstd450Fract;
  7482. break;
  7483. case glslang::EOpIsNan:
  7484. unaryOp = spv::Op::OpIsNan;
  7485. break;
  7486. case glslang::EOpIsInf:
  7487. unaryOp = spv::Op::OpIsInf;
  7488. break;
  7489. case glslang::EOpIsFinite:
  7490. unaryOp = spv::Op::OpIsFinite;
  7491. break;
  7492. case glslang::EOpFloatBitsToInt:
  7493. case glslang::EOpFloatBitsToUint:
  7494. case glslang::EOpIntBitsToFloat:
  7495. case glslang::EOpUintBitsToFloat:
  7496. case glslang::EOpDoubleBitsToInt64:
  7497. case glslang::EOpDoubleBitsToUint64:
  7498. case glslang::EOpInt64BitsToDouble:
  7499. case glslang::EOpUint64BitsToDouble:
  7500. case glslang::EOpFloat16BitsToInt16:
  7501. case glslang::EOpFloat16BitsToUint16:
  7502. case glslang::EOpInt16BitsToFloat16:
  7503. case glslang::EOpUint16BitsToFloat16:
  7504. unaryOp = spv::Op::OpBitcast;
  7505. break;
  7506. case glslang::EOpPackSnorm2x16:
  7507. libCall = spv::GLSLstd450PackSnorm2x16;
  7508. break;
  7509. case glslang::EOpUnpackSnorm2x16:
  7510. libCall = spv::GLSLstd450UnpackSnorm2x16;
  7511. break;
  7512. case glslang::EOpPackUnorm2x16:
  7513. libCall = spv::GLSLstd450PackUnorm2x16;
  7514. break;
  7515. case glslang::EOpUnpackUnorm2x16:
  7516. libCall = spv::GLSLstd450UnpackUnorm2x16;
  7517. break;
  7518. case glslang::EOpPackHalf2x16:
  7519. libCall = spv::GLSLstd450PackHalf2x16;
  7520. break;
  7521. case glslang::EOpUnpackHalf2x16:
  7522. libCall = spv::GLSLstd450UnpackHalf2x16;
  7523. break;
  7524. case glslang::EOpPackSnorm4x8:
  7525. libCall = spv::GLSLstd450PackSnorm4x8;
  7526. break;
  7527. case glslang::EOpUnpackSnorm4x8:
  7528. libCall = spv::GLSLstd450UnpackSnorm4x8;
  7529. break;
  7530. case glslang::EOpPackUnorm4x8:
  7531. libCall = spv::GLSLstd450PackUnorm4x8;
  7532. break;
  7533. case glslang::EOpUnpackUnorm4x8:
  7534. libCall = spv::GLSLstd450UnpackUnorm4x8;
  7535. break;
  7536. case glslang::EOpPackDouble2x32:
  7537. libCall = spv::GLSLstd450PackDouble2x32;
  7538. break;
  7539. case glslang::EOpUnpackDouble2x32:
  7540. libCall = spv::GLSLstd450UnpackDouble2x32;
  7541. break;
  7542. case glslang::EOpPackInt2x32:
  7543. case glslang::EOpUnpackInt2x32:
  7544. case glslang::EOpPackUint2x32:
  7545. case glslang::EOpUnpackUint2x32:
  7546. case glslang::EOpPack16:
  7547. case glslang::EOpPack32:
  7548. case glslang::EOpPack64:
  7549. case glslang::EOpUnpack32:
  7550. case glslang::EOpUnpack16:
  7551. case glslang::EOpUnpack8:
  7552. case glslang::EOpPackInt2x16:
  7553. case glslang::EOpUnpackInt2x16:
  7554. case glslang::EOpPackUint2x16:
  7555. case glslang::EOpUnpackUint2x16:
  7556. case glslang::EOpPackInt4x16:
  7557. case glslang::EOpUnpackInt4x16:
  7558. case glslang::EOpPackUint4x16:
  7559. case glslang::EOpUnpackUint4x16:
  7560. case glslang::EOpPackFloat2x16:
  7561. case glslang::EOpUnpackFloat2x16:
  7562. unaryOp = spv::Op::OpBitcast;
  7563. break;
  7564. case glslang::EOpDPdx:
  7565. unaryOp = spv::Op::OpDPdx;
  7566. break;
  7567. case glslang::EOpDPdy:
  7568. unaryOp = spv::Op::OpDPdy;
  7569. break;
  7570. case glslang::EOpFwidth:
  7571. unaryOp = spv::Op::OpFwidth;
  7572. break;
  7573. case glslang::EOpAny:
  7574. unaryOp = spv::Op::OpAny;
  7575. break;
  7576. case glslang::EOpAll:
  7577. unaryOp = spv::Op::OpAll;
  7578. break;
  7579. case glslang::EOpAbs:
  7580. if (isFloat)
  7581. libCall = spv::GLSLstd450FAbs;
  7582. else
  7583. libCall = spv::GLSLstd450SAbs;
  7584. break;
  7585. case glslang::EOpSign:
  7586. if (isFloat)
  7587. libCall = spv::GLSLstd450FSign;
  7588. else
  7589. libCall = spv::GLSLstd450SSign;
  7590. break;
  7591. case glslang::EOpDPdxFine:
  7592. unaryOp = spv::Op::OpDPdxFine;
  7593. break;
  7594. case glslang::EOpDPdyFine:
  7595. unaryOp = spv::Op::OpDPdyFine;
  7596. break;
  7597. case glslang::EOpFwidthFine:
  7598. unaryOp = spv::Op::OpFwidthFine;
  7599. break;
  7600. case glslang::EOpDPdxCoarse:
  7601. unaryOp = spv::Op::OpDPdxCoarse;
  7602. break;
  7603. case glslang::EOpDPdyCoarse:
  7604. unaryOp = spv::Op::OpDPdyCoarse;
  7605. break;
  7606. case glslang::EOpFwidthCoarse:
  7607. unaryOp = spv::Op::OpFwidthCoarse;
  7608. break;
  7609. case glslang::EOpRayQueryProceed:
  7610. unaryOp = spv::Op::OpRayQueryProceedKHR;
  7611. break;
  7612. case glslang::EOpRayQueryGetRayTMin:
  7613. unaryOp = spv::Op::OpRayQueryGetRayTMinKHR;
  7614. break;
  7615. case glslang::EOpRayQueryGetRayFlags:
  7616. unaryOp = spv::Op::OpRayQueryGetRayFlagsKHR;
  7617. break;
  7618. case glslang::EOpRayQueryGetWorldRayOrigin:
  7619. unaryOp = spv::Op::OpRayQueryGetWorldRayOriginKHR;
  7620. break;
  7621. case glslang::EOpRayQueryGetWorldRayDirection:
  7622. unaryOp = spv::Op::OpRayQueryGetWorldRayDirectionKHR;
  7623. break;
  7624. case glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque:
  7625. unaryOp = spv::Op::OpRayQueryGetIntersectionCandidateAABBOpaqueKHR;
  7626. break;
  7627. case glslang::EOpInterpolateAtCentroid:
  7628. if (typeProxy == glslang::EbtFloat16)
  7629. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
  7630. libCall = spv::GLSLstd450InterpolateAtCentroid;
  7631. break;
  7632. case glslang::EOpAtomicCounterIncrement:
  7633. case glslang::EOpAtomicCounterDecrement:
  7634. case glslang::EOpAtomicCounter:
  7635. {
  7636. // Handle all of the atomics in one place, in createAtomicOperation()
  7637. std::vector<spv::Id> operands;
  7638. operands.push_back(operand);
  7639. return createAtomicOperation(op, decorations.precision, typeId, operands, typeProxy, lvalueCoherentFlags, opType);
  7640. }
  7641. case glslang::EOpBitFieldReverse:
  7642. unaryOp = spv::Op::OpBitReverse;
  7643. break;
  7644. case glslang::EOpBitCount:
  7645. unaryOp = spv::Op::OpBitCount;
  7646. break;
  7647. case glslang::EOpFindLSB:
  7648. libCall = spv::GLSLstd450FindILsb;
  7649. break;
  7650. case glslang::EOpFindMSB:
  7651. if (isUnsigned)
  7652. libCall = spv::GLSLstd450FindUMsb;
  7653. else
  7654. libCall = spv::GLSLstd450FindSMsb;
  7655. break;
  7656. case glslang::EOpCountLeadingZeros:
  7657. builder.addCapability(spv::Capability::IntegerFunctions2INTEL);
  7658. builder.addExtension("SPV_INTEL_shader_integer_functions2");
  7659. unaryOp = spv::Op::OpUCountLeadingZerosINTEL;
  7660. break;
  7661. case glslang::EOpCountTrailingZeros:
  7662. builder.addCapability(spv::Capability::IntegerFunctions2INTEL);
  7663. builder.addExtension("SPV_INTEL_shader_integer_functions2");
  7664. unaryOp = spv::Op::OpUCountTrailingZerosINTEL;
  7665. break;
  7666. case glslang::EOpBallot:
  7667. case glslang::EOpReadFirstInvocation:
  7668. case glslang::EOpAnyInvocation:
  7669. case glslang::EOpAllInvocations:
  7670. case glslang::EOpAllInvocationsEqual:
  7671. case glslang::EOpMinInvocations:
  7672. case glslang::EOpMaxInvocations:
  7673. case glslang::EOpAddInvocations:
  7674. case glslang::EOpMinInvocationsNonUniform:
  7675. case glslang::EOpMaxInvocationsNonUniform:
  7676. case glslang::EOpAddInvocationsNonUniform:
  7677. case glslang::EOpMinInvocationsInclusiveScan:
  7678. case glslang::EOpMaxInvocationsInclusiveScan:
  7679. case glslang::EOpAddInvocationsInclusiveScan:
  7680. case glslang::EOpMinInvocationsInclusiveScanNonUniform:
  7681. case glslang::EOpMaxInvocationsInclusiveScanNonUniform:
  7682. case glslang::EOpAddInvocationsInclusiveScanNonUniform:
  7683. case glslang::EOpMinInvocationsExclusiveScan:
  7684. case glslang::EOpMaxInvocationsExclusiveScan:
  7685. case glslang::EOpAddInvocationsExclusiveScan:
  7686. case glslang::EOpMinInvocationsExclusiveScanNonUniform:
  7687. case glslang::EOpMaxInvocationsExclusiveScanNonUniform:
  7688. case glslang::EOpAddInvocationsExclusiveScanNonUniform:
  7689. {
  7690. std::vector<spv::Id> operands;
  7691. operands.push_back(operand);
  7692. return createInvocationsOperation(op, typeId, operands, typeProxy);
  7693. }
  7694. case glslang::EOpSubgroupAll:
  7695. case glslang::EOpSubgroupAny:
  7696. case glslang::EOpSubgroupAllEqual:
  7697. case glslang::EOpSubgroupBroadcastFirst:
  7698. case glslang::EOpSubgroupBallot:
  7699. case glslang::EOpSubgroupInverseBallot:
  7700. case glslang::EOpSubgroupBallotBitCount:
  7701. case glslang::EOpSubgroupBallotInclusiveBitCount:
  7702. case glslang::EOpSubgroupBallotExclusiveBitCount:
  7703. case glslang::EOpSubgroupBallotFindLSB:
  7704. case glslang::EOpSubgroupBallotFindMSB:
  7705. case glslang::EOpSubgroupAdd:
  7706. case glslang::EOpSubgroupMul:
  7707. case glslang::EOpSubgroupMin:
  7708. case glslang::EOpSubgroupMax:
  7709. case glslang::EOpSubgroupAnd:
  7710. case glslang::EOpSubgroupOr:
  7711. case glslang::EOpSubgroupXor:
  7712. case glslang::EOpSubgroupInclusiveAdd:
  7713. case glslang::EOpSubgroupInclusiveMul:
  7714. case glslang::EOpSubgroupInclusiveMin:
  7715. case glslang::EOpSubgroupInclusiveMax:
  7716. case glslang::EOpSubgroupInclusiveAnd:
  7717. case glslang::EOpSubgroupInclusiveOr:
  7718. case glslang::EOpSubgroupInclusiveXor:
  7719. case glslang::EOpSubgroupExclusiveAdd:
  7720. case glslang::EOpSubgroupExclusiveMul:
  7721. case glslang::EOpSubgroupExclusiveMin:
  7722. case glslang::EOpSubgroupExclusiveMax:
  7723. case glslang::EOpSubgroupExclusiveAnd:
  7724. case glslang::EOpSubgroupExclusiveOr:
  7725. case glslang::EOpSubgroupExclusiveXor:
  7726. case glslang::EOpSubgroupQuadSwapHorizontal:
  7727. case glslang::EOpSubgroupQuadSwapVertical:
  7728. case glslang::EOpSubgroupQuadSwapDiagonal:
  7729. case glslang::EOpSubgroupQuadAll:
  7730. case glslang::EOpSubgroupQuadAny: {
  7731. std::vector<spv::Id> operands;
  7732. operands.push_back(operand);
  7733. return createSubgroupOperation(op, typeId, operands, typeProxy);
  7734. }
  7735. case glslang::EOpMbcnt:
  7736. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
  7737. libCall = spv::MbcntAMD;
  7738. break;
  7739. case glslang::EOpCubeFaceIndex:
  7740. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_gcn_shader);
  7741. libCall = spv::CubeFaceIndexAMD;
  7742. break;
  7743. case glslang::EOpCubeFaceCoord:
  7744. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_gcn_shader);
  7745. libCall = spv::CubeFaceCoordAMD;
  7746. break;
  7747. case glslang::EOpSubgroupPartition:
  7748. unaryOp = spv::Op::OpGroupNonUniformPartitionNV;
  7749. break;
  7750. case glslang::EOpConstructReference:
  7751. unaryOp = spv::Op::OpBitcast;
  7752. break;
  7753. case glslang::EOpConvUint64ToAccStruct:
  7754. case glslang::EOpConvUvec2ToAccStruct:
  7755. unaryOp = spv::Op::OpConvertUToAccelerationStructureKHR;
  7756. break;
  7757. case glslang::EOpHitObjectIsEmptyNV:
  7758. unaryOp = spv::Op::OpHitObjectIsEmptyNV;
  7759. break;
  7760. case glslang::EOpHitObjectIsEmptyEXT:
  7761. unaryOp = spv::Op::OpHitObjectIsEmptyEXT;
  7762. break;
  7763. case glslang::EOpHitObjectIsMissNV:
  7764. unaryOp = spv::Op::OpHitObjectIsMissNV;
  7765. break;
  7766. case glslang::EOpHitObjectIsMissEXT:
  7767. unaryOp = spv::Op::OpHitObjectIsMissEXT;
  7768. break;
  7769. case glslang::EOpHitObjectIsHitNV:
  7770. unaryOp = spv::Op::OpHitObjectIsHitNV;
  7771. break;
  7772. case glslang::EOpHitObjectIsHitEXT:
  7773. unaryOp = spv::Op::OpHitObjectIsHitEXT;
  7774. break;
  7775. case glslang::EOpHitObjectGetObjectRayOriginNV:
  7776. unaryOp = spv::Op::OpHitObjectGetObjectRayOriginNV;
  7777. break;
  7778. case glslang::EOpHitObjectGetObjectRayOriginEXT:
  7779. unaryOp = spv::Op::OpHitObjectGetObjectRayOriginEXT;
  7780. break;
  7781. case glslang::EOpHitObjectGetObjectRayDirectionNV:
  7782. unaryOp = spv::Op::OpHitObjectGetObjectRayDirectionNV;
  7783. break;
  7784. case glslang::EOpHitObjectGetObjectRayDirectionEXT:
  7785. unaryOp = spv::Op::OpHitObjectGetObjectRayDirectionEXT;
  7786. break;
  7787. case glslang::EOpHitObjectGetWorldRayOriginNV:
  7788. unaryOp = spv::Op::OpHitObjectGetWorldRayOriginNV;
  7789. break;
  7790. case glslang::EOpHitObjectGetWorldRayOriginEXT:
  7791. unaryOp = spv::Op::OpHitObjectGetWorldRayOriginEXT;
  7792. break;
  7793. case glslang::EOpHitObjectGetWorldRayDirectionNV:
  7794. unaryOp = spv::Op::OpHitObjectGetWorldRayDirectionNV;
  7795. break;
  7796. case glslang::EOpHitObjectGetWorldRayDirectionEXT:
  7797. unaryOp = spv::Op::OpHitObjectGetWorldRayDirectionEXT;
  7798. break;
  7799. case glslang::EOpHitObjectGetObjectToWorldNV:
  7800. unaryOp = spv::Op::OpHitObjectGetObjectToWorldNV;
  7801. break;
  7802. case glslang::EOpHitObjectGetObjectToWorldEXT:
  7803. unaryOp = spv::Op::OpHitObjectGetObjectToWorldEXT;
  7804. break;
  7805. case glslang::EOpHitObjectGetWorldToObjectNV:
  7806. unaryOp = spv::Op::OpHitObjectGetWorldToObjectNV;
  7807. break;
  7808. case glslang::EOpHitObjectGetWorldToObjectEXT:
  7809. unaryOp = spv::Op::OpHitObjectGetWorldToObjectEXT;
  7810. break;
  7811. case glslang::EOpHitObjectGetRayTMinNV:
  7812. unaryOp = spv::Op::OpHitObjectGetRayTMinNV;
  7813. break;
  7814. case glslang::EOpHitObjectGetRayTMinEXT:
  7815. unaryOp = spv::Op::OpHitObjectGetRayTMinEXT;
  7816. break;
  7817. case glslang::EOpHitObjectGetRayTMaxNV:
  7818. unaryOp = spv::Op::OpHitObjectGetRayTMaxNV;
  7819. break;
  7820. case glslang::EOpHitObjectGetRayTMaxEXT:
  7821. unaryOp = spv::Op::OpHitObjectGetRayTMaxEXT;
  7822. break;
  7823. case glslang::EOpHitObjectGetRayFlagsEXT:
  7824. unaryOp = spv::Op::OpHitObjectGetRayFlagsEXT;
  7825. break;
  7826. case glslang::EOpHitObjectGetPrimitiveIndexNV:
  7827. unaryOp = spv::Op::OpHitObjectGetPrimitiveIndexNV;
  7828. break;
  7829. case glslang::EOpHitObjectGetPrimitiveIndexEXT:
  7830. unaryOp = spv::Op::OpHitObjectGetPrimitiveIndexEXT;
  7831. break;
  7832. case glslang::EOpHitObjectGetInstanceIdNV:
  7833. unaryOp = spv::Op::OpHitObjectGetInstanceIdNV;
  7834. break;
  7835. case glslang::EOpHitObjectGetInstanceIdEXT:
  7836. unaryOp = spv::Op::OpHitObjectGetInstanceIdEXT;
  7837. break;
  7838. case glslang::EOpHitObjectGetInstanceCustomIndexNV:
  7839. unaryOp = spv::Op::OpHitObjectGetInstanceCustomIndexNV;
  7840. break;
  7841. case glslang::EOpHitObjectGetInstanceCustomIndexEXT:
  7842. unaryOp = spv::Op::OpHitObjectGetInstanceCustomIndexEXT;
  7843. break;
  7844. case glslang::EOpHitObjectGetGeometryIndexNV:
  7845. unaryOp = spv::Op::OpHitObjectGetGeometryIndexNV;
  7846. break;
  7847. case glslang::EOpHitObjectGetGeometryIndexEXT:
  7848. unaryOp = spv::Op::OpHitObjectGetGeometryIndexEXT;
  7849. break;
  7850. case glslang::EOpHitObjectGetHitKindNV:
  7851. unaryOp = spv::Op::OpHitObjectGetHitKindNV;
  7852. break;
  7853. case glslang::EOpHitObjectGetHitKindEXT:
  7854. unaryOp = spv::Op::OpHitObjectGetHitKindEXT;
  7855. break;
  7856. case glslang::EOpHitObjectGetCurrentTimeNV:
  7857. unaryOp = spv::Op::OpHitObjectGetCurrentTimeNV;
  7858. break;
  7859. case glslang::EOpHitObjectGetCurrentTimeEXT:
  7860. unaryOp = spv::Op::OpHitObjectGetCurrentTimeEXT;
  7861. break;
  7862. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:
  7863. unaryOp = spv::Op::OpHitObjectGetShaderBindingTableRecordIndexNV;
  7864. break;
  7865. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexEXT:
  7866. unaryOp = spv::Op::OpHitObjectGetShaderBindingTableRecordIndexEXT;
  7867. break;
  7868. case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:
  7869. unaryOp = spv::Op::OpHitObjectGetShaderRecordBufferHandleNV;
  7870. break;
  7871. case glslang::EOpHitObjectGetClusterIdNV:
  7872. unaryOp = spv::Op::OpHitObjectGetClusterIdNV;
  7873. builder.addExtension(spv::E_SPV_NV_cluster_acceleration_structure);
  7874. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  7875. builder.addCapability(spv::Capability::RayTracingClusterAccelerationStructureNV);
  7876. break;
  7877. case glslang::EOpHitObjectGetSpherePositionNV:
  7878. unaryOp = spv::Op::OpHitObjectGetSpherePositionNV;
  7879. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  7880. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  7881. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  7882. break;
  7883. case glslang::EOpHitObjectGetSphereRadiusNV:
  7884. unaryOp = spv::Op::OpHitObjectGetSphereRadiusNV;
  7885. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  7886. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  7887. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  7888. break;
  7889. case glslang::EOpHitObjectIsSphereHitNV:
  7890. unaryOp = spv::Op::OpHitObjectIsSphereHitNV;
  7891. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  7892. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  7893. builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
  7894. break;
  7895. case glslang::EOpHitObjectIsLSSHitNV:
  7896. unaryOp = spv::Op::OpHitObjectIsLSSHitNV;
  7897. builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
  7898. builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
  7899. builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
  7900. break;
  7901. case glslang::EOpHitObjectGetShaderRecordBufferHandleEXT:
  7902. unaryOp = spv::Op::OpHitObjectGetShaderRecordBufferHandleEXT;
  7903. break;
  7904. case glslang::EOpFetchMicroTriangleVertexPositionNV:
  7905. unaryOp = spv::Op::OpFetchMicroTriangleVertexPositionNV;
  7906. break;
  7907. case glslang::EOpFetchMicroTriangleVertexBarycentricNV:
  7908. unaryOp = spv::Op::OpFetchMicroTriangleVertexBarycentricNV;
  7909. break;
  7910. case glslang::EOpCopyObject:
  7911. unaryOp = spv::Op::OpCopyObject;
  7912. break;
  7913. case glslang::EOpDepthAttachmentReadEXT:
  7914. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  7915. builder.addCapability(spv::Capability::TileImageDepthReadAccessEXT);
  7916. unaryOp = spv::Op::OpDepthAttachmentReadEXT;
  7917. decorations.precision = spv::NoPrecision;
  7918. break;
  7919. case glslang::EOpStencilAttachmentReadEXT:
  7920. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  7921. builder.addCapability(spv::Capability::TileImageStencilReadAccessEXT);
  7922. unaryOp = spv::Op::OpStencilAttachmentReadEXT;
  7923. decorations.precision = spv::Decoration::RelaxedPrecision;
  7924. break;
  7925. default:
  7926. return 0;
  7927. }
  7928. spv::Id id;
  7929. if (libCall >= 0) {
  7930. std::vector<spv::Id> args;
  7931. args.push_back(operand);
  7932. id = builder.createBuiltinCall(typeId, extBuiltins >= 0 ? extBuiltins : stdBuiltins, libCall, args);
  7933. } else {
  7934. id = builder.createUnaryOp(unaryOp, typeId, operand);
  7935. }
  7936. decorations.addNoContraction(builder, id);
  7937. decorations.addNonUniform(builder, id);
  7938. return builder.setPrecision(id, decorations.precision);
  7939. }
  7940. // Create a unary operation on a matrix
  7941. spv::Id TGlslangToSpvTraverser::createUnaryMatrixOperation(spv::Op op, OpDecorations& decorations, spv::Id typeId,
  7942. spv::Id operand, glslang::TBasicType /* typeProxy */)
  7943. {
  7944. // Handle unary operations vector by vector.
  7945. // The result type is the same type as the original type.
  7946. // The algorithm is to:
  7947. // - break the matrix into vectors
  7948. // - apply the operation to each vector
  7949. // - make a matrix out the vector results
  7950. // get the types sorted out
  7951. int numCols = builder.getNumColumns(operand);
  7952. int numRows = builder.getNumRows(operand);
  7953. spv::Id srcVecType = builder.makeVectorType(builder.getScalarTypeId(builder.getTypeId(operand)), numRows);
  7954. spv::Id destVecType = builder.makeVectorType(builder.getScalarTypeId(typeId), numRows);
  7955. std::vector<spv::Id> results;
  7956. // do each vector op
  7957. for (int c = 0; c < numCols; ++c) {
  7958. std::vector<unsigned int> indexes;
  7959. indexes.push_back(c);
  7960. spv::Id srcVec = builder.createCompositeExtract(operand, srcVecType, indexes);
  7961. spv::Id destVec = builder.createUnaryOp(op, destVecType, srcVec);
  7962. decorations.addNoContraction(builder, destVec);
  7963. decorations.addNonUniform(builder, destVec);
  7964. results.push_back(builder.setPrecision(destVec, decorations.precision));
  7965. }
  7966. // put the pieces together
  7967. spv::Id result = builder.setPrecision(builder.createCompositeConstruct(typeId, results), decorations.precision);
  7968. decorations.addNonUniform(builder, result);
  7969. return result;
  7970. }
  7971. // For converting integers where both the bitwidth and the signedness could
  7972. // change, but only do the width change here. The caller is still responsible
  7973. // for the signedness conversion.
  7974. // destType is the final type that will be converted to, but this function
  7975. // may only be doing part of that conversion.
  7976. spv::Id TGlslangToSpvTraverser::createIntWidthConversion(spv::Id operand, int vectorSize, spv::Id destType,
  7977. glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType)
  7978. {
  7979. // Get the result type width, based on the type to convert to.
  7980. int width = GetNumBits(resultBasicType);
  7981. // Get the conversion operation and result type,
  7982. // based on the target width, but the source type.
  7983. spv::Id type = spv::NoType;
  7984. spv::Op convOp = spv::Op::OpNop;
  7985. if (isTypeSignedInt(operandBasicType)) {
  7986. convOp = spv::Op::OpSConvert;
  7987. type = builder.makeIntType(width);
  7988. } else {
  7989. convOp = spv::Op::OpUConvert;
  7990. type = builder.makeUintType(width);
  7991. }
  7992. if (builder.getOpCode(destType) == spv::Op::OpTypeCooperativeVectorNV) {
  7993. type = builder.makeCooperativeVectorTypeNV(type, builder.getCooperativeVectorNumComponents(destType));
  7994. } else if (vectorSize > 0)
  7995. type = builder.makeVectorType(type, vectorSize);
  7996. else if (builder.getOpCode(destType) == spv::Op::OpTypeCooperativeMatrixKHR ||
  7997. builder.getOpCode(destType) == spv::Op::OpTypeCooperativeMatrixNV) {
  7998. type = builder.makeCooperativeMatrixTypeWithSameShape(type, destType);
  7999. }
  8000. return builder.createUnaryOp(convOp, type, operand);
  8001. }
  8002. spv::Id TGlslangToSpvTraverser::createConversion(glslang::TOperator op, OpDecorations& decorations, spv::Id destType,
  8003. spv::Id operand, glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType)
  8004. {
  8005. spv::Op convOp = spv::Op::OpNop;
  8006. spv::Id zero = 0;
  8007. spv::Id one = 0;
  8008. int vectorSize = builder.isVectorType(destType) ? builder.getNumTypeComponents(destType) : 0;
  8009. if (IsOpNumericConv(op) || op == glslang::EOpConstructSaturated) {
  8010. if (isTypeSignedInt(operandBasicType) && isTypeFloat(resultBasicType)) {
  8011. convOp = spv::Op::OpConvertSToF;
  8012. }
  8013. if (isTypeUnsignedInt(operandBasicType) && isTypeFloat(resultBasicType)) {
  8014. convOp = spv::Op::OpConvertUToF;
  8015. }
  8016. if (isTypeFloat(operandBasicType) && isTypeSignedInt(resultBasicType)) {
  8017. convOp = spv::Op::OpConvertFToS;
  8018. }
  8019. if (isTypeFloat(operandBasicType) && isTypeUnsignedInt(resultBasicType)) {
  8020. convOp = spv::Op::OpConvertFToU;
  8021. }
  8022. if (isTypeSignedInt(operandBasicType) && isTypeSignedInt(resultBasicType)) {
  8023. convOp = spv::Op::OpSConvert;
  8024. }
  8025. if (isTypeUnsignedInt(operandBasicType) && isTypeUnsignedInt(resultBasicType)) {
  8026. convOp = spv::Op::OpUConvert;
  8027. }
  8028. if (isTypeFloat(operandBasicType) && isTypeFloat(resultBasicType)) {
  8029. convOp = spv::Op::OpFConvert;
  8030. if (builder.isMatrixType(destType))
  8031. return createUnaryMatrixOperation(convOp, decorations, destType, operand, operandBasicType);
  8032. }
  8033. if (isTypeInt(operandBasicType) && isTypeInt(resultBasicType) &&
  8034. isTypeUnsignedInt(operandBasicType) != isTypeUnsignedInt(resultBasicType)) {
  8035. if (GetNumBits(operandBasicType) != GetNumBits(resultBasicType)) {
  8036. // OpSConvert/OpUConvert + OpBitCast
  8037. operand = createIntWidthConversion(operand, vectorSize, destType, resultBasicType, operandBasicType);
  8038. }
  8039. if (builder.isInSpecConstCodeGenMode()) {
  8040. uint32_t bits = GetNumBits(resultBasicType);
  8041. spv::Id zeroType = builder.makeUintType(bits);
  8042. if (bits == 64) {
  8043. zero = builder.makeInt64Constant(zeroType, 0, false);
  8044. } else {
  8045. zero = builder.makeIntConstant(zeroType, 0, false);
  8046. }
  8047. zero = makeSmearedConstant(zero, vectorSize);
  8048. // Use OpIAdd, instead of OpBitcast to do the conversion when
  8049. // generating for OpSpecConstantOp instruction.
  8050. return builder.createBinOp(spv::Op::OpIAdd, destType, operand, zero);
  8051. }
  8052. // For normal run-time conversion instruction, use OpBitcast.
  8053. convOp = spv::Op::OpBitcast;
  8054. }
  8055. if (resultBasicType == glslang::EbtBool) {
  8056. uint32_t bits = GetNumBits(operandBasicType);
  8057. if (isTypeInt(operandBasicType)) {
  8058. spv::Id zeroType = builder.makeUintType(bits);
  8059. if (bits == 64) {
  8060. zero = builder.makeInt64Constant(zeroType, 0, false);
  8061. } else {
  8062. zero = builder.makeIntConstant(zeroType, 0, false);
  8063. }
  8064. zero = makeSmearedConstant(zero, vectorSize);
  8065. return builder.createBinOp(spv::Op::OpINotEqual, destType, operand, zero);
  8066. } else {
  8067. assert(isTypeFloat(operandBasicType));
  8068. if (bits == 64) {
  8069. zero = builder.makeDoubleConstant(0.0);
  8070. } else if (bits == 32) {
  8071. zero = builder.makeFloatConstant(0.0);
  8072. } else {
  8073. assert(bits == 16);
  8074. zero = builder.makeFloat16Constant(0.0);
  8075. }
  8076. zero = makeSmearedConstant(zero, vectorSize);
  8077. return builder.createBinOp(spv::Op::OpFUnordNotEqual, destType, operand, zero);
  8078. }
  8079. }
  8080. if (operandBasicType == glslang::EbtBool) {
  8081. uint32_t bits = GetNumBits(resultBasicType);
  8082. convOp = spv::Op::OpSelect;
  8083. if (isTypeInt(resultBasicType)) {
  8084. spv::Id zeroType = isTypeSignedInt(resultBasicType) ? builder.makeIntType(bits) : builder.makeUintType(bits);
  8085. if (bits == 64) {
  8086. zero = builder.makeInt64Constant(zeroType, 0, false);
  8087. one = builder.makeInt64Constant(zeroType, 1, false);
  8088. } else {
  8089. zero = builder.makeIntConstant(zeroType, 0, false);
  8090. one = builder.makeIntConstant(zeroType, 1, false);
  8091. }
  8092. } else {
  8093. assert(isTypeFloat(resultBasicType));
  8094. if (bits == 64) {
  8095. zero = builder.makeDoubleConstant(0.0);
  8096. one = builder.makeDoubleConstant(1.0);
  8097. } else if (bits == 32) {
  8098. zero = builder.makeFloatConstant(0.0);
  8099. one = builder.makeFloatConstant(1.0);
  8100. } else {
  8101. assert(bits == 16);
  8102. zero = builder.makeFloat16Constant(0.0);
  8103. one = builder.makeFloat16Constant(1.0);
  8104. }
  8105. }
  8106. }
  8107. }
  8108. if (convOp == spv::Op::OpNop) {
  8109. switch (op) {
  8110. case glslang::EOpConvUint64ToPtr:
  8111. convOp = spv::Op::OpConvertUToPtr;
  8112. break;
  8113. case glslang::EOpConvPtrToUint64:
  8114. convOp = spv::Op::OpConvertPtrToU;
  8115. break;
  8116. case glslang::EOpConvPtrToUvec2:
  8117. case glslang::EOpConvUvec2ToPtr:
  8118. convOp = spv::Op::OpBitcast;
  8119. break;
  8120. default:
  8121. break;
  8122. }
  8123. }
  8124. spv::Id result = 0;
  8125. if (convOp == spv::Op::OpNop)
  8126. return result;
  8127. if (convOp == spv::Op::OpSelect) {
  8128. zero = makeSmearedConstant(zero, vectorSize);
  8129. one = makeSmearedConstant(one, vectorSize);
  8130. result = builder.createTriOp(convOp, destType, operand, one, zero);
  8131. } else
  8132. result = builder.createUnaryOp(convOp, destType, operand);
  8133. result = builder.setPrecision(result, decorations.precision);
  8134. decorations.addNonUniform(builder, result);
  8135. return result;
  8136. }
  8137. spv::Id TGlslangToSpvTraverser::makeSmearedConstant(spv::Id constant, int vectorSize)
  8138. {
  8139. if (vectorSize == 0)
  8140. return constant;
  8141. spv::Id vectorTypeId = builder.makeVectorType(builder.getTypeId(constant), vectorSize);
  8142. std::vector<spv::Id> components;
  8143. for (int c = 0; c < vectorSize; ++c)
  8144. components.push_back(constant);
  8145. return builder.makeCompositeConstant(vectorTypeId, components);
  8146. }
  8147. // For glslang ops that map to SPV atomic opCodes
  8148. spv::Id TGlslangToSpvTraverser::createAtomicOperation(glslang::TOperator op, spv::Decoration /*precision*/,
  8149. spv::Id typeId, std::vector<spv::Id>& operands, glslang::TBasicType typeProxy,
  8150. const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags, const glslang::TType &opType)
  8151. {
  8152. spv::Op opCode = spv::Op::OpNop;
  8153. switch (op) {
  8154. case glslang::EOpAtomicAdd:
  8155. case glslang::EOpImageAtomicAdd:
  8156. case glslang::EOpAtomicCounterAdd:
  8157. opCode = spv::Op::OpAtomicIAdd;
  8158. if (typeProxy == glslang::EbtFloat16 || typeProxy == glslang::EbtFloat || typeProxy == glslang::EbtDouble) {
  8159. opCode = spv::Op::OpAtomicFAddEXT;
  8160. if (typeProxy == glslang::EbtFloat16 &&
  8161. (opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {
  8162. builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);
  8163. builder.addCapability(spv::Capability::AtomicFloat16VectorNV);
  8164. } else {
  8165. builder.addExtension(spv::E_SPV_EXT_shader_atomic_float_add);
  8166. if (typeProxy == glslang::EbtFloat16) {
  8167. builder.addExtension(spv::E_SPV_EXT_shader_atomic_float16_add);
  8168. builder.addCapability(spv::Capability::AtomicFloat16AddEXT);
  8169. } else if (typeProxy == glslang::EbtFloat) {
  8170. builder.addCapability(spv::Capability::AtomicFloat32AddEXT);
  8171. } else {
  8172. builder.addCapability(spv::Capability::AtomicFloat64AddEXT);
  8173. }
  8174. }
  8175. }
  8176. break;
  8177. case glslang::EOpAtomicSubtract:
  8178. case glslang::EOpAtomicCounterSubtract:
  8179. opCode = spv::Op::OpAtomicISub;
  8180. break;
  8181. case glslang::EOpAtomicMin:
  8182. case glslang::EOpImageAtomicMin:
  8183. case glslang::EOpAtomicCounterMin:
  8184. if (typeProxy == glslang::EbtFloat16 || typeProxy == glslang::EbtFloat || typeProxy == glslang::EbtDouble) {
  8185. opCode = spv::Op::OpAtomicFMinEXT;
  8186. if (typeProxy == glslang::EbtFloat16 &&
  8187. (opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {
  8188. builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);
  8189. builder.addCapability(spv::Capability::AtomicFloat16VectorNV);
  8190. } else {
  8191. builder.addExtension(spv::E_SPV_EXT_shader_atomic_float_min_max);
  8192. if (typeProxy == glslang::EbtFloat16)
  8193. builder.addCapability(spv::Capability::AtomicFloat16MinMaxEXT);
  8194. else if (typeProxy == glslang::EbtFloat)
  8195. builder.addCapability(spv::Capability::AtomicFloat32MinMaxEXT);
  8196. else
  8197. builder.addCapability(spv::Capability::AtomicFloat64MinMaxEXT);
  8198. }
  8199. } else if (typeProxy == glslang::EbtUint || typeProxy == glslang::EbtUint64) {
  8200. opCode = spv::Op::OpAtomicUMin;
  8201. } else {
  8202. opCode = spv::Op::OpAtomicSMin;
  8203. }
  8204. break;
  8205. case glslang::EOpAtomicMax:
  8206. case glslang::EOpImageAtomicMax:
  8207. case glslang::EOpAtomicCounterMax:
  8208. if (typeProxy == glslang::EbtFloat16 || typeProxy == glslang::EbtFloat || typeProxy == glslang::EbtDouble) {
  8209. opCode = spv::Op::OpAtomicFMaxEXT;
  8210. if (typeProxy == glslang::EbtFloat16 &&
  8211. (opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {
  8212. builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);
  8213. builder.addCapability(spv::Capability::AtomicFloat16VectorNV);
  8214. } else {
  8215. builder.addExtension(spv::E_SPV_EXT_shader_atomic_float_min_max);
  8216. if (typeProxy == glslang::EbtFloat16)
  8217. builder.addCapability(spv::Capability::AtomicFloat16MinMaxEXT);
  8218. else if (typeProxy == glslang::EbtFloat)
  8219. builder.addCapability(spv::Capability::AtomicFloat32MinMaxEXT);
  8220. else
  8221. builder.addCapability(spv::Capability::AtomicFloat64MinMaxEXT);
  8222. }
  8223. } else if (typeProxy == glslang::EbtUint || typeProxy == glslang::EbtUint64) {
  8224. opCode = spv::Op::OpAtomicUMax;
  8225. } else {
  8226. opCode = spv::Op::OpAtomicSMax;
  8227. }
  8228. break;
  8229. case glslang::EOpAtomicAnd:
  8230. case glslang::EOpImageAtomicAnd:
  8231. case glslang::EOpAtomicCounterAnd:
  8232. opCode = spv::Op::OpAtomicAnd;
  8233. break;
  8234. case glslang::EOpAtomicOr:
  8235. case glslang::EOpImageAtomicOr:
  8236. case glslang::EOpAtomicCounterOr:
  8237. opCode = spv::Op::OpAtomicOr;
  8238. break;
  8239. case glslang::EOpAtomicXor:
  8240. case glslang::EOpImageAtomicXor:
  8241. case glslang::EOpAtomicCounterXor:
  8242. opCode = spv::Op::OpAtomicXor;
  8243. break;
  8244. case glslang::EOpAtomicExchange:
  8245. case glslang::EOpImageAtomicExchange:
  8246. case glslang::EOpAtomicCounterExchange:
  8247. if ((typeProxy == glslang::EbtFloat16) &&
  8248. (opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {
  8249. builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);
  8250. builder.addCapability(spv::Capability::AtomicFloat16VectorNV);
  8251. }
  8252. opCode = spv::Op::OpAtomicExchange;
  8253. break;
  8254. case glslang::EOpAtomicCompSwap:
  8255. case glslang::EOpImageAtomicCompSwap:
  8256. case glslang::EOpAtomicCounterCompSwap:
  8257. opCode = spv::Op::OpAtomicCompareExchange;
  8258. break;
  8259. case glslang::EOpAtomicCounterIncrement:
  8260. opCode = spv::Op::OpAtomicIIncrement;
  8261. break;
  8262. case glslang::EOpAtomicCounterDecrement:
  8263. opCode = spv::Op::OpAtomicIDecrement;
  8264. break;
  8265. case glslang::EOpAtomicCounter:
  8266. case glslang::EOpImageAtomicLoad:
  8267. case glslang::EOpAtomicLoad:
  8268. opCode = spv::Op::OpAtomicLoad;
  8269. break;
  8270. case glslang::EOpAtomicStore:
  8271. case glslang::EOpImageAtomicStore:
  8272. opCode = spv::Op::OpAtomicStore;
  8273. break;
  8274. default:
  8275. assert(0);
  8276. break;
  8277. }
  8278. if (typeProxy == glslang::EbtInt64 || typeProxy == glslang::EbtUint64)
  8279. builder.addCapability(spv::Capability::Int64Atomics);
  8280. // Sort out the operands
  8281. // - mapping from glslang -> SPV
  8282. // - there are extra SPV operands that are optional in glslang
  8283. // - compare-exchange swaps the value and comparator
  8284. // - compare-exchange has an extra memory semantics
  8285. // - EOpAtomicCounterDecrement needs a post decrement
  8286. spv::Id pointerId = 0, compareId = 0, valueId = 0;
  8287. // scope defaults to Device in the old model, QueueFamilyKHR in the new model
  8288. spv::Id scopeId;
  8289. if (glslangIntermediate->usingVulkanMemoryModel()) {
  8290. scopeId = builder.makeUintConstant(spv::Scope::QueueFamilyKHR);
  8291. } else {
  8292. scopeId = builder.makeUintConstant(spv::Scope::Device);
  8293. }
  8294. // semantics default to relaxed
  8295. spv::Id semanticsId = builder.makeUintConstant(lvalueCoherentFlags.isVolatile() &&
  8296. glslangIntermediate->usingVulkanMemoryModel() ?
  8297. spv::MemorySemanticsMask::Volatile :
  8298. spv::MemorySemanticsMask::MaskNone);
  8299. spv::Id semanticsId2 = semanticsId;
  8300. pointerId = operands[0];
  8301. if (opCode == spv::Op::OpAtomicIIncrement || opCode == spv::Op::OpAtomicIDecrement) {
  8302. // no additional operands
  8303. } else if (opCode == spv::Op::OpAtomicCompareExchange) {
  8304. compareId = operands[1];
  8305. valueId = operands[2];
  8306. if (operands.size() > 3) {
  8307. scopeId = operands[3];
  8308. semanticsId = builder.makeUintConstant(
  8309. builder.getConstantScalar(operands[4]) | builder.getConstantScalar(operands[5]));
  8310. semanticsId2 = builder.makeUintConstant(
  8311. builder.getConstantScalar(operands[6]) | builder.getConstantScalar(operands[7]));
  8312. }
  8313. } else if (opCode == spv::Op::OpAtomicLoad) {
  8314. if (operands.size() > 1) {
  8315. scopeId = operands[1];
  8316. semanticsId = builder.makeUintConstant(
  8317. builder.getConstantScalar(operands[2]) | builder.getConstantScalar(operands[3]));
  8318. }
  8319. } else {
  8320. // atomic store or RMW
  8321. valueId = operands[1];
  8322. if (operands.size() > 2) {
  8323. scopeId = operands[2];
  8324. semanticsId = builder.makeUintConstant
  8325. (builder.getConstantScalar(operands[3]) | builder.getConstantScalar(operands[4]));
  8326. }
  8327. }
  8328. // Check for capabilities
  8329. auto const semanticsImmediate = (spv::MemorySemanticsMask)(builder.getConstantScalar(semanticsId) | builder.getConstantScalar(semanticsId2));
  8330. if (anySet(semanticsImmediate, spv::MemorySemanticsMask::MakeAvailableKHR |
  8331. spv::MemorySemanticsMask::MakeVisibleKHR |
  8332. spv::MemorySemanticsMask::OutputMemoryKHR |
  8333. spv::MemorySemanticsMask::Volatile)) {
  8334. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  8335. }
  8336. auto const scope = (spv::Scope)builder.getConstantScalar(scopeId);
  8337. if (scope == spv::Scope::QueueFamily) {
  8338. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  8339. }
  8340. if (glslangIntermediate->usingVulkanMemoryModel() && scope == spv::Scope::Device) {
  8341. builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);
  8342. }
  8343. std::vector<spv::Id> spvAtomicOperands; // hold the spv operands
  8344. spvAtomicOperands.reserve(6);
  8345. spvAtomicOperands.push_back(pointerId);
  8346. spvAtomicOperands.push_back(scopeId);
  8347. spvAtomicOperands.push_back(semanticsId);
  8348. if (opCode == spv::Op::OpAtomicCompareExchange) {
  8349. spvAtomicOperands.push_back(semanticsId2);
  8350. spvAtomicOperands.push_back(valueId);
  8351. spvAtomicOperands.push_back(compareId);
  8352. } else if (opCode != spv::Op::OpAtomicLoad && opCode != spv::Op::OpAtomicIIncrement && opCode != spv::Op::OpAtomicIDecrement) {
  8353. spvAtomicOperands.push_back(valueId);
  8354. }
  8355. if (opCode == spv::Op::OpAtomicStore) {
  8356. builder.createNoResultOp(opCode, spvAtomicOperands);
  8357. return 0;
  8358. } else {
  8359. spv::Id resultId = builder.createOp(opCode, typeId, spvAtomicOperands);
  8360. // GLSL and HLSL atomic-counter decrement return post-decrement value,
  8361. // while SPIR-V returns pre-decrement value. Translate between these semantics.
  8362. if (op == glslang::EOpAtomicCounterDecrement)
  8363. resultId = builder.createBinOp(spv::Op::OpISub, typeId, resultId, builder.makeIntConstant(1));
  8364. return resultId;
  8365. }
  8366. }
  8367. // Create group invocation operations.
  8368. spv::Id TGlslangToSpvTraverser::createInvocationsOperation(glslang::TOperator op, spv::Id typeId,
  8369. std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)
  8370. {
  8371. bool isUnsigned = isTypeUnsignedInt(typeProxy);
  8372. bool isFloat = isTypeFloat(typeProxy);
  8373. spv::Op opCode = spv::Op::OpNop;
  8374. std::vector<spv::IdImmediate> spvGroupOperands;
  8375. spv::GroupOperation groupOperation = spv::GroupOperation::Max;
  8376. if (op == glslang::EOpBallot || op == glslang::EOpReadFirstInvocation ||
  8377. op == glslang::EOpReadInvocation) {
  8378. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  8379. builder.addCapability(spv::Capability::SubgroupBallotKHR);
  8380. } else if (op == glslang::EOpAnyInvocation ||
  8381. op == glslang::EOpAllInvocations ||
  8382. op == glslang::EOpAllInvocationsEqual) {
  8383. builder.addExtension(spv::E_SPV_KHR_subgroup_vote);
  8384. builder.addCapability(spv::Capability::SubgroupVoteKHR);
  8385. } else {
  8386. builder.addCapability(spv::Capability::Groups);
  8387. if (op == glslang::EOpMinInvocationsNonUniform ||
  8388. op == glslang::EOpMaxInvocationsNonUniform ||
  8389. op == glslang::EOpAddInvocationsNonUniform ||
  8390. op == glslang::EOpMinInvocationsInclusiveScanNonUniform ||
  8391. op == glslang::EOpMaxInvocationsInclusiveScanNonUniform ||
  8392. op == glslang::EOpAddInvocationsInclusiveScanNonUniform ||
  8393. op == glslang::EOpMinInvocationsExclusiveScanNonUniform ||
  8394. op == glslang::EOpMaxInvocationsExclusiveScanNonUniform ||
  8395. op == glslang::EOpAddInvocationsExclusiveScanNonUniform)
  8396. builder.addExtension(spv::E_SPV_AMD_shader_ballot);
  8397. switch (op) {
  8398. case glslang::EOpMinInvocations:
  8399. case glslang::EOpMaxInvocations:
  8400. case glslang::EOpAddInvocations:
  8401. case glslang::EOpMinInvocationsNonUniform:
  8402. case glslang::EOpMaxInvocationsNonUniform:
  8403. case glslang::EOpAddInvocationsNonUniform:
  8404. groupOperation = spv::GroupOperation::Reduce;
  8405. break;
  8406. case glslang::EOpMinInvocationsInclusiveScan:
  8407. case glslang::EOpMaxInvocationsInclusiveScan:
  8408. case glslang::EOpAddInvocationsInclusiveScan:
  8409. case glslang::EOpMinInvocationsInclusiveScanNonUniform:
  8410. case glslang::EOpMaxInvocationsInclusiveScanNonUniform:
  8411. case glslang::EOpAddInvocationsInclusiveScanNonUniform:
  8412. groupOperation = spv::GroupOperation::InclusiveScan;
  8413. break;
  8414. case glslang::EOpMinInvocationsExclusiveScan:
  8415. case glslang::EOpMaxInvocationsExclusiveScan:
  8416. case glslang::EOpAddInvocationsExclusiveScan:
  8417. case glslang::EOpMinInvocationsExclusiveScanNonUniform:
  8418. case glslang::EOpMaxInvocationsExclusiveScanNonUniform:
  8419. case glslang::EOpAddInvocationsExclusiveScanNonUniform:
  8420. groupOperation = spv::GroupOperation::ExclusiveScan;
  8421. break;
  8422. default:
  8423. break;
  8424. }
  8425. spv::IdImmediate scope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };
  8426. spvGroupOperands.push_back(scope);
  8427. if (groupOperation != spv::GroupOperation::Max) {
  8428. spv::IdImmediate groupOp = { false, (unsigned)groupOperation };
  8429. spvGroupOperands.push_back(groupOp);
  8430. }
  8431. }
  8432. for (auto opIt = operands.begin(); opIt != operands.end(); ++opIt) {
  8433. spv::IdImmediate op = { true, *opIt };
  8434. spvGroupOperands.push_back(op);
  8435. }
  8436. switch (op) {
  8437. case glslang::EOpAnyInvocation:
  8438. opCode = spv::Op::OpSubgroupAnyKHR;
  8439. break;
  8440. case glslang::EOpAllInvocations:
  8441. opCode = spv::Op::OpSubgroupAllKHR;
  8442. break;
  8443. case glslang::EOpAllInvocationsEqual:
  8444. opCode = spv::Op::OpSubgroupAllEqualKHR;
  8445. break;
  8446. case glslang::EOpReadInvocation:
  8447. opCode = spv::Op::OpSubgroupReadInvocationKHR;
  8448. if (builder.isVectorType(typeId))
  8449. return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
  8450. break;
  8451. case glslang::EOpReadFirstInvocation:
  8452. opCode = spv::Op::OpSubgroupFirstInvocationKHR;
  8453. if (builder.isVectorType(typeId))
  8454. return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
  8455. break;
  8456. case glslang::EOpBallot:
  8457. {
  8458. // NOTE: According to the spec, the result type of "OpSubgroupBallotKHR" must be a 4 component vector of 32
  8459. // bit integer types. The GLSL built-in function "ballotARB()" assumes the maximum number of invocations in
  8460. // a subgroup is 64. Thus, we have to convert uvec4.xy to uint64_t as follow:
  8461. //
  8462. // result = Bitcast(SubgroupBallotKHR(Predicate).xy)
  8463. //
  8464. spv::Id uintType = builder.makeUintType(32);
  8465. spv::Id uvec4Type = builder.makeVectorType(uintType, 4);
  8466. spv::Id result = builder.createOp(spv::Op::OpSubgroupBallotKHR, uvec4Type, spvGroupOperands);
  8467. std::vector<spv::Id> components;
  8468. components.push_back(builder.createCompositeExtract(result, uintType, 0));
  8469. components.push_back(builder.createCompositeExtract(result, uintType, 1));
  8470. spv::Id uvec2Type = builder.makeVectorType(uintType, 2);
  8471. return builder.createUnaryOp(spv::Op::OpBitcast, typeId,
  8472. builder.createCompositeConstruct(uvec2Type, components));
  8473. }
  8474. case glslang::EOpMinInvocations:
  8475. case glslang::EOpMaxInvocations:
  8476. case glslang::EOpAddInvocations:
  8477. case glslang::EOpMinInvocationsInclusiveScan:
  8478. case glslang::EOpMaxInvocationsInclusiveScan:
  8479. case glslang::EOpAddInvocationsInclusiveScan:
  8480. case glslang::EOpMinInvocationsExclusiveScan:
  8481. case glslang::EOpMaxInvocationsExclusiveScan:
  8482. case glslang::EOpAddInvocationsExclusiveScan:
  8483. if (op == glslang::EOpMinInvocations ||
  8484. op == glslang::EOpMinInvocationsInclusiveScan ||
  8485. op == glslang::EOpMinInvocationsExclusiveScan) {
  8486. if (isFloat)
  8487. opCode = spv::Op::OpGroupFMin;
  8488. else {
  8489. if (isUnsigned)
  8490. opCode = spv::Op::OpGroupUMin;
  8491. else
  8492. opCode = spv::Op::OpGroupSMin;
  8493. }
  8494. } else if (op == glslang::EOpMaxInvocations ||
  8495. op == glslang::EOpMaxInvocationsInclusiveScan ||
  8496. op == glslang::EOpMaxInvocationsExclusiveScan) {
  8497. if (isFloat)
  8498. opCode = spv::Op::OpGroupFMax;
  8499. else {
  8500. if (isUnsigned)
  8501. opCode = spv::Op::OpGroupUMax;
  8502. else
  8503. opCode = spv::Op::OpGroupSMax;
  8504. }
  8505. } else {
  8506. if (isFloat)
  8507. opCode = spv::Op::OpGroupFAdd;
  8508. else
  8509. opCode = spv::Op::OpGroupIAdd;
  8510. }
  8511. if (builder.isVectorType(typeId))
  8512. return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
  8513. break;
  8514. case glslang::EOpMinInvocationsNonUniform:
  8515. case glslang::EOpMaxInvocationsNonUniform:
  8516. case glslang::EOpAddInvocationsNonUniform:
  8517. case glslang::EOpMinInvocationsInclusiveScanNonUniform:
  8518. case glslang::EOpMaxInvocationsInclusiveScanNonUniform:
  8519. case glslang::EOpAddInvocationsInclusiveScanNonUniform:
  8520. case glslang::EOpMinInvocationsExclusiveScanNonUniform:
  8521. case glslang::EOpMaxInvocationsExclusiveScanNonUniform:
  8522. case glslang::EOpAddInvocationsExclusiveScanNonUniform:
  8523. if (op == glslang::EOpMinInvocationsNonUniform ||
  8524. op == glslang::EOpMinInvocationsInclusiveScanNonUniform ||
  8525. op == glslang::EOpMinInvocationsExclusiveScanNonUniform) {
  8526. if (isFloat)
  8527. opCode = spv::Op::OpGroupFMinNonUniformAMD;
  8528. else {
  8529. if (isUnsigned)
  8530. opCode = spv::Op::OpGroupUMinNonUniformAMD;
  8531. else
  8532. opCode = spv::Op::OpGroupSMinNonUniformAMD;
  8533. }
  8534. }
  8535. else if (op == glslang::EOpMaxInvocationsNonUniform ||
  8536. op == glslang::EOpMaxInvocationsInclusiveScanNonUniform ||
  8537. op == glslang::EOpMaxInvocationsExclusiveScanNonUniform) {
  8538. if (isFloat)
  8539. opCode = spv::Op::OpGroupFMaxNonUniformAMD;
  8540. else {
  8541. if (isUnsigned)
  8542. opCode = spv::Op::OpGroupUMaxNonUniformAMD;
  8543. else
  8544. opCode = spv::Op::OpGroupSMaxNonUniformAMD;
  8545. }
  8546. }
  8547. else {
  8548. if (isFloat)
  8549. opCode = spv::Op::OpGroupFAddNonUniformAMD;
  8550. else
  8551. opCode = spv::Op::OpGroupIAddNonUniformAMD;
  8552. }
  8553. if (builder.isVectorType(typeId))
  8554. return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
  8555. break;
  8556. default:
  8557. logger->missingFunctionality("invocation operation");
  8558. return spv::NoResult;
  8559. }
  8560. assert(opCode != spv::Op::OpNop);
  8561. return builder.createOp(opCode, typeId, spvGroupOperands);
  8562. }
  8563. // Create group invocation operations on a vector
  8564. spv::Id TGlslangToSpvTraverser::CreateInvocationsVectorOperation(spv::Op op, spv::GroupOperation groupOperation,
  8565. spv::Id typeId, std::vector<spv::Id>& operands)
  8566. {
  8567. assert(op == spv::Op::OpGroupFMin || op == spv::Op::OpGroupUMin || op == spv::Op::OpGroupSMin ||
  8568. op == spv::Op::OpGroupFMax || op == spv::Op::OpGroupUMax || op == spv::Op::OpGroupSMax ||
  8569. op == spv::Op::OpGroupFAdd || op == spv::Op::OpGroupIAdd || op == spv::Op::OpGroupBroadcast ||
  8570. op == spv::Op::OpSubgroupReadInvocationKHR || op == spv::Op::OpSubgroupFirstInvocationKHR ||
  8571. op == spv::Op::OpGroupFMinNonUniformAMD || op == spv::Op::OpGroupUMinNonUniformAMD ||
  8572. op == spv::Op::OpGroupSMinNonUniformAMD ||
  8573. op == spv::Op::OpGroupFMaxNonUniformAMD || op == spv::Op::OpGroupUMaxNonUniformAMD ||
  8574. op == spv::Op::OpGroupSMaxNonUniformAMD ||
  8575. op == spv::Op::OpGroupFAddNonUniformAMD || op == spv::Op::OpGroupIAddNonUniformAMD);
  8576. // Handle group invocation operations scalar by scalar.
  8577. // The result type is the same type as the original type.
  8578. // The algorithm is to:
  8579. // - break the vector into scalars
  8580. // - apply the operation to each scalar
  8581. // - make a vector out the scalar results
  8582. // get the types sorted out
  8583. int numComponents = builder.getNumComponents(operands[0]);
  8584. spv::Id scalarType = builder.getScalarTypeId(builder.getTypeId(operands[0]));
  8585. std::vector<spv::Id> results;
  8586. // do each scalar op
  8587. for (int comp = 0; comp < numComponents; ++comp) {
  8588. std::vector<unsigned int> indexes;
  8589. indexes.push_back(comp);
  8590. spv::IdImmediate scalar = { true, builder.createCompositeExtract(operands[0], scalarType, indexes) };
  8591. std::vector<spv::IdImmediate> spvGroupOperands;
  8592. if (op == spv::Op::OpSubgroupReadInvocationKHR) {
  8593. spvGroupOperands.push_back(scalar);
  8594. spv::IdImmediate operand = { true, operands[1] };
  8595. spvGroupOperands.push_back(operand);
  8596. } else if (op == spv::Op::OpSubgroupFirstInvocationKHR) {
  8597. spvGroupOperands.push_back(scalar);
  8598. } else if (op == spv::Op::OpGroupBroadcast) {
  8599. spv::IdImmediate scope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };
  8600. spvGroupOperands.push_back(scope);
  8601. spvGroupOperands.push_back(scalar);
  8602. spv::IdImmediate operand = { true, operands[1] };
  8603. spvGroupOperands.push_back(operand);
  8604. } else {
  8605. spv::IdImmediate scope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };
  8606. spvGroupOperands.push_back(scope);
  8607. spv::IdImmediate groupOp = { false, (unsigned)groupOperation };
  8608. spvGroupOperands.push_back(groupOp);
  8609. spvGroupOperands.push_back(scalar);
  8610. }
  8611. results.push_back(builder.createOp(op, scalarType, spvGroupOperands));
  8612. }
  8613. // put the pieces together
  8614. return builder.createCompositeConstruct(typeId, results);
  8615. }
  8616. // Create subgroup invocation operations.
  8617. spv::Id TGlslangToSpvTraverser::createSubgroupOperation(glslang::TOperator op, spv::Id typeId,
  8618. std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)
  8619. {
  8620. // Add the required capabilities.
  8621. switch (op) {
  8622. case glslang::EOpSubgroupElect:
  8623. builder.addCapability(spv::Capability::GroupNonUniform);
  8624. break;
  8625. case glslang::EOpSubgroupQuadAll:
  8626. case glslang::EOpSubgroupQuadAny:
  8627. builder.addExtension(spv::E_SPV_KHR_quad_control);
  8628. builder.addCapability(spv::Capability::QuadControlKHR);
  8629. [[fallthrough]];
  8630. case glslang::EOpSubgroupAll:
  8631. case glslang::EOpSubgroupAny:
  8632. case glslang::EOpSubgroupAllEqual:
  8633. builder.addCapability(spv::Capability::GroupNonUniform);
  8634. builder.addCapability(spv::Capability::GroupNonUniformVote);
  8635. break;
  8636. case glslang::EOpSubgroupBroadcast:
  8637. case glslang::EOpSubgroupBroadcastFirst:
  8638. case glslang::EOpSubgroupBallot:
  8639. case glslang::EOpSubgroupInverseBallot:
  8640. case glslang::EOpSubgroupBallotBitExtract:
  8641. case glslang::EOpSubgroupBallotBitCount:
  8642. case glslang::EOpSubgroupBallotInclusiveBitCount:
  8643. case glslang::EOpSubgroupBallotExclusiveBitCount:
  8644. case glslang::EOpSubgroupBallotFindLSB:
  8645. case glslang::EOpSubgroupBallotFindMSB:
  8646. builder.addCapability(spv::Capability::GroupNonUniform);
  8647. builder.addCapability(spv::Capability::GroupNonUniformBallot);
  8648. break;
  8649. case glslang::EOpSubgroupRotate:
  8650. case glslang::EOpSubgroupClusteredRotate:
  8651. builder.addExtension(spv::E_SPV_KHR_subgroup_rotate);
  8652. builder.addCapability(spv::Capability::GroupNonUniformRotateKHR);
  8653. break;
  8654. case glslang::EOpSubgroupShuffle:
  8655. case glslang::EOpSubgroupShuffleXor:
  8656. builder.addCapability(spv::Capability::GroupNonUniform);
  8657. builder.addCapability(spv::Capability::GroupNonUniformShuffle);
  8658. break;
  8659. case glslang::EOpSubgroupShuffleUp:
  8660. case glslang::EOpSubgroupShuffleDown:
  8661. builder.addCapability(spv::Capability::GroupNonUniform);
  8662. builder.addCapability(spv::Capability::GroupNonUniformShuffleRelative);
  8663. break;
  8664. case glslang::EOpSubgroupAdd:
  8665. case glslang::EOpSubgroupMul:
  8666. case glslang::EOpSubgroupMin:
  8667. case glslang::EOpSubgroupMax:
  8668. case glslang::EOpSubgroupAnd:
  8669. case glslang::EOpSubgroupOr:
  8670. case glslang::EOpSubgroupXor:
  8671. case glslang::EOpSubgroupInclusiveAdd:
  8672. case glslang::EOpSubgroupInclusiveMul:
  8673. case glslang::EOpSubgroupInclusiveMin:
  8674. case glslang::EOpSubgroupInclusiveMax:
  8675. case glslang::EOpSubgroupInclusiveAnd:
  8676. case glslang::EOpSubgroupInclusiveOr:
  8677. case glslang::EOpSubgroupInclusiveXor:
  8678. case glslang::EOpSubgroupExclusiveAdd:
  8679. case glslang::EOpSubgroupExclusiveMul:
  8680. case glslang::EOpSubgroupExclusiveMin:
  8681. case glslang::EOpSubgroupExclusiveMax:
  8682. case glslang::EOpSubgroupExclusiveAnd:
  8683. case glslang::EOpSubgroupExclusiveOr:
  8684. case glslang::EOpSubgroupExclusiveXor:
  8685. builder.addCapability(spv::Capability::GroupNonUniform);
  8686. builder.addCapability(spv::Capability::GroupNonUniformArithmetic);
  8687. break;
  8688. case glslang::EOpSubgroupClusteredAdd:
  8689. case glslang::EOpSubgroupClusteredMul:
  8690. case glslang::EOpSubgroupClusteredMin:
  8691. case glslang::EOpSubgroupClusteredMax:
  8692. case glslang::EOpSubgroupClusteredAnd:
  8693. case glslang::EOpSubgroupClusteredOr:
  8694. case glslang::EOpSubgroupClusteredXor:
  8695. builder.addCapability(spv::Capability::GroupNonUniform);
  8696. builder.addCapability(spv::Capability::GroupNonUniformClustered);
  8697. break;
  8698. case glslang::EOpSubgroupQuadBroadcast:
  8699. case glslang::EOpSubgroupQuadSwapHorizontal:
  8700. case glslang::EOpSubgroupQuadSwapVertical:
  8701. case glslang::EOpSubgroupQuadSwapDiagonal:
  8702. builder.addCapability(spv::Capability::GroupNonUniform);
  8703. builder.addCapability(spv::Capability::GroupNonUniformQuad);
  8704. break;
  8705. case glslang::EOpSubgroupPartitionedAdd:
  8706. case glslang::EOpSubgroupPartitionedMul:
  8707. case glslang::EOpSubgroupPartitionedMin:
  8708. case glslang::EOpSubgroupPartitionedMax:
  8709. case glslang::EOpSubgroupPartitionedAnd:
  8710. case glslang::EOpSubgroupPartitionedOr:
  8711. case glslang::EOpSubgroupPartitionedXor:
  8712. case glslang::EOpSubgroupPartitionedInclusiveAdd:
  8713. case glslang::EOpSubgroupPartitionedInclusiveMul:
  8714. case glslang::EOpSubgroupPartitionedInclusiveMin:
  8715. case glslang::EOpSubgroupPartitionedInclusiveMax:
  8716. case glslang::EOpSubgroupPartitionedInclusiveAnd:
  8717. case glslang::EOpSubgroupPartitionedInclusiveOr:
  8718. case glslang::EOpSubgroupPartitionedInclusiveXor:
  8719. case glslang::EOpSubgroupPartitionedExclusiveAdd:
  8720. case glslang::EOpSubgroupPartitionedExclusiveMul:
  8721. case glslang::EOpSubgroupPartitionedExclusiveMin:
  8722. case glslang::EOpSubgroupPartitionedExclusiveMax:
  8723. case glslang::EOpSubgroupPartitionedExclusiveAnd:
  8724. case glslang::EOpSubgroupPartitionedExclusiveOr:
  8725. case glslang::EOpSubgroupPartitionedExclusiveXor:
  8726. builder.addExtension(spv::E_SPV_NV_shader_subgroup_partitioned);
  8727. builder.addCapability(spv::Capability::GroupNonUniformPartitionedNV);
  8728. break;
  8729. default: assert(0 && "Unhandled subgroup operation!");
  8730. }
  8731. const bool isUnsigned = isTypeUnsignedInt(typeProxy);
  8732. const bool isFloat = isTypeFloat(typeProxy);
  8733. const bool isBool = typeProxy == glslang::EbtBool;
  8734. spv::Op opCode = spv::Op::OpNop;
  8735. // Figure out which opcode to use.
  8736. switch (op) {
  8737. case glslang::EOpSubgroupElect: opCode = spv::Op::OpGroupNonUniformElect; break;
  8738. case glslang::EOpSubgroupQuadAll: opCode = spv::Op::OpGroupNonUniformQuadAllKHR; break;
  8739. case glslang::EOpSubgroupAll: opCode = spv::Op::OpGroupNonUniformAll; break;
  8740. case glslang::EOpSubgroupQuadAny: opCode = spv::Op::OpGroupNonUniformQuadAnyKHR; break;
  8741. case glslang::EOpSubgroupAny: opCode = spv::Op::OpGroupNonUniformAny; break;
  8742. case glslang::EOpSubgroupAllEqual: opCode = spv::Op::OpGroupNonUniformAllEqual; break;
  8743. case glslang::EOpSubgroupBroadcast: opCode = spv::Op::OpGroupNonUniformBroadcast; break;
  8744. case glslang::EOpSubgroupBroadcastFirst: opCode = spv::Op::OpGroupNonUniformBroadcastFirst; break;
  8745. case glslang::EOpSubgroupBallot: opCode = spv::Op::OpGroupNonUniformBallot; break;
  8746. case glslang::EOpSubgroupInverseBallot: opCode = spv::Op::OpGroupNonUniformInverseBallot; break;
  8747. case glslang::EOpSubgroupBallotBitExtract: opCode = spv::Op::OpGroupNonUniformBallotBitExtract; break;
  8748. case glslang::EOpSubgroupBallotBitCount:
  8749. case glslang::EOpSubgroupBallotInclusiveBitCount:
  8750. case glslang::EOpSubgroupBallotExclusiveBitCount: opCode = spv::Op::OpGroupNonUniformBallotBitCount; break;
  8751. case glslang::EOpSubgroupBallotFindLSB: opCode = spv::Op::OpGroupNonUniformBallotFindLSB; break;
  8752. case glslang::EOpSubgroupBallotFindMSB: opCode = spv::Op::OpGroupNonUniformBallotFindMSB; break;
  8753. case glslang::EOpSubgroupShuffle: opCode = spv::Op::OpGroupNonUniformShuffle; break;
  8754. case glslang::EOpSubgroupShuffleXor: opCode = spv::Op::OpGroupNonUniformShuffleXor; break;
  8755. case glslang::EOpSubgroupShuffleUp: opCode = spv::Op::OpGroupNonUniformShuffleUp; break;
  8756. case glslang::EOpSubgroupShuffleDown: opCode = spv::Op::OpGroupNonUniformShuffleDown; break;
  8757. case glslang::EOpSubgroupRotate:
  8758. case glslang::EOpSubgroupClusteredRotate: opCode = spv::Op::OpGroupNonUniformRotateKHR; break;
  8759. case glslang::EOpSubgroupAdd:
  8760. case glslang::EOpSubgroupInclusiveAdd:
  8761. case glslang::EOpSubgroupExclusiveAdd:
  8762. case glslang::EOpSubgroupClusteredAdd:
  8763. case glslang::EOpSubgroupPartitionedAdd:
  8764. case glslang::EOpSubgroupPartitionedInclusiveAdd:
  8765. case glslang::EOpSubgroupPartitionedExclusiveAdd:
  8766. if (isFloat) {
  8767. opCode = spv::Op::OpGroupNonUniformFAdd;
  8768. } else {
  8769. opCode = spv::Op::OpGroupNonUniformIAdd;
  8770. }
  8771. break;
  8772. case glslang::EOpSubgroupMul:
  8773. case glslang::EOpSubgroupInclusiveMul:
  8774. case glslang::EOpSubgroupExclusiveMul:
  8775. case glslang::EOpSubgroupClusteredMul:
  8776. case glslang::EOpSubgroupPartitionedMul:
  8777. case glslang::EOpSubgroupPartitionedInclusiveMul:
  8778. case glslang::EOpSubgroupPartitionedExclusiveMul:
  8779. if (isFloat) {
  8780. opCode = spv::Op::OpGroupNonUniformFMul;
  8781. } else {
  8782. opCode = spv::Op::OpGroupNonUniformIMul;
  8783. }
  8784. break;
  8785. case glslang::EOpSubgroupMin:
  8786. case glslang::EOpSubgroupInclusiveMin:
  8787. case glslang::EOpSubgroupExclusiveMin:
  8788. case glslang::EOpSubgroupClusteredMin:
  8789. case glslang::EOpSubgroupPartitionedMin:
  8790. case glslang::EOpSubgroupPartitionedInclusiveMin:
  8791. case glslang::EOpSubgroupPartitionedExclusiveMin:
  8792. if (isFloat) {
  8793. opCode = spv::Op::OpGroupNonUniformFMin;
  8794. } else if (isUnsigned) {
  8795. opCode = spv::Op::OpGroupNonUniformUMin;
  8796. } else {
  8797. opCode = spv::Op::OpGroupNonUniformSMin;
  8798. }
  8799. break;
  8800. case glslang::EOpSubgroupMax:
  8801. case glslang::EOpSubgroupInclusiveMax:
  8802. case glslang::EOpSubgroupExclusiveMax:
  8803. case glslang::EOpSubgroupClusteredMax:
  8804. case glslang::EOpSubgroupPartitionedMax:
  8805. case glslang::EOpSubgroupPartitionedInclusiveMax:
  8806. case glslang::EOpSubgroupPartitionedExclusiveMax:
  8807. if (isFloat) {
  8808. opCode = spv::Op::OpGroupNonUniformFMax;
  8809. } else if (isUnsigned) {
  8810. opCode = spv::Op::OpGroupNonUniformUMax;
  8811. } else {
  8812. opCode = spv::Op::OpGroupNonUniformSMax;
  8813. }
  8814. break;
  8815. case glslang::EOpSubgroupAnd:
  8816. case glslang::EOpSubgroupInclusiveAnd:
  8817. case glslang::EOpSubgroupExclusiveAnd:
  8818. case glslang::EOpSubgroupClusteredAnd:
  8819. case glslang::EOpSubgroupPartitionedAnd:
  8820. case glslang::EOpSubgroupPartitionedInclusiveAnd:
  8821. case glslang::EOpSubgroupPartitionedExclusiveAnd:
  8822. if (isBool) {
  8823. opCode = spv::Op::OpGroupNonUniformLogicalAnd;
  8824. } else {
  8825. opCode = spv::Op::OpGroupNonUniformBitwiseAnd;
  8826. }
  8827. break;
  8828. case glslang::EOpSubgroupOr:
  8829. case glslang::EOpSubgroupInclusiveOr:
  8830. case glslang::EOpSubgroupExclusiveOr:
  8831. case glslang::EOpSubgroupClusteredOr:
  8832. case glslang::EOpSubgroupPartitionedOr:
  8833. case glslang::EOpSubgroupPartitionedInclusiveOr:
  8834. case glslang::EOpSubgroupPartitionedExclusiveOr:
  8835. if (isBool) {
  8836. opCode = spv::Op::OpGroupNonUniformLogicalOr;
  8837. } else {
  8838. opCode = spv::Op::OpGroupNonUniformBitwiseOr;
  8839. }
  8840. break;
  8841. case glslang::EOpSubgroupXor:
  8842. case glslang::EOpSubgroupInclusiveXor:
  8843. case glslang::EOpSubgroupExclusiveXor:
  8844. case glslang::EOpSubgroupClusteredXor:
  8845. case glslang::EOpSubgroupPartitionedXor:
  8846. case glslang::EOpSubgroupPartitionedInclusiveXor:
  8847. case glslang::EOpSubgroupPartitionedExclusiveXor:
  8848. if (isBool) {
  8849. opCode = spv::Op::OpGroupNonUniformLogicalXor;
  8850. } else {
  8851. opCode = spv::Op::OpGroupNonUniformBitwiseXor;
  8852. }
  8853. break;
  8854. case glslang::EOpSubgroupQuadBroadcast: opCode = spv::Op::OpGroupNonUniformQuadBroadcast; break;
  8855. case glslang::EOpSubgroupQuadSwapHorizontal:
  8856. case glslang::EOpSubgroupQuadSwapVertical:
  8857. case glslang::EOpSubgroupQuadSwapDiagonal: opCode = spv::Op::OpGroupNonUniformQuadSwap; break;
  8858. default: assert(0 && "Unhandled subgroup operation!");
  8859. }
  8860. // get the right Group Operation
  8861. spv::GroupOperation groupOperation = spv::GroupOperation::Max;
  8862. switch (op) {
  8863. default:
  8864. break;
  8865. case glslang::EOpSubgroupBallotBitCount:
  8866. case glslang::EOpSubgroupAdd:
  8867. case glslang::EOpSubgroupMul:
  8868. case glslang::EOpSubgroupMin:
  8869. case glslang::EOpSubgroupMax:
  8870. case glslang::EOpSubgroupAnd:
  8871. case glslang::EOpSubgroupOr:
  8872. case glslang::EOpSubgroupXor:
  8873. groupOperation = spv::GroupOperation::Reduce;
  8874. break;
  8875. case glslang::EOpSubgroupBallotInclusiveBitCount:
  8876. case glslang::EOpSubgroupInclusiveAdd:
  8877. case glslang::EOpSubgroupInclusiveMul:
  8878. case glslang::EOpSubgroupInclusiveMin:
  8879. case glslang::EOpSubgroupInclusiveMax:
  8880. case glslang::EOpSubgroupInclusiveAnd:
  8881. case glslang::EOpSubgroupInclusiveOr:
  8882. case glslang::EOpSubgroupInclusiveXor:
  8883. groupOperation = spv::GroupOperation::InclusiveScan;
  8884. break;
  8885. case glslang::EOpSubgroupBallotExclusiveBitCount:
  8886. case glslang::EOpSubgroupExclusiveAdd:
  8887. case glslang::EOpSubgroupExclusiveMul:
  8888. case glslang::EOpSubgroupExclusiveMin:
  8889. case glslang::EOpSubgroupExclusiveMax:
  8890. case glslang::EOpSubgroupExclusiveAnd:
  8891. case glslang::EOpSubgroupExclusiveOr:
  8892. case glslang::EOpSubgroupExclusiveXor:
  8893. groupOperation = spv::GroupOperation::ExclusiveScan;
  8894. break;
  8895. case glslang::EOpSubgroupClusteredAdd:
  8896. case glslang::EOpSubgroupClusteredMul:
  8897. case glslang::EOpSubgroupClusteredMin:
  8898. case glslang::EOpSubgroupClusteredMax:
  8899. case glslang::EOpSubgroupClusteredAnd:
  8900. case glslang::EOpSubgroupClusteredOr:
  8901. case glslang::EOpSubgroupClusteredXor:
  8902. groupOperation = spv::GroupOperation::ClusteredReduce;
  8903. break;
  8904. case glslang::EOpSubgroupPartitionedAdd:
  8905. case glslang::EOpSubgroupPartitionedMul:
  8906. case glslang::EOpSubgroupPartitionedMin:
  8907. case glslang::EOpSubgroupPartitionedMax:
  8908. case glslang::EOpSubgroupPartitionedAnd:
  8909. case glslang::EOpSubgroupPartitionedOr:
  8910. case glslang::EOpSubgroupPartitionedXor:
  8911. groupOperation = spv::GroupOperation::PartitionedReduceNV;
  8912. break;
  8913. case glslang::EOpSubgroupPartitionedInclusiveAdd:
  8914. case glslang::EOpSubgroupPartitionedInclusiveMul:
  8915. case glslang::EOpSubgroupPartitionedInclusiveMin:
  8916. case glslang::EOpSubgroupPartitionedInclusiveMax:
  8917. case glslang::EOpSubgroupPartitionedInclusiveAnd:
  8918. case glslang::EOpSubgroupPartitionedInclusiveOr:
  8919. case glslang::EOpSubgroupPartitionedInclusiveXor:
  8920. groupOperation = spv::GroupOperation::PartitionedInclusiveScanNV;
  8921. break;
  8922. case glslang::EOpSubgroupPartitionedExclusiveAdd:
  8923. case glslang::EOpSubgroupPartitionedExclusiveMul:
  8924. case glslang::EOpSubgroupPartitionedExclusiveMin:
  8925. case glslang::EOpSubgroupPartitionedExclusiveMax:
  8926. case glslang::EOpSubgroupPartitionedExclusiveAnd:
  8927. case glslang::EOpSubgroupPartitionedExclusiveOr:
  8928. case glslang::EOpSubgroupPartitionedExclusiveXor:
  8929. groupOperation = spv::GroupOperation::PartitionedExclusiveScanNV;
  8930. break;
  8931. }
  8932. // build the instruction
  8933. std::vector<spv::IdImmediate> spvGroupOperands;
  8934. // Every operation begins with the Execution Scope operand.
  8935. spv::IdImmediate executionScope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };
  8936. // All other ops need the execution scope. Quad Control Ops don't need scope, it's always Quad.
  8937. if (opCode != spv::Op::OpGroupNonUniformQuadAllKHR && opCode != spv::Op::OpGroupNonUniformQuadAnyKHR) {
  8938. spvGroupOperands.push_back(executionScope);
  8939. }
  8940. // Next, for all operations that use a Group Operation, push that as an operand.
  8941. if (groupOperation != spv::GroupOperation::Max) {
  8942. spv::IdImmediate groupOperand = { false, (unsigned)groupOperation };
  8943. spvGroupOperands.push_back(groupOperand);
  8944. }
  8945. // Push back the operands next.
  8946. for (auto opIt = operands.cbegin(); opIt != operands.cend(); ++opIt) {
  8947. spv::IdImmediate operand = { true, *opIt };
  8948. spvGroupOperands.push_back(operand);
  8949. }
  8950. // Some opcodes have additional operands.
  8951. spv::Id directionId = spv::NoResult;
  8952. switch (op) {
  8953. default: break;
  8954. case glslang::EOpSubgroupQuadSwapHorizontal: directionId = builder.makeUintConstant(0); break;
  8955. case glslang::EOpSubgroupQuadSwapVertical: directionId = builder.makeUintConstant(1); break;
  8956. case glslang::EOpSubgroupQuadSwapDiagonal: directionId = builder.makeUintConstant(2); break;
  8957. }
  8958. if (directionId != spv::NoResult) {
  8959. spv::IdImmediate direction = { true, directionId };
  8960. spvGroupOperands.push_back(direction);
  8961. }
  8962. return builder.createOp(opCode, typeId, spvGroupOperands);
  8963. }
  8964. spv::Id TGlslangToSpvTraverser::createMiscOperation(glslang::TOperator op, spv::Decoration precision,
  8965. spv::Id typeId, std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)
  8966. {
  8967. bool isUnsigned = isTypeUnsignedInt(typeProxy);
  8968. bool isFloat = isTypeFloat(typeProxy);
  8969. spv::Op opCode = spv::Op::OpNop;
  8970. int extBuiltins = -1;
  8971. int libCall = -1;
  8972. size_t consumedOperands = operands.size();
  8973. spv::Id typeId0 = 0;
  8974. if (consumedOperands > 0)
  8975. typeId0 = builder.getTypeId(operands[0]);
  8976. spv::Id typeId1 = 0;
  8977. if (consumedOperands > 1)
  8978. typeId1 = builder.getTypeId(operands[1]);
  8979. spv::Id frexpIntType = 0;
  8980. switch (op) {
  8981. case glslang::EOpMin:
  8982. if (isFloat)
  8983. libCall = nanMinMaxClamp ? spv::GLSLstd450NMin : spv::GLSLstd450FMin;
  8984. else if (isUnsigned)
  8985. libCall = spv::GLSLstd450UMin;
  8986. else
  8987. libCall = spv::GLSLstd450SMin;
  8988. builder.promoteScalar(precision, operands.front(), operands.back());
  8989. break;
  8990. case glslang::EOpModf:
  8991. {
  8992. libCall = spv::GLSLstd450ModfStruct;
  8993. assert(builder.isFloatType(builder.getScalarTypeId(typeId0)));
  8994. // The returned struct has two members of the same type as the first argument
  8995. typeId = builder.makeStructResultType(typeId0, typeId0);
  8996. consumedOperands = 1;
  8997. }
  8998. break;
  8999. case glslang::EOpMax:
  9000. if (isFloat)
  9001. libCall = nanMinMaxClamp ? spv::GLSLstd450NMax : spv::GLSLstd450FMax;
  9002. else if (isUnsigned)
  9003. libCall = spv::GLSLstd450UMax;
  9004. else
  9005. libCall = spv::GLSLstd450SMax;
  9006. builder.promoteScalar(precision, operands.front(), operands.back());
  9007. break;
  9008. case glslang::EOpPow:
  9009. libCall = spv::GLSLstd450Pow;
  9010. break;
  9011. case glslang::EOpDot:
  9012. case glslang::EOpDotPackedEXT:
  9013. case glslang::EOpDotAccSatEXT:
  9014. case glslang::EOpDotPackedAccSatEXT:
  9015. {
  9016. if (builder.isFloatType(builder.getScalarTypeId(typeId0)) ||
  9017. // HLSL supports dot(int,int) which is just a multiply
  9018. glslangIntermediate->getSource() == glslang::EShSourceHlsl) {
  9019. if (typeProxy == glslang::EbtBFloat16) {
  9020. builder.addExtension(spv::E_SPV_KHR_bfloat16);
  9021. builder.addCapability(spv::Capability::BFloat16DotProductKHR);
  9022. }
  9023. opCode = spv::Op::OpDot;
  9024. } else {
  9025. builder.addExtension(spv::E_SPV_KHR_integer_dot_product);
  9026. builder.addCapability(spv::Capability::DotProductKHR);
  9027. const unsigned int vectorSize = builder.getNumComponents(operands[0]);
  9028. if (op == glslang::EOpDotPackedEXT || op == glslang::EOpDotPackedAccSatEXT) {
  9029. builder.addCapability(spv::Capability::DotProductInput4x8BitPackedKHR);
  9030. } else if (vectorSize == 4 && builder.getScalarTypeWidth(typeId0) == 8) {
  9031. builder.addCapability(spv::Capability::DotProductInput4x8BitKHR);
  9032. } else {
  9033. builder.addCapability(spv::Capability::DotProductInputAllKHR);
  9034. }
  9035. const bool type0isSigned = builder.isIntType(builder.getScalarTypeId(typeId0));
  9036. const bool type1isSigned = builder.isIntType(builder.getScalarTypeId(typeId1));
  9037. const bool accSat = (op == glslang::EOpDotAccSatEXT || op == glslang::EOpDotPackedAccSatEXT);
  9038. if (!type0isSigned && !type1isSigned) {
  9039. opCode = accSat ? spv::Op::OpUDotAccSatKHR : spv::Op::OpUDotKHR;
  9040. } else if (type0isSigned && type1isSigned) {
  9041. opCode = accSat ? spv::Op::OpSDotAccSatKHR : spv::Op::OpSDotKHR;
  9042. } else {
  9043. opCode = accSat ? spv::Op::OpSUDotAccSatKHR : spv::Op::OpSUDotKHR;
  9044. // the spir-v opcode assumes the operands to be "signed, unsigned" in that order, so swap if needed
  9045. if (type1isSigned) {
  9046. std::swap(operands[0], operands[1]);
  9047. }
  9048. }
  9049. std::vector<spv::IdImmediate> operands2;
  9050. for (auto &o : operands) {
  9051. operands2.push_back({true, o});
  9052. }
  9053. if (op == glslang::EOpDotPackedEXT || op == glslang::EOpDotPackedAccSatEXT) {
  9054. operands2.push_back({false, 0});
  9055. }
  9056. return builder.createOp(opCode, typeId, operands2);
  9057. }
  9058. }
  9059. break;
  9060. case glslang::EOpAtan:
  9061. libCall = spv::GLSLstd450Atan2;
  9062. break;
  9063. case glslang::EOpClamp:
  9064. if (isFloat)
  9065. libCall = nanMinMaxClamp ? spv::GLSLstd450NClamp : spv::GLSLstd450FClamp;
  9066. else if (isUnsigned)
  9067. libCall = spv::GLSLstd450UClamp;
  9068. else
  9069. libCall = spv::GLSLstd450SClamp;
  9070. builder.promoteScalar(precision, operands.front(), operands[1]);
  9071. builder.promoteScalar(precision, operands.front(), operands[2]);
  9072. break;
  9073. case glslang::EOpMix:
  9074. if (! builder.isBoolType(builder.getScalarTypeId(builder.getTypeId(operands.back())))) {
  9075. assert(isFloat);
  9076. libCall = spv::GLSLstd450FMix;
  9077. } else {
  9078. opCode = spv::Op::OpSelect;
  9079. std::swap(operands.front(), operands.back());
  9080. }
  9081. builder.promoteScalar(precision, operands.front(), operands.back());
  9082. break;
  9083. case glslang::EOpStep:
  9084. libCall = spv::GLSLstd450Step;
  9085. builder.promoteScalar(precision, operands.front(), operands.back());
  9086. break;
  9087. case glslang::EOpSmoothStep:
  9088. libCall = spv::GLSLstd450SmoothStep;
  9089. builder.promoteScalar(precision, operands[0], operands[2]);
  9090. builder.promoteScalar(precision, operands[1], operands[2]);
  9091. break;
  9092. case glslang::EOpDistance:
  9093. libCall = spv::GLSLstd450Distance;
  9094. break;
  9095. case glslang::EOpCross:
  9096. libCall = spv::GLSLstd450Cross;
  9097. break;
  9098. case glslang::EOpFaceForward:
  9099. libCall = spv::GLSLstd450FaceForward;
  9100. break;
  9101. case glslang::EOpReflect:
  9102. libCall = spv::GLSLstd450Reflect;
  9103. break;
  9104. case glslang::EOpRefract:
  9105. libCall = spv::GLSLstd450Refract;
  9106. break;
  9107. case glslang::EOpBarrier:
  9108. {
  9109. // This is for the extended controlBarrier function, with four operands.
  9110. // The unextended barrier() goes through createNoArgOperation.
  9111. assert(operands.size() == 4);
  9112. auto const executionScope = (spv::Scope)builder.getConstantScalar(operands[0]);
  9113. auto const memoryScope = (spv::Scope)builder.getConstantScalar(operands[1]);
  9114. auto const semantics = (spv::MemorySemanticsMask)(builder.getConstantScalar(operands[2]) | builder.getConstantScalar(operands[3]));
  9115. builder.createControlBarrier(executionScope, memoryScope,
  9116. semantics);
  9117. if (anySet(semantics, spv::MemorySemanticsMask::MakeAvailableKHR |
  9118. spv::MemorySemanticsMask::MakeVisibleKHR |
  9119. spv::MemorySemanticsMask::OutputMemoryKHR |
  9120. spv::MemorySemanticsMask::Volatile)) {
  9121. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  9122. }
  9123. if (glslangIntermediate->usingVulkanMemoryModel() && (executionScope == spv::Scope::Device ||
  9124. memoryScope == spv::Scope::Device)) {
  9125. builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);
  9126. }
  9127. return 0;
  9128. }
  9129. break;
  9130. case glslang::EOpMemoryBarrier:
  9131. {
  9132. // This is for the extended memoryBarrier function, with three operands.
  9133. // The unextended memoryBarrier() goes through createNoArgOperation.
  9134. assert(operands.size() == 3);
  9135. auto const memoryScope = (spv::Scope)builder.getConstantScalar(operands[0]);
  9136. auto const semantics = (spv::MemorySemanticsMask)(builder.getConstantScalar(operands[1]) | builder.getConstantScalar(operands[2]));
  9137. builder.createMemoryBarrier(memoryScope, semantics);
  9138. if (anySet(semantics, spv::MemorySemanticsMask::MakeAvailableKHR |
  9139. spv::MemorySemanticsMask::MakeVisibleKHR |
  9140. spv::MemorySemanticsMask::OutputMemoryKHR |
  9141. spv::MemorySemanticsMask::Volatile)) {
  9142. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  9143. }
  9144. if (glslangIntermediate->usingVulkanMemoryModel() && memoryScope == spv::Scope::Device) {
  9145. builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);
  9146. }
  9147. return 0;
  9148. }
  9149. break;
  9150. case glslang::EOpInterpolateAtSample:
  9151. if (typeProxy == glslang::EbtFloat16)
  9152. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
  9153. libCall = spv::GLSLstd450InterpolateAtSample;
  9154. break;
  9155. case glslang::EOpInterpolateAtOffset:
  9156. if (typeProxy == glslang::EbtFloat16)
  9157. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
  9158. libCall = spv::GLSLstd450InterpolateAtOffset;
  9159. break;
  9160. case glslang::EOpAddCarry:
  9161. opCode = spv::Op::OpIAddCarry;
  9162. typeId = builder.makeStructResultType(typeId0, typeId0);
  9163. consumedOperands = 2;
  9164. break;
  9165. case glslang::EOpSubBorrow:
  9166. opCode = spv::Op::OpISubBorrow;
  9167. typeId = builder.makeStructResultType(typeId0, typeId0);
  9168. consumedOperands = 2;
  9169. break;
  9170. case glslang::EOpUMulExtended:
  9171. opCode = spv::Op::OpUMulExtended;
  9172. typeId = builder.makeStructResultType(typeId0, typeId0);
  9173. consumedOperands = 2;
  9174. break;
  9175. case glslang::EOpIMulExtended:
  9176. opCode = spv::Op::OpSMulExtended;
  9177. typeId = builder.makeStructResultType(typeId0, typeId0);
  9178. consumedOperands = 2;
  9179. break;
  9180. case glslang::EOpBitfieldExtract:
  9181. if (isUnsigned)
  9182. opCode = spv::Op::OpBitFieldUExtract;
  9183. else
  9184. opCode = spv::Op::OpBitFieldSExtract;
  9185. break;
  9186. case glslang::EOpBitfieldInsert:
  9187. opCode = spv::Op::OpBitFieldInsert;
  9188. break;
  9189. case glslang::EOpFma:
  9190. libCall = spv::GLSLstd450Fma;
  9191. break;
  9192. case glslang::EOpFrexp:
  9193. {
  9194. libCall = spv::GLSLstd450FrexpStruct;
  9195. assert(builder.isPointerType(typeId1));
  9196. typeId1 = builder.getContainedTypeId(typeId1);
  9197. int width = builder.getScalarTypeWidth(typeId1);
  9198. if (width == 16)
  9199. // Using 16-bit exp operand, enable extension SPV_AMD_gpu_shader_int16
  9200. builder.addExtension(spv::E_SPV_AMD_gpu_shader_int16);
  9201. if (builder.getNumComponents(operands[0]) == 1)
  9202. frexpIntType = builder.makeIntegerType(width, true);
  9203. else if (builder.isCooperativeVector(operands[0]))
  9204. frexpIntType = builder.makeCooperativeVectorTypeNV(builder.makeIntegerType(width, true),
  9205. builder.getCooperativeVectorNumComponents(builder.getTypeId(operands[0])));
  9206. else
  9207. frexpIntType = builder.makeVectorType(builder.makeIntegerType(width, true),
  9208. builder.getNumComponents(operands[0]));
  9209. typeId = builder.makeStructResultType(typeId0, frexpIntType);
  9210. consumedOperands = 1;
  9211. }
  9212. break;
  9213. case glslang::EOpLdexp:
  9214. libCall = spv::GLSLstd450Ldexp;
  9215. break;
  9216. case glslang::EOpReadInvocation:
  9217. return createInvocationsOperation(op, typeId, operands, typeProxy);
  9218. case glslang::EOpSubgroupBroadcast:
  9219. case glslang::EOpSubgroupBallotBitExtract:
  9220. case glslang::EOpSubgroupShuffle:
  9221. case glslang::EOpSubgroupShuffleXor:
  9222. case glslang::EOpSubgroupShuffleUp:
  9223. case glslang::EOpSubgroupShuffleDown:
  9224. case glslang::EOpSubgroupRotate:
  9225. case glslang::EOpSubgroupClusteredRotate:
  9226. case glslang::EOpSubgroupClusteredAdd:
  9227. case glslang::EOpSubgroupClusteredMul:
  9228. case glslang::EOpSubgroupClusteredMin:
  9229. case glslang::EOpSubgroupClusteredMax:
  9230. case glslang::EOpSubgroupClusteredAnd:
  9231. case glslang::EOpSubgroupClusteredOr:
  9232. case glslang::EOpSubgroupClusteredXor:
  9233. case glslang::EOpSubgroupQuadBroadcast:
  9234. case glslang::EOpSubgroupPartitionedAdd:
  9235. case glslang::EOpSubgroupPartitionedMul:
  9236. case glslang::EOpSubgroupPartitionedMin:
  9237. case glslang::EOpSubgroupPartitionedMax:
  9238. case glslang::EOpSubgroupPartitionedAnd:
  9239. case glslang::EOpSubgroupPartitionedOr:
  9240. case glslang::EOpSubgroupPartitionedXor:
  9241. case glslang::EOpSubgroupPartitionedInclusiveAdd:
  9242. case glslang::EOpSubgroupPartitionedInclusiveMul:
  9243. case glslang::EOpSubgroupPartitionedInclusiveMin:
  9244. case glslang::EOpSubgroupPartitionedInclusiveMax:
  9245. case glslang::EOpSubgroupPartitionedInclusiveAnd:
  9246. case glslang::EOpSubgroupPartitionedInclusiveOr:
  9247. case glslang::EOpSubgroupPartitionedInclusiveXor:
  9248. case glslang::EOpSubgroupPartitionedExclusiveAdd:
  9249. case glslang::EOpSubgroupPartitionedExclusiveMul:
  9250. case glslang::EOpSubgroupPartitionedExclusiveMin:
  9251. case glslang::EOpSubgroupPartitionedExclusiveMax:
  9252. case glslang::EOpSubgroupPartitionedExclusiveAnd:
  9253. case glslang::EOpSubgroupPartitionedExclusiveOr:
  9254. case glslang::EOpSubgroupPartitionedExclusiveXor:
  9255. return createSubgroupOperation(op, typeId, operands, typeProxy);
  9256. case glslang::EOpSwizzleInvocations:
  9257. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
  9258. libCall = spv::SwizzleInvocationsAMD;
  9259. break;
  9260. case glslang::EOpSwizzleInvocationsMasked:
  9261. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
  9262. libCall = spv::SwizzleInvocationsMaskedAMD;
  9263. break;
  9264. case glslang::EOpWriteInvocation:
  9265. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
  9266. libCall = spv::WriteInvocationAMD;
  9267. break;
  9268. case glslang::EOpMin3:
  9269. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_trinary_minmax);
  9270. if (isFloat)
  9271. libCall = spv::FMin3AMD;
  9272. else {
  9273. if (isUnsigned)
  9274. libCall = spv::UMin3AMD;
  9275. else
  9276. libCall = spv::SMin3AMD;
  9277. }
  9278. break;
  9279. case glslang::EOpMax3:
  9280. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_trinary_minmax);
  9281. if (isFloat)
  9282. libCall = spv::FMax3AMD;
  9283. else {
  9284. if (isUnsigned)
  9285. libCall = spv::UMax3AMD;
  9286. else
  9287. libCall = spv::SMax3AMD;
  9288. }
  9289. break;
  9290. case glslang::EOpMid3:
  9291. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_trinary_minmax);
  9292. if (isFloat)
  9293. libCall = spv::FMid3AMD;
  9294. else {
  9295. if (isUnsigned)
  9296. libCall = spv::UMid3AMD;
  9297. else
  9298. libCall = spv::SMid3AMD;
  9299. }
  9300. break;
  9301. case glslang::EOpInterpolateAtVertex:
  9302. if (typeProxy == glslang::EbtFloat16)
  9303. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
  9304. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  9305. libCall = spv::InterpolateAtVertexAMD;
  9306. break;
  9307. case glslang::EOpReportIntersection:
  9308. typeId = builder.makeBoolType();
  9309. opCode = spv::Op::OpReportIntersectionKHR;
  9310. break;
  9311. case glslang::EOpTraceNV:
  9312. builder.createNoResultOp(spv::Op::OpTraceNV, operands);
  9313. return 0;
  9314. case glslang::EOpTraceRayMotionNV:
  9315. builder.addExtension(spv::E_SPV_NV_ray_tracing_motion_blur);
  9316. builder.addCapability(spv::Capability::RayTracingMotionBlurNV);
  9317. builder.createNoResultOp(spv::Op::OpTraceRayMotionNV, operands);
  9318. return 0;
  9319. case glslang::EOpTraceKHR:
  9320. builder.createNoResultOp(spv::Op::OpTraceRayKHR, operands);
  9321. return 0;
  9322. case glslang::EOpExecuteCallableNV:
  9323. builder.createNoResultOp(spv::Op::OpExecuteCallableNV, operands);
  9324. return 0;
  9325. case glslang::EOpExecuteCallableKHR:
  9326. builder.createNoResultOp(spv::Op::OpExecuteCallableKHR, operands);
  9327. return 0;
  9328. case glslang::EOpRayQueryInitialize:
  9329. builder.createNoResultOp(spv::Op::OpRayQueryInitializeKHR, operands);
  9330. return 0;
  9331. case glslang::EOpRayQueryTerminate:
  9332. builder.createNoResultOp(spv::Op::OpRayQueryTerminateKHR, operands);
  9333. return 0;
  9334. case glslang::EOpRayQueryGenerateIntersection:
  9335. builder.createNoResultOp(spv::Op::OpRayQueryGenerateIntersectionKHR, operands);
  9336. return 0;
  9337. case glslang::EOpRayQueryConfirmIntersection:
  9338. builder.createNoResultOp(spv::Op::OpRayQueryConfirmIntersectionKHR, operands);
  9339. return 0;
  9340. case glslang::EOpRayQueryProceed:
  9341. typeId = builder.makeBoolType();
  9342. opCode = spv::Op::OpRayQueryProceedKHR;
  9343. break;
  9344. case glslang::EOpRayQueryGetIntersectionType:
  9345. typeId = builder.makeUintType(32);
  9346. opCode = spv::Op::OpRayQueryGetIntersectionTypeKHR;
  9347. break;
  9348. case glslang::EOpRayQueryGetRayTMin:
  9349. typeId = builder.makeFloatType(32);
  9350. opCode = spv::Op::OpRayQueryGetRayTMinKHR;
  9351. break;
  9352. case glslang::EOpRayQueryGetRayFlags:
  9353. typeId = builder.makeIntType(32);
  9354. opCode = spv::Op::OpRayQueryGetRayFlagsKHR;
  9355. break;
  9356. case glslang::EOpRayQueryGetIntersectionT:
  9357. typeId = builder.makeFloatType(32);
  9358. opCode = spv::Op::OpRayQueryGetIntersectionTKHR;
  9359. break;
  9360. case glslang::EOpRayQueryGetIntersectionInstanceCustomIndex:
  9361. typeId = builder.makeIntType(32);
  9362. opCode = spv::Op::OpRayQueryGetIntersectionInstanceCustomIndexKHR;
  9363. break;
  9364. case glslang::EOpRayQueryGetIntersectionInstanceId:
  9365. typeId = builder.makeIntType(32);
  9366. opCode = spv::Op::OpRayQueryGetIntersectionInstanceIdKHR;
  9367. break;
  9368. case glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset:
  9369. typeId = builder.makeUintType(32);
  9370. opCode = spv::Op::OpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffsetKHR;
  9371. break;
  9372. case glslang::EOpRayQueryGetIntersectionGeometryIndex:
  9373. typeId = builder.makeIntType(32);
  9374. opCode = spv::Op::OpRayQueryGetIntersectionGeometryIndexKHR;
  9375. break;
  9376. case glslang::EOpRayQueryGetIntersectionPrimitiveIndex:
  9377. typeId = builder.makeIntType(32);
  9378. opCode = spv::Op::OpRayQueryGetIntersectionPrimitiveIndexKHR;
  9379. break;
  9380. case glslang::EOpRayQueryGetIntersectionBarycentrics:
  9381. typeId = builder.makeVectorType(builder.makeFloatType(32), 2);
  9382. opCode = spv::Op::OpRayQueryGetIntersectionBarycentricsKHR;
  9383. break;
  9384. case glslang::EOpRayQueryGetIntersectionFrontFace:
  9385. typeId = builder.makeBoolType();
  9386. opCode = spv::Op::OpRayQueryGetIntersectionFrontFaceKHR;
  9387. break;
  9388. case glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque:
  9389. typeId = builder.makeBoolType();
  9390. opCode = spv::Op::OpRayQueryGetIntersectionCandidateAABBOpaqueKHR;
  9391. break;
  9392. case glslang::EOpRayQueryGetIntersectionObjectRayDirection:
  9393. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9394. opCode = spv::Op::OpRayQueryGetIntersectionObjectRayDirectionKHR;
  9395. break;
  9396. case glslang::EOpRayQueryGetIntersectionObjectRayOrigin:
  9397. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9398. opCode = spv::Op::OpRayQueryGetIntersectionObjectRayOriginKHR;
  9399. break;
  9400. case glslang::EOpRayQueryGetWorldRayDirection:
  9401. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9402. opCode = spv::Op::OpRayQueryGetWorldRayDirectionKHR;
  9403. break;
  9404. case glslang::EOpRayQueryGetWorldRayOrigin:
  9405. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9406. opCode = spv::Op::OpRayQueryGetWorldRayOriginKHR;
  9407. break;
  9408. case glslang::EOpRayQueryGetIntersectionObjectToWorld:
  9409. typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  9410. opCode = spv::Op::OpRayQueryGetIntersectionObjectToWorldKHR;
  9411. break;
  9412. case glslang::EOpRayQueryGetIntersectionClusterIdNV:
  9413. typeId = builder.makeIntegerType(32, 1);
  9414. opCode = spv::Op::OpRayQueryGetClusterIdNV;
  9415. break;
  9416. case glslang::EOpRayQueryGetIntersectionWorldToObject:
  9417. typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  9418. opCode = spv::Op::OpRayQueryGetIntersectionWorldToObjectKHR;
  9419. break;
  9420. case glslang::EOpRayQueryGetIntersectionSpherePositionNV:
  9421. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9422. opCode = spv::Op::OpRayQueryGetIntersectionSpherePositionNV;
  9423. break;
  9424. case glslang::EOpRayQueryGetIntersectionSphereRadiusNV:
  9425. typeId = builder.makeFloatType(32);
  9426. opCode = spv::Op::OpRayQueryGetIntersectionSphereRadiusNV;
  9427. break;
  9428. case glslang::EOpRayQueryGetIntersectionLSSHitValueNV:
  9429. typeId = builder.makeFloatType(32);
  9430. opCode = spv::Op::OpRayQueryGetIntersectionLSSHitValueNV;
  9431. break;
  9432. case glslang::EOpRayQueryIsSphereHitNV:
  9433. typeId = builder.makeBoolType();
  9434. opCode = spv::Op::OpRayQueryIsSphereHitNV;
  9435. break;
  9436. case glslang::EOpRayQueryIsLSSHitNV:
  9437. typeId = builder.makeBoolType();
  9438. opCode = spv::Op::OpRayQueryIsLSSHitNV;
  9439. break;
  9440. case glslang::EOpWritePackedPrimitiveIndices4x8NV:
  9441. builder.createNoResultOp(spv::Op::OpWritePackedPrimitiveIndices4x8NV, operands);
  9442. return 0;
  9443. case glslang::EOpEmitMeshTasksEXT:
  9444. if (taskPayloadID)
  9445. operands.push_back(taskPayloadID);
  9446. // As per SPV_EXT_mesh_shader make it a terminating instruction in the current block
  9447. builder.makeStatementTerminator(spv::Op::OpEmitMeshTasksEXT, operands, "post-OpEmitMeshTasksEXT");
  9448. return 0;
  9449. case glslang::EOpSetMeshOutputsEXT:
  9450. builder.createNoResultOp(spv::Op::OpSetMeshOutputsEXT, operands);
  9451. return 0;
  9452. case glslang::EOpCooperativeMatrixMulAddNV:
  9453. opCode = spv::Op::OpCooperativeMatrixMulAddNV;
  9454. break;
  9455. case glslang::EOpHitObjectTraceRayNV:
  9456. builder.createNoResultOp(spv::Op::OpHitObjectTraceRayNV, operands);
  9457. return 0;
  9458. case glslang::EOpHitObjectTraceRayEXT:
  9459. builder.createNoResultOp(spv::Op::OpHitObjectTraceRayEXT, operands);
  9460. return 0;
  9461. case glslang::EOpHitObjectTraceRayMotionNV:
  9462. builder.createNoResultOp(spv::Op::OpHitObjectTraceRayMotionNV, operands);
  9463. return 0;
  9464. case glslang::EOpHitObjectTraceRayMotionEXT:
  9465. builder.createNoResultOp(spv::Op::OpHitObjectTraceRayMotionEXT, operands);
  9466. return 0;
  9467. case glslang::EOpHitObjectRecordHitNV:
  9468. builder.createNoResultOp(spv::Op::OpHitObjectRecordHitNV, operands);
  9469. return 0;
  9470. case glslang::EOpHitObjectRecordHitMotionNV:
  9471. builder.createNoResultOp(spv::Op::OpHitObjectRecordHitMotionNV, operands);
  9472. return 0;
  9473. case glslang::EOpHitObjectRecordHitWithIndexNV:
  9474. builder.createNoResultOp(spv::Op::OpHitObjectRecordHitWithIndexNV, operands);
  9475. return 0;
  9476. case glslang::EOpHitObjectRecordHitWithIndexMotionNV:
  9477. builder.createNoResultOp(spv::Op::OpHitObjectRecordHitWithIndexMotionNV, operands);
  9478. return 0;
  9479. case glslang::EOpHitObjectRecordMissNV:
  9480. builder.createNoResultOp(spv::Op::OpHitObjectRecordMissNV, operands);
  9481. return 0;
  9482. case glslang::EOpHitObjectRecordMissEXT:
  9483. builder.createNoResultOp(spv::Op::OpHitObjectRecordMissEXT, operands);
  9484. return 0;
  9485. case glslang::EOpHitObjectRecordMissMotionNV:
  9486. builder.createNoResultOp(spv::Op::OpHitObjectRecordMissMotionNV, operands);
  9487. return 0;
  9488. case glslang::EOpHitObjectRecordMissMotionEXT:
  9489. builder.createNoResultOp(spv::Op::OpHitObjectRecordMissMotionEXT, operands);
  9490. return 0;
  9491. case glslang::EOpHitObjectExecuteShaderNV:
  9492. builder.createNoResultOp(spv::Op::OpHitObjectExecuteShaderNV, operands);
  9493. return 0;
  9494. case glslang::EOpHitObjectExecuteShaderEXT:
  9495. builder.createNoResultOp(spv::Op::OpHitObjectExecuteShaderEXT, operands);
  9496. return 0;
  9497. case glslang::EOpHitObjectIsEmptyNV:
  9498. typeId = builder.makeBoolType();
  9499. opCode = spv::Op::OpHitObjectIsEmptyNV;
  9500. break;
  9501. case glslang::EOpHitObjectIsEmptyEXT:
  9502. typeId = builder.makeBoolType();
  9503. opCode = spv::Op::OpHitObjectIsEmptyEXT;
  9504. break;
  9505. case glslang::EOpHitObjectIsMissNV:
  9506. typeId = builder.makeBoolType();
  9507. opCode = spv::Op::OpHitObjectIsMissNV;
  9508. break;
  9509. case glslang::EOpHitObjectIsMissEXT:
  9510. typeId = builder.makeBoolType();
  9511. opCode = spv::Op::OpHitObjectIsMissEXT;
  9512. break;
  9513. case glslang::EOpHitObjectIsHitNV:
  9514. typeId = builder.makeBoolType();
  9515. opCode = spv::Op::OpHitObjectIsHitNV;
  9516. break;
  9517. case glslang::EOpHitObjectIsSphereHitNV:
  9518. typeId = builder.makeBoolType();
  9519. opCode = spv::Op::OpHitObjectIsSphereHitNV;
  9520. break;
  9521. case glslang::EOpHitObjectIsLSSHitNV:
  9522. typeId = builder.makeBoolType();
  9523. opCode = spv::Op::OpHitObjectIsLSSHitNV;
  9524. break;
  9525. case glslang::EOpHitObjectIsHitEXT:
  9526. typeId = builder.makeBoolType();
  9527. opCode = spv::Op::OpHitObjectIsHitEXT;
  9528. break;
  9529. case glslang::EOpHitObjectGetRayTMinNV:
  9530. typeId = builder.makeFloatType(32);
  9531. opCode = spv::Op::OpHitObjectGetRayTMinNV;
  9532. break;
  9533. case glslang::EOpHitObjectGetRayTMinEXT:
  9534. typeId = builder.makeFloatType(32);
  9535. opCode = spv::Op::OpHitObjectGetRayTMinEXT;
  9536. break;
  9537. case glslang::EOpHitObjectGetRayTMaxNV:
  9538. typeId = builder.makeFloatType(32);
  9539. opCode = spv::Op::OpHitObjectGetRayTMaxNV;
  9540. break;
  9541. case glslang::EOpHitObjectGetRayTMaxEXT:
  9542. typeId = builder.makeFloatType(32);
  9543. opCode = spv::Op::OpHitObjectGetRayTMaxEXT;
  9544. break;
  9545. case glslang::EOpHitObjectGetRayFlagsEXT:
  9546. typeId = builder.makeIntegerType(32, 0);
  9547. opCode = spv::Op::OpHitObjectGetRayFlagsEXT;
  9548. break;
  9549. case glslang::EOpHitObjectGetObjectRayOriginNV:
  9550. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9551. opCode = spv::Op::OpHitObjectGetObjectRayOriginNV;
  9552. break;
  9553. case glslang::EOpHitObjectGetObjectRayOriginEXT:
  9554. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9555. opCode = spv::Op::OpHitObjectGetObjectRayOriginEXT;
  9556. break;
  9557. case glslang::EOpHitObjectGetObjectRayDirectionNV:
  9558. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9559. opCode = spv::Op::OpHitObjectGetObjectRayDirectionNV;
  9560. break;
  9561. case glslang::EOpHitObjectGetObjectRayDirectionEXT:
  9562. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9563. opCode = spv::Op::OpHitObjectGetObjectRayDirectionEXT;
  9564. break;
  9565. case glslang::EOpHitObjectGetWorldRayOriginNV:
  9566. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9567. opCode = spv::Op::OpHitObjectGetWorldRayOriginNV;
  9568. break;
  9569. case glslang::EOpHitObjectGetWorldRayOriginEXT:
  9570. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9571. opCode = spv::Op::OpHitObjectGetWorldRayOriginEXT;
  9572. break;
  9573. case glslang::EOpHitObjectGetWorldRayDirectionNV:
  9574. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9575. opCode = spv::Op::OpHitObjectGetWorldRayDirectionNV;
  9576. break;
  9577. case glslang::EOpHitObjectGetWorldRayDirectionEXT:
  9578. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9579. opCode = spv::Op::OpHitObjectGetWorldRayDirectionEXT;
  9580. break;
  9581. case glslang::EOpHitObjectGetWorldToObjectNV:
  9582. typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  9583. opCode = spv::Op::OpHitObjectGetWorldToObjectNV;
  9584. break;
  9585. case glslang::EOpHitObjectGetWorldToObjectEXT:
  9586. typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  9587. opCode = spv::Op::OpHitObjectGetWorldToObjectEXT;
  9588. break;
  9589. case glslang::EOpHitObjectGetObjectToWorldNV:
  9590. typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  9591. opCode = spv::Op::OpHitObjectGetObjectToWorldNV;
  9592. break;
  9593. case glslang::EOpHitObjectGetObjectToWorldEXT:
  9594. typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
  9595. opCode = spv::Op::OpHitObjectGetObjectToWorldEXT;
  9596. break;
  9597. case glslang::EOpHitObjectGetInstanceCustomIndexNV:
  9598. typeId = builder.makeIntegerType(32, 1);
  9599. opCode = spv::Op::OpHitObjectGetInstanceCustomIndexNV;
  9600. break;
  9601. case glslang::EOpHitObjectGetInstanceCustomIndexEXT:
  9602. typeId = builder.makeIntegerType(32, 1);
  9603. opCode = spv::Op::OpHitObjectGetInstanceCustomIndexEXT;
  9604. break;
  9605. case glslang::EOpHitObjectGetInstanceIdNV:
  9606. typeId = builder.makeIntegerType(32, 1);
  9607. opCode = spv::Op::OpHitObjectGetInstanceIdNV;
  9608. break;
  9609. case glslang::EOpHitObjectGetInstanceIdEXT:
  9610. typeId = builder.makeIntegerType(32, 1);
  9611. opCode = spv::Op::OpHitObjectGetInstanceIdEXT;
  9612. break;
  9613. case glslang::EOpHitObjectGetGeometryIndexNV:
  9614. typeId = builder.makeIntegerType(32, 1);
  9615. opCode = spv::Op::OpHitObjectGetGeometryIndexNV;
  9616. break;
  9617. case glslang::EOpHitObjectGetGeometryIndexEXT:
  9618. typeId = builder.makeIntegerType(32, 1);
  9619. opCode = spv::Op::OpHitObjectGetGeometryIndexEXT;
  9620. break;
  9621. case glslang::EOpHitObjectGetPrimitiveIndexNV:
  9622. typeId = builder.makeIntegerType(32, 1);
  9623. opCode = spv::Op::OpHitObjectGetPrimitiveIndexNV;
  9624. break;
  9625. case glslang::EOpHitObjectGetPrimitiveIndexEXT:
  9626. typeId = builder.makeIntegerType(32, 1);
  9627. opCode = spv::Op::OpHitObjectGetPrimitiveIndexEXT;
  9628. break;
  9629. case glslang::EOpHitObjectGetHitKindNV:
  9630. typeId = builder.makeIntegerType(32, 0);
  9631. opCode = spv::Op::OpHitObjectGetHitKindNV;
  9632. break;
  9633. case glslang::EOpHitObjectGetHitKindEXT:
  9634. typeId = builder.makeIntegerType(32, 0);
  9635. opCode = spv::Op::OpHitObjectGetHitKindEXT;
  9636. break;
  9637. case glslang::EOpHitObjectGetCurrentTimeNV:
  9638. typeId = builder.makeFloatType(32);
  9639. opCode = spv::Op::OpHitObjectGetCurrentTimeNV;
  9640. break;
  9641. case glslang::EOpHitObjectGetCurrentTimeEXT:
  9642. typeId = builder.makeFloatType(32);
  9643. opCode = spv::Op::OpHitObjectGetCurrentTimeEXT;
  9644. break;
  9645. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:
  9646. typeId = builder.makeIntegerType(32, 0);
  9647. opCode = spv::Op::OpHitObjectGetShaderBindingTableRecordIndexNV;
  9648. return 0;
  9649. case glslang::EOpHitObjectGetShaderBindingTableRecordIndexEXT:
  9650. typeId = builder.makeIntegerType(32, 0);
  9651. opCode = spv::Op::OpHitObjectGetShaderBindingTableRecordIndexEXT;
  9652. return 0;
  9653. case glslang::EOpHitObjectGetAttributesNV:
  9654. builder.createNoResultOp(spv::Op::OpHitObjectGetAttributesNV, operands);
  9655. return 0;
  9656. case glslang::EOpHitObjectGetAttributesEXT:
  9657. builder.createNoResultOp(spv::Op::OpHitObjectGetAttributesEXT, operands);
  9658. return 0;
  9659. case glslang::EOpHitObjectRecordFromQueryEXT:
  9660. builder.createNoResultOp(spv::Op::OpHitObjectRecordFromQueryEXT, operands);
  9661. return 0;
  9662. case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:
  9663. typeId = builder.makeVectorType(builder.makeUintType(32), 2);
  9664. opCode = spv::Op::OpHitObjectGetShaderRecordBufferHandleNV;
  9665. break;
  9666. case glslang::EOpHitObjectGetClusterIdNV:
  9667. typeId = builder.makeIntegerType(32, 1);
  9668. opCode = spv::Op::OpHitObjectGetClusterIdNV;
  9669. break;
  9670. case glslang::EOpHitObjectGetShaderRecordBufferHandleEXT:
  9671. typeId = builder.makeVectorType(builder.makeUintType(32), 2);
  9672. opCode = spv::Op::OpHitObjectGetShaderRecordBufferHandleEXT;
  9673. break;
  9674. case glslang::EOpHitObjectSetShaderBindingTableRecordIndexEXT:
  9675. builder.createNoResultOp(spv::Op::OpHitObjectSetShaderBindingTableRecordIndexEXT, operands);
  9676. return 0;
  9677. case glslang::EOpReorderThreadNV: {
  9678. if (operands.size() == 2) {
  9679. builder.createNoResultOp(spv::Op::OpReorderThreadWithHintNV, operands);
  9680. } else {
  9681. builder.createNoResultOp(spv::Op::OpReorderThreadWithHitObjectNV, operands);
  9682. }
  9683. return 0;
  9684. }
  9685. case glslang::EOpReorderThreadEXT: {
  9686. if (operands.size() == 2) {
  9687. builder.createNoResultOp(spv::Op::OpReorderThreadWithHintEXT, operands);
  9688. } else {
  9689. builder.createNoResultOp(spv::Op::OpReorderThreadWithHitObjectEXT, operands);
  9690. }
  9691. return 0;
  9692. }
  9693. case glslang::EOpHitObjectReorderExecuteEXT: {
  9694. if (operands.size() == 2) {
  9695. builder.createNoResultOp(spv::Op::OpHitObjectReorderExecuteShaderEXT, operands);
  9696. } else {
  9697. // GLSL intrinsic is
  9698. // hitObjectReorderExecuteEXT(hitObjectEXT hitObject, uint hint, uint bits,int payload) while
  9699. // SPIRV is hitObject id , payload id, optional hint id, optional bits id hence reorder operands
  9700. builder.createNoResultOp(spv::Op::OpHitObjectReorderExecuteShaderEXT, {operands[0], operands[3], operands[1], operands[2]});
  9701. }
  9702. return 0;
  9703. }
  9704. case glslang::EOpHitObjectTraceReorderExecuteEXT: {
  9705. if (operands.size() == 12) {
  9706. builder.createNoResultOp(spv::Op::OpHitObjectTraceReorderExecuteEXT, operands);
  9707. } else {
  9708. std::vector<spv::Id> argOperands;
  9709. std::copy(operands.begin(), operands.begin() + 11, std::back_inserter(argOperands));
  9710. argOperands.push_back(operands[13]);
  9711. argOperands.push_back(operands[11]);
  9712. argOperands.push_back(operands[12]);
  9713. builder.createNoResultOp(spv::Op::OpHitObjectTraceReorderExecuteEXT, argOperands);
  9714. }
  9715. return 0;
  9716. }
  9717. case glslang::EOpHitObjectTraceMotionReorderExecuteEXT: {
  9718. if (operands.size() == 13) {
  9719. builder.createNoResultOp(spv::Op::OpHitObjectTraceMotionReorderExecuteEXT, operands);
  9720. } else {
  9721. std::vector<spv::Id> argOperands;
  9722. std::copy(operands.begin(), operands.begin() + 12, std::back_inserter(argOperands));
  9723. argOperands.push_back(operands[14]);
  9724. argOperands.push_back(operands[12]);
  9725. argOperands.push_back(operands[13]);
  9726. builder.createNoResultOp(spv::Op::OpHitObjectTraceMotionReorderExecuteEXT, argOperands);
  9727. }
  9728. return 0;
  9729. }
  9730. case glslang::EOpImageSampleWeightedQCOM:
  9731. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9732. opCode = spv::Op::OpImageSampleWeightedQCOM;
  9733. addImageProcessingQCOMDecoration(operands[2], spv::Decoration::WeightTextureQCOM);
  9734. break;
  9735. case glslang::EOpImageBoxFilterQCOM:
  9736. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9737. opCode = spv::Op::OpImageBoxFilterQCOM;
  9738. break;
  9739. case glslang::EOpImageBlockMatchSADQCOM:
  9740. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9741. opCode = spv::Op::OpImageBlockMatchSADQCOM;
  9742. addImageProcessingQCOMDecoration(operands[0], spv::Decoration::BlockMatchTextureQCOM);
  9743. addImageProcessingQCOMDecoration(operands[2], spv::Decoration::BlockMatchTextureQCOM);
  9744. break;
  9745. case glslang::EOpImageBlockMatchSSDQCOM:
  9746. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9747. opCode = spv::Op::OpImageBlockMatchSSDQCOM;
  9748. addImageProcessingQCOMDecoration(operands[0], spv::Decoration::BlockMatchTextureQCOM);
  9749. addImageProcessingQCOMDecoration(operands[2], spv::Decoration::BlockMatchTextureQCOM);
  9750. break;
  9751. case glslang::EOpFetchMicroTriangleVertexBarycentricNV:
  9752. typeId = builder.makeVectorType(builder.makeFloatType(32), 2);
  9753. opCode = spv::Op::OpFetchMicroTriangleVertexBarycentricNV;
  9754. break;
  9755. case glslang::EOpFetchMicroTriangleVertexPositionNV:
  9756. typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
  9757. opCode = spv::Op::OpFetchMicroTriangleVertexPositionNV;
  9758. break;
  9759. case glslang::EOpImageBlockMatchWindowSSDQCOM:
  9760. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9761. opCode = spv::Op::OpImageBlockMatchWindowSSDQCOM;
  9762. addImageProcessing2QCOMDecoration(operands[0], false);
  9763. addImageProcessing2QCOMDecoration(operands[2], false);
  9764. break;
  9765. case glslang::EOpImageBlockMatchWindowSADQCOM:
  9766. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9767. opCode = spv::Op::OpImageBlockMatchWindowSADQCOM;
  9768. addImageProcessing2QCOMDecoration(operands[0], false);
  9769. addImageProcessing2QCOMDecoration(operands[2], false);
  9770. break;
  9771. case glslang::EOpImageBlockMatchGatherSSDQCOM:
  9772. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9773. opCode = spv::Op::OpImageBlockMatchGatherSSDQCOM;
  9774. addImageProcessing2QCOMDecoration(operands[0], true);
  9775. addImageProcessing2QCOMDecoration(operands[2], true);
  9776. break;
  9777. case glslang::EOpImageBlockMatchGatherSADQCOM:
  9778. typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
  9779. opCode = spv::Op::OpImageBlockMatchGatherSADQCOM;
  9780. addImageProcessing2QCOMDecoration(operands[0], true);
  9781. addImageProcessing2QCOMDecoration(operands[2], true);
  9782. break;
  9783. case glslang::EOpCreateTensorLayoutNV:
  9784. return builder.createOp(spv::Op::OpCreateTensorLayoutNV, typeId, std::vector<spv::Id>{});
  9785. case glslang::EOpCreateTensorViewNV:
  9786. return builder.createOp(spv::Op::OpCreateTensorViewNV, typeId, std::vector<spv::Id>{});
  9787. case glslang::EOpTensorLayoutSetBlockSizeNV:
  9788. opCode = spv::Op::OpTensorLayoutSetBlockSizeNV;
  9789. break;
  9790. case glslang::EOpTensorLayoutSetDimensionNV:
  9791. opCode = spv::Op::OpTensorLayoutSetDimensionNV;
  9792. break;
  9793. case glslang::EOpTensorLayoutSetStrideNV:
  9794. opCode = spv::Op::OpTensorLayoutSetStrideNV;
  9795. break;
  9796. case glslang::EOpTensorLayoutSliceNV:
  9797. opCode = spv::Op::OpTensorLayoutSliceNV;
  9798. break;
  9799. case glslang::EOpTensorLayoutSetClampValueNV:
  9800. opCode = spv::Op::OpTensorLayoutSetClampValueNV;
  9801. break;
  9802. case glslang::EOpTensorViewSetDimensionNV:
  9803. opCode = spv::Op::OpTensorViewSetDimensionNV;
  9804. break;
  9805. case glslang::EOpTensorViewSetStrideNV:
  9806. opCode = spv::Op::OpTensorViewSetStrideNV;
  9807. break;
  9808. case glslang::EOpTensorViewSetClipNV:
  9809. opCode = spv::Op::OpTensorViewSetClipNV;
  9810. break;
  9811. default:
  9812. return 0;
  9813. }
  9814. spv::Id id = 0;
  9815. if (libCall >= 0) {
  9816. // Use an extended instruction from the standard library.
  9817. // Construct the call arguments, without modifying the original operands vector.
  9818. // We might need the remaining arguments, e.g. in the EOpFrexp case.
  9819. std::vector<spv::Id> callArguments(operands.begin(), operands.begin() + consumedOperands);
  9820. id = builder.createBuiltinCall(typeId, extBuiltins >= 0 ? extBuiltins : stdBuiltins, libCall, callArguments);
  9821. } else if (opCode == spv::Op::OpDot && !isFloat) {
  9822. // int dot(int, int)
  9823. // NOTE: never called for scalar/vector1, this is turned into simple mul before this can be reached
  9824. const int componentCount = builder.getNumComponents(operands[0]);
  9825. spv::Id mulOp = builder.createBinOp(spv::Op::OpIMul, builder.getTypeId(operands[0]), operands[0], operands[1]);
  9826. builder.setPrecision(mulOp, precision);
  9827. id = builder.createCompositeExtract(mulOp, typeId, 0);
  9828. for (int i = 1; i < componentCount; ++i) {
  9829. builder.setPrecision(id, precision);
  9830. id = builder.createBinOp(spv::Op::OpIAdd, typeId, id, builder.createCompositeExtract(mulOp, typeId, i));
  9831. }
  9832. } else {
  9833. switch (consumedOperands) {
  9834. case 0:
  9835. // should all be handled by visitAggregate and createNoArgOperation
  9836. assert(0);
  9837. return 0;
  9838. case 1:
  9839. // should all be handled by createUnaryOperation
  9840. assert(0);
  9841. return 0;
  9842. case 2:
  9843. id = builder.createBinOp(opCode, typeId, operands[0], operands[1]);
  9844. break;
  9845. default:
  9846. // anything 3 or over doesn't have l-value operands, so all should be consumed
  9847. assert(consumedOperands == operands.size());
  9848. id = builder.createOp(opCode, typeId, operands);
  9849. break;
  9850. }
  9851. }
  9852. // Decode the return types that were structures
  9853. switch (op) {
  9854. case glslang::EOpAddCarry:
  9855. case glslang::EOpSubBorrow:
  9856. builder.createStore(builder.createCompositeExtract(id, typeId0, 1), operands[2]);
  9857. id = builder.createCompositeExtract(id, typeId0, 0);
  9858. break;
  9859. case glslang::EOpUMulExtended:
  9860. case glslang::EOpIMulExtended:
  9861. builder.createStore(builder.createCompositeExtract(id, typeId0, 0), operands[3]);
  9862. builder.createStore(builder.createCompositeExtract(id, typeId0, 1), operands[2]);
  9863. break;
  9864. case glslang::EOpModf:
  9865. {
  9866. assert(operands.size() == 2);
  9867. builder.createStore(builder.createCompositeExtract(id, typeId0, 1), operands[1]);
  9868. id = builder.createCompositeExtract(id, typeId0, 0);
  9869. }
  9870. break;
  9871. case glslang::EOpFrexp:
  9872. {
  9873. assert(operands.size() == 2);
  9874. if (builder.isFloatType(builder.getScalarTypeId(typeId1))) {
  9875. // "exp" is floating-point type (from HLSL intrinsic)
  9876. spv::Id member1 = builder.createCompositeExtract(id, frexpIntType, 1);
  9877. member1 = builder.createUnaryOp(spv::Op::OpConvertSToF, typeId1, member1);
  9878. builder.createStore(member1, operands[1]);
  9879. } else
  9880. // "exp" is integer type (from GLSL built-in function)
  9881. builder.createStore(builder.createCompositeExtract(id, frexpIntType, 1), operands[1]);
  9882. id = builder.createCompositeExtract(id, typeId0, 0);
  9883. }
  9884. break;
  9885. default:
  9886. break;
  9887. }
  9888. return builder.setPrecision(id, precision);
  9889. }
  9890. // Intrinsics with no arguments (or no return value, and no precision).
  9891. spv::Id TGlslangToSpvTraverser::createNoArgOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId)
  9892. {
  9893. // GLSL memory barriers use queuefamily scope in new model, device scope in old model
  9894. spv::Scope memoryBarrierScope = glslangIntermediate->usingVulkanMemoryModel() ?
  9895. spv::Scope::QueueFamilyKHR : spv::Scope::Device;
  9896. switch (op) {
  9897. case glslang::EOpBarrier:
  9898. if (glslangIntermediate->getStage() == EShLangTessControl) {
  9899. if (glslangIntermediate->usingVulkanMemoryModel()) {
  9900. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Workgroup,
  9901. spv::MemorySemanticsMask::OutputMemoryKHR |
  9902. spv::MemorySemanticsMask::AcquireRelease);
  9903. builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
  9904. } else {
  9905. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Invocation, spv::MemorySemanticsMask::MaskNone);
  9906. }
  9907. } else {
  9908. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Workgroup,
  9909. spv::MemorySemanticsMask::WorkgroupMemory |
  9910. spv::MemorySemanticsMask::AcquireRelease);
  9911. }
  9912. return 0;
  9913. case glslang::EOpMemoryBarrier:
  9914. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsAllMemory |
  9915. spv::MemorySemanticsMask::AcquireRelease);
  9916. return 0;
  9917. case glslang::EOpMemoryBarrierBuffer:
  9918. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::UniformMemory |
  9919. spv::MemorySemanticsMask::AcquireRelease);
  9920. return 0;
  9921. case glslang::EOpMemoryBarrierShared:
  9922. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::WorkgroupMemory |
  9923. spv::MemorySemanticsMask::AcquireRelease);
  9924. return 0;
  9925. case glslang::EOpGroupMemoryBarrier:
  9926. builder.createMemoryBarrier(spv::Scope::Workgroup, spv::MemorySemanticsAllMemory |
  9927. spv::MemorySemanticsMask::AcquireRelease);
  9928. return 0;
  9929. case glslang::EOpMemoryBarrierAtomicCounter:
  9930. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::AtomicCounterMemory |
  9931. spv::MemorySemanticsMask::AcquireRelease);
  9932. return 0;
  9933. case glslang::EOpMemoryBarrierImage:
  9934. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::ImageMemory |
  9935. spv::MemorySemanticsMask::AcquireRelease);
  9936. return 0;
  9937. case glslang::EOpAllMemoryBarrierWithGroupSync:
  9938. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Device,
  9939. spv::MemorySemanticsAllMemory |
  9940. spv::MemorySemanticsMask::AcquireRelease);
  9941. return 0;
  9942. case glslang::EOpDeviceMemoryBarrier:
  9943. builder.createMemoryBarrier(spv::Scope::Device, spv::MemorySemanticsMask::UniformMemory |
  9944. spv::MemorySemanticsMask::ImageMemory |
  9945. spv::MemorySemanticsMask::AcquireRelease);
  9946. return 0;
  9947. case glslang::EOpDeviceMemoryBarrierWithGroupSync:
  9948. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Device, spv::MemorySemanticsMask::UniformMemory |
  9949. spv::MemorySemanticsMask::ImageMemory |
  9950. spv::MemorySemanticsMask::AcquireRelease);
  9951. return 0;
  9952. case glslang::EOpWorkgroupMemoryBarrier:
  9953. builder.createMemoryBarrier(spv::Scope::Workgroup, spv::MemorySemanticsMask::WorkgroupMemory |
  9954. spv::MemorySemanticsMask::AcquireRelease);
  9955. return 0;
  9956. case glslang::EOpWorkgroupMemoryBarrierWithGroupSync:
  9957. builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Workgroup,
  9958. spv::MemorySemanticsMask::WorkgroupMemory |
  9959. spv::MemorySemanticsMask::AcquireRelease);
  9960. return 0;
  9961. case glslang::EOpSubgroupBarrier:
  9962. builder.createControlBarrier(spv::Scope::Subgroup, spv::Scope::Subgroup, spv::MemorySemanticsAllMemory |
  9963. spv::MemorySemanticsMask::AcquireRelease);
  9964. return spv::NoResult;
  9965. case glslang::EOpSubgroupMemoryBarrier:
  9966. builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsAllMemory |
  9967. spv::MemorySemanticsMask::AcquireRelease);
  9968. return spv::NoResult;
  9969. case glslang::EOpSubgroupMemoryBarrierBuffer:
  9970. builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsMask::UniformMemory |
  9971. spv::MemorySemanticsMask::AcquireRelease);
  9972. return spv::NoResult;
  9973. case glslang::EOpSubgroupMemoryBarrierImage:
  9974. builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsMask::ImageMemory |
  9975. spv::MemorySemanticsMask::AcquireRelease);
  9976. return spv::NoResult;
  9977. case glslang::EOpSubgroupMemoryBarrierShared:
  9978. builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsMask::WorkgroupMemory |
  9979. spv::MemorySemanticsMask::AcquireRelease);
  9980. return spv::NoResult;
  9981. case glslang::EOpEmitVertex:
  9982. builder.createNoResultOp(spv::Op::OpEmitVertex);
  9983. return 0;
  9984. case glslang::EOpEndPrimitive:
  9985. builder.createNoResultOp(spv::Op::OpEndPrimitive);
  9986. return 0;
  9987. case glslang::EOpSubgroupElect: {
  9988. std::vector<spv::Id> operands;
  9989. return createSubgroupOperation(op, typeId, operands, glslang::EbtVoid);
  9990. }
  9991. case glslang::EOpTime:
  9992. {
  9993. std::vector<spv::Id> args; // Dummy arguments
  9994. spv::Id id = builder.createBuiltinCall(typeId, getExtBuiltins(spv::E_SPV_AMD_gcn_shader), spv::TimeAMD, args);
  9995. return builder.setPrecision(id, precision);
  9996. }
  9997. case glslang::EOpIgnoreIntersectionNV:
  9998. builder.createNoResultOp(spv::Op::OpIgnoreIntersectionNV);
  9999. return 0;
  10000. case glslang::EOpTerminateRayNV:
  10001. builder.createNoResultOp(spv::Op::OpTerminateRayNV);
  10002. return 0;
  10003. case glslang::EOpRayQueryInitialize:
  10004. builder.createNoResultOp(spv::Op::OpRayQueryInitializeKHR);
  10005. return 0;
  10006. case glslang::EOpRayQueryTerminate:
  10007. builder.createNoResultOp(spv::Op::OpRayQueryTerminateKHR);
  10008. return 0;
  10009. case glslang::EOpRayQueryGenerateIntersection:
  10010. builder.createNoResultOp(spv::Op::OpRayQueryGenerateIntersectionKHR);
  10011. return 0;
  10012. case glslang::EOpRayQueryConfirmIntersection:
  10013. builder.createNoResultOp(spv::Op::OpRayQueryConfirmIntersectionKHR);
  10014. return 0;
  10015. case glslang::EOpBeginInvocationInterlock:
  10016. builder.createNoResultOp(spv::Op::OpBeginInvocationInterlockEXT);
  10017. return 0;
  10018. case glslang::EOpEndInvocationInterlock:
  10019. builder.createNoResultOp(spv::Op::OpEndInvocationInterlockEXT);
  10020. return 0;
  10021. case glslang::EOpIsHelperInvocation:
  10022. {
  10023. std::vector<spv::Id> args; // Dummy arguments
  10024. builder.addExtension(spv::E_SPV_EXT_demote_to_helper_invocation);
  10025. builder.addCapability(spv::Capability::DemoteToHelperInvocationEXT);
  10026. return builder.createOp(spv::Op::OpIsHelperInvocationEXT, typeId, args);
  10027. }
  10028. case glslang::EOpReadClockSubgroupKHR: {
  10029. std::vector<spv::Id> args;
  10030. args.push_back(builder.makeUintConstant(spv::Scope::Subgroup));
  10031. builder.addExtension(spv::E_SPV_KHR_shader_clock);
  10032. builder.addCapability(spv::Capability::ShaderClockKHR);
  10033. return builder.createOp(spv::Op::OpReadClockKHR, typeId, args);
  10034. }
  10035. case glslang::EOpReadClockDeviceKHR: {
  10036. std::vector<spv::Id> args;
  10037. args.push_back(builder.makeUintConstant(spv::Scope::Device));
  10038. builder.addExtension(spv::E_SPV_KHR_shader_clock);
  10039. builder.addCapability(spv::Capability::ShaderClockKHR);
  10040. return builder.createOp(spv::Op::OpReadClockKHR, typeId, args);
  10041. }
  10042. case glslang::EOpStencilAttachmentReadEXT:
  10043. case glslang::EOpDepthAttachmentReadEXT:
  10044. {
  10045. builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
  10046. spv::Decoration precision;
  10047. spv::Op spv_op;
  10048. if (op == glslang::EOpStencilAttachmentReadEXT)
  10049. {
  10050. precision = spv::Decoration::RelaxedPrecision;
  10051. spv_op = spv::Op::OpStencilAttachmentReadEXT;
  10052. builder.addCapability(spv::Capability::TileImageStencilReadAccessEXT);
  10053. }
  10054. else
  10055. {
  10056. precision = spv::NoPrecision;
  10057. spv_op = spv::Op::OpDepthAttachmentReadEXT;
  10058. builder.addCapability(spv::Capability::TileImageDepthReadAccessEXT);
  10059. }
  10060. std::vector<spv::Id> args; // Dummy args
  10061. spv::Id result = builder.createOp(spv_op, typeId, args);
  10062. return builder.setPrecision(result, precision);
  10063. }
  10064. default:
  10065. break;
  10066. }
  10067. logger->missingFunctionality("unknown operation with no arguments");
  10068. return 0;
  10069. }
  10070. spv::Id TGlslangToSpvTraverser::getSymbolId(const glslang::TIntermSymbol* symbol)
  10071. {
  10072. auto iter = symbolValues.find(symbol->getId());
  10073. spv::Id id;
  10074. if (symbolValues.end() != iter) {
  10075. id = iter->second;
  10076. return id;
  10077. }
  10078. // it was not found, create it
  10079. spv::BuiltIn builtIn = TranslateBuiltInDecoration(symbol->getQualifier().builtIn, false);
  10080. auto forcedType = getForcedType(symbol->getQualifier().builtIn, symbol->getType());
  10081. // There are pairs of symbols that map to the same SPIR-V built-in:
  10082. // gl_ObjectToWorldEXT and gl_ObjectToWorld3x4EXT, and gl_WorldToObjectEXT
  10083. // and gl_WorldToObject3x4EXT. SPIR-V forbids having two OpVariables
  10084. // with the same BuiltIn in the same storage class, so we must re-use one.
  10085. const bool mayNeedToReuseBuiltIn =
  10086. builtIn == spv::BuiltIn::ObjectToWorldKHR ||
  10087. builtIn == spv::BuiltIn::WorldToObjectKHR;
  10088. // EXT_descriptor_heap
  10089. const bool needToRemapDescHeap =
  10090. builtIn == spv::BuiltIn::ResourceHeapEXT || builtIn == spv::BuiltIn::SamplerHeapEXT;
  10091. if (mayNeedToReuseBuiltIn || needToRemapDescHeap) {
  10092. auto iter = builtInVariableIds.find(uint32_t(builtIn));
  10093. if (builtInVariableIds.end() != iter) {
  10094. id = iter->second;
  10095. symbolValues[symbol->getId()] = id;
  10096. if (forcedType.second != spv::NoType)
  10097. forceType[id] = forcedType.second;
  10098. return id;
  10099. }
  10100. }
  10101. if (symbol->getBasicType() == glslang::EbtFunction) {
  10102. return 0;
  10103. }
  10104. id = createSpvVariable(symbol, forcedType.first);
  10105. if (mayNeedToReuseBuiltIn) {
  10106. builtInVariableIds.insert({uint32_t(builtIn), id});
  10107. }
  10108. symbolValues[symbol->getId()] = id;
  10109. if (forcedType.second != spv::NoType)
  10110. forceType[id] = forcedType.second;
  10111. if (symbol->getBasicType() != glslang::EbtBlock) {
  10112. builder.addDecoration(id, TranslatePrecisionDecoration(symbol->getType()));
  10113. builder.addDecoration(id, TranslateInterpolationDecoration(symbol->getType().getQualifier()));
  10114. builder.addDecoration(id, TranslateAuxiliaryStorageDecoration(symbol->getType().getQualifier()));
  10115. addMeshNVDecoration(id, /*member*/ -1, symbol->getType().getQualifier());
  10116. if (symbol->getQualifier().hasComponent())
  10117. builder.addDecoration(id, spv::Decoration::Component, symbol->getQualifier().layoutComponent);
  10118. if (symbol->getQualifier().hasIndex())
  10119. builder.addDecoration(id, spv::Decoration::Index, symbol->getQualifier().layoutIndex);
  10120. if (symbol->getType().getQualifier().hasSpecConstantId())
  10121. builder.addDecoration(id, spv::Decoration::SpecId, symbol->getType().getQualifier().layoutSpecConstantId);
  10122. // atomic counters use this:
  10123. if (symbol->getQualifier().hasOffset())
  10124. builder.addDecoration(id, spv::Decoration::Offset, symbol->getQualifier().layoutOffset);
  10125. }
  10126. if (symbol->getQualifier().hasLocation()) {
  10127. if (!(glslangIntermediate->isRayTracingStage() &&
  10128. (glslangIntermediate->IsRequestedExtension(glslang::E_GL_EXT_ray_tracing) ||
  10129. glslangIntermediate->IsRequestedExtension(glslang::E_GL_NV_shader_invocation_reorder) ||
  10130. glslangIntermediate->IsRequestedExtension(glslang::E_GL_EXT_shader_invocation_reorder))
  10131. && (builder.getStorageClass(id) == spv::StorageClass::RayPayloadKHR ||
  10132. builder.getStorageClass(id) == spv::StorageClass::IncomingRayPayloadKHR ||
  10133. builder.getStorageClass(id) == spv::StorageClass::CallableDataKHR ||
  10134. builder.getStorageClass(id) == spv::StorageClass::IncomingCallableDataKHR ||
  10135. builder.getStorageClass(id) == spv::StorageClass::HitObjectAttributeEXT ||
  10136. builder.getStorageClass(id) == spv::StorageClass::HitObjectAttributeNV))) {
  10137. // Location values are used to link TraceRayKHR/ExecuteCallableKHR/HitObjectGetAttributesNV
  10138. // to corresponding variables but are not valid in SPIRV since they are supported only
  10139. // for Input/Output Storage classes.
  10140. builder.addDecoration(id, spv::Decoration::Location, symbol->getQualifier().layoutLocation);
  10141. }
  10142. }
  10143. builder.addDecoration(id, TranslateInvariantDecoration(symbol->getType().getQualifier()));
  10144. if (symbol->getQualifier().hasStream() && glslangIntermediate->isMultiStream()) {
  10145. builder.addCapability(spv::Capability::GeometryStreams);
  10146. builder.addDecoration(id, spv::Decoration::Stream, symbol->getQualifier().layoutStream);
  10147. }
  10148. if (symbol->getQualifier().hasSet())
  10149. builder.addDecoration(id, spv::Decoration::DescriptorSet, symbol->getQualifier().layoutSet);
  10150. else if (IsDescriptorResource(symbol->getType())) {
  10151. // default to 0
  10152. builder.addDecoration(id, spv::Decoration::DescriptorSet, 0);
  10153. }
  10154. if (symbol->getQualifier().hasBinding())
  10155. builder.addDecoration(id, spv::Decoration::Binding, symbol->getQualifier().layoutBinding);
  10156. else if (IsDescriptorResource(symbol->getType())) {
  10157. // default to 0
  10158. builder.addDecoration(id, spv::Decoration::Binding, 0);
  10159. }
  10160. if (symbol->getQualifier().hasAttachment())
  10161. builder.addDecoration(id, spv::Decoration::InputAttachmentIndex, symbol->getQualifier().layoutAttachment);
  10162. if (glslangIntermediate->getXfbMode()) {
  10163. builder.addCapability(spv::Capability::TransformFeedback);
  10164. if (symbol->getQualifier().hasXfbBuffer()) {
  10165. builder.addDecoration(id, spv::Decoration::XfbBuffer, symbol->getQualifier().layoutXfbBuffer);
  10166. unsigned stride = glslangIntermediate->getXfbStride(symbol->getQualifier().layoutXfbBuffer);
  10167. if (stride != glslang::TQualifier::layoutXfbStrideEnd)
  10168. builder.addDecoration(id, spv::Decoration::XfbStride, stride);
  10169. }
  10170. if (symbol->getQualifier().hasXfbOffset())
  10171. builder.addDecoration(id, spv::Decoration::Offset, symbol->getQualifier().layoutXfbOffset);
  10172. }
  10173. // add built-in variable decoration
  10174. if (builtIn != spv::BuiltIn::Max) {
  10175. // WorkgroupSize deprecated in spirv1.6
  10176. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_6 ||
  10177. builtIn != spv::BuiltIn::WorkgroupSize)
  10178. builder.addDecoration(id, spv::Decoration::BuiltIn, (int)builtIn);
  10179. }
  10180. // Add volatile decoration to HelperInvocation for spirv1.6 and beyond
  10181. if (builtIn == spv::BuiltIn::HelperInvocation &&
  10182. !glslangIntermediate->usingVulkanMemoryModel() &&
  10183. glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {
  10184. builder.addDecoration(id, spv::Decoration::Volatile);
  10185. }
  10186. // Subgroup builtins which have input storage class are volatile for ray tracing stages.
  10187. if (symbol->getType().isImage() || symbol->getQualifier().isPipeInput()) {
  10188. std::vector<spv::Decoration> memory;
  10189. TranslateMemoryDecoration(symbol->getType().getQualifier(), memory,
  10190. glslangIntermediate->usingVulkanMemoryModel());
  10191. for (unsigned int i = 0; i < memory.size(); ++i)
  10192. builder.addDecoration(id, memory[i]);
  10193. }
  10194. if (builtIn == spv::BuiltIn::SampleMask) {
  10195. spv::Decoration decoration;
  10196. // GL_NV_sample_mask_override_coverage extension
  10197. if (glslangIntermediate->getLayoutOverrideCoverage())
  10198. decoration = spv::Decoration::OverrideCoverageNV;
  10199. else
  10200. decoration = spv::Decoration::Max;
  10201. builder.addDecoration(id, decoration);
  10202. if (decoration != spv::Decoration::Max) {
  10203. builder.addCapability(spv::Capability::SampleMaskOverrideCoverageNV);
  10204. builder.addExtension(spv::E_SPV_NV_sample_mask_override_coverage);
  10205. }
  10206. }
  10207. else if (builtIn == spv::BuiltIn::Layer) {
  10208. // SPV_NV_viewport_array2 extension
  10209. if (symbol->getQualifier().layoutViewportRelative) {
  10210. builder.addDecoration(id, spv::Decoration::ViewportRelativeNV);
  10211. builder.addCapability(spv::Capability::ShaderViewportMaskNV);
  10212. builder.addExtension(spv::E_SPV_NV_viewport_array2);
  10213. }
  10214. if (symbol->getQualifier().layoutSecondaryViewportRelativeOffset != -2048) {
  10215. builder.addDecoration(id, spv::Decoration::SecondaryViewportRelativeNV,
  10216. symbol->getQualifier().layoutSecondaryViewportRelativeOffset);
  10217. builder.addCapability(spv::Capability::ShaderStereoViewNV);
  10218. builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
  10219. }
  10220. }
  10221. if (symbol->getQualifier().layoutPassthrough) {
  10222. builder.addDecoration(id, spv::Decoration::PassthroughNV);
  10223. builder.addCapability(spv::Capability::GeometryShaderPassthroughNV);
  10224. builder.addExtension(spv::E_SPV_NV_geometry_shader_passthrough);
  10225. }
  10226. if (symbol->getQualifier().pervertexNV) {
  10227. builder.addDecoration(id, spv::Decoration::PerVertexNV);
  10228. builder.addCapability(spv::Capability::FragmentBarycentricNV);
  10229. builder.addExtension(spv::E_SPV_NV_fragment_shader_barycentric);
  10230. }
  10231. if (symbol->getQualifier().pervertexEXT) {
  10232. builder.addDecoration(id, spv::Decoration::PerVertexKHR);
  10233. builder.addCapability(spv::Capability::FragmentBarycentricKHR);
  10234. builder.addExtension(spv::E_SPV_KHR_fragment_shader_barycentric);
  10235. }
  10236. if (glslangIntermediate->getHlslFunctionality1() && symbol->getType().getQualifier().semanticName != nullptr) {
  10237. builder.addExtension("SPV_GOOGLE_hlsl_functionality1");
  10238. builder.addDecoration(id, spv::Decoration::HlslSemanticGOOGLE,
  10239. symbol->getType().getQualifier().semanticName);
  10240. }
  10241. if (symbol->isReference()) {
  10242. builder.addDecoration(id, symbol->getType().getQualifier().restrict ?
  10243. spv::Decoration::RestrictPointerEXT : spv::Decoration::AliasedPointerEXT);
  10244. }
  10245. // Add SPIR-V decorations (GL_EXT_spirv_intrinsics)
  10246. if (symbol->getType().getQualifier().hasSpirvDecorate())
  10247. applySpirvDecorate(symbol->getType(), id, {});
  10248. if (symbol->getQualifier().hasBank()) {
  10249. builder.addExtension(spv::E_SPV_NV_push_constant_bank);
  10250. builder.addCapability(spv::Capability::PushConstantBanksNV);
  10251. builder.addDecoration(id, spv::Decoration::BankNV, symbol->getQualifier().layoutBank);
  10252. }
  10253. if (symbol->getQualifier().hasMemberOffset()) {
  10254. builder.addExtension(spv::E_SPV_NV_push_constant_bank);
  10255. builder.addCapability(spv::Capability::PushConstantBanksNV);
  10256. builder.addDecoration(id, spv::Decoration::MemberOffsetNV, symbol->getQualifier().layoutMemberOffset);
  10257. }
  10258. return id;
  10259. }
  10260. // add per-primitive, per-view. per-task decorations to a struct member (member >= 0) or an object
  10261. void TGlslangToSpvTraverser::addMeshNVDecoration(spv::Id id, int member, const glslang::TQualifier& qualifier)
  10262. {
  10263. bool isMeshShaderExt = (glslangIntermediate->getRequestedExtensions().find(glslang::E_GL_EXT_mesh_shader) !=
  10264. glslangIntermediate->getRequestedExtensions().end());
  10265. if (member >= 0) {
  10266. if (qualifier.perPrimitiveNV) {
  10267. // Need to add capability/extension for fragment shader.
  10268. // Mesh shader already adds this by default.
  10269. if (glslangIntermediate->getStage() == EShLangFragment) {
  10270. if(isMeshShaderExt) {
  10271. builder.addCapability(spv::Capability::MeshShadingEXT);
  10272. builder.addExtension(spv::E_SPV_EXT_mesh_shader);
  10273. } else {
  10274. builder.addCapability(spv::Capability::MeshShadingNV);
  10275. builder.addExtension(spv::E_SPV_NV_mesh_shader);
  10276. }
  10277. }
  10278. builder.addMemberDecoration(id, (unsigned)member, spv::Decoration::PerPrimitiveNV);
  10279. }
  10280. if (qualifier.perViewNV)
  10281. builder.addMemberDecoration(id, (unsigned)member, spv::Decoration::PerViewNV);
  10282. if (qualifier.perTaskNV)
  10283. builder.addMemberDecoration(id, (unsigned)member, spv::Decoration::PerTaskNV);
  10284. } else {
  10285. if (qualifier.perPrimitiveNV) {
  10286. // Need to add capability/extension for fragment shader.
  10287. // Mesh shader already adds this by default.
  10288. if (glslangIntermediate->getStage() == EShLangFragment) {
  10289. if(isMeshShaderExt) {
  10290. builder.addCapability(spv::Capability::MeshShadingEXT);
  10291. builder.addExtension(spv::E_SPV_EXT_mesh_shader);
  10292. } else {
  10293. builder.addCapability(spv::Capability::MeshShadingNV);
  10294. builder.addExtension(spv::E_SPV_NV_mesh_shader);
  10295. }
  10296. }
  10297. builder.addDecoration(id, spv::Decoration::PerPrimitiveNV);
  10298. }
  10299. if (qualifier.perViewNV)
  10300. builder.addDecoration(id, spv::Decoration::PerViewNV);
  10301. if (qualifier.perTaskNV)
  10302. builder.addDecoration(id, spv::Decoration::PerTaskNV);
  10303. }
  10304. }
  10305. bool TGlslangToSpvTraverser::hasQCOMImageProceessingDecoration(spv::Id id, spv::Decoration decor)
  10306. {
  10307. std::vector<spv::Decoration> &decoVec = idToQCOMDecorations[id];
  10308. for ( auto d : decoVec ) {
  10309. if ( d == decor )
  10310. return true;
  10311. }
  10312. return false;
  10313. }
  10314. void TGlslangToSpvTraverser::addImageProcessingQCOMDecoration(spv::Id id, spv::Decoration decor)
  10315. {
  10316. spv::Op opc = builder.getOpCode(id);
  10317. if (opc == spv::Op::OpSampledImage) {
  10318. id = builder.getIdOperand(id, 0);
  10319. opc = builder.getOpCode(id);
  10320. }
  10321. if (opc == spv::Op::OpLoad) {
  10322. spv::Id texid = builder.getIdOperand(id, 0);
  10323. if (!hasQCOMImageProceessingDecoration(texid, decor)) {//
  10324. builder.addDecoration(texid, decor);
  10325. idToQCOMDecorations[texid].push_back(decor);
  10326. }
  10327. }
  10328. }
  10329. void TGlslangToSpvTraverser::addImageProcessing2QCOMDecoration(spv::Id id, bool isForGather)
  10330. {
  10331. if (isForGather) {
  10332. return addImageProcessingQCOMDecoration(id, spv::Decoration::BlockMatchTextureQCOM);
  10333. }
  10334. auto addDecor =
  10335. [this](spv::Id id, spv::Decoration decor) {
  10336. spv::Op tsopc = this->builder.getOpCode(id);
  10337. if (tsopc == spv::Op::OpLoad) {
  10338. spv::Id tsid = this->builder.getIdOperand(id, 0);
  10339. if (this->glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {
  10340. assert(iOSet.count(tsid) > 0);
  10341. }
  10342. if (!hasQCOMImageProceessingDecoration(tsid, decor)) {
  10343. this->builder.addDecoration(tsid, decor);
  10344. idToQCOMDecorations[tsid].push_back(decor);
  10345. }
  10346. }
  10347. };
  10348. spv::Op opc = builder.getOpCode(id);
  10349. bool isInterfaceObject = (opc != spv::Op::OpSampledImage);
  10350. if (!isInterfaceObject) {
  10351. addDecor(builder.getIdOperand(id, 0), spv::Decoration::BlockMatchTextureQCOM);
  10352. addDecor(builder.getIdOperand(id, 1), spv::Decoration::BlockMatchSamplerQCOM);
  10353. } else {
  10354. addDecor(id, spv::Decoration::BlockMatchTextureQCOM);
  10355. addDecor(id, spv::Decoration::BlockMatchSamplerQCOM);
  10356. }
  10357. }
  10358. // Make a full tree of instructions to build a SPIR-V specialization constant,
  10359. // or regular constant if possible.
  10360. //
  10361. // TBD: this is not yet done, nor verified to be the best design, it does do the leaf symbols though
  10362. //
  10363. // Recursively walk the nodes. The nodes form a tree whose leaves are
  10364. // regular constants, which themselves are trees that createSpvConstant()
  10365. // recursively walks. So, this function walks the "top" of the tree:
  10366. // - emit specialization constant-building instructions for specConstant
  10367. // - when running into a non-spec-constant, switch to createSpvConstant()
  10368. spv::Id TGlslangToSpvTraverser::createSpvConstant(const glslang::TIntermTyped& node)
  10369. {
  10370. assert(node.getQualifier().isConstant());
  10371. // Handle front-end constants first (non-specialization constants).
  10372. if (! node.getQualifier().specConstant) {
  10373. // hand off to the non-spec-constant path
  10374. assert(node.getAsConstantUnion() != nullptr || node.getAsSymbolNode() != nullptr);
  10375. int nextConst = 0;
  10376. return createSpvConstantFromConstUnionArray(node.getType(), node.getAsConstantUnion() ?
  10377. node.getAsConstantUnion()->getConstArray() : node.getAsSymbolNode()->getConstArray(),
  10378. nextConst, false);
  10379. }
  10380. // We now know we have a specialization constant to build
  10381. // Extra capabilities may be needed.
  10382. if (node.getType().contains8BitInt())
  10383. builder.addCapability(spv::Capability::Int8);
  10384. if (node.getType().contains16BitFloat())
  10385. builder.addCapability(spv::Capability::Float16);
  10386. if (node.getType().contains16BitInt())
  10387. builder.addCapability(spv::Capability::Int16);
  10388. if (node.getType().contains64BitInt())
  10389. builder.addCapability(spv::Capability::Int64);
  10390. if (node.getType().containsDouble())
  10391. builder.addCapability(spv::Capability::Float64);
  10392. // gl_WorkGroupSize is a special case until the front-end handles hierarchical specialization constants,
  10393. // even then, it's specialization ids are handled by special case syntax in GLSL: layout(local_size_x = ...
  10394. if (node.getType().getQualifier().builtIn == glslang::EbvWorkGroupSize) {
  10395. std::vector<spv::Id> dimConstId;
  10396. for (int dim = 0; dim < 3; ++dim) {
  10397. bool specConst = (glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet);
  10398. dimConstId.push_back(builder.makeUintConstant(glslangIntermediate->getLocalSize(dim), specConst));
  10399. if (specConst) {
  10400. builder.addDecoration(dimConstId.back(), spv::Decoration::SpecId,
  10401. glslangIntermediate->getLocalSizeSpecId(dim));
  10402. }
  10403. }
  10404. return builder.makeCompositeConstant(builder.makeVectorType(builder.makeUintType(32), 3), dimConstId, true);
  10405. }
  10406. // An AST node labelled as specialization constant should be a symbol node.
  10407. // Its initializer should either be a sub tree with constant nodes, or a constant union array.
  10408. if (auto* sn = node.getAsSymbolNode()) {
  10409. spv::Id result;
  10410. if (auto* sub_tree = sn->getConstSubtree()) {
  10411. // Traverse the constant constructor sub tree like generating normal run-time instructions.
  10412. // During the AST traversal, if the node is marked as 'specConstant', SpecConstantOpModeGuard
  10413. // will set the builder into spec constant op instruction generating mode.
  10414. sub_tree->traverse(this);
  10415. result = accessChainLoad(sub_tree->getType());
  10416. } else if (auto* const_union_array = &sn->getConstArray()) {
  10417. int nextConst = 0;
  10418. result = createSpvConstantFromConstUnionArray(sn->getType(), *const_union_array, nextConst, true);
  10419. } else {
  10420. logger->missingFunctionality("Invalid initializer for spec constant.");
  10421. return spv::NoResult;
  10422. }
  10423. builder.addName(result, sn->getName().c_str());
  10424. return result;
  10425. }
  10426. // Neither a front-end constant node, nor a specialization constant node with constant union array or
  10427. // constant sub tree as initializer.
  10428. logger->missingFunctionality("Neither a front-end constant nor a spec constant.");
  10429. return spv::NoResult;
  10430. }
  10431. // Use 'consts' as the flattened glslang source of scalar constants to recursively
  10432. // build the aggregate SPIR-V constant.
  10433. //
  10434. // If there are not enough elements present in 'consts', 0 will be substituted;
  10435. // an empty 'consts' can be used to create a fully zeroed SPIR-V constant.
  10436. //
  10437. spv::Id TGlslangToSpvTraverser::createSpvConstantFromConstUnionArray(const glslang::TType& glslangType,
  10438. const glslang::TConstUnionArray& consts, int& nextConst, bool specConstant)
  10439. {
  10440. // vector of constants for SPIR-V
  10441. std::vector<spv::Id> spvConsts;
  10442. // Type is used for struct and array constants
  10443. spv::Id typeId = convertGlslangToSpvType(glslangType);
  10444. if (glslangType.isArray()) {
  10445. glslang::TType elementType(glslangType, 0);
  10446. for (int i = 0; i < glslangType.getOuterArraySize(); ++i)
  10447. spvConsts.push_back(createSpvConstantFromConstUnionArray(elementType, consts, nextConst, false));
  10448. } else if (glslangType.isMatrix()) {
  10449. glslang::TType vectorType(glslangType, 0);
  10450. for (int col = 0; col < glslangType.getMatrixCols(); ++col)
  10451. spvConsts.push_back(createSpvConstantFromConstUnionArray(vectorType, consts, nextConst, false));
  10452. } else if (glslangType.isCoopMat()) {
  10453. glslang::TType componentType(glslangType.getBasicType());
  10454. spvConsts.push_back(createSpvConstantFromConstUnionArray(componentType, consts, nextConst, false));
  10455. } else if (glslangType.isStruct()) {
  10456. glslang::TVector<glslang::TTypeLoc>::const_iterator iter;
  10457. for (iter = glslangType.getStruct()->begin(); iter != glslangType.getStruct()->end(); ++iter)
  10458. spvConsts.push_back(createSpvConstantFromConstUnionArray(*iter->type, consts, nextConst, false));
  10459. } else if (glslangType.getVectorSize() > 1 || glslangType.isCoopVecOrLongVector()) {
  10460. unsigned int numComponents = glslangType.isCoopVecOrLongVector() ? glslangType.getTypeParameters()->arraySizes->getDimSize(0) : glslangType.getVectorSize();
  10461. for (unsigned int i = 0; i < numComponents; ++i) {
  10462. bool zero = nextConst >= consts.size();
  10463. switch (glslangType.getBasicType()) {
  10464. case glslang::EbtInt:
  10465. spvConsts.push_back(builder.makeIntConstant(zero ? 0 : consts[nextConst].getIConst()));
  10466. break;
  10467. case glslang::EbtUint:
  10468. spvConsts.push_back(builder.makeUintConstant(zero ? 0 : consts[nextConst].getUConst()));
  10469. break;
  10470. case glslang::EbtFloat:
  10471. spvConsts.push_back(builder.makeFloatConstant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  10472. break;
  10473. case glslang::EbtBool:
  10474. spvConsts.push_back(builder.makeBoolConstant(zero ? false : consts[nextConst].getBConst()));
  10475. break;
  10476. case glslang::EbtInt8:
  10477. builder.addCapability(spv::Capability::Int8);
  10478. spvConsts.push_back(builder.makeInt8Constant(zero ? 0 : consts[nextConst].getI8Const()));
  10479. break;
  10480. case glslang::EbtUint8:
  10481. builder.addCapability(spv::Capability::Int8);
  10482. spvConsts.push_back(builder.makeUint8Constant(zero ? 0 : consts[nextConst].getU8Const()));
  10483. break;
  10484. case glslang::EbtInt16:
  10485. builder.addCapability(spv::Capability::Int16);
  10486. spvConsts.push_back(builder.makeInt16Constant(zero ? 0 : consts[nextConst].getI16Const()));
  10487. break;
  10488. case glslang::EbtUint16:
  10489. builder.addCapability(spv::Capability::Int16);
  10490. spvConsts.push_back(builder.makeUint16Constant(zero ? 0 : consts[nextConst].getU16Const()));
  10491. break;
  10492. case glslang::EbtInt64:
  10493. spvConsts.push_back(builder.makeInt64Constant(zero ? 0 : consts[nextConst].getI64Const()));
  10494. break;
  10495. case glslang::EbtUint64:
  10496. spvConsts.push_back(builder.makeUint64Constant(zero ? 0 : consts[nextConst].getU64Const()));
  10497. break;
  10498. case glslang::EbtDouble:
  10499. spvConsts.push_back(builder.makeDoubleConstant(zero ? 0.0 : consts[nextConst].getDConst()));
  10500. break;
  10501. case glslang::EbtFloat16:
  10502. builder.addCapability(spv::Capability::Float16);
  10503. spvConsts.push_back(builder.makeFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  10504. break;
  10505. case glslang::EbtBFloat16:
  10506. spvConsts.push_back(builder.makeBFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  10507. break;
  10508. case glslang::EbtFloatE5M2:
  10509. spvConsts.push_back(builder.makeFloatE5M2Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  10510. break;
  10511. case glslang::EbtFloatE4M3:
  10512. spvConsts.push_back(builder.makeFloatE4M3Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  10513. break;
  10514. default:
  10515. assert(0);
  10516. break;
  10517. }
  10518. ++nextConst;
  10519. }
  10520. } else {
  10521. // we have a non-aggregate (scalar) constant
  10522. bool zero = nextConst >= consts.size();
  10523. spv::Id scalar = 0;
  10524. switch (glslangType.getBasicType()) {
  10525. case glslang::EbtInt:
  10526. scalar = builder.makeIntConstant(zero ? 0 : consts[nextConst].getIConst(), specConstant);
  10527. break;
  10528. case glslang::EbtUint:
  10529. scalar = builder.makeUintConstant(zero ? 0 : consts[nextConst].getUConst(), specConstant);
  10530. break;
  10531. case glslang::EbtFloat:
  10532. scalar = builder.makeFloatConstant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  10533. break;
  10534. case glslang::EbtBool:
  10535. scalar = builder.makeBoolConstant(zero ? false : consts[nextConst].getBConst(), specConstant);
  10536. break;
  10537. case glslang::EbtInt8:
  10538. builder.addCapability(spv::Capability::Int8);
  10539. scalar = builder.makeInt8Constant(zero ? 0 : consts[nextConst].getI8Const(), specConstant);
  10540. break;
  10541. case glslang::EbtUint8:
  10542. builder.addCapability(spv::Capability::Int8);
  10543. scalar = builder.makeUint8Constant(zero ? 0 : consts[nextConst].getU8Const(), specConstant);
  10544. break;
  10545. case glslang::EbtInt16:
  10546. builder.addCapability(spv::Capability::Int16);
  10547. scalar = builder.makeInt16Constant(zero ? 0 : consts[nextConst].getI16Const(), specConstant);
  10548. break;
  10549. case glslang::EbtUint16:
  10550. builder.addCapability(spv::Capability::Int16);
  10551. scalar = builder.makeUint16Constant(zero ? 0 : consts[nextConst].getU16Const(), specConstant);
  10552. break;
  10553. case glslang::EbtInt64:
  10554. scalar = builder.makeInt64Constant(zero ? 0 : consts[nextConst].getI64Const(), specConstant);
  10555. break;
  10556. case glslang::EbtUint64:
  10557. scalar = builder.makeUint64Constant(zero ? 0 : consts[nextConst].getU64Const(), specConstant);
  10558. break;
  10559. case glslang::EbtDouble:
  10560. scalar = builder.makeDoubleConstant(zero ? 0.0 : consts[nextConst].getDConst(), specConstant);
  10561. break;
  10562. case glslang::EbtFloat16:
  10563. builder.addCapability(spv::Capability::Float16);
  10564. scalar = builder.makeFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  10565. break;
  10566. case glslang::EbtBFloat16:
  10567. scalar = builder.makeBFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  10568. break;
  10569. case glslang::EbtFloatE5M2:
  10570. scalar = builder.makeFloatE5M2Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  10571. break;
  10572. case glslang::EbtFloatE4M3:
  10573. scalar = builder.makeFloatE4M3Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  10574. break;
  10575. case glslang::EbtReference:
  10576. scalar = builder.makeUint64Constant(zero ? 0 : consts[nextConst].getU64Const(), specConstant);
  10577. scalar = builder.createUnaryOp(spv::Op::OpBitcast, typeId, scalar);
  10578. break;
  10579. case glslang::EbtString:
  10580. scalar = builder.getStringId(consts[nextConst].getSConst()->c_str());
  10581. break;
  10582. default:
  10583. assert(0);
  10584. break;
  10585. }
  10586. ++nextConst;
  10587. return scalar;
  10588. }
  10589. return builder.makeCompositeConstant(typeId, spvConsts);
  10590. }
  10591. // Return true if the node is a constant or symbol whose reading has no
  10592. // non-trivial observable cost or effect.
  10593. bool TGlslangToSpvTraverser::isTrivialLeaf(const glslang::TIntermTyped* node)
  10594. {
  10595. // don't know what this is
  10596. if (node == nullptr)
  10597. return false;
  10598. // a constant is safe
  10599. if (node->getAsConstantUnion() != nullptr)
  10600. return true;
  10601. // not a symbol means non-trivial
  10602. if (node->getAsSymbolNode() == nullptr)
  10603. return false;
  10604. // a symbol, depends on what's being read
  10605. switch (node->getType().getQualifier().storage) {
  10606. case glslang::EvqTemporary:
  10607. case glslang::EvqGlobal:
  10608. case glslang::EvqIn:
  10609. case glslang::EvqInOut:
  10610. case glslang::EvqConst:
  10611. case glslang::EvqConstReadOnly:
  10612. case glslang::EvqUniform:
  10613. return true;
  10614. default:
  10615. return false;
  10616. }
  10617. }
  10618. // A node is trivial if it is a single operation with no side effects.
  10619. // HLSL (and/or vectors) are always trivial, as it does not short circuit.
  10620. // Otherwise, error on the side of saying non-trivial.
  10621. // Return true if trivial.
  10622. bool TGlslangToSpvTraverser::isTrivial(const glslang::TIntermTyped* node)
  10623. {
  10624. if (node == nullptr)
  10625. return false;
  10626. // count non scalars as trivial, as well as anything coming from HLSL
  10627. if (! node->getType().isScalarOrVec1() || glslangIntermediate->getSource() == glslang::EShSourceHlsl)
  10628. return true;
  10629. // symbols and constants are trivial
  10630. if (isTrivialLeaf(node))
  10631. return true;
  10632. // otherwise, it needs to be a simple operation or one or two leaf nodes
  10633. // not a simple operation
  10634. const glslang::TIntermBinary* binaryNode = node->getAsBinaryNode();
  10635. const glslang::TIntermUnary* unaryNode = node->getAsUnaryNode();
  10636. if (binaryNode == nullptr && unaryNode == nullptr)
  10637. return false;
  10638. // not on leaf nodes
  10639. if (binaryNode && (! isTrivialLeaf(binaryNode->getLeft()) || ! isTrivialLeaf(binaryNode->getRight())))
  10640. return false;
  10641. if (unaryNode && ! isTrivialLeaf(unaryNode->getOperand())) {
  10642. return false;
  10643. }
  10644. if (IsOpNumericConv(node->getAsOperator()->getOp()) &&
  10645. node->getType().getBasicType() == glslang::EbtBool) {
  10646. return true;
  10647. }
  10648. switch (node->getAsOperator()->getOp()) {
  10649. case glslang::EOpLogicalNot:
  10650. case glslang::EOpEqual:
  10651. case glslang::EOpNotEqual:
  10652. case glslang::EOpLessThan:
  10653. case glslang::EOpGreaterThan:
  10654. case glslang::EOpLessThanEqual:
  10655. case glslang::EOpGreaterThanEqual:
  10656. case glslang::EOpIndexDirect:
  10657. case glslang::EOpIndexDirectStruct:
  10658. case glslang::EOpLogicalXor:
  10659. case glslang::EOpAny:
  10660. case glslang::EOpAll:
  10661. return true;
  10662. default:
  10663. return false;
  10664. }
  10665. }
  10666. // Emit short-circuiting code, where 'right' is never evaluated unless
  10667. // the left side is true (for &&) or false (for ||).
  10668. spv::Id TGlslangToSpvTraverser::createShortCircuit(glslang::TOperator op, glslang::TIntermTyped& left,
  10669. glslang::TIntermTyped& right)
  10670. {
  10671. spv::Id boolTypeId = builder.makeBoolType();
  10672. // emit left operand
  10673. builder.clearAccessChain();
  10674. left.traverse(this);
  10675. spv::Id leftId = accessChainLoad(left.getType());
  10676. // Operands to accumulate OpPhi operands
  10677. std::vector<spv::Id> phiOperands;
  10678. phiOperands.reserve(4);
  10679. // accumulate left operand's phi information
  10680. phiOperands.push_back(leftId);
  10681. phiOperands.push_back(builder.getBuildPoint()->getId());
  10682. // Make the two kinds of operation symmetric with a "!"
  10683. // || => emit "if (! left) result = right"
  10684. // && => emit "if ( left) result = right"
  10685. //
  10686. // TODO: this runtime "not" for || could be avoided by adding functionality
  10687. // to 'builder' to have an "else" without an "then"
  10688. if (op == glslang::EOpLogicalOr)
  10689. leftId = builder.createUnaryOp(spv::Op::OpLogicalNot, boolTypeId, leftId);
  10690. // make an "if" based on the left value
  10691. spv::Builder::If ifBuilder(leftId, spv::SelectionControlMask::MaskNone, builder);
  10692. // emit right operand as the "then" part of the "if"
  10693. builder.clearAccessChain();
  10694. right.traverse(this);
  10695. spv::Id rightId = accessChainLoad(right.getType());
  10696. // accumulate left operand's phi information
  10697. phiOperands.push_back(rightId);
  10698. phiOperands.push_back(builder.getBuildPoint()->getId());
  10699. // finish the "if"
  10700. ifBuilder.makeEndIf();
  10701. // phi together the two results
  10702. return builder.createOp(spv::Op::OpPhi, boolTypeId, phiOperands);
  10703. }
  10704. // Return type Id of the imported set of extended instructions corresponds to the name.
  10705. // Import this set if it has not been imported yet.
  10706. spv::Id TGlslangToSpvTraverser::getExtBuiltins(const char* name)
  10707. {
  10708. if (extBuiltinMap.find(name) != extBuiltinMap.end())
  10709. return extBuiltinMap[name];
  10710. else {
  10711. spv::Id extBuiltins = builder.import(name);
  10712. extBuiltinMap[name] = extBuiltins;
  10713. return extBuiltins;
  10714. }
  10715. }
  10716. } // end anonymous namespace
  10717. namespace glslang {
  10718. void GetSpirvVersion(std::string& version)
  10719. {
  10720. const int bufSize = 100;
  10721. char buf[bufSize];
  10722. snprintf(buf, bufSize, "0x%08x, Revision %d", spv::Version, spv::Revision);
  10723. version = buf;
  10724. }
  10725. // For low-order part of the generator's magic number. Bump up
  10726. // when there is a change in the style (e.g., if SSA form changes,
  10727. // or a different instruction sequence to do something gets used).
  10728. int GetSpirvGeneratorVersion()
  10729. {
  10730. // return 1; // start
  10731. // return 2; // EOpAtomicCounterDecrement gets a post decrement, to map between GLSL -> SPIR-V
  10732. // return 3; // change/correct barrier-instruction operands, to match memory model group decisions
  10733. // return 4; // some deeper access chains: for dynamic vector component, and local Boolean component
  10734. // return 5; // make OpArrayLength result type be an int with signedness of 0
  10735. // return 6; // revert version 5 change, which makes a different (new) kind of incorrect code,
  10736. // versions 4 and 6 each generate OpArrayLength as it has long been done
  10737. // return 7; // GLSL volatile keyword maps to both SPIR-V decorations Volatile and Coherent
  10738. // return 8; // switch to new dead block eliminator; use OpUnreachable
  10739. // return 9; // don't include opaque function parameters in OpEntryPoint global's operand list
  10740. // return 10; // Generate OpFUnordNotEqual for != comparisons
  10741. return 11; // Make OpEmitMeshTasksEXT a terminal instruction
  10742. }
  10743. // Write SPIR-V out to a binary file
  10744. bool OutputSpvBin(const std::vector<unsigned int>& spirv, const char* baseName)
  10745. {
  10746. std::ofstream out;
  10747. out.open(baseName, std::ios::binary | std::ios::out);
  10748. if (out.fail()) {
  10749. printf("ERROR: Failed to open file: %s\n", baseName);
  10750. return false;
  10751. }
  10752. for (int i = 0; i < (int)spirv.size(); ++i) {
  10753. unsigned int word = spirv[i];
  10754. out.write((const char*)&word, 4);
  10755. }
  10756. out.close();
  10757. return true;
  10758. }
  10759. // Write SPIR-V out to a text file with 32-bit hexadecimal words
  10760. bool OutputSpvHex(const std::vector<unsigned int>& spirv, const char* baseName, const char* varName)
  10761. {
  10762. std::ofstream out;
  10763. out.open(baseName, std::ios::binary | std::ios::out);
  10764. if (out.fail()) {
  10765. printf("ERROR: Failed to open file: %s\n", baseName);
  10766. return false;
  10767. }
  10768. out << "\t// " <<
  10769. GetSpirvGeneratorVersion() <<
  10770. GLSLANG_VERSION_MAJOR << "." << GLSLANG_VERSION_MINOR << "." << GLSLANG_VERSION_PATCH <<
  10771. GLSLANG_VERSION_FLAVOR << std::endl;
  10772. if (varName != nullptr) {
  10773. out << "\t #pragma once" << std::endl;
  10774. out << "const uint32_t " << varName << "[] = {" << std::endl;
  10775. }
  10776. const int WORDS_PER_LINE = 8;
  10777. for (int i = 0; i < (int)spirv.size(); i += WORDS_PER_LINE) {
  10778. out << "\t";
  10779. for (int j = 0; j < WORDS_PER_LINE && i + j < (int)spirv.size(); ++j) {
  10780. const unsigned int word = spirv[i + j];
  10781. out << "0x" << std::hex << std::setw(8) << std::setfill('0') << word;
  10782. if (i + j + 1 < (int)spirv.size()) {
  10783. out << ",";
  10784. }
  10785. }
  10786. out << std::endl;
  10787. }
  10788. if (varName != nullptr) {
  10789. out << "};";
  10790. out << std::endl;
  10791. }
  10792. out.close();
  10793. return true;
  10794. }
  10795. //
  10796. // Set up the glslang traversal
  10797. //
  10798. void GlslangToSpv(const TIntermediate& intermediate, std::vector<unsigned int>& spirv, SpvOptions* options)
  10799. {
  10800. spv::SpvBuildLogger logger;
  10801. GlslangToSpv(intermediate, spirv, &logger, options);
  10802. }
  10803. void GlslangToSpv(const TIntermediate& intermediate, std::vector<unsigned int>& spirv,
  10804. spv::SpvBuildLogger* logger, SpvOptions* options)
  10805. {
  10806. TIntermNode* root = intermediate.getTreeRoot();
  10807. if (root == nullptr)
  10808. return;
  10809. SpvOptions defaultOptions;
  10810. if (options == nullptr)
  10811. options = &defaultOptions;
  10812. GetThreadPoolAllocator().push();
  10813. TGlslangToSpvTraverser it(intermediate.getSpv().spv, &intermediate, logger, *options);
  10814. root->traverse(&it);
  10815. it.finishSpv(options->compileOnly);
  10816. it.dumpSpv(spirv);
  10817. #if ENABLE_OPT
  10818. // If from HLSL, run spirv-opt to "legalize" the SPIR-V for Vulkan
  10819. // eg. forward and remove memory writes of opaque types.
  10820. bool prelegalization = intermediate.getSource() == EShSourceHlsl;
  10821. if ((prelegalization || options->optimizeSize) && !options->disableOptimizer) {
  10822. SpirvToolsTransform(intermediate, spirv, logger, options);
  10823. prelegalization = false;
  10824. }
  10825. else if (options->stripDebugInfo) {
  10826. // Strip debug info even if optimization is disabled.
  10827. SpirvToolsStripDebugInfo(intermediate, spirv, logger);
  10828. }
  10829. if (options->validate)
  10830. SpirvToolsValidate(intermediate, spirv, logger, prelegalization);
  10831. if (options->disassemble)
  10832. SpirvToolsDisassemble(std::cout, spirv);
  10833. #endif
  10834. GetThreadPoolAllocator().pop();
  10835. }
  10836. } // end namespace glslang