GlslangToSpv.cpp 331 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488248924902491249224932494249524962497249824992500250125022503250425052506250725082509251025112512251325142515251625172518251925202521252225232524252525262527252825292530253125322533253425352536253725382539254025412542254325442545254625472548254925502551255225532554255525562557255825592560256125622563256425652566256725682569257025712572257325742575257625772578257925802581258225832584258525862587258825892590259125922593259425952596259725982599260026012602260326042605260626072608260926102611261226132614261526162617261826192620262126222623262426252626262726282629263026312632263326342635263626372638263926402641264226432644264526462647264826492650265126522653265426552656265726582659266026612662266326642665266626672668266926702671267226732674267526762677267826792680268126822683268426852686268726882689269026912692269326942695269626972698269927002701270227032704270527062707270827092710271127122713271427152716271727182719272027212722272327242725272627272728272927302731273227332734273527362737273827392740274127422743274427452746274727482749275027512752275327542755275627572758275927602761276227632764276527662767276827692770277127722773277427752776277727782779278027812782278327842785278627872788278927902791279227932794279527962797279827992800280128022803280428052806280728082809281028112812281328142815281628172818281928202821282228232824282528262827282828292830283128322833283428352836283728382839284028412842284328442845284628472848284928502851285228532854285528562857285828592860286128622863286428652866286728682869287028712872287328742875287628772878287928802881288228832884288528862887288828892890289128922893289428952896289728982899290029012902290329042905290629072908290929102911291229132914291529162917291829192920292129222923292429252926292729282929293029312932293329342935293629372938293929402941294229432944294529462947294829492950295129522953295429552956295729582959296029612962296329642965296629672968296929702971297229732974297529762977297829792980298129822983298429852986298729882989299029912992299329942995299629972998299930003001300230033004300530063007300830093010301130123013301430153016301730183019302030213022302330243025302630273028302930303031303230333034303530363037303830393040304130423043304430453046304730483049305030513052305330543055305630573058305930603061306230633064306530663067306830693070307130723073307430753076307730783079308030813082308330843085308630873088308930903091309230933094309530963097309830993100310131023103310431053106310731083109311031113112311331143115311631173118311931203121312231233124312531263127312831293130313131323133313431353136313731383139314031413142314331443145314631473148314931503151315231533154315531563157315831593160316131623163316431653166316731683169317031713172317331743175317631773178317931803181318231833184318531863187318831893190319131923193319431953196319731983199320032013202320332043205320632073208320932103211321232133214321532163217321832193220322132223223322432253226322732283229323032313232323332343235323632373238323932403241324232433244324532463247324832493250325132523253325432553256325732583259326032613262326332643265326632673268326932703271327232733274327532763277327832793280328132823283328432853286328732883289329032913292329332943295329632973298329933003301330233033304330533063307330833093310331133123313331433153316331733183319332033213322332333243325332633273328332933303331333233333334333533363337333833393340334133423343334433453346334733483349335033513352335333543355335633573358335933603361336233633364336533663367336833693370337133723373337433753376337733783379338033813382338333843385338633873388338933903391339233933394339533963397339833993400340134023403340434053406340734083409341034113412341334143415341634173418341934203421342234233424342534263427342834293430343134323433343434353436343734383439344034413442344334443445344634473448344934503451345234533454345534563457345834593460346134623463346434653466346734683469347034713472347334743475347634773478347934803481348234833484348534863487348834893490349134923493349434953496349734983499350035013502350335043505350635073508350935103511351235133514351535163517351835193520352135223523352435253526352735283529353035313532353335343535353635373538353935403541354235433544354535463547354835493550355135523553355435553556355735583559356035613562356335643565356635673568356935703571357235733574357535763577357835793580358135823583358435853586358735883589359035913592359335943595359635973598359936003601360236033604360536063607360836093610361136123613361436153616361736183619362036213622362336243625362636273628362936303631363236333634363536363637363836393640364136423643364436453646364736483649365036513652365336543655365636573658365936603661366236633664366536663667366836693670367136723673367436753676367736783679368036813682368336843685368636873688368936903691369236933694369536963697369836993700370137023703370437053706370737083709371037113712371337143715371637173718371937203721372237233724372537263727372837293730373137323733373437353736373737383739374037413742374337443745374637473748374937503751375237533754375537563757375837593760376137623763376437653766376737683769377037713772377337743775377637773778377937803781378237833784378537863787378837893790379137923793379437953796379737983799380038013802380338043805380638073808380938103811381238133814381538163817381838193820382138223823382438253826382738283829383038313832383338343835383638373838383938403841384238433844384538463847384838493850385138523853385438553856385738583859386038613862386338643865386638673868386938703871387238733874387538763877387838793880388138823883388438853886388738883889389038913892389338943895389638973898389939003901390239033904390539063907390839093910391139123913391439153916391739183919392039213922392339243925392639273928392939303931393239333934393539363937393839393940394139423943394439453946394739483949395039513952395339543955395639573958395939603961396239633964396539663967396839693970397139723973397439753976397739783979398039813982398339843985398639873988398939903991399239933994399539963997399839994000400140024003400440054006400740084009401040114012401340144015401640174018401940204021402240234024402540264027402840294030403140324033403440354036403740384039404040414042404340444045404640474048404940504051405240534054405540564057405840594060406140624063406440654066406740684069407040714072407340744075407640774078407940804081408240834084408540864087408840894090409140924093409440954096409740984099410041014102410341044105410641074108410941104111411241134114411541164117411841194120412141224123412441254126412741284129413041314132413341344135413641374138413941404141414241434144414541464147414841494150415141524153415441554156415741584159416041614162416341644165416641674168416941704171417241734174417541764177417841794180418141824183418441854186418741884189419041914192419341944195419641974198419942004201420242034204420542064207420842094210421142124213421442154216421742184219422042214222422342244225422642274228422942304231423242334234423542364237423842394240424142424243424442454246424742484249425042514252425342544255425642574258425942604261426242634264426542664267426842694270427142724273427442754276427742784279428042814282428342844285428642874288428942904291429242934294429542964297429842994300430143024303430443054306430743084309431043114312431343144315431643174318431943204321432243234324432543264327432843294330433143324333433443354336433743384339434043414342434343444345434643474348434943504351435243534354435543564357435843594360436143624363436443654366436743684369437043714372437343744375437643774378437943804381438243834384438543864387438843894390439143924393439443954396439743984399440044014402440344044405440644074408440944104411441244134414441544164417441844194420442144224423442444254426442744284429443044314432443344344435443644374438443944404441444244434444444544464447444844494450445144524453445444554456445744584459446044614462446344644465446644674468446944704471447244734474447544764477447844794480448144824483448444854486448744884489449044914492449344944495449644974498449945004501450245034504450545064507450845094510451145124513451445154516451745184519452045214522452345244525452645274528452945304531453245334534453545364537453845394540454145424543454445454546454745484549455045514552455345544555455645574558455945604561456245634564456545664567456845694570457145724573457445754576457745784579458045814582458345844585458645874588458945904591459245934594459545964597459845994600460146024603460446054606460746084609461046114612461346144615461646174618461946204621462246234624462546264627462846294630463146324633463446354636463746384639464046414642464346444645464646474648464946504651465246534654465546564657465846594660466146624663466446654666466746684669467046714672467346744675467646774678467946804681468246834684468546864687468846894690469146924693469446954696469746984699470047014702470347044705470647074708470947104711471247134714471547164717471847194720472147224723472447254726472747284729473047314732473347344735473647374738473947404741474247434744474547464747474847494750475147524753475447554756475747584759476047614762476347644765476647674768476947704771477247734774477547764777477847794780478147824783478447854786478747884789479047914792479347944795479647974798479948004801480248034804480548064807480848094810481148124813481448154816481748184819482048214822482348244825482648274828482948304831483248334834483548364837483848394840484148424843484448454846484748484849485048514852485348544855485648574858485948604861486248634864486548664867486848694870487148724873487448754876487748784879488048814882488348844885488648874888488948904891489248934894489548964897489848994900490149024903490449054906490749084909491049114912491349144915491649174918491949204921492249234924492549264927492849294930493149324933493449354936493749384939494049414942494349444945494649474948494949504951495249534954495549564957495849594960496149624963496449654966496749684969497049714972497349744975497649774978497949804981498249834984498549864987498849894990499149924993499449954996499749984999500050015002500350045005500650075008500950105011501250135014501550165017501850195020502150225023502450255026502750285029503050315032503350345035503650375038503950405041504250435044504550465047504850495050505150525053505450555056505750585059506050615062506350645065506650675068506950705071507250735074507550765077507850795080508150825083508450855086508750885089509050915092509350945095509650975098509951005101510251035104510551065107510851095110511151125113511451155116511751185119512051215122512351245125512651275128512951305131513251335134513551365137513851395140514151425143514451455146514751485149515051515152515351545155515651575158515951605161516251635164516551665167516851695170517151725173517451755176517751785179518051815182518351845185518651875188518951905191519251935194519551965197519851995200520152025203520452055206520752085209521052115212521352145215521652175218521952205221522252235224522552265227522852295230523152325233523452355236523752385239524052415242524352445245524652475248524952505251525252535254525552565257525852595260526152625263526452655266526752685269527052715272527352745275527652775278527952805281528252835284528552865287528852895290529152925293529452955296529752985299530053015302530353045305530653075308530953105311531253135314531553165317531853195320532153225323532453255326532753285329533053315332533353345335533653375338533953405341534253435344534553465347534853495350535153525353535453555356535753585359536053615362536353645365536653675368536953705371537253735374537553765377537853795380538153825383538453855386538753885389539053915392539353945395539653975398539954005401540254035404540554065407540854095410541154125413541454155416541754185419542054215422542354245425542654275428542954305431543254335434543554365437543854395440544154425443544454455446544754485449545054515452545354545455545654575458545954605461546254635464546554665467546854695470547154725473547454755476547754785479548054815482548354845485548654875488548954905491549254935494549554965497549854995500550155025503550455055506550755085509551055115512551355145515551655175518551955205521552255235524552555265527552855295530553155325533553455355536553755385539554055415542554355445545554655475548554955505551555255535554555555565557555855595560556155625563556455655566556755685569557055715572557355745575557655775578557955805581558255835584558555865587558855895590559155925593559455955596559755985599560056015602560356045605560656075608560956105611561256135614561556165617561856195620562156225623562456255626562756285629563056315632563356345635563656375638563956405641564256435644564556465647564856495650565156525653565456555656565756585659566056615662566356645665566656675668566956705671567256735674567556765677567856795680568156825683568456855686568756885689569056915692569356945695569656975698569957005701570257035704570557065707570857095710571157125713571457155716571757185719572057215722572357245725572657275728572957305731573257335734573557365737573857395740574157425743574457455746574757485749575057515752575357545755575657575758575957605761576257635764576557665767576857695770577157725773577457755776577757785779578057815782578357845785578657875788578957905791579257935794579557965797579857995800580158025803580458055806580758085809581058115812581358145815581658175818581958205821582258235824582558265827582858295830583158325833583458355836583758385839584058415842584358445845584658475848584958505851585258535854585558565857585858595860586158625863586458655866586758685869587058715872587358745875587658775878587958805881588258835884588558865887588858895890589158925893589458955896589758985899590059015902590359045905590659075908590959105911591259135914591559165917591859195920592159225923592459255926592759285929593059315932593359345935593659375938593959405941594259435944594559465947594859495950595159525953595459555956595759585959596059615962596359645965596659675968596959705971597259735974597559765977597859795980598159825983598459855986598759885989599059915992599359945995599659975998599960006001600260036004600560066007600860096010601160126013601460156016601760186019602060216022602360246025602660276028602960306031603260336034603560366037603860396040604160426043604460456046604760486049605060516052605360546055605660576058605960606061606260636064606560666067606860696070607160726073607460756076607760786079608060816082608360846085608660876088608960906091609260936094609560966097609860996100610161026103610461056106610761086109611061116112611361146115611661176118611961206121612261236124612561266127612861296130613161326133613461356136613761386139614061416142614361446145614661476148614961506151615261536154615561566157615861596160616161626163616461656166616761686169617061716172617361746175617661776178617961806181618261836184618561866187618861896190619161926193619461956196619761986199620062016202620362046205620662076208620962106211621262136214621562166217621862196220622162226223622462256226622762286229623062316232623362346235623662376238623962406241624262436244624562466247624862496250625162526253625462556256625762586259626062616262626362646265626662676268626962706271627262736274627562766277627862796280628162826283628462856286628762886289629062916292629362946295629662976298629963006301630263036304630563066307630863096310631163126313631463156316631763186319632063216322632363246325632663276328632963306331633263336334633563366337633863396340634163426343634463456346634763486349635063516352635363546355635663576358635963606361636263636364636563666367636863696370637163726373637463756376637763786379638063816382638363846385638663876388638963906391639263936394639563966397639863996400640164026403640464056406640764086409641064116412641364146415641664176418641964206421642264236424642564266427642864296430643164326433643464356436643764386439644064416442644364446445644664476448644964506451645264536454645564566457645864596460646164626463646464656466646764686469647064716472647364746475647664776478647964806481648264836484648564866487648864896490649164926493649464956496649764986499650065016502650365046505650665076508650965106511651265136514651565166517651865196520652165226523652465256526652765286529653065316532653365346535653665376538653965406541654265436544654565466547654865496550655165526553655465556556655765586559656065616562656365646565656665676568656965706571657265736574657565766577657865796580658165826583658465856586658765886589659065916592659365946595659665976598659966006601660266036604660566066607660866096610661166126613661466156616661766186619662066216622662366246625662666276628662966306631663266336634663566366637663866396640664166426643664466456646664766486649665066516652665366546655665666576658665966606661666266636664666566666667666866696670667166726673667466756676667766786679668066816682668366846685668666876688668966906691669266936694669566966697669866996700670167026703670467056706670767086709671067116712671367146715671667176718671967206721672267236724672567266727672867296730673167326733673467356736673767386739674067416742674367446745674667476748674967506751675267536754675567566757675867596760676167626763676467656766676767686769677067716772677367746775677667776778677967806781678267836784678567866787678867896790679167926793679467956796679767986799680068016802680368046805680668076808680968106811681268136814681568166817681868196820682168226823682468256826682768286829683068316832683368346835683668376838683968406841684268436844684568466847684868496850685168526853685468556856685768586859686068616862686368646865686668676868686968706871687268736874687568766877687868796880688168826883688468856886688768886889689068916892689368946895689668976898689969006901690269036904690569066907690869096910691169126913691469156916691769186919692069216922692369246925692669276928692969306931693269336934693569366937693869396940694169426943694469456946694769486949695069516952695369546955695669576958695969606961696269636964696569666967696869696970697169726973697469756976697769786979698069816982698369846985698669876988698969906991699269936994699569966997699869997000700170027003700470057006700770087009701070117012701370147015701670177018701970207021702270237024702570267027702870297030703170327033703470357036703770387039704070417042704370447045704670477048704970507051705270537054705570567057705870597060706170627063706470657066706770687069707070717072707370747075707670777078707970807081708270837084708570867087708870897090709170927093709470957096709770987099710071017102710371047105710671077108710971107111711271137114711571167117711871197120712171227123712471257126712771287129713071317132713371347135713671377138713971407141714271437144714571467147714871497150715171527153715471557156715771587159716071617162716371647165716671677168716971707171717271737174717571767177717871797180718171827183718471857186718771887189719071917192719371947195719671977198719972007201720272037204720572067207720872097210721172127213721472157216721772187219722072217222722372247225722672277228722972307231723272337234723572367237723872397240724172427243724472457246724772487249725072517252725372547255725672577258725972607261726272637264726572667267726872697270727172727273727472757276727772787279728072817282728372847285728672877288728972907291729272937294729572967297729872997300730173027303730473057306730773087309731073117312731373147315731673177318731973207321732273237324732573267327732873297330733173327333733473357336733773387339734073417342734373447345734673477348734973507351735273537354735573567357735873597360736173627363736473657366736773687369737073717372737373747375737673777378737973807381738273837384738573867387738873897390739173927393739473957396739773987399740074017402740374047405740674077408740974107411741274137414741574167417741874197420742174227423742474257426742774287429743074317432743374347435743674377438743974407441744274437444744574467447744874497450745174527453745474557456745774587459746074617462746374647465746674677468746974707471747274737474747574767477747874797480748174827483748474857486748774887489749074917492749374947495749674977498749975007501750275037504750575067507750875097510751175127513751475157516751775187519752075217522752375247525752675277528752975307531753275337534753575367537753875397540754175427543754475457546754775487549755075517552755375547555755675577558755975607561756275637564756575667567756875697570757175727573757475757576757775787579758075817582758375847585758675877588758975907591759275937594759575967597759875997600760176027603760476057606760776087609761076117612761376147615761676177618761976207621762276237624762576267627762876297630763176327633763476357636763776387639764076417642764376447645764676477648764976507651765276537654765576567657765876597660766176627663766476657666766776687669767076717672767376747675767676777678767976807681768276837684768576867687768876897690769176927693769476957696769776987699770077017702770377047705770677077708770977107711771277137714771577167717771877197720772177227723772477257726772777287729773077317732773377347735773677377738773977407741774277437744774577467747774877497750775177527753775477557756775777587759776077617762776377647765776677677768776977707771777277737774777577767777777877797780778177827783778477857786778777887789779077917792779377947795779677977798779978007801780278037804780578067807780878097810781178127813781478157816781778187819782078217822782378247825782678277828782978307831783278337834783578367837783878397840784178427843784478457846784778487849785078517852785378547855785678577858785978607861786278637864786578667867786878697870787178727873787478757876787778787879788078817882788378847885788678877888788978907891789278937894789578967897789878997900790179027903790479057906790779087909791079117912791379147915791679177918791979207921792279237924792579267927792879297930793179327933793479357936793779387939794079417942794379447945794679477948794979507951795279537954795579567957795879597960796179627963796479657966796779687969797079717972797379747975797679777978797979807981
  1. //
  2. // Copyright (C) 2014-2016 LunarG, Inc.
  3. // Copyright (C) 2015-2018 Google, Inc.
  4. // Copyright (C) 2017 ARM Limited.
  5. //
  6. // All rights reserved.
  7. //
  8. // Redistribution and use in source and binary forms, with or without
  9. // modification, are permitted provided that the following conditions
  10. // are met:
  11. //
  12. // Redistributions of source code must retain the above copyright
  13. // notice, this list of conditions and the following disclaimer.
  14. //
  15. // Redistributions in binary form must reproduce the above
  16. // copyright notice, this list of conditions and the following
  17. // disclaimer in the documentation and/or other materials provided
  18. // with the distribution.
  19. //
  20. // Neither the name of 3Dlabs Inc. Ltd. nor the names of its
  21. // contributors may be used to endorse or promote products derived
  22. // from this software without specific prior written permission.
  23. //
  24. // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  25. // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  26. // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
  27. // FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
  28. // COPYRIGHT HOLDERS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
  29. // INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
  30. // BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  31. // LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
  32. // CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  33. // LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
  34. // ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  35. // POSSIBILITY OF SUCH DAMAGE.
  36. //
  37. // Visit the nodes in the glslang intermediate tree representation to
  38. // translate them to SPIR-V.
  39. //
  40. #include "spirv.hpp"
  41. #include "GlslangToSpv.h"
  42. #include "SpvBuilder.h"
  43. namespace spv {
  44. #include "GLSL.std.450.h"
  45. #include "GLSL.ext.KHR.h"
  46. #include "GLSL.ext.EXT.h"
  47. #ifdef AMD_EXTENSIONS
  48. #include "GLSL.ext.AMD.h"
  49. #endif
  50. #include "GLSL.ext.NV.h"
  51. }
  52. // Glslang includes
  53. #include "../glslang/MachineIndependent/localintermediate.h"
  54. #include "../glslang/MachineIndependent/SymbolTable.h"
  55. #include "../glslang/Include/Common.h"
  56. #include "../glslang/Include/revision.h"
  57. #include <fstream>
  58. #include <iomanip>
  59. #include <list>
  60. #include <map>
  61. #include <stack>
  62. #include <string>
  63. #include <vector>
  64. namespace {
  65. namespace {
  66. class SpecConstantOpModeGuard {
  67. public:
  68. SpecConstantOpModeGuard(spv::Builder* builder)
  69. : builder_(builder) {
  70. previous_flag_ = builder->isInSpecConstCodeGenMode();
  71. }
  72. ~SpecConstantOpModeGuard() {
  73. previous_flag_ ? builder_->setToSpecConstCodeGenMode()
  74. : builder_->setToNormalCodeGenMode();
  75. }
  76. void turnOnSpecConstantOpMode() {
  77. builder_->setToSpecConstCodeGenMode();
  78. }
  79. private:
  80. spv::Builder* builder_;
  81. bool previous_flag_;
  82. };
  83. struct OpDecorations {
  84. spv::Decoration precision;
  85. spv::Decoration noContraction;
  86. spv::Decoration nonUniform;
  87. };
  88. } // namespace
  89. //
  90. // The main holder of information for translating glslang to SPIR-V.
  91. //
  92. // Derives from the AST walking base class.
  93. //
  94. class TGlslangToSpvTraverser : public glslang::TIntermTraverser {
  95. public:
  96. TGlslangToSpvTraverser(unsigned int spvVersion, const glslang::TIntermediate*, spv::SpvBuildLogger* logger,
  97. glslang::SpvOptions& options);
  98. virtual ~TGlslangToSpvTraverser() { }
  99. bool visitAggregate(glslang::TVisit, glslang::TIntermAggregate*);
  100. bool visitBinary(glslang::TVisit, glslang::TIntermBinary*);
  101. void visitConstantUnion(glslang::TIntermConstantUnion*);
  102. bool visitSelection(glslang::TVisit, glslang::TIntermSelection*);
  103. bool visitSwitch(glslang::TVisit, glslang::TIntermSwitch*);
  104. void visitSymbol(glslang::TIntermSymbol* symbol);
  105. bool visitUnary(glslang::TVisit, glslang::TIntermUnary*);
  106. bool visitLoop(glslang::TVisit, glslang::TIntermLoop*);
  107. bool visitBranch(glslang::TVisit visit, glslang::TIntermBranch*);
  108. void finishSpv();
  109. void dumpSpv(std::vector<unsigned int>& out);
  110. protected:
  111. TGlslangToSpvTraverser(TGlslangToSpvTraverser&);
  112. TGlslangToSpvTraverser& operator=(TGlslangToSpvTraverser&);
  113. spv::Decoration TranslateInterpolationDecoration(const glslang::TQualifier& qualifier);
  114. spv::Decoration TranslateAuxiliaryStorageDecoration(const glslang::TQualifier& qualifier);
  115. spv::Decoration TranslateNonUniformDecoration(const glslang::TQualifier& qualifier);
  116. spv::Builder::AccessChain::CoherentFlags TranslateCoherent(const glslang::TType& type);
  117. spv::MemoryAccessMask TranslateMemoryAccess(const spv::Builder::AccessChain::CoherentFlags &coherentFlags);
  118. spv::ImageOperandsMask TranslateImageOperands(const spv::Builder::AccessChain::CoherentFlags &coherentFlags);
  119. spv::Scope TranslateMemoryScope(const spv::Builder::AccessChain::CoherentFlags &coherentFlags);
  120. spv::BuiltIn TranslateBuiltInDecoration(glslang::TBuiltInVariable, bool memberDeclaration);
  121. spv::ImageFormat TranslateImageFormat(const glslang::TType& type);
  122. spv::SelectionControlMask TranslateSelectionControl(const glslang::TIntermSelection&) const;
  123. spv::SelectionControlMask TranslateSwitchControl(const glslang::TIntermSwitch&) const;
  124. spv::LoopControlMask TranslateLoopControl(const glslang::TIntermLoop&, unsigned int& dependencyLength) const;
  125. spv::StorageClass TranslateStorageClass(const glslang::TType&);
  126. void addIndirectionIndexCapabilities(const glslang::TType& baseType, const glslang::TType& indexType);
  127. spv::Id createSpvVariable(const glslang::TIntermSymbol*);
  128. spv::Id getSampledType(const glslang::TSampler&);
  129. spv::Id getInvertedSwizzleType(const glslang::TIntermTyped&);
  130. spv::Id createInvertedSwizzle(spv::Decoration precision, const glslang::TIntermTyped&, spv::Id parentResult);
  131. void convertSwizzle(const glslang::TIntermAggregate&, std::vector<unsigned>& swizzle);
  132. spv::Id convertGlslangToSpvType(const glslang::TType& type, bool forwardReferenceOnly = false);
  133. spv::Id convertGlslangToSpvType(const glslang::TType& type, glslang::TLayoutPacking, const glslang::TQualifier&,
  134. bool lastBufferBlockMember, bool forwardReferenceOnly = false);
  135. bool filterMember(const glslang::TType& member);
  136. spv::Id convertGlslangStructToSpvType(const glslang::TType&, const glslang::TTypeList* glslangStruct,
  137. glslang::TLayoutPacking, const glslang::TQualifier&);
  138. void decorateStructType(const glslang::TType&, const glslang::TTypeList* glslangStruct, glslang::TLayoutPacking,
  139. const glslang::TQualifier&, spv::Id);
  140. spv::Id makeArraySizeId(const glslang::TArraySizes&, int dim);
  141. spv::Id accessChainLoad(const glslang::TType& type);
  142. void accessChainStore(const glslang::TType& type, spv::Id rvalue);
  143. void multiTypeStore(const glslang::TType&, spv::Id rValue);
  144. glslang::TLayoutPacking getExplicitLayout(const glslang::TType& type) const;
  145. int getArrayStride(const glslang::TType& arrayType, glslang::TLayoutPacking, glslang::TLayoutMatrix);
  146. int getMatrixStride(const glslang::TType& matrixType, glslang::TLayoutPacking, glslang::TLayoutMatrix);
  147. void updateMemberOffset(const glslang::TType& structType, const glslang::TType& memberType, int& currentOffset,
  148. int& nextOffset, glslang::TLayoutPacking, glslang::TLayoutMatrix);
  149. void declareUseOfStructMember(const glslang::TTypeList& members, int glslangMember);
  150. bool isShaderEntryPoint(const glslang::TIntermAggregate* node);
  151. bool writableParam(glslang::TStorageQualifier) const;
  152. bool originalParam(glslang::TStorageQualifier, const glslang::TType&, bool implicitThisParam);
  153. void makeFunctions(const glslang::TIntermSequence&);
  154. void makeGlobalInitializers(const glslang::TIntermSequence&);
  155. void visitFunctions(const glslang::TIntermSequence&);
  156. void handleFunctionEntry(const glslang::TIntermAggregate* node);
  157. void translateArguments(const glslang::TIntermAggregate& node, std::vector<spv::Id>& arguments);
  158. void translateArguments(glslang::TIntermUnary& node, std::vector<spv::Id>& arguments);
  159. spv::Id createImageTextureFunctionCall(glslang::TIntermOperator* node);
  160. spv::Id handleUserFunctionCall(const glslang::TIntermAggregate*);
  161. spv::Id createBinaryOperation(glslang::TOperator op, OpDecorations&, spv::Id typeId, spv::Id left, spv::Id right,
  162. glslang::TBasicType typeProxy, bool reduceComparison = true);
  163. spv::Id createBinaryMatrixOperation(spv::Op, OpDecorations&, spv::Id typeId, spv::Id left, spv::Id right);
  164. spv::Id createUnaryOperation(glslang::TOperator op, OpDecorations&, spv::Id typeId, spv::Id operand,
  165. glslang::TBasicType typeProxy);
  166. spv::Id createUnaryMatrixOperation(spv::Op op, OpDecorations&, spv::Id typeId, spv::Id operand,
  167. glslang::TBasicType typeProxy);
  168. spv::Id createConversion(glslang::TOperator op, OpDecorations&, spv::Id destTypeId, spv::Id operand,
  169. glslang::TBasicType typeProxy);
  170. spv::Id createIntWidthConversion(glslang::TOperator op, spv::Id operand, int vectorSize);
  171. spv::Id makeSmearedConstant(spv::Id constant, int vectorSize);
  172. spv::Id createAtomicOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId, std::vector<spv::Id>& operands, glslang::TBasicType typeProxy);
  173. spv::Id createInvocationsOperation(glslang::TOperator op, spv::Id typeId, std::vector<spv::Id>& operands, glslang::TBasicType typeProxy);
  174. spv::Id CreateInvocationsVectorOperation(spv::Op op, spv::GroupOperation groupOperation, spv::Id typeId, std::vector<spv::Id>& operands);
  175. spv::Id createSubgroupOperation(glslang::TOperator op, spv::Id typeId, std::vector<spv::Id>& operands, glslang::TBasicType typeProxy);
  176. spv::Id createMiscOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId, std::vector<spv::Id>& operands, glslang::TBasicType typeProxy);
  177. spv::Id createNoArgOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId);
  178. spv::Id getSymbolId(const glslang::TIntermSymbol* node);
  179. #ifdef NV_EXTENSIONS
  180. void addMeshNVDecoration(spv::Id id, int member, const glslang::TQualifier & qualifier);
  181. #endif
  182. spv::Id createSpvConstant(const glslang::TIntermTyped&);
  183. spv::Id createSpvConstantFromConstUnionArray(const glslang::TType& type, const glslang::TConstUnionArray&, int& nextConst, bool specConstant);
  184. bool isTrivialLeaf(const glslang::TIntermTyped* node);
  185. bool isTrivial(const glslang::TIntermTyped* node);
  186. spv::Id createShortCircuit(glslang::TOperator, glslang::TIntermTyped& left, glslang::TIntermTyped& right);
  187. #ifdef AMD_EXTENSIONS
  188. spv::Id getExtBuiltins(const char* name);
  189. #endif
  190. void addPre13Extension(const char* ext)
  191. {
  192. if (builder.getSpvVersion() < glslang::EShTargetSpv_1_3)
  193. builder.addExtension(ext);
  194. }
  195. glslang::SpvOptions& options;
  196. spv::Function* shaderEntry;
  197. spv::Function* currentFunction;
  198. spv::Instruction* entryPoint;
  199. int sequenceDepth;
  200. spv::SpvBuildLogger* logger;
  201. // There is a 1:1 mapping between a spv builder and a module; this is thread safe
  202. spv::Builder builder;
  203. bool inEntryPoint;
  204. bool entryPointTerminated;
  205. bool linkageOnly; // true when visiting the set of objects in the AST present only for establishing interface, whether or not they were statically used
  206. std::set<spv::Id> iOSet; // all input/output variables from either static use or declaration of interface
  207. const glslang::TIntermediate* glslangIntermediate;
  208. spv::Id stdBuiltins;
  209. std::unordered_map<const char*, spv::Id> extBuiltinMap;
  210. std::unordered_map<int, spv::Id> symbolValues;
  211. std::unordered_set<int> rValueParameters; // set of formal function parameters passed as rValues, rather than a pointer
  212. std::unordered_map<std::string, spv::Function*> functionMap;
  213. std::unordered_map<const glslang::TTypeList*, spv::Id> structMap[glslang::ElpCount][glslang::ElmCount];
  214. // for mapping glslang block indices to spv indices (e.g., due to hidden members):
  215. std::unordered_map<const glslang::TTypeList*, std::vector<int> > memberRemapper;
  216. std::stack<bool> breakForLoop; // false means break for switch
  217. std::unordered_map<std::string, const glslang::TIntermSymbol*> counterOriginator;
  218. // Map pointee types for EbtReference to their forward pointers
  219. std::map<const glslang::TType *, spv::Id> forwardPointers;
  220. };
  221. //
  222. // Helper functions for translating glslang representations to SPIR-V enumerants.
  223. //
  224. // Translate glslang profile to SPIR-V source language.
  225. spv::SourceLanguage TranslateSourceLanguage(glslang::EShSource source, EProfile profile)
  226. {
  227. switch (source) {
  228. case glslang::EShSourceGlsl:
  229. switch (profile) {
  230. case ENoProfile:
  231. case ECoreProfile:
  232. case ECompatibilityProfile:
  233. return spv::SourceLanguageGLSL;
  234. case EEsProfile:
  235. return spv::SourceLanguageESSL;
  236. default:
  237. return spv::SourceLanguageUnknown;
  238. }
  239. case glslang::EShSourceHlsl:
  240. return spv::SourceLanguageHLSL;
  241. default:
  242. return spv::SourceLanguageUnknown;
  243. }
  244. }
  245. // Translate glslang language (stage) to SPIR-V execution model.
  246. spv::ExecutionModel TranslateExecutionModel(EShLanguage stage)
  247. {
  248. switch (stage) {
  249. case EShLangVertex: return spv::ExecutionModelVertex;
  250. case EShLangTessControl: return spv::ExecutionModelTessellationControl;
  251. case EShLangTessEvaluation: return spv::ExecutionModelTessellationEvaluation;
  252. case EShLangGeometry: return spv::ExecutionModelGeometry;
  253. case EShLangFragment: return spv::ExecutionModelFragment;
  254. case EShLangCompute: return spv::ExecutionModelGLCompute;
  255. #ifdef NV_EXTENSIONS
  256. case EShLangRayGenNV: return spv::ExecutionModelRayGenerationNV;
  257. case EShLangIntersectNV: return spv::ExecutionModelIntersectionNV;
  258. case EShLangAnyHitNV: return spv::ExecutionModelAnyHitNV;
  259. case EShLangClosestHitNV: return spv::ExecutionModelClosestHitNV;
  260. case EShLangMissNV: return spv::ExecutionModelMissNV;
  261. case EShLangCallableNV: return spv::ExecutionModelCallableNV;
  262. case EShLangTaskNV: return spv::ExecutionModelTaskNV;
  263. case EShLangMeshNV: return spv::ExecutionModelMeshNV;
  264. #endif
  265. default:
  266. assert(0);
  267. return spv::ExecutionModelFragment;
  268. }
  269. }
  270. // Translate glslang sampler type to SPIR-V dimensionality.
  271. spv::Dim TranslateDimensionality(const glslang::TSampler& sampler)
  272. {
  273. switch (sampler.dim) {
  274. case glslang::Esd1D: return spv::Dim1D;
  275. case glslang::Esd2D: return spv::Dim2D;
  276. case glslang::Esd3D: return spv::Dim3D;
  277. case glslang::EsdCube: return spv::DimCube;
  278. case glslang::EsdRect: return spv::DimRect;
  279. case glslang::EsdBuffer: return spv::DimBuffer;
  280. case glslang::EsdSubpass: return spv::DimSubpassData;
  281. default:
  282. assert(0);
  283. return spv::Dim2D;
  284. }
  285. }
  286. // Translate glslang precision to SPIR-V precision decorations.
  287. spv::Decoration TranslatePrecisionDecoration(glslang::TPrecisionQualifier glslangPrecision)
  288. {
  289. switch (glslangPrecision) {
  290. case glslang::EpqLow: return spv::DecorationRelaxedPrecision;
  291. case glslang::EpqMedium: return spv::DecorationRelaxedPrecision;
  292. default:
  293. return spv::NoPrecision;
  294. }
  295. }
  296. // Translate glslang type to SPIR-V precision decorations.
  297. spv::Decoration TranslatePrecisionDecoration(const glslang::TType& type)
  298. {
  299. return TranslatePrecisionDecoration(type.getQualifier().precision);
  300. }
  301. // Translate glslang type to SPIR-V block decorations.
  302. spv::Decoration TranslateBlockDecoration(const glslang::TType& type, bool useStorageBuffer)
  303. {
  304. if (type.getBasicType() == glslang::EbtBlock) {
  305. switch (type.getQualifier().storage) {
  306. case glslang::EvqUniform: return spv::DecorationBlock;
  307. case glslang::EvqBuffer: return useStorageBuffer ? spv::DecorationBlock : spv::DecorationBufferBlock;
  308. case glslang::EvqVaryingIn: return spv::DecorationBlock;
  309. case glslang::EvqVaryingOut: return spv::DecorationBlock;
  310. #ifdef NV_EXTENSIONS
  311. case glslang::EvqPayloadNV: return spv::DecorationBlock;
  312. case glslang::EvqPayloadInNV: return spv::DecorationBlock;
  313. case glslang::EvqHitAttrNV: return spv::DecorationBlock;
  314. case glslang::EvqCallableDataNV: return spv::DecorationBlock;
  315. case glslang::EvqCallableDataInNV: return spv::DecorationBlock;
  316. #endif
  317. default:
  318. assert(0);
  319. break;
  320. }
  321. }
  322. return spv::DecorationMax;
  323. }
  324. // Translate glslang type to SPIR-V memory decorations.
  325. void TranslateMemoryDecoration(const glslang::TQualifier& qualifier, std::vector<spv::Decoration>& memory, bool useVulkanMemoryModel)
  326. {
  327. if (!useVulkanMemoryModel) {
  328. if (qualifier.coherent)
  329. memory.push_back(spv::DecorationCoherent);
  330. if (qualifier.volatil) {
  331. memory.push_back(spv::DecorationVolatile);
  332. memory.push_back(spv::DecorationCoherent);
  333. }
  334. }
  335. if (qualifier.restrict)
  336. memory.push_back(spv::DecorationRestrict);
  337. if (qualifier.readonly)
  338. memory.push_back(spv::DecorationNonWritable);
  339. if (qualifier.writeonly)
  340. memory.push_back(spv::DecorationNonReadable);
  341. }
  342. // Translate glslang type to SPIR-V layout decorations.
  343. spv::Decoration TranslateLayoutDecoration(const glslang::TType& type, glslang::TLayoutMatrix matrixLayout)
  344. {
  345. if (type.isMatrix()) {
  346. switch (matrixLayout) {
  347. case glslang::ElmRowMajor:
  348. return spv::DecorationRowMajor;
  349. case glslang::ElmColumnMajor:
  350. return spv::DecorationColMajor;
  351. default:
  352. // opaque layouts don't need a majorness
  353. return spv::DecorationMax;
  354. }
  355. } else {
  356. switch (type.getBasicType()) {
  357. default:
  358. return spv::DecorationMax;
  359. break;
  360. case glslang::EbtBlock:
  361. switch (type.getQualifier().storage) {
  362. case glslang::EvqUniform:
  363. case glslang::EvqBuffer:
  364. switch (type.getQualifier().layoutPacking) {
  365. case glslang::ElpShared: return spv::DecorationGLSLShared;
  366. case glslang::ElpPacked: return spv::DecorationGLSLPacked;
  367. default:
  368. return spv::DecorationMax;
  369. }
  370. case glslang::EvqVaryingIn:
  371. case glslang::EvqVaryingOut:
  372. if (type.getQualifier().isTaskMemory()) {
  373. switch (type.getQualifier().layoutPacking) {
  374. case glslang::ElpShared: return spv::DecorationGLSLShared;
  375. case glslang::ElpPacked: return spv::DecorationGLSLPacked;
  376. default: break;
  377. }
  378. } else {
  379. assert(type.getQualifier().layoutPacking == glslang::ElpNone);
  380. }
  381. return spv::DecorationMax;
  382. #ifdef NV_EXTENSIONS
  383. case glslang::EvqPayloadNV:
  384. case glslang::EvqPayloadInNV:
  385. case glslang::EvqHitAttrNV:
  386. case glslang::EvqCallableDataNV:
  387. case glslang::EvqCallableDataInNV:
  388. return spv::DecorationMax;
  389. #endif
  390. default:
  391. assert(0);
  392. return spv::DecorationMax;
  393. }
  394. }
  395. }
  396. }
  397. // Translate glslang type to SPIR-V interpolation decorations.
  398. // Returns spv::DecorationMax when no decoration
  399. // should be applied.
  400. spv::Decoration TGlslangToSpvTraverser::TranslateInterpolationDecoration(const glslang::TQualifier& qualifier)
  401. {
  402. if (qualifier.smooth)
  403. // Smooth decoration doesn't exist in SPIR-V 1.0
  404. return spv::DecorationMax;
  405. else if (qualifier.nopersp)
  406. return spv::DecorationNoPerspective;
  407. else if (qualifier.flat)
  408. return spv::DecorationFlat;
  409. #ifdef AMD_EXTENSIONS
  410. else if (qualifier.explicitInterp) {
  411. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  412. return spv::DecorationExplicitInterpAMD;
  413. }
  414. #endif
  415. else
  416. return spv::DecorationMax;
  417. }
  418. // Translate glslang type to SPIR-V auxiliary storage decorations.
  419. // Returns spv::DecorationMax when no decoration
  420. // should be applied.
  421. spv::Decoration TGlslangToSpvTraverser::TranslateAuxiliaryStorageDecoration(const glslang::TQualifier& qualifier)
  422. {
  423. if (qualifier.patch)
  424. return spv::DecorationPatch;
  425. else if (qualifier.centroid)
  426. return spv::DecorationCentroid;
  427. else if (qualifier.sample) {
  428. builder.addCapability(spv::CapabilitySampleRateShading);
  429. return spv::DecorationSample;
  430. } else
  431. return spv::DecorationMax;
  432. }
  433. // If glslang type is invariant, return SPIR-V invariant decoration.
  434. spv::Decoration TranslateInvariantDecoration(const glslang::TQualifier& qualifier)
  435. {
  436. if (qualifier.invariant)
  437. return spv::DecorationInvariant;
  438. else
  439. return spv::DecorationMax;
  440. }
  441. // If glslang type is noContraction, return SPIR-V NoContraction decoration.
  442. spv::Decoration TranslateNoContractionDecoration(const glslang::TQualifier& qualifier)
  443. {
  444. if (qualifier.noContraction)
  445. return spv::DecorationNoContraction;
  446. else
  447. return spv::DecorationMax;
  448. }
  449. // If glslang type is nonUniform, return SPIR-V NonUniform decoration.
  450. spv::Decoration TGlslangToSpvTraverser::TranslateNonUniformDecoration(const glslang::TQualifier& qualifier)
  451. {
  452. if (qualifier.isNonUniform()) {
  453. builder.addExtension("SPV_EXT_descriptor_indexing");
  454. builder.addCapability(spv::CapabilityShaderNonUniformEXT);
  455. return spv::DecorationNonUniformEXT;
  456. } else
  457. return spv::DecorationMax;
  458. }
  459. spv::MemoryAccessMask TGlslangToSpvTraverser::TranslateMemoryAccess(const spv::Builder::AccessChain::CoherentFlags &coherentFlags)
  460. {
  461. if (!glslangIntermediate->usingVulkanMemoryModel() || coherentFlags.isImage) {
  462. return spv::MemoryAccessMaskNone;
  463. }
  464. spv::MemoryAccessMask mask = spv::MemoryAccessMaskNone;
  465. if (coherentFlags.volatil ||
  466. coherentFlags.coherent ||
  467. coherentFlags.devicecoherent ||
  468. coherentFlags.queuefamilycoherent ||
  469. coherentFlags.workgroupcoherent ||
  470. coherentFlags.subgroupcoherent) {
  471. mask = mask | spv::MemoryAccessMakePointerAvailableKHRMask |
  472. spv::MemoryAccessMakePointerVisibleKHRMask;
  473. }
  474. if (coherentFlags.nonprivate) {
  475. mask = mask | spv::MemoryAccessNonPrivatePointerKHRMask;
  476. }
  477. if (coherentFlags.volatil) {
  478. mask = mask | spv::MemoryAccessVolatileMask;
  479. }
  480. if (mask != spv::MemoryAccessMaskNone) {
  481. builder.addCapability(spv::CapabilityVulkanMemoryModelKHR);
  482. }
  483. return mask;
  484. }
  485. spv::ImageOperandsMask TGlslangToSpvTraverser::TranslateImageOperands(const spv::Builder::AccessChain::CoherentFlags &coherentFlags)
  486. {
  487. if (!glslangIntermediate->usingVulkanMemoryModel()) {
  488. return spv::ImageOperandsMaskNone;
  489. }
  490. spv::ImageOperandsMask mask = spv::ImageOperandsMaskNone;
  491. if (coherentFlags.volatil ||
  492. coherentFlags.coherent ||
  493. coherentFlags.devicecoherent ||
  494. coherentFlags.queuefamilycoherent ||
  495. coherentFlags.workgroupcoherent ||
  496. coherentFlags.subgroupcoherent) {
  497. mask = mask | spv::ImageOperandsMakeTexelAvailableKHRMask |
  498. spv::ImageOperandsMakeTexelVisibleKHRMask;
  499. }
  500. if (coherentFlags.nonprivate) {
  501. mask = mask | spv::ImageOperandsNonPrivateTexelKHRMask;
  502. }
  503. if (coherentFlags.volatil) {
  504. mask = mask | spv::ImageOperandsVolatileTexelKHRMask;
  505. }
  506. if (mask != spv::ImageOperandsMaskNone) {
  507. builder.addCapability(spv::CapabilityVulkanMemoryModelKHR);
  508. }
  509. return mask;
  510. }
  511. spv::Builder::AccessChain::CoherentFlags TGlslangToSpvTraverser::TranslateCoherent(const glslang::TType& type)
  512. {
  513. spv::Builder::AccessChain::CoherentFlags flags;
  514. flags.coherent = type.getQualifier().coherent;
  515. flags.devicecoherent = type.getQualifier().devicecoherent;
  516. flags.queuefamilycoherent = type.getQualifier().queuefamilycoherent;
  517. // shared variables are implicitly workgroupcoherent in GLSL.
  518. flags.workgroupcoherent = type.getQualifier().workgroupcoherent ||
  519. type.getQualifier().storage == glslang::EvqShared;
  520. flags.subgroupcoherent = type.getQualifier().subgroupcoherent;
  521. flags.volatil = type.getQualifier().volatil;
  522. // *coherent variables are implicitly nonprivate in GLSL
  523. flags.nonprivate = type.getQualifier().nonprivate ||
  524. flags.subgroupcoherent ||
  525. flags.workgroupcoherent ||
  526. flags.queuefamilycoherent ||
  527. flags.devicecoherent ||
  528. flags.coherent ||
  529. flags.volatil;
  530. flags.isImage = type.getBasicType() == glslang::EbtSampler;
  531. return flags;
  532. }
  533. spv::Scope TGlslangToSpvTraverser::TranslateMemoryScope(const spv::Builder::AccessChain::CoherentFlags &coherentFlags)
  534. {
  535. spv::Scope scope;
  536. if (coherentFlags.volatil || coherentFlags.coherent) {
  537. // coherent defaults to Device scope in the old model, QueueFamilyKHR scope in the new model
  538. scope = glslangIntermediate->usingVulkanMemoryModel() ? spv::ScopeQueueFamilyKHR : spv::ScopeDevice;
  539. } else if (coherentFlags.devicecoherent) {
  540. scope = spv::ScopeDevice;
  541. } else if (coherentFlags.queuefamilycoherent) {
  542. scope = spv::ScopeQueueFamilyKHR;
  543. } else if (coherentFlags.workgroupcoherent) {
  544. scope = spv::ScopeWorkgroup;
  545. } else if (coherentFlags.subgroupcoherent) {
  546. scope = spv::ScopeSubgroup;
  547. } else {
  548. scope = spv::ScopeMax;
  549. }
  550. if (glslangIntermediate->usingVulkanMemoryModel() && scope == spv::ScopeDevice) {
  551. builder.addCapability(spv::CapabilityVulkanMemoryModelDeviceScopeKHR);
  552. }
  553. return scope;
  554. }
  555. // Translate a glslang built-in variable to a SPIR-V built in decoration. Also generate
  556. // associated capabilities when required. For some built-in variables, a capability
  557. // is generated only when using the variable in an executable instruction, but not when
  558. // just declaring a struct member variable with it. This is true for PointSize,
  559. // ClipDistance, and CullDistance.
  560. spv::BuiltIn TGlslangToSpvTraverser::TranslateBuiltInDecoration(glslang::TBuiltInVariable builtIn, bool memberDeclaration)
  561. {
  562. switch (builtIn) {
  563. case glslang::EbvPointSize:
  564. // Defer adding the capability until the built-in is actually used.
  565. if (! memberDeclaration) {
  566. switch (glslangIntermediate->getStage()) {
  567. case EShLangGeometry:
  568. builder.addCapability(spv::CapabilityGeometryPointSize);
  569. break;
  570. case EShLangTessControl:
  571. case EShLangTessEvaluation:
  572. builder.addCapability(spv::CapabilityTessellationPointSize);
  573. break;
  574. default:
  575. break;
  576. }
  577. }
  578. return spv::BuiltInPointSize;
  579. // These *Distance capabilities logically belong here, but if the member is declared and
  580. // then never used, consumers of SPIR-V prefer the capability not be declared.
  581. // They are now generated when used, rather than here when declared.
  582. // Potentially, the specification should be more clear what the minimum
  583. // use needed is to trigger the capability.
  584. //
  585. case glslang::EbvClipDistance:
  586. if (!memberDeclaration)
  587. builder.addCapability(spv::CapabilityClipDistance);
  588. return spv::BuiltInClipDistance;
  589. case glslang::EbvCullDistance:
  590. if (!memberDeclaration)
  591. builder.addCapability(spv::CapabilityCullDistance);
  592. return spv::BuiltInCullDistance;
  593. case glslang::EbvViewportIndex:
  594. builder.addCapability(spv::CapabilityMultiViewport);
  595. if (glslangIntermediate->getStage() == EShLangVertex ||
  596. glslangIntermediate->getStage() == EShLangTessControl ||
  597. glslangIntermediate->getStage() == EShLangTessEvaluation) {
  598. builder.addExtension(spv::E_SPV_EXT_shader_viewport_index_layer);
  599. builder.addCapability(spv::CapabilityShaderViewportIndexLayerEXT);
  600. }
  601. return spv::BuiltInViewportIndex;
  602. case glslang::EbvSampleId:
  603. builder.addCapability(spv::CapabilitySampleRateShading);
  604. return spv::BuiltInSampleId;
  605. case glslang::EbvSamplePosition:
  606. builder.addCapability(spv::CapabilitySampleRateShading);
  607. return spv::BuiltInSamplePosition;
  608. case glslang::EbvSampleMask:
  609. return spv::BuiltInSampleMask;
  610. case glslang::EbvLayer:
  611. #ifdef NV_EXTENSIONS
  612. if (glslangIntermediate->getStage() == EShLangMeshNV) {
  613. return spv::BuiltInLayer;
  614. }
  615. #endif
  616. builder.addCapability(spv::CapabilityGeometry);
  617. if (glslangIntermediate->getStage() == EShLangVertex ||
  618. glslangIntermediate->getStage() == EShLangTessControl ||
  619. glslangIntermediate->getStage() == EShLangTessEvaluation) {
  620. builder.addExtension(spv::E_SPV_EXT_shader_viewport_index_layer);
  621. builder.addCapability(spv::CapabilityShaderViewportIndexLayerEXT);
  622. }
  623. return spv::BuiltInLayer;
  624. case glslang::EbvPosition: return spv::BuiltInPosition;
  625. case glslang::EbvVertexId: return spv::BuiltInVertexId;
  626. case glslang::EbvInstanceId: return spv::BuiltInInstanceId;
  627. case glslang::EbvVertexIndex: return spv::BuiltInVertexIndex;
  628. case glslang::EbvInstanceIndex: return spv::BuiltInInstanceIndex;
  629. case glslang::EbvBaseVertex:
  630. addPre13Extension(spv::E_SPV_KHR_shader_draw_parameters);
  631. builder.addCapability(spv::CapabilityDrawParameters);
  632. return spv::BuiltInBaseVertex;
  633. case glslang::EbvBaseInstance:
  634. addPre13Extension(spv::E_SPV_KHR_shader_draw_parameters);
  635. builder.addCapability(spv::CapabilityDrawParameters);
  636. return spv::BuiltInBaseInstance;
  637. case glslang::EbvDrawId:
  638. addPre13Extension(spv::E_SPV_KHR_shader_draw_parameters);
  639. builder.addCapability(spv::CapabilityDrawParameters);
  640. return spv::BuiltInDrawIndex;
  641. case glslang::EbvPrimitiveId:
  642. if (glslangIntermediate->getStage() == EShLangFragment)
  643. builder.addCapability(spv::CapabilityGeometry);
  644. return spv::BuiltInPrimitiveId;
  645. case glslang::EbvFragStencilRef:
  646. builder.addExtension(spv::E_SPV_EXT_shader_stencil_export);
  647. builder.addCapability(spv::CapabilityStencilExportEXT);
  648. return spv::BuiltInFragStencilRefEXT;
  649. case glslang::EbvInvocationId: return spv::BuiltInInvocationId;
  650. case glslang::EbvTessLevelInner: return spv::BuiltInTessLevelInner;
  651. case glslang::EbvTessLevelOuter: return spv::BuiltInTessLevelOuter;
  652. case glslang::EbvTessCoord: return spv::BuiltInTessCoord;
  653. case glslang::EbvPatchVertices: return spv::BuiltInPatchVertices;
  654. case glslang::EbvFragCoord: return spv::BuiltInFragCoord;
  655. case glslang::EbvPointCoord: return spv::BuiltInPointCoord;
  656. case glslang::EbvFace: return spv::BuiltInFrontFacing;
  657. case glslang::EbvFragDepth: return spv::BuiltInFragDepth;
  658. case glslang::EbvHelperInvocation: return spv::BuiltInHelperInvocation;
  659. case glslang::EbvNumWorkGroups: return spv::BuiltInNumWorkgroups;
  660. case glslang::EbvWorkGroupSize: return spv::BuiltInWorkgroupSize;
  661. case glslang::EbvWorkGroupId: return spv::BuiltInWorkgroupId;
  662. case glslang::EbvLocalInvocationId: return spv::BuiltInLocalInvocationId;
  663. case glslang::EbvLocalInvocationIndex: return spv::BuiltInLocalInvocationIndex;
  664. case glslang::EbvGlobalInvocationId: return spv::BuiltInGlobalInvocationId;
  665. case glslang::EbvSubGroupSize:
  666. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  667. builder.addCapability(spv::CapabilitySubgroupBallotKHR);
  668. return spv::BuiltInSubgroupSize;
  669. case glslang::EbvSubGroupInvocation:
  670. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  671. builder.addCapability(spv::CapabilitySubgroupBallotKHR);
  672. return spv::BuiltInSubgroupLocalInvocationId;
  673. case glslang::EbvSubGroupEqMask:
  674. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  675. builder.addCapability(spv::CapabilitySubgroupBallotKHR);
  676. return spv::BuiltInSubgroupEqMaskKHR;
  677. case glslang::EbvSubGroupGeMask:
  678. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  679. builder.addCapability(spv::CapabilitySubgroupBallotKHR);
  680. return spv::BuiltInSubgroupGeMaskKHR;
  681. case glslang::EbvSubGroupGtMask:
  682. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  683. builder.addCapability(spv::CapabilitySubgroupBallotKHR);
  684. return spv::BuiltInSubgroupGtMaskKHR;
  685. case glslang::EbvSubGroupLeMask:
  686. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  687. builder.addCapability(spv::CapabilitySubgroupBallotKHR);
  688. return spv::BuiltInSubgroupLeMaskKHR;
  689. case glslang::EbvSubGroupLtMask:
  690. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  691. builder.addCapability(spv::CapabilitySubgroupBallotKHR);
  692. return spv::BuiltInSubgroupLtMaskKHR;
  693. case glslang::EbvNumSubgroups:
  694. builder.addCapability(spv::CapabilityGroupNonUniform);
  695. return spv::BuiltInNumSubgroups;
  696. case glslang::EbvSubgroupID:
  697. builder.addCapability(spv::CapabilityGroupNonUniform);
  698. return spv::BuiltInSubgroupId;
  699. case glslang::EbvSubgroupSize2:
  700. builder.addCapability(spv::CapabilityGroupNonUniform);
  701. return spv::BuiltInSubgroupSize;
  702. case glslang::EbvSubgroupInvocation2:
  703. builder.addCapability(spv::CapabilityGroupNonUniform);
  704. return spv::BuiltInSubgroupLocalInvocationId;
  705. case glslang::EbvSubgroupEqMask2:
  706. builder.addCapability(spv::CapabilityGroupNonUniform);
  707. builder.addCapability(spv::CapabilityGroupNonUniformBallot);
  708. return spv::BuiltInSubgroupEqMask;
  709. case glslang::EbvSubgroupGeMask2:
  710. builder.addCapability(spv::CapabilityGroupNonUniform);
  711. builder.addCapability(spv::CapabilityGroupNonUniformBallot);
  712. return spv::BuiltInSubgroupGeMask;
  713. case glslang::EbvSubgroupGtMask2:
  714. builder.addCapability(spv::CapabilityGroupNonUniform);
  715. builder.addCapability(spv::CapabilityGroupNonUniformBallot);
  716. return spv::BuiltInSubgroupGtMask;
  717. case glslang::EbvSubgroupLeMask2:
  718. builder.addCapability(spv::CapabilityGroupNonUniform);
  719. builder.addCapability(spv::CapabilityGroupNonUniformBallot);
  720. return spv::BuiltInSubgroupLeMask;
  721. case glslang::EbvSubgroupLtMask2:
  722. builder.addCapability(spv::CapabilityGroupNonUniform);
  723. builder.addCapability(spv::CapabilityGroupNonUniformBallot);
  724. return spv::BuiltInSubgroupLtMask;
  725. #ifdef AMD_EXTENSIONS
  726. case glslang::EbvBaryCoordNoPersp:
  727. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  728. return spv::BuiltInBaryCoordNoPerspAMD;
  729. case glslang::EbvBaryCoordNoPerspCentroid:
  730. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  731. return spv::BuiltInBaryCoordNoPerspCentroidAMD;
  732. case glslang::EbvBaryCoordNoPerspSample:
  733. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  734. return spv::BuiltInBaryCoordNoPerspSampleAMD;
  735. case glslang::EbvBaryCoordSmooth:
  736. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  737. return spv::BuiltInBaryCoordSmoothAMD;
  738. case glslang::EbvBaryCoordSmoothCentroid:
  739. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  740. return spv::BuiltInBaryCoordSmoothCentroidAMD;
  741. case glslang::EbvBaryCoordSmoothSample:
  742. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  743. return spv::BuiltInBaryCoordSmoothSampleAMD;
  744. case glslang::EbvBaryCoordPullModel:
  745. builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  746. return spv::BuiltInBaryCoordPullModelAMD;
  747. #endif
  748. case glslang::EbvDeviceIndex:
  749. addPre13Extension(spv::E_SPV_KHR_device_group);
  750. builder.addCapability(spv::CapabilityDeviceGroup);
  751. return spv::BuiltInDeviceIndex;
  752. case glslang::EbvViewIndex:
  753. addPre13Extension(spv::E_SPV_KHR_multiview);
  754. builder.addCapability(spv::CapabilityMultiView);
  755. return spv::BuiltInViewIndex;
  756. case glslang::EbvFragSizeEXT:
  757. builder.addExtension(spv::E_SPV_EXT_fragment_invocation_density);
  758. builder.addCapability(spv::CapabilityFragmentDensityEXT);
  759. return spv::BuiltInFragSizeEXT;
  760. case glslang::EbvFragInvocationCountEXT:
  761. builder.addExtension(spv::E_SPV_EXT_fragment_invocation_density);
  762. builder.addCapability(spv::CapabilityFragmentDensityEXT);
  763. return spv::BuiltInFragInvocationCountEXT;
  764. #ifdef NV_EXTENSIONS
  765. case glslang::EbvViewportMaskNV:
  766. if (!memberDeclaration) {
  767. builder.addExtension(spv::E_SPV_NV_viewport_array2);
  768. builder.addCapability(spv::CapabilityShaderViewportMaskNV);
  769. }
  770. return spv::BuiltInViewportMaskNV;
  771. case glslang::EbvSecondaryPositionNV:
  772. if (!memberDeclaration) {
  773. builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
  774. builder.addCapability(spv::CapabilityShaderStereoViewNV);
  775. }
  776. return spv::BuiltInSecondaryPositionNV;
  777. case glslang::EbvSecondaryViewportMaskNV:
  778. if (!memberDeclaration) {
  779. builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
  780. builder.addCapability(spv::CapabilityShaderStereoViewNV);
  781. }
  782. return spv::BuiltInSecondaryViewportMaskNV;
  783. case glslang::EbvPositionPerViewNV:
  784. if (!memberDeclaration) {
  785. builder.addExtension(spv::E_SPV_NVX_multiview_per_view_attributes);
  786. builder.addCapability(spv::CapabilityPerViewAttributesNV);
  787. }
  788. return spv::BuiltInPositionPerViewNV;
  789. case glslang::EbvViewportMaskPerViewNV:
  790. if (!memberDeclaration) {
  791. builder.addExtension(spv::E_SPV_NVX_multiview_per_view_attributes);
  792. builder.addCapability(spv::CapabilityPerViewAttributesNV);
  793. }
  794. return spv::BuiltInViewportMaskPerViewNV;
  795. case glslang::EbvFragFullyCoveredNV:
  796. builder.addExtension(spv::E_SPV_EXT_fragment_fully_covered);
  797. builder.addCapability(spv::CapabilityFragmentFullyCoveredEXT);
  798. return spv::BuiltInFullyCoveredEXT;
  799. case glslang::EbvFragmentSizeNV:
  800. builder.addExtension(spv::E_SPV_NV_shading_rate);
  801. builder.addCapability(spv::CapabilityShadingRateNV);
  802. return spv::BuiltInFragmentSizeNV;
  803. case glslang::EbvInvocationsPerPixelNV:
  804. builder.addExtension(spv::E_SPV_NV_shading_rate);
  805. builder.addCapability(spv::CapabilityShadingRateNV);
  806. return spv::BuiltInInvocationsPerPixelNV;
  807. // raytracing
  808. case glslang::EbvLaunchIdNV:
  809. return spv::BuiltInLaunchIdNV;
  810. case glslang::EbvLaunchSizeNV:
  811. return spv::BuiltInLaunchSizeNV;
  812. case glslang::EbvWorldRayOriginNV:
  813. return spv::BuiltInWorldRayOriginNV;
  814. case glslang::EbvWorldRayDirectionNV:
  815. return spv::BuiltInWorldRayDirectionNV;
  816. case glslang::EbvObjectRayOriginNV:
  817. return spv::BuiltInObjectRayOriginNV;
  818. case glslang::EbvObjectRayDirectionNV:
  819. return spv::BuiltInObjectRayDirectionNV;
  820. case glslang::EbvRayTminNV:
  821. return spv::BuiltInRayTminNV;
  822. case glslang::EbvRayTmaxNV:
  823. return spv::BuiltInRayTmaxNV;
  824. case glslang::EbvInstanceCustomIndexNV:
  825. return spv::BuiltInInstanceCustomIndexNV;
  826. case glslang::EbvHitTNV:
  827. return spv::BuiltInHitTNV;
  828. case glslang::EbvHitKindNV:
  829. return spv::BuiltInHitKindNV;
  830. case glslang::EbvObjectToWorldNV:
  831. return spv::BuiltInObjectToWorldNV;
  832. case glslang::EbvWorldToObjectNV:
  833. return spv::BuiltInWorldToObjectNV;
  834. case glslang::EbvIncomingRayFlagsNV:
  835. return spv::BuiltInIncomingRayFlagsNV;
  836. case glslang::EbvBaryCoordNV:
  837. builder.addExtension(spv::E_SPV_NV_fragment_shader_barycentric);
  838. builder.addCapability(spv::CapabilityFragmentBarycentricNV);
  839. return spv::BuiltInBaryCoordNV;
  840. case glslang::EbvBaryCoordNoPerspNV:
  841. builder.addExtension(spv::E_SPV_NV_fragment_shader_barycentric);
  842. builder.addCapability(spv::CapabilityFragmentBarycentricNV);
  843. return spv::BuiltInBaryCoordNoPerspNV;
  844. case glslang::EbvTaskCountNV:
  845. return spv::BuiltInTaskCountNV;
  846. case glslang::EbvPrimitiveCountNV:
  847. return spv::BuiltInPrimitiveCountNV;
  848. case glslang::EbvPrimitiveIndicesNV:
  849. return spv::BuiltInPrimitiveIndicesNV;
  850. case glslang::EbvClipDistancePerViewNV:
  851. return spv::BuiltInClipDistancePerViewNV;
  852. case glslang::EbvCullDistancePerViewNV:
  853. return spv::BuiltInCullDistancePerViewNV;
  854. case glslang::EbvLayerPerViewNV:
  855. return spv::BuiltInLayerPerViewNV;
  856. case glslang::EbvMeshViewCountNV:
  857. return spv::BuiltInMeshViewCountNV;
  858. case glslang::EbvMeshViewIndicesNV:
  859. return spv::BuiltInMeshViewIndicesNV;
  860. #endif
  861. default:
  862. return spv::BuiltInMax;
  863. }
  864. }
  865. // Translate glslang image layout format to SPIR-V image format.
  866. spv::ImageFormat TGlslangToSpvTraverser::TranslateImageFormat(const glslang::TType& type)
  867. {
  868. assert(type.getBasicType() == glslang::EbtSampler);
  869. // Check for capabilities
  870. switch (type.getQualifier().layoutFormat) {
  871. case glslang::ElfRg32f:
  872. case glslang::ElfRg16f:
  873. case glslang::ElfR11fG11fB10f:
  874. case glslang::ElfR16f:
  875. case glslang::ElfRgba16:
  876. case glslang::ElfRgb10A2:
  877. case glslang::ElfRg16:
  878. case glslang::ElfRg8:
  879. case glslang::ElfR16:
  880. case glslang::ElfR8:
  881. case glslang::ElfRgba16Snorm:
  882. case glslang::ElfRg16Snorm:
  883. case glslang::ElfRg8Snorm:
  884. case glslang::ElfR16Snorm:
  885. case glslang::ElfR8Snorm:
  886. case glslang::ElfRg32i:
  887. case glslang::ElfRg16i:
  888. case glslang::ElfRg8i:
  889. case glslang::ElfR16i:
  890. case glslang::ElfR8i:
  891. case glslang::ElfRgb10a2ui:
  892. case glslang::ElfRg32ui:
  893. case glslang::ElfRg16ui:
  894. case glslang::ElfRg8ui:
  895. case glslang::ElfR16ui:
  896. case glslang::ElfR8ui:
  897. builder.addCapability(spv::CapabilityStorageImageExtendedFormats);
  898. break;
  899. default:
  900. break;
  901. }
  902. // do the translation
  903. switch (type.getQualifier().layoutFormat) {
  904. case glslang::ElfNone: return spv::ImageFormatUnknown;
  905. case glslang::ElfRgba32f: return spv::ImageFormatRgba32f;
  906. case glslang::ElfRgba16f: return spv::ImageFormatRgba16f;
  907. case glslang::ElfR32f: return spv::ImageFormatR32f;
  908. case glslang::ElfRgba8: return spv::ImageFormatRgba8;
  909. case glslang::ElfRgba8Snorm: return spv::ImageFormatRgba8Snorm;
  910. case glslang::ElfRg32f: return spv::ImageFormatRg32f;
  911. case glslang::ElfRg16f: return spv::ImageFormatRg16f;
  912. case glslang::ElfR11fG11fB10f: return spv::ImageFormatR11fG11fB10f;
  913. case glslang::ElfR16f: return spv::ImageFormatR16f;
  914. case glslang::ElfRgba16: return spv::ImageFormatRgba16;
  915. case glslang::ElfRgb10A2: return spv::ImageFormatRgb10A2;
  916. case glslang::ElfRg16: return spv::ImageFormatRg16;
  917. case glslang::ElfRg8: return spv::ImageFormatRg8;
  918. case glslang::ElfR16: return spv::ImageFormatR16;
  919. case glslang::ElfR8: return spv::ImageFormatR8;
  920. case glslang::ElfRgba16Snorm: return spv::ImageFormatRgba16Snorm;
  921. case glslang::ElfRg16Snorm: return spv::ImageFormatRg16Snorm;
  922. case glslang::ElfRg8Snorm: return spv::ImageFormatRg8Snorm;
  923. case glslang::ElfR16Snorm: return spv::ImageFormatR16Snorm;
  924. case glslang::ElfR8Snorm: return spv::ImageFormatR8Snorm;
  925. case glslang::ElfRgba32i: return spv::ImageFormatRgba32i;
  926. case glslang::ElfRgba16i: return spv::ImageFormatRgba16i;
  927. case glslang::ElfRgba8i: return spv::ImageFormatRgba8i;
  928. case glslang::ElfR32i: return spv::ImageFormatR32i;
  929. case glslang::ElfRg32i: return spv::ImageFormatRg32i;
  930. case glslang::ElfRg16i: return spv::ImageFormatRg16i;
  931. case glslang::ElfRg8i: return spv::ImageFormatRg8i;
  932. case glslang::ElfR16i: return spv::ImageFormatR16i;
  933. case glslang::ElfR8i: return spv::ImageFormatR8i;
  934. case glslang::ElfRgba32ui: return spv::ImageFormatRgba32ui;
  935. case glslang::ElfRgba16ui: return spv::ImageFormatRgba16ui;
  936. case glslang::ElfRgba8ui: return spv::ImageFormatRgba8ui;
  937. case glslang::ElfR32ui: return spv::ImageFormatR32ui;
  938. case glslang::ElfRg32ui: return spv::ImageFormatRg32ui;
  939. case glslang::ElfRg16ui: return spv::ImageFormatRg16ui;
  940. case glslang::ElfRgb10a2ui: return spv::ImageFormatRgb10a2ui;
  941. case glslang::ElfRg8ui: return spv::ImageFormatRg8ui;
  942. case glslang::ElfR16ui: return spv::ImageFormatR16ui;
  943. case glslang::ElfR8ui: return spv::ImageFormatR8ui;
  944. default: return spv::ImageFormatMax;
  945. }
  946. }
  947. spv::SelectionControlMask TGlslangToSpvTraverser::TranslateSelectionControl(const glslang::TIntermSelection& selectionNode) const
  948. {
  949. if (selectionNode.getFlatten())
  950. return spv::SelectionControlFlattenMask;
  951. if (selectionNode.getDontFlatten())
  952. return spv::SelectionControlDontFlattenMask;
  953. return spv::SelectionControlMaskNone;
  954. }
  955. spv::SelectionControlMask TGlslangToSpvTraverser::TranslateSwitchControl(const glslang::TIntermSwitch& switchNode) const
  956. {
  957. if (switchNode.getFlatten())
  958. return spv::SelectionControlFlattenMask;
  959. if (switchNode.getDontFlatten())
  960. return spv::SelectionControlDontFlattenMask;
  961. return spv::SelectionControlMaskNone;
  962. }
  963. // return a non-0 dependency if the dependency argument must be set
  964. spv::LoopControlMask TGlslangToSpvTraverser::TranslateLoopControl(const glslang::TIntermLoop& loopNode,
  965. unsigned int& dependencyLength) const
  966. {
  967. spv::LoopControlMask control = spv::LoopControlMaskNone;
  968. if (loopNode.getDontUnroll())
  969. control = control | spv::LoopControlDontUnrollMask;
  970. if (loopNode.getUnroll())
  971. control = control | spv::LoopControlUnrollMask;
  972. if (unsigned(loopNode.getLoopDependency()) == glslang::TIntermLoop::dependencyInfinite)
  973. control = control | spv::LoopControlDependencyInfiniteMask;
  974. else if (loopNode.getLoopDependency() > 0) {
  975. control = control | spv::LoopControlDependencyLengthMask;
  976. dependencyLength = loopNode.getLoopDependency();
  977. }
  978. return control;
  979. }
  980. // Translate glslang type to SPIR-V storage class.
  981. spv::StorageClass TGlslangToSpvTraverser::TranslateStorageClass(const glslang::TType& type)
  982. {
  983. if (type.getQualifier().isPipeInput())
  984. return spv::StorageClassInput;
  985. if (type.getQualifier().isPipeOutput())
  986. return spv::StorageClassOutput;
  987. if (glslangIntermediate->getSource() != glslang::EShSourceHlsl ||
  988. type.getQualifier().storage == glslang::EvqUniform) {
  989. if (type.getBasicType() == glslang::EbtAtomicUint)
  990. return spv::StorageClassAtomicCounter;
  991. if (type.containsOpaque())
  992. return spv::StorageClassUniformConstant;
  993. }
  994. #ifdef NV_EXTENSIONS
  995. if (type.getQualifier().isUniformOrBuffer() &&
  996. type.getQualifier().layoutShaderRecordNV) {
  997. return spv::StorageClassShaderRecordBufferNV;
  998. }
  999. #endif
  1000. if (glslangIntermediate->usingStorageBuffer() && type.getQualifier().storage == glslang::EvqBuffer) {
  1001. addPre13Extension(spv::E_SPV_KHR_storage_buffer_storage_class);
  1002. return spv::StorageClassStorageBuffer;
  1003. }
  1004. if (type.getQualifier().isUniformOrBuffer()) {
  1005. if (type.getQualifier().layoutPushConstant)
  1006. return spv::StorageClassPushConstant;
  1007. if (type.getBasicType() == glslang::EbtBlock)
  1008. return spv::StorageClassUniform;
  1009. return spv::StorageClassUniformConstant;
  1010. }
  1011. switch (type.getQualifier().storage) {
  1012. case glslang::EvqShared: return spv::StorageClassWorkgroup;
  1013. case glslang::EvqGlobal: return spv::StorageClassPrivate;
  1014. case glslang::EvqConstReadOnly: return spv::StorageClassFunction;
  1015. case glslang::EvqTemporary: return spv::StorageClassFunction;
  1016. #ifdef NV_EXTENSIONS
  1017. case glslang::EvqPayloadNV: return spv::StorageClassRayPayloadNV;
  1018. case glslang::EvqPayloadInNV: return spv::StorageClassIncomingRayPayloadNV;
  1019. case glslang::EvqHitAttrNV: return spv::StorageClassHitAttributeNV;
  1020. case glslang::EvqCallableDataNV: return spv::StorageClassCallableDataNV;
  1021. case glslang::EvqCallableDataInNV: return spv::StorageClassIncomingCallableDataNV;
  1022. #endif
  1023. default:
  1024. assert(0);
  1025. break;
  1026. }
  1027. return spv::StorageClassFunction;
  1028. }
  1029. // Add capabilities pertaining to how an array is indexed.
  1030. void TGlslangToSpvTraverser::addIndirectionIndexCapabilities(const glslang::TType& baseType,
  1031. const glslang::TType& indexType)
  1032. {
  1033. if (indexType.getQualifier().isNonUniform()) {
  1034. // deal with an asserted non-uniform index
  1035. // SPV_EXT_descriptor_indexing already added in TranslateNonUniformDecoration
  1036. if (baseType.getBasicType() == glslang::EbtSampler) {
  1037. if (baseType.getQualifier().hasAttachment())
  1038. builder.addCapability(spv::CapabilityInputAttachmentArrayNonUniformIndexingEXT);
  1039. else if (baseType.isImage() && baseType.getSampler().dim == glslang::EsdBuffer)
  1040. builder.addCapability(spv::CapabilityStorageTexelBufferArrayNonUniformIndexingEXT);
  1041. else if (baseType.isTexture() && baseType.getSampler().dim == glslang::EsdBuffer)
  1042. builder.addCapability(spv::CapabilityUniformTexelBufferArrayNonUniformIndexingEXT);
  1043. else if (baseType.isImage())
  1044. builder.addCapability(spv::CapabilityStorageImageArrayNonUniformIndexingEXT);
  1045. else if (baseType.isTexture())
  1046. builder.addCapability(spv::CapabilitySampledImageArrayNonUniformIndexingEXT);
  1047. } else if (baseType.getBasicType() == glslang::EbtBlock) {
  1048. if (baseType.getQualifier().storage == glslang::EvqBuffer)
  1049. builder.addCapability(spv::CapabilityStorageBufferArrayNonUniformIndexingEXT);
  1050. else if (baseType.getQualifier().storage == glslang::EvqUniform)
  1051. builder.addCapability(spv::CapabilityUniformBufferArrayNonUniformIndexingEXT);
  1052. }
  1053. } else {
  1054. // assume a dynamically uniform index
  1055. if (baseType.getBasicType() == glslang::EbtSampler) {
  1056. if (baseType.getQualifier().hasAttachment()) {
  1057. builder.addExtension("SPV_EXT_descriptor_indexing");
  1058. builder.addCapability(spv::CapabilityInputAttachmentArrayDynamicIndexingEXT);
  1059. } else if (baseType.isImage() && baseType.getSampler().dim == glslang::EsdBuffer) {
  1060. builder.addExtension("SPV_EXT_descriptor_indexing");
  1061. builder.addCapability(spv::CapabilityStorageTexelBufferArrayDynamicIndexingEXT);
  1062. } else if (baseType.isTexture() && baseType.getSampler().dim == glslang::EsdBuffer) {
  1063. builder.addExtension("SPV_EXT_descriptor_indexing");
  1064. builder.addCapability(spv::CapabilityUniformTexelBufferArrayDynamicIndexingEXT);
  1065. }
  1066. }
  1067. }
  1068. }
  1069. // Return whether or not the given type is something that should be tied to a
  1070. // descriptor set.
  1071. bool IsDescriptorResource(const glslang::TType& type)
  1072. {
  1073. // uniform and buffer blocks are included, unless it is a push_constant
  1074. if (type.getBasicType() == glslang::EbtBlock)
  1075. return type.getQualifier().isUniformOrBuffer() &&
  1076. #ifdef NV_EXTENSIONS
  1077. ! type.getQualifier().layoutShaderRecordNV &&
  1078. #endif
  1079. ! type.getQualifier().layoutPushConstant;
  1080. // non block...
  1081. // basically samplerXXX/subpass/sampler/texture are all included
  1082. // if they are the global-scope-class, not the function parameter
  1083. // (or local, if they ever exist) class.
  1084. if (type.getBasicType() == glslang::EbtSampler)
  1085. return type.getQualifier().isUniformOrBuffer();
  1086. // None of the above.
  1087. return false;
  1088. }
  1089. void InheritQualifiers(glslang::TQualifier& child, const glslang::TQualifier& parent)
  1090. {
  1091. if (child.layoutMatrix == glslang::ElmNone)
  1092. child.layoutMatrix = parent.layoutMatrix;
  1093. if (parent.invariant)
  1094. child.invariant = true;
  1095. if (parent.nopersp)
  1096. child.nopersp = true;
  1097. #ifdef AMD_EXTENSIONS
  1098. if (parent.explicitInterp)
  1099. child.explicitInterp = true;
  1100. #endif
  1101. if (parent.flat)
  1102. child.flat = true;
  1103. if (parent.centroid)
  1104. child.centroid = true;
  1105. if (parent.patch)
  1106. child.patch = true;
  1107. if (parent.sample)
  1108. child.sample = true;
  1109. if (parent.coherent)
  1110. child.coherent = true;
  1111. if (parent.devicecoherent)
  1112. child.devicecoherent = true;
  1113. if (parent.queuefamilycoherent)
  1114. child.queuefamilycoherent = true;
  1115. if (parent.workgroupcoherent)
  1116. child.workgroupcoherent = true;
  1117. if (parent.subgroupcoherent)
  1118. child.subgroupcoherent = true;
  1119. if (parent.nonprivate)
  1120. child.nonprivate = true;
  1121. if (parent.volatil)
  1122. child.volatil = true;
  1123. if (parent.restrict)
  1124. child.restrict = true;
  1125. if (parent.readonly)
  1126. child.readonly = true;
  1127. if (parent.writeonly)
  1128. child.writeonly = true;
  1129. #ifdef NV_EXTENSIONS
  1130. if (parent.perPrimitiveNV)
  1131. child.perPrimitiveNV = true;
  1132. if (parent.perViewNV)
  1133. child.perViewNV = true;
  1134. if (parent.perTaskNV)
  1135. child.perTaskNV = true;
  1136. #endif
  1137. }
  1138. bool HasNonLayoutQualifiers(const glslang::TType& type, const glslang::TQualifier& qualifier)
  1139. {
  1140. // This should list qualifiers that simultaneous satisfy:
  1141. // - struct members might inherit from a struct declaration
  1142. // (note that non-block structs don't explicitly inherit,
  1143. // only implicitly, meaning no decoration involved)
  1144. // - affect decorations on the struct members
  1145. // (note smooth does not, and expecting something like volatile
  1146. // to effect the whole object)
  1147. // - are not part of the offset/st430/etc or row/column-major layout
  1148. return qualifier.invariant || (qualifier.hasLocation() && type.getBasicType() == glslang::EbtBlock);
  1149. }
  1150. //
  1151. // Implement the TGlslangToSpvTraverser class.
  1152. //
  1153. TGlslangToSpvTraverser::TGlslangToSpvTraverser(unsigned int spvVersion, const glslang::TIntermediate* glslangIntermediate,
  1154. spv::SpvBuildLogger* buildLogger, glslang::SpvOptions& options)
  1155. : TIntermTraverser(true, false, true),
  1156. options(options),
  1157. shaderEntry(nullptr), currentFunction(nullptr),
  1158. sequenceDepth(0), logger(buildLogger),
  1159. builder(spvVersion, (glslang::GetKhronosToolId() << 16) | glslang::GetSpirvGeneratorVersion(), logger),
  1160. inEntryPoint(false), entryPointTerminated(false), linkageOnly(false),
  1161. glslangIntermediate(glslangIntermediate)
  1162. {
  1163. spv::ExecutionModel executionModel = TranslateExecutionModel(glslangIntermediate->getStage());
  1164. builder.clearAccessChain();
  1165. builder.setSource(TranslateSourceLanguage(glslangIntermediate->getSource(), glslangIntermediate->getProfile()),
  1166. glslangIntermediate->getVersion());
  1167. if (options.generateDebugInfo) {
  1168. builder.setEmitOpLines();
  1169. builder.setSourceFile(glslangIntermediate->getSourceFile());
  1170. // Set the source shader's text. If for SPV version 1.0, include
  1171. // a preamble in comments stating the OpModuleProcessed instructions.
  1172. // Otherwise, emit those as actual instructions.
  1173. std::string text;
  1174. const std::vector<std::string>& processes = glslangIntermediate->getProcesses();
  1175. for (int p = 0; p < (int)processes.size(); ++p) {
  1176. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_1) {
  1177. text.append("// OpModuleProcessed ");
  1178. text.append(processes[p]);
  1179. text.append("\n");
  1180. } else
  1181. builder.addModuleProcessed(processes[p]);
  1182. }
  1183. if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_1 && (int)processes.size() > 0)
  1184. text.append("#line 1\n");
  1185. text.append(glslangIntermediate->getSourceText());
  1186. builder.setSourceText(text);
  1187. // Pass name and text for all included files
  1188. const std::map<std::string, std::string>& include_txt = glslangIntermediate->getIncludeText();
  1189. for (auto iItr = include_txt.begin(); iItr != include_txt.end(); ++iItr)
  1190. builder.addInclude(iItr->first, iItr->second);
  1191. }
  1192. stdBuiltins = builder.import("GLSL.std.450");
  1193. spv::AddressingModel addressingModel = spv::AddressingModelLogical;
  1194. spv::MemoryModel memoryModel = spv::MemoryModelGLSL450;
  1195. if (glslangIntermediate->usingPhysicalStorageBuffer()) {
  1196. addressingModel = spv::AddressingModelPhysicalStorageBuffer64EXT;
  1197. builder.addExtension(spv::E_SPV_EXT_physical_storage_buffer);
  1198. builder.addCapability(spv::CapabilityPhysicalStorageBufferAddressesEXT);
  1199. };
  1200. if (glslangIntermediate->usingVulkanMemoryModel()) {
  1201. memoryModel = spv::MemoryModelVulkanKHR;
  1202. builder.addCapability(spv::CapabilityVulkanMemoryModelKHR);
  1203. builder.addExtension(spv::E_SPV_KHR_vulkan_memory_model);
  1204. }
  1205. builder.setMemoryModel(addressingModel, memoryModel);
  1206. if (glslangIntermediate->usingVariablePointers()) {
  1207. builder.addCapability(spv::CapabilityVariablePointers);
  1208. }
  1209. shaderEntry = builder.makeEntryPoint(glslangIntermediate->getEntryPointName().c_str());
  1210. entryPoint = builder.addEntryPoint(executionModel, shaderEntry, glslangIntermediate->getEntryPointName().c_str());
  1211. // Add the source extensions
  1212. const auto& sourceExtensions = glslangIntermediate->getRequestedExtensions();
  1213. for (auto it = sourceExtensions.begin(); it != sourceExtensions.end(); ++it)
  1214. builder.addSourceExtension(it->c_str());
  1215. // Add the top-level modes for this shader.
  1216. if (glslangIntermediate->getXfbMode()) {
  1217. builder.addCapability(spv::CapabilityTransformFeedback);
  1218. builder.addExecutionMode(shaderEntry, spv::ExecutionModeXfb);
  1219. }
  1220. unsigned int mode;
  1221. switch (glslangIntermediate->getStage()) {
  1222. case EShLangVertex:
  1223. builder.addCapability(spv::CapabilityShader);
  1224. break;
  1225. case EShLangTessEvaluation:
  1226. case EShLangTessControl:
  1227. builder.addCapability(spv::CapabilityTessellation);
  1228. glslang::TLayoutGeometry primitive;
  1229. if (glslangIntermediate->getStage() == EShLangTessControl) {
  1230. builder.addExecutionMode(shaderEntry, spv::ExecutionModeOutputVertices, glslangIntermediate->getVertices());
  1231. primitive = glslangIntermediate->getOutputPrimitive();
  1232. } else {
  1233. primitive = glslangIntermediate->getInputPrimitive();
  1234. }
  1235. switch (primitive) {
  1236. case glslang::ElgTriangles: mode = spv::ExecutionModeTriangles; break;
  1237. case glslang::ElgQuads: mode = spv::ExecutionModeQuads; break;
  1238. case glslang::ElgIsolines: mode = spv::ExecutionModeIsolines; break;
  1239. default: mode = spv::ExecutionModeMax; break;
  1240. }
  1241. if (mode != spv::ExecutionModeMax)
  1242. builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
  1243. switch (glslangIntermediate->getVertexSpacing()) {
  1244. case glslang::EvsEqual: mode = spv::ExecutionModeSpacingEqual; break;
  1245. case glslang::EvsFractionalEven: mode = spv::ExecutionModeSpacingFractionalEven; break;
  1246. case glslang::EvsFractionalOdd: mode = spv::ExecutionModeSpacingFractionalOdd; break;
  1247. default: mode = spv::ExecutionModeMax; break;
  1248. }
  1249. if (mode != spv::ExecutionModeMax)
  1250. builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
  1251. switch (glslangIntermediate->getVertexOrder()) {
  1252. case glslang::EvoCw: mode = spv::ExecutionModeVertexOrderCw; break;
  1253. case glslang::EvoCcw: mode = spv::ExecutionModeVertexOrderCcw; break;
  1254. default: mode = spv::ExecutionModeMax; break;
  1255. }
  1256. if (mode != spv::ExecutionModeMax)
  1257. builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
  1258. if (glslangIntermediate->getPointMode())
  1259. builder.addExecutionMode(shaderEntry, spv::ExecutionModePointMode);
  1260. break;
  1261. case EShLangGeometry:
  1262. builder.addCapability(spv::CapabilityGeometry);
  1263. switch (glslangIntermediate->getInputPrimitive()) {
  1264. case glslang::ElgPoints: mode = spv::ExecutionModeInputPoints; break;
  1265. case glslang::ElgLines: mode = spv::ExecutionModeInputLines; break;
  1266. case glslang::ElgLinesAdjacency: mode = spv::ExecutionModeInputLinesAdjacency; break;
  1267. case glslang::ElgTriangles: mode = spv::ExecutionModeTriangles; break;
  1268. case glslang::ElgTrianglesAdjacency: mode = spv::ExecutionModeInputTrianglesAdjacency; break;
  1269. default: mode = spv::ExecutionModeMax; break;
  1270. }
  1271. if (mode != spv::ExecutionModeMax)
  1272. builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
  1273. builder.addExecutionMode(shaderEntry, spv::ExecutionModeInvocations, glslangIntermediate->getInvocations());
  1274. switch (glslangIntermediate->getOutputPrimitive()) {
  1275. case glslang::ElgPoints: mode = spv::ExecutionModeOutputPoints; break;
  1276. case glslang::ElgLineStrip: mode = spv::ExecutionModeOutputLineStrip; break;
  1277. case glslang::ElgTriangleStrip: mode = spv::ExecutionModeOutputTriangleStrip; break;
  1278. default: mode = spv::ExecutionModeMax; break;
  1279. }
  1280. if (mode != spv::ExecutionModeMax)
  1281. builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
  1282. builder.addExecutionMode(shaderEntry, spv::ExecutionModeOutputVertices, glslangIntermediate->getVertices());
  1283. break;
  1284. case EShLangFragment:
  1285. builder.addCapability(spv::CapabilityShader);
  1286. if (glslangIntermediate->getPixelCenterInteger())
  1287. builder.addExecutionMode(shaderEntry, spv::ExecutionModePixelCenterInteger);
  1288. if (glslangIntermediate->getOriginUpperLeft())
  1289. builder.addExecutionMode(shaderEntry, spv::ExecutionModeOriginUpperLeft);
  1290. else
  1291. builder.addExecutionMode(shaderEntry, spv::ExecutionModeOriginLowerLeft);
  1292. if (glslangIntermediate->getEarlyFragmentTests())
  1293. builder.addExecutionMode(shaderEntry, spv::ExecutionModeEarlyFragmentTests);
  1294. if (glslangIntermediate->getPostDepthCoverage()) {
  1295. builder.addCapability(spv::CapabilitySampleMaskPostDepthCoverage);
  1296. builder.addExecutionMode(shaderEntry, spv::ExecutionModePostDepthCoverage);
  1297. builder.addExtension(spv::E_SPV_KHR_post_depth_coverage);
  1298. }
  1299. switch(glslangIntermediate->getDepth()) {
  1300. case glslang::EldGreater: mode = spv::ExecutionModeDepthGreater; break;
  1301. case glslang::EldLess: mode = spv::ExecutionModeDepthLess; break;
  1302. default: mode = spv::ExecutionModeMax; break;
  1303. }
  1304. if (mode != spv::ExecutionModeMax)
  1305. builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
  1306. if (glslangIntermediate->getDepth() != glslang::EldUnchanged && glslangIntermediate->isDepthReplacing())
  1307. builder.addExecutionMode(shaderEntry, spv::ExecutionModeDepthReplacing);
  1308. break;
  1309. case EShLangCompute:
  1310. builder.addCapability(spv::CapabilityShader);
  1311. builder.addExecutionMode(shaderEntry, spv::ExecutionModeLocalSize, glslangIntermediate->getLocalSize(0),
  1312. glslangIntermediate->getLocalSize(1),
  1313. glslangIntermediate->getLocalSize(2));
  1314. #ifdef NV_EXTENSIONS
  1315. if (glslangIntermediate->getLayoutDerivativeModeNone() == glslang::LayoutDerivativeGroupQuads) {
  1316. builder.addCapability(spv::CapabilityComputeDerivativeGroupQuadsNV);
  1317. builder.addExecutionMode(shaderEntry, spv::ExecutionModeDerivativeGroupQuadsNV);
  1318. builder.addExtension(spv::E_SPV_NV_compute_shader_derivatives);
  1319. } else if (glslangIntermediate->getLayoutDerivativeModeNone() == glslang::LayoutDerivativeGroupLinear) {
  1320. builder.addCapability(spv::CapabilityComputeDerivativeGroupLinearNV);
  1321. builder.addExecutionMode(shaderEntry, spv::ExecutionModeDerivativeGroupLinearNV);
  1322. builder.addExtension(spv::E_SPV_NV_compute_shader_derivatives);
  1323. }
  1324. #endif
  1325. break;
  1326. #ifdef NV_EXTENSIONS
  1327. case EShLangRayGenNV:
  1328. case EShLangIntersectNV:
  1329. case EShLangAnyHitNV:
  1330. case EShLangClosestHitNV:
  1331. case EShLangMissNV:
  1332. case EShLangCallableNV:
  1333. builder.addCapability(spv::CapabilityRayTracingNV);
  1334. builder.addExtension("SPV_NV_ray_tracing");
  1335. break;
  1336. case EShLangTaskNV:
  1337. case EShLangMeshNV:
  1338. builder.addCapability(spv::CapabilityMeshShadingNV);
  1339. builder.addExtension(spv::E_SPV_NV_mesh_shader);
  1340. builder.addExecutionMode(shaderEntry, spv::ExecutionModeLocalSize, glslangIntermediate->getLocalSize(0),
  1341. glslangIntermediate->getLocalSize(1),
  1342. glslangIntermediate->getLocalSize(2));
  1343. if (glslangIntermediate->getStage() == EShLangMeshNV) {
  1344. builder.addExecutionMode(shaderEntry, spv::ExecutionModeOutputVertices, glslangIntermediate->getVertices());
  1345. builder.addExecutionMode(shaderEntry, spv::ExecutionModeOutputPrimitivesNV, glslangIntermediate->getPrimitives());
  1346. switch (glslangIntermediate->getOutputPrimitive()) {
  1347. case glslang::ElgPoints: mode = spv::ExecutionModeOutputPoints; break;
  1348. case glslang::ElgLines: mode = spv::ExecutionModeOutputLinesNV; break;
  1349. case glslang::ElgTriangles: mode = spv::ExecutionModeOutputTrianglesNV; break;
  1350. default: mode = spv::ExecutionModeMax; break;
  1351. }
  1352. if (mode != spv::ExecutionModeMax)
  1353. builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
  1354. }
  1355. break;
  1356. #endif
  1357. default:
  1358. break;
  1359. }
  1360. }
  1361. // Finish creating SPV, after the traversal is complete.
  1362. void TGlslangToSpvTraverser::finishSpv()
  1363. {
  1364. // Finish the entry point function
  1365. if (! entryPointTerminated) {
  1366. builder.setBuildPoint(shaderEntry->getLastBlock());
  1367. builder.leaveFunction();
  1368. }
  1369. // finish off the entry-point SPV instruction by adding the Input/Output <id>
  1370. for (auto it = iOSet.cbegin(); it != iOSet.cend(); ++it)
  1371. entryPoint->addIdOperand(*it);
  1372. // Add capabilities, extensions, remove unneeded decorations, etc.,
  1373. // based on the resulting SPIR-V.
  1374. builder.postProcess();
  1375. }
  1376. // Write the SPV into 'out'.
  1377. void TGlslangToSpvTraverser::dumpSpv(std::vector<unsigned int>& out)
  1378. {
  1379. builder.dump(out);
  1380. }
  1381. //
  1382. // Implement the traversal functions.
  1383. //
  1384. // Return true from interior nodes to have the external traversal
  1385. // continue on to children. Return false if children were
  1386. // already processed.
  1387. //
  1388. //
  1389. // Symbols can turn into
  1390. // - uniform/input reads
  1391. // - output writes
  1392. // - complex lvalue base setups: foo.bar[3].... , where we see foo and start up an access chain
  1393. // - something simple that degenerates into the last bullet
  1394. //
  1395. void TGlslangToSpvTraverser::visitSymbol(glslang::TIntermSymbol* symbol)
  1396. {
  1397. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  1398. if (symbol->getType().getQualifier().isSpecConstant())
  1399. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  1400. // getSymbolId() will set up all the IO decorations on the first call.
  1401. // Formal function parameters were mapped during makeFunctions().
  1402. spv::Id id = getSymbolId(symbol);
  1403. // Include all "static use" and "linkage only" interface variables on the OpEntryPoint instruction
  1404. if (builder.isPointer(id)) {
  1405. spv::StorageClass sc = builder.getStorageClass(id);
  1406. if (sc == spv::StorageClassInput || sc == spv::StorageClassOutput) {
  1407. if (!symbol->getType().isStruct() || symbol->getType().getStruct()->size() > 0)
  1408. iOSet.insert(id);
  1409. }
  1410. }
  1411. // Only process non-linkage-only nodes for generating actual static uses
  1412. if (! linkageOnly || symbol->getQualifier().isSpecConstant()) {
  1413. // Prepare to generate code for the access
  1414. // L-value chains will be computed left to right. We're on the symbol now,
  1415. // which is the left-most part of the access chain, so now is "clear" time,
  1416. // followed by setting the base.
  1417. builder.clearAccessChain();
  1418. // For now, we consider all user variables as being in memory, so they are pointers,
  1419. // except for
  1420. // A) R-Value arguments to a function, which are an intermediate object.
  1421. // See comments in handleUserFunctionCall().
  1422. // B) Specialization constants (normal constants don't even come in as a variable),
  1423. // These are also pure R-values.
  1424. glslang::TQualifier qualifier = symbol->getQualifier();
  1425. if (qualifier.isSpecConstant() || rValueParameters.find(symbol->getId()) != rValueParameters.end())
  1426. builder.setAccessChainRValue(id);
  1427. else
  1428. builder.setAccessChainLValue(id);
  1429. }
  1430. // Process linkage-only nodes for any special additional interface work.
  1431. if (linkageOnly) {
  1432. if (glslangIntermediate->getHlslFunctionality1()) {
  1433. // Map implicit counter buffers to their originating buffers, which should have been
  1434. // seen by now, given earlier pruning of unused counters, and preservation of order
  1435. // of declaration.
  1436. if (symbol->getType().getQualifier().isUniformOrBuffer()) {
  1437. if (!glslangIntermediate->hasCounterBufferName(symbol->getName())) {
  1438. // Save possible originating buffers for counter buffers, keyed by
  1439. // making the potential counter-buffer name.
  1440. std::string keyName = symbol->getName().c_str();
  1441. keyName = glslangIntermediate->addCounterBufferName(keyName);
  1442. counterOriginator[keyName] = symbol;
  1443. } else {
  1444. // Handle a counter buffer, by finding the saved originating buffer.
  1445. std::string keyName = symbol->getName().c_str();
  1446. auto it = counterOriginator.find(keyName);
  1447. if (it != counterOriginator.end()) {
  1448. id = getSymbolId(it->second);
  1449. if (id != spv::NoResult) {
  1450. spv::Id counterId = getSymbolId(symbol);
  1451. if (counterId != spv::NoResult) {
  1452. builder.addExtension("SPV_GOOGLE_hlsl_functionality1");
  1453. builder.addDecorationId(id, spv::DecorationHlslCounterBufferGOOGLE, counterId);
  1454. }
  1455. }
  1456. }
  1457. }
  1458. }
  1459. }
  1460. }
  1461. }
  1462. bool TGlslangToSpvTraverser::visitBinary(glslang::TVisit /* visit */, glslang::TIntermBinary* node)
  1463. {
  1464. builder.setLine(node->getLoc().line, node->getLoc().getFilename());
  1465. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  1466. if (node->getType().getQualifier().isSpecConstant())
  1467. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  1468. // First, handle special cases
  1469. switch (node->getOp()) {
  1470. case glslang::EOpAssign:
  1471. case glslang::EOpAddAssign:
  1472. case glslang::EOpSubAssign:
  1473. case glslang::EOpMulAssign:
  1474. case glslang::EOpVectorTimesMatrixAssign:
  1475. case glslang::EOpVectorTimesScalarAssign:
  1476. case glslang::EOpMatrixTimesScalarAssign:
  1477. case glslang::EOpMatrixTimesMatrixAssign:
  1478. case glslang::EOpDivAssign:
  1479. case glslang::EOpModAssign:
  1480. case glslang::EOpAndAssign:
  1481. case glslang::EOpInclusiveOrAssign:
  1482. case glslang::EOpExclusiveOrAssign:
  1483. case glslang::EOpLeftShiftAssign:
  1484. case glslang::EOpRightShiftAssign:
  1485. // A bin-op assign "a += b" means the same thing as "a = a + b"
  1486. // where a is evaluated before b. For a simple assignment, GLSL
  1487. // says to evaluate the left before the right. So, always, left
  1488. // node then right node.
  1489. {
  1490. // get the left l-value, save it away
  1491. builder.clearAccessChain();
  1492. node->getLeft()->traverse(this);
  1493. spv::Builder::AccessChain lValue = builder.getAccessChain();
  1494. // evaluate the right
  1495. builder.clearAccessChain();
  1496. node->getRight()->traverse(this);
  1497. spv::Id rValue = accessChainLoad(node->getRight()->getType());
  1498. if (node->getOp() != glslang::EOpAssign) {
  1499. // the left is also an r-value
  1500. builder.setAccessChain(lValue);
  1501. spv::Id leftRValue = accessChainLoad(node->getLeft()->getType());
  1502. // do the operation
  1503. OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
  1504. TranslateNoContractionDecoration(node->getType().getQualifier()),
  1505. TranslateNonUniformDecoration(node->getType().getQualifier()) };
  1506. rValue = createBinaryOperation(node->getOp(), decorations,
  1507. convertGlslangToSpvType(node->getType()), leftRValue, rValue,
  1508. node->getType().getBasicType());
  1509. // these all need their counterparts in createBinaryOperation()
  1510. assert(rValue != spv::NoResult);
  1511. }
  1512. // store the result
  1513. builder.setAccessChain(lValue);
  1514. multiTypeStore(node->getLeft()->getType(), rValue);
  1515. // assignments are expressions having an rValue after they are evaluated...
  1516. builder.clearAccessChain();
  1517. builder.setAccessChainRValue(rValue);
  1518. }
  1519. return false;
  1520. case glslang::EOpIndexDirect:
  1521. case glslang::EOpIndexDirectStruct:
  1522. {
  1523. // Get the left part of the access chain.
  1524. node->getLeft()->traverse(this);
  1525. // Add the next element in the chain
  1526. const int glslangIndex = node->getRight()->getAsConstantUnion()->getConstArray()[0].getIConst();
  1527. if (! node->getLeft()->getType().isArray() &&
  1528. node->getLeft()->getType().isVector() &&
  1529. node->getOp() == glslang::EOpIndexDirect) {
  1530. // This is essentially a hard-coded vector swizzle of size 1,
  1531. // so short circuit the access-chain stuff with a swizzle.
  1532. std::vector<unsigned> swizzle;
  1533. swizzle.push_back(glslangIndex);
  1534. int dummySize;
  1535. builder.accessChainPushSwizzle(swizzle, convertGlslangToSpvType(node->getLeft()->getType()),
  1536. TranslateCoherent(node->getLeft()->getType()),
  1537. glslangIntermediate->getBaseAlignmentScalar(node->getLeft()->getType(), dummySize));
  1538. } else {
  1539. // Load through a block reference is performed with a dot operator that
  1540. // is mapped to EOpIndexDirectStruct. When we get to the actual reference,
  1541. // do a load and reset the access chain.
  1542. if (node->getLeft()->getBasicType() == glslang::EbtReference &&
  1543. !node->getLeft()->getType().isArray() &&
  1544. node->getOp() == glslang::EOpIndexDirectStruct)
  1545. {
  1546. spv::Id left = accessChainLoad(node->getLeft()->getType());
  1547. builder.clearAccessChain();
  1548. builder.setAccessChainLValue(left);
  1549. }
  1550. int spvIndex = glslangIndex;
  1551. if (node->getLeft()->getBasicType() == glslang::EbtBlock &&
  1552. node->getOp() == glslang::EOpIndexDirectStruct)
  1553. {
  1554. // This may be, e.g., an anonymous block-member selection, which generally need
  1555. // index remapping due to hidden members in anonymous blocks.
  1556. std::vector<int>& remapper = memberRemapper[node->getLeft()->getType().getStruct()];
  1557. assert(remapper.size() > 0);
  1558. spvIndex = remapper[glslangIndex];
  1559. }
  1560. // normal case for indexing array or structure or block
  1561. builder.accessChainPush(builder.makeIntConstant(spvIndex), TranslateCoherent(node->getLeft()->getType()), node->getLeft()->getType().getBufferReferenceAlignment());
  1562. // Add capabilities here for accessing PointSize and clip/cull distance.
  1563. // We have deferred generation of associated capabilities until now.
  1564. if (node->getLeft()->getType().isStruct() && ! node->getLeft()->getType().isArray())
  1565. declareUseOfStructMember(*(node->getLeft()->getType().getStruct()), glslangIndex);
  1566. }
  1567. }
  1568. return false;
  1569. case glslang::EOpIndexIndirect:
  1570. {
  1571. // Structure or array or vector indirection.
  1572. // Will use native SPIR-V access-chain for struct and array indirection;
  1573. // matrices are arrays of vectors, so will also work for a matrix.
  1574. // Will use the access chain's 'component' for variable index into a vector.
  1575. // This adapter is building access chains left to right.
  1576. // Set up the access chain to the left.
  1577. node->getLeft()->traverse(this);
  1578. // save it so that computing the right side doesn't trash it
  1579. spv::Builder::AccessChain partial = builder.getAccessChain();
  1580. // compute the next index in the chain
  1581. builder.clearAccessChain();
  1582. node->getRight()->traverse(this);
  1583. spv::Id index = accessChainLoad(node->getRight()->getType());
  1584. addIndirectionIndexCapabilities(node->getLeft()->getType(), node->getRight()->getType());
  1585. // restore the saved access chain
  1586. builder.setAccessChain(partial);
  1587. if (! node->getLeft()->getType().isArray() && node->getLeft()->getType().isVector()) {
  1588. int dummySize;
  1589. builder.accessChainPushComponent(index, convertGlslangToSpvType(node->getLeft()->getType()),
  1590. TranslateCoherent(node->getLeft()->getType()),
  1591. glslangIntermediate->getBaseAlignmentScalar(node->getLeft()->getType(), dummySize));
  1592. } else
  1593. builder.accessChainPush(index, TranslateCoherent(node->getLeft()->getType()), node->getLeft()->getType().getBufferReferenceAlignment());
  1594. }
  1595. return false;
  1596. case glslang::EOpVectorSwizzle:
  1597. {
  1598. node->getLeft()->traverse(this);
  1599. std::vector<unsigned> swizzle;
  1600. convertSwizzle(*node->getRight()->getAsAggregate(), swizzle);
  1601. int dummySize;
  1602. builder.accessChainPushSwizzle(swizzle, convertGlslangToSpvType(node->getLeft()->getType()),
  1603. TranslateCoherent(node->getLeft()->getType()),
  1604. glslangIntermediate->getBaseAlignmentScalar(node->getLeft()->getType(), dummySize));
  1605. }
  1606. return false;
  1607. case glslang::EOpMatrixSwizzle:
  1608. logger->missingFunctionality("matrix swizzle");
  1609. return true;
  1610. case glslang::EOpLogicalOr:
  1611. case glslang::EOpLogicalAnd:
  1612. {
  1613. // These may require short circuiting, but can sometimes be done as straight
  1614. // binary operations. The right operand must be short circuited if it has
  1615. // side effects, and should probably be if it is complex.
  1616. if (isTrivial(node->getRight()->getAsTyped()))
  1617. break; // handle below as a normal binary operation
  1618. // otherwise, we need to do dynamic short circuiting on the right operand
  1619. spv::Id result = createShortCircuit(node->getOp(), *node->getLeft()->getAsTyped(), *node->getRight()->getAsTyped());
  1620. builder.clearAccessChain();
  1621. builder.setAccessChainRValue(result);
  1622. }
  1623. return false;
  1624. default:
  1625. break;
  1626. }
  1627. // Assume generic binary op...
  1628. // get right operand
  1629. builder.clearAccessChain();
  1630. node->getLeft()->traverse(this);
  1631. spv::Id left = accessChainLoad(node->getLeft()->getType());
  1632. // get left operand
  1633. builder.clearAccessChain();
  1634. node->getRight()->traverse(this);
  1635. spv::Id right = accessChainLoad(node->getRight()->getType());
  1636. // get result
  1637. OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
  1638. TranslateNoContractionDecoration(node->getType().getQualifier()),
  1639. TranslateNonUniformDecoration(node->getType().getQualifier()) };
  1640. spv::Id result = createBinaryOperation(node->getOp(), decorations,
  1641. convertGlslangToSpvType(node->getType()), left, right,
  1642. node->getLeft()->getType().getBasicType());
  1643. builder.clearAccessChain();
  1644. if (! result) {
  1645. logger->missingFunctionality("unknown glslang binary operation");
  1646. return true; // pick up a child as the place-holder result
  1647. } else {
  1648. builder.setAccessChainRValue(result);
  1649. return false;
  1650. }
  1651. }
  1652. bool TGlslangToSpvTraverser::visitUnary(glslang::TVisit /* visit */, glslang::TIntermUnary* node)
  1653. {
  1654. builder.setLine(node->getLoc().line, node->getLoc().getFilename());
  1655. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  1656. if (node->getType().getQualifier().isSpecConstant())
  1657. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  1658. spv::Id result = spv::NoResult;
  1659. // try texturing first
  1660. result = createImageTextureFunctionCall(node);
  1661. if (result != spv::NoResult) {
  1662. builder.clearAccessChain();
  1663. builder.setAccessChainRValue(result);
  1664. return false; // done with this node
  1665. }
  1666. // Non-texturing.
  1667. if (node->getOp() == glslang::EOpArrayLength) {
  1668. // Quite special; won't want to evaluate the operand.
  1669. // Currently, the front-end does not allow .length() on an array until it is sized,
  1670. // except for the last block membeor of an SSBO.
  1671. // TODO: If this changes, link-time sized arrays might show up here, and need their
  1672. // size extracted.
  1673. // Normal .length() would have been constant folded by the front-end.
  1674. // So, this has to be block.lastMember.length().
  1675. // SPV wants "block" and member number as the operands, go get them.
  1676. spv::Id length;
  1677. if (node->getOperand()->getType().isCoopMat()) {
  1678. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  1679. spv::Id typeId = convertGlslangToSpvType(node->getOperand()->getType());
  1680. assert(builder.isCooperativeMatrixType(typeId));
  1681. length = builder.createCooperativeMatrixLength(typeId);
  1682. } else {
  1683. glslang::TIntermTyped* block = node->getOperand()->getAsBinaryNode()->getLeft();
  1684. block->traverse(this);
  1685. unsigned int member = node->getOperand()->getAsBinaryNode()->getRight()->getAsConstantUnion()->getConstArray()[0].getUConst();
  1686. length = builder.createArrayLength(builder.accessChainGetLValue(), member);
  1687. }
  1688. // GLSL semantics say the result of .length() is an int, while SPIR-V says
  1689. // signedness must be 0. So, convert from SPIR-V unsigned back to GLSL's
  1690. // AST expectation of a signed result.
  1691. if (glslangIntermediate->getSource() == glslang::EShSourceGlsl) {
  1692. if (builder.isInSpecConstCodeGenMode()) {
  1693. length = builder.createBinOp(spv::OpIAdd, builder.makeIntType(32), length, builder.makeIntConstant(0));
  1694. } else {
  1695. length = builder.createUnaryOp(spv::OpBitcast, builder.makeIntType(32), length);
  1696. }
  1697. }
  1698. builder.clearAccessChain();
  1699. builder.setAccessChainRValue(length);
  1700. return false;
  1701. }
  1702. // Start by evaluating the operand
  1703. // Does it need a swizzle inversion? If so, evaluation is inverted;
  1704. // operate first on the swizzle base, then apply the swizzle.
  1705. spv::Id invertedType = spv::NoType;
  1706. auto resultType = [&invertedType, &node, this](){ return invertedType != spv::NoType ? invertedType : convertGlslangToSpvType(node->getType()); };
  1707. if (node->getOp() == glslang::EOpInterpolateAtCentroid)
  1708. invertedType = getInvertedSwizzleType(*node->getOperand());
  1709. builder.clearAccessChain();
  1710. if (invertedType != spv::NoType)
  1711. node->getOperand()->getAsBinaryNode()->getLeft()->traverse(this);
  1712. else
  1713. node->getOperand()->traverse(this);
  1714. spv::Id operand = spv::NoResult;
  1715. if (node->getOp() == glslang::EOpAtomicCounterIncrement ||
  1716. node->getOp() == glslang::EOpAtomicCounterDecrement ||
  1717. node->getOp() == glslang::EOpAtomicCounter ||
  1718. node->getOp() == glslang::EOpInterpolateAtCentroid)
  1719. operand = builder.accessChainGetLValue(); // Special case l-value operands
  1720. else
  1721. operand = accessChainLoad(node->getOperand()->getType());
  1722. OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
  1723. TranslateNoContractionDecoration(node->getType().getQualifier()),
  1724. TranslateNonUniformDecoration(node->getType().getQualifier()) };
  1725. // it could be a conversion
  1726. if (! result)
  1727. result = createConversion(node->getOp(), decorations, resultType(), operand, node->getOperand()->getBasicType());
  1728. // if not, then possibly an operation
  1729. if (! result)
  1730. result = createUnaryOperation(node->getOp(), decorations, resultType(), operand, node->getOperand()->getBasicType());
  1731. if (result) {
  1732. if (invertedType) {
  1733. result = createInvertedSwizzle(decorations.precision, *node->getOperand(), result);
  1734. builder.addDecoration(result, decorations.nonUniform);
  1735. }
  1736. builder.clearAccessChain();
  1737. builder.setAccessChainRValue(result);
  1738. return false; // done with this node
  1739. }
  1740. // it must be a special case, check...
  1741. switch (node->getOp()) {
  1742. case glslang::EOpPostIncrement:
  1743. case glslang::EOpPostDecrement:
  1744. case glslang::EOpPreIncrement:
  1745. case glslang::EOpPreDecrement:
  1746. {
  1747. // we need the integer value "1" or the floating point "1.0" to add/subtract
  1748. spv::Id one = 0;
  1749. if (node->getBasicType() == glslang::EbtFloat)
  1750. one = builder.makeFloatConstant(1.0F);
  1751. else if (node->getBasicType() == glslang::EbtDouble)
  1752. one = builder.makeDoubleConstant(1.0);
  1753. else if (node->getBasicType() == glslang::EbtFloat16)
  1754. one = builder.makeFloat16Constant(1.0F);
  1755. else if (node->getBasicType() == glslang::EbtInt8 || node->getBasicType() == glslang::EbtUint8)
  1756. one = builder.makeInt8Constant(1);
  1757. else if (node->getBasicType() == glslang::EbtInt16 || node->getBasicType() == glslang::EbtUint16)
  1758. one = builder.makeInt16Constant(1);
  1759. else if (node->getBasicType() == glslang::EbtInt64 || node->getBasicType() == glslang::EbtUint64)
  1760. one = builder.makeInt64Constant(1);
  1761. else
  1762. one = builder.makeIntConstant(1);
  1763. glslang::TOperator op;
  1764. if (node->getOp() == glslang::EOpPreIncrement ||
  1765. node->getOp() == glslang::EOpPostIncrement)
  1766. op = glslang::EOpAdd;
  1767. else
  1768. op = glslang::EOpSub;
  1769. spv::Id result = createBinaryOperation(op, decorations,
  1770. convertGlslangToSpvType(node->getType()), operand, one,
  1771. node->getType().getBasicType());
  1772. assert(result != spv::NoResult);
  1773. // The result of operation is always stored, but conditionally the
  1774. // consumed result. The consumed result is always an r-value.
  1775. builder.accessChainStore(result);
  1776. builder.clearAccessChain();
  1777. if (node->getOp() == glslang::EOpPreIncrement ||
  1778. node->getOp() == glslang::EOpPreDecrement)
  1779. builder.setAccessChainRValue(result);
  1780. else
  1781. builder.setAccessChainRValue(operand);
  1782. }
  1783. return false;
  1784. case glslang::EOpEmitStreamVertex:
  1785. builder.createNoResultOp(spv::OpEmitStreamVertex, operand);
  1786. return false;
  1787. case glslang::EOpEndStreamPrimitive:
  1788. builder.createNoResultOp(spv::OpEndStreamPrimitive, operand);
  1789. return false;
  1790. default:
  1791. logger->missingFunctionality("unknown glslang unary");
  1792. return true; // pick up operand as placeholder result
  1793. }
  1794. }
  1795. bool TGlslangToSpvTraverser::visitAggregate(glslang::TVisit visit, glslang::TIntermAggregate* node)
  1796. {
  1797. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  1798. if (node->getType().getQualifier().isSpecConstant())
  1799. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  1800. spv::Id result = spv::NoResult;
  1801. spv::Id invertedType = spv::NoType; // to use to override the natural type of the node
  1802. auto resultType = [&invertedType, &node, this](){ return invertedType != spv::NoType ? invertedType : convertGlslangToSpvType(node->getType()); };
  1803. // try texturing
  1804. result = createImageTextureFunctionCall(node);
  1805. if (result != spv::NoResult) {
  1806. builder.clearAccessChain();
  1807. builder.setAccessChainRValue(result);
  1808. return false;
  1809. } else if (node->getOp() == glslang::EOpImageStore ||
  1810. #ifdef AMD_EXTENSIONS
  1811. node->getOp() == glslang::EOpImageStoreLod ||
  1812. #endif
  1813. node->getOp() == glslang::EOpImageAtomicStore) {
  1814. // "imageStore" is a special case, which has no result
  1815. return false;
  1816. }
  1817. glslang::TOperator binOp = glslang::EOpNull;
  1818. bool reduceComparison = true;
  1819. bool isMatrix = false;
  1820. bool noReturnValue = false;
  1821. bool atomic = false;
  1822. assert(node->getOp());
  1823. spv::Decoration precision = TranslatePrecisionDecoration(node->getOperationPrecision());
  1824. switch (node->getOp()) {
  1825. case glslang::EOpSequence:
  1826. {
  1827. if (preVisit)
  1828. ++sequenceDepth;
  1829. else
  1830. --sequenceDepth;
  1831. if (sequenceDepth == 1) {
  1832. // If this is the parent node of all the functions, we want to see them
  1833. // early, so all call points have actual SPIR-V functions to reference.
  1834. // In all cases, still let the traverser visit the children for us.
  1835. makeFunctions(node->getAsAggregate()->getSequence());
  1836. // Also, we want all globals initializers to go into the beginning of the entry point, before
  1837. // anything else gets there, so visit out of order, doing them all now.
  1838. makeGlobalInitializers(node->getAsAggregate()->getSequence());
  1839. // Initializers are done, don't want to visit again, but functions and link objects need to be processed,
  1840. // so do them manually.
  1841. visitFunctions(node->getAsAggregate()->getSequence());
  1842. return false;
  1843. }
  1844. return true;
  1845. }
  1846. case glslang::EOpLinkerObjects:
  1847. {
  1848. if (visit == glslang::EvPreVisit)
  1849. linkageOnly = true;
  1850. else
  1851. linkageOnly = false;
  1852. return true;
  1853. }
  1854. case glslang::EOpComma:
  1855. {
  1856. // processing from left to right naturally leaves the right-most
  1857. // lying around in the access chain
  1858. glslang::TIntermSequence& glslangOperands = node->getSequence();
  1859. for (int i = 0; i < (int)glslangOperands.size(); ++i)
  1860. glslangOperands[i]->traverse(this);
  1861. return false;
  1862. }
  1863. case glslang::EOpFunction:
  1864. if (visit == glslang::EvPreVisit) {
  1865. if (isShaderEntryPoint(node)) {
  1866. inEntryPoint = true;
  1867. builder.setBuildPoint(shaderEntry->getLastBlock());
  1868. currentFunction = shaderEntry;
  1869. } else {
  1870. handleFunctionEntry(node);
  1871. }
  1872. } else {
  1873. if (inEntryPoint)
  1874. entryPointTerminated = true;
  1875. builder.leaveFunction();
  1876. inEntryPoint = false;
  1877. }
  1878. return true;
  1879. case glslang::EOpParameters:
  1880. // Parameters will have been consumed by EOpFunction processing, but not
  1881. // the body, so we still visited the function node's children, making this
  1882. // child redundant.
  1883. return false;
  1884. case glslang::EOpFunctionCall:
  1885. {
  1886. builder.setLine(node->getLoc().line, node->getLoc().getFilename());
  1887. if (node->isUserDefined())
  1888. result = handleUserFunctionCall(node);
  1889. // assert(result); // this can happen for bad shaders because the call graph completeness checking is not yet done
  1890. if (result) {
  1891. builder.clearAccessChain();
  1892. builder.setAccessChainRValue(result);
  1893. } else
  1894. logger->missingFunctionality("missing user function; linker needs to catch that");
  1895. return false;
  1896. }
  1897. case glslang::EOpConstructMat2x2:
  1898. case glslang::EOpConstructMat2x3:
  1899. case glslang::EOpConstructMat2x4:
  1900. case glslang::EOpConstructMat3x2:
  1901. case glslang::EOpConstructMat3x3:
  1902. case glslang::EOpConstructMat3x4:
  1903. case glslang::EOpConstructMat4x2:
  1904. case glslang::EOpConstructMat4x3:
  1905. case glslang::EOpConstructMat4x4:
  1906. case glslang::EOpConstructDMat2x2:
  1907. case glslang::EOpConstructDMat2x3:
  1908. case glslang::EOpConstructDMat2x4:
  1909. case glslang::EOpConstructDMat3x2:
  1910. case glslang::EOpConstructDMat3x3:
  1911. case glslang::EOpConstructDMat3x4:
  1912. case glslang::EOpConstructDMat4x2:
  1913. case glslang::EOpConstructDMat4x3:
  1914. case glslang::EOpConstructDMat4x4:
  1915. case glslang::EOpConstructIMat2x2:
  1916. case glslang::EOpConstructIMat2x3:
  1917. case glslang::EOpConstructIMat2x4:
  1918. case glslang::EOpConstructIMat3x2:
  1919. case glslang::EOpConstructIMat3x3:
  1920. case glslang::EOpConstructIMat3x4:
  1921. case glslang::EOpConstructIMat4x2:
  1922. case glslang::EOpConstructIMat4x3:
  1923. case glslang::EOpConstructIMat4x4:
  1924. case glslang::EOpConstructUMat2x2:
  1925. case glslang::EOpConstructUMat2x3:
  1926. case glslang::EOpConstructUMat2x4:
  1927. case glslang::EOpConstructUMat3x2:
  1928. case glslang::EOpConstructUMat3x3:
  1929. case glslang::EOpConstructUMat3x4:
  1930. case glslang::EOpConstructUMat4x2:
  1931. case glslang::EOpConstructUMat4x3:
  1932. case glslang::EOpConstructUMat4x4:
  1933. case glslang::EOpConstructBMat2x2:
  1934. case glslang::EOpConstructBMat2x3:
  1935. case glslang::EOpConstructBMat2x4:
  1936. case glslang::EOpConstructBMat3x2:
  1937. case glslang::EOpConstructBMat3x3:
  1938. case glslang::EOpConstructBMat3x4:
  1939. case glslang::EOpConstructBMat4x2:
  1940. case glslang::EOpConstructBMat4x3:
  1941. case glslang::EOpConstructBMat4x4:
  1942. case glslang::EOpConstructF16Mat2x2:
  1943. case glslang::EOpConstructF16Mat2x3:
  1944. case glslang::EOpConstructF16Mat2x4:
  1945. case glslang::EOpConstructF16Mat3x2:
  1946. case glslang::EOpConstructF16Mat3x3:
  1947. case glslang::EOpConstructF16Mat3x4:
  1948. case glslang::EOpConstructF16Mat4x2:
  1949. case glslang::EOpConstructF16Mat4x3:
  1950. case glslang::EOpConstructF16Mat4x4:
  1951. isMatrix = true;
  1952. // fall through
  1953. case glslang::EOpConstructFloat:
  1954. case glslang::EOpConstructVec2:
  1955. case glslang::EOpConstructVec3:
  1956. case glslang::EOpConstructVec4:
  1957. case glslang::EOpConstructDouble:
  1958. case glslang::EOpConstructDVec2:
  1959. case glslang::EOpConstructDVec3:
  1960. case glslang::EOpConstructDVec4:
  1961. case glslang::EOpConstructFloat16:
  1962. case glslang::EOpConstructF16Vec2:
  1963. case glslang::EOpConstructF16Vec3:
  1964. case glslang::EOpConstructF16Vec4:
  1965. case glslang::EOpConstructBool:
  1966. case glslang::EOpConstructBVec2:
  1967. case glslang::EOpConstructBVec3:
  1968. case glslang::EOpConstructBVec4:
  1969. case glslang::EOpConstructInt8:
  1970. case glslang::EOpConstructI8Vec2:
  1971. case glslang::EOpConstructI8Vec3:
  1972. case glslang::EOpConstructI8Vec4:
  1973. case glslang::EOpConstructUint8:
  1974. case glslang::EOpConstructU8Vec2:
  1975. case glslang::EOpConstructU8Vec3:
  1976. case glslang::EOpConstructU8Vec4:
  1977. case glslang::EOpConstructInt16:
  1978. case glslang::EOpConstructI16Vec2:
  1979. case glslang::EOpConstructI16Vec3:
  1980. case glslang::EOpConstructI16Vec4:
  1981. case glslang::EOpConstructUint16:
  1982. case glslang::EOpConstructU16Vec2:
  1983. case glslang::EOpConstructU16Vec3:
  1984. case glslang::EOpConstructU16Vec4:
  1985. case glslang::EOpConstructInt:
  1986. case glslang::EOpConstructIVec2:
  1987. case glslang::EOpConstructIVec3:
  1988. case glslang::EOpConstructIVec4:
  1989. case glslang::EOpConstructUint:
  1990. case glslang::EOpConstructUVec2:
  1991. case glslang::EOpConstructUVec3:
  1992. case glslang::EOpConstructUVec4:
  1993. case glslang::EOpConstructInt64:
  1994. case glslang::EOpConstructI64Vec2:
  1995. case glslang::EOpConstructI64Vec3:
  1996. case glslang::EOpConstructI64Vec4:
  1997. case glslang::EOpConstructUint64:
  1998. case glslang::EOpConstructU64Vec2:
  1999. case glslang::EOpConstructU64Vec3:
  2000. case glslang::EOpConstructU64Vec4:
  2001. case glslang::EOpConstructStruct:
  2002. case glslang::EOpConstructTextureSampler:
  2003. case glslang::EOpConstructReference:
  2004. case glslang::EOpConstructCooperativeMatrix:
  2005. {
  2006. builder.setLine(node->getLoc().line, node->getLoc().getFilename());
  2007. std::vector<spv::Id> arguments;
  2008. translateArguments(*node, arguments);
  2009. spv::Id constructed;
  2010. if (node->getOp() == glslang::EOpConstructTextureSampler)
  2011. constructed = builder.createOp(spv::OpSampledImage, resultType(), arguments);
  2012. else if (node->getOp() == glslang::EOpConstructStruct ||
  2013. node->getOp() == glslang::EOpConstructCooperativeMatrix ||
  2014. node->getType().isArray()) {
  2015. std::vector<spv::Id> constituents;
  2016. for (int c = 0; c < (int)arguments.size(); ++c)
  2017. constituents.push_back(arguments[c]);
  2018. constructed = builder.createCompositeConstruct(resultType(), constituents);
  2019. } else if (isMatrix)
  2020. constructed = builder.createMatrixConstructor(precision, arguments, resultType());
  2021. else
  2022. constructed = builder.createConstructor(precision, arguments, resultType());
  2023. builder.clearAccessChain();
  2024. builder.setAccessChainRValue(constructed);
  2025. return false;
  2026. }
  2027. // These six are component-wise compares with component-wise results.
  2028. // Forward on to createBinaryOperation(), requesting a vector result.
  2029. case glslang::EOpLessThan:
  2030. case glslang::EOpGreaterThan:
  2031. case glslang::EOpLessThanEqual:
  2032. case glslang::EOpGreaterThanEqual:
  2033. case glslang::EOpVectorEqual:
  2034. case glslang::EOpVectorNotEqual:
  2035. {
  2036. // Map the operation to a binary
  2037. binOp = node->getOp();
  2038. reduceComparison = false;
  2039. switch (node->getOp()) {
  2040. case glslang::EOpVectorEqual: binOp = glslang::EOpVectorEqual; break;
  2041. case glslang::EOpVectorNotEqual: binOp = glslang::EOpVectorNotEqual; break;
  2042. default: binOp = node->getOp(); break;
  2043. }
  2044. break;
  2045. }
  2046. case glslang::EOpMul:
  2047. // component-wise matrix multiply
  2048. binOp = glslang::EOpMul;
  2049. break;
  2050. case glslang::EOpOuterProduct:
  2051. // two vectors multiplied to make a matrix
  2052. binOp = glslang::EOpOuterProduct;
  2053. break;
  2054. case glslang::EOpDot:
  2055. {
  2056. // for scalar dot product, use multiply
  2057. glslang::TIntermSequence& glslangOperands = node->getSequence();
  2058. if (glslangOperands[0]->getAsTyped()->getVectorSize() == 1)
  2059. binOp = glslang::EOpMul;
  2060. break;
  2061. }
  2062. case glslang::EOpMod:
  2063. // when an aggregate, this is the floating-point mod built-in function,
  2064. // which can be emitted by the one in createBinaryOperation()
  2065. binOp = glslang::EOpMod;
  2066. break;
  2067. case glslang::EOpEmitVertex:
  2068. case glslang::EOpEndPrimitive:
  2069. case glslang::EOpBarrier:
  2070. case glslang::EOpMemoryBarrier:
  2071. case glslang::EOpMemoryBarrierAtomicCounter:
  2072. case glslang::EOpMemoryBarrierBuffer:
  2073. case glslang::EOpMemoryBarrierImage:
  2074. case glslang::EOpMemoryBarrierShared:
  2075. case glslang::EOpGroupMemoryBarrier:
  2076. case glslang::EOpDeviceMemoryBarrier:
  2077. case glslang::EOpAllMemoryBarrierWithGroupSync:
  2078. case glslang::EOpDeviceMemoryBarrierWithGroupSync:
  2079. case glslang::EOpWorkgroupMemoryBarrier:
  2080. case glslang::EOpWorkgroupMemoryBarrierWithGroupSync:
  2081. case glslang::EOpSubgroupBarrier:
  2082. case glslang::EOpSubgroupMemoryBarrier:
  2083. case glslang::EOpSubgroupMemoryBarrierBuffer:
  2084. case glslang::EOpSubgroupMemoryBarrierImage:
  2085. case glslang::EOpSubgroupMemoryBarrierShared:
  2086. noReturnValue = true;
  2087. // These all have 0 operands and will naturally finish up in the code below for 0 operands
  2088. break;
  2089. case glslang::EOpAtomicStore:
  2090. noReturnValue = true;
  2091. // fallthrough
  2092. case glslang::EOpAtomicLoad:
  2093. case glslang::EOpAtomicAdd:
  2094. case glslang::EOpAtomicMin:
  2095. case glslang::EOpAtomicMax:
  2096. case glslang::EOpAtomicAnd:
  2097. case glslang::EOpAtomicOr:
  2098. case glslang::EOpAtomicXor:
  2099. case glslang::EOpAtomicExchange:
  2100. case glslang::EOpAtomicCompSwap:
  2101. atomic = true;
  2102. break;
  2103. case glslang::EOpAtomicCounterAdd:
  2104. case glslang::EOpAtomicCounterSubtract:
  2105. case glslang::EOpAtomicCounterMin:
  2106. case glslang::EOpAtomicCounterMax:
  2107. case glslang::EOpAtomicCounterAnd:
  2108. case glslang::EOpAtomicCounterOr:
  2109. case glslang::EOpAtomicCounterXor:
  2110. case glslang::EOpAtomicCounterExchange:
  2111. case glslang::EOpAtomicCounterCompSwap:
  2112. builder.addExtension("SPV_KHR_shader_atomic_counter_ops");
  2113. builder.addCapability(spv::CapabilityAtomicStorageOps);
  2114. atomic = true;
  2115. break;
  2116. #ifdef NV_EXTENSIONS
  2117. case glslang::EOpIgnoreIntersectionNV:
  2118. case glslang::EOpTerminateRayNV:
  2119. case glslang::EOpTraceNV:
  2120. case glslang::EOpExecuteCallableNV:
  2121. case glslang::EOpWritePackedPrimitiveIndices4x8NV:
  2122. noReturnValue = true;
  2123. break;
  2124. #endif
  2125. case glslang::EOpCooperativeMatrixLoad:
  2126. case glslang::EOpCooperativeMatrixStore:
  2127. noReturnValue = true;
  2128. break;
  2129. default:
  2130. break;
  2131. }
  2132. //
  2133. // See if it maps to a regular operation.
  2134. //
  2135. if (binOp != glslang::EOpNull) {
  2136. glslang::TIntermTyped* left = node->getSequence()[0]->getAsTyped();
  2137. glslang::TIntermTyped* right = node->getSequence()[1]->getAsTyped();
  2138. assert(left && right);
  2139. builder.clearAccessChain();
  2140. left->traverse(this);
  2141. spv::Id leftId = accessChainLoad(left->getType());
  2142. builder.clearAccessChain();
  2143. right->traverse(this);
  2144. spv::Id rightId = accessChainLoad(right->getType());
  2145. builder.setLine(node->getLoc().line, node->getLoc().getFilename());
  2146. OpDecorations decorations = { precision,
  2147. TranslateNoContractionDecoration(node->getType().getQualifier()),
  2148. TranslateNonUniformDecoration(node->getType().getQualifier()) };
  2149. result = createBinaryOperation(binOp, decorations,
  2150. resultType(), leftId, rightId,
  2151. left->getType().getBasicType(), reduceComparison);
  2152. // code above should only make binOp that exists in createBinaryOperation
  2153. assert(result != spv::NoResult);
  2154. builder.clearAccessChain();
  2155. builder.setAccessChainRValue(result);
  2156. return false;
  2157. }
  2158. //
  2159. // Create the list of operands.
  2160. //
  2161. glslang::TIntermSequence& glslangOperands = node->getSequence();
  2162. std::vector<spv::Id> operands;
  2163. std::vector<spv::IdImmediate> memoryAccessOperands;
  2164. for (int arg = 0; arg < (int)glslangOperands.size(); ++arg) {
  2165. // special case l-value operands; there are just a few
  2166. bool lvalue = false;
  2167. switch (node->getOp()) {
  2168. case glslang::EOpFrexp:
  2169. case glslang::EOpModf:
  2170. if (arg == 1)
  2171. lvalue = true;
  2172. break;
  2173. case glslang::EOpInterpolateAtSample:
  2174. case glslang::EOpInterpolateAtOffset:
  2175. #ifdef AMD_EXTENSIONS
  2176. case glslang::EOpInterpolateAtVertex:
  2177. #endif
  2178. if (arg == 0) {
  2179. lvalue = true;
  2180. // Does it need a swizzle inversion? If so, evaluation is inverted;
  2181. // operate first on the swizzle base, then apply the swizzle.
  2182. if (glslangOperands[0]->getAsOperator() &&
  2183. glslangOperands[0]->getAsOperator()->getOp() == glslang::EOpVectorSwizzle)
  2184. invertedType = convertGlslangToSpvType(glslangOperands[0]->getAsBinaryNode()->getLeft()->getType());
  2185. }
  2186. break;
  2187. case glslang::EOpAtomicAdd:
  2188. case glslang::EOpAtomicMin:
  2189. case glslang::EOpAtomicMax:
  2190. case glslang::EOpAtomicAnd:
  2191. case glslang::EOpAtomicOr:
  2192. case glslang::EOpAtomicXor:
  2193. case glslang::EOpAtomicExchange:
  2194. case glslang::EOpAtomicCompSwap:
  2195. case glslang::EOpAtomicLoad:
  2196. case glslang::EOpAtomicStore:
  2197. case glslang::EOpAtomicCounterAdd:
  2198. case glslang::EOpAtomicCounterSubtract:
  2199. case glslang::EOpAtomicCounterMin:
  2200. case glslang::EOpAtomicCounterMax:
  2201. case glslang::EOpAtomicCounterAnd:
  2202. case glslang::EOpAtomicCounterOr:
  2203. case glslang::EOpAtomicCounterXor:
  2204. case glslang::EOpAtomicCounterExchange:
  2205. case glslang::EOpAtomicCounterCompSwap:
  2206. if (arg == 0)
  2207. lvalue = true;
  2208. break;
  2209. case glslang::EOpAddCarry:
  2210. case glslang::EOpSubBorrow:
  2211. if (arg == 2)
  2212. lvalue = true;
  2213. break;
  2214. case glslang::EOpUMulExtended:
  2215. case glslang::EOpIMulExtended:
  2216. if (arg >= 2)
  2217. lvalue = true;
  2218. break;
  2219. case glslang::EOpCooperativeMatrixLoad:
  2220. if (arg == 0 || arg == 1)
  2221. lvalue = true;
  2222. break;
  2223. case glslang::EOpCooperativeMatrixStore:
  2224. if (arg == 1)
  2225. lvalue = true;
  2226. break;
  2227. default:
  2228. break;
  2229. }
  2230. builder.clearAccessChain();
  2231. if (invertedType != spv::NoType && arg == 0)
  2232. glslangOperands[0]->getAsBinaryNode()->getLeft()->traverse(this);
  2233. else
  2234. glslangOperands[arg]->traverse(this);
  2235. if (node->getOp() == glslang::EOpCooperativeMatrixLoad ||
  2236. node->getOp() == glslang::EOpCooperativeMatrixStore) {
  2237. if (arg == 1) {
  2238. // fold "element" parameter into the access chain
  2239. spv::Builder::AccessChain save = builder.getAccessChain();
  2240. builder.clearAccessChain();
  2241. glslangOperands[2]->traverse(this);
  2242. spv::Id elementId = accessChainLoad(glslangOperands[2]->getAsTyped()->getType());
  2243. builder.setAccessChain(save);
  2244. // Point to the first element of the array.
  2245. builder.accessChainPush(elementId, TranslateCoherent(glslangOperands[arg]->getAsTyped()->getType()),
  2246. glslangOperands[arg]->getAsTyped()->getType().getBufferReferenceAlignment());
  2247. spv::Builder::AccessChain::CoherentFlags coherentFlags = builder.getAccessChain().coherentFlags;
  2248. unsigned int alignment = builder.getAccessChain().alignment;
  2249. int memoryAccess = TranslateMemoryAccess(coherentFlags);
  2250. if (node->getOp() == glslang::EOpCooperativeMatrixLoad)
  2251. memoryAccess &= ~spv::MemoryAccessMakePointerAvailableKHRMask;
  2252. if (node->getOp() == glslang::EOpCooperativeMatrixStore)
  2253. memoryAccess &= ~spv::MemoryAccessMakePointerVisibleKHRMask;
  2254. if (builder.getStorageClass(builder.getAccessChain().base) == spv::StorageClassPhysicalStorageBufferEXT) {
  2255. memoryAccess = (spv::MemoryAccessMask)(memoryAccess | spv::MemoryAccessAlignedMask);
  2256. }
  2257. memoryAccessOperands.push_back(spv::IdImmediate(false, memoryAccess));
  2258. if (memoryAccess & spv::MemoryAccessAlignedMask) {
  2259. memoryAccessOperands.push_back(spv::IdImmediate(false, alignment));
  2260. }
  2261. if (memoryAccess & (spv::MemoryAccessMakePointerAvailableKHRMask | spv::MemoryAccessMakePointerVisibleKHRMask)) {
  2262. memoryAccessOperands.push_back(spv::IdImmediate(true, builder.makeUintConstant(TranslateMemoryScope(coherentFlags))));
  2263. }
  2264. } else if (arg == 2) {
  2265. continue;
  2266. }
  2267. }
  2268. if (lvalue)
  2269. operands.push_back(builder.accessChainGetLValue());
  2270. else {
  2271. builder.setLine(node->getLoc().line, node->getLoc().getFilename());
  2272. operands.push_back(accessChainLoad(glslangOperands[arg]->getAsTyped()->getType()));
  2273. }
  2274. }
  2275. builder.setLine(node->getLoc().line, node->getLoc().getFilename());
  2276. if (node->getOp() == glslang::EOpCooperativeMatrixLoad) {
  2277. std::vector<spv::IdImmediate> idImmOps;
  2278. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  2279. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
  2280. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // colMajor
  2281. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
  2282. // get the pointee type
  2283. spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
  2284. assert(builder.isCooperativeMatrixType(typeId));
  2285. // do the op
  2286. spv::Id result = builder.createOp(spv::OpCooperativeMatrixLoadNV, typeId, idImmOps);
  2287. // store the result to the pointer (out param 'm')
  2288. builder.createStore(result, operands[0]);
  2289. result = 0;
  2290. } else if (node->getOp() == glslang::EOpCooperativeMatrixStore) {
  2291. std::vector<spv::IdImmediate> idImmOps;
  2292. idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
  2293. idImmOps.push_back(spv::IdImmediate(true, operands[0])); // object
  2294. idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
  2295. idImmOps.push_back(spv::IdImmediate(true, operands[3])); // colMajor
  2296. idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
  2297. builder.createNoResultOp(spv::OpCooperativeMatrixStoreNV, idImmOps);
  2298. result = 0;
  2299. } else if (atomic) {
  2300. // Handle all atomics
  2301. result = createAtomicOperation(node->getOp(), precision, resultType(), operands, node->getBasicType());
  2302. } else {
  2303. // Pass through to generic operations.
  2304. switch (glslangOperands.size()) {
  2305. case 0:
  2306. result = createNoArgOperation(node->getOp(), precision, resultType());
  2307. break;
  2308. case 1:
  2309. {
  2310. OpDecorations decorations = { precision,
  2311. TranslateNoContractionDecoration(node->getType().getQualifier()),
  2312. TranslateNonUniformDecoration(node->getType().getQualifier()) };
  2313. result = createUnaryOperation(
  2314. node->getOp(), decorations,
  2315. resultType(), operands.front(),
  2316. glslangOperands[0]->getAsTyped()->getBasicType());
  2317. }
  2318. break;
  2319. default:
  2320. result = createMiscOperation(node->getOp(), precision, resultType(), operands, node->getBasicType());
  2321. break;
  2322. }
  2323. if (invertedType)
  2324. result = createInvertedSwizzle(precision, *glslangOperands[0]->getAsBinaryNode(), result);
  2325. }
  2326. if (noReturnValue)
  2327. return false;
  2328. if (! result) {
  2329. logger->missingFunctionality("unknown glslang aggregate");
  2330. return true; // pick up a child as a placeholder operand
  2331. } else {
  2332. builder.clearAccessChain();
  2333. builder.setAccessChainRValue(result);
  2334. return false;
  2335. }
  2336. }
  2337. // This path handles both if-then-else and ?:
  2338. // The if-then-else has a node type of void, while
  2339. // ?: has either a void or a non-void node type
  2340. //
  2341. // Leaving the result, when not void:
  2342. // GLSL only has r-values as the result of a :?, but
  2343. // if we have an l-value, that can be more efficient if it will
  2344. // become the base of a complex r-value expression, because the
  2345. // next layer copies r-values into memory to use the access-chain mechanism
  2346. bool TGlslangToSpvTraverser::visitSelection(glslang::TVisit /* visit */, glslang::TIntermSelection* node)
  2347. {
  2348. // See if it simple and safe, or required, to execute both sides.
  2349. // Crucially, side effects must be either semantically required or avoided,
  2350. // and there are performance trade-offs.
  2351. // Return true if required or a good idea (and safe) to execute both sides,
  2352. // false otherwise.
  2353. const auto bothSidesPolicy = [&]() -> bool {
  2354. // do we have both sides?
  2355. if (node->getTrueBlock() == nullptr ||
  2356. node->getFalseBlock() == nullptr)
  2357. return false;
  2358. // required? (unless we write additional code to look for side effects
  2359. // and make performance trade-offs if none are present)
  2360. if (!node->getShortCircuit())
  2361. return true;
  2362. // if not required to execute both, decide based on performance/practicality...
  2363. // see if OpSelect can handle it
  2364. if ((!node->getType().isScalar() && !node->getType().isVector()) ||
  2365. node->getBasicType() == glslang::EbtVoid)
  2366. return false;
  2367. assert(node->getType() == node->getTrueBlock() ->getAsTyped()->getType() &&
  2368. node->getType() == node->getFalseBlock()->getAsTyped()->getType());
  2369. // return true if a single operand to ? : is okay for OpSelect
  2370. const auto operandOkay = [](glslang::TIntermTyped* node) {
  2371. return node->getAsSymbolNode() || node->getType().getQualifier().isConstant();
  2372. };
  2373. return operandOkay(node->getTrueBlock() ->getAsTyped()) &&
  2374. operandOkay(node->getFalseBlock()->getAsTyped());
  2375. };
  2376. spv::Id result = spv::NoResult; // upcoming result selecting between trueValue and falseValue
  2377. // emit the condition before doing anything with selection
  2378. node->getCondition()->traverse(this);
  2379. spv::Id condition = accessChainLoad(node->getCondition()->getType());
  2380. // Find a way of executing both sides and selecting the right result.
  2381. const auto executeBothSides = [&]() -> void {
  2382. // execute both sides
  2383. node->getTrueBlock()->traverse(this);
  2384. spv::Id trueValue = accessChainLoad(node->getTrueBlock()->getAsTyped()->getType());
  2385. node->getFalseBlock()->traverse(this);
  2386. spv::Id falseValue = accessChainLoad(node->getTrueBlock()->getAsTyped()->getType());
  2387. builder.setLine(node->getLoc().line, node->getLoc().getFilename());
  2388. // done if void
  2389. if (node->getBasicType() == glslang::EbtVoid)
  2390. return;
  2391. // emit code to select between trueValue and falseValue
  2392. // see if OpSelect can handle it
  2393. if (node->getType().isScalar() || node->getType().isVector()) {
  2394. // Emit OpSelect for this selection.
  2395. // smear condition to vector, if necessary (AST is always scalar)
  2396. if (builder.isVector(trueValue))
  2397. condition = builder.smearScalar(spv::NoPrecision, condition,
  2398. builder.makeVectorType(builder.makeBoolType(),
  2399. builder.getNumComponents(trueValue)));
  2400. // OpSelect
  2401. result = builder.createTriOp(spv::OpSelect,
  2402. convertGlslangToSpvType(node->getType()), condition,
  2403. trueValue, falseValue);
  2404. builder.clearAccessChain();
  2405. builder.setAccessChainRValue(result);
  2406. } else {
  2407. // We need control flow to select the result.
  2408. // TODO: Once SPIR-V OpSelect allows arbitrary types, eliminate this path.
  2409. result = builder.createVariable(spv::StorageClassFunction, convertGlslangToSpvType(node->getType()));
  2410. // Selection control:
  2411. const spv::SelectionControlMask control = TranslateSelectionControl(*node);
  2412. // make an "if" based on the value created by the condition
  2413. spv::Builder::If ifBuilder(condition, control, builder);
  2414. // emit the "then" statement
  2415. builder.createStore(trueValue, result);
  2416. ifBuilder.makeBeginElse();
  2417. // emit the "else" statement
  2418. builder.createStore(falseValue, result);
  2419. // finish off the control flow
  2420. ifBuilder.makeEndIf();
  2421. builder.clearAccessChain();
  2422. builder.setAccessChainLValue(result);
  2423. }
  2424. };
  2425. // Execute the one side needed, as per the condition
  2426. const auto executeOneSide = [&]() {
  2427. // Always emit control flow.
  2428. if (node->getBasicType() != glslang::EbtVoid)
  2429. result = builder.createVariable(spv::StorageClassFunction, convertGlslangToSpvType(node->getType()));
  2430. // Selection control:
  2431. const spv::SelectionControlMask control = TranslateSelectionControl(*node);
  2432. // make an "if" based on the value created by the condition
  2433. spv::Builder::If ifBuilder(condition, control, builder);
  2434. // emit the "then" statement
  2435. if (node->getTrueBlock() != nullptr) {
  2436. node->getTrueBlock()->traverse(this);
  2437. if (result != spv::NoResult)
  2438. builder.createStore(accessChainLoad(node->getTrueBlock()->getAsTyped()->getType()), result);
  2439. }
  2440. if (node->getFalseBlock() != nullptr) {
  2441. ifBuilder.makeBeginElse();
  2442. // emit the "else" statement
  2443. node->getFalseBlock()->traverse(this);
  2444. if (result != spv::NoResult)
  2445. builder.createStore(accessChainLoad(node->getFalseBlock()->getAsTyped()->getType()), result);
  2446. }
  2447. // finish off the control flow
  2448. ifBuilder.makeEndIf();
  2449. if (result != spv::NoResult) {
  2450. builder.clearAccessChain();
  2451. builder.setAccessChainLValue(result);
  2452. }
  2453. };
  2454. // Try for OpSelect (or a requirement to execute both sides)
  2455. if (bothSidesPolicy()) {
  2456. SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
  2457. if (node->getType().getQualifier().isSpecConstant())
  2458. spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
  2459. executeBothSides();
  2460. } else
  2461. executeOneSide();
  2462. return false;
  2463. }
  2464. bool TGlslangToSpvTraverser::visitSwitch(glslang::TVisit /* visit */, glslang::TIntermSwitch* node)
  2465. {
  2466. // emit and get the condition before doing anything with switch
  2467. node->getCondition()->traverse(this);
  2468. spv::Id selector = accessChainLoad(node->getCondition()->getAsTyped()->getType());
  2469. // Selection control:
  2470. const spv::SelectionControlMask control = TranslateSwitchControl(*node);
  2471. // browse the children to sort out code segments
  2472. int defaultSegment = -1;
  2473. std::vector<TIntermNode*> codeSegments;
  2474. glslang::TIntermSequence& sequence = node->getBody()->getSequence();
  2475. std::vector<int> caseValues;
  2476. std::vector<int> valueIndexToSegment(sequence.size()); // note: probably not all are used, it is an overestimate
  2477. for (glslang::TIntermSequence::iterator c = sequence.begin(); c != sequence.end(); ++c) {
  2478. TIntermNode* child = *c;
  2479. if (child->getAsBranchNode() && child->getAsBranchNode()->getFlowOp() == glslang::EOpDefault)
  2480. defaultSegment = (int)codeSegments.size();
  2481. else if (child->getAsBranchNode() && child->getAsBranchNode()->getFlowOp() == glslang::EOpCase) {
  2482. valueIndexToSegment[caseValues.size()] = (int)codeSegments.size();
  2483. caseValues.push_back(child->getAsBranchNode()->getExpression()->getAsConstantUnion()->getConstArray()[0].getIConst());
  2484. } else
  2485. codeSegments.push_back(child);
  2486. }
  2487. // handle the case where the last code segment is missing, due to no code
  2488. // statements between the last case and the end of the switch statement
  2489. if ((caseValues.size() && (int)codeSegments.size() == valueIndexToSegment[caseValues.size() - 1]) ||
  2490. (int)codeSegments.size() == defaultSegment)
  2491. codeSegments.push_back(nullptr);
  2492. // make the switch statement
  2493. std::vector<spv::Block*> segmentBlocks; // returned, as the blocks allocated in the call
  2494. builder.makeSwitch(selector, control, (int)codeSegments.size(), caseValues, valueIndexToSegment, defaultSegment, segmentBlocks);
  2495. // emit all the code in the segments
  2496. breakForLoop.push(false);
  2497. for (unsigned int s = 0; s < codeSegments.size(); ++s) {
  2498. builder.nextSwitchSegment(segmentBlocks, s);
  2499. if (codeSegments[s])
  2500. codeSegments[s]->traverse(this);
  2501. else
  2502. builder.addSwitchBreak();
  2503. }
  2504. breakForLoop.pop();
  2505. builder.endSwitch(segmentBlocks);
  2506. return false;
  2507. }
  2508. void TGlslangToSpvTraverser::visitConstantUnion(glslang::TIntermConstantUnion* node)
  2509. {
  2510. int nextConst = 0;
  2511. spv::Id constant = createSpvConstantFromConstUnionArray(node->getType(), node->getConstArray(), nextConst, false);
  2512. builder.clearAccessChain();
  2513. builder.setAccessChainRValue(constant);
  2514. }
  2515. bool TGlslangToSpvTraverser::visitLoop(glslang::TVisit /* visit */, glslang::TIntermLoop* node)
  2516. {
  2517. auto blocks = builder.makeNewLoop();
  2518. builder.createBranch(&blocks.head);
  2519. // Loop control:
  2520. unsigned int dependencyLength = glslang::TIntermLoop::dependencyInfinite;
  2521. const spv::LoopControlMask control = TranslateLoopControl(*node, dependencyLength);
  2522. // Spec requires back edges to target header blocks, and every header block
  2523. // must dominate its merge block. Make a header block first to ensure these
  2524. // conditions are met. By definition, it will contain OpLoopMerge, followed
  2525. // by a block-ending branch. But we don't want to put any other body/test
  2526. // instructions in it, since the body/test may have arbitrary instructions,
  2527. // including merges of its own.
  2528. builder.setLine(node->getLoc().line, node->getLoc().getFilename());
  2529. builder.setBuildPoint(&blocks.head);
  2530. builder.createLoopMerge(&blocks.merge, &blocks.continue_target, control, dependencyLength);
  2531. if (node->testFirst() && node->getTest()) {
  2532. spv::Block& test = builder.makeNewBlock();
  2533. builder.createBranch(&test);
  2534. builder.setBuildPoint(&test);
  2535. node->getTest()->traverse(this);
  2536. spv::Id condition = accessChainLoad(node->getTest()->getType());
  2537. builder.createConditionalBranch(condition, &blocks.body, &blocks.merge);
  2538. builder.setBuildPoint(&blocks.body);
  2539. breakForLoop.push(true);
  2540. if (node->getBody())
  2541. node->getBody()->traverse(this);
  2542. builder.createBranch(&blocks.continue_target);
  2543. breakForLoop.pop();
  2544. builder.setBuildPoint(&blocks.continue_target);
  2545. if (node->getTerminal())
  2546. node->getTerminal()->traverse(this);
  2547. builder.createBranch(&blocks.head);
  2548. } else {
  2549. builder.setLine(node->getLoc().line, node->getLoc().getFilename());
  2550. builder.createBranch(&blocks.body);
  2551. breakForLoop.push(true);
  2552. builder.setBuildPoint(&blocks.body);
  2553. if (node->getBody())
  2554. node->getBody()->traverse(this);
  2555. builder.createBranch(&blocks.continue_target);
  2556. breakForLoop.pop();
  2557. builder.setBuildPoint(&blocks.continue_target);
  2558. if (node->getTerminal())
  2559. node->getTerminal()->traverse(this);
  2560. if (node->getTest()) {
  2561. node->getTest()->traverse(this);
  2562. spv::Id condition =
  2563. accessChainLoad(node->getTest()->getType());
  2564. builder.createConditionalBranch(condition, &blocks.head, &blocks.merge);
  2565. } else {
  2566. // TODO: unless there was a break/return/discard instruction
  2567. // somewhere in the body, this is an infinite loop, so we should
  2568. // issue a warning.
  2569. builder.createBranch(&blocks.head);
  2570. }
  2571. }
  2572. builder.setBuildPoint(&blocks.merge);
  2573. builder.closeLoop();
  2574. return false;
  2575. }
  2576. bool TGlslangToSpvTraverser::visitBranch(glslang::TVisit /* visit */, glslang::TIntermBranch* node)
  2577. {
  2578. if (node->getExpression())
  2579. node->getExpression()->traverse(this);
  2580. builder.setLine(node->getLoc().line, node->getLoc().getFilename());
  2581. switch (node->getFlowOp()) {
  2582. case glslang::EOpKill:
  2583. builder.makeDiscard();
  2584. break;
  2585. case glslang::EOpBreak:
  2586. if (breakForLoop.top())
  2587. builder.createLoopExit();
  2588. else
  2589. builder.addSwitchBreak();
  2590. break;
  2591. case glslang::EOpContinue:
  2592. builder.createLoopContinue();
  2593. break;
  2594. case glslang::EOpReturn:
  2595. if (node->getExpression()) {
  2596. const glslang::TType& glslangReturnType = node->getExpression()->getType();
  2597. spv::Id returnId = accessChainLoad(glslangReturnType);
  2598. if (builder.getTypeId(returnId) != currentFunction->getReturnType()) {
  2599. builder.clearAccessChain();
  2600. spv::Id copyId = builder.createVariable(spv::StorageClassFunction, currentFunction->getReturnType());
  2601. builder.setAccessChainLValue(copyId);
  2602. multiTypeStore(glslangReturnType, returnId);
  2603. returnId = builder.createLoad(copyId);
  2604. }
  2605. builder.makeReturn(false, returnId);
  2606. } else
  2607. builder.makeReturn(false);
  2608. builder.clearAccessChain();
  2609. break;
  2610. default:
  2611. assert(0);
  2612. break;
  2613. }
  2614. return false;
  2615. }
  2616. spv::Id TGlslangToSpvTraverser::createSpvVariable(const glslang::TIntermSymbol* node)
  2617. {
  2618. // First, steer off constants, which are not SPIR-V variables, but
  2619. // can still have a mapping to a SPIR-V Id.
  2620. // This includes specialization constants.
  2621. if (node->getQualifier().isConstant()) {
  2622. spv::Id result = createSpvConstant(*node);
  2623. if (result != spv::NoResult)
  2624. return result;
  2625. }
  2626. // Now, handle actual variables
  2627. spv::StorageClass storageClass = TranslateStorageClass(node->getType());
  2628. spv::Id spvType = convertGlslangToSpvType(node->getType());
  2629. const bool contains16BitType = node->getType().containsBasicType(glslang::EbtFloat16) ||
  2630. node->getType().containsBasicType(glslang::EbtInt16) ||
  2631. node->getType().containsBasicType(glslang::EbtUint16);
  2632. if (contains16BitType) {
  2633. switch (storageClass) {
  2634. case spv::StorageClassInput:
  2635. case spv::StorageClassOutput:
  2636. addPre13Extension(spv::E_SPV_KHR_16bit_storage);
  2637. builder.addCapability(spv::CapabilityStorageInputOutput16);
  2638. break;
  2639. case spv::StorageClassPushConstant:
  2640. addPre13Extension(spv::E_SPV_KHR_16bit_storage);
  2641. builder.addCapability(spv::CapabilityStoragePushConstant16);
  2642. break;
  2643. case spv::StorageClassUniform:
  2644. addPre13Extension(spv::E_SPV_KHR_16bit_storage);
  2645. if (node->getType().getQualifier().storage == glslang::EvqBuffer)
  2646. builder.addCapability(spv::CapabilityStorageUniformBufferBlock16);
  2647. else
  2648. builder.addCapability(spv::CapabilityStorageUniform16);
  2649. break;
  2650. case spv::StorageClassStorageBuffer:
  2651. case spv::StorageClassPhysicalStorageBufferEXT:
  2652. addPre13Extension(spv::E_SPV_KHR_16bit_storage);
  2653. builder.addCapability(spv::CapabilityStorageUniformBufferBlock16);
  2654. break;
  2655. default:
  2656. break;
  2657. }
  2658. }
  2659. const bool contains8BitType = node->getType().containsBasicType(glslang::EbtInt8) ||
  2660. node->getType().containsBasicType(glslang::EbtUint8);
  2661. if (contains8BitType) {
  2662. if (storageClass == spv::StorageClassPushConstant) {
  2663. builder.addExtension(spv::E_SPV_KHR_8bit_storage);
  2664. builder.addCapability(spv::CapabilityStoragePushConstant8);
  2665. } else if (storageClass == spv::StorageClassUniform) {
  2666. builder.addExtension(spv::E_SPV_KHR_8bit_storage);
  2667. builder.addCapability(spv::CapabilityUniformAndStorageBuffer8BitAccess);
  2668. } else if (storageClass == spv::StorageClassStorageBuffer) {
  2669. builder.addExtension(spv::E_SPV_KHR_8bit_storage);
  2670. builder.addCapability(spv::CapabilityStorageBuffer8BitAccess);
  2671. }
  2672. }
  2673. const char* name = node->getName().c_str();
  2674. if (glslang::IsAnonymous(name))
  2675. name = "";
  2676. return builder.createVariable(storageClass, spvType, name);
  2677. }
  2678. // Return type Id of the sampled type.
  2679. spv::Id TGlslangToSpvTraverser::getSampledType(const glslang::TSampler& sampler)
  2680. {
  2681. switch (sampler.type) {
  2682. case glslang::EbtFloat: return builder.makeFloatType(32);
  2683. #ifdef AMD_EXTENSIONS
  2684. case glslang::EbtFloat16:
  2685. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float_fetch);
  2686. builder.addCapability(spv::CapabilityFloat16ImageAMD);
  2687. return builder.makeFloatType(16);
  2688. #endif
  2689. case glslang::EbtInt: return builder.makeIntType(32);
  2690. case glslang::EbtUint: return builder.makeUintType(32);
  2691. default:
  2692. assert(0);
  2693. return builder.makeFloatType(32);
  2694. }
  2695. }
  2696. // If node is a swizzle operation, return the type that should be used if
  2697. // the swizzle base is first consumed by another operation, before the swizzle
  2698. // is applied.
  2699. spv::Id TGlslangToSpvTraverser::getInvertedSwizzleType(const glslang::TIntermTyped& node)
  2700. {
  2701. if (node.getAsOperator() &&
  2702. node.getAsOperator()->getOp() == glslang::EOpVectorSwizzle)
  2703. return convertGlslangToSpvType(node.getAsBinaryNode()->getLeft()->getType());
  2704. else
  2705. return spv::NoType;
  2706. }
  2707. // When inverting a swizzle with a parent op, this function
  2708. // will apply the swizzle operation to a completed parent operation.
  2709. spv::Id TGlslangToSpvTraverser::createInvertedSwizzle(spv::Decoration precision, const glslang::TIntermTyped& node, spv::Id parentResult)
  2710. {
  2711. std::vector<unsigned> swizzle;
  2712. convertSwizzle(*node.getAsBinaryNode()->getRight()->getAsAggregate(), swizzle);
  2713. return builder.createRvalueSwizzle(precision, convertGlslangToSpvType(node.getType()), parentResult, swizzle);
  2714. }
  2715. // Convert a glslang AST swizzle node to a swizzle vector for building SPIR-V.
  2716. void TGlslangToSpvTraverser::convertSwizzle(const glslang::TIntermAggregate& node, std::vector<unsigned>& swizzle)
  2717. {
  2718. const glslang::TIntermSequence& swizzleSequence = node.getSequence();
  2719. for (int i = 0; i < (int)swizzleSequence.size(); ++i)
  2720. swizzle.push_back(swizzleSequence[i]->getAsConstantUnion()->getConstArray()[0].getIConst());
  2721. }
  2722. // Convert from a glslang type to an SPV type, by calling into a
  2723. // recursive version of this function. This establishes the inherited
  2724. // layout state rooted from the top-level type.
  2725. spv::Id TGlslangToSpvTraverser::convertGlslangToSpvType(const glslang::TType& type, bool forwardReferenceOnly)
  2726. {
  2727. return convertGlslangToSpvType(type, getExplicitLayout(type), type.getQualifier(), false, forwardReferenceOnly);
  2728. }
  2729. // Do full recursive conversion of an arbitrary glslang type to a SPIR-V Id.
  2730. // explicitLayout can be kept the same throughout the hierarchical recursive walk.
  2731. // Mutually recursive with convertGlslangStructToSpvType().
  2732. spv::Id TGlslangToSpvTraverser::convertGlslangToSpvType(const glslang::TType& type,
  2733. glslang::TLayoutPacking explicitLayout, const glslang::TQualifier& qualifier,
  2734. bool lastBufferBlockMember, bool forwardReferenceOnly)
  2735. {
  2736. spv::Id spvType = spv::NoResult;
  2737. switch (type.getBasicType()) {
  2738. case glslang::EbtVoid:
  2739. spvType = builder.makeVoidType();
  2740. assert (! type.isArray());
  2741. break;
  2742. case glslang::EbtFloat:
  2743. spvType = builder.makeFloatType(32);
  2744. break;
  2745. case glslang::EbtDouble:
  2746. spvType = builder.makeFloatType(64);
  2747. break;
  2748. case glslang::EbtFloat16:
  2749. spvType = builder.makeFloatType(16);
  2750. break;
  2751. case glslang::EbtBool:
  2752. // "transparent" bool doesn't exist in SPIR-V. The GLSL convention is
  2753. // a 32-bit int where non-0 means true.
  2754. if (explicitLayout != glslang::ElpNone)
  2755. spvType = builder.makeUintType(32);
  2756. else
  2757. spvType = builder.makeBoolType();
  2758. break;
  2759. case glslang::EbtInt8:
  2760. spvType = builder.makeIntType(8);
  2761. break;
  2762. case glslang::EbtUint8:
  2763. spvType = builder.makeUintType(8);
  2764. break;
  2765. case glslang::EbtInt16:
  2766. spvType = builder.makeIntType(16);
  2767. break;
  2768. case glslang::EbtUint16:
  2769. spvType = builder.makeUintType(16);
  2770. break;
  2771. case glslang::EbtInt:
  2772. spvType = builder.makeIntType(32);
  2773. break;
  2774. case glslang::EbtUint:
  2775. spvType = builder.makeUintType(32);
  2776. break;
  2777. case glslang::EbtInt64:
  2778. spvType = builder.makeIntType(64);
  2779. break;
  2780. case glslang::EbtUint64:
  2781. spvType = builder.makeUintType(64);
  2782. break;
  2783. case glslang::EbtAtomicUint:
  2784. builder.addCapability(spv::CapabilityAtomicStorage);
  2785. spvType = builder.makeUintType(32);
  2786. break;
  2787. #ifdef NV_EXTENSIONS
  2788. case glslang::EbtAccStructNV:
  2789. spvType = builder.makeAccelerationStructureNVType();
  2790. break;
  2791. #endif
  2792. case glslang::EbtSampler:
  2793. {
  2794. const glslang::TSampler& sampler = type.getSampler();
  2795. if (sampler.sampler) {
  2796. // pure sampler
  2797. spvType = builder.makeSamplerType();
  2798. } else {
  2799. // an image is present, make its type
  2800. spvType = builder.makeImageType(getSampledType(sampler), TranslateDimensionality(sampler), sampler.shadow, sampler.arrayed, sampler.ms,
  2801. sampler.image ? 2 : 1, TranslateImageFormat(type));
  2802. if (sampler.combined) {
  2803. // already has both image and sampler, make the combined type
  2804. spvType = builder.makeSampledImageType(spvType);
  2805. }
  2806. }
  2807. }
  2808. break;
  2809. case glslang::EbtStruct:
  2810. case glslang::EbtBlock:
  2811. {
  2812. // If we've seen this struct type, return it
  2813. const glslang::TTypeList* glslangMembers = type.getStruct();
  2814. // Try to share structs for different layouts, but not yet for other
  2815. // kinds of qualification (primarily not yet including interpolant qualification).
  2816. if (! HasNonLayoutQualifiers(type, qualifier))
  2817. spvType = structMap[explicitLayout][qualifier.layoutMatrix][glslangMembers];
  2818. if (spvType != spv::NoResult)
  2819. break;
  2820. // else, we haven't seen it...
  2821. if (type.getBasicType() == glslang::EbtBlock)
  2822. memberRemapper[glslangMembers].resize(glslangMembers->size());
  2823. spvType = convertGlslangStructToSpvType(type, glslangMembers, explicitLayout, qualifier);
  2824. }
  2825. break;
  2826. case glslang::EbtReference:
  2827. {
  2828. // Make the forward pointer, then recurse to convert the structure type, then
  2829. // patch up the forward pointer with a real pointer type.
  2830. if (forwardPointers.find(type.getReferentType()) == forwardPointers.end()) {
  2831. spv::Id forwardId = builder.makeForwardPointer(spv::StorageClassPhysicalStorageBufferEXT);
  2832. forwardPointers[type.getReferentType()] = forwardId;
  2833. }
  2834. spvType = forwardPointers[type.getReferentType()];
  2835. if (!forwardReferenceOnly) {
  2836. spv::Id referentType = convertGlslangToSpvType(*type.getReferentType());
  2837. builder.makePointerFromForwardPointer(spv::StorageClassPhysicalStorageBufferEXT,
  2838. forwardPointers[type.getReferentType()],
  2839. referentType);
  2840. }
  2841. }
  2842. break;
  2843. default:
  2844. assert(0);
  2845. break;
  2846. }
  2847. if (type.isMatrix())
  2848. spvType = builder.makeMatrixType(spvType, type.getMatrixCols(), type.getMatrixRows());
  2849. else {
  2850. // If this variable has a vector element count greater than 1, create a SPIR-V vector
  2851. if (type.getVectorSize() > 1)
  2852. spvType = builder.makeVectorType(spvType, type.getVectorSize());
  2853. }
  2854. if (type.isCoopMat()) {
  2855. builder.addCapability(spv::CapabilityCooperativeMatrixNV);
  2856. builder.addExtension(spv::E_SPV_NV_cooperative_matrix);
  2857. if (type.getBasicType() == glslang::EbtFloat16)
  2858. builder.addCapability(spv::CapabilityFloat16);
  2859. spv::Id scope = makeArraySizeId(*type.getTypeParameters(), 1);
  2860. spv::Id rows = makeArraySizeId(*type.getTypeParameters(), 2);
  2861. spv::Id cols = makeArraySizeId(*type.getTypeParameters(), 3);
  2862. spvType = builder.makeCooperativeMatrixType(spvType, scope, rows, cols);
  2863. }
  2864. if (type.isArray()) {
  2865. int stride = 0; // keep this 0 unless doing an explicit layout; 0 will mean no decoration, no stride
  2866. // Do all but the outer dimension
  2867. if (type.getArraySizes()->getNumDims() > 1) {
  2868. // We need to decorate array strides for types needing explicit layout, except blocks.
  2869. if (explicitLayout != glslang::ElpNone && type.getBasicType() != glslang::EbtBlock) {
  2870. // Use a dummy glslang type for querying internal strides of
  2871. // arrays of arrays, but using just a one-dimensional array.
  2872. glslang::TType simpleArrayType(type, 0); // deference type of the array
  2873. while (simpleArrayType.getArraySizes()->getNumDims() > 1)
  2874. simpleArrayType.getArraySizes()->dereference();
  2875. // Will compute the higher-order strides here, rather than making a whole
  2876. // pile of types and doing repetitive recursion on their contents.
  2877. stride = getArrayStride(simpleArrayType, explicitLayout, qualifier.layoutMatrix);
  2878. }
  2879. // make the arrays
  2880. for (int dim = type.getArraySizes()->getNumDims() - 1; dim > 0; --dim) {
  2881. spvType = builder.makeArrayType(spvType, makeArraySizeId(*type.getArraySizes(), dim), stride);
  2882. if (stride > 0)
  2883. builder.addDecoration(spvType, spv::DecorationArrayStride, stride);
  2884. stride *= type.getArraySizes()->getDimSize(dim);
  2885. }
  2886. } else {
  2887. // single-dimensional array, and don't yet have stride
  2888. // We need to decorate array strides for types needing explicit layout, except blocks.
  2889. if (explicitLayout != glslang::ElpNone && type.getBasicType() != glslang::EbtBlock)
  2890. stride = getArrayStride(type, explicitLayout, qualifier.layoutMatrix);
  2891. }
  2892. // Do the outer dimension, which might not be known for a runtime-sized array.
  2893. // (Unsized arrays that survive through linking will be runtime-sized arrays)
  2894. if (type.isSizedArray())
  2895. spvType = builder.makeArrayType(spvType, makeArraySizeId(*type.getArraySizes(), 0), stride);
  2896. else {
  2897. if (!lastBufferBlockMember) {
  2898. builder.addExtension("SPV_EXT_descriptor_indexing");
  2899. builder.addCapability(spv::CapabilityRuntimeDescriptorArrayEXT);
  2900. }
  2901. spvType = builder.makeRuntimeArray(spvType);
  2902. }
  2903. if (stride > 0)
  2904. builder.addDecoration(spvType, spv::DecorationArrayStride, stride);
  2905. }
  2906. return spvType;
  2907. }
  2908. // TODO: this functionality should exist at a higher level, in creating the AST
  2909. //
  2910. // Identify interface members that don't have their required extension turned on.
  2911. //
  2912. bool TGlslangToSpvTraverser::filterMember(const glslang::TType& member)
  2913. {
  2914. #ifdef NV_EXTENSIONS
  2915. auto& extensions = glslangIntermediate->getRequestedExtensions();
  2916. if (member.getFieldName() == "gl_SecondaryViewportMaskNV" &&
  2917. extensions.find("GL_NV_stereo_view_rendering") == extensions.end())
  2918. return true;
  2919. if (member.getFieldName() == "gl_SecondaryPositionNV" &&
  2920. extensions.find("GL_NV_stereo_view_rendering") == extensions.end())
  2921. return true;
  2922. if (glslangIntermediate->getStage() != EShLangMeshNV) {
  2923. if (member.getFieldName() == "gl_ViewportMask" &&
  2924. extensions.find("GL_NV_viewport_array2") == extensions.end())
  2925. return true;
  2926. if (member.getFieldName() == "gl_PositionPerViewNV" &&
  2927. extensions.find("GL_NVX_multiview_per_view_attributes") == extensions.end())
  2928. return true;
  2929. if (member.getFieldName() == "gl_ViewportMaskPerViewNV" &&
  2930. extensions.find("GL_NVX_multiview_per_view_attributes") == extensions.end())
  2931. return true;
  2932. }
  2933. #endif
  2934. return false;
  2935. };
  2936. // Do full recursive conversion of a glslang structure (or block) type to a SPIR-V Id.
  2937. // explicitLayout can be kept the same throughout the hierarchical recursive walk.
  2938. // Mutually recursive with convertGlslangToSpvType().
  2939. spv::Id TGlslangToSpvTraverser::convertGlslangStructToSpvType(const glslang::TType& type,
  2940. const glslang::TTypeList* glslangMembers,
  2941. glslang::TLayoutPacking explicitLayout,
  2942. const glslang::TQualifier& qualifier)
  2943. {
  2944. // Create a vector of struct types for SPIR-V to consume
  2945. std::vector<spv::Id> spvMembers;
  2946. int memberDelta = 0; // how much the member's index changes from glslang to SPIR-V, normally 0, except sometimes for blocks
  2947. std::vector<std::pair<glslang::TType*, glslang::TQualifier> > deferredForwardPointers;
  2948. for (int i = 0; i < (int)glslangMembers->size(); i++) {
  2949. glslang::TType& glslangMember = *(*glslangMembers)[i].type;
  2950. if (glslangMember.hiddenMember()) {
  2951. ++memberDelta;
  2952. if (type.getBasicType() == glslang::EbtBlock)
  2953. memberRemapper[glslangMembers][i] = -1;
  2954. } else {
  2955. if (type.getBasicType() == glslang::EbtBlock) {
  2956. memberRemapper[glslangMembers][i] = i - memberDelta;
  2957. if (filterMember(glslangMember))
  2958. continue;
  2959. }
  2960. // modify just this child's view of the qualifier
  2961. glslang::TQualifier memberQualifier = glslangMember.getQualifier();
  2962. InheritQualifiers(memberQualifier, qualifier);
  2963. // manually inherit location
  2964. if (! memberQualifier.hasLocation() && qualifier.hasLocation())
  2965. memberQualifier.layoutLocation = qualifier.layoutLocation;
  2966. // recurse
  2967. bool lastBufferBlockMember = qualifier.storage == glslang::EvqBuffer &&
  2968. i == (int)glslangMembers->size() - 1;
  2969. // Make forward pointers for any pointer members, and create a list of members to
  2970. // convert to spirv types after creating the struct.
  2971. if (glslangMember.getBasicType() == glslang::EbtReference) {
  2972. if (forwardPointers.find(glslangMember.getReferentType()) == forwardPointers.end()) {
  2973. deferredForwardPointers.push_back(std::make_pair(&glslangMember, memberQualifier));
  2974. }
  2975. spvMembers.push_back(
  2976. convertGlslangToSpvType(glslangMember, explicitLayout, memberQualifier, lastBufferBlockMember, true));
  2977. } else {
  2978. spvMembers.push_back(
  2979. convertGlslangToSpvType(glslangMember, explicitLayout, memberQualifier, lastBufferBlockMember, false));
  2980. }
  2981. }
  2982. }
  2983. // Make the SPIR-V type
  2984. spv::Id spvType = builder.makeStructType(spvMembers, type.getTypeName().c_str());
  2985. if (! HasNonLayoutQualifiers(type, qualifier))
  2986. structMap[explicitLayout][qualifier.layoutMatrix][glslangMembers] = spvType;
  2987. // Decorate it
  2988. decorateStructType(type, glslangMembers, explicitLayout, qualifier, spvType);
  2989. for (int i = 0; i < (int)deferredForwardPointers.size(); ++i) {
  2990. auto it = deferredForwardPointers[i];
  2991. convertGlslangToSpvType(*it.first, explicitLayout, it.second, false);
  2992. }
  2993. return spvType;
  2994. }
  2995. void TGlslangToSpvTraverser::decorateStructType(const glslang::TType& type,
  2996. const glslang::TTypeList* glslangMembers,
  2997. glslang::TLayoutPacking explicitLayout,
  2998. const glslang::TQualifier& qualifier,
  2999. spv::Id spvType)
  3000. {
  3001. // Name and decorate the non-hidden members
  3002. int offset = -1;
  3003. int locationOffset = 0; // for use within the members of this struct
  3004. for (int i = 0; i < (int)glslangMembers->size(); i++) {
  3005. glslang::TType& glslangMember = *(*glslangMembers)[i].type;
  3006. int member = i;
  3007. if (type.getBasicType() == glslang::EbtBlock) {
  3008. member = memberRemapper[glslangMembers][i];
  3009. if (filterMember(glslangMember))
  3010. continue;
  3011. }
  3012. // modify just this child's view of the qualifier
  3013. glslang::TQualifier memberQualifier = glslangMember.getQualifier();
  3014. InheritQualifiers(memberQualifier, qualifier);
  3015. // using -1 above to indicate a hidden member
  3016. if (member < 0)
  3017. continue;
  3018. builder.addMemberName(spvType, member, glslangMember.getFieldName().c_str());
  3019. builder.addMemberDecoration(spvType, member,
  3020. TranslateLayoutDecoration(glslangMember, memberQualifier.layoutMatrix));
  3021. builder.addMemberDecoration(spvType, member, TranslatePrecisionDecoration(glslangMember));
  3022. // Add interpolation and auxiliary storage decorations only to
  3023. // top-level members of Input and Output storage classes
  3024. if (type.getQualifier().storage == glslang::EvqVaryingIn ||
  3025. type.getQualifier().storage == glslang::EvqVaryingOut) {
  3026. if (type.getBasicType() == glslang::EbtBlock ||
  3027. glslangIntermediate->getSource() == glslang::EShSourceHlsl) {
  3028. builder.addMemberDecoration(spvType, member, TranslateInterpolationDecoration(memberQualifier));
  3029. builder.addMemberDecoration(spvType, member, TranslateAuxiliaryStorageDecoration(memberQualifier));
  3030. #ifdef NV_EXTENSIONS
  3031. addMeshNVDecoration(spvType, member, memberQualifier);
  3032. #endif
  3033. }
  3034. }
  3035. builder.addMemberDecoration(spvType, member, TranslateInvariantDecoration(memberQualifier));
  3036. if (type.getBasicType() == glslang::EbtBlock &&
  3037. qualifier.storage == glslang::EvqBuffer) {
  3038. // Add memory decorations only to top-level members of shader storage block
  3039. std::vector<spv::Decoration> memory;
  3040. TranslateMemoryDecoration(memberQualifier, memory, glslangIntermediate->usingVulkanMemoryModel());
  3041. for (unsigned int i = 0; i < memory.size(); ++i)
  3042. builder.addMemberDecoration(spvType, member, memory[i]);
  3043. }
  3044. // Location assignment was already completed correctly by the front end,
  3045. // just track whether a member needs to be decorated.
  3046. // Ignore member locations if the container is an array, as that's
  3047. // ill-specified and decisions have been made to not allow this.
  3048. if (! type.isArray() && memberQualifier.hasLocation())
  3049. builder.addMemberDecoration(spvType, member, spv::DecorationLocation, memberQualifier.layoutLocation);
  3050. if (qualifier.hasLocation()) // track for upcoming inheritance
  3051. locationOffset += glslangIntermediate->computeTypeLocationSize(
  3052. glslangMember, glslangIntermediate->getStage());
  3053. // component, XFB, others
  3054. if (glslangMember.getQualifier().hasComponent())
  3055. builder.addMemberDecoration(spvType, member, spv::DecorationComponent,
  3056. glslangMember.getQualifier().layoutComponent);
  3057. if (glslangMember.getQualifier().hasXfbOffset())
  3058. builder.addMemberDecoration(spvType, member, spv::DecorationOffset,
  3059. glslangMember.getQualifier().layoutXfbOffset);
  3060. else if (explicitLayout != glslang::ElpNone) {
  3061. // figure out what to do with offset, which is accumulating
  3062. int nextOffset;
  3063. updateMemberOffset(type, glslangMember, offset, nextOffset, explicitLayout, memberQualifier.layoutMatrix);
  3064. if (offset >= 0)
  3065. builder.addMemberDecoration(spvType, member, spv::DecorationOffset, offset);
  3066. offset = nextOffset;
  3067. }
  3068. if (glslangMember.isMatrix() && explicitLayout != glslang::ElpNone)
  3069. builder.addMemberDecoration(spvType, member, spv::DecorationMatrixStride,
  3070. getMatrixStride(glslangMember, explicitLayout, memberQualifier.layoutMatrix));
  3071. // built-in variable decorations
  3072. spv::BuiltIn builtIn = TranslateBuiltInDecoration(glslangMember.getQualifier().builtIn, true);
  3073. if (builtIn != spv::BuiltInMax)
  3074. builder.addMemberDecoration(spvType, member, spv::DecorationBuiltIn, (int)builtIn);
  3075. // nonuniform
  3076. builder.addMemberDecoration(spvType, member, TranslateNonUniformDecoration(glslangMember.getQualifier()));
  3077. if (glslangIntermediate->getHlslFunctionality1() && memberQualifier.semanticName != nullptr) {
  3078. builder.addExtension("SPV_GOOGLE_hlsl_functionality1");
  3079. builder.addMemberDecoration(spvType, member, (spv::Decoration)spv::DecorationHlslSemanticGOOGLE,
  3080. memberQualifier.semanticName);
  3081. }
  3082. #ifdef NV_EXTENSIONS
  3083. if (builtIn == spv::BuiltInLayer) {
  3084. // SPV_NV_viewport_array2 extension
  3085. if (glslangMember.getQualifier().layoutViewportRelative){
  3086. builder.addMemberDecoration(spvType, member, (spv::Decoration)spv::DecorationViewportRelativeNV);
  3087. builder.addCapability(spv::CapabilityShaderViewportMaskNV);
  3088. builder.addExtension(spv::E_SPV_NV_viewport_array2);
  3089. }
  3090. if (glslangMember.getQualifier().layoutSecondaryViewportRelativeOffset != -2048){
  3091. builder.addMemberDecoration(spvType, member,
  3092. (spv::Decoration)spv::DecorationSecondaryViewportRelativeNV,
  3093. glslangMember.getQualifier().layoutSecondaryViewportRelativeOffset);
  3094. builder.addCapability(spv::CapabilityShaderStereoViewNV);
  3095. builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
  3096. }
  3097. }
  3098. if (glslangMember.getQualifier().layoutPassthrough) {
  3099. builder.addMemberDecoration(spvType, member, (spv::Decoration)spv::DecorationPassthroughNV);
  3100. builder.addCapability(spv::CapabilityGeometryShaderPassthroughNV);
  3101. builder.addExtension(spv::E_SPV_NV_geometry_shader_passthrough);
  3102. }
  3103. #endif
  3104. }
  3105. // Decorate the structure
  3106. builder.addDecoration(spvType, TranslateLayoutDecoration(type, qualifier.layoutMatrix));
  3107. builder.addDecoration(spvType, TranslateBlockDecoration(type, glslangIntermediate->usingStorageBuffer()));
  3108. }
  3109. // Turn the expression forming the array size into an id.
  3110. // This is not quite trivial, because of specialization constants.
  3111. // Sometimes, a raw constant is turned into an Id, and sometimes
  3112. // a specialization constant expression is.
  3113. spv::Id TGlslangToSpvTraverser::makeArraySizeId(const glslang::TArraySizes& arraySizes, int dim)
  3114. {
  3115. // First, see if this is sized with a node, meaning a specialization constant:
  3116. glslang::TIntermTyped* specNode = arraySizes.getDimNode(dim);
  3117. if (specNode != nullptr) {
  3118. builder.clearAccessChain();
  3119. specNode->traverse(this);
  3120. return accessChainLoad(specNode->getAsTyped()->getType());
  3121. }
  3122. // Otherwise, need a compile-time (front end) size, get it:
  3123. int size = arraySizes.getDimSize(dim);
  3124. assert(size > 0);
  3125. return builder.makeUintConstant(size);
  3126. }
  3127. // Wrap the builder's accessChainLoad to:
  3128. // - localize handling of RelaxedPrecision
  3129. // - use the SPIR-V inferred type instead of another conversion of the glslang type
  3130. // (avoids unnecessary work and possible type punning for structures)
  3131. // - do conversion of concrete to abstract type
  3132. spv::Id TGlslangToSpvTraverser::accessChainLoad(const glslang::TType& type)
  3133. {
  3134. spv::Id nominalTypeId = builder.accessChainGetInferredType();
  3135. spv::Builder::AccessChain::CoherentFlags coherentFlags = builder.getAccessChain().coherentFlags;
  3136. coherentFlags |= TranslateCoherent(type);
  3137. unsigned int alignment = builder.getAccessChain().alignment;
  3138. alignment |= type.getBufferReferenceAlignment();
  3139. spv::Id loadedId = builder.accessChainLoad(TranslatePrecisionDecoration(type),
  3140. TranslateNonUniformDecoration(type.getQualifier()),
  3141. nominalTypeId,
  3142. spv::MemoryAccessMask(TranslateMemoryAccess(coherentFlags) & ~spv::MemoryAccessMakePointerAvailableKHRMask),
  3143. TranslateMemoryScope(coherentFlags),
  3144. alignment);
  3145. // Need to convert to abstract types when necessary
  3146. if (type.getBasicType() == glslang::EbtBool) {
  3147. if (builder.isScalarType(nominalTypeId)) {
  3148. // Conversion for bool
  3149. spv::Id boolType = builder.makeBoolType();
  3150. if (nominalTypeId != boolType)
  3151. loadedId = builder.createBinOp(spv::OpINotEqual, boolType, loadedId, builder.makeUintConstant(0));
  3152. } else if (builder.isVectorType(nominalTypeId)) {
  3153. // Conversion for bvec
  3154. int vecSize = builder.getNumTypeComponents(nominalTypeId);
  3155. spv::Id bvecType = builder.makeVectorType(builder.makeBoolType(), vecSize);
  3156. if (nominalTypeId != bvecType)
  3157. loadedId = builder.createBinOp(spv::OpINotEqual, bvecType, loadedId, makeSmearedConstant(builder.makeUintConstant(0), vecSize));
  3158. }
  3159. }
  3160. return loadedId;
  3161. }
  3162. // Wrap the builder's accessChainStore to:
  3163. // - do conversion of concrete to abstract type
  3164. //
  3165. // Implicitly uses the existing builder.accessChain as the storage target.
  3166. void TGlslangToSpvTraverser::accessChainStore(const glslang::TType& type, spv::Id rvalue)
  3167. {
  3168. // Need to convert to abstract types when necessary
  3169. if (type.getBasicType() == glslang::EbtBool) {
  3170. spv::Id nominalTypeId = builder.accessChainGetInferredType();
  3171. if (builder.isScalarType(nominalTypeId)) {
  3172. // Conversion for bool
  3173. spv::Id boolType = builder.makeBoolType();
  3174. if (nominalTypeId != boolType) {
  3175. // keep these outside arguments, for determinant order-of-evaluation
  3176. spv::Id one = builder.makeUintConstant(1);
  3177. spv::Id zero = builder.makeUintConstant(0);
  3178. rvalue = builder.createTriOp(spv::OpSelect, nominalTypeId, rvalue, one, zero);
  3179. } else if (builder.getTypeId(rvalue) != boolType)
  3180. rvalue = builder.createBinOp(spv::OpINotEqual, boolType, rvalue, builder.makeUintConstant(0));
  3181. } else if (builder.isVectorType(nominalTypeId)) {
  3182. // Conversion for bvec
  3183. int vecSize = builder.getNumTypeComponents(nominalTypeId);
  3184. spv::Id bvecType = builder.makeVectorType(builder.makeBoolType(), vecSize);
  3185. if (nominalTypeId != bvecType) {
  3186. // keep these outside arguments, for determinant order-of-evaluation
  3187. spv::Id one = makeSmearedConstant(builder.makeUintConstant(1), vecSize);
  3188. spv::Id zero = makeSmearedConstant(builder.makeUintConstant(0), vecSize);
  3189. rvalue = builder.createTriOp(spv::OpSelect, nominalTypeId, rvalue, one, zero);
  3190. } else if (builder.getTypeId(rvalue) != bvecType)
  3191. rvalue = builder.createBinOp(spv::OpINotEqual, bvecType, rvalue,
  3192. makeSmearedConstant(builder.makeUintConstant(0), vecSize));
  3193. }
  3194. }
  3195. spv::Builder::AccessChain::CoherentFlags coherentFlags = builder.getAccessChain().coherentFlags;
  3196. coherentFlags |= TranslateCoherent(type);
  3197. unsigned int alignment = builder.getAccessChain().alignment;
  3198. alignment |= type.getBufferReferenceAlignment();
  3199. builder.accessChainStore(rvalue,
  3200. spv::MemoryAccessMask(TranslateMemoryAccess(coherentFlags) & ~spv::MemoryAccessMakePointerVisibleKHRMask),
  3201. TranslateMemoryScope(coherentFlags), alignment);
  3202. }
  3203. // For storing when types match at the glslang level, but not might match at the
  3204. // SPIR-V level.
  3205. //
  3206. // This especially happens when a single glslang type expands to multiple
  3207. // SPIR-V types, like a struct that is used in a member-undecorated way as well
  3208. // as in a member-decorated way.
  3209. //
  3210. // NOTE: This function can handle any store request; if it's not special it
  3211. // simplifies to a simple OpStore.
  3212. //
  3213. // Implicitly uses the existing builder.accessChain as the storage target.
  3214. void TGlslangToSpvTraverser::multiTypeStore(const glslang::TType& type, spv::Id rValue)
  3215. {
  3216. // we only do the complex path here if it's an aggregate
  3217. if (! type.isStruct() && ! type.isArray()) {
  3218. accessChainStore(type, rValue);
  3219. return;
  3220. }
  3221. // and, it has to be a case of type aliasing
  3222. spv::Id rType = builder.getTypeId(rValue);
  3223. spv::Id lValue = builder.accessChainGetLValue();
  3224. spv::Id lType = builder.getContainedTypeId(builder.getTypeId(lValue));
  3225. if (lType == rType) {
  3226. accessChainStore(type, rValue);
  3227. return;
  3228. }
  3229. // Recursively (as needed) copy an aggregate type to a different aggregate type,
  3230. // where the two types were the same type in GLSL. This requires member
  3231. // by member copy, recursively.
  3232. // If an array, copy element by element.
  3233. if (type.isArray()) {
  3234. glslang::TType glslangElementType(type, 0);
  3235. spv::Id elementRType = builder.getContainedTypeId(rType);
  3236. for (int index = 0; index < type.getOuterArraySize(); ++index) {
  3237. // get the source member
  3238. spv::Id elementRValue = builder.createCompositeExtract(rValue, elementRType, index);
  3239. // set up the target storage
  3240. builder.clearAccessChain();
  3241. builder.setAccessChainLValue(lValue);
  3242. builder.accessChainPush(builder.makeIntConstant(index), TranslateCoherent(type), type.getBufferReferenceAlignment());
  3243. // store the member
  3244. multiTypeStore(glslangElementType, elementRValue);
  3245. }
  3246. } else {
  3247. assert(type.isStruct());
  3248. // loop over structure members
  3249. const glslang::TTypeList& members = *type.getStruct();
  3250. for (int m = 0; m < (int)members.size(); ++m) {
  3251. const glslang::TType& glslangMemberType = *members[m].type;
  3252. // get the source member
  3253. spv::Id memberRType = builder.getContainedTypeId(rType, m);
  3254. spv::Id memberRValue = builder.createCompositeExtract(rValue, memberRType, m);
  3255. // set up the target storage
  3256. builder.clearAccessChain();
  3257. builder.setAccessChainLValue(lValue);
  3258. builder.accessChainPush(builder.makeIntConstant(m), TranslateCoherent(type), type.getBufferReferenceAlignment());
  3259. // store the member
  3260. multiTypeStore(glslangMemberType, memberRValue);
  3261. }
  3262. }
  3263. }
  3264. // Decide whether or not this type should be
  3265. // decorated with offsets and strides, and if so
  3266. // whether std140 or std430 rules should be applied.
  3267. glslang::TLayoutPacking TGlslangToSpvTraverser::getExplicitLayout(const glslang::TType& type) const
  3268. {
  3269. // has to be a block
  3270. if (type.getBasicType() != glslang::EbtBlock)
  3271. return glslang::ElpNone;
  3272. // has to be a uniform or buffer block or task in/out blocks
  3273. if (type.getQualifier().storage != glslang::EvqUniform &&
  3274. type.getQualifier().storage != glslang::EvqBuffer &&
  3275. !type.getQualifier().isTaskMemory())
  3276. return glslang::ElpNone;
  3277. // return the layout to use
  3278. switch (type.getQualifier().layoutPacking) {
  3279. case glslang::ElpStd140:
  3280. case glslang::ElpStd430:
  3281. case glslang::ElpScalar:
  3282. return type.getQualifier().layoutPacking;
  3283. default:
  3284. return glslang::ElpNone;
  3285. }
  3286. }
  3287. // Given an array type, returns the integer stride required for that array
  3288. int TGlslangToSpvTraverser::getArrayStride(const glslang::TType& arrayType, glslang::TLayoutPacking explicitLayout, glslang::TLayoutMatrix matrixLayout)
  3289. {
  3290. int size;
  3291. int stride;
  3292. glslangIntermediate->getMemberAlignment(arrayType, size, stride, explicitLayout, matrixLayout == glslang::ElmRowMajor);
  3293. return stride;
  3294. }
  3295. // Given a matrix type, or array (of array) of matrixes type, returns the integer stride required for that matrix
  3296. // when used as a member of an interface block
  3297. int TGlslangToSpvTraverser::getMatrixStride(const glslang::TType& matrixType, glslang::TLayoutPacking explicitLayout, glslang::TLayoutMatrix matrixLayout)
  3298. {
  3299. glslang::TType elementType;
  3300. elementType.shallowCopy(matrixType);
  3301. elementType.clearArraySizes();
  3302. int size;
  3303. int stride;
  3304. glslangIntermediate->getMemberAlignment(elementType, size, stride, explicitLayout, matrixLayout == glslang::ElmRowMajor);
  3305. return stride;
  3306. }
  3307. // Given a member type of a struct, realign the current offset for it, and compute
  3308. // the next (not yet aligned) offset for the next member, which will get aligned
  3309. // on the next call.
  3310. // 'currentOffset' should be passed in already initialized, ready to modify, and reflecting
  3311. // the migration of data from nextOffset -> currentOffset. It should be -1 on the first call.
  3312. // -1 means a non-forced member offset (no decoration needed).
  3313. void TGlslangToSpvTraverser::updateMemberOffset(const glslang::TType& structType, const glslang::TType& memberType, int& currentOffset, int& nextOffset,
  3314. glslang::TLayoutPacking explicitLayout, glslang::TLayoutMatrix matrixLayout)
  3315. {
  3316. // this will get a positive value when deemed necessary
  3317. nextOffset = -1;
  3318. // override anything in currentOffset with user-set offset
  3319. if (memberType.getQualifier().hasOffset())
  3320. currentOffset = memberType.getQualifier().layoutOffset;
  3321. // It could be that current linker usage in glslang updated all the layoutOffset,
  3322. // in which case the following code does not matter. But, that's not quite right
  3323. // once cross-compilation unit GLSL validation is done, as the original user
  3324. // settings are needed in layoutOffset, and then the following will come into play.
  3325. if (explicitLayout == glslang::ElpNone) {
  3326. if (! memberType.getQualifier().hasOffset())
  3327. currentOffset = -1;
  3328. return;
  3329. }
  3330. // Getting this far means we need explicit offsets
  3331. if (currentOffset < 0)
  3332. currentOffset = 0;
  3333. // Now, currentOffset is valid (either 0, or from a previous nextOffset),
  3334. // but possibly not yet correctly aligned.
  3335. int memberSize;
  3336. int dummyStride;
  3337. int memberAlignment = glslangIntermediate->getMemberAlignment(memberType, memberSize, dummyStride, explicitLayout, matrixLayout == glslang::ElmRowMajor);
  3338. // Adjust alignment for HLSL rules
  3339. // TODO: make this consistent in early phases of code:
  3340. // adjusting this late means inconsistencies with earlier code, which for reflection is an issue
  3341. // Until reflection is brought in sync with these adjustments, don't apply to $Global,
  3342. // which is the most likely to rely on reflection, and least likely to rely implicit layouts
  3343. if (glslangIntermediate->usingHlslOffsets() &&
  3344. ! memberType.isArray() && memberType.isVector() && structType.getTypeName().compare("$Global") != 0) {
  3345. int dummySize;
  3346. int componentAlignment = glslangIntermediate->getBaseAlignmentScalar(memberType, dummySize);
  3347. if (componentAlignment <= 4)
  3348. memberAlignment = componentAlignment;
  3349. }
  3350. // Bump up to member alignment
  3351. glslang::RoundToPow2(currentOffset, memberAlignment);
  3352. // Bump up to vec4 if there is a bad straddle
  3353. if (explicitLayout != glslang::ElpScalar && glslangIntermediate->improperStraddle(memberType, memberSize, currentOffset))
  3354. glslang::RoundToPow2(currentOffset, 16);
  3355. nextOffset = currentOffset + memberSize;
  3356. }
  3357. void TGlslangToSpvTraverser::declareUseOfStructMember(const glslang::TTypeList& members, int glslangMember)
  3358. {
  3359. const glslang::TBuiltInVariable glslangBuiltIn = members[glslangMember].type->getQualifier().builtIn;
  3360. switch (glslangBuiltIn)
  3361. {
  3362. case glslang::EbvClipDistance:
  3363. case glslang::EbvCullDistance:
  3364. case glslang::EbvPointSize:
  3365. #ifdef NV_EXTENSIONS
  3366. case glslang::EbvViewportMaskNV:
  3367. case glslang::EbvSecondaryPositionNV:
  3368. case glslang::EbvSecondaryViewportMaskNV:
  3369. case glslang::EbvPositionPerViewNV:
  3370. case glslang::EbvViewportMaskPerViewNV:
  3371. case glslang::EbvTaskCountNV:
  3372. case glslang::EbvPrimitiveCountNV:
  3373. case glslang::EbvPrimitiveIndicesNV:
  3374. case glslang::EbvClipDistancePerViewNV:
  3375. case glslang::EbvCullDistancePerViewNV:
  3376. case glslang::EbvLayerPerViewNV:
  3377. case glslang::EbvMeshViewCountNV:
  3378. case glslang::EbvMeshViewIndicesNV:
  3379. #endif
  3380. // Generate the associated capability. Delegate to TranslateBuiltInDecoration.
  3381. // Alternately, we could just call this for any glslang built-in, since the
  3382. // capability already guards against duplicates.
  3383. TranslateBuiltInDecoration(glslangBuiltIn, false);
  3384. break;
  3385. default:
  3386. // Capabilities were already generated when the struct was declared.
  3387. break;
  3388. }
  3389. }
  3390. bool TGlslangToSpvTraverser::isShaderEntryPoint(const glslang::TIntermAggregate* node)
  3391. {
  3392. return node->getName().compare(glslangIntermediate->getEntryPointMangledName().c_str()) == 0;
  3393. }
  3394. // Does parameter need a place to keep writes, separate from the original?
  3395. // Assumes called after originalParam(), which filters out block/buffer/opaque-based
  3396. // qualifiers such that we should have only in/out/inout/constreadonly here.
  3397. bool TGlslangToSpvTraverser::writableParam(glslang::TStorageQualifier qualifier) const
  3398. {
  3399. assert(qualifier == glslang::EvqIn ||
  3400. qualifier == glslang::EvqOut ||
  3401. qualifier == glslang::EvqInOut ||
  3402. qualifier == glslang::EvqConstReadOnly);
  3403. return qualifier != glslang::EvqConstReadOnly;
  3404. }
  3405. // Is parameter pass-by-original?
  3406. bool TGlslangToSpvTraverser::originalParam(glslang::TStorageQualifier qualifier, const glslang::TType& paramType,
  3407. bool implicitThisParam)
  3408. {
  3409. if (implicitThisParam) // implicit this
  3410. return true;
  3411. if (glslangIntermediate->getSource() == glslang::EShSourceHlsl)
  3412. return paramType.getBasicType() == glslang::EbtBlock;
  3413. return paramType.containsOpaque() || // sampler, etc.
  3414. (paramType.getBasicType() == glslang::EbtBlock && qualifier == glslang::EvqBuffer); // SSBO
  3415. }
  3416. // Make all the functions, skeletally, without actually visiting their bodies.
  3417. void TGlslangToSpvTraverser::makeFunctions(const glslang::TIntermSequence& glslFunctions)
  3418. {
  3419. const auto getParamDecorations = [&](std::vector<spv::Decoration>& decorations, const glslang::TType& type, bool useVulkanMemoryModel) {
  3420. spv::Decoration paramPrecision = TranslatePrecisionDecoration(type);
  3421. if (paramPrecision != spv::NoPrecision)
  3422. decorations.push_back(paramPrecision);
  3423. TranslateMemoryDecoration(type.getQualifier(), decorations, useVulkanMemoryModel);
  3424. if (type.getBasicType() == glslang::EbtReference) {
  3425. // Original and non-writable params pass the pointer directly and
  3426. // use restrict/aliased, others are stored to a pointer in Function
  3427. // memory and use RestrictPointer/AliasedPointer.
  3428. if (originalParam(type.getQualifier().storage, type, false) ||
  3429. !writableParam(type.getQualifier().storage)) {
  3430. decorations.push_back(type.getQualifier().restrict ? spv::DecorationRestrict : spv::DecorationAliased);
  3431. } else {
  3432. decorations.push_back(type.getQualifier().restrict ? spv::DecorationRestrictPointerEXT : spv::DecorationAliasedPointerEXT);
  3433. }
  3434. }
  3435. };
  3436. for (int f = 0; f < (int)glslFunctions.size(); ++f) {
  3437. glslang::TIntermAggregate* glslFunction = glslFunctions[f]->getAsAggregate();
  3438. if (! glslFunction || glslFunction->getOp() != glslang::EOpFunction || isShaderEntryPoint(glslFunction))
  3439. continue;
  3440. // We're on a user function. Set up the basic interface for the function now,
  3441. // so that it's available to call. Translating the body will happen later.
  3442. //
  3443. // Typically (except for a "const in" parameter), an address will be passed to the
  3444. // function. What it is an address of varies:
  3445. //
  3446. // - "in" parameters not marked as "const" can be written to without modifying the calling
  3447. // argument so that write needs to be to a copy, hence the address of a copy works.
  3448. //
  3449. // - "const in" parameters can just be the r-value, as no writes need occur.
  3450. //
  3451. // - "out" and "inout" arguments can't be done as pointers to the calling argument, because
  3452. // GLSL has copy-in/copy-out semantics. They can be handled though with a pointer to a copy.
  3453. std::vector<spv::Id> paramTypes;
  3454. std::vector<std::vector<spv::Decoration>> paramDecorations; // list of decorations per parameter
  3455. glslang::TIntermSequence& parameters = glslFunction->getSequence()[0]->getAsAggregate()->getSequence();
  3456. bool implicitThis = (int)parameters.size() > 0 && parameters[0]->getAsSymbolNode()->getName() ==
  3457. glslangIntermediate->implicitThisName;
  3458. paramDecorations.resize(parameters.size());
  3459. for (int p = 0; p < (int)parameters.size(); ++p) {
  3460. const glslang::TType& paramType = parameters[p]->getAsTyped()->getType();
  3461. spv::Id typeId = convertGlslangToSpvType(paramType);
  3462. if (originalParam(paramType.getQualifier().storage, paramType, implicitThis && p == 0))
  3463. typeId = builder.makePointer(TranslateStorageClass(paramType), typeId);
  3464. else if (writableParam(paramType.getQualifier().storage))
  3465. typeId = builder.makePointer(spv::StorageClassFunction, typeId);
  3466. else
  3467. rValueParameters.insert(parameters[p]->getAsSymbolNode()->getId());
  3468. getParamDecorations(paramDecorations[p], paramType, glslangIntermediate->usingVulkanMemoryModel());
  3469. paramTypes.push_back(typeId);
  3470. }
  3471. spv::Block* functionBlock;
  3472. spv::Function *function = builder.makeFunctionEntry(TranslatePrecisionDecoration(glslFunction->getType()),
  3473. convertGlslangToSpvType(glslFunction->getType()),
  3474. glslFunction->getName().c_str(), paramTypes,
  3475. paramDecorations, &functionBlock);
  3476. if (implicitThis)
  3477. function->setImplicitThis();
  3478. // Track function to emit/call later
  3479. functionMap[glslFunction->getName().c_str()] = function;
  3480. // Set the parameter id's
  3481. for (int p = 0; p < (int)parameters.size(); ++p) {
  3482. symbolValues[parameters[p]->getAsSymbolNode()->getId()] = function->getParamId(p);
  3483. // give a name too
  3484. builder.addName(function->getParamId(p), parameters[p]->getAsSymbolNode()->getName().c_str());
  3485. }
  3486. }
  3487. }
  3488. // Process all the initializers, while skipping the functions and link objects
  3489. void TGlslangToSpvTraverser::makeGlobalInitializers(const glslang::TIntermSequence& initializers)
  3490. {
  3491. builder.setBuildPoint(shaderEntry->getLastBlock());
  3492. for (int i = 0; i < (int)initializers.size(); ++i) {
  3493. glslang::TIntermAggregate* initializer = initializers[i]->getAsAggregate();
  3494. if (initializer && initializer->getOp() != glslang::EOpFunction && initializer->getOp() != glslang::EOpLinkerObjects) {
  3495. // We're on a top-level node that's not a function. Treat as an initializer, whose
  3496. // code goes into the beginning of the entry point.
  3497. initializer->traverse(this);
  3498. }
  3499. }
  3500. }
  3501. // Process all the functions, while skipping initializers.
  3502. void TGlslangToSpvTraverser::visitFunctions(const glslang::TIntermSequence& glslFunctions)
  3503. {
  3504. for (int f = 0; f < (int)glslFunctions.size(); ++f) {
  3505. glslang::TIntermAggregate* node = glslFunctions[f]->getAsAggregate();
  3506. if (node && (node->getOp() == glslang::EOpFunction || node->getOp() == glslang::EOpLinkerObjects))
  3507. node->traverse(this);
  3508. }
  3509. }
  3510. void TGlslangToSpvTraverser::handleFunctionEntry(const glslang::TIntermAggregate* node)
  3511. {
  3512. // SPIR-V functions should already be in the functionMap from the prepass
  3513. // that called makeFunctions().
  3514. currentFunction = functionMap[node->getName().c_str()];
  3515. spv::Block* functionBlock = currentFunction->getEntryBlock();
  3516. builder.setBuildPoint(functionBlock);
  3517. }
  3518. void TGlslangToSpvTraverser::translateArguments(const glslang::TIntermAggregate& node, std::vector<spv::Id>& arguments)
  3519. {
  3520. const glslang::TIntermSequence& glslangArguments = node.getSequence();
  3521. glslang::TSampler sampler = {};
  3522. bool cubeCompare = false;
  3523. #ifdef AMD_EXTENSIONS
  3524. bool f16ShadowCompare = false;
  3525. #endif
  3526. if (node.isTexture() || node.isImage()) {
  3527. sampler = glslangArguments[0]->getAsTyped()->getType().getSampler();
  3528. cubeCompare = sampler.dim == glslang::EsdCube && sampler.arrayed && sampler.shadow;
  3529. #ifdef AMD_EXTENSIONS
  3530. f16ShadowCompare = sampler.shadow && glslangArguments[1]->getAsTyped()->getType().getBasicType() == glslang::EbtFloat16;
  3531. #endif
  3532. }
  3533. for (int i = 0; i < (int)glslangArguments.size(); ++i) {
  3534. builder.clearAccessChain();
  3535. glslangArguments[i]->traverse(this);
  3536. // Special case l-value operands
  3537. bool lvalue = false;
  3538. switch (node.getOp()) {
  3539. case glslang::EOpImageAtomicAdd:
  3540. case glslang::EOpImageAtomicMin:
  3541. case glslang::EOpImageAtomicMax:
  3542. case glslang::EOpImageAtomicAnd:
  3543. case glslang::EOpImageAtomicOr:
  3544. case glslang::EOpImageAtomicXor:
  3545. case glslang::EOpImageAtomicExchange:
  3546. case glslang::EOpImageAtomicCompSwap:
  3547. case glslang::EOpImageAtomicLoad:
  3548. case glslang::EOpImageAtomicStore:
  3549. if (i == 0)
  3550. lvalue = true;
  3551. break;
  3552. case glslang::EOpSparseImageLoad:
  3553. if ((sampler.ms && i == 3) || (! sampler.ms && i == 2))
  3554. lvalue = true;
  3555. break;
  3556. #ifdef AMD_EXTENSIONS
  3557. case glslang::EOpSparseTexture:
  3558. if (((cubeCompare || f16ShadowCompare) && i == 3) || (! (cubeCompare || f16ShadowCompare) && i == 2))
  3559. lvalue = true;
  3560. break;
  3561. case glslang::EOpSparseTextureClamp:
  3562. if (((cubeCompare || f16ShadowCompare) && i == 4) || (! (cubeCompare || f16ShadowCompare) && i == 3))
  3563. lvalue = true;
  3564. break;
  3565. case glslang::EOpSparseTextureLod:
  3566. case glslang::EOpSparseTextureOffset:
  3567. if ((f16ShadowCompare && i == 4) || (! f16ShadowCompare && i == 3))
  3568. lvalue = true;
  3569. break;
  3570. #else
  3571. case glslang::EOpSparseTexture:
  3572. if ((cubeCompare && i == 3) || (! cubeCompare && i == 2))
  3573. lvalue = true;
  3574. break;
  3575. case glslang::EOpSparseTextureClamp:
  3576. if ((cubeCompare && i == 4) || (! cubeCompare && i == 3))
  3577. lvalue = true;
  3578. break;
  3579. case glslang::EOpSparseTextureLod:
  3580. case glslang::EOpSparseTextureOffset:
  3581. if (i == 3)
  3582. lvalue = true;
  3583. break;
  3584. #endif
  3585. case glslang::EOpSparseTextureFetch:
  3586. if ((sampler.dim != glslang::EsdRect && i == 3) || (sampler.dim == glslang::EsdRect && i == 2))
  3587. lvalue = true;
  3588. break;
  3589. case glslang::EOpSparseTextureFetchOffset:
  3590. if ((sampler.dim != glslang::EsdRect && i == 4) || (sampler.dim == glslang::EsdRect && i == 3))
  3591. lvalue = true;
  3592. break;
  3593. #ifdef AMD_EXTENSIONS
  3594. case glslang::EOpSparseTextureLodOffset:
  3595. case glslang::EOpSparseTextureGrad:
  3596. case glslang::EOpSparseTextureOffsetClamp:
  3597. if ((f16ShadowCompare && i == 5) || (! f16ShadowCompare && i == 4))
  3598. lvalue = true;
  3599. break;
  3600. case glslang::EOpSparseTextureGradOffset:
  3601. case glslang::EOpSparseTextureGradClamp:
  3602. if ((f16ShadowCompare && i == 6) || (! f16ShadowCompare && i == 5))
  3603. lvalue = true;
  3604. break;
  3605. case glslang::EOpSparseTextureGradOffsetClamp:
  3606. if ((f16ShadowCompare && i == 7) || (! f16ShadowCompare && i == 6))
  3607. lvalue = true;
  3608. break;
  3609. #else
  3610. case glslang::EOpSparseTextureLodOffset:
  3611. case glslang::EOpSparseTextureGrad:
  3612. case glslang::EOpSparseTextureOffsetClamp:
  3613. if (i == 4)
  3614. lvalue = true;
  3615. break;
  3616. case glslang::EOpSparseTextureGradOffset:
  3617. case glslang::EOpSparseTextureGradClamp:
  3618. if (i == 5)
  3619. lvalue = true;
  3620. break;
  3621. case glslang::EOpSparseTextureGradOffsetClamp:
  3622. if (i == 6)
  3623. lvalue = true;
  3624. break;
  3625. #endif
  3626. case glslang::EOpSparseTextureGather:
  3627. if ((sampler.shadow && i == 3) || (! sampler.shadow && i == 2))
  3628. lvalue = true;
  3629. break;
  3630. case glslang::EOpSparseTextureGatherOffset:
  3631. case glslang::EOpSparseTextureGatherOffsets:
  3632. if ((sampler.shadow && i == 4) || (! sampler.shadow && i == 3))
  3633. lvalue = true;
  3634. break;
  3635. #ifdef AMD_EXTENSIONS
  3636. case glslang::EOpSparseTextureGatherLod:
  3637. if (i == 3)
  3638. lvalue = true;
  3639. break;
  3640. case glslang::EOpSparseTextureGatherLodOffset:
  3641. case glslang::EOpSparseTextureGatherLodOffsets:
  3642. if (i == 4)
  3643. lvalue = true;
  3644. break;
  3645. case glslang::EOpSparseImageLoadLod:
  3646. if (i == 3)
  3647. lvalue = true;
  3648. break;
  3649. #endif
  3650. #ifdef NV_EXTENSIONS
  3651. case glslang::EOpImageSampleFootprintNV:
  3652. if (i == 4)
  3653. lvalue = true;
  3654. break;
  3655. case glslang::EOpImageSampleFootprintClampNV:
  3656. case glslang::EOpImageSampleFootprintLodNV:
  3657. if (i == 5)
  3658. lvalue = true;
  3659. break;
  3660. case glslang::EOpImageSampleFootprintGradNV:
  3661. if (i == 6)
  3662. lvalue = true;
  3663. break;
  3664. case glslang::EOpImageSampleFootprintGradClampNV:
  3665. if (i == 7)
  3666. lvalue = true;
  3667. break;
  3668. #endif
  3669. default:
  3670. break;
  3671. }
  3672. if (lvalue)
  3673. arguments.push_back(builder.accessChainGetLValue());
  3674. else
  3675. arguments.push_back(accessChainLoad(glslangArguments[i]->getAsTyped()->getType()));
  3676. }
  3677. }
  3678. void TGlslangToSpvTraverser::translateArguments(glslang::TIntermUnary& node, std::vector<spv::Id>& arguments)
  3679. {
  3680. builder.clearAccessChain();
  3681. node.getOperand()->traverse(this);
  3682. arguments.push_back(accessChainLoad(node.getOperand()->getType()));
  3683. }
  3684. spv::Id TGlslangToSpvTraverser::createImageTextureFunctionCall(glslang::TIntermOperator* node)
  3685. {
  3686. if (! node->isImage() && ! node->isTexture())
  3687. return spv::NoResult;
  3688. builder.setLine(node->getLoc().line, node->getLoc().getFilename());
  3689. // Process a GLSL texturing op (will be SPV image)
  3690. const glslang::TType &imageType = node->getAsAggregate() ? node->getAsAggregate()->getSequence()[0]->getAsTyped()->getType()
  3691. : node->getAsUnaryNode()->getOperand()->getAsTyped()->getType();
  3692. const glslang::TSampler sampler = imageType.getSampler();
  3693. #ifdef AMD_EXTENSIONS
  3694. bool f16ShadowCompare = (sampler.shadow && node->getAsAggregate())
  3695. ? node->getAsAggregate()->getSequence()[1]->getAsTyped()->getType().getBasicType() == glslang::EbtFloat16
  3696. : false;
  3697. #endif
  3698. std::vector<spv::Id> arguments;
  3699. if (node->getAsAggregate())
  3700. translateArguments(*node->getAsAggregate(), arguments);
  3701. else
  3702. translateArguments(*node->getAsUnaryNode(), arguments);
  3703. spv::Decoration precision = TranslatePrecisionDecoration(node->getOperationPrecision());
  3704. spv::Builder::TextureParameters params = { };
  3705. params.sampler = arguments[0];
  3706. glslang::TCrackedTextureOp cracked;
  3707. node->crackTexture(sampler, cracked);
  3708. const bool isUnsignedResult = node->getType().getBasicType() == glslang::EbtUint;
  3709. // Check for queries
  3710. if (cracked.query) {
  3711. // OpImageQueryLod works on a sampled image, for other queries the image has to be extracted first
  3712. if (node->getOp() != glslang::EOpTextureQueryLod && builder.isSampledImage(params.sampler))
  3713. params.sampler = builder.createUnaryOp(spv::OpImage, builder.getImageType(params.sampler), params.sampler);
  3714. switch (node->getOp()) {
  3715. case glslang::EOpImageQuerySize:
  3716. case glslang::EOpTextureQuerySize:
  3717. if (arguments.size() > 1) {
  3718. params.lod = arguments[1];
  3719. return builder.createTextureQueryCall(spv::OpImageQuerySizeLod, params, isUnsignedResult);
  3720. } else
  3721. return builder.createTextureQueryCall(spv::OpImageQuerySize, params, isUnsignedResult);
  3722. case glslang::EOpImageQuerySamples:
  3723. case glslang::EOpTextureQuerySamples:
  3724. return builder.createTextureQueryCall(spv::OpImageQuerySamples, params, isUnsignedResult);
  3725. case glslang::EOpTextureQueryLod:
  3726. params.coords = arguments[1];
  3727. return builder.createTextureQueryCall(spv::OpImageQueryLod, params, isUnsignedResult);
  3728. case glslang::EOpTextureQueryLevels:
  3729. return builder.createTextureQueryCall(spv::OpImageQueryLevels, params, isUnsignedResult);
  3730. case glslang::EOpSparseTexelsResident:
  3731. return builder.createUnaryOp(spv::OpImageSparseTexelsResident, builder.makeBoolType(), arguments[0]);
  3732. default:
  3733. assert(0);
  3734. break;
  3735. }
  3736. }
  3737. int components = node->getType().getVectorSize();
  3738. if (node->getOp() == glslang::EOpTextureFetch) {
  3739. // These must produce 4 components, per SPIR-V spec. We'll add a conversion constructor if needed.
  3740. // This will only happen through the HLSL path for operator[], so we do not have to handle e.g.
  3741. // the EOpTexture/Proj/Lod/etc family. It would be harmless to do so, but would need more logic
  3742. // here around e.g. which ones return scalars or other types.
  3743. components = 4;
  3744. }
  3745. glslang::TType returnType(node->getType().getBasicType(), glslang::EvqTemporary, components);
  3746. auto resultType = [&returnType,this]{ return convertGlslangToSpvType(returnType); };
  3747. // Check for image functions other than queries
  3748. if (node->isImage()) {
  3749. std::vector<spv::IdImmediate> operands;
  3750. auto opIt = arguments.begin();
  3751. spv::IdImmediate image = { true, *(opIt++) };
  3752. operands.push_back(image);
  3753. // Handle subpass operations
  3754. // TODO: GLSL should change to have the "MS" only on the type rather than the
  3755. // built-in function.
  3756. if (cracked.subpass) {
  3757. // add on the (0,0) coordinate
  3758. spv::Id zero = builder.makeIntConstant(0);
  3759. std::vector<spv::Id> comps;
  3760. comps.push_back(zero);
  3761. comps.push_back(zero);
  3762. spv::IdImmediate coord = { true,
  3763. builder.makeCompositeConstant(builder.makeVectorType(builder.makeIntType(32), 2), comps) };
  3764. operands.push_back(coord);
  3765. if (sampler.ms) {
  3766. spv::IdImmediate imageOperands = { false, spv::ImageOperandsSampleMask };
  3767. operands.push_back(imageOperands);
  3768. spv::IdImmediate imageOperand = { true, *(opIt++) };
  3769. operands.push_back(imageOperand);
  3770. }
  3771. spv::Id result = builder.createOp(spv::OpImageRead, resultType(), operands);
  3772. builder.setPrecision(result, precision);
  3773. return result;
  3774. }
  3775. spv::IdImmediate coord = { true, *(opIt++) };
  3776. operands.push_back(coord);
  3777. #ifdef AMD_EXTENSIONS
  3778. if (node->getOp() == glslang::EOpImageLoad || node->getOp() == glslang::EOpImageLoadLod) {
  3779. #else
  3780. if (node->getOp() == glslang::EOpImageLoad) {
  3781. #endif
  3782. spv::ImageOperandsMask mask = spv::ImageOperandsMaskNone;
  3783. if (sampler.ms) {
  3784. mask = mask | spv::ImageOperandsSampleMask;
  3785. }
  3786. #ifdef AMD_EXTENSIONS
  3787. if (cracked.lod) {
  3788. builder.addExtension(spv::E_SPV_AMD_shader_image_load_store_lod);
  3789. builder.addCapability(spv::CapabilityImageReadWriteLodAMD);
  3790. mask = mask | spv::ImageOperandsLodMask;
  3791. }
  3792. #endif
  3793. mask = mask | TranslateImageOperands(TranslateCoherent(imageType));
  3794. mask = (spv::ImageOperandsMask)(mask & ~spv::ImageOperandsMakeTexelAvailableKHRMask);
  3795. if (mask) {
  3796. spv::IdImmediate imageOperands = { false, (unsigned int)mask };
  3797. operands.push_back(imageOperands);
  3798. }
  3799. if (mask & spv::ImageOperandsSampleMask) {
  3800. spv::IdImmediate imageOperand = { true, *opIt++ };
  3801. operands.push_back(imageOperand);
  3802. }
  3803. #ifdef AMD_EXTENSIONS
  3804. if (mask & spv::ImageOperandsLodMask) {
  3805. spv::IdImmediate imageOperand = { true, *opIt++ };
  3806. operands.push_back(imageOperand);
  3807. }
  3808. #endif
  3809. if (mask & spv::ImageOperandsMakeTexelVisibleKHRMask) {
  3810. spv::IdImmediate imageOperand = { true, builder.makeUintConstant(TranslateMemoryScope(TranslateCoherent(imageType))) };
  3811. operands.push_back(imageOperand);
  3812. }
  3813. if (builder.getImageTypeFormat(builder.getImageType(operands.front().word)) == spv::ImageFormatUnknown)
  3814. builder.addCapability(spv::CapabilityStorageImageReadWithoutFormat);
  3815. std::vector<spv::Id> result(1, builder.createOp(spv::OpImageRead, resultType(), operands));
  3816. builder.setPrecision(result[0], precision);
  3817. // If needed, add a conversion constructor to the proper size.
  3818. if (components != node->getType().getVectorSize())
  3819. result[0] = builder.createConstructor(precision, result, convertGlslangToSpvType(node->getType()));
  3820. return result[0];
  3821. #ifdef AMD_EXTENSIONS
  3822. } else if (node->getOp() == glslang::EOpImageStore || node->getOp() == glslang::EOpImageStoreLod) {
  3823. #else
  3824. } else if (node->getOp() == glslang::EOpImageStore) {
  3825. #endif
  3826. // Push the texel value before the operands
  3827. #ifdef AMD_EXTENSIONS
  3828. if (sampler.ms || cracked.lod) {
  3829. #else
  3830. if (sampler.ms) {
  3831. #endif
  3832. spv::IdImmediate texel = { true, *(opIt + 1) };
  3833. operands.push_back(texel);
  3834. } else {
  3835. spv::IdImmediate texel = { true, *opIt };
  3836. operands.push_back(texel);
  3837. }
  3838. spv::ImageOperandsMask mask = spv::ImageOperandsMaskNone;
  3839. if (sampler.ms) {
  3840. mask = mask | spv::ImageOperandsSampleMask;
  3841. }
  3842. #ifdef AMD_EXTENSIONS
  3843. if (cracked.lod) {
  3844. builder.addExtension(spv::E_SPV_AMD_shader_image_load_store_lod);
  3845. builder.addCapability(spv::CapabilityImageReadWriteLodAMD);
  3846. mask = mask | spv::ImageOperandsLodMask;
  3847. }
  3848. #endif
  3849. mask = mask | TranslateImageOperands(TranslateCoherent(imageType));
  3850. mask = (spv::ImageOperandsMask)(mask & ~spv::ImageOperandsMakeTexelVisibleKHRMask);
  3851. if (mask) {
  3852. spv::IdImmediate imageOperands = { false, (unsigned int)mask };
  3853. operands.push_back(imageOperands);
  3854. }
  3855. if (mask & spv::ImageOperandsSampleMask) {
  3856. spv::IdImmediate imageOperand = { true, *opIt++ };
  3857. operands.push_back(imageOperand);
  3858. }
  3859. #ifdef AMD_EXTENSIONS
  3860. if (mask & spv::ImageOperandsLodMask) {
  3861. spv::IdImmediate imageOperand = { true, *opIt++ };
  3862. operands.push_back(imageOperand);
  3863. }
  3864. #endif
  3865. if (mask & spv::ImageOperandsMakeTexelAvailableKHRMask) {
  3866. spv::IdImmediate imageOperand = { true, builder.makeUintConstant(TranslateMemoryScope(TranslateCoherent(imageType))) };
  3867. operands.push_back(imageOperand);
  3868. }
  3869. builder.createNoResultOp(spv::OpImageWrite, operands);
  3870. if (builder.getImageTypeFormat(builder.getImageType(operands.front().word)) == spv::ImageFormatUnknown)
  3871. builder.addCapability(spv::CapabilityStorageImageWriteWithoutFormat);
  3872. return spv::NoResult;
  3873. #ifdef AMD_EXTENSIONS
  3874. } else if (node->getOp() == glslang::EOpSparseImageLoad || node->getOp() == glslang::EOpSparseImageLoadLod) {
  3875. #else
  3876. } else if (node->getOp() == glslang::EOpSparseImageLoad) {
  3877. #endif
  3878. builder.addCapability(spv::CapabilitySparseResidency);
  3879. if (builder.getImageTypeFormat(builder.getImageType(operands.front().word)) == spv::ImageFormatUnknown)
  3880. builder.addCapability(spv::CapabilityStorageImageReadWithoutFormat);
  3881. spv::ImageOperandsMask mask = spv::ImageOperandsMaskNone;
  3882. if (sampler.ms) {
  3883. mask = mask | spv::ImageOperandsSampleMask;
  3884. }
  3885. #ifdef AMD_EXTENSIONS
  3886. if (cracked.lod) {
  3887. builder.addExtension(spv::E_SPV_AMD_shader_image_load_store_lod);
  3888. builder.addCapability(spv::CapabilityImageReadWriteLodAMD);
  3889. mask = mask | spv::ImageOperandsLodMask;
  3890. }
  3891. #endif
  3892. mask = mask | TranslateImageOperands(TranslateCoherent(imageType));
  3893. mask = (spv::ImageOperandsMask)(mask & ~spv::ImageOperandsMakeTexelAvailableKHRMask);
  3894. if (mask) {
  3895. spv::IdImmediate imageOperands = { false, (unsigned int)mask };
  3896. operands.push_back(imageOperands);
  3897. }
  3898. if (mask & spv::ImageOperandsSampleMask) {
  3899. spv::IdImmediate imageOperand = { true, *opIt++ };
  3900. operands.push_back(imageOperand);
  3901. }
  3902. #ifdef AMD_EXTENSIONS
  3903. if (mask & spv::ImageOperandsLodMask) {
  3904. spv::IdImmediate imageOperand = { true, *opIt++ };
  3905. operands.push_back(imageOperand);
  3906. }
  3907. #endif
  3908. if (mask & spv::ImageOperandsMakeTexelVisibleKHRMask) {
  3909. spv::IdImmediate imageOperand = { true, builder.makeUintConstant(TranslateMemoryScope(TranslateCoherent(imageType))) };
  3910. operands.push_back(imageOperand);
  3911. }
  3912. // Create the return type that was a special structure
  3913. spv::Id texelOut = *opIt;
  3914. spv::Id typeId0 = resultType();
  3915. spv::Id typeId1 = builder.getDerefTypeId(texelOut);
  3916. spv::Id resultTypeId = builder.makeStructResultType(typeId0, typeId1);
  3917. spv::Id resultId = builder.createOp(spv::OpImageSparseRead, resultTypeId, operands);
  3918. // Decode the return type
  3919. builder.createStore(builder.createCompositeExtract(resultId, typeId1, 1), texelOut);
  3920. return builder.createCompositeExtract(resultId, typeId0, 0);
  3921. } else {
  3922. // Process image atomic operations
  3923. // GLSL "IMAGE_PARAMS" will involve in constructing an image texel pointer and this pointer,
  3924. // as the first source operand, is required by SPIR-V atomic operations.
  3925. // For non-MS, the sample value should be 0
  3926. spv::IdImmediate sample = { true, sampler.ms ? *(opIt++) : builder.makeUintConstant(0) };
  3927. operands.push_back(sample);
  3928. spv::Id resultTypeId;
  3929. // imageAtomicStore has a void return type so base the pointer type on
  3930. // the type of the value operand.
  3931. if (node->getOp() == glslang::EOpImageAtomicStore) {
  3932. resultTypeId = builder.makePointer(spv::StorageClassImage, builder.getTypeId(operands[2].word));
  3933. } else {
  3934. resultTypeId = builder.makePointer(spv::StorageClassImage, resultType());
  3935. }
  3936. spv::Id pointer = builder.createOp(spv::OpImageTexelPointer, resultTypeId, operands);
  3937. std::vector<spv::Id> operands;
  3938. operands.push_back(pointer);
  3939. for (; opIt != arguments.end(); ++opIt)
  3940. operands.push_back(*opIt);
  3941. return createAtomicOperation(node->getOp(), precision, resultType(), operands, node->getBasicType());
  3942. }
  3943. }
  3944. #ifdef AMD_EXTENSIONS
  3945. // Check for fragment mask functions other than queries
  3946. if (cracked.fragMask) {
  3947. assert(sampler.ms);
  3948. auto opIt = arguments.begin();
  3949. std::vector<spv::Id> operands;
  3950. // Extract the image if necessary
  3951. if (builder.isSampledImage(params.sampler))
  3952. params.sampler = builder.createUnaryOp(spv::OpImage, builder.getImageType(params.sampler), params.sampler);
  3953. operands.push_back(params.sampler);
  3954. ++opIt;
  3955. if (sampler.isSubpass()) {
  3956. // add on the (0,0) coordinate
  3957. spv::Id zero = builder.makeIntConstant(0);
  3958. std::vector<spv::Id> comps;
  3959. comps.push_back(zero);
  3960. comps.push_back(zero);
  3961. operands.push_back(builder.makeCompositeConstant(builder.makeVectorType(builder.makeIntType(32), 2), comps));
  3962. }
  3963. for (; opIt != arguments.end(); ++opIt)
  3964. operands.push_back(*opIt);
  3965. spv::Op fragMaskOp = spv::OpNop;
  3966. if (node->getOp() == glslang::EOpFragmentMaskFetch)
  3967. fragMaskOp = spv::OpFragmentMaskFetchAMD;
  3968. else if (node->getOp() == glslang::EOpFragmentFetch)
  3969. fragMaskOp = spv::OpFragmentFetchAMD;
  3970. builder.addExtension(spv::E_SPV_AMD_shader_fragment_mask);
  3971. builder.addCapability(spv::CapabilityFragmentMaskAMD);
  3972. return builder.createOp(fragMaskOp, resultType(), operands);
  3973. }
  3974. #endif
  3975. // Check for texture functions other than queries
  3976. bool sparse = node->isSparseTexture();
  3977. #ifdef NV_EXTENSIONS
  3978. bool imageFootprint = node->isImageFootprint();
  3979. #endif
  3980. bool cubeCompare = sampler.dim == glslang::EsdCube && sampler.arrayed && sampler.shadow;
  3981. // check for bias argument
  3982. bool bias = false;
  3983. #ifdef AMD_EXTENSIONS
  3984. if (! cracked.lod && ! cracked.grad && ! cracked.fetch && ! cubeCompare) {
  3985. #else
  3986. if (! cracked.lod && ! cracked.gather && ! cracked.grad && ! cracked.fetch && ! cubeCompare) {
  3987. #endif
  3988. int nonBiasArgCount = 2;
  3989. #ifdef AMD_EXTENSIONS
  3990. if (cracked.gather)
  3991. ++nonBiasArgCount; // comp argument should be present when bias argument is present
  3992. if (f16ShadowCompare)
  3993. ++nonBiasArgCount;
  3994. #endif
  3995. if (cracked.offset)
  3996. ++nonBiasArgCount;
  3997. #ifdef AMD_EXTENSIONS
  3998. else if (cracked.offsets)
  3999. ++nonBiasArgCount;
  4000. #endif
  4001. if (cracked.grad)
  4002. nonBiasArgCount += 2;
  4003. if (cracked.lodClamp)
  4004. ++nonBiasArgCount;
  4005. if (sparse)
  4006. ++nonBiasArgCount;
  4007. #ifdef NV_EXTENSIONS
  4008. if (imageFootprint)
  4009. //Following three extra arguments
  4010. // int granularity, bool coarse, out gl_TextureFootprint2DNV footprint
  4011. nonBiasArgCount += 3;
  4012. #endif
  4013. if ((int)arguments.size() > nonBiasArgCount)
  4014. bias = true;
  4015. }
  4016. // See if the sampler param should really be just the SPV image part
  4017. if (cracked.fetch) {
  4018. // a fetch needs to have the image extracted first
  4019. if (builder.isSampledImage(params.sampler))
  4020. params.sampler = builder.createUnaryOp(spv::OpImage, builder.getImageType(params.sampler), params.sampler);
  4021. }
  4022. #ifdef AMD_EXTENSIONS
  4023. if (cracked.gather) {
  4024. const auto& sourceExtensions = glslangIntermediate->getRequestedExtensions();
  4025. if (bias || cracked.lod ||
  4026. sourceExtensions.find(glslang::E_GL_AMD_texture_gather_bias_lod) != sourceExtensions.end()) {
  4027. builder.addExtension(spv::E_SPV_AMD_texture_gather_bias_lod);
  4028. builder.addCapability(spv::CapabilityImageGatherBiasLodAMD);
  4029. }
  4030. }
  4031. #endif
  4032. // set the rest of the arguments
  4033. params.coords = arguments[1];
  4034. int extraArgs = 0;
  4035. bool noImplicitLod = false;
  4036. // sort out where Dref is coming from
  4037. #ifdef AMD_EXTENSIONS
  4038. if (cubeCompare || f16ShadowCompare) {
  4039. #else
  4040. if (cubeCompare) {
  4041. #endif
  4042. params.Dref = arguments[2];
  4043. ++extraArgs;
  4044. } else if (sampler.shadow && cracked.gather) {
  4045. params.Dref = arguments[2];
  4046. ++extraArgs;
  4047. } else if (sampler.shadow) {
  4048. std::vector<spv::Id> indexes;
  4049. int dRefComp;
  4050. if (cracked.proj)
  4051. dRefComp = 2; // "The resulting 3rd component of P in the shadow forms is used as Dref"
  4052. else
  4053. dRefComp = builder.getNumComponents(params.coords) - 1;
  4054. indexes.push_back(dRefComp);
  4055. params.Dref = builder.createCompositeExtract(params.coords, builder.getScalarTypeId(builder.getTypeId(params.coords)), indexes);
  4056. }
  4057. // lod
  4058. if (cracked.lod) {
  4059. params.lod = arguments[2 + extraArgs];
  4060. ++extraArgs;
  4061. } else if (glslangIntermediate->getStage() != EShLangFragment
  4062. #ifdef NV_EXTENSIONS
  4063. // NV_compute_shader_derivatives layout qualifiers allow for implicit LODs
  4064. && !(glslangIntermediate->getStage() == EShLangCompute &&
  4065. (glslangIntermediate->getLayoutDerivativeModeNone() != glslang::LayoutDerivativeNone))
  4066. #endif
  4067. ) {
  4068. // we need to invent the default lod for an explicit lod instruction for a non-fragment stage
  4069. noImplicitLod = true;
  4070. }
  4071. // multisample
  4072. if (sampler.ms) {
  4073. params.sample = arguments[2 + extraArgs]; // For MS, "sample" should be specified
  4074. ++extraArgs;
  4075. }
  4076. // gradient
  4077. if (cracked.grad) {
  4078. params.gradX = arguments[2 + extraArgs];
  4079. params.gradY = arguments[3 + extraArgs];
  4080. extraArgs += 2;
  4081. }
  4082. // offset and offsets
  4083. if (cracked.offset) {
  4084. params.offset = arguments[2 + extraArgs];
  4085. ++extraArgs;
  4086. } else if (cracked.offsets) {
  4087. params.offsets = arguments[2 + extraArgs];
  4088. ++extraArgs;
  4089. }
  4090. // lod clamp
  4091. if (cracked.lodClamp) {
  4092. params.lodClamp = arguments[2 + extraArgs];
  4093. ++extraArgs;
  4094. }
  4095. // sparse
  4096. if (sparse) {
  4097. params.texelOut = arguments[2 + extraArgs];
  4098. ++extraArgs;
  4099. }
  4100. // gather component
  4101. if (cracked.gather && ! sampler.shadow) {
  4102. // default component is 0, if missing, otherwise an argument
  4103. if (2 + extraArgs < (int)arguments.size()) {
  4104. params.component = arguments[2 + extraArgs];
  4105. ++extraArgs;
  4106. } else
  4107. params.component = builder.makeIntConstant(0);
  4108. }
  4109. #ifdef NV_EXTENSIONS
  4110. spv::Id resultStruct = spv::NoResult;
  4111. if (imageFootprint) {
  4112. //Following three extra arguments
  4113. // int granularity, bool coarse, out gl_TextureFootprint2DNV footprint
  4114. params.granularity = arguments[2 + extraArgs];
  4115. params.coarse = arguments[3 + extraArgs];
  4116. resultStruct = arguments[4 + extraArgs];
  4117. extraArgs += 3;
  4118. }
  4119. #endif
  4120. // bias
  4121. if (bias) {
  4122. params.bias = arguments[2 + extraArgs];
  4123. ++extraArgs;
  4124. }
  4125. #ifdef NV_EXTENSIONS
  4126. if (imageFootprint) {
  4127. builder.addExtension(spv::E_SPV_NV_shader_image_footprint);
  4128. builder.addCapability(spv::CapabilityImageFootprintNV);
  4129. //resultStructType(OpenGL type) contains 5 elements:
  4130. //struct gl_TextureFootprint2DNV {
  4131. // uvec2 anchor;
  4132. // uvec2 offset;
  4133. // uvec2 mask;
  4134. // uint lod;
  4135. // uint granularity;
  4136. //};
  4137. //or
  4138. //struct gl_TextureFootprint3DNV {
  4139. // uvec3 anchor;
  4140. // uvec3 offset;
  4141. // uvec2 mask;
  4142. // uint lod;
  4143. // uint granularity;
  4144. //};
  4145. spv::Id resultStructType = builder.getContainedTypeId(builder.getTypeId(resultStruct));
  4146. assert(builder.isStructType(resultStructType));
  4147. //resType (SPIR-V type) contains 6 elements:
  4148. //Member 0 must be a Boolean type scalar(LOD),
  4149. //Member 1 must be a vector of integer type, whose Signedness operand is 0(anchor),
  4150. //Member 2 must be a vector of integer type, whose Signedness operand is 0(offset),
  4151. //Member 3 must be a vector of integer type, whose Signedness operand is 0(mask),
  4152. //Member 4 must be a scalar of integer type, whose Signedness operand is 0(lod),
  4153. //Member 5 must be a scalar of integer type, whose Signedness operand is 0(granularity).
  4154. std::vector<spv::Id> members;
  4155. members.push_back(resultType());
  4156. for (int i = 0; i < 5; i++) {
  4157. members.push_back(builder.getContainedTypeId(resultStructType, i));
  4158. }
  4159. spv::Id resType = builder.makeStructType(members, "ResType");
  4160. //call ImageFootprintNV
  4161. spv::Id res = builder.createTextureCall(precision, resType, sparse, cracked.fetch, cracked.proj, cracked.gather, noImplicitLod, params);
  4162. //copy resType (SPIR-V type) to resultStructType(OpenGL type)
  4163. for (int i = 0; i < 5; i++) {
  4164. builder.clearAccessChain();
  4165. builder.setAccessChainLValue(resultStruct);
  4166. //Accessing to a struct we created, no coherent flag is set
  4167. spv::Builder::AccessChain::CoherentFlags flags;
  4168. flags.clear();
  4169. builder.accessChainPush(builder.makeIntConstant(i), flags, 0);
  4170. builder.accessChainStore(builder.createCompositeExtract(res, builder.getContainedTypeId(resType, i+1), i+1));
  4171. }
  4172. return builder.createCompositeExtract(res, resultType(), 0);
  4173. }
  4174. #endif
  4175. // projective component (might not to move)
  4176. // GLSL: "The texture coordinates consumed from P, not including the last component of P,
  4177. // are divided by the last component of P."
  4178. // SPIR-V: "... (u [, v] [, w], q)... It may be a vector larger than needed, but all
  4179. // unused components will appear after all used components."
  4180. if (cracked.proj) {
  4181. int projSourceComp = builder.getNumComponents(params.coords) - 1;
  4182. int projTargetComp;
  4183. switch (sampler.dim) {
  4184. case glslang::Esd1D: projTargetComp = 1; break;
  4185. case glslang::Esd2D: projTargetComp = 2; break;
  4186. case glslang::EsdRect: projTargetComp = 2; break;
  4187. default: projTargetComp = projSourceComp; break;
  4188. }
  4189. // copy the projective coordinate if we have to
  4190. if (projTargetComp != projSourceComp) {
  4191. spv::Id projComp = builder.createCompositeExtract(params.coords,
  4192. builder.getScalarTypeId(builder.getTypeId(params.coords)),
  4193. projSourceComp);
  4194. params.coords = builder.createCompositeInsert(projComp, params.coords,
  4195. builder.getTypeId(params.coords), projTargetComp);
  4196. }
  4197. }
  4198. // nonprivate
  4199. if (imageType.getQualifier().nonprivate) {
  4200. params.nonprivate = true;
  4201. }
  4202. // volatile
  4203. if (imageType.getQualifier().volatil) {
  4204. params.volatil = true;
  4205. }
  4206. std::vector<spv::Id> result( 1,
  4207. builder.createTextureCall(precision, resultType(), sparse, cracked.fetch, cracked.proj, cracked.gather, noImplicitLod, params)
  4208. );
  4209. if (components != node->getType().getVectorSize())
  4210. result[0] = builder.createConstructor(precision, result, convertGlslangToSpvType(node->getType()));
  4211. return result[0];
  4212. }
  4213. spv::Id TGlslangToSpvTraverser::handleUserFunctionCall(const glslang::TIntermAggregate* node)
  4214. {
  4215. // Grab the function's pointer from the previously created function
  4216. spv::Function* function = functionMap[node->getName().c_str()];
  4217. if (! function)
  4218. return 0;
  4219. const glslang::TIntermSequence& glslangArgs = node->getSequence();
  4220. const glslang::TQualifierList& qualifiers = node->getQualifierList();
  4221. // See comments in makeFunctions() for details about the semantics for parameter passing.
  4222. //
  4223. // These imply we need a four step process:
  4224. // 1. Evaluate the arguments
  4225. // 2. Allocate and make copies of in, out, and inout arguments
  4226. // 3. Make the call
  4227. // 4. Copy back the results
  4228. // 1. Evaluate the arguments and their types
  4229. std::vector<spv::Builder::AccessChain> lValues;
  4230. std::vector<spv::Id> rValues;
  4231. std::vector<const glslang::TType*> argTypes;
  4232. for (int a = 0; a < (int)glslangArgs.size(); ++a) {
  4233. argTypes.push_back(&glslangArgs[a]->getAsTyped()->getType());
  4234. // build l-value
  4235. builder.clearAccessChain();
  4236. glslangArgs[a]->traverse(this);
  4237. // keep outputs and pass-by-originals as l-values, evaluate others as r-values
  4238. if (originalParam(qualifiers[a], *argTypes[a], function->hasImplicitThis() && a == 0) ||
  4239. writableParam(qualifiers[a])) {
  4240. // save l-value
  4241. lValues.push_back(builder.getAccessChain());
  4242. } else {
  4243. // process r-value
  4244. rValues.push_back(accessChainLoad(*argTypes.back()));
  4245. }
  4246. }
  4247. // 2. Allocate space for anything needing a copy, and if it's "in" or "inout"
  4248. // copy the original into that space.
  4249. //
  4250. // Also, build up the list of actual arguments to pass in for the call
  4251. int lValueCount = 0;
  4252. int rValueCount = 0;
  4253. std::vector<spv::Id> spvArgs;
  4254. for (int a = 0; a < (int)glslangArgs.size(); ++a) {
  4255. spv::Id arg;
  4256. if (originalParam(qualifiers[a], *argTypes[a], function->hasImplicitThis() && a == 0)) {
  4257. builder.setAccessChain(lValues[lValueCount]);
  4258. arg = builder.accessChainGetLValue();
  4259. ++lValueCount;
  4260. } else if (writableParam(qualifiers[a])) {
  4261. // need space to hold the copy
  4262. arg = builder.createVariable(spv::StorageClassFunction, builder.getContainedTypeId(function->getParamType(a)), "param");
  4263. if (qualifiers[a] == glslang::EvqIn || qualifiers[a] == glslang::EvqInOut) {
  4264. // need to copy the input into output space
  4265. builder.setAccessChain(lValues[lValueCount]);
  4266. spv::Id copy = accessChainLoad(*argTypes[a]);
  4267. builder.clearAccessChain();
  4268. builder.setAccessChainLValue(arg);
  4269. multiTypeStore(*argTypes[a], copy);
  4270. }
  4271. ++lValueCount;
  4272. } else {
  4273. // process r-value, which involves a copy for a type mismatch
  4274. if (function->getParamType(a) != convertGlslangToSpvType(*argTypes[a])) {
  4275. spv::Id argCopy = builder.createVariable(spv::StorageClassFunction, function->getParamType(a), "arg");
  4276. builder.clearAccessChain();
  4277. builder.setAccessChainLValue(argCopy);
  4278. multiTypeStore(*argTypes[a], rValues[rValueCount]);
  4279. arg = builder.createLoad(argCopy);
  4280. } else
  4281. arg = rValues[rValueCount];
  4282. ++rValueCount;
  4283. }
  4284. spvArgs.push_back(arg);
  4285. }
  4286. // 3. Make the call.
  4287. spv::Id result = builder.createFunctionCall(function, spvArgs);
  4288. builder.setPrecision(result, TranslatePrecisionDecoration(node->getType()));
  4289. // 4. Copy back out an "out" arguments.
  4290. lValueCount = 0;
  4291. for (int a = 0; a < (int)glslangArgs.size(); ++a) {
  4292. if (originalParam(qualifiers[a], *argTypes[a], function->hasImplicitThis() && a == 0))
  4293. ++lValueCount;
  4294. else if (writableParam(qualifiers[a])) {
  4295. if (qualifiers[a] == glslang::EvqOut || qualifiers[a] == glslang::EvqInOut) {
  4296. spv::Id copy = builder.createLoad(spvArgs[a]);
  4297. builder.setAccessChain(lValues[lValueCount]);
  4298. multiTypeStore(*argTypes[a], copy);
  4299. }
  4300. ++lValueCount;
  4301. }
  4302. }
  4303. return result;
  4304. }
  4305. // Translate AST operation to SPV operation, already having SPV-based operands/types.
  4306. spv::Id TGlslangToSpvTraverser::createBinaryOperation(glslang::TOperator op, OpDecorations& decorations,
  4307. spv::Id typeId, spv::Id left, spv::Id right,
  4308. glslang::TBasicType typeProxy, bool reduceComparison)
  4309. {
  4310. bool isUnsigned = isTypeUnsignedInt(typeProxy);
  4311. bool isFloat = isTypeFloat(typeProxy);
  4312. bool isBool = typeProxy == glslang::EbtBool;
  4313. spv::Op binOp = spv::OpNop;
  4314. bool needMatchingVectors = true; // for non-matrix ops, would a scalar need to smear to match a vector?
  4315. bool comparison = false;
  4316. switch (op) {
  4317. case glslang::EOpAdd:
  4318. case glslang::EOpAddAssign:
  4319. if (isFloat)
  4320. binOp = spv::OpFAdd;
  4321. else
  4322. binOp = spv::OpIAdd;
  4323. break;
  4324. case glslang::EOpSub:
  4325. case glslang::EOpSubAssign:
  4326. if (isFloat)
  4327. binOp = spv::OpFSub;
  4328. else
  4329. binOp = spv::OpISub;
  4330. break;
  4331. case glslang::EOpMul:
  4332. case glslang::EOpMulAssign:
  4333. if (isFloat)
  4334. binOp = spv::OpFMul;
  4335. else
  4336. binOp = spv::OpIMul;
  4337. break;
  4338. case glslang::EOpVectorTimesScalar:
  4339. case glslang::EOpVectorTimesScalarAssign:
  4340. if (isFloat && (builder.isVector(left) || builder.isVector(right))) {
  4341. if (builder.isVector(right))
  4342. std::swap(left, right);
  4343. assert(builder.isScalar(right));
  4344. needMatchingVectors = false;
  4345. binOp = spv::OpVectorTimesScalar;
  4346. } else if (isFloat)
  4347. binOp = spv::OpFMul;
  4348. else
  4349. binOp = spv::OpIMul;
  4350. break;
  4351. case glslang::EOpVectorTimesMatrix:
  4352. case glslang::EOpVectorTimesMatrixAssign:
  4353. binOp = spv::OpVectorTimesMatrix;
  4354. break;
  4355. case glslang::EOpMatrixTimesVector:
  4356. binOp = spv::OpMatrixTimesVector;
  4357. break;
  4358. case glslang::EOpMatrixTimesScalar:
  4359. case glslang::EOpMatrixTimesScalarAssign:
  4360. binOp = spv::OpMatrixTimesScalar;
  4361. break;
  4362. case glslang::EOpMatrixTimesMatrix:
  4363. case glslang::EOpMatrixTimesMatrixAssign:
  4364. binOp = spv::OpMatrixTimesMatrix;
  4365. break;
  4366. case glslang::EOpOuterProduct:
  4367. binOp = spv::OpOuterProduct;
  4368. needMatchingVectors = false;
  4369. break;
  4370. case glslang::EOpDiv:
  4371. case glslang::EOpDivAssign:
  4372. if (isFloat)
  4373. binOp = spv::OpFDiv;
  4374. else if (isUnsigned)
  4375. binOp = spv::OpUDiv;
  4376. else
  4377. binOp = spv::OpSDiv;
  4378. break;
  4379. case glslang::EOpMod:
  4380. case glslang::EOpModAssign:
  4381. if (isFloat)
  4382. binOp = spv::OpFMod;
  4383. else if (isUnsigned)
  4384. binOp = spv::OpUMod;
  4385. else
  4386. binOp = spv::OpSMod;
  4387. break;
  4388. case glslang::EOpRightShift:
  4389. case glslang::EOpRightShiftAssign:
  4390. if (isUnsigned)
  4391. binOp = spv::OpShiftRightLogical;
  4392. else
  4393. binOp = spv::OpShiftRightArithmetic;
  4394. break;
  4395. case glslang::EOpLeftShift:
  4396. case glslang::EOpLeftShiftAssign:
  4397. binOp = spv::OpShiftLeftLogical;
  4398. break;
  4399. case glslang::EOpAnd:
  4400. case glslang::EOpAndAssign:
  4401. binOp = spv::OpBitwiseAnd;
  4402. break;
  4403. case glslang::EOpLogicalAnd:
  4404. needMatchingVectors = false;
  4405. binOp = spv::OpLogicalAnd;
  4406. break;
  4407. case glslang::EOpInclusiveOr:
  4408. case glslang::EOpInclusiveOrAssign:
  4409. binOp = spv::OpBitwiseOr;
  4410. break;
  4411. case glslang::EOpLogicalOr:
  4412. needMatchingVectors = false;
  4413. binOp = spv::OpLogicalOr;
  4414. break;
  4415. case glslang::EOpExclusiveOr:
  4416. case glslang::EOpExclusiveOrAssign:
  4417. binOp = spv::OpBitwiseXor;
  4418. break;
  4419. case glslang::EOpLogicalXor:
  4420. needMatchingVectors = false;
  4421. binOp = spv::OpLogicalNotEqual;
  4422. break;
  4423. case glslang::EOpLessThan:
  4424. case glslang::EOpGreaterThan:
  4425. case glslang::EOpLessThanEqual:
  4426. case glslang::EOpGreaterThanEqual:
  4427. case glslang::EOpEqual:
  4428. case glslang::EOpNotEqual:
  4429. case glslang::EOpVectorEqual:
  4430. case glslang::EOpVectorNotEqual:
  4431. comparison = true;
  4432. break;
  4433. default:
  4434. break;
  4435. }
  4436. // handle mapped binary operations (should be non-comparison)
  4437. if (binOp != spv::OpNop) {
  4438. assert(comparison == false);
  4439. if (builder.isMatrix(left) || builder.isMatrix(right) ||
  4440. builder.isCooperativeMatrix(left) || builder.isCooperativeMatrix(right))
  4441. return createBinaryMatrixOperation(binOp, decorations, typeId, left, right);
  4442. // No matrix involved; make both operands be the same number of components, if needed
  4443. if (needMatchingVectors)
  4444. builder.promoteScalar(decorations.precision, left, right);
  4445. spv::Id result = builder.createBinOp(binOp, typeId, left, right);
  4446. builder.addDecoration(result, decorations.noContraction);
  4447. builder.addDecoration(result, decorations.nonUniform);
  4448. return builder.setPrecision(result, decorations.precision);
  4449. }
  4450. if (! comparison)
  4451. return 0;
  4452. // Handle comparison instructions
  4453. if (reduceComparison && (op == glslang::EOpEqual || op == glslang::EOpNotEqual)
  4454. && (builder.isVector(left) || builder.isMatrix(left) || builder.isAggregate(left))) {
  4455. spv::Id result = builder.createCompositeCompare(decorations.precision, left, right, op == glslang::EOpEqual);
  4456. builder.addDecoration(result, decorations.nonUniform);
  4457. return result;
  4458. }
  4459. switch (op) {
  4460. case glslang::EOpLessThan:
  4461. if (isFloat)
  4462. binOp = spv::OpFOrdLessThan;
  4463. else if (isUnsigned)
  4464. binOp = spv::OpULessThan;
  4465. else
  4466. binOp = spv::OpSLessThan;
  4467. break;
  4468. case glslang::EOpGreaterThan:
  4469. if (isFloat)
  4470. binOp = spv::OpFOrdGreaterThan;
  4471. else if (isUnsigned)
  4472. binOp = spv::OpUGreaterThan;
  4473. else
  4474. binOp = spv::OpSGreaterThan;
  4475. break;
  4476. case glslang::EOpLessThanEqual:
  4477. if (isFloat)
  4478. binOp = spv::OpFOrdLessThanEqual;
  4479. else if (isUnsigned)
  4480. binOp = spv::OpULessThanEqual;
  4481. else
  4482. binOp = spv::OpSLessThanEqual;
  4483. break;
  4484. case glslang::EOpGreaterThanEqual:
  4485. if (isFloat)
  4486. binOp = spv::OpFOrdGreaterThanEqual;
  4487. else if (isUnsigned)
  4488. binOp = spv::OpUGreaterThanEqual;
  4489. else
  4490. binOp = spv::OpSGreaterThanEqual;
  4491. break;
  4492. case glslang::EOpEqual:
  4493. case glslang::EOpVectorEqual:
  4494. if (isFloat)
  4495. binOp = spv::OpFOrdEqual;
  4496. else if (isBool)
  4497. binOp = spv::OpLogicalEqual;
  4498. else
  4499. binOp = spv::OpIEqual;
  4500. break;
  4501. case glslang::EOpNotEqual:
  4502. case glslang::EOpVectorNotEqual:
  4503. if (isFloat)
  4504. binOp = spv::OpFOrdNotEqual;
  4505. else if (isBool)
  4506. binOp = spv::OpLogicalNotEqual;
  4507. else
  4508. binOp = spv::OpINotEqual;
  4509. break;
  4510. default:
  4511. break;
  4512. }
  4513. if (binOp != spv::OpNop) {
  4514. spv::Id result = builder.createBinOp(binOp, typeId, left, right);
  4515. builder.addDecoration(result, decorations.noContraction);
  4516. builder.addDecoration(result, decorations.nonUniform);
  4517. return builder.setPrecision(result, decorations.precision);
  4518. }
  4519. return 0;
  4520. }
  4521. //
  4522. // Translate AST matrix operation to SPV operation, already having SPV-based operands/types.
  4523. // These can be any of:
  4524. //
  4525. // matrix * scalar
  4526. // scalar * matrix
  4527. // matrix * matrix linear algebraic
  4528. // matrix * vector
  4529. // vector * matrix
  4530. // matrix * matrix componentwise
  4531. // matrix op matrix op in {+, -, /}
  4532. // matrix op scalar op in {+, -, /}
  4533. // scalar op matrix op in {+, -, /}
  4534. //
  4535. spv::Id TGlslangToSpvTraverser::createBinaryMatrixOperation(spv::Op op, OpDecorations& decorations, spv::Id typeId,
  4536. spv::Id left, spv::Id right)
  4537. {
  4538. bool firstClass = true;
  4539. // First, handle first-class matrix operations (* and matrix/scalar)
  4540. switch (op) {
  4541. case spv::OpFDiv:
  4542. if (builder.isMatrix(left) && builder.isScalar(right)) {
  4543. // turn matrix / scalar into a multiply...
  4544. spv::Id resultType = builder.getTypeId(right);
  4545. right = builder.createBinOp(spv::OpFDiv, resultType, builder.makeFpConstant(resultType, 1.0), right);
  4546. op = spv::OpMatrixTimesScalar;
  4547. } else
  4548. firstClass = false;
  4549. break;
  4550. case spv::OpMatrixTimesScalar:
  4551. if (builder.isMatrix(right) || builder.isCooperativeMatrix(right))
  4552. std::swap(left, right);
  4553. assert(builder.isScalar(right));
  4554. break;
  4555. case spv::OpVectorTimesMatrix:
  4556. assert(builder.isVector(left));
  4557. assert(builder.isMatrix(right));
  4558. break;
  4559. case spv::OpMatrixTimesVector:
  4560. assert(builder.isMatrix(left));
  4561. assert(builder.isVector(right));
  4562. break;
  4563. case spv::OpMatrixTimesMatrix:
  4564. assert(builder.isMatrix(left));
  4565. assert(builder.isMatrix(right));
  4566. break;
  4567. default:
  4568. firstClass = false;
  4569. break;
  4570. }
  4571. if (builder.isCooperativeMatrix(left) || builder.isCooperativeMatrix(right))
  4572. firstClass = true;
  4573. if (firstClass) {
  4574. spv::Id result = builder.createBinOp(op, typeId, left, right);
  4575. builder.addDecoration(result, decorations.noContraction);
  4576. builder.addDecoration(result, decorations.nonUniform);
  4577. return builder.setPrecision(result, decorations.precision);
  4578. }
  4579. // Handle component-wise +, -, *, %, and / for all combinations of type.
  4580. // The result type of all of them is the same type as the (a) matrix operand.
  4581. // The algorithm is to:
  4582. // - break the matrix(es) into vectors
  4583. // - smear any scalar to a vector
  4584. // - do vector operations
  4585. // - make a matrix out the vector results
  4586. switch (op) {
  4587. case spv::OpFAdd:
  4588. case spv::OpFSub:
  4589. case spv::OpFDiv:
  4590. case spv::OpFMod:
  4591. case spv::OpFMul:
  4592. {
  4593. // one time set up...
  4594. bool leftMat = builder.isMatrix(left);
  4595. bool rightMat = builder.isMatrix(right);
  4596. unsigned int numCols = leftMat ? builder.getNumColumns(left) : builder.getNumColumns(right);
  4597. int numRows = leftMat ? builder.getNumRows(left) : builder.getNumRows(right);
  4598. spv::Id scalarType = builder.getScalarTypeId(typeId);
  4599. spv::Id vecType = builder.makeVectorType(scalarType, numRows);
  4600. std::vector<spv::Id> results;
  4601. spv::Id smearVec = spv::NoResult;
  4602. if (builder.isScalar(left))
  4603. smearVec = builder.smearScalar(decorations.precision, left, vecType);
  4604. else if (builder.isScalar(right))
  4605. smearVec = builder.smearScalar(decorations.precision, right, vecType);
  4606. // do each vector op
  4607. for (unsigned int c = 0; c < numCols; ++c) {
  4608. std::vector<unsigned int> indexes;
  4609. indexes.push_back(c);
  4610. spv::Id leftVec = leftMat ? builder.createCompositeExtract( left, vecType, indexes) : smearVec;
  4611. spv::Id rightVec = rightMat ? builder.createCompositeExtract(right, vecType, indexes) : smearVec;
  4612. spv::Id result = builder.createBinOp(op, vecType, leftVec, rightVec);
  4613. builder.addDecoration(result, decorations.noContraction);
  4614. builder.addDecoration(result, decorations.nonUniform);
  4615. results.push_back(builder.setPrecision(result, decorations.precision));
  4616. }
  4617. // put the pieces together
  4618. spv::Id result = builder.setPrecision(builder.createCompositeConstruct(typeId, results), decorations.precision);
  4619. builder.addDecoration(result, decorations.nonUniform);
  4620. return result;
  4621. }
  4622. default:
  4623. assert(0);
  4624. return spv::NoResult;
  4625. }
  4626. }
  4627. spv::Id TGlslangToSpvTraverser::createUnaryOperation(glslang::TOperator op, OpDecorations& decorations, spv::Id typeId,
  4628. spv::Id operand, glslang::TBasicType typeProxy)
  4629. {
  4630. spv::Op unaryOp = spv::OpNop;
  4631. int extBuiltins = -1;
  4632. int libCall = -1;
  4633. bool isUnsigned = isTypeUnsignedInt(typeProxy);
  4634. bool isFloat = isTypeFloat(typeProxy);
  4635. switch (op) {
  4636. case glslang::EOpNegative:
  4637. if (isFloat) {
  4638. unaryOp = spv::OpFNegate;
  4639. if (builder.isMatrixType(typeId))
  4640. return createUnaryMatrixOperation(unaryOp, decorations, typeId, operand, typeProxy);
  4641. } else
  4642. unaryOp = spv::OpSNegate;
  4643. break;
  4644. case glslang::EOpLogicalNot:
  4645. case glslang::EOpVectorLogicalNot:
  4646. unaryOp = spv::OpLogicalNot;
  4647. break;
  4648. case glslang::EOpBitwiseNot:
  4649. unaryOp = spv::OpNot;
  4650. break;
  4651. case glslang::EOpDeterminant:
  4652. libCall = spv::GLSLstd450Determinant;
  4653. break;
  4654. case glslang::EOpMatrixInverse:
  4655. libCall = spv::GLSLstd450MatrixInverse;
  4656. break;
  4657. case glslang::EOpTranspose:
  4658. unaryOp = spv::OpTranspose;
  4659. break;
  4660. case glslang::EOpRadians:
  4661. libCall = spv::GLSLstd450Radians;
  4662. break;
  4663. case glslang::EOpDegrees:
  4664. libCall = spv::GLSLstd450Degrees;
  4665. break;
  4666. case glslang::EOpSin:
  4667. libCall = spv::GLSLstd450Sin;
  4668. break;
  4669. case glslang::EOpCos:
  4670. libCall = spv::GLSLstd450Cos;
  4671. break;
  4672. case glslang::EOpTan:
  4673. libCall = spv::GLSLstd450Tan;
  4674. break;
  4675. case glslang::EOpAcos:
  4676. libCall = spv::GLSLstd450Acos;
  4677. break;
  4678. case glslang::EOpAsin:
  4679. libCall = spv::GLSLstd450Asin;
  4680. break;
  4681. case glslang::EOpAtan:
  4682. libCall = spv::GLSLstd450Atan;
  4683. break;
  4684. case glslang::EOpAcosh:
  4685. libCall = spv::GLSLstd450Acosh;
  4686. break;
  4687. case glslang::EOpAsinh:
  4688. libCall = spv::GLSLstd450Asinh;
  4689. break;
  4690. case glslang::EOpAtanh:
  4691. libCall = spv::GLSLstd450Atanh;
  4692. break;
  4693. case glslang::EOpTanh:
  4694. libCall = spv::GLSLstd450Tanh;
  4695. break;
  4696. case glslang::EOpCosh:
  4697. libCall = spv::GLSLstd450Cosh;
  4698. break;
  4699. case glslang::EOpSinh:
  4700. libCall = spv::GLSLstd450Sinh;
  4701. break;
  4702. case glslang::EOpLength:
  4703. libCall = spv::GLSLstd450Length;
  4704. break;
  4705. case glslang::EOpNormalize:
  4706. libCall = spv::GLSLstd450Normalize;
  4707. break;
  4708. case glslang::EOpExp:
  4709. libCall = spv::GLSLstd450Exp;
  4710. break;
  4711. case glslang::EOpLog:
  4712. libCall = spv::GLSLstd450Log;
  4713. break;
  4714. case glslang::EOpExp2:
  4715. libCall = spv::GLSLstd450Exp2;
  4716. break;
  4717. case glslang::EOpLog2:
  4718. libCall = spv::GLSLstd450Log2;
  4719. break;
  4720. case glslang::EOpSqrt:
  4721. libCall = spv::GLSLstd450Sqrt;
  4722. break;
  4723. case glslang::EOpInverseSqrt:
  4724. libCall = spv::GLSLstd450InverseSqrt;
  4725. break;
  4726. case glslang::EOpFloor:
  4727. libCall = spv::GLSLstd450Floor;
  4728. break;
  4729. case glslang::EOpTrunc:
  4730. libCall = spv::GLSLstd450Trunc;
  4731. break;
  4732. case glslang::EOpRound:
  4733. libCall = spv::GLSLstd450Round;
  4734. break;
  4735. case glslang::EOpRoundEven:
  4736. libCall = spv::GLSLstd450RoundEven;
  4737. break;
  4738. case glslang::EOpCeil:
  4739. libCall = spv::GLSLstd450Ceil;
  4740. break;
  4741. case glslang::EOpFract:
  4742. libCall = spv::GLSLstd450Fract;
  4743. break;
  4744. case glslang::EOpIsNan:
  4745. unaryOp = spv::OpIsNan;
  4746. break;
  4747. case glslang::EOpIsInf:
  4748. unaryOp = spv::OpIsInf;
  4749. break;
  4750. case glslang::EOpIsFinite:
  4751. unaryOp = spv::OpIsFinite;
  4752. break;
  4753. case glslang::EOpFloatBitsToInt:
  4754. case glslang::EOpFloatBitsToUint:
  4755. case glslang::EOpIntBitsToFloat:
  4756. case glslang::EOpUintBitsToFloat:
  4757. case glslang::EOpDoubleBitsToInt64:
  4758. case glslang::EOpDoubleBitsToUint64:
  4759. case glslang::EOpInt64BitsToDouble:
  4760. case glslang::EOpUint64BitsToDouble:
  4761. case glslang::EOpFloat16BitsToInt16:
  4762. case glslang::EOpFloat16BitsToUint16:
  4763. case glslang::EOpInt16BitsToFloat16:
  4764. case glslang::EOpUint16BitsToFloat16:
  4765. unaryOp = spv::OpBitcast;
  4766. break;
  4767. case glslang::EOpPackSnorm2x16:
  4768. libCall = spv::GLSLstd450PackSnorm2x16;
  4769. break;
  4770. case glslang::EOpUnpackSnorm2x16:
  4771. libCall = spv::GLSLstd450UnpackSnorm2x16;
  4772. break;
  4773. case glslang::EOpPackUnorm2x16:
  4774. libCall = spv::GLSLstd450PackUnorm2x16;
  4775. break;
  4776. case glslang::EOpUnpackUnorm2x16:
  4777. libCall = spv::GLSLstd450UnpackUnorm2x16;
  4778. break;
  4779. case glslang::EOpPackHalf2x16:
  4780. libCall = spv::GLSLstd450PackHalf2x16;
  4781. break;
  4782. case glslang::EOpUnpackHalf2x16:
  4783. libCall = spv::GLSLstd450UnpackHalf2x16;
  4784. break;
  4785. case glslang::EOpPackSnorm4x8:
  4786. libCall = spv::GLSLstd450PackSnorm4x8;
  4787. break;
  4788. case glslang::EOpUnpackSnorm4x8:
  4789. libCall = spv::GLSLstd450UnpackSnorm4x8;
  4790. break;
  4791. case glslang::EOpPackUnorm4x8:
  4792. libCall = spv::GLSLstd450PackUnorm4x8;
  4793. break;
  4794. case glslang::EOpUnpackUnorm4x8:
  4795. libCall = spv::GLSLstd450UnpackUnorm4x8;
  4796. break;
  4797. case glslang::EOpPackDouble2x32:
  4798. libCall = spv::GLSLstd450PackDouble2x32;
  4799. break;
  4800. case glslang::EOpUnpackDouble2x32:
  4801. libCall = spv::GLSLstd450UnpackDouble2x32;
  4802. break;
  4803. case glslang::EOpPackInt2x32:
  4804. case glslang::EOpUnpackInt2x32:
  4805. case glslang::EOpPackUint2x32:
  4806. case glslang::EOpUnpackUint2x32:
  4807. case glslang::EOpPack16:
  4808. case glslang::EOpPack32:
  4809. case glslang::EOpPack64:
  4810. case glslang::EOpUnpack32:
  4811. case glslang::EOpUnpack16:
  4812. case glslang::EOpUnpack8:
  4813. case glslang::EOpPackInt2x16:
  4814. case glslang::EOpUnpackInt2x16:
  4815. case glslang::EOpPackUint2x16:
  4816. case glslang::EOpUnpackUint2x16:
  4817. case glslang::EOpPackInt4x16:
  4818. case glslang::EOpUnpackInt4x16:
  4819. case glslang::EOpPackUint4x16:
  4820. case glslang::EOpUnpackUint4x16:
  4821. case glslang::EOpPackFloat2x16:
  4822. case glslang::EOpUnpackFloat2x16:
  4823. unaryOp = spv::OpBitcast;
  4824. break;
  4825. case glslang::EOpDPdx:
  4826. unaryOp = spv::OpDPdx;
  4827. break;
  4828. case glslang::EOpDPdy:
  4829. unaryOp = spv::OpDPdy;
  4830. break;
  4831. case glslang::EOpFwidth:
  4832. unaryOp = spv::OpFwidth;
  4833. break;
  4834. case glslang::EOpDPdxFine:
  4835. unaryOp = spv::OpDPdxFine;
  4836. break;
  4837. case glslang::EOpDPdyFine:
  4838. unaryOp = spv::OpDPdyFine;
  4839. break;
  4840. case glslang::EOpFwidthFine:
  4841. unaryOp = spv::OpFwidthFine;
  4842. break;
  4843. case glslang::EOpDPdxCoarse:
  4844. unaryOp = spv::OpDPdxCoarse;
  4845. break;
  4846. case glslang::EOpDPdyCoarse:
  4847. unaryOp = spv::OpDPdyCoarse;
  4848. break;
  4849. case glslang::EOpFwidthCoarse:
  4850. unaryOp = spv::OpFwidthCoarse;
  4851. break;
  4852. case glslang::EOpInterpolateAtCentroid:
  4853. #ifdef AMD_EXTENSIONS
  4854. if (typeProxy == glslang::EbtFloat16)
  4855. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
  4856. #endif
  4857. libCall = spv::GLSLstd450InterpolateAtCentroid;
  4858. break;
  4859. case glslang::EOpAny:
  4860. unaryOp = spv::OpAny;
  4861. break;
  4862. case glslang::EOpAll:
  4863. unaryOp = spv::OpAll;
  4864. break;
  4865. case glslang::EOpAbs:
  4866. if (isFloat)
  4867. libCall = spv::GLSLstd450FAbs;
  4868. else
  4869. libCall = spv::GLSLstd450SAbs;
  4870. break;
  4871. case glslang::EOpSign:
  4872. if (isFloat)
  4873. libCall = spv::GLSLstd450FSign;
  4874. else
  4875. libCall = spv::GLSLstd450SSign;
  4876. break;
  4877. case glslang::EOpAtomicCounterIncrement:
  4878. case glslang::EOpAtomicCounterDecrement:
  4879. case glslang::EOpAtomicCounter:
  4880. {
  4881. // Handle all of the atomics in one place, in createAtomicOperation()
  4882. std::vector<spv::Id> operands;
  4883. operands.push_back(operand);
  4884. return createAtomicOperation(op, decorations.precision, typeId, operands, typeProxy);
  4885. }
  4886. case glslang::EOpBitFieldReverse:
  4887. unaryOp = spv::OpBitReverse;
  4888. break;
  4889. case glslang::EOpBitCount:
  4890. unaryOp = spv::OpBitCount;
  4891. break;
  4892. case glslang::EOpFindLSB:
  4893. libCall = spv::GLSLstd450FindILsb;
  4894. break;
  4895. case glslang::EOpFindMSB:
  4896. if (isUnsigned)
  4897. libCall = spv::GLSLstd450FindUMsb;
  4898. else
  4899. libCall = spv::GLSLstd450FindSMsb;
  4900. break;
  4901. case glslang::EOpBallot:
  4902. case glslang::EOpReadFirstInvocation:
  4903. case glslang::EOpAnyInvocation:
  4904. case glslang::EOpAllInvocations:
  4905. case glslang::EOpAllInvocationsEqual:
  4906. #ifdef AMD_EXTENSIONS
  4907. case glslang::EOpMinInvocations:
  4908. case glslang::EOpMaxInvocations:
  4909. case glslang::EOpAddInvocations:
  4910. case glslang::EOpMinInvocationsNonUniform:
  4911. case glslang::EOpMaxInvocationsNonUniform:
  4912. case glslang::EOpAddInvocationsNonUniform:
  4913. case glslang::EOpMinInvocationsInclusiveScan:
  4914. case glslang::EOpMaxInvocationsInclusiveScan:
  4915. case glslang::EOpAddInvocationsInclusiveScan:
  4916. case glslang::EOpMinInvocationsInclusiveScanNonUniform:
  4917. case glslang::EOpMaxInvocationsInclusiveScanNonUniform:
  4918. case glslang::EOpAddInvocationsInclusiveScanNonUniform:
  4919. case glslang::EOpMinInvocationsExclusiveScan:
  4920. case glslang::EOpMaxInvocationsExclusiveScan:
  4921. case glslang::EOpAddInvocationsExclusiveScan:
  4922. case glslang::EOpMinInvocationsExclusiveScanNonUniform:
  4923. case glslang::EOpMaxInvocationsExclusiveScanNonUniform:
  4924. case glslang::EOpAddInvocationsExclusiveScanNonUniform:
  4925. #endif
  4926. {
  4927. std::vector<spv::Id> operands;
  4928. operands.push_back(operand);
  4929. return createInvocationsOperation(op, typeId, operands, typeProxy);
  4930. }
  4931. case glslang::EOpSubgroupAll:
  4932. case glslang::EOpSubgroupAny:
  4933. case glslang::EOpSubgroupAllEqual:
  4934. case glslang::EOpSubgroupBroadcastFirst:
  4935. case glslang::EOpSubgroupBallot:
  4936. case glslang::EOpSubgroupInverseBallot:
  4937. case glslang::EOpSubgroupBallotBitCount:
  4938. case glslang::EOpSubgroupBallotInclusiveBitCount:
  4939. case glslang::EOpSubgroupBallotExclusiveBitCount:
  4940. case glslang::EOpSubgroupBallotFindLSB:
  4941. case glslang::EOpSubgroupBallotFindMSB:
  4942. case glslang::EOpSubgroupAdd:
  4943. case glslang::EOpSubgroupMul:
  4944. case glslang::EOpSubgroupMin:
  4945. case glslang::EOpSubgroupMax:
  4946. case glslang::EOpSubgroupAnd:
  4947. case glslang::EOpSubgroupOr:
  4948. case glslang::EOpSubgroupXor:
  4949. case glslang::EOpSubgroupInclusiveAdd:
  4950. case glslang::EOpSubgroupInclusiveMul:
  4951. case glslang::EOpSubgroupInclusiveMin:
  4952. case glslang::EOpSubgroupInclusiveMax:
  4953. case glslang::EOpSubgroupInclusiveAnd:
  4954. case glslang::EOpSubgroupInclusiveOr:
  4955. case glslang::EOpSubgroupInclusiveXor:
  4956. case glslang::EOpSubgroupExclusiveAdd:
  4957. case glslang::EOpSubgroupExclusiveMul:
  4958. case glslang::EOpSubgroupExclusiveMin:
  4959. case glslang::EOpSubgroupExclusiveMax:
  4960. case glslang::EOpSubgroupExclusiveAnd:
  4961. case glslang::EOpSubgroupExclusiveOr:
  4962. case glslang::EOpSubgroupExclusiveXor:
  4963. case glslang::EOpSubgroupQuadSwapHorizontal:
  4964. case glslang::EOpSubgroupQuadSwapVertical:
  4965. case glslang::EOpSubgroupQuadSwapDiagonal: {
  4966. std::vector<spv::Id> operands;
  4967. operands.push_back(operand);
  4968. return createSubgroupOperation(op, typeId, operands, typeProxy);
  4969. }
  4970. #ifdef AMD_EXTENSIONS
  4971. case glslang::EOpMbcnt:
  4972. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
  4973. libCall = spv::MbcntAMD;
  4974. break;
  4975. case glslang::EOpCubeFaceIndex:
  4976. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_gcn_shader);
  4977. libCall = spv::CubeFaceIndexAMD;
  4978. break;
  4979. case glslang::EOpCubeFaceCoord:
  4980. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_gcn_shader);
  4981. libCall = spv::CubeFaceCoordAMD;
  4982. break;
  4983. #endif
  4984. #ifdef NV_EXTENSIONS
  4985. case glslang::EOpSubgroupPartition:
  4986. unaryOp = spv::OpGroupNonUniformPartitionNV;
  4987. break;
  4988. #endif
  4989. case glslang::EOpConstructReference:
  4990. unaryOp = spv::OpBitcast;
  4991. break;
  4992. default:
  4993. return 0;
  4994. }
  4995. spv::Id id;
  4996. if (libCall >= 0) {
  4997. std::vector<spv::Id> args;
  4998. args.push_back(operand);
  4999. id = builder.createBuiltinCall(typeId, extBuiltins >= 0 ? extBuiltins : stdBuiltins, libCall, args);
  5000. } else {
  5001. id = builder.createUnaryOp(unaryOp, typeId, operand);
  5002. }
  5003. builder.addDecoration(id, decorations.noContraction);
  5004. builder.addDecoration(id, decorations.nonUniform);
  5005. return builder.setPrecision(id, decorations.precision);
  5006. }
  5007. // Create a unary operation on a matrix
  5008. spv::Id TGlslangToSpvTraverser::createUnaryMatrixOperation(spv::Op op, OpDecorations& decorations, spv::Id typeId,
  5009. spv::Id operand, glslang::TBasicType /* typeProxy */)
  5010. {
  5011. // Handle unary operations vector by vector.
  5012. // The result type is the same type as the original type.
  5013. // The algorithm is to:
  5014. // - break the matrix into vectors
  5015. // - apply the operation to each vector
  5016. // - make a matrix out the vector results
  5017. // get the types sorted out
  5018. int numCols = builder.getNumColumns(operand);
  5019. int numRows = builder.getNumRows(operand);
  5020. spv::Id srcVecType = builder.makeVectorType(builder.getScalarTypeId(builder.getTypeId(operand)), numRows);
  5021. spv::Id destVecType = builder.makeVectorType(builder.getScalarTypeId(typeId), numRows);
  5022. std::vector<spv::Id> results;
  5023. // do each vector op
  5024. for (int c = 0; c < numCols; ++c) {
  5025. std::vector<unsigned int> indexes;
  5026. indexes.push_back(c);
  5027. spv::Id srcVec = builder.createCompositeExtract(operand, srcVecType, indexes);
  5028. spv::Id destVec = builder.createUnaryOp(op, destVecType, srcVec);
  5029. builder.addDecoration(destVec, decorations.noContraction);
  5030. builder.addDecoration(destVec, decorations.nonUniform);
  5031. results.push_back(builder.setPrecision(destVec, decorations.precision));
  5032. }
  5033. // put the pieces together
  5034. spv::Id result = builder.setPrecision(builder.createCompositeConstruct(typeId, results), decorations.precision);
  5035. builder.addDecoration(result, decorations.nonUniform);
  5036. return result;
  5037. }
  5038. // For converting integers where both the bitwidth and the signedness could
  5039. // change, but only do the width change here. The caller is still responsible
  5040. // for the signedness conversion.
  5041. spv::Id TGlslangToSpvTraverser::createIntWidthConversion(glslang::TOperator op, spv::Id operand, int vectorSize)
  5042. {
  5043. // Get the result type width, based on the type to convert to.
  5044. int width = 32;
  5045. switch(op) {
  5046. case glslang::EOpConvInt16ToUint8:
  5047. case glslang::EOpConvIntToUint8:
  5048. case glslang::EOpConvInt64ToUint8:
  5049. case glslang::EOpConvUint16ToInt8:
  5050. case glslang::EOpConvUintToInt8:
  5051. case glslang::EOpConvUint64ToInt8:
  5052. width = 8;
  5053. break;
  5054. case glslang::EOpConvInt8ToUint16:
  5055. case glslang::EOpConvIntToUint16:
  5056. case glslang::EOpConvInt64ToUint16:
  5057. case glslang::EOpConvUint8ToInt16:
  5058. case glslang::EOpConvUintToInt16:
  5059. case glslang::EOpConvUint64ToInt16:
  5060. width = 16;
  5061. break;
  5062. case glslang::EOpConvInt8ToUint:
  5063. case glslang::EOpConvInt16ToUint:
  5064. case glslang::EOpConvInt64ToUint:
  5065. case glslang::EOpConvUint8ToInt:
  5066. case glslang::EOpConvUint16ToInt:
  5067. case glslang::EOpConvUint64ToInt:
  5068. width = 32;
  5069. break;
  5070. case glslang::EOpConvInt8ToUint64:
  5071. case glslang::EOpConvInt16ToUint64:
  5072. case glslang::EOpConvIntToUint64:
  5073. case glslang::EOpConvUint8ToInt64:
  5074. case glslang::EOpConvUint16ToInt64:
  5075. case glslang::EOpConvUintToInt64:
  5076. width = 64;
  5077. break;
  5078. default:
  5079. assert(false && "Default missing");
  5080. break;
  5081. }
  5082. // Get the conversion operation and result type,
  5083. // based on the target width, but the source type.
  5084. spv::Id type = spv::NoType;
  5085. spv::Op convOp = spv::OpNop;
  5086. switch(op) {
  5087. case glslang::EOpConvInt8ToUint16:
  5088. case glslang::EOpConvInt8ToUint:
  5089. case glslang::EOpConvInt8ToUint64:
  5090. case glslang::EOpConvInt16ToUint8:
  5091. case glslang::EOpConvInt16ToUint:
  5092. case glslang::EOpConvInt16ToUint64:
  5093. case glslang::EOpConvIntToUint8:
  5094. case glslang::EOpConvIntToUint16:
  5095. case glslang::EOpConvIntToUint64:
  5096. case glslang::EOpConvInt64ToUint8:
  5097. case glslang::EOpConvInt64ToUint16:
  5098. case glslang::EOpConvInt64ToUint:
  5099. convOp = spv::OpSConvert;
  5100. type = builder.makeIntType(width);
  5101. break;
  5102. default:
  5103. convOp = spv::OpUConvert;
  5104. type = builder.makeUintType(width);
  5105. break;
  5106. }
  5107. if (vectorSize > 0)
  5108. type = builder.makeVectorType(type, vectorSize);
  5109. return builder.createUnaryOp(convOp, type, operand);
  5110. }
  5111. spv::Id TGlslangToSpvTraverser::createConversion(glslang::TOperator op, OpDecorations& decorations, spv::Id destType,
  5112. spv::Id operand, glslang::TBasicType typeProxy)
  5113. {
  5114. spv::Op convOp = spv::OpNop;
  5115. spv::Id zero = 0;
  5116. spv::Id one = 0;
  5117. int vectorSize = builder.isVectorType(destType) ? builder.getNumTypeComponents(destType) : 0;
  5118. switch (op) {
  5119. case glslang::EOpConvInt8ToBool:
  5120. case glslang::EOpConvUint8ToBool:
  5121. zero = builder.makeUint8Constant(0);
  5122. zero = makeSmearedConstant(zero, vectorSize);
  5123. return builder.createBinOp(spv::OpINotEqual, destType, operand, zero);
  5124. case glslang::EOpConvInt16ToBool:
  5125. case glslang::EOpConvUint16ToBool:
  5126. zero = builder.makeUint16Constant(0);
  5127. zero = makeSmearedConstant(zero, vectorSize);
  5128. return builder.createBinOp(spv::OpINotEqual, destType, operand, zero);
  5129. case glslang::EOpConvIntToBool:
  5130. case glslang::EOpConvUintToBool:
  5131. zero = builder.makeUintConstant(0);
  5132. zero = makeSmearedConstant(zero, vectorSize);
  5133. return builder.createBinOp(spv::OpINotEqual, destType, operand, zero);
  5134. case glslang::EOpConvInt64ToBool:
  5135. case glslang::EOpConvUint64ToBool:
  5136. zero = builder.makeUint64Constant(0);
  5137. zero = makeSmearedConstant(zero, vectorSize);
  5138. return builder.createBinOp(spv::OpINotEqual, destType, operand, zero);
  5139. case glslang::EOpConvFloatToBool:
  5140. zero = builder.makeFloatConstant(0.0F);
  5141. zero = makeSmearedConstant(zero, vectorSize);
  5142. return builder.createBinOp(spv::OpFOrdNotEqual, destType, operand, zero);
  5143. case glslang::EOpConvDoubleToBool:
  5144. zero = builder.makeDoubleConstant(0.0);
  5145. zero = makeSmearedConstant(zero, vectorSize);
  5146. return builder.createBinOp(spv::OpFOrdNotEqual, destType, operand, zero);
  5147. case glslang::EOpConvFloat16ToBool:
  5148. zero = builder.makeFloat16Constant(0.0F);
  5149. zero = makeSmearedConstant(zero, vectorSize);
  5150. return builder.createBinOp(spv::OpFOrdNotEqual, destType, operand, zero);
  5151. case glslang::EOpConvBoolToFloat:
  5152. convOp = spv::OpSelect;
  5153. zero = builder.makeFloatConstant(0.0F);
  5154. one = builder.makeFloatConstant(1.0F);
  5155. break;
  5156. case glslang::EOpConvBoolToDouble:
  5157. convOp = spv::OpSelect;
  5158. zero = builder.makeDoubleConstant(0.0);
  5159. one = builder.makeDoubleConstant(1.0);
  5160. break;
  5161. case glslang::EOpConvBoolToFloat16:
  5162. convOp = spv::OpSelect;
  5163. zero = builder.makeFloat16Constant(0.0F);
  5164. one = builder.makeFloat16Constant(1.0F);
  5165. break;
  5166. case glslang::EOpConvBoolToInt8:
  5167. zero = builder.makeInt8Constant(0);
  5168. one = builder.makeInt8Constant(1);
  5169. convOp = spv::OpSelect;
  5170. break;
  5171. case glslang::EOpConvBoolToUint8:
  5172. zero = builder.makeUint8Constant(0);
  5173. one = builder.makeUint8Constant(1);
  5174. convOp = spv::OpSelect;
  5175. break;
  5176. case glslang::EOpConvBoolToInt16:
  5177. zero = builder.makeInt16Constant(0);
  5178. one = builder.makeInt16Constant(1);
  5179. convOp = spv::OpSelect;
  5180. break;
  5181. case glslang::EOpConvBoolToUint16:
  5182. zero = builder.makeUint16Constant(0);
  5183. one = builder.makeUint16Constant(1);
  5184. convOp = spv::OpSelect;
  5185. break;
  5186. case glslang::EOpConvBoolToInt:
  5187. case glslang::EOpConvBoolToInt64:
  5188. if (op == glslang::EOpConvBoolToInt64)
  5189. zero = builder.makeInt64Constant(0);
  5190. else
  5191. zero = builder.makeIntConstant(0);
  5192. if (op == glslang::EOpConvBoolToInt64)
  5193. one = builder.makeInt64Constant(1);
  5194. else
  5195. one = builder.makeIntConstant(1);
  5196. convOp = spv::OpSelect;
  5197. break;
  5198. case glslang::EOpConvBoolToUint:
  5199. case glslang::EOpConvBoolToUint64:
  5200. if (op == glslang::EOpConvBoolToUint64)
  5201. zero = builder.makeUint64Constant(0);
  5202. else
  5203. zero = builder.makeUintConstant(0);
  5204. if (op == glslang::EOpConvBoolToUint64)
  5205. one = builder.makeUint64Constant(1);
  5206. else
  5207. one = builder.makeUintConstant(1);
  5208. convOp = spv::OpSelect;
  5209. break;
  5210. case glslang::EOpConvInt8ToFloat16:
  5211. case glslang::EOpConvInt8ToFloat:
  5212. case glslang::EOpConvInt8ToDouble:
  5213. case glslang::EOpConvInt16ToFloat16:
  5214. case glslang::EOpConvInt16ToFloat:
  5215. case glslang::EOpConvInt16ToDouble:
  5216. case glslang::EOpConvIntToFloat16:
  5217. case glslang::EOpConvIntToFloat:
  5218. case glslang::EOpConvIntToDouble:
  5219. case glslang::EOpConvInt64ToFloat:
  5220. case glslang::EOpConvInt64ToDouble:
  5221. case glslang::EOpConvInt64ToFloat16:
  5222. convOp = spv::OpConvertSToF;
  5223. break;
  5224. case glslang::EOpConvUint8ToFloat16:
  5225. case glslang::EOpConvUint8ToFloat:
  5226. case glslang::EOpConvUint8ToDouble:
  5227. case glslang::EOpConvUint16ToFloat16:
  5228. case glslang::EOpConvUint16ToFloat:
  5229. case glslang::EOpConvUint16ToDouble:
  5230. case glslang::EOpConvUintToFloat16:
  5231. case glslang::EOpConvUintToFloat:
  5232. case glslang::EOpConvUintToDouble:
  5233. case glslang::EOpConvUint64ToFloat:
  5234. case glslang::EOpConvUint64ToDouble:
  5235. case glslang::EOpConvUint64ToFloat16:
  5236. convOp = spv::OpConvertUToF;
  5237. break;
  5238. case glslang::EOpConvDoubleToFloat:
  5239. case glslang::EOpConvFloatToDouble:
  5240. case glslang::EOpConvDoubleToFloat16:
  5241. case glslang::EOpConvFloat16ToDouble:
  5242. case glslang::EOpConvFloatToFloat16:
  5243. case glslang::EOpConvFloat16ToFloat:
  5244. convOp = spv::OpFConvert;
  5245. if (builder.isMatrixType(destType))
  5246. return createUnaryMatrixOperation(convOp, decorations, destType, operand, typeProxy);
  5247. break;
  5248. case glslang::EOpConvFloat16ToInt8:
  5249. case glslang::EOpConvFloatToInt8:
  5250. case glslang::EOpConvDoubleToInt8:
  5251. case glslang::EOpConvFloat16ToInt16:
  5252. case glslang::EOpConvFloatToInt16:
  5253. case glslang::EOpConvDoubleToInt16:
  5254. case glslang::EOpConvFloat16ToInt:
  5255. case glslang::EOpConvFloatToInt:
  5256. case glslang::EOpConvDoubleToInt:
  5257. case glslang::EOpConvFloat16ToInt64:
  5258. case glslang::EOpConvFloatToInt64:
  5259. case glslang::EOpConvDoubleToInt64:
  5260. convOp = spv::OpConvertFToS;
  5261. break;
  5262. case glslang::EOpConvUint8ToInt8:
  5263. case glslang::EOpConvInt8ToUint8:
  5264. case glslang::EOpConvUint16ToInt16:
  5265. case glslang::EOpConvInt16ToUint16:
  5266. case glslang::EOpConvUintToInt:
  5267. case glslang::EOpConvIntToUint:
  5268. case glslang::EOpConvUint64ToInt64:
  5269. case glslang::EOpConvInt64ToUint64:
  5270. if (builder.isInSpecConstCodeGenMode()) {
  5271. // Build zero scalar or vector for OpIAdd.
  5272. if(op == glslang::EOpConvUint8ToInt8 || op == glslang::EOpConvInt8ToUint8) {
  5273. zero = builder.makeUint8Constant(0);
  5274. } else if (op == glslang::EOpConvUint16ToInt16 || op == glslang::EOpConvInt16ToUint16) {
  5275. zero = builder.makeUint16Constant(0);
  5276. } else if (op == glslang::EOpConvUint64ToInt64 || op == glslang::EOpConvInt64ToUint64) {
  5277. zero = builder.makeUint64Constant(0);
  5278. } else {
  5279. zero = builder.makeUintConstant(0);
  5280. }
  5281. zero = makeSmearedConstant(zero, vectorSize);
  5282. // Use OpIAdd, instead of OpBitcast to do the conversion when
  5283. // generating for OpSpecConstantOp instruction.
  5284. return builder.createBinOp(spv::OpIAdd, destType, operand, zero);
  5285. }
  5286. // For normal run-time conversion instruction, use OpBitcast.
  5287. convOp = spv::OpBitcast;
  5288. break;
  5289. case glslang::EOpConvFloat16ToUint8:
  5290. case glslang::EOpConvFloatToUint8:
  5291. case glslang::EOpConvDoubleToUint8:
  5292. case glslang::EOpConvFloat16ToUint16:
  5293. case glslang::EOpConvFloatToUint16:
  5294. case glslang::EOpConvDoubleToUint16:
  5295. case glslang::EOpConvFloat16ToUint:
  5296. case glslang::EOpConvFloatToUint:
  5297. case glslang::EOpConvDoubleToUint:
  5298. case glslang::EOpConvFloatToUint64:
  5299. case glslang::EOpConvDoubleToUint64:
  5300. case glslang::EOpConvFloat16ToUint64:
  5301. convOp = spv::OpConvertFToU;
  5302. break;
  5303. case glslang::EOpConvInt8ToInt16:
  5304. case glslang::EOpConvInt8ToInt:
  5305. case glslang::EOpConvInt8ToInt64:
  5306. case glslang::EOpConvInt16ToInt8:
  5307. case glslang::EOpConvInt16ToInt:
  5308. case glslang::EOpConvInt16ToInt64:
  5309. case glslang::EOpConvIntToInt8:
  5310. case glslang::EOpConvIntToInt16:
  5311. case glslang::EOpConvIntToInt64:
  5312. case glslang::EOpConvInt64ToInt8:
  5313. case glslang::EOpConvInt64ToInt16:
  5314. case glslang::EOpConvInt64ToInt:
  5315. convOp = spv::OpSConvert;
  5316. break;
  5317. case glslang::EOpConvUint8ToUint16:
  5318. case glslang::EOpConvUint8ToUint:
  5319. case glslang::EOpConvUint8ToUint64:
  5320. case glslang::EOpConvUint16ToUint8:
  5321. case glslang::EOpConvUint16ToUint:
  5322. case glslang::EOpConvUint16ToUint64:
  5323. case glslang::EOpConvUintToUint8:
  5324. case glslang::EOpConvUintToUint16:
  5325. case glslang::EOpConvUintToUint64:
  5326. case glslang::EOpConvUint64ToUint8:
  5327. case glslang::EOpConvUint64ToUint16:
  5328. case glslang::EOpConvUint64ToUint:
  5329. convOp = spv::OpUConvert;
  5330. break;
  5331. case glslang::EOpConvInt8ToUint16:
  5332. case glslang::EOpConvInt8ToUint:
  5333. case glslang::EOpConvInt8ToUint64:
  5334. case glslang::EOpConvInt16ToUint8:
  5335. case glslang::EOpConvInt16ToUint:
  5336. case glslang::EOpConvInt16ToUint64:
  5337. case glslang::EOpConvIntToUint8:
  5338. case glslang::EOpConvIntToUint16:
  5339. case glslang::EOpConvIntToUint64:
  5340. case glslang::EOpConvInt64ToUint8:
  5341. case glslang::EOpConvInt64ToUint16:
  5342. case glslang::EOpConvInt64ToUint:
  5343. case glslang::EOpConvUint8ToInt16:
  5344. case glslang::EOpConvUint8ToInt:
  5345. case glslang::EOpConvUint8ToInt64:
  5346. case glslang::EOpConvUint16ToInt8:
  5347. case glslang::EOpConvUint16ToInt:
  5348. case glslang::EOpConvUint16ToInt64:
  5349. case glslang::EOpConvUintToInt8:
  5350. case glslang::EOpConvUintToInt16:
  5351. case glslang::EOpConvUintToInt64:
  5352. case glslang::EOpConvUint64ToInt8:
  5353. case glslang::EOpConvUint64ToInt16:
  5354. case glslang::EOpConvUint64ToInt:
  5355. // OpSConvert/OpUConvert + OpBitCast
  5356. operand = createIntWidthConversion(op, operand, vectorSize);
  5357. if (builder.isInSpecConstCodeGenMode()) {
  5358. // Build zero scalar or vector for OpIAdd.
  5359. switch(op) {
  5360. case glslang::EOpConvInt16ToUint8:
  5361. case glslang::EOpConvIntToUint8:
  5362. case glslang::EOpConvInt64ToUint8:
  5363. case glslang::EOpConvUint16ToInt8:
  5364. case glslang::EOpConvUintToInt8:
  5365. case glslang::EOpConvUint64ToInt8:
  5366. zero = builder.makeUint8Constant(0);
  5367. break;
  5368. case glslang::EOpConvInt8ToUint16:
  5369. case glslang::EOpConvIntToUint16:
  5370. case glslang::EOpConvInt64ToUint16:
  5371. case glslang::EOpConvUint8ToInt16:
  5372. case glslang::EOpConvUintToInt16:
  5373. case glslang::EOpConvUint64ToInt16:
  5374. zero = builder.makeUint16Constant(0);
  5375. break;
  5376. case glslang::EOpConvInt8ToUint:
  5377. case glslang::EOpConvInt16ToUint:
  5378. case glslang::EOpConvInt64ToUint:
  5379. case glslang::EOpConvUint8ToInt:
  5380. case glslang::EOpConvUint16ToInt:
  5381. case glslang::EOpConvUint64ToInt:
  5382. zero = builder.makeUintConstant(0);
  5383. break;
  5384. case glslang::EOpConvInt8ToUint64:
  5385. case glslang::EOpConvInt16ToUint64:
  5386. case glslang::EOpConvIntToUint64:
  5387. case glslang::EOpConvUint8ToInt64:
  5388. case glslang::EOpConvUint16ToInt64:
  5389. case glslang::EOpConvUintToInt64:
  5390. zero = builder.makeUint64Constant(0);
  5391. break;
  5392. default:
  5393. assert(false && "Default missing");
  5394. break;
  5395. }
  5396. zero = makeSmearedConstant(zero, vectorSize);
  5397. // Use OpIAdd, instead of OpBitcast to do the conversion when
  5398. // generating for OpSpecConstantOp instruction.
  5399. return builder.createBinOp(spv::OpIAdd, destType, operand, zero);
  5400. }
  5401. // For normal run-time conversion instruction, use OpBitcast.
  5402. convOp = spv::OpBitcast;
  5403. break;
  5404. case glslang::EOpConvUint64ToPtr:
  5405. convOp = spv::OpConvertUToPtr;
  5406. break;
  5407. case glslang::EOpConvPtrToUint64:
  5408. convOp = spv::OpConvertPtrToU;
  5409. break;
  5410. default:
  5411. break;
  5412. }
  5413. spv::Id result = 0;
  5414. if (convOp == spv::OpNop)
  5415. return result;
  5416. if (convOp == spv::OpSelect) {
  5417. zero = makeSmearedConstant(zero, vectorSize);
  5418. one = makeSmearedConstant(one, vectorSize);
  5419. result = builder.createTriOp(convOp, destType, operand, one, zero);
  5420. } else
  5421. result = builder.createUnaryOp(convOp, destType, operand);
  5422. result = builder.setPrecision(result, decorations.precision);
  5423. builder.addDecoration(result, decorations.nonUniform);
  5424. return result;
  5425. }
  5426. spv::Id TGlslangToSpvTraverser::makeSmearedConstant(spv::Id constant, int vectorSize)
  5427. {
  5428. if (vectorSize == 0)
  5429. return constant;
  5430. spv::Id vectorTypeId = builder.makeVectorType(builder.getTypeId(constant), vectorSize);
  5431. std::vector<spv::Id> components;
  5432. for (int c = 0; c < vectorSize; ++c)
  5433. components.push_back(constant);
  5434. return builder.makeCompositeConstant(vectorTypeId, components);
  5435. }
  5436. // For glslang ops that map to SPV atomic opCodes
  5437. spv::Id TGlslangToSpvTraverser::createAtomicOperation(glslang::TOperator op, spv::Decoration /*precision*/, spv::Id typeId, std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)
  5438. {
  5439. spv::Op opCode = spv::OpNop;
  5440. switch (op) {
  5441. case glslang::EOpAtomicAdd:
  5442. case glslang::EOpImageAtomicAdd:
  5443. case glslang::EOpAtomicCounterAdd:
  5444. opCode = spv::OpAtomicIAdd;
  5445. break;
  5446. case glslang::EOpAtomicCounterSubtract:
  5447. opCode = spv::OpAtomicISub;
  5448. break;
  5449. case glslang::EOpAtomicMin:
  5450. case glslang::EOpImageAtomicMin:
  5451. case glslang::EOpAtomicCounterMin:
  5452. opCode = (typeProxy == glslang::EbtUint || typeProxy == glslang::EbtUint64) ? spv::OpAtomicUMin : spv::OpAtomicSMin;
  5453. break;
  5454. case glslang::EOpAtomicMax:
  5455. case glslang::EOpImageAtomicMax:
  5456. case glslang::EOpAtomicCounterMax:
  5457. opCode = (typeProxy == glslang::EbtUint || typeProxy == glslang::EbtUint64) ? spv::OpAtomicUMax : spv::OpAtomicSMax;
  5458. break;
  5459. case glslang::EOpAtomicAnd:
  5460. case glslang::EOpImageAtomicAnd:
  5461. case glslang::EOpAtomicCounterAnd:
  5462. opCode = spv::OpAtomicAnd;
  5463. break;
  5464. case glslang::EOpAtomicOr:
  5465. case glslang::EOpImageAtomicOr:
  5466. case glslang::EOpAtomicCounterOr:
  5467. opCode = spv::OpAtomicOr;
  5468. break;
  5469. case glslang::EOpAtomicXor:
  5470. case glslang::EOpImageAtomicXor:
  5471. case glslang::EOpAtomicCounterXor:
  5472. opCode = spv::OpAtomicXor;
  5473. break;
  5474. case glslang::EOpAtomicExchange:
  5475. case glslang::EOpImageAtomicExchange:
  5476. case glslang::EOpAtomicCounterExchange:
  5477. opCode = spv::OpAtomicExchange;
  5478. break;
  5479. case glslang::EOpAtomicCompSwap:
  5480. case glslang::EOpImageAtomicCompSwap:
  5481. case glslang::EOpAtomicCounterCompSwap:
  5482. opCode = spv::OpAtomicCompareExchange;
  5483. break;
  5484. case glslang::EOpAtomicCounterIncrement:
  5485. opCode = spv::OpAtomicIIncrement;
  5486. break;
  5487. case glslang::EOpAtomicCounterDecrement:
  5488. opCode = spv::OpAtomicIDecrement;
  5489. break;
  5490. case glslang::EOpAtomicCounter:
  5491. case glslang::EOpImageAtomicLoad:
  5492. case glslang::EOpAtomicLoad:
  5493. opCode = spv::OpAtomicLoad;
  5494. break;
  5495. case glslang::EOpAtomicStore:
  5496. case glslang::EOpImageAtomicStore:
  5497. opCode = spv::OpAtomicStore;
  5498. break;
  5499. default:
  5500. assert(0);
  5501. break;
  5502. }
  5503. if (typeProxy == glslang::EbtInt64 || typeProxy == glslang::EbtUint64)
  5504. builder.addCapability(spv::CapabilityInt64Atomics);
  5505. // Sort out the operands
  5506. // - mapping from glslang -> SPV
  5507. // - there are extra SPV operands that are optional in glslang
  5508. // - compare-exchange swaps the value and comparator
  5509. // - compare-exchange has an extra memory semantics
  5510. // - EOpAtomicCounterDecrement needs a post decrement
  5511. spv::Id pointerId = 0, compareId = 0, valueId = 0;
  5512. // scope defaults to Device in the old model, QueueFamilyKHR in the new model
  5513. spv::Id scopeId;
  5514. if (glslangIntermediate->usingVulkanMemoryModel()) {
  5515. scopeId = builder.makeUintConstant(spv::ScopeQueueFamilyKHR);
  5516. } else {
  5517. scopeId = builder.makeUintConstant(spv::ScopeDevice);
  5518. }
  5519. // semantics default to relaxed
  5520. spv::Id semanticsId = builder.makeUintConstant(spv::MemorySemanticsMaskNone);
  5521. spv::Id semanticsId2 = semanticsId;
  5522. pointerId = operands[0];
  5523. if (opCode == spv::OpAtomicIIncrement || opCode == spv::OpAtomicIDecrement) {
  5524. // no additional operands
  5525. } else if (opCode == spv::OpAtomicCompareExchange) {
  5526. compareId = operands[1];
  5527. valueId = operands[2];
  5528. if (operands.size() > 3) {
  5529. scopeId = operands[3];
  5530. semanticsId = builder.makeUintConstant(builder.getConstantScalar(operands[4]) | builder.getConstantScalar(operands[5]));
  5531. semanticsId2 = builder.makeUintConstant(builder.getConstantScalar(operands[6]) | builder.getConstantScalar(operands[7]));
  5532. }
  5533. } else if (opCode == spv::OpAtomicLoad) {
  5534. if (operands.size() > 1) {
  5535. scopeId = operands[1];
  5536. semanticsId = builder.makeUintConstant(builder.getConstantScalar(operands[2]) | builder.getConstantScalar(operands[3]));
  5537. }
  5538. } else {
  5539. // atomic store or RMW
  5540. valueId = operands[1];
  5541. if (operands.size() > 2) {
  5542. scopeId = operands[2];
  5543. semanticsId = builder.makeUintConstant(builder.getConstantScalar(operands[3]) | builder.getConstantScalar(operands[4]));
  5544. }
  5545. }
  5546. // Check for capabilities
  5547. unsigned semanticsImmediate = builder.getConstantScalar(semanticsId) | builder.getConstantScalar(semanticsId2);
  5548. if (semanticsImmediate & (spv::MemorySemanticsMakeAvailableKHRMask | spv::MemorySemanticsMakeVisibleKHRMask | spv::MemorySemanticsOutputMemoryKHRMask)) {
  5549. builder.addCapability(spv::CapabilityVulkanMemoryModelKHR);
  5550. }
  5551. if (glslangIntermediate->usingVulkanMemoryModel() && builder.getConstantScalar(scopeId) == spv::ScopeDevice) {
  5552. builder.addCapability(spv::CapabilityVulkanMemoryModelDeviceScopeKHR);
  5553. }
  5554. std::vector<spv::Id> spvAtomicOperands; // hold the spv operands
  5555. spvAtomicOperands.push_back(pointerId);
  5556. spvAtomicOperands.push_back(scopeId);
  5557. spvAtomicOperands.push_back(semanticsId);
  5558. if (opCode == spv::OpAtomicCompareExchange) {
  5559. spvAtomicOperands.push_back(semanticsId2);
  5560. spvAtomicOperands.push_back(valueId);
  5561. spvAtomicOperands.push_back(compareId);
  5562. } else if (opCode != spv::OpAtomicLoad && opCode != spv::OpAtomicIIncrement && opCode != spv::OpAtomicIDecrement) {
  5563. spvAtomicOperands.push_back(valueId);
  5564. }
  5565. if (opCode == spv::OpAtomicStore) {
  5566. builder.createNoResultOp(opCode, spvAtomicOperands);
  5567. return 0;
  5568. } else {
  5569. spv::Id resultId = builder.createOp(opCode, typeId, spvAtomicOperands);
  5570. // GLSL and HLSL atomic-counter decrement return post-decrement value,
  5571. // while SPIR-V returns pre-decrement value. Translate between these semantics.
  5572. if (op == glslang::EOpAtomicCounterDecrement)
  5573. resultId = builder.createBinOp(spv::OpISub, typeId, resultId, builder.makeIntConstant(1));
  5574. return resultId;
  5575. }
  5576. }
  5577. // Create group invocation operations.
  5578. spv::Id TGlslangToSpvTraverser::createInvocationsOperation(glslang::TOperator op, spv::Id typeId, std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)
  5579. {
  5580. #ifdef AMD_EXTENSIONS
  5581. bool isUnsigned = isTypeUnsignedInt(typeProxy);
  5582. bool isFloat = isTypeFloat(typeProxy);
  5583. #endif
  5584. spv::Op opCode = spv::OpNop;
  5585. std::vector<spv::IdImmediate> spvGroupOperands;
  5586. spv::GroupOperation groupOperation = spv::GroupOperationMax;
  5587. if (op == glslang::EOpBallot || op == glslang::EOpReadFirstInvocation ||
  5588. op == glslang::EOpReadInvocation) {
  5589. builder.addExtension(spv::E_SPV_KHR_shader_ballot);
  5590. builder.addCapability(spv::CapabilitySubgroupBallotKHR);
  5591. } else if (op == glslang::EOpAnyInvocation ||
  5592. op == glslang::EOpAllInvocations ||
  5593. op == glslang::EOpAllInvocationsEqual) {
  5594. builder.addExtension(spv::E_SPV_KHR_subgroup_vote);
  5595. builder.addCapability(spv::CapabilitySubgroupVoteKHR);
  5596. } else {
  5597. builder.addCapability(spv::CapabilityGroups);
  5598. #ifdef AMD_EXTENSIONS
  5599. if (op == glslang::EOpMinInvocationsNonUniform ||
  5600. op == glslang::EOpMaxInvocationsNonUniform ||
  5601. op == glslang::EOpAddInvocationsNonUniform ||
  5602. op == glslang::EOpMinInvocationsInclusiveScanNonUniform ||
  5603. op == glslang::EOpMaxInvocationsInclusiveScanNonUniform ||
  5604. op == glslang::EOpAddInvocationsInclusiveScanNonUniform ||
  5605. op == glslang::EOpMinInvocationsExclusiveScanNonUniform ||
  5606. op == glslang::EOpMaxInvocationsExclusiveScanNonUniform ||
  5607. op == glslang::EOpAddInvocationsExclusiveScanNonUniform)
  5608. builder.addExtension(spv::E_SPV_AMD_shader_ballot);
  5609. #endif
  5610. #ifdef AMD_EXTENSIONS
  5611. switch (op) {
  5612. case glslang::EOpMinInvocations:
  5613. case glslang::EOpMaxInvocations:
  5614. case glslang::EOpAddInvocations:
  5615. case glslang::EOpMinInvocationsNonUniform:
  5616. case glslang::EOpMaxInvocationsNonUniform:
  5617. case glslang::EOpAddInvocationsNonUniform:
  5618. groupOperation = spv::GroupOperationReduce;
  5619. break;
  5620. case glslang::EOpMinInvocationsInclusiveScan:
  5621. case glslang::EOpMaxInvocationsInclusiveScan:
  5622. case glslang::EOpAddInvocationsInclusiveScan:
  5623. case glslang::EOpMinInvocationsInclusiveScanNonUniform:
  5624. case glslang::EOpMaxInvocationsInclusiveScanNonUniform:
  5625. case glslang::EOpAddInvocationsInclusiveScanNonUniform:
  5626. groupOperation = spv::GroupOperationInclusiveScan;
  5627. break;
  5628. case glslang::EOpMinInvocationsExclusiveScan:
  5629. case glslang::EOpMaxInvocationsExclusiveScan:
  5630. case glslang::EOpAddInvocationsExclusiveScan:
  5631. case glslang::EOpMinInvocationsExclusiveScanNonUniform:
  5632. case glslang::EOpMaxInvocationsExclusiveScanNonUniform:
  5633. case glslang::EOpAddInvocationsExclusiveScanNonUniform:
  5634. groupOperation = spv::GroupOperationExclusiveScan;
  5635. break;
  5636. default:
  5637. break;
  5638. }
  5639. spv::IdImmediate scope = { true, builder.makeUintConstant(spv::ScopeSubgroup) };
  5640. spvGroupOperands.push_back(scope);
  5641. if (groupOperation != spv::GroupOperationMax) {
  5642. spv::IdImmediate groupOp = { false, (unsigned)groupOperation };
  5643. spvGroupOperands.push_back(groupOp);
  5644. }
  5645. #endif
  5646. }
  5647. for (auto opIt = operands.begin(); opIt != operands.end(); ++opIt) {
  5648. spv::IdImmediate op = { true, *opIt };
  5649. spvGroupOperands.push_back(op);
  5650. }
  5651. switch (op) {
  5652. case glslang::EOpAnyInvocation:
  5653. opCode = spv::OpSubgroupAnyKHR;
  5654. break;
  5655. case glslang::EOpAllInvocations:
  5656. opCode = spv::OpSubgroupAllKHR;
  5657. break;
  5658. case glslang::EOpAllInvocationsEqual:
  5659. opCode = spv::OpSubgroupAllEqualKHR;
  5660. break;
  5661. case glslang::EOpReadInvocation:
  5662. opCode = spv::OpSubgroupReadInvocationKHR;
  5663. if (builder.isVectorType(typeId))
  5664. return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
  5665. break;
  5666. case glslang::EOpReadFirstInvocation:
  5667. opCode = spv::OpSubgroupFirstInvocationKHR;
  5668. break;
  5669. case glslang::EOpBallot:
  5670. {
  5671. // NOTE: According to the spec, the result type of "OpSubgroupBallotKHR" must be a 4 component vector of 32
  5672. // bit integer types. The GLSL built-in function "ballotARB()" assumes the maximum number of invocations in
  5673. // a subgroup is 64. Thus, we have to convert uvec4.xy to uint64_t as follow:
  5674. //
  5675. // result = Bitcast(SubgroupBallotKHR(Predicate).xy)
  5676. //
  5677. spv::Id uintType = builder.makeUintType(32);
  5678. spv::Id uvec4Type = builder.makeVectorType(uintType, 4);
  5679. spv::Id result = builder.createOp(spv::OpSubgroupBallotKHR, uvec4Type, spvGroupOperands);
  5680. std::vector<spv::Id> components;
  5681. components.push_back(builder.createCompositeExtract(result, uintType, 0));
  5682. components.push_back(builder.createCompositeExtract(result, uintType, 1));
  5683. spv::Id uvec2Type = builder.makeVectorType(uintType, 2);
  5684. return builder.createUnaryOp(spv::OpBitcast, typeId,
  5685. builder.createCompositeConstruct(uvec2Type, components));
  5686. }
  5687. #ifdef AMD_EXTENSIONS
  5688. case glslang::EOpMinInvocations:
  5689. case glslang::EOpMaxInvocations:
  5690. case glslang::EOpAddInvocations:
  5691. case glslang::EOpMinInvocationsInclusiveScan:
  5692. case glslang::EOpMaxInvocationsInclusiveScan:
  5693. case glslang::EOpAddInvocationsInclusiveScan:
  5694. case glslang::EOpMinInvocationsExclusiveScan:
  5695. case glslang::EOpMaxInvocationsExclusiveScan:
  5696. case glslang::EOpAddInvocationsExclusiveScan:
  5697. if (op == glslang::EOpMinInvocations ||
  5698. op == glslang::EOpMinInvocationsInclusiveScan ||
  5699. op == glslang::EOpMinInvocationsExclusiveScan) {
  5700. if (isFloat)
  5701. opCode = spv::OpGroupFMin;
  5702. else {
  5703. if (isUnsigned)
  5704. opCode = spv::OpGroupUMin;
  5705. else
  5706. opCode = spv::OpGroupSMin;
  5707. }
  5708. } else if (op == glslang::EOpMaxInvocations ||
  5709. op == glslang::EOpMaxInvocationsInclusiveScan ||
  5710. op == glslang::EOpMaxInvocationsExclusiveScan) {
  5711. if (isFloat)
  5712. opCode = spv::OpGroupFMax;
  5713. else {
  5714. if (isUnsigned)
  5715. opCode = spv::OpGroupUMax;
  5716. else
  5717. opCode = spv::OpGroupSMax;
  5718. }
  5719. } else {
  5720. if (isFloat)
  5721. opCode = spv::OpGroupFAdd;
  5722. else
  5723. opCode = spv::OpGroupIAdd;
  5724. }
  5725. if (builder.isVectorType(typeId))
  5726. return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
  5727. break;
  5728. case glslang::EOpMinInvocationsNonUniform:
  5729. case glslang::EOpMaxInvocationsNonUniform:
  5730. case glslang::EOpAddInvocationsNonUniform:
  5731. case glslang::EOpMinInvocationsInclusiveScanNonUniform:
  5732. case glslang::EOpMaxInvocationsInclusiveScanNonUniform:
  5733. case glslang::EOpAddInvocationsInclusiveScanNonUniform:
  5734. case glslang::EOpMinInvocationsExclusiveScanNonUniform:
  5735. case glslang::EOpMaxInvocationsExclusiveScanNonUniform:
  5736. case glslang::EOpAddInvocationsExclusiveScanNonUniform:
  5737. if (op == glslang::EOpMinInvocationsNonUniform ||
  5738. op == glslang::EOpMinInvocationsInclusiveScanNonUniform ||
  5739. op == glslang::EOpMinInvocationsExclusiveScanNonUniform) {
  5740. if (isFloat)
  5741. opCode = spv::OpGroupFMinNonUniformAMD;
  5742. else {
  5743. if (isUnsigned)
  5744. opCode = spv::OpGroupUMinNonUniformAMD;
  5745. else
  5746. opCode = spv::OpGroupSMinNonUniformAMD;
  5747. }
  5748. }
  5749. else if (op == glslang::EOpMaxInvocationsNonUniform ||
  5750. op == glslang::EOpMaxInvocationsInclusiveScanNonUniform ||
  5751. op == glslang::EOpMaxInvocationsExclusiveScanNonUniform) {
  5752. if (isFloat)
  5753. opCode = spv::OpGroupFMaxNonUniformAMD;
  5754. else {
  5755. if (isUnsigned)
  5756. opCode = spv::OpGroupUMaxNonUniformAMD;
  5757. else
  5758. opCode = spv::OpGroupSMaxNonUniformAMD;
  5759. }
  5760. }
  5761. else {
  5762. if (isFloat)
  5763. opCode = spv::OpGroupFAddNonUniformAMD;
  5764. else
  5765. opCode = spv::OpGroupIAddNonUniformAMD;
  5766. }
  5767. if (builder.isVectorType(typeId))
  5768. return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
  5769. break;
  5770. #endif
  5771. default:
  5772. logger->missingFunctionality("invocation operation");
  5773. return spv::NoResult;
  5774. }
  5775. assert(opCode != spv::OpNop);
  5776. return builder.createOp(opCode, typeId, spvGroupOperands);
  5777. }
  5778. // Create group invocation operations on a vector
  5779. spv::Id TGlslangToSpvTraverser::CreateInvocationsVectorOperation(spv::Op op, spv::GroupOperation groupOperation,
  5780. spv::Id typeId, std::vector<spv::Id>& operands)
  5781. {
  5782. #ifdef AMD_EXTENSIONS
  5783. assert(op == spv::OpGroupFMin || op == spv::OpGroupUMin || op == spv::OpGroupSMin ||
  5784. op == spv::OpGroupFMax || op == spv::OpGroupUMax || op == spv::OpGroupSMax ||
  5785. op == spv::OpGroupFAdd || op == spv::OpGroupIAdd || op == spv::OpGroupBroadcast ||
  5786. op == spv::OpSubgroupReadInvocationKHR ||
  5787. op == spv::OpGroupFMinNonUniformAMD || op == spv::OpGroupUMinNonUniformAMD || op == spv::OpGroupSMinNonUniformAMD ||
  5788. op == spv::OpGroupFMaxNonUniformAMD || op == spv::OpGroupUMaxNonUniformAMD || op == spv::OpGroupSMaxNonUniformAMD ||
  5789. op == spv::OpGroupFAddNonUniformAMD || op == spv::OpGroupIAddNonUniformAMD);
  5790. #else
  5791. assert(op == spv::OpGroupFMin || op == spv::OpGroupUMin || op == spv::OpGroupSMin ||
  5792. op == spv::OpGroupFMax || op == spv::OpGroupUMax || op == spv::OpGroupSMax ||
  5793. op == spv::OpGroupFAdd || op == spv::OpGroupIAdd || op == spv::OpGroupBroadcast ||
  5794. op == spv::OpSubgroupReadInvocationKHR);
  5795. #endif
  5796. // Handle group invocation operations scalar by scalar.
  5797. // The result type is the same type as the original type.
  5798. // The algorithm is to:
  5799. // - break the vector into scalars
  5800. // - apply the operation to each scalar
  5801. // - make a vector out the scalar results
  5802. // get the types sorted out
  5803. int numComponents = builder.getNumComponents(operands[0]);
  5804. spv::Id scalarType = builder.getScalarTypeId(builder.getTypeId(operands[0]));
  5805. std::vector<spv::Id> results;
  5806. // do each scalar op
  5807. for (int comp = 0; comp < numComponents; ++comp) {
  5808. std::vector<unsigned int> indexes;
  5809. indexes.push_back(comp);
  5810. spv::IdImmediate scalar = { true, builder.createCompositeExtract(operands[0], scalarType, indexes) };
  5811. std::vector<spv::IdImmediate> spvGroupOperands;
  5812. if (op == spv::OpSubgroupReadInvocationKHR) {
  5813. spvGroupOperands.push_back(scalar);
  5814. spv::IdImmediate operand = { true, operands[1] };
  5815. spvGroupOperands.push_back(operand);
  5816. } else if (op == spv::OpGroupBroadcast) {
  5817. spv::IdImmediate scope = { true, builder.makeUintConstant(spv::ScopeSubgroup) };
  5818. spvGroupOperands.push_back(scope);
  5819. spvGroupOperands.push_back(scalar);
  5820. spv::IdImmediate operand = { true, operands[1] };
  5821. spvGroupOperands.push_back(operand);
  5822. } else {
  5823. spv::IdImmediate scope = { true, builder.makeUintConstant(spv::ScopeSubgroup) };
  5824. spvGroupOperands.push_back(scope);
  5825. spv::IdImmediate groupOp = { false, (unsigned)groupOperation };
  5826. spvGroupOperands.push_back(groupOp);
  5827. spvGroupOperands.push_back(scalar);
  5828. }
  5829. results.push_back(builder.createOp(op, scalarType, spvGroupOperands));
  5830. }
  5831. // put the pieces together
  5832. return builder.createCompositeConstruct(typeId, results);
  5833. }
  5834. // Create subgroup invocation operations.
  5835. spv::Id TGlslangToSpvTraverser::createSubgroupOperation(glslang::TOperator op, spv::Id typeId,
  5836. std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)
  5837. {
  5838. // Add the required capabilities.
  5839. switch (op) {
  5840. case glslang::EOpSubgroupElect:
  5841. builder.addCapability(spv::CapabilityGroupNonUniform);
  5842. break;
  5843. case glslang::EOpSubgroupAll:
  5844. case glslang::EOpSubgroupAny:
  5845. case glslang::EOpSubgroupAllEqual:
  5846. builder.addCapability(spv::CapabilityGroupNonUniform);
  5847. builder.addCapability(spv::CapabilityGroupNonUniformVote);
  5848. break;
  5849. case glslang::EOpSubgroupBroadcast:
  5850. case glslang::EOpSubgroupBroadcastFirst:
  5851. case glslang::EOpSubgroupBallot:
  5852. case glslang::EOpSubgroupInverseBallot:
  5853. case glslang::EOpSubgroupBallotBitExtract:
  5854. case glslang::EOpSubgroupBallotBitCount:
  5855. case glslang::EOpSubgroupBallotInclusiveBitCount:
  5856. case glslang::EOpSubgroupBallotExclusiveBitCount:
  5857. case glslang::EOpSubgroupBallotFindLSB:
  5858. case glslang::EOpSubgroupBallotFindMSB:
  5859. builder.addCapability(spv::CapabilityGroupNonUniform);
  5860. builder.addCapability(spv::CapabilityGroupNonUniformBallot);
  5861. break;
  5862. case glslang::EOpSubgroupShuffle:
  5863. case glslang::EOpSubgroupShuffleXor:
  5864. builder.addCapability(spv::CapabilityGroupNonUniform);
  5865. builder.addCapability(spv::CapabilityGroupNonUniformShuffle);
  5866. break;
  5867. case glslang::EOpSubgroupShuffleUp:
  5868. case glslang::EOpSubgroupShuffleDown:
  5869. builder.addCapability(spv::CapabilityGroupNonUniform);
  5870. builder.addCapability(spv::CapabilityGroupNonUniformShuffleRelative);
  5871. break;
  5872. case glslang::EOpSubgroupAdd:
  5873. case glslang::EOpSubgroupMul:
  5874. case glslang::EOpSubgroupMin:
  5875. case glslang::EOpSubgroupMax:
  5876. case glslang::EOpSubgroupAnd:
  5877. case glslang::EOpSubgroupOr:
  5878. case glslang::EOpSubgroupXor:
  5879. case glslang::EOpSubgroupInclusiveAdd:
  5880. case glslang::EOpSubgroupInclusiveMul:
  5881. case glslang::EOpSubgroupInclusiveMin:
  5882. case glslang::EOpSubgroupInclusiveMax:
  5883. case glslang::EOpSubgroupInclusiveAnd:
  5884. case glslang::EOpSubgroupInclusiveOr:
  5885. case glslang::EOpSubgroupInclusiveXor:
  5886. case glslang::EOpSubgroupExclusiveAdd:
  5887. case glslang::EOpSubgroupExclusiveMul:
  5888. case glslang::EOpSubgroupExclusiveMin:
  5889. case glslang::EOpSubgroupExclusiveMax:
  5890. case glslang::EOpSubgroupExclusiveAnd:
  5891. case glslang::EOpSubgroupExclusiveOr:
  5892. case glslang::EOpSubgroupExclusiveXor:
  5893. builder.addCapability(spv::CapabilityGroupNonUniform);
  5894. builder.addCapability(spv::CapabilityGroupNonUniformArithmetic);
  5895. break;
  5896. case glslang::EOpSubgroupClusteredAdd:
  5897. case glslang::EOpSubgroupClusteredMul:
  5898. case glslang::EOpSubgroupClusteredMin:
  5899. case glslang::EOpSubgroupClusteredMax:
  5900. case glslang::EOpSubgroupClusteredAnd:
  5901. case glslang::EOpSubgroupClusteredOr:
  5902. case glslang::EOpSubgroupClusteredXor:
  5903. builder.addCapability(spv::CapabilityGroupNonUniform);
  5904. builder.addCapability(spv::CapabilityGroupNonUniformClustered);
  5905. break;
  5906. case glslang::EOpSubgroupQuadBroadcast:
  5907. case glslang::EOpSubgroupQuadSwapHorizontal:
  5908. case glslang::EOpSubgroupQuadSwapVertical:
  5909. case glslang::EOpSubgroupQuadSwapDiagonal:
  5910. builder.addCapability(spv::CapabilityGroupNonUniform);
  5911. builder.addCapability(spv::CapabilityGroupNonUniformQuad);
  5912. break;
  5913. #ifdef NV_EXTENSIONS
  5914. case glslang::EOpSubgroupPartitionedAdd:
  5915. case glslang::EOpSubgroupPartitionedMul:
  5916. case glslang::EOpSubgroupPartitionedMin:
  5917. case glslang::EOpSubgroupPartitionedMax:
  5918. case glslang::EOpSubgroupPartitionedAnd:
  5919. case glslang::EOpSubgroupPartitionedOr:
  5920. case glslang::EOpSubgroupPartitionedXor:
  5921. case glslang::EOpSubgroupPartitionedInclusiveAdd:
  5922. case glslang::EOpSubgroupPartitionedInclusiveMul:
  5923. case glslang::EOpSubgroupPartitionedInclusiveMin:
  5924. case glslang::EOpSubgroupPartitionedInclusiveMax:
  5925. case glslang::EOpSubgroupPartitionedInclusiveAnd:
  5926. case glslang::EOpSubgroupPartitionedInclusiveOr:
  5927. case glslang::EOpSubgroupPartitionedInclusiveXor:
  5928. case glslang::EOpSubgroupPartitionedExclusiveAdd:
  5929. case glslang::EOpSubgroupPartitionedExclusiveMul:
  5930. case glslang::EOpSubgroupPartitionedExclusiveMin:
  5931. case glslang::EOpSubgroupPartitionedExclusiveMax:
  5932. case glslang::EOpSubgroupPartitionedExclusiveAnd:
  5933. case glslang::EOpSubgroupPartitionedExclusiveOr:
  5934. case glslang::EOpSubgroupPartitionedExclusiveXor:
  5935. builder.addExtension(spv::E_SPV_NV_shader_subgroup_partitioned);
  5936. builder.addCapability(spv::CapabilityGroupNonUniformPartitionedNV);
  5937. break;
  5938. #endif
  5939. default: assert(0 && "Unhandled subgroup operation!");
  5940. }
  5941. const bool isUnsigned = typeProxy == glslang::EbtUint || typeProxy == glslang::EbtUint64;
  5942. const bool isFloat = typeProxy == glslang::EbtFloat || typeProxy == glslang::EbtDouble;
  5943. const bool isBool = typeProxy == glslang::EbtBool;
  5944. spv::Op opCode = spv::OpNop;
  5945. // Figure out which opcode to use.
  5946. switch (op) {
  5947. case glslang::EOpSubgroupElect: opCode = spv::OpGroupNonUniformElect; break;
  5948. case glslang::EOpSubgroupAll: opCode = spv::OpGroupNonUniformAll; break;
  5949. case glslang::EOpSubgroupAny: opCode = spv::OpGroupNonUniformAny; break;
  5950. case glslang::EOpSubgroupAllEqual: opCode = spv::OpGroupNonUniformAllEqual; break;
  5951. case glslang::EOpSubgroupBroadcast: opCode = spv::OpGroupNonUniformBroadcast; break;
  5952. case glslang::EOpSubgroupBroadcastFirst: opCode = spv::OpGroupNonUniformBroadcastFirst; break;
  5953. case glslang::EOpSubgroupBallot: opCode = spv::OpGroupNonUniformBallot; break;
  5954. case glslang::EOpSubgroupInverseBallot: opCode = spv::OpGroupNonUniformInverseBallot; break;
  5955. case glslang::EOpSubgroupBallotBitExtract: opCode = spv::OpGroupNonUniformBallotBitExtract; break;
  5956. case glslang::EOpSubgroupBallotBitCount:
  5957. case glslang::EOpSubgroupBallotInclusiveBitCount:
  5958. case glslang::EOpSubgroupBallotExclusiveBitCount: opCode = spv::OpGroupNonUniformBallotBitCount; break;
  5959. case glslang::EOpSubgroupBallotFindLSB: opCode = spv::OpGroupNonUniformBallotFindLSB; break;
  5960. case glslang::EOpSubgroupBallotFindMSB: opCode = spv::OpGroupNonUniformBallotFindMSB; break;
  5961. case glslang::EOpSubgroupShuffle: opCode = spv::OpGroupNonUniformShuffle; break;
  5962. case glslang::EOpSubgroupShuffleXor: opCode = spv::OpGroupNonUniformShuffleXor; break;
  5963. case glslang::EOpSubgroupShuffleUp: opCode = spv::OpGroupNonUniformShuffleUp; break;
  5964. case glslang::EOpSubgroupShuffleDown: opCode = spv::OpGroupNonUniformShuffleDown; break;
  5965. case glslang::EOpSubgroupAdd:
  5966. case glslang::EOpSubgroupInclusiveAdd:
  5967. case glslang::EOpSubgroupExclusiveAdd:
  5968. case glslang::EOpSubgroupClusteredAdd:
  5969. #ifdef NV_EXTENSIONS
  5970. case glslang::EOpSubgroupPartitionedAdd:
  5971. case glslang::EOpSubgroupPartitionedInclusiveAdd:
  5972. case glslang::EOpSubgroupPartitionedExclusiveAdd:
  5973. #endif
  5974. if (isFloat) {
  5975. opCode = spv::OpGroupNonUniformFAdd;
  5976. } else {
  5977. opCode = spv::OpGroupNonUniformIAdd;
  5978. }
  5979. break;
  5980. case glslang::EOpSubgroupMul:
  5981. case glslang::EOpSubgroupInclusiveMul:
  5982. case glslang::EOpSubgroupExclusiveMul:
  5983. case glslang::EOpSubgroupClusteredMul:
  5984. #ifdef NV_EXTENSIONS
  5985. case glslang::EOpSubgroupPartitionedMul:
  5986. case glslang::EOpSubgroupPartitionedInclusiveMul:
  5987. case glslang::EOpSubgroupPartitionedExclusiveMul:
  5988. #endif
  5989. if (isFloat) {
  5990. opCode = spv::OpGroupNonUniformFMul;
  5991. } else {
  5992. opCode = spv::OpGroupNonUniformIMul;
  5993. }
  5994. break;
  5995. case glslang::EOpSubgroupMin:
  5996. case glslang::EOpSubgroupInclusiveMin:
  5997. case glslang::EOpSubgroupExclusiveMin:
  5998. case glslang::EOpSubgroupClusteredMin:
  5999. #ifdef NV_EXTENSIONS
  6000. case glslang::EOpSubgroupPartitionedMin:
  6001. case glslang::EOpSubgroupPartitionedInclusiveMin:
  6002. case glslang::EOpSubgroupPartitionedExclusiveMin:
  6003. #endif
  6004. if (isFloat) {
  6005. opCode = spv::OpGroupNonUniformFMin;
  6006. } else if (isUnsigned) {
  6007. opCode = spv::OpGroupNonUniformUMin;
  6008. } else {
  6009. opCode = spv::OpGroupNonUniformSMin;
  6010. }
  6011. break;
  6012. case glslang::EOpSubgroupMax:
  6013. case glslang::EOpSubgroupInclusiveMax:
  6014. case glslang::EOpSubgroupExclusiveMax:
  6015. case glslang::EOpSubgroupClusteredMax:
  6016. #ifdef NV_EXTENSIONS
  6017. case glslang::EOpSubgroupPartitionedMax:
  6018. case glslang::EOpSubgroupPartitionedInclusiveMax:
  6019. case glslang::EOpSubgroupPartitionedExclusiveMax:
  6020. #endif
  6021. if (isFloat) {
  6022. opCode = spv::OpGroupNonUniformFMax;
  6023. } else if (isUnsigned) {
  6024. opCode = spv::OpGroupNonUniformUMax;
  6025. } else {
  6026. opCode = spv::OpGroupNonUniformSMax;
  6027. }
  6028. break;
  6029. case glslang::EOpSubgroupAnd:
  6030. case glslang::EOpSubgroupInclusiveAnd:
  6031. case glslang::EOpSubgroupExclusiveAnd:
  6032. case glslang::EOpSubgroupClusteredAnd:
  6033. #ifdef NV_EXTENSIONS
  6034. case glslang::EOpSubgroupPartitionedAnd:
  6035. case glslang::EOpSubgroupPartitionedInclusiveAnd:
  6036. case glslang::EOpSubgroupPartitionedExclusiveAnd:
  6037. #endif
  6038. if (isBool) {
  6039. opCode = spv::OpGroupNonUniformLogicalAnd;
  6040. } else {
  6041. opCode = spv::OpGroupNonUniformBitwiseAnd;
  6042. }
  6043. break;
  6044. case glslang::EOpSubgroupOr:
  6045. case glslang::EOpSubgroupInclusiveOr:
  6046. case glslang::EOpSubgroupExclusiveOr:
  6047. case glslang::EOpSubgroupClusteredOr:
  6048. #ifdef NV_EXTENSIONS
  6049. case glslang::EOpSubgroupPartitionedOr:
  6050. case glslang::EOpSubgroupPartitionedInclusiveOr:
  6051. case glslang::EOpSubgroupPartitionedExclusiveOr:
  6052. #endif
  6053. if (isBool) {
  6054. opCode = spv::OpGroupNonUniformLogicalOr;
  6055. } else {
  6056. opCode = spv::OpGroupNonUniformBitwiseOr;
  6057. }
  6058. break;
  6059. case glslang::EOpSubgroupXor:
  6060. case glslang::EOpSubgroupInclusiveXor:
  6061. case glslang::EOpSubgroupExclusiveXor:
  6062. case glslang::EOpSubgroupClusteredXor:
  6063. #ifdef NV_EXTENSIONS
  6064. case glslang::EOpSubgroupPartitionedXor:
  6065. case glslang::EOpSubgroupPartitionedInclusiveXor:
  6066. case glslang::EOpSubgroupPartitionedExclusiveXor:
  6067. #endif
  6068. if (isBool) {
  6069. opCode = spv::OpGroupNonUniformLogicalXor;
  6070. } else {
  6071. opCode = spv::OpGroupNonUniformBitwiseXor;
  6072. }
  6073. break;
  6074. case glslang::EOpSubgroupQuadBroadcast: opCode = spv::OpGroupNonUniformQuadBroadcast; break;
  6075. case glslang::EOpSubgroupQuadSwapHorizontal:
  6076. case glslang::EOpSubgroupQuadSwapVertical:
  6077. case glslang::EOpSubgroupQuadSwapDiagonal: opCode = spv::OpGroupNonUniformQuadSwap; break;
  6078. default: assert(0 && "Unhandled subgroup operation!");
  6079. }
  6080. // get the right Group Operation
  6081. spv::GroupOperation groupOperation = spv::GroupOperationMax;
  6082. switch (op) {
  6083. default:
  6084. break;
  6085. case glslang::EOpSubgroupBallotBitCount:
  6086. case glslang::EOpSubgroupAdd:
  6087. case glslang::EOpSubgroupMul:
  6088. case glslang::EOpSubgroupMin:
  6089. case glslang::EOpSubgroupMax:
  6090. case glslang::EOpSubgroupAnd:
  6091. case glslang::EOpSubgroupOr:
  6092. case glslang::EOpSubgroupXor:
  6093. groupOperation = spv::GroupOperationReduce;
  6094. break;
  6095. case glslang::EOpSubgroupBallotInclusiveBitCount:
  6096. case glslang::EOpSubgroupInclusiveAdd:
  6097. case glslang::EOpSubgroupInclusiveMul:
  6098. case glslang::EOpSubgroupInclusiveMin:
  6099. case glslang::EOpSubgroupInclusiveMax:
  6100. case glslang::EOpSubgroupInclusiveAnd:
  6101. case glslang::EOpSubgroupInclusiveOr:
  6102. case glslang::EOpSubgroupInclusiveXor:
  6103. groupOperation = spv::GroupOperationInclusiveScan;
  6104. break;
  6105. case glslang::EOpSubgroupBallotExclusiveBitCount:
  6106. case glslang::EOpSubgroupExclusiveAdd:
  6107. case glslang::EOpSubgroupExclusiveMul:
  6108. case glslang::EOpSubgroupExclusiveMin:
  6109. case glslang::EOpSubgroupExclusiveMax:
  6110. case glslang::EOpSubgroupExclusiveAnd:
  6111. case glslang::EOpSubgroupExclusiveOr:
  6112. case glslang::EOpSubgroupExclusiveXor:
  6113. groupOperation = spv::GroupOperationExclusiveScan;
  6114. break;
  6115. case glslang::EOpSubgroupClusteredAdd:
  6116. case glslang::EOpSubgroupClusteredMul:
  6117. case glslang::EOpSubgroupClusteredMin:
  6118. case glslang::EOpSubgroupClusteredMax:
  6119. case glslang::EOpSubgroupClusteredAnd:
  6120. case glslang::EOpSubgroupClusteredOr:
  6121. case glslang::EOpSubgroupClusteredXor:
  6122. groupOperation = spv::GroupOperationClusteredReduce;
  6123. break;
  6124. #ifdef NV_EXTENSIONS
  6125. case glslang::EOpSubgroupPartitionedAdd:
  6126. case glslang::EOpSubgroupPartitionedMul:
  6127. case glslang::EOpSubgroupPartitionedMin:
  6128. case glslang::EOpSubgroupPartitionedMax:
  6129. case glslang::EOpSubgroupPartitionedAnd:
  6130. case glslang::EOpSubgroupPartitionedOr:
  6131. case glslang::EOpSubgroupPartitionedXor:
  6132. groupOperation = spv::GroupOperationPartitionedReduceNV;
  6133. break;
  6134. case glslang::EOpSubgroupPartitionedInclusiveAdd:
  6135. case glslang::EOpSubgroupPartitionedInclusiveMul:
  6136. case glslang::EOpSubgroupPartitionedInclusiveMin:
  6137. case glslang::EOpSubgroupPartitionedInclusiveMax:
  6138. case glslang::EOpSubgroupPartitionedInclusiveAnd:
  6139. case glslang::EOpSubgroupPartitionedInclusiveOr:
  6140. case glslang::EOpSubgroupPartitionedInclusiveXor:
  6141. groupOperation = spv::GroupOperationPartitionedInclusiveScanNV;
  6142. break;
  6143. case glslang::EOpSubgroupPartitionedExclusiveAdd:
  6144. case glslang::EOpSubgroupPartitionedExclusiveMul:
  6145. case glslang::EOpSubgroupPartitionedExclusiveMin:
  6146. case glslang::EOpSubgroupPartitionedExclusiveMax:
  6147. case glslang::EOpSubgroupPartitionedExclusiveAnd:
  6148. case glslang::EOpSubgroupPartitionedExclusiveOr:
  6149. case glslang::EOpSubgroupPartitionedExclusiveXor:
  6150. groupOperation = spv::GroupOperationPartitionedExclusiveScanNV;
  6151. break;
  6152. #endif
  6153. }
  6154. // build the instruction
  6155. std::vector<spv::IdImmediate> spvGroupOperands;
  6156. // Every operation begins with the Execution Scope operand.
  6157. spv::IdImmediate executionScope = { true, builder.makeUintConstant(spv::ScopeSubgroup) };
  6158. spvGroupOperands.push_back(executionScope);
  6159. // Next, for all operations that use a Group Operation, push that as an operand.
  6160. if (groupOperation != spv::GroupOperationMax) {
  6161. spv::IdImmediate groupOperand = { false, (unsigned)groupOperation };
  6162. spvGroupOperands.push_back(groupOperand);
  6163. }
  6164. // Push back the operands next.
  6165. for (auto opIt = operands.cbegin(); opIt != operands.cend(); ++opIt) {
  6166. spv::IdImmediate operand = { true, *opIt };
  6167. spvGroupOperands.push_back(operand);
  6168. }
  6169. // Some opcodes have additional operands.
  6170. spv::Id directionId = spv::NoResult;
  6171. switch (op) {
  6172. default: break;
  6173. case glslang::EOpSubgroupQuadSwapHorizontal: directionId = builder.makeUintConstant(0); break;
  6174. case glslang::EOpSubgroupQuadSwapVertical: directionId = builder.makeUintConstant(1); break;
  6175. case glslang::EOpSubgroupQuadSwapDiagonal: directionId = builder.makeUintConstant(2); break;
  6176. }
  6177. if (directionId != spv::NoResult) {
  6178. spv::IdImmediate direction = { true, directionId };
  6179. spvGroupOperands.push_back(direction);
  6180. }
  6181. return builder.createOp(opCode, typeId, spvGroupOperands);
  6182. }
  6183. spv::Id TGlslangToSpvTraverser::createMiscOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId, std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)
  6184. {
  6185. bool isUnsigned = isTypeUnsignedInt(typeProxy);
  6186. bool isFloat = isTypeFloat(typeProxy);
  6187. spv::Op opCode = spv::OpNop;
  6188. int extBuiltins = -1;
  6189. int libCall = -1;
  6190. size_t consumedOperands = operands.size();
  6191. spv::Id typeId0 = 0;
  6192. if (consumedOperands > 0)
  6193. typeId0 = builder.getTypeId(operands[0]);
  6194. spv::Id typeId1 = 0;
  6195. if (consumedOperands > 1)
  6196. typeId1 = builder.getTypeId(operands[1]);
  6197. spv::Id frexpIntType = 0;
  6198. switch (op) {
  6199. case glslang::EOpMin:
  6200. if (isFloat)
  6201. libCall = spv::GLSLstd450FMin;
  6202. else if (isUnsigned)
  6203. libCall = spv::GLSLstd450UMin;
  6204. else
  6205. libCall = spv::GLSLstd450SMin;
  6206. builder.promoteScalar(precision, operands.front(), operands.back());
  6207. break;
  6208. case glslang::EOpModf:
  6209. libCall = spv::GLSLstd450Modf;
  6210. break;
  6211. case glslang::EOpMax:
  6212. if (isFloat)
  6213. libCall = spv::GLSLstd450FMax;
  6214. else if (isUnsigned)
  6215. libCall = spv::GLSLstd450UMax;
  6216. else
  6217. libCall = spv::GLSLstd450SMax;
  6218. builder.promoteScalar(precision, operands.front(), operands.back());
  6219. break;
  6220. case glslang::EOpPow:
  6221. libCall = spv::GLSLstd450Pow;
  6222. break;
  6223. case glslang::EOpDot:
  6224. opCode = spv::OpDot;
  6225. break;
  6226. case glslang::EOpAtan:
  6227. libCall = spv::GLSLstd450Atan2;
  6228. break;
  6229. case glslang::EOpClamp:
  6230. if (isFloat)
  6231. libCall = spv::GLSLstd450FClamp;
  6232. else if (isUnsigned)
  6233. libCall = spv::GLSLstd450UClamp;
  6234. else
  6235. libCall = spv::GLSLstd450SClamp;
  6236. builder.promoteScalar(precision, operands.front(), operands[1]);
  6237. builder.promoteScalar(precision, operands.front(), operands[2]);
  6238. break;
  6239. case glslang::EOpMix:
  6240. if (! builder.isBoolType(builder.getScalarTypeId(builder.getTypeId(operands.back())))) {
  6241. assert(isFloat);
  6242. libCall = spv::GLSLstd450FMix;
  6243. } else {
  6244. opCode = spv::OpSelect;
  6245. std::swap(operands.front(), operands.back());
  6246. }
  6247. builder.promoteScalar(precision, operands.front(), operands.back());
  6248. break;
  6249. case glslang::EOpStep:
  6250. libCall = spv::GLSLstd450Step;
  6251. builder.promoteScalar(precision, operands.front(), operands.back());
  6252. break;
  6253. case glslang::EOpSmoothStep:
  6254. libCall = spv::GLSLstd450SmoothStep;
  6255. builder.promoteScalar(precision, operands[0], operands[2]);
  6256. builder.promoteScalar(precision, operands[1], operands[2]);
  6257. break;
  6258. case glslang::EOpDistance:
  6259. libCall = spv::GLSLstd450Distance;
  6260. break;
  6261. case glslang::EOpCross:
  6262. libCall = spv::GLSLstd450Cross;
  6263. break;
  6264. case glslang::EOpFaceForward:
  6265. libCall = spv::GLSLstd450FaceForward;
  6266. break;
  6267. case glslang::EOpReflect:
  6268. libCall = spv::GLSLstd450Reflect;
  6269. break;
  6270. case glslang::EOpRefract:
  6271. libCall = spv::GLSLstd450Refract;
  6272. break;
  6273. case glslang::EOpInterpolateAtSample:
  6274. #ifdef AMD_EXTENSIONS
  6275. if (typeProxy == glslang::EbtFloat16)
  6276. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
  6277. #endif
  6278. libCall = spv::GLSLstd450InterpolateAtSample;
  6279. break;
  6280. case glslang::EOpInterpolateAtOffset:
  6281. #ifdef AMD_EXTENSIONS
  6282. if (typeProxy == glslang::EbtFloat16)
  6283. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
  6284. #endif
  6285. libCall = spv::GLSLstd450InterpolateAtOffset;
  6286. break;
  6287. case glslang::EOpAddCarry:
  6288. opCode = spv::OpIAddCarry;
  6289. typeId = builder.makeStructResultType(typeId0, typeId0);
  6290. consumedOperands = 2;
  6291. break;
  6292. case glslang::EOpSubBorrow:
  6293. opCode = spv::OpISubBorrow;
  6294. typeId = builder.makeStructResultType(typeId0, typeId0);
  6295. consumedOperands = 2;
  6296. break;
  6297. case glslang::EOpUMulExtended:
  6298. opCode = spv::OpUMulExtended;
  6299. typeId = builder.makeStructResultType(typeId0, typeId0);
  6300. consumedOperands = 2;
  6301. break;
  6302. case glslang::EOpIMulExtended:
  6303. opCode = spv::OpSMulExtended;
  6304. typeId = builder.makeStructResultType(typeId0, typeId0);
  6305. consumedOperands = 2;
  6306. break;
  6307. case glslang::EOpBitfieldExtract:
  6308. if (isUnsigned)
  6309. opCode = spv::OpBitFieldUExtract;
  6310. else
  6311. opCode = spv::OpBitFieldSExtract;
  6312. break;
  6313. case glslang::EOpBitfieldInsert:
  6314. opCode = spv::OpBitFieldInsert;
  6315. break;
  6316. case glslang::EOpFma:
  6317. libCall = spv::GLSLstd450Fma;
  6318. break;
  6319. case glslang::EOpFrexp:
  6320. {
  6321. libCall = spv::GLSLstd450FrexpStruct;
  6322. assert(builder.isPointerType(typeId1));
  6323. typeId1 = builder.getContainedTypeId(typeId1);
  6324. int width = builder.getScalarTypeWidth(typeId1);
  6325. #ifdef AMD_EXTENSIONS
  6326. if (width == 16)
  6327. // Using 16-bit exp operand, enable extension SPV_AMD_gpu_shader_int16
  6328. builder.addExtension(spv::E_SPV_AMD_gpu_shader_int16);
  6329. #endif
  6330. if (builder.getNumComponents(operands[0]) == 1)
  6331. frexpIntType = builder.makeIntegerType(width, true);
  6332. else
  6333. frexpIntType = builder.makeVectorType(builder.makeIntegerType(width, true), builder.getNumComponents(operands[0]));
  6334. typeId = builder.makeStructResultType(typeId0, frexpIntType);
  6335. consumedOperands = 1;
  6336. }
  6337. break;
  6338. case glslang::EOpLdexp:
  6339. libCall = spv::GLSLstd450Ldexp;
  6340. break;
  6341. case glslang::EOpReadInvocation:
  6342. return createInvocationsOperation(op, typeId, operands, typeProxy);
  6343. case glslang::EOpSubgroupBroadcast:
  6344. case glslang::EOpSubgroupBallotBitExtract:
  6345. case glslang::EOpSubgroupShuffle:
  6346. case glslang::EOpSubgroupShuffleXor:
  6347. case glslang::EOpSubgroupShuffleUp:
  6348. case glslang::EOpSubgroupShuffleDown:
  6349. case glslang::EOpSubgroupClusteredAdd:
  6350. case glslang::EOpSubgroupClusteredMul:
  6351. case glslang::EOpSubgroupClusteredMin:
  6352. case glslang::EOpSubgroupClusteredMax:
  6353. case glslang::EOpSubgroupClusteredAnd:
  6354. case glslang::EOpSubgroupClusteredOr:
  6355. case glslang::EOpSubgroupClusteredXor:
  6356. case glslang::EOpSubgroupQuadBroadcast:
  6357. #ifdef NV_EXTENSIONS
  6358. case glslang::EOpSubgroupPartitionedAdd:
  6359. case glslang::EOpSubgroupPartitionedMul:
  6360. case glslang::EOpSubgroupPartitionedMin:
  6361. case glslang::EOpSubgroupPartitionedMax:
  6362. case glslang::EOpSubgroupPartitionedAnd:
  6363. case glslang::EOpSubgroupPartitionedOr:
  6364. case glslang::EOpSubgroupPartitionedXor:
  6365. case glslang::EOpSubgroupPartitionedInclusiveAdd:
  6366. case glslang::EOpSubgroupPartitionedInclusiveMul:
  6367. case glslang::EOpSubgroupPartitionedInclusiveMin:
  6368. case glslang::EOpSubgroupPartitionedInclusiveMax:
  6369. case glslang::EOpSubgroupPartitionedInclusiveAnd:
  6370. case glslang::EOpSubgroupPartitionedInclusiveOr:
  6371. case glslang::EOpSubgroupPartitionedInclusiveXor:
  6372. case glslang::EOpSubgroupPartitionedExclusiveAdd:
  6373. case glslang::EOpSubgroupPartitionedExclusiveMul:
  6374. case glslang::EOpSubgroupPartitionedExclusiveMin:
  6375. case glslang::EOpSubgroupPartitionedExclusiveMax:
  6376. case glslang::EOpSubgroupPartitionedExclusiveAnd:
  6377. case glslang::EOpSubgroupPartitionedExclusiveOr:
  6378. case glslang::EOpSubgroupPartitionedExclusiveXor:
  6379. #endif
  6380. return createSubgroupOperation(op, typeId, operands, typeProxy);
  6381. #ifdef AMD_EXTENSIONS
  6382. case glslang::EOpSwizzleInvocations:
  6383. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
  6384. libCall = spv::SwizzleInvocationsAMD;
  6385. break;
  6386. case glslang::EOpSwizzleInvocationsMasked:
  6387. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
  6388. libCall = spv::SwizzleInvocationsMaskedAMD;
  6389. break;
  6390. case glslang::EOpWriteInvocation:
  6391. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
  6392. libCall = spv::WriteInvocationAMD;
  6393. break;
  6394. case glslang::EOpMin3:
  6395. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_trinary_minmax);
  6396. if (isFloat)
  6397. libCall = spv::FMin3AMD;
  6398. else {
  6399. if (isUnsigned)
  6400. libCall = spv::UMin3AMD;
  6401. else
  6402. libCall = spv::SMin3AMD;
  6403. }
  6404. break;
  6405. case glslang::EOpMax3:
  6406. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_trinary_minmax);
  6407. if (isFloat)
  6408. libCall = spv::FMax3AMD;
  6409. else {
  6410. if (isUnsigned)
  6411. libCall = spv::UMax3AMD;
  6412. else
  6413. libCall = spv::SMax3AMD;
  6414. }
  6415. break;
  6416. case glslang::EOpMid3:
  6417. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_trinary_minmax);
  6418. if (isFloat)
  6419. libCall = spv::FMid3AMD;
  6420. else {
  6421. if (isUnsigned)
  6422. libCall = spv::UMid3AMD;
  6423. else
  6424. libCall = spv::SMid3AMD;
  6425. }
  6426. break;
  6427. case glslang::EOpInterpolateAtVertex:
  6428. if (typeProxy == glslang::EbtFloat16)
  6429. builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
  6430. extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
  6431. libCall = spv::InterpolateAtVertexAMD;
  6432. break;
  6433. #endif
  6434. case glslang::EOpBarrier:
  6435. {
  6436. // This is for the extended controlBarrier function, with four operands.
  6437. // The unextended barrier() goes through createNoArgOperation.
  6438. assert(operands.size() == 4);
  6439. unsigned int executionScope = builder.getConstantScalar(operands[0]);
  6440. unsigned int memoryScope = builder.getConstantScalar(operands[1]);
  6441. unsigned int semantics = builder.getConstantScalar(operands[2]) | builder.getConstantScalar(operands[3]);
  6442. builder.createControlBarrier((spv::Scope)executionScope, (spv::Scope)memoryScope, (spv::MemorySemanticsMask)semantics);
  6443. if (semantics & (spv::MemorySemanticsMakeAvailableKHRMask | spv::MemorySemanticsMakeVisibleKHRMask | spv::MemorySemanticsOutputMemoryKHRMask)) {
  6444. builder.addCapability(spv::CapabilityVulkanMemoryModelKHR);
  6445. }
  6446. if (glslangIntermediate->usingVulkanMemoryModel() && (executionScope == spv::ScopeDevice || memoryScope == spv::ScopeDevice)) {
  6447. builder.addCapability(spv::CapabilityVulkanMemoryModelDeviceScopeKHR);
  6448. }
  6449. return 0;
  6450. }
  6451. break;
  6452. case glslang::EOpMemoryBarrier:
  6453. {
  6454. // This is for the extended memoryBarrier function, with three operands.
  6455. // The unextended memoryBarrier() goes through createNoArgOperation.
  6456. assert(operands.size() == 3);
  6457. unsigned int memoryScope = builder.getConstantScalar(operands[0]);
  6458. unsigned int semantics = builder.getConstantScalar(operands[1]) | builder.getConstantScalar(operands[2]);
  6459. builder.createMemoryBarrier((spv::Scope)memoryScope, (spv::MemorySemanticsMask)semantics);
  6460. if (semantics & (spv::MemorySemanticsMakeAvailableKHRMask | spv::MemorySemanticsMakeVisibleKHRMask | spv::MemorySemanticsOutputMemoryKHRMask)) {
  6461. builder.addCapability(spv::CapabilityVulkanMemoryModelKHR);
  6462. }
  6463. if (glslangIntermediate->usingVulkanMemoryModel() && memoryScope == spv::ScopeDevice) {
  6464. builder.addCapability(spv::CapabilityVulkanMemoryModelDeviceScopeKHR);
  6465. }
  6466. return 0;
  6467. }
  6468. break;
  6469. #ifdef NV_EXTENSIONS
  6470. case glslang::EOpReportIntersectionNV:
  6471. {
  6472. typeId = builder.makeBoolType();
  6473. opCode = spv::OpReportIntersectionNV;
  6474. }
  6475. break;
  6476. case glslang::EOpTraceNV:
  6477. {
  6478. builder.createNoResultOp(spv::OpTraceNV, operands);
  6479. return 0;
  6480. }
  6481. break;
  6482. case glslang::EOpExecuteCallableNV:
  6483. {
  6484. builder.createNoResultOp(spv::OpExecuteCallableNV, operands);
  6485. return 0;
  6486. }
  6487. break;
  6488. case glslang::EOpWritePackedPrimitiveIndices4x8NV:
  6489. builder.createNoResultOp(spv::OpWritePackedPrimitiveIndices4x8NV, operands);
  6490. return 0;
  6491. #endif
  6492. case glslang::EOpCooperativeMatrixMulAdd:
  6493. opCode = spv::OpCooperativeMatrixMulAddNV;
  6494. break;
  6495. default:
  6496. return 0;
  6497. }
  6498. spv::Id id = 0;
  6499. if (libCall >= 0) {
  6500. // Use an extended instruction from the standard library.
  6501. // Construct the call arguments, without modifying the original operands vector.
  6502. // We might need the remaining arguments, e.g. in the EOpFrexp case.
  6503. std::vector<spv::Id> callArguments(operands.begin(), operands.begin() + consumedOperands);
  6504. id = builder.createBuiltinCall(typeId, extBuiltins >= 0 ? extBuiltins : stdBuiltins, libCall, callArguments);
  6505. } else if (opCode == spv::OpDot && !isFloat) {
  6506. // int dot(int, int)
  6507. // NOTE: never called for scalar/vector1, this is turned into simple mul before this can be reached
  6508. const int componentCount = builder.getNumComponents(operands[0]);
  6509. spv::Id mulOp = builder.createBinOp(spv::OpIMul, builder.getTypeId(operands[0]), operands[0], operands[1]);
  6510. builder.setPrecision(mulOp, precision);
  6511. id = builder.createCompositeExtract(mulOp, typeId, 0);
  6512. for (int i = 1; i < componentCount; ++i) {
  6513. builder.setPrecision(id, precision);
  6514. id = builder.createBinOp(spv::OpIAdd, typeId, id, builder.createCompositeExtract(operands[0], typeId, i));
  6515. }
  6516. } else {
  6517. switch (consumedOperands) {
  6518. case 0:
  6519. // should all be handled by visitAggregate and createNoArgOperation
  6520. assert(0);
  6521. return 0;
  6522. case 1:
  6523. // should all be handled by createUnaryOperation
  6524. assert(0);
  6525. return 0;
  6526. case 2:
  6527. id = builder.createBinOp(opCode, typeId, operands[0], operands[1]);
  6528. break;
  6529. default:
  6530. // anything 3 or over doesn't have l-value operands, so all should be consumed
  6531. assert(consumedOperands == operands.size());
  6532. id = builder.createOp(opCode, typeId, operands);
  6533. break;
  6534. }
  6535. }
  6536. // Decode the return types that were structures
  6537. switch (op) {
  6538. case glslang::EOpAddCarry:
  6539. case glslang::EOpSubBorrow:
  6540. builder.createStore(builder.createCompositeExtract(id, typeId0, 1), operands[2]);
  6541. id = builder.createCompositeExtract(id, typeId0, 0);
  6542. break;
  6543. case glslang::EOpUMulExtended:
  6544. case glslang::EOpIMulExtended:
  6545. builder.createStore(builder.createCompositeExtract(id, typeId0, 0), operands[3]);
  6546. builder.createStore(builder.createCompositeExtract(id, typeId0, 1), operands[2]);
  6547. break;
  6548. case glslang::EOpFrexp:
  6549. {
  6550. assert(operands.size() == 2);
  6551. if (builder.isFloatType(builder.getScalarTypeId(typeId1))) {
  6552. // "exp" is floating-point type (from HLSL intrinsic)
  6553. spv::Id member1 = builder.createCompositeExtract(id, frexpIntType, 1);
  6554. member1 = builder.createUnaryOp(spv::OpConvertSToF, typeId1, member1);
  6555. builder.createStore(member1, operands[1]);
  6556. } else
  6557. // "exp" is integer type (from GLSL built-in function)
  6558. builder.createStore(builder.createCompositeExtract(id, frexpIntType, 1), operands[1]);
  6559. id = builder.createCompositeExtract(id, typeId0, 0);
  6560. }
  6561. break;
  6562. default:
  6563. break;
  6564. }
  6565. return builder.setPrecision(id, precision);
  6566. }
  6567. // Intrinsics with no arguments (or no return value, and no precision).
  6568. spv::Id TGlslangToSpvTraverser::createNoArgOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId)
  6569. {
  6570. // GLSL memory barriers use queuefamily scope in new model, device scope in old model
  6571. spv::Scope memoryBarrierScope = glslangIntermediate->usingVulkanMemoryModel() ? spv::ScopeQueueFamilyKHR : spv::ScopeDevice;
  6572. switch (op) {
  6573. case glslang::EOpEmitVertex:
  6574. builder.createNoResultOp(spv::OpEmitVertex);
  6575. return 0;
  6576. case glslang::EOpEndPrimitive:
  6577. builder.createNoResultOp(spv::OpEndPrimitive);
  6578. return 0;
  6579. case glslang::EOpBarrier:
  6580. if (glslangIntermediate->getStage() == EShLangTessControl) {
  6581. if (glslangIntermediate->usingVulkanMemoryModel()) {
  6582. builder.createControlBarrier(spv::ScopeWorkgroup, spv::ScopeWorkgroup,
  6583. spv::MemorySemanticsOutputMemoryKHRMask |
  6584. spv::MemorySemanticsAcquireReleaseMask);
  6585. builder.addCapability(spv::CapabilityVulkanMemoryModelKHR);
  6586. } else {
  6587. builder.createControlBarrier(spv::ScopeWorkgroup, spv::ScopeInvocation, spv::MemorySemanticsMaskNone);
  6588. }
  6589. } else {
  6590. builder.createControlBarrier(spv::ScopeWorkgroup, spv::ScopeWorkgroup,
  6591. spv::MemorySemanticsWorkgroupMemoryMask |
  6592. spv::MemorySemanticsAcquireReleaseMask);
  6593. }
  6594. return 0;
  6595. case glslang::EOpMemoryBarrier:
  6596. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsAllMemory |
  6597. spv::MemorySemanticsAcquireReleaseMask);
  6598. return 0;
  6599. case glslang::EOpMemoryBarrierAtomicCounter:
  6600. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsAtomicCounterMemoryMask |
  6601. spv::MemorySemanticsAcquireReleaseMask);
  6602. return 0;
  6603. case glslang::EOpMemoryBarrierBuffer:
  6604. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsUniformMemoryMask |
  6605. spv::MemorySemanticsAcquireReleaseMask);
  6606. return 0;
  6607. case glslang::EOpMemoryBarrierImage:
  6608. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsImageMemoryMask |
  6609. spv::MemorySemanticsAcquireReleaseMask);
  6610. return 0;
  6611. case glslang::EOpMemoryBarrierShared:
  6612. builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsWorkgroupMemoryMask |
  6613. spv::MemorySemanticsAcquireReleaseMask);
  6614. return 0;
  6615. case glslang::EOpGroupMemoryBarrier:
  6616. builder.createMemoryBarrier(spv::ScopeWorkgroup, spv::MemorySemanticsAllMemory |
  6617. spv::MemorySemanticsAcquireReleaseMask);
  6618. return 0;
  6619. case glslang::EOpAllMemoryBarrierWithGroupSync:
  6620. builder.createControlBarrier(spv::ScopeWorkgroup, spv::ScopeDevice,
  6621. spv::MemorySemanticsAllMemory |
  6622. spv::MemorySemanticsAcquireReleaseMask);
  6623. return 0;
  6624. case glslang::EOpDeviceMemoryBarrier:
  6625. builder.createMemoryBarrier(spv::ScopeDevice, spv::MemorySemanticsUniformMemoryMask |
  6626. spv::MemorySemanticsImageMemoryMask |
  6627. spv::MemorySemanticsAcquireReleaseMask);
  6628. return 0;
  6629. case glslang::EOpDeviceMemoryBarrierWithGroupSync:
  6630. builder.createControlBarrier(spv::ScopeWorkgroup, spv::ScopeDevice, spv::MemorySemanticsUniformMemoryMask |
  6631. spv::MemorySemanticsImageMemoryMask |
  6632. spv::MemorySemanticsAcquireReleaseMask);
  6633. return 0;
  6634. case glslang::EOpWorkgroupMemoryBarrier:
  6635. builder.createMemoryBarrier(spv::ScopeWorkgroup, spv::MemorySemanticsWorkgroupMemoryMask |
  6636. spv::MemorySemanticsAcquireReleaseMask);
  6637. return 0;
  6638. case glslang::EOpWorkgroupMemoryBarrierWithGroupSync:
  6639. builder.createControlBarrier(spv::ScopeWorkgroup, spv::ScopeWorkgroup,
  6640. spv::MemorySemanticsWorkgroupMemoryMask |
  6641. spv::MemorySemanticsAcquireReleaseMask);
  6642. return 0;
  6643. case glslang::EOpSubgroupBarrier:
  6644. builder.createControlBarrier(spv::ScopeSubgroup, spv::ScopeSubgroup, spv::MemorySemanticsAllMemory |
  6645. spv::MemorySemanticsAcquireReleaseMask);
  6646. return spv::NoResult;
  6647. case glslang::EOpSubgroupMemoryBarrier:
  6648. builder.createMemoryBarrier(spv::ScopeSubgroup, spv::MemorySemanticsAllMemory |
  6649. spv::MemorySemanticsAcquireReleaseMask);
  6650. return spv::NoResult;
  6651. case glslang::EOpSubgroupMemoryBarrierBuffer:
  6652. builder.createMemoryBarrier(spv::ScopeSubgroup, spv::MemorySemanticsUniformMemoryMask |
  6653. spv::MemorySemanticsAcquireReleaseMask);
  6654. return spv::NoResult;
  6655. case glslang::EOpSubgroupMemoryBarrierImage:
  6656. builder.createMemoryBarrier(spv::ScopeSubgroup, spv::MemorySemanticsImageMemoryMask |
  6657. spv::MemorySemanticsAcquireReleaseMask);
  6658. return spv::NoResult;
  6659. case glslang::EOpSubgroupMemoryBarrierShared:
  6660. builder.createMemoryBarrier(spv::ScopeSubgroup, spv::MemorySemanticsWorkgroupMemoryMask |
  6661. spv::MemorySemanticsAcquireReleaseMask);
  6662. return spv::NoResult;
  6663. case glslang::EOpSubgroupElect: {
  6664. std::vector<spv::Id> operands;
  6665. return createSubgroupOperation(op, typeId, operands, glslang::EbtVoid);
  6666. }
  6667. #ifdef AMD_EXTENSIONS
  6668. case glslang::EOpTime:
  6669. {
  6670. std::vector<spv::Id> args; // Dummy arguments
  6671. spv::Id id = builder.createBuiltinCall(typeId, getExtBuiltins(spv::E_SPV_AMD_gcn_shader), spv::TimeAMD, args);
  6672. return builder.setPrecision(id, precision);
  6673. }
  6674. #endif
  6675. #ifdef NV_EXTENSIONS
  6676. case glslang::EOpIgnoreIntersectionNV:
  6677. builder.createNoResultOp(spv::OpIgnoreIntersectionNV);
  6678. return 0;
  6679. case glslang::EOpTerminateRayNV:
  6680. builder.createNoResultOp(spv::OpTerminateRayNV);
  6681. return 0;
  6682. #endif
  6683. default:
  6684. logger->missingFunctionality("unknown operation with no arguments");
  6685. return 0;
  6686. }
  6687. }
  6688. spv::Id TGlslangToSpvTraverser::getSymbolId(const glslang::TIntermSymbol* symbol)
  6689. {
  6690. auto iter = symbolValues.find(symbol->getId());
  6691. spv::Id id;
  6692. if (symbolValues.end() != iter) {
  6693. id = iter->second;
  6694. return id;
  6695. }
  6696. // it was not found, create it
  6697. id = createSpvVariable(symbol);
  6698. symbolValues[symbol->getId()] = id;
  6699. if (symbol->getBasicType() != glslang::EbtBlock) {
  6700. builder.addDecoration(id, TranslatePrecisionDecoration(symbol->getType()));
  6701. builder.addDecoration(id, TranslateInterpolationDecoration(symbol->getType().getQualifier()));
  6702. builder.addDecoration(id, TranslateAuxiliaryStorageDecoration(symbol->getType().getQualifier()));
  6703. #ifdef NV_EXTENSIONS
  6704. addMeshNVDecoration(id, /*member*/ -1, symbol->getType().getQualifier());
  6705. #endif
  6706. if (symbol->getType().getQualifier().hasSpecConstantId())
  6707. builder.addDecoration(id, spv::DecorationSpecId, symbol->getType().getQualifier().layoutSpecConstantId);
  6708. if (symbol->getQualifier().hasIndex())
  6709. builder.addDecoration(id, spv::DecorationIndex, symbol->getQualifier().layoutIndex);
  6710. if (symbol->getQualifier().hasComponent())
  6711. builder.addDecoration(id, spv::DecorationComponent, symbol->getQualifier().layoutComponent);
  6712. // atomic counters use this:
  6713. if (symbol->getQualifier().hasOffset())
  6714. builder.addDecoration(id, spv::DecorationOffset, symbol->getQualifier().layoutOffset);
  6715. }
  6716. if (symbol->getQualifier().hasLocation())
  6717. builder.addDecoration(id, spv::DecorationLocation, symbol->getQualifier().layoutLocation);
  6718. builder.addDecoration(id, TranslateInvariantDecoration(symbol->getType().getQualifier()));
  6719. if (symbol->getQualifier().hasStream() && glslangIntermediate->isMultiStream()) {
  6720. builder.addCapability(spv::CapabilityGeometryStreams);
  6721. builder.addDecoration(id, spv::DecorationStream, symbol->getQualifier().layoutStream);
  6722. }
  6723. if (symbol->getQualifier().hasSet())
  6724. builder.addDecoration(id, spv::DecorationDescriptorSet, symbol->getQualifier().layoutSet);
  6725. else if (IsDescriptorResource(symbol->getType())) {
  6726. // default to 0
  6727. builder.addDecoration(id, spv::DecorationDescriptorSet, 0);
  6728. }
  6729. if (symbol->getQualifier().hasBinding())
  6730. builder.addDecoration(id, spv::DecorationBinding, symbol->getQualifier().layoutBinding);
  6731. else if (IsDescriptorResource(symbol->getType())) {
  6732. // default to 0
  6733. builder.addDecoration(id, spv::DecorationBinding, 0);
  6734. }
  6735. if (symbol->getQualifier().hasAttachment())
  6736. builder.addDecoration(id, spv::DecorationInputAttachmentIndex, symbol->getQualifier().layoutAttachment);
  6737. if (glslangIntermediate->getXfbMode()) {
  6738. builder.addCapability(spv::CapabilityTransformFeedback);
  6739. if (symbol->getQualifier().hasXfbBuffer()) {
  6740. builder.addDecoration(id, spv::DecorationXfbBuffer, symbol->getQualifier().layoutXfbBuffer);
  6741. unsigned stride = glslangIntermediate->getXfbStride(symbol->getQualifier().layoutXfbBuffer);
  6742. if (stride != glslang::TQualifier::layoutXfbStrideEnd)
  6743. builder.addDecoration(id, spv::DecorationXfbStride, stride);
  6744. }
  6745. if (symbol->getQualifier().hasXfbOffset())
  6746. builder.addDecoration(id, spv::DecorationOffset, symbol->getQualifier().layoutXfbOffset);
  6747. }
  6748. if (symbol->getType().isImage()) {
  6749. std::vector<spv::Decoration> memory;
  6750. TranslateMemoryDecoration(symbol->getType().getQualifier(), memory, glslangIntermediate->usingVulkanMemoryModel());
  6751. for (unsigned int i = 0; i < memory.size(); ++i)
  6752. builder.addDecoration(id, memory[i]);
  6753. }
  6754. // built-in variable decorations
  6755. spv::BuiltIn builtIn = TranslateBuiltInDecoration(symbol->getQualifier().builtIn, false);
  6756. if (builtIn != spv::BuiltInMax)
  6757. builder.addDecoration(id, spv::DecorationBuiltIn, (int)builtIn);
  6758. // nonuniform
  6759. builder.addDecoration(id, TranslateNonUniformDecoration(symbol->getType().getQualifier()));
  6760. #ifdef NV_EXTENSIONS
  6761. if (builtIn == spv::BuiltInSampleMask) {
  6762. spv::Decoration decoration;
  6763. // GL_NV_sample_mask_override_coverage extension
  6764. if (glslangIntermediate->getLayoutOverrideCoverage())
  6765. decoration = (spv::Decoration)spv::DecorationOverrideCoverageNV;
  6766. else
  6767. decoration = (spv::Decoration)spv::DecorationMax;
  6768. builder.addDecoration(id, decoration);
  6769. if (decoration != spv::DecorationMax) {
  6770. builder.addExtension(spv::E_SPV_NV_sample_mask_override_coverage);
  6771. }
  6772. }
  6773. else if (builtIn == spv::BuiltInLayer) {
  6774. // SPV_NV_viewport_array2 extension
  6775. if (symbol->getQualifier().layoutViewportRelative) {
  6776. builder.addDecoration(id, (spv::Decoration)spv::DecorationViewportRelativeNV);
  6777. builder.addCapability(spv::CapabilityShaderViewportMaskNV);
  6778. builder.addExtension(spv::E_SPV_NV_viewport_array2);
  6779. }
  6780. if (symbol->getQualifier().layoutSecondaryViewportRelativeOffset != -2048) {
  6781. builder.addDecoration(id, (spv::Decoration)spv::DecorationSecondaryViewportRelativeNV,
  6782. symbol->getQualifier().layoutSecondaryViewportRelativeOffset);
  6783. builder.addCapability(spv::CapabilityShaderStereoViewNV);
  6784. builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
  6785. }
  6786. }
  6787. if (symbol->getQualifier().layoutPassthrough) {
  6788. builder.addDecoration(id, spv::DecorationPassthroughNV);
  6789. builder.addCapability(spv::CapabilityGeometryShaderPassthroughNV);
  6790. builder.addExtension(spv::E_SPV_NV_geometry_shader_passthrough);
  6791. }
  6792. if (symbol->getQualifier().pervertexNV) {
  6793. builder.addDecoration(id, spv::DecorationPerVertexNV);
  6794. builder.addCapability(spv::CapabilityFragmentBarycentricNV);
  6795. builder.addExtension(spv::E_SPV_NV_fragment_shader_barycentric);
  6796. }
  6797. #endif
  6798. if (glslangIntermediate->getHlslFunctionality1() && symbol->getType().getQualifier().semanticName != nullptr) {
  6799. builder.addExtension("SPV_GOOGLE_hlsl_functionality1");
  6800. builder.addDecoration(id, (spv::Decoration)spv::DecorationHlslSemanticGOOGLE,
  6801. symbol->getType().getQualifier().semanticName);
  6802. }
  6803. if (symbol->getBasicType() == glslang::EbtReference) {
  6804. builder.addDecoration(id, symbol->getType().getQualifier().restrict ? spv::DecorationRestrictPointerEXT : spv::DecorationAliasedPointerEXT);
  6805. }
  6806. return id;
  6807. }
  6808. #ifdef NV_EXTENSIONS
  6809. // add per-primitive, per-view. per-task decorations to a struct member (member >= 0) or an object
  6810. void TGlslangToSpvTraverser::addMeshNVDecoration(spv::Id id, int member, const glslang::TQualifier& qualifier)
  6811. {
  6812. if (member >= 0) {
  6813. if (qualifier.perPrimitiveNV) {
  6814. // Need to add capability/extension for fragment shader.
  6815. // Mesh shader already adds this by default.
  6816. if (glslangIntermediate->getStage() == EShLangFragment) {
  6817. builder.addCapability(spv::CapabilityMeshShadingNV);
  6818. builder.addExtension(spv::E_SPV_NV_mesh_shader);
  6819. }
  6820. builder.addMemberDecoration(id, (unsigned)member, spv::DecorationPerPrimitiveNV);
  6821. }
  6822. if (qualifier.perViewNV)
  6823. builder.addMemberDecoration(id, (unsigned)member, spv::DecorationPerViewNV);
  6824. if (qualifier.perTaskNV)
  6825. builder.addMemberDecoration(id, (unsigned)member, spv::DecorationPerTaskNV);
  6826. } else {
  6827. if (qualifier.perPrimitiveNV) {
  6828. // Need to add capability/extension for fragment shader.
  6829. // Mesh shader already adds this by default.
  6830. if (glslangIntermediate->getStage() == EShLangFragment) {
  6831. builder.addCapability(spv::CapabilityMeshShadingNV);
  6832. builder.addExtension(spv::E_SPV_NV_mesh_shader);
  6833. }
  6834. builder.addDecoration(id, spv::DecorationPerPrimitiveNV);
  6835. }
  6836. if (qualifier.perViewNV)
  6837. builder.addDecoration(id, spv::DecorationPerViewNV);
  6838. if (qualifier.perTaskNV)
  6839. builder.addDecoration(id, spv::DecorationPerTaskNV);
  6840. }
  6841. }
  6842. #endif
  6843. // Make a full tree of instructions to build a SPIR-V specialization constant,
  6844. // or regular constant if possible.
  6845. //
  6846. // TBD: this is not yet done, nor verified to be the best design, it does do the leaf symbols though
  6847. //
  6848. // Recursively walk the nodes. The nodes form a tree whose leaves are
  6849. // regular constants, which themselves are trees that createSpvConstant()
  6850. // recursively walks. So, this function walks the "top" of the tree:
  6851. // - emit specialization constant-building instructions for specConstant
  6852. // - when running into a non-spec-constant, switch to createSpvConstant()
  6853. spv::Id TGlslangToSpvTraverser::createSpvConstant(const glslang::TIntermTyped& node)
  6854. {
  6855. assert(node.getQualifier().isConstant());
  6856. // Handle front-end constants first (non-specialization constants).
  6857. if (! node.getQualifier().specConstant) {
  6858. // hand off to the non-spec-constant path
  6859. assert(node.getAsConstantUnion() != nullptr || node.getAsSymbolNode() != nullptr);
  6860. int nextConst = 0;
  6861. return createSpvConstantFromConstUnionArray(node.getType(), node.getAsConstantUnion() ? node.getAsConstantUnion()->getConstArray() : node.getAsSymbolNode()->getConstArray(),
  6862. nextConst, false);
  6863. }
  6864. // We now know we have a specialization constant to build
  6865. // gl_WorkGroupSize is a special case until the front-end handles hierarchical specialization constants,
  6866. // even then, it's specialization ids are handled by special case syntax in GLSL: layout(local_size_x = ...
  6867. if (node.getType().getQualifier().builtIn == glslang::EbvWorkGroupSize) {
  6868. std::vector<spv::Id> dimConstId;
  6869. for (int dim = 0; dim < 3; ++dim) {
  6870. bool specConst = (glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet);
  6871. dimConstId.push_back(builder.makeUintConstant(glslangIntermediate->getLocalSize(dim), specConst));
  6872. if (specConst) {
  6873. builder.addDecoration(dimConstId.back(), spv::DecorationSpecId,
  6874. glslangIntermediate->getLocalSizeSpecId(dim));
  6875. }
  6876. }
  6877. return builder.makeCompositeConstant(builder.makeVectorType(builder.makeUintType(32), 3), dimConstId, true);
  6878. }
  6879. // An AST node labelled as specialization constant should be a symbol node.
  6880. // Its initializer should either be a sub tree with constant nodes, or a constant union array.
  6881. if (auto* sn = node.getAsSymbolNode()) {
  6882. spv::Id result;
  6883. if (auto* sub_tree = sn->getConstSubtree()) {
  6884. // Traverse the constant constructor sub tree like generating normal run-time instructions.
  6885. // During the AST traversal, if the node is marked as 'specConstant', SpecConstantOpModeGuard
  6886. // will set the builder into spec constant op instruction generating mode.
  6887. sub_tree->traverse(this);
  6888. result = accessChainLoad(sub_tree->getType());
  6889. } else if (auto* const_union_array = &sn->getConstArray()) {
  6890. int nextConst = 0;
  6891. result = createSpvConstantFromConstUnionArray(sn->getType(), *const_union_array, nextConst, true);
  6892. } else {
  6893. logger->missingFunctionality("Invalid initializer for spec onstant.");
  6894. return spv::NoResult;
  6895. }
  6896. builder.addName(result, sn->getName().c_str());
  6897. return result;
  6898. }
  6899. // Neither a front-end constant node, nor a specialization constant node with constant union array or
  6900. // constant sub tree as initializer.
  6901. logger->missingFunctionality("Neither a front-end constant nor a spec constant.");
  6902. return spv::NoResult;
  6903. }
  6904. // Use 'consts' as the flattened glslang source of scalar constants to recursively
  6905. // build the aggregate SPIR-V constant.
  6906. //
  6907. // If there are not enough elements present in 'consts', 0 will be substituted;
  6908. // an empty 'consts' can be used to create a fully zeroed SPIR-V constant.
  6909. //
  6910. spv::Id TGlslangToSpvTraverser::createSpvConstantFromConstUnionArray(const glslang::TType& glslangType, const glslang::TConstUnionArray& consts, int& nextConst, bool specConstant)
  6911. {
  6912. // vector of constants for SPIR-V
  6913. std::vector<spv::Id> spvConsts;
  6914. // Type is used for struct and array constants
  6915. spv::Id typeId = convertGlslangToSpvType(glslangType);
  6916. if (glslangType.isArray()) {
  6917. glslang::TType elementType(glslangType, 0);
  6918. for (int i = 0; i < glslangType.getOuterArraySize(); ++i)
  6919. spvConsts.push_back(createSpvConstantFromConstUnionArray(elementType, consts, nextConst, false));
  6920. } else if (glslangType.isMatrix()) {
  6921. glslang::TType vectorType(glslangType, 0);
  6922. for (int col = 0; col < glslangType.getMatrixCols(); ++col)
  6923. spvConsts.push_back(createSpvConstantFromConstUnionArray(vectorType, consts, nextConst, false));
  6924. } else if (glslangType.isCoopMat()) {
  6925. glslang::TType componentType(glslangType.getBasicType());
  6926. spvConsts.push_back(createSpvConstantFromConstUnionArray(componentType, consts, nextConst, false));
  6927. } else if (glslangType.isStruct()) {
  6928. glslang::TVector<glslang::TTypeLoc>::const_iterator iter;
  6929. for (iter = glslangType.getStruct()->begin(); iter != glslangType.getStruct()->end(); ++iter)
  6930. spvConsts.push_back(createSpvConstantFromConstUnionArray(*iter->type, consts, nextConst, false));
  6931. } else if (glslangType.getVectorSize() > 1) {
  6932. for (unsigned int i = 0; i < (unsigned int)glslangType.getVectorSize(); ++i) {
  6933. bool zero = nextConst >= consts.size();
  6934. switch (glslangType.getBasicType()) {
  6935. case glslang::EbtInt8:
  6936. spvConsts.push_back(builder.makeInt8Constant(zero ? 0 : consts[nextConst].getI8Const()));
  6937. break;
  6938. case glslang::EbtUint8:
  6939. spvConsts.push_back(builder.makeUint8Constant(zero ? 0 : consts[nextConst].getU8Const()));
  6940. break;
  6941. case glslang::EbtInt16:
  6942. spvConsts.push_back(builder.makeInt16Constant(zero ? 0 : consts[nextConst].getI16Const()));
  6943. break;
  6944. case glslang::EbtUint16:
  6945. spvConsts.push_back(builder.makeUint16Constant(zero ? 0 : consts[nextConst].getU16Const()));
  6946. break;
  6947. case glslang::EbtInt:
  6948. spvConsts.push_back(builder.makeIntConstant(zero ? 0 : consts[nextConst].getIConst()));
  6949. break;
  6950. case glslang::EbtUint:
  6951. spvConsts.push_back(builder.makeUintConstant(zero ? 0 : consts[nextConst].getUConst()));
  6952. break;
  6953. case glslang::EbtInt64:
  6954. spvConsts.push_back(builder.makeInt64Constant(zero ? 0 : consts[nextConst].getI64Const()));
  6955. break;
  6956. case glslang::EbtUint64:
  6957. spvConsts.push_back(builder.makeUint64Constant(zero ? 0 : consts[nextConst].getU64Const()));
  6958. break;
  6959. case glslang::EbtFloat:
  6960. spvConsts.push_back(builder.makeFloatConstant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  6961. break;
  6962. case glslang::EbtDouble:
  6963. spvConsts.push_back(builder.makeDoubleConstant(zero ? 0.0 : consts[nextConst].getDConst()));
  6964. break;
  6965. case glslang::EbtFloat16:
  6966. spvConsts.push_back(builder.makeFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
  6967. break;
  6968. case glslang::EbtBool:
  6969. spvConsts.push_back(builder.makeBoolConstant(zero ? false : consts[nextConst].getBConst()));
  6970. break;
  6971. default:
  6972. assert(0);
  6973. break;
  6974. }
  6975. ++nextConst;
  6976. }
  6977. } else {
  6978. // we have a non-aggregate (scalar) constant
  6979. bool zero = nextConst >= consts.size();
  6980. spv::Id scalar = 0;
  6981. switch (glslangType.getBasicType()) {
  6982. case glslang::EbtInt8:
  6983. scalar = builder.makeInt8Constant(zero ? 0 : consts[nextConst].getI8Const(), specConstant);
  6984. break;
  6985. case glslang::EbtUint8:
  6986. scalar = builder.makeUint8Constant(zero ? 0 : consts[nextConst].getU8Const(), specConstant);
  6987. break;
  6988. case glslang::EbtInt16:
  6989. scalar = builder.makeInt16Constant(zero ? 0 : consts[nextConst].getI16Const(), specConstant);
  6990. break;
  6991. case glslang::EbtUint16:
  6992. scalar = builder.makeUint16Constant(zero ? 0 : consts[nextConst].getU16Const(), specConstant);
  6993. break;
  6994. case glslang::EbtInt:
  6995. scalar = builder.makeIntConstant(zero ? 0 : consts[nextConst].getIConst(), specConstant);
  6996. break;
  6997. case glslang::EbtUint:
  6998. scalar = builder.makeUintConstant(zero ? 0 : consts[nextConst].getUConst(), specConstant);
  6999. break;
  7000. case glslang::EbtInt64:
  7001. scalar = builder.makeInt64Constant(zero ? 0 : consts[nextConst].getI64Const(), specConstant);
  7002. break;
  7003. case glslang::EbtUint64:
  7004. scalar = builder.makeUint64Constant(zero ? 0 : consts[nextConst].getU64Const(), specConstant);
  7005. break;
  7006. case glslang::EbtFloat:
  7007. scalar = builder.makeFloatConstant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  7008. break;
  7009. case glslang::EbtDouble:
  7010. scalar = builder.makeDoubleConstant(zero ? 0.0 : consts[nextConst].getDConst(), specConstant);
  7011. break;
  7012. case glslang::EbtFloat16:
  7013. scalar = builder.makeFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
  7014. break;
  7015. case glslang::EbtBool:
  7016. scalar = builder.makeBoolConstant(zero ? false : consts[nextConst].getBConst(), specConstant);
  7017. break;
  7018. case glslang::EbtReference:
  7019. scalar = builder.makeUint64Constant(zero ? 0 : consts[nextConst].getU64Const(), specConstant);
  7020. scalar = builder.createUnaryOp(spv::OpBitcast, typeId, scalar);
  7021. break;
  7022. default:
  7023. assert(0);
  7024. break;
  7025. }
  7026. ++nextConst;
  7027. return scalar;
  7028. }
  7029. return builder.makeCompositeConstant(typeId, spvConsts);
  7030. }
  7031. // Return true if the node is a constant or symbol whose reading has no
  7032. // non-trivial observable cost or effect.
  7033. bool TGlslangToSpvTraverser::isTrivialLeaf(const glslang::TIntermTyped* node)
  7034. {
  7035. // don't know what this is
  7036. if (node == nullptr)
  7037. return false;
  7038. // a constant is safe
  7039. if (node->getAsConstantUnion() != nullptr)
  7040. return true;
  7041. // not a symbol means non-trivial
  7042. if (node->getAsSymbolNode() == nullptr)
  7043. return false;
  7044. // a symbol, depends on what's being read
  7045. switch (node->getType().getQualifier().storage) {
  7046. case glslang::EvqTemporary:
  7047. case glslang::EvqGlobal:
  7048. case glslang::EvqIn:
  7049. case glslang::EvqInOut:
  7050. case glslang::EvqConst:
  7051. case glslang::EvqConstReadOnly:
  7052. case glslang::EvqUniform:
  7053. return true;
  7054. default:
  7055. return false;
  7056. }
  7057. }
  7058. // A node is trivial if it is a single operation with no side effects.
  7059. // HLSL (and/or vectors) are always trivial, as it does not short circuit.
  7060. // Otherwise, error on the side of saying non-trivial.
  7061. // Return true if trivial.
  7062. bool TGlslangToSpvTraverser::isTrivial(const glslang::TIntermTyped* node)
  7063. {
  7064. if (node == nullptr)
  7065. return false;
  7066. // count non scalars as trivial, as well as anything coming from HLSL
  7067. if (! node->getType().isScalarOrVec1() || glslangIntermediate->getSource() == glslang::EShSourceHlsl)
  7068. return true;
  7069. // symbols and constants are trivial
  7070. if (isTrivialLeaf(node))
  7071. return true;
  7072. // otherwise, it needs to be a simple operation or one or two leaf nodes
  7073. // not a simple operation
  7074. const glslang::TIntermBinary* binaryNode = node->getAsBinaryNode();
  7075. const glslang::TIntermUnary* unaryNode = node->getAsUnaryNode();
  7076. if (binaryNode == nullptr && unaryNode == nullptr)
  7077. return false;
  7078. // not on leaf nodes
  7079. if (binaryNode && (! isTrivialLeaf(binaryNode->getLeft()) || ! isTrivialLeaf(binaryNode->getRight())))
  7080. return false;
  7081. if (unaryNode && ! isTrivialLeaf(unaryNode->getOperand())) {
  7082. return false;
  7083. }
  7084. switch (node->getAsOperator()->getOp()) {
  7085. case glslang::EOpLogicalNot:
  7086. case glslang::EOpConvIntToBool:
  7087. case glslang::EOpConvUintToBool:
  7088. case glslang::EOpConvFloatToBool:
  7089. case glslang::EOpConvDoubleToBool:
  7090. case glslang::EOpEqual:
  7091. case glslang::EOpNotEqual:
  7092. case glslang::EOpLessThan:
  7093. case glslang::EOpGreaterThan:
  7094. case glslang::EOpLessThanEqual:
  7095. case glslang::EOpGreaterThanEqual:
  7096. case glslang::EOpIndexDirect:
  7097. case glslang::EOpIndexDirectStruct:
  7098. case glslang::EOpLogicalXor:
  7099. case glslang::EOpAny:
  7100. case glslang::EOpAll:
  7101. return true;
  7102. default:
  7103. return false;
  7104. }
  7105. }
  7106. // Emit short-circuiting code, where 'right' is never evaluated unless
  7107. // the left side is true (for &&) or false (for ||).
  7108. spv::Id TGlslangToSpvTraverser::createShortCircuit(glslang::TOperator op, glslang::TIntermTyped& left, glslang::TIntermTyped& right)
  7109. {
  7110. spv::Id boolTypeId = builder.makeBoolType();
  7111. // emit left operand
  7112. builder.clearAccessChain();
  7113. left.traverse(this);
  7114. spv::Id leftId = accessChainLoad(left.getType());
  7115. // Operands to accumulate OpPhi operands
  7116. std::vector<spv::Id> phiOperands;
  7117. // accumulate left operand's phi information
  7118. phiOperands.push_back(leftId);
  7119. phiOperands.push_back(builder.getBuildPoint()->getId());
  7120. // Make the two kinds of operation symmetric with a "!"
  7121. // || => emit "if (! left) result = right"
  7122. // && => emit "if ( left) result = right"
  7123. //
  7124. // TODO: this runtime "not" for || could be avoided by adding functionality
  7125. // to 'builder' to have an "else" without an "then"
  7126. if (op == glslang::EOpLogicalOr)
  7127. leftId = builder.createUnaryOp(spv::OpLogicalNot, boolTypeId, leftId);
  7128. // make an "if" based on the left value
  7129. spv::Builder::If ifBuilder(leftId, spv::SelectionControlMaskNone, builder);
  7130. // emit right operand as the "then" part of the "if"
  7131. builder.clearAccessChain();
  7132. right.traverse(this);
  7133. spv::Id rightId = accessChainLoad(right.getType());
  7134. // accumulate left operand's phi information
  7135. phiOperands.push_back(rightId);
  7136. phiOperands.push_back(builder.getBuildPoint()->getId());
  7137. // finish the "if"
  7138. ifBuilder.makeEndIf();
  7139. // phi together the two results
  7140. return builder.createOp(spv::OpPhi, boolTypeId, phiOperands);
  7141. }
  7142. #ifdef AMD_EXTENSIONS
  7143. // Return type Id of the imported set of extended instructions corresponds to the name.
  7144. // Import this set if it has not been imported yet.
  7145. spv::Id TGlslangToSpvTraverser::getExtBuiltins(const char* name)
  7146. {
  7147. if (extBuiltinMap.find(name) != extBuiltinMap.end())
  7148. return extBuiltinMap[name];
  7149. else {
  7150. builder.addExtension(name);
  7151. spv::Id extBuiltins = builder.import(name);
  7152. extBuiltinMap[name] = extBuiltins;
  7153. return extBuiltins;
  7154. }
  7155. }
  7156. #endif
  7157. }; // end anonymous namespace
  7158. namespace glslang {
  7159. void GetSpirvVersion(std::string& version)
  7160. {
  7161. const int bufSize = 100;
  7162. char buf[bufSize];
  7163. snprintf(buf, bufSize, "0x%08x, Revision %d", spv::Version, spv::Revision);
  7164. version = buf;
  7165. }
  7166. // For low-order part of the generator's magic number. Bump up
  7167. // when there is a change in the style (e.g., if SSA form changes,
  7168. // or a different instruction sequence to do something gets used).
  7169. int GetSpirvGeneratorVersion()
  7170. {
  7171. // return 1; // start
  7172. // return 2; // EOpAtomicCounterDecrement gets a post decrement, to map between GLSL -> SPIR-V
  7173. // return 3; // change/correct barrier-instruction operands, to match memory model group decisions
  7174. // return 4; // some deeper access chains: for dynamic vector component, and local Boolean component
  7175. // return 5; // make OpArrayLength result type be an int with signedness of 0
  7176. // return 6; // revert version 5 change, which makes a different (new) kind of incorrect code,
  7177. // versions 4 and 6 each generate OpArrayLength as it has long been done
  7178. return 7; // GLSL volatile keyword maps to both SPIR-V decorations Volatile and Coherent
  7179. }
  7180. // Write SPIR-V out to a binary file
  7181. void OutputSpvBin(const std::vector<unsigned int>& spirv, const char* baseName)
  7182. {
  7183. std::ofstream out;
  7184. out.open(baseName, std::ios::binary | std::ios::out);
  7185. if (out.fail())
  7186. printf("ERROR: Failed to open file: %s\n", baseName);
  7187. for (int i = 0; i < (int)spirv.size(); ++i) {
  7188. unsigned int word = spirv[i];
  7189. out.write((const char*)&word, 4);
  7190. }
  7191. out.close();
  7192. }
  7193. // Write SPIR-V out to a text file with 32-bit hexadecimal words
  7194. void OutputSpvHex(const std::vector<unsigned int>& spirv, const char* baseName, const char* varName)
  7195. {
  7196. std::ofstream out;
  7197. out.open(baseName, std::ios::binary | std::ios::out);
  7198. if (out.fail())
  7199. printf("ERROR: Failed to open file: %s\n", baseName);
  7200. out << "\t// " <<
  7201. GetSpirvGeneratorVersion() << "." << GLSLANG_MINOR_VERSION << "." << GLSLANG_PATCH_LEVEL <<
  7202. std::endl;
  7203. if (varName != nullptr) {
  7204. out << "\t #pragma once" << std::endl;
  7205. out << "const uint32_t " << varName << "[] = {" << std::endl;
  7206. }
  7207. const int WORDS_PER_LINE = 8;
  7208. for (int i = 0; i < (int)spirv.size(); i += WORDS_PER_LINE) {
  7209. out << "\t";
  7210. for (int j = 0; j < WORDS_PER_LINE && i + j < (int)spirv.size(); ++j) {
  7211. const unsigned int word = spirv[i + j];
  7212. out << "0x" << std::hex << std::setw(8) << std::setfill('0') << word;
  7213. if (i + j + 1 < (int)spirv.size()) {
  7214. out << ",";
  7215. }
  7216. }
  7217. out << std::endl;
  7218. }
  7219. if (varName != nullptr) {
  7220. out << "};";
  7221. }
  7222. out.close();
  7223. }
  7224. //
  7225. // Set up the glslang traversal
  7226. //
  7227. void GlslangToSpv(const TIntermediate& intermediate, std::vector<unsigned int>& spirv, SpvOptions* options)
  7228. {
  7229. spv::SpvBuildLogger logger;
  7230. GlslangToSpv(intermediate, spirv, &logger, options);
  7231. }
  7232. void GlslangToSpv(const TIntermediate& intermediate, std::vector<unsigned int>& spirv,
  7233. spv::SpvBuildLogger* logger, SpvOptions* options)
  7234. {
  7235. TIntermNode* root = intermediate.getTreeRoot();
  7236. if (root == 0)
  7237. return;
  7238. SpvOptions defaultOptions;
  7239. if (options == nullptr)
  7240. options = &defaultOptions;
  7241. GetThreadPoolAllocator().push();
  7242. TGlslangToSpvTraverser it(intermediate.getSpv().spv, &intermediate, logger, *options);
  7243. root->traverse(&it);
  7244. it.finishSpv();
  7245. it.dumpSpv(spirv);
  7246. #if ENABLE_OPT
  7247. // If from HLSL, run spirv-opt to "legalize" the SPIR-V for Vulkan
  7248. // eg. forward and remove memory writes of opaque types.
  7249. if ((intermediate.getSource() == EShSourceHlsl || options->optimizeSize) && !options->disableOptimizer)
  7250. SpirvToolsLegalize(intermediate, spirv, logger, options);
  7251. if (options->validate)
  7252. SpirvToolsValidate(intermediate, spirv, logger);
  7253. if (options->disassemble)
  7254. SpirvToolsDisassemble(std::cout, spirv);
  7255. #endif
  7256. GetThreadPoolAllocator().pop();
  7257. }
  7258. }; // end namespace glslang