BeMCContext.cpp 475 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322232323242325232623272328232923302331233223332334233523362337233823392340234123422343234423452346234723482349235023512352235323542355235623572358235923602361236223632364236523662367236823692370237123722373237423752376237723782379238023812382238323842385238623872388238923902391239223932394239523962397239823992400240124022403240424052406240724082409241024112412241324142415241624172418241924202421242224232424242524262427242824292430243124322433243424352436243724382439244024412442244324442445244624472448244924502451245224532454245524562457245824592460246124622463246424652466246724682469247024712472247324742475247624772478247924802481248224832484248524862487248824892490249124922493249424952496249724982499250025012502250325042505250625072508250925102511251225132514251525162517251825192520252125222523252425252526252725282529253025312532253325342535253625372538253925402541254225432544254525462547254825492550255125522553255425552556255725582559256025612562256325642565256625672568256925702571257225732574257525762577257825792580258125822583258425852586258725882589259025912592259325942595259625972598259926002601260226032604260526062607260826092610261126122613261426152616261726182619262026212622262326242625262626272628262926302631263226332634263526362637263826392640264126422643264426452646264726482649265026512652265326542655265626572658265926602661266226632664266526662667266826692670267126722673267426752676267726782679268026812682268326842685268626872688268926902691269226932694269526962697269826992700270127022703270427052706270727082709271027112712271327142715271627172718271927202721272227232724272527262727272827292730273127322733273427352736273727382739274027412742274327442745274627472748274927502751275227532754275527562757275827592760276127622763276427652766276727682769277027712772277327742775277627772778277927802781278227832784278527862787278827892790279127922793279427952796279727982799280028012802280328042805280628072808280928102811281228132814281528162817281828192820282128222823282428252826282728282829283028312832283328342835283628372838283928402841284228432844284528462847284828492850285128522853285428552856285728582859286028612862286328642865286628672868286928702871287228732874287528762877287828792880288128822883288428852886288728882889289028912892289328942895289628972898289929002901290229032904290529062907290829092910291129122913291429152916291729182919292029212922292329242925292629272928292929302931293229332934293529362937293829392940294129422943294429452946294729482949295029512952295329542955295629572958295929602961296229632964296529662967296829692970297129722973297429752976297729782979298029812982298329842985298629872988298929902991299229932994299529962997299829993000300130023003300430053006300730083009301030113012301330143015301630173018301930203021302230233024302530263027302830293030303130323033303430353036303730383039304030413042304330443045304630473048304930503051305230533054305530563057305830593060306130623063306430653066306730683069307030713072307330743075307630773078307930803081308230833084308530863087308830893090309130923093309430953096309730983099310031013102310331043105310631073108310931103111311231133114311531163117311831193120312131223123312431253126312731283129313031313132313331343135313631373138313931403141314231433144314531463147314831493150315131523153315431553156315731583159316031613162316331643165316631673168316931703171317231733174317531763177317831793180318131823183318431853186318731883189319031913192319331943195319631973198319932003201320232033204320532063207320832093210321132123213321432153216321732183219322032213222322332243225322632273228322932303231323232333234323532363237323832393240324132423243324432453246324732483249325032513252325332543255325632573258325932603261326232633264326532663267326832693270327132723273327432753276327732783279328032813282328332843285328632873288328932903291329232933294329532963297329832993300330133023303330433053306330733083309331033113312331333143315331633173318331933203321332233233324332533263327332833293330333133323333333433353336333733383339334033413342334333443345334633473348334933503351335233533354335533563357335833593360336133623363336433653366336733683369337033713372337333743375337633773378337933803381338233833384338533863387338833893390339133923393339433953396339733983399340034013402340334043405340634073408340934103411341234133414341534163417341834193420342134223423342434253426342734283429343034313432343334343435343634373438343934403441344234433444344534463447344834493450345134523453345434553456345734583459346034613462346334643465346634673468346934703471347234733474347534763477347834793480348134823483348434853486348734883489349034913492349334943495349634973498349935003501350235033504350535063507350835093510351135123513351435153516351735183519352035213522352335243525352635273528352935303531353235333534353535363537353835393540354135423543354435453546354735483549355035513552355335543555355635573558355935603561356235633564356535663567356835693570357135723573357435753576357735783579358035813582358335843585358635873588358935903591359235933594359535963597359835993600360136023603360436053606360736083609361036113612361336143615361636173618361936203621362236233624362536263627362836293630363136323633363436353636363736383639364036413642364336443645364636473648364936503651365236533654365536563657365836593660366136623663366436653666366736683669367036713672367336743675367636773678367936803681368236833684368536863687368836893690369136923693369436953696369736983699370037013702370337043705370637073708370937103711371237133714371537163717371837193720372137223723372437253726372737283729373037313732373337343735373637373738373937403741374237433744374537463747374837493750375137523753375437553756375737583759376037613762376337643765376637673768376937703771377237733774377537763777377837793780378137823783378437853786378737883789379037913792379337943795379637973798379938003801380238033804380538063807380838093810381138123813381438153816381738183819382038213822382338243825382638273828382938303831383238333834383538363837383838393840384138423843384438453846384738483849385038513852385338543855385638573858385938603861386238633864386538663867386838693870387138723873387438753876387738783879388038813882388338843885388638873888388938903891389238933894389538963897389838993900390139023903390439053906390739083909391039113912391339143915391639173918391939203921392239233924392539263927392839293930393139323933393439353936393739383939394039413942394339443945394639473948394939503951395239533954395539563957395839593960396139623963396439653966396739683969397039713972397339743975397639773978397939803981398239833984398539863987398839893990399139923993399439953996399739983999400040014002400340044005400640074008400940104011401240134014401540164017401840194020402140224023402440254026402740284029403040314032403340344035403640374038403940404041404240434044404540464047404840494050405140524053405440554056405740584059406040614062406340644065406640674068406940704071407240734074407540764077407840794080408140824083408440854086408740884089409040914092409340944095409640974098409941004101410241034104410541064107410841094110411141124113411441154116411741184119412041214122412341244125412641274128412941304131413241334134413541364137413841394140414141424143414441454146414741484149415041514152415341544155415641574158415941604161416241634164416541664167416841694170417141724173417441754176417741784179418041814182418341844185418641874188418941904191419241934194419541964197419841994200420142024203420442054206420742084209421042114212421342144215421642174218421942204221422242234224422542264227422842294230423142324233423442354236423742384239424042414242424342444245424642474248424942504251425242534254425542564257425842594260426142624263426442654266426742684269427042714272427342744275427642774278427942804281428242834284428542864287428842894290429142924293429442954296429742984299430043014302430343044305430643074308430943104311431243134314431543164317431843194320432143224323432443254326432743284329433043314332433343344335433643374338433943404341434243434344434543464347434843494350435143524353435443554356435743584359436043614362436343644365436643674368436943704371437243734374437543764377437843794380438143824383438443854386438743884389439043914392439343944395439643974398439944004401440244034404440544064407440844094410441144124413441444154416441744184419442044214422442344244425442644274428442944304431443244334434443544364437443844394440444144424443444444454446444744484449445044514452445344544455445644574458445944604461446244634464446544664467446844694470447144724473447444754476447744784479448044814482448344844485448644874488448944904491449244934494449544964497449844994500450145024503450445054506450745084509451045114512451345144515451645174518451945204521452245234524452545264527452845294530453145324533453445354536453745384539454045414542454345444545454645474548454945504551455245534554455545564557455845594560456145624563456445654566456745684569457045714572457345744575457645774578457945804581458245834584458545864587458845894590459145924593459445954596459745984599460046014602460346044605460646074608460946104611461246134614461546164617461846194620462146224623462446254626462746284629463046314632463346344635463646374638463946404641464246434644464546464647464846494650465146524653465446554656465746584659466046614662466346644665466646674668466946704671467246734674467546764677467846794680468146824683468446854686468746884689469046914692469346944695469646974698469947004701470247034704470547064707470847094710471147124713471447154716471747184719472047214722472347244725472647274728472947304731473247334734473547364737473847394740474147424743474447454746474747484749475047514752475347544755475647574758475947604761476247634764476547664767476847694770477147724773477447754776477747784779478047814782478347844785478647874788478947904791479247934794479547964797479847994800480148024803480448054806480748084809481048114812481348144815481648174818481948204821482248234824482548264827482848294830483148324833483448354836483748384839484048414842484348444845484648474848484948504851485248534854485548564857485848594860486148624863486448654866486748684869487048714872487348744875487648774878487948804881488248834884488548864887488848894890489148924893489448954896489748984899490049014902490349044905490649074908490949104911491249134914491549164917491849194920492149224923492449254926492749284929493049314932493349344935493649374938493949404941494249434944494549464947494849494950495149524953495449554956495749584959496049614962496349644965496649674968496949704971497249734974497549764977497849794980498149824983498449854986498749884989499049914992499349944995499649974998499950005001500250035004500550065007500850095010501150125013501450155016501750185019502050215022502350245025502650275028502950305031503250335034503550365037503850395040504150425043504450455046504750485049505050515052505350545055505650575058505950605061506250635064506550665067506850695070507150725073507450755076507750785079508050815082508350845085508650875088508950905091509250935094509550965097509850995100510151025103510451055106510751085109511051115112511351145115511651175118511951205121512251235124512551265127512851295130513151325133513451355136513751385139514051415142514351445145514651475148514951505151515251535154515551565157515851595160516151625163516451655166516751685169517051715172517351745175517651775178517951805181518251835184518551865187518851895190519151925193519451955196519751985199520052015202520352045205520652075208520952105211521252135214521552165217521852195220522152225223522452255226522752285229523052315232523352345235523652375238523952405241524252435244524552465247524852495250525152525253525452555256525752585259526052615262526352645265526652675268526952705271527252735274527552765277527852795280528152825283528452855286528752885289529052915292529352945295529652975298529953005301530253035304530553065307530853095310531153125313531453155316531753185319532053215322532353245325532653275328532953305331533253335334533553365337533853395340534153425343534453455346534753485349535053515352535353545355535653575358535953605361536253635364536553665367536853695370537153725373537453755376537753785379538053815382538353845385538653875388538953905391539253935394539553965397539853995400540154025403540454055406540754085409541054115412541354145415541654175418541954205421542254235424542554265427542854295430543154325433543454355436543754385439544054415442544354445445544654475448544954505451545254535454545554565457545854595460546154625463546454655466546754685469547054715472547354745475547654775478547954805481548254835484548554865487548854895490549154925493549454955496549754985499550055015502550355045505550655075508550955105511551255135514551555165517551855195520552155225523552455255526552755285529553055315532553355345535553655375538553955405541554255435544554555465547554855495550555155525553555455555556555755585559556055615562556355645565556655675568556955705571557255735574557555765577557855795580558155825583558455855586558755885589559055915592559355945595559655975598559956005601560256035604560556065607560856095610561156125613561456155616561756185619562056215622562356245625562656275628562956305631563256335634563556365637563856395640564156425643564456455646564756485649565056515652565356545655565656575658565956605661566256635664566556665667566856695670567156725673567456755676567756785679568056815682568356845685568656875688568956905691569256935694569556965697569856995700570157025703570457055706570757085709571057115712571357145715571657175718571957205721572257235724572557265727572857295730573157325733573457355736573757385739574057415742574357445745574657475748574957505751575257535754575557565757575857595760576157625763576457655766576757685769577057715772577357745775577657775778577957805781578257835784578557865787578857895790579157925793579457955796579757985799580058015802580358045805580658075808580958105811581258135814581558165817581858195820582158225823582458255826582758285829583058315832583358345835583658375838583958405841584258435844584558465847584858495850585158525853585458555856585758585859586058615862586358645865586658675868586958705871587258735874587558765877587858795880588158825883588458855886588758885889589058915892589358945895589658975898589959005901590259035904590559065907590859095910591159125913591459155916591759185919592059215922592359245925592659275928592959305931593259335934593559365937593859395940594159425943594459455946594759485949595059515952595359545955595659575958595959605961596259635964596559665967596859695970597159725973597459755976597759785979598059815982598359845985598659875988598959905991599259935994599559965997599859996000600160026003600460056006600760086009601060116012601360146015601660176018601960206021602260236024602560266027602860296030603160326033603460356036603760386039604060416042604360446045604660476048604960506051605260536054605560566057605860596060606160626063606460656066606760686069607060716072607360746075607660776078607960806081608260836084608560866087608860896090609160926093609460956096609760986099610061016102610361046105610661076108610961106111611261136114611561166117611861196120612161226123612461256126612761286129613061316132613361346135613661376138613961406141614261436144614561466147614861496150615161526153615461556156615761586159616061616162616361646165616661676168616961706171617261736174617561766177617861796180618161826183618461856186618761886189619061916192619361946195619661976198619962006201620262036204620562066207620862096210621162126213621462156216621762186219622062216222622362246225622662276228622962306231623262336234623562366237623862396240624162426243624462456246624762486249625062516252625362546255625662576258625962606261626262636264626562666267626862696270627162726273627462756276627762786279628062816282628362846285628662876288628962906291629262936294629562966297629862996300630163026303630463056306630763086309631063116312631363146315631663176318631963206321632263236324632563266327632863296330633163326333633463356336633763386339634063416342634363446345634663476348634963506351635263536354635563566357635863596360636163626363636463656366636763686369637063716372637363746375637663776378637963806381638263836384638563866387638863896390639163926393639463956396639763986399640064016402640364046405640664076408640964106411641264136414641564166417641864196420642164226423642464256426642764286429643064316432643364346435643664376438643964406441644264436444644564466447644864496450645164526453645464556456645764586459646064616462646364646465646664676468646964706471647264736474647564766477647864796480648164826483648464856486648764886489649064916492649364946495649664976498649965006501650265036504650565066507650865096510651165126513651465156516651765186519652065216522652365246525652665276528652965306531653265336534653565366537653865396540654165426543654465456546654765486549655065516552655365546555655665576558655965606561656265636564656565666567656865696570657165726573657465756576657765786579658065816582658365846585658665876588658965906591659265936594659565966597659865996600660166026603660466056606660766086609661066116612661366146615661666176618661966206621662266236624662566266627662866296630663166326633663466356636663766386639664066416642664366446645664666476648664966506651665266536654665566566657665866596660666166626663666466656666666766686669667066716672667366746675667666776678667966806681668266836684668566866687668866896690669166926693669466956696669766986699670067016702670367046705670667076708670967106711671267136714671567166717671867196720672167226723672467256726672767286729673067316732673367346735673667376738673967406741674267436744674567466747674867496750675167526753675467556756675767586759676067616762676367646765676667676768676967706771677267736774677567766777677867796780678167826783678467856786678767886789679067916792679367946795679667976798679968006801680268036804680568066807680868096810681168126813681468156816681768186819682068216822682368246825682668276828682968306831683268336834683568366837683868396840684168426843684468456846684768486849685068516852685368546855685668576858685968606861686268636864686568666867686868696870687168726873687468756876687768786879688068816882688368846885688668876888688968906891689268936894689568966897689868996900690169026903690469056906690769086909691069116912691369146915691669176918691969206921692269236924692569266927692869296930693169326933693469356936693769386939694069416942694369446945694669476948694969506951695269536954695569566957695869596960696169626963696469656966696769686969697069716972697369746975697669776978697969806981698269836984698569866987698869896990699169926993699469956996699769986999700070017002700370047005700670077008700970107011701270137014701570167017701870197020702170227023702470257026702770287029703070317032703370347035703670377038703970407041704270437044704570467047704870497050705170527053705470557056705770587059706070617062706370647065706670677068706970707071707270737074707570767077707870797080708170827083708470857086708770887089709070917092709370947095709670977098709971007101710271037104710571067107710871097110711171127113711471157116711771187119712071217122712371247125712671277128712971307131713271337134713571367137713871397140714171427143714471457146714771487149715071517152715371547155715671577158715971607161716271637164716571667167716871697170717171727173717471757176717771787179718071817182718371847185718671877188718971907191719271937194719571967197719871997200720172027203720472057206720772087209721072117212721372147215721672177218721972207221722272237224722572267227722872297230723172327233723472357236723772387239724072417242724372447245724672477248724972507251725272537254725572567257725872597260726172627263726472657266726772687269727072717272727372747275727672777278727972807281728272837284728572867287728872897290729172927293729472957296729772987299730073017302730373047305730673077308730973107311731273137314731573167317731873197320732173227323732473257326732773287329733073317332733373347335733673377338733973407341734273437344734573467347734873497350735173527353735473557356735773587359736073617362736373647365736673677368736973707371737273737374737573767377737873797380738173827383738473857386738773887389739073917392739373947395739673977398739974007401740274037404740574067407740874097410741174127413741474157416741774187419742074217422742374247425742674277428742974307431743274337434743574367437743874397440744174427443744474457446744774487449745074517452745374547455745674577458745974607461746274637464746574667467746874697470747174727473747474757476747774787479748074817482748374847485748674877488748974907491749274937494749574967497749874997500750175027503750475057506750775087509751075117512751375147515751675177518751975207521752275237524752575267527752875297530753175327533753475357536753775387539754075417542754375447545754675477548754975507551755275537554755575567557755875597560756175627563756475657566756775687569757075717572757375747575757675777578757975807581758275837584758575867587758875897590759175927593759475957596759775987599760076017602760376047605760676077608760976107611761276137614761576167617761876197620762176227623762476257626762776287629763076317632763376347635763676377638763976407641764276437644764576467647764876497650765176527653765476557656765776587659766076617662766376647665766676677668766976707671767276737674767576767677767876797680768176827683768476857686768776887689769076917692769376947695769676977698769977007701770277037704770577067707770877097710771177127713771477157716771777187719772077217722772377247725772677277728772977307731773277337734773577367737773877397740774177427743774477457746774777487749775077517752775377547755775677577758775977607761776277637764776577667767776877697770777177727773777477757776777777787779778077817782778377847785778677877788778977907791779277937794779577967797779877997800780178027803780478057806780778087809781078117812781378147815781678177818781978207821782278237824782578267827782878297830783178327833783478357836783778387839784078417842784378447845784678477848784978507851785278537854785578567857785878597860786178627863786478657866786778687869787078717872787378747875787678777878787978807881788278837884788578867887788878897890789178927893789478957896789778987899790079017902790379047905790679077908790979107911791279137914791579167917791879197920792179227923792479257926792779287929793079317932793379347935793679377938793979407941794279437944794579467947794879497950795179527953795479557956795779587959796079617962796379647965796679677968796979707971797279737974797579767977797879797980798179827983798479857986798779887989799079917992799379947995799679977998799980008001800280038004800580068007800880098010801180128013801480158016801780188019802080218022802380248025802680278028802980308031803280338034803580368037803880398040804180428043804480458046804780488049805080518052805380548055805680578058805980608061806280638064806580668067806880698070807180728073807480758076807780788079808080818082808380848085808680878088808980908091809280938094809580968097809880998100810181028103810481058106810781088109811081118112811381148115811681178118811981208121812281238124812581268127812881298130813181328133813481358136813781388139814081418142814381448145814681478148814981508151815281538154815581568157815881598160816181628163816481658166816781688169817081718172817381748175817681778178817981808181818281838184818581868187818881898190819181928193819481958196819781988199820082018202820382048205820682078208820982108211821282138214821582168217821882198220822182228223822482258226822782288229823082318232823382348235823682378238823982408241824282438244824582468247824882498250825182528253825482558256825782588259826082618262826382648265826682678268826982708271827282738274827582768277827882798280828182828283828482858286828782888289829082918292829382948295829682978298829983008301830283038304830583068307830883098310831183128313831483158316831783188319832083218322832383248325832683278328832983308331833283338334833583368337833883398340834183428343834483458346834783488349835083518352835383548355835683578358835983608361836283638364836583668367836883698370837183728373837483758376837783788379838083818382838383848385838683878388838983908391839283938394839583968397839883998400840184028403840484058406840784088409841084118412841384148415841684178418841984208421842284238424842584268427842884298430843184328433843484358436843784388439844084418442844384448445844684478448844984508451845284538454845584568457845884598460846184628463846484658466846784688469847084718472847384748475847684778478847984808481848284838484848584868487848884898490849184928493849484958496849784988499850085018502850385048505850685078508850985108511851285138514851585168517851885198520852185228523852485258526852785288529853085318532853385348535853685378538853985408541854285438544854585468547854885498550855185528553855485558556855785588559856085618562856385648565856685678568856985708571857285738574857585768577857885798580858185828583858485858586858785888589859085918592859385948595859685978598859986008601860286038604860586068607860886098610861186128613861486158616861786188619862086218622862386248625862686278628862986308631863286338634863586368637863886398640864186428643864486458646864786488649865086518652865386548655865686578658865986608661866286638664866586668667866886698670867186728673867486758676867786788679868086818682868386848685868686878688868986908691869286938694869586968697869886998700870187028703870487058706870787088709871087118712871387148715871687178718871987208721872287238724872587268727872887298730873187328733873487358736873787388739874087418742874387448745874687478748874987508751875287538754875587568757875887598760876187628763876487658766876787688769877087718772877387748775877687778778877987808781878287838784878587868787878887898790879187928793879487958796879787988799880088018802880388048805880688078808880988108811881288138814881588168817881888198820882188228823882488258826882788288829883088318832883388348835883688378838883988408841884288438844884588468847884888498850885188528853885488558856885788588859886088618862886388648865886688678868886988708871887288738874887588768877887888798880888188828883888488858886888788888889889088918892889388948895889688978898889989008901890289038904890589068907890889098910891189128913891489158916891789188919892089218922892389248925892689278928892989308931893289338934893589368937893889398940894189428943894489458946894789488949895089518952895389548955895689578958895989608961896289638964896589668967896889698970897189728973897489758976897789788979898089818982898389848985898689878988898989908991899289938994899589968997899889999000900190029003900490059006900790089009901090119012901390149015901690179018901990209021902290239024902590269027902890299030903190329033903490359036903790389039904090419042904390449045904690479048904990509051905290539054905590569057905890599060906190629063906490659066906790689069907090719072907390749075907690779078907990809081908290839084908590869087908890899090909190929093909490959096909790989099910091019102910391049105910691079108910991109111911291139114911591169117911891199120912191229123912491259126912791289129913091319132913391349135913691379138913991409141914291439144914591469147914891499150915191529153915491559156915791589159916091619162916391649165916691679168916991709171917291739174917591769177917891799180918191829183918491859186918791889189919091919192919391949195919691979198919992009201920292039204920592069207920892099210921192129213921492159216921792189219922092219222922392249225922692279228922992309231923292339234923592369237923892399240924192429243924492459246924792489249925092519252925392549255925692579258925992609261926292639264926592669267926892699270927192729273927492759276927792789279928092819282928392849285928692879288928992909291929292939294929592969297929892999300930193029303930493059306930793089309931093119312931393149315931693179318931993209321932293239324932593269327932893299330933193329333933493359336933793389339934093419342934393449345934693479348934993509351935293539354935593569357935893599360936193629363936493659366936793689369937093719372937393749375937693779378937993809381938293839384938593869387938893899390939193929393939493959396939793989399940094019402940394049405940694079408940994109411941294139414941594169417941894199420942194229423942494259426942794289429943094319432943394349435943694379438943994409441944294439444944594469447944894499450945194529453945494559456945794589459946094619462946394649465946694679468946994709471947294739474947594769477947894799480948194829483948494859486948794889489949094919492949394949495949694979498949995009501950295039504950595069507950895099510951195129513951495159516951795189519952095219522952395249525952695279528952995309531953295339534953595369537953895399540954195429543954495459546954795489549955095519552955395549555955695579558955995609561956295639564956595669567956895699570957195729573957495759576957795789579958095819582958395849585958695879588958995909591959295939594959595969597959895999600960196029603960496059606960796089609961096119612961396149615961696179618961996209621962296239624962596269627962896299630963196329633963496359636963796389639964096419642964396449645964696479648964996509651965296539654965596569657965896599660966196629663966496659666966796689669967096719672967396749675967696779678967996809681968296839684968596869687968896899690969196929693969496959696969796989699970097019702970397049705970697079708970997109711971297139714971597169717971897199720972197229723972497259726972797289729973097319732973397349735973697379738973997409741974297439744974597469747974897499750975197529753975497559756975797589759976097619762976397649765976697679768976997709771977297739774977597769777977897799780978197829783978497859786978797889789979097919792979397949795979697979798979998009801980298039804980598069807980898099810981198129813981498159816981798189819982098219822982398249825982698279828982998309831983298339834983598369837983898399840984198429843984498459846984798489849985098519852985398549855985698579858985998609861986298639864986598669867986898699870987198729873987498759876987798789879988098819882988398849885988698879888988998909891989298939894989598969897989898999900990199029903990499059906990799089909991099119912991399149915991699179918991999209921992299239924992599269927992899299930993199329933993499359936993799389939994099419942994399449945994699479948994999509951995299539954995599569957995899599960996199629963996499659966996799689969997099719972997399749975997699779978997999809981998299839984998599869987998899899990999199929993999499959996999799989999100001000110002100031000410005100061000710008100091001010011100121001310014100151001610017100181001910020100211002210023100241002510026100271002810029100301003110032100331003410035100361003710038100391004010041100421004310044100451004610047100481004910050100511005210053100541005510056100571005810059100601006110062100631006410065100661006710068100691007010071100721007310074100751007610077100781007910080100811008210083100841008510086100871008810089100901009110092100931009410095100961009710098100991010010101101021010310104101051010610107101081010910110101111011210113101141011510116101171011810119101201012110122101231012410125101261012710128101291013010131101321013310134101351013610137101381013910140101411014210143101441014510146101471014810149101501015110152101531015410155101561015710158101591016010161101621016310164101651016610167101681016910170101711017210173101741017510176101771017810179101801018110182101831018410185101861018710188101891019010191101921019310194101951019610197101981019910200102011020210203102041020510206102071020810209102101021110212102131021410215102161021710218102191022010221102221022310224102251022610227102281022910230102311023210233102341023510236102371023810239102401024110242102431024410245102461024710248102491025010251102521025310254102551025610257102581025910260102611026210263102641026510266102671026810269102701027110272102731027410275102761027710278102791028010281102821028310284102851028610287102881028910290102911029210293102941029510296102971029810299103001030110302103031030410305103061030710308103091031010311103121031310314103151031610317103181031910320103211032210323103241032510326103271032810329103301033110332103331033410335103361033710338103391034010341103421034310344103451034610347103481034910350103511035210353103541035510356103571035810359103601036110362103631036410365103661036710368103691037010371103721037310374103751037610377103781037910380103811038210383103841038510386103871038810389103901039110392103931039410395103961039710398103991040010401104021040310404104051040610407104081040910410104111041210413104141041510416104171041810419104201042110422104231042410425104261042710428104291043010431104321043310434104351043610437104381043910440104411044210443104441044510446104471044810449104501045110452104531045410455104561045710458104591046010461104621046310464104651046610467104681046910470104711047210473104741047510476104771047810479104801048110482104831048410485104861048710488104891049010491104921049310494104951049610497104981049910500105011050210503105041050510506105071050810509105101051110512105131051410515105161051710518105191052010521105221052310524105251052610527105281052910530105311053210533105341053510536105371053810539105401054110542105431054410545105461054710548105491055010551105521055310554105551055610557105581055910560105611056210563105641056510566105671056810569105701057110572105731057410575105761057710578105791058010581105821058310584105851058610587105881058910590105911059210593105941059510596105971059810599106001060110602106031060410605106061060710608106091061010611106121061310614106151061610617106181061910620106211062210623106241062510626106271062810629106301063110632106331063410635106361063710638106391064010641106421064310644106451064610647106481064910650106511065210653106541065510656106571065810659106601066110662106631066410665106661066710668106691067010671106721067310674106751067610677106781067910680106811068210683106841068510686106871068810689106901069110692106931069410695106961069710698106991070010701107021070310704107051070610707107081070910710107111071210713107141071510716107171071810719107201072110722107231072410725107261072710728107291073010731107321073310734107351073610737107381073910740107411074210743107441074510746107471074810749107501075110752107531075410755107561075710758107591076010761107621076310764107651076610767107681076910770107711077210773107741077510776107771077810779107801078110782107831078410785107861078710788107891079010791107921079310794107951079610797107981079910800108011080210803108041080510806108071080810809108101081110812108131081410815108161081710818108191082010821108221082310824108251082610827108281082910830108311083210833108341083510836108371083810839108401084110842108431084410845108461084710848108491085010851108521085310854108551085610857108581085910860108611086210863108641086510866108671086810869108701087110872108731087410875108761087710878108791088010881108821088310884108851088610887108881088910890108911089210893108941089510896108971089810899109001090110902109031090410905109061090710908109091091010911109121091310914109151091610917109181091910920109211092210923109241092510926109271092810929109301093110932109331093410935109361093710938109391094010941109421094310944109451094610947109481094910950109511095210953109541095510956109571095810959109601096110962109631096410965109661096710968109691097010971109721097310974109751097610977109781097910980109811098210983109841098510986109871098810989109901099110992109931099410995109961099710998109991100011001110021100311004110051100611007110081100911010110111101211013110141101511016110171101811019110201102111022110231102411025110261102711028110291103011031110321103311034110351103611037110381103911040110411104211043110441104511046110471104811049110501105111052110531105411055110561105711058110591106011061110621106311064110651106611067110681106911070110711107211073110741107511076110771107811079110801108111082110831108411085110861108711088110891109011091110921109311094110951109611097110981109911100111011110211103111041110511106111071110811109111101111111112111131111411115111161111711118111191112011121111221112311124111251112611127111281112911130111311113211133111341113511136111371113811139111401114111142111431114411145111461114711148111491115011151111521115311154111551115611157111581115911160111611116211163111641116511166111671116811169111701117111172111731117411175111761117711178111791118011181111821118311184111851118611187111881118911190111911119211193111941119511196111971119811199112001120111202112031120411205112061120711208112091121011211112121121311214112151121611217112181121911220112211122211223112241122511226112271122811229112301123111232112331123411235112361123711238112391124011241112421124311244112451124611247112481124911250112511125211253112541125511256112571125811259112601126111262112631126411265112661126711268112691127011271112721127311274112751127611277112781127911280112811128211283112841128511286112871128811289112901129111292112931129411295112961129711298112991130011301113021130311304113051130611307113081130911310113111131211313113141131511316113171131811319113201132111322113231132411325113261132711328113291133011331113321133311334113351133611337113381133911340113411134211343113441134511346113471134811349113501135111352113531135411355113561135711358113591136011361113621136311364113651136611367113681136911370113711137211373113741137511376113771137811379113801138111382113831138411385113861138711388113891139011391113921139311394113951139611397113981139911400114011140211403114041140511406114071140811409114101141111412114131141411415114161141711418114191142011421114221142311424114251142611427114281142911430114311143211433114341143511436114371143811439114401144111442114431144411445114461144711448114491145011451114521145311454114551145611457114581145911460114611146211463114641146511466114671146811469114701147111472114731147411475114761147711478114791148011481114821148311484114851148611487114881148911490114911149211493114941149511496114971149811499115001150111502115031150411505115061150711508115091151011511115121151311514115151151611517115181151911520115211152211523115241152511526115271152811529115301153111532115331153411535115361153711538115391154011541115421154311544115451154611547115481154911550115511155211553115541155511556115571155811559115601156111562115631156411565115661156711568115691157011571115721157311574115751157611577115781157911580115811158211583115841158511586115871158811589115901159111592115931159411595115961159711598115991160011601116021160311604116051160611607116081160911610116111161211613116141161511616116171161811619116201162111622116231162411625116261162711628116291163011631116321163311634116351163611637116381163911640116411164211643116441164511646116471164811649116501165111652116531165411655116561165711658116591166011661116621166311664116651166611667116681166911670116711167211673116741167511676116771167811679116801168111682116831168411685116861168711688116891169011691116921169311694116951169611697116981169911700117011170211703117041170511706117071170811709117101171111712117131171411715117161171711718117191172011721117221172311724117251172611727117281172911730117311173211733117341173511736117371173811739117401174111742117431174411745117461174711748117491175011751117521175311754117551175611757117581175911760117611176211763117641176511766117671176811769117701177111772117731177411775117761177711778117791178011781117821178311784117851178611787117881178911790117911179211793117941179511796117971179811799118001180111802118031180411805118061180711808118091181011811118121181311814118151181611817118181181911820118211182211823118241182511826118271182811829118301183111832118331183411835118361183711838118391184011841118421184311844118451184611847118481184911850118511185211853118541185511856118571185811859118601186111862118631186411865118661186711868118691187011871118721187311874118751187611877118781187911880118811188211883118841188511886118871188811889118901189111892118931189411895118961189711898118991190011901119021190311904119051190611907119081190911910119111191211913119141191511916119171191811919119201192111922119231192411925119261192711928119291193011931119321193311934119351193611937119381193911940119411194211943119441194511946119471194811949119501195111952119531195411955119561195711958119591196011961119621196311964119651196611967119681196911970119711197211973119741197511976119771197811979119801198111982119831198411985119861198711988119891199011991119921199311994119951199611997119981199912000120011200212003120041200512006120071200812009120101201112012120131201412015120161201712018120191202012021120221202312024120251202612027120281202912030120311203212033120341203512036120371203812039120401204112042120431204412045120461204712048120491205012051120521205312054120551205612057120581205912060120611206212063120641206512066120671206812069120701207112072120731207412075120761207712078120791208012081120821208312084120851208612087120881208912090120911209212093120941209512096120971209812099121001210112102121031210412105121061210712108121091211012111121121211312114121151211612117121181211912120121211212212123121241212512126121271212812129121301213112132121331213412135121361213712138121391214012141121421214312144121451214612147121481214912150121511215212153121541215512156121571215812159121601216112162121631216412165121661216712168121691217012171121721217312174121751217612177121781217912180121811218212183121841218512186121871218812189121901219112192121931219412195121961219712198121991220012201122021220312204122051220612207122081220912210122111221212213122141221512216122171221812219122201222112222122231222412225122261222712228122291223012231122321223312234122351223612237122381223912240122411224212243122441224512246122471224812249122501225112252122531225412255122561225712258122591226012261122621226312264122651226612267122681226912270122711227212273122741227512276122771227812279122801228112282122831228412285122861228712288122891229012291122921229312294122951229612297122981229912300123011230212303123041230512306123071230812309123101231112312123131231412315123161231712318123191232012321123221232312324123251232612327123281232912330123311233212333123341233512336123371233812339123401234112342123431234412345123461234712348123491235012351123521235312354123551235612357123581235912360123611236212363123641236512366123671236812369123701237112372123731237412375123761237712378123791238012381123821238312384123851238612387123881238912390123911239212393123941239512396123971239812399124001240112402124031240412405124061240712408124091241012411124121241312414124151241612417124181241912420124211242212423124241242512426124271242812429124301243112432124331243412435124361243712438124391244012441124421244312444124451244612447124481244912450124511245212453124541245512456124571245812459124601246112462124631246412465124661246712468124691247012471124721247312474124751247612477124781247912480124811248212483124841248512486124871248812489124901249112492124931249412495124961249712498124991250012501125021250312504125051250612507125081250912510125111251212513125141251512516125171251812519125201252112522125231252412525125261252712528125291253012531125321253312534125351253612537125381253912540125411254212543125441254512546125471254812549125501255112552125531255412555125561255712558125591256012561125621256312564125651256612567125681256912570125711257212573125741257512576125771257812579125801258112582125831258412585125861258712588125891259012591125921259312594125951259612597125981259912600126011260212603126041260512606126071260812609126101261112612126131261412615126161261712618126191262012621126221262312624126251262612627126281262912630126311263212633126341263512636126371263812639126401264112642126431264412645126461264712648126491265012651126521265312654126551265612657126581265912660126611266212663126641266512666126671266812669126701267112672126731267412675126761267712678126791268012681126821268312684126851268612687126881268912690126911269212693126941269512696126971269812699127001270112702127031270412705127061270712708127091271012711127121271312714127151271612717127181271912720127211272212723127241272512726127271272812729127301273112732127331273412735127361273712738127391274012741127421274312744127451274612747127481274912750127511275212753127541275512756127571275812759127601276112762127631276412765127661276712768127691277012771127721277312774127751277612777127781277912780127811278212783127841278512786127871278812789127901279112792127931279412795127961279712798127991280012801128021280312804128051280612807128081280912810128111281212813128141281512816128171281812819128201282112822128231282412825128261282712828128291283012831128321283312834128351283612837128381283912840128411284212843128441284512846128471284812849128501285112852128531285412855128561285712858128591286012861128621286312864128651286612867128681286912870128711287212873128741287512876128771287812879128801288112882128831288412885128861288712888128891289012891128921289312894128951289612897128981289912900129011290212903129041290512906129071290812909129101291112912129131291412915129161291712918129191292012921129221292312924129251292612927129281292912930129311293212933129341293512936129371293812939129401294112942129431294412945129461294712948129491295012951129521295312954129551295612957129581295912960129611296212963129641296512966129671296812969129701297112972129731297412975129761297712978129791298012981129821298312984129851298612987129881298912990129911299212993129941299512996129971299812999130001300113002130031300413005130061300713008130091301013011130121301313014130151301613017130181301913020130211302213023130241302513026130271302813029130301303113032130331303413035130361303713038130391304013041130421304313044130451304613047130481304913050130511305213053130541305513056130571305813059130601306113062130631306413065130661306713068130691307013071130721307313074130751307613077130781307913080130811308213083130841308513086130871308813089130901309113092130931309413095130961309713098130991310013101131021310313104131051310613107131081310913110131111311213113131141311513116131171311813119131201312113122131231312413125131261312713128131291313013131131321313313134131351313613137131381313913140131411314213143131441314513146131471314813149131501315113152131531315413155131561315713158131591316013161131621316313164131651316613167131681316913170131711317213173131741317513176131771317813179131801318113182131831318413185131861318713188131891319013191131921319313194131951319613197131981319913200132011320213203132041320513206132071320813209132101321113212132131321413215132161321713218132191322013221132221322313224132251322613227132281322913230132311323213233132341323513236132371323813239132401324113242132431324413245132461324713248132491325013251132521325313254132551325613257132581325913260132611326213263132641326513266132671326813269132701327113272132731327413275132761327713278132791328013281132821328313284132851328613287132881328913290132911329213293132941329513296132971329813299133001330113302133031330413305133061330713308133091331013311133121331313314133151331613317133181331913320133211332213323133241332513326133271332813329133301333113332133331333413335133361333713338133391334013341133421334313344133451334613347133481334913350133511335213353133541335513356133571335813359133601336113362133631336413365133661336713368133691337013371133721337313374133751337613377133781337913380133811338213383133841338513386133871338813389133901339113392133931339413395133961339713398133991340013401134021340313404134051340613407134081340913410134111341213413134141341513416134171341813419134201342113422134231342413425134261342713428134291343013431134321343313434134351343613437134381343913440134411344213443134441344513446134471344813449134501345113452134531345413455134561345713458134591346013461134621346313464134651346613467134681346913470134711347213473134741347513476134771347813479134801348113482134831348413485134861348713488134891349013491134921349313494134951349613497134981349913500135011350213503135041350513506135071350813509135101351113512135131351413515135161351713518135191352013521135221352313524135251352613527135281352913530135311353213533135341353513536135371353813539135401354113542135431354413545135461354713548135491355013551135521355313554135551355613557135581355913560135611356213563135641356513566135671356813569135701357113572135731357413575135761357713578135791358013581135821358313584135851358613587135881358913590135911359213593135941359513596135971359813599136001360113602136031360413605136061360713608136091361013611136121361313614136151361613617136181361913620136211362213623136241362513626136271362813629136301363113632136331363413635136361363713638136391364013641136421364313644136451364613647136481364913650136511365213653136541365513656136571365813659136601366113662136631366413665136661366713668136691367013671136721367313674136751367613677136781367913680136811368213683136841368513686136871368813689136901369113692136931369413695136961369713698136991370013701137021370313704137051370613707137081370913710137111371213713137141371513716137171371813719137201372113722137231372413725137261372713728137291373013731137321373313734137351373613737137381373913740137411374213743137441374513746137471374813749137501375113752137531375413755137561375713758137591376013761137621376313764137651376613767137681376913770137711377213773137741377513776137771377813779137801378113782137831378413785137861378713788137891379013791137921379313794137951379613797137981379913800138011380213803138041380513806138071380813809138101381113812138131381413815138161381713818138191382013821138221382313824138251382613827138281382913830138311383213833138341383513836138371383813839138401384113842138431384413845138461384713848138491385013851138521385313854138551385613857138581385913860138611386213863138641386513866138671386813869138701387113872138731387413875138761387713878138791388013881138821388313884138851388613887138881388913890138911389213893138941389513896138971389813899139001390113902139031390413905139061390713908139091391013911139121391313914139151391613917139181391913920139211392213923139241392513926139271392813929139301393113932139331393413935139361393713938139391394013941139421394313944139451394613947139481394913950139511395213953139541395513956139571395813959139601396113962139631396413965139661396713968139691397013971139721397313974139751397613977139781397913980139811398213983139841398513986139871398813989139901399113992139931399413995139961399713998139991400014001140021400314004140051400614007140081400914010140111401214013140141401514016140171401814019140201402114022140231402414025140261402714028140291403014031140321403314034140351403614037140381403914040140411404214043140441404514046140471404814049140501405114052140531405414055140561405714058140591406014061140621406314064140651406614067140681406914070140711407214073140741407514076140771407814079140801408114082140831408414085140861408714088140891409014091140921409314094140951409614097140981409914100141011410214103141041410514106141071410814109141101411114112141131411414115141161411714118141191412014121141221412314124141251412614127141281412914130141311413214133141341413514136141371413814139141401414114142141431414414145141461414714148141491415014151141521415314154141551415614157141581415914160141611416214163141641416514166141671416814169141701417114172141731417414175141761417714178141791418014181141821418314184141851418614187141881418914190141911419214193141941419514196141971419814199142001420114202142031420414205142061420714208142091421014211142121421314214142151421614217142181421914220142211422214223142241422514226142271422814229142301423114232142331423414235142361423714238142391424014241142421424314244142451424614247142481424914250142511425214253142541425514256142571425814259142601426114262142631426414265142661426714268142691427014271142721427314274142751427614277142781427914280142811428214283142841428514286142871428814289142901429114292142931429414295142961429714298142991430014301143021430314304143051430614307143081430914310143111431214313143141431514316143171431814319143201432114322143231432414325143261432714328143291433014331143321433314334143351433614337143381433914340143411434214343143441434514346143471434814349143501435114352143531435414355143561435714358143591436014361143621436314364143651436614367143681436914370143711437214373143741437514376143771437814379143801438114382143831438414385143861438714388143891439014391143921439314394143951439614397143981439914400144011440214403144041440514406144071440814409144101441114412144131441414415144161441714418144191442014421144221442314424144251442614427144281442914430144311443214433144341443514436144371443814439144401444114442144431444414445144461444714448144491445014451144521445314454144551445614457144581445914460144611446214463144641446514466144671446814469144701447114472144731447414475144761447714478144791448014481144821448314484144851448614487144881448914490144911449214493144941449514496144971449814499145001450114502145031450414505145061450714508145091451014511145121451314514145151451614517145181451914520145211452214523145241452514526145271452814529145301453114532145331453414535145361453714538145391454014541145421454314544145451454614547145481454914550145511455214553145541455514556145571455814559145601456114562145631456414565145661456714568145691457014571145721457314574145751457614577145781457914580145811458214583145841458514586145871458814589145901459114592145931459414595145961459714598145991460014601146021460314604146051460614607146081460914610146111461214613146141461514616146171461814619146201462114622146231462414625146261462714628146291463014631146321463314634146351463614637146381463914640146411464214643146441464514646146471464814649146501465114652146531465414655146561465714658146591466014661146621466314664146651466614667146681466914670146711467214673146741467514676146771467814679146801468114682146831468414685146861468714688146891469014691146921469314694146951469614697146981469914700147011470214703147041470514706147071470814709147101471114712147131471414715147161471714718147191472014721147221472314724147251472614727147281472914730147311473214733147341473514736147371473814739147401474114742147431474414745147461474714748147491475014751147521475314754147551475614757147581475914760147611476214763147641476514766147671476814769147701477114772147731477414775147761477714778147791478014781147821478314784147851478614787147881478914790147911479214793147941479514796147971479814799148001480114802148031480414805148061480714808148091481014811148121481314814148151481614817148181481914820148211482214823148241482514826148271482814829148301483114832148331483414835148361483714838148391484014841148421484314844148451484614847148481484914850148511485214853148541485514856148571485814859148601486114862148631486414865148661486714868148691487014871148721487314874148751487614877148781487914880148811488214883148841488514886148871488814889148901489114892148931489414895148961489714898148991490014901149021490314904149051490614907149081490914910149111491214913149141491514916149171491814919149201492114922149231492414925149261492714928149291493014931149321493314934149351493614937149381493914940149411494214943149441494514946149471494814949149501495114952149531495414955149561495714958149591496014961149621496314964149651496614967149681496914970149711497214973149741497514976149771497814979149801498114982149831498414985149861498714988149891499014991149921499314994149951499614997149981499915000150011500215003150041500515006150071500815009150101501115012150131501415015150161501715018150191502015021150221502315024150251502615027150281502915030150311503215033150341503515036150371503815039150401504115042150431504415045150461504715048150491505015051150521505315054150551505615057150581505915060150611506215063150641506515066150671506815069150701507115072150731507415075150761507715078150791508015081150821508315084150851508615087150881508915090150911509215093150941509515096150971509815099151001510115102151031510415105151061510715108151091511015111151121511315114151151511615117151181511915120151211512215123151241512515126151271512815129151301513115132151331513415135151361513715138151391514015141151421514315144151451514615147151481514915150151511515215153151541515515156151571515815159151601516115162151631516415165151661516715168151691517015171151721517315174151751517615177151781517915180151811518215183151841518515186151871518815189151901519115192151931519415195151961519715198151991520015201152021520315204152051520615207152081520915210152111521215213152141521515216152171521815219152201522115222152231522415225152261522715228152291523015231152321523315234152351523615237152381523915240152411524215243152441524515246152471524815249152501525115252152531525415255152561525715258152591526015261152621526315264152651526615267152681526915270152711527215273152741527515276152771527815279152801528115282152831528415285152861528715288152891529015291152921529315294152951529615297152981529915300153011530215303153041530515306153071530815309153101531115312153131531415315153161531715318153191532015321153221532315324153251532615327153281532915330153311533215333153341533515336153371533815339153401534115342153431534415345153461534715348153491535015351153521535315354153551535615357153581535915360153611536215363153641536515366153671536815369153701537115372153731537415375153761537715378153791538015381153821538315384153851538615387153881538915390153911539215393153941539515396153971539815399154001540115402154031540415405154061540715408154091541015411154121541315414154151541615417154181541915420154211542215423154241542515426154271542815429154301543115432154331543415435154361543715438154391544015441154421544315444154451544615447154481544915450154511545215453154541545515456154571545815459154601546115462154631546415465154661546715468154691547015471154721547315474154751547615477154781547915480154811548215483154841548515486154871548815489154901549115492154931549415495154961549715498154991550015501155021550315504155051550615507155081550915510155111551215513155141551515516155171551815519155201552115522155231552415525155261552715528155291553015531155321553315534155351553615537155381553915540155411554215543155441554515546155471554815549155501555115552155531555415555155561555715558155591556015561155621556315564155651556615567155681556915570155711557215573155741557515576155771557815579155801558115582155831558415585155861558715588155891559015591155921559315594155951559615597155981559915600156011560215603156041560515606156071560815609156101561115612156131561415615156161561715618156191562015621156221562315624156251562615627156281562915630156311563215633156341563515636156371563815639156401564115642156431564415645156461564715648156491565015651156521565315654156551565615657156581565915660156611566215663156641566515666156671566815669156701567115672156731567415675156761567715678156791568015681156821568315684156851568615687156881568915690156911569215693156941569515696156971569815699157001570115702157031570415705157061570715708157091571015711157121571315714157151571615717157181571915720157211572215723157241572515726157271572815729157301573115732157331573415735157361573715738157391574015741157421574315744157451574615747157481574915750157511575215753157541575515756157571575815759157601576115762157631576415765157661576715768157691577015771157721577315774157751577615777157781577915780157811578215783157841578515786157871578815789157901579115792157931579415795157961579715798157991580015801158021580315804158051580615807158081580915810158111581215813158141581515816158171581815819158201582115822158231582415825158261582715828158291583015831158321583315834158351583615837158381583915840158411584215843158441584515846158471584815849158501585115852158531585415855158561585715858158591586015861158621586315864158651586615867158681586915870158711587215873158741587515876158771587815879158801588115882158831588415885158861588715888158891589015891158921589315894158951589615897158981589915900159011590215903159041590515906159071590815909159101591115912159131591415915159161591715918159191592015921159221592315924159251592615927159281592915930159311593215933159341593515936159371593815939159401594115942159431594415945159461594715948159491595015951159521595315954159551595615957159581595915960159611596215963159641596515966159671596815969159701597115972159731597415975159761597715978159791598015981159821598315984159851598615987159881598915990159911599215993159941599515996159971599815999160001600116002160031600416005160061600716008160091601016011160121601316014160151601616017160181601916020160211602216023160241602516026160271602816029160301603116032160331603416035160361603716038160391604016041160421604316044160451604616047160481604916050160511605216053160541605516056160571605816059160601606116062160631606416065160661606716068160691607016071160721607316074160751607616077160781607916080160811608216083160841608516086160871608816089160901609116092160931609416095160961609716098160991610016101161021610316104161051610616107161081610916110161111611216113161141611516116161171611816119161201612116122161231612416125161261612716128161291613016131161321613316134161351613616137161381613916140161411614216143161441614516146161471614816149161501615116152161531615416155161561615716158161591616016161161621616316164161651616616167161681616916170161711617216173161741617516176161771617816179161801618116182161831618416185161861618716188161891619016191161921619316194161951619616197161981619916200162011620216203162041620516206162071620816209162101621116212162131621416215162161621716218162191622016221162221622316224162251622616227162281622916230162311623216233162341623516236162371623816239162401624116242162431624416245162461624716248162491625016251162521625316254162551625616257162581625916260162611626216263162641626516266162671626816269162701627116272162731627416275162761627716278162791628016281162821628316284162851628616287162881628916290162911629216293162941629516296162971629816299163001630116302163031630416305163061630716308163091631016311163121631316314163151631616317163181631916320163211632216323163241632516326163271632816329163301633116332163331633416335163361633716338163391634016341163421634316344163451634616347163481634916350163511635216353163541635516356163571635816359163601636116362163631636416365163661636716368163691637016371163721637316374163751637616377163781637916380163811638216383163841638516386163871638816389163901639116392163931639416395163961639716398163991640016401164021640316404164051640616407164081640916410164111641216413164141641516416164171641816419164201642116422164231642416425164261642716428164291643016431164321643316434164351643616437164381643916440164411644216443164441644516446164471644816449164501645116452164531645416455164561645716458164591646016461164621646316464164651646616467164681646916470164711647216473164741647516476164771647816479164801648116482164831648416485164861648716488164891649016491164921649316494164951649616497164981649916500165011650216503165041650516506165071650816509165101651116512165131651416515165161651716518165191652016521165221652316524165251652616527165281652916530165311653216533165341653516536165371653816539165401654116542165431654416545165461654716548165491655016551165521655316554165551655616557165581655916560165611656216563165641656516566165671656816569165701657116572165731657416575165761657716578165791658016581165821658316584165851658616587165881658916590165911659216593
  1. //TODO: Temporary, to add asserts
  2. #define BF_DEBUG_ASSERTS
  3. #include <deque>
  4. #include "BeMCContext.h"
  5. #include "BeCOFFObject.h"
  6. #include "BeIRCodeGen.h"
  7. #include "BeefySysLib/util/BeefPerf.h"
  8. #include "BeefySysLib/util/AllocDebug.h"
  9. #pragma warning(disable:4146)
  10. USING_NS_BF;
  11. //////////////////////////////////////////////////////////////////////////
  12. #define IS_BIT_SET_32(bits, idx) (((bits)[(idx) / 32] & (1 << ((idx) % 32))) != 0)
  13. // Only use "rep stosb"/"rep movsb" if total size is at least this value. The drawback is requiring saving/restore of RAX, RDI, and RCX (and RSI for movsb)
  14. const int BF_REP_MOV_LIMIT = 128;
  15. static const X64CPURegister gVolatileRegs[] = { X64Reg_RAX, X64Reg_RCX, X64Reg_RDX, X64Reg_R8, X64Reg_R9, X64Reg_R10, X64Reg_R11,
  16. X64Reg_XMM0_f64, X64Reg_XMM1_f64, X64Reg_XMM2_f64, X64Reg_XMM3_f64, X64Reg_XMM4_f64, X64Reg_XMM5_f64};
  17. static const char* gOpName[] =
  18. {
  19. "None",
  20. "@Def",
  21. "@DefLoad",
  22. "@DefPhi",
  23. "@DbgDecl",
  24. "@DbgRangeStart",
  25. "@DbgRangeEnd",
  26. "@LifetimeExtend",
  27. "@LifetimeStart",
  28. "@LifetimeEnd",
  29. "@ValueScopeSoftEnd",
  30. "@ValueScopeHardEnd",
  31. "@Label",
  32. //"PhiValue",
  33. "CmpToBool",
  34. "MemSet",
  35. "MemCpy",
  36. "FastCheckStack",
  37. "TLSSetup",
  38. "PreserveVolatiles",
  39. "RestoreVolatiles",
  40. "Unwind_PushReg",
  41. "Unwind_SaveXMM",
  42. "Unwind_Alloc",
  43. "Unwind_SetBP",
  44. "Rem",
  45. "IRem",
  46. "Nop",
  47. "Unreachable",
  48. "EnsureCodeAt",
  49. "DbgBreak",
  50. "MFence",
  51. "Mov",
  52. "MovRaw",
  53. "MovSX",
  54. "XChg",
  55. "XAdd",
  56. "CmpXChg",
  57. "Load",
  58. "Store",
  59. "Push",
  60. "Pop",
  61. "Neg",
  62. "Not",
  63. "Add",
  64. "Sub",
  65. "Mul",
  66. "IMul",
  67. "Div",
  68. "IDiv",
  69. "Cmp",
  70. "And",
  71. "Or",
  72. "Xor",
  73. "Shl",
  74. "Shr",
  75. "Sar",
  76. "Test",
  77. "CondBr",
  78. "Br",
  79. "Ret",
  80. "Call",
  81. };
  82. static_assert(BF_ARRAY_COUNT(gOpName) == (int)BeMCInstKind_COUNT, "gOpName incorrect size");
  83. void PrintBoolVec(Array<bool>& boolVec)
  84. {
  85. String str;
  86. for (int i = 0; i < (int)boolVec.size(); i++)
  87. {
  88. str += StrFormat("%d: %s\n", i, boolVec[i] ? "true" : "false");
  89. }
  90. OutputDebugStr(str);
  91. }
  92. static bool IsPowerOfTwo(int64 val)
  93. {
  94. return (val != 0) && ((val & (val - 1)) == 0);
  95. }
  96. bool BeVTrackingBits::IsSet(int idx)
  97. {
  98. return IS_BIT_SET_32((uint32*)this, idx);
  99. }
  100. void BeVTrackingBits::Set(int idx)
  101. {
  102. uint32* bits = (uint32*)this;
  103. bits[(idx) / 32] |= (1 << (idx % 32));
  104. }
  105. void BeVTrackingBits::Clear(int idx)
  106. {
  107. uint32* bits = (uint32*)this;
  108. bits[(idx) / 32] &= ~(1 << (idx % 32));
  109. }
  110. BeVTrackingContext::BeVTrackingContext(BeMCContext* mcContext)
  111. {
  112. mMCContext = mcContext;
  113. mNumEntries = 0;
  114. mNumItems = 0;
  115. mNumBlocks = -1;
  116. mTrackKindCount = (int)BeTrackKind_COUNT;
  117. }
  118. void BeVTrackingContext::Init(int numItems)
  119. {
  120. mNumItems = numItems;
  121. mNumEntries = mNumItems * mTrackKindCount;
  122. mNumBlocks = (mNumEntries + 31) / 32;
  123. }
  124. void BeVTrackingContext::Clear()
  125. {
  126. mAlloc.Clear();
  127. mNumBlocks = -1;
  128. }
  129. int BeVTrackingContext::GetBitsBytes()
  130. {
  131. return mNumBlocks * 4;
  132. }
  133. int BeVTrackingContext::GetIdx(int baseIdx, BeTrackKind liveKind)
  134. {
  135. return baseIdx + mNumItems*(int)liveKind;
  136. }
  137. void BeVTrackingContext::Print(BeVTrackingList* list)
  138. {
  139. String str;
  140. for (int i : *list)
  141. str += StrFormat("%d ", i);
  142. if (list->mNumChanges > 0)
  143. {
  144. str += " |";
  145. for (int changeIdx = 0; changeIdx < list->mNumChanges; changeIdx++)
  146. {
  147. int change = list->GetChange(changeIdx);
  148. if (change >= 0)
  149. str += StrFormat(" +%d", change);
  150. else
  151. str += StrFormat(" -%d", -change - 1);
  152. }
  153. }
  154. str += "\n";
  155. OutputDebugStr(str);
  156. }
  157. BeVTrackingList* BeVTrackingContext::AllocEmptyList()
  158. {
  159. int allocBytes = sizeof(int) * (2);
  160. auto newList = (BeVTrackingList*)mAlloc.AllocBytes(allocBytes);
  161. mStats.mListBytes += allocBytes;
  162. newList->mSize = 0;
  163. newList->mNumChanges = 0;
  164. return newList;
  165. }
  166. BeVTrackingList* BeVTrackingContext::AddFiltered(BeVTrackingList* list, SizedArrayImpl<int>& filteredAdds, bool perserveChangeList)
  167. {
  168. int newSize = list->mSize + filteredAdds.size();
  169. int allocBytes = sizeof(int) * (2 + newSize);
  170. if (perserveChangeList)
  171. allocBytes += sizeof(int) * (int)(list->mNumChanges + filteredAdds.size());
  172. auto newList = (BeVTrackingList*)mAlloc.AllocBytes(allocBytes);
  173. mStats.mListBytes += allocBytes;
  174. {
  175. if (filteredAdds.size() > 1)
  176. std::sort(filteredAdds.begin(), filteredAdds.end());
  177. int addIdx = 0;
  178. int nextAdd;
  179. if (addIdx < (int)filteredAdds.size())
  180. nextAdd = filteredAdds[addIdx++];
  181. else
  182. nextAdd = 0x7FFFFFFF;
  183. int* outPtr = &newList->mEntries[0];
  184. for (auto idx : *list)
  185. {
  186. while (idx > nextAdd)
  187. {
  188. *(outPtr++) = nextAdd;
  189. if (addIdx < (int)filteredAdds.size())
  190. nextAdd = filteredAdds[addIdx++];
  191. else
  192. nextAdd = 0x7FFFFFFF;
  193. }
  194. *(outPtr++) = idx;
  195. }
  196. while (nextAdd != 0x7FFFFFFF)
  197. {
  198. *(outPtr++) = nextAdd;
  199. if (addIdx >= (int)filteredAdds.size())
  200. break;
  201. nextAdd = filteredAdds[addIdx++];
  202. }
  203. }
  204. newList->mSize = newSize;
  205. if (perserveChangeList)
  206. {
  207. for (int changeIdx = 0; changeIdx < list->mNumChanges; changeIdx++)
  208. {
  209. newList->mEntries[newSize + changeIdx] = list->GetChange(changeIdx);
  210. }
  211. for (int changeIdx = 0; changeIdx < (int)filteredAdds.size(); changeIdx++)
  212. {
  213. newList->mEntries[newSize + list->mNumChanges + changeIdx] = filteredAdds[changeIdx];
  214. }
  215. newList->mNumChanges = list->mNumChanges + (int)filteredAdds.size();
  216. }
  217. else
  218. newList->mNumChanges = 0;
  219. return newList;
  220. }
  221. BeVTrackingList* BeVTrackingContext::AddFiltered(BeVTrackingList* list, int idx, bool perserveChangeList)
  222. {
  223. int newSize = list->mSize + 1;
  224. int allocBytes = sizeof(int) * (2 + newSize);
  225. if (perserveChangeList)
  226. allocBytes += sizeof(int) * (int)(list->mNumChanges + 1);
  227. auto newList = (BeVTrackingList*)mAlloc.AllocBytes(allocBytes);
  228. mStats.mListBytes += allocBytes;
  229. {
  230. int addIdx = 0;
  231. int nextAdd;
  232. nextAdd = idx;
  233. int* outPtr = &newList->mEntries[0];
  234. for (auto idx : *list)
  235. {
  236. while (idx > nextAdd)
  237. {
  238. *(outPtr++) = nextAdd;
  239. nextAdd = 0x7FFFFFFF;
  240. }
  241. *(outPtr++) = idx;
  242. }
  243. while (nextAdd != 0x7FFFFFFF)
  244. {
  245. *(outPtr++) = nextAdd;
  246. break;
  247. }
  248. }
  249. newList->mSize = newSize;
  250. if (perserveChangeList)
  251. {
  252. for (int changeIdx = 0; changeIdx < list->mNumChanges; changeIdx++)
  253. {
  254. newList->mEntries[newSize + changeIdx] = list->GetChange(changeIdx);
  255. }
  256. newList->mEntries[newSize + list->mNumChanges] = idx;
  257. newList->mNumChanges = list->mNumChanges + (int)1;
  258. }
  259. else
  260. newList->mNumChanges = 0;
  261. return newList;
  262. }
  263. BeVTrackingList* BeVTrackingContext::Add(BeVTrackingList* list, const SizedArrayImpl<int>& indices, bool perserveChangeList)
  264. {
  265. SizedArray<int, 16> newIndices;
  266. for (int idx : indices)
  267. {
  268. if (!IsSet(list, idx))
  269. {
  270. newIndices.push_back(idx);
  271. }
  272. }
  273. if (newIndices.empty())
  274. return list;
  275. return AddFiltered(list, newIndices, perserveChangeList);
  276. }
  277. BeVTrackingList* BeVTrackingContext::Add(BeVTrackingList* list, int idx, bool perserveChangeList)
  278. {
  279. if (IsSet(list, idx))
  280. return list;
  281. return AddFiltered(list, idx, perserveChangeList);
  282. }
  283. // Performs an 'add' for items that were in prevDest
  284. BeVTrackingList* BeVTrackingContext::SetChanges(BeVTrackingList* prevDestEntry, BeVTrackingList* mergeFrom)
  285. {
  286. int removeCount = 0;
  287. int addCount = 0;
  288. int newSize = prevDestEntry->mSize;
  289. auto prevItr = prevDestEntry->begin();
  290. auto prevEnd = prevDestEntry->end();
  291. auto mergeFromItr = mergeFrom->begin();
  292. auto mergeFromEnd = mergeFrom->end();
  293. while ((prevItr != prevEnd) && (mergeFromItr != mergeFromEnd))
  294. {
  295. int prevIdx = *prevItr;
  296. int mergeIdx = *mergeFromItr;
  297. bool done = false;
  298. while (mergeIdx < prevIdx)
  299. {
  300. removeCount++;
  301. ++mergeFromItr;
  302. if (mergeFromItr == mergeFromEnd)
  303. {
  304. done = true;
  305. break;
  306. }
  307. mergeIdx = *mergeFromItr;
  308. }
  309. if (done)
  310. break;
  311. while (prevIdx < mergeIdx)
  312. {
  313. addCount++;
  314. ++prevItr;
  315. if (prevItr == prevEnd)
  316. {
  317. done = true;
  318. break;
  319. }
  320. prevIdx = *prevItr;
  321. }
  322. if (done)
  323. break;
  324. if (prevIdx == mergeIdx)
  325. {
  326. ++prevItr;
  327. ++mergeFromItr;
  328. }
  329. }
  330. while (prevItr != prevEnd)
  331. {
  332. addCount++;
  333. ++prevItr;
  334. }
  335. while (mergeFromItr != mergeFromEnd)
  336. {
  337. removeCount++;
  338. ++mergeFromItr;
  339. }
  340. int allocBytes = sizeof(int) * (2 + newSize + addCount + removeCount);
  341. auto newList = (BeVTrackingList*)mAlloc.AllocBytes(allocBytes);
  342. mStats.mListBytes += allocBytes;
  343. int* outPtr = &newList->mEntries[0];
  344. int* changePtr = &newList->mEntries[newSize];
  345. prevItr = prevDestEntry->begin();
  346. mergeFromItr = mergeFrom->begin();
  347. while ((prevItr != prevEnd) && (mergeFromItr != mergeFromEnd))
  348. {
  349. int prevIdx = *prevItr;
  350. int mergeIdx = *mergeFromItr;
  351. bool done = false;
  352. while (mergeIdx < prevIdx)
  353. {
  354. *(changePtr++) = ~mergeIdx;
  355. ++mergeFromItr;
  356. if (mergeFromItr == mergeFromEnd)
  357. {
  358. done = true;
  359. break;
  360. }
  361. mergeIdx = *mergeFromItr;
  362. }
  363. if (done)
  364. break;
  365. while (prevIdx < mergeIdx)
  366. {
  367. *(outPtr++) = prevIdx;
  368. *(changePtr++) = prevIdx;
  369. ++prevItr;
  370. if (prevItr == prevEnd)
  371. {
  372. done = true;
  373. break;
  374. }
  375. prevIdx = *prevItr;
  376. }
  377. if (done)
  378. break;
  379. if (prevIdx == mergeIdx)
  380. {
  381. *(outPtr++) = *prevItr;
  382. ++prevItr;
  383. ++mergeFromItr;
  384. }
  385. }
  386. while (prevItr != prevEnd)
  387. {
  388. int prevIdx = *prevItr;
  389. *(outPtr++) = *prevItr;
  390. *(changePtr++) = prevIdx;
  391. ++prevItr;
  392. }
  393. while (mergeFromItr != mergeFromEnd)
  394. {
  395. int mergeIdx = *mergeFromItr;
  396. *(changePtr++) = ~mergeIdx;
  397. ++mergeFromItr;
  398. }
  399. BF_ASSERT((outPtr - &newList->mEntries[0]) == newSize);
  400. BF_ASSERT((changePtr - &newList->mEntries[newSize]) == addCount + removeCount);
  401. newList->mSize = newSize;
  402. newList->mNumChanges = addCount + removeCount;
  403. return newList;
  404. }
  405. BeVTrackingList* BeVTrackingContext::ClearFiltered(BeVTrackingList* list, const SizedArrayImpl<int>& indices)
  406. {
  407. /*int newSize = list->mSize - indices.size();
  408. auto newList = (BeVTrackingList*)mAlloc.AllocBytes(sizeof(int) * (1 + newSize));
  409. if (indices.size() == 1)
  410. {
  411. int findIdx0 = indices[0];
  412. int* outPtr = 0;
  413. for (auto idx : indices)
  414. {
  415. if (idx != findIdx0)
  416. *(outPtr++) = idx;
  417. }
  418. BF_ASSERT(outPtr == &newList->mEntries[0] + indices.size());
  419. }
  420. else if (indices.size() == 2)
  421. {
  422. int findIdx0 = indices[0];
  423. int findIdx1 = indices[1];
  424. int* outPtr = 0;
  425. for (auto idx : indices)
  426. {
  427. if ((idx != findIdx0) && (idx != findIdx1))
  428. *(outPtr++) = idx;
  429. }
  430. BF_ASSERT(outPtr == &newList->mEntries[0] + indices.size());
  431. }
  432. else
  433. {
  434. int* outPtr = 0;
  435. for (auto idx : indices)
  436. {
  437. if (std::find(indices.begin(), indices.end(), idx) == indices.end())
  438. *(outPtr++) = idx;
  439. }
  440. BF_ASSERT(outPtr == &newList->mEntries[0] + indices.size());
  441. }
  442. newList->mSize = newSize;
  443. return newList;*/
  444. BF_FATAL("Broken");
  445. return NULL;
  446. }
  447. BeVTrackingList* BeVTrackingContext::Modify(BeVTrackingList* list, const SizedArrayImpl<int>& inAdds, const SizedArrayImpl<int>& inRemoves, SizedArrayImpl<int>& filteredAdds, SizedArrayImpl<int>& filteredRemoves)
  448. {
  449. for (int idx : inAdds)
  450. {
  451. if (!IsSet(list, idx))
  452. {
  453. filteredAdds.push_back(idx);
  454. }
  455. }
  456. for (int idx : inRemoves)
  457. {
  458. if (IsSet(list, idx))
  459. {
  460. filteredRemoves.push_back(idx);
  461. }
  462. }
  463. if ((filteredAdds.empty()) && (filteredRemoves.empty()))
  464. return list;
  465. int newSize = list->mSize - filteredRemoves.size() + filteredAdds.size();
  466. int changeSize = filteredRemoves.size() + filteredAdds.size();
  467. int allocBytes = sizeof(int) * (2 + newSize + changeSize);
  468. auto newList = (BeVTrackingList*)mAlloc.AllocBytes(allocBytes);
  469. mStats.mListBytes += allocBytes;
  470. /*if (filteredRemoves.size() == 0)
  471. {
  472. memcpy(newList->mEntries, unit.mList->mEntries, sizeof(int) * unit.mList->mSize);
  473. }
  474. else if (filteredRemoves.size() == 1)
  475. {
  476. int findIdx0 = filteredRemoves[0];
  477. int* outPtr = &newList->mEntries[0];
  478. for (auto idx : *unit.mList)
  479. {
  480. if (idx != findIdx0)
  481. *(outPtr++) = idx;
  482. }
  483. BF_ASSERT(outPtr == &newList->mEntries[0] + unit.mList->mSize - filteredRemoves.size());
  484. }
  485. else if (filteredRemoves.size() == 2)
  486. {
  487. int findIdx0 = filteredRemoves[0];
  488. int findIdx1 = filteredRemoves[1];
  489. int* outPtr = &newList->mEntries[0];
  490. for (auto idx : *unit.mList)
  491. {
  492. if ((idx != findIdx0) && (idx != findIdx1))
  493. *(outPtr++) = idx;
  494. }
  495. BF_ASSERT(outPtr == &newList->mEntries[0] + unit.mList->mSize - filteredRemoves.size());
  496. }
  497. else
  498. {
  499. int* outPtr = &newList->mEntries[0];
  500. for (auto idx : *unit.mList)
  501. {
  502. if (std::find(filteredRemoves.begin(), filteredRemoves.end(), idx) == filteredRemoves.end())
  503. *(outPtr++) = idx;
  504. }
  505. BF_ASSERT(outPtr == &newList->mEntries[0] + unit.mList->mSize - filteredRemoves.size());
  506. }*/
  507. {
  508. if (filteredAdds.size() > 1)
  509. std::sort(filteredAdds.begin(), filteredAdds.end());
  510. if (filteredRemoves.size() > 1)
  511. std::sort(filteredRemoves.begin(), filteredRemoves.end());
  512. int addIdx = 0;
  513. int nextAdd;
  514. if (addIdx < (int)filteredAdds.size())
  515. nextAdd = filteredAdds[addIdx++];
  516. else
  517. nextAdd = 0x7FFFFFFF;
  518. int removeIdx = 0;
  519. int nextRemove;
  520. if (removeIdx < (int)filteredRemoves.size())
  521. nextRemove = filteredRemoves[removeIdx++];
  522. else
  523. nextRemove = 0x7FFFFFFF;
  524. int* outPtr = &newList->mEntries[0];
  525. for (auto idx : *list)
  526. {
  527. if (idx == nextRemove)
  528. {
  529. if (removeIdx < (int)filteredRemoves.size())
  530. nextRemove = filteredRemoves[removeIdx++];
  531. else
  532. nextRemove = 0x7FFFFFFF;
  533. continue;
  534. }
  535. while (idx > nextAdd)
  536. {
  537. *(outPtr++) = nextAdd;
  538. if (addIdx < (int)filteredAdds.size())
  539. nextAdd = filteredAdds[addIdx++];
  540. else
  541. nextAdd = 0x7FFFFFFF;
  542. }
  543. *(outPtr++) = idx;
  544. }
  545. while (nextAdd != 0x7FFFFFFF)
  546. {
  547. *(outPtr++) = nextAdd;
  548. if (addIdx >= (int)filteredAdds.size())
  549. break;
  550. nextAdd = filteredAdds[addIdx++];
  551. }
  552. BF_ASSERT(outPtr == &newList->mEntries[0] + newSize);
  553. BF_ASSERT((nextAdd = 0x7FFFFFFF) && (nextRemove == 0x7FFFFFFF));
  554. }
  555. for (int i = 0; i < (int)filteredRemoves.size(); i++)
  556. {
  557. newList->mEntries[newSize + i] = -filteredRemoves[i] - 1;
  558. }
  559. for (int i = 0; i < (int)filteredAdds.size(); i++)
  560. {
  561. newList->mEntries[newSize + filteredRemoves.size() + i] = filteredAdds[i];
  562. }
  563. newList->mSize = newSize;
  564. newList->mNumChanges = changeSize;
  565. ///
  566. /*for (int i = 0; i < mNumEntries; i++)
  567. BF_ASSERT(IsSet(newList, i) == unit.mBits->IsSet(i));
  568. int prevIdx = -1;
  569. for (int idx : *newList)
  570. {
  571. BF_ASSERT(idx > prevIdx);
  572. prevIdx = idx;
  573. }
  574. OutputDebugStrF("Modify %d %@\n", modifyItrIdx, newList);*/
  575. ///
  576. return newList;
  577. }
  578. int BeVTrackingContext::FindIndex(BeVTrackingList* entry, int val)
  579. {
  580. int lo = 0;
  581. int hi = entry->mSize - 1;
  582. while (lo <= hi)
  583. {
  584. int i = (lo + hi) / 2;
  585. int midVal = entry->mEntries[i];
  586. int c = midVal - val;
  587. if (c == 0) return i;
  588. if (c < 0)
  589. lo = i + 1;
  590. else
  591. hi = i - 1;
  592. }
  593. return ~lo;
  594. }
  595. bool BeVTrackingContext::IsSet(BeVTrackingList* entry, int idx)
  596. {
  597. return FindIndex(entry, idx) >= 0;
  598. }
  599. bool BeVTrackingContext::IsSet(BeVTrackingList* entry, int idx, BeTrackKind trackKind)
  600. {
  601. return IsSet(entry, GetIdx(idx, trackKind));
  602. }
  603. BeVTrackingList* BeVTrackingContext::Clear(BeVTrackingList* list, const SizedArrayImpl<int>& indices)
  604. {
  605. SizedArray<int, 16> newIndices;
  606. for (int idx : indices)
  607. {
  608. if (IsSet(list, idx))
  609. {
  610. newIndices.push_back(idx);
  611. }
  612. }
  613. if (newIndices.empty())
  614. return list;
  615. return ClearFiltered(list, newIndices);
  616. }
  617. bool BeVTrackingContext::IsEmpty(BeVTrackingList* list)
  618. {
  619. return list->mSize == 0;
  620. }
  621. BeVTrackingList* BeVTrackingContext::Merge(BeVTrackingList* prevDestEntry, BeVTrackingList* mergeFrom)
  622. {
  623. if (prevDestEntry == NULL)
  624. return mergeFrom;
  625. if (mergeFrom->mSize == 0)
  626. return prevDestEntry;
  627. if (prevDestEntry->mSize == 0)
  628. return mergeFrom;
  629. int newSize = prevDestEntry->mSize;
  630. auto prevItr = prevDestEntry->begin();
  631. auto prevEnd = prevDestEntry->end();
  632. auto mergeFromItr = mergeFrom->begin();
  633. auto mergeFromEnd = mergeFrom->end();
  634. while ((prevItr != prevEnd) && (mergeFromItr != mergeFromEnd))
  635. {
  636. int prevIdx = *prevItr;
  637. int mergeIdx = *mergeFromItr;
  638. bool done = false;
  639. while (mergeIdx < prevIdx)
  640. {
  641. newSize++;
  642. ++mergeFromItr;
  643. if (mergeFromItr == mergeFromEnd)
  644. {
  645. done = true;
  646. break;
  647. }
  648. mergeIdx = *mergeFromItr;
  649. }
  650. if (done)
  651. break;
  652. while (prevIdx < mergeIdx)
  653. {
  654. ++prevItr;
  655. if (prevItr == prevEnd)
  656. {
  657. done = true;
  658. break;
  659. }
  660. prevIdx = *prevItr;
  661. }
  662. if (done)
  663. break;
  664. if (prevIdx == mergeIdx)
  665. {
  666. ++prevItr;
  667. ++mergeFromItr;
  668. }
  669. }
  670. while (mergeFromItr != mergeFromEnd)
  671. {
  672. newSize++;
  673. ++mergeFromItr;
  674. }
  675. if (newSize == prevDestEntry->mSize)
  676. return prevDestEntry;
  677. int allocBytes = sizeof(int) * (2 + newSize);
  678. auto newList = (BeVTrackingList*)mAlloc.AllocBytes(allocBytes);
  679. mStats.mListBytes += allocBytes;
  680. int* outPtr = &newList->mEntries[0];
  681. prevItr = prevDestEntry->begin();
  682. mergeFromItr = mergeFrom->begin();
  683. while ((prevItr != prevEnd) && (mergeFromItr != mergeFromEnd))
  684. {
  685. int prevIdx = *prevItr;
  686. int mergeIdx = *mergeFromItr;
  687. bool done = false;
  688. while (mergeIdx < prevIdx)
  689. {
  690. *(outPtr++) = mergeIdx;
  691. ++mergeFromItr;
  692. if (mergeFromItr == mergeFromEnd)
  693. {
  694. done = true;
  695. break;
  696. }
  697. mergeIdx = *mergeFromItr;
  698. }
  699. if (done)
  700. break;
  701. while (prevIdx < mergeIdx)
  702. {
  703. *(outPtr++) = prevIdx;
  704. ++prevItr;
  705. if (prevItr == prevEnd)
  706. {
  707. done = true;
  708. break;
  709. }
  710. prevIdx = *prevItr;
  711. }
  712. if (done)
  713. break;
  714. if (prevIdx == mergeIdx)
  715. {
  716. *(outPtr++) = *prevItr;
  717. ++prevItr;
  718. ++mergeFromItr;
  719. }
  720. }
  721. while (prevItr != prevEnd)
  722. {
  723. *(outPtr++) = *prevItr;
  724. ++prevItr;
  725. }
  726. while (mergeFromItr != mergeFromEnd)
  727. {
  728. *(outPtr++) = *mergeFromItr;
  729. ++mergeFromItr;
  730. }
  731. BF_ASSERT((outPtr - &newList->mEntries[0]) == newSize);
  732. newList->mSize = newSize;
  733. newList->mNumChanges = 0;
  734. return newList;
  735. }
  736. BeVTrackingList* BeVTrackingContext::MergeChanges(BeVTrackingList* prevDestEntry, BeVTrackingList* mergeFrom)
  737. {
  738. if (prevDestEntry == mergeFrom)
  739. return prevDestEntry;
  740. if (mergeFrom->mNumChanges == 0)
  741. return prevDestEntry;
  742. SizedArray<int, 2> changes;
  743. for (int changeIdx = 0; changeIdx < (int)prevDestEntry->mNumChanges; changeIdx++)
  744. changes.push_back(prevDestEntry->GetChange(changeIdx));
  745. for (int changeIdx = 0; changeIdx < (int)mergeFrom->mNumChanges; changeIdx++)
  746. {
  747. // If there isn't already a change (whether and add or a remove) that refers to this same vreg,
  748. // then we add this change as well
  749. int change = mergeFrom->GetChange(changeIdx);
  750. int negChange = -change - 1;
  751. /*if (((std::find(changes.begin(), changes.end(), change) == changes.end())) &&
  752. ((std::find(changes.begin(), changes.end(), negChange) == changes.end())))*/
  753. if ((!changes.Contains(change)) && (!changes.Contains(negChange)))
  754. {
  755. changes.push_back(change);
  756. }
  757. }
  758. int newSize = prevDestEntry->mSize;
  759. int allocBytes = (int)(sizeof(int) * (2 + newSize + changes.size()));
  760. auto newList = (BeVTrackingList*)mAlloc.AllocBytes(allocBytes);
  761. mStats.mListBytes += allocBytes;
  762. memcpy(&newList->mEntries[0], &prevDestEntry->mEntries[0], newSize * sizeof(int));
  763. for (int i = 0; i < (int)changes.size(); i++)
  764. {
  765. newList->mEntries[newSize + i] = changes[i];
  766. }
  767. newList->mSize = newSize;
  768. newList->mNumChanges = (int)changes.size();
  769. return newList;
  770. }
  771. BeVTrackingList * BeVTrackingContext::RemoveChange(BeVTrackingList* prevDestEntry, int idx)
  772. {
  773. int newSize = prevDestEntry->mSize;
  774. int allocBytes = (int)(sizeof(int) * (2 + newSize + prevDestEntry->mNumChanges - 1));
  775. auto newList = (BeVTrackingList*)mAlloc.AllocBytes(allocBytes);
  776. mStats.mListBytes += allocBytes;
  777. memcpy(&newList->mEntries[0], &prevDestEntry->mEntries[0], newSize * sizeof(int));
  778. bool found = false;
  779. int outIdx = newSize;
  780. for (int i = 0; i < (int)prevDestEntry->mNumChanges; i++)
  781. {
  782. int change = prevDestEntry->GetChange(i);
  783. if (change == idx)
  784. {
  785. found = true;
  786. continue;
  787. }
  788. newList->mEntries[outIdx++] = change;
  789. }
  790. BF_ASSERT(found);
  791. newList->mSize = newSize;
  792. newList->mNumChanges = prevDestEntry->mNumChanges - 1;
  793. return newList;
  794. }
  795. //////////////////////////////////////////////////////////////////////////
  796. BeMCColorizer::BeMCColorizer(BeMCContext* mcContext)
  797. {
  798. mContext = mcContext;
  799. mReserveParamRegs = false;
  800. }
  801. void BeMCColorizer::Prepare()
  802. {
  803. mReserveParamRegs = false;
  804. mNodes.Resize(mContext->mVRegInfo.size());
  805. if (mContext->mDebugging)
  806. {
  807. NOP;
  808. }
  809. for (int vregIdx = 0; vregIdx < (int)mNodes.size(); vregIdx++)
  810. {
  811. auto node = &mNodes[vregIdx];
  812. node->Prepare();
  813. //node->mActualVRegIdx = vregIdx;
  814. auto vregInfo = mContext->mVRegInfo[vregIdx];
  815. if ((vregInfo->mIsRetVal) && (mContext->mCompositeRetVRegIdx != -1) && (vregIdx != mContext->mCompositeRetVRegIdx))
  816. continue;
  817. if (vregInfo->mRelTo)
  818. {
  819. BF_ASSERT(vregInfo->mIsExpr);
  820. /*if ((vregInfo->IsDirectRelTo()) && (vregInfo->mRelTo.mKind == BeMCOperandKind_VReg))
  821. node->mActualVRegIdx = vregInfo->mRelTo.mVRegIdx; */
  822. //node->mWantsReg = false;
  823. //vregInfo->mReg = X64Reg_None;
  824. //continue;
  825. }
  826. if ((vregInfo->mRefCount > 0) || (vregInfo->mIsRetVal))
  827. {
  828. node->mWantsReg = ((vregInfo->mType->mSize > 0) && (!vregInfo->mRegNumPinned) && (!vregInfo->mSpilled) &&
  829. (!vregInfo->mIsExpr) && (!vregInfo->mForceMem) && (vregInfo->mFrameOffset == INT_MIN));
  830. }
  831. // if (vregInfo->mIsRetVal)
  832. // node->mWantsReg = true;
  833. if (!node->mWantsReg)
  834. vregInfo->mReg = X64Reg_None;
  835. vregInfo->mVRegAffinity = -1;
  836. /*if (vregInfo->mForceReg)
  837. {
  838. // We can't have reg restrictions when we have forceReg set
  839. BF_ASSERT(!vregInfo->mDisableR12);
  840. BF_ASSERT(!vregInfo->mDisableRDX);
  841. }*/
  842. if (vregInfo->mDisableR11)
  843. node->AdjustRegCost(X64Reg_R11, 0x0FFFFFFF);
  844. if (vregInfo->mDisableR12)
  845. node->AdjustRegCost(X64Reg_R12, 0x0FFFFFFF);
  846. if (vregInfo->mDisableR13)
  847. node->AdjustRegCost(X64Reg_R13, 0x0FFFFFFF);
  848. if (vregInfo->mDisableRAX)
  849. node->AdjustRegCost(X64Reg_RAX, 0x0FFFFFFF);
  850. if (vregInfo->mDisableRDX)
  851. node->AdjustRegCost(X64Reg_RDX, 0x0FFFFFFF);
  852. if (vregInfo->mDisableEx)
  853. {
  854. for (int i = X64Reg_RSI; i <= X64Reg_R15; i++)
  855. node->AdjustRegCost((X64CPURegister)i, 0x0FFFFFFF);
  856. }
  857. }
  858. }
  859. void BeMCColorizer::AddEdge(int vreg0, int vreg1)
  860. {
  861. int checkVRegIdx0 = mContext->GetUnderlyingVReg(vreg0);
  862. int checkVRegIdx1 = mContext->GetUnderlyingVReg(vreg1);
  863. if (checkVRegIdx0 == checkVRegIdx1)
  864. return;
  865. auto node0 = &mNodes[checkVRegIdx0];
  866. auto node1 = &mNodes[checkVRegIdx1];
  867. if ((node0->mWantsReg) && (node1->mWantsReg))
  868. {
  869. node0->mEdges.Add(checkVRegIdx1);
  870. node1->mEdges.Add(checkVRegIdx0);
  871. }
  872. }
  873. void BeMCColorizer::PropogateMemCost(const BeMCOperand & operand, int memCost)
  874. {
  875. if (operand.IsVRegAny())
  876. {
  877. auto vregInfo = mContext->mVRegInfo[operand.mVRegIdx];
  878. mNodes[operand.mVRegIdx].mMemCost += memCost;
  879. PropogateMemCost(vregInfo->mRelTo, memCost);
  880. PropogateMemCost(vregInfo->mRelOffset, memCost);
  881. }
  882. }
  883. void BeMCColorizer::GenerateRegCosts()
  884. {
  885. bool doRegCost = true;
  886. // Disallow param reg cross-refs
  887. {
  888. Array<X64CPURegister> paramRegsLeft = mContext->mParamsUsedRegs;
  889. Array<int> prevRegMovs;
  890. auto mcBlock = mContext->mBlocks[0];
  891. for (int instIdx = 0; instIdx < (int)mcBlock->mInstructions.size(); instIdx++)
  892. {
  893. auto inst = mcBlock->mInstructions[instIdx];
  894. if ((inst->IsMov()) && (inst->mArg1.IsNativeReg()) && (!inst->mArg0.IsNativeReg()))
  895. {
  896. BF_ASSERT(inst->mArg0.IsVReg());
  897. int vregIdx = mContext->GetUnderlyingVReg(inst->mArg0.mVRegIdx);
  898. auto reg = mContext->ResizeRegister(inst->mArg1.mReg, 8);
  899. // Don't allow any previous "direct reg movs" assign to a vreg that gets bound
  900. // to this reg. This is to avoid "cross-referencing" param vregs. IE:
  901. // Mov %vreg0<RDX>, RCX
  902. // Mov %vreg1<RCX>, RDX
  903. // Because the first MOV would destroy the incoming RDX
  904. for (auto prevVRegIdx : prevRegMovs)
  905. {
  906. auto node = &mNodes[prevVRegIdx];
  907. node->AdjustRegCost(reg, 0x0FFFFFFF);
  908. }
  909. /*auto itr = std::find(paramRegsLeft.begin(), paramRegsLeft.end(), reg);
  910. if (itr != paramRegsLeft.end())
  911. {
  912. paramRegsLeft.erase(itr);
  913. if (paramRegsLeft.size() == 0)
  914. break;
  915. prevRegMovs.push_back(vregIdx);
  916. }*/
  917. if (paramRegsLeft.Remove(reg))
  918. {
  919. if (paramRegsLeft.size() == 0)
  920. break;
  921. prevRegMovs.push_back(vregIdx);
  922. }
  923. }
  924. }
  925. BF_ASSERT(paramRegsLeft.size() == 0);
  926. }
  927. int preserveDepth = 0;
  928. for (auto mcBlock : mContext->mBlocks)
  929. {
  930. int costMult = mcBlock->mIsLooped ? 4 : 1;
  931. for (int instIdx = (int)mcBlock->mInstructions.size() - 1; instIdx >= 0; instIdx--)
  932. {
  933. auto inst = mcBlock->mInstructions[instIdx];
  934. // We could adjust register cost based on a possibility of cross-dependencies that won't allow us
  935. // to reorder the movs for param setup
  936. if (inst->mKind == BeMCInstKind_PreserveVolatiles)
  937. {
  938. preserveDepth++;
  939. int preserveCost = 8 * costMult;
  940. if (inst->mArg0.mKind == BeMCOperandKind_PreserveFlag)
  941. {
  942. // Just use a small cost for NoReturns, those are implied to be "unlikely" paths (ie: errors)
  943. // But at the least, the code is smaller if we don't need to save the regs so use a small cost
  944. if ((inst->mArg0.mPreserveFlag & BeMCPreserveFlag_NoRestore) != 0)
  945. preserveCost = 1;
  946. }
  947. auto restoreIdx = mContext->FindRestoreVolatiles(mcBlock, instIdx);
  948. if (restoreIdx == -1)
  949. restoreIdx = mcBlock->mInstructions.size() - 1; // 'Ret'
  950. auto restoreInst = mcBlock->mInstructions[restoreIdx];
  951. // Any vregs alive during this call will incur a cost of saving/restoring if we allocate onto a volatile register.
  952. // If the vreg is either input-only or output-only (short lived temporary) then we can map it directly to a volatile register
  953. for (int vregIdx : *inst->mLiveness)
  954. {
  955. if (vregIdx >= mContext->mLivenessContext.mNumItems)
  956. continue;
  957. auto checkVRegIdx = mContext->GetUnderlyingVReg(vregIdx);
  958. // Already handled the underlying vreg?
  959. if ((checkVRegIdx != vregIdx) && (mContext->mLivenessContext.IsSet(inst->mLiveness, checkVRegIdx)))
  960. continue;
  961. if (mContext->mLivenessContext.IsSet(restoreInst->mLiveness, vregIdx))
  962. {
  963. auto node = &mNodes[checkVRegIdx];
  964. if (inst->mArg0.IsNativeReg())
  965. {
  966. // Only one specific register used being preserved
  967. node->AdjustRegCost(inst->mArg0.mReg, preserveCost);
  968. }
  969. else
  970. {
  971. // All volatile registers preserved
  972. for (auto reg : gVolatileRegs)
  973. {
  974. node->AdjustRegCost(reg, preserveCost);
  975. }
  976. }
  977. }
  978. }
  979. }
  980. else if (inst->mKind == BeMCInstKind_RestoreVolatiles)
  981. {
  982. preserveDepth--;
  983. }
  984. if (inst->IsPsuedo())
  985. continue;
  986. // If both args are non-registers then we presume we may have to create a scratch register
  987. // so inflate the cost. Note that the first time through, this will presumably occur for all
  988. // operations but we can change our minds as instructions are legalized
  989. if ((inst->mArg0.IsVReg()) && (inst->mArg1.IsVReg()))
  990. {
  991. auto vregInfo0 = mContext->mVRegInfo[inst->mArg0.mVRegIdx];
  992. auto vregInfo1 = mContext->mVRegInfo[inst->mArg1.mVRegIdx];
  993. if ((vregInfo0->mReg == X64Reg_None) && (vregInfo1->mReg == X64Reg_None))
  994. {
  995. Node* node0 = &mNodes[inst->mArg1.mVRegIdx];
  996. Node* node1 = &mNodes[inst->mArg1.mVRegIdx];
  997. node0->mMemCost += 4 * costMult;
  998. node1->mMemCost += 4 * costMult;
  999. }
  1000. }
  1001. if ((inst->mKind == BeMCInstKind_Div) || (inst->mKind == BeMCInstKind_IDiv))
  1002. {
  1003. if (inst->mArg0.IsVReg())
  1004. {
  1005. Node* node = &mNodes[inst->mArg0.mVRegIdx];
  1006. int adjustCost = -4;
  1007. if (preserveDepth >= 2)
  1008. {
  1009. // This has to be large enough to counteract the 'PreserveVolatile RAX'
  1010. adjustCost -= 8;
  1011. }
  1012. node->AdjustRegCost(X64Reg_RAX, costMult * adjustCost);
  1013. continue;
  1014. }
  1015. }
  1016. if (inst->mKind == BeMCInstKind_MovSX)
  1017. {
  1018. // We can only perform MovSX on reg targets
  1019. if (inst->mArg0.IsVReg())
  1020. mNodes[inst->mArg0.mVRegIdx].mMemCost += 4 * costMult;
  1021. }
  1022. if (inst->mKind == BeMCInstKind_Mov)
  1023. {
  1024. if ((inst->mArg0.mKind == BeMCOperandKind_VReg) &&
  1025. (inst->mArg1.mKind == BeMCOperandKind_VReg))
  1026. {
  1027. int arg0Idx = mContext->GetUnderlyingVReg(inst->mArg0.mVRegIdx);
  1028. int arg1Idx = mContext->GetUnderlyingVReg(inst->mArg1.mVRegIdx);
  1029. auto vregInfo0 = mContext->mVRegInfo[arg0Idx];
  1030. auto vregInfo1 = mContext->mVRegInfo[arg1Idx];
  1031. if (vregInfo0->mVRegAffinity == -1)
  1032. vregInfo0->mVRegAffinity = arg1Idx;
  1033. if (vregInfo1->mVRegAffinity == -1)
  1034. vregInfo1->mVRegAffinity = arg0Idx;
  1035. }
  1036. }
  1037. if (inst->mKind == BeMCInstKind_Call)
  1038. {
  1039. if (inst->mArg0.IsVRegAny())
  1040. {
  1041. for (int checkInstIdx = instIdx - 1; checkInstIdx >= 0; checkInstIdx--)
  1042. {
  1043. auto checkInst = mcBlock->mInstructions[checkInstIdx];
  1044. if ((checkInst->mKind == BeMCInstKind_Mov) && (checkInst->mArg0.IsNativeReg()))
  1045. {
  1046. // This can save us from needing to mov the call addr to RAX before the call
  1047. mNodes[inst->mArg0.mVRegIdx].AdjustRegCost(checkInst->mArg0.mReg, 2 * costMult);
  1048. }
  1049. else
  1050. break;
  1051. }
  1052. }
  1053. }
  1054. if (inst->IsMov())
  1055. {
  1056. auto argTo = inst->mArg0;
  1057. auto vregInfo = mContext->GetVRegInfo(argTo);
  1058. if ((vregInfo != NULL) && (vregInfo->IsDirectRelTo()))
  1059. argTo = vregInfo->mRelTo;
  1060. auto argFrom = inst->mArg1;
  1061. vregInfo = mContext->GetVRegInfo(argFrom);
  1062. if ((vregInfo != NULL) && (vregInfo->IsDirectRelTo()))
  1063. argFrom = vregInfo->mRelTo;
  1064. if (argTo == argFrom)
  1065. continue;
  1066. }
  1067. auto operands = { &inst->mResult, &inst->mArg0, &inst->mArg1 };
  1068. for (auto operand : operands)
  1069. {
  1070. if (operand->IsVRegAny())
  1071. {
  1072. Node* node = &mNodes[operand->mVRegIdx];
  1073. auto vregInfo = mContext->mVRegInfo[operand->mVRegIdx];
  1074. if ((vregInfo->mIsRetVal) && (mContext->mCompositeRetVRegIdx != -1))
  1075. vregInfo = mContext->mVRegInfo[mContext->mCompositeRetVRegIdx];
  1076. if (operand->mKind == BeMCOperandKind_VRegLoad)
  1077. {
  1078. // We propagate this mem cost to RelTo/RelOffset layer
  1079. Node* node = &mNodes[operand->mVRegIdx];
  1080. node->mMemCost += 6 * costMult;
  1081. }
  1082. while (vregInfo->IsDirectRelTo())
  1083. {
  1084. node = &mNodes[vregInfo->mRelTo.mVRegIdx];
  1085. vregInfo = mContext->mVRegInfo[vregInfo->mRelTo.mVRegIdx];
  1086. }
  1087. node->mMemCost += 4 * costMult;
  1088. if (vregInfo->mRelTo.IsVRegAny())
  1089. mNodes[vregInfo->mRelTo.mVRegIdx].mMemCost += 4 * costMult;
  1090. if (vregInfo->mRelOffset.IsVRegAny()) // Higher cost, will definitely require a reg
  1091. mNodes[vregInfo->mRelOffset.mVRegIdx].mMemCost += 8 * costMult;
  1092. if (inst->IsMov())
  1093. {
  1094. if (operand != &inst->mResult)
  1095. {
  1096. auto otherReg = X64Reg_None;
  1097. if (operand == &inst->mArg0)
  1098. {
  1099. if (inst->mArg1.mKind == BeMCOperandKind_NativeReg)
  1100. otherReg = inst->mArg1.mReg;
  1101. if (inst->mArg1.IsImmediateFloat()) // Moving a float immediate into memory takes two instructions
  1102. node->mMemCost += 4 * costMult;
  1103. }
  1104. else
  1105. {
  1106. if (inst->mArg0.mKind == BeMCOperandKind_NativeReg)
  1107. otherReg = inst->mArg0.mReg;
  1108. }
  1109. // If we assigned ourselves to this reg then it would be a "mov reg, reg" which could
  1110. // be eliminated so the cost is negative. We could be tempted to more strongly favor this,
  1111. // but that could cause RAX to be used for __return when it would be less costly to use
  1112. // memory so we don't have to preserve/restore it across call boundaries
  1113. if (otherReg != X64Reg_None)
  1114. node->AdjustRegCost(mContext->ResizeRegister(otherReg, 8), -2 * costMult);
  1115. }
  1116. }
  1117. }
  1118. }
  1119. }
  1120. }
  1121. for (int nodeIdx = 0; nodeIdx < (int)mNodes.size(); nodeIdx++)
  1122. {
  1123. auto node = &mNodes[nodeIdx];
  1124. if (node->mMemCost > 0)
  1125. {
  1126. auto vregInfo = mContext->mVRegInfo[nodeIdx];
  1127. if (vregInfo->mIsExpr)
  1128. {
  1129. PropogateMemCost(vregInfo->mRelTo, node->mMemCost);
  1130. PropogateMemCost(vregInfo->mRelOffset, node->mMemCost);
  1131. }
  1132. }
  1133. }
  1134. BF_ASSERT(preserveDepth == 0);
  1135. }
  1136. void BeMCColorizer::AssignRegs(RegKind regKind)
  1137. {
  1138. if (mContext->mDebugging)
  1139. {
  1140. NOP;
  1141. }
  1142. X64CPURegister highestReg;
  1143. int totalRegs32 = 0;
  1144. int totalRegs16 = 0;
  1145. SizedArray<X64CPURegister, 32> validRegs;
  1146. if (regKind == BeMCColorizer::RegKind_Ints)
  1147. {
  1148. highestReg = X64Reg_R15;
  1149. validRegs = { X64Reg_RAX, X64Reg_RBX, X64Reg_RCX, X64Reg_RDX, X64Reg_RSI, X64Reg_RDI, X64Reg_R8,
  1150. X64Reg_R9, X64Reg_R10, X64Reg_R11, X64Reg_R12, X64Reg_R13, X64Reg_R14, X64Reg_R15 };
  1151. }
  1152. else
  1153. {
  1154. highestReg = X64Reg_XMM15_f64;
  1155. validRegs = {
  1156. X64Reg_XMM0_f64, X64Reg_XMM1_f64, X64Reg_XMM2_f64, X64Reg_XMM3_f64,
  1157. X64Reg_XMM4_f64, X64Reg_XMM5_f64, X64Reg_XMM6_f64, X64Reg_XMM7_f64,
  1158. X64Reg_XMM8_f64, X64Reg_XMM9_f64, X64Reg_XMM10_f64, X64Reg_XMM11_f64,
  1159. X64Reg_XMM12_f64, X64Reg_XMM13_f64, X64Reg_XMM14_f64, X64Reg_XMM15_f64 };
  1160. }
  1161. int totalRegs = (int)validRegs.size();
  1162. #define BF_DEQUE
  1163. #ifdef BF_DEQUE
  1164. std::deque<int> vregStack;
  1165. #else
  1166. std::vector<int> vregStack;
  1167. #endif
  1168. //vregStack.reserve(mNodes.size());
  1169. SizedArray<int, 32> vregHiPriStack;
  1170. vregHiPriStack.reserve(mNodes.size());
  1171. SizedArray<int, 32> vregGraph;
  1172. vregGraph.reserve(mNodes.size());
  1173. SizedArray<int, 32> orderedSpillList;
  1174. //
  1175. {
  1176. BP_ZONE("AssignRegs:vregGraph build");
  1177. for (int vregIdx = (int)mNodes.size() - 1; vregIdx >= 0; vregIdx--)
  1178. {
  1179. auto node = &mNodes[vregIdx];
  1180. if (node->mWantsReg)
  1181. {
  1182. auto vregInfo = mContext->mVRegInfo[vregIdx];
  1183. bool canBeReg = false;
  1184. if (regKind == RegKind_Ints)
  1185. {
  1186. if ((vregInfo->mType->IsInt()) || (vregInfo->mType->mTypeCode == BeTypeCode_Boolean) || (vregInfo->mType->mTypeCode == BeTypeCode_Pointer))
  1187. canBeReg = true;
  1188. }
  1189. else if (regKind == RegKind_Floats)
  1190. {
  1191. if (vregInfo->mType->IsFloat())
  1192. canBeReg = true;
  1193. }
  1194. if (canBeReg)
  1195. {
  1196. node->mInGraph = true;
  1197. node->mGraphEdgeCount = 0;
  1198. vregGraph.push_back(vregIdx);
  1199. }
  1200. else
  1201. {
  1202. node->mInGraph = false;
  1203. }
  1204. }
  1205. }
  1206. }
  1207. for (int vregIdx = (int)mNodes.size() - 1; vregIdx >= 0; vregIdx--)
  1208. {
  1209. auto node = &mNodes[vregIdx];
  1210. if (node->mInGraph)
  1211. {
  1212. for (auto connNodeIdx : node->mEdges)
  1213. {
  1214. Node* connNode = &mNodes[connNodeIdx];
  1215. if (connNode->mInGraph)
  1216. node->mGraphEdgeCount++;
  1217. }
  1218. }
  1219. }
  1220. //TODO: This sort was meaningless I think...
  1221. //int xorVal = 227;
  1222. // For vregs that have a 'preferred register', make sure we pop those off the stack first to help
  1223. // ensure they actually get that assignment
  1224. //std::stable_sort(vregGraph.begin(), vregGraph.end(), [&] (int lhs, int rhs)
  1225. // {
  1226. // auto lhsInfo = mContext->mVRegInfo[lhs];
  1227. // auto rhsInfo = mContext->mVRegInfo[rhs];
  1228. // if (lhsInfo->mForceReg != rhsInfo->mForceReg)
  1229. // return !lhsInfo->mForceReg;
  1230. // return mNodes[lhs].mLowestRegCost > mNodes[rhs].mLowestRegCost;
  1231. // //return (lhs ^ xorVal) < (rhs ^ xorVal);
  1232. // });
  1233. //
  1234. {
  1235. int graphSize = (int)vregGraph.size();
  1236. BP_ZONE("AssignRegs:buildStack");
  1237. while (graphSize > 0)
  1238. {
  1239. bool hadNewStackItem = false;
  1240. #ifdef _DEBUG
  1241. // for (int graphIdx = 0; graphIdx < (int)vregGraph.size(); graphIdx++)
  1242. // {
  1243. // int validatedCount = 0;
  1244. // int vregIdx = vregGraph[graphIdx];
  1245. // if (vregIdx == -1)
  1246. // continue;
  1247. // Node* node = &mNodes[vregIdx];
  1248. // for (auto connNodeIdx : node->mEdges)
  1249. // {
  1250. // Node* connNode = &mNodes[connNodeIdx];
  1251. // if (connNode->mInGraph)
  1252. // validatedCount++;
  1253. // }
  1254. // BF_ASSERT(validatedCount == node->mGraphEdgeCount);
  1255. // }
  1256. #endif
  1257. for (int graphIdx = 0; graphIdx < (int)vregGraph.size(); graphIdx++)
  1258. {
  1259. int vregIdx = vregGraph[graphIdx];
  1260. if (vregIdx == -1)
  1261. continue;
  1262. Node* node = &mNodes[vregIdx];
  1263. auto vregInfo = mContext->mVRegInfo[vregIdx];
  1264. int validRegCount = (int)validRegs.size();
  1265. BF_ASSERT(node->mGraphEdgeCount <= vregGraph.size() - 1);
  1266. if ((node->mSpilled) || (node->mGraphEdgeCount < validRegCount))
  1267. {
  1268. node->mInGraph = false;
  1269. for (auto connNodeIdx : node->mEdges)
  1270. {
  1271. Node* connNode = &mNodes[connNodeIdx];
  1272. connNode->mGraphEdgeCount--;
  1273. }
  1274. vregGraph[graphIdx] = -1;
  1275. graphSize--;
  1276. if (!node->mSpilled)
  1277. {
  1278. vregStack.push_back(vregIdx);
  1279. hadNewStackItem = true;
  1280. }
  1281. else
  1282. {
  1283. // We insert spills at the front so we can try to "optimistically" unspill them
  1284. // after all the definite coloring is done
  1285. #ifdef BF_DEQUE
  1286. vregStack.push_front(vregIdx);
  1287. #else
  1288. vregStack.insert(vregStack.begin(), vregIdx);
  1289. #endif
  1290. }
  1291. }
  1292. }
  1293. if (!hadNewStackItem)
  1294. {
  1295. BP_ZONE("Spill");
  1296. // We need to spill!
  1297. int bestSpillVReg = -1;
  1298. for (int regPassIdx = 0; regPassIdx < 2; regPassIdx++)
  1299. {
  1300. while (!orderedSpillList.empty())
  1301. {
  1302. int vregIdx = orderedSpillList.back();
  1303. orderedSpillList.pop_back();
  1304. if (mNodes[vregIdx].mInGraph)
  1305. {
  1306. bestSpillVReg = vregIdx;
  1307. break;
  1308. }
  1309. }
  1310. if (bestSpillVReg != -1)
  1311. break;
  1312. // Order by mem cost
  1313. orderedSpillList.reserve(vregGraph.size());
  1314. for (int graphIdx = 0; graphIdx < (int)vregGraph.size(); graphIdx++)
  1315. {
  1316. int vregIdx = vregGraph[graphIdx];
  1317. if (vregIdx == -1)
  1318. continue;
  1319. auto vregInfo = mContext->mVRegInfo[vregIdx];
  1320. if (vregInfo->mForceReg)
  1321. continue;
  1322. orderedSpillList.push_back(vregIdx);
  1323. }
  1324. std::sort(orderedSpillList.begin(), orderedSpillList.end(), [&](int lhs, int rhs)
  1325. {
  1326. return mNodes[lhs].mMemCost > mNodes[rhs].mMemCost;
  1327. });
  1328. }
  1329. /*int bestSpillVReg = -1;
  1330. int bestSpillCost = INT_MAX;
  1331. // We need to spill now! Try to spill something with the fewest references
  1332. for (int graphIdx = 0; graphIdx < (int)vregGraph.size(); graphIdx++)
  1333. {
  1334. int vregIdx = vregGraph[graphIdx];
  1335. auto vregInfo = mContext->mVRegInfo[vregIdx];
  1336. if (vregInfo->mForceReg)
  1337. continue;
  1338. if (vregInfo->mRefCount < bestSpillCost)
  1339. {
  1340. bestSpillCost = vregInfo->mRefCount;
  1341. bestSpillVReg = vregIdx;
  1342. }
  1343. }*/
  1344. if (bestSpillVReg != -1)
  1345. {
  1346. auto node = &mNodes[bestSpillVReg];
  1347. node->mSpilled = true;
  1348. auto spillVRegInfo = mContext->mVRegInfo[bestSpillVReg];
  1349. spillVRegInfo->mSpilled = true;
  1350. }
  1351. else
  1352. {
  1353. mContext->Fail("Unable to spill vreg");
  1354. }
  1355. }
  1356. }
  1357. }
  1358. SizedArray<bool, 32> globalRegUsedVec;
  1359. globalRegUsedVec.resize(highestReg + 1);
  1360. SizedArray<bool, 32> regUsedVec;
  1361. regUsedVec.resize(highestReg + 1);
  1362. /*String dbgStr;
  1363. if (mContext->mDebugging)
  1364. dbgStr += "AssignRegs ";*/
  1365. BP_ZONE("AssignRegs:assign");
  1366. while (vregStack.size() > 0)
  1367. {
  1368. int vregIdx = vregStack.back();
  1369. vregStack.pop_back();
  1370. /*if (mContext->mDebugging)
  1371. {
  1372. dbgStr += StrFormat("VReg %d ", vregIdx);
  1373. }*/
  1374. BeMCVRegInfo* vregInfo = mContext->mVRegInfo[vregIdx];
  1375. Node* node = &mNodes[vregIdx];
  1376. if (vregInfo->mVRegAffinity != -1)
  1377. {
  1378. auto affinityVRegInfo = mContext->mVRegInfo[vregInfo->mVRegAffinity];
  1379. if (affinityVRegInfo->mReg != X64Reg_None)
  1380. node->AdjustRegCost(affinityVRegInfo->mReg, -2);
  1381. }
  1382. for (int i = 0; i <= highestReg; i++)
  1383. regUsedVec[i] = false;
  1384. if (mReserveParamRegs)
  1385. {
  1386. // This is a fallback case for when the "streams get crossed" during initialization-
  1387. // IE: when arg0 gets assigned to RDX and arg1 gets assigned to RCX and we end up with:
  1388. // MOV arg0<RDX>, RCX
  1389. // MOV arg1<RCX>, RDX
  1390. // Which is bad.
  1391. for (auto reg : mContext->mParamsUsedRegs)
  1392. {
  1393. if (((int)reg < regUsedVec.size()) && (reg != vregInfo->mNaturalReg))
  1394. regUsedVec[(int)reg] = true;
  1395. }
  1396. }
  1397. for (auto connNodeIdx : node->mEdges)
  1398. {
  1399. Node* connNode = &mNodes[connNodeIdx];
  1400. if (connNode->mInGraph)
  1401. {
  1402. auto connVRegInfo = mContext->mVRegInfo[connNodeIdx];
  1403. auto usedReg = mContext->ResizeRegister(connVRegInfo->mReg, 8);
  1404. BF_ASSERT(usedReg != X64Reg_None);
  1405. regUsedVec[(int)usedReg] = true;
  1406. }
  1407. }
  1408. auto bestReg = X64Reg_None;
  1409. int bestRegCost = 0x07FFFFFF; // 0x0FFFFFFF is considered illegal for a reg, so set the mem cost to lower than that...;
  1410. // This is the cost of just leaving the vreg as a memory access. In cases where we bind to a volatile
  1411. // register, we need to consider the cost of preserving and restoring that register across calls, so
  1412. // it cases where we have just a few accesses to this vreg but it spans a lot of calls then we just
  1413. // leave it as memory
  1414. if (!vregInfo->mForceReg)
  1415. bestRegCost = node->mMemCost;
  1416. //for (auto validReg : validRegs)
  1417. int validRegCount = (int)validRegs.size();
  1418. for (int regIdx = 0; regIdx < validRegCount; regIdx++)
  1419. {
  1420. auto validReg = validRegs[regIdx];
  1421. if (!regUsedVec[(int)validReg])
  1422. {
  1423. int checkCost = node->mRegCost[(int)validReg];
  1424. // If this register is non-volatile then we'd have to save and restore it, which costs... unless
  1425. // some other vreg has already used this, then there's no additional cost
  1426. if ((!globalRegUsedVec[(int)validReg]) && (!mContext->IsVolatileReg(validReg)))
  1427. {
  1428. int costMult = 1;
  1429. if (regKind == BeMCColorizer::RegKind_Floats)
  1430. costMult = 2;
  1431. checkCost += 7 * costMult;
  1432. }
  1433. if (checkCost < bestRegCost)
  1434. {
  1435. // Try not to use registers that other params may want
  1436. for (auto argReg : mContext->mParamsUsedRegs)
  1437. {
  1438. if (validReg == argReg)
  1439. checkCost += 1;
  1440. }
  1441. }
  1442. /*if (mContext->mDebugging)
  1443. {
  1444. dbgStr += StrFormat("Cost %d:%d ", validReg, checkCost);
  1445. }*/
  1446. if (checkCost < bestRegCost)
  1447. {
  1448. bestReg = validReg;
  1449. bestRegCost = checkCost;
  1450. }
  1451. }
  1452. }
  1453. if (mContext->mDebugging)
  1454. {
  1455. //auto itr = mContext->mDbgPreferredRegs.find(vregIdx);
  1456. //if (itr != mContext->mDbgPreferredRegs.end())
  1457. X64CPURegister* regPtr = NULL;
  1458. if (mContext->mDbgPreferredRegs.TryGetValue(vregIdx, &regPtr))
  1459. {
  1460. auto reg = *regPtr;
  1461. if (reg == X64Reg_None)
  1462. {
  1463. if (!vregInfo->mForceReg)
  1464. bestReg = reg;
  1465. }
  1466. else
  1467. {
  1468. if (!regUsedVec[(int)reg])
  1469. bestReg = reg;
  1470. }
  1471. }
  1472. }
  1473. if (vregInfo->mSpilled)
  1474. {
  1475. if (bestReg != X64Reg_None)
  1476. {
  1477. // We managed to optimistically unspill
  1478. vregInfo->mSpilled = false;
  1479. }
  1480. }
  1481. else
  1482. {
  1483. if (vregInfo->mForceReg)
  1484. {
  1485. // We didn't end up with a usable reg -- steal a reg from one of our edges
  1486. if (bestReg == X64Reg_None)
  1487. {
  1488. int bestSpillVReg = -1;
  1489. int bestSpillCost = INT_MAX;
  1490. for (auto connNodeIdx : node->mEdges)
  1491. {
  1492. Node* connNode = &mNodes[connNodeIdx];
  1493. if (connNode->mInGraph)
  1494. {
  1495. auto connVRegInfo = mContext->mVRegInfo[connNodeIdx];
  1496. auto usedReg = mContext->ResizeRegister(connVRegInfo->mReg, 8);
  1497. if (connVRegInfo->mForceReg)
  1498. continue;
  1499. if (node->mRegCost[usedReg] < 0x07FFFFFFF)
  1500. {
  1501. if (connVRegInfo->mRefCount < bestSpillCost)
  1502. {
  1503. bestSpillCost = connVRegInfo->mRefCount;
  1504. bestSpillVReg = connNodeIdx;
  1505. }
  1506. }
  1507. }
  1508. }
  1509. if (bestSpillVReg != -1)
  1510. {
  1511. /*if (mContext->mDebugging)
  1512. {
  1513. dbgStr += StrFormat("StealingVReg %d ", bestSpillVReg);
  1514. }*/
  1515. auto connNode = &mNodes[bestSpillVReg];
  1516. auto connVRegInfo = mContext->mVRegInfo[bestSpillVReg];
  1517. bestReg = mContext->ResizeRegister(connVRegInfo->mReg, 8);
  1518. connVRegInfo->mReg = X64Reg_None;
  1519. connNode->mSpilled = true;
  1520. connVRegInfo->mSpilled = true;
  1521. connNode->mInGraph = false;
  1522. for (auto connNodeEdgeIdx : connNode->mEdges)
  1523. {
  1524. Node* connNodeEdge = &mNodes[connNodeEdgeIdx];
  1525. connNodeEdge->mGraphEdgeCount--;
  1526. }
  1527. // We insert spills at the front so we can try to "optimistically" unspill them
  1528. // after all the definite coloring is done
  1529. vregStack.insert(vregStack.begin(), bestSpillVReg);
  1530. }
  1531. }
  1532. // The only way we should have failed to allocate a register is if we spilled...
  1533. BF_ASSERT((bestReg != X64Reg_None) /*|| (mReserveParamRegs)*/);
  1534. }
  1535. }
  1536. vregInfo->mReg = mContext->ResizeRegister(bestReg, vregInfo->mType->mSize);
  1537. if (bestReg != X64Reg_None)
  1538. {
  1539. node->mInGraph = true;
  1540. globalRegUsedVec[(int)bestReg] = true;
  1541. for (auto connNodeIdx : node->mEdges)
  1542. {
  1543. Node* connNode = &mNodes[connNodeIdx];
  1544. connNode->mGraphEdgeCount++;
  1545. }
  1546. }
  1547. /*if (mContext->mDebugging)
  1548. {
  1549. dbgStr += StrFormat("Reg %d ", vregInfo->mReg);
  1550. }*/
  1551. }
  1552. /*if (!dbgStr.empty())
  1553. {
  1554. dbgStr += "\n\n";
  1555. OutputDebugStr(dbgStr);
  1556. }*/
  1557. /*bool dumpStats = true;
  1558. if (dumpStats)
  1559. {
  1560. String str;
  1561. str += "Register costs:\n";
  1562. str += " Mem ";
  1563. for (int regNum = 0; regNum <= X64Reg_EDI; regNum++)
  1564. {
  1565. str += StrFormat("%4s", X64CPURegisters::GetRegisterName((X64CPURegister)regNum));
  1566. }
  1567. str += "\n";
  1568. for (int liveVRregIdx = 0; liveVRregIdx < mContext->mVRegInfo.size(); liveVRregIdx++)
  1569. {
  1570. auto vregInfo = mContext->mVRegInfo[liveVRregIdx];
  1571. auto node = &mNodes[liveVRregIdx];
  1572. String name = mContext->ToString(BeMCOperand::FromVReg(liveVRregIdx));
  1573. str += StrFormat("%24s", name.c_str());
  1574. str += StrFormat(" %3d", node->mMemCost);
  1575. for (int regNum = 0; regNum <= X64Reg_EDI; regNum++)
  1576. {
  1577. str += StrFormat(" %3d", node->mRegCost[regNum]);
  1578. }
  1579. str += "\n";
  1580. }
  1581. OutputDebugStr(str);
  1582. }*/
  1583. }
  1584. bool BeMCColorizer::Validate()
  1585. {
  1586. #ifdef _DEBUG
  1587. auto paramsLeft = mContext->mParamsUsedRegs;
  1588. for (auto mcBlock : mContext->mBlocks)
  1589. {
  1590. for (auto inst : mcBlock->mInstructions)
  1591. {
  1592. if (paramsLeft.size() == 0)
  1593. break;
  1594. if (inst->IsMov())
  1595. {
  1596. if (inst->mArg1.IsNativeReg())
  1597. {
  1598. BF_ASSERT(inst->mArg0.IsVReg());
  1599. BF_ASSERT(mContext->ResizeRegister(inst->mArg1.mReg, 8) == paramsLeft[0]);
  1600. paramsLeft.erase(paramsLeft.begin());
  1601. auto vregInfo = mContext->mVRegInfo[inst->mArg0.mVRegIdx];
  1602. if (vregInfo->mReg != X64Reg_None)
  1603. {
  1604. auto checkReg = mContext->ResizeRegister(vregInfo->mReg, 8);
  1605. //auto itr = std::find(paramsLeft.begin(), paramsLeft.end(), checkReg);
  1606. //if (itr != paramsLeft.end())
  1607. if (paramsLeft.Contains(checkReg))
  1608. {
  1609. // This will happen if we have assigned a 'wrong' register to a parameter-
  1610. // a register that is not the 'natural' register (ie: rcx for param0),
  1611. // but it's a register that is already bound to another parameter which
  1612. // will be needed later. Given the 'natural' order of RCX, RDX, R8, R9,
  1613. // This is a valid order still: R10, RCX, R8, R9 since RCX will get written
  1614. // to R10 first so it won't get clobbered, but: RDX, R10, R8, R9 is not
  1615. // valid because RDX gets clobbered before it can be written to R10.
  1616. return false;
  1617. }
  1618. }
  1619. }
  1620. }
  1621. }
  1622. }
  1623. #endif
  1624. return true;
  1625. }
  1626. //////////////////////////////////////////////////////////////////////////
  1627. BeMCLoopDetector::BeMCLoopDetector(BeMCContext* context) : mTrackingContext(context)
  1628. {
  1629. mMCContext = context;
  1630. mTrackingContext.mTrackKindCount = 1;
  1631. mTrackingContext.Init((int)mMCContext->mMCBlockAlloc.size());
  1632. mNodes.Resize(mMCContext->mMCBlockAlloc.size());
  1633. }
  1634. void BeMCLoopDetector::DetectLoops(BeMCBlock* mcBlock, BeVTrackingList* predBlocksSeen)
  1635. {
  1636. mMCContext->mDetectLoopIdx++;
  1637. auto node = &mNodes[mcBlock->mBlockIdx];
  1638. auto blocksSeen = mTrackingContext.Merge(node->mPredBlocksSeen, predBlocksSeen);
  1639. if (blocksSeen == node->mPredBlocksSeen)
  1640. return;
  1641. node->mPredBlocksSeen = blocksSeen;
  1642. //SizedArray<int, 2> addVec = { mcBlock->mBlockIdx };
  1643. //auto newBlocksSeen = mTrackingContext.Add(blocksSeen, addVec, false);
  1644. auto newBlocksSeen = mTrackingContext.Add(blocksSeen, mcBlock->mBlockIdx, false);
  1645. if (newBlocksSeen == blocksSeen)
  1646. {
  1647. // Our ID was already set, so this is a re-entry and thus we are looped
  1648. mcBlock->mIsLooped = true;
  1649. }
  1650. blocksSeen = newBlocksSeen;
  1651. for (auto succ : mcBlock->mSuccs)
  1652. {
  1653. DetectLoops(succ, blocksSeen);
  1654. }
  1655. }
  1656. void BeMCLoopDetector::DetectLoops()
  1657. {
  1658. // auto blocksSeen = mTrackingContext.AllocEmptyList();
  1659. // DetectLoops(mMCContext->mBlocks[0], blocksSeen);
  1660. //
  1661. // HashSet<int> wasLooped;
  1662. // for (auto block : mMCContext->mBlocks)
  1663. // {
  1664. // if (block->mIsLooped)
  1665. // {
  1666. // wasLooped.Add(block->mBlockIdx);
  1667. // block->mIsLooped = false;
  1668. // }
  1669. // }
  1670. for (auto block : mMCContext->mBlocks)
  1671. {
  1672. for (auto succ : block->mSuccs)
  1673. {
  1674. if (succ->mBlockIdx < block->mBlockIdx)
  1675. {
  1676. auto prevBlock = mMCContext->mBlocks[block->mBlockIdx - 1];
  1677. //if ((!succ->mIsLooped) || (!prevBlock->mIsLooped))
  1678. {
  1679. for (int setBlockIdx = succ->mBlockIdx; setBlockIdx < block->mBlockIdx; setBlockIdx++)
  1680. mMCContext->mBlocks[setBlockIdx]->mIsLooped = true;
  1681. }
  1682. }
  1683. }
  1684. }
  1685. }
  1686. //////////////////////////////////////////////////////////////////////////
  1687. void BeMCBlock::AddPred(BeMCBlock* pred)
  1688. {
  1689. if (!mPreds.Contains(pred))
  1690. {
  1691. pred->mSuccs.push_back(this);
  1692. mPreds.push_back(pred);
  1693. }
  1694. }
  1695. int BeMCBlock::FindLabelInstIdx(int labelIdx)
  1696. {
  1697. for (int instIdx = 0; instIdx < (int)mInstructions.size(); instIdx++)
  1698. {
  1699. auto inst = mInstructions[instIdx];
  1700. if ((inst->mKind == BeMCInstKind_Label) && (inst->mArg0.mLabelIdx == labelIdx))
  1701. return instIdx;
  1702. }
  1703. return -1;
  1704. }
  1705. //////////////////////////////////////////////////////////////////////////
  1706. BeMCContext::BeMCContext(BeCOFFObject* coffObject) : mOut(coffObject->mTextSect.mData), mLivenessContext(this), mVRegInitializedContext(this), mColorizer(this)
  1707. {
  1708. mLivenessContext.mTrackKindCount = 1;
  1709. mCOFFObject = coffObject;
  1710. mModule = NULL;
  1711. mBeFunction = NULL;
  1712. mActiveBeBlock = NULL;
  1713. mActiveBlock = NULL;
  1714. mDbgFunction = NULL;
  1715. mCompositeRetVRegIdx = -1;
  1716. mTLSVRegIdx = -1;
  1717. mStackSize = 0;
  1718. mCurLabelIdx = 0;
  1719. mCurPhiIdx = 0;
  1720. mMaxCallParamCount = -1;
  1721. mCurDbgLoc = NULL;
  1722. mCurVRegsInit = NULL;
  1723. mCurVRegsLive = NULL;
  1724. mUseBP = false;
  1725. mInsertInstIdxRef = NULL;
  1726. mNativeIntType = mCOFFObject->mBeModule->mContext->GetPrimitiveType(BeTypeCode_Int64);
  1727. mDebugging = false;
  1728. mFailed = false;
  1729. mDetectLoopIdx = 0;
  1730. }
  1731. void BeMCContext::NotImpl()
  1732. {
  1733. Fail("Not implemented");
  1734. }
  1735. void BeMCContext::Fail(const StringImpl& str)
  1736. {
  1737. String errStr = StrFormat("Failure during codegen of %s in %s: %s", mBeFunction->mName.c_str(), mModule->mModuleName.c_str(), str.c_str());
  1738. BfpSystem_FatalError(errStr.c_str(), "FATAL ERROR");
  1739. }
  1740. void BeMCContext::SoftFail(const StringImpl& str, BeDbgLoc* dbgLoc)
  1741. {
  1742. if (mFailed)
  1743. return;
  1744. mFailed = true;
  1745. String errStr = StrFormat("Failure during codegen of %s: %s", mBeFunction->mName.c_str(), str.c_str());
  1746. if (dbgLoc != NULL)
  1747. {
  1748. auto dbgFile = dbgLoc->GetDbgFile();
  1749. if (dbgFile != NULL)
  1750. errStr += StrFormat(" at line %d:%d in %s/%s", dbgLoc->mLine + 1, dbgLoc->mColumn + 1, dbgFile->mDirectory.c_str(), dbgFile->mFileName.c_str());
  1751. }
  1752. mModule->mBeIRCodeGen->Fail(errStr);
  1753. }
  1754. String BeMCContext::ToString(const BeMCOperand& operand)
  1755. {
  1756. if (operand.mKind == BeMCOperandKind_NativeReg)
  1757. {
  1758. return String("%") + X64CPURegisters::GetRegisterName((int)operand.mReg);
  1759. }
  1760. if (operand.IsVRegAny())
  1761. {
  1762. auto vregInfo = GetVRegInfo(operand);
  1763. String str;
  1764. mModule->ToString(str, GetType(operand));
  1765. str += " ";
  1766. if (operand.IsVRegAny())
  1767. {
  1768. auto vregInfo = GetVRegInfo(operand);
  1769. if (operand.mKind == BeMCOperandKind_VRegAddr)
  1770. str += "&";
  1771. if (operand.mKind == BeMCOperandKind_VRegLoad)
  1772. str += "*";
  1773. if (vregInfo->mDbgVariable != NULL)
  1774. str += "#" + vregInfo->mDbgVariable->mName + StrFormat("/%d", operand.mVRegIdx);
  1775. else
  1776. str += StrFormat("%%vreg%d", operand.mVRegIdx);
  1777. }
  1778. if (vregInfo->mReg != X64Reg_None)
  1779. {
  1780. str += "<";
  1781. str += X64CPURegisters::GetRegisterName((int)vregInfo->mReg);
  1782. str += ">";
  1783. }
  1784. else if (vregInfo->mForceReg)
  1785. {
  1786. str += "<reg>";
  1787. }
  1788. if (vregInfo->mDisableR11)
  1789. {
  1790. str += "<NoR11>";
  1791. }
  1792. if (vregInfo->mDisableR12)
  1793. {
  1794. str += "<NoR12>";
  1795. }
  1796. if (vregInfo->mDisableR13)
  1797. {
  1798. str += "<NoR13>";
  1799. }
  1800. if (vregInfo->mDisableRAX)
  1801. {
  1802. str += "<NoRAX>";
  1803. }
  1804. if (vregInfo->mDisableRDX)
  1805. {
  1806. str += "<NoRDX>";
  1807. }
  1808. if (vregInfo->mDisableEx)
  1809. {
  1810. str += "<NoEx>";
  1811. }
  1812. if (vregInfo->mForceMem)
  1813. {
  1814. str += "<mem>";
  1815. }
  1816. if (vregInfo->mIsRetVal)
  1817. {
  1818. str += "<retval>";
  1819. }
  1820. if (vregInfo->mForceMerge)
  1821. {
  1822. str += "<canMerge>";
  1823. }
  1824. if (vregInfo->mRelTo)
  1825. {
  1826. str += "(";
  1827. str += ToString(vregInfo->mRelTo);
  1828. if (vregInfo->mRelOffset)
  1829. {
  1830. str += "+";
  1831. str += ToString(vregInfo->mRelOffset);
  1832. }
  1833. if (vregInfo->mRelOffsetScale != 1)
  1834. str += StrFormat("*%d", vregInfo->mRelOffsetScale);
  1835. str += ")";
  1836. }
  1837. return str;
  1838. }
  1839. if (operand.IsImmediate())
  1840. {
  1841. String str;
  1842. switch (operand.mKind)
  1843. {
  1844. case BeMCOperandKind_Immediate_i8: str += "i8 "; break;
  1845. case BeMCOperandKind_Immediate_i16: str += "i16 "; break;
  1846. case BeMCOperandKind_Immediate_i32: str += "i32 "; break;
  1847. case BeMCOperandKind_Immediate_i64: str += "i64 "; break;
  1848. case BeMCOperandKind_Immediate_Null:
  1849. if (operand.mType != NULL)
  1850. {
  1851. mModule->ToString(str, operand.mType);
  1852. str += " null";
  1853. }
  1854. else
  1855. str += "null";
  1856. return str;
  1857. case BeMCOperandKind_Immediate_f32: return StrFormat("f32 %f", operand.mImmFloat);
  1858. case BeMCOperandKind_Immediate_f32_Packed128: return StrFormat("f32_packed %f", operand.mImmFloat);
  1859. case BeMCOperandKind_Immediate_f64: return StrFormat("f64 %f", operand.mImmFloat);
  1860. case BeMCOperandKind_Immediate_f64_Packed128: return StrFormat("f64_packed %f", operand.mImmFloat);
  1861. }
  1862. //if (operand.mImmediate < 10)
  1863. str += StrFormat("%lld", operand.mImmediate);
  1864. /*else
  1865. str += StrFormat("0x%llX", operand.mImmediate);*/
  1866. return str;
  1867. }
  1868. if (operand.mKind == BeMCOperandKind_Block)
  1869. return "%" + operand.mBlock->mName;
  1870. if (operand.mKind == BeMCOperandKind_Label)
  1871. return StrFormat("%%label%d", operand.mLabelIdx);
  1872. if (operand.mKind == BeMCOperandKind_CmpKind)
  1873. return BeDumpContext::ToString(operand.mCmpKind);
  1874. if (operand.mKind == BeMCOperandKind_CmpResult)
  1875. {
  1876. String result = StrFormat("%%CmpResult%d", operand.mCmpResultIdx);
  1877. auto& cmpResult = mCmpResults[operand.mCmpResultIdx];
  1878. if (cmpResult.mResultVRegIdx != -1)
  1879. result += StrFormat("<vreg%d>", cmpResult.mResultVRegIdx);
  1880. result += " ";
  1881. result += BeDumpContext::ToString(cmpResult.mCmpKind);
  1882. return result;
  1883. }
  1884. if (operand.mKind == BeMCOperandKind_NotResult)
  1885. {
  1886. auto mcResult = GetOperand(operand.mNotResult->mValue, true, true);
  1887. String result = "NOT ";
  1888. result += ToString(mcResult);
  1889. return result;
  1890. }
  1891. if (operand.mKind == BeMCOperandKind_Symbol)
  1892. return mCOFFObject->mSymbols[operand.mSymbolIdx]->mName;
  1893. if (operand.mKind == BeMCOperandKind_SymbolAddr)
  1894. return "&" + mCOFFObject->mSymbols[operand.mSymbolIdx]->mName;
  1895. if (operand.mKind == BeMCOperandKind_MemSetInfo)
  1896. return StrFormat("size=%d val=%d align=%d", operand.mMemSetInfo.mSize, operand.mMemSetInfo.mValue, operand.mMemSetInfo.mAlign);
  1897. if (operand.mKind == BeMCOperandKind_MemCpyInfo)
  1898. return StrFormat("size=%d align=%d", operand.mMemCpyInfo.mSize, operand.mMemCpyInfo.mAlign);
  1899. if (operand.mKind == BeMCOperandKind_VRegPair)
  1900. {
  1901. String str = "(";
  1902. str += ToString(BeMCOperand::FromEncoded(operand.mVRegPair.mVRegIdx0));
  1903. str += ", ";
  1904. str += ToString(BeMCOperand::FromEncoded(operand.mVRegPair.mVRegIdx1));
  1905. str += ")";
  1906. return str;
  1907. }
  1908. if (operand.mKind == BeMCOperandKind_Phi)
  1909. return StrFormat("%%PHI%d", operand.mPhi->mIdx);
  1910. if (operand.mKind == BeMCOperandKind_PreserveFlag)
  1911. {
  1912. if (operand.mPreserveFlag == BeMCPreserveFlag_NoRestore)
  1913. return "PreserveFlag:NoReturn";
  1914. }
  1915. if (operand.mKind == BeMCOperandKind_ConstAgg)
  1916. {
  1917. BeDumpContext dumpContext;
  1918. dumpContext.mModule = mBeFunction->mModule;
  1919. String str = "const ";
  1920. str += dumpContext.ToString(operand.mConstant);
  1921. return str;
  1922. }
  1923. return "???";
  1924. }
  1925. BeMCOperand BeMCContext::GetOperand(BeValue* value, bool allowMetaResult, bool allowFail)
  1926. {
  1927. if (value == NULL)
  1928. return BeMCOperand();
  1929. switch (value->GetTypeId())
  1930. {
  1931. case BeGlobalVariable::TypeId:
  1932. {
  1933. auto globalVar = (BeGlobalVariable*)value;
  1934. if ((globalVar->mIsTLS) && (mTLSVRegIdx == -1))
  1935. {
  1936. auto tlsVReg = AllocVirtualReg(mNativeIntType);
  1937. auto vregInfo = GetVRegInfo(tlsVReg);
  1938. vregInfo->mMustExist = true;
  1939. vregInfo->mForceReg = true;
  1940. mTLSVRegIdx = tlsVReg.mVRegIdx;
  1941. }
  1942. auto sym = mCOFFObject->GetSymbol(globalVar);
  1943. if (sym != NULL)
  1944. {
  1945. BeMCOperand mcOperand;
  1946. mcOperand.mKind = BeMCOperandKind_SymbolAddr;
  1947. mcOperand.mSymbolIdx = sym->mIdx;
  1948. return mcOperand;
  1949. }
  1950. }
  1951. break;
  1952. case BeCastConstant::TypeId:
  1953. {
  1954. auto constant = (BeCastConstant*)value;
  1955. BeMCOperand mcOperand;
  1956. auto relTo = GetOperand(constant->mTarget);
  1957. if (relTo.mKind == BeMCOperandKind_Immediate_Null)
  1958. {
  1959. mcOperand.mKind = BeMCOperandKind_Immediate_Null;
  1960. mcOperand.mType = constant->mType;
  1961. return mcOperand;
  1962. }
  1963. mcOperand = AllocVirtualReg(constant->mType);
  1964. auto vregInfo = GetVRegInfo(mcOperand);
  1965. vregInfo->mDefOnFirstUse = true;
  1966. vregInfo->mRelTo = relTo;
  1967. vregInfo->mIsExpr = true;
  1968. return mcOperand;
  1969. }
  1970. break;
  1971. case BeConstant::TypeId:
  1972. {
  1973. auto constant = (BeConstant*)value;
  1974. BeMCOperand mcOperand;
  1975. switch (constant->mType->mTypeCode)
  1976. {
  1977. case BeTypeCode_Boolean:
  1978. case BeTypeCode_Int8: mcOperand.mKind = BeMCOperandKind_Immediate_i8; break;
  1979. case BeTypeCode_Int16: mcOperand.mKind = BeMCOperandKind_Immediate_i16; break;
  1980. case BeTypeCode_Int32: mcOperand.mKind = BeMCOperandKind_Immediate_i32; break;
  1981. case BeTypeCode_Int64: mcOperand.mKind = BeMCOperandKind_Immediate_i64; break;
  1982. case BeTypeCode_Float:
  1983. mcOperand.mImmFloat = constant->mDouble;
  1984. mcOperand.mKind = BeMCOperandKind_Immediate_f32;
  1985. return mcOperand;
  1986. case BeTypeCode_Double:
  1987. mcOperand.mImmFloat = constant->mDouble;
  1988. mcOperand.mKind = BeMCOperandKind_Immediate_f64;
  1989. return mcOperand;
  1990. case BeTypeCode_Pointer:
  1991. {
  1992. if (constant->mTarget == NULL)
  1993. {
  1994. mcOperand.mKind = BeMCOperandKind_Immediate_Null;
  1995. mcOperand.mType = constant->mType;
  1996. return mcOperand;
  1997. }
  1998. else
  1999. {
  2000. auto relTo = GetOperand(constant->mTarget);
  2001. if (relTo.mKind == BeMCOperandKind_Immediate_Null)
  2002. {
  2003. mcOperand.mKind = BeMCOperandKind_Immediate_Null;
  2004. mcOperand.mType = constant->mType;
  2005. return mcOperand;
  2006. }
  2007. mcOperand = AllocVirtualReg(constant->mType);
  2008. auto vregInfo = GetVRegInfo(mcOperand);
  2009. vregInfo->mDefOnFirstUse = true;
  2010. vregInfo->mRelTo = relTo;
  2011. vregInfo->mIsExpr = true;
  2012. return mcOperand;
  2013. }
  2014. }
  2015. break;
  2016. case BeTypeCode_Struct:
  2017. case BeTypeCode_SizedArray:
  2018. mcOperand.mImmediate = constant->mInt64;
  2019. mcOperand.mKind = BeMCOperandKind_Immediate_i64;
  2020. break;
  2021. default:
  2022. NotImpl();
  2023. }
  2024. mcOperand.mImmediate = constant->mInt64;
  2025. return mcOperand;
  2026. }
  2027. break;
  2028. case BeStructConstant::TypeId:
  2029. {
  2030. auto structConstant = (BeStructConstant*)value;
  2031. BeMCOperand mcOperand;
  2032. mcOperand.mKind = BeMCOperandKind_ConstAgg;
  2033. mcOperand.mConstant = structConstant;
  2034. return mcOperand;
  2035. }
  2036. case BeGEPConstant::TypeId:
  2037. {
  2038. auto gepConstant = (BeGEPConstant*)value;
  2039. auto mcVal = GetOperand(gepConstant->mTarget);
  2040. BePointerType* ptrType = (BePointerType*)GetType(mcVal);
  2041. BF_ASSERT(ptrType->mTypeCode == BeTypeCode_Pointer);
  2042. auto result = mcVal;
  2043. // We assume we never do both an idx0 and idx1 at once. Fix if we change that.
  2044. int byteOffset = 0;
  2045. BeType* elementType = NULL;
  2046. byteOffset += gepConstant->mIdx0 * ptrType->mElementType->mSize;
  2047. if (ptrType->mElementType->mTypeCode == BeTypeCode_Struct)
  2048. {
  2049. BeStructType* structType = (BeStructType*)ptrType->mElementType;
  2050. auto& structMember = structType->mMembers[gepConstant->mIdx1];
  2051. elementType = structMember.mType;
  2052. byteOffset = structMember.mByteOffset;
  2053. }
  2054. else
  2055. {
  2056. BF_ASSERT(ptrType->mElementType->mTypeCode == BeTypeCode_SizedArray);
  2057. auto arrayType = (BeSizedArrayType*)ptrType->mElementType;
  2058. elementType = arrayType->mElementType;
  2059. byteOffset = gepConstant->mIdx1 * elementType->mSize;
  2060. }
  2061. auto elementPtrType = mModule->mContext->GetPointerTo(elementType);
  2062. result = AllocRelativeVirtualReg(elementPtrType, result, GetImmediate(byteOffset), 1);
  2063. // The def is primary to create a single 'master location' for the GEP vreg to become legalized before use
  2064. auto vregInfo = GetVRegInfo(result);
  2065. vregInfo->mDefOnFirstUse = true;
  2066. result.mKind = BeMCOperandKind_VReg;
  2067. return result;
  2068. }
  2069. break;
  2070. case BeFunction::TypeId:
  2071. {
  2072. auto sym = mCOFFObject->GetSymbol(value);
  2073. BF_ASSERT(sym != NULL);
  2074. if (sym != NULL)
  2075. {
  2076. BeMCOperand mcOperand;
  2077. mcOperand.mKind = BeMCOperandKind_SymbolAddr;
  2078. mcOperand.mSymbolIdx = sym->mIdx;
  2079. return mcOperand;
  2080. }
  2081. }
  2082. break;
  2083. case BeCallInst::TypeId:
  2084. {
  2085. auto callInst = (BeCallInst*)value;
  2086. if (callInst->mInlineResult != NULL)
  2087. return GetOperand(callInst->mInlineResult);
  2088. }
  2089. break;
  2090. case BeDbgVariable::TypeId:
  2091. {
  2092. }
  2093. }
  2094. BeMCOperand* operandPtr = NULL;
  2095. mValueToOperand.TryGetValue(value, &operandPtr);
  2096. //auto itr = mValueToOperand.find(value);
  2097. if (!allowFail)
  2098. {
  2099. BF_ASSERT(operandPtr != NULL);
  2100. }
  2101. if (operandPtr == NULL)
  2102. {
  2103. if (allowFail)
  2104. return BeMCOperand();
  2105. BeMCOperand mcOperand;
  2106. mcOperand.mKind = BeMCOperandKind_Immediate_i64;
  2107. mcOperand.mImmediate = 0;
  2108. return mcOperand;
  2109. }
  2110. auto operand = *operandPtr;
  2111. if ((operand.mKind == BeMCOperandKind_Phi) && (!allowMetaResult))
  2112. {
  2113. auto phi = operand.mPhi;
  2114. int phiInstIdx = 0;
  2115. auto mcBlock = phi->mBlock;
  2116. for (auto instIdx = 0; instIdx < mcBlock->mInstructions.size(); instIdx++)
  2117. {
  2118. auto inst = mcBlock->mInstructions[instIdx];
  2119. if (inst->mKind == BeMCInstKind_DefPhi)
  2120. {
  2121. BF_ASSERT(inst->mArg0.mPhi == phi);
  2122. phiInstIdx = instIdx;
  2123. RemoveInst(mcBlock, phiInstIdx);
  2124. break;
  2125. }
  2126. }
  2127. SetAndRestoreValue<BeMCBlock*> prevBlock(mActiveBlock, mcBlock);
  2128. SetAndRestoreValue<int*> prevInstIdxRef(mInsertInstIdxRef, &phiInstIdx);
  2129. auto resultType = value->GetType();
  2130. auto result = AllocVirtualReg(resultType);
  2131. auto vregInfo = GetVRegInfo(result);
  2132. vregInfo->mHasDynLife = true; // No specific 'def' location
  2133. mValueToOperand[value] = result;
  2134. if (resultType->mTypeCode == BeTypeCode_Boolean)
  2135. {
  2136. CreateDefineVReg(result);
  2137. BeMCOperand falseLabel = BeMCOperand::FromLabel(mCurLabelIdx++);
  2138. BeMCOperand trueLabel = BeMCOperand::FromLabel(mCurLabelIdx++);
  2139. BeMCOperand endLabel = BeMCOperand::FromLabel(mCurLabelIdx++);
  2140. CreateCondBr(mActiveBlock, operand, trueLabel, falseLabel);
  2141. AllocInst(BeMCInstKind_Label, falseLabel);
  2142. AllocInst(BeMCInstKind_Mov, result, BeMCOperand::FromImmediate(0));
  2143. AllocInst(BeMCInstKind_Br, endLabel);
  2144. AllocInst(BeMCInstKind_Label, trueLabel);
  2145. AllocInst(BeMCInstKind_Mov, result, BeMCOperand::FromImmediate(1));
  2146. AllocInst(BeMCInstKind_Label, endLabel);
  2147. }
  2148. else
  2149. {
  2150. // Attempt to find common ancestor to insert a 'def' at
  2151. SizedArray<BeMCBlock*, 16> blockSearch;
  2152. blockSearch.reserve(phi->mValues.size());
  2153. BeMCBlock* lowestBlock = NULL;
  2154. for (auto& phiValue : phi->mValues)
  2155. {
  2156. if ((lowestBlock == NULL) || (phiValue.mBlockFrom->mBlockIdx < lowestBlock->mBlockIdx))
  2157. lowestBlock = phiValue.mBlockFrom;
  2158. blockSearch.push_back(phiValue.mBlockFrom);
  2159. }
  2160. while (true)
  2161. {
  2162. bool allMatched = true;
  2163. bool didWork = false;
  2164. for (int searchIdx = 0; searchIdx < (int)blockSearch.size(); searchIdx++)
  2165. {
  2166. auto& blockRef = blockSearch[searchIdx];
  2167. if (blockRef != lowestBlock)
  2168. {
  2169. allMatched = false;
  2170. for (auto& pred : blockRef->mPreds)
  2171. {
  2172. // Try find a block closer to start, but not below the current lowestBlock
  2173. if ((pred->mBlockIdx >= lowestBlock->mBlockIdx) && (pred->mBlockIdx < blockRef->mBlockIdx))
  2174. {
  2175. blockRef = pred;
  2176. didWork = true;
  2177. }
  2178. }
  2179. }
  2180. }
  2181. if (allMatched)
  2182. {
  2183. SetAndRestoreValue<BeMCBlock*> prevActiveBlock(mActiveBlock, lowestBlock);
  2184. SetAndRestoreValue<int*> prevInstIdxRef(mInsertInstIdxRef, NULL);
  2185. auto inst = CreateDefineVReg(result);
  2186. inst->mVRegsInitialized = NULL;
  2187. inst->mDbgLoc = NULL;
  2188. break;
  2189. }
  2190. if (!didWork)
  2191. {
  2192. BeMCBlock* nextLowestBlock = NULL;
  2193. // Find the next candidate block
  2194. for (auto& blockRef : blockSearch)
  2195. {
  2196. for (auto& pred : blockRef->mPreds)
  2197. {
  2198. if (pred->mBlockIdx < lowestBlock->mBlockIdx)
  2199. {
  2200. if ((nextLowestBlock == NULL) || (pred->mBlockIdx > nextLowestBlock->mBlockIdx))
  2201. nextLowestBlock = pred;
  2202. }
  2203. }
  2204. }
  2205. if (nextLowestBlock == NULL)
  2206. break;
  2207. lowestBlock = nextLowestBlock;
  2208. }
  2209. }
  2210. BeMCOperand doneLabel = BeMCOperand::FromLabel(mCurLabelIdx++);
  2211. CreatePhiAssign(mActiveBlock, operand, result, doneLabel);
  2212. // Don't use an explicit dbgLoc
  2213. SetAndRestoreValue<BeDbgLoc*> prevDbgLoc(mCurDbgLoc, NULL);
  2214. AllocInst(BeMCInstKind_Label, doneLabel);
  2215. }
  2216. return result;
  2217. }
  2218. if ((operand.mKind == BeMCOperandKind_CmpResult) && (!allowMetaResult))
  2219. {
  2220. auto& cmpResult = mCmpResults[operand.mCmpResultIdx];
  2221. if (cmpResult.mResultVRegIdx == -1)
  2222. {
  2223. // Create the vreg now, and insert the CmpToBool during legalization
  2224. BeType* boolType = mModule->mContext->GetPrimitiveType(BeTypeCode_Boolean);
  2225. operand = AllocVirtualReg(boolType);
  2226. cmpResult.mResultVRegIdx = operand.mVRegIdx;
  2227. auto vregInfo = GetVRegInfo(operand);
  2228. vregInfo->mDefOnFirstUse = true;
  2229. }
  2230. operand = BeMCOperand::FromVReg(cmpResult.mResultVRegIdx);
  2231. }
  2232. if ((operand.mKind == BeMCOperandKind_NotResult) && (!allowMetaResult))
  2233. {
  2234. auto mcValue = GetOperand(operand.mNotResult->mValue, false, allowFail);
  2235. operand = AllocVirtualReg(GetType(mcValue));
  2236. CreateDefineVReg(operand);
  2237. AllocInst(BeMCInstKind_Mov, operand, mcValue);
  2238. BeMCOperand xorVal;
  2239. xorVal.mKind = BeMCOperandKind_Immediate_i8;
  2240. xorVal.mImmediate = 0x1;
  2241. AllocInst(BeMCInstKind_Xor, operand, xorVal);
  2242. }
  2243. return operand;
  2244. }
  2245. BeType* BeMCContext::GetType(const BeMCOperand& operand)
  2246. {
  2247. if (operand.mKind == BeMCOperandKind_NativeReg)
  2248. {
  2249. if ((operand.mReg >= X64Reg_RAX) && (operand.mReg <= X64Reg_EFL))
  2250. return mModule->mContext->GetPrimitiveType(BeTypeCode_Int64);
  2251. if ((operand.mReg >= X64Reg_EAX) && (operand.mReg <= X64Reg_R15D))
  2252. return mModule->mContext->GetPrimitiveType(BeTypeCode_Int32);
  2253. if ((operand.mReg >= X64Reg_AX) && (operand.mReg <= X64Reg_R15W))
  2254. return mModule->mContext->GetPrimitiveType(BeTypeCode_Int16);
  2255. if ((operand.mReg >= X64Reg_AL) && (operand.mReg <= X64Reg_R15B))
  2256. return mModule->mContext->GetPrimitiveType(BeTypeCode_Int8);
  2257. if ((operand.mReg >= X64Reg_XMM0_f64) && (operand.mReg <= X64Reg_XMM15_f64))
  2258. return mModule->mContext->GetPrimitiveType(BeTypeCode_Double);
  2259. if ((operand.mReg >= X64Reg_XMM0_f32) && (operand.mReg <= X64Reg_XMM15_f32))
  2260. return mModule->mContext->GetPrimitiveType(BeTypeCode_Float);
  2261. }
  2262. if (operand.mKind == BeMCOperandKind_VReg)
  2263. return mVRegInfo[operand.mVRegIdx]->mType;
  2264. if (operand.mKind == BeMCOperandKind_VRegAddr)
  2265. return mModule->mContext->GetPointerTo(mVRegInfo[operand.mVRegIdx]->mType);
  2266. if (operand.mKind == BeMCOperandKind_VRegLoad)
  2267. {
  2268. auto type = mVRegInfo[operand.mVRegIdx]->mType;
  2269. BF_ASSERT(type->IsPointer());
  2270. return ((BePointerType*)type)->mElementType;
  2271. }
  2272. switch (operand.mKind)
  2273. {
  2274. case BeMCOperandKind_Immediate_i8: return mModule->mContext->GetPrimitiveType(BeTypeCode_Int8); break;
  2275. case BeMCOperandKind_Immediate_i16: return mModule->mContext->GetPrimitiveType(BeTypeCode_Int16); break;
  2276. case BeMCOperandKind_Immediate_i32: return mModule->mContext->GetPrimitiveType(BeTypeCode_Int32); break;
  2277. case BeMCOperandKind_Immediate_i64: return mModule->mContext->GetPrimitiveType(BeTypeCode_Int64); break;
  2278. case BeMCOperandKind_Immediate_Null: return operand.mType; break;
  2279. case BeMCOperandKind_Immediate_f32:
  2280. case BeMCOperandKind_Immediate_f32_Packed128: return mModule->mContext->GetPrimitiveType(BeTypeCode_Float); break;
  2281. case BeMCOperandKind_Immediate_f64:
  2282. case BeMCOperandKind_Immediate_f64_Packed128: return mModule->mContext->GetPrimitiveType(BeTypeCode_Double); break;
  2283. }
  2284. if (operand.mKind == BeMCOperandKind_SymbolAddr)
  2285. {
  2286. auto symbol = mCOFFObject->mSymbols[operand.mSymbolIdx];
  2287. if (symbol->mType == NULL)
  2288. return NULL;
  2289. return mModule->mContext->GetPointerTo(symbol->mType);
  2290. }
  2291. if (operand.mKind == BeMCOperandKind_Symbol)
  2292. {
  2293. auto symbol = mCOFFObject->mSymbols[operand.mSymbolIdx];
  2294. return symbol->mType;
  2295. }
  2296. if (operand.mKind == BeMCOperandKind_CmpResult)
  2297. {
  2298. return mModule->mContext->GetPrimitiveType(BeTypeCode_Boolean);
  2299. }
  2300. if (operand.mKind == BeMCOperandKind_ConstAgg)
  2301. {
  2302. return operand.mConstant->mType;
  2303. }
  2304. return NULL;
  2305. }
  2306. bool BeMCContext::AreTypesEquivalent(BeType* type0, BeType* type1)
  2307. {
  2308. if ((type0->IsFloat()) != (type1->IsFloat()))
  2309. return false;
  2310. return type0->mSize == type1->mSize;
  2311. }
  2312. void BeMCContext::AddRelRefs(BeMCOperand& operand, int refCount)
  2313. {
  2314. if (!operand.IsVRegAny())
  2315. return;
  2316. auto vregInfo = mVRegInfo[operand.mVRegIdx];
  2317. vregInfo->mRefCount += refCount;
  2318. if (vregInfo->mRelTo)
  2319. AddRelRefs(vregInfo->mRelTo, vregInfo->mRefCount + refCount);
  2320. if (vregInfo->mRelOffset)
  2321. AddRelRefs(vregInfo->mRelOffset, vregInfo->mRefCount + refCount);
  2322. }
  2323. int BeMCContext::FindSafeInstInsertPos(int instIdx, bool forceSafeCheck)
  2324. {
  2325. auto inst = mActiveBlock->mInstructions[instIdx];
  2326. bool doSafeCheck = false;
  2327. if (forceSafeCheck)
  2328. doSafeCheck = true;
  2329. if ((inst->mKind == BeMCInstKind_Call) ||
  2330. (inst->mKind == BeMCInstKind_MemSet) ||
  2331. (inst->mKind == BeMCInstKind_MemCpy))
  2332. doSafeCheck = true;
  2333. if ((inst->IsMov()) && (inst->mArg0.IsNativeReg()))
  2334. doSafeCheck = true;
  2335. if (!doSafeCheck)
  2336. return instIdx;
  2337. // If we're in a CALL then move this Def before the param loads
  2338. int bestIdx = instIdx;
  2339. while (bestIdx > 0)
  2340. {
  2341. inst = mActiveBlock->mInstructions[bestIdx - 1];
  2342. bestIdx--;
  2343. if (inst->mKind == BeMCInstKind_PreserveVolatiles)
  2344. return bestIdx;
  2345. }
  2346. return bestIdx;
  2347. }
  2348. BeMCInst* BeMCContext::AllocInst(int insertIdx)
  2349. {
  2350. auto mcInst = mAlloc.Alloc<BeMCInst>();
  2351. mcInst->mKind = BeMCInstKind_None;
  2352. mcInst->mDbgLoc = mCurDbgLoc;
  2353. mcInst->mVRegsInitialized = mCurVRegsInit;
  2354. mcInst->mLiveness = mCurVRegsLive;
  2355. if ((insertIdx == -1) && (mInsertInstIdxRef != NULL))
  2356. insertIdx = (*mInsertInstIdxRef)++;
  2357. if (insertIdx == -1)
  2358. mActiveBlock->mInstructions.push_back(mcInst);
  2359. else
  2360. mActiveBlock->mInstructions.Insert(insertIdx, mcInst);
  2361. return mcInst;
  2362. }
  2363. BeMCInst* BeMCContext::AllocInst(BeMCInstKind instKind, int insertIdx)
  2364. {
  2365. auto mcInst = AllocInst(insertIdx);
  2366. mcInst->mKind = instKind;
  2367. return mcInst;
  2368. }
  2369. BeMCInst* BeMCContext::AllocInst(BeMCInstKind instKind, const BeMCOperand& arg0, int insertIdx)
  2370. {
  2371. auto mcInst = AllocInst(insertIdx);
  2372. mcInst->mKind = instKind;
  2373. mcInst->mArg0 = arg0;
  2374. return mcInst;
  2375. }
  2376. BeMCInst* BeMCContext::AllocInst(BeMCInstKind instKind, const BeMCOperand& arg0, const BeMCOperand& arg1, int insertIdx)
  2377. {
  2378. auto mcInst = AllocInst(insertIdx);
  2379. mcInst->mKind = instKind;
  2380. mcInst->mArg0 = arg0;
  2381. mcInst->mArg1 = arg1;
  2382. return mcInst;
  2383. }
  2384. void BeMCContext::RemoveInst(BeMCBlock* block, int instIdx, bool needChangesMerged)
  2385. {
  2386. // If neither the instruction before or after this one shares the vregsInitialized flags, then we need to
  2387. // merge down our Changes to the next instruction
  2388. auto inst = block->mInstructions[instIdx];
  2389. if (instIdx > 0)
  2390. {
  2391. auto prevInst = block->mInstructions[instIdx - 1];
  2392. if (prevInst->mVRegsInitialized == inst->mVRegsInitialized)
  2393. needChangesMerged = false;
  2394. }
  2395. if (needChangesMerged)
  2396. {
  2397. if (instIdx < (int)block->mInstructions.size() - 1)
  2398. {
  2399. auto nextInst = block->mInstructions[instIdx + 1];
  2400. if ((inst->mVRegsInitialized != NULL) && (nextInst->mVRegsInitialized != NULL))
  2401. {
  2402. nextInst->mVRegsInitialized = mVRegInitializedContext.MergeChanges(nextInst->mVRegsInitialized, inst->mVRegsInitialized);
  2403. }
  2404. }
  2405. }
  2406. block->mInstructions.RemoveAt(instIdx);
  2407. }
  2408. BeMCOperand BeMCContext::GetCallArgVReg(int argIdx, BeTypeCode typeCode)
  2409. {
  2410. int pIdx = argIdx;
  2411. BeMCNativeTypeCode vregType = BeMCNativeTypeCode_Int64;
  2412. switch (typeCode)
  2413. {
  2414. case BeTypeCode_Int8:
  2415. vregType = BeMCNativeTypeCode_Int8;
  2416. break;
  2417. case BeTypeCode_Int16:
  2418. vregType = BeMCNativeTypeCode_Int16;
  2419. break;
  2420. case BeTypeCode_Int32:
  2421. vregType = BeMCNativeTypeCode_Int32;
  2422. break;
  2423. case BeTypeCode_Int64:
  2424. vregType = BeMCNativeTypeCode_Int64;
  2425. break;
  2426. case BeTypeCode_Float:
  2427. vregType = BeMCNativeTypeCode_Float;
  2428. break;
  2429. case BeTypeCode_Double:
  2430. vregType = BeMCNativeTypeCode_Double;
  2431. break;
  2432. default:
  2433. typeCode = BeTypeCode_Int64;
  2434. vregType = BeMCNativeTypeCode_Int64;
  2435. break;
  2436. }
  2437. Array<int>& callArgVRegs = mCallArgVRegs[vregType];
  2438. while (pIdx >= (int)callArgVRegs.size())
  2439. callArgVRegs.push_back(-1);
  2440. if (callArgVRegs[pIdx] == -1)
  2441. {
  2442. auto nativeType = mModule->mContext->GetPrimitiveType(typeCode);
  2443. auto nativePtrType = mModule->mContext->GetPointerTo(nativeType);
  2444. auto mcArg = AllocVirtualReg(nativePtrType);
  2445. auto vregInfo = mVRegInfo[mcArg.mVRegIdx];
  2446. vregInfo->mMustExist = true;
  2447. vregInfo->mIsExpr = true;
  2448. vregInfo->mRelTo = BeMCOperand::FromReg(X64Reg_RSP);
  2449. vregInfo->mRelOffset = BeMCOperand::FromImmediate(argIdx * 8);
  2450. callArgVRegs[pIdx] = mcArg.mVRegIdx;
  2451. mcArg.mKind = BeMCOperandKind_VRegLoad;
  2452. return mcArg;
  2453. }
  2454. else
  2455. {
  2456. auto mcArg = BeMCOperand::FromVReg(callArgVRegs[pIdx]);
  2457. mcArg.mKind = BeMCOperandKind_VRegLoad;
  2458. return mcArg;
  2459. }
  2460. }
  2461. BeMCOperand BeMCContext::CreateCall(const BeMCOperand &func, const SizedArrayImpl<BeValue*>& args, BeType* retType, BfIRCallingConv callingConv, bool structRet, bool noReturn, bool isVarArg)
  2462. {
  2463. SizedArray<BeMCOperand, 4> opArgs;
  2464. for (auto itr = args.begin(); itr != args.end(); ++itr)
  2465. {
  2466. auto& arg = *itr;
  2467. opArgs.push_back(GetOperand(arg));
  2468. }
  2469. return CreateCall(func, opArgs, retType, callingConv, structRet, noReturn, isVarArg);
  2470. }
  2471. BeMCOperand BeMCContext::CreateLoad(const BeMCOperand& mcTarget)
  2472. {
  2473. BeMCOperand result;
  2474. auto loadedTarget = BeMCOperand::ToLoad(mcTarget);
  2475. auto targetType = GetType(loadedTarget);
  2476. result = AllocVirtualReg(targetType);
  2477. auto vregInfo = GetVRegInfo(result);
  2478. vregInfo->mIsExpr = true;
  2479. vregInfo->mRelTo = loadedTarget;
  2480. result.mKind = BeMCOperandKind_VReg;
  2481. AllocInst(BeMCInstKind_DefLoad, result);
  2482. return result;
  2483. }
  2484. void BeMCContext::CreateStore(BeMCInstKind instKind, const BeMCOperand& val, const BeMCOperand& ptr)
  2485. {
  2486. BeMCOperand mcVal = val;
  2487. BeMCOperand mcPtr = ptr;
  2488. if (mcVal.mKind == BeMCOperandKind_ConstAgg)
  2489. {
  2490. bool needsDecompose = false;
  2491. if (auto arrayConst = BeValueDynCast<BeStructConstant>(mcVal.mConstant))
  2492. {
  2493. for (auto& val : arrayConst->mMemberValues)
  2494. {
  2495. if (auto globalVar = BeValueDynCast<BeGlobalVariable>(val))
  2496. {
  2497. needsDecompose = true;
  2498. }
  2499. else if (auto castConst = BeValueDynCast<BeCastConstant>(val))
  2500. {
  2501. needsDecompose = true;
  2502. }
  2503. }
  2504. if (needsDecompose)
  2505. {
  2506. int offset = 0;
  2507. auto arrayType = arrayConst->GetType();
  2508. BF_ASSERT(arrayType->IsSizedArray());
  2509. auto sizedArrayType = (BeSizedArrayType*)arrayType;
  2510. for (auto& val : arrayConst->mMemberValues)
  2511. {
  2512. auto destOperand = AllocVirtualReg(mModule->mContext->GetPointerTo(sizedArrayType->mElementType));
  2513. auto vregInfo = GetVRegInfo(destOperand);
  2514. vregInfo->mDefOnFirstUse = true;
  2515. vregInfo->mRelTo = mcPtr;
  2516. vregInfo->mIsExpr = true;
  2517. vregInfo->mRelOffset = BeMCOperand::FromImmediate(offset);
  2518. destOperand.mKind = BeMCOperandKind_VRegLoad;
  2519. auto elementVal = GetOperand(val);
  2520. AllocInst(instKind, destOperand, elementVal);
  2521. offset += sizedArrayType->mElementType->mSize;
  2522. }
  2523. return;
  2524. }
  2525. }
  2526. }
  2527. // Addr mov infers something like a "int* intPtr = &intVal"
  2528. if (mcVal.mKind == BeMCOperandKind_VRegAddr)
  2529. {
  2530. auto vregInfo = GetVRegInfo(mcVal);
  2531. vregInfo->mForceMem = true;
  2532. CheckForce(vregInfo);
  2533. }
  2534. if (mcPtr.mKind == BeMCOperandKind_VRegAddr)
  2535. {
  2536. mcPtr.mKind = BeMCOperandKind_VReg;
  2537. AllocInst(instKind, mcPtr, mcVal);
  2538. }
  2539. else if (mcPtr.mKind == BeMCOperandKind_VReg)
  2540. {
  2541. mcPtr.mKind = BeMCOperandKind_VRegLoad;
  2542. AllocInst(instKind, mcPtr, mcVal);
  2543. }
  2544. else if (mcPtr.mKind == BeMCOperandKind_SymbolAddr)
  2545. {
  2546. mcPtr.mKind = BeMCOperandKind_Symbol;
  2547. AllocInst(instKind, mcPtr, mcVal);
  2548. }
  2549. else
  2550. {
  2551. mcPtr = CreateLoad(mcPtr);
  2552. AllocInst(instKind, mcPtr, mcVal);
  2553. }
  2554. }
  2555. BeMCOperand BeMCContext::CreateCall(const BeMCOperand& func, const SizedArrayImpl<BeMCOperand>& args, BeType* retType, BfIRCallingConv callingConv, bool structRet, bool noReturn, bool isVarArg)
  2556. {
  2557. BeMCOperand mcResult;
  2558. //TODO: Allow user to directly specify ret addr with "sret" attribute
  2559. int argOfs = 0;
  2560. X64CPURegister compositeRetReg = X64Reg_None;
  2561. bool flipFirstRegs = (structRet) && (callingConv == BfIRCallingConv_ThisCall);
  2562. if ((retType != NULL) && (retType->IsComposite()))
  2563. {
  2564. mcResult = AllocVirtualReg(retType);
  2565. auto vregInfo = GetVRegInfo(mcResult);
  2566. vregInfo->mMustExist = true;
  2567. CreateDefineVReg(mcResult);
  2568. // 'this' always goes in RCX, so push compositeRetReg out by one
  2569. compositeRetReg = (callingConv == BfIRCallingConv_ThisCall) ? X64Reg_RDX : X64Reg_RCX;
  2570. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromReg(compositeRetReg), BeMCOperand::FromVRegAddr(mcResult.mVRegIdx));
  2571. argOfs = 1;
  2572. }
  2573. bool didPreserveRegs = false;
  2574. auto _AddPreserveRegs = [&] ()
  2575. {
  2576. if (noReturn)
  2577. AllocInst(BeMCInstKind_PreserveVolatiles, BeMCOperand::FromPreserveFlag(BeMCPreserveFlag_NoRestore));
  2578. else
  2579. AllocInst(BeMCInstKind_PreserveVolatiles);
  2580. didPreserveRegs = true;
  2581. };
  2582. int argCount = (int)args.size() + argOfs;
  2583. int dynStackSize = 0;
  2584. // if (mUseBP)
  2585. // {
  2586. // dynStackSize = BF_MAX(4, argCount) * 8;
  2587. // dynStackSize = BF_ALIGN(dynStackSize, 16);
  2588. // }
  2589. if (dynStackSize > 0)
  2590. AllocInst(BeMCInstKind_Sub, BeMCOperand::FromReg(X64Reg_RSP), BeMCOperand::FromImmediate(dynStackSize));
  2591. struct _ShadowReg
  2592. {
  2593. X64CPURegister mFReg;
  2594. X64CPURegister mIReg;
  2595. };
  2596. SizedArray<_ShadowReg, 8> shadowRegs;
  2597. BF_ASSERT(mMaxCallParamCount >= argCount);
  2598. mMaxCallParamCount = BF_MAX(mMaxCallParamCount, argCount);
  2599. for (int argIdx = args.size() - 1; argIdx >= 0; argIdx--)
  2600. {
  2601. if ((argIdx == 0) && (compositeRetReg == X64Reg_RDX))
  2602. argOfs = 0;
  2603. auto mcValue = args[argIdx];
  2604. auto argType = GetType(mcValue);
  2605. X64CPURegister useReg = X64Reg_None;
  2606. int useArgIdx = argIdx + argOfs;
  2607. if (argType->IsFloat())
  2608. {
  2609. switch (useArgIdx)
  2610. {
  2611. case 0:
  2612. useReg = (argType->mTypeCode == BeTypeCode_Float) ? X64Reg_XMM0_f32 : X64Reg_XMM0_f64;
  2613. break;
  2614. case 1:
  2615. useReg = (argType->mTypeCode == BeTypeCode_Float) ? X64Reg_XMM1_f32 : X64Reg_XMM1_f64;
  2616. break;
  2617. case 2:
  2618. useReg = (argType->mTypeCode == BeTypeCode_Float) ? X64Reg_XMM2_f32 : X64Reg_XMM2_f64;
  2619. break;
  2620. case 3:
  2621. useReg = (argType->mTypeCode == BeTypeCode_Float) ? X64Reg_XMM3_f32 : X64Reg_XMM3_f64;
  2622. break;
  2623. }
  2624. if (isVarArg)
  2625. {
  2626. X64CPURegister shadowReg = X64Reg_None;
  2627. switch (useArgIdx)
  2628. {
  2629. case 0:
  2630. shadowReg = !flipFirstRegs ? X64Reg_RCX : X64Reg_RDX;
  2631. break;
  2632. case 1:
  2633. shadowReg = !flipFirstRegs ? X64Reg_RDX : X64Reg_RCX;
  2634. break;
  2635. case 2:
  2636. shadowReg = X64Reg_R8;
  2637. break;
  2638. case 3:
  2639. shadowReg = X64Reg_R9;
  2640. break;
  2641. }
  2642. if ((shadowReg != X64Reg_None) && (useReg != X64Reg_None))
  2643. {
  2644. shadowRegs.push_back(_ShadowReg { useReg, shadowReg} );
  2645. }
  2646. }
  2647. }
  2648. else
  2649. {
  2650. switch (useArgIdx)
  2651. {
  2652. case 0:
  2653. useReg = !flipFirstRegs ? X64Reg_RCX : X64Reg_RDX;
  2654. break;
  2655. case 1:
  2656. useReg = !flipFirstRegs ? X64Reg_RDX : X64Reg_RCX;
  2657. break;
  2658. case 2:
  2659. useReg = X64Reg_R8;
  2660. break;
  2661. case 3:
  2662. useReg = X64Reg_R9;
  2663. break;
  2664. }
  2665. }
  2666. if ((!argType->IsComposite()) && (!isVarArg)) // VarArg uses full 64 bits
  2667. useReg = ResizeRegister(useReg, argType->mSize);
  2668. if (mcValue.mKind == BeMCOperandKind_VRegAddr)
  2669. {
  2670. auto vregInfo = GetVRegInfo(mcValue);
  2671. vregInfo->mForceMem = true;
  2672. CheckForce(vregInfo);
  2673. }
  2674. if (useReg != X64Reg_None)
  2675. {
  2676. // We want to do the non-register params before the PreserveRegs call,
  2677. // because those may be a memory-to-memory mov, which will result in
  2678. // a temporary variable which will allocate a register which may
  2679. // conflict with our param regs
  2680. if (!didPreserveRegs)
  2681. _AddPreserveRegs();
  2682. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromReg(useReg), mcValue);
  2683. }
  2684. else
  2685. {
  2686. auto useTypeCode = argType->mTypeCode;
  2687. if (isVarArg)
  2688. {
  2689. if (argType->IsFloat())
  2690. useTypeCode = BeTypeCode_Double;
  2691. else
  2692. useTypeCode = BeTypeCode_Int64;
  2693. }
  2694. auto callArgVReg = GetCallArgVReg(useArgIdx, useTypeCode);
  2695. // Do a 'def' for every usage, to clear out the 'init' at all paths
  2696. CreateDefineVReg(BeMCOperand::FromVReg(callArgVReg.mVRegIdx));
  2697. if (argType->IsComposite())
  2698. {
  2699. BF_ASSERT(mcValue.mKind == BeMCOperandKind_VReg);
  2700. AllocInst(BeMCInstKind_Mov, callArgVReg, BeMCOperand::FromVRegAddr(mcValue.mVRegIdx));
  2701. }
  2702. else
  2703. AllocInst(BeMCInstKind_Mov, callArgVReg, mcValue);
  2704. }
  2705. }
  2706. if (!didPreserveRegs)
  2707. _AddPreserveRegs();
  2708. auto mcFunc = func;
  2709. for (auto& shadowReg : shadowRegs ) // Do float shadowing
  2710. {
  2711. AllocInst(BeMCInstKind_MovRaw, BeMCOperand::FromReg(shadowReg.mIReg), BeMCOperand::FromReg(shadowReg.mFReg));
  2712. }
  2713. AllocInst(BeMCInstKind_Call, mcFunc);
  2714. if (dynStackSize > 0)
  2715. AllocInst(BeMCInstKind_Add, BeMCOperand::FromReg(X64Reg_RSP), BeMCOperand::FromImmediate(dynStackSize));
  2716. if ((!mcResult) && (retType != NULL) && (retType->mTypeCode != BeTypeCode_None))
  2717. {
  2718. mcResult = AllocVirtualReg(retType);
  2719. CreateDefineVReg(mcResult);
  2720. X64CPURegister resultReg;
  2721. if (retType->IsFloat())
  2722. {
  2723. resultReg = ResizeRegister(X64Reg_XMM0_f64, retType->mSize);
  2724. }
  2725. else
  2726. {
  2727. BF_ASSERT(retType->IsIntable());
  2728. resultReg = ResizeRegister(X64Reg_RAX, retType->mSize);
  2729. }
  2730. AllocInst(BeMCInstKind_Mov, mcResult, BeMCOperand::FromReg(resultReg));
  2731. }
  2732. if (noReturn)
  2733. AllocInst(BeMCInstKind_RestoreVolatiles, BeMCOperand::FromPreserveFlag(BeMCPreserveFlag_NoRestore));
  2734. else
  2735. AllocInst(BeMCInstKind_RestoreVolatiles);
  2736. return mcResult;
  2737. }
  2738. void BeMCContext::CreateMemSet(const BeMCOperand& addr, uint8 val, int size, int align)
  2739. {
  2740. if ((size == 8) || (size == 4) || (size == 2) || (size == 1))
  2741. {
  2742. BeType* type = NULL;
  2743. BeMCOperand zeroVal;
  2744. zeroVal.mImmediate = 0;
  2745. switch (size)
  2746. {
  2747. case 8:
  2748. type = mModule->mContext->GetPrimitiveType(BeTypeCode_Int64);
  2749. zeroVal.mKind = BeMCOperandKind_Immediate_i64;
  2750. zeroVal.mImmediate = ((int64)val << 56) | ((int64)val << 48) | ((int64)val << 40) | ((int64)val << 32) |
  2751. (val << 24) | (val << 16) | (val << 8) | val;
  2752. break;
  2753. case 4:
  2754. type = mModule->mContext->GetPrimitiveType(BeTypeCode_Int32);
  2755. zeroVal.mKind = BeMCOperandKind_Immediate_i32;
  2756. zeroVal.mImmediate = (val << 24) | (val << 16) | (val << 8) | val;
  2757. break;
  2758. case 2:
  2759. type = mModule->mContext->GetPrimitiveType(BeTypeCode_Int16);
  2760. zeroVal.mKind = BeMCOperandKind_Immediate_i16;
  2761. zeroVal.mImmediate = (val << 8) | val;
  2762. break;
  2763. case 1:
  2764. type = mModule->mContext->GetPrimitiveType(BeTypeCode_Int8);
  2765. zeroVal.mKind = BeMCOperandKind_Immediate_i8;
  2766. zeroVal.mImmediate = val;
  2767. break;
  2768. }
  2769. auto ptrType = mModule->mContext->GetPointerTo(type);
  2770. auto result = AllocVirtualReg(ptrType);
  2771. CreateDefineVReg(result);
  2772. auto vregInfo = GetVRegInfo(result);
  2773. vregInfo->mRelTo = addr;
  2774. vregInfo->mIsExpr = true;
  2775. BeMCOperand dest;
  2776. dest.mKind = BeMCOperandKind_VRegLoad;
  2777. dest.mVRegIdx = result.mVRegIdx;
  2778. AllocInst(BeMCInstKind_Mov, dest, zeroVal);
  2779. return;
  2780. }
  2781. if (addr.IsVRegAny())
  2782. {
  2783. auto vregInfo = GetVRegInfo(addr);
  2784. if (!vregInfo->mIsRetVal)
  2785. vregInfo->mForceMem = true;
  2786. CheckForce(vregInfo);
  2787. }
  2788. if (size <= 256)
  2789. {
  2790. auto temp = addr;
  2791. BeMCOperand mcMemSetInfo;
  2792. mcMemSetInfo.mKind = BeMCOperandKind_MemSetInfo;
  2793. mcMemSetInfo.mMemSetInfo.mSize = size;
  2794. mcMemSetInfo.mMemSetInfo.mAlign = align;
  2795. mcMemSetInfo.mMemSetInfo.mValue = val;
  2796. AllocInst(BeMCInstKind_PreserveVolatiles, BeMCOperand::FromReg(X64Reg_R11));
  2797. AllocInst(BeMCInstKind_MemSet, mcMemSetInfo, temp);
  2798. AllocInst(BeMCInstKind_RestoreVolatiles, BeMCOperand::FromReg(X64Reg_R11));
  2799. return;
  2800. }
  2801. SizedArray<BeMCOperand, 3> args = { addr, BeMCOperand::FromImmediate(val), BeMCOperand::FromImmediate(size) };
  2802. auto mcFunc = BeMCOperand::FromSymbolAddr(mCOFFObject->GetSymbolRef("memset")->mIdx);
  2803. CreateCall(mcFunc, args);
  2804. }
  2805. void BeMCContext::CreateMemCpy(const BeMCOperand& dest, const BeMCOperand& src, int size, int align)
  2806. {
  2807. auto destVRegInfo = GetVRegInfo(dest);
  2808. auto srcVRegInfo = GetVRegInfo(src);
  2809. if ((destVRegInfo != NULL) && (srcVRegInfo != NULL) && (destVRegInfo->mIsRetVal) && (srcVRegInfo->mIsRetVal))
  2810. return;
  2811. if (size <= 256)
  2812. {
  2813. int destIdx = -1;
  2814. if (!GetEncodedOperand(dest, destIdx))
  2815. {
  2816. BeMCOperand tempDest = AllocVirtualReg(GetType(dest), 1);
  2817. CreateDefineVReg(tempDest);
  2818. AllocInst(BeMCInstKind_Mov, tempDest, dest);
  2819. auto vregInfo = mVRegInfo[tempDest.mVRegIdx];
  2820. vregInfo->mForceReg = true;
  2821. vregInfo->mDisableR11 = true;
  2822. destIdx = tempDest.mVRegIdx;
  2823. }
  2824. int srcIdx = -1;
  2825. if (!GetEncodedOperand(src, srcIdx))
  2826. {
  2827. BeMCOperand tempSrc = AllocVirtualReg(GetType(src), 1);
  2828. CreateDefineVReg(tempSrc);
  2829. AllocInst(BeMCInstKind_Mov, tempSrc, src);
  2830. auto vregInfo = mVRegInfo[tempSrc.mVRegIdx];
  2831. vregInfo->mForceReg = true;
  2832. vregInfo->mDisableR11 = true;
  2833. srcIdx = tempSrc.mVRegIdx;
  2834. }
  2835. BeMCOperand mcMemCpyInfo;
  2836. mcMemCpyInfo.mKind = BeMCOperandKind_MemCpyInfo;
  2837. mcMemCpyInfo.mMemCpyInfo.mSize = size;
  2838. mcMemCpyInfo.mMemCpyInfo.mAlign = align;
  2839. AllocInst(BeMCInstKind_PreserveVolatiles, BeMCOperand::FromReg(X64Reg_R11));
  2840. BeMCOperand mcVRegPair;
  2841. mcVRegPair.mKind = BeMCOperandKind_VRegPair;
  2842. mcVRegPair.mVRegPair.mVRegIdx0 = destIdx;
  2843. mcVRegPair.mVRegPair.mVRegIdx1 = srcIdx;
  2844. AllocInst(BeMCInstKind_MemCpy, mcMemCpyInfo, mcVRegPair);
  2845. AllocInst(BeMCInstKind_RestoreVolatiles, BeMCOperand::FromReg(X64Reg_R11));
  2846. return;
  2847. }
  2848. SizedArray<BeMCOperand, 3> args = { dest, src, BeMCOperand::FromImmediate(size) };
  2849. auto mcFunc = BeMCOperand::FromSymbolAddr(mCOFFObject->GetSymbolRef("memcpy")->mIdx);
  2850. CreateCall(mcFunc, args);
  2851. }
  2852. void BeMCContext::CreateTableSwitchSection(BeSwitchInst* switchInst, int startIdx, int endIdx)
  2853. {
  2854. auto& sect = mCOFFObject->mRDataSect;
  2855. auto defaultBlock = GetOperand(switchInst->mDefaultBlock);
  2856. auto int32Type = mModule->mContext->GetPrimitiveType(BeTypeCode_Int32);
  2857. auto int32PtrType = mModule->mContext->GetPointerTo(int32Type);
  2858. auto nativeType = mModule->mContext->GetPrimitiveType(BeTypeCode_Int64);
  2859. auto nativePtrType = mModule->mContext->GetPointerTo(nativeType);
  2860. int64 loVal = switchInst->mCases.front().mValue->mInt64;
  2861. int64 hiVal = switchInst->mCases.back().mValue->mInt64;
  2862. int numVals = switchInst->mCases.size();
  2863. BeMCSymbol* sym = mCOFFObject->mSymbols.Alloc();
  2864. sym->mType = int32Type;
  2865. sym->mName = StrFormat("@jumpTab%d", mCOFFObject->mCurJumpTableIdx++);
  2866. sym->mIsStatic = true;
  2867. sym->mSymKind = BeMCSymbolKind_External;
  2868. sym->mIdx = (int)mCOFFObject->mSymbols.size() - 1;
  2869. mCOFFObject->MarkSectionUsed(sect);
  2870. sym->mSectionNum = sect.mSectionIdx + 1;
  2871. sect.mData.Align(4);
  2872. sect.mAlign = BF_MAX(sect.mAlign, 4);
  2873. sym->mValue = sect.mData.GetSize();
  2874. auto mcValue = GetOperand(switchInst->mValue);
  2875. auto beType = GetType(mcValue);
  2876. auto mcOfsValue = AllocVirtualReg(nativeType);
  2877. CreateDefineVReg(mcOfsValue);
  2878. if (beType->mSize < 8)
  2879. AllocInst(BeMCInstKind_MovSX, mcOfsValue, mcValue);
  2880. else
  2881. AllocInst(BeMCInstKind_Mov, mcOfsValue, mcValue);
  2882. AllocInst(BeMCInstKind_Sub, mcOfsValue, BeMCOperand::FromImmediate(loVal));
  2883. AllocInst(BeMCInstKind_CondBr, defaultBlock, BeMCOperand::FromCmpKind(BeCmpKind_SLT));
  2884. AllocInst(BeMCInstKind_Cmp, mcOfsValue, BeMCOperand::FromImmediate(hiVal - loVal));
  2885. AllocInst(BeMCInstKind_CondBr, defaultBlock, BeMCOperand::FromCmpKind(BeCmpKind_SGT));
  2886. auto jumpVReg = AllocVirtualReg(nativeType);
  2887. CreateDefineVReg(jumpVReg);
  2888. AllocInst(BeMCInstKind_Mov, jumpVReg, BeMCOperand::FromSymbolAddr(sym->mIdx));
  2889. auto jumpRelVReg = AllocVirtualReg(int32PtrType);
  2890. CreateDefineVReg(jumpRelVReg);
  2891. auto vregInfo = mVRegInfo[jumpRelVReg.mVRegIdx];
  2892. vregInfo->mIsExpr = true;
  2893. vregInfo->mRelTo = jumpVReg;
  2894. vregInfo->mRelOffset = mcOfsValue;
  2895. vregInfo->mRelOffsetScale = 4;
  2896. jumpRelVReg.mKind = BeMCOperandKind_VRegLoad;
  2897. AllocInst(BeMCInstKind_Mov, jumpVReg, jumpRelVReg);
  2898. auto imageBaseSym = mCOFFObject->GetSymbolRef("__ImageBase");
  2899. imageBaseSym->mType = nativeType;
  2900. auto baseVReg = AllocVirtualReg(nativeType);
  2901. CreateDefineVReg(baseVReg);
  2902. AllocInst(BeMCInstKind_Mov, baseVReg, BeMCOperand::FromSymbolAddr(imageBaseSym->mIdx));
  2903. AllocInst(BeMCInstKind_Add, jumpVReg, baseVReg);
  2904. AllocInst(BeMCInstKind_Br, jumpVReg);
  2905. int64 lastVal = loVal - 1;
  2906. defaultBlock.mBlock->AddPred(mActiveBlock);
  2907. for (int caseIdx = 0; caseIdx < (int)switchInst->mCases.size(); caseIdx++)
  2908. {
  2909. auto& switchCase = switchInst->mCases[caseIdx];
  2910. int64 newVal = switchCase.mValue->mInt64;
  2911. for (int64 val = lastVal + 1; val <= newVal; val++)
  2912. {
  2913. BeMCSwitchEntry switchEntry;
  2914. switchEntry.mOfs = sect.mData.GetSize();
  2915. if (val == newVal)
  2916. {
  2917. auto switchBlock = GetOperand(switchCase.mBlock);
  2918. switchBlock.mBlock->AddPred(mActiveBlock);
  2919. switchEntry.mBlock = switchBlock.mBlock;
  2920. }
  2921. else
  2922. {
  2923. switchEntry.mBlock = defaultBlock.mBlock;
  2924. }
  2925. mSwitchEntries.push_back(switchEntry);
  2926. // Placeholder
  2927. sect.mData.Write((int32)0);
  2928. }
  2929. lastVal = newVal;
  2930. }
  2931. }
  2932. void BeMCContext::CreateBinarySwitchSection(BeSwitchInst* switchInst, int startIdx, int endIdx)
  2933. {
  2934. // This is an empirically determined binary switching limit
  2935. if (endIdx - startIdx >= 18)
  2936. {
  2937. int gteLabel = mCurLabelIdx++;
  2938. auto mcDefaultBlock = GetOperand(switchInst->mDefaultBlock);
  2939. int midIdx = startIdx + (endIdx - startIdx) / 2;
  2940. auto& switchCase = switchInst->mCases[midIdx];
  2941. auto switchBlock = GetOperand(switchCase.mBlock);
  2942. auto mcValue = GetOperand(switchInst->mValue);
  2943. auto valueType = GetType(mcValue);
  2944. AllocInst(BeMCInstKind_Cmp, mcValue, GetOperand(switchCase.mValue));
  2945. AllocInst(BeMCInstKind_CondBr, BeMCOperand::FromLabel(gteLabel), BeMCOperand::FromCmpKind(BeCmpKind_SGE));
  2946. switchBlock.mBlock->AddPred(mActiveBlock);
  2947. CreateBinarySwitchSection(switchInst, startIdx, midIdx);
  2948. AllocInst(BeMCInstKind_Br, mcDefaultBlock);
  2949. CreateLabel(-1, gteLabel);
  2950. CreateBinarySwitchSection(switchInst, midIdx, endIdx);
  2951. return;
  2952. }
  2953. for (int caseIdx = startIdx; caseIdx < endIdx; caseIdx++)
  2954. {
  2955. auto& switchCase = switchInst->mCases[caseIdx];
  2956. auto switchBlock = GetOperand(switchCase.mBlock);
  2957. auto mcValue = GetOperand(switchInst->mValue);
  2958. AllocInst(BeMCInstKind_Cmp, mcValue, GetOperand(switchCase.mValue));
  2959. AllocInst(BeMCInstKind_CondBr, switchBlock, BeMCOperand::FromCmpKind(BeCmpKind_EQ));
  2960. switchBlock.mBlock->AddPred(mActiveBlock);
  2961. }
  2962. }
  2963. void BeMCContext::CreateCondBr(BeMCBlock* mcBlock, BeMCOperand& testVal, const BeMCOperand& trueBlock, const BeMCOperand& falseBlock)
  2964. {
  2965. if (mDebugging)
  2966. {
  2967. NOP;
  2968. }
  2969. if (testVal.IsImmediate())
  2970. {
  2971. if (testVal.mImmediate != 0)
  2972. AllocInst(BeMCInstKind_Br, trueBlock);
  2973. else
  2974. AllocInst(BeMCInstKind_Br, falseBlock);
  2975. }
  2976. else if (testVal.mKind == BeMCOperandKind_CmpResult)
  2977. {
  2978. // Beef-specific: assuming CMP results aren't stomped
  2979. auto& cmpResult = mCmpResults[testVal.mCmpResultIdx];
  2980. AllocInst(BeMCInstKind_CondBr, trueBlock, BeMCOperand::FromCmpKind(cmpResult.mCmpKind));
  2981. AllocInst(BeMCInstKind_Br, falseBlock);
  2982. }
  2983. else if (testVal.mKind == BeMCOperandKind_Phi)
  2984. {
  2985. auto phi = testVal.mPhi;
  2986. auto phiBlock = phi->mBlock;
  2987. if ((phi->mBrTrue != NULL) && (phi->mBrFalse != NULL))
  2988. {
  2989. // Redirect branches
  2990. for (auto instIdx = 0; instIdx < phiBlock->mInstructions.size(); instIdx++)
  2991. {
  2992. auto inst = phiBlock->mInstructions[instIdx];
  2993. if (inst->mKind == BeMCInstKind_Br)
  2994. {
  2995. if (inst->mArg0 == phi->mBrTrue)
  2996. inst->mArg0 = trueBlock;
  2997. else if (inst->mArg0 == phi->mBrFalse)
  2998. inst->mArg0 = falseBlock;
  2999. }
  3000. }
  3001. phi->mBrTrue = trueBlock;
  3002. phi->mBrFalse = falseBlock;
  3003. return;
  3004. }
  3005. phi->mBrTrue = trueBlock;
  3006. phi->mBrFalse = falseBlock;
  3007. // Using a Phi for a CondBr in a different block is not supported
  3008. if (phiBlock != mcBlock)
  3009. {
  3010. // Special case if our using block directly leads into us
  3011. BF_ASSERT(mcBlock->mPreds.size() == 1);
  3012. BF_ASSERT(mcBlock->mPreds[0] == phiBlock);
  3013. }
  3014. for (auto instIdx = 0; instIdx < phiBlock->mInstructions.size(); instIdx++)
  3015. {
  3016. auto inst = phiBlock->mInstructions[instIdx];
  3017. if (inst->mKind == BeMCInstKind_DefPhi)
  3018. {
  3019. BF_ASSERT(inst->mArg0.mPhi == phi);
  3020. RemoveInst(phiBlock, instIdx);
  3021. break;
  3022. }
  3023. }
  3024. for (auto& phiVal : phi->mValues)
  3025. {
  3026. BeMCOperand landinglabel;
  3027. if (phiVal.mValue.mKind != BeMCOperandKind_Phi)
  3028. {
  3029. landinglabel = BeMCOperand::FromLabel(mCurLabelIdx++);
  3030. AllocInst(BeMCInstKind_Label, landinglabel);
  3031. }
  3032. int brInstIdx = -1;
  3033. bool isFalseCmpResult = false;
  3034. if (landinglabel)
  3035. {
  3036. bool found = false;
  3037. auto _CheckBlock = [&] (BeMCBlock* block)
  3038. {
  3039. for (int checkIdx = (int)block->mInstructions.size() - 1; checkIdx >= 0; checkIdx--)
  3040. {
  3041. auto checkInst = block->mInstructions[checkIdx];
  3042. if ((checkInst->mArg0.mKind == BeMCOperandKind_Block) &&
  3043. (checkInst->mArg0.mBlock == phi->mBlock))
  3044. {
  3045. brInstIdx = checkIdx;
  3046. checkInst->mArg0 = landinglabel;
  3047. found = true;
  3048. // Don't break, if we're are chained to another PHI then we need to modify all the labels
  3049. isFalseCmpResult = false;
  3050. if ((checkIdx >= 2) && (checkInst->mKind == BeMCInstKind_Br))
  3051. {
  3052. auto prevInst = block->mInstructions[checkIdx - 1];
  3053. auto prevPrevInst = block->mInstructions[checkIdx - 2];
  3054. if ((prevPrevInst->mKind == BeMCInstKind_Cmp) && (prevPrevInst->mResult == phiVal.mValue) &&
  3055. (prevInst->mKind == BeMCInstKind_CondBr) && (prevInst->mArg1.mCmpKind == BeCmpKind_EQ))
  3056. {
  3057. isFalseCmpResult = true;
  3058. }
  3059. }
  3060. }
  3061. }
  3062. };
  3063. _CheckBlock(phiVal.mBlockFrom);
  3064. BF_ASSERT(found);
  3065. }
  3066. if (isFalseCmpResult)
  3067. {
  3068. BF_ASSERT(phiVal.mValue.mKind == BeMCOperandKind_CmpResult);
  3069. AllocInst(BeMCInstKind_Br, falseBlock);
  3070. }
  3071. else if ((phiVal.mValue.IsImmediate()) ||
  3072. (phiVal.mValue.mKind == BeMCOperandKind_CmpResult) ||
  3073. (phiVal.mValue.mKind == BeMCOperandKind_Phi) ||
  3074. (phiVal.mValue.mKind == BeMCOperandKind_NotResult))
  3075. {
  3076. CreateCondBr(phiVal.mBlockFrom, phiVal.mValue, trueBlock, falseBlock);
  3077. }
  3078. else
  3079. {
  3080. // Do the 'test' in the preceding block. This is needed for liveness checking. Using a vreg in this
  3081. // block would require the def to be hoisted
  3082. SetAndRestoreValue<BeMCBlock*> prevActiveBlock(mActiveBlock, phiVal.mBlockFrom);
  3083. BeMCOperand testImm;
  3084. testImm.mKind = BeMCOperandKind_Immediate_i8;
  3085. testImm.mImmediate = 1;
  3086. auto mcInst = AllocInst(BeMCInstKind_Test, phiVal.mValue, testImm, brInstIdx);
  3087. prevActiveBlock.Restore();
  3088. mcInst = AllocInst(BeMCInstKind_CondBr, trueBlock, BeMCOperand::FromCmpKind(BeCmpKind_NE));
  3089. mcInst = AllocInst(BeMCInstKind_Br, falseBlock);
  3090. }
  3091. }
  3092. }
  3093. else if (testVal.mKind == BeMCOperandKind_NotResult)
  3094. {
  3095. // Just get the original block and swap the true/false blocks
  3096. auto invResult = GetOperand(testVal.mNotResult->mValue, true);
  3097. if (invResult)
  3098. {
  3099. CreateCondBr(mcBlock, invResult, falseBlock, trueBlock);
  3100. }
  3101. }
  3102. else
  3103. {
  3104. BeMCOperand testImm;
  3105. testImm.mKind = BeMCOperandKind_Immediate_i8;
  3106. testImm.mImmediate = 1;
  3107. auto mcInst = AllocInst(BeMCInstKind_Test, testVal, testImm);
  3108. mcInst = AllocInst(BeMCInstKind_CondBr, trueBlock, BeMCOperand::FromCmpKind(BeCmpKind_NE));
  3109. mcInst = AllocInst(BeMCInstKind_Br, falseBlock);
  3110. }
  3111. }
  3112. void BeMCContext::CreatePhiAssign(BeMCBlock* mcBlock, const BeMCOperand& testVal, const BeMCOperand& result, const BeMCOperand& doneLabel)
  3113. {
  3114. if (testVal.mKind == BeMCOperandKind_Phi)
  3115. {
  3116. auto phi = testVal.mPhi;
  3117. for (auto& phiVal : phi->mValues)
  3118. {
  3119. BeMCOperand landinglabel;
  3120. if (phiVal.mValue.mKind == BeMCOperandKind_Phi)
  3121. {
  3122. // Remove PhiDef
  3123. auto phi = phiVal.mValue.mPhi;
  3124. auto phiBlock = phi->mBlock;
  3125. for (auto instIdx = 0; instIdx < phiBlock->mInstructions.size(); instIdx++)
  3126. {
  3127. auto inst = phiBlock->mInstructions[instIdx];
  3128. if (inst->mKind == BeMCInstKind_DefPhi)
  3129. {
  3130. BF_ASSERT(inst->mArg0.mPhi == phi);
  3131. RemoveInst(phiBlock, instIdx);
  3132. break;
  3133. }
  3134. }
  3135. CreatePhiAssign(phiVal.mBlockFrom, phiVal.mValue, result, doneLabel);
  3136. }
  3137. else
  3138. {
  3139. bool found = false;
  3140. auto _CheckBlock = [&] (BeMCBlock* block)
  3141. {
  3142. SetAndRestoreValue<BeMCBlock*> prevActiveBlock(mActiveBlock, block);
  3143. for (int checkIdx = (int)block->mInstructions.size() - 1; checkIdx >= 0; checkIdx--)
  3144. {
  3145. auto checkInst = block->mInstructions[checkIdx];
  3146. if ((checkInst->mArg0.mKind == BeMCOperandKind_Block) &&
  3147. (checkInst->mArg0.mBlock == phi->mBlock))
  3148. {
  3149. // Don't use an explicit dbgLoc
  3150. SetAndRestoreValue<BeDbgLoc*> prevDbgLoc(mCurDbgLoc, NULL);
  3151. if (checkInst->mKind == BeMCInstKind_CondBr)
  3152. {
  3153. auto falseLabel = BeMCOperand::FromLabel(mCurLabelIdx++);
  3154. auto prevDest = checkInst->mArg0;
  3155. checkInst->mArg0 = falseLabel;
  3156. checkInst->mArg1.mCmpKind = BeModule::InvertCmp(checkInst->mArg1.mCmpKind);
  3157. AllocInst(BeMCInstKind_Mov, result, phiVal.mValue, checkIdx + 1);
  3158. AllocInst(BeMCInstKind_Br, prevDest, checkIdx + 2);
  3159. AllocInst(BeMCInstKind_Label, falseLabel, checkIdx + 3);
  3160. }
  3161. else
  3162. {
  3163. AllocInst(BeMCInstKind_Mov, result, phiVal.mValue, checkIdx);
  3164. }
  3165. found = true;
  3166. }
  3167. }
  3168. };
  3169. _CheckBlock(phiVal.mBlockFrom);
  3170. BF_ASSERT(found);
  3171. }
  3172. if (landinglabel)
  3173. {
  3174. AllocInst(BeMCInstKind_Br, doneLabel);
  3175. }
  3176. }
  3177. }
  3178. else
  3179. {
  3180. NotImpl();
  3181. }
  3182. }
  3183. BeMCOperand BeMCContext::GetImmediate(int64 val)
  3184. {
  3185. BeMCOperand operand;
  3186. operand.mKind = BeMCOperandKind_Immediate_i64;
  3187. operand.mImmediate = val;
  3188. return operand;
  3189. }
  3190. BeMCOperand BeMCContext::GetVReg(int regNum)
  3191. {
  3192. auto vregInfo = mVRegInfo[regNum];
  3193. if (vregInfo->mReg != X64Reg_None)
  3194. return BeMCOperand::FromReg(vregInfo->mReg);
  3195. BeMCOperand operand;
  3196. operand.mKind = BeMCOperandKind_VReg;
  3197. operand.mVRegIdx = regNum;
  3198. return operand;
  3199. }
  3200. BeMCOperand BeMCContext::AllocVirtualReg(BeType* type, int refCount, bool mustBeReg)
  3201. {
  3202. BF_ASSERT(type->mTypeCode != BeTypeCode_Function); // We can only have pointers to these
  3203. if (mustBeReg)
  3204. {
  3205. BF_ASSERT(!type->IsComposite());
  3206. BF_ASSERT(type->mSize != 0);
  3207. }
  3208. int vregIdx = (int)mVRegInfo.size();
  3209. BeMCVRegInfo* vregInfo = mAlloc.Alloc<BeMCVRegInfo>();
  3210. vregInfo->mType = type;
  3211. vregInfo->mAlign = type->mAlign;
  3212. vregInfo->mRefCount = refCount;
  3213. vregInfo->mForceReg = mustBeReg;
  3214. mVRegInfo.push_back(vregInfo);
  3215. BeMCOperand mcOperand;
  3216. mcOperand.mKind = BeMCOperandKind_VReg;
  3217. mcOperand.mVRegIdx = vregIdx++;
  3218. if (mDebugging)
  3219. {
  3220. if (mcOperand.mVRegIdx == 3)
  3221. {
  3222. NOP;
  3223. }
  3224. }
  3225. return mcOperand;
  3226. }
  3227. int BeMCContext::GetUnderlyingVReg(int vregIdx)
  3228. {
  3229. while (true)
  3230. {
  3231. auto vregInfo = mVRegInfo[vregIdx];
  3232. if (!vregInfo->mRelTo.IsVRegAny())
  3233. return vregIdx;
  3234. if (vregInfo->mRelOffset)
  3235. return vregIdx;
  3236. vregIdx = vregInfo->mRelTo.mVRegIdx;
  3237. }
  3238. }
  3239. bool BeMCContext::HasForceRegs(const BeMCOperand &operand)
  3240. {
  3241. if (!operand.IsVRegAny())
  3242. return false;
  3243. auto vregInfo = mVRegInfo[operand.mVRegIdx];
  3244. if (vregInfo->mForceReg)
  3245. return true;
  3246. return HasForceRegs(vregInfo->mRelTo) || HasForceRegs(vregInfo->mRelOffset);
  3247. }
  3248. bool BeMCContext::OperandsEqual(const BeMCOperand& op0, const BeMCOperand& op1, bool exact)
  3249. {
  3250. bool isVReg0 = op0.mKind == BeMCOperandKind_VReg;
  3251. bool isVReg1 = op1.mKind == BeMCOperandKind_VReg;
  3252. if (!isVReg0 || !isVReg1)
  3253. {
  3254. return op0 == op1;
  3255. }
  3256. if (exact)
  3257. {
  3258. int vregIdx0 = op0.mVRegIdx;
  3259. int vregIdx1 = op1.mVRegIdx;
  3260. while (true)
  3261. {
  3262. auto vregInfo = mVRegInfo[vregIdx0];
  3263. if (!vregInfo->IsDirectRelTo())
  3264. break;
  3265. if (vregInfo->mRelTo.mKind != BeMCOperandKind_VReg)
  3266. return false;
  3267. vregIdx0 = vregInfo->mRelTo.mVRegIdx;
  3268. }
  3269. while (true)
  3270. {
  3271. auto vregInfo = mVRegInfo[vregIdx1];
  3272. if (!vregInfo->IsDirectRelTo())
  3273. break;
  3274. if (vregInfo->mRelTo.mKind != BeMCOperandKind_VReg)
  3275. return false;
  3276. vregIdx1 = vregInfo->mRelTo.mVRegIdx;
  3277. }
  3278. return vregIdx0 == vregIdx1;
  3279. }
  3280. int vregIdx0 = GetUnderlyingVReg(op0.mVRegIdx);
  3281. int vregIdx1 = GetUnderlyingVReg(op1.mVRegIdx);
  3282. return vregIdx0 == vregIdx1;
  3283. }
  3284. bool BeMCContext::ContainsNonOffsetRef(const BeMCOperand& checkOperand, const BeMCOperand& findOperand)
  3285. {
  3286. if (!checkOperand.IsVRegAny())
  3287. return false;
  3288. if (checkOperand == findOperand)
  3289. return true;
  3290. auto vregInfo = GetVRegInfo(checkOperand);
  3291. if (ContainsNonOffsetRef(vregInfo->mRelTo, findOperand))
  3292. return true;
  3293. return false;
  3294. }
  3295. // For all values that we are certain we will immediately use, we directly do a Def preceding its first use.
  3296. // For Allocas in the head, however, we may not use that memory for a long time so we imply the Def location
  3297. // in DoDefPass. That allows us to limit how long that vreg will hold onto a register, reducing register
  3298. // contention.
  3299. BeMCInst* BeMCContext::CreateDefineVReg(const BeMCOperand& vreg, int insertIdx)
  3300. {
  3301. auto mcInst = AllocInst(insertIdx);
  3302. mcInst->mKind = BeMCInstKind_Def;
  3303. mcInst->mArg0 = vreg;
  3304. return mcInst;
  3305. }
  3306. int BeMCContext::CreateLabel(int insertIdx, int labelIdx)
  3307. {
  3308. auto inst = AllocInst(insertIdx);
  3309. inst->mKind = BeMCInstKind_Label;
  3310. inst->mArg0.mKind = BeMCOperandKind_Label;
  3311. if (labelIdx != -1)
  3312. inst->mArg0.mLabelIdx = labelIdx;
  3313. else
  3314. inst->mArg0.mLabelIdx = mCurLabelIdx++;
  3315. return inst->mArg0.mLabelIdx;
  3316. }
  3317. bool BeMCContext::FindTarget(const BeMCOperand& loc, BeMCBlock*& outBlock, int& outInstIdx)
  3318. {
  3319. if (loc.mKind == BeMCOperandKind_Block)
  3320. {
  3321. outBlock = loc.mBlock;
  3322. outInstIdx = -1;
  3323. return true;
  3324. }
  3325. if (loc.mKind == BeMCOperandKind_Label)
  3326. {
  3327. // Linear search :-(
  3328. for (auto mcBlock : mBlocks)
  3329. {
  3330. for (int instIdx = 0; instIdx < (int)mcBlock->mInstructions.size(); instIdx++)
  3331. {
  3332. auto inst = mcBlock->mInstructions[instIdx];
  3333. if ((inst->mKind == BeMCInstKind_Label) && (inst->mArg0.mLabelIdx == loc.mLabelIdx))
  3334. {
  3335. outBlock = mcBlock;
  3336. outInstIdx = instIdx;
  3337. return true;
  3338. }
  3339. }
  3340. }
  3341. }
  3342. return false;
  3343. }
  3344. BeMCOperand BeMCContext::AllocRelativeVirtualReg(BeType* type, const BeMCOperand& relTo, const BeMCOperand& relOffset, int relScale)
  3345. {
  3346. if (!relTo.IsVRegAny())
  3347. {
  3348. auto relToType = GetType(relTo);
  3349. auto tempRelTo = AllocVirtualReg(relToType, 1);
  3350. CreateDefineVReg(tempRelTo);
  3351. AllocInst(BeMCInstKind_Mov, tempRelTo, relTo);
  3352. tempRelTo.mKind = BeMCOperandKind_VReg;
  3353. return AllocRelativeVirtualReg(type, tempRelTo, relOffset, relScale);
  3354. }
  3355. BF_ASSERT(relTo.IsVRegAny());
  3356. auto relToVRegInfo = GetVRegInfo(relTo);
  3357. if ((mDebugging) && (mVRegInfo.size() == 5))
  3358. {
  3359. NOP;
  3360. }
  3361. if ((relToVRegInfo->mRelTo) && (relToVRegInfo->mRelOffsetScale == 1) && (relToVRegInfo->mRelOffset.IsImmediate()) &&
  3362. (relOffset.IsImmediate()) && (relScale == 1))
  3363. {
  3364. if (relTo.mKind == BeMCOperandKind_VReg)
  3365. {
  3366. int offset = (int)relOffset.mImmediate;
  3367. if (relToVRegInfo->mRelOffset)
  3368. offset += relToVRegInfo->mRelOffset.mImmediate;
  3369. return AllocRelativeVirtualReg(type, relToVRegInfo->mRelTo, GetImmediate(offset), 1);
  3370. }
  3371. }
  3372. if ((relTo.mKind == BeMCOperandKind_VRegAddr) && (!relToVRegInfo->mRelOffset) && (relOffset.IsZero()) && (relScale == 1))
  3373. {
  3374. auto vregInfo = GetVRegInfo(relTo);
  3375. if (vregInfo->IsDirectRelToAny())
  3376. {
  3377. if (vregInfo->mRelTo.mKind == BeMCOperandKind_Symbol)
  3378. {
  3379. return AllocRelativeVirtualReg(type, BeMCOperand::FromSymbolAddr(vregInfo->mRelTo.mSymbolIdx), BeMCOperand(), 1);
  3380. }
  3381. }
  3382. }
  3383. auto mcVReg = AllocVirtualReg(type);
  3384. auto vregInfo = GetVRegInfo(mcVReg);
  3385. vregInfo->mIsExpr = true;
  3386. vregInfo->mRelTo = relTo;
  3387. if (!relOffset.IsZero())
  3388. vregInfo->mRelOffset = relOffset;
  3389. vregInfo->mRelOffsetScale = relScale;
  3390. mcVReg.mKind = BeMCOperandKind_VReg;
  3391. return mcVReg;
  3392. }
  3393. BeMCVRegInfo* BeMCContext::GetVRegInfo(const BeMCOperand& operand)
  3394. {
  3395. if (!operand.IsVRegAny())
  3396. return NULL;
  3397. return mVRegInfo[operand.mVRegIdx];
  3398. }
  3399. bool BeMCContext::HasSymbolAddr(const BeMCOperand& operand)
  3400. {
  3401. if (operand.mKind == BeMCOperandKind_SymbolAddr)
  3402. return true;
  3403. auto vregInfo = GetVRegInfo(operand);
  3404. if (vregInfo == NULL)
  3405. return false;
  3406. if ((vregInfo->mRelTo) && (HasSymbolAddr(vregInfo->mRelTo)))
  3407. return true;
  3408. if ((vregInfo->mRelOffset) && (HasSymbolAddr(vregInfo->mRelOffset)))
  3409. return true;
  3410. return false;
  3411. }
  3412. BeMCOperand BeMCContext::ReplaceWithNewVReg(BeMCOperand& operand, int& instIdx, bool isInput, bool mustBeReg)
  3413. {
  3414. BeMCOperand scratchReg = AllocVirtualReg(GetType(operand), 2, mustBeReg);
  3415. CreateDefineVReg(scratchReg, instIdx++);
  3416. if (isInput)
  3417. AllocInst(BeMCInstKind_Mov, scratchReg, operand, instIdx++);
  3418. else
  3419. AllocInst(BeMCInstKind_Mov, operand, scratchReg, instIdx++ + 1);
  3420. operand = scratchReg;
  3421. return scratchReg;
  3422. }
  3423. BeMCOperand BeMCContext::RemapOperand(BeMCOperand& operand, BeMCRemapper& regRemaps)
  3424. {
  3425. if (!operand.IsVRegAny())
  3426. return operand;
  3427. int regIdx = regRemaps.GetHead(operand.mVRegIdx);
  3428. if (regIdx < 0)
  3429. {
  3430. BeMCOperand newOperand;
  3431. newOperand.mKind = operand.mKind;
  3432. if (newOperand.mKind == BeMCOperandKind_VRegLoad)
  3433. newOperand.mKind = BeMCOperandKind_VReg;
  3434. else
  3435. NotImpl();
  3436. newOperand.mVRegIdx = -regIdx;
  3437. return newOperand;
  3438. }
  3439. else
  3440. {
  3441. BeMCOperand newOperand;
  3442. newOperand.mKind = operand.mKind;
  3443. newOperand.mVRegIdx = regIdx;
  3444. return newOperand;
  3445. }
  3446. }
  3447. bool BeMCContext::IsLive(BeVTrackingList* liveRegs, int origVRegIdx, BeMCRemapper& regRemaps)
  3448. {
  3449. // Check the whole remap chain to determine liveness
  3450. int vregIdx = regRemaps.GetHead(origVRegIdx);
  3451. while (vregIdx != -1)
  3452. {
  3453. if (mLivenessContext.IsSet(liveRegs, vregIdx))
  3454. return true;
  3455. vregIdx = regRemaps.GetNext(vregIdx);
  3456. }
  3457. return false;
  3458. }
  3459. void BeMCContext::AddRegRemap(int from, int to, BeMCRemapper& regRemaps, bool allowRemapToDbgVar)
  3460. {
  3461. auto vregInfoFrom = mVRegInfo[from];
  3462. auto vregInfoTo = mVRegInfo[to];
  3463. BF_ASSERT(vregInfoFrom->mDbgVariable == NULL);
  3464. if (vregInfoTo->mDbgVariable != NULL)
  3465. {
  3466. // We can't do a direct remap due to lifetime issues, so do an indirect one
  3467. vregInfoFrom->mIsExpr = true;
  3468. if (!vregInfoFrom->mIsRetVal)
  3469. vregInfoFrom->mForceReg = false;
  3470. vregInfoFrom->mRelTo = BeMCOperand::FromVReg(to);
  3471. vregInfoFrom->mRelOffset = BeMCOperand();
  3472. vregInfoFrom->mRelOffsetScale = 1;
  3473. return;
  3474. }
  3475. regRemaps.Add(from, to);
  3476. }
  3477. bool BeMCContext::GetEncodedOperand(const BeMCOperand& operand, int& encodedVal)
  3478. {
  3479. if (operand.mKind == BeMCOperandKind_VReg)
  3480. {
  3481. auto vregInfo = mVRegInfo[operand.mVRegIdx];
  3482. encodedVal = operand.mVRegIdx;
  3483. return true;
  3484. }
  3485. if (operand.mKind != BeMCOperandKind_VRegAddr)
  3486. return false;
  3487. auto vregInfo = mVRegInfo[operand.mVRegIdx];
  3488. if (vregInfo->IsDirectRelTo())
  3489. {
  3490. if (!GetEncodedOperand(vregInfo->mRelTo, encodedVal))
  3491. return false;
  3492. encodedVal |= BeMCOperand::EncodeFlag_Addr;
  3493. return true;
  3494. }
  3495. if (vregInfo->mIsExpr)
  3496. return false;
  3497. encodedVal = operand.mVRegIdx | BeMCOperand::EncodeFlag_Addr;
  3498. return true;
  3499. }
  3500. bool BeMCContext::HasPointerDeref(const BeMCOperand& operand)
  3501. {
  3502. if (operand.mKind == BeMCOperandKind_VRegLoad)
  3503. return true;
  3504. auto vregInfo = GetVRegInfo(operand);
  3505. if (vregInfo == NULL)
  3506. return false;
  3507. if (!vregInfo->mRelTo)
  3508. return false;
  3509. if ((vregInfo->mRelTo.mKind == BeMCOperandKind_VRegLoad) ||
  3510. (vregInfo->mRelTo.mKind == BeMCOperandKind_VReg))
  3511. return true;
  3512. return false;
  3513. }
  3514. bool BeMCContext::AreOperandsEquivalent(const BeMCOperand& origOp0, const BeMCOperand& origOp1, BeMCRemapper& regRemaps)
  3515. {
  3516. auto op0 = origOp0;
  3517. RemapOperand(op0, regRemaps);
  3518. auto op1 = origOp1;
  3519. RemapOperand(op1, regRemaps);
  3520. if (op0.mKind != op1.mKind)
  3521. return false;
  3522. if (op0.mKind == BeMCOperandKind_None)
  3523. return true;
  3524. if (op0.IsSymbol())
  3525. return op0.mSymbolIdx == op1.mSymbolIdx;
  3526. if (op0.IsImmediate())
  3527. return op0.mImmediate == op1.mImmediate;
  3528. if (op0.IsNativeReg())
  3529. return op0.mReg == op1.mReg;
  3530. if (op0.IsVRegAny())
  3531. {
  3532. if (op0.mVRegIdx == op1.mVRegIdx)
  3533. return true;
  3534. auto vregInfo0 = mVRegInfo[op0.mVRegIdx];
  3535. auto vregInfo1 = mVRegInfo[op1.mVRegIdx];
  3536. if (vregInfo0->mType != vregInfo1->mType)
  3537. return false;
  3538. if ((!vregInfo0->mIsExpr) || (!vregInfo1->mIsExpr))
  3539. return false;
  3540. return
  3541. (vregInfo0->mRelOffsetScale == vregInfo1->mRelOffsetScale) &&
  3542. (AreOperandsEquivalent(vregInfo0->mRelTo, vregInfo1->mRelTo, regRemaps)) &&
  3543. (AreOperandsEquivalent(vregInfo0->mRelOffset, vregInfo1->mRelOffset, regRemaps));
  3544. }
  3545. return false;
  3546. }
  3547. bool BeMCContext::CouldBeReg(const BeMCOperand& operand)
  3548. {
  3549. if (operand.mKind != BeMCOperandKind_VReg)
  3550. return false;
  3551. auto vregInfo = GetVRegInfo(operand);
  3552. if (vregInfo->mForceMem)
  3553. return false;
  3554. if (vregInfo->mIsExpr)
  3555. {
  3556. if (vregInfo->mRelOffset)
  3557. return false;
  3558. }
  3559. return true;
  3560. }
  3561. bool BeMCContext::CheckForce(BeMCVRegInfo * vregInfo)
  3562. {
  3563. if (!vregInfo->mIsRetVal)
  3564. {
  3565. if (vregInfo->mForceMem && vregInfo->mForceReg)
  3566. Fail("vreg forceMem/forceReg collision");
  3567. }
  3568. return false;
  3569. }
  3570. void BeMCContext::MarkLive(BeVTrackingList* liveRegs, SizedArrayImpl<int>& newRegs, BeVTrackingList* vregsInitialized, const BeMCOperand& operand)
  3571. {
  3572. int vregIdx = operand.mVRegIdx;
  3573. auto vregInfo = mVRegInfo[vregIdx];
  3574. if (mLivenessContext.IsSet(liveRegs, operand.mVRegIdx))
  3575. return;
  3576. for (auto newReg : newRegs)
  3577. if (newReg == operand.mVRegIdx)
  3578. return;
  3579. if (!mColorizer.mNodes.empty())
  3580. {
  3581. // Is new
  3582. for (int i = 0; i < liveRegs->mSize; i++)
  3583. {
  3584. int checkReg = liveRegs->mEntries[i];
  3585. if (checkReg >= mLivenessContext.mNumItems)
  3586. continue;
  3587. mColorizer.AddEdge(checkReg, operand.mVRegIdx);
  3588. }
  3589. for (auto checkReg : newRegs)
  3590. mColorizer.AddEdge(checkReg, operand.mVRegIdx);
  3591. }
  3592. if (vregInfo->mHasDynLife)
  3593. {
  3594. if (!mLivenessContext.IsSet(vregsInitialized, vregIdx))
  3595. {
  3596. // This indicates that this is a 'def' usage, meaning the value wasn't actually set yet
  3597. // so don't propagate this index upward
  3598. return;
  3599. }
  3600. }
  3601. if ((vregInfo->mRelTo) && (vregInfo->mRelTo.IsVRegAny()))
  3602. MarkLive(liveRegs, newRegs, vregsInitialized, vregInfo->mRelTo);
  3603. if ((vregInfo->mRelOffset) && (vregInfo->mRelOffset.IsVRegAny()))
  3604. MarkLive(liveRegs, newRegs, vregsInitialized, vregInfo->mRelOffset);
  3605. newRegs.push_back(operand.mVRegIdx);
  3606. }
  3607. BeVTrackingList* BeMCContext::MergeLiveRegs(BeVTrackingList* prevDestEntry, BeVTrackingList* mergeFrom)
  3608. {
  3609. int vregIdx = -1;
  3610. SizedArray<int, 16> newNodes;
  3611. SizedArray<int, 16> prevExclusiveNodes;
  3612. // Take nodes that were exclusive to the new set and add edges to nodes that were exclusive the old set
  3613. /*while (true)
  3614. {
  3615. vregIdx = mLivenessContext.GetNextDiffSetIdx(prevDestEntry.mBits, mergeFrom, vregIdx);
  3616. if (vregIdx == -1)
  3617. break;
  3618. newNodes.push_back(vregIdx);
  3619. if (!mColorizer.mNodes.empty())
  3620. {
  3621. int checkReg = -1;
  3622. while (true)
  3623. {
  3624. checkReg = mLivenessContext.GetNextDiffSetIdx(mergeFrom, prevDestEntry.mBits, checkReg);
  3625. if (checkReg == -1)
  3626. break;
  3627. mColorizer.AddEdge(checkReg, vregIdx);
  3628. }
  3629. }
  3630. }*/
  3631. auto prevItr = prevDestEntry->begin();
  3632. auto prevEnd = prevDestEntry->end();
  3633. auto mergeFromItr = mergeFrom->begin();
  3634. auto mergeFromEnd = mergeFrom->end();
  3635. while ((prevItr != prevEnd) && (mergeFromItr != mergeFromEnd))
  3636. {
  3637. int prevIdx = *prevItr;
  3638. int mergeIdx = *mergeFromItr;
  3639. bool done = false;
  3640. while (mergeIdx < prevIdx)
  3641. {
  3642. newNodes.push_back(mergeIdx);
  3643. ++mergeFromItr;
  3644. if (mergeFromItr == mergeFromEnd)
  3645. {
  3646. done = true;
  3647. break;
  3648. }
  3649. mergeIdx = *mergeFromItr;
  3650. }
  3651. if (done)
  3652. break;
  3653. while (prevIdx < mergeIdx)
  3654. {
  3655. prevExclusiveNodes.push_back(prevIdx);
  3656. ++prevItr;
  3657. if (prevItr == prevEnd)
  3658. {
  3659. done = true;
  3660. break;
  3661. }
  3662. prevIdx = *prevItr;
  3663. }
  3664. if (done)
  3665. break;
  3666. if (prevIdx == mergeIdx)
  3667. {
  3668. ++prevItr;
  3669. ++mergeFromItr;
  3670. }
  3671. }
  3672. while (prevItr != prevEnd)
  3673. {
  3674. prevExclusiveNodes.push_back(*prevItr);
  3675. ++prevItr;
  3676. }
  3677. while (mergeFromItr != mergeFromEnd)
  3678. {
  3679. newNodes.push_back(*mergeFromItr);
  3680. ++mergeFromItr;
  3681. }
  3682. if (!mColorizer.mNodes.empty())
  3683. {
  3684. for (int newIdx : newNodes)
  3685. {
  3686. for (int prevExclusiveIdx : prevExclusiveNodes)
  3687. {
  3688. mColorizer.AddEdge(newIdx, prevExclusiveIdx);
  3689. }
  3690. }
  3691. }
  3692. return mLivenessContext.Add(prevDestEntry, newNodes, false);
  3693. }
  3694. static void DedupPushBack(SizedArrayImpl<int>& vec, int val)
  3695. {
  3696. if (vec.Contains(val))
  3697. return;
  3698. vec.push_back(val);
  3699. }
  3700. static int genLivenessIdx = 0;
  3701. void BeMCContext::GenerateLiveness(BeMCBlock* block, BeVTrackingGenContext* genCtx, bool& modifiedBlockBefore, bool& modifiedBlockAfter)
  3702. {
  3703. genCtx->mBlocks[block->mBlockIdx].mGenerateCount++;
  3704. modifiedBlockBefore = false;
  3705. modifiedBlockAfter = false;
  3706. genCtx->mCalls++;
  3707. bool debugging = false;
  3708. //if (mDebugging) debugging = true;
  3709. //if (mBeFunction->mName == "?Draw@DarkEditWidgetContent@dark@theme@Beefy@@UEAAXPEAVGraphics@gfx@4@@Z")
  3710. //debugging = true;
  3711. //"?DrawEntry@DrawContext@PerfView@BeefPerf@@QEAAXPEAVGraphics@gfx@Beefy@@PEAVTrackNodeEntry@23@MM@Z")
  3712. //debugging &= mcColorizer != NULL;
  3713. if (debugging)
  3714. {
  3715. if (block->mBlockIdx == 220)
  3716. {
  3717. //BF_ASSERT(mLivenessContext.IsSet(succLiveRegs, 36));
  3718. }
  3719. }
  3720. if (debugging)
  3721. {
  3722. OutputDebugStrF("GenerateLiveness %s(%d)\n", ToString(BeMCOperand::FromBlock(block)).c_str(), block->mBlockIdx);
  3723. }
  3724. /*bool isFirstEntry = block->mSuccLiveness.mBits == NULL;
  3725. if (isFirstEntry)
  3726. {
  3727. mLivenessContext.mStats.mSuccBytes += mLivenessContext.GetBitsBytes() * 2;
  3728. block->mSuccLiveness.mBits = mLivenessContext.Duplicate(succLiveRegs.mBits);
  3729. block->mSuccLiveness.mList = succLiveRegs.mList;
  3730. block->mSuccVRegsInitialized.mBits = mLivenessContext.Duplicate(succInitRegs.mBits);
  3731. block->mSuccVRegsInitialized.mList = succInitRegs.mList;
  3732. }
  3733. else
  3734. {
  3735. if (debugging)
  3736. {
  3737. OutputDebugStrF(" New Succ Regs: ");
  3738. int vregIdx = -1;
  3739. while (true)
  3740. {
  3741. vregIdx = mLivenessContext.GetNextDiffSetIdx(block->mSuccLiveness.mBits, succLiveRegs.mBits, vregIdx);
  3742. if (vregIdx == -1)
  3743. break;
  3744. auto vregInfo = mVRegInfo[vregIdx];
  3745. if (vregInfo->mDbgVariable != NULL)
  3746. OutputDebugStrF("#%s/%d ", vregInfo->mDbgVariable->mName.c_str(), vregIdx);
  3747. else
  3748. OutputDebugStrF("%%vreg%d ", vregIdx);
  3749. }
  3750. OutputDebugStrF("\n");
  3751. }
  3752. if (mDebugging)
  3753. {
  3754. }
  3755. MergeLiveRegs(block->mSuccLiveness, succLiveRegs.mBits);
  3756. mVRegInitializedContext.MergeInplace(block->mSuccVRegsInitialized.mBits, succInitRegs.mBits);
  3757. }*/
  3758. genCtx->mHandledCalls++;
  3759. BeMDNode* curDbgScope = NULL;
  3760. // Don't use 'ref' here, it's important that mSuccLiveRegs actually means 'successor', otherwise
  3761. // we could miss a later-occurring liveness overlap on a different successor
  3762. BeVTrackingList* liveRegs = block->mSuccLiveness;
  3763. BeVTrackingList* vregsInitialized = block->mSuccVRegsInitialized;
  3764. // When we process our first vregsInitialized (at the bottom of the block), there won't be Change entries
  3765. // for us to use to determine the delta from mSuccVRegsInitialized to inst->mVRegsInitialized
  3766. bool needsManualVRegInitDiff = true;
  3767. for (int instIdx = (int)block->mInstructions.size() - 1; instIdx >= 0; instIdx--)
  3768. {
  3769. genLivenessIdx++;
  3770. auto inst = block->mInstructions[instIdx];
  3771. auto prevLiveness = inst->mLiveness;
  3772. genCtx->mInstructions++;
  3773. SizedArray<int, 16> removeVec;
  3774. SizedArray<int, 16> addVec;
  3775. SizedArray<int, 16> filteredRemoveVec;
  3776. SizedArray<int, 16> filteredAddVec;
  3777. inst->mLiveness = liveRegs;
  3778. if ((inst->mVRegsInitialized != NULL) && (inst->mVRegsInitialized != vregsInitialized))
  3779. {
  3780. /*int vregIdxEx = -1;
  3781. while (true)
  3782. {
  3783. vregIdxEx = mVRegInitializedContext.GetNextDiffSetIdx(vregsInitialized.mBits, inst->mVRegsInitialized, vregIdxEx, false, false);
  3784. if (vregIdxEx == -1)
  3785. break;*/
  3786. auto _VRegUninit = [&] (int vregIdxEx)
  3787. {
  3788. int vregIdx = vregIdxEx % mVRegInitializedContext.mNumItems;
  3789. auto vregInfo = mVRegInfo[vregIdx];
  3790. if (!vregInfo->mHasDynLife)
  3791. return;
  3792. bool doClear = false;
  3793. if (vregInfo->mDoConservativeLife)
  3794. {
  3795. // Only do liveness clear when both 'init' and 'non-init' is set
  3796. int otherVRegIdxEx = vregIdx;
  3797. if (vregIdxEx < mVRegInitializedContext.mNumItems)
  3798. otherVRegIdxEx += mVRegInitializedContext.mNumItems;
  3799. if (!mVRegInitializedContext.IsSet(inst->mVRegsInitialized, otherVRegIdxEx))
  3800. doClear = true;
  3801. }
  3802. else
  3803. {
  3804. // Only do liveness clear on 'init' clearing out
  3805. if (vregIdx < mVRegInitializedContext.mNumItems)
  3806. doClear = true;
  3807. }
  3808. if (doClear)
  3809. {
  3810. if (vregIdx >= mVRegInitializedContext.mNumItems)
  3811. DedupPushBack(removeVec, vregIdx);
  3812. else
  3813. removeVec.push_back(vregIdx);
  3814. }
  3815. };
  3816. if (needsManualVRegInitDiff)
  3817. {
  3818. BF_ASSERT(vregsInitialized == block->mSuccVRegsInitialized);
  3819. // Manually compare
  3820. auto vregsInit0 = vregsInitialized;
  3821. auto vregsInit1 = inst->mVRegsInitialized;
  3822. if (vregsInit0 != vregsInit1)
  3823. {
  3824. int idx0 = 0;
  3825. int idx1 = 0;
  3826. while ((idx0 != vregsInit0->mSize) && (idx1 != vregsInit1->mSize))
  3827. {
  3828. int val0 = vregsInit0->mEntries[idx0];
  3829. int val1 = vregsInit1->mEntries[idx1];
  3830. if (val0 == val1)
  3831. {
  3832. idx0++;
  3833. idx1++;
  3834. continue;
  3835. }
  3836. bool done = false;
  3837. while (val0 < val1)
  3838. {
  3839. _VRegUninit(val0);
  3840. idx0++;
  3841. if (idx0 >= vregsInit0->mSize)
  3842. {
  3843. done = true;
  3844. break;
  3845. }
  3846. val0 = vregsInit0->mEntries[idx0];
  3847. }
  3848. if (done)
  3849. break;
  3850. while (val1 < val0)
  3851. {
  3852. idx1++;
  3853. if (idx1 >= vregsInit1->mSize)
  3854. {
  3855. done = true;
  3856. break;
  3857. }
  3858. val1 = vregsInit1->mEntries[idx1];
  3859. }
  3860. if (done)
  3861. break;
  3862. }
  3863. while (idx0 < vregsInit0->mSize)
  3864. {
  3865. _VRegUninit(vregsInit0->mEntries[idx0++]);
  3866. }
  3867. }
  3868. }
  3869. else
  3870. {
  3871. for (int changeIdx = 0; changeIdx < vregsInitialized->mNumChanges; changeIdx++)
  3872. {
  3873. int vregIdxEx = vregsInitialized->GetChange(changeIdx);
  3874. if (vregIdxEx < 0)
  3875. continue;
  3876. // It's possible this vregsInitialized is equivalent to the one in 'inst', but also merged with another 'inst'
  3877. // during legalization. We need to avoid uninitializing vregs if that's the case.
  3878. // the entry above this
  3879. if (inst->mVRegsInitialized->ContainsChange(vregIdxEx))
  3880. continue;
  3881. _VRegUninit(vregIdxEx);
  3882. }
  3883. }
  3884. vregsInitialized = inst->mVRegsInitialized;
  3885. }
  3886. if (inst->mVRegsInitialized != NULL)
  3887. needsManualVRegInitDiff = false;
  3888. if (inst->mKind == BeMCInstKind_DbgDecl)
  3889. {
  3890. if (!mVRegInitializedContext.IsSet(inst->mVRegsInitialized, inst->mArg0.mVRegIdx))
  3891. {
  3892. // There are some rare cases with conditional branches where one branch will have a vreg marked as
  3893. // initialized, which causes the variable to be marked as live, which propagates upward into the block
  3894. // containing a variable declaration, before the actual def point
  3895. DedupPushBack(removeVec, inst->mArg0.mVRegIdx);
  3896. }
  3897. liveRegs = mLivenessContext.Modify(liveRegs, addVec, removeVec, filteredAddVec, filteredRemoveVec);
  3898. continue;
  3899. }
  3900. // This is used for clearing out things like usage of inline return values, which will be accessed after their
  3901. // lifetime end (the lifetime ends inside the inlined method but the value is used afterward, in the inlining
  3902. // function. This will emit as a load of a dbgVar, so we need to drill down into the relTo values
  3903. if (inst->mKind == BeMCInstKind_LifetimeStart)
  3904. {
  3905. BF_ASSERT(inst->mArg0.IsVRegAny());
  3906. int vregIdx = inst->mArg0.mVRegIdx;
  3907. while (true)
  3908. {
  3909. DedupPushBack(removeVec, vregIdx);
  3910. auto vregInfo = mVRegInfo[vregIdx];
  3911. if (!vregInfo->IsDirectRelTo())
  3912. break;
  3913. BF_ASSERT(vregInfo->mRelTo.IsVReg());
  3914. vregIdx = vregInfo->mRelTo.mVRegIdx;
  3915. }
  3916. liveRegs = mLivenessContext.Modify(liveRegs, addVec, removeVec, filteredAddVec, filteredRemoveVec);
  3917. continue;
  3918. }
  3919. if (inst->mKind == BeMCInstKind_LifetimeEnd)
  3920. {
  3921. auto vregInfo = GetVRegInfo(inst->mArg0);
  3922. if (vregInfo->mDbgVariable == NULL)
  3923. {
  3924. // Only extend lifetime down through LifetimeEnd when we have a debug variable we want to keep alive,
  3925. // otherwise constrict lifetime to actual usage
  3926. liveRegs = mLivenessContext.Modify(liveRegs, addVec, removeVec, filteredAddVec, filteredRemoveVec);
  3927. continue;
  3928. }
  3929. }
  3930. if (inst->IsDef())
  3931. {
  3932. DedupPushBack(removeVec, inst->mArg0.mVRegIdx);
  3933. liveRegs = mLivenessContext.Modify(liveRegs, addVec, removeVec, filteredAddVec, filteredRemoveVec);
  3934. continue;
  3935. }
  3936. auto operands = { &inst->mResult, &inst->mArg0, &inst->mArg1 };
  3937. for (auto operand : operands)
  3938. {
  3939. if (operand->IsSymbol())
  3940. {
  3941. auto sym = mCOFFObject->mSymbols[operand->mSymbolIdx];
  3942. if (sym->mIsTLS)
  3943. {
  3944. MarkLive(liveRegs, addVec, vregsInitialized, BeMCOperand::FromVReg(mTLSVRegIdx));
  3945. }
  3946. }
  3947. if (operand->mKind == BeMCOperandKind_VRegPair)
  3948. {
  3949. auto mcOperand = BeMCOperand::FromEncoded(operand->mVRegPair.mVRegIdx0);
  3950. if (mcOperand.IsVRegAny())
  3951. MarkLive(liveRegs, addVec, vregsInitialized, mcOperand);
  3952. mcOperand = BeMCOperand::FromEncoded(operand->mVRegPair.mVRegIdx1);
  3953. if (mcOperand.IsVRegAny())
  3954. MarkLive(liveRegs, addVec, vregsInitialized, mcOperand);
  3955. }
  3956. if (operand->IsVRegAny())
  3957. {
  3958. MarkLive(liveRegs, addVec, vregsInitialized, *operand);
  3959. }
  3960. }
  3961. liveRegs = mLivenessContext.Modify(liveRegs, addVec, removeVec, filteredAddVec, filteredRemoveVec);
  3962. /*if ((!isFirstEntry) && (liveRegs == prevLiveness))
  3963. {
  3964. // We've already been here before and nothing changed
  3965. return;
  3966. }*/
  3967. inst->mLiveness = liveRegs;
  3968. }
  3969. if (block == mBlocks[0])
  3970. {
  3971. BF_ASSERT(block->mBlockIdx == 0);
  3972. if (!mLivenessContext.IsEmpty(liveRegs))
  3973. {
  3974. for (int vregIdx = 0; vregIdx < mLivenessContext.mNumEntries; vregIdx++)
  3975. {
  3976. if (mLivenessContext.IsSet(liveRegs, vregIdx))
  3977. {
  3978. auto vregInfo = mVRegInfo[vregIdx];
  3979. // If we are still alive then the only valid reason is because we have mHasDynLife and our 'init' flag is still set
  3980. if (vregInfo->mHasDynLife)
  3981. {
  3982. if (!mVRegInitializedContext.IsSet(vregsInitialized, vregIdx))
  3983. {
  3984. if (vregInfo->mDoConservativeLife)
  3985. BF_ASSERT(mVRegInitializedContext.IsSet(vregsInitialized, vregIdx, BeTrackKind_Uninitialized));
  3986. else
  3987. Fail("VReg lifetime error");
  3988. }
  3989. }
  3990. else
  3991. {
  3992. Fail("VReg lifetime error");
  3993. }
  3994. }
  3995. }
  3996. }
  3997. }
  3998. for (auto pred : block->mPreds)
  3999. {
  4000. auto& entry = genCtx->mBlocks[pred->mBlockIdx];
  4001. BF_ASSERT(pred == mBlocks[pred->mBlockIdx]);
  4002. auto newSuccLiveness = MergeLiveRegs(pred->mSuccLiveness, liveRegs);
  4003. if (newSuccLiveness == pred->mSuccLiveness)
  4004. continue;
  4005. pred->mSuccLiveness = newSuccLiveness;
  4006. /*if (mVRegInitializedContext.HasExtraBitsSet(pred->mSuccVRegsInitialized.mBits, vregsInitialized.mBits))
  4007. {
  4008. mVRegInitializedContext.MergeInplace(pred->mSuccVRegsInitialized.mBits, vregsInitialized.mBits);
  4009. }*/
  4010. //if (mVRegInitializedContext.HasExtraEntries(pred->mSuccVRegsInitialized.mList, vregsInitialized.mList))
  4011. pred->mSuccVRegsInitialized = mVRegInitializedContext.Merge(pred->mSuccVRegsInitialized, vregsInitialized);
  4012. if (pred->mBlockIdx > block->mBlockIdx)
  4013. modifiedBlockAfter = true;
  4014. else
  4015. modifiedBlockBefore = true;
  4016. entry.mGenerateQueued = true;
  4017. //GenerateLiveness(pred, liveRegs, vregsInitialized, mcColorizer, livenessStats);
  4018. }
  4019. }
  4020. void BeMCContext::GenerateLiveness()
  4021. {
  4022. //GenerateLiveness_OLD(mcColorizer);
  4023. //return;
  4024. mLivenessContext.mStats = BeVTrackingContext::Stats();
  4025. #ifdef _DEBUG
  4026. // So we can Print() while generating liveness (the old values would have been unallocated)
  4027. for (auto mcBlock : mBlocks)
  4028. {
  4029. for (auto mcInst : mcBlock->mInstructions)
  4030. {
  4031. mcInst->mLiveness = NULL;
  4032. }
  4033. }
  4034. #endif
  4035. BP_ZONE("BeMCContext::GenerateLiveness");
  4036. mLivenessContext.Clear();
  4037. mLivenessContext.Init((int)mVRegInfo.size());
  4038. auto emptyList = mLivenessContext.AllocEmptyList();
  4039. BeVTrackingGenContext genCtx;
  4040. genCtx.mEmptyList = emptyList;
  4041. genCtx.mBlocks.Resize(mBlocks.size());
  4042. for (auto mcBlock : mBlocks)
  4043. {
  4044. mcBlock->mSuccLiveness = emptyList;
  4045. mcBlock->mSuccVRegsInitialized = emptyList;
  4046. if (mTLSVRegIdx != -1)
  4047. {
  4048. // Keep TLS alive
  4049. SizedArray<int, 1> vec = { mTLSVRegIdx };
  4050. mcBlock->mSuccLiveness = mLivenessContext.Add(mcBlock->mSuccLiveness, vec, false);
  4051. }
  4052. }
  4053. while (true)
  4054. {
  4055. bool didWork = false;
  4056. // Handle any outstanding pred entries
  4057. for (int blockIdx = (int)mBlocks.size() - 1; blockIdx >= 0; blockIdx--)
  4058. {
  4059. auto& entry = genCtx.mBlocks[blockIdx];
  4060. if (entry.mGenerateQueued)
  4061. {
  4062. entry.mGenerateQueued = false;
  4063. didWork = true;
  4064. auto block = mBlocks[blockIdx];
  4065. bool modifiedBlockBefore;
  4066. bool modifiedBlockAfter;
  4067. GenerateLiveness(block, &genCtx, modifiedBlockBefore, modifiedBlockAfter);
  4068. if (modifiedBlockAfter)
  4069. break;
  4070. }
  4071. }
  4072. // If no pred entries, find blocks that haven't been processed yet
  4073. if (!didWork)
  4074. {
  4075. for (int blockIdx = (int)mBlocks.size() - 1; blockIdx >= 0; blockIdx--)
  4076. {
  4077. auto& entry = genCtx.mBlocks[blockIdx];
  4078. if (entry.mGenerateCount == 0)
  4079. {
  4080. didWork = true;
  4081. auto block = mBlocks[blockIdx];
  4082. bool modifiedBlockBefore;
  4083. bool modifiedBlockAfter;
  4084. GenerateLiveness(block, &genCtx, modifiedBlockBefore, modifiedBlockAfter);
  4085. if (modifiedBlockBefore || modifiedBlockAfter)
  4086. break;
  4087. }
  4088. }
  4089. }
  4090. if (!didWork)
  4091. break;
  4092. }
  4093. int instCount = 0;
  4094. for (auto block : mBlocks)
  4095. instCount += (int)block->mInstructions.size();
  4096. BpEvent("GenerateLiveness Results",
  4097. StrFormat("Blocks: %d\nInstructions: %d\nVRegs: %d\nCalls: %d\nHandled Calls: %d\nProcessed Instructions: %d\nLiveness Bytes: %d\n"
  4098. "Temp Bytes: %d\nBits Bytes: %d\nList Bytes: %d\nSucc Bytes: %d",
  4099. mBlocks.size(), instCount, mVRegInfo.size(), genCtx.mCalls, genCtx.mHandledCalls, genCtx.mInstructions, mLivenessContext.mAlloc.GetAllocSize(),
  4100. genCtx.mAlloc.GetAllocSize(), mLivenessContext.mStats.mBitsBytes, mLivenessContext.mStats.mListBytes, mLivenessContext.mStats.mSuccBytes).c_str());
  4101. }
  4102. void BeMCContext::IntroduceVRegs(const BeMCOperand& newVReg, BeMCBlock* block, int startInstIdx, int lastInstIdx)
  4103. {
  4104. return;
  4105. /*BF_ASSERT((block->mInstructions[startInstIdx]->mKind == BeMCInstKind_Def) && (block->mInstructions[startInstIdx]->mArg0 == newVReg));
  4106. BF_ASSERT(mColorizer.mNodes.size() == newVReg.mVRegIdx);
  4107. mColorizer.mNodes.resize(mColorizer.mNodes.size() + 1);
  4108. BeVTrackingBits* lastLiveness = NULL;
  4109. for (int instIdx = startInstIdx + 1; instIdx <= lastInstIdx; instIdx++)
  4110. {
  4111. auto inst = block->mInstructions[instIdx];
  4112. if (lastLiveness == NULL)
  4113. {
  4114. for (int vregIdx : *inst->mLiveness)
  4115. {
  4116. if (vregIdx >= mLivenessContext.mNumItems)
  4117. continue;
  4118. mColorizer.AddEdge(newVReg.mVRegIdx, vregIdx);
  4119. }
  4120. }
  4121. else
  4122. {
  4123. int vregIdx = -1;
  4124. while (true)
  4125. {
  4126. vregIdx = mLivenessContext.GetNextDiffSetIdx(lastLiveness, inst->mLiveness, vregIdx);
  4127. if (vregIdx == -1)
  4128. break;
  4129. mColorizer.AddEdge(newVReg.mVRegIdx, vregIdx);
  4130. }
  4131. }
  4132. if (inst->mVRegsInitializedEx != NULL)
  4133. {
  4134. auto vregArray = (BeMCVRegArray*)mAlloc.AllocBytes(sizeof(int) * (inst->mVRegsInitializedEx->mSize + 1 + 1), sizeof(int));
  4135. vregArray->mSize = inst->mVRegsInitializedEx->mSize + 1;
  4136. for (int listIdx = 0; listIdx < inst->mVRegsInitializedEx->mSize; listIdx++)
  4137. {
  4138. mColorizer.AddEdge(newVReg.mVRegIdx, inst->mVRegsInitializedEx->mVRegIndices[listIdx]);
  4139. vregArray->mVRegIndices[listIdx] = inst->mVRegsInitializedEx->mVRegIndices[listIdx];
  4140. }
  4141. vregArray->mVRegIndices[vregArray->mSize - 1] = newVReg.mVRegIdx;
  4142. inst->mVRegsInitializedEx = vregArray;
  4143. }
  4144. else
  4145. {
  4146. auto vregArray = (BeMCVRegArray*)mAlloc.AllocBytes(sizeof(int) * 2, sizeof(int));
  4147. vregArray->mSize = 1;
  4148. vregArray->mVRegIndices[0] = newVReg.mVRegIdx;
  4149. inst->mVRegsInitializedEx = vregArray;
  4150. }
  4151. lastLiveness = inst->mLiveness;
  4152. }*/
  4153. }
  4154. bool BeMCContext::IsVolatileReg(X64CPURegister reg)
  4155. {
  4156. switch (ResizeRegister(reg, 8))
  4157. {
  4158. case X64Reg_RAX:
  4159. case X64Reg_RCX:
  4160. case X64Reg_RDX:
  4161. case X64Reg_R8:
  4162. case X64Reg_R9:
  4163. case X64Reg_R10:
  4164. case X64Reg_R11:
  4165. case X64Reg_XMM0_f64:
  4166. case X64Reg_XMM1_f64:
  4167. case X64Reg_XMM2_f64:
  4168. case X64Reg_XMM3_f64:
  4169. case X64Reg_XMM4_f64:
  4170. case X64Reg_XMM5_f64:
  4171. return true;
  4172. default:
  4173. return false;
  4174. }
  4175. }
  4176. bool BeMCContext::IsXMMReg(X64CPURegister reg)
  4177. {
  4178. return (reg >= X64Reg_XMM0_f64) && (reg <= X64Reg_XMM15_f32);
  4179. }
  4180. X64CPURegister BeMCContext::ResizeRegister(X64CPURegister reg, int numBytes)
  4181. {
  4182. if (numBytes == 8)
  4183. {
  4184. switch (reg)
  4185. {
  4186. case X64Reg_DIL:
  4187. case X64Reg_DI:
  4188. case X64Reg_EDI:
  4189. case X64Reg_RDI: return X64Reg_RDI;
  4190. case X64Reg_SIL:
  4191. case X64Reg_SI:
  4192. case X64Reg_ESI:
  4193. case X64Reg_RSI: return X64Reg_RSI;
  4194. case X64Reg_AL:
  4195. case X64Reg_AH:
  4196. case X64Reg_AX:
  4197. case X64Reg_EAX:
  4198. case X64Reg_RAX: return X64Reg_RAX;
  4199. case X64Reg_DL:
  4200. case X64Reg_DH:
  4201. case X64Reg_DX:
  4202. case X64Reg_EDX:
  4203. case X64Reg_RDX: return X64Reg_RDX;
  4204. case X64Reg_CL:
  4205. case X64Reg_CH:
  4206. case X64Reg_CX:
  4207. case X64Reg_ECX:
  4208. case X64Reg_RCX: return X64Reg_RCX;
  4209. case X64Reg_BL:
  4210. case X64Reg_BH:
  4211. case X64Reg_BX:
  4212. case X64Reg_EBX:
  4213. case X64Reg_RBX: return X64Reg_RBX;
  4214. case X64Reg_R8B:
  4215. case X64Reg_R8W:
  4216. case X64Reg_R8D:
  4217. case X64Reg_R8: return X64Reg_R8;
  4218. case X64Reg_R9B:
  4219. case X64Reg_R9W:
  4220. case X64Reg_R9D:
  4221. case X64Reg_R9: return X64Reg_R9;
  4222. case X64Reg_R10B:
  4223. case X64Reg_R10W:
  4224. case X64Reg_R10D:
  4225. case X64Reg_R10: return X64Reg_R10;
  4226. case X64Reg_R11B:
  4227. case X64Reg_R11W:
  4228. case X64Reg_R11D:
  4229. case X64Reg_R11: return X64Reg_R11;
  4230. case X64Reg_R12B:
  4231. case X64Reg_R12W:
  4232. case X64Reg_R12D:
  4233. case X64Reg_R12: return X64Reg_R12;
  4234. case X64Reg_R13B:
  4235. case X64Reg_R13W:
  4236. case X64Reg_R13D:
  4237. case X64Reg_R13: return X64Reg_R13;
  4238. case X64Reg_R14B:
  4239. case X64Reg_R14W:
  4240. case X64Reg_R14D:
  4241. case X64Reg_R14: return X64Reg_R14;
  4242. case X64Reg_R15B:
  4243. case X64Reg_R15W:
  4244. case X64Reg_R15D:
  4245. case X64Reg_R15: return X64Reg_R15;
  4246. case X64Reg_XMM0_f32:
  4247. case X64Reg_XMM0_f64: return X64Reg_XMM0_f64;
  4248. case X64Reg_XMM1_f32:
  4249. case X64Reg_XMM1_f64: return X64Reg_XMM1_f64;
  4250. case X64Reg_XMM2_f32:
  4251. case X64Reg_XMM2_f64: return X64Reg_XMM2_f64;
  4252. case X64Reg_XMM3_f32:
  4253. case X64Reg_XMM3_f64: return X64Reg_XMM3_f64;
  4254. case X64Reg_XMM4_f32:
  4255. case X64Reg_XMM4_f64: return X64Reg_XMM4_f64;
  4256. case X64Reg_XMM5_f32:
  4257. case X64Reg_XMM5_f64: return X64Reg_XMM5_f64;
  4258. case X64Reg_XMM6_f32:
  4259. case X64Reg_XMM6_f64: return X64Reg_XMM6_f64;
  4260. case X64Reg_XMM7_f32:
  4261. case X64Reg_XMM7_f64: return X64Reg_XMM7_f64;
  4262. case X64Reg_XMM8_f32:
  4263. case X64Reg_XMM8_f64: return X64Reg_XMM8_f64;
  4264. case X64Reg_XMM9_f32:
  4265. case X64Reg_XMM9_f64: return X64Reg_XMM9_f64;
  4266. case X64Reg_XMM10_f32:
  4267. case X64Reg_XMM10_f64: return X64Reg_XMM10_f64;
  4268. case X64Reg_XMM11_f32:
  4269. case X64Reg_XMM11_f64: return X64Reg_XMM11_f64;
  4270. case X64Reg_XMM12_f32:
  4271. case X64Reg_XMM12_f64: return X64Reg_XMM12_f64;
  4272. case X64Reg_XMM13_f32:
  4273. case X64Reg_XMM13_f64: return X64Reg_XMM13_f64;
  4274. case X64Reg_XMM14_f32:
  4275. case X64Reg_XMM14_f64: return X64Reg_XMM14_f64;
  4276. case X64Reg_XMM15_f32:
  4277. case X64Reg_XMM15_f64: return X64Reg_XMM15_f64;
  4278. }
  4279. return reg;
  4280. }
  4281. if (numBytes == 4)
  4282. {
  4283. switch (reg)
  4284. {
  4285. case X64Reg_DIL:
  4286. case X64Reg_DI:
  4287. case X64Reg_EDI:
  4288. case X64Reg_RDI: return X64Reg_EDI;
  4289. case X64Reg_SIL:
  4290. case X64Reg_SI:
  4291. case X64Reg_ESI:
  4292. case X64Reg_RSI: return X64Reg_ESI;
  4293. case X64Reg_AL:
  4294. case X64Reg_AH:
  4295. case X64Reg_AX:
  4296. case X64Reg_EAX:
  4297. case X64Reg_RAX: return X64Reg_EAX;
  4298. case X64Reg_DL:
  4299. case X64Reg_DH:
  4300. case X64Reg_DX:
  4301. case X64Reg_EDX:
  4302. case X64Reg_RDX: return X64Reg_EDX;
  4303. case X64Reg_CL:
  4304. case X64Reg_CH:
  4305. case X64Reg_CX:
  4306. case X64Reg_ECX:
  4307. case X64Reg_RCX: return X64Reg_ECX;
  4308. case X64Reg_BL:
  4309. case X64Reg_BH:
  4310. case X64Reg_BX:
  4311. case X64Reg_EBX:
  4312. case X64Reg_RBX: return X64Reg_EBX;
  4313. case X64Reg_R8B:
  4314. case X64Reg_R8W:
  4315. case X64Reg_R8D:
  4316. case X64Reg_R8: return X64Reg_R8D;
  4317. case X64Reg_R9B:
  4318. case X64Reg_R9W:
  4319. case X64Reg_R9D:
  4320. case X64Reg_R9: return X64Reg_R9D;
  4321. case X64Reg_R10B:
  4322. case X64Reg_R10W:
  4323. case X64Reg_R10D:
  4324. case X64Reg_R10: return X64Reg_R10D;
  4325. case X64Reg_R11B:
  4326. case X64Reg_R11W:
  4327. case X64Reg_R11D:
  4328. case X64Reg_R11: return X64Reg_R11D;
  4329. case X64Reg_R12B:
  4330. case X64Reg_R12W:
  4331. case X64Reg_R12D:
  4332. case X64Reg_R12: return X64Reg_R12D;
  4333. case X64Reg_R13B:
  4334. case X64Reg_R13W:
  4335. case X64Reg_R13D:
  4336. case X64Reg_R13: return X64Reg_R13D;
  4337. case X64Reg_R14B:
  4338. case X64Reg_R14W:
  4339. case X64Reg_R14D:
  4340. case X64Reg_R14: return X64Reg_R14D;
  4341. case X64Reg_R15B:
  4342. case X64Reg_R15W:
  4343. case X64Reg_R15D:
  4344. case X64Reg_R15: return X64Reg_R15D;
  4345. case X64Reg_XMM0_f32:
  4346. case X64Reg_XMM0_f64: return X64Reg_XMM0_f32;
  4347. case X64Reg_XMM1_f32:
  4348. case X64Reg_XMM1_f64: return X64Reg_XMM1_f32;
  4349. case X64Reg_XMM2_f32:
  4350. case X64Reg_XMM2_f64: return X64Reg_XMM2_f32;
  4351. case X64Reg_XMM3_f32:
  4352. case X64Reg_XMM3_f64: return X64Reg_XMM3_f32;
  4353. case X64Reg_XMM4_f32:
  4354. case X64Reg_XMM4_f64: return X64Reg_XMM4_f32;
  4355. case X64Reg_XMM5_f32:
  4356. case X64Reg_XMM5_f64: return X64Reg_XMM5_f32;
  4357. case X64Reg_XMM6_f32:
  4358. case X64Reg_XMM6_f64: return X64Reg_XMM6_f32;
  4359. case X64Reg_XMM7_f32:
  4360. case X64Reg_XMM7_f64: return X64Reg_XMM7_f32;
  4361. case X64Reg_XMM8_f32:
  4362. case X64Reg_XMM8_f64: return X64Reg_XMM8_f32;
  4363. case X64Reg_XMM9_f32:
  4364. case X64Reg_XMM9_f64: return X64Reg_XMM9_f32;
  4365. case X64Reg_XMM10_f32:
  4366. case X64Reg_XMM10_f64: return X64Reg_XMM10_f32;
  4367. case X64Reg_XMM11_f32:
  4368. case X64Reg_XMM11_f64: return X64Reg_XMM11_f32;
  4369. case X64Reg_XMM12_f32:
  4370. case X64Reg_XMM12_f64: return X64Reg_XMM12_f32;
  4371. case X64Reg_XMM13_f32:
  4372. case X64Reg_XMM13_f64: return X64Reg_XMM13_f32;
  4373. case X64Reg_XMM14_f32:
  4374. case X64Reg_XMM14_f64: return X64Reg_XMM14_f32;
  4375. case X64Reg_XMM15_f32:
  4376. case X64Reg_XMM15_f64: return X64Reg_XMM15_f32;
  4377. }
  4378. }
  4379. if (numBytes == 2)
  4380. {
  4381. switch (reg)
  4382. {
  4383. case X64Reg_DIL:
  4384. case X64Reg_DI:
  4385. case X64Reg_EDI:
  4386. case X64Reg_RDI: return X64Reg_DI;
  4387. case X64Reg_SIL:
  4388. case X64Reg_SI:
  4389. case X64Reg_ESI:
  4390. case X64Reg_RSI: return X64Reg_SI;
  4391. case X64Reg_AL:
  4392. case X64Reg_AH:
  4393. case X64Reg_AX:
  4394. case X64Reg_EAX:
  4395. case X64Reg_RAX: return X64Reg_AX;
  4396. case X64Reg_DL:
  4397. case X64Reg_DH:
  4398. case X64Reg_DX:
  4399. case X64Reg_EDX:
  4400. case X64Reg_RDX: return X64Reg_DX;
  4401. case X64Reg_CL:
  4402. case X64Reg_CH:
  4403. case X64Reg_CX:
  4404. case X64Reg_ECX:
  4405. case X64Reg_RCX: return X64Reg_CX;
  4406. case X64Reg_BL:
  4407. case X64Reg_BH:
  4408. case X64Reg_BX:
  4409. case X64Reg_EBX:
  4410. case X64Reg_RBX: return X64Reg_BX;
  4411. case X64Reg_R8B:
  4412. case X64Reg_R8W:
  4413. case X64Reg_R8D:
  4414. case X64Reg_R8: return X64Reg_R8W;
  4415. case X64Reg_R9B:
  4416. case X64Reg_R9W:
  4417. case X64Reg_R9D:
  4418. case X64Reg_R9: return X64Reg_R9W;
  4419. case X64Reg_R10B:
  4420. case X64Reg_R10W:
  4421. case X64Reg_R10D:
  4422. case X64Reg_R10: return X64Reg_R10W;
  4423. case X64Reg_R11B:
  4424. case X64Reg_R11W:
  4425. case X64Reg_R11D:
  4426. case X64Reg_R11: return X64Reg_R11W;
  4427. case X64Reg_R12B:
  4428. case X64Reg_R12W:
  4429. case X64Reg_R12D:
  4430. case X64Reg_R12: return X64Reg_R12W;
  4431. case X64Reg_R13B:
  4432. case X64Reg_R13W:
  4433. case X64Reg_R13D:
  4434. case X64Reg_R13: return X64Reg_R13W;
  4435. case X64Reg_R14B:
  4436. case X64Reg_R14W:
  4437. case X64Reg_R14D:
  4438. case X64Reg_R14: return X64Reg_R14W;
  4439. case X64Reg_R15B:
  4440. case X64Reg_R15W:
  4441. case X64Reg_R15D:
  4442. case X64Reg_R15: return X64Reg_R15W;
  4443. }
  4444. }
  4445. if (numBytes == 1)
  4446. {
  4447. switch (reg)
  4448. {
  4449. case X64Reg_DIL:
  4450. case X64Reg_DI:
  4451. case X64Reg_EDI:
  4452. case X64Reg_RDI: return X64Reg_DIL;
  4453. case X64Reg_SIL:
  4454. case X64Reg_SI:
  4455. case X64Reg_ESI:
  4456. case X64Reg_RSI: return X64Reg_SIL;
  4457. case X64Reg_AH: return X64Reg_AH;
  4458. case X64Reg_AL:
  4459. case X64Reg_AX:
  4460. case X64Reg_EAX:
  4461. case X64Reg_RAX: return X64Reg_AL;
  4462. case X64Reg_DH: return X64Reg_DH;
  4463. case X64Reg_DL:
  4464. case X64Reg_DX:
  4465. case X64Reg_EDX:
  4466. case X64Reg_RDX: return X64Reg_DL;
  4467. case X64Reg_CH: return X64Reg_CH;
  4468. case X64Reg_CL:
  4469. case X64Reg_CX:
  4470. case X64Reg_ECX:
  4471. case X64Reg_RCX: return X64Reg_CL;
  4472. case X64Reg_BH: return X64Reg_BH;
  4473. case X64Reg_BL:
  4474. case X64Reg_BX:
  4475. case X64Reg_EBX:
  4476. case X64Reg_RBX: return X64Reg_BL;
  4477. case X64Reg_R8B:
  4478. case X64Reg_R8W:
  4479. case X64Reg_R8D:
  4480. case X64Reg_R8: return X64Reg_R8B;
  4481. case X64Reg_R9B:
  4482. case X64Reg_R9W:
  4483. case X64Reg_R9D:
  4484. case X64Reg_R9: return X64Reg_R9B;
  4485. case X64Reg_R10B:
  4486. case X64Reg_R10W:
  4487. case X64Reg_R10D:
  4488. case X64Reg_R10: return X64Reg_R10B;
  4489. case X64Reg_R11B:
  4490. case X64Reg_R11W:
  4491. case X64Reg_R11D:
  4492. case X64Reg_R11: return X64Reg_R11B;
  4493. case X64Reg_R12B:
  4494. case X64Reg_R12W:
  4495. case X64Reg_R12D:
  4496. case X64Reg_R12: return X64Reg_R12B;
  4497. case X64Reg_R13B:
  4498. case X64Reg_R13W:
  4499. case X64Reg_R13D:
  4500. case X64Reg_R13: return X64Reg_R13B;
  4501. case X64Reg_R14B:
  4502. case X64Reg_R14W:
  4503. case X64Reg_R14D:
  4504. case X64Reg_R14: return X64Reg_R14B;
  4505. case X64Reg_R15B:
  4506. case X64Reg_R15W:
  4507. case X64Reg_R15D:
  4508. case X64Reg_R15: return X64Reg_R15B;
  4509. }
  4510. }
  4511. return X64Reg_None;
  4512. }
  4513. bool BeMCContext::IsAddress(BeMCOperand& operand)
  4514. {
  4515. if (operand.mKind == BeMCOperandKind_VRegAddr)
  4516. return true;
  4517. if (operand.mKind != BeMCOperandKind_VReg)
  4518. return false;
  4519. auto vregInfo = mVRegInfo[operand.mVRegIdx];
  4520. return IsAddress(vregInfo->mRelTo);
  4521. }
  4522. bool BeMCContext::IsAddressable(BeMCOperand& operand)
  4523. {
  4524. if (operand.mKind == BeMCOperandKind_Symbol)
  4525. return true;
  4526. if (operand.mKind == BeMCOperandKind_NativeReg)
  4527. return true;
  4528. if (operand.mKind == BeMCOperandKind_VRegAddr)
  4529. return true;
  4530. if (operand.mKind != BeMCOperandKind_VReg)
  4531. return false;
  4532. auto vregInfo = mVRegInfo[operand.mVRegIdx];
  4533. return IsAddressable(vregInfo->mRelTo);
  4534. }
  4535. bool BeMCContext::IsVRegExpr(BeMCOperand& operand)
  4536. {
  4537. if (!operand.IsVRegAny())
  4538. return false;
  4539. auto vregInfo = mVRegInfo[operand.mVRegIdx];
  4540. return vregInfo->mIsExpr;
  4541. }
  4542. void BeMCContext::FixOperand(BeMCOperand& operand)
  4543. {
  4544. // We don't want to check for VRegLoad, that would erase the dereference
  4545. if ((operand.mKind != BeMCOperandKind_VReg) && (operand.mKind != BeMCOperandKind_VRegAddr))
  4546. return;
  4547. auto vregInfo = mVRegInfo[operand.mVRegIdx];
  4548. if (vregInfo->mReg != X64Reg_None)
  4549. {
  4550. operand.mKind = BeMCOperandKind_NativeReg;
  4551. operand.mReg = vregInfo->mReg;
  4552. return;
  4553. }
  4554. if ((vregInfo->mIsRetVal) && (mCompositeRetVRegIdx != -1) && (mCompositeRetVRegIdx != operand.mVRegIdx))
  4555. {
  4556. BF_ASSERT(mCompositeRetVRegIdx != -1);
  4557. BeMCOperand origOperand = operand;
  4558. operand = BeMCOperand::FromVReg(mCompositeRetVRegIdx);
  4559. if ((origOperand.mKind == BeMCOperandKind_VReg) && (vregInfo->mType->IsComposite()))
  4560. operand.mKind = BeMCOperandKind_VRegLoad;
  4561. FixOperand(operand);
  4562. //auto retVRegInfo = mVRegInfo[mCompositeRetVRegIdx];
  4563. //operand = BeMCOperand::FromReg(retVRegInfo->mReg);
  4564. }
  4565. if (vregInfo->IsDirectRelToAny())
  4566. {
  4567. auto checkOperand = vregInfo->mRelTo;
  4568. if (checkOperand.IsVReg())
  4569. FixOperand(checkOperand);
  4570. if (checkOperand.IsNativeReg())
  4571. {
  4572. auto resizedReg = ResizeRegister(checkOperand.mReg, vregInfo->mType->mSize);
  4573. if (resizedReg != X64Reg_None)
  4574. operand = BeMCOperand::FromReg(resizedReg);
  4575. }
  4576. else if (checkOperand.mKind == BeMCOperandKind_Symbol)
  4577. {
  4578. auto symbol = mCOFFObject->mSymbols[checkOperand.mSymbolIdx];
  4579. if (AreTypesEquivalent(vregInfo->mType, symbol->mType))
  4580. {
  4581. if (checkOperand.mKind == BeMCOperandKind_VRegAddr)
  4582. {
  4583. operand = BeMCOperand::ToAddr(checkOperand);
  4584. }
  4585. else
  4586. operand = checkOperand;
  4587. }
  4588. }
  4589. else if (checkOperand.mKind == BeMCOperandKind_SymbolAddr)
  4590. {
  4591. operand = checkOperand;
  4592. }
  4593. }
  4594. }
  4595. BeMCOperand BeMCContext::GetFixedOperand(const BeMCOperand& operand)
  4596. {
  4597. BeMCOperand copyOp = operand;
  4598. FixOperand(copyOp);
  4599. return copyOp;
  4600. }
  4601. uint8 BeMCContext::GetREX(const BeMCOperand& r, const BeMCOperand& rm, bool is64Bit)
  4602. {
  4603. //bool is64Bit = false;
  4604. bool is64BitExR = false;
  4605. bool is64BitExRM = false;
  4606. bool forceRex = false;
  4607. if (r.mKind == BeMCOperandKind_NativeReg)
  4608. {
  4609. /*if ((r.mReg >= X64Reg_RAX) && (r.mReg <= X64Reg_EFL))
  4610. BF_ASSERT(is64Bit); */
  4611. switch (r.mReg)
  4612. {
  4613. case X64Reg_SIL:
  4614. case X64Reg_DIL:
  4615. forceRex = true;
  4616. break;
  4617. case X64Reg_R8: case X64Reg_R9: case X64Reg_R10: case X64Reg_R11: case X64Reg_R12: case X64Reg_R13: case X64Reg_R14: case X64Reg_R15:
  4618. case X64Reg_R8D: case X64Reg_R9D: case X64Reg_R10D: case X64Reg_R11D: case X64Reg_R12D: case X64Reg_R13D: case X64Reg_R14D: case X64Reg_R15D:
  4619. case X64Reg_R8W: case X64Reg_R9W: case X64Reg_R10W: case X64Reg_R11W: case X64Reg_R12W: case X64Reg_R13W: case X64Reg_R14W: case X64Reg_R15W:
  4620. case X64Reg_R8B: case X64Reg_R9B: case X64Reg_R10B: case X64Reg_R11B: case X64Reg_R12B: case X64Reg_R13B: case X64Reg_R14B: case X64Reg_R15B:
  4621. case X64Reg_XMM8_f64: case X64Reg_XMM9_f64: case X64Reg_XMM10_f64: case X64Reg_XMM11_f64:
  4622. case X64Reg_XMM12_f64: case X64Reg_XMM13_f64: case X64Reg_XMM14_f64: case X64Reg_XMM15_f64:
  4623. case X64Reg_XMM8_f32: case X64Reg_XMM9_f32: case X64Reg_XMM10_f32: case X64Reg_XMM11_f32:
  4624. case X64Reg_XMM12_f32: case X64Reg_XMM13_f32: case X64Reg_XMM14_f32: case X64Reg_XMM15_f32:
  4625. is64BitExR = true;
  4626. }
  4627. }
  4628. bool hasSibExRM = false;
  4629. if (rm.mKind == BeMCOperandKind_NativeReg)
  4630. {
  4631. switch (rm.mReg)
  4632. {
  4633. case X64Reg_SIL:
  4634. case X64Reg_DIL:
  4635. forceRex = true;
  4636. break;
  4637. case X64Reg_R8: case X64Reg_R9: case X64Reg_R10: case X64Reg_R11: case X64Reg_R12: case X64Reg_R13: case X64Reg_R14: case X64Reg_R15:
  4638. case X64Reg_R8D: case X64Reg_R9D: case X64Reg_R10D: case X64Reg_R11D: case X64Reg_R12D: case X64Reg_R13D: case X64Reg_R14D: case X64Reg_R15D:
  4639. case X64Reg_R8W: case X64Reg_R9W: case X64Reg_R10W: case X64Reg_R11W: case X64Reg_R12W: case X64Reg_R13W: case X64Reg_R14W: case X64Reg_R15W:
  4640. case X64Reg_R8B: case X64Reg_R9B: case X64Reg_R10B: case X64Reg_R11B: case X64Reg_R12B: case X64Reg_R13B: case X64Reg_R14B: case X64Reg_R15B:
  4641. case X64Reg_XMM8_f64: case X64Reg_XMM9_f64: case X64Reg_XMM10_f64: case X64Reg_XMM11_f64:
  4642. case X64Reg_XMM12_f64: case X64Reg_XMM13_f64: case X64Reg_XMM14_f64: case X64Reg_XMM15_f64:
  4643. case X64Reg_XMM8_f32: case X64Reg_XMM9_f32: case X64Reg_XMM10_f32: case X64Reg_XMM11_f32:
  4644. case X64Reg_XMM12_f32: case X64Reg_XMM13_f32: case X64Reg_XMM14_f32: case X64Reg_XMM15_f32:
  4645. is64BitExRM = true;
  4646. }
  4647. }
  4648. else if (rm.IsVRegAny())
  4649. {
  4650. auto vregInfo = mVRegInfo[rm.mVRegIdx];
  4651. if (vregInfo->IsDirectRelTo())
  4652. return GetREX(r, vregInfo->mRelTo, is64Bit);
  4653. X64CPURegister regA = X64Reg_None;
  4654. X64CPURegister regB = X64Reg_None;
  4655. int bScale = 1;
  4656. int disp = 0;
  4657. GetRMParams(rm, regA, regB, bScale, disp);
  4658. is64BitExRM |= ((regA >= X64Reg_R8) && (regA <= X64Reg_R15)) || ((regA >= X64Reg_R8D) && (regA <= X64Reg_R15D));
  4659. hasSibExRM |= ((regB >= X64Reg_R8) && (regB <= X64Reg_R15)) || ((regB >= X64Reg_R8D) && (regB <= X64Reg_R15D));
  4660. }
  4661. else if (rm.IsSymbol())
  4662. {
  4663. auto sym = mCOFFObject->mSymbols[rm.mSymbolIdx];
  4664. if (sym->mIsTLS)
  4665. {
  4666. auto tlsReg = mVRegInfo[mTLSVRegIdx]->mReg;
  4667. is64BitExRM |= (tlsReg >= X64Reg_R8) && (tlsReg <= X64Reg_R15);
  4668. }
  4669. }
  4670. uint8 flags = 0;
  4671. if (is64Bit)
  4672. flags |= 8;
  4673. if (is64BitExR)
  4674. flags |= 4;
  4675. if (hasSibExRM)
  4676. flags |= 2;
  4677. if (is64BitExRM)
  4678. flags |= 1;
  4679. if ((flags != 0) || (forceRex))
  4680. return (uint8)(0x40 | flags);
  4681. return 0;
  4682. }
  4683. void BeMCContext::EmitREX(const BeMCOperand& r, const BeMCOperand& rm, bool is64Bit)
  4684. {
  4685. uint8 rex = GetREX(r, rm, is64Bit);
  4686. if (rex != 0)
  4687. mOut.Write(rex);
  4688. }
  4689. uint8 BeMCContext::EncodeRegNum(X64CPURegister regNum)
  4690. {
  4691. switch (regNum)
  4692. {
  4693. case X64Reg_AL:
  4694. case X64Reg_AX:
  4695. case X64Reg_EAX:
  4696. case X64Reg_RAX:
  4697. case X64Reg_R8:
  4698. case X64Reg_R8D:
  4699. case X64Reg_R8W:
  4700. case X64Reg_R8B:
  4701. case X64Reg_MM0:
  4702. case X64Reg_XMM0_f32:
  4703. case X64Reg_XMM0_f64:
  4704. case X64Reg_XMM8_f32:
  4705. case X64Reg_XMM8_f64:
  4706. return 0;
  4707. case X64Reg_CL:
  4708. case X64Reg_CX:
  4709. case X64Reg_ECX:
  4710. case X64Reg_RCX:
  4711. case X64Reg_R9:
  4712. case X64Reg_R9D:
  4713. case X64Reg_R9W:
  4714. case X64Reg_R9B:
  4715. case X64Reg_MM1:
  4716. case X64Reg_XMM1_f32:
  4717. case X64Reg_XMM1_f64:
  4718. case X64Reg_XMM9_f32:
  4719. case X64Reg_XMM9_f64:
  4720. return 1;
  4721. case X64Reg_DL:
  4722. case X64Reg_DX:
  4723. case X64Reg_EDX:
  4724. case X64Reg_RDX:
  4725. case X64Reg_R10:
  4726. case X64Reg_R10D:
  4727. case X64Reg_R10W:
  4728. case X64Reg_R10B:
  4729. case X64Reg_MM2:
  4730. case X64Reg_XMM2_f32:
  4731. case X64Reg_XMM2_f64:
  4732. case X64Reg_XMM10_f32:
  4733. case X64Reg_XMM10_f64:
  4734. return 2;
  4735. case X64Reg_BL:
  4736. case X64Reg_BX:
  4737. case X64Reg_EBX:
  4738. case X64Reg_RBX:
  4739. case X64Reg_R11:
  4740. case X64Reg_R11D:
  4741. case X64Reg_R11W:
  4742. case X64Reg_R11B:
  4743. case X64Reg_MM3:
  4744. case X64Reg_XMM3_f32:
  4745. case X64Reg_XMM3_f64:
  4746. case X64Reg_XMM11_f32:
  4747. case X64Reg_XMM11_f64:
  4748. return 3;
  4749. case X64Reg_None: // Useful for SIB/RM addr encodings
  4750. case X64Reg_AH:
  4751. //case X64Reg_SP:
  4752. //case X64Reg_ESP:
  4753. case X64Reg_RSP:
  4754. case X64Reg_R12:
  4755. case X64Reg_R12D:
  4756. case X64Reg_R12W:
  4757. case X64Reg_R12B:
  4758. case X64Reg_MM4:
  4759. case X64Reg_XMM4_f32:
  4760. case X64Reg_XMM4_f64:
  4761. case X64Reg_XMM12_f32:
  4762. case X64Reg_XMM12_f64:
  4763. return 4;
  4764. case X64Reg_CH:
  4765. //case X64Reg_BP:
  4766. //case X64Reg_EBP:
  4767. case X64Reg_RBP:
  4768. case X64Reg_R13:
  4769. case X64Reg_R13D:
  4770. case X64Reg_R13W:
  4771. case X64Reg_R13B:
  4772. case X64Reg_MM5:
  4773. case X64Reg_XMM5_f32:
  4774. case X64Reg_XMM5_f64:
  4775. case X64Reg_XMM13_f32:
  4776. case X64Reg_XMM13_f64:
  4777. return 5;
  4778. case X64Reg_DH:
  4779. case X64Reg_SIL:
  4780. case X64Reg_SI:
  4781. case X64Reg_ESI:
  4782. case X64Reg_RSI:
  4783. case X64Reg_R14:
  4784. case X64Reg_R14D:
  4785. case X64Reg_R14W:
  4786. case X64Reg_R14B:
  4787. case X64Reg_MM6:
  4788. case X64Reg_XMM6_f32:
  4789. case X64Reg_XMM6_f64:
  4790. case X64Reg_XMM14_f32:
  4791. case X64Reg_XMM14_f64:
  4792. return 6;
  4793. case X64Reg_BH:
  4794. case X64Reg_DIL:
  4795. case X64Reg_DI:
  4796. case X64Reg_EDI:
  4797. case X64Reg_RDI:
  4798. case X64Reg_R15:
  4799. case X64Reg_R15D:
  4800. case X64Reg_R15W:
  4801. case X64Reg_R15B:
  4802. case X64Reg_MM7:
  4803. case X64Reg_XMM7_f32:
  4804. case X64Reg_XMM7_f64:
  4805. case X64Reg_XMM15_f32:
  4806. case X64Reg_XMM15_f64:
  4807. return 7;
  4808. }
  4809. Fail("Invalid reg");
  4810. return -1;
  4811. }
  4812. int BeMCContext::GetRegSize(int regNum)
  4813. {
  4814. if ((regNum >= X64Reg_EAX) && (regNum <= X64Reg_EDI))
  4815. return 4;
  4816. if ((regNum >= X64Reg_AX) && (regNum <= X64Reg_BX))
  4817. return 2;
  4818. if ((regNum >= X64Reg_AL) && (regNum <= X64Reg_BH))
  4819. return 1;
  4820. return 8;
  4821. }
  4822. BeMCRMMode BeMCContext::ValidateRMResult(const BeMCOperand& operand, X64CPURegister& regA, X64CPURegister& regB, int& bScale, int& disp, int* errorVReg, BeMCRMMode result, bool doValidate)
  4823. {
  4824. if (!doValidate)
  4825. return result;
  4826. //TODO: WTF- this previous version just seems to be wrong! Why did think this was true? the REX.X and REX.B flags fix these
  4827. // in a SIB, the base can't be R13 (which is RBP+REX), and the scaled index can't be R12 (which is RSP+REX)
  4828. //if ((regB != X64Reg_None) &&
  4829. // ((regA == X64Reg_R13) || (regB == X64Reg_R12)))
  4830. //{
  4831. // // We can't just swap the regs if we have a scale applied
  4832. // if (bScale != 1)
  4833. // {
  4834. // if (errorVReg != NULL)
  4835. // *errorVReg = -2; // Scale error
  4836. // return BeMCRMMode_Invalid;
  4837. // }
  4838. // BF_SWAP(regA, regB);
  4839. //}
  4840. // In a SIB, the base can't be RBP, and the scaled index can't be RSP
  4841. if ((regB != X64Reg_None) &&
  4842. ((regA == X64Reg_RBP) || (regB == X64Reg_RSP)))
  4843. {
  4844. // We can't just swap the regs if we have a scale applied
  4845. if (bScale != 1)
  4846. {
  4847. if (errorVReg != NULL)
  4848. *errorVReg = -2; // Scale error
  4849. return BeMCRMMode_Invalid;
  4850. }
  4851. BF_SWAP(regA, regB);
  4852. }
  4853. return result;
  4854. }
  4855. BeMCRMMode BeMCContext::GetRMParams(const BeMCOperand& operand, X64CPURegister& regA, X64CPURegister& regB, int& bScale, int& disp, int* errorVReg, bool doValidate)
  4856. {
  4857. BeMCRMMode rmMode = BeMCRMMode_Invalid;
  4858. if (operand.mKind == BeMCOperandKind_NativeReg)
  4859. {
  4860. if (regA == X64Reg_None)
  4861. regA = operand.mReg;
  4862. else if (regB == X64Reg_None)
  4863. regB = operand.mReg;
  4864. else
  4865. return BeMCRMMode_Invalid;
  4866. return ValidateRMResult(operand, regA, regB, bScale, disp, errorVReg, BeMCRMMode_Direct, doValidate);
  4867. }
  4868. else if (operand.IsImmediateInt())
  4869. {
  4870. disp += (int)operand.mImmediate;
  4871. return ValidateRMResult(operand, regA, regB, bScale, disp, errorVReg, BeMCRMMode_Direct, doValidate);
  4872. }
  4873. if (operand.mKind == BeMCOperandKind_VReg)
  4874. {
  4875. auto vregInfo = mVRegInfo[operand.mVRegIdx];
  4876. if (!vregInfo->mIsExpr)
  4877. {
  4878. auto reg = vregInfo->mReg;
  4879. if (reg != X64Reg_None)
  4880. {
  4881. if (regA == X64Reg_None)
  4882. regA = reg;
  4883. else if (regB == X64Reg_None)
  4884. regB = reg;
  4885. else
  4886. return BeMCRMMode_Invalid;
  4887. return ValidateRMResult(operand, regA, regB, bScale, disp, errorVReg, BeMCRMMode_Direct, doValidate);
  4888. }
  4889. auto result = GetRMParams(BeMCOperand::ToAddr(operand), regA, regB, bScale, disp, errorVReg, doValidate);
  4890. if (result == BeMCRMMode_Invalid)
  4891. return BeMCRMMode_Invalid;
  4892. BF_ASSERT(result == BeMCRMMode_Direct);
  4893. return ValidateRMResult(BeMCOperand::ToAddr(operand), regA, regB, bScale, disp, errorVReg, BeMCRMMode_Deref, doValidate);
  4894. }
  4895. // Fall through
  4896. }
  4897. else if (operand.mKind == BeMCOperandKind_VRegAddr)
  4898. {
  4899. auto vregInfo = mVRegInfo[operand.mVRegIdx];
  4900. if (vregInfo->mIsExpr)
  4901. {
  4902. if (vregInfo->IsDirectRelToAny())
  4903. {
  4904. if (vregInfo->mRelTo.mKind == BeMCOperandKind_VReg)
  4905. return GetRMParams(BeMCOperand::FromVRegAddr(vregInfo->mRelTo.mVRegIdx), regA, regB, bScale, disp, errorVReg, doValidate);
  4906. else if (vregInfo->mRelTo.mKind == BeMCOperandKind_VRegLoad)
  4907. return GetRMParams(BeMCOperand::FromVReg(vregInfo->mRelTo.mVRegIdx), regA, regB, bScale, disp, errorVReg, doValidate);
  4908. }
  4909. *errorVReg = operand.mVRegIdx;
  4910. return BeMCRMMode_Invalid;
  4911. }
  4912. BF_ASSERT(!vregInfo->mIsExpr);
  4913. BF_ASSERT(vregInfo->mReg == X64Reg_None);
  4914. X64CPURegister reg = X64Reg_None;
  4915. if ((vregInfo->mIsRetVal) && (mCompositeRetVRegIdx != -1) && (mCompositeRetVRegIdx != operand.mVRegIdx))
  4916. {
  4917. return GetRMParams(BeMCOperand::FromVReg(mCompositeRetVRegIdx), regA, regB, bScale, disp, errorVReg, doValidate);
  4918. }
  4919. reg = mUseBP ? X64Reg_RBP : X64Reg_RSP;
  4920. disp = mStackSize + vregInfo->mFrameOffset;
  4921. if (regA == X64Reg_None)
  4922. regA = reg;
  4923. else if (regB == X64Reg_None)
  4924. regB = reg;
  4925. return ValidateRMResult(operand, regA, regB, bScale, disp, errorVReg, BeMCRMMode_Direct, doValidate);
  4926. }
  4927. else if (operand.mKind == BeMCOperandKind_VRegLoad)
  4928. {
  4929. auto vregInfo = mVRegInfo[operand.mVRegIdx];
  4930. if (!vregInfo->mIsExpr)
  4931. {
  4932. auto reg = vregInfo->mReg;
  4933. if (reg == X64Reg_None)
  4934. {
  4935. if (errorVReg != NULL)
  4936. *errorVReg = operand.mVRegIdx;
  4937. return BeMCRMMode_Invalid;
  4938. }
  4939. if (regA == X64Reg_None)
  4940. regA = reg;
  4941. else if (regB == X64Reg_None)
  4942. regB = reg;
  4943. return ValidateRMResult(operand, regA, regB, bScale, disp, errorVReg, BeMCRMMode_Deref, doValidate);
  4944. }
  4945. }
  4946. else
  4947. {
  4948. return BeMCRMMode_Invalid;
  4949. }
  4950. auto vregInfo = mVRegInfo[operand.mVRegIdx];
  4951. BF_ASSERT(vregInfo->mIsExpr);
  4952. if (vregInfo->mRelTo)
  4953. {
  4954. auto oldRegA = regA;
  4955. auto result = GetRMParams(vregInfo->mRelTo, regA, regB, bScale, disp, errorVReg, false);
  4956. if (result == BeMCRMMode_Invalid)
  4957. {
  4958. if ((errorVReg != NULL) && (*errorVReg == -1))
  4959. {
  4960. *errorVReg = operand.mVRegIdx;
  4961. }
  4962. return BeMCRMMode_Invalid;
  4963. }
  4964. if (result == BeMCRMMode_Deref)
  4965. {
  4966. // A deref can only stand alone, and no double-derefs
  4967. if ((vregInfo->mRelOffset) || (vregInfo->mRelOffsetScale != 1) || (operand.mKind == BeMCOperandKind_VRegLoad))
  4968. {
  4969. if (errorVReg != NULL)
  4970. {
  4971. BF_ASSERT(vregInfo->mRelTo.IsVRegAny());
  4972. *errorVReg = vregInfo->mRelTo.mVRegIdx;
  4973. // For some reason we had changed this to:
  4974. //*errorVReg = operand.mVRegIdx;
  4975. // This doesn't work, it's the deref that we want to isolate, otherwise we just end up creating another invalid expression
  4976. }
  4977. return BeMCRMMode_Invalid;
  4978. }
  4979. if (operand.mKind == BeMCOperandKind_VRegAddr)
  4980. return ValidateRMResult(vregInfo->mRelTo, regA, regB, bScale, disp, errorVReg, BeMCRMMode_Direct, doValidate);
  4981. else if (operand.mKind == BeMCOperandKind_VReg)
  4982. return ValidateRMResult(vregInfo->mRelTo, regA, regB, bScale, disp, errorVReg, BeMCRMMode_Deref, doValidate);
  4983. else
  4984. NotImpl();
  4985. }
  4986. }
  4987. if (vregInfo->mRelOffset)
  4988. {
  4989. bool relToComplicated = (regB != X64Reg_None) || (bScale != 1);
  4990. auto result = GetRMParams(vregInfo->mRelOffset, regA, regB, bScale, disp, errorVReg, false);
  4991. if (result == BeMCRMMode_Invalid)
  4992. {
  4993. if (errorVReg != NULL)
  4994. {
  4995. // Pick the "most complicated" between relOffset and relTo?
  4996. if (relToComplicated)
  4997. {
  4998. BF_ASSERT(vregInfo->mRelTo.IsVRegAny());
  4999. *errorVReg = vregInfo->mRelTo.mVRegIdx;
  5000. }
  5001. else
  5002. {
  5003. BF_ASSERT(vregInfo->mRelOffset.IsVRegAny());
  5004. *errorVReg = vregInfo->mRelOffset.mVRegIdx;
  5005. }
  5006. }
  5007. return BeMCRMMode_Invalid;
  5008. }
  5009. if (result == BeMCRMMode_Deref) // Deref only allowed on relTo
  5010. {
  5011. if (errorVReg != NULL)
  5012. {
  5013. BF_ASSERT(vregInfo->mRelOffset.IsVRegAny());
  5014. *errorVReg = vregInfo->mRelOffset.mVRegIdx;
  5015. }
  5016. return BeMCRMMode_Invalid;
  5017. }
  5018. }
  5019. bool success = true;
  5020. if (vregInfo->mRelOffsetScale != 1)
  5021. {
  5022. if (bScale != 1)
  5023. success = false;
  5024. bScale = vregInfo->mRelOffsetScale;
  5025. if ((bScale != 2) && (bScale != 4) && (bScale != 8))
  5026. success = false;
  5027. if (regB == X64Reg_None)
  5028. {
  5029. regB = regA;
  5030. regA = X64Reg_None;
  5031. }
  5032. }
  5033. if (!success)
  5034. {
  5035. if ((errorVReg != NULL) && (*errorVReg == -1))
  5036. *errorVReg = operand.mVRegIdx;
  5037. }
  5038. if (success)
  5039. {
  5040. if (operand.mKind == BeMCOperandKind_VRegLoad)
  5041. return ValidateRMResult(vregInfo->mRelOffset, regA, regB, bScale, disp, errorVReg, BeMCRMMode_Deref, doValidate);
  5042. else
  5043. return ValidateRMResult(vregInfo->mRelOffset, regA, regB, bScale, disp, errorVReg, BeMCRMMode_Direct, doValidate);
  5044. }
  5045. else
  5046. return BeMCRMMode_Invalid;
  5047. }
  5048. void BeMCContext::DisableRegister(const BeMCOperand& operand, X64CPURegister reg)
  5049. {
  5050. auto vregInfo = GetVRegInfo(operand);
  5051. if (vregInfo == NULL)
  5052. return;
  5053. switch (reg)
  5054. {
  5055. case X64Reg_RAX:
  5056. vregInfo->mDisableRAX = true;
  5057. break;
  5058. case X64Reg_SIL:
  5059. vregInfo->mDisableEx = true;
  5060. break;
  5061. default:
  5062. NotImpl();
  5063. }
  5064. if (vregInfo->mRelTo)
  5065. DisableRegister(vregInfo->mRelTo, reg);
  5066. if (vregInfo->mRelOffset)
  5067. DisableRegister(vregInfo->mRelOffset, reg);
  5068. }
  5069. void BeMCContext::MarkInvalidRMRegs(const BeMCOperand& operand)
  5070. {
  5071. if (!operand.IsVRegAny())
  5072. return;
  5073. auto vregInfo = mVRegInfo[operand.mVRegIdx];
  5074. if (vregInfo->mReg == X64Reg_R12) // Can't allow a scaled R12, it's illegal in ModRM
  5075. vregInfo->mDisableR12 = true;
  5076. if (vregInfo->mReg == X64Reg_R13) // Can't allow a base R13, it's illegal in ModRM
  5077. vregInfo->mDisableR13 = true;
  5078. MarkInvalidRMRegs(vregInfo->mRelTo);
  5079. MarkInvalidRMRegs(vregInfo->mRelOffset);
  5080. }
  5081. void BeMCContext::GetUsedRegs(const BeMCOperand& operand, X64CPURegister& regA, X64CPURegister& regB)
  5082. {
  5083. int scale = 1;
  5084. int offset = 0;
  5085. GetRMParams(operand, regA, regB, scale, offset, NULL);
  5086. if (regA != X64Reg_None)
  5087. regA = ResizeRegister(regA, 8);
  5088. if (regB != X64Reg_None)
  5089. regB = ResizeRegister(regB, 8);
  5090. }
  5091. BeMCRMMode BeMCContext::GetRMForm(const BeMCOperand& operand, bool& isMulti)
  5092. {
  5093. X64CPURegister regA = X64Reg_None;
  5094. X64CPURegister regB = X64Reg_None;
  5095. int bScale = 1;
  5096. int disp = 0;
  5097. auto result = GetRMParams(operand, regA, regB, bScale, disp);
  5098. isMulti = (regB != X64Reg_None) || (disp != 0);
  5099. return result;
  5100. }
  5101. void BeMCContext::GetValAddr(const BeMCOperand& operand, X64CPURegister& reg, int& offset)
  5102. {
  5103. if (operand.IsNativeReg())
  5104. {
  5105. reg = operand.mReg;
  5106. return;
  5107. }
  5108. BF_ASSERT(operand.IsVRegAny());
  5109. auto vregInfo = mVRegInfo[operand.mVRegIdx];
  5110. if (operand.mKind == BeMCOperandKind_VReg)
  5111. {
  5112. if (vregInfo->mRelTo)
  5113. {
  5114. GetValAddr(vregInfo->mRelTo, reg, offset);
  5115. if (vregInfo->mRelOffset)
  5116. {
  5117. BF_ASSERT(vregInfo->mRelOffset.IsImmediateInt());
  5118. offset += vregInfo->mRelOffset.mImmediate;
  5119. }
  5120. return;
  5121. }
  5122. BF_ASSERT(vregInfo->mType->IsPointer());
  5123. BF_ASSERT(vregInfo->mReg != X64Reg_None);
  5124. reg = vregInfo->mReg;
  5125. return;
  5126. }
  5127. if ((vregInfo->mIsRetVal) && (mCompositeRetVRegIdx != -1) && (mCompositeRetVRegIdx != operand.mVRegIdx))
  5128. {
  5129. BF_ASSERT(mCompositeRetVRegIdx != -1);
  5130. GetValAddr(BeMCOperand::FromVRegAddr(mCompositeRetVRegIdx), reg, offset);
  5131. return;
  5132. }
  5133. while (vregInfo->IsDirectRelTo())
  5134. {
  5135. vregInfo = GetVRegInfo(vregInfo->mRelTo);
  5136. }
  5137. reg = mUseBP ? X64Reg_RBP : X64Reg_RSP;
  5138. offset = mStackSize + vregInfo->mFrameOffset;
  5139. }
  5140. int BeMCContext::GetHighestVRegRef(const BeMCOperand& operand)
  5141. {
  5142. if (!operand.IsVRegAny())
  5143. return -1;
  5144. int highestIdx = operand.mVRegIdx;
  5145. auto vregInfo = mVRegInfo[operand.mVRegIdx];
  5146. if (vregInfo->mRelTo)
  5147. highestIdx = std::max(highestIdx, GetHighestVRegRef(vregInfo->mRelTo));
  5148. if (vregInfo->mRelOffset)
  5149. highestIdx = std::max(highestIdx, GetHighestVRegRef(vregInfo->mRelOffset));
  5150. return highestIdx;
  5151. }
  5152. uint8 BeMCContext::GetJumpOpCode(BeCmpKind cmpKind, bool isLong)
  5153. {
  5154. if (isLong)
  5155. {
  5156. switch (cmpKind)
  5157. {
  5158. case BeCmpKind_None: // JMP
  5159. return 0xE9;
  5160. case BeCmpKind_SLT: // JL
  5161. return 0x8C;
  5162. case BeCmpKind_ULT: // JB
  5163. return 0x82;
  5164. case BeCmpKind_SLE: // JLE
  5165. return 0x8E;
  5166. case BeCmpKind_ULE: // JBE
  5167. return 0x86;
  5168. case BeCmpKind_EQ: // JE
  5169. return 0x84;
  5170. case BeCmpKind_NE: // JNE
  5171. return 0x85;
  5172. case BeCmpKind_SGT: // JG
  5173. return 0x8F;
  5174. case BeCmpKind_UGT: // JA
  5175. return 0x87;
  5176. case BeCmpKind_SGE: // JGE
  5177. return 0x8D;
  5178. case BeCmpKind_UGE: // JAE
  5179. return 0x83;
  5180. }
  5181. }
  5182. else
  5183. {
  5184. switch (cmpKind)
  5185. {
  5186. case BeCmpKind_None: // JMP
  5187. return 0xEB;
  5188. case BeCmpKind_SLT: // JL
  5189. return 0x7C;
  5190. case BeCmpKind_ULT: // JB
  5191. return 0x72;
  5192. case BeCmpKind_SLE: // JLE
  5193. return 0x7E;
  5194. case BeCmpKind_ULE: // JBE
  5195. return 0x76;
  5196. case BeCmpKind_EQ: // JE
  5197. return 0x74;
  5198. case BeCmpKind_NE: // JNE
  5199. return 0x75;
  5200. case BeCmpKind_SGT: // JG
  5201. return 0x7F;
  5202. case BeCmpKind_UGT: // JA
  5203. return 0x77;
  5204. case BeCmpKind_SGE: // JGE
  5205. return 0x7D;
  5206. case BeCmpKind_UGE: // JAE
  5207. return 0x73;
  5208. }
  5209. }
  5210. return 0;
  5211. }
  5212. void BeMCContext::Emit(uint8 val)
  5213. {
  5214. mOut.Write(val);
  5215. }
  5216. void BeMCContext::EmitModRM(int mod, int reg, int rm)
  5217. {
  5218. mOut.Write((uint8)((mod << 6) | (reg << 3) | rm));
  5219. }
  5220. void BeMCContext::EmitModRMRel(int rx, X64CPURegister regA, X64CPURegister regB, int bScale, int relOffset)
  5221. {
  5222. if (regB != X64Reg_None)
  5223. {
  5224. // We can't encode regA as RBP in the SIB base
  5225. BF_ASSERT(regA != X64Reg_RBP);
  5226. // We can't encode RegB as RSP in the SIB index
  5227. BF_ASSERT(regB != X64Reg_RSP);
  5228. }
  5229. uint8 modRM = (rx << 3);
  5230. if ((regB == X64Reg_None) && (regA != X64Reg_RSP) && (regA != X64Reg_R12)) // RSP/R12 can't be encoded without a SIB
  5231. {
  5232. if ((relOffset == 0) && (regA != X64Reg_RBP) && (regA != X64Reg_R13)) // RBP/R13 can't be encoded with Mod0
  5233. {
  5234. modRM |= (0x0 << 6) | (EncodeRegNum(regA)); // [regA]
  5235. mOut.Write(modRM);
  5236. return;
  5237. }
  5238. else if ((relOffset >= -0x80) && (relOffset <= 0x7F))
  5239. {
  5240. modRM |= (0x1 << 6) | (EncodeRegNum(regA)); // [regA]+disp8
  5241. mOut.Write(modRM);
  5242. mOut.Write((uint8)relOffset);
  5243. return;
  5244. }
  5245. else
  5246. {
  5247. modRM |= (0x2 << 6) | (EncodeRegNum(regA)); // [regA]+disp32
  5248. mOut.Write(modRM);
  5249. mOut.Write((int32)relOffset);
  5250. return;
  5251. }
  5252. }
  5253. else if (regA == X64Reg_None) // The only option is disp32
  5254. {
  5255. modRM |= (0x0 << 6) | (0x4); // [--][--]+disp32
  5256. mOut.Write(modRM);
  5257. uint8 sib = ((bScale == 2) ? 1 : (bScale == 4) ? 2 : (bScale == 8) ? 3 : 0) << 6;
  5258. sib |= (EncodeRegNum(regB) << 3) | 5;
  5259. mOut.Write(sib);
  5260. mOut.Write((int32)relOffset);
  5261. return;
  5262. }
  5263. else
  5264. {
  5265. // Do no-offset version UNLESS we have a base of R13, which has its representation stolen by '[--][--]+disp32',
  5266. // so we must use the longer +disp8 version in that case
  5267. if ((relOffset == 0) && (regA != X64Reg_R13))
  5268. {
  5269. modRM |= (0x0 << 6) | (0x4); // [--][--]
  5270. mOut.Write(modRM);
  5271. uint8 sib = ((bScale == 2) ? 1 : (bScale == 4) ? 2 : (bScale == 8) ? 3 : 0) << 6;
  5272. sib |= (EncodeRegNum(regB) << 3) | EncodeRegNum(regA);
  5273. mOut.Write(sib);
  5274. return;
  5275. }
  5276. else if ((relOffset >= -0x80) && (relOffset <= 0x7F))
  5277. {
  5278. modRM |= (0x1 << 6) | (0x4); // [--][--]+disp8
  5279. mOut.Write(modRM);
  5280. uint8 sib = ((bScale == 2) ? 1 : (bScale == 4) ? 2 : (bScale == 8) ? 3 : 0) << 6;
  5281. sib |= (EncodeRegNum(regB) << 3) | EncodeRegNum(regA);
  5282. mOut.Write(sib);
  5283. mOut.Write((uint8)relOffset);
  5284. return;
  5285. }
  5286. else
  5287. {
  5288. modRM |= (0x2 << 6) | (0x4); // [--][--]+disp32
  5289. mOut.Write(modRM);
  5290. uint8 sib = ((bScale == 2) ? 1 : (bScale == 4) ? 2 : (bScale == 8) ? 3 : 0) << 6;
  5291. sib |= (EncodeRegNum(regB) << 3) | EncodeRegNum(regA);
  5292. mOut.Write(sib);
  5293. mOut.Write((int32)relOffset);
  5294. return;
  5295. }
  5296. }
  5297. }
  5298. void BeMCContext::EmitModRMRelStack(int rx, int regOffset, int scale)
  5299. {
  5300. EmitModRMRel(rx, mUseBP ? X64Reg_RBP : X64Reg_RSP, X64Reg_None, scale, regOffset);
  5301. }
  5302. void BeMCContext::EmitModRM(int rx, BeMCOperand rm, int relocOfs)
  5303. {
  5304. uint8 modRM = (rx << 3);
  5305. //int relocIdx = -1;
  5306. if (rm.IsImmediateFloat())
  5307. {
  5308. EmitModRM_XMM_IMM(rx, rm);
  5309. return;
  5310. }
  5311. else if ((rm.mKind == BeMCOperandKind_Symbol) || (rm.mKind == BeMCOperandKind_SymbolAddr))
  5312. {
  5313. BeMCRelocation reloc;
  5314. auto sym = mCOFFObject->mSymbols[rm.mSymbolIdx];
  5315. if (sym->mIsTLS)
  5316. {
  5317. auto vregInfo = mVRegInfo[mTLSVRegIdx];
  5318. modRM |= (2<<6) | EncodeRegNum(vregInfo->mReg);
  5319. reloc.mKind = BeMCRelocationKind_SECREL;
  5320. relocOfs = 0;
  5321. }
  5322. else
  5323. {
  5324. modRM |= 0x5; // RIP + <X>
  5325. reloc.mKind = BeMCRelocationKind_REL32;
  5326. }
  5327. Emit(modRM);
  5328. reloc.mOffset = mOut.GetPos();
  5329. reloc.mSymTableIdx = rm.mSymbolIdx;
  5330. mCOFFObject->mTextSect.mRelocs.push_back(reloc);
  5331. mTextRelocs.push_back((int)mCOFFObject->mTextSect.mRelocs.size() - 1);
  5332. //relocIdx = (int)mOut.GetSize();
  5333. mOut.Write((int32)relocOfs);
  5334. return;
  5335. }
  5336. else if (rm.mKind == BeMCOperandKind_NativeReg)
  5337. {
  5338. modRM |= (0x3 << 6) | (EncodeRegNum(rm.mReg));
  5339. }
  5340. else if (rm.IsVRegAny())
  5341. {
  5342. auto vregInfo = mVRegInfo[rm.mVRegIdx];
  5343. if ((vregInfo->mRelTo.mKind == BeMCOperandKind_SymbolAddr) &&
  5344. (vregInfo->mRelOffset.IsImmediateInt()) &&
  5345. (vregInfo->mRelOffsetScale == 1))
  5346. {
  5347. return EmitModRM(rx, vregInfo->mRelTo, relocOfs + vregInfo->mRelOffset.mImmediate);
  5348. }
  5349. if ((rm.IsVReg()) && (vregInfo->IsDirectRelToAny()))
  5350. return EmitModRM(rx, vregInfo->mRelTo, relocOfs);
  5351. X64CPURegister regA = X64Reg_None;
  5352. X64CPURegister regB = X64Reg_None;
  5353. int bScale = 1;
  5354. int disp = 0;
  5355. auto resultType = GetRMParams(rm, regA, regB, bScale, disp);
  5356. //BF_ASSERT(resultType != BeMCRMMode_Invalid);
  5357. BF_ASSERT(resultType == BeMCRMMode_Deref);
  5358. EmitModRMRel(rx, regA, regB, bScale, disp);
  5359. return;
  5360. }
  5361. else
  5362. {
  5363. Fail("Invalid rm");
  5364. }
  5365. mOut.Write(modRM);
  5366. }
  5367. void BeMCContext::EmitModRM(BeMCOperand r, BeMCOperand rm, int relocOfs)
  5368. {
  5369. uint8 modRM = 0;
  5370. BF_ASSERT(r.mKind == BeMCOperandKind_NativeReg);
  5371. EmitModRM(EncodeRegNum(r.mReg), rm, relocOfs);
  5372. }
  5373. void BeMCContext::EmitModRM_Addr(BeMCOperand r, BeMCOperand rm)
  5374. {
  5375. uint8 modRM = 0;
  5376. BF_ASSERT(r.mKind == BeMCOperandKind_NativeReg);
  5377. modRM = EncodeRegNum(r.mReg) << 3;
  5378. if (rm.mKind == BeMCOperandKind_NativeReg)
  5379. {
  5380. modRM |= (0x0 << 6) | (EncodeRegNum(rm.mReg));
  5381. }
  5382. else if ((rm.mKind == BeMCOperandKind_Symbol) || (rm.mKind == BeMCOperandKind_SymbolAddr))
  5383. {
  5384. EmitModRM(r, rm);
  5385. return;
  5386. }
  5387. else if (rm.mKind == BeMCOperandKind_VReg)
  5388. {
  5389. auto vregInfo = mVRegInfo[rm.mVRegIdx];
  5390. if (vregInfo->mIsExpr)
  5391. {
  5392. if (vregInfo->mRelOffsetScale == 1)
  5393. {
  5394. X64CPURegister relToReg = X64Reg_None;
  5395. int regOffset = 0;
  5396. if (vregInfo->mRelOffset)
  5397. {
  5398. BF_ASSERT(vregInfo->mRelOffset.IsImmediate());
  5399. regOffset = (int)vregInfo->mRelOffset.mImmediate;
  5400. }
  5401. if (vregInfo->mRelTo.IsNativeReg())
  5402. {
  5403. relToReg = vregInfo->mRelTo.mReg;
  5404. }
  5405. else if (vregInfo->mRelTo.IsVRegAny())
  5406. {
  5407. auto relVRegInfo = GetVRegInfo(vregInfo->mRelTo);
  5408. if (relVRegInfo->mRelTo)
  5409. {
  5410. X64CPURegister regA = X64Reg_None;
  5411. X64CPURegister regB = X64Reg_None;
  5412. int bScale = 1;
  5413. int disp = 0;
  5414. auto resultType = GetRMParams(rm, regA, regB, bScale, disp);
  5415. BF_ASSERT(resultType != BeMCRMMode_Invalid);
  5416. EmitModRMRel(EncodeRegNum(r.mReg), regA, regB, bScale, disp);
  5417. return;
  5418. }
  5419. else
  5420. NotImpl();
  5421. }
  5422. else
  5423. NotImpl();
  5424. EmitModRMRel(EncodeRegNum(r.mReg), relToReg, X64Reg_None, 1, regOffset);
  5425. return;
  5426. }
  5427. else
  5428. {
  5429. if (vregInfo->mRelOffset)
  5430. {
  5431. BF_ASSERT(vregInfo->mRelOffset.IsImmediate());
  5432. int regOffset = vregInfo->mRelOffset.mImmediate;
  5433. int scaleVal = 0;
  5434. if (vregInfo->mRelOffsetScale == 2)
  5435. scaleVal = 0x1;
  5436. else if (vregInfo->mRelOffsetScale == 4)
  5437. scaleVal = 0x2;
  5438. else if (vregInfo->mRelOffsetScale == 8)
  5439. scaleVal = 0x3;
  5440. modRM |= (0x0 << 6) | (0x4); // [--][--]
  5441. mOut.Write(modRM);
  5442. uint8 sib = (scaleVal << 6) | (EncodeRegNum(vregInfo->mRelTo.mReg) << 3) | (0x5); // [<reg>*<scale> + imm32]
  5443. mOut.Write(sib);
  5444. mOut.Write((int32)regOffset);
  5445. return;
  5446. }
  5447. }
  5448. }
  5449. else
  5450. {
  5451. Fail("Illegal");
  5452. }
  5453. }
  5454. else
  5455. {
  5456. Fail("Invalid rm");
  5457. }
  5458. mOut.Write(modRM);
  5459. }
  5460. void BeMCContext::EmitModRM_XMM_IMM(int rx, BeMCOperand & imm)
  5461. {
  5462. Emit((rx << 3) | (0x5)); // RIP + <X>
  5463. BeMCSymbol* sym = NULL;
  5464. if (imm.mKind == BeMCOperandKind_Immediate_f32)
  5465. {
  5466. float floatVal = (float)imm.mImmFloat;
  5467. String name = StrFormat("__real@%08x", *(int*)&floatVal);
  5468. sym = mCOFFObject->GetCOMDAT(name, &floatVal, 4, 4);
  5469. }
  5470. else if (imm.mKind == BeMCOperandKind_Immediate_f64)
  5471. {
  5472. double floatVal = imm.mImmFloat;
  5473. String name = StrFormat("__real@%016llx", *(int64*)&floatVal);
  5474. sym = mCOFFObject->GetCOMDAT(name, &floatVal, 8, 8);
  5475. }
  5476. else if (imm.mKind == BeMCOperandKind_Immediate_f32_Packed128)
  5477. {
  5478. float floatVal = (float)imm.mImmFloat;
  5479. String name = StrFormat("__real@%08x_packed", *(int*)&floatVal);
  5480. float data[4] = { floatVal, 0, 0, 0 };
  5481. sym = mCOFFObject->GetCOMDAT(name, data, 16, 16);
  5482. }
  5483. else if (imm.mKind == BeMCOperandKind_Immediate_f64_Packed128)
  5484. {
  5485. double floatVal = imm.mImmFloat;
  5486. String name = StrFormat("__real@%016llx_packed", *(int64*)&floatVal);
  5487. double data[2] = { floatVal, 0 };
  5488. sym = mCOFFObject->GetCOMDAT(name, data, 16, 16);
  5489. }
  5490. else
  5491. NotImpl();
  5492. BeMCRelocation reloc;
  5493. reloc.mKind = BeMCRelocationKind_REL32;
  5494. reloc.mOffset = mOut.GetPos();
  5495. reloc.mSymTableIdx = sym->mIdx;
  5496. mCOFFObject->mTextSect.mRelocs.push_back(reloc);
  5497. mTextRelocs.push_back((int)mCOFFObject->mTextSect.mRelocs.size() - 1);
  5498. mOut.Write((int32)0);
  5499. }
  5500. void BeMCContext::VRegSetInitialized(BeMCBlock* mcBlock, BeMCInst* inst, const BeMCOperand& operand, SizedArrayImpl<int>& addVec, SizedArrayImpl<int>& removeVec, bool deepSet, bool doSet)
  5501. {
  5502. if (operand.IsSymbol())
  5503. {
  5504. auto sym = mCOFFObject->mSymbols[operand.mSymbolIdx];
  5505. if (sym->mIsTLS)
  5506. {
  5507. VRegSetInitialized(mcBlock, inst, BeMCOperand::FromVReg(mTLSVRegIdx), addVec, removeVec, deepSet, doSet);
  5508. return;
  5509. }
  5510. }
  5511. if (operand.mKind == BeMCOperandKind_CmpResult)
  5512. {
  5513. auto& cmpResult = mCmpResults[operand.mCmpResultIdx];
  5514. if (cmpResult.mResultVRegIdx != -1)
  5515. VRegSetInitialized(mcBlock, inst, BeMCOperand::FromVReg(cmpResult.mResultVRegIdx), addVec, removeVec, deepSet, doSet);
  5516. return;
  5517. }
  5518. if (operand.mKind == BeMCOperandKind_VRegPair)
  5519. {
  5520. VRegSetInitialized(mcBlock, inst, BeMCOperand::FromVReg(operand.mVRegPair.mVRegIdx0), addVec, removeVec, deepSet, doSet);
  5521. VRegSetInitialized(mcBlock, inst, BeMCOperand::FromVReg(operand.mVRegPair.mVRegIdx1), addVec, removeVec, deepSet, doSet);
  5522. }
  5523. if (!operand.IsVRegAny())
  5524. return;
  5525. auto vregInfo = mVRegInfo[operand.mVRegIdx];
  5526. if (vregInfo->mDefOnFirstUse)
  5527. {
  5528. int insertIdx = FindSafeInstInsertPos(*mInsertInstIdxRef);
  5529. AllocInst(BeMCInstKind_Def, operand, insertIdx);
  5530. vregInfo->mDefOnFirstUse = false;
  5531. }
  5532. if (vregInfo->mRelTo)
  5533. VRegSetInitialized(mcBlock, inst, vregInfo->mRelTo, addVec, removeVec, deepSet, doSet && deepSet);
  5534. if (vregInfo->mRelOffset)
  5535. VRegSetInitialized(mcBlock, inst, vregInfo->mRelOffset, addVec, removeVec, deepSet, doSet && deepSet);
  5536. if (doSet)
  5537. {
  5538. addVec.push_back(operand.mVRegIdx);
  5539. removeVec.push_back(mVRegInitializedContext.GetIdx(operand.mVRegIdx, BeTrackKind_Uninitialized));
  5540. //vregsInitialized = mVRegInitializedContext.SetAndClear(vregsInitialized, operand.mVRegIdx, mVRegInitializedContext.GetIdx(operand.mVRegIdx, BeTrackKind_Uninitialized));
  5541. }
  5542. }
  5543. BeMCInst* BeMCContext::FindSafePreBranchInst(BeMCBlock* mcBlock)
  5544. {
  5545. for (int instIdx = 0; instIdx < (int)mcBlock->mInstructions.size(); instIdx++)
  5546. {
  5547. auto inst = mcBlock->mInstructions[instIdx];
  5548. // We set the definition to just right before the first branch
  5549. if ((inst->mKind == BeMCInstKind_Br) || (inst->mKind == BeMCInstKind_CondBr))
  5550. {
  5551. // Don't separate out Def/Cmp/CmpToBool/Test calls
  5552. while (instIdx > 0)
  5553. {
  5554. auto checkInst = mcBlock->mInstructions[instIdx - 1];
  5555. if ((checkInst->mKind != BeMCInstKind_Def) &&
  5556. (checkInst->mKind != BeMCInstKind_DefLoad) &&
  5557. (checkInst->mKind != BeMCInstKind_Test) &&
  5558. (checkInst->mKind != BeMCInstKind_Cmp) &&
  5559. (checkInst->mKind != BeMCInstKind_CmpToBool))
  5560. return inst;
  5561. inst = checkInst;
  5562. instIdx--;
  5563. }
  5564. break;
  5565. }
  5566. }
  5567. return mcBlock->mInstructions[0];
  5568. }
  5569. void BeMCContext::InitializedPassHelper(BeMCBlock* mcBlock, BeVTrackingGenContext* genCtx, bool& modifiedBlockBefore, bool& modifiedBlockAfter)
  5570. {
  5571. modifiedBlockBefore = false;
  5572. modifiedBlockAfter = false;
  5573. genCtx->mBlocks[mcBlock->mBlockIdx].mGenerateCount++;
  5574. genCtx->mCalls++;
  5575. genCtx->mHandledCalls++;
  5576. BeMDNode* curDbgScope = NULL;
  5577. BeVTrackingList* vregsInitialized = mcBlock->mPredVRegsInitialized;
  5578. //OutputDebugStrF("InitializedPassHelper %@\n", vregsInitialized.mList);
  5579. mActiveBlock = mcBlock;
  5580. for (int instIdx = 0; instIdx < (int)mcBlock->mInstructions.size(); instIdx++)
  5581. {
  5582. genCtx->mInstructions++;
  5583. mInsertInstIdxRef = &instIdx;
  5584. auto inst = mcBlock->mInstructions[instIdx];
  5585. inst->mVRegsInitialized = vregsInitialized;
  5586. bool deepSet = false;
  5587. if (inst->mKind == BeMCInstKind_LifetimeStart)
  5588. continue;
  5589. SizedArray<int, 16> removeVec;
  5590. SizedArray<int, 16> addVec;
  5591. SizedArray<int, 16> filteredRemoveVec;
  5592. SizedArray<int, 16> filteredAddVec;
  5593. if ((inst->mKind == BeMCInstKind_ValueScopeSoftEnd) || (inst->mKind == BeMCInstKind_ValueScopeHardEnd))
  5594. {
  5595. bool isSoft = inst->mKind == BeMCInstKind_ValueScopeSoftEnd;
  5596. int startVRegIdx = (int)inst->mArg0.mImmediate;
  5597. int endVRegIdx = (int)inst->mArg1.mImmediate;
  5598. int listIdx = mVRegInitializedContext.FindIndex(vregsInitialized, startVRegIdx);
  5599. if (listIdx < 0)
  5600. listIdx = ~listIdx;
  5601. for ( ; listIdx < vregsInitialized->mSize; listIdx++)
  5602. {
  5603. int vregIdx = vregsInitialized->mEntries[listIdx];
  5604. if (vregIdx >= endVRegIdx)
  5605. break;
  5606. auto vregInfo = mVRegInfo[vregIdx];
  5607. if (isSoft)
  5608. {
  5609. if (vregInfo->mValueScopeRetainedKind >= BeMCValueScopeRetainKind_Soft)
  5610. continue;
  5611. }
  5612. else
  5613. {
  5614. if (vregInfo->mValueScopeRetainedKind >= BeMCValueScopeRetainKind_Hard)
  5615. continue;
  5616. }
  5617. filteredRemoveVec.push_back(vregIdx);
  5618. }
  5619. }
  5620. if ((inst->mResult) && (inst->mResult.mKind == BeMCOperandKind_CmpResult))
  5621. {
  5622. auto& cmpResult = mCmpResults[inst->mResult.mCmpResultIdx];
  5623. if (cmpResult.mResultVRegIdx != -1)
  5624. {
  5625. auto cmpToBoolInst = AllocInst(BeMCInstKind_CmpToBool, BeMCOperand::FromCmpKind(cmpResult.mCmpKind), BeMCOperand(), instIdx + 1);
  5626. cmpToBoolInst->mResult = BeMCOperand::FromVReg(cmpResult.mResultVRegIdx);
  5627. }
  5628. inst->mResult = BeMCOperand();
  5629. }
  5630. if (inst->mKind == BeMCInstKind_DbgDecl)
  5631. {
  5632. if (!mVRegInitializedContext.IsSet(vregsInitialized, inst->mArg0.mVRegIdx))
  5633. {
  5634. auto vregInfo = mVRegInfo[inst->mArg0.mVRegIdx];
  5635. if (vregInfo->mIsExpr) // For shadowed inlined params, set as initialized
  5636. addVec.push_back(inst->mArg0.mVRegIdx);
  5637. else
  5638. {
  5639. if ((vregInfo->mDbgVariable != NULL) && (vregInfo->mDbgVariable->mInitType == BfIRInitType_NotNeeded_AliveOnDecl))
  5640. addVec.push_back(inst->mArg0.mVRegIdx);
  5641. else
  5642. addVec.push_back(mVRegInitializedContext.GetIdx(inst->mArg0.mVRegIdx, BeTrackKind_Uninitialized));
  5643. }
  5644. }
  5645. vregsInitialized = mVRegInitializedContext.Modify(vregsInitialized, addVec, removeVec, filteredAddVec, filteredRemoveVec);
  5646. continue;
  5647. }
  5648. if (inst->mKind == BeMCInstKind_Def)
  5649. {
  5650. //deepSet = true;
  5651. // If we take a pointer to a local variable before initializing it, we need to consider it as being "ambiguously initialized"
  5652. auto vregInfo = GetVRegInfo(inst->mArg0);
  5653. if (vregInfo->mRelTo.mKind == BeMCOperandKind_VRegAddr)
  5654. {
  5655. auto relVRegInfo = GetVRegInfo(vregInfo->mRelTo);
  5656. if ((relVRegInfo->mDbgVariable != NULL) && (!mVRegInitializedContext.IsSet(vregsInitialized, vregInfo->mRelTo.mVRegIdx)))
  5657. relVRegInfo->mHasAmbiguousInitialization = true;
  5658. }
  5659. }
  5660. if (inst->mKind == BeMCInstKind_LifetimeEnd)
  5661. {
  5662. // In some cases we can have a dbg variable that actually points to a global variable (due to macros/inlining/etc), so this check is for that case:
  5663. if (inst->mArg0.IsVRegAny())
  5664. {
  5665. removeVec.push_back(inst->mArg0.mVRegIdx);
  5666. removeVec.push_back(mVRegInitializedContext.GetIdx(inst->mArg0.mVRegIdx, BeTrackKind_Uninitialized));
  5667. }
  5668. vregsInitialized= mVRegInitializedContext.Modify(vregsInitialized, addVec, removeVec, filteredAddVec, filteredRemoveVec);
  5669. continue;
  5670. }
  5671. if (inst->mKind == BeMCInstKind_DefLoad)
  5672. {
  5673. // This is also an address-taking operation, OR it's just a usage of an explicitly-undefined value
  5674. auto loadRegInfo = GetVRegInfo(inst->mArg0);
  5675. if (loadRegInfo->mRelTo.IsVRegAny())
  5676. {
  5677. auto relVRegInfo = GetVRegInfo(loadRegInfo->mRelTo);
  5678. if ((relVRegInfo->mDbgVariable != NULL) && (!mVRegInitializedContext.IsSet(vregsInitialized, loadRegInfo->mRelTo.mVRegIdx)))
  5679. relVRegInfo->mHasAmbiguousInitialization = true;
  5680. }
  5681. }
  5682. if (inst->IsMov())
  5683. {
  5684. // This is also an address-taking operation, OR it's just a usage of an explicitly-undefined value
  5685. if (inst->mArg1.IsVRegAny())
  5686. {
  5687. auto srcRegInfo = GetVRegInfo(inst->mArg1);
  5688. if ((srcRegInfo->mDbgVariable != NULL) && (!mVRegInitializedContext.IsSet(vregsInitialized, inst->mArg1.mVRegIdx)))
  5689. srcRegInfo->mHasAmbiguousInitialization = true;
  5690. }
  5691. }
  5692. int cpyDestVRegIdx = -1;
  5693. if ((inst->mKind == BeMCInstKind_MemCpy) || (inst->mKind == BeMCInstKind_MemSet))
  5694. {
  5695. cpyDestVRegIdx = inst->mArg1.mVRegPair.mVRegIdx0;
  5696. }
  5697. //deepSet = true;
  5698. auto destArg = inst->GetDest();
  5699. auto operands = { &inst->mResult, &inst->mArg0, &inst->mArg1 };
  5700. for (auto op : operands)
  5701. {
  5702. VRegSetInitialized(mcBlock, inst, *op, addVec, removeVec, deepSet || (op == destArg));
  5703. }
  5704. for (int removeIdx = 0; removeIdx < (int)filteredRemoveVec.size(); removeIdx++)
  5705. {
  5706. int vregIdx = filteredRemoveVec[removeIdx];
  5707. if (vregIdx >= mVRegInitializedContext.mNumItems)
  5708. continue;
  5709. auto vregInfo = mVRegInfo[vregIdx];
  5710. if (vregInfo->mChainLifetimeEnd)
  5711. {
  5712. auto mcCheck = vregInfo->mRelTo;
  5713. while (mcCheck.IsVRegAny())
  5714. {
  5715. auto checkInfo = mVRegInfo[mcCheck.mVRegIdx];
  5716. removeVec.push_back(mcCheck.mVRegIdx);
  5717. mcCheck = checkInfo->mRelTo;
  5718. }
  5719. }
  5720. }
  5721. vregsInitialized = mVRegInitializedContext.Modify(vregsInitialized, addVec, removeVec, filteredAddVec, filteredRemoveVec);
  5722. }
  5723. mInsertInstIdxRef = NULL;
  5724. mActiveBlock = NULL;
  5725. for (int succIdx = 0; succIdx < (int)mcBlock->mSuccs.size(); succIdx++)
  5726. {
  5727. BeMCBlock* succ = mcBlock->mSuccs[succIdx];
  5728. auto& entry = genCtx->mBlocks[succ->mBlockIdx];
  5729. bool forceRun = (entry.mGenerateCount == 0) && (!entry.mGenerateQueued);
  5730. //if ((!mVRegInitializedContext.HasExtraBitsSet(succ->mPredVRegsInitialized, vregsInitialized)) && (!forceRun))
  5731. //continue;
  5732. auto newPredVRegsInitialized = mVRegInitializedContext.Merge(succ->mPredVRegsInitialized, vregsInitialized);
  5733. if ((newPredVRegsInitialized == succ->mPredVRegsInitialized) && (!forceRun))
  5734. continue;
  5735. int vregIdx = -1;
  5736. /*SizedArray<int, 16> newNodes;
  5737. auto& prevDestEntry = succ->mPredVRegsInitialized;
  5738. auto& mergeFrom = vregsInitialized.mBits;
  5739. // Take nodes that were exclusive to the new set and add edges to nodes that were exclusive the old set
  5740. while (true)
  5741. {
  5742. vregIdx = mVRegInitializedContext.GetNextDiffSetIdx(prevDestEntry.mBits, mergeFrom, vregIdx);
  5743. if (vregIdx == -1)
  5744. break;
  5745. newNodes.push_back(vregIdx);
  5746. }
  5747. BF_ASSERT((!newNodes.empty()) || (forceRun));*/
  5748. /*if ((mDebugging) || (mBeFunction->mName == "?DrawEntry@DrawContext@PerfView@BeefPerf@@QEAAXPEAVGraphics@gfx@Beefy@@PEAVTrackNodeEntry@23@MM@Z"))
  5749. {
  5750. String str;
  5751. str += StrFormat("%s -> %s (Gen=%d) ", ToString(BeMCOperand::FromBlock(mcBlock)).c_str(), ToString(BeMCOperand::FromBlock(succ)).c_str(), genCtx->mBlocks[succ->mBlockIdx].mGenerateCount);
  5752. for (auto newNode : newNodes)
  5753. str += StrFormat(" %d", newNode);
  5754. str += "\r\n";
  5755. OutputDebugStringA(str.c_str());
  5756. }*/
  5757. succ->mPredVRegsInitialized = newPredVRegsInitialized;
  5758. //TODO: This was a bad comparison
  5759. // if (succ->mBlockIdx > succ->mBlockIdx)
  5760. // modifiedBlockAfter = true;
  5761. // else
  5762. // modifiedBlockBefore = true;
  5763. // What does this do?
  5764. if (succ->mBlockIdx > mcBlock->mBlockIdx)
  5765. modifiedBlockAfter = true;
  5766. else
  5767. modifiedBlockBefore = true;
  5768. entry.mGenerateQueued = true;
  5769. }
  5770. }
  5771. void BeMCContext::FixVRegInitFlags(BeMCInst* inst, const BeMCOperand& operand)
  5772. {
  5773. if (operand.IsVReg())
  5774. {
  5775. SizedArray<int, 1> addVec = { operand.mVRegIdx };
  5776. inst->mVRegsInitialized = mVRegInitializedContext.Add(inst->mVRegsInitialized, addVec, true);
  5777. }
  5778. }
  5779. void BeMCContext::SetVTrackingValue(BeMCOperand& operand, BeVTrackingValue& vTrackingValue)
  5780. {
  5781. if (!operand.IsVRegAny())
  5782. return;
  5783. vTrackingValue.mEntry->Set(operand.mVRegIdx);
  5784. auto vregInfo = mVRegInfo[operand.mVRegIdx];
  5785. SetVTrackingValue(vregInfo->mRelTo, vTrackingValue);
  5786. SetVTrackingValue(vregInfo->mRelOffset, vTrackingValue);
  5787. }
  5788. void BeMCContext::DoInitInjectionPass()
  5789. {
  5790. BP_ZONE("BeMCContext::DoInitInjectionPass");
  5791. for (auto mcBlock : mBlocks)
  5792. {
  5793. mActiveBlock = mcBlock;
  5794. for (int instIdx = 0; instIdx < (int)mcBlock->mInstructions.size(); instIdx++)
  5795. {
  5796. auto inst = mcBlock->mInstructions[instIdx];
  5797. BfIRInitType pendingInitKind = BfIRInitType_NotNeeded;
  5798. if (inst->mKind == BeMCInstKind_DbgDecl)
  5799. {
  5800. int vregIdx = inst->mArg0.mVRegIdx;
  5801. auto vregInfo = mVRegInfo[vregIdx];
  5802. auto dbgVar = vregInfo->mDbgVariable;
  5803. if (!mVRegInitializedContext.IsSet(inst->mVRegsInitialized, vregIdx))
  5804. {
  5805. if ((dbgVar->mPendingInitType != BfIRInitType_NotNeeded) && (dbgVar->mPendingInitType != BfIRInitType_NotNeeded_AliveOnDecl))
  5806. {
  5807. pendingInitKind = dbgVar->mPendingInitType;
  5808. // We don't need dynLife anymore since we're explicitly writing this
  5809. //vregInfo->mHasDynLife = false;
  5810. //AllocInst(BeMCInstKind_Def, inst->mArg0, instIdx);
  5811. }
  5812. }
  5813. }
  5814. if (pendingInitKind != BfIRInitType_NotNeeded)
  5815. {
  5816. int vregIdx = inst->mArg0.mVRegIdx;
  5817. auto dbgVar = mVRegInfo[vregIdx]->mDbgVariable;
  5818. auto varType = mVRegInfo[vregIdx]->mType;
  5819. auto initType = dbgVar->mPendingInitType;
  5820. if (varType->IsFloat())
  5821. {
  5822. BeMCOperand zeroVal;
  5823. if (varType->mTypeCode == BeTypeCode_Float)
  5824. zeroVal.mKind = BeMCOperandKind_Immediate_f32;
  5825. else
  5826. zeroVal.mKind = BeMCOperandKind_Immediate_f64;
  5827. if (initType == BfIRInitType_Uninitialized)
  5828. zeroVal.mImmFloat = NAN;
  5829. else
  5830. zeroVal.mImmFloat = 0;
  5831. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromVReg(vregIdx), zeroVal, instIdx + 1);
  5832. }
  5833. else if (varType->IsComposite())
  5834. {
  5835. SetAndRestoreValue<int*> insertPtr(mInsertInstIdxRef, &instIdx);
  5836. instIdx++;
  5837. uint8 val = (initType == BfIRInitType_Uninitialized) ? 0xCC : 0;
  5838. CreateMemSet(BeMCOperand::FromVRegAddr(vregIdx), val, varType->mSize, varType->mAlign);
  5839. instIdx--;
  5840. }
  5841. else
  5842. {
  5843. int64 val = (initType == BfIRInitType_Uninitialized) ? (int64)0xCCCCCCCCCCCCCCCCLL : 0;
  5844. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromVReg(vregIdx), BeMCOperand::FromImmediate(val), instIdx + 1);
  5845. }
  5846. dbgVar->mPendingInitType = BfIRInitType_NotNeeded;
  5847. }
  5848. }
  5849. mActiveBlock = NULL;
  5850. }
  5851. SetCurrentInst(NULL);
  5852. }
  5853. void BeMCContext::ReplaceVRegsInit(BeMCBlock* mcBlock, int startInstIdx, BeVTrackingList* prevList, BeVTrackingList* newList)
  5854. {
  5855. for (int instIdx = startInstIdx; instIdx < (int)mcBlock->mInstructions.size(); instIdx++)
  5856. {
  5857. auto inst = mcBlock->mInstructions[instIdx];
  5858. if (inst->mVRegsInitialized != prevList)
  5859. return;
  5860. inst->mVRegsInitialized = newList;
  5861. }
  5862. }
  5863. void BeMCContext::GenerateVRegInitFlags(BeVTrackingGenContext& genCtx)
  5864. {
  5865. BP_ZONE("BeMCContext::GenerateVRegInitFlags");
  5866. mVRegInitializedContext.Clear();
  5867. mVRegInitializedContext.Init((int)mVRegInfo.size());
  5868. auto emptyList = mVRegInitializedContext.AllocEmptyList();
  5869. genCtx.mEmptyList = emptyList;
  5870. genCtx.mBlocks.Resize(mBlocks.size());
  5871. for (int blockIdx = 0; blockIdx < (int)mBlocks.size(); blockIdx++)
  5872. {
  5873. auto mcBlock = mBlocks[blockIdx];
  5874. mcBlock->mPredVRegsInitialized = emptyList;
  5875. }
  5876. bool modifiedBlockBefore;
  5877. bool modifiedBlockAfter;
  5878. InitializedPassHelper(mBlocks[0], &genCtx, modifiedBlockBefore, modifiedBlockAfter);
  5879. while (true)
  5880. {
  5881. bool didWork = false;
  5882. // Handle any outstanding pred entries
  5883. for (int blockIdx = 0; blockIdx < (int)mBlocks.size(); blockIdx++)
  5884. {
  5885. auto& entry = genCtx.mBlocks[blockIdx];
  5886. if (entry.mGenerateQueued)
  5887. {
  5888. entry.mGenerateQueued = false;
  5889. didWork = true;
  5890. auto block = mBlocks[blockIdx];
  5891. bool modifiedBlockBefore;
  5892. bool modifiedBlockAfter;
  5893. InitializedPassHelper(block, &genCtx, modifiedBlockBefore, modifiedBlockAfter);
  5894. if (modifiedBlockBefore)
  5895. break;
  5896. }
  5897. }
  5898. if (!didWork)
  5899. break;
  5900. }
  5901. // Fix up the vregsInit changes to represent changes from the last intruction in one block to the first instruction on the next blockfs
  5902. for (int blockIdx = 0; blockIdx < (int)mBlocks.size() - 1; blockIdx++)
  5903. {
  5904. auto fromBlock = mBlocks[blockIdx];
  5905. auto toBlock = mBlocks[blockIdx + 1];
  5906. if ((fromBlock->mInstructions.empty()) || (toBlock->mInstructions.empty()))
  5907. continue;
  5908. BeMCInst* fromInst = NULL;
  5909. // Last inst may not have vregsInit set
  5910. for (int instIdx = (int)fromBlock->mInstructions.size() - 1; instIdx >= 0; instIdx--)
  5911. {
  5912. fromInst = fromBlock->mInstructions[instIdx];
  5913. if (fromInst->mVRegsInitialized != NULL)
  5914. break;
  5915. }
  5916. auto toInst = toBlock->mInstructions.front();
  5917. if ((fromInst == NULL) || (fromInst->mVRegsInitialized == NULL) ||
  5918. (toInst == NULL) || (toInst->mVRegsInitialized == NULL))
  5919. continue;
  5920. auto prevVRegsInit = toInst->mVRegsInitialized;
  5921. auto newVRegsInit = mVRegInitializedContext.SetChanges(toInst->mVRegsInitialized, fromInst->mVRegsInitialized);;
  5922. for (int instIdx = 0; instIdx < (int)toBlock->mInstructions.size(); instIdx++)
  5923. {
  5924. auto inst = toBlock->mInstructions[instIdx];
  5925. if (inst->mVRegsInitialized != prevVRegsInit)
  5926. break;
  5927. inst->mVRegsInitialized = newVRegsInit;
  5928. }
  5929. }
  5930. int instCount = 0;
  5931. for (auto block : mBlocks)
  5932. instCount += (int)block->mInstructions.size();
  5933. BpEvent("GenerateVRegInitFlags Results",
  5934. StrFormat("Blocks: %d\nInstructions: %d\nVRegs: %d\nCalls: %d\nHandled Calls: %d\nProcessed Instructions: %d\nVRegInit Bytes: %d\nTemp Bytes: %d",
  5935. (int)mBlocks.size(), instCount, (int)mVRegInfo.size(), genCtx.mCalls, genCtx.mHandledCalls, genCtx.mInstructions, mVRegInitializedContext.mAlloc.GetAllocSize(), genCtx.mAlloc.GetAllocSize()).c_str());
  5936. }
  5937. bool BeMCContext::DoInitializedPass()
  5938. {
  5939. BP_ZONE("BeMCContext::DoInitializedPass");
  5940. BeVTrackingGenContext genCtx;
  5941. GenerateVRegInitFlags(genCtx);
  5942. // Search blocks for instances of ambiguous initialization
  5943. for (int blockIdx = 0; blockIdx < (int)mBlocks.size(); blockIdx++)
  5944. {
  5945. auto mcBlock = mBlocks[blockIdx];
  5946. // If mPredVRegsInitialized is NULL, this blocks is unreachable. It could still be in some other block's preds so we don't
  5947. // completely erase it, just empty it
  5948. if (genCtx.mBlocks[mcBlock->mBlockIdx].mGenerateCount == 0)
  5949. {
  5950. //BF_ASSERT((blockIdx != 0) && (mcBlock->mPreds.size() == 0));
  5951. mcBlock->mInstructions.Clear();
  5952. continue;
  5953. }
  5954. /*int vregIdx = -1;
  5955. while (true)
  5956. {
  5957. vregIdx = mVRegInitializedContext.GetNextSetIdx(mcBlock->mPredVRegsInitialized, vregIdx);
  5958. if (vregIdx == -1)
  5959. break;*/
  5960. for (int vregIdx : *mcBlock->mPredVRegsInitialized)
  5961. {
  5962. if (vregIdx >= mVRegInitializedContext.mNumItems)
  5963. continue;
  5964. if (mVRegInitializedContext.IsSet(mcBlock->mPredVRegsInitialized, vregIdx, BeTrackKind_Uninitialized))
  5965. {
  5966. // If a register has both the "initialized" and "uninitialized" flags set, that means that there will be debugging range
  5967. // where the variable could show an uninitialized value. We zero out the value at the def position to make
  5968. // variable viewing less confusing. This state does not affect actual program execution because we've already statically
  5969. // checked against usage of unassigned variables -- unless overridden with a "?" uninitialized expression, in which case
  5970. // one could argue that 0xCC would be a more useful value, but we go with the argument for the "less confusing" zero in this case.
  5971. auto vregInfo = mVRegInfo[vregIdx];
  5972. vregInfo->mHasAmbiguousInitialization = true;
  5973. }
  5974. }
  5975. //
  5976. }
  5977. bool needsReRun = false;
  5978. bool hasInits = false;
  5979. for (int vregIdx = 0; vregIdx < (int)mVRegInfo.size(); vregIdx++)
  5980. {
  5981. auto vregInfo = mVRegInfo[vregIdx];
  5982. if (vregInfo->mDbgVariable != NULL)
  5983. {
  5984. auto initType = vregInfo->mDbgVariable->mInitType;
  5985. if (initType == BfIRInitType_NotSet)
  5986. {
  5987. if (vregInfo->mHasAmbiguousInitialization)
  5988. initType = BfIRInitType_Zero;
  5989. else
  5990. initType = BfIRInitType_NotNeeded;
  5991. }
  5992. else if ((initType == BfIRInitType_Uninitialized) && (!vregInfo->mHasAmbiguousInitialization))
  5993. {
  5994. // If we have an explicitly-uninitialized variable but it doesn't have ambiguous initialization
  5995. // then we don't need to do the 0xCC, we can control visibility in the debugger through scope
  5996. initType = BfIRInitType_NotNeeded;
  5997. }
  5998. if (vregInfo->mDbgVariable->mPendingInitType == initType)
  5999. continue;
  6000. if ((initType != BfIRInitType_NotNeeded) ||
  6001. (vregInfo->mDbgVariable->mPendingInitType == BfIRInitType_NotSet))
  6002. {
  6003. vregInfo->mDbgVariable->mPendingInitType = initType;
  6004. }
  6005. if ((initType != BfIRInitType_NotNeeded) && (initType != BfIRInitType_NotNeeded_AliveOnDecl))
  6006. {
  6007. vregInfo->mDbgVariable->mPendingInitDef = true;
  6008. BF_ASSERT(vregInfo->mHasDynLife);
  6009. vregInfo->mDoConservativeLife = true;
  6010. hasInits = true;
  6011. }
  6012. }
  6013. }
  6014. if (hasInits)
  6015. {
  6016. DoInitInjectionPass();
  6017. // We need to re-execute the init flag generation
  6018. BeVTrackingGenContext genCtx;
  6019. GenerateVRegInitFlags(genCtx);
  6020. }
  6021. return !needsReRun;
  6022. }
  6023. void BeMCContext::DoTLSSetup()
  6024. {
  6025. // Perform at the end of the 'entry' block
  6026. if (mTLSVRegIdx == -1)
  6027. return;
  6028. auto mcBlock = mBlocks[0];
  6029. mActiveBlock = mcBlock;
  6030. for (int instIdx = 0; instIdx < (int)mcBlock->mInstructions.size(); instIdx++)
  6031. {
  6032. auto inst = mcBlock->mInstructions[instIdx];
  6033. // Skip past param setup
  6034. if (inst->mKind == BeMCInstKind_Def)
  6035. continue;
  6036. if ((inst->mKind == BeMCInstKind_Mov) && (inst->mArg1.IsNativeReg()))
  6037. continue;
  6038. auto int32Type = mModule->mContext->GetPrimitiveType(BeTypeCode_Int32);
  6039. auto intType = mModule->mContext->GetPrimitiveType(BeTypeCode_Int64);
  6040. auto intPtrType = mModule->mContext->GetPointerTo(intType);
  6041. auto mcTlsIndex = AllocVirtualReg(intType);
  6042. CreateDefineVReg(mcTlsIndex, instIdx++);
  6043. auto sym = mCOFFObject->GetSymbolRef("_tls_index");
  6044. if (sym->mType == NULL)
  6045. sym->mType = int32Type;
  6046. AllocInst(BeMCInstKind_Mov, mcTlsIndex, BeMCOperand::FromSymbol(sym->mIdx), instIdx++);
  6047. AllocInst(BeMCInstKind_Def, BeMCOperand::FromVReg(mTLSVRegIdx), instIdx++);
  6048. AllocInst(BeMCInstKind_TLSSetup, BeMCOperand::FromVReg(mTLSVRegIdx), BeMCOperand::FromImmediate(0), instIdx++);
  6049. auto mcTlsVal = AllocVirtualReg(intPtrType);
  6050. CreateDefineVReg(mcTlsVal, instIdx++);
  6051. auto tlsValInfo = GetVRegInfo(mcTlsVal);
  6052. tlsValInfo->mIsExpr = true;
  6053. tlsValInfo->mRelTo = BeMCOperand::FromVReg(mTLSVRegIdx);
  6054. tlsValInfo->mRelOffset = mcTlsIndex;
  6055. tlsValInfo->mRelOffsetScale = 8;
  6056. auto mcLoadVal = mcTlsVal;
  6057. mcLoadVal.mKind = BeMCOperandKind_VRegLoad;
  6058. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromVReg(mTLSVRegIdx), mcLoadVal, instIdx++);
  6059. break;
  6060. }
  6061. mActiveBlock = NULL;
  6062. }
  6063. void BeMCContext::DoChainedBlockMerge()
  6064. {
  6065. for (int blockIdx = 0; blockIdx < mBlocks.size() - 1; blockIdx++)
  6066. {
  6067. auto mcBlock = mBlocks[blockIdx];
  6068. auto nextMcBlock = mBlocks[blockIdx + 1];
  6069. // We only branch into one block, and the the next block only has current block as a predecessor?
  6070. if ((mcBlock->mSuccs.size() == 1) && (nextMcBlock->mPreds.size() == 1) && (nextMcBlock->mPreds[0] == mcBlock))
  6071. {
  6072. auto lastInst = mcBlock->mInstructions.back();
  6073. // Last instruction of current block is an unconditional branch to the next block
  6074. if ((lastInst->mKind == BeMCInstKind_Br) && (lastInst->mArg0.mBlock == nextMcBlock))
  6075. {
  6076. //auto itr = std::find(mcBlock->mSuccs.begin(), mcBlock->mSuccs.end(), nextMcBlock);
  6077. //mcBlock->mSuccs.erase(itr);
  6078. mcBlock->mSuccs.Remove(nextMcBlock);
  6079. for (auto succ : nextMcBlock->mSuccs)
  6080. {
  6081. //auto itr = std::find(mcBlock->mSuccs.begin(), mcBlock->mSuccs.end(), succ);
  6082. //if (itr == mcBlock->mSuccs.end())
  6083. if (!mcBlock->mSuccs.Contains(succ))
  6084. {
  6085. mcBlock->mSuccs.push_back(succ);
  6086. succ->mPreds.push_back(mcBlock);
  6087. }
  6088. /*itr = std::find(succ->mPreds.begin(), succ->mPreds.end(), nextMcBlock);
  6089. succ->mPreds.erase(itr);*/
  6090. succ->mPreds.Remove(nextMcBlock);
  6091. }
  6092. mcBlock->mMaxDeclBlockId = nextMcBlock->mMaxDeclBlockId;
  6093. mcBlock->mInstructions.pop_back();
  6094. for (auto inst : nextMcBlock->mInstructions)
  6095. mcBlock->mInstructions.push_back(inst);
  6096. mBlocks.RemoveAt(blockIdx + 1);
  6097. blockIdx--;
  6098. }
  6099. }
  6100. }
  6101. for (int blockIdx = 0; blockIdx < mBlocks.size(); blockIdx++)
  6102. mBlocks[blockIdx]->mBlockIdx = blockIdx;
  6103. }
  6104. void BeMCContext::DetectLoops()
  6105. {
  6106. BP_ZONE("BeMCContext::DetectLoops");
  6107. BeMCLoopDetector loopDetector(this);
  6108. loopDetector.DetectLoops();
  6109. }
  6110. void BeMCContext::RefreshRefCounts()
  6111. {
  6112. for (auto vregInfo : mVRegInfo)
  6113. {
  6114. if (vregInfo->mMustExist)
  6115. vregInfo->mRefCount = 1;
  6116. else
  6117. vregInfo->mRefCount = 0;
  6118. vregInfo->mAssignCount = 0;
  6119. }
  6120. for (auto mcBlock : mBlocks)
  6121. {
  6122. for (auto& inst : mcBlock->mInstructions)
  6123. {
  6124. if (inst->IsDef())
  6125. continue;
  6126. auto operands = { inst->mResult, inst->mArg0, inst->mArg1 };
  6127. for (auto op : operands)
  6128. {
  6129. if (op.IsVRegAny())
  6130. mVRegInfo[op.mVRegIdx]->mRefCount++;
  6131. if (op.mKind == BeMCOperandKind_VRegPair)
  6132. {
  6133. auto vreg0 = BeMCOperand::FromEncoded(op.mVRegPair.mVRegIdx0);
  6134. if (vreg0.IsVRegAny())
  6135. {
  6136. mVRegInfo[vreg0.mVRegIdx]->mRefCount++;
  6137. mVRegInfo[vreg0.mVRegIdx]->mAssignCount++;
  6138. }
  6139. auto vreg1 = BeMCOperand::FromEncoded(op.mVRegPair.mVRegIdx1);
  6140. if (vreg1.IsVRegAny())
  6141. mVRegInfo[vreg1.mVRegIdx]->mRefCount++;
  6142. }
  6143. }
  6144. if (inst->IsAssignment())
  6145. {
  6146. if (inst->mArg0.IsVRegAny())
  6147. mVRegInfo[inst->mArg0.mVRegIdx]->mAssignCount++;
  6148. }
  6149. if (inst->mResult)
  6150. {
  6151. if (inst->mResult.IsVRegAny())
  6152. mVRegInfo[inst->mResult.mVRegIdx]->mAssignCount++;
  6153. }
  6154. }
  6155. }
  6156. for (int vregIdx = 0; vregIdx < (int)mVRegInfo.size(); vregIdx++)
  6157. {
  6158. auto vregInfo = mVRegInfo[vregIdx];
  6159. if (vregInfo->mRefCount > 0)
  6160. AddRelRefs(BeMCOperand::FromVReg(vregIdx), 0);
  6161. }
  6162. }
  6163. bool BeMCContext::CheckVRegEqualityRange(BeMCBlock* mcBlock, int instIdx, const BeMCOperand& vreg0, const BeMCOperand& vreg1, BeMCRemapper& regRemaps, bool onlyCheckFirstLifetime)
  6164. {
  6165. // The algorithm here is that we check to see if either of these registers are ever written to
  6166. // up to the point that one of them dies. If not, we can map them to each other
  6167. bool foundSplitPoint = false;
  6168. bool hadPointerDeref = false;
  6169. for (int checkInstIdx = instIdx + 1; checkInstIdx < (int)mcBlock->mInstructions.size(); checkInstIdx++)
  6170. {
  6171. auto checkInst = mcBlock->mInstructions[checkInstIdx];
  6172. if ((!IsLive(checkInst->mLiveness, vreg0.mVRegIdx, regRemaps)) ||
  6173. ((!onlyCheckFirstLifetime) && (!IsLive(checkInst->mLiveness, vreg1.mVRegIdx, regRemaps))))
  6174. {
  6175. return true;
  6176. }
  6177. if ((checkInst->mKind == BeMCInstKind_LifetimeEnd) &&
  6178. ((checkInst->mArg0.mVRegIdx == vreg0.mVRegIdx) || (checkInst->mArg0.mVRegIdx == vreg1.mVRegIdx)))
  6179. {
  6180. if (checkInstIdx == (int)mcBlock->mInstructions.size() - 1)
  6181. {
  6182. // There are cases where this might be the last instruction in a block, so we won't see the mLiveness change
  6183. // so this catches that case
  6184. return true;
  6185. }
  6186. // We have cases like when have a "defer delete val;", val will get used by the dtor after the LifetimeEnd
  6187. return false;
  6188. }
  6189. if (hadPointerDeref)
  6190. {
  6191. // Pointer deref is okay as long as liveness ends one instruction afterwards
  6192. return false;
  6193. }
  6194. // Anything can happen during a call...
  6195. if (checkInst->mKind == BeMCInstKind_Call)
  6196. return false;
  6197. auto mcDest = checkInst->GetDest();
  6198. if ((mcDest != NULL) && (mcDest->mKind == BeMCOperandKind_VReg))
  6199. {
  6200. // Any assignment to either of these regs disqualifies them
  6201. if ((mcDest->mVRegIdx == vreg0.mVRegIdx) || (mcDest->mVRegIdx == vreg1.mVRegIdx))
  6202. return false;
  6203. // Any writing into memory could be aliased, so we don't replace across that boundary
  6204. if (HasPointerDeref(*mcDest))
  6205. {
  6206. // Delay the 'return false' until we determine if our liveness ends on the next instruction.
  6207. // If it does, then this is okay because it didn't affect the source of any operations
  6208. hadPointerDeref = true;
  6209. }
  6210. }
  6211. }
  6212. return false;
  6213. }
  6214. void BeMCContext::DoInstCombinePass()
  6215. {
  6216. BP_ZONE("BeMCContext::DoInstCombinePass");
  6217. BeMCRemapper regRemaps;
  6218. regRemaps.Init((int)mVRegInfo.size());
  6219. BeVTrackingValue vTrackingVal((int)mVRegInfo.size());
  6220. HashSet<int> wantUnwrapVRegs;
  6221. if (mDebugging)
  6222. {
  6223. NOP;
  6224. }
  6225. for (auto mcBlock : mBlocks)
  6226. {
  6227. BeDbgLoc* curDbgLoc = NULL;
  6228. int safeMergeLocStart = 0;
  6229. bool lastDefDidMerge = false;
  6230. for (int instIdx = 0; instIdx < (int)mcBlock->mInstructions.size(); instIdx++)
  6231. {
  6232. bool reprocessInst = false;
  6233. auto inst = mcBlock->mInstructions[instIdx];
  6234. BeMCInst* prevInst = NULL;
  6235. if (instIdx > 0)
  6236. prevInst = mcBlock->mInstructions[instIdx - 1];
  6237. if ((inst->mDbgLoc != curDbgLoc) && (inst->mDbgLoc != NULL))
  6238. {
  6239. safeMergeLocStart = instIdx;
  6240. curDbgLoc = inst->mDbgLoc;
  6241. }
  6242. if ((inst->mKind == BeMCInstKind_Call) || (inst->mKind == BeMCInstKind_MemCpy) || (inst->mKind == BeMCInstKind_MemSet))
  6243. {
  6244. // Don't merge anything across callsites or memory writes
  6245. safeMergeLocStart = instIdx;
  6246. }
  6247. auto instDest = inst->GetDest();
  6248. if ((instDest != NULL) && (HasPointerDeref(*instDest)))
  6249. {
  6250. // Memory aliasing may invalidate any accesses, don't merge expressions across here
  6251. safeMergeLocStart = instIdx + 1;
  6252. }
  6253. SetCurrentInst(inst);
  6254. //TODO: Remove
  6255. // if we've remapped other vregs onto this that aren't dead, then we can't end the value lifetime but we
  6256. // must end the lifetime of the visible debug variable
  6257. /*if (inst->mKind == BeMCInstKind_LifetimeEnd)
  6258. {
  6259. bool extendValue = false;
  6260. int vregIdx = inst->mArg0.mVRegIdx;
  6261. int checkIdx = regRemaps.GetHead(vregIdx);
  6262. while (checkIdx != -1)
  6263. {
  6264. if ((checkIdx != vregIdx) && (mLivenessContext.IsSet(inst->mLiveness, checkIdx)))
  6265. extendValue = true;
  6266. checkIdx = regRemaps.GetNext(checkIdx);
  6267. }
  6268. if (extendValue)
  6269. {
  6270. //Throw error
  6271. }
  6272. //inst->mKind = BeMCInstKind_LifetimeDbgEnd;
  6273. }*/
  6274. // Handle movs into .addrs
  6275. if (inst->mKind == BeMCInstKind_Mov)
  6276. {
  6277. auto vregInfoDest = GetVRegInfo(inst->mArg0);
  6278. if (vregInfoDest != NULL)
  6279. {
  6280. auto vregInfoSrc = GetVRegInfo(inst->mArg1);
  6281. if ((vregInfoSrc != NULL) && (vregInfoSrc->mForceMerge))
  6282. {
  6283. vregInfoSrc->mForceMerge = false;
  6284. if ((vregInfoDest->mDbgVariable != NULL) && (vregInfoSrc->CanEliminate()))
  6285. {
  6286. BF_ASSERT(!mVRegInitializedContext.IsSet(inst->mVRegsInitialized, inst->mArg0.mVRegIdx));
  6287. AddRegRemap(inst->mArg1.mVRegIdx, inst->mArg0.mVRegIdx, regRemaps);
  6288. // Remove any LifetimeStarts since our source may have been alive before us
  6289. //if (inst->mArg1.mVRegIdx < inst->mArg0.mVRegIdx)
  6290. //removeLifetimeStarts.insert(inst->mArg0.mVRegIdx);
  6291. }
  6292. }
  6293. }
  6294. }
  6295. // The following code only applies when we aren't on the last instruction
  6296. int nextIdx = instIdx + 1;
  6297. BeMCInst* nextInst = NULL;
  6298. while (true)
  6299. {
  6300. if (nextIdx >= (int)mcBlock->mInstructions.size())
  6301. break;
  6302. nextInst = mcBlock->mInstructions[nextIdx];
  6303. if (!nextInst->IsDef())
  6304. break;
  6305. nextIdx++;
  6306. }
  6307. if (nextInst == NULL)
  6308. continue;
  6309. // The following code only applies when we have at least 2 more instructions
  6310. // Find a non-Def instruction
  6311. int nextNextIdx = nextIdx + 1;
  6312. BeMCInst* nextNextInst = NULL;
  6313. while (true)
  6314. {
  6315. if (nextNextIdx >= (int)mcBlock->mInstructions.size())
  6316. break;
  6317. nextNextInst = mcBlock->mInstructions[nextNextIdx];
  6318. if (!nextNextInst->IsDef())
  6319. break;
  6320. nextNextIdx++;
  6321. }
  6322. auto result = RemapOperand(inst->mResult, regRemaps);
  6323. auto arg0 = RemapOperand(inst->mArg0, regRemaps);
  6324. auto arg1 = RemapOperand(inst->mArg1, regRemaps);
  6325. if (inst->IsDef())
  6326. {
  6327. auto vregInfo = mVRegInfo[inst->mArg0.mVRegIdx];
  6328. if (vregInfo->mIsExpr)
  6329. {
  6330. for (int checkInstIdx = safeMergeLocStart; checkInstIdx < instIdx; checkInstIdx++)
  6331. {
  6332. auto checkInst = mcBlock->mInstructions[checkInstIdx];
  6333. if (checkInst->IsDef())
  6334. {
  6335. auto checkArg0 = RemapOperand(checkInst->mArg0, regRemaps);
  6336. auto checkVRegInfo = mVRegInfo[checkArg0.mVRegIdx];
  6337. if (checkVRegInfo->mIsExpr)
  6338. {
  6339. // Remap to use the earlier definition of this expression
  6340. if (AreOperandsEquivalent(inst->mArg0, checkArg0, regRemaps))
  6341. {
  6342. vTrackingVal.Clear();
  6343. SetVTrackingValue(checkArg0, vTrackingVal);
  6344. // Check to make sure we didn't do any writes to any of the values used in the expression. This happens
  6345. // during "iVal++", for example.
  6346. bool hadBadWrite = false;
  6347. for (int verifyInstIdx = safeMergeLocStart; verifyInstIdx < instIdx; verifyInstIdx++)
  6348. {
  6349. auto verifyInst = mcBlock->mInstructions[verifyInstIdx];
  6350. auto verifyDest = verifyInst->GetDest();
  6351. if ((verifyDest != NULL) && (verifyDest->IsVRegAny()) && (vTrackingVal.mEntry->IsSet(verifyDest->mVRegIdx)))
  6352. {
  6353. hadBadWrite = true;
  6354. break;
  6355. }
  6356. }
  6357. if (!hadBadWrite)
  6358. {
  6359. auto vregInfoFrom = GetVRegInfo(inst->mArg0);
  6360. if (vregInfoFrom->mDbgVariable == NULL)
  6361. AddRegRemap(inst->mArg0.mVRegIdx, checkArg0.mVRegIdx, regRemaps, true);
  6362. }
  6363. break;
  6364. }
  6365. }
  6366. }
  6367. }
  6368. }
  6369. }
  6370. BeMCOperand origNextDestOperand;
  6371. if (nextInst->IsAssignment())
  6372. origNextDestOperand = nextInst->mArg0;
  6373. else if (nextInst->mResult)
  6374. origNextDestOperand = nextInst->mResult;
  6375. BeMCOperand nextDestOperand = RemapOperand(origNextDestOperand, regRemaps);
  6376. if (inst->mKind == BeMCInstKind_DefLoad)
  6377. {
  6378. auto vregInfoDest = GetVRegInfo(inst->mArg0);
  6379. auto mcLoaded = inst->mArg0;
  6380. auto mcAddr = vregInfoDest->mRelTo;
  6381. // We can only do a regRemap replace if we aren't the product of a pointer dereference
  6382. bool mapToDef = false;
  6383. if (mcAddr.mKind == BeMCOperandKind_VReg)
  6384. {
  6385. auto vregInfo = mVRegInfo[inst->mArg0.mVRegIdx];
  6386. // We do 'onlyCheckFirstLifetime' because we have cases like when have a "defer delete val;", because val will get used by the dtor after the LiftimeEnd
  6387. if ((vregInfo->IsDirectRelTo()) && (vregInfo->mDbgVariable == NULL) && (CheckVRegEqualityRange(mcBlock, instIdx, mcLoaded, mcAddr, regRemaps, true)))
  6388. {
  6389. // If the source value doesn't change in the lifetime of the loaded value then
  6390. // we can just map directly to the source - no copy needed.
  6391. inst->mKind = BeMCInstKind_Def;
  6392. AddRegRemap(inst->mArg0.mVRegIdx, vregInfoDest->mRelTo.mVRegIdx, regRemaps, true);
  6393. continue;
  6394. }
  6395. }
  6396. else if ((mcAddr.mKind == BeMCOperandKind_Symbol) || (mcAddr.mKind == BeMCOperandKind_SymbolAddr))
  6397. {
  6398. // No actual load needed - just keep it as a Direct reference
  6399. inst->mKind = BeMCInstKind_Def;
  6400. //wantUnwrapVRegs.Add(inst->mArg0.mVRegIdx);
  6401. continue;
  6402. }
  6403. bool hadPointerDeref = false;
  6404. for (int checkInstIdx = instIdx + 1; checkInstIdx < (int)mcBlock->mInstructions.size(); checkInstIdx++)
  6405. {
  6406. auto checkInst = mcBlock->mInstructions[checkInstIdx];
  6407. BF_ASSERT(mcLoaded.IsVRegAny());
  6408. if (!IsLive(checkInst->mLiveness, mcLoaded.mVRegIdx, regRemaps))
  6409. {
  6410. break;
  6411. }
  6412. if ((mcAddr.IsVRegAny()) && (!IsLive(checkInst->mLiveness, mcAddr.mVRegIdx, regRemaps)))
  6413. break;
  6414. if (hadPointerDeref)
  6415. {
  6416. // Pointer deref is okay as long as liveness ends one instruction afterwards
  6417. break;
  6418. }
  6419. auto mcDest = checkInst->GetDest();
  6420. if ((mcDest != NULL) &&
  6421. ((mcDest->mKind == BeMCOperandKind_VReg) || (mcDest->mKind == mcAddr.mKind)))
  6422. {
  6423. // Any assignment to either of these regs ends our remapping loop
  6424. if ((mcDest->mVRegIdx == mcLoaded.mVRegIdx) || (mcDest->mVRegIdx == mcAddr.mVRegIdx))
  6425. {
  6426. break;
  6427. }
  6428. // Any writing into memory could be aliased, so we don't replace across that boundary
  6429. if (HasPointerDeref(*mcDest))
  6430. {
  6431. // Delay the 'return false' until we determine if our liveness ends on the next instruction.
  6432. // If it does, then this is okay because it didn't affect the source of any operations
  6433. hadPointerDeref = true;
  6434. }
  6435. }
  6436. if (checkInst->IsInformational())
  6437. continue;
  6438. if (checkInst->mKind == BeMCInstKind_Call) // Anything can happen during a call
  6439. break;
  6440. if (checkInst->mDbgLoc != inst->mDbgLoc)
  6441. break;
  6442. auto operands = { &checkInst->mArg0, &checkInst->mArg1 };
  6443. for (auto& operand : operands)
  6444. {
  6445. // If we reference the loaded version during the range where the value hasn't changed,
  6446. // then just refer back to the original value. This is useful in cases like i++,
  6447. // where we want to be able to still do an INC on the source variable rather than
  6448. // "loadedI = i; i = loadedI + 1; ... use loadedI ..."
  6449. if ((operand->mKind == BeMCOperandKind_VReg) && (operand->mVRegIdx == mcLoaded.mVRegIdx))
  6450. {
  6451. *operand = mcAddr;
  6452. }
  6453. if ((operand->mKind == BeMCOperandKind_VRegLoad) && (operand->mVRegIdx == mcLoaded.mVRegIdx))
  6454. {
  6455. if (mcAddr.mKind == BeMCOperandKind_VReg)
  6456. {
  6457. operand->mVRegIdx = mcAddr.mVRegIdx;
  6458. }
  6459. }
  6460. }
  6461. }
  6462. }
  6463. // Check for the special case of a single move to a SRET dereference - if so, then make the source composite be the source value
  6464. if ((inst->mKind == BeMCInstKind_Mov) && (inst->mArg0.mKind == BeMCOperandKind_VRegLoad) && (inst->mArg1.mKind == BeMCOperandKind_VReg))
  6465. {
  6466. auto vregInfoDest = GetVRegInfo(inst->mArg0);
  6467. auto vregInfoSrc = GetVRegInfo(inst->mArg1);
  6468. if ((vregInfoDest->IsDirectRelTo()) && (vregInfoSrc->IsDirectRelTo()))
  6469. {
  6470. auto destRelTo = GetVRegInfo(vregInfoDest->mRelTo);
  6471. auto srcRelTo = GetVRegInfo(vregInfoSrc->mRelTo);
  6472. if ((destRelTo->mIsRetVal) && (vregInfoDest->mAssignCount == 1) &&
  6473. (!destRelTo->mIsExpr) && (!srcRelTo->mIsExpr))
  6474. {
  6475. mCompositeRetVRegIdx = vregInfoDest->mRelTo.mVRegIdx;
  6476. RemoveInst(mcBlock, instIdx);
  6477. srcRelTo->SetRetVal();
  6478. instIdx--;
  6479. continue;
  6480. }
  6481. }
  6482. }
  6483. // For the form:
  6484. // @Def %vreg0
  6485. // [%result] = <op> %vreg0, %vreg1
  6486. // Remap %vreg0 to %vreg1 if this is the only assignment, and thus an immutable definition, and vreg1 doesn't change
  6487. if ((nextDestOperand) &&
  6488. (((inst->mKind == BeMCInstKind_Def) && (arg0 == nextDestOperand)) ||
  6489. ((inst->mKind == BeMCInstKind_LifetimeStart) && (BeMCOperand::ToLoad(arg0) == nextDestOperand))))
  6490. {
  6491. lastDefDidMerge = false;
  6492. auto vregInfoDest = GetVRegInfo(nextDestOperand);
  6493. auto checkOperands = { &nextInst->mArg0, &nextInst->mArg1 };
  6494. bool checkArg1 = true;
  6495. if (nextInst->mResult)
  6496. {
  6497. if ((nextInst->mKind == BeMCInstKind_Add) || (nextInst->mKind == BeMCInstKind_Mul))
  6498. {
  6499. // These are commutative, so we can remap to either the LHS or RHS
  6500. checkArg1 = true;
  6501. }
  6502. else
  6503. {
  6504. // We can only remap to LHS
  6505. checkArg1 = false;
  6506. }
  6507. }
  6508. for (int argCheckIdx = (nextInst->mResult ? 0 : 1); argCheckIdx < (checkArg1 ? 2 : 1); argCheckIdx++)
  6509. {
  6510. BeMCOperand origCheckOperand;
  6511. if (argCheckIdx == 0)
  6512. origCheckOperand = nextInst->mArg0;
  6513. else
  6514. origCheckOperand = nextInst->mArg1;
  6515. auto checkOperand = RemapOperand(origCheckOperand, regRemaps);
  6516. if (checkOperand.mKind != BeMCOperandKind_VReg) // Loads/Addrs not applicable
  6517. continue;
  6518. auto vregInfoCheck = GetVRegInfo(checkOperand);
  6519. if (vregInfoCheck == NULL)
  6520. continue;
  6521. if ((vregInfoDest->mIsExpr) || (vregInfoCheck->mIsExpr))
  6522. continue;
  6523. if ((!vregInfoDest->mForceMerge) && (!vregInfoDest->mIsRetVal))
  6524. {
  6525. // If we merge to a vreg that has a pointer ref, that could be a deoptimization by not allowing
  6526. // either to bind to a register
  6527. if (vregInfoDest->mForceMem != vregInfoCheck->mForceMem)
  6528. {
  6529. if (!GetType(checkOperand)->IsComposite())
  6530. continue;
  6531. }
  6532. }
  6533. // We have a special retVal case where we can allow the __returnVal to share an address with the
  6534. // actual 'ret' param. This is most useful when returning structs by value, to avoid a copy.
  6535. // The only downside is that editing the return value in the debugger will also show the value
  6536. // of the ret param changing, which is normally not acceptable but in this case we allow it.
  6537. bool allowCoexist = ((vregInfoDest->mIsRetVal) ||
  6538. (vregInfoCheck->CanEliminate()) || (vregInfoDest->CanEliminate()));
  6539. // Only vregs of the same types can be merged
  6540. if (!AreTypesEquivalent(vregInfoCheck->mType, vregInfoDest->mType))
  6541. continue;
  6542. bool canMerge = false;
  6543. if ((nextInst->IsMov()) && (allowCoexist))
  6544. {
  6545. if ((vregInfoCheck->mForceMerge) || (vregInfoCheck->mIsRetVal))
  6546. canMerge = true; // This is to allow the incoming vregs to combine with the ".addr" debug variables
  6547. else // Always use orig operands for liveness checking
  6548. canMerge = CheckVRegEqualityRange(mcBlock, nextIdx, origCheckOperand, origNextDestOperand, regRemaps);
  6549. }
  6550. else
  6551. {
  6552. // If we're dealing with a non-Mov instruction, then the values of both of these vregs will
  6553. // be different after the instruction, so we can only map them if the incoming vreg will be dead
  6554. // afterwards. If both are dbgVariables then we can't allow them to coeexist because the user
  6555. // could edit one of the values in the debugger and we don't want the other one changing.
  6556. if ((nextNextInst != NULL) &&
  6557. (!IsLive(nextNextInst->mLiveness, origCheckOperand.mVRegIdx, regRemaps)) &&
  6558. (!IsLive(nextNextInst->mLiveness, checkOperand.mVRegIdx, regRemaps)))
  6559. canMerge = true;
  6560. }
  6561. if (canMerge)
  6562. {
  6563. if (vregInfoCheck->mForceMerge)
  6564. vregInfoCheck->mForceMerge = false; // Only allow one merge
  6565. lastDefDidMerge = true;
  6566. if (vregInfoDest->mIsRetVal)
  6567. {
  6568. // We don't do a remap for this return value optimization, because we want both vregs
  6569. // to still show in the debugger - even though they will point to the same address
  6570. // now (in the case of a struct return)
  6571. vregInfoCheck->SetRetVal();
  6572. //BF_ASSERT(mCompositeRetVRegIdx != -1);
  6573. //vregInfoCheck->mRelTo = BeMCOperand::FromVReg(mCompositeRetVRegIdx);
  6574. break;
  6575. }
  6576. if ((vregInfoCheck->mDbgVariable != NULL) && (vregInfoDest->mDbgVariable != NULL))
  6577. {
  6578. // We want separate vreg info so we can track the mDbgVariable separately, but we do want
  6579. // the same location
  6580. vregInfoDest->mIsExpr = true;
  6581. vregInfoDest->mRelTo.mKind = BeMCOperandKind_VReg;
  6582. vregInfoDest->mRelTo.mVRegIdx = checkOperand.mVRegIdx;
  6583. }
  6584. else
  6585. {
  6586. // Replace %vreg0 with %vreg1?
  6587. if (vregInfoDest->CanEliminate())
  6588. {
  6589. bool canReplace = true;
  6590. if (canReplace)
  6591. {
  6592. AddRegRemap(nextDestOperand.mVRegIdx, checkOperand.mVRegIdx, regRemaps);
  6593. break;
  6594. }
  6595. }
  6596. // Or go the other way, and make %vreg1 use our variable directly since we're just handing off anyway
  6597. if (vregInfoCheck->CanEliminate())
  6598. {
  6599. if (vregInfoCheck->mIsRetVal)
  6600. {
  6601. vregInfoDest->SetRetVal();
  6602. //BF_ASSERT(mCompositeRetVRegIdx != -1);
  6603. //vregInfoCheck->mRelTo = BeMCOperand::FromVReg(mCompositeRetVRegIdx);
  6604. }
  6605. AddRegRemap(checkOperand.mVRegIdx, nextDestOperand.mVRegIdx, regRemaps);
  6606. if (vregInfoDest->mNaturalReg == X64Reg_None)
  6607. vregInfoDest->mNaturalReg = vregInfoCheck->mNaturalReg;
  6608. break;
  6609. }
  6610. }
  6611. }
  6612. }
  6613. }
  6614. //if (mDebugging)
  6615. {
  6616. // For the form
  6617. // Def %vreg0
  6618. // Mov %vreg0, %vreg1
  6619. // <Op> <Arg>, %vreg0
  6620. // Where vreg0 has no other references, convert to
  6621. // <Op> <arg>, &vreg1
  6622. if ((inst->mKind == BeMCInstKind_Def) && (nextInst->mKind == BeMCInstKind_Mov) && (nextNextInst != NULL))
  6623. {
  6624. auto vregInfo = GetVRegInfo(inst->mArg0);
  6625. if ((vregInfo->mRefCount == 2) && (inst->mArg0 == nextInst->mArg0) && (!nextInst->mArg1.IsNativeReg()) &&
  6626. (nextNextInst->mArg0 != nextInst->mArg0) && (nextNextInst->mArg1 == nextInst->mArg0) &&
  6627. (AreTypesEquivalent(GetType(inst->mArg0), GetType(nextInst->mArg1))))
  6628. {
  6629. nextNextInst->mArg1 = nextInst->mArg1;
  6630. RemoveInst(mcBlock, instIdx);
  6631. RemoveInst(mcBlock, instIdx);
  6632. instIdx--;
  6633. continue;
  6634. }
  6635. }
  6636. }
  6637. // For the form
  6638. // <BinOp> %vreg0, %vreg1
  6639. // Test %vreg0, 1
  6640. // Remove test, because the BinOp will already set the correct flags
  6641. if ((nextInst->mKind == BeMCInstKind_Test) && (nextInst->mArg1.IsImmediateInt()) && (nextInst->mArg1.mImmediate == 1) &&
  6642. (nextInst->mArg0 == inst->mArg0))
  6643. {
  6644. if ((inst->mKind == BeMCInstKind_Xor) || (inst->mKind == BeMCInstKind_Or) || (inst->mKind == BeMCInstKind_And))
  6645. {
  6646. BF_ASSERT(!inst->mResult);
  6647. RemoveInst(mcBlock, instIdx + 1);
  6648. instIdx--;
  6649. continue;
  6650. }
  6651. }
  6652. if (inst->mResult)
  6653. {
  6654. auto nextArg0 = RemapOperand(nextInst->mArg0, regRemaps);
  6655. auto nextArg1 = RemapOperand(nextInst->mArg1, regRemaps);
  6656. // For the form:
  6657. // %vreg2 = <op> %vreg0, %vreg1
  6658. // Mov %vreg3, %vreg2
  6659. // If %vreg2 has no other references, combine into
  6660. // %vreg3 = <op> %vreg0, %vreg1
  6661. if ((nextInst->IsMov()) && (result == nextArg1))
  6662. {
  6663. // We purposely check inst->mResult here rather than 'result', because that ref count is our
  6664. // indication of whether the result was actually used again
  6665. auto vregInfo = GetVRegInfo(inst->mResult);
  6666. if ((vregInfo != NULL) && (vregInfo->mRefCount == 2) && (vregInfo->CanEliminate()))
  6667. {
  6668. // Make sure the MOV isn't a conversion
  6669. auto movArg0Type = GetType(nextInst->mArg0);
  6670. auto movArg1Type = GetType(nextInst->mArg1);
  6671. if (AreTypesEquivalent(movArg0Type, movArg1Type))
  6672. {
  6673. // We actually eliminate the current inst incase there was a Def between the two,
  6674. // otherwise the Def would occur AFTER the assignment which would be bad
  6675. nextInst->mResult = nextInst->mArg0;
  6676. nextInst->mKind = inst->mKind;
  6677. nextInst->mArg0 = inst->mArg0;
  6678. nextInst->mArg1 = inst->mArg1;
  6679. RemoveInst(mcBlock, instIdx);
  6680. instIdx--;
  6681. continue;
  6682. }
  6683. }
  6684. }
  6685. if (inst->IsCommutable())
  6686. {
  6687. if ((nextInst->IsMov()) && (arg1 == nextArg0) && (result == nextArg1))
  6688. {
  6689. break;
  6690. }
  6691. }
  6692. // For the form:
  6693. // %vreg2 = <op> %vreg0, %vreg1
  6694. // If %vreg0 ends its life on this instruction,
  6695. // Replace all instances of %vreg2 with %vreg0
  6696. if ((inst->mResult.mKind == BeMCOperandKind_VReg) && (inst->mArg0.mKind == BeMCOperandKind_VReg) &&
  6697. (inst->mResult != inst->mArg0))
  6698. {
  6699. // Check liveness against both the orig arg0 and the remap
  6700. //if ((!nextInst->mLiveness->IsSet(inst->mArg0.mVRegIdx)) && (!nextInst->mLiveness->IsSet(arg0.mVRegIdx)))
  6701. if (!IsLive(nextInst->mLiveness, inst->mArg0.mVRegIdx, regRemaps))
  6702. {
  6703. // Only do a full regRemap if this is the def initialization
  6704. if ((prevInst != NULL) && (prevInst->mKind == BeMCInstKind_Def) && (prevInst->mArg0.mVRegIdx == inst->mResult.mVRegIdx))
  6705. {
  6706. auto vregInfoResult = GetVRegInfo(result);
  6707. auto vregInfo0 = GetVRegInfo(arg0);
  6708. if ((vregInfoResult->CanEliminate()) && (!vregInfo0->mIsExpr))
  6709. {
  6710. AddRegRemap(inst->mResult.mVRegIdx, arg0.mVRegIdx, regRemaps);
  6711. }
  6712. }
  6713. }
  6714. }
  6715. }
  6716. if (inst->mKind == BeMCInstKind_RestoreVolatiles)
  6717. {
  6718. if (mcBlock == mBlocks.back())
  6719. {
  6720. bool hadInvalidInst = false;
  6721. for (int checkInstIdx = instIdx + 1; checkInstIdx < (int)mcBlock->mInstructions.size(); checkInstIdx++)
  6722. {
  6723. auto checkInst = mcBlock->mInstructions[checkInstIdx];
  6724. if ((checkInst->mKind != BeMCInstKind_DbgDecl) &&
  6725. (checkInst->mKind != BeMCInstKind_EnsureInstructionAt) &&
  6726. (checkInst->mKind != BeMCInstKind_Ret))
  6727. {
  6728. hadInvalidInst = true;
  6729. break;
  6730. }
  6731. }
  6732. if (!hadInvalidInst)
  6733. {
  6734. // We return after this, we don't need to restore volatiles
  6735. inst->mArg1 = BeMCOperand::FromPreserveFlag(BeMCPreserveFlag_NoRestore);
  6736. continue;
  6737. }
  6738. }
  6739. }
  6740. if (nextNextInst == NULL)
  6741. {
  6742. if (reprocessInst)
  6743. instIdx--;
  6744. continue;
  6745. }
  6746. // For the form
  6747. // Xor &vreg0, 1
  6748. // CondBr <label>, <op>
  6749. // If vreg0 dies at the end, convert to to:
  6750. // Test &veg0, 1
  6751. // CondBr <label>, ~<op>
  6752. // This is advantageous because Test is a non-modifying instruction so we can hopefully elide a copy
  6753. if ((inst->mKind == BeMCInstKind_Xor) &&
  6754. (nextInst->mKind == BeMCInstKind_CondBr))
  6755. {
  6756. auto vregInfo = GetVRegInfo(inst->mArg0);
  6757. if ((vregInfo != NULL) && (!IsLive(nextNextInst->mLiveness, inst->mArg0.mVRegIdx, regRemaps)))
  6758. {
  6759. inst->mKind = BeMCInstKind_Test;
  6760. BF_ASSERT(nextInst->mArg1.mKind == BeMCOperandKind_CmpKind);
  6761. nextInst->mArg1.mCmpKind = BeModule::InvertCmp(nextInst->mArg1.mCmpKind);
  6762. if ((instIdx >= 2) && (!lastDefDidMerge))
  6763. {
  6764. auto defInst = mcBlock->mInstructions[instIdx - 2];
  6765. if ((defInst->mKind == BeMCInstKind_Def) && (defInst->mArg0 == inst->mArg0))
  6766. {
  6767. // Go back and try to eliminate this vreg
  6768. instIdx -= 3;
  6769. continue;
  6770. }
  6771. }
  6772. }
  6773. }
  6774. // For the form:
  6775. // %vreg0 = CmpToBool <cmpType>
  6776. // Test %vreg0, %vreg0
  6777. // CondBr %label, eq
  6778. // If %vreg0 has no other references, convert to:
  6779. // CondBr %label, <cmpType>
  6780. if ((inst->mKind == BeMCInstKind_CmpToBool) &&
  6781. (nextInst->mKind == BeMCInstKind_Test) && (nextInst->mArg0 == nextInst->mArg1) &&
  6782. (nextNextInst->mKind == BeMCInstKind_CondBr) &&
  6783. (nextInst->mArg0 == inst->mResult))
  6784. {
  6785. auto vregInfo = GetVRegInfo(inst->mResult);
  6786. if ((vregInfo != NULL) && (vregInfo->mRefCount == 3))
  6787. {
  6788. BF_ASSERT(nextNextInst->mArg1.mKind == BeMCOperandKind_CmpKind);
  6789. nextNextInst->mArg1.mCmpKind = inst->mArg0.mCmpKind;
  6790. RemoveInst(mcBlock, nextIdx);
  6791. RemoveInst(mcBlock, instIdx);
  6792. instIdx--;
  6793. }
  6794. }
  6795. if (reprocessInst)
  6796. instIdx--;
  6797. }
  6798. }
  6799. SetCurrentInst(NULL);
  6800. Dictionary<int, int> regRemapMap;
  6801. for (int vregIdx = 0; vregIdx < (int)mVRegInfo.size(); vregIdx++)
  6802. {
  6803. int remapIdx = regRemaps.GetHead(vregIdx);
  6804. if (remapIdx != vregIdx)
  6805. regRemapMap[vregIdx] = remapIdx;
  6806. }
  6807. // We want to keep the earliest @Def and remap (in necessary) the later one
  6808. // For remaps, the liveVRregIdx will always indicate which @Def occurs earlier,
  6809. // unless there's a case I haven't considered
  6810. Dictionary<int, int> defMap;
  6811. for (auto& remapPair : regRemapMap)
  6812. {
  6813. int remapFrom = remapPair.mKey;
  6814. int remapTo = remapPair.mValue;
  6815. if (remapTo < 0)
  6816. continue;
  6817. auto vregInfoFrom = mVRegInfo[remapFrom];
  6818. auto vregInfoTo = mVRegInfo[remapTo];
  6819. int bestVRegIdx = (vregInfoFrom->mDefOrderIdx < vregInfoTo->mDefOrderIdx) ? remapFrom : remapTo;
  6820. //auto itr = defMap.find(remapTo);
  6821. //if (itr != defMap.end())
  6822. int* prevBestVRegIdxPtr = NULL;
  6823. if (defMap.TryGetValue(remapTo, &prevBestVRegIdxPtr))
  6824. {
  6825. auto prevBestVRegIdx = *prevBestVRegIdxPtr;
  6826. if (mVRegInfo[bestVRegIdx]->mDefOrderIdx < mVRegInfo[prevBestVRegIdx]->mDefOrderIdx)
  6827. defMap[remapTo] = bestVRegIdx;
  6828. }
  6829. else
  6830. defMap[remapTo] = bestVRegIdx;
  6831. }
  6832. // We have a many-to-one relation so we have to use both a
  6833. HashSet<int> keepDefs;
  6834. for (auto& defPair : defMap)
  6835. keepDefs.Add(defPair.mValue);
  6836. HashSet<int> removeDefs;
  6837. for (auto& remapPair : regRemapMap)
  6838. {
  6839. /*if (keepDefs.find(remapPair.first) == keepDefs.end())
  6840. removeDefs.insert(remapPair.first);*/
  6841. removeDefs.Add(remapPair.mKey);
  6842. /*if (keepDefs.find(remapPair.second) == keepDefs.end())
  6843. removeDefs.insert(remapPair.second);*/
  6844. keepDefs.Add(remapPair.mValue);
  6845. auto vregInfoFrom = mVRegInfo[remapPair.mKey];
  6846. auto vregInfoTo = mVRegInfo[remapPair.mValue];
  6847. if (vregInfoFrom->mHasDynLife)
  6848. vregInfoTo->mHasDynLife = true;
  6849. }
  6850. auto _RemapOperand = [&](BeMCOperand* operand)
  6851. {
  6852. if (operand->IsVRegAny())
  6853. {
  6854. int* regIdxPtr = NULL;
  6855. if (regRemapMap.TryGetValue(operand->mVRegIdx, &regIdxPtr))
  6856. {
  6857. int regIdx = *regIdxPtr;
  6858. if (regIdx < 0)
  6859. {
  6860. if (operand->mKind == BeMCOperandKind_VRegLoad)
  6861. operand->mKind = BeMCOperandKind_VReg;
  6862. else
  6863. NotImpl();
  6864. operand->mVRegIdx = -regIdx;
  6865. }
  6866. else
  6867. {
  6868. operand->mVRegIdx = regIdx;
  6869. }
  6870. }
  6871. }
  6872. if (operand->IsVRegAny())
  6873. {
  6874. if (wantUnwrapVRegs.Contains(operand->mVRegIdx))
  6875. {
  6876. // Replace any rel-to symbol info with direct references to those symbols
  6877. auto vregInfo = mVRegInfo[operand->mVRegIdx];
  6878. BF_ASSERT(vregInfo->IsDirectRelToAny());
  6879. if (operand->mKind == BeMCOperandKind_VReg)
  6880. *operand = vregInfo->mRelTo;
  6881. else if (operand->mKind == BeMCOperandKind_VRegAddr)
  6882. *operand = BeMCOperand::ToAddr(vregInfo->mRelTo);
  6883. }
  6884. }
  6885. };
  6886. if ((!regRemapMap.IsEmpty()) || (!wantUnwrapVRegs.IsEmpty()))
  6887. {
  6888. for (auto mcBlock : mBlocks)
  6889. {
  6890. for (int instIdx = 0; instIdx < (int)mcBlock->mInstructions.size(); instIdx++)
  6891. {
  6892. auto inst = mcBlock->mInstructions[instIdx];
  6893. if (inst->IsDef())
  6894. {
  6895. //auto itr = removeDefs.find(inst->mArg0.mVRegIdx);
  6896. //if (itr != removeDefs.end())
  6897. if ((removeDefs.Contains(inst->mArg0.mVRegIdx)) || (wantUnwrapVRegs.Contains(inst->mArg0.mVRegIdx)))
  6898. {
  6899. RemoveInst(mcBlock, instIdx);
  6900. instIdx--;
  6901. continue;
  6902. }
  6903. }
  6904. /*if (inst->mKind == BeMCInstKind_LifetimeStart)
  6905. {
  6906. if (removeLifetimeStarts.find(inst->mArg0.mVRegIdx) != removeLifetimeStarts.end())
  6907. {
  6908. RemoveInst(mcBlock, instIdx);
  6909. instIdx--;
  6910. continue;
  6911. }
  6912. }*/
  6913. auto operands = { &inst->mResult, &inst->mArg0, &inst->mArg1 };
  6914. for (auto& operand : operands)
  6915. {
  6916. _RemapOperand(operand);
  6917. }
  6918. }
  6919. }
  6920. for (auto vregInfo : mVRegInfo)
  6921. {
  6922. auto operands = { &vregInfo->mRelTo, &vregInfo->mRelOffset };
  6923. for (auto& operand : operands)
  6924. {
  6925. if (operand->IsVRegAny())
  6926. {
  6927. RemapOperand(*operand, regRemaps);
  6928. _RemapOperand(operand);
  6929. }
  6930. }
  6931. }
  6932. }
  6933. }
  6934. void BeMCContext::DoRegAssignPass()
  6935. {
  6936. BP_ZONE("BeMCContext::DoRegAssignPass");
  6937. bool generateLiveness = true;
  6938. //
  6939. if (generateLiveness)
  6940. {
  6941. for (auto& node : mColorizer.mNodes)
  6942. {
  6943. node.mEdges.Clear();
  6944. }
  6945. mColorizer.Prepare();
  6946. GenerateLiveness();
  6947. }
  6948. else
  6949. {
  6950. mColorizer.Prepare();
  6951. }
  6952. mColorizer.GenerateRegCosts();
  6953. //
  6954. {
  6955. BP_ZONE("BeMCContext::DoRegAssignPass:ints");
  6956. mColorizer.AssignRegs(BeMCColorizer::RegKind_Ints);
  6957. }
  6958. //
  6959. {
  6960. BP_ZONE("BeMCContext::DoRegAssignPass:float");
  6961. mColorizer.AssignRegs(BeMCColorizer::RegKind_Floats);
  6962. }
  6963. #ifdef _DEBUG
  6964. BF_ASSERT(mColorizer.Validate());
  6965. for (int vregIdx = 0; vregIdx < (int)mVRegInfo.size(); vregIdx++)
  6966. {
  6967. auto vregInfo = mVRegInfo[vregIdx];
  6968. if (vregInfo->mRefCount == 0)
  6969. continue;
  6970. if ((vregInfo->mIsRetVal) && (mCompositeRetVRegIdx != -1) && (vregIdx != mCompositeRetVRegIdx))
  6971. continue;
  6972. if ((vregInfo->mForceReg) && (!vregInfo->mRelTo) && (vregInfo->mReg == X64Reg_None))
  6973. {
  6974. Fail("Failed to assign register to ForceReg vreg");
  6975. }
  6976. if (vregInfo->mDisableRAX)
  6977. {
  6978. BF_ASSERT(ResizeRegister(vregInfo->mReg, 8) != X64Reg_RAX);
  6979. }
  6980. if (vregInfo->mDisableRDX)
  6981. {
  6982. BF_ASSERT(ResizeRegister(vregInfo->mReg, 8) != X64Reg_RDX);
  6983. }
  6984. if (vregInfo->mDisableR11)
  6985. {
  6986. BF_ASSERT(ResizeRegister(vregInfo->mReg, 8) != X64Reg_R11);
  6987. }
  6988. if (vregInfo->mDisableR12)
  6989. {
  6990. BF_ASSERT(ResizeRegister(vregInfo->mReg, 8) != X64Reg_R12);
  6991. }
  6992. if (vregInfo->mDisableR13)
  6993. {
  6994. BF_ASSERT(ResizeRegister(vregInfo->mReg, 8) != X64Reg_R13);
  6995. }
  6996. }
  6997. #endif
  6998. }
  6999. void BeMCContext::DoFrameObjPass()
  7000. {
  7001. BF_ASSERT(mBlocks.size() == 1);
  7002. SetCurrentInst(NULL);
  7003. // MS x64 ABI requires a "home address" of 4 intptrs when we call a function, plus whatever
  7004. // we need for calls with more than 4 params.
  7005. // If we're doing UseBP, we have to allocate these at call time
  7006. int homeSize = BF_ALIGN(BF_MAX(mMaxCallParamCount, 4) * 8, 16);
  7007. mStackSize = 0;
  7008. if (mUseBP)
  7009. mUsedRegs.Add(X64Reg_RBP);
  7010. int regStackOffset = 0;
  7011. int xmmRegStackSize = 0;
  7012. for (auto usedReg : mUsedRegs)
  7013. {
  7014. if (!IsVolatileReg(usedReg))
  7015. {
  7016. BF_ASSERT(usedReg != X64Reg_RSP);
  7017. if (IsXMMReg(usedReg))
  7018. xmmRegStackSize += 16;
  7019. else
  7020. regStackOffset += 8;
  7021. }
  7022. }
  7023. int xmmStackOffset = -1;
  7024. if (xmmRegStackSize > 0)
  7025. {
  7026. int align = 16;
  7027. int alignOffset = regStackOffset + 8;
  7028. int alignedPosition = (mStackSize + alignOffset + (align - 1)) & ~(align - 1);
  7029. mStackSize = alignedPosition - alignOffset;
  7030. mStackSize += xmmRegStackSize;
  7031. xmmStackOffset = -mStackSize - regStackOffset;
  7032. }
  7033. for (int vregIdx = 0; vregIdx < (int)mVRegInfo.size(); vregIdx++)
  7034. {
  7035. auto vregInfo = mVRegInfo[vregIdx];
  7036. if ((vregInfo->mIsRetVal) && (vregIdx != mCompositeRetVRegIdx))
  7037. continue;
  7038. if ((vregInfo->mRefCount > 0) && (!vregInfo->mIsExpr) && (vregInfo->mReg == X64Reg_None) && (vregInfo->mFrameOffset == INT_MIN))
  7039. {
  7040. BF_ASSERT(vregInfo->mAlign != -1);
  7041. int align = BF_MAX(vregInfo->mAlign, 1);
  7042. int alignOffset = regStackOffset + 8;
  7043. int alignedPosition = (mStackSize + alignOffset + (align - 1)) & ~(align - 1);
  7044. mStackSize = alignedPosition - alignOffset;
  7045. //vregInfo->mFrameOffset = -mStackSize - regStackOffset - 8;
  7046. mStackSize += BF_ALIGN(vregInfo->mType->mSize, vregInfo->mAlign);
  7047. vregInfo->mFrameOffset = -mStackSize - regStackOffset;
  7048. }
  7049. }
  7050. // If we have dynamic stack resizing then we have a stack frame and must be 16-byte aligned
  7051. // even if we're a leaf function
  7052. bool mHasFramePointer = false;
  7053. // Potentially pull off retaddr bytes if alignment allows --
  7054. // Stack must be aligned to 16 bytes and retaddr offsets us by 8,
  7055. // so we must always offset by 0x?8
  7056. int align = 8;
  7057. mStackSize = (mStackSize + (align - 1)) & ~(align - 1);
  7058. //if (!mUseBP)
  7059. {
  7060. // MS x64 ABI requires a "home address" of 4 intptrs when we call a function, plus whatever
  7061. // we need for calls with more than 4 params.
  7062. // If we're doing UseBP, we have to allocate these at call time
  7063. if (mMaxCallParamCount != -1)
  7064. {
  7065. mStackSize += homeSize;
  7066. // Even param counts, to align to 16 bytes.
  7067. // Minimum is space for 4 params
  7068. //int paramSpace = (std::max(mMaxCallParamCount, 4) + 1) & ~1;
  7069. //mStackSize += paramSpace * 8;
  7070. }
  7071. }
  7072. int stackAdjust = mStackSize;
  7073. mStackSize += regStackOffset;
  7074. if ((mStackSize != 0) && (mStackSize % 16 == 0))
  7075. {
  7076. mStackSize += 8;
  7077. stackAdjust += 8;
  7078. }
  7079. mActiveBlock = mBlocks[0];
  7080. if (mUseBP)
  7081. {
  7082. AllocInst(BeMCInstKind_Unwind_SetBP, 0);
  7083. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromReg(X64Reg_RBP), BeMCOperand::FromReg(X64Reg_RSP), 0);
  7084. }
  7085. int xmmRegIdx = 0;
  7086. for (auto usedReg : mUsedRegs)
  7087. {
  7088. if ((!IsVolatileReg(usedReg)) && (IsXMMReg(usedReg)))
  7089. {
  7090. AllocInst(BeMCInstKind_Unwind_SaveXMM, BeMCOperand::FromReg(usedReg), BeMCOperand::FromImmediate(mStackSize + xmmStackOffset + xmmRegIdx * 16), 0);
  7091. AllocInst(BeMCInstKind_Push, BeMCOperand::FromReg(usedReg), BeMCOperand::FromImmediate(mStackSize + xmmStackOffset + xmmRegIdx * 16), 0);
  7092. xmmRegIdx++;
  7093. }
  7094. }
  7095. if (stackAdjust > 0)
  7096. {
  7097. AllocInst(BeMCInstKind_Unwind_Alloc, BeMCOperand::FromImmediate(stackAdjust), 0);
  7098. AllocInst(BeMCInstKind_Sub, BeMCOperand::FromReg(X64Reg_RSP), BeMCOperand::FromImmediate(stackAdjust), 0);
  7099. if (stackAdjust >= 4096)
  7100. {
  7101. BeMCOperand mcFunc;
  7102. mcFunc.mKind = BeMCOperandKind_SymbolAddr;
  7103. mcFunc.mSymbolIdx = mCOFFObject->GetSymbolRef("__chkstk")->mIdx;
  7104. AllocInst(BeMCInstKind_Call, mcFunc, 0);
  7105. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromReg(X64Reg_RAX), BeMCOperand::FromImmediate(stackAdjust), 0);
  7106. }
  7107. }
  7108. for (auto usedReg : mUsedRegs)
  7109. {
  7110. if ((!IsVolatileReg(usedReg)) && (!IsXMMReg(usedReg)))
  7111. {
  7112. AllocInst(BeMCInstKind_Unwind_PushReg, BeMCOperand::FromReg(usedReg), 0);
  7113. AllocInst(BeMCInstKind_Push, BeMCOperand::FromReg(usedReg), 0);
  7114. }
  7115. }
  7116. BeMCOperand restoreBPVal;
  7117. if (mUseBP)
  7118. {
  7119. auto nativeType = mModule->mContext->GetPrimitiveType(BeTypeCode_Int64);
  7120. restoreBPVal = AllocVirtualReg(nativeType);
  7121. auto restoreBPVReg = mVRegInfo[restoreBPVal.mVRegIdx];
  7122. restoreBPVReg->mIsExpr = true;
  7123. restoreBPVReg->mRelTo = BeMCOperand::FromReg(X64Reg_RBP);
  7124. restoreBPVReg->mRelOffset = BeMCOperand::FromImmediate(stackAdjust);
  7125. restoreBPVal.mKind = BeMCOperandKind_VReg;
  7126. }
  7127. for (int instIdx = 0; instIdx < (int)mActiveBlock->mInstructions.size(); instIdx++)
  7128. {
  7129. auto checkInst = mActiveBlock->mInstructions[instIdx];
  7130. if (checkInst->mKind == BeMCInstKind_Ret)
  7131. {
  7132. mCurDbgLoc = checkInst->mDbgLoc;
  7133. int insertIdx = instIdx;
  7134. int xmmRegIdx = 0;
  7135. for (auto usedReg : mUsedRegs)
  7136. {
  7137. if ((!IsVolatileReg(usedReg)) && (IsXMMReg(usedReg)))
  7138. {
  7139. AllocInst(BeMCInstKind_Pop, BeMCOperand::FromReg(usedReg), BeMCOperand::FromImmediate(mStackSize + xmmStackOffset + xmmRegIdx * 16), insertIdx++);
  7140. xmmRegIdx++;
  7141. }
  7142. }
  7143. if (mUseBP)
  7144. {
  7145. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromReg(X64Reg_RSP), restoreBPVal, insertIdx++);
  7146. }
  7147. else if (stackAdjust > 0)
  7148. {
  7149. AllocInst(BeMCInstKind_Add, BeMCOperand::FromReg(X64Reg_RSP), BeMCOperand::FromImmediate(stackAdjust), insertIdx++);
  7150. instIdx++;
  7151. }
  7152. for (auto usedReg : mUsedRegs)
  7153. {
  7154. if ((!IsVolatileReg(usedReg)) && (!IsXMMReg(usedReg)))
  7155. AllocInst(BeMCInstKind_Pop, BeMCOperand::FromReg(usedReg), insertIdx++);
  7156. }
  7157. instIdx = insertIdx;
  7158. }
  7159. }
  7160. }
  7161. static int gLegalizeIdx = 0;
  7162. void BeMCContext::DoActualization()
  7163. {
  7164. while (true)
  7165. {
  7166. bool hasMoreWork = false;
  7167. for (auto mcBlock : mBlocks)
  7168. {
  7169. mActiveBlock = mcBlock;
  7170. for (int instIdx = 0; instIdx < (int)mcBlock->mInstructions.size(); instIdx++)
  7171. {
  7172. auto inst = mcBlock->mInstructions[instIdx];
  7173. SetCurrentInst(inst);
  7174. if (inst->mKind == BeMCInstKind_DbgDecl)
  7175. {
  7176. auto vregInfo = GetVRegInfo(inst->mArg0);
  7177. if (vregInfo->mWantsExprActualize)
  7178. {
  7179. if (inst->mArg0.mKind == BeMCOperandKind_VReg)
  7180. {
  7181. if (vregInfo->mDbgVariable->mIsValue)
  7182. {
  7183. vregInfo->mDbgVariable->mIsValue = false;
  7184. inst->mArg0.mKind = BeMCOperandKind_VRegAddr;
  7185. }
  7186. else
  7187. {
  7188. inst->mArg0.mKind = BeMCOperandKind_VRegAddr;
  7189. vregInfo->mDbgVariable->mType = mModule->mDbgModule->CreateReferenceType(vregInfo->mDbgVariable->mType);
  7190. }
  7191. // if (auto ptrType = BeValueDynCast<BeDbgPointerType>(vregInfo->mDbgVariable->mType))
  7192. // vregInfo->mDbgVariable->mType = ptrType->mElement;
  7193. // if (vregInfo->mType->IsPointer())
  7194. // vregInfo->mType = ((BePointerType*)vregInfo->mType)->mElementType;
  7195. }
  7196. vregInfo->mWantsExprActualize = false;
  7197. }
  7198. }
  7199. if (inst->IsDef())
  7200. {
  7201. int vregIdx = inst->mArg0.mVRegIdx;
  7202. auto vregInfo = GetVRegInfo(inst->mArg0);
  7203. if (vregInfo->mWantsExprActualize)
  7204. {
  7205. if (vregInfo->mDbgVariable != NULL)
  7206. {
  7207. // Wait until dbgDecl so we can potentially set to VRegAddr
  7208. }
  7209. else
  7210. {
  7211. vregInfo->mWantsExprActualize = false;
  7212. }
  7213. BF_ASSERT((!vregInfo->IsDirectRelTo()) || (vregInfo->mDbgVariable != NULL));
  7214. if (vregInfo->mIsExpr)
  7215. {
  7216. // Create a new reg with the expression, and then load the value into the old non-expressionized reg
  7217. // This has the advantage of fixing any other references to this expr, too
  7218. auto scratchReg = AllocVirtualReg(vregInfo->mType, 2, false);
  7219. auto scratchVRegInfo = mVRegInfo[scratchReg.mVRegIdx];
  7220. scratchVRegInfo->mIsExpr = true;
  7221. scratchVRegInfo->mRelTo = vregInfo->mRelTo;
  7222. scratchVRegInfo->mRelOffset = vregInfo->mRelOffset;
  7223. scratchVRegInfo->mRelOffsetScale = vregInfo->mRelOffsetScale;
  7224. vregInfo->mIsExpr = false;
  7225. vregInfo->mRelTo = BeMCOperand();
  7226. vregInfo->mRelOffset = BeMCOperand();
  7227. vregInfo->mRelOffsetScale = 1;
  7228. CreateDefineVReg(scratchReg, instIdx++ + 1);
  7229. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromVReg(vregIdx), scratchReg, instIdx++ + 1);
  7230. }
  7231. }
  7232. }
  7233. }
  7234. }
  7235. if (!hasMoreWork)
  7236. break;
  7237. }
  7238. }
  7239. void BeMCContext::DoLoads()
  7240. {
  7241. for (auto mcBlock : mBlocks)
  7242. {
  7243. mActiveBlock = mcBlock;
  7244. for (int instIdx = 0; instIdx < (int)mcBlock->mInstructions.size(); instIdx++)
  7245. {
  7246. auto inst = mcBlock->mInstructions[instIdx];
  7247. SetCurrentInst(inst);
  7248. if (inst->mKind == BeMCInstKind_DefLoad)
  7249. {
  7250. // Almost all DefLoads should be eliminated during InstCombine, but for 'persistent loads', we need
  7251. // to actualize them now
  7252. inst->mKind = BeMCInstKind_Def;
  7253. auto vregInfo = mVRegInfo[inst->mArg0.mVRegIdx];
  7254. if (vregInfo->mRefCount == 0)
  7255. continue;
  7256. auto relLoaded = vregInfo->mRelTo;
  7257. auto loadTo = inst->mArg0;
  7258. BF_ASSERT(loadTo.mKind == BeMCOperandKind_VReg);
  7259. AllocInst(BeMCInstKind_Mov, loadTo, relLoaded, instIdx++ + 1);
  7260. vregInfo->mIsExpr = false;
  7261. vregInfo->mRelTo = BeMCOperand();
  7262. }
  7263. if (inst->mKind == BeMCInstKind_Def)
  7264. {
  7265. auto vregInfo = mVRegInfo[inst->mArg0.mVRegIdx];
  7266. if (vregInfo->mRefCount == 0)
  7267. continue;
  7268. if (vregInfo->mRelTo.mKind == BeMCOperandKind_VRegAddr)
  7269. {
  7270. auto vregRelInfo = mVRegInfo[vregInfo->mRelTo.mVRegIdx];
  7271. vregRelInfo->mForceMem = true;
  7272. CheckForce(vregInfo);
  7273. }
  7274. }
  7275. }
  7276. }
  7277. }
  7278. static int sLegalizationIdx = 0;
  7279. // Returning false means we generated some new vregs that need to be assigned to registers
  7280. bool BeMCContext::DoLegalization()
  7281. {
  7282. BP_ZONE("BeMCContext::DoLegalization");
  7283. bool debugging = false;
  7284. //if (mBeFunction->mName == "?DrawEntry@DrawContext@PerfView@BeefPerf@@QEAAXPEAVGraphics@gfx@Beefy@@PEAVTrackNodeEntry@23@MM@Z")
  7285. //debugging = true;
  7286. if (debugging)
  7287. OutputDebugStrF("DoLegalization\n");
  7288. bool isFinalRun = true;
  7289. int startingVRegCount = (int)mVRegInfo.size();
  7290. HashSet<int> vregExprChangeSet;
  7291. bool hasPendingActualizations = false;
  7292. SetCurrentInst(NULL);
  7293. int regPreserveDepth = 0;
  7294. for (auto mcBlock : mBlocks)
  7295. {
  7296. mActiveBlock = mcBlock;
  7297. for (int instIdx = 0; instIdx < (int)mcBlock->mInstructions.size(); instIdx++)
  7298. {
  7299. BfIRInitType pendingInitKind = BfIRInitType_NotNeeded;
  7300. gLegalizeIdx++;
  7301. auto inst = mcBlock->mInstructions[instIdx];
  7302. SetCurrentInst(inst);
  7303. if ((mDebugging) && (inst->mKind == BeMCInstKind_IMul))
  7304. {
  7305. NOP;
  7306. }
  7307. if (inst->mKind == BeMCInstKind_Mov)
  7308. {
  7309. // Useless mov, remove it
  7310. if (OperandsEqual(inst->mArg0, inst->mArg1, true))
  7311. {
  7312. // We leave the instructions alone here and remove them in DoRegFinalization.
  7313. // There are some cases with DirectRelTo vregs where we need to preserve liveness that a mov
  7314. // generates. We just want to keep from inserting any additional legalization instructions here (ie: movs to temps)
  7315. continue;
  7316. }
  7317. }
  7318. BeMCInst* nextInst = NULL;
  7319. if (instIdx < mcBlock->mInstructions.size() - 1)
  7320. {
  7321. // It's important that we do this at the top before any instructions might get split, so liveness of the next instruction can be analyzed
  7322. nextInst = mcBlock->mInstructions[instIdx + 1];
  7323. }
  7324. auto arg0 = GetFixedOperand(inst->mArg0);
  7325. auto arg1 = GetFixedOperand(inst->mArg1);
  7326. auto arg0Type = GetType(arg0);
  7327. auto arg1Type = GetType(arg1);
  7328. if ((arg0Type != NULL) && (arg0Type->mSize == 0) && (!inst->IsPsuedo()))
  7329. {
  7330. RemoveInst(mcBlock, instIdx);
  7331. instIdx--;
  7332. continue;
  7333. }
  7334. // Check operands
  7335. if ((!inst->IsPsuedo()) && (arg0Type != NULL) && (!arg0Type->IsComposite()))
  7336. {
  7337. bool replacedOpr = false;
  7338. for (int oprIdx = 0; oprIdx < 2; oprIdx++)
  7339. {
  7340. BeMCOperand& origOperand = (oprIdx == 0) ? inst->mArg0 : inst->mArg1;
  7341. BeMCOperand& remappedOperand = (oprIdx == 0) ? arg0 : arg1;
  7342. if (remappedOperand.IsVRegAny())
  7343. {
  7344. bool isMulti = false;
  7345. X64CPURegister regA = X64Reg_None;
  7346. X64CPURegister regB = X64Reg_None;
  7347. int bScale = 1;
  7348. int disp = 0;
  7349. int errorVReg = -1;
  7350. auto rmForm = GetRMParams(remappedOperand, regA, regB, bScale, disp, &errorVReg);
  7351. bool badOperand = false;
  7352. bool scratchForceReg = false;
  7353. if (rmForm == BeMCRMMode_Invalid)
  7354. {
  7355. badOperand = true;
  7356. scratchForceReg = true;
  7357. }
  7358. // We can only allow a "complex direct" expression such as (RAX+RBX) on the SRC side of
  7359. // a mov, where it can be emitted as a LEA. All other uses are invalid.
  7360. bool allowComplexDirect = (inst->mKind == BeMCInstKind_Mov) && (oprIdx == 1);
  7361. if (allowComplexDirect)
  7362. {
  7363. auto vregInfo = GetVRegInfo(remappedOperand);
  7364. if ((vregInfo->mRelTo.mKind == BeMCOperandKind_SymbolAddr) &&
  7365. (vregInfo->mRelOffset.IsImmediateInt()) &&
  7366. (vregInfo->mRelOffsetScale == 1))
  7367. {
  7368. badOperand = false;
  7369. }
  7370. }
  7371. else
  7372. {
  7373. if ((rmForm == BeMCRMMode_Direct) &&
  7374. ((regB != X64Reg_None) || (bScale != 1) || (disp != 0)))
  7375. {
  7376. badOperand = true;
  7377. }
  7378. // bool isSimple = (rmForm == BeMCRMMode_Direct) && (regB == X64Reg_None) && (bScale == 1) && (disp == 0);
  7379. // if ((!isSimple) && (oprIdx == 1) && (!arg0isSimple))
  7380. // {
  7381. // NOP;
  7382. // }
  7383. // if (oprIdx == 0)
  7384. // arg0isSimple = isSimple;
  7385. }
  7386. if (badOperand)
  7387. {
  7388. BeMCOperand checkOperand = remappedOperand;
  7389. while (checkOperand.mKind == BeMCOperandKind_VReg)
  7390. {
  7391. auto vregInfo = GetVRegInfo(checkOperand);
  7392. if (!vregInfo->IsDirectRelToAny())
  7393. break;
  7394. checkOperand = vregInfo->mRelTo;
  7395. }
  7396. if (inst->mKind == BeMCInstKind_Mov)
  7397. {
  7398. if ((checkOperand.mKind == BeMCOperandKind_Symbol) || (checkOperand.mKind == BeMCOperandKind_SymbolAddr))
  7399. {
  7400. // SymbolAddr can be emitted as an LEA
  7401. badOperand = false;
  7402. }
  7403. if (checkOperand.mKind == BeMCOperandKind_VRegAddr)
  7404. {
  7405. auto vregInfo = GetVRegInfo(checkOperand);
  7406. if ((vregInfo->IsDirectRelToAny()) && (vregInfo->mRelTo.mKind == BeMCOperandKind_Symbol))
  7407. {
  7408. badOperand = false;
  7409. }
  7410. }
  7411. }
  7412. }
  7413. if (badOperand)
  7414. {
  7415. //if (vregExprChangeSet.find(errorVReg) == vregExprChangeSet.end())
  7416. if (!vregExprChangeSet.Contains(errorVReg))
  7417. {
  7418. auto remappedVRegInfo = mVRegInfo[remappedOperand.mVRegIdx];
  7419. BeMCOperand savedOperand = BeMCOperand::FromVReg(remappedOperand.mVRegIdx);
  7420. BeMCOperand newOperand;
  7421. if (origOperand.mKind == BeMCOperandKind_VRegLoad)
  7422. {
  7423. // Loads keep their load-ness
  7424. savedOperand = BeMCOperand::FromVReg(remappedOperand.mVRegIdx);
  7425. newOperand = origOperand;
  7426. }
  7427. else
  7428. {
  7429. savedOperand = origOperand;
  7430. newOperand.mKind = BeMCOperandKind_VReg;
  7431. }
  7432. auto type = GetType(savedOperand);
  7433. //TODO: Are there circumstances when this needs to be forceReg?
  7434. BeMCOperand scratchReg = AllocVirtualReg(type, 2, scratchForceReg);
  7435. int insertPos = FindSafeInstInsertPos(instIdx);
  7436. CreateDefineVReg(scratchReg, insertPos);
  7437. AllocInst(BeMCInstKind_Mov, scratchReg, savedOperand, insertPos + 1);
  7438. newOperand.mVRegIdx = scratchReg.mVRegIdx;
  7439. IntroduceVRegs(scratchReg, mcBlock, insertPos, insertPos + 1);
  7440. if ((insertPos == instIdx) || (!scratchForceReg))
  7441. {
  7442. // Only allow short-lived forceRegs
  7443. instIdx += 2;
  7444. //origOperand.mVRegIdx = scratchReg.mVRegIdx;
  7445. origOperand = newOperand;
  7446. }
  7447. else
  7448. {
  7449. // .. otherwise we need yet another layer of indirection for the load
  7450. auto loadedType = GetType(inst->mArg0);
  7451. BeMCOperand loadedReg = AllocVirtualReg(loadedType, 2, false);
  7452. CreateDefineVReg(loadedReg, insertPos + 2);
  7453. AllocInst(BeMCInstKind_Mov, loadedReg, origOperand, insertPos + 3);
  7454. IntroduceVRegs(scratchReg, mcBlock, insertPos + 2, insertPos + 3);
  7455. instIdx += 4;
  7456. origOperand = loadedReg;
  7457. }
  7458. replacedOpr = true;
  7459. isFinalRun = false;
  7460. if (debugging)
  7461. OutputDebugStrF(" BadOperand %d\n", errorVReg);
  7462. }
  7463. }
  7464. }
  7465. }
  7466. if (replacedOpr)
  7467. {
  7468. //instIdx--;
  7469. continue;
  7470. }
  7471. }
  7472. if (!inst->IsPsuedo())
  7473. {
  7474. if ((HasSymbolAddr(inst->mArg0)) && (inst->mKind != BeMCInstKind_Call))
  7475. {
  7476. ReplaceWithNewVReg(inst->mArg0, instIdx, true, false);
  7477. isFinalRun = false;
  7478. // if (debugging)
  7479. // OutputDebugStrF(" SymbolAddr0\n");
  7480. }
  7481. // We can only allow symbol addresses on a MOV where they can be made into a LEA
  7482. if ((HasSymbolAddr(inst->mArg1)) && (inst->mKind != BeMCInstKind_Mov))
  7483. {
  7484. ReplaceWithNewVReg(inst->mArg1, instIdx, true, false);
  7485. isFinalRun = false;
  7486. // if (debugging)
  7487. // OutputDebugStrF(" SymbolAddr1\n");
  7488. }
  7489. }
  7490. if (!inst->IsPsuedo())
  7491. {
  7492. if ((arg0.IsImmediate()) && (arg1) && (inst->IsCommutable()))
  7493. {
  7494. // Always make the immediate be the second arg
  7495. BF_SWAP(inst->mArg0, inst->mArg1);
  7496. BF_SWAP(arg0, arg1);
  7497. }
  7498. bool isIntMul = (inst->IsMul()) && (arg0Type->IsInt());
  7499. bool isIntDiv = (((inst->mKind == BeMCInstKind_IDiv) || (inst->mKind == BeMCInstKind_Div))) && (arg0Type->IsInt());
  7500. bool isMov_R64_IMM64 = ((inst->mKind == BeMCInstKind_Mov) && (inst->mArg0.IsNativeReg()) && (inst->mArg1.IsImmediateInt()));
  7501. bool doStdCheck = true;
  7502. if (isMov_R64_IMM64)
  7503. doStdCheck = false;
  7504. bool is3FormMul = false;
  7505. if ((isIntMul) && (inst->mResult))
  7506. {
  7507. is3FormMul = true;
  7508. if (inst->mArg1.IsImmediateInt())
  7509. {
  7510. bool isLegal = true;
  7511. int64 immediateInt = inst->mArg1.GetImmediateInt();
  7512. if (inst->mKind == BeMCInstKind_Mul)
  7513. {
  7514. if (immediateInt > 0xFFFFFFFFLL)
  7515. isLegal = false;
  7516. }
  7517. else
  7518. {
  7519. if ((immediateInt < -0x80000000LL) || (immediateInt > 0x7FFFFFFF))
  7520. isLegal = false;
  7521. }
  7522. if (isLegal)
  7523. doStdCheck = false;
  7524. }
  7525. }
  7526. // Int 3-form mul does not follow these rules
  7527. if (doStdCheck)
  7528. {
  7529. bool isIncOrDec = false;
  7530. isIncOrDec = (((inst->mKind == BeMCInstKind_Add) || (inst->mKind == BeMCInstKind_Sub)) &&
  7531. (arg1.IsImmediateInt()) && (arg1.mImmediate == 1));
  7532. bool badOps = false;
  7533. if ((!isIncOrDec) && (!isIntMul) && (!isIntDiv))
  7534. {
  7535. if ((arg0.MayBeMemory()) && (arg1.MayBeMemory()))
  7536. {
  7537. if (arg0 == arg1)
  7538. {
  7539. if (inst->mKind != BeMCInstKind_Mov)
  7540. {
  7541. badOps = true;
  7542. }
  7543. }
  7544. else
  7545. badOps = true;
  7546. }
  7547. //TODO: For what instructions was this true? CMP, MOV, ADD, etc... seems to have it
  7548. if ((arg1Type != NULL) && (arg1Type->IsFloat()))
  7549. {
  7550. // MOV is allowed on '<r/m>, <imm>'
  7551. if ((inst->mKind != BeMCInstKind_Mov) && (arg0.MayBeMemory()) && (arg1.IsImmediate()))
  7552. badOps = true;
  7553. }
  7554. }
  7555. // "MOV <r>, <imm64>" is the only instruction that allows an IMM64 immediate
  7556. if (((inst->mKind != BeMCInstKind_Mov) || (!arg0.IsNativeReg())) &&
  7557. (arg1.mKind == BeMCOperandKind_Immediate_i64))
  7558. {
  7559. if ((arg1.mImmediate < -0x80000000LL) || (arg1.mImmediate > 0x7FFFFFFF))
  7560. badOps = true;
  7561. }
  7562. if (badOps)
  7563. {
  7564. // On X64 we can never have an instruction where both args are memory so we create a short-lived scratch vreg
  7565. // and run another reg pass to generate register access
  7566. // From: <op> a, b
  7567. // To: @Def scratch
  7568. // mov scratch, b
  7569. // <op> a, scratch
  7570. auto targetType = GetType(inst->mArg0);
  7571. if (!targetType->IsComposite())
  7572. {
  7573. auto scratchType = GetType(inst->mArg1);
  7574. BeMCOperand scratchReg = AllocVirtualReg(scratchType, 2, true);
  7575. CreateDefineVReg(scratchReg, instIdx);
  7576. AllocInst(BeMCInstKind_Mov, scratchReg, inst->mArg1, instIdx + 1);
  7577. inst->mArg1 = scratchReg;
  7578. IntroduceVRegs(scratchReg, mcBlock, instIdx, instIdx + 2);
  7579. // Don't process the changed instructions until after another reg pass
  7580. instIdx += 2;
  7581. isFinalRun = false;
  7582. if (debugging)
  7583. OutputDebugStrF(" BadOps\n");
  7584. continue;
  7585. }
  7586. }
  7587. if (inst->mResult)
  7588. {
  7589. if (inst->mResult == inst->mArg0)
  7590. {
  7591. inst->mResult = BeMCOperand();
  7592. }
  7593. else if ((arg0Type->IsFloat()) && (!CouldBeReg(inst->mResult)))
  7594. {
  7595. // We need a REG on the dest for sure, so just create a scratch here, otherwise we end up
  7596. // requiring additional scratch vregs later
  7597. // FROM:
  7598. // %vreg0 = op %vreg1, %vreg2
  7599. // To:
  7600. // Mov %scratch<reg>, %vreg1
  7601. // Op %scratch<reg>, %vreg2
  7602. // Mov %result, %scatch<reg>
  7603. ReplaceWithNewVReg(inst->mArg0, instIdx, true);
  7604. AllocInst(BeMCInstKind_Mov, inst->mResult, inst->mArg0, instIdx + 1);
  7605. IntroduceVRegs(inst->mArg0, mcBlock, instIdx, instIdx + 2);
  7606. inst->mResult = BeMCOperand();
  7607. isFinalRun = false;
  7608. if (debugging)
  7609. OutputDebugStrF(" Float RegOnDest\n");
  7610. instIdx++;
  7611. continue;
  7612. }
  7613. else if ((inst->mResult == inst->mArg1) &&
  7614. ((inst->mKind == BeMCInstKind_Add) || (inst->mKind == BeMCInstKind_Mul) || (inst->mKind == BeMCInstKind_IMul)))
  7615. {
  7616. BF_SWAP(inst->mArg0, inst->mArg1);
  7617. BF_SWAP(arg0, arg1);
  7618. inst->mResult = BeMCOperand();
  7619. }
  7620. else
  7621. {
  7622. bool addCanBeLEA =
  7623. ((inst->mKind == BeMCInstKind_Sub) || (inst->mKind == BeMCInstKind_Add)) &&
  7624. (arg0Type->mSize >= 2) && // Int8s don't have an LEA
  7625. (GetFixedOperand(inst->mResult).IsNativeReg()) && (arg0.IsNativeReg()) && (arg1.IsImmediateInt());
  7626. if (addCanBeLEA)
  7627. {
  7628. // LEA is add-only
  7629. if (inst->mKind == BeMCInstKind_Sub)
  7630. {
  7631. BF_ASSERT(inst->mArg1.IsImmediate());
  7632. inst->mKind = BeMCInstKind_Add;
  7633. inst->mArg1.mImmediate = -inst->mArg1.mImmediate;
  7634. }
  7635. }
  7636. else
  7637. {
  7638. bool handled = false;
  7639. if (OperandsEqual(inst->mResult, inst->mArg1))
  7640. {
  7641. if (inst->mKind == BeMCInstKind_Sub)
  7642. {
  7643. // From: b = Sub a, b
  7644. // To: Neg b
  7645. // Add b, a
  7646. AllocInst(BeMCInstKind_Add, inst->mResult, inst->mArg0, instIdx + 1);
  7647. inst->mKind = BeMCInstKind_Neg;
  7648. inst->mArg0 = inst->mResult;
  7649. inst->mArg1 = BeMCOperand();
  7650. inst->mResult = BeMCOperand();
  7651. handled = true;
  7652. instIdx--; // Rerun on the Neg
  7653. }
  7654. else
  7655. {
  7656. // We need a scratch reg for this
  7657. ReplaceWithNewVReg(inst->mArg1, instIdx, true);
  7658. IntroduceVRegs(inst->mArg1, mcBlock, instIdx, instIdx + 2);
  7659. }
  7660. }
  7661. if (!handled)
  7662. {
  7663. // From: result = <op> a, b
  7664. // To: mov result, a
  7665. // <op> result, b
  7666. AllocInst(BeMCInstKind_Mov, inst->mResult, inst->mArg0, instIdx++);
  7667. inst->mArg0 = inst->mResult;
  7668. inst->mResult = BeMCOperand();
  7669. FixVRegInitFlags(inst, inst->mArg0);
  7670. if (debugging)
  7671. OutputDebugStrF(" Result\n");
  7672. isFinalRun = false;
  7673. }
  7674. }
  7675. continue;
  7676. }
  7677. }
  7678. }
  7679. if ((inst->mKind != BeMCInstKind_Cmp) &&
  7680. (inst->mKind != BeMCInstKind_CmpToBool) &&
  7681. (inst->mKind != BeMCInstKind_Mov))
  7682. {
  7683. if ((arg0Type != NULL) && (arg0Type->IsFloat()))
  7684. {
  7685. // <r/m>, <xmm> is not valid, <xmm>, <r/m>
  7686. if (!arg0.IsNativeReg())
  7687. {
  7688. if ((arg1.IsNativeReg()) && (inst->mArg1.IsVReg()) && (nextInst != NULL) && (nextInst->mLiveness != NULL) && (inst->IsCommutable()))
  7689. {
  7690. int underlyingVRegIdx = GetUnderlyingVReg(inst->mArg1.mVRegIdx);
  7691. if (!mLivenessContext.IsSet(nextInst->mLiveness, underlyingVRegIdx))
  7692. {
  7693. // If Arg1 is a temporary vreg, then we can use that as our destination so we don't need
  7694. // to create another temporary vreg
  7695. BF_SWAP(inst->mArg0, inst->mArg1);
  7696. AllocInst(BeMCInstKind_Mov, inst->mArg1, inst->mArg0, instIdx + 1);
  7697. continue;
  7698. }
  7699. }
  7700. BeMCOperand prevDest;
  7701. auto prevDestPtr = inst->GetDest();
  7702. if (prevDestPtr != NULL)
  7703. prevDest = *prevDestPtr;
  7704. ReplaceWithNewVReg(inst->mArg0, instIdx, true);
  7705. isFinalRun = false;
  7706. if (debugging)
  7707. OutputDebugStrF(" Float Arg0\n");
  7708. if (prevDest)
  7709. {
  7710. // This is a modifying instruction so we need to store the result afterward
  7711. AllocInst(BeMCInstKind_Mov, prevDest, inst->mArg0, instIdx + 1);
  7712. IntroduceVRegs(inst->mArg0, mcBlock, instIdx, instIdx + 2);
  7713. instIdx++; // Skip this instruction until next pass
  7714. }
  7715. else
  7716. {
  7717. IntroduceVRegs(inst->mArg0, mcBlock, instIdx, instIdx + 1);
  7718. }
  7719. continue;
  7720. }
  7721. }
  7722. }
  7723. if ((!inst->IsMov()) && (arg0.IsVReg()) && (arg0Type->IsFloat()))
  7724. {
  7725. BF_ASSERT(!inst->mResult);
  7726. // XMM instructions (besides MOVs) require native register destinations
  7727. if ((inst->IsCommutable()) && (arg1.IsNativeReg()) && (inst->mArg1.IsVReg()))
  7728. {
  7729. auto nextInst = mcBlock->mInstructions[instIdx + 1];
  7730. int underlyingVRegIdx = GetUnderlyingVReg(inst->mArg1.mVRegIdx);
  7731. if (!mLivenessContext.IsSet(nextInst->mLiveness, underlyingVRegIdx))
  7732. {
  7733. // Convert a "Mul %vreg0, %vreg1<reg>"
  7734. // To
  7735. // Mul %reg1<reg>, %vreg0
  7736. // Mov %vreg0, %reg1<reg>
  7737. // This only works if %reg1 dies after this instruction and this is
  7738. // cheaper than the more general case below
  7739. AllocInst(BeMCInstKind_Mov, inst->mArg0, inst->mArg1, instIdx++ + 1);
  7740. BF_SWAP(inst->mArg0, inst->mArg1);
  7741. BF_SWAP(arg0, arg1);
  7742. continue;
  7743. }
  7744. }
  7745. // Convert from "<op> %reg0, %reg1"
  7746. // To
  7747. // Mov %vreg2<reg>, %vreg0
  7748. // <op> %vreg2<reg>, %vreg1
  7749. // Mov %vreg0, %vreg2<reg>
  7750. auto prevDest = inst->mArg0;
  7751. ReplaceWithNewVReg(inst->mArg0, instIdx, true);
  7752. AllocInst(BeMCInstKind_Mov, prevDest, inst->mArg0, instIdx + 1);
  7753. IntroduceVRegs(inst->mArg0, mcBlock, instIdx, instIdx + 2);
  7754. instIdx++;
  7755. isFinalRun = false;
  7756. if (debugging)
  7757. OutputDebugStrF(" Float reg dest\n");
  7758. continue;
  7759. }
  7760. }
  7761. if (inst->mKind == BeMCInstKind_Call)
  7762. {
  7763. // Convert from
  7764. // Mov %reg0, <x>
  7765. // ..
  7766. // Call %reg0
  7767. // To "Call <x>"
  7768. // This is a common case for virtual dispatch where complex address expressions get actualized
  7769. // but then we end up with an 'extra' vreg
  7770. if (inst->mArg0.IsVReg())
  7771. {
  7772. auto vregInfo = GetVRegInfo(inst->mArg0);
  7773. if (vregInfo->mRefCount == 1)
  7774. {
  7775. for (int checkInstIdx = instIdx - 1; checkInstIdx >= 0; checkInstIdx--)
  7776. {
  7777. auto checkInst = mcBlock->mInstructions[checkInstIdx];
  7778. if ((checkInst->mKind == BeMCInstKind_Mov) && (checkInst->mArg0 == inst->mArg0))
  7779. {
  7780. // We can't extend down any ForceRegs, those must be confined to very short intervals
  7781. if (!HasForceRegs(checkInst->mArg1))
  7782. {
  7783. inst->mArg0 = checkInst->mArg1;
  7784. RemoveInst(mcBlock, checkInstIdx);
  7785. instIdx--;
  7786. continue;
  7787. }
  7788. }
  7789. }
  7790. }
  7791. }
  7792. }
  7793. switch (inst->mKind)
  7794. {
  7795. case BeMCInstKind_PreserveVolatiles:
  7796. regPreserveDepth++;
  7797. break;
  7798. case BeMCInstKind_RestoreVolatiles:
  7799. regPreserveDepth--;
  7800. break;
  7801. case BeMCInstKind_DefLoad:
  7802. {
  7803. Fail("DefLoad- DoLoads should have removed these");
  7804. }
  7805. break;
  7806. case BeMCInstKind_Def:
  7807. {
  7808. auto vregInfo = mVRegInfo[inst->mArg0.mVRegIdx];
  7809. // Legalize vreg exprs
  7810. if ((vregInfo->mRefCount > 0) && (vregInfo->mRelTo) && (!vregInfo->IsDirectRelToAny()))
  7811. {
  7812. if (vregInfo->mRelTo.mKind == BeMCOperandKind_SymbolAddr)
  7813. continue; // Just leave it
  7814. if (vregInfo->mRelTo.mKind == BeMCOperandKind_Symbol)
  7815. {
  7816. continue;
  7817. }
  7818. if (vregInfo->IsDirectRelTo())
  7819. {
  7820. if (vregInfo->mRelTo.IsVRegAny())
  7821. {
  7822. // Propagate change to the directRel
  7823. //auto itr = vregExprChangeSet.find(vregInfo->mRelTo.mVRegIdx);
  7824. //if (itr != vregExprChangeSet.end())
  7825. if (vregExprChangeSet.Contains(vregInfo->mRelTo.mVRegIdx))
  7826. {
  7827. BF_ASSERT(!isFinalRun);
  7828. vregExprChangeSet.Add(inst->mArg0.mVRegIdx);
  7829. isFinalRun = false;
  7830. }
  7831. }
  7832. }
  7833. else
  7834. {
  7835. if (vregInfo->mRelOffset)
  7836. {
  7837. auto relOfsType = GetType(vregInfo->mRelOffset);
  7838. // We can only do offsets by int64s
  7839. if (relOfsType->mTypeCode != BeTypeCode_Int64)
  7840. {
  7841. bool didExtend = false;
  7842. if (vregInfo->mRelOffset.IsVReg())
  7843. {
  7844. // First we try to resize the original vreg, which we are allowed to do
  7845. // if there's only one mov and the vreg dies by the end of the block
  7846. int relVRegIdx = vregInfo->mRelOffset.mVRegIdx;
  7847. bool foundDef = false;
  7848. BeMCInst* setInst = NULL;
  7849. for (int checkIdx = 0; checkIdx < (int)mcBlock->mInstructions.size(); checkIdx++)
  7850. {
  7851. auto checkInst = mcBlock->mInstructions[checkIdx];
  7852. if ((checkInst->mKind == BeMCInstKind_Def) && (checkInst->mArg0.mVRegIdx == relVRegIdx))
  7853. foundDef = true;
  7854. if (foundDef)
  7855. {
  7856. if ((checkInst->mKind == BeMCInstKind_Mov) && (checkInst->mArg0 == vregInfo->mRelOffset))
  7857. {
  7858. if (setInst != NULL)
  7859. break; // Only one set is allowed
  7860. setInst = checkInst;
  7861. }
  7862. else
  7863. {
  7864. // If we also use this reg for a non-offset reason then we can't just extend the size
  7865. bool hasNonOffsetRef = false;
  7866. auto operands = { &checkInst->mResult, &checkInst->mArg0, &checkInst->mArg1 };
  7867. for (auto operand : operands)
  7868. if (ContainsNonOffsetRef(*operand, vregInfo->mRelOffset))
  7869. hasNonOffsetRef = true;
  7870. if (hasNonOffsetRef)
  7871. {
  7872. break;
  7873. }
  7874. }
  7875. if (!mLivenessContext.IsSet(checkInst->mLiveness, relVRegIdx))
  7876. {
  7877. if (setInst != NULL)
  7878. {
  7879. didExtend = true;
  7880. auto relVRegInfo = mVRegInfo[relVRegIdx];
  7881. setInst->mKind = BeMCInstKind_MovSX;
  7882. relVRegInfo->mType = mModule->mContext->GetPrimitiveType(BeTypeCode_Int64);
  7883. relVRegInfo->mAlign = relVRegInfo->mType->mAlign;
  7884. if (debugging)
  7885. OutputDebugStrF(" Def MovSX\n");
  7886. isFinalRun = false;
  7887. }
  7888. break;
  7889. }
  7890. }
  7891. }
  7892. }
  7893. if (!didExtend)
  7894. {
  7895. auto relOfs64 = AllocVirtualReg(mModule->mContext->GetPrimitiveType(BeTypeCode_Int64), 2);
  7896. CreateDefineVReg(relOfs64, instIdx);
  7897. AllocInst(BeMCInstKind_MovSX, relOfs64, vregInfo->mRelOffset, instIdx + 1);
  7898. IntroduceVRegs(inst->mArg0, mcBlock, instIdx, instIdx + 2);
  7899. instIdx += 2;
  7900. vregInfo->mRelOffset = relOfs64;
  7901. vregExprChangeSet.Add(relOfs64.mVRegIdx);
  7902. if (debugging)
  7903. OutputDebugStrF(" Def MovSX 2\n");
  7904. isFinalRun = false;
  7905. }
  7906. }
  7907. }
  7908. X64CPURegister regA = X64Reg_None;
  7909. X64CPURegister regB = X64Reg_None;
  7910. int bScale = 1;
  7911. int disp = 0;
  7912. int errorVRegIdx = -1;
  7913. bool isValid = GetRMParams(inst->mArg0, regA, regB, bScale, disp, &errorVRegIdx) != BeMCRMMode_Invalid;
  7914. if (!isValid)
  7915. {
  7916. if (errorVRegIdx == -1)
  7917. {
  7918. BF_ASSERT(!vregInfo->mRelOffset);
  7919. if (vregInfo->mType->IsPointer())
  7920. {
  7921. // This must be a cast like "(void*)gGlobalVar". We need to actualize the symbol address
  7922. // in a native register now.
  7923. vregExprChangeSet.Add(inst->mArg0.mVRegIdx);
  7924. AllocInst(BeMCInstKind_Mov, inst->mArg0, vregInfo->mRelTo, instIdx++ + 1);
  7925. vregInfo->mIsExpr = false;
  7926. vregInfo->mRelTo = BeMCOperand();
  7927. vregInfo->mForceReg = true;
  7928. CheckForce(vregInfo);
  7929. isFinalRun = false;
  7930. if (debugging)
  7931. OutputDebugStrF(" Symbol Addr\n");
  7932. break;
  7933. }
  7934. else
  7935. {
  7936. // This could be a special case like
  7937. // MOV (int64)floatVal, reg64
  7938. // For two-step loading of immediates into memory without using .rdata
  7939. continue;
  7940. }
  7941. }
  7942. else if (errorVRegIdx == -2)
  7943. {
  7944. vregExprChangeSet.Add(inst->mArg0.mVRegIdx);
  7945. MarkInvalidRMRegs(inst->mArg0);
  7946. if (debugging)
  7947. OutputDebugStrF(" GetRMParams invalid indices\n");
  7948. isFinalRun = false;
  7949. break;
  7950. }
  7951. //if (vregExprChangeSet.find(errorVRegIdx) != vregExprChangeSet.end())
  7952. if (vregExprChangeSet.Contains(errorVRegIdx))
  7953. {
  7954. // This means we have already modified some dependent vregs, so we may be legalized already.
  7955. // Wait till next iteration to determine that.
  7956. BF_ASSERT(!isFinalRun);
  7957. isValid = true; //
  7958. }
  7959. }
  7960. // The only valid form is [<reg>*<1/2/4/8>+<imm>]
  7961. // If we violate that then we have to break it up
  7962. //if ((vregInfo->mRelOffsetScale != 1) && (vregInfo->mRelOffsetScale != 2) && (vregInfo->mRelOffsetScale != 4) && (vregInfo->mRelOffsetScale != 8))
  7963. if ((!isValid) && (errorVRegIdx == inst->mArg0.mVRegIdx))
  7964. {
  7965. vregExprChangeSet.Add(errorVRegIdx);
  7966. if ((vregInfo->mRelOffsetScale != 1) && (vregInfo->mRelOffsetScale != 2) && (vregInfo->mRelOffsetScale != 4) && (vregInfo->mRelOffsetScale != 8))
  7967. {
  7968. auto relOffsetType = GetType(vregInfo->mRelOffset);
  7969. BeMCOperand scratchReg = AllocVirtualReg(relOffsetType, 2, true);
  7970. CreateDefineVReg(scratchReg, instIdx++);
  7971. auto newInst = AllocInst(BeMCInstKind_IMul, vregInfo->mRelOffset, BeMCOperand::FromImmediate(vregInfo->mRelOffsetScale), instIdx++);
  7972. newInst->mResult = scratchReg;
  7973. vregInfo->mRelOffset = scratchReg;
  7974. vregInfo->mRelOffsetScale = 1;
  7975. if (debugging)
  7976. OutputDebugStrF(" Invalid RM combo\n");
  7977. vregExprChangeSet.Add(scratchReg.mVRegIdx);
  7978. }
  7979. else if (!vregInfo->mRelTo.IsVRegAny())
  7980. {
  7981. vregInfo->mWantsExprActualize = true;
  7982. hasPendingActualizations = true;
  7983. }
  7984. isFinalRun = false;
  7985. }
  7986. else if (!isValid)
  7987. {
  7988. auto errorVRegInfo = mVRegInfo[errorVRegIdx];
  7989. if ((errorVRegInfo->mIsExpr) && (!errorVRegInfo->IsDirectRelTo()))
  7990. {
  7991. errorVRegInfo->mWantsExprActualize = true;
  7992. hasPendingActualizations = true;
  7993. vregExprChangeSet.Add(errorVRegIdx);
  7994. isFinalRun = false;
  7995. if (debugging)
  7996. OutputDebugStrF(" RM not valid, actualize\n");
  7997. }
  7998. else
  7999. {
  8000. // We don't want to have too many concurrent ForceReg vregs at once, since that causes too much register pressure and
  8001. // can cause register allocation to fail at the extreme end. The scratchReg adds another ForceReg for the lifetime
  8002. // of the def vreg, so if the def vreg doesn't immediately die and there are already too many ForceRegs active then
  8003. // we need to actualize ourselves
  8004. bool actualizeSelf = false;
  8005. if (instIdx < mcBlock->mInstructions.size() - 2)
  8006. {
  8007. auto checkInst = mcBlock->mInstructions[instIdx + 2];
  8008. if (mLivenessContext.IsSet(checkInst->mLiveness, inst->mArg0.mVRegIdx))
  8009. {
  8010. actualizeSelf = true;
  8011. }
  8012. }
  8013. else
  8014. {
  8015. actualizeSelf = true;
  8016. }
  8017. if (actualizeSelf)
  8018. {
  8019. auto vregInfo = mVRegInfo[inst->mArg0.mVRegIdx];
  8020. // DirectRel cannot actualize
  8021. if (vregInfo->IsDirectRelTo())
  8022. actualizeSelf = false;
  8023. }
  8024. if (actualizeSelf)
  8025. {
  8026. auto vregInfo = mVRegInfo[inst->mArg0.mVRegIdx];
  8027. vregInfo->mWantsExprActualize = true;
  8028. hasPendingActualizations = true;
  8029. }
  8030. else
  8031. {
  8032. // This may be a local variable that failed to be assigned to a reg, create a scratch local with a forced reg
  8033. auto scratchReg = AllocVirtualReg(errorVRegInfo->mType, 2, false);
  8034. auto scratchVRegInfo = mVRegInfo[scratchReg.mVRegIdx];
  8035. auto errorVReg = BeMCOperand::FromVReg(errorVRegIdx);
  8036. if ((vregInfo->mRelTo == errorVReg) || (vregInfo->mRelOffset == errorVReg))
  8037. {
  8038. CreateDefineVReg(scratchReg, instIdx++);
  8039. AllocInst(BeMCInstKind_Mov, scratchReg, errorVReg, instIdx++);
  8040. isFinalRun = false;
  8041. if (debugging)
  8042. OutputDebugStrF(" RM failed, scratch vreg\n");
  8043. vregExprChangeSet.Add(scratchReg.mVRegIdx);
  8044. if (vregInfo->mRelTo == errorVReg)
  8045. {
  8046. scratchVRegInfo->mForceReg = true;
  8047. CheckForce(scratchVRegInfo);
  8048. vregInfo->mRelTo.mVRegIdx = scratchReg.mVRegIdx;
  8049. }
  8050. else if (vregInfo->mRelOffset == errorVReg)
  8051. {
  8052. scratchVRegInfo->mForceReg = true;
  8053. CheckForce(scratchVRegInfo);
  8054. vregInfo->mRelOffset.mVRegIdx = scratchReg.mVRegIdx;
  8055. }
  8056. }
  8057. else
  8058. {
  8059. // This should be impossible - a previous def for an inner expr should have caught this case
  8060. if (vregExprChangeSet.IsEmpty())
  8061. {
  8062. Fail("Error");
  8063. }
  8064. }
  8065. }
  8066. }
  8067. }
  8068. }
  8069. }
  8070. if ((vregInfo->mDbgVariable != NULL) && (vregInfo->mDbgVariable->mPendingInitType != BfIRInitType_NotNeeded))
  8071. pendingInitKind = vregInfo->mDbgVariable->mPendingInitType;
  8072. }
  8073. break;
  8074. case BeMCInstKind_DbgDecl:
  8075. {
  8076. bool isInvalid = false;
  8077. int vregIdx = inst->mArg0.mVRegIdx;
  8078. auto vregInfo = mVRegInfo[vregIdx];
  8079. auto dbgVar = vregInfo->mDbgVariable;
  8080. X64CPURegister regA = X64Reg_None;
  8081. X64CPURegister regB = X64Reg_None;
  8082. int scale = 1;
  8083. int disp = 0;
  8084. BeMCRMMode mode;
  8085. if (dbgVar->mIsValue)
  8086. mode = GetRMParams(inst->mArg0, regA, regB, scale, disp);
  8087. else
  8088. {
  8089. if (inst->mArg0.mKind == BeMCOperandKind_VRegAddr)
  8090. mode = GetRMParams(BeMCOperand::ToLoad(inst->mArg0), regA, regB, scale, disp);
  8091. else
  8092. {
  8093. mode = GetRMParams(inst->mArg0, regA, regB, scale, disp);
  8094. if ((mode != BeMCRMMode_Direct) && (scale != 1) && (disp != 0))
  8095. isInvalid = true;
  8096. }
  8097. }
  8098. if (mode == BeMCRMMode_Invalid)
  8099. {
  8100. if (vregInfo->mType->mSize != 0)
  8101. {
  8102. isInvalid = true;
  8103. }
  8104. }
  8105. else if (mode == BeMCRMMode_Direct)
  8106. {
  8107. if ((regB != X64Reg_None) || (disp != 0) || (scale != 1))
  8108. {
  8109. isInvalid = true;
  8110. }
  8111. }
  8112. else if (mode == BeMCRMMode_Deref)
  8113. {
  8114. if ((regB != X64Reg_None) || (scale != 1))
  8115. {
  8116. isInvalid = true;
  8117. }
  8118. }
  8119. if (isInvalid)
  8120. {
  8121. isFinalRun = false;
  8122. /*ReplaceWithNewVReg(inst->mArg0, instIdx, true, false);
  8123. // The debug value is not representable, so copy it. This can only occur within mixins where we are pointing
  8124. // to composed values
  8125. BF_ASSERT(inst->mArg0.mKind == BeMCOperandKind_VReg);
  8126. inst->mArg0.mKind = BeMCOperandKind_VRegAddr;
  8127. dbgVar->mIsValue = false;
  8128. auto newVRegInfo = mVRegInfo[inst->mArg0.mVRegIdx];
  8129. vregInfo->mDbgVariable = NULL;
  8130. newVRegInfo->mDbgVariable = dbgVar;*/
  8131. // The debug value is not representable
  8132. inst->mArg0.mKind = BeMCOperandKind_VReg;
  8133. vregInfo->mWantsExprActualize = true;
  8134. hasPendingActualizations = true;
  8135. vregExprChangeSet.Add(inst->mArg0.mVRegIdx);
  8136. isFinalRun = false;
  8137. break;
  8138. }
  8139. if (!mVRegInitializedContext.IsSet(inst->mVRegsInitialized, vregIdx))
  8140. {
  8141. if ((dbgVar->mPendingInitType != BfIRInitType_NotNeeded) && (dbgVar->mPendingInitType != BfIRInitType_NotNeeded_AliveOnDecl))
  8142. {
  8143. Fail("Shouldn't happen here anymore");
  8144. /*pendingInitKind = dbgVar->mPendingInitType;
  8145. // We don't need dynLife anymore since we're explicitly writing this
  8146. vregInfo->mHasDynLife = false;
  8147. AllocInst(BeMCInstKind_Def, inst->mArg0, instIdx);
  8148. // We don't definitively need this, it's just to make sure this doesn't cause a liveness error
  8149. isFinalRun = false;*/
  8150. }
  8151. }
  8152. }
  8153. break;
  8154. case BeMCInstKind_MemCpy:
  8155. {
  8156. if (inst->mArg1)
  8157. {
  8158. BF_ASSERT(inst->mArg1.mKind == BeMCOperandKind_VRegPair);
  8159. int* vregIndices[] = { &inst->mArg1.mVRegPair.mVRegIdx0, &inst->mArg1.mVRegPair.mVRegIdx1 };
  8160. for (int* argIdxPtr : vregIndices)
  8161. {
  8162. auto mcArg = BeMCOperand::FromEncoded(*argIdxPtr);
  8163. X64CPURegister regA = X64Reg_None;
  8164. X64CPURegister regB = X64Reg_None;
  8165. int bScale = 1;
  8166. int disp = 0;
  8167. auto form = GetRMParams(mcArg, regA, regB, bScale, disp);
  8168. if ((form != BeMCRMMode_Direct) || (regB != X64Reg_None) || (regA == X64Reg_R11))
  8169. {
  8170. BeMCOperand scratchReg = AllocVirtualReg(GetType(mcArg), 2, true);
  8171. auto vregInfo = GetVRegInfo(scratchReg);
  8172. vregInfo->mDisableR11 = true;
  8173. int insertPos = FindSafeInstInsertPos(instIdx);
  8174. CreateDefineVReg(scratchReg, insertPos);
  8175. AllocInst(BeMCInstKind_Mov, scratchReg, mcArg, insertPos + 1);
  8176. *argIdxPtr = scratchReg.mVRegIdx;
  8177. instIdx += 2;
  8178. isFinalRun = false;
  8179. if (debugging)
  8180. OutputDebugStrF(" MemCpy\n");
  8181. }
  8182. }
  8183. }
  8184. }
  8185. break;
  8186. case BeMCInstKind_MemSet:
  8187. {
  8188. if (inst->mArg1)
  8189. {
  8190. X64CPURegister regA = X64Reg_None;
  8191. X64CPURegister regB = X64Reg_None;
  8192. int bScale = 1;
  8193. int disp = 0;
  8194. auto form = GetRMParams(inst->mArg1, regA, regB, bScale, disp);
  8195. if ((form != BeMCRMMode_Direct) || (regB != X64Reg_None) || (regA == X64Reg_R11) || (disp != 0))
  8196. {
  8197. BeMCOperand scratchReg = AllocVirtualReg(GetType(inst->mArg1), 2, true);
  8198. auto vregInfo = GetVRegInfo(scratchReg);
  8199. vregInfo->mDisableR11 = true;
  8200. int insertPos = FindSafeInstInsertPos(instIdx);
  8201. CreateDefineVReg(scratchReg, insertPos);
  8202. AllocInst(BeMCInstKind_Mov, scratchReg, inst->mArg1, insertPos + 1);
  8203. inst->mArg1 = scratchReg;
  8204. instIdx += 2;
  8205. isFinalRun = false;
  8206. if (debugging)
  8207. OutputDebugStrF(" MemSet\n");
  8208. }
  8209. }
  8210. }
  8211. break;
  8212. case BeMCInstKind_Neg:
  8213. {
  8214. if (arg0Type->IsFloat())
  8215. {
  8216. inst->mKind = BeMCInstKind_Xor;
  8217. if (arg0Type->mTypeCode == BeTypeCode_Float)
  8218. inst->mArg1.mKind = BeMCOperandKind_Immediate_f32_Packed128;
  8219. else
  8220. inst->mArg1.mKind = BeMCOperandKind_Immediate_f64_Packed128;
  8221. inst->mArg1.mImmFloat = -0.0;
  8222. }
  8223. }
  8224. break;
  8225. case BeMCInstKind_Div:
  8226. case BeMCInstKind_IDiv:
  8227. case BeMCInstKind_Rem:
  8228. case BeMCInstKind_IRem:
  8229. {
  8230. // Unsigned div and rem can be implemented with bitwise operations
  8231. // Negative values cannot (at least following C standards, because of rounding issues)
  8232. if ((inst->mKind == BeMCInstKind_Div) || (inst->mKind == BeMCInstKind_Rem))
  8233. {
  8234. if ((!inst->mResult) && (inst->mArg1.IsImmediateInt()) && (IsPowerOfTwo(inst->mArg1.mImmediate)))
  8235. {
  8236. if (inst->mKind == BeMCInstKind_Div)
  8237. {
  8238. int64 divVal = inst->mArg1.mImmediate;
  8239. int shiftCount = 0;
  8240. while (divVal > 1)
  8241. {
  8242. shiftCount++;
  8243. divVal >>= 1;
  8244. }
  8245. inst->mKind = BeMCInstKind_Shr;
  8246. inst->mArg1 = BeMCOperand::FromImmediate(shiftCount);
  8247. isFinalRun = false;
  8248. if (debugging)
  8249. OutputDebugStrF(" Div SHR\n");
  8250. break;
  8251. }
  8252. else if (inst->mKind == BeMCInstKind_Rem)
  8253. {
  8254. inst->mKind = BeMCInstKind_And;
  8255. inst->mArg1 = BeMCOperand::FromImmediate(inst->mArg1.mImmediate - 1);
  8256. isFinalRun = false;
  8257. if (debugging)
  8258. OutputDebugStrF(" Div REM\n");
  8259. break;
  8260. }
  8261. }
  8262. }
  8263. if (arg1.IsImmediate())
  8264. {
  8265. // Oops, must be 'rm'
  8266. ReplaceWithNewVReg(inst->mArg1, instIdx, true, false);
  8267. isFinalRun = false;
  8268. if (debugging)
  8269. OutputDebugStrF(" Div/Rem not RM\n");
  8270. }
  8271. auto arg0Type = GetType(arg0);
  8272. if (arg0Type->IsInt())
  8273. {
  8274. // DIV/IDIV can only operate on the RDX:RAX pair, except for i8 divide which just uses AX
  8275. bool isRegADividend = (arg0.mReg == X64Reg_RAX) || (arg0.mReg == X64Reg_EAX) || (arg0.mReg == X64Reg_AX) || (arg0.mReg == X64Reg_AL);
  8276. if ((!arg0.IsNativeReg()) || (!isRegADividend) ||
  8277. (inst->mKind == BeMCInstKind_Rem) || (inst->mKind == BeMCInstKind_IRem))
  8278. {
  8279. bool preserveRDX = (arg0Type->mSize != 1) && (regPreserveDepth == 0);
  8280. auto mcScratch = BeMCOperand::FromReg(ResizeRegister(X64Reg_RAX, arg0Type->mSize));
  8281. BF_ASSERT(!inst->mResult);
  8282. BeMCInst* preserveRAXInst = AllocInst(BeMCInstKind_PreserveVolatiles, BeMCOperand::FromReg(X64Reg_RAX), instIdx++);
  8283. BeMCInst* preserveRDXInst = NULL;
  8284. if (preserveRDX)
  8285. preserveRDXInst = AllocInst(BeMCInstKind_PreserveVolatiles, BeMCOperand::FromReg(X64Reg_RDX), instIdx++);
  8286. AllocInst(BeMCInstKind_Mov, mcScratch, inst->mArg0, instIdx++);
  8287. if ((inst->mKind == BeMCInstKind_Rem) || (inst->mKind == BeMCInstKind_IRem))
  8288. {
  8289. if (inst->mKind == BeMCInstKind_Rem)
  8290. inst->mKind = BeMCInstKind_Div;
  8291. else
  8292. inst->mKind = BeMCInstKind_IDiv;
  8293. BeMCOperand mcRemaindier;
  8294. if (arg0Type->mSize == 1)
  8295. {
  8296. mcRemaindier = BeMCOperand::FromReg(ResizeRegister(X64Reg_AH, arg0Type->mSize));
  8297. preserveRAXInst->mArg1 = inst->mArg0; // RAX preserve elision exception
  8298. DisableRegister(inst->mArg0, X64Reg_SIL); // Disable Hi8
  8299. }
  8300. else
  8301. {
  8302. mcRemaindier = BeMCOperand::FromReg(ResizeRegister(X64Reg_RDX, arg0Type->mSize));
  8303. preserveRDXInst->mArg1 = inst->mArg0; // RDX preserve elision exception
  8304. auto vregInfo = GetVRegInfo(inst->mArg0);
  8305. if (vregInfo != NULL)
  8306. {
  8307. // This is to avoid overlap with PreserveRAX
  8308. DisableRegister(inst->mArg0, X64Reg_RAX);
  8309. }
  8310. }
  8311. AllocInst(BeMCInstKind_Mov, inst->mArg0, mcRemaindier, instIdx++ + 1);
  8312. }
  8313. else
  8314. {
  8315. preserveRAXInst->mArg1 = inst->mArg0; // RAX preserve elision exception
  8316. AllocInst(BeMCInstKind_Mov, inst->mArg0, mcScratch, instIdx++ + 1);
  8317. }
  8318. inst->mArg0 = mcScratch;
  8319. if (preserveRDX)
  8320. AllocInst(BeMCInstKind_RestoreVolatiles, BeMCOperand::FromReg(X64Reg_RDX), instIdx++ + 1);
  8321. AllocInst(BeMCInstKind_RestoreVolatiles, BeMCOperand::FromReg(X64Reg_RAX), instIdx++ + 1);
  8322. isFinalRun = false;
  8323. if (debugging)
  8324. OutputDebugStrF(" Div/Rem Setup\n");
  8325. }
  8326. else
  8327. {
  8328. if (regPreserveDepth == 0)
  8329. {
  8330. if (arg0Type->mSize != 1)
  8331. {
  8332. AllocInst(BeMCInstKind_PreserveVolatiles, BeMCOperand::FromReg(X64Reg_RDX), instIdx++);
  8333. AllocInst(BeMCInstKind_RestoreVolatiles, BeMCOperand::FromReg(X64Reg_RDX), instIdx++ + 1);
  8334. isFinalRun = false; // Reassign regs
  8335. if (debugging)
  8336. OutputDebugStrF(" Div/Rem Preserve\n");
  8337. }
  8338. }
  8339. }
  8340. // We can't allow division by RDX because we need RAX:RDX for the dividend
  8341. auto divisorReg = ResizeRegister(arg1.mReg, 8);
  8342. if ((arg1.IsNativeReg()) &&
  8343. ((divisorReg == X64Reg_RDX) || (divisorReg == X64Reg_RAX)))
  8344. {
  8345. BF_ASSERT(inst->mArg1.IsVRegAny());
  8346. int vregIdx = GetUnderlyingVReg(inst->mArg1.mVRegIdx);
  8347. auto vregInfo = mVRegInfo[vregIdx];
  8348. if (vregInfo != NULL)
  8349. {
  8350. vregInfo->mDisableRAX = true;
  8351. vregInfo->mDisableRDX = true;
  8352. isFinalRun = false;
  8353. if (debugging)
  8354. OutputDebugStrF(" Div/Rem invalid reg\n");
  8355. }
  8356. }
  8357. }
  8358. else if (inst->mKind == BeMCInstKind_IRem)
  8359. {
  8360. SetAndRestoreValue<int*> insertPtr(mInsertInstIdxRef, &instIdx);
  8361. SizedArray<BeMCOperand, 3> args = { inst->mArg0, inst->mArg1 };
  8362. auto mcFunc = BeMCOperand::FromSymbolAddr(mCOFFObject->GetSymbolRef((arg0Type->mTypeCode == BeTypeCode_Double) ? "fmod" : "fmodf")->mIdx);
  8363. auto fmodVal = CreateCall(mcFunc, args, arg0Type);
  8364. inst->mKind = BeMCInstKind_Mov;
  8365. inst->mResult = BeMCOperand();
  8366. inst->mArg1 = fmodVal;
  8367. isFinalRun = false;
  8368. if (debugging)
  8369. OutputDebugStrF(" FMod\n");
  8370. }
  8371. }
  8372. break;
  8373. case BeMCInstKind_Mul:
  8374. case BeMCInstKind_IMul:
  8375. {
  8376. if (arg0Type->mSize == 1)
  8377. {
  8378. if ((!arg0.IsNativeReg()) || (arg0.mReg != X64Reg_AL) || (inst->mResult))
  8379. {
  8380. BF_ASSERT(inst->mResult);
  8381. // Int8 multiplies can only be done on AL
  8382. AllocInst(BeMCInstKind_PreserveVolatiles, BeMCOperand::FromReg(X64Reg_RAX), instIdx++);
  8383. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromReg(X64Reg_AL), inst->mArg0, instIdx++);
  8384. AllocInst(BeMCInstKind_Mov, inst->mResult, BeMCOperand::FromReg(X64Reg_AL), instIdx++ + 1);
  8385. inst->mArg0 = BeMCOperand::FromReg(X64Reg_AL);
  8386. inst->mResult = BeMCOperand();
  8387. AllocInst(BeMCInstKind_RestoreVolatiles, BeMCOperand::FromReg(X64Reg_RAX), instIdx++ + 1);
  8388. isFinalRun = false;
  8389. if (debugging)
  8390. OutputDebugStrF(" Mul Size 1\n");
  8391. break;
  8392. }
  8393. if (inst->mArg1.IsImmediateInt())
  8394. {
  8395. ReplaceWithNewVReg(inst->mArg1, instIdx, true, false);
  8396. }
  8397. BF_ASSERT(!inst->mResult);
  8398. }
  8399. else
  8400. {
  8401. if (inst->mResult)
  8402. {
  8403. // The 3-op form of MUL must be in "reg, r/m64, imm" form
  8404. if (!inst->mArg1.IsImmediateInt())
  8405. {
  8406. Fail("Not supported");
  8407. //isFinalRun = false;
  8408. break;
  8409. }
  8410. }
  8411. // Convert from %vreg0 = mul %vreg1, %vreg2
  8412. // To: %scratch = mul %vreg1, %vreg2
  8413. // mov %reg0, %scratch
  8414. if (inst->mResult)
  8415. {
  8416. bool isLegal = true;
  8417. int64 immediateInt = inst->mArg1.GetImmediateInt();
  8418. // if (inst->mKind == BeMCInstKind_Mul)
  8419. // {
  8420. // if (immediateInt > 0xFFFFFFFFLL)
  8421. // isLegal = false;
  8422. // }
  8423. // else
  8424. // {
  8425. // if ((immediateInt < -0x80000000LL) || (immediateInt > 0x7FFFFFFF))
  8426. // isLegal = false;
  8427. // }
  8428. if (!GetFixedOperand(inst->mResult).IsNativeReg())
  8429. {
  8430. BeMCOperand scratchReg = AllocVirtualReg(GetType(inst->mResult), 2, true);
  8431. CreateDefineVReg(scratchReg, instIdx);
  8432. AllocInst(BeMCInstKind_Mov, inst->mResult, scratchReg, instIdx + 2);
  8433. inst->mResult = scratchReg;
  8434. if (debugging)
  8435. OutputDebugStrF(" Mul 3-form not reg\n");
  8436. isFinalRun = false;
  8437. instIdx += 2;
  8438. break;
  8439. }
  8440. }
  8441. else
  8442. {
  8443. if (!GetFixedOperand(inst->mArg0).IsNativeReg())
  8444. {
  8445. auto prevArg0 = inst->mArg0;
  8446. ReplaceWithNewVReg(inst->mArg0, instIdx, true);
  8447. AllocInst(BeMCInstKind_Mov, prevArg0, inst->mArg0, instIdx + 1);
  8448. isFinalRun = false;
  8449. if (debugging)
  8450. OutputDebugStrF(" Mul not reg\n");
  8451. instIdx++;
  8452. break;
  8453. }
  8454. }
  8455. }
  8456. }
  8457. // Fallthrough
  8458. case BeMCInstKind_Add:
  8459. case BeMCInstKind_Sub:
  8460. {
  8461. }
  8462. break;
  8463. case BeMCInstKind_Shl:
  8464. case BeMCInstKind_Shr:
  8465. case BeMCInstKind_Sar:
  8466. {
  8467. if ((!inst->mArg1.IsNativeReg()) && (!inst->mArg1.IsImmediateInt()))
  8468. {
  8469. auto mcShift = inst->mArg1;
  8470. auto shiftType = GetType(mcShift);
  8471. BF_ASSERT(shiftType->IsInt());
  8472. if (shiftType->mSize != 1)
  8473. {
  8474. auto mcShift8 = AllocVirtualReg(mModule->mContext->GetPrimitiveType(BeTypeCode_Int8), 2);
  8475. CreateDefineVReg(mcShift8, instIdx++);
  8476. auto vregInfo = GetVRegInfo(mcShift8);
  8477. vregInfo->mIsExpr = true;
  8478. vregInfo->mRelTo = mcShift;
  8479. mcShift = mcShift8;
  8480. }
  8481. // The only non-constant shift is by 'CL'
  8482. AllocInst(BeMCInstKind_PreserveVolatiles, BeMCOperand::FromReg(X64Reg_RCX), instIdx++);
  8483. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromReg(X64Reg_CL), mcShift, instIdx++);
  8484. AllocInst(BeMCInstKind_RestoreVolatiles, BeMCOperand::FromReg(X64Reg_RCX), instIdx++ + 1);
  8485. inst->mArg1 = BeMCOperand::FromReg(X64Reg_RCX);
  8486. isFinalRun = false;
  8487. if (debugging)
  8488. OutputDebugStrF(" Shift by CL\n");
  8489. continue;
  8490. }
  8491. if (inst->mArg1.IsNativeReg())
  8492. {
  8493. BF_ASSERT(inst->mArg1.mReg == X64Reg_RCX);
  8494. X64CPURegister regs[2] = { X64Reg_None, X64Reg_None };
  8495. GetUsedRegs(inst->mArg0, regs[0], regs[1]);
  8496. if ((regs[0] == X64Reg_RCX) || (regs[1] == X64Reg_RCX))
  8497. {
  8498. // Bad reg!
  8499. auto mcTarget = inst->mArg0;
  8500. int insertIdx = instIdx - 1;
  8501. ReplaceWithNewVReg(inst->mArg0, insertIdx, true);
  8502. BF_ASSERT(mcBlock->mInstructions[instIdx + 3]->mKind == BeMCInstKind_RestoreVolatiles);
  8503. AllocInst(BeMCInstKind_Mov, mcTarget, inst->mArg0, instIdx + 4);
  8504. }
  8505. }
  8506. }
  8507. break;
  8508. case BeMCInstKind_Cmp:
  8509. {
  8510. bool needSwap = false;
  8511. // Cmp <imm>, <r/m> is not legal, so we need to swap LHS/RHS, which means also modifying the instruction that uses the result of the cmp
  8512. if (inst->mArg0.IsImmediate())
  8513. needSwap = true;
  8514. if (arg0Type->IsFloat())
  8515. {
  8516. // Cmp <r/m>, <xmm> is not valid, only Cmp <xmm>, <r/m>
  8517. if ((!arg0.IsNativeReg()) && (arg1.IsNativeReg()))
  8518. {
  8519. needSwap = true;
  8520. }
  8521. else
  8522. {
  8523. if (!arg0.IsNativeReg())
  8524. {
  8525. Fail("xmm reg required");
  8526. }
  8527. }
  8528. }
  8529. if (needSwap)
  8530. {
  8531. bool hasConstResult = false;
  8532. int constResult = 0;
  8533. if (inst->mArg1.IsImmediate())
  8534. {
  8535. //constResult = inst->mArg0.mImmediate - inst->mArg1.mImmediate;
  8536. // Should have been handled in the frontend
  8537. ReplaceWithNewVReg(inst->mArg0, instIdx, true);
  8538. break;
  8539. }
  8540. int checkInstIdx = instIdx + 1;
  8541. auto checkBlock = mcBlock;
  8542. for ( ; checkInstIdx < (int)checkBlock->mInstructions.size(); checkInstIdx++)
  8543. {
  8544. auto checkInst = checkBlock->mInstructions[checkInstIdx];
  8545. if ((checkInst->mKind == BeMCInstKind_CondBr) || (checkInst->mKind == BeMCInstKind_CmpToBool))
  8546. {
  8547. if (constResult)
  8548. {
  8549. NotImpl();
  8550. //mcBlock->RemoveInst(instIdx);
  8551. //instIdx--;
  8552. }
  8553. else
  8554. {
  8555. BeMCOperand& cmpArg = (checkInst->mKind == BeMCInstKind_CondBr) ? checkInst->mArg1 : checkInst->mArg0;
  8556. BF_SWAP(inst->mArg0, inst->mArg1);
  8557. BF_ASSERT(cmpArg.mKind == BeMCOperandKind_CmpKind);
  8558. cmpArg.mCmpKind = BeModule::SwapCmpSides(cmpArg.mCmpKind);
  8559. }
  8560. break;
  8561. }
  8562. else if (checkInst->mKind == BeMCInstKind_Br)
  8563. {
  8564. // Sometimes the matching use is in another block
  8565. FindTarget(checkInst->mArg0, checkBlock, checkInstIdx);
  8566. }
  8567. else if ((checkInst->mKind != BeMCInstKind_Def) && (checkInst->mKind != BeMCInstKind_DbgDecl) &&
  8568. (checkInst->mKind != BeMCInstKind_ValueScopeSoftEnd) && (checkInst->mKind != BeMCInstKind_ValueScopeHardEnd))
  8569. {
  8570. Fail("Malformed");
  8571. }
  8572. }
  8573. break;
  8574. }
  8575. }
  8576. break;
  8577. case BeMCInstKind_CmpToBool:
  8578. {
  8579. if (inst->mResult.IsVRegAny())
  8580. {
  8581. if (!mVRegInitializedContext.IsSet(mCurVRegsInit, inst->mResult.mVRegIdx))
  8582. {
  8583. SizedArray<int, 1> addVec = { inst->mResult.mVRegIdx };
  8584. mCurVRegsInit = mVRegInitializedContext.Add(mCurVRegsInit, addVec, true);
  8585. BF_ASSERT(instIdx < (int)mcBlock->mInstructions.size() - 1);
  8586. if (instIdx < (int)mcBlock->mInstructions.size() - 1)
  8587. {
  8588. auto nextInst = mcBlock->mInstructions[instIdx + 1];
  8589. if (nextInst->mVRegsInitialized != NULL)
  8590. {
  8591. auto fixedVRegsInit = mVRegInitializedContext.RemoveChange(nextInst->mVRegsInitialized, inst->mResult.mVRegIdx);
  8592. ReplaceVRegsInit(mcBlock, instIdx + 1, nextInst->mVRegsInitialized, fixedVRegsInit);
  8593. }
  8594. }
  8595. }
  8596. }
  8597. // Do this with a CMOV instead?
  8598. auto result = inst->mResult;
  8599. inst->mResult.mKind = BeMCOperandKind_None;
  8600. inst->mKind = BeMCInstKind_CondBr;
  8601. inst->mArg1 = inst->mArg0; // Move cmpType
  8602. inst->mArg0 = BeMCOperand::FromLabel(mCurLabelIdx);
  8603. int insertInstIdx = instIdx + 1;
  8604. //auto mcInst = AllocInst(BeMCInstKind_CondBr, BeMCOperand::FromLabel(mCurLabelIdx), BeMCOperand::FromCmpKind(BeCmpKind_EQ), insertInstIdx++);
  8605. auto mcInst = AllocInst(BeMCInstKind_Mov, result, BeMCOperand::FromImmediate(0), insertInstIdx++);
  8606. mcInst = AllocInst(BeMCInstKind_Br, BeMCOperand::FromLabel(mCurLabelIdx + 1), insertInstIdx++);
  8607. CreateLabel(insertInstIdx++);
  8608. mcInst = AllocInst(BeMCInstKind_Mov, result, BeMCOperand::FromImmediate(1), insertInstIdx++);
  8609. CreateLabel(insertInstIdx++);
  8610. }
  8611. break;
  8612. case BeMCInstKind_MovSX:
  8613. case BeMCInstKind_Mov:
  8614. {
  8615. bool isSignedExt = inst->mKind == BeMCInstKind_MovSX;
  8616. auto arg0Type = GetType(inst->mArg0);
  8617. auto arg1Type = GetType(inst->mArg1);
  8618. if (inst->mArg1.mKind == BeMCOperandKind_VRegAddr)
  8619. {
  8620. auto vregInfo = mVRegInfo[inst->mArg1.mVRegIdx];
  8621. if ((!vregInfo->mIsExpr) && (!vregInfo->mForceMem))
  8622. {
  8623. Fail("VRegAddr used without ForceMem");
  8624. }
  8625. }
  8626. if (arg0Type->mSize == 0)
  8627. {
  8628. RemoveInst(mcBlock, instIdx);
  8629. instIdx--;
  8630. continue;
  8631. }
  8632. if (arg0Type->IsComposite())
  8633. {
  8634. if (arg1.mKind == BeMCOperandKind_Immediate_i64)
  8635. {
  8636. // This is just a "zero initializer" marker
  8637. BF_ASSERT(arg1.mImmediate == 0);
  8638. SetAndRestoreValue<int*> insertPtr(mInsertInstIdxRef, &instIdx);
  8639. RemoveInst(mcBlock, instIdx);
  8640. CreateMemSet(BeMCOperand::ToAddr(arg0), 0, arg0Type->mSize, arg0Type->mAlign);
  8641. instIdx--;
  8642. isFinalRun = false;
  8643. if (debugging)
  8644. OutputDebugStrF(" Zero init\n");
  8645. break;
  8646. }
  8647. else if (arg1.mKind == BeMCOperandKind_ConstAgg)
  8648. {
  8649. bool needsSaveRegs = true;
  8650. if (instIdx > 0)
  8651. {
  8652. auto prevInst = mcBlock->mInstructions[instIdx - 1];
  8653. if ((prevInst->mKind == BeMCInstKind_PreserveVolatiles) /*&& (prevInst->mArg0.mReg == X64Reg_R11)*/)
  8654. needsSaveRegs = false;
  8655. }
  8656. auto argType = GetType(arg1);
  8657. bool useRep = argType->mSize >= BF_REP_MOV_LIMIT;
  8658. int movInstIdx = instIdx;
  8659. if (needsSaveRegs)
  8660. {
  8661. AllocInst(BeMCInstKind_PreserveVolatiles, BeMCOperand::FromReg(X64Reg_R11), BeMCOperand(), instIdx);
  8662. instIdx += 1;
  8663. if (useRep)
  8664. {
  8665. AllocInst(BeMCInstKind_PreserveVolatiles, BeMCOperand::FromReg(X64Reg_RAX), BeMCOperand(), instIdx);
  8666. instIdx += 1;
  8667. AllocInst(BeMCInstKind_PreserveVolatiles, BeMCOperand::FromReg(X64Reg_RDI), BeMCOperand(), instIdx);
  8668. instIdx += 1;
  8669. AllocInst(BeMCInstKind_PreserveVolatiles, BeMCOperand::FromReg(X64Reg_RCX), BeMCOperand(), instIdx);
  8670. instIdx += 1;
  8671. }
  8672. movInstIdx = instIdx;
  8673. if (useRep)
  8674. {
  8675. AllocInst(BeMCInstKind_RestoreVolatiles, BeMCOperand::FromReg(X64Reg_RCX), BeMCOperand(), instIdx + 1);
  8676. instIdx += 1;
  8677. AllocInst(BeMCInstKind_RestoreVolatiles, BeMCOperand::FromReg(X64Reg_RDI), BeMCOperand(), instIdx + 1);
  8678. instIdx += 1;
  8679. AllocInst(BeMCInstKind_RestoreVolatiles, BeMCOperand::FromReg(X64Reg_RAX), BeMCOperand(), instIdx + 1);
  8680. instIdx += 1;
  8681. }
  8682. AllocInst(BeMCInstKind_RestoreVolatiles, BeMCOperand::FromReg(X64Reg_R11), BeMCOperand(), instIdx + 1);
  8683. instIdx += 1;
  8684. isFinalRun = false;
  8685. }
  8686. X64CPURegister regA = X64Reg_None;
  8687. X64CPURegister regB = X64Reg_None;
  8688. int bScale = 1;
  8689. int disp = 0;
  8690. auto form = GetRMParams(inst->mArg0, regA, regB, bScale, disp);
  8691. if (form == BeMCRMMode_Invalid)
  8692. {
  8693. if (inst->mArg0.IsSymbol())
  8694. {
  8695. // Just make it an addr so we can replace it with a temporary
  8696. inst->mArg0.mKind = BeMCOperandKind_SymbolAddr;
  8697. }
  8698. ReplaceWithNewVReg(inst->mArg0, movInstIdx, true, false);
  8699. auto vregInfo = GetVRegInfo(inst->mArg0);
  8700. vregInfo->mDisableR11 = true;
  8701. instIdx += 2;
  8702. isFinalRun = false;
  8703. }
  8704. continue;
  8705. }
  8706. // Struct = Struct
  8707. else //if (arg1.mKind == BeMCOperandKind_VReg)
  8708. {
  8709. auto arg0Addr = BeMCOperand::ToAddr(arg0);
  8710. auto arg1Addr = BeMCOperand::ToAddr(arg1);
  8711. SetAndRestoreValue<int*> insertPtr(mInsertInstIdxRef, &instIdx);
  8712. RemoveInst(mcBlock, instIdx);
  8713. CreateMemCpy(arg0Addr, arg1Addr, BF_MIN(arg0Type->mSize, arg1Type->mSize), BF_MIN(arg0Type->mAlign, arg1Type->mAlign));
  8714. instIdx--;
  8715. isFinalRun = false;
  8716. if (debugging)
  8717. OutputDebugStrF(" Mov MemCpy\n");
  8718. break;
  8719. }
  8720. }
  8721. if ((arg0Type->IsFloat()) && (arg1Type->IsInt()))
  8722. {
  8723. if ((arg1Type->mTypeCode == BeTypeCode_Int64) && (!isSignedExt))
  8724. {
  8725. //uint64->float
  8726. AllocInst(BeMCInstKind_PreserveVolatiles, BeMCOperand::FromReg(X64Reg_RAX), BeMCOperand(), instIdx);
  8727. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromReg(X64Reg_RAX), inst->mArg1, instIdx + 1);
  8728. inst->mArg1 = BeMCOperand::FromReg(X64Reg_RAX);
  8729. inst->mKind = BeMCInstKind_MovSX;
  8730. int labelIdx = CreateLabel(instIdx + 3);
  8731. AllocInst(BeMCInstKind_Test, BeMCOperand::FromReg(X64Reg_RAX), BeMCOperand::FromReg(X64Reg_RAX), instIdx + 3);
  8732. AllocInst(BeMCInstKind_CondBr, BeMCOperand::FromLabel(labelIdx), BeMCOperand::FromCmpKind(BeCmpKind_SGE), instIdx + 4);
  8733. BeMCOperand mcOffset;
  8734. if (arg0Type->mSize == 8)
  8735. mcOffset.mKind = BeMCOperandKind_Immediate_f64;
  8736. else
  8737. mcOffset.mKind = BeMCOperandKind_Immediate_f32;
  8738. mcOffset.mImmFloat = 1.8446744073709552e+19;
  8739. AllocInst(BeMCInstKind_Add, inst->mArg0, mcOffset, instIdx + 5);
  8740. AllocInst(BeMCInstKind_RestoreVolatiles, BeMCOperand::FromReg(X64Reg_RAX), BeMCOperand(), instIdx + 7);
  8741. if (debugging)
  8742. OutputDebugStrF(" uint64->float\n");
  8743. isFinalRun = false;
  8744. instIdx--;
  8745. continue; // Rerun from PreserveVolatiles
  8746. }
  8747. else if ((!isSignedExt) || (arg1Type->mSize < 4))
  8748. {
  8749. // Int->Float conversions only work on 32 and 64-bit signed values, so we
  8750. // zero-extend into a larger scratch vreg and then we do the signed conversion on that.
  8751. // Convert from
  8752. // mov float, uint<bits>
  8753. // to
  8754. // mov scratch int<bits*2>, uint<bits>
  8755. // mov float, scratch int<bits*2>
  8756. if ((arg1.IsNativeReg()) && (arg1Type->mSize == 4))
  8757. {
  8758. // If we already have a 32-bit register, then we know that the upper 32-bits are zeroed
  8759. // so during emission we just use the 64-bit version of that register
  8760. }
  8761. else
  8762. {
  8763. auto mcScratch = AllocVirtualReg(mModule->mContext->GetPrimitiveType(BeTypeCode_Int64), 2, true);
  8764. CreateDefineVReg(mcScratch, instIdx++);
  8765. if ((isSignedExt) && (arg1Type->mSize < 8))
  8766. AllocInst(BeMCInstKind_MovSX, mcScratch, inst->mArg1, instIdx++);
  8767. else
  8768. AllocInst(BeMCInstKind_Mov, mcScratch, inst->mArg1, instIdx++);
  8769. inst->mKind = BeMCInstKind_MovSX;
  8770. inst->mArg1 = mcScratch;
  8771. isFinalRun = false;
  8772. if (debugging)
  8773. OutputDebugStrF(" MovSX\n");
  8774. }
  8775. }
  8776. }
  8777. if (!arg0.IsNativeReg())
  8778. {
  8779. // With f32s we can do a imm32 mov into memory, but there's no imm64 version of that
  8780. if ((arg0Type->mTypeCode == BeTypeCode_Double) && (arg1.IsImmediate()))
  8781. {
  8782. // One option would be to do a "movsd xmm, .rdata" to load up the immediate...
  8783. // and that would leave arg0 with the possibility of binding to a register
  8784. // in a subsequent reg pass, but we don't do that.
  8785. //ReplaceWithNewVReg(inst->mArg1, instIdx, true);
  8786. // We do an int64 load/store, so arg0 must never be allowed to be a register
  8787. if (arg0.IsVReg())
  8788. {
  8789. auto vregInfo = mVRegInfo[arg0.mVRegIdx];
  8790. vregInfo->mForceMem = true;
  8791. CheckForce(vregInfo);
  8792. }
  8793. BeMCOperand castedVReg = AllocVirtualReg(mModule->mContext->GetPrimitiveType(BeTypeCode_Int64), 2, false);
  8794. CreateDefineVReg(castedVReg, instIdx++);
  8795. auto castedVRegInfo = GetVRegInfo(castedVReg);
  8796. castedVRegInfo->mIsExpr = true;
  8797. castedVRegInfo->mRelTo = inst->mArg0;
  8798. BeMCOperand scratchReg = AllocVirtualReg(mModule->mContext->GetPrimitiveType(BeTypeCode_Int64), 2, true);
  8799. CreateDefineVReg(scratchReg, instIdx++);
  8800. AllocInst(BeMCInstKind_Mov, scratchReg, BeMCOperand::FromImmediate(arg1.mImmediate), instIdx++);
  8801. inst->mArg0 = castedVReg;
  8802. inst->mArg1 = scratchReg;
  8803. isFinalRun = false;
  8804. if (debugging)
  8805. OutputDebugStrF(" Movsd\n");
  8806. }
  8807. // Conversion types only work in "r, rm" format
  8808. auto arg0Type = GetType(inst->mArg0);
  8809. auto arg1Type = GetType(inst->mArg1);
  8810. bool isCompat = arg0Type->mSize == arg1Type->mSize;
  8811. if ((arg0Type->IsFloat()) != arg1Type->IsFloat())
  8812. isCompat = false;
  8813. if (!isCompat)
  8814. {
  8815. ReplaceWithNewVReg(inst->mArg0, instIdx, false);
  8816. isFinalRun = false;
  8817. if (debugging)
  8818. OutputDebugStrF(" Mov float rm\n");
  8819. }
  8820. }
  8821. }
  8822. break;
  8823. case BeMCInstKind_XAdd:
  8824. {
  8825. for (int oprIdx = 0; oprIdx < 2; oprIdx++)
  8826. {
  8827. BeMCOperand& origOperand = (oprIdx == 0) ? inst->mArg0 : inst->mArg1;
  8828. if (origOperand.IsVRegAny())
  8829. {
  8830. X64CPURegister regA = X64Reg_None;
  8831. X64CPURegister regB = X64Reg_None;
  8832. int bScale = 1;
  8833. int disp = 0;
  8834. int errorVReg = -1;
  8835. auto rmForm = GetRMParams(origOperand, regA, regB, bScale, disp, &errorVReg);
  8836. auto vregInfo = GetVRegInfo(origOperand);
  8837. bool isValid = true;
  8838. if (oprIdx == 1)
  8839. {
  8840. if (rmForm != BeMCRMMode_Direct)
  8841. {
  8842. auto newVReg = ReplaceWithNewVReg(origOperand, instIdx, true, true);
  8843. auto newVRegInfo = GetVRegInfo(newVReg);
  8844. newVRegInfo->mDisableRAX = true;
  8845. isFinalRun = false;
  8846. }
  8847. }
  8848. }
  8849. }
  8850. }
  8851. break;
  8852. case BeMCInstKind_CmpXChg:
  8853. {
  8854. for (int oprIdx = 0; oprIdx < 2; oprIdx++)
  8855. {
  8856. BeMCOperand& origOperand = (oprIdx == 0) ? inst->mArg0 : inst->mArg1;
  8857. if (origOperand.IsVRegAny())
  8858. {
  8859. X64CPURegister regA = X64Reg_None;
  8860. X64CPURegister regB = X64Reg_None;
  8861. int bScale = 1;
  8862. int disp = 0;
  8863. int errorVReg = -1;
  8864. auto rmForm = GetRMParams(origOperand, regA, regB, bScale, disp, &errorVReg);
  8865. auto vregInfo = GetVRegInfo(origOperand);
  8866. if ((ResizeRegister(regA, 8) == X64Reg_RAX) || (ResizeRegister(regB, 8) == X64Reg_RAX))
  8867. {
  8868. if (!vregInfo->mIsExpr)
  8869. {
  8870. isFinalRun = false;
  8871. vregInfo->mDisableRAX = true;
  8872. continue;
  8873. }
  8874. else
  8875. {
  8876. int safeIdx = FindSafeInstInsertPos(instIdx, true);
  8877. isFinalRun = false;
  8878. auto origType = GetType(origOperand);
  8879. BeMCOperand scratchReg = AllocVirtualReg(mModule->mContext->GetPointerTo(origType), 2, false);
  8880. CreateDefineVReg(scratchReg, safeIdx++);
  8881. AllocInst(BeMCInstKind_Mov, scratchReg, BeMCOperand::ToAddr(origOperand), safeIdx++);
  8882. auto newVRegInfo = GetVRegInfo(scratchReg);
  8883. newVRegInfo->mDisableRAX = true;
  8884. origOperand = scratchReg;
  8885. origOperand.mKind = BeMCOperandKind_VRegLoad;
  8886. continue;
  8887. }
  8888. }
  8889. bool isValid = true;
  8890. if (oprIdx == 1)
  8891. {
  8892. if (rmForm != BeMCRMMode_Direct)
  8893. {
  8894. int safeIdx = FindSafeInstInsertPos(instIdx, true);
  8895. auto newVReg = ReplaceWithNewVReg(origOperand, safeIdx, true, true);
  8896. auto newVRegInfo = GetVRegInfo(newVReg);
  8897. newVRegInfo->mDisableRAX = true;
  8898. isFinalRun = false;
  8899. }
  8900. }
  8901. }
  8902. }
  8903. }
  8904. break;
  8905. case BeMCInstKind_Load:
  8906. {
  8907. // And Load gets converted to a "Load %reg0, [%reg1]"
  8908. // So both mArg0 and mArg1 must be a register
  8909. if (!IsAddressable(arg1))
  8910. {
  8911. // Convert to
  8912. // Mov %scratch, %vreg1
  8913. // Load %vreg0, [%scratch]
  8914. ReplaceWithNewVReg(inst->mArg1, instIdx, true);
  8915. arg1 = GetFixedOperand(inst->mArg1);
  8916. isFinalRun = false;
  8917. if (debugging)
  8918. OutputDebugStrF(" Load\n");
  8919. }
  8920. // Do this one second since the 'insert after' makes instIdx no longer point to the Load inst
  8921. if (!arg0.IsNativeReg())
  8922. {
  8923. // Convert to
  8924. // Load %scratch, [%vreg1]
  8925. // Mov %vreg0, %scratch
  8926. ReplaceWithNewVReg(inst->mArg0, instIdx, false);
  8927. isFinalRun = false;
  8928. if (debugging)
  8929. OutputDebugStrF(" Load 2\n");
  8930. }
  8931. }
  8932. break;
  8933. case BeMCInstKind_Store:
  8934. {
  8935. // Store gets converted to a "Store [reg], reg"
  8936. if (!IsAddressable(arg0))
  8937. {
  8938. // Convert to
  8939. // Mov %scratch, %vreg0
  8940. // Store %scratch, [%vreg1]
  8941. ReplaceWithNewVReg(inst->mArg0, instIdx, true);
  8942. isFinalRun = false;
  8943. if (debugging)
  8944. OutputDebugStrF(" Store\n");
  8945. }
  8946. if (!arg1.IsNativeReg())
  8947. {
  8948. // Convert to
  8949. // Mov %scratch, %vreg1
  8950. // Store %vreg0, [%scratch]
  8951. ReplaceWithNewVReg(inst->mArg1, instIdx, true);
  8952. isFinalRun = false;
  8953. if (debugging)
  8954. OutputDebugStrF(" Store2\n");
  8955. }
  8956. }
  8957. break;
  8958. }
  8959. if ((pendingInitKind != BfIRInitType_NotNeeded) && (pendingInitKind != BfIRInitType_NotNeeded_AliveOnDecl))
  8960. {
  8961. Fail("Shouldn't happen here anymore");
  8962. /*int vregIdx = inst->mArg0.mVRegIdx;
  8963. auto dbgVar = mVRegInfo[vregIdx]->mDbgVariable;
  8964. auto varType = mVRegInfo[vregIdx]->mType;
  8965. auto initType = dbgVar->mPendingInitType;
  8966. if (varType->IsFloat())
  8967. {
  8968. BeMCOperand zeroVal;
  8969. if (varType->mTypeCode == BeTypeCode_Float)
  8970. zeroVal.mKind = BeMCOperandKind_Immediate_f32;
  8971. else
  8972. zeroVal.mKind = BeMCOperandKind_Immediate_f64;
  8973. if (initType == BfIRInitType_Uninitialized)
  8974. zeroVal.mImmFloat = NAN;
  8975. else
  8976. zeroVal.mImmFloat = 0;
  8977. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromVReg(vregIdx), zeroVal, instIdx + 1);
  8978. }
  8979. else if (varType->IsComposite())
  8980. {
  8981. SetAndRestoreValue<int*> insertPtr(mInsertInstIdxRef, &instIdx);
  8982. instIdx++;
  8983. uint8 val = (initType == BfIRInitType_Uninitialized) ? 0xCC : 0;
  8984. CreateMemSet(BeMCOperand::FromVRegAddr(vregIdx), val, varType->mSize, varType->mAlign);
  8985. instIdx--;
  8986. isFinalRun = false;
  8987. }
  8988. else
  8989. {
  8990. int64 val = (initType == BfIRInitType_Uninitialized) ? (int64)0xCCCCCCCCCCCCCCCCLL : 0;
  8991. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromVReg(vregIdx), BeMCOperand::FromImmediate(val), instIdx + 1);
  8992. }
  8993. dbgVar->mPendingInitType = BfIRInitType_NotNeeded;*/
  8994. }
  8995. }
  8996. }
  8997. BF_ASSERT(regPreserveDepth == 0);
  8998. SetCurrentInst(NULL);
  8999. if (hasPendingActualizations)
  9000. {
  9001. DoActualization();
  9002. isFinalRun = false;
  9003. if (debugging)
  9004. OutputDebugStrF(" DoActualizations\n");
  9005. }
  9006. return isFinalRun;
  9007. }
  9008. void BeMCContext::DoSanityChecking()
  9009. {
  9010. for (auto mcBlock : mBlocks)
  9011. {
  9012. mActiveBlock = mcBlock;
  9013. for (int instIdx = 0; instIdx < (int)mcBlock->mInstructions.size() - 1; instIdx++)
  9014. {
  9015. auto inst = mcBlock->mInstructions[instIdx];
  9016. auto nextInst = mcBlock->mInstructions[instIdx + 1];
  9017. auto dest = inst->GetDest();
  9018. if (dest == NULL)
  9019. continue;
  9020. auto vregInfo = GetVRegInfo(*dest);
  9021. if ((vregInfo != NULL) && (vregInfo->mHasDynLife))
  9022. {
  9023. if ((nextInst->mVRegsInitialized != NULL) && (!mVRegInitializedContext.IsSet(nextInst->mVRegsInitialized, dest->mVRegIdx)))
  9024. {
  9025. if (nextInst->mKind != BeMCInstKind_RestoreVolatiles)
  9026. {
  9027. // It's possible during legalization to extend the usage of a dynLife value 'upward', and we need
  9028. // to ensure we also extend the init flags up as well
  9029. Fail("Invalid liveness - from init flag not being set properly?");
  9030. }
  9031. }
  9032. }
  9033. }
  9034. }
  9035. }
  9036. void BeMCContext::DoBlockCombine()
  9037. {
  9038. auto masterBlock = mMCBlockAlloc.Alloc();
  9039. mActiveBlock = masterBlock;
  9040. for (auto mcBlock : mBlocks)
  9041. {
  9042. mcBlock->mLabelIdx = mCurLabelIdx++;
  9043. }
  9044. for (auto mcBlock : mBlocks)
  9045. {
  9046. auto inst = AllocInst();
  9047. inst->mKind = BeMCInstKind_Label;
  9048. inst->mArg0.mKind = BeMCOperandKind_Label;
  9049. inst->mArg0.mLabelIdx = mcBlock->mLabelIdx;
  9050. for (auto blockInst : mcBlock->mInstructions)
  9051. {
  9052. if (inst->mDbgLoc == NULL)
  9053. inst->mDbgLoc = blockInst->mDbgLoc;
  9054. auto operands = { &blockInst->mArg0, &blockInst->mArg1 };
  9055. for (auto op : operands)
  9056. {
  9057. if (op->mKind == BeMCOperandKind_Block)
  9058. {
  9059. op->mKind = BeMCOperandKind_Label;
  9060. op->mLabelIdx = op->mBlock->mLabelIdx;
  9061. }
  9062. }
  9063. masterBlock->mInstructions.push_back(blockInst);
  9064. }
  9065. }
  9066. mBlocks.Clear();
  9067. mBlocks.push_back(masterBlock);
  9068. }
  9069. bool BeMCContext::DoJumpRemovePass()
  9070. {
  9071. struct LabelStats
  9072. {
  9073. public:
  9074. bool mHasRefs;
  9075. bool mForceKeepLabel;
  9076. bool mFromMultipleDbgLocs;
  9077. // If all branches share the dbgLoc with the first inst then we can potentially do a remap
  9078. BeDbgLoc* mRefDbgLoc;
  9079. public:
  9080. LabelStats()
  9081. {
  9082. mHasRefs = false;
  9083. mForceKeepLabel = false;
  9084. mFromMultipleDbgLocs = false;
  9085. mRefDbgLoc = NULL;
  9086. }
  9087. };
  9088. bool didWork = false;
  9089. SizedArray<LabelStats, 32> labelStats;
  9090. labelStats.resize(mCurLabelIdx);
  9091. Dictionary<int, int> labelRemaps;
  9092. for (auto& switchEntry : mSwitchEntries)
  9093. {
  9094. labelStats[switchEntry.mBlock->mLabelIdx].mForceKeepLabel = true;
  9095. labelStats[switchEntry.mBlock->mLabelIdx].mHasRefs = true;
  9096. }
  9097. for (auto mcBlock : mBlocks)
  9098. {
  9099. for (int instIdx = 0; instIdx < (int)mcBlock->mInstructions.size(); instIdx++)
  9100. {
  9101. auto inst = mcBlock->mInstructions[instIdx];
  9102. if (inst->mKind == BeMCInstKind_Label)
  9103. {
  9104. if (instIdx < (int)mcBlock->mInstructions.size() - 2)
  9105. {
  9106. auto nextInst = mcBlock->mInstructions[instIdx + 1];
  9107. if (nextInst->mDbgLoc != NULL)
  9108. {
  9109. auto& stats = labelStats[inst->mArg0.mLabelIdx];
  9110. if ((stats.mRefDbgLoc != NULL) && (stats.mRefDbgLoc != nextInst->mDbgLoc))
  9111. stats.mFromMultipleDbgLocs = true;
  9112. else
  9113. stats.mRefDbgLoc = nextInst->mDbgLoc;
  9114. }
  9115. }
  9116. }
  9117. else
  9118. {
  9119. auto operands = { &inst->mArg0, &inst->mArg1 };
  9120. for (auto operand : operands)
  9121. {
  9122. if (operand->mKind == BeMCOperandKind_Label)
  9123. {
  9124. labelStats[operand->mLabelIdx].mHasRefs = true;
  9125. if (inst->mDbgLoc != NULL)
  9126. {
  9127. auto& stats = labelStats[operand->mLabelIdx];
  9128. if ((stats.mRefDbgLoc != NULL) && (stats.mRefDbgLoc != inst->mDbgLoc))
  9129. stats.mFromMultipleDbgLocs = true;
  9130. else
  9131. stats.mRefDbgLoc = inst->mDbgLoc;
  9132. }
  9133. }
  9134. }
  9135. }
  9136. }
  9137. }
  9138. for (auto mcBlock : mBlocks)
  9139. {
  9140. for (int instIdx = 0; instIdx < (int)mcBlock->mInstructions.size(); instIdx++)
  9141. {
  9142. auto inst = mcBlock->mInstructions[instIdx];
  9143. bool goBackToLastBranch = false;
  9144. bool removeInst = false;
  9145. // If we're just jumping to the next label, remove jump
  9146. // It's possible there are several labels in a row here, so check against all of them
  9147. if (inst->mKind == BeMCInstKind_Br)
  9148. {
  9149. if (inst->mArg0.mKind == BeMCOperandKind_Label)
  9150. {
  9151. for (int labelInstIdx = instIdx + 1; labelInstIdx < (int)mcBlock->mInstructions.size(); labelInstIdx++)
  9152. {
  9153. auto labelInst = mcBlock->mInstructions[labelInstIdx];
  9154. if (labelInst->mKind != BeMCInstKind_Label)
  9155. {
  9156. if (labelInst->IsPsuedo())
  9157. continue;
  9158. break;
  9159. }
  9160. if (inst->mArg0 == labelInst->mArg0)
  9161. {
  9162. didWork = true;
  9163. inst->mKind = inst->mArg1 ? BeMCInstKind_Nop : BeMCInstKind_EnsureInstructionAt;
  9164. inst->mArg0 = BeMCOperand();
  9165. inst->mArg1 = BeMCOperand();
  9166. goBackToLastBranch = true;
  9167. break;
  9168. }
  9169. }
  9170. }
  9171. }
  9172. if (removeInst)
  9173. {
  9174. mcBlock->mInstructions.RemoveAt(instIdx);
  9175. instIdx--;
  9176. continue;
  9177. }
  9178. // Do we have a label that immediately branches?
  9179. if (inst->mKind == BeMCInstKind_Label)
  9180. {
  9181. // We can only remap this if the contained instructions and all references share the same dbgLoc
  9182. if ((instIdx < (int)mcBlock->mInstructions.size() - 2) && (!labelStats[inst->mArg0.mLabelIdx].mFromMultipleDbgLocs))
  9183. {
  9184. bool allowRemove = true;
  9185. auto nextInst = mcBlock->mInstructions[instIdx + 1];
  9186. auto nextNextInst = mcBlock->mInstructions[instIdx + 2];
  9187. if ((nextInst->mKind == BeMCInstKind_Br) &&
  9188. ((inst->mDbgLoc == NULL) || (inst->mDbgLoc == nextNextInst->mDbgLoc)) &&
  9189. (!labelStats[inst->mArg0.mLabelIdx].mForceKeepLabel))
  9190. {
  9191. int checkIdx = instIdx - 1;
  9192. while (checkIdx >= 0)
  9193. {
  9194. auto prevInst = mcBlock->mInstructions[checkIdx];
  9195. if (prevInst->mKind == BeMCInstKind_Label)
  9196. {
  9197. // Keep looking
  9198. }
  9199. else if (prevInst->mKind == BeMCInstKind_Br)
  9200. {
  9201. break;
  9202. }
  9203. else
  9204. {
  9205. // We flowed into here, so we can't remove this branch
  9206. allowRemove = false;
  9207. break;
  9208. }
  9209. checkIdx--;
  9210. }
  9211. /*if (labelStats[inst->mArg0.mLabelIdx].mFromMultipleDbgLocs)
  9212. allowRemove = false;*/
  9213. didWork = true;
  9214. RemoveInst(mcBlock, instIdx); // Remove label
  9215. labelRemaps.TryAdd(inst->mArg0.mLabelIdx, nextInst->mArg0.mLabelIdx);
  9216. if (allowRemove)
  9217. {
  9218. RemoveInst(mcBlock, instIdx); // Remove branch
  9219. goBackToLastBranch = true;
  9220. }
  9221. }
  9222. }
  9223. }
  9224. if (goBackToLastBranch)
  9225. {
  9226. // We may be able to remove the previous branch now
  9227. int checkIdx = instIdx - 1;
  9228. while (checkIdx >= 0)
  9229. {
  9230. auto checkInst = mcBlock->mInstructions[checkIdx];
  9231. if (checkInst->mKind == BeMCInstKind_Br)
  9232. {
  9233. instIdx = checkIdx - 1;
  9234. break;
  9235. }
  9236. else if (checkInst->mKind != BeMCInstKind_Label)
  9237. break;
  9238. checkIdx--;
  9239. }
  9240. continue;
  9241. }
  9242. }
  9243. }
  9244. if (!labelRemaps.IsEmpty())
  9245. {
  9246. while (true)
  9247. {
  9248. bool didRemapMerge = false;
  9249. for (auto& remapPair : labelRemaps)
  9250. {
  9251. //auto itr = labelRemaps.find(remapPair.second);
  9252. //if (itr != labelRemaps.end())
  9253. int* valuePtr = NULL;
  9254. if (labelRemaps.TryGetValue(remapPair.mValue, &valuePtr))
  9255. {
  9256. //remapPair.second = itr->second;
  9257. remapPair.mValue = *valuePtr;
  9258. didRemapMerge = true;
  9259. }
  9260. }
  9261. if (!didRemapMerge)
  9262. break;
  9263. }
  9264. for (auto mcBlock : mBlocks)
  9265. {
  9266. for (int instIdx = 0; instIdx < (int)mcBlock->mInstructions.size(); instIdx++)
  9267. {
  9268. auto inst = mcBlock->mInstructions[instIdx];
  9269. auto operands = { &inst->mArg0, &inst->mArg1 };
  9270. for (auto operand : operands)
  9271. {
  9272. if (operand->mKind == BeMCOperandKind_Label)
  9273. {
  9274. //auto itr = labelRemaps.find(operand->mLabelIdx);
  9275. //if (itr != labelRemaps.end())
  9276. int* valuePtr = NULL;
  9277. if (labelRemaps.TryGetValue(operand->mLabelIdx, &valuePtr))
  9278. {
  9279. labelStats[operand->mLabelIdx].mHasRefs = false;
  9280. //operand->mLabelIdx = itr->second;
  9281. operand->mLabelIdx = *valuePtr;
  9282. labelStats[operand->mLabelIdx].mHasRefs = true;
  9283. }
  9284. }
  9285. }
  9286. }
  9287. }
  9288. }
  9289. for (auto mcBlock : mBlocks)
  9290. {
  9291. for (int instIdx = 0; instIdx < (int)mcBlock->mInstructions.size(); instIdx++)
  9292. {
  9293. auto inst = mcBlock->mInstructions[instIdx];
  9294. bool goBackToLastBranch = false;
  9295. }
  9296. }
  9297. // Remove unreferenced labels
  9298. for (auto mcBlock : mBlocks)
  9299. {
  9300. bool doMorePasses = false;
  9301. bool isUnreachable = false;
  9302. for (int instIdx = 0; instIdx < (int)mcBlock->mInstructions.size(); instIdx++)
  9303. {
  9304. auto inst = mcBlock->mInstructions[instIdx];
  9305. if (inst->mKind == BeMCInstKind_Label)
  9306. {
  9307. isUnreachable = false;
  9308. if (!labelStats[inst->mArg0.mLabelIdx].mHasRefs)
  9309. {
  9310. didWork = true;
  9311. mcBlock->mInstructions.RemoveAt(instIdx);
  9312. instIdx--;
  9313. }
  9314. }
  9315. if (inst->mKind == BeMCInstKind_CondBr)
  9316. doMorePasses = true;
  9317. if (inst->mKind == BeMCInstKind_Br)
  9318. {
  9319. if (isUnreachable)
  9320. {
  9321. // We can't possible reach this branch. This is an artifact of other br removals
  9322. didWork = true;
  9323. RemoveInst(mcBlock, instIdx);
  9324. instIdx--;
  9325. continue;
  9326. }
  9327. isUnreachable = true;
  9328. }
  9329. }
  9330. if (doMorePasses)
  9331. {
  9332. for (int instIdx = 0; instIdx < (int)mcBlock->mInstructions.size(); instIdx++)
  9333. {
  9334. auto inst = mcBlock->mInstructions[instIdx];
  9335. // For the form:
  9336. // CondBr %label0, eq
  9337. // Br %label1
  9338. // %label0:
  9339. // Invert condition and convert that to
  9340. // CondBr %label1, neq
  9341. // %label0:
  9342. // We perform this after the jump-removal process to ensure we compare against the correct
  9343. // final label positions, otherwise there are cases where we would incorrectly apply this
  9344. // transformation early and end up with worse results than just not doing it
  9345. if (inst->mKind == BeMCInstKind_CondBr)
  9346. {
  9347. if (instIdx < (int)mcBlock->mInstructions.size() - 2)
  9348. {
  9349. int nextIdx = instIdx + 1;
  9350. int nextNextIdx = instIdx + 2;
  9351. auto nextInst = mcBlock->mInstructions[nextIdx];
  9352. if (nextInst->mKind == BeMCInstKind_EnsureInstructionAt)
  9353. {
  9354. if (nextInst->mDbgLoc != inst->mDbgLoc)
  9355. continue;
  9356. nextIdx++;
  9357. nextNextIdx++;
  9358. nextInst = mcBlock->mInstructions[nextIdx];
  9359. }
  9360. auto nextNextInst = mcBlock->mInstructions[nextNextIdx];
  9361. if ((nextInst->mKind == BeMCInstKind_Br) &&
  9362. (nextNextInst->mKind == BeMCInstKind_Label) && (inst->mArg0 == nextNextInst->mArg0))
  9363. {
  9364. didWork = true;
  9365. inst->mArg0 = nextInst->mArg0;
  9366. BF_ASSERT(inst->mArg1.mKind == BeMCOperandKind_CmpKind);
  9367. inst->mArg1.mCmpKind = BeModule::InvertCmp(inst->mArg1.mCmpKind);
  9368. mcBlock->mInstructions.RemoveAt(nextIdx);
  9369. }
  9370. }
  9371. }
  9372. }
  9373. }
  9374. }
  9375. return didWork;
  9376. }
  9377. void BeMCContext::DoRegFinalization()
  9378. {
  9379. SizedArray<int, 32> savedVolatileVRegs;
  9380. mUsedRegs.Clear();
  9381. SetCurrentInst(NULL);
  9382. // Remove the Def instructions, replace vreg
  9383. for (auto mcBlock : mBlocks)
  9384. {
  9385. mActiveBlock = mcBlock;
  9386. for (int instIdx = 0; instIdx < (int)mcBlock->mInstructions.size(); instIdx++)
  9387. {
  9388. auto inst = mcBlock->mInstructions[instIdx];
  9389. SetCurrentInst(inst);
  9390. if (inst->IsDef())
  9391. {
  9392. auto vregInfo = GetVRegInfo(inst->mArg0);
  9393. if (vregInfo->mDbgVariable != NULL)
  9394. vregInfo->mAwaitingDbgStart = true;
  9395. RemoveInst(mcBlock, instIdx);
  9396. instIdx--;
  9397. continue;
  9398. }
  9399. // This is similar to an optimization we have in DoLegalization, but it allows for directRelTo's to match
  9400. // We can't match those in DoLegalization because it would alter the liveness
  9401. if (inst->mKind == BeMCInstKind_Mov)
  9402. {
  9403. // Useless mov, remove it
  9404. if (OperandsEqual(inst->mArg0, inst->mArg1, false))
  9405. {
  9406. if (inst->mDbgLoc != NULL)
  9407. {
  9408. inst->mKind = BeMCInstKind_EnsureInstructionAt;
  9409. inst->mArg0 = BeMCOperand();
  9410. inst->mArg1 = BeMCOperand();
  9411. }
  9412. else
  9413. {
  9414. RemoveInst(mcBlock, instIdx);
  9415. instIdx--;
  9416. }
  9417. continue;
  9418. }
  9419. }
  9420. if ((inst->mKind >= BeMCInstKind_Def) && (inst->mKind <= BeMCInstKind_LifetimeEnd))
  9421. continue;
  9422. if (inst->mResult == inst->mArg0)
  9423. {
  9424. // Destination is implicitly arg0
  9425. inst->mResult.mKind = BeMCOperandKind_None;
  9426. }
  9427. // Unfortunate rule:
  9428. // if we end up with:
  9429. // PreserveVolatiles RAX
  9430. // Shl vreg0<RCX>, CL
  9431. // RestoreVolatiles RAXS
  9432. // Then convert that to
  9433. // PreserveVolatiles RAX
  9434. // Shl <SavedLoc>, RAX
  9435. // RestoreVolatiles RAX
  9436. /*if ((inst->mKind == BeMCInstKind_Shl) ||
  9437. (inst->mKind == BeMCInstKind_Shr) ||
  9438. (inst->mKind == BeMCInstKind_Sar))
  9439. {
  9440. if (inst->mArg1.IsNativeReg())
  9441. {
  9442. }
  9443. }*/
  9444. auto operands = { &inst->mResult, &inst->mArg0, &inst->mArg1 };
  9445. for (auto operand : operands)
  9446. {
  9447. BeMCOperand checkOperand = *operand;
  9448. while (true)
  9449. {
  9450. auto vregInfo = GetVRegInfo(checkOperand);
  9451. if (vregInfo == NULL)
  9452. break;
  9453. // We may think that range starts should always occur on a "mov <vreg>, <value>", but
  9454. // we have some cases like un-splatting into a composite, or using an uninitialized local
  9455. // variable where we want to start the range on ANY use, not just a direct assignment
  9456. if (vregInfo->mAwaitingDbgStart)
  9457. {
  9458. //AllocInst(BeMCInstKind_DbgRangeStart, checkOperand, instIdx + 1);
  9459. //vregInfo->mAwaitingDbgStart = false;
  9460. }
  9461. if (!vregInfo->mRelTo)
  9462. break;
  9463. checkOperand = vregInfo->mRelTo;
  9464. }
  9465. FixOperand(*operand);
  9466. if (operand->mKind == BeMCOperandKind_NativeReg)
  9467. {
  9468. auto nativeReg = ResizeRegister(operand->mReg, 8);
  9469. BF_ASSERT(nativeReg != X64Reg_None);
  9470. if (nativeReg != X64Reg_RSP) // This can happen from allocas
  9471. mUsedRegs.Add(nativeReg);
  9472. }
  9473. }
  9474. if (inst->IsMov())
  9475. {
  9476. bool removeInst = false;
  9477. if (inst->mArg0 == inst->mArg1)
  9478. {
  9479. removeInst = true;
  9480. }
  9481. if ((inst->mArg0.IsNativeReg()) && (inst->mArg1.IsNativeReg()))
  9482. {
  9483. // Removes size-reducing moves such as "mov eax, rax"
  9484. if (ResizeRegister(inst->mArg0.mReg, 8) == inst->mArg1.mReg)
  9485. {
  9486. removeInst = true;
  9487. }
  9488. }
  9489. if (removeInst)
  9490. {
  9491. inst->mKind = BeMCInstKind_EnsureInstructionAt;
  9492. inst->mResult = BeMCOperand();
  9493. inst->mArg0 = BeMCOperand();
  9494. inst->mArg1 = BeMCOperand();
  9495. }
  9496. }
  9497. switch (inst->mKind)
  9498. {
  9499. case BeMCInstKind_PreserveVolatiles:
  9500. {
  9501. if (mDebugging)
  9502. {
  9503. NOP;
  9504. }
  9505. int preserveIdx;
  9506. BeMCInst* preserveInst;
  9507. BeMCInst* restoreInst;
  9508. if (inst->mKind == BeMCInstKind_PreserveVolatiles)
  9509. {
  9510. preserveIdx = instIdx;
  9511. preserveInst = inst;
  9512. restoreInst = mcBlock->mInstructions[FindRestoreVolatiles(mcBlock, instIdx)];
  9513. }
  9514. else
  9515. {
  9516. preserveIdx = FindPreserveVolatiles(mcBlock, instIdx);
  9517. preserveInst = mcBlock->mInstructions[preserveIdx];
  9518. restoreInst = inst;
  9519. }
  9520. int insertIdx = instIdx;
  9521. if ((inst->mArg0.IsNativeReg()) && (inst->mArg1.IsNativeReg()))
  9522. {
  9523. // If our exception (IE: div target) is set to the desired preserve reg then
  9524. if (inst->mArg0.mReg == ResizeRegister(inst->mArg1.mReg, 8))
  9525. break;
  9526. }
  9527. // Save volatile registers
  9528. for (int liveVRegIdx : *inst->mLiveness)
  9529. {
  9530. if (liveVRegIdx >= mLivenessContext.mNumItems)
  9531. continue;
  9532. auto checkVRegIdx = GetUnderlyingVReg(liveVRegIdx);
  9533. // Already handled the underlying vreg?
  9534. if ((checkVRegIdx != liveVRegIdx) && (mLivenessContext.IsSet(preserveInst->mLiveness, checkVRegIdx)))
  9535. continue;
  9536. auto vregInfo = mVRegInfo[checkVRegIdx];
  9537. if (vregInfo->mReg != X64Reg_None)
  9538. {
  9539. // Do we specify a particular reg, or just all volatiles?
  9540. if ((inst->mArg0.IsNativeReg()) && (inst->mArg0.mReg != ResizeRegister(vregInfo->mReg, 8)))
  9541. continue;
  9542. if (!mLivenessContext.IsSet(restoreInst->mLiveness, liveVRegIdx))
  9543. {
  9544. // This vreg doesn't survive until the PreserveRegs -- it's probably used for params or the call addr
  9545. continue;
  9546. }
  9547. if (IsVolatileReg(vregInfo->mReg))
  9548. {
  9549. if (vregInfo->mVolatileVRegSave == -1)
  9550. {
  9551. BF_ASSERT(inst->mKind != BeMCInstKind_RestoreVolatiles); // Should have already been allocated
  9552. auto savedVReg = AllocVirtualReg(vregInfo->mType);
  9553. auto savedVRegInfo = mVRegInfo[savedVReg.mVRegIdx];
  9554. savedVRegInfo->mForceMem = true;
  9555. vregInfo->mVolatileVRegSave = savedVReg.mVRegIdx;
  9556. }
  9557. savedVolatileVRegs.push_back(checkVRegIdx);
  9558. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromVReg(vregInfo->mVolatileVRegSave), GetVReg(checkVRegIdx), insertIdx++);
  9559. instIdx++;
  9560. }
  9561. }
  9562. }
  9563. bool savingSpecificReg = false;
  9564. if (inst->mArg0)
  9565. {
  9566. if (inst->mArg0.IsNativeReg())
  9567. savingSpecificReg = true;
  9568. else
  9569. BF_ASSERT(inst->mArg0.mKind == BeMCOperandKind_PreserveFlag);
  9570. }
  9571. // Full PreserveRegs case:
  9572. // Check register crossover errors, ie:
  9573. // Mov RCX, reg0<RDX>
  9574. // Mov RDX, reg1<RCX>
  9575. if (!savingSpecificReg)
  9576. {
  9577. int preserveIdx = instIdx;
  9578. bool regsFailed = false;
  9579. for (int pass = 0; true; pass++)
  9580. {
  9581. bool regStomped[X64Reg_COUNT] = { false };
  9582. bool regFailed[X64Reg_COUNT] = { false };
  9583. regsFailed = false;
  9584. bool isFinalPass = pass == 4;
  9585. int instEndIdx = -1;
  9586. for (int instIdx = preserveIdx + 1; instIdx < (int)mcBlock->mInstructions.size(); instIdx++)
  9587. {
  9588. auto inst = mcBlock->mInstructions[instIdx];
  9589. if ((inst->mKind == BeMCInstKind_RestoreVolatiles) ||
  9590. (inst->mKind == BeMCInstKind_Call))
  9591. {
  9592. instEndIdx = instIdx;
  9593. if (inst->mKind == BeMCInstKind_Call)
  9594. {
  9595. X64CPURegister regA = X64Reg_None;
  9596. X64CPURegister regB = X64Reg_None;
  9597. int bScale = 1;
  9598. int disp = 0;
  9599. GetRMParams(inst->mArg0, regA, regB, bScale, disp);
  9600. if (((regA != X64Reg_None) && (regA != X64Reg_RAX) && (regStomped[regA])) ||
  9601. ((regB != X64Reg_None) && (regStomped[regB])))
  9602. {
  9603. BF_ASSERT(pass == 0);
  9604. // Target is stomped! Mov to RAX and then handle it along with the generalized reg setup
  9605. auto callTarget = BeMCOperand::FromReg(X64Reg_RAX);
  9606. AllocInst(BeMCInstKind_Mov, callTarget, inst->mArg0, preserveIdx + 1);
  9607. inst->mArg0 = callTarget;
  9608. regsFailed = true; // So we'll rerun taking into account the new RAX reg
  9609. instEndIdx++;
  9610. }
  9611. }
  9612. break;
  9613. }
  9614. if (inst->mKind == BeMCInstKind_Def)
  9615. {
  9616. // If we have a Def here, it's because of a legalization that introduced a variable in a non-safe position
  9617. Fail("Illegal def");
  9618. }
  9619. if (inst->mKind == BeMCInstKind_Mov)
  9620. {
  9621. X64CPURegister regs[2] = { X64Reg_None, X64Reg_None };
  9622. GetUsedRegs(inst->mArg1, regs[0], regs[1]);
  9623. bool isStomped = false;
  9624. for (auto reg : regs)
  9625. {
  9626. if (reg != X64Reg_None)
  9627. {
  9628. if (regStomped[reg])
  9629. {
  9630. regsFailed = true;
  9631. isStomped = true;
  9632. regFailed[reg] = true;
  9633. }
  9634. }
  9635. }
  9636. // Don't swap on the final pass, we need regsFailed to be accurate so this is just a
  9637. // verification pass
  9638. if ((isStomped) && (!isFinalPass))
  9639. {
  9640. // Bubble up, maybe a reordering will fix our issue
  9641. BF_SWAP(mcBlock->mInstructions[instIdx - 1], mcBlock->mInstructions[instIdx]);
  9642. }
  9643. if (inst->mArg0.IsNativeReg())
  9644. {
  9645. auto reg = ResizeRegister(inst->mArg0.mReg, 8);
  9646. regStomped[(int)reg] = true;
  9647. }
  9648. }
  9649. }
  9650. if (!regsFailed)
  9651. break;
  9652. if (isFinalPass)
  9653. {
  9654. // We've failed to reorder
  9655. int deferredIdx = 0;
  9656. for (int instIdx = preserveIdx + 1; instIdx < instEndIdx; instIdx++)
  9657. {
  9658. auto inst = mcBlock->mInstructions[instIdx];
  9659. if ((inst->mKind == BeMCInstKind_RestoreVolatiles) ||
  9660. (inst->mKind == BeMCInstKind_Call))
  9661. break;
  9662. if (inst->mKind == BeMCInstKind_Mov)
  9663. {
  9664. if (inst->mArg0.IsNativeReg())
  9665. {
  9666. auto reg = ResizeRegister(inst->mArg0.mReg, 8);
  9667. if (regFailed[(int)reg])
  9668. {
  9669. // Convert
  9670. // Mov <reg>, vreg0
  9671. // To
  9672. // Push vreg0
  9673. // ...
  9674. // Pop <reg>
  9675. auto mcPopReg = inst->mArg0;
  9676. auto popType = GetType(mcPopReg);
  9677. if (!popType->IsFloat())
  9678. mcPopReg.mReg = ResizeRegister(mcPopReg.mReg, 8);
  9679. auto pushType = GetType(inst->mArg1);
  9680. auto useTypeCode = pushType->IsFloat() ? pushType->mTypeCode : BeTypeCode_Int64;
  9681. BF_ASSERT(deferredIdx < 4);
  9682. auto mcDeferred = GetCallArgVReg(deferredIdx++, useTypeCode);
  9683. CreateDefineVReg(BeMCOperand::FromVReg(mcDeferred.mVRegIdx), instIdx++);
  9684. instEndIdx++;
  9685. auto popInst = AllocInst(BeMCInstKind_Mov, mcPopReg, mcDeferred, instEndIdx);
  9686. //auto popInst = AllocInst(BeMCInstKind_Pop, mcPopReg, instEndIdx);
  9687. auto arg1 = inst->mArg1;
  9688. FixOperand(arg1);
  9689. if (arg1.IsNativeReg())
  9690. {
  9691. inst->mKind = BeMCInstKind_Mov;
  9692. inst->mArg0 = mcDeferred;
  9693. if (!popType->IsFloat())
  9694. inst->mArg1 = BeMCOperand::FromReg(ResizeRegister(arg1.mReg, 8));
  9695. else
  9696. inst->mArg1 = BeMCOperand::FromReg(arg1.mReg);
  9697. }
  9698. else
  9699. {
  9700. // Use R11 or XMM5 as our temporary - they are the least likely volatiles to be
  9701. // allocated, so we may not need to restore them after using them
  9702. X64CPURegister scratchReg;
  9703. if (pushType->mTypeCode == BeTypeCode_Float)
  9704. scratchReg = X64Reg_XMM5_f32;
  9705. else if (pushType->mTypeCode == BeTypeCode_Double)
  9706. scratchReg = X64Reg_XMM5_f64;
  9707. else
  9708. scratchReg = X64Reg_R11;
  9709. int volatileVRegSave = -1;
  9710. for (auto vregIdx : savedVolatileVRegs)
  9711. {
  9712. auto vregInfo = mVRegInfo[vregIdx];
  9713. if (ResizeRegister(vregInfo->mReg, 8) == scratchReg)
  9714. {
  9715. volatileVRegSave = vregInfo->mVolatileVRegSave;
  9716. }
  9717. }
  9718. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromReg(scratchReg), inst->mArg1, instIdx++);
  9719. instEndIdx++;
  9720. inst->mKind = BeMCInstKind_Mov;
  9721. inst->mArg0 = mcDeferred;
  9722. inst->mArg1 = BeMCOperand::FromReg(scratchReg);
  9723. if (volatileVRegSave != -1)
  9724. {
  9725. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromReg(scratchReg), BeMCOperand::FromVReg(volatileVRegSave), ++instIdx);
  9726. instEndIdx++;
  9727. }
  9728. }
  9729. }
  9730. }
  9731. }
  9732. }
  9733. break;
  9734. }
  9735. }
  9736. }
  9737. }
  9738. break;
  9739. case BeMCInstKind_RestoreVolatiles:
  9740. {
  9741. bool doRestore = true;
  9742. if ((inst->mArg0.mKind == BeMCOperandKind_PreserveFlag) && ((inst->mArg0.mPreserveFlag & BeMCPreserveFlag_NoRestore) != 0))
  9743. {
  9744. // Don't bother restore registers for NoReturns
  9745. doRestore = false;
  9746. }
  9747. if (doRestore)
  9748. {
  9749. for (auto vregIdx : savedVolatileVRegs)
  9750. {
  9751. auto vregInfo = mVRegInfo[vregIdx];
  9752. AllocInst(BeMCInstKind_Mov, GetVReg(vregIdx), BeMCOperand::FromVReg(vregInfo->mVolatileVRegSave), instIdx++);
  9753. }
  9754. }
  9755. savedVolatileVRegs.clear();
  9756. }
  9757. break;
  9758. }
  9759. }
  9760. }
  9761. SetCurrentInst(NULL);
  9762. // Do this at the end so we can properly handle RangeStarts
  9763. for (int vregIdx = 0; vregIdx < (int)mVRegInfo.size(); vregIdx++)
  9764. {
  9765. auto vregInfo = mVRegInfo[vregIdx];
  9766. if (vregInfo->mRelTo)
  9767. {
  9768. FixOperand(vregInfo->mRelTo);
  9769. FixOperand(vregInfo->mRelOffset);
  9770. }
  9771. }
  9772. }
  9773. BeMCInstForm BeMCContext::GetInstForm(BeMCInst* inst)
  9774. {
  9775. if (!inst->mArg0)
  9776. return BeMCInstForm_Unknown;
  9777. if (!inst->mArg1)
  9778. {
  9779. if (inst->mArg0.mKind == BeMCOperandKind_Symbol)
  9780. return BeMCInstForm_Symbol;
  9781. if (inst->mArg0.mKind == BeMCOperandKind_SymbolAddr)
  9782. return BeMCInstForm_SymbolAddr;
  9783. auto arg0Type = GetType(inst->mArg0);
  9784. if (arg0Type == NULL)
  9785. return BeMCInstForm_Unknown;
  9786. if (inst->mArg0.IsImmediate())
  9787. {
  9788. if ((inst->mArg0.mImmediate >= -0x80000000LL) && (inst->mArg0.mImmediate <= 0x7FFFFFFF))
  9789. return BeMCInstForm_IMM32;
  9790. }
  9791. if (inst->mArg0.mKind == BeMCOperandKind_NativeReg)
  9792. {
  9793. if (arg0Type->mSize == 4)
  9794. return BeMCInstForm_R32;
  9795. if (arg0Type->mSize == 2)
  9796. return BeMCInstForm_R16;
  9797. if (arg0Type->mSize == 1)
  9798. return BeMCInstForm_R8;
  9799. return BeMCInstForm_R64;
  9800. }
  9801. if (arg0Type->mSize == 4)
  9802. return BeMCInstForm_RM32;
  9803. if (arg0Type->mSize == 2)
  9804. return BeMCInstForm_RM16;
  9805. if (arg0Type->mSize == 1)
  9806. return BeMCInstForm_RM8;
  9807. return BeMCInstForm_RM64;
  9808. }
  9809. auto arg0Type = GetType(inst->mArg0);
  9810. auto arg1Type = GetType(inst->mArg1);
  9811. if ((arg0Type != NULL) && (arg1Type != NULL) &&
  9812. ((arg0Type->IsFloat()) || (arg1Type->IsFloat())))
  9813. {
  9814. if (inst->mArg0.IsNativeReg())
  9815. {
  9816. if (arg0Type->mTypeCode == BeTypeCode_Double)
  9817. {
  9818. /*if (inst->mArg1.IsNativeReg())
  9819. {
  9820. if (arg1Type->mTypeCode == BeTypeCode_Double)
  9821. return BeMCInstForm_XMM64_XMM64;
  9822. else if (arg1Type->mTypeCode == BeTypeCode_Float)
  9823. return BeMCInstForm_XMM64_XMM32;
  9824. }*/
  9825. if (inst->mArg1.IsImmediate())
  9826. return BeMCInstForm_XMM64_IMM;
  9827. /*if (inst->mArg1.IsSymbol())
  9828. return BeMCInstForm_XMM64_FRM64;*/
  9829. switch (arg1Type->mTypeCode)
  9830. {
  9831. case BeTypeCode_Float: return BeMCInstForm_XMM64_FRM32;
  9832. case BeTypeCode_Double: return BeMCInstForm_XMM64_FRM64;
  9833. case BeTypeCode_Int32: return BeMCInstForm_XMM64_RM32;
  9834. case BeTypeCode_Int64: return BeMCInstForm_XMM64_RM64;
  9835. default: NotImpl();
  9836. }
  9837. }
  9838. else if (arg0Type->mTypeCode == BeTypeCode_Float)
  9839. {
  9840. /*if (inst->mArg1.IsNativeReg())
  9841. {
  9842. if (arg1Type->mTypeCode == BeTypeCode_Double)
  9843. return BeMCInstForm_XMM32_XMM64;
  9844. else if (arg1Type->mTypeCode == BeTypeCode_Float)
  9845. return BeMCInstForm_XMM32_XMM32;
  9846. }*/
  9847. if (inst->mArg1.IsImmediate())
  9848. return BeMCInstForm_XMM32_IMM;
  9849. /*if (inst->mArg1.IsSymbol())
  9850. return BeMCInstForm_XMM32_FRM32;*/
  9851. switch (arg1Type->mTypeCode)
  9852. {
  9853. case BeTypeCode_Float: return BeMCInstForm_XMM32_FRM32;
  9854. case BeTypeCode_Double: return BeMCInstForm_XMM32_FRM64;
  9855. case BeTypeCode_Int32: return BeMCInstForm_XMM32_RM32;
  9856. case BeTypeCode_Int64: return BeMCInstForm_XMM32_RM64;
  9857. default: NotImpl();
  9858. }
  9859. }
  9860. else if (arg1Type->mTypeCode == BeTypeCode_Double)
  9861. {
  9862. if (arg0Type->mSize == 4)
  9863. return BeMCInstForm_R32_F64;
  9864. else
  9865. return BeMCInstForm_R64_F64;
  9866. }
  9867. else if (arg1Type->mTypeCode == BeTypeCode_Float)
  9868. {
  9869. if (arg0Type->mSize == 4)
  9870. return BeMCInstForm_R32_F32;
  9871. else
  9872. return BeMCInstForm_R64_F32;
  9873. }
  9874. }
  9875. else
  9876. {
  9877. if (inst->mArg1.IsImmediate())
  9878. return BeMCInstForm_Unknown;
  9879. if (arg0Type->mTypeCode == BeTypeCode_Double)
  9880. {
  9881. //TODO: This used to INCORRECTLY say 'switch (arg0Type->mTypeCode)'
  9882. switch (arg1Type->mTypeCode)
  9883. {
  9884. case BeTypeCode_Float: return BeMCInstForm_FRM32_XMM64;
  9885. case BeTypeCode_Double: return BeMCInstForm_FRM64_XMM64;
  9886. default: NotImpl();
  9887. }
  9888. }
  9889. else if (arg0Type->mTypeCode == BeTypeCode_Float)
  9890. {
  9891. //TODO: This used to INCORRECTLY say 'switch (arg0Type->mTypeCode)'
  9892. switch (arg1Type->mTypeCode)
  9893. {
  9894. case BeTypeCode_Float: return BeMCInstForm_FRM32_XMM32;
  9895. case BeTypeCode_Double: return BeMCInstForm_FRM64_XMM32;
  9896. default: NotImpl();
  9897. }
  9898. }
  9899. else
  9900. NotImpl();
  9901. }
  9902. }
  9903. if ((inst->mArg1.IsImmediate()) && (arg0Type != NULL)) // MOV r/m64, imm32
  9904. {
  9905. int64 maxSize = 8;
  9906. if ((arg0Type->IsInt()) && (inst->mArg1.IsImmediateInt()))
  9907. maxSize = arg0Type->mSize;
  9908. if ((inst->mArg1.mKind == BeMCOperandKind_Immediate_Null) || (maxSize <= 1) ||
  9909. ((inst->mArg1.mImmediate >= -0x80) && (inst->mArg1.mImmediate <= 0x7F)))
  9910. {
  9911. switch (arg0Type->mSize)
  9912. {
  9913. case 8: return BeMCInstForm_RM64_IMM8;
  9914. case 4: return BeMCInstForm_RM32_IMM8;
  9915. case 2: return BeMCInstForm_RM16_IMM8;
  9916. case 1: return BeMCInstForm_RM8_IMM8;
  9917. }
  9918. }
  9919. else if ((maxSize <= 2) ||
  9920. ((inst->mArg1.mImmediate >= -0x8000) && (inst->mArg1.mImmediate <= 0x7FFF)))
  9921. {
  9922. switch (arg0Type->mSize)
  9923. {
  9924. case 8: return BeMCInstForm_RM64_IMM16;
  9925. case 4: return BeMCInstForm_RM32_IMM16;
  9926. case 2: return BeMCInstForm_RM16_IMM16;
  9927. case 1: return BeMCInstForm_RM8_IMM8;
  9928. }
  9929. }
  9930. else if ((maxSize <= 4) ||
  9931. ((inst->mArg1.mImmediate >= -0x80000000LL) && (inst->mArg1.mImmediate <= 0x7FFFFFFF)))
  9932. {
  9933. switch (arg0Type->mSize)
  9934. {
  9935. case 8: return BeMCInstForm_RM64_IMM32;
  9936. case 4: return BeMCInstForm_RM32_IMM32;
  9937. case 2: return BeMCInstForm_RM16_IMM16;
  9938. case 1: return BeMCInstForm_RM8_IMM8;
  9939. }
  9940. }
  9941. else
  9942. return BeMCInstForm_RM64_IMM64;
  9943. }
  9944. if ((arg0Type == NULL) || (arg1Type == NULL) || (arg0Type->mSize != arg1Type->mSize))
  9945. return BeMCInstForm_Unknown;
  9946. if (inst->mArg0.mKind == BeMCOperandKind_NativeReg)
  9947. {
  9948. switch (GetType(inst->mArg0)->mSize)
  9949. {
  9950. case 8: return BeMCInstForm_R64_RM64;
  9951. case 4: return BeMCInstForm_R32_RM32;
  9952. case 2: return BeMCInstForm_R16_RM16;
  9953. case 1: return BeMCInstForm_R8_RM8;
  9954. }
  9955. }
  9956. if (inst->mArg1.mKind == BeMCOperandKind_NativeReg)
  9957. {
  9958. switch (GetType(inst->mArg1)->mSize)
  9959. {
  9960. case 8: return BeMCInstForm_RM64_R64;
  9961. case 4: return BeMCInstForm_RM32_R32;
  9962. case 2: return BeMCInstForm_RM16_R16;
  9963. case 1: return BeMCInstForm_RM8_R8;
  9964. }
  9965. }
  9966. return BeMCInstForm_Unknown;
  9967. }
  9968. BeMCInstForm BeMCContext::ToIMM16(BeMCInstForm instForm)
  9969. {
  9970. switch (instForm)
  9971. {
  9972. case BeMCInstForm_RM16_IMM8: return BeMCInstForm_RM32_IMM16;
  9973. case BeMCInstForm_RM32_IMM8: return BeMCInstForm_RM32_IMM16;
  9974. case BeMCInstForm_RM64_IMM8: return BeMCInstForm_RM64_IMM16;
  9975. case BeMCInstForm_RM16_IMM16: return BeMCInstForm_RM32_IMM16;
  9976. case BeMCInstForm_RM32_IMM16: return BeMCInstForm_RM32_IMM16;
  9977. case BeMCInstForm_RM64_IMM16: return BeMCInstForm_RM64_IMM16;
  9978. }
  9979. NotImpl();
  9980. return instForm;
  9981. }
  9982. BeMCInstForm BeMCContext::ToIMM32OrSmaller(BeMCInstForm instForm)
  9983. {
  9984. switch (instForm)
  9985. {
  9986. case BeMCInstForm_RM8_IMM8: return BeMCInstForm_RM8_IMM8;
  9987. case BeMCInstForm_RM16_IMM8: return BeMCInstForm_RM16_IMM16;
  9988. case BeMCInstForm_RM32_IMM8: return BeMCInstForm_RM32_IMM32;
  9989. case BeMCInstForm_RM64_IMM8: return BeMCInstForm_RM64_IMM32;
  9990. case BeMCInstForm_RM16_IMM16: return BeMCInstForm_RM16_IMM16;
  9991. case BeMCInstForm_RM32_IMM16: return BeMCInstForm_RM32_IMM32;
  9992. case BeMCInstForm_RM64_IMM16: return BeMCInstForm_RM64_IMM32;
  9993. case BeMCInstForm_RM32_IMM32: return BeMCInstForm_RM32_IMM32;
  9994. case BeMCInstForm_RM64_IMM32: return BeMCInstForm_RM64_IMM32;
  9995. }
  9996. NotImpl();
  9997. return instForm;
  9998. }
  9999. void BeMCContext::SetCurrentInst(BeMCInst* inst)
  10000. {
  10001. if (inst == NULL)
  10002. {
  10003. mCurDbgLoc = NULL;
  10004. mCurVRegsInit = NULL;
  10005. mCurVRegsLive = NULL;
  10006. }
  10007. else
  10008. {
  10009. mCurDbgLoc = inst->mDbgLoc;
  10010. mCurVRegsInit = inst->mVRegsInitialized;
  10011. mCurVRegsLive = inst->mLiveness;
  10012. }
  10013. }
  10014. int BeMCContext::FindPreserveVolatiles(BeMCBlock* mcBlock, int instIdx)
  10015. {
  10016. for (int checkIdx = instIdx - 1; checkIdx >= 0; checkIdx--)
  10017. {
  10018. BeMCInst* checkInst = mcBlock->mInstructions[checkIdx];
  10019. if (checkInst->mKind == BeMCInstKind_PreserveVolatiles)
  10020. return checkIdx;
  10021. }
  10022. return -1;
  10023. }
  10024. int BeMCContext::FindRestoreVolatiles(BeMCBlock* mcBlock, int instIdx)
  10025. {
  10026. for (int checkIdx = instIdx + 1; checkIdx < (int)mcBlock->mInstructions.size(); checkIdx++)
  10027. {
  10028. BeMCInst* checkInst = mcBlock->mInstructions[checkIdx];
  10029. if (checkInst->mKind == BeMCInstKind_RestoreVolatiles)
  10030. return checkIdx;
  10031. }
  10032. return mcBlock->mInstructions.size() - 1; // Ret
  10033. }
  10034. void BeMCContext::EmitInstPrefix(BeMCInstForm instForm, BeMCInst* inst)
  10035. {
  10036. switch (instForm)
  10037. {
  10038. case BeMCInstForm_R16_RM16:
  10039. case BeMCInstForm_R16_RM64_ADDR:
  10040. case BeMCInstForm_RM16_R16:
  10041. case BeMCInstForm_RM16_IMM8:
  10042. case BeMCInstForm_RM16_IMM16:
  10043. case BeMCInstForm_RM64_R16_ADDR:
  10044. case BeMCInstForm_RM16:
  10045. case BeMCInstForm_R16:
  10046. Emit(0x66);
  10047. }
  10048. switch (instForm)
  10049. {
  10050. case BeMCInstForm_R64_RM64:
  10051. EmitREX(inst->mArg0, inst->mArg1, true);
  10052. break;
  10053. case BeMCInstForm_R8_RM8:
  10054. case BeMCInstForm_R16_RM16:
  10055. case BeMCInstForm_R32_RM32:
  10056. case BeMCInstForm_R8_RM64_ADDR:
  10057. case BeMCInstForm_R16_RM64_ADDR:
  10058. case BeMCInstForm_R32_RM64_ADDR:
  10059. EmitREX(inst->mArg0, inst->mArg1, false);
  10060. break;
  10061. case BeMCInstForm_R64_RM64_ADDR:
  10062. EmitREX(inst->mArg0, inst->mArg1, true);
  10063. break;
  10064. case BeMCInstForm_RM8_R8:
  10065. case BeMCInstForm_RM16_R16:
  10066. case BeMCInstForm_RM32_R32:
  10067. case BeMCInstForm_RM64_R8_ADDR:
  10068. case BeMCInstForm_RM64_R16_ADDR:
  10069. case BeMCInstForm_RM64_R32_ADDR:
  10070. EmitREX(inst->mArg1, inst->mArg0, false);
  10071. break;
  10072. case BeMCInstForm_RM64_R64:
  10073. case BeMCInstForm_RM64_R64_ADDR:
  10074. EmitREX(inst->mArg1, inst->mArg0, true);
  10075. break;
  10076. case BeMCInstForm_RM8_IMM8:
  10077. case BeMCInstForm_RM16_IMM8:
  10078. case BeMCInstForm_RM16_IMM16:
  10079. case BeMCInstForm_RM32_IMM8:
  10080. case BeMCInstForm_RM32_IMM16:
  10081. case BeMCInstForm_RM32_IMM32:
  10082. EmitREX(inst->mArg1, inst->mArg0, false);
  10083. break;
  10084. case BeMCInstForm_RM64_IMM8:
  10085. case BeMCInstForm_RM64_IMM16:
  10086. case BeMCInstForm_RM64_IMM32:
  10087. case BeMCInstForm_RM64_IMM64:
  10088. EmitREX(inst->mArg1, inst->mArg0, true);
  10089. break;
  10090. }
  10091. }
  10092. void BeMCContext::EmitInst(BeMCInstForm instForm, uint16 codeBytes, BeMCInst* inst)
  10093. {
  10094. EmitInstPrefix(instForm, inst);
  10095. if (codeBytes <= 0xFF)
  10096. mOut.Write((uint8)codeBytes);
  10097. else
  10098. mOut.Write((int16)codeBytes);
  10099. switch (instForm)
  10100. {
  10101. case BeMCInstForm_R8_RM8:
  10102. case BeMCInstForm_R16_RM16:
  10103. case BeMCInstForm_R32_RM32:
  10104. case BeMCInstForm_R64_RM64:
  10105. EmitModRM(inst->mArg0, inst->mArg1);
  10106. break;
  10107. case BeMCInstForm_R8_RM64_ADDR:
  10108. case BeMCInstForm_R16_RM64_ADDR:
  10109. case BeMCInstForm_R32_RM64_ADDR:
  10110. case BeMCInstForm_R64_RM64_ADDR:
  10111. EmitModRM_Addr(inst->mArg0, inst->mArg1);
  10112. break;
  10113. case BeMCInstForm_RM8_R8:
  10114. case BeMCInstForm_RM16_R16:
  10115. case BeMCInstForm_RM32_R32:
  10116. case BeMCInstForm_RM64_R64:
  10117. EmitModRM(inst->mArg1, inst->mArg0);
  10118. break;
  10119. case BeMCInstForm_RM64_R8_ADDR:
  10120. case BeMCInstForm_RM64_R16_ADDR:
  10121. case BeMCInstForm_RM64_R32_ADDR:
  10122. case BeMCInstForm_RM64_R64_ADDR:
  10123. EmitModRM_Addr(inst->mArg1, inst->mArg0);
  10124. break;
  10125. case BeMCInstForm_RM64_IMM32:
  10126. break;
  10127. default:
  10128. Fail("Notimpl EmitInst");
  10129. }
  10130. }
  10131. void BeMCContext::EmitInst(BeMCInstForm instForm, uint16 codeBytes, uint8 rx, BeMCInst* inst)
  10132. {
  10133. EmitInstPrefix(instForm, inst);
  10134. BF_ASSERT(codeBytes != 0);
  10135. if (codeBytes <= 0xFF)
  10136. mOut.Write((uint8)codeBytes);
  10137. else
  10138. mOut.Write((int16)codeBytes);
  10139. switch (instForm)
  10140. {
  10141. case BeMCInstForm_RM8_IMM8:
  10142. case BeMCInstForm_RM16_IMM8:
  10143. case BeMCInstForm_RM32_IMM8:
  10144. case BeMCInstForm_RM64_IMM8:
  10145. EmitModRM(rx, inst->mArg0, -1);
  10146. mOut.Write((int8)inst->mArg1.GetImmediateInt());
  10147. break;
  10148. case BeMCInstForm_RM16_IMM16:
  10149. case BeMCInstForm_RM32_IMM16:
  10150. case BeMCInstForm_RM64_IMM16:
  10151. EmitModRM(rx, inst->mArg0, -2);
  10152. mOut.Write((int16)inst->mArg1.GetImmediateInt());
  10153. break;
  10154. case BeMCInstForm_RM32_IMM32:
  10155. case BeMCInstForm_RM64_IMM32:
  10156. EmitModRM(rx, inst->mArg0, -4);
  10157. mOut.Write((int32)inst->mArg1.GetImmediateInt());
  10158. break;
  10159. case BeMCInstForm_RM64_IMM64:
  10160. EmitModRM(rx, inst->mArg0, -8);
  10161. mOut.Write((int64)inst->mArg1.GetImmediateInt());
  10162. break;
  10163. default:
  10164. Fail("Notimpl EmitInst");
  10165. }
  10166. }
  10167. void BeMCContext::EmitStdInst(BeMCInstForm instForm, BeMCInst* inst, uint8 opcode_rm_r, uint8 opcode_r_rm, uint8 opcode_rm_imm, uint8 opcode_rm_imm_rx)
  10168. {
  10169. switch (instForm)
  10170. {
  10171. case BeMCInstForm_R8_RM8: EmitInst(instForm, opcode_r_rm - 1, inst); break;
  10172. case BeMCInstForm_R16_RM16:
  10173. case BeMCInstForm_R32_RM32:
  10174. case BeMCInstForm_R64_RM64: EmitInst(instForm, opcode_r_rm, inst); break;
  10175. case BeMCInstForm_RM8_R8: EmitInst(instForm, opcode_rm_r - 1, inst); break;
  10176. case BeMCInstForm_RM16_R16:
  10177. case BeMCInstForm_RM32_R32:
  10178. case BeMCInstForm_RM64_R64: EmitInst(instForm, opcode_rm_r, inst); break;
  10179. // These immediate forms assume an expansion to imm32, OR the register size for 8 and 16 bit registers
  10180. case BeMCInstForm_RM8_IMM8: EmitInst(BeMCInstForm_RM8_IMM8, opcode_rm_imm - 1, opcode_rm_imm_rx, inst); break;
  10181. case BeMCInstForm_RM16_IMM8: EmitInst(BeMCInstForm_RM16_IMM16, opcode_rm_imm, opcode_rm_imm_rx, inst); break;
  10182. case BeMCInstForm_RM32_IMM8: EmitInst(BeMCInstForm_RM32_IMM32, opcode_rm_imm, opcode_rm_imm_rx, inst); break;
  10183. case BeMCInstForm_RM64_IMM8: EmitInst(BeMCInstForm_RM64_IMM32, opcode_rm_imm, opcode_rm_imm_rx, inst); break;
  10184. case BeMCInstForm_RM32_IMM16: EmitInst(BeMCInstForm_RM32_IMM32, opcode_rm_imm, opcode_rm_imm_rx, inst); break;
  10185. case BeMCInstForm_RM16_IMM16: EmitInst(BeMCInstForm_RM16_IMM16, opcode_rm_imm, opcode_rm_imm_rx, inst); break;
  10186. case BeMCInstForm_RM64_IMM16: EmitInst(BeMCInstForm_RM64_IMM32, opcode_rm_imm, opcode_rm_imm_rx, inst); break;
  10187. case BeMCInstForm_RM32_IMM32: EmitInst(BeMCInstForm_RM32_IMM32, opcode_rm_imm, opcode_rm_imm_rx, inst); break;
  10188. case BeMCInstForm_RM64_IMM32: EmitInst(BeMCInstForm_RM64_IMM32, opcode_rm_imm, opcode_rm_imm_rx, inst); break;
  10189. default:
  10190. Print();
  10191. NotImpl();
  10192. }
  10193. }
  10194. void BeMCContext::EmitStdInst(BeMCInstForm instForm, BeMCInst * inst, uint8 opcode_rm_r, uint8 opcode_r_rm, uint8 opcode_rm_imm, uint8 opcode_rm_imm_rx, uint8 opcode_rm_imm8, uint8 opcode_rm_imm8_rx)
  10195. {
  10196. switch (instForm)
  10197. {
  10198. case BeMCInstForm_R8_RM8: EmitInst(instForm, opcode_r_rm - 1, inst); break;
  10199. case BeMCInstForm_R16_RM16:
  10200. case BeMCInstForm_R32_RM32:
  10201. case BeMCInstForm_R64_RM64: EmitInst(instForm, opcode_r_rm, inst); break;
  10202. case BeMCInstForm_RM8_R8: EmitInst(instForm, opcode_rm_r - 1, inst); break;
  10203. case BeMCInstForm_RM16_R16:
  10204. case BeMCInstForm_RM32_R32:
  10205. case BeMCInstForm_RM64_R64: EmitInst(instForm, opcode_rm_r, inst); break;
  10206. case BeMCInstForm_RM8_IMM8: EmitInst(BeMCInstForm_RM8_IMM8, opcode_rm_imm - 1, opcode_rm_imm_rx, inst); break;
  10207. case BeMCInstForm_RM16_IMM8: EmitInst(BeMCInstForm_RM16_IMM8, opcode_rm_imm8, opcode_rm_imm8_rx, inst); break;
  10208. case BeMCInstForm_RM32_IMM8: EmitInst(BeMCInstForm_RM32_IMM8, opcode_rm_imm8, opcode_rm_imm8_rx, inst); break;
  10209. case BeMCInstForm_RM64_IMM8: EmitInst(BeMCInstForm_RM64_IMM8, opcode_rm_imm8, opcode_rm_imm8_rx, inst); break;
  10210. // These immediate forms assume an expansion to imm32, OR the register size for 8 and 16 bit registers
  10211. case BeMCInstForm_RM32_IMM16: EmitInst(BeMCInstForm_RM32_IMM32, opcode_rm_imm, opcode_rm_imm_rx, inst); break;
  10212. case BeMCInstForm_RM16_IMM16: EmitInst(BeMCInstForm_RM16_IMM16, opcode_rm_imm, opcode_rm_imm_rx, inst); break;
  10213. case BeMCInstForm_RM64_IMM16: EmitInst(BeMCInstForm_RM64_IMM32, opcode_rm_imm, opcode_rm_imm_rx, inst); break;
  10214. case BeMCInstForm_RM32_IMM32: EmitInst(BeMCInstForm_RM32_IMM32, opcode_rm_imm, opcode_rm_imm_rx, inst); break;
  10215. case BeMCInstForm_RM64_IMM32: EmitInst(BeMCInstForm_RM64_IMM32, opcode_rm_imm, opcode_rm_imm_rx, inst); break;
  10216. default:
  10217. NotImpl();
  10218. }
  10219. }
  10220. bool BeMCContext::EmitStdXMMInst(BeMCInstForm instForm, BeMCInst* inst, uint8 opcode)
  10221. {
  10222. bool is64Bit = false;
  10223. switch (instForm)
  10224. {
  10225. case BeMCInstForm_R64_F32:
  10226. case BeMCInstForm_XMM32_RM64:
  10227. is64Bit = true;
  10228. // Fallthrough
  10229. case BeMCInstForm_R32_F32:
  10230. case BeMCInstForm_XMM32_RM32:
  10231. case BeMCInstForm_XMM32_IMM:
  10232. case BeMCInstForm_XMM32_FRM32:
  10233. case BeMCInstForm_XMM64_FRM32: // CVTSS2SD
  10234. Emit(0xF3); EmitREX(inst->mArg0, inst->mArg1, is64Bit);
  10235. Emit(0x0F); Emit(opcode);
  10236. EmitModRM(inst->mArg0, inst->mArg1);
  10237. return true;
  10238. case BeMCInstForm_R64_F64:
  10239. case BeMCInstForm_XMM64_RM64:
  10240. is64Bit = true;
  10241. // Fallthrough
  10242. case BeMCInstForm_R32_F64:
  10243. case BeMCInstForm_XMM64_RM32:
  10244. case BeMCInstForm_XMM64_IMM:
  10245. case BeMCInstForm_XMM64_FRM64:
  10246. case BeMCInstForm_XMM32_FRM64: // CVTSD2SS
  10247. Emit(0xF2); EmitREX(inst->mArg0, inst->mArg1, is64Bit);
  10248. Emit(0x0F); Emit(opcode);
  10249. EmitModRM(inst->mArg0, inst->mArg1);
  10250. return true;
  10251. }
  10252. return false;
  10253. }
  10254. bool BeMCContext::EmitStdXMMInst(BeMCInstForm instForm, BeMCInst* inst, uint8 opcode, uint8 opcode_dest_frm)
  10255. {
  10256. bool is64Bit = false;
  10257. switch (instForm)
  10258. {
  10259. case BeMCInstForm_FRM32_XMM32:
  10260. Emit(0xF3); EmitREX(inst->mArg1, inst->mArg0, is64Bit);
  10261. Emit(0x0F); Emit(opcode_dest_frm);
  10262. EmitModRM(inst->mArg1, inst->mArg0);
  10263. return true;
  10264. case BeMCInstForm_FRM64_XMM64:
  10265. Emit(0xF2); EmitREX(inst->mArg1, inst->mArg0, is64Bit);
  10266. Emit(0x0F); Emit(opcode_dest_frm);
  10267. EmitModRM(inst->mArg1, inst->mArg0);
  10268. return true;
  10269. default:
  10270. return EmitStdXMMInst(instForm, inst, opcode);
  10271. }
  10272. return false;
  10273. }
  10274. bool BeMCContext::EmitPackedXMMInst(BeMCInstForm instForm, BeMCInst* inst, uint8 opcode)
  10275. {
  10276. bool is64Bit = false;
  10277. switch (instForm)
  10278. {
  10279. case BeMCInstForm_R64_F32:
  10280. case BeMCInstForm_XMM32_RM64:
  10281. is64Bit = true;
  10282. // Fallthrough
  10283. case BeMCInstForm_R32_F32:
  10284. case BeMCInstForm_XMM32_RM32:
  10285. case BeMCInstForm_XMM32_IMM:
  10286. case BeMCInstForm_XMM32_FRM32:
  10287. case BeMCInstForm_XMM64_FRM32: // CVTSS2SD
  10288. EmitREX(inst->mArg0, inst->mArg1, is64Bit);
  10289. Emit(0x0F); Emit(opcode);
  10290. EmitModRM(inst->mArg0, inst->mArg1);
  10291. return true;
  10292. case BeMCInstForm_R64_F64:
  10293. case BeMCInstForm_XMM64_RM64:
  10294. is64Bit = true;
  10295. // Fallthrough
  10296. case BeMCInstForm_R32_F64:
  10297. case BeMCInstForm_XMM64_RM32:
  10298. case BeMCInstForm_XMM64_IMM:
  10299. case BeMCInstForm_XMM64_FRM64:
  10300. case BeMCInstForm_XMM32_FRM64: // CVTSD2SS
  10301. EmitREX(inst->mArg0, inst->mArg1, is64Bit);
  10302. Emit(0x0F); Emit(opcode);
  10303. EmitModRM(inst->mArg0, inst->mArg1);
  10304. return true;
  10305. }
  10306. return false;
  10307. }
  10308. void BeMCContext::EmitAggMov(const BeMCOperand& dest, const BeMCOperand& src)
  10309. {
  10310. X64CPURegister regA = X64Reg_None;
  10311. X64CPURegister regB = X64Reg_None;
  10312. int bScale = 1;
  10313. int disp = 0;
  10314. auto form = GetRMParams(dest, regA, regB, bScale, disp);
  10315. BF_ASSERT(src.mKind == BeMCOperandKind_ConstAgg);
  10316. auto aggConstant = src.mConstant;
  10317. Array<uint8> dataVec;
  10318. aggConstant->GetData(dataVec);
  10319. int memSize = dataVec.size();
  10320. int curOfs = 0;
  10321. bool allowRep = dataVec.size() >= BF_REP_MOV_LIMIT;
  10322. if (mDebugging)
  10323. {
  10324. NOP;
  10325. }
  10326. union IntUnion
  10327. {
  10328. int64 mInt64;
  10329. int32 mInt32;
  10330. int16 mInt16;
  10331. int8 mInt8;
  10332. };
  10333. bool isValRegSet = false;
  10334. int64 curVal = 0;
  10335. auto _EmitMovR11 = [&](int64 val)
  10336. {
  10337. int64 prevVal = curVal;
  10338. bool wasValRegSet = isValRegSet;
  10339. isValRegSet = true;
  10340. curVal = val;
  10341. if ((wasValRegSet) && (val == prevVal))
  10342. return;
  10343. if (val == 0)
  10344. {
  10345. // xor r11, r11
  10346. Emit(0x4D); Emit(0x31); Emit(0xDB);
  10347. return;
  10348. }
  10349. if (wasValRegSet)
  10350. {
  10351. if ((val & ~0xFF) == (prevVal & ~0xFF))
  10352. {
  10353. // mov r11b, val8
  10354. Emit(0x41); Emit(0xB3);
  10355. Emit((int8)val);
  10356. return;
  10357. }
  10358. if ((val & ~0xFFFF) == (prevVal & ~0xFFFF))
  10359. {
  10360. // mov r11w, val16
  10361. Emit(0x66); Emit(0x41); Emit(0xBB);
  10362. mOut.Write((int16)val);
  10363. return;
  10364. }
  10365. }
  10366. if ((val >= 0) && (val <= 0x7FFFFFFF))
  10367. {
  10368. // mov r11d, val32
  10369. Emit(0x41); Emit(0xBB);
  10370. mOut.Write((int32)val);
  10371. }
  10372. else if ((val >= -0x80000000LL) && (val <= 0x7FFFFFFF))
  10373. {
  10374. // mov r11, val32 (sign extended)
  10375. Emit(0x49); Emit(0xC7); Emit(0xC3);
  10376. mOut.Write((int32)val);
  10377. }
  10378. else
  10379. {
  10380. // movabs r11, val32
  10381. Emit(0x49); Emit(0xBB);
  10382. mOut.Write((int64)val);
  10383. }
  10384. };
  10385. for (; curOfs <= memSize - 8; )
  10386. {
  10387. if (allowRep)
  10388. {
  10389. uint8 val = dataVec[curOfs];
  10390. int repSize = 0;
  10391. int checkOfs = curOfs;
  10392. while (checkOfs < (int)dataVec.size())
  10393. {
  10394. if (dataVec[checkOfs] != val)
  10395. break;
  10396. checkOfs++;
  10397. repSize++;
  10398. }
  10399. if (repSize >= 16)
  10400. {
  10401. bool regSaved = false;
  10402. if ((regA == X64Reg_RAX) ||
  10403. (regA == X64Reg_RCX) ||
  10404. (regA == X64Reg_RDI))
  10405. {
  10406. BF_ASSERT(regB == X64Reg_None);
  10407. // mov R11, regA
  10408. Emit(0x49); Emit(0x89);
  10409. EmitModRM(BeMCOperand::FromReg(regA), BeMCOperand::FromReg(X64Reg_R11));
  10410. regSaved = true;
  10411. }
  10412. // lea rdi, <dest+curOfs>
  10413. EmitREX(BeMCOperand::FromReg(X64Reg_RDI), dest, true);
  10414. Emit(0x8D);
  10415. EmitModRMRel(EncodeRegNum(X64Reg_RDI), regA, regB, 1, disp + curOfs);
  10416. // mov al, <val>
  10417. Emit(0xB0); Emit(val);
  10418. // mov edx, <repSize>
  10419. Emit(0xB9);
  10420. mOut.Write((int32)repSize);
  10421. // rep stosb
  10422. Emit(0xF3); Emit(0xAA);
  10423. if (regSaved)
  10424. {
  10425. // mov regA, R11
  10426. Emit(0x4C); Emit(0x89);
  10427. EmitModRM(BeMCOperand::FromReg(X64Reg_R11), BeMCOperand::FromReg(regA));
  10428. }
  10429. curOfs += repSize;
  10430. continue;
  10431. }
  10432. }
  10433. int64 newValReg = *((int64*)&dataVec[curOfs]);
  10434. _EmitMovR11(newValReg);
  10435. // mov <dest+curOfs>, R11
  10436. EmitREX(BeMCOperand::FromReg(X64Reg_R11), dest, true);
  10437. Emit(0x89);
  10438. EmitModRMRel(EncodeRegNum(X64Reg_R11), regA, regB, 1, disp + curOfs);
  10439. curOfs += 8;
  10440. }
  10441. for (; curOfs <= memSize - 4; curOfs += 4)
  10442. {
  10443. int64 newValReg = curVal;
  10444. *((int32*)&newValReg) = *((int32*)&dataVec[curOfs]);
  10445. _EmitMovR11(newValReg);
  10446. // mov <dest+curOfs>, R11d
  10447. EmitREX(BeMCOperand::FromReg(X64Reg_R11D), dest, false);
  10448. Emit(0x89);
  10449. EmitModRMRel(EncodeRegNum(X64Reg_R11D), regA, regB, 1, disp + curOfs);
  10450. }
  10451. for (; curOfs <= memSize - 2; curOfs += 2)
  10452. {
  10453. int64 newValReg = curVal;
  10454. *((int16*)&newValReg) = *((int16*)&dataVec[curOfs]);
  10455. _EmitMovR11(newValReg);
  10456. // mov <dest+curOfs>, R11w
  10457. Emit(0x66); EmitREX(BeMCOperand::FromReg(X64Reg_R11W), dest, false);
  10458. Emit(0x89);
  10459. EmitModRMRel(EncodeRegNum(X64Reg_R11W), regA, regB, 1, disp + curOfs);
  10460. }
  10461. for (; curOfs <= memSize - 1; curOfs += 1)
  10462. {
  10463. int64 newValReg = curVal;
  10464. *((int8*)&newValReg) = *((int8*)&dataVec[curOfs]);
  10465. _EmitMovR11(newValReg);
  10466. // mov <dest+curOfs>, R11b
  10467. EmitREX(BeMCOperand::FromReg(X64Reg_R11B), dest, false);
  10468. Emit(0x89 - 1);
  10469. EmitModRMRel(EncodeRegNum(X64Reg_R11B), regA, regB, 1, disp + curOfs);
  10470. }
  10471. }
  10472. void BeMCContext::DoCodeEmission()
  10473. {
  10474. BP_ZONE("BeMCContext::DoCodeEmission");
  10475. struct BeMCJump
  10476. {
  10477. public:
  10478. int mCodeOffset;
  10479. int mLabelIdx;
  10480. int mJumpKind; // 0 = rel8, 1 = rel16 (not valid in x64), 2 = rel32
  10481. BeCmpKind mCmpKind;
  10482. public:
  10483. BeMCJump()
  10484. {
  10485. mCmpKind = BeCmpKind_None;
  10486. mCodeOffset = -1;
  10487. mLabelIdx = -1;
  10488. mJumpKind = -1;
  10489. }
  10490. };
  10491. SizedArray<int, 64> labelPositions;
  10492. labelPositions.resize(mCurLabelIdx);
  10493. for (int labelIdx = 0; labelIdx < mCurLabelIdx; labelIdx++)
  10494. labelPositions[labelIdx] = -1;
  10495. SizedArray<BeMCJump, 64> deferredJumps;
  10496. auto& xdata = mCOFFObject->mXDataSect.mData;
  10497. int xdataStartPos = xdata.GetPos();
  10498. int textSectStartPos = mOut.GetPos();
  10499. int lastLabelIdx = -1;
  10500. bool hasPData = mStackSize != 0;
  10501. if (hasPData)
  10502. {
  10503. // xdata must be DWORD aligned
  10504. while ((xdataStartPos & 3) != 0)
  10505. {
  10506. xdata.Write((uint8)0);
  10507. xdataStartPos++;
  10508. }
  10509. // pdata starting loc
  10510. BeMCRelocation reloc;
  10511. reloc.mKind = BeMCRelocationKind_ADDR32NB;
  10512. reloc.mOffset = mCOFFObject->mPDataSect.mData.GetPos();
  10513. reloc.mSymTableIdx = mCOFFObject->GetSymbol(mBeFunction)->mIdx;
  10514. mCOFFObject->mPDataSect.mRelocs.push_back(reloc);
  10515. mCOFFObject->mPDataSect.mData.Write((int32)0);
  10516. xdata.Write((uint8)1); // version
  10517. xdata.Write((uint8)0); // prolog size (placeholder)
  10518. xdata.Write((uint8)0); // num unwind codes (placeholder)
  10519. if (mUseBP)
  10520. {
  10521. int frameReg = 5;
  10522. int offset = 0; // scaled by 16
  10523. xdata.Write((uint8)(frameReg + (offset<<4))); // frame register
  10524. }
  10525. else
  10526. xdata.Write((uint8)0); // frame register
  10527. }
  10528. struct BeMCDeferredUnwind
  10529. {
  10530. BeMCInst* mUnwindInst;
  10531. int mCodePos;
  10532. };
  10533. struct BeDbgInstPos
  10534. {
  10535. int mPos;
  10536. int mOrigPos;
  10537. BeMCInst* mInst;
  10538. };
  10539. SizedArray<BeDbgInstPos, 64> dbgInstPositions;
  10540. String dbgStr;
  10541. if (mDebugging)
  10542. {
  10543. dbgStr += "DoCodeEmission:\n";
  10544. }
  10545. SizedArray<BeMCDeferredUnwind, 64> deferredUnwinds;
  10546. mCurDbgLoc = NULL;
  10547. bool needsInstructionAtDbgLoc = false;
  10548. bool dbgExtendLifetime = false;
  10549. int hotJumpLen = 5;
  10550. int funcCodePos = 0;
  10551. BeVTrackingList* vregsLive = mLivenessContext.AllocEmptyList();
  10552. BeVTrackingList* vregsInitialized = mVRegInitializedContext.AllocEmptyList();
  10553. for (auto mcBlock : mBlocks)
  10554. {
  10555. for (auto inst : mcBlock->mInstructions)
  10556. {
  10557. if (mDebugging)
  10558. {
  10559. ToString(inst, dbgStr, true, true);
  10560. }
  10561. auto checkInst = inst;
  10562. int newFuncCodePos = mOut.GetPos() - textSectStartPos;
  10563. if (newFuncCodePos != funcCodePos)
  10564. {
  10565. funcCodePos = newFuncCodePos;
  10566. if (dbgExtendLifetime)
  10567. {
  10568. dbgExtendLifetime = false;
  10569. if (mDebugging)
  10570. {
  10571. //
  10572. }
  10573. }
  10574. }
  10575. if ((inst->mKind == BeMCInstKind_LifetimeEnd) || (inst->mKind == BeMCInstKind_LifetimeExtend))
  10576. {
  10577. if (needsInstructionAtDbgLoc)
  10578. {
  10579. // This 'dbgExtendLifetime' is useful in cases like
  10580. // repeat { int a = 123; } while (false);
  10581. // Otherwise 'a' wouldn't be viewable
  10582. dbgExtendLifetime = true;
  10583. }
  10584. }
  10585. switch (inst->mKind)
  10586. {
  10587. case BeMCInstKind_Label:
  10588. //Why did we set this FALSE here? Just because we have a label doesn't mean we've emitted any actual instructions....
  10589. // Leaving this out broke a test where we couldn't view a 'this' at the end of a particular method
  10590. //dbgExtendLifetime = false;
  10591. break;
  10592. }
  10593. if ((inst->mDbgLoc != NULL) && (mDbgFunction != NULL))
  10594. {
  10595. if (inst->mDbgLoc != mCurDbgLoc)
  10596. {
  10597. bool allowEmission = true;
  10598. if (inst->mKind == BeMCInstKind_DbgDecl)
  10599. {
  10600. // We need to separate out dbgDecls if we are attempting to extend a previous one,
  10601. // otherwise wait for a real instruction
  10602. if (dbgExtendLifetime)
  10603. {
  10604. mOut.Write((uint8)0x90);
  10605. funcCodePos++;
  10606. needsInstructionAtDbgLoc = false;
  10607. dbgExtendLifetime = false;
  10608. }
  10609. else
  10610. allowEmission = false;
  10611. }
  10612. else
  10613. {
  10614. mCurDbgLoc = inst->mDbgLoc;
  10615. if ((!mDbgFunction->mEmissions.empty()) && (mDbgFunction->mEmissions.back().mPos == funcCodePos))
  10616. {
  10617. bool hadEmission = false;
  10618. if (needsInstructionAtDbgLoc)
  10619. {
  10620. // We only need an instruction on this LINE, not necessarily the same column or lexical scope
  10621. auto prevDbgLoc = mDbgFunction->mEmissions.back().mDbgLoc;
  10622. if ((prevDbgLoc->mLine != mCurDbgLoc->mLine) ||
  10623. (prevDbgLoc->GetDbgFile() != mCurDbgLoc->GetDbgFile()) ||
  10624. ((prevDbgLoc->mColumn != -1) != (mCurDbgLoc->mColumn != -1)))
  10625. {
  10626. // We didn't emit anything so we need to put a NOP in
  10627. mOut.Write((uint8)0x90);
  10628. funcCodePos++;
  10629. needsInstructionAtDbgLoc = false;
  10630. hadEmission = true;
  10631. dbgExtendLifetime = false;
  10632. }
  10633. }
  10634. if (!hadEmission)
  10635. {
  10636. // No code emitted, take back the last codeEmission
  10637. mDbgFunction->mEmissions.pop_back();
  10638. }
  10639. }
  10640. }
  10641. if (allowEmission)
  10642. {
  10643. BeDbgCodeEmission codeEmission;
  10644. codeEmission.mDbgLoc = mCurDbgLoc;
  10645. codeEmission.mPos = funcCodePos;
  10646. mDbgFunction->mEmissions.push_back(codeEmission);
  10647. }
  10648. }
  10649. }
  10650. BeMCJump jump;
  10651. auto instForm = GetInstForm(inst);
  10652. // Generate gaps
  10653. if ((inst->mVRegsInitialized != NULL) && (vregsInitialized != inst->mVRegsInitialized))
  10654. {
  10655. for (int changeIdx = 0; changeIdx < inst->mVRegsInitialized->mNumChanges; changeIdx++)
  10656. {
  10657. int vregInitializedIdx = inst->mVRegsInitialized->GetChange(changeIdx);
  10658. if (vregInitializedIdx >= 0) // Added
  10659. {
  10660. if (vregInitializedIdx >= mVRegInitializedContext.mNumItems)
  10661. continue;
  10662. auto dbgVar = mVRegInfo[vregInitializedIdx]->mDbgVariable;
  10663. if ((dbgVar != NULL) && (!dbgVar->mDbgLifeEnded))
  10664. {
  10665. // Wasn't initialized, now it is
  10666. if (!dbgVar->mGaps.empty())
  10667. {
  10668. auto& range = dbgVar->mGaps.back();
  10669. if (dbgVar->mDeclLifetimeExtend)
  10670. {
  10671. range.mOffset++;
  10672. dbgVar->mDeclEnd = range.mOffset;
  10673. dbgVar->mDeclLifetimeExtend = false;
  10674. if (mDebugging)
  10675. {
  10676. dbgStr += StrFormat("#### Dbg Applied LifetimeExtend %s\n", dbgVar->mName.c_str());
  10677. }
  10678. }
  10679. // We have to check for this because it's possible we get multiple adds
  10680. if (range.mLength == -1)
  10681. {
  10682. range.mLength = funcCodePos - range.mOffset;
  10683. if (range.mLength <= 0)
  10684. {
  10685. dbgVar->mGaps.pop_back();
  10686. }
  10687. }
  10688. if (mDebugging)
  10689. {
  10690. dbgStr += StrFormat("#### Dbg End Gap %s\n", dbgVar->mName.c_str());
  10691. }
  10692. }
  10693. }
  10694. }
  10695. else // Removed
  10696. {
  10697. vregInitializedIdx = -vregInitializedIdx - 1;
  10698. if (vregInitializedIdx >= mVRegInitializedContext.mNumItems)
  10699. continue;
  10700. auto dbgVar = mVRegInfo[vregInitializedIdx]->mDbgVariable;
  10701. if ((dbgVar != NULL) && (!dbgVar->mDbgLifeEnded))
  10702. {
  10703. bool inGap = false;
  10704. if (!dbgVar->mGaps.empty())
  10705. inGap = dbgVar->mGaps.back().mLength == -1;
  10706. if (!inGap)
  10707. {
  10708. if (mDebugging)
  10709. {
  10710. dbgStr += StrFormat("#### Dbg Start Gap %s\n", dbgVar->mName.c_str());
  10711. }
  10712. // Starting a new gap
  10713. BeDbgVariableRange range;
  10714. range.mOffset = funcCodePos;
  10715. range.mLength = -1;
  10716. dbgVar->mGaps.push_back(range);
  10717. }
  10718. }
  10719. }
  10720. }
  10721. vregsInitialized = inst->mVRegsInitialized;
  10722. }
  10723. // Finish range for variables exiting liveness. Since liveness is built in end-to-start order,
  10724. // an "add" means that the NEXT instruction won't have this entry (if the next entry doesn't share
  10725. // the exact liveness value)
  10726. if ((inst->mLiveness != NULL) && (inst->mLiveness != vregsLive))
  10727. {
  10728. for (int changeIdx = 0; changeIdx < vregsLive->mNumChanges; changeIdx++)
  10729. {
  10730. int vregLiveIdx = vregsLive->GetChange(changeIdx);
  10731. if (vregLiveIdx < 0)
  10732. continue;
  10733. // Check for both the 'exists' flag changing and the 'in scope' flag changing
  10734. int vregIdx = vregLiveIdx % mLivenessContext.mNumItems;
  10735. auto dbgVar = mVRegInfo[vregIdx]->mDbgVariable;
  10736. if ((dbgVar != NULL) && (!dbgVar->mDbgLifeEnded))
  10737. {
  10738. //if (!mLivenessContext.IsSet(inst->mLiveness, vregIdx))
  10739. {
  10740. if (!dbgVar->mGaps.empty())
  10741. {
  10742. auto& lastGap = dbgVar->mGaps.back();
  10743. if (lastGap.mLength == -1)
  10744. {
  10745. // Unused gap
  10746. //dbgVar->mGaps.pop_back();
  10747. // Don't remove this 'unused gap' because the variable may come back alive
  10748. // This can happen in blocks after NoReturn calls
  10749. }
  10750. }
  10751. if (dbgVar->mDeclStart != -1)
  10752. {
  10753. dbgVar->mDeclEnd = funcCodePos;
  10754. if (mDebugging)
  10755. {
  10756. dbgStr += StrFormat("#### Dbg Setting DeclEnd %s\n", dbgVar->mName.c_str());
  10757. }
  10758. }
  10759. if ((mDebugging) && (dbgExtendLifetime))
  10760. {
  10761. dbgStr += StrFormat("#### Dbg Setting LifetimeExtend %s\n", dbgVar->mName.c_str());
  10762. }
  10763. dbgVar->mDeclLifetimeExtend = dbgExtendLifetime;
  10764. //if (dbgExtendLifetime)
  10765. //dbgVar->mDeclEnd++;
  10766. }
  10767. }
  10768. }
  10769. vregsLive = inst->mLiveness;
  10770. }
  10771. if (mDebugging)
  10772. {
  10773. BeDbgInstPos dbgInstPos = { funcCodePos, funcCodePos, inst };
  10774. dbgInstPositions.push_back(dbgInstPos);
  10775. }
  10776. switch (inst->mKind)
  10777. {
  10778. case BeMCInstKind_DbgDecl:
  10779. {
  10780. auto vregInfo = GetVRegInfo(inst->mArg0);
  10781. auto dbgVar = vregInfo->mDbgVariable;
  10782. dbgVar->mDeclStart = funcCodePos;
  10783. while (vregInfo->IsDirectRelTo())
  10784. {
  10785. if (vregInfo->mRelTo.IsNativeReg())
  10786. {
  10787. break;
  10788. }
  10789. else
  10790. vregInfo = GetVRegInfo(vregInfo->mRelTo);
  10791. }
  10792. BeMCOperand defArg = inst->mArg0;
  10793. if ((vregInfo->mIsRetVal) && (mCompositeRetVRegIdx != -1) && (mCompositeRetVRegIdx != inst->mArg0.mVRegIdx))
  10794. {
  10795. defArg = BeMCOperand::FromVReg(mCompositeRetVRegIdx);
  10796. if ((inst->mArg0.mKind == BeMCOperandKind_VReg) && (vregInfo->mType->IsComposite()))
  10797. defArg.mKind = BeMCOperandKind_VRegLoad;
  10798. vregInfo = mVRegInfo[mCompositeRetVRegIdx];
  10799. }
  10800. if (vregInfo->mReg != X64Reg_None)
  10801. {
  10802. if ((defArg.mKind == BeMCOperandKind_VRegAddr) || (dbgVar->mIsValue))
  10803. dbgVar->mPrimaryLoc.mKind = BeDbgVariableLoc::Kind_Reg;
  10804. else
  10805. dbgVar->mPrimaryLoc.mKind = BeDbgVariableLoc::Kind_Indexed;
  10806. dbgVar->mPrimaryLoc.mReg = vregInfo->mReg;
  10807. dbgVar->mPrimaryLoc.mOfs = 0;
  10808. }
  10809. else if (vregInfo->mRelTo.IsNativeReg())
  10810. {
  10811. if ((defArg.mKind == BeMCOperandKind_VRegAddr) || (dbgVar->mIsValue))
  10812. dbgVar->mPrimaryLoc.mKind = BeDbgVariableLoc::Kind_Reg;
  10813. else
  10814. dbgVar->mPrimaryLoc.mKind = BeDbgVariableLoc::Kind_Indexed;
  10815. dbgVar->mPrimaryLoc.mReg = vregInfo->mRelTo.mReg;
  10816. if (vregInfo->mRelOffset.IsImmediateInt())
  10817. {
  10818. dbgVar->mPrimaryLoc.mOfs = vregInfo->mRelOffset.mImmediate;
  10819. }
  10820. else
  10821. BF_ASSERT(!vregInfo->mRelOffset);
  10822. }
  10823. else if (vregInfo->mRelTo.mKind == BeMCOperandKind_SymbolAddr)
  10824. {
  10825. Fail("Not supported SymbolAddr");
  10826. //dbgVar->mPrimaryLoc.mKind = BeDbgVariableLoc::Kind_SymbolAddr;
  10827. //dbgVar->mPrimaryLoc.mOfs = vregInfo->mRelTo.mSymbolIdx;
  10828. }
  10829. if ((dbgVar->mPrimaryLoc.mKind == BeDbgVariableLoc::Kind_None) && (vregInfo->mType->mSize != 0))
  10830. {
  10831. dbgVar->mPrimaryLoc.mKind = BeDbgVariableLoc::Kind_Indexed;
  10832. GetValAddr(BeMCOperand::FromVRegAddr(inst->mArg0.mVRegIdx), dbgVar->mPrimaryLoc.mReg, dbgVar->mPrimaryLoc.mOfs);
  10833. }
  10834. if (!mVRegInitializedContext.IsSet(vregsInitialized, inst->mArg0.mVRegIdx))
  10835. {
  10836. bool inGap = false;
  10837. if (!dbgVar->mGaps.empty())
  10838. inGap = dbgVar->mGaps.back().mLength == -1;
  10839. if (!inGap)
  10840. {
  10841. if (mDebugging)
  10842. {
  10843. dbgStr += StrFormat(" Dbg Starting Gap %s\n", dbgVar->mName.c_str());
  10844. }
  10845. BeDbgVariableRange range;
  10846. range.mOffset = funcCodePos;
  10847. range.mLength = -1;
  10848. dbgVar->mGaps.push_back(range);
  10849. }
  10850. }
  10851. if (vregInfo->mVolatileVRegSave != -1)
  10852. {
  10853. auto savedVRegInfo = mVRegInfo[vregInfo->mVolatileVRegSave];
  10854. dbgVar->mSavedLoc.mKind = BeDbgVariableLoc::Kind_Indexed;
  10855. GetValAddr(BeMCOperand::FromVRegAddr(vregInfo->mVolatileVRegSave), dbgVar->mSavedLoc.mReg, dbgVar->mSavedLoc.mOfs);
  10856. }
  10857. }
  10858. break;
  10859. case BeMCInstKind_DbgRangeStart:
  10860. {
  10861. }
  10862. break;
  10863. case BeMCInstKind_DbgRangeEnd:
  10864. {
  10865. auto vregInfo = GetVRegInfo(inst->mArg0);
  10866. if (vregInfo->mDbgVariable != NULL)
  10867. {
  10868. auto dbgVar = vregInfo->mDbgVariable;
  10869. dbgVar->mDeclEnd = funcCodePos;
  10870. dbgVar->mDeclLifetimeExtend = false;
  10871. BF_ASSERT((uint)dbgVar->mDeclEnd >= (uint)dbgVar->mDeclStart);
  10872. }
  10873. }
  10874. break;
  10875. case BeMCInstKind_LifetimeExtend:
  10876. break;
  10877. case BeMCInstKind_LifetimeStart:
  10878. break;
  10879. case BeMCInstKind_LifetimeEnd:
  10880. break;
  10881. case BeMCInstKind_ValueScopeSoftEnd:
  10882. break;
  10883. case BeMCInstKind_ValueScopeHardEnd:
  10884. break;
  10885. case BeMCInstKind_MemSet:
  10886. {
  10887. // This doesn't currently attempt to align properly
  10888. int memSize = inst->mArg0.mMemSetInfo.mSize;
  10889. uint8 memValue = inst->mArg0.mMemSetInfo.mValue;
  10890. int curOfs = 0;
  10891. X64CPURegister destReg = X64Reg_R10;
  10892. int destOfs = 0;
  10893. if (inst->mArg1.IsNativeReg())
  10894. {
  10895. destReg = inst->mArg1.mReg;
  10896. }
  10897. else if (inst->mArg1)
  10898. {
  10899. //BF_ASSERT(inst->mArg1.mKind == BeMCOperandKind_VReg);
  10900. GetValAddr(inst->mArg1, destReg, destOfs);
  10901. }
  10902. if (memValue == 0)
  10903. {
  10904. // xor r11, r11
  10905. Emit(0x4D); Emit(0x31); Emit(0xDB);
  10906. }
  10907. else
  10908. {
  10909. // mov r11, memValue*8
  10910. Emit(0x49); Emit(0xBB);
  10911. for (int i = 0; i < 8; i++)
  10912. Emit(memValue);
  10913. }
  10914. for (; curOfs <= memSize - 8; curOfs += 8)
  10915. {
  10916. EmitREX(BeMCOperand::FromReg(X64Reg_R11), BeMCOperand::FromReg(destReg), true);
  10917. Emit(0x89);
  10918. EmitModRMRel(EncodeRegNum(X64Reg_R11), destReg, X64Reg_None, 1, curOfs + destOfs);
  10919. }
  10920. // If there's more that one 'small' write required then we just do another 64-bit move
  10921. // which overlaps partially into the previous 64-bit move
  10922. if ((memSize > 8) && (curOfs < memSize) && (memSize - curOfs != 4) &&
  10923. (memSize - curOfs != 2) && (memSize - curOfs != 1))
  10924. {
  10925. EmitREX(BeMCOperand::FromReg(X64Reg_R11), BeMCOperand::FromReg(destReg), true);
  10926. Emit(0x89);
  10927. EmitModRMRel(EncodeRegNum(X64Reg_R11), destReg, X64Reg_None, 1, (memSize - 8) + destOfs);
  10928. curOfs = memSize;
  10929. }
  10930. for (; curOfs <= memSize - 4; curOfs += 4)
  10931. {
  10932. EmitREX(BeMCOperand::FromReg(X64Reg_R11D), BeMCOperand::FromReg(destReg), false);
  10933. Emit(0x89);
  10934. EmitModRMRel(EncodeRegNum(X64Reg_R11D), destReg, X64Reg_None, 1, curOfs + destOfs);
  10935. }
  10936. for (; curOfs <= memSize - 2; curOfs += 2)
  10937. {
  10938. Emit(0x66); EmitREX(BeMCOperand::FromReg(X64Reg_R11W), BeMCOperand::FromReg(destReg), false);
  10939. Emit(0x89);
  10940. EmitModRMRel(EncodeRegNum(X64Reg_R11W), destReg, X64Reg_None, 1, curOfs + destOfs);
  10941. }
  10942. for (; curOfs <= memSize - 1; curOfs += 1)
  10943. {
  10944. EmitREX(BeMCOperand::FromReg(X64Reg_R11B), BeMCOperand::FromReg(destReg), false); //-V530
  10945. Emit(0x89 - 1);
  10946. EmitModRMRel(EncodeRegNum(X64Reg_R11B), destReg, X64Reg_None, 1, curOfs + destOfs);
  10947. }
  10948. }
  10949. break;
  10950. case BeMCInstKind_MemCpy:
  10951. {
  10952. // This doesn't currently attempt to align properly
  10953. int memSize = inst->mArg0.mMemCpyInfo.mSize;
  10954. int curOfs = 0;
  10955. X64CPURegister destReg = X64Reg_R10;
  10956. X64CPURegister srcReg = X64Reg_R11;
  10957. int destOfs = 0;
  10958. int srcOfs = 0;
  10959. if (inst->mArg1)
  10960. {
  10961. BF_ASSERT(inst->mArg1.mKind == BeMCOperandKind_VRegPair);
  10962. GetValAddr(BeMCOperand::FromEncoded(inst->mArg1.mVRegPair.mVRegIdx0), destReg, destOfs);
  10963. GetValAddr(BeMCOperand::FromEncoded(inst->mArg1.mVRegPair.mVRegIdx1), srcReg, srcOfs);
  10964. }
  10965. if ((srcReg == destReg) && (srcOfs == destOfs))
  10966. break;
  10967. for ( ; curOfs <= memSize - 8 ; curOfs += 8)
  10968. {
  10969. EmitREX(BeMCOperand::FromReg(X64Reg_R11), BeMCOperand::FromReg(srcReg), true);
  10970. Emit(0x8B);
  10971. EmitModRMRel(EncodeRegNum(X64Reg_R11), srcReg, X64Reg_None, 1, curOfs + srcOfs);
  10972. EmitREX(BeMCOperand::FromReg(X64Reg_R11), BeMCOperand::FromReg(destReg), true);
  10973. Emit(0x89);
  10974. EmitModRMRel(EncodeRegNum(X64Reg_R11), destReg, X64Reg_None, 1, curOfs + destOfs);
  10975. }
  10976. // If there's more that one 'small' write required then we just do another 64-bit move
  10977. // which overlaps partially into the previous 64-bit move
  10978. if ((memSize > 8) && (curOfs < memSize) && (memSize - curOfs != 4) &&
  10979. (memSize - curOfs != 2) && (memSize - curOfs != 1))
  10980. {
  10981. EmitREX(BeMCOperand::FromReg(X64Reg_R11), BeMCOperand::FromReg(srcReg), true);
  10982. Emit(0x8B);
  10983. EmitModRMRel(EncodeRegNum(X64Reg_R11), srcReg, X64Reg_None, 1, (memSize - 8) + srcOfs);
  10984. EmitREX(BeMCOperand::FromReg(X64Reg_R11), BeMCOperand::FromReg(destReg), true);
  10985. Emit(0x89);
  10986. EmitModRMRel(EncodeRegNum(X64Reg_R11), destReg, X64Reg_None, 1, (memSize - 8) + destOfs);
  10987. curOfs = memSize;
  10988. }
  10989. for ( ; curOfs <= memSize - 4; curOfs += 4)
  10990. {
  10991. EmitREX(BeMCOperand::FromReg(X64Reg_R11D), BeMCOperand::FromReg(srcReg), false);
  10992. Emit(0x8B);
  10993. EmitModRMRel(EncodeRegNum(X64Reg_R11D), srcReg, X64Reg_None, 1, curOfs + srcOfs);
  10994. EmitREX(BeMCOperand::FromReg(X64Reg_R11D), BeMCOperand::FromReg(destReg), false);
  10995. Emit(0x89);
  10996. EmitModRMRel(EncodeRegNum(X64Reg_R11D), destReg, X64Reg_None, 1, curOfs + destOfs);
  10997. }
  10998. for ( ; curOfs <= memSize - 2; curOfs += 2)
  10999. {
  11000. Emit(0x66); EmitREX(BeMCOperand::FromReg(X64Reg_R11W), BeMCOperand::FromReg(srcReg), false);
  11001. Emit(0x8B);
  11002. EmitModRMRel(EncodeRegNum(X64Reg_R11W), srcReg, X64Reg_None, 1, curOfs + srcOfs);
  11003. Emit(0x66); EmitREX(BeMCOperand::FromReg(X64Reg_R11W), BeMCOperand::FromReg(destReg), false);
  11004. Emit(0x89);
  11005. EmitModRMRel(EncodeRegNum(X64Reg_R11W), destReg, X64Reg_None, 1, curOfs + destOfs);
  11006. }
  11007. for ( ; curOfs <= memSize - 1; curOfs += 1)
  11008. {
  11009. EmitREX(BeMCOperand::FromReg(X64Reg_R11B), BeMCOperand::FromReg(srcReg), false);
  11010. Emit(0x8B - 1);
  11011. EmitModRMRel(EncodeRegNum(X64Reg_R11B), srcReg, X64Reg_None, 1, curOfs + srcOfs);
  11012. EmitREX(BeMCOperand::FromReg(X64Reg_R11B), BeMCOperand::FromReg(destReg), false);
  11013. Emit(0x89 - 1);
  11014. EmitModRMRel(EncodeRegNum(X64Reg_R11B), destReg, X64Reg_None, 1, curOfs + destOfs);
  11015. }
  11016. }
  11017. break;
  11018. case BeMCInstKind_FastCheckStack:
  11019. {
  11020. // CMP RSP, [RSP]
  11021. BF_ASSERT(inst->mArg0 == BeMCOperand::FromReg(X64Reg_RSP));
  11022. Emit(0x48);
  11023. Emit(0x3B);
  11024. Emit(0x24);
  11025. Emit(0x24);
  11026. }
  11027. break;
  11028. case BeMCInstKind_TLSSetup:
  11029. {
  11030. if (inst->mArg1) // Alt
  11031. {
  11032. BF_ASSERT(inst->mArg0.IsNativeReg());
  11033. // mov arg0, qword ptr gs:[0x58]
  11034. Emit(0x65);
  11035. EmitREX(inst->mArg0, BeMCOperand(), true);
  11036. Emit(0x8B); Emit(0x04 | (EncodeRegNum(inst->mArg0.mReg) << 3)); Emit(0x25);
  11037. mOut.Write((int32)0x58);
  11038. }
  11039. else
  11040. {
  11041. // mov eax, _tls_index
  11042. Emit(0x8B); Emit(0x05);
  11043. auto sym = mCOFFObject->GetSymbolRef("_tls_index");
  11044. BeMCRelocation reloc;
  11045. reloc.mKind = BeMCRelocationKind_REL32;
  11046. reloc.mOffset = mOut.GetPos();
  11047. reloc.mSymTableIdx = sym->mIdx;
  11048. mCOFFObject->mTextSect.mRelocs.push_back(reloc);
  11049. mTextRelocs.push_back((int)mCOFFObject->mTextSect.mRelocs.size() - 1);
  11050. mOut.Write((int32)0);
  11051. auto vregInfo = mVRegInfo[mTLSVRegIdx];
  11052. BF_ASSERT(vregInfo->mReg != X64Reg_None);
  11053. auto tlsOperand = BeMCOperand::FromReg(vregInfo->mReg);
  11054. // mov tlsReg, qword ptr gs:[0x58]
  11055. Emit(0x65);
  11056. EmitREX(tlsOperand, BeMCOperand(), true);
  11057. Emit(0x8B); Emit(0x04 | (EncodeRegNum(vregInfo->mReg) << 3)); Emit(0x25);
  11058. mOut.Write((int32)0x58);
  11059. // mov tlsReg, qword ptr [tlsReg + 8*rax]
  11060. EmitREX(tlsOperand, tlsOperand, true);
  11061. Emit(0x8B);
  11062. EmitModRMRel(EncodeRegNum(vregInfo->mReg), vregInfo->mReg, X64Reg_RAX, 8, 0);
  11063. }
  11064. }
  11065. break;
  11066. case BeMCInstKind_PreserveVolatiles:
  11067. {
  11068. for (int vregIdx : *inst->mLiveness)
  11069. {
  11070. if (vregIdx >= mLivenessContext.mNumItems)
  11071. continue;
  11072. auto vregInfo = mVRegInfo[vregIdx];
  11073. if ((inst->mArg0.IsNativeReg()) && (inst->mArg0.mReg != vregInfo->mReg))
  11074. continue;
  11075. if (vregInfo->mVolatileVRegSave != -1)
  11076. {
  11077. if (vregInfo->mDbgVariable != NULL)
  11078. {
  11079. BeDbgVariableRange range;
  11080. range.mOffset = funcCodePos;
  11081. range.mLength = -1;
  11082. vregInfo->mDbgVariable->mSavedRanges.push_back(range);
  11083. }
  11084. }
  11085. }
  11086. }
  11087. break;
  11088. case BeMCInstKind_RestoreVolatiles:
  11089. {
  11090. for (int vregIdx : *inst->mLiveness)
  11091. {
  11092. if (vregIdx >= mLivenessContext.mNumItems)
  11093. continue;
  11094. auto vregInfo = mVRegInfo[vregIdx];
  11095. if ((inst->mArg0.IsNativeReg()) && (inst->mArg0.mReg != vregInfo->mReg))
  11096. continue;
  11097. if (vregInfo->mVolatileVRegSave != -1)
  11098. {
  11099. if ((vregInfo->mDbgVariable != NULL) && (!vregInfo->mDbgVariable->mSavedRanges.empty()))
  11100. {
  11101. BeDbgVariableRange& range = vregInfo->mDbgVariable->mSavedRanges.back();
  11102. range.mLength = funcCodePos - range.mOffset;
  11103. bool handled = false;
  11104. if (!vregInfo->mDbgVariable->mGaps.empty())
  11105. {
  11106. auto& lastGap = vregInfo->mDbgVariable->mGaps.back();
  11107. if (lastGap.mLength == -1)
  11108. {
  11109. lastGap.mLength = funcCodePos - lastGap.mOffset;
  11110. handled = true;
  11111. }
  11112. }
  11113. if (!handled)
  11114. {
  11115. BeDbgVariableRange gapRange = range;
  11116. // gapRange.mOffset++;
  11117. // gapRange.mLength--;
  11118. vregInfo->mDbgVariable->mGaps.push_back(gapRange);
  11119. }
  11120. }
  11121. }
  11122. }
  11123. }
  11124. break;
  11125. case BeMCInstKind_None:
  11126. break;
  11127. case BeMCInstKind_Unwind_Alloc:
  11128. case BeMCInstKind_Unwind_PushReg:
  11129. case BeMCInstKind_Unwind_SaveXMM:
  11130. case BeMCInstKind_Unwind_SetBP:
  11131. {
  11132. BeMCDeferredUnwind deferredUnwind = { inst, funcCodePos };
  11133. deferredUnwinds.push_back(deferredUnwind);
  11134. }
  11135. break;
  11136. case BeMCInstKind_Label:
  11137. while (funcCodePos < hotJumpLen)
  11138. {
  11139. Emit(0x90);
  11140. funcCodePos++;
  11141. }
  11142. lastLabelIdx = inst->mArg0.mLabelIdx;
  11143. labelPositions[inst->mArg0.mLabelIdx] = funcCodePos;
  11144. // This ensures we can't jump back into the hot jump area
  11145. break;
  11146. case BeMCInstKind_Nop:
  11147. Emit(0x90);
  11148. break;
  11149. case BeMCInstKind_Unreachable:
  11150. // ud2
  11151. Emit(0x0F); Emit(0x0B);
  11152. break;
  11153. case BeMCInstKind_EnsureInstructionAt:
  11154. needsInstructionAtDbgLoc = true;
  11155. /*if (mDbgFunction != NULL)
  11156. {
  11157. // If this is true, this means that our instruction was the first one encountered at this mDbgPos,
  11158. // so we emit a NOP so we can step onto this line
  11159. if (mDbgFunction->mEmissions.back().mPos == funcCodePos)
  11160. {
  11161. mOut.Write((uint8)0x90);
  11162. }
  11163. }*/
  11164. break;
  11165. case BeMCInstKind_DbgBreak:
  11166. Emit(0xCC);
  11167. break;
  11168. case BeMCInstKind_MFence:
  11169. Emit(0x0F); Emit(0xAE); Emit(0xF0);
  11170. break;
  11171. case BeMCInstKind_Mov:
  11172. {
  11173. if (inst->mArg1.mKind == BeMCOperandKind_ConstAgg)
  11174. {
  11175. EmitAggMov(inst->mArg0, inst->mArg1);
  11176. break;
  11177. }
  11178. auto vregInfo = GetVRegInfo(inst->mArg1);
  11179. auto arg0Type = GetType(inst->mArg0);
  11180. auto arg1Type = GetType(inst->mArg1);
  11181. if (instForm == BeMCInstForm_Unknown)
  11182. {
  11183. if ((inst->mArg0.IsNativeReg()) && (inst->mArg1.IsNativeReg()))
  11184. {
  11185. if ((arg0Type->IsInt()) && (arg0Type->mSize < arg1Type->mSize))
  11186. {
  11187. // Reduce arg1 to arg0 size
  11188. BeMCOperand mcDest;
  11189. BeMCOperand mcSrc = BeMCOperand::FromReg(ResizeRegister(inst->mArg1.mReg, arg0Type->mSize));
  11190. BeTypeCode useTypeCode = BeTypeCode_None;
  11191. if (mcSrc.mReg != X64Reg_None)
  11192. {
  11193. // Reduction worked
  11194. mcDest = inst->mArg0;
  11195. useTypeCode = arg0Type->mTypeCode;
  11196. }
  11197. else
  11198. {
  11199. Fail("Error in Mov");
  11200. }
  11201. switch (useTypeCode)
  11202. {
  11203. case BeTypeCode_Int8:
  11204. EmitREX(mcDest, mcSrc, false);
  11205. Emit(0x8A); EmitModRM(mcDest, mcSrc);
  11206. break;
  11207. case BeTypeCode_Int16: Emit(0x66); // Fallthrough
  11208. case BeTypeCode_Int32:
  11209. case BeTypeCode_Int64:
  11210. EmitREX(mcDest, mcSrc, arg0Type->mTypeCode == BeTypeCode_Int64);
  11211. Emit(0x8B); EmitModRM(mcDest, mcSrc);
  11212. break;
  11213. default: NotImpl();
  11214. }
  11215. break;
  11216. }
  11217. }
  11218. if (inst->mArg0.IsNativeReg())
  11219. {
  11220. BF_ASSERT(arg0Type->IsIntable());
  11221. BF_ASSERT(arg1Type->IsIntable());
  11222. BF_ASSERT(arg0Type->mSize > arg1Type->mSize);
  11223. // Zero extend 'dest' to 'src', emit movzx
  11224. switch (arg0Type->mTypeCode)
  11225. {
  11226. case BeTypeCode_Int16:
  11227. BF_ASSERT(arg1Type->mTypeCode == BeTypeCode_Int8);
  11228. Emit(0x66);
  11229. EmitREX(inst->mArg0, inst->mArg1, false);
  11230. Emit(0x0F); Emit(0xB6); EmitModRM(inst->mArg0, inst->mArg1);
  11231. break;
  11232. case BeTypeCode_Int32:
  11233. switch (arg1Type->mTypeCode)
  11234. {
  11235. case BeTypeCode_Int8:
  11236. case BeTypeCode_Boolean:
  11237. EmitREX(inst->mArg0, inst->mArg1, false);
  11238. Emit(0x0F); Emit(0xB6); EmitModRM(inst->mArg0, inst->mArg1);
  11239. break;
  11240. case BeTypeCode_Int16:
  11241. EmitREX(inst->mArg0, inst->mArg1, false);
  11242. Emit(0x0F); Emit(0xB7); EmitModRM(inst->mArg0, inst->mArg1);
  11243. break;
  11244. default: NotImpl();
  11245. }
  11246. break;
  11247. case BeTypeCode_Int64:
  11248. switch (arg1Type->mTypeCode)
  11249. {
  11250. case BeTypeCode_Int8:
  11251. case BeTypeCode_Boolean:
  11252. EmitREX(inst->mArg0, inst->mArg1, true);
  11253. Emit(0x0F); Emit(0xB6); EmitModRM(inst->mArg0, inst->mArg1); break;
  11254. case BeTypeCode_Int16:
  11255. EmitREX(inst->mArg0, inst->mArg1, true);
  11256. Emit(0x0F); Emit(0xB7); EmitModRM(inst->mArg0, inst->mArg1); break;
  11257. case BeTypeCode_Int32:
  11258. {
  11259. // We convert from a "mov r64, r32" to a "mov r32, r32", which forces high 32 bits of original r64 to zero
  11260. BeMCOperand mcDest = BeMCOperand::FromReg(ResizeRegister(inst->mArg0.mReg, arg1Type->mSize));
  11261. EmitREX(mcDest, inst->mArg1, false);
  11262. Emit(0x8B); EmitModRM(mcDest, inst->mArg1);
  11263. }
  11264. break;
  11265. }
  11266. break;
  11267. default:
  11268. NotImpl();
  11269. }
  11270. break; // from inst switch
  11271. }
  11272. if (arg0Type->mTypeCode == BeTypeCode_Float)
  11273. {
  11274. if (inst->mArg1.IsImmediate())
  11275. {
  11276. // Emit as a int32 mov
  11277. EmitREX(BeMCOperand(), inst->mArg0, false);
  11278. Emit(0xC7);
  11279. EmitModRM(0, inst->mArg0, -4);
  11280. float val = inst->mArg1.mImmFloat;
  11281. mOut.Write(*(int32*)&val);
  11282. break;
  11283. }
  11284. }
  11285. }
  11286. if (inst->mArg1.mKind == BeMCOperandKind_CmpResult)
  11287. {
  11288. BF_ASSERT(instForm == BeMCInstForm_R8_RM8);
  11289. // SETcc
  11290. auto& cmpResult = mCmpResults[inst->mArg1.mCmpResultIdx];
  11291. uint8 opCode = GetJumpOpCode(cmpResult.mCmpKind, false) + 0x20;
  11292. EmitREX(BeMCOperand(), inst->mArg0, false);
  11293. Emit(0x0F);
  11294. Emit(opCode);
  11295. EmitModRM(0, inst->mArg0);
  11296. break;
  11297. }
  11298. bool isLEA = inst->mArg1.mKind == BeMCOperandKind_SymbolAddr;
  11299. if ((instForm == BeMCInstForm_R64_RM64) && (inst->mArg1.IsVRegAny()))
  11300. {
  11301. bool isMulti = false;
  11302. if (GetRMForm(inst->mArg1, isMulti) == BeMCRMMode_Direct)
  11303. {
  11304. // LEA
  11305. auto modInst = *inst;
  11306. BF_ASSERT(modInst.mArg1.IsVRegAny());
  11307. modInst.mArg1 = BeMCOperand::ToLoad(modInst.mArg1);
  11308. EmitInst(BeMCInstForm_R64_RM64, 0x8D, &modInst);
  11309. break;
  11310. }
  11311. else
  11312. {
  11313. auto vregInfo1 = GetVRegInfo(inst->mArg1);
  11314. if (vregInfo1->mRelTo.mKind == BeMCOperandKind_SymbolAddr)
  11315. isLEA = true;
  11316. }
  11317. }
  11318. if (inst->mArg1.mKind == BeMCOperandKind_VRegAddr)
  11319. {
  11320. NotImpl();
  11321. /*// LEA
  11322. switch (instForm)
  11323. {
  11324. case BeMCInstForm_R64_RM64: EmitInst(BeMCInstForm_R64_RM64, 0x8D, inst); break;
  11325. default:
  11326. NotImpl();
  11327. }*/
  11328. }
  11329. else if (isLEA)
  11330. {
  11331. // LEA
  11332. switch (instForm)
  11333. {
  11334. case BeMCInstForm_R64_RM64: EmitInst(BeMCInstForm_R64_RM64, 0x8D, inst); break;
  11335. default:
  11336. NotImpl();
  11337. }
  11338. }
  11339. // ??
  11340. /*else if ((vregInfo != NULL) && (vregInfo->mIsExpr))
  11341. {
  11342. // LEA
  11343. switch (instForm)
  11344. {
  11345. case BeMCInstForm_R64_RM64: EmitInst(BeMCInstForm_R64_RM64_ADDR, 0x8D, inst); break;
  11346. default:
  11347. NotImpl();
  11348. }
  11349. }*/
  11350. else if ((inst->mArg0.IsNativeReg()) && (inst->mArg1.IsZero()))
  11351. {
  11352. // Emit as XOR <arg0>, <arg0>
  11353. EmitREX(inst->mArg0, inst->mArg0, GetType(inst->mArg0)->mSize == 8);
  11354. mOut.Write((uint8)0x33); // r, r/m64
  11355. EmitModRM(inst->mArg0, inst->mArg0);
  11356. }
  11357. else
  11358. {
  11359. switch (instForm)
  11360. {
  11361. case BeMCInstForm_XMM32_RM32:
  11362. {
  11363. BF_ASSERT(inst->mArg1.IsNativeReg());
  11364. // CVTSI2SS - use zero-extended 64-bit register
  11365. EmitStdXMMInst(BeMCInstForm_XMM32_RM64, inst, 0x2A);
  11366. }
  11367. break;
  11368. case BeMCInstForm_XMM64_RM32:
  11369. {
  11370. BF_ASSERT(inst->mArg1.IsNativeReg());
  11371. // CVTSI2SD - use zero-extended 64-bit register
  11372. EmitStdXMMInst(BeMCInstForm_XMM64_RM64, inst, 0x2A);
  11373. }
  11374. break;
  11375. case BeMCInstForm_XMM64_RM64:
  11376. case BeMCInstForm_XMM32_RM64:
  11377. {
  11378. // uint64->xmm Not implemented
  11379. NotImpl();
  11380. }
  11381. break;
  11382. case BeMCInstForm_XMM64_FRM32:
  11383. case BeMCInstForm_XMM32_FRM64:
  11384. {
  11385. // CVTSS2SD / CVTSD2SS
  11386. EmitStdXMMInst(instForm, inst, 0x5A);
  11387. }
  11388. break;
  11389. case BeMCInstForm_R32_F32:
  11390. case BeMCInstForm_R32_F64:
  11391. case BeMCInstForm_R64_F32:
  11392. case BeMCInstForm_R64_F64:
  11393. {
  11394. // CVTTSS2SI
  11395. EmitStdXMMInst(instForm, inst, 0x2C);
  11396. }
  11397. break;
  11398. default:
  11399. {
  11400. // MOVSS/MOVSD
  11401. if (EmitStdXMMInst(instForm, inst, 0x10, 0x11))
  11402. break;
  11403. if ((inst->mArg0.IsNativeReg()) && (inst->mArg1.IsImmediateInt()))
  11404. {
  11405. auto arg0Type = GetType(inst->mArg0);
  11406. if (arg0Type->mTypeCode == BeTypeCode_Int16)
  11407. {
  11408. Emit(0x66);
  11409. EmitREX(BeMCOperand(), inst->mArg0, false);
  11410. Emit(0xB8 + EncodeRegNum(inst->mArg0.mReg));
  11411. mOut.Write((int16)inst->mArg1.mImmediate);
  11412. break;
  11413. }
  11414. else if ((arg0Type->mTypeCode == BeTypeCode_Int32) || (arg0Type->mTypeCode == BeTypeCode_Int64))
  11415. {
  11416. // For 64-bit writes, we would like to use 32-bit zero extension but we resort to the full
  11417. // 64-bits if necessary
  11418. auto arg0 = inst->mArg0;
  11419. if (arg0Type->mTypeCode == BeTypeCode_Int64)
  11420. {
  11421. auto resizedReg = ResizeRegister(arg0.mReg, 4);
  11422. if ((resizedReg != X64Reg_None) && (inst->mArg1.mImmediate < 0) && (inst->mArg1.mImmediate >= -0x80000000LL))
  11423. {
  11424. // Do sign-extend R32 mov
  11425. EmitREX(BeMCOperand(), inst->mArg0, true);
  11426. Emit(0xC7);
  11427. EmitModRM(0, inst->mArg0);
  11428. mOut.Write((int32)inst->mArg1.mImmediate);
  11429. break;
  11430. }
  11431. if ((resizedReg == X64Reg_None) || (inst->mArg1.mImmediate < 0) || (inst->mArg1.mImmediate >= 0x100000000LL))
  11432. {
  11433. EmitREX(BeMCOperand(), inst->mArg0, true);
  11434. Emit(0xB8 + EncodeRegNum(inst->mArg0.mReg));
  11435. mOut.Write((int64)inst->mArg1.mImmediate);
  11436. break;
  11437. }
  11438. else
  11439. arg0.mReg = resizedReg;
  11440. }
  11441. EmitREX(BeMCOperand(), arg0, false);
  11442. Emit(0xB8 + EncodeRegNum(arg0.mReg));
  11443. mOut.Write((int32)inst->mArg1.mImmediate);
  11444. break;
  11445. }
  11446. }
  11447. EmitStdInst(instForm, inst, 0x89, 0x8B, 0xC7, 0x0);
  11448. }
  11449. }
  11450. }
  11451. }
  11452. break;
  11453. case BeMCInstKind_MovRaw:
  11454. {
  11455. auto arg0Type = GetType(inst->mArg0);
  11456. auto arg1Type = GetType(inst->mArg1);
  11457. if ((arg0Type->mTypeCode == BeTypeCode_Int64) && (arg1Type->mTypeCode == BeTypeCode_Double))
  11458. {
  11459. Emit(0x66); EmitREX(inst->mArg1, inst->mArg0, true);
  11460. Emit(0x0F); Emit(0x7E);
  11461. EmitModRM(inst->mArg1, inst->mArg0);
  11462. }
  11463. else
  11464. {
  11465. NotImpl();
  11466. }
  11467. }
  11468. break;
  11469. case BeMCInstKind_MovSX:
  11470. {
  11471. auto arg0Type = GetType(inst->mArg0);
  11472. auto arg1Type = GetType(inst->mArg1);
  11473. switch (arg0Type->mTypeCode)
  11474. {
  11475. case BeTypeCode_Int16:
  11476. BF_ASSERT(arg1Type->mTypeCode == BeTypeCode_Int8);
  11477. Emit(0x66);
  11478. EmitREX(inst->mArg0, inst->mArg1, false);
  11479. Emit(0x0F); Emit(0xBE); EmitModRM(inst->mArg0, inst->mArg1);
  11480. break;
  11481. case BeTypeCode_Int32:
  11482. switch (arg1Type->mTypeCode)
  11483. {
  11484. case BeTypeCode_Int8:
  11485. EmitREX(inst->mArg0, inst->mArg1, false);
  11486. Emit(0x0F); Emit(0xBE); EmitModRM(inst->mArg0, inst->mArg1);
  11487. break;
  11488. case BeTypeCode_Int16:
  11489. EmitREX(inst->mArg0, inst->mArg1, false);
  11490. Emit(0x0F); Emit(0xBF); EmitModRM(inst->mArg0, inst->mArg1);
  11491. break;
  11492. case BeTypeCode_Float:
  11493. // CVTSS2SI
  11494. Emit(0xF3); EmitREX(inst->mArg0, inst->mArg1, false);
  11495. Emit(0x0F); Emit(0x2C);
  11496. EmitModRM(inst->mArg0, inst->mArg1);
  11497. break;
  11498. default: NotImpl();
  11499. }
  11500. break;
  11501. case BeTypeCode_Int64:
  11502. switch (arg1Type->mTypeCode)
  11503. {
  11504. case BeTypeCode_Int8:
  11505. EmitREX(inst->mArg0, inst->mArg1, true);
  11506. Emit(0x0F); Emit(0xBE); EmitModRM(inst->mArg0, inst->mArg1); break;
  11507. case BeTypeCode_Int16:
  11508. EmitREX(inst->mArg0, inst->mArg1, true);
  11509. Emit(0x0F); Emit(0xBF); EmitModRM(inst->mArg0, inst->mArg1); break;
  11510. case BeTypeCode_Int32:
  11511. EmitREX(inst->mArg0, inst->mArg1, true);
  11512. Emit(0x63); EmitModRM(inst->mArg0, inst->mArg1); break;
  11513. case BeTypeCode_Float:
  11514. // CVTSS2SI
  11515. Emit(0xF3); EmitREX(inst->mArg0, inst->mArg1, true);
  11516. Emit(0x0F); Emit(0x2C);
  11517. EmitModRM(inst->mArg0, inst->mArg1);
  11518. break;
  11519. default: NotImpl();
  11520. }
  11521. break;
  11522. case BeTypeCode_Float:
  11523. case BeTypeCode_Double:
  11524. {
  11525. if (arg1Type->IsInt())
  11526. {
  11527. // CVTSI2SS / CVTSI2SD
  11528. EmitStdXMMInst(instForm, inst, 0x2A);
  11529. }
  11530. else
  11531. NotImpl();
  11532. /*switch (arg1Type->mTypeCode)
  11533. {
  11534. case BeTypeCode_Double:
  11535. EmitStdXMMInst(BeMCInstForm_XMM32_RM64, inst, 0x5A);
  11536. break;
  11537. default:
  11538. NotImpl();
  11539. break;
  11540. }*/
  11541. }
  11542. break;
  11543. default: NotImpl();
  11544. }
  11545. }
  11546. break;
  11547. case BeMCInstKind_CmpXChg:
  11548. {
  11549. auto arg0Type = GetType(inst->mArg0);
  11550. if (inst->mArg1.IsNativeReg())
  11551. {
  11552. switch (instForm)
  11553. {
  11554. case BeMCInstForm_R8_RM8:
  11555. instForm = BeMCInstForm_RM8_R8;
  11556. break;
  11557. case BeMCInstForm_R16_RM16:
  11558. instForm = BeMCInstForm_RM16_R16;
  11559. break;
  11560. case BeMCInstForm_R32_RM32:
  11561. instForm = BeMCInstForm_RM32_R32;
  11562. break;
  11563. case BeMCInstForm_R64_RM64:
  11564. instForm = BeMCInstForm_RM64_R64;
  11565. break;
  11566. }
  11567. }
  11568. if (!inst->mArg0.IsNativeReg())
  11569. Emit(0xF0); // LOCK
  11570. switch (instForm)
  11571. {
  11572. case BeMCInstForm_RM8_R8:
  11573. EmitREX(inst->mArg1, inst->mArg0, false);
  11574. Emit(0x0F); Emit(0xB0); EmitModRM(inst->mArg1, inst->mArg0);
  11575. break;
  11576. case BeMCInstForm_RM16_R16:
  11577. EmitREX(inst->mArg1, inst->mArg0, false);
  11578. Emit(0x66); Emit(0x0F); Emit(0xB0); EmitModRM(inst->mArg1, inst->mArg0);
  11579. break;
  11580. case BeMCInstForm_RM32_R32:
  11581. EmitREX(inst->mArg1, inst->mArg0, false);
  11582. Emit(0x0F); Emit(0xB1); EmitModRM(inst->mArg1, inst->mArg0);
  11583. break;
  11584. case BeMCInstForm_RM64_R64:
  11585. EmitREX(inst->mArg1, inst->mArg0, true);
  11586. Emit(0x0F); Emit(0xB1); EmitModRM(inst->mArg1, inst->mArg0);
  11587. break;
  11588. default:
  11589. Fail("Invalid CmpXChg args");
  11590. }
  11591. }
  11592. break;
  11593. case BeMCInstKind_XAdd:
  11594. {
  11595. auto arg0Type = GetType(inst->mArg0);
  11596. switch (instForm)
  11597. {
  11598. case BeMCInstForm_R8_RM8:
  11599. if (inst->mArg1.IsNativeReg())
  11600. instForm = BeMCInstForm_RM8_R8;
  11601. break;
  11602. case BeMCInstForm_R16_RM16:
  11603. if (inst->mArg1.IsNativeReg())
  11604. instForm = BeMCInstForm_RM16_R16;
  11605. break;
  11606. case BeMCInstForm_R32_RM32:
  11607. if (inst->mArg1.IsNativeReg())
  11608. instForm = BeMCInstForm_RM32_R32;
  11609. break;
  11610. case BeMCInstForm_R64_RM64:
  11611. if (inst->mArg1.IsNativeReg())
  11612. instForm = BeMCInstForm_RM64_R64;
  11613. break;
  11614. }
  11615. if (!inst->mArg0.IsNativeReg())
  11616. Emit(0xF0); // LOCK
  11617. switch (instForm)
  11618. {
  11619. case BeMCInstForm_RM8_R8:
  11620. EmitREX(inst->mArg1, inst->mArg0, false);
  11621. Emit(0x0F); Emit(0xC0); EmitModRM(inst->mArg1, inst->mArg0);
  11622. break;
  11623. case BeMCInstForm_RM16_R16:
  11624. EmitREX(inst->mArg1, inst->mArg0, false);
  11625. Emit(0x66); Emit(0x0F); Emit(0xC0); EmitModRM(inst->mArg1, inst->mArg0);
  11626. break;
  11627. case BeMCInstForm_RM32_R32:
  11628. EmitREX(inst->mArg1, inst->mArg0, false);
  11629. Emit(0x0F); Emit(0xC1); EmitModRM(inst->mArg1, inst->mArg0);
  11630. break;
  11631. case BeMCInstForm_RM64_R64:
  11632. EmitREX(inst->mArg1, inst->mArg0, true);
  11633. Emit(0x0F); Emit(0xC1); EmitModRM(inst->mArg1, inst->mArg0);
  11634. break;
  11635. default:
  11636. Fail("Invalid XAdd args");
  11637. }
  11638. }
  11639. break;
  11640. case BeMCInstKind_XChg:
  11641. {
  11642. EmitStdInst(instForm, inst, 0x87, 0x87, 0x00, 0x0);
  11643. }
  11644. break;
  11645. case BeMCInstKind_Load:
  11646. {
  11647. if (inst->mArg1.IsSymbol())
  11648. {
  11649. BF_ASSERT(inst->mArg0.IsNativeReg());
  11650. }
  11651. switch (instForm)
  11652. {
  11653. case BeMCInstForm_XMM64_FRM64:
  11654. case BeMCInstForm_XMM32_FRM32:
  11655. // MOVSS/MOVSD
  11656. EmitStdXMMInst(instForm, inst, 0x10);
  11657. break;
  11658. case BeMCInstForm_R32_RM32:
  11659. EmitInst(BeMCInstForm_R32_RM64_ADDR, 0x8B, inst);
  11660. break;
  11661. case BeMCInstForm_R64_RM64:
  11662. EmitInst(BeMCInstForm_R64_RM64_ADDR, 0x8B, inst);
  11663. break;
  11664. case BeMCInstForm_XMM32_RM64:
  11665. case BeMCInstForm_XMM64_RM64:
  11666. // MOVSS / MOVSD
  11667. BF_ASSERT(inst->mArg0.IsNativeReg());
  11668. if (instForm == BeMCInstForm_XMM64_RM64)
  11669. Emit(0xF2);
  11670. else
  11671. Emit(0xF3);
  11672. EmitREX(inst->mArg0, inst->mArg1, false);
  11673. Emit(0x0F); Emit(0x10);
  11674. EmitModRM_Addr(inst->mArg0, inst->mArg1);
  11675. break;
  11676. default:
  11677. {
  11678. BF_ASSERT(inst->mArg0.IsNativeReg());
  11679. auto arg0Type = GetType(inst->mArg0);
  11680. auto arg1Type = GetType(inst->mArg1);
  11681. BF_ASSERT(arg1Type->mSize == 8);
  11682. switch (arg0Type->mSize)
  11683. {
  11684. case 1: EmitInst(BeMCInstForm_R8_RM64_ADDR, 0x8B, inst); break;
  11685. case 2: EmitInst(BeMCInstForm_R16_RM64_ADDR, 0x8B, inst); break;
  11686. case 4: EmitInst(BeMCInstForm_R32_RM64_ADDR, 0x8B, inst); break;
  11687. case 8: EmitInst(BeMCInstForm_R64_RM64_ADDR, 0x8B, inst); break;
  11688. }
  11689. }
  11690. }
  11691. /*BF_ASSERT(inst->mArg0.mKind == BeMCOperandKind_NativeReg);
  11692. BF_ASSERT(inst->mArg1.mKind == BeMCOperandKind_NativeReg);
  11693. EmitREX(inst->mArg0, inst->mArg1);
  11694. mOut.Write((uint8)0x8B);
  11695. uint8 modRM = (0x0 << 6) | (EncodeRegNum(inst->mArg1.mReg)) | (EncodeRegNum(inst->mArg0.mReg)); // <arg0>, [<arg1>]
  11696. mOut.Write(modRM);*/
  11697. }
  11698. break;
  11699. case BeMCInstKind_Store:
  11700. {
  11701. switch (instForm)
  11702. {
  11703. /*case BeMCInstForm_R64_RM64:
  11704. {
  11705. // Make sure its really R64, R64
  11706. BF_ASSERT(inst->mArg1.IsNativeReg());
  11707. EmitInst(BeMCInstForm_RM64_R64_ADDR, 0x89, inst);
  11708. }
  11709. break;*/
  11710. case BeMCInstForm_RM64_R64: EmitInst(BeMCInstForm_RM64_R64_ADDR, 0x89, inst); break;
  11711. case BeMCInstForm_FRM32_XMM32:
  11712. case BeMCInstForm_FRM64_XMM64:
  11713. // MOVSS/MOVSD
  11714. EmitStdXMMInst(instForm, inst, 0x10, 0x11);
  11715. break;
  11716. case BeMCInstForm_R64_F64:
  11717. case BeMCInstForm_R64_F32:
  11718. // MOVSS / MOVSD
  11719. BF_ASSERT(inst->mArg1.IsNativeReg());
  11720. if (instForm == BeMCInstForm_R64_F64)
  11721. Emit(0xF2);
  11722. else
  11723. Emit(0xF3);
  11724. EmitREX(inst->mArg1, inst->mArg0, false);
  11725. Emit(0x0F); Emit(0x11);
  11726. EmitModRM_Addr(inst->mArg1, inst->mArg0);
  11727. break;
  11728. default:
  11729. {
  11730. BF_ASSERT(inst->mArg0.IsNativeReg());
  11731. BF_ASSERT(inst->mArg1.IsNativeReg());
  11732. auto arg0Type = GetType(inst->mArg0);
  11733. auto arg1Type = GetType(inst->mArg1);
  11734. BF_ASSERT(arg0Type->mSize == 8);
  11735. switch (arg1Type->mSize)
  11736. {
  11737. case 1: EmitInst(BeMCInstForm_RM64_R8_ADDR, 0x89, inst); break;
  11738. case 2: EmitInst(BeMCInstForm_RM64_R16_ADDR, 0x89, inst); break;
  11739. case 4: EmitInst(BeMCInstForm_RM64_R32_ADDR, 0x89, inst); break;
  11740. case 8: EmitInst(BeMCInstForm_RM64_R64_ADDR, 0x89, inst); break;
  11741. }
  11742. }
  11743. }
  11744. }
  11745. break;
  11746. case BeMCInstKind_Push:
  11747. {
  11748. auto arg0Type = GetType(inst->mArg0);
  11749. if (inst->mArg1)
  11750. {
  11751. BF_ASSERT(IsXMMReg(inst->mArg0.mReg));
  11752. BF_ASSERT(inst->mArg1.IsImmediate());
  11753. // Is there a performance benefit to properly using MOVAPD vs MOVAPS if we only
  11754. // use this register for double storage?
  11755. // MOVAPS
  11756. EmitREX(inst->mArg0, BeMCOperand(), false);
  11757. Emit(0x0F); Emit(0x29);
  11758. EmitModRMRel(EncodeRegNum(inst->mArg0.mReg), X64Reg_RSP, X64Reg_None, 1, (int)inst->mArg1.mImmediate);
  11759. break;
  11760. }
  11761. if (arg0Type->IsFloat())
  11762. {
  11763. BF_ASSERT(IsXMMReg(inst->mArg0.mReg));
  11764. // sub rsp, sizeof(arg0)
  11765. Emit(0x48); Emit(0x83); Emit(0xEC); Emit(arg0Type->mSize);
  11766. Emit((arg0Type->mSize == 4) ? 0xF3 : 0xF2);
  11767. EmitREX(inst->mArg0, BeMCOperand(), false);
  11768. Emit(0x0F); Emit(0x11);
  11769. EmitModRMRel(EncodeRegNum(inst->mArg0.mReg), X64Reg_RSP, X64Reg_None, 1, 0);
  11770. break;
  11771. }
  11772. // This is used in combination with register pops, and we can't pop 32-bit registers
  11773. // so we need to make sure we're always pushing a full 64 bits
  11774. switch (instForm)
  11775. {
  11776. case BeMCInstForm_R8: // Always use full reg (always push 64 bits)
  11777. case BeMCInstForm_R16:
  11778. case BeMCInstForm_R32:
  11779. case BeMCInstForm_R64:
  11780. EmitREX(BeMCOperand(), inst->mArg0, true);
  11781. mOut.Write((uint8)(0x50 + EncodeRegNum(inst->mArg0.mReg)));
  11782. break;
  11783. case BeMCInstForm_RM64:
  11784. EmitREX(BeMCOperand(), inst->mArg0, true);
  11785. Emit(0xFF); EmitModRM(6, inst->mArg0);
  11786. break;
  11787. case BeMCInstForm_IMM32: // Always pad to 64 bits
  11788. {
  11789. Emit(0x68); mOut.Write((int32)inst->mArg0.mImmediate);
  11790. // Emit padded 0
  11791. Emit(0x68); mOut.Write((int32)0);
  11792. }
  11793. break;
  11794. default:
  11795. NotImpl();
  11796. }
  11797. }
  11798. break;
  11799. case BeMCInstKind_Pop:
  11800. {
  11801. auto arg0Type = GetType(inst->mArg0);
  11802. if (inst->mArg1)
  11803. {
  11804. BF_ASSERT(IsXMMReg(inst->mArg0.mReg));
  11805. BF_ASSERT(inst->mArg1.IsImmediate());
  11806. // Is there a performance benefit to properly using MOVAPD vs MOVAPS if we only
  11807. // use this register for double storage?
  11808. // MOVAPS
  11809. EmitREX(inst->mArg0, BeMCOperand(), false);
  11810. Emit(0x0F); Emit(0x28);
  11811. // Push always uses RSP (required for stack unwinding), but Pop uses RBP when applicable
  11812. // because it is still set up at that point
  11813. EmitModRMRelStack(EncodeRegNum(inst->mArg0.mReg), (int)inst->mArg1.mImmediate, 1);
  11814. break;
  11815. }
  11816. if (arg0Type->IsFloat())
  11817. {
  11818. BF_ASSERT(IsXMMReg(inst->mArg0.mReg));
  11819. Emit((arg0Type->mSize == 4) ? 0xF3 : 0xF2);
  11820. EmitREX(inst->mArg0, BeMCOperand(), false);
  11821. Emit(0x0F); Emit(0x10);
  11822. EmitModRMRel(EncodeRegNum(inst->mArg0.mReg), X64Reg_RSP, X64Reg_None, 1, 0);
  11823. // add rsp, sizeof(arg0)
  11824. Emit(0x48); Emit(0x83); Emit(0xC4); Emit(arg0Type->mSize);
  11825. break;
  11826. }
  11827. switch (instForm)
  11828. {
  11829. case BeMCInstForm_R64:
  11830. EmitREX(BeMCOperand(), inst->mArg0, true);
  11831. mOut.Write((uint8)(0x58 + EncodeRegNum(inst->mArg0.mReg)));
  11832. break;
  11833. case BeMCInstForm_RM64:
  11834. EmitREX(BeMCOperand(), inst->mArg0, true);
  11835. Emit(0x8F); EmitModRM(0, inst->mArg0);
  11836. default:
  11837. NotImpl();
  11838. }
  11839. }
  11840. break;
  11841. case BeMCInstKind_Neg:
  11842. {
  11843. auto typeCode = GetType(inst->mArg0)->mTypeCode;
  11844. switch (typeCode)
  11845. {
  11846. case BeTypeCode_Int8:
  11847. EmitREX(BeMCOperand(), inst->mArg0, false);
  11848. Emit(0xF6);
  11849. EmitModRM(3, inst->mArg0);
  11850. break;
  11851. case BeTypeCode_Int16: Emit(0x66); // Fallthrough
  11852. case BeTypeCode_Int32:
  11853. case BeTypeCode_Int64:
  11854. EmitREX(BeMCOperand(), inst->mArg0, typeCode == BeTypeCode_Int64);
  11855. Emit(0xF7); EmitModRM(3, inst->mArg0);
  11856. break;
  11857. default:
  11858. NotImpl();
  11859. }
  11860. }
  11861. break;
  11862. case BeMCInstKind_Not:
  11863. {
  11864. auto typeCode = GetType(inst->mArg0)->mTypeCode;
  11865. switch (typeCode)
  11866. {
  11867. case BeTypeCode_Int8:
  11868. EmitREX(BeMCOperand(), inst->mArg0, false);
  11869. Emit(0xF6);
  11870. EmitModRM(2, inst->mArg0);
  11871. break;
  11872. case BeTypeCode_Int16: Emit(0x66); // Fallthrough
  11873. case BeTypeCode_Int32:
  11874. case BeTypeCode_Int64:
  11875. EmitREX(BeMCOperand(), inst->mArg0, typeCode == BeTypeCode_Int64);
  11876. Emit(0xF7); EmitModRM(2, inst->mArg0);
  11877. break;
  11878. default:
  11879. NotImpl();
  11880. }
  11881. }
  11882. break;
  11883. case BeMCInstKind_Add:
  11884. {
  11885. if ((inst->mResult) && (inst->mResult != inst->mArg0))
  11886. {
  11887. BF_ASSERT(inst->mResult.IsNativeReg());
  11888. BF_ASSERT(inst->mArg0.IsNativeReg());
  11889. BF_ASSERT(inst->mArg1.IsImmediate());
  11890. // LEA form
  11891. auto resultType = GetType(inst->mArg0);
  11892. switch (resultType->mTypeCode)
  11893. {
  11894. case BeTypeCode_Int16:
  11895. Emit(0x66);
  11896. case BeTypeCode_Int32:
  11897. case BeTypeCode_Int64:
  11898. EmitREX(inst->mResult, inst->mArg0, resultType->mTypeCode == BeTypeCode_Int64);
  11899. Emit(0x8D); EmitModRMRel(EncodeRegNum(inst->mResult.mReg), ResizeRegister(inst->mArg0.mReg, 8), X64Reg_None, 1, (int)inst->mArg1.mImmediate);
  11900. break;
  11901. default:
  11902. NotImpl();
  11903. }
  11904. }
  11905. else if ((inst->mArg1.IsImmediateInt()) && (inst->mArg1.mImmediate == 1))
  11906. {
  11907. // Emit as INC <arg0>
  11908. auto typeCode = GetType(inst->mArg0)->mTypeCode;
  11909. switch (typeCode)
  11910. {
  11911. case BeTypeCode_Int8:
  11912. EmitREX(BeMCOperand(), inst->mArg0, false);
  11913. Emit(0xFE); EmitModRM(0, inst->mArg0);
  11914. break;
  11915. case BeTypeCode_Int16: Emit(0x66); // Fallthrough
  11916. case BeTypeCode_Int32:
  11917. case BeTypeCode_Int64:
  11918. EmitREX(BeMCOperand(), inst->mArg0, typeCode == BeTypeCode_Int64);
  11919. Emit(0xFF); EmitModRM(0, inst->mArg0);
  11920. break;
  11921. default:
  11922. NotImpl();
  11923. }
  11924. }
  11925. else if ((inst->mArg1.IsImmediateInt()) && (inst->mArg1.mImmediate == -1))
  11926. {
  11927. // Emit as DEC <arg0>
  11928. auto typeCode = GetType(inst->mArg0)->mTypeCode;
  11929. switch (typeCode)
  11930. {
  11931. case BeTypeCode_Int8:
  11932. EmitREX(BeMCOperand(), inst->mArg0, false);
  11933. Emit(0xFE); EmitModRM(1, inst->mArg0);
  11934. break;
  11935. case BeTypeCode_Int16: Emit(0x66); // Fallthrough
  11936. case BeTypeCode_Int32:
  11937. case BeTypeCode_Int64:
  11938. EmitREX(BeMCOperand(), inst->mArg0, typeCode == BeTypeCode_Int64);
  11939. Emit(0xFF); EmitModRM(1, inst->mArg0);
  11940. break;
  11941. default:
  11942. NotImpl();
  11943. }
  11944. }
  11945. else
  11946. {
  11947. if (((instForm == BeMCInstForm_RM64_IMM16) || (instForm == BeMCInstForm_RM64_IMM32)) &&
  11948. (inst->mArg0.mReg == X64Reg_RAX))
  11949. {
  11950. // Emit as ADD RAX, <imm32>
  11951. EmitREX(inst->mArg0, BeMCOperand(), true);
  11952. mOut.Write((uint8)0x05);
  11953. mOut.Write((int32)inst->mArg1.mImmediate);
  11954. break;
  11955. }
  11956. if (EmitStdXMMInst(instForm, inst, 0x58))
  11957. break;
  11958. EmitStdInst(instForm, inst, 0x01, 0x03, 0x81, 0x0, 0x83, 0x0);
  11959. }
  11960. }
  11961. break;
  11962. case BeMCInstKind_Sub:
  11963. {
  11964. if ((inst->mArg1.IsImmediateInt()) && (inst->mArg1.mImmediate == 1))
  11965. {
  11966. // Emit as DEC <arg0>
  11967. auto typeCode = GetType(inst->mArg0)->mTypeCode;
  11968. switch (typeCode)
  11969. {
  11970. case BeTypeCode_Int8:
  11971. EmitREX(BeMCOperand(), inst->mArg0, false);
  11972. Emit(0xFE); EmitModRM(1, inst->mArg0);
  11973. break;
  11974. case BeTypeCode_Int16: Emit(0x66); // Fallthrough
  11975. case BeTypeCode_Int32:
  11976. case BeTypeCode_Int64:
  11977. EmitREX(BeMCOperand(), inst->mArg0, typeCode == BeTypeCode_Int64);
  11978. Emit(0xFF); EmitModRM(1, inst->mArg0);
  11979. break;
  11980. default:
  11981. NotImpl();
  11982. }
  11983. }
  11984. else
  11985. {
  11986. if (((instForm == BeMCInstForm_RM64_IMM16) || (instForm == BeMCInstForm_RM64_IMM32)) &&
  11987. (inst->mArg0.mReg == X64Reg_RAX))
  11988. {
  11989. // Emit as SUB RAX, <imm32>
  11990. EmitREX(inst->mArg0, BeMCOperand(), true);
  11991. mOut.Write((uint8)0x2D);
  11992. mOut.Write((int32)inst->mArg1.mImmediate);
  11993. break;
  11994. }
  11995. if (EmitStdXMMInst(instForm, inst, 0x5C))
  11996. break;
  11997. EmitStdInst(instForm, inst, 0x29, 0x2B, 0x81, 0x5, 0x83, 0x5);
  11998. }
  11999. }
  12000. break;
  12001. case BeMCInstKind_IMul:
  12002. {
  12003. if (EmitStdXMMInst(instForm, inst, 0x59))
  12004. break;
  12005. BeMCOperand result = inst->mResult;
  12006. if ((!result) && (inst->mArg1.IsImmediate()))
  12007. result = inst->mArg0; // Do as 3-form anyway
  12008. if (result)
  12009. {
  12010. BF_ASSERT(inst->mArg1.IsImmediate());
  12011. if ((inst->mArg0.IsNativeReg()) &&
  12012. ((inst->mArg1.mImmediate == 2) || (inst->mArg1.mImmediate == 4) || (inst->mArg1.mImmediate == 8)))
  12013. {
  12014. // LEA form
  12015. auto resultType = GetType(inst->mArg0);
  12016. if (resultType->mTypeCode != BeTypeCode_Int8)
  12017. {
  12018. switch (resultType->mTypeCode)
  12019. {
  12020. case BeTypeCode_Int16:
  12021. Emit(0x66);
  12022. case BeTypeCode_Int32:
  12023. case BeTypeCode_Int64:
  12024. uint8 rex = GetREX(result, inst->mArg0, resultType->mTypeCode == BeTypeCode_Int64);
  12025. if (rex != 0)
  12026. {
  12027. if (rex & 1)
  12028. {
  12029. // Mov REX flag from RM to SiB
  12030. rex = (rex & ~1) | 2;
  12031. }
  12032. Emit(rex);
  12033. }
  12034. Emit(0x8D); EmitModRMRel(EncodeRegNum(result.mReg), X64Reg_None, inst->mArg0.mReg, (int)inst->mArg1.mImmediate, 0);
  12035. break;
  12036. }
  12037. break;
  12038. }
  12039. }
  12040. auto typeCode = GetType(inst->mArg0)->mTypeCode;
  12041. switch (typeCode)
  12042. {
  12043. case BeTypeCode_Int16:
  12044. Emit(0x66);
  12045. // Fall through
  12046. case BeTypeCode_Int32:
  12047. case BeTypeCode_Int64:
  12048. EmitREX(result, inst->mArg0, typeCode == BeTypeCode_Int64);
  12049. if ((inst->mArg1.mImmediate >= -0x80) && (inst->mArg1.mImmediate <= 0x7F))
  12050. {
  12051. Emit(0x6B);
  12052. EmitModRM(result, inst->mArg0, -1);
  12053. mOut.Write((int8)inst->mArg1.mImmediate);
  12054. }
  12055. else
  12056. {
  12057. Emit(0x69);
  12058. EmitModRM(result, inst->mArg0, (typeCode == BeTypeCode_Int16) ? -2 : -4);
  12059. if (typeCode == BeTypeCode_Int16)
  12060. mOut.Write((int16)inst->mArg1.mImmediate);
  12061. else
  12062. mOut.Write((int32)inst->mArg1.mImmediate);
  12063. }
  12064. break;
  12065. default:
  12066. NotImpl();
  12067. }
  12068. }
  12069. else
  12070. {
  12071. if (inst->mArg1.IsImmediate())
  12072. {
  12073. int64 multVal = inst->mArg1.mImmediate;
  12074. if (IsPowerOfTwo(multVal))
  12075. {
  12076. int shiftCount = 0;
  12077. while (multVal > 1)
  12078. {
  12079. shiftCount++;
  12080. multVal >>= 1;
  12081. }
  12082. auto arg0Type = GetType(inst->mArg0);
  12083. switch (arg0Type->mTypeCode)
  12084. {
  12085. case BeTypeCode_Int64:
  12086. EmitREX(inst->mArg0, BeMCOperand(), true);
  12087. // Fall through
  12088. case BeTypeCode_Int32:
  12089. Emit(0xC1); Emit((0x4 << 3) | (3 << 6) | (EncodeRegNum(inst->mArg0.mReg)));
  12090. Emit((uint8)shiftCount);
  12091. break;
  12092. default:
  12093. NotImpl();
  12094. }
  12095. break;
  12096. }
  12097. }
  12098. switch (instForm)
  12099. {
  12100. case BeMCInstForm_R8_RM8:
  12101. BF_ASSERT(inst->mArg0.mReg == X64Reg_AL);
  12102. Emit(0xF6);
  12103. EmitModRM(0x5, inst->mArg1);
  12104. break;
  12105. case BeMCInstForm_R16_RM16:
  12106. case BeMCInstForm_R32_RM32:
  12107. case BeMCInstForm_R64_RM64: EmitInst(instForm, 0xAF0F, inst); break;
  12108. default:
  12109. NotImpl();
  12110. }
  12111. }
  12112. }
  12113. break;
  12114. case BeMCInstKind_Div:
  12115. {
  12116. auto arg0Type = GetType(inst->mArg0);
  12117. switch (arg0Type->mTypeCode)
  12118. {
  12119. case BeTypeCode_Int8:
  12120. BF_ASSERT((inst->mArg0.IsNativeReg()) && (inst->mArg0.mReg == X64Reg_AL));
  12121. // XOR ah, ah
  12122. Emit(0x30); Emit(0xE4);
  12123. // IDIV rm
  12124. EmitREX(BeMCOperand::FromReg(X64Reg_AX), inst->mArg1, false);
  12125. Emit(0xF6); EmitModRM(0x6, inst->mArg1);
  12126. break;
  12127. case BeTypeCode_Int16:
  12128. BF_ASSERT((inst->mArg0.IsNativeReg()) && (inst->mArg0.mReg == X64Reg_AX));
  12129. // XOR eax, eax
  12130. Emit(0x31); Emit(0xC0);
  12131. // IDIV rm
  12132. Emit(0x66);
  12133. EmitREX(BeMCOperand::FromReg(X64Reg_AX), inst->mArg1, false);
  12134. Emit(0xF7); EmitModRM(0x6, inst->mArg1);
  12135. break;
  12136. case BeTypeCode_Int32:
  12137. BF_ASSERT((inst->mArg0.IsNativeReg()) && (inst->mArg0.mReg == X64Reg_EAX));
  12138. // XOR edx, edx
  12139. Emit(0x31); Emit(0xD2);
  12140. // IDIV rm
  12141. EmitREX(BeMCOperand::FromReg(X64Reg_EAX), inst->mArg1, false);
  12142. Emit(0xF7); EmitModRM(0x6, inst->mArg1);
  12143. break;
  12144. case BeTypeCode_Int64:
  12145. BF_ASSERT((inst->mArg0.IsNativeReg()) && (inst->mArg0.mReg == X64Reg_RAX));
  12146. // XOR rdx, rdx
  12147. Emit(0x48); Emit(0x31); Emit(0xD2);
  12148. EmitREX(BeMCOperand::FromReg(X64Reg_RAX), inst->mArg1, true);
  12149. // IDIV rm
  12150. EmitREX(BeMCOperand::FromReg(X64Reg_RAX), inst->mArg1, true);
  12151. Emit(0xF7); EmitModRM(0x6, inst->mArg1);
  12152. break;
  12153. }
  12154. }
  12155. break;
  12156. case BeMCInstKind_IDiv:
  12157. {
  12158. if (EmitStdXMMInst(instForm, inst, 0x5E))
  12159. break;
  12160. auto arg0Type = GetType(inst->mArg0);
  12161. switch (arg0Type->mTypeCode)
  12162. {
  12163. case BeTypeCode_Int8:
  12164. BF_ASSERT((inst->mArg0.IsNativeReg()) && (inst->mArg0.mReg == X64Reg_AL));
  12165. // CBW
  12166. Emit(0x66); Emit(0x98);
  12167. // IDIV rm
  12168. EmitREX(BeMCOperand::FromReg(X64Reg_AX), inst->mArg1, false);
  12169. Emit(0xF6); EmitModRM(0x7, inst->mArg1);
  12170. break;
  12171. case BeTypeCode_Int16:
  12172. BF_ASSERT((inst->mArg0.IsNativeReg()) && (inst->mArg0.mReg == X64Reg_AX));
  12173. // CWD
  12174. Emit(0x66); Emit(0x99);
  12175. // IDIV rm
  12176. Emit(0x66);
  12177. EmitREX(BeMCOperand::FromReg(X64Reg_AX), inst->mArg1, false);
  12178. Emit(0xF7); EmitModRM(0x7, inst->mArg1);
  12179. break;
  12180. case BeTypeCode_Int32:
  12181. BF_ASSERT((inst->mArg0.IsNativeReg()) && (inst->mArg0.mReg == X64Reg_EAX));
  12182. // CDQ
  12183. Emit(0x99);
  12184. // IDIV rm
  12185. EmitREX(BeMCOperand::FromReg(X64Reg_EAX), inst->mArg1, false);
  12186. Emit(0xF7); EmitModRM(0x7, inst->mArg1);
  12187. break;
  12188. case BeTypeCode_Int64:
  12189. BF_ASSERT((inst->mArg0.IsNativeReg()) && (inst->mArg0.mReg == X64Reg_RAX));
  12190. // CQO
  12191. Emit(0x48); Emit(0x99);
  12192. // IDIV rm
  12193. EmitREX(BeMCOperand::FromReg(X64Reg_RAX), inst->mArg1, true);
  12194. Emit(0xF7); EmitModRM(0x7, inst->mArg1);
  12195. break;
  12196. }
  12197. }
  12198. break;
  12199. case BeMCInstKind_IRem:
  12200. {
  12201. NotImpl();
  12202. //if (EmitStdXMMInst(instForm, inst, 0x5E))
  12203. //break;
  12204. }
  12205. break;
  12206. case BeMCInstKind_Cmp:
  12207. {
  12208. switch (instForm)
  12209. {
  12210. case BeMCInstForm_XMM32_FRM32:
  12211. case BeMCInstForm_XMM32_IMM:
  12212. // COMISS
  12213. EmitREX(inst->mArg0, inst->mArg1, false);
  12214. Emit(0x0F); Emit(0x2F);
  12215. EmitModRM(inst->mArg0, inst->mArg1);
  12216. break;
  12217. case BeMCInstForm_XMM64_FRM64:
  12218. case BeMCInstForm_XMM64_IMM:
  12219. // COMISD
  12220. Emit(0x66);
  12221. EmitREX(inst->mArg0, inst->mArg1, false);
  12222. Emit(0x0F); Emit(0x2F);
  12223. EmitModRM(inst->mArg0, inst->mArg1);
  12224. break;
  12225. default:
  12226. {
  12227. if (((inst->mArg0.IsNativeReg()) && (inst->mArg1.IsImmediateInt())) && (inst->mArg1.GetImmediateInt() == 0))
  12228. {
  12229. // Test
  12230. auto typeCode = GetType(inst->mArg0)->mTypeCode;
  12231. switch (typeCode)
  12232. {
  12233. case BeTypeCode_Int8:
  12234. EmitREX(inst->mArg0, inst->mArg0, false);
  12235. Emit(0x84);
  12236. EmitModRM(inst->mArg0, inst->mArg0);
  12237. break;
  12238. case BeTypeCode_Int16: Emit(0x66); // Fallthrough
  12239. case BeTypeCode_Int32:
  12240. case BeTypeCode_Int64:
  12241. EmitREX(inst->mArg0, inst->mArg0, typeCode == BeTypeCode_Int64);
  12242. Emit(0x85); EmitModRM(inst->mArg0, inst->mArg0);
  12243. break;
  12244. default:
  12245. NotImpl();
  12246. }
  12247. /*if (arg0Type->mSize == 2)
  12248. Emit(0x66);
  12249. // Emit as TEST <arg0>, <arg0>
  12250. EmitREX(inst->mArg0, inst->mArg0, GetType(inst->mArg0)->mSize == 8);
  12251. mOut.Write((uint8)0x85); // r/m64, r
  12252. EmitModRM(inst->mArg0, inst->mArg0);*/
  12253. }
  12254. else
  12255. {
  12256. EmitStdInst(instForm, inst, 0x39, 0x3B, 0x81, 0x7, 0x83, 0x7);
  12257. }
  12258. }
  12259. }
  12260. }
  12261. break;
  12262. case BeMCInstKind_And:
  12263. {
  12264. BeMCInst modInst = *inst;
  12265. bool isZeroing = false;
  12266. // Use a shorter form if the upper bytes are masked in
  12267. if ((instForm == BeMCInstForm_RM32_IMM32) || (instForm == BeMCInstForm_RM64_IMM32))
  12268. {
  12269. if ((modInst.mArg1.mImmediate & 0xFFFF0000) == 0xFFFF0000)
  12270. {
  12271. if (modInst.mArg0.IsNativeReg())
  12272. modInst.mArg0.mReg = ResizeRegister(modInst.mArg0.mReg, 2);
  12273. instForm = BeMCInstForm_RM16_IMM16;
  12274. if ((modInst.mArg1.mImmediate & 0xFFFF) == 0)
  12275. isZeroing = true;
  12276. }
  12277. else if (instForm == BeMCInstForm_RM32_IMM32)
  12278. {
  12279. if ((modInst.mArg1.mImmediate & 0xFFFFFFFF) == 0)
  12280. {
  12281. isZeroing = true;
  12282. }
  12283. }
  12284. }
  12285. if ((instForm == BeMCInstForm_RM16_IMM16) || (instForm == BeMCInstForm_RM32_IMM16) || (instForm == BeMCInstForm_RM64_IMM16))
  12286. {
  12287. if ((modInst.mArg1.mImmediate & 0xFFFFFF00) == 0xFFFFFF00)
  12288. {
  12289. if (modInst.mArg0.IsNativeReg())
  12290. modInst.mArg0.mReg = ResizeRegister(modInst.mArg0.mReg, 1);
  12291. instForm = BeMCInstForm_RM8_IMM8;
  12292. }
  12293. else if (instForm == BeMCInstForm_RM16_IMM16)
  12294. {
  12295. if ((modInst.mArg1.mImmediate & 0xFFFF) == 0)
  12296. {
  12297. isZeroing = true;
  12298. }
  12299. }
  12300. }
  12301. if (instForm == BeMCInstForm_RM8_IMM8)
  12302. {
  12303. // Are we really just zeroing out the lower byte?
  12304. if (((modInst.mArg1.mImmediate & 0xFF) == 0) && (modInst.mArg0.IsNativeReg()))
  12305. {
  12306. isZeroing = true;
  12307. }
  12308. }
  12309. if (isZeroing)
  12310. {
  12311. int size = 0;
  12312. switch (instForm)
  12313. {
  12314. case BeMCInstForm_RM32_IMM32:
  12315. instForm = BeMCInstForm_RM32_R32;
  12316. break;
  12317. case BeMCInstForm_RM16_IMM16:
  12318. instForm = BeMCInstForm_RM16_R16;
  12319. break;
  12320. case BeMCInstForm_RM8_IMM8:
  12321. instForm = BeMCInstForm_RM8_R8;
  12322. break;
  12323. default:
  12324. NotImpl();
  12325. }
  12326. //XOR arg0, arg0
  12327. modInst.mKind = BeMCInstKind_Xor;
  12328. modInst.mArg1 = modInst.mArg0;
  12329. EmitStdInst(instForm, &modInst, 0x31, 0x33, 0x81, 0x6, 0x83, 0x6);
  12330. break;
  12331. }
  12332. EmitStdInst(instForm, &modInst, 0x21, 0x23, 0x81, 0x4, 0x83, 0x4);
  12333. }
  12334. break;
  12335. case BeMCInstKind_Or:
  12336. {
  12337. EmitStdInst(instForm, inst, 0x09, 0x0B, 0x81, 0x1, 0x83, 0x1);
  12338. }
  12339. break;
  12340. case BeMCInstKind_Xor:
  12341. {
  12342. if (EmitPackedXMMInst(instForm, inst, 0x57))
  12343. break;
  12344. EmitStdInst(instForm, inst, 0x31, 0x33, 0x81, 0x6, 0x83, 0x6);
  12345. }
  12346. break;
  12347. case BeMCInstKind_Shl:
  12348. case BeMCInstKind_Shr:
  12349. case BeMCInstKind_Sar:
  12350. {
  12351. int rx = 0;
  12352. switch (inst->mKind)
  12353. {
  12354. case BeMCInstKind_Shl:
  12355. rx = 4;
  12356. break;
  12357. case BeMCInstKind_Shr:
  12358. rx = 5;
  12359. break;
  12360. case BeMCInstKind_Sar:
  12361. rx = 7;
  12362. break;
  12363. }
  12364. bool handled = false;
  12365. switch (instForm)
  12366. {
  12367. case BeMCInstForm_RM8_IMM8:
  12368. case BeMCInstForm_RM16_IMM8:
  12369. case BeMCInstForm_RM32_IMM8:
  12370. case BeMCInstForm_RM64_IMM8:
  12371. if (inst->mArg1.mImmediate == 1)
  12372. {
  12373. // Shift by one has a short form
  12374. if (instForm == BeMCInstForm_RM16_IMM8) Emit(0x66);
  12375. EmitREX(inst->mArg1, inst->mArg0, instForm == BeMCInstForm_RM64_IMM8);
  12376. if (instForm == BeMCInstForm_RM8_IMM8)
  12377. Emit(0xD0);
  12378. else
  12379. Emit(0xD1);
  12380. EmitModRM(rx, inst->mArg0);
  12381. handled = true;
  12382. }
  12383. else
  12384. {
  12385. if (instForm == BeMCInstForm_RM16_IMM8) Emit(0x66);
  12386. EmitREX(inst->mArg1, inst->mArg0, instForm == BeMCInstForm_RM64_IMM8);
  12387. if (instForm == BeMCInstForm_RM8_IMM8)
  12388. Emit(0xC0);
  12389. else
  12390. Emit(0xC1);
  12391. EmitModRM(rx, inst->mArg0);
  12392. Emit((uint8)inst->mArg1.mImmediate);
  12393. handled = true;
  12394. }
  12395. break;
  12396. default:
  12397. {
  12398. BF_ASSERT(inst->mArg1.IsNativeReg());
  12399. BF_ASSERT(inst->mArg1.mReg == X64Reg_RCX);
  12400. int destSize = GetType(inst->mArg0)->mSize;
  12401. if (destSize == 2) Emit(0x66);
  12402. EmitREX(BeMCOperand(), inst->mArg0, destSize == 8);
  12403. if (destSize == 1)
  12404. Emit(0xD2);
  12405. else
  12406. Emit(0xD3);
  12407. EmitModRM(rx, inst->mArg0);
  12408. handled = true;
  12409. }
  12410. break;
  12411. }
  12412. }
  12413. break;
  12414. case BeMCInstKind_Test:
  12415. {
  12416. if (instForm == BeMCInstForm_R64_RM64)
  12417. {
  12418. BF_SWAP(inst->mArg0, inst->mArg1);
  12419. instForm = BeMCInstForm_RM64_R64;
  12420. }
  12421. EmitStdInst(instForm, inst, 0x85, 0x00, 0xF7, 0x0);
  12422. }
  12423. break;
  12424. case BeMCInstKind_CondBr:
  12425. {
  12426. BF_ASSERT(inst->mArg0.mKind == BeMCOperandKind_Label);
  12427. BeMCJump jump;
  12428. jump.mCodeOffset = funcCodePos;
  12429. jump.mLabelIdx = inst->mArg0.mLabelIdx;
  12430. // Speculative make it a short jump
  12431. jump.mJumpKind = 0;
  12432. jump.mCmpKind = inst->mArg1.mCmpKind;
  12433. deferredJumps.push_back(jump);
  12434. mOut.Write(GetJumpOpCode(jump.mCmpKind, false));
  12435. mOut.Write((uint8)0);
  12436. }
  12437. break;
  12438. case BeMCInstKind_Br:
  12439. {
  12440. if (inst->mArg1.mKind == BeMCOperandKind_Immediate_i8)
  12441. {
  12442. if (inst->mArg1.mImmediate == 2) // Fake?
  12443. break;
  12444. }
  12445. if (inst->mArg0.mKind == BeMCOperandKind_Label)
  12446. {
  12447. BeMCJump jump;
  12448. jump.mCodeOffset = funcCodePos;
  12449. jump.mLabelIdx = inst->mArg0.mLabelIdx;
  12450. // Speculatively make it a short jump
  12451. jump.mJumpKind = 0;
  12452. jump.mCmpKind = BeCmpKind_None;
  12453. deferredJumps.push_back(jump);
  12454. mOut.Write((uint8)0xEB);
  12455. mOut.Write((uint8)0);
  12456. }
  12457. else
  12458. {
  12459. auto arg0Type = GetType(inst->mArg0);
  12460. BF_ASSERT(arg0Type->mTypeCode == BeTypeCode_Int64);
  12461. uint8 rex = GetREX(BeMCOperand(), inst->mArg0, true);
  12462. if (rex != 0x40)
  12463. Emit(rex);
  12464. Emit(0xFF);
  12465. EmitModRM(4, inst->mArg0);
  12466. }
  12467. }
  12468. break;
  12469. case BeMCInstKind_Ret:
  12470. mOut.Write((uint8)0xC3);
  12471. break;
  12472. case BeMCInstKind_Call:
  12473. {
  12474. switch (instForm)
  12475. {
  12476. case BeMCInstForm_Symbol:
  12477. {
  12478. // Call [rip+<X>]
  12479. mOut.Write((uint8)0xFF);
  12480. mOut.Write((uint8)0x15);
  12481. BeMCRelocation reloc;
  12482. reloc.mKind = BeMCRelocationKind_REL32;
  12483. reloc.mOffset = mOut.GetPos();
  12484. reloc.mSymTableIdx = inst->mArg0.mSymbolIdx;
  12485. mCOFFObject->mTextSect.mRelocs.push_back(reloc);
  12486. mTextRelocs.push_back((int)mCOFFObject->mTextSect.mRelocs.size() - 1);
  12487. mOut.Write((int32)0);
  12488. }
  12489. break;
  12490. case BeMCInstForm_SymbolAddr:
  12491. {
  12492. // Call <X>
  12493. mOut.Write((uint8)0xE8);
  12494. BeMCRelocation reloc;
  12495. reloc.mKind = BeMCRelocationKind_REL32;
  12496. reloc.mOffset = mOut.GetPos();
  12497. reloc.mSymTableIdx = inst->mArg0.mSymbolIdx;
  12498. mCOFFObject->mTextSect.mRelocs.push_back(reloc);
  12499. mTextRelocs.push_back((int)mCOFFObject->mTextSect.mRelocs.size() - 1);
  12500. mOut.Write((int32)0);
  12501. }
  12502. break;
  12503. default:
  12504. {
  12505. EmitREX(BeMCOperand(), inst->mArg0, true);
  12506. mOut.Write((uint8)0xFF);
  12507. EmitModRM(0x2, inst->mArg0);
  12508. }
  12509. break;
  12510. }
  12511. }
  12512. //mOut.Write((uint8)0xC3);
  12513. break;
  12514. default:
  12515. NotImpl();
  12516. }
  12517. }
  12518. }
  12519. if (mDebugging)
  12520. {
  12521. dbgStr += "\nEMISSIONS:\n";
  12522. }
  12523. // Finish range for all outstanding variables
  12524. for (int vregLiveIdx : *vregsLive)
  12525. {
  12526. if (vregLiveIdx >= mLivenessContext.mNumItems)
  12527. continue;
  12528. int vregIdx = vregLiveIdx % mLivenessContext.mNumItems;
  12529. auto dbgVar = mVRegInfo[vregIdx]->mDbgVariable;
  12530. if (dbgVar != NULL)
  12531. {
  12532. dbgVar->mDeclEnd = mOut.GetPos() - textSectStartPos;
  12533. dbgVar->mDeclLifetimeExtend = false;
  12534. BF_ASSERT(dbgVar->mDeclEnd >= dbgVar->mDeclStart);
  12535. if (!dbgVar->mSavedRanges.empty())
  12536. {
  12537. auto& savedRange = dbgVar->mSavedRanges.back();
  12538. if (savedRange.mLength == -1)
  12539. {
  12540. savedRange.mLength = dbgVar->mDeclEnd - savedRange.mOffset;
  12541. dbgVar->mGaps.push_back(savedRange);
  12542. }
  12543. }
  12544. }
  12545. }
  12546. auto& codeVec = mOut.mData;
  12547. for (int pass = 0; true; pass++)
  12548. {
  12549. bool didWidening = false;
  12550. for (auto& jump : deferredJumps)
  12551. {
  12552. int labelPos = labelPositions[jump.mLabelIdx];
  12553. int offsetRel = jump.mCodeOffset;
  12554. if (jump.mJumpKind == 0)
  12555. offsetRel += 2;
  12556. else if (jump.mJumpKind == 1)
  12557. offsetRel += 4;
  12558. else if (jump.mJumpKind == 2)
  12559. {
  12560. if (jump.mCmpKind == BeCmpKind_None)
  12561. offsetRel += 5;
  12562. else
  12563. offsetRel += 6;
  12564. }
  12565. int offset = labelPos - offsetRel;
  12566. //BF_ASSERT((offset >= -128) && (offset <= 127));
  12567. if ((jump.mJumpKind == 0) &&
  12568. ((offset < -0x80) || (offset > 0x7F)))
  12569. {
  12570. // Extend this guy into a rel32
  12571. int adjustFrom = jump.mCodeOffset + 2;
  12572. int adjustBytes = 3;
  12573. if (jump.mCmpKind != BeCmpKind_None)
  12574. adjustBytes++;
  12575. codeVec.Insert(jump.mCodeOffset + 1 + textSectStartPos, (uint8)0xCC, adjustBytes);
  12576. mOut.mPos += adjustBytes;
  12577. if (jump.mCmpKind == BeCmpKind_None)
  12578. {
  12579. codeVec[jump.mCodeOffset + textSectStartPos] = 0xE9;
  12580. }
  12581. else
  12582. {
  12583. codeVec[jump.mCodeOffset + textSectStartPos] = 0x0F;
  12584. codeVec[jump.mCodeOffset + 1 + textSectStartPos] = GetJumpOpCode(jump.mCmpKind, true);
  12585. }
  12586. #define CODE_OFFSET_ADJUST(val) if (val >= adjustFrom) val += adjustBytes
  12587. for (auto& labelPosition : labelPositions)
  12588. CODE_OFFSET_ADJUST(labelPosition);
  12589. for (auto& checkJump : deferredJumps)
  12590. CODE_OFFSET_ADJUST(checkJump.mCodeOffset);
  12591. if (mDbgFunction != NULL)
  12592. {
  12593. for (auto& codeEmission : mDbgFunction->mEmissions)
  12594. CODE_OFFSET_ADJUST(codeEmission.mPos);
  12595. for (auto dbgVar : mDbgFunction->mVariables)
  12596. {
  12597. if (dbgVar == NULL)
  12598. continue;
  12599. CODE_OFFSET_ADJUST(dbgVar->mDeclStart);
  12600. CODE_OFFSET_ADJUST(dbgVar->mDeclEnd);
  12601. for (auto& range : dbgVar->mSavedRanges)
  12602. CODE_OFFSET_ADJUST(range.mOffset);
  12603. for (auto& range : dbgVar->mGaps)
  12604. CODE_OFFSET_ADJUST(range.mOffset);
  12605. }
  12606. }
  12607. for (auto& deferredUnwind : deferredUnwinds)
  12608. CODE_OFFSET_ADJUST(deferredUnwind.mCodePos);
  12609. for (int textRelocIdx : mTextRelocs)
  12610. {
  12611. auto& reloc = mCOFFObject->mTextSect.mRelocs[textRelocIdx];
  12612. if (reloc.mOffset - textSectStartPos >= adjustFrom)
  12613. reloc.mOffset += adjustBytes;
  12614. }
  12615. for (auto& dbgInstPos : dbgInstPositions)
  12616. CODE_OFFSET_ADJUST(dbgInstPos.mPos);
  12617. #undef CODE_OFFSET_ADJUST
  12618. jump.mJumpKind = 2;
  12619. didWidening = true;
  12620. }
  12621. //TODO: Test extending into a long jump
  12622. if (jump.mJumpKind == 0)
  12623. codeVec[jump.mCodeOffset + 1 + textSectStartPos] = (uint8)offset;
  12624. else if (jump.mCmpKind == BeCmpKind_None)
  12625. *(int32*)(&codeVec[jump.mCodeOffset + 1 + textSectStartPos]) = (uint32)offset;
  12626. else
  12627. *(int32*)(&codeVec[jump.mCodeOffset + 2 + textSectStartPos]) = (uint32)offset;
  12628. }
  12629. if (!didWidening)
  12630. break;
  12631. }
  12632. if (!mSwitchEntries.empty())
  12633. {
  12634. auto thisFuncSym = mCOFFObject->GetSymbol(mBeFunction);
  12635. for (auto& switchEntry : mSwitchEntries)
  12636. {
  12637. auto& sect = mCOFFObject->mRDataSect;
  12638. int32* ofsPtr = (int32*)((uint8*)sect.mData.GetPtr() + switchEntry.mOfs);
  12639. *ofsPtr = labelPositions[switchEntry.mBlock->mLabelIdx];
  12640. BeMCRelocation reloc;
  12641. reloc.mKind = BeMCRelocationKind_ADDR32NB;
  12642. reloc.mOffset = switchEntry.mOfs;
  12643. reloc.mSymTableIdx = thisFuncSym->mIdx;
  12644. sect.mRelocs.push_back(reloc);
  12645. }
  12646. }
  12647. //for (auto& deferredUnwind : deferredUnwinds)
  12648. for (int deferredUnwindIdx = (int)deferredUnwinds.size() - 1; deferredUnwindIdx >= 0; deferredUnwindIdx--)
  12649. {
  12650. auto inst = deferredUnwinds[deferredUnwindIdx].mUnwindInst;
  12651. int codePos = deferredUnwinds[deferredUnwindIdx].mCodePos;
  12652. switch (inst->mKind)
  12653. {
  12654. case BeMCInstKind_Unwind_Alloc:
  12655. {
  12656. xdata.Write((uint8)(codePos));
  12657. int allocSize = (int)inst->mArg0.mImmediate;
  12658. if (allocSize <= 128)
  12659. {
  12660. // UWOP_ALLOC_SMALL
  12661. xdata.Write((uint8)((2) | ((allocSize / 8 - 1) << 4)));
  12662. }
  12663. else if ((allocSize <= 0x7FFF8) && ((allocSize & 7) == 0)) // up to 512k-8 bytes
  12664. {
  12665. // UWOP_ALLOC_LARGE
  12666. xdata.Write((uint8)((1) | ((0) << 4)));
  12667. xdata.Write((uint8)((allocSize / 8) & 0xFF));
  12668. xdata.Write((uint8)((allocSize / 8) >> 8));
  12669. }
  12670. else
  12671. {
  12672. // UWOP_ALLOC_LARGE+
  12673. xdata.Write((uint8)((1) | ((1) << 4)));
  12674. xdata.Write((int32)allocSize);
  12675. }
  12676. }
  12677. break;
  12678. case BeMCInstKind_Unwind_PushReg:
  12679. {
  12680. xdata.Write((uint8)(codePos));
  12681. int regNum = 0;
  12682. switch (inst->mArg0.mReg)
  12683. {
  12684. case X64Reg_RAX: regNum = 0; break;
  12685. case X64Reg_RCX: regNum = 1; break;
  12686. case X64Reg_RDX: regNum = 2; break;
  12687. case X64Reg_RBX: regNum = 3; break;
  12688. case X64Reg_RSP: regNum = 4; break;
  12689. case X64Reg_RBP: regNum = 5; break;
  12690. case X64Reg_RSI: regNum = 6; break;
  12691. case X64Reg_RDI: regNum = 7; break;
  12692. case X64Reg_R8: regNum = 8; break;
  12693. case X64Reg_R9: regNum = 9; break;
  12694. case X64Reg_R10: regNum = 10; break;
  12695. case X64Reg_R11: regNum = 11; break;
  12696. case X64Reg_R12: regNum = 12; break;
  12697. case X64Reg_R13: regNum = 13; break;
  12698. case X64Reg_R14: regNum = 14; break;
  12699. case X64Reg_R15: regNum = 15; break;
  12700. default: NotImpl();
  12701. }
  12702. // UWOP_PUSH_NONVOL
  12703. xdata.Write((uint8)((0) | (regNum << 4)));
  12704. }
  12705. break;
  12706. case BeMCInstKind_Unwind_SaveXMM:
  12707. {
  12708. xdata.Write((uint8)(codePos));
  12709. int regNum = 0;
  12710. switch (inst->mArg0.mReg)
  12711. {
  12712. case X64Reg_XMM0_f64: regNum = 0; break;
  12713. case X64Reg_XMM1_f64: regNum = 1; break;
  12714. case X64Reg_XMM2_f64: regNum = 2; break;
  12715. case X64Reg_XMM3_f64: regNum = 3; break;
  12716. case X64Reg_XMM4_f64: regNum = 4; break;
  12717. case X64Reg_XMM5_f64: regNum = 5; break;
  12718. case X64Reg_XMM6_f64: regNum = 6; break;
  12719. case X64Reg_XMM7_f64: regNum = 7; break;
  12720. case X64Reg_XMM8_f64: regNum = 8; break;
  12721. case X64Reg_XMM9_f64: regNum = 9; break;
  12722. case X64Reg_XMM10_f64: regNum = 10; break;
  12723. case X64Reg_XMM11_f64: regNum = 11; break;
  12724. case X64Reg_XMM12_f64: regNum = 12; break;
  12725. case X64Reg_XMM13_f64: regNum = 13; break;
  12726. case X64Reg_XMM14_f64: regNum = 14; break;
  12727. case X64Reg_XMM15_f64: regNum = 15; break;
  12728. default: NotImpl();
  12729. }
  12730. // UWOP_SAVE_XMM128
  12731. xdata.Write((uint8)((8) | (regNum << 4)));
  12732. xdata.Write((int16)(inst->mArg1.mImmediate / 16));
  12733. }
  12734. break;
  12735. case BeMCInstKind_Unwind_SetBP:
  12736. {
  12737. xdata.Write((uint8)(codePos));
  12738. // UWOP_SET_FPREG
  12739. xdata.Write((uint8)((3) | (0 << 4)));
  12740. }
  12741. break;
  12742. }
  12743. }
  12744. int codeLen = mOut.GetPos() - textSectStartPos;
  12745. int minCodeLen = hotJumpLen;
  12746. int addCodeLen = minCodeLen - codeLen;
  12747. for (int i = 0; i < addCodeLen; i++)
  12748. {
  12749. mOut.Write((uint8)0x90);
  12750. }
  12751. if (mDbgFunction != NULL)
  12752. {
  12753. mDbgFunction->mCodeLen = mOut.GetPos() - textSectStartPos;
  12754. }
  12755. if (hasPData)
  12756. {
  12757. int codeLen = mOut.GetPos() - textSectStartPos;
  12758. // PDATA end addr
  12759. BeMCRelocation reloc;
  12760. reloc.mKind = BeMCRelocationKind_ADDR32NB;
  12761. reloc.mOffset = mCOFFObject->mPDataSect.mData.GetPos();
  12762. reloc.mSymTableIdx = mCOFFObject->GetSymbol(mBeFunction)->mIdx;
  12763. mCOFFObject->mPDataSect.mRelocs.push_back(reloc);
  12764. mCOFFObject->mPDataSect.mData.Write((int32)codeLen);
  12765. // XDATA pos
  12766. reloc.mKind = BeMCRelocationKind_ADDR32NB;
  12767. reloc.mOffset = mCOFFObject->mPDataSect.mData.GetPos();
  12768. reloc.mSymTableIdx = mCOFFObject->mXDataSect.mSymbolIdx;
  12769. mCOFFObject->mPDataSect.mRelocs.push_back(reloc);
  12770. mCOFFObject->mPDataSect.mData.Write((int32)xdataStartPos);
  12771. int numCodes = (xdata.GetPos() - xdataStartPos - 4) / 2;
  12772. if (numCodes > 0)
  12773. {
  12774. xdata.mData[xdataStartPos + 1] = (uint8)(deferredUnwinds.back().mCodePos); // prolog size
  12775. xdata.mData[xdataStartPos + 2] = (uint8)numCodes;
  12776. }
  12777. }
  12778. for (auto& dbgInstPos : dbgInstPositions)
  12779. {
  12780. auto inst = dbgInstPos.mInst;
  12781. dbgStr += StrFormat("%d[%d]", dbgInstPos.mPos, dbgInstPos.mOrigPos);
  12782. if (inst->mDbgLoc != NULL)
  12783. dbgStr += StrFormat("@%d", inst->mDbgLoc->mIdx);
  12784. if (inst->mResult.mKind != BeMCOperandKind_None)
  12785. {
  12786. dbgStr += " ";
  12787. dbgStr += ToString(inst->mResult);
  12788. dbgStr += " = ";
  12789. }
  12790. dbgStr += " ";
  12791. dbgStr += gOpName[(int)inst->mKind];
  12792. if (inst->mArg0.mKind != BeMCOperandKind_None)
  12793. {
  12794. dbgStr += " ";
  12795. dbgStr += ToString(inst->mArg0);
  12796. }
  12797. if (inst->mArg1.mKind != BeMCOperandKind_None)
  12798. {
  12799. dbgStr += ", ";
  12800. dbgStr += ToString(inst->mArg1);
  12801. }
  12802. dbgStr += "\n";
  12803. }
  12804. if (mDebugging)
  12805. {
  12806. dbgStr += "\nDebug Variables:\n";
  12807. for (auto dbgVar : mDbgFunction->mVariables)
  12808. {
  12809. if (dbgVar == NULL)
  12810. continue;
  12811. dbgStr += StrFormat("%s %d to %d", dbgVar->mName.c_str(), dbgVar->mDeclStart, dbgVar->mDeclEnd);
  12812. if (dbgVar->mDeclLifetimeExtend)
  12813. dbgStr += " LifetimeExtend";
  12814. dbgStr += "\n";
  12815. for (auto& gap : dbgVar->mGaps)
  12816. {
  12817. if (gap.mLength == -1)
  12818. dbgStr += StrFormat(" Gap %d to <unterminated>\n", gap.mOffset);
  12819. else
  12820. dbgStr += StrFormat(" Gap %d to %d\n", gap.mOffset, gap.mOffset + gap.mLength);
  12821. }
  12822. for (auto& gap : dbgVar->mSavedRanges)
  12823. {
  12824. if (gap.mLength == -1)
  12825. dbgStr += StrFormat(" SavedRange %d to <unterminated>\n", gap.mOffset);
  12826. else
  12827. dbgStr += StrFormat(" SavedRange %d to %d\n", gap.mOffset, gap.mOffset + gap.mLength);
  12828. }
  12829. }
  12830. }
  12831. if (!dbgStr.empty())
  12832. {
  12833. dbgStr += "\n";
  12834. OutputDebugStr(dbgStr);
  12835. }
  12836. }
  12837. void BeMCContext::HandleParams()
  12838. {
  12839. auto beModule = mBeFunction->mModule;
  12840. int regIdxOfs = 0;
  12841. int paramOfs = 0;
  12842. auto retType = mBeFunction->GetFuncType()->mReturnType;
  12843. X64CPURegister compositeRetReg = X64Reg_None;
  12844. bool flipFirstRegs = false;
  12845. if (mBeFunction->HasStructRet())
  12846. {
  12847. flipFirstRegs = mBeFunction->mCallingConv == BfIRCallingConv_ThisCall;
  12848. //paramOfs = 1;
  12849. /*auto ptrType = (BePointerType*)mBeFunction->mFuncType->mParams[0].mType;
  12850. BF_ASSERT(ptrType->mTypeCode == BeTypeCode_Pointer);
  12851. retType = ptrType->mElementType;*/
  12852. //retType = mBeFunction->mFuncType->mParams[0].mType;
  12853. //flipFirstRegs = mBeFunction->mCallingConv == BfIRCallingConv_ThisCall;
  12854. /*
  12855. auto beArg = beModule->GetArgument(0);
  12856. compositeRetReg = (mBeFunction->mCallingConv == BfIRCallingConv_ThisCall) ? X64Reg_RDX : X64Reg_RCX;
  12857. mParamsUsedRegs.push_back(compositeRetReg);
  12858. BeMCOperand mcOperand;
  12859. mcOperand.mReg = compositeRetReg;
  12860. mcOperand.mKind = BeMCOperandKind_NativeReg;
  12861. auto ptrType = (BePointerType*)mBeFunction->mFuncType->mParams[0].mType;
  12862. BF_ASSERT(ptrType->mTypeCode == BeTypeCode_Pointer);
  12863. auto paramVReg = AllocVirtualReg(ptrType->mElementType);
  12864. auto paramVRegInfo = GetVRegInfo(paramVReg);
  12865. CreateDefineVReg(paramVReg);
  12866. paramVRegInfo->mNaturalReg = compositeRetReg;
  12867. AllocInst(BeMCInstKind_Mov, paramVReg, mcOperand);
  12868. mValueToOperand[beArg] = paramVReg;*/
  12869. }
  12870. else if (retType->IsComposite())
  12871. {
  12872. compositeRetReg = (mBeFunction->mCallingConv == BfIRCallingConv_ThisCall) ? X64Reg_RDX : X64Reg_RCX;
  12873. auto retVReg = AllocVirtualReg(mModule->mContext->GetPrimitiveType(BeTypeCode_Int64));
  12874. auto retVRegInfo = GetVRegInfo(retVReg);
  12875. retVRegInfo->mNaturalReg = compositeRetReg;
  12876. retVRegInfo->mForceReg = true;
  12877. retVRegInfo->mMustExist = true;
  12878. AllocInst(BeMCInstKind_Mov, retVReg, BeMCOperand::FromReg(compositeRetReg));
  12879. mCompositeRetVRegIdx = retVReg.mVRegIdx;
  12880. mParamsUsedRegs.push_back(compositeRetReg);
  12881. }
  12882. for (int paramIdx = 0; paramIdx < (int)mBeFunction->mParams.size() - paramOfs; paramIdx++)
  12883. {
  12884. if (((paramIdx == 0) && (compositeRetReg == X64Reg_RCX)) ||
  12885. ((paramIdx == 1) && (compositeRetReg == X64Reg_RDX)))
  12886. regIdxOfs = 1;
  12887. auto funcType = mBeFunction->GetFuncType();
  12888. auto& typeParam = funcType->mParams[paramIdx + paramOfs];
  12889. auto& param = mBeFunction->mParams[paramIdx + paramOfs];
  12890. auto beArg = beModule->GetArgument(paramIdx + paramOfs);
  12891. BeMCOperand mcOperand;
  12892. mcOperand.mReg = X64Reg_None;
  12893. mcOperand.mKind = BeMCOperandKind_NativeReg;
  12894. int regIdx = paramIdx + regIdxOfs;
  12895. if (typeParam.mType->IsFloat())
  12896. {
  12897. switch (regIdx)
  12898. {
  12899. case 0:
  12900. mcOperand.mReg = X64Reg_XMM0_f64;
  12901. break;
  12902. case 1:
  12903. mcOperand.mReg = X64Reg_XMM1_f64;
  12904. break;
  12905. case 2:
  12906. mcOperand.mReg = X64Reg_XMM2_f64;
  12907. break;
  12908. case 3:
  12909. mcOperand.mReg = X64Reg_XMM3_f64;
  12910. break;
  12911. }
  12912. }
  12913. else
  12914. {
  12915. switch (regIdx)
  12916. {
  12917. case 0:
  12918. mcOperand.mReg = !flipFirstRegs ? X64Reg_RCX : X64Reg_RDX;
  12919. break;
  12920. case 1:
  12921. mcOperand.mReg = !flipFirstRegs ? X64Reg_RDX : X64Reg_RCX;
  12922. break;
  12923. case 2:
  12924. mcOperand.mReg = X64Reg_R8;
  12925. break;
  12926. case 3:
  12927. mcOperand.mReg = X64Reg_R9;
  12928. break;
  12929. }
  12930. }
  12931. if (mcOperand.mReg != X64Reg_None)
  12932. {
  12933. mParamsUsedRegs.push_back(mcOperand.mReg);
  12934. mcOperand.mReg = ResizeRegister(mcOperand.mReg, typeParam.mType->mSize);
  12935. }
  12936. BeMCOperand paramVReg;
  12937. /*if ((paramIdx == 0) && (mBeFunction->mStructRet))
  12938. {
  12939. auto ptrType = (BePointerType*)typeParam.mType;
  12940. BF_ASSERT(ptrType->mTypeCode == BeTypeCode_Pointer);
  12941. paramVReg = AllocVirtualReg(ptrType->mElementType);
  12942. paramVReg.mKind = BeMCOperandKind_VRegAddr;
  12943. //paramVReg.mR
  12944. }
  12945. else*/
  12946. paramVReg = AllocVirtualReg(typeParam.mType);
  12947. auto paramVRegInfo = GetVRegInfo(paramVReg);
  12948. if ((mBeFunction->HasStructRet()) && (paramIdx == 0))
  12949. {
  12950. paramVRegInfo->SetRetVal();
  12951. }
  12952. else
  12953. paramVRegInfo->mForceMerge = true;
  12954. CreateDefineVReg(paramVReg);
  12955. if (mcOperand.mReg != X64Reg_None)
  12956. {
  12957. // This indirection allows us to NOT directly use a register for a parameter
  12958. // if the cost of saving/restoring this volatile reg is too great
  12959. paramVRegInfo->mNaturalReg = mcOperand.mReg;
  12960. AllocInst(BeMCInstKind_Mov, paramVReg, mcOperand);
  12961. }
  12962. else
  12963. {
  12964. paramVRegInfo->mMustExist = true;
  12965. paramVRegInfo->mForceMem = true;
  12966. paramVRegInfo->mFrameOffset = paramIdx * 8 + 8;
  12967. CreateDefineVReg(paramVReg);
  12968. }
  12969. //paramVRegInfo->mDbgVariable = mDbgFunction->mParams[paramIdx];
  12970. mValueToOperand[beArg] = paramVReg;
  12971. }
  12972. }
  12973. void BeMCContext::ToString(BeMCInst* inst, String& str, bool showVRegFlags, bool showVRegDetails)
  12974. {
  12975. if (inst->mKind == BeMCInstKind_Label)
  12976. {
  12977. str += ToString(inst->mArg0);
  12978. str += ":";
  12979. }
  12980. else
  12981. {
  12982. str += " ";
  12983. if (inst->mResult)
  12984. {
  12985. str += ToString(inst->mResult);
  12986. str += " = ";
  12987. }
  12988. str += gOpName[(int)inst->mKind];
  12989. if (inst->mKind == BeMCInstKind_DbgDecl)
  12990. {
  12991. auto vregInfo = GetVRegInfo(inst->mArg0);
  12992. if ((vregInfo != NULL) && (vregInfo->mDbgVariable != NULL))
  12993. {
  12994. if (vregInfo->mDbgVariable->mIsValue)
  12995. str += " <value>";
  12996. else
  12997. str += " <addr>";
  12998. }
  12999. }
  13000. if (inst->mKind == BeMCInstKind_DefPhi)
  13001. {
  13002. str += " ";
  13003. str += ToString(inst->mArg0);
  13004. for (auto& val : inst->mArg0.mPhi->mValues)
  13005. {
  13006. str += ", [";
  13007. str += ToString(BeMCOperand::FromBlock(val.mBlockFrom));
  13008. str += ", ";
  13009. str += ToString(val.mValue);
  13010. str += "]";
  13011. }
  13012. }
  13013. else if (inst->mKind == BeMCInstKind_Load)
  13014. {
  13015. str += " ";
  13016. str += ToString(inst->mArg0);
  13017. str += ", [";
  13018. str += ToString(inst->mArg1);
  13019. str += "]";
  13020. }
  13021. else if (inst->mKind == BeMCInstKind_Store)
  13022. {
  13023. str += " [";
  13024. str += ToString(inst->mArg0);
  13025. str += "], ";
  13026. str += ToString(inst->mArg1);
  13027. }
  13028. else if (inst->mArg0.mKind != BeMCOperandKind_None)
  13029. {
  13030. str += " ";
  13031. str += ToString(inst->mArg0);
  13032. if (inst->mArg1.mKind != BeMCOperandKind_None)
  13033. {
  13034. str += ", ";
  13035. str += ToString(inst->mArg1);
  13036. }
  13037. }
  13038. }
  13039. if (inst->IsDef())
  13040. {
  13041. auto vregInfo = mVRegInfo[inst->mArg0.mVRegIdx];
  13042. if (vregInfo->mRefCount != -1)
  13043. str += StrFormat(" : %d refs", vregInfo->mRefCount);
  13044. }
  13045. /*if (inst->mKind == BeMCInstKind_Def)
  13046. {
  13047. str += " ";
  13048. str += mModule->ToString(GetType(inst->mArg0));
  13049. }*/
  13050. bool hadSemi = false;
  13051. if (inst->mDbgLoc != NULL)
  13052. {
  13053. str += StrFormat(" ; @%d[%d:%d]", inst->mDbgLoc->mIdx, inst->mDbgLoc->mLine + 1, inst->mDbgLoc->mColumn + 1);
  13054. hadSemi = true;
  13055. }
  13056. bool showLiveness = showVRegFlags;
  13057. if ((showLiveness) && (inst->mLiveness != NULL))
  13058. {
  13059. if (!hadSemi)
  13060. {
  13061. str += " ;";
  13062. hadSemi = true;
  13063. }
  13064. bool isFirstInScope = true;
  13065. str += " live: ";
  13066. int vregIdx = -1;
  13067. for (int nextVRegIdx : *inst->mLiveness)
  13068. {
  13069. if (nextVRegIdx >= mLivenessContext.mNumItems)
  13070. {
  13071. vregIdx = nextVRegIdx;
  13072. int showVRegIdx = vregIdx - mLivenessContext.mNumItems;
  13073. if (!mLivenessContext.IsSet(inst->mLiveness, showVRegIdx))
  13074. str += StrFormat(", %d*", showVRegIdx);
  13075. continue;
  13076. }
  13077. if (vregIdx != -1)
  13078. str += ", ";
  13079. vregIdx = nextVRegIdx;
  13080. str += StrFormat("%d", vregIdx);
  13081. if (showVRegDetails)
  13082. {
  13083. auto vregInfo = mVRegInfo[vregIdx];
  13084. if (vregInfo->mForceReg)
  13085. str += "r";
  13086. if (vregInfo->mForceMem)
  13087. str += "m";
  13088. if (vregInfo->mSpilled)
  13089. str += "s";
  13090. }
  13091. }
  13092. if (inst->mLiveness->mNumChanges > 0)
  13093. {
  13094. str += " | ";
  13095. for (int changeIdx = 0; changeIdx < inst->mLiveness->mNumChanges; changeIdx++)
  13096. {
  13097. if (changeIdx != 0)
  13098. str += ", ";
  13099. int vregIdx = inst->mLiveness->GetChange(changeIdx);
  13100. if (vregIdx >= 0)
  13101. str += StrFormat("+%d", vregIdx);
  13102. else
  13103. str += StrFormat("-%d", -vregIdx - 1);
  13104. }
  13105. }
  13106. }
  13107. bool showInitialized = showVRegFlags;
  13108. if ((showInitialized) && (inst->mVRegsInitialized != NULL))
  13109. {
  13110. if (!hadSemi)
  13111. {
  13112. str += " ;";
  13113. hadSemi = true;
  13114. }
  13115. bool isFirstUninit = true;
  13116. str += " init: ";
  13117. int vregIdx = -1;
  13118. for (int nextVRegIdx : *inst->mVRegsInitialized)
  13119. {
  13120. if (nextVRegIdx >= mVRegInitializedContext.mNumItems)
  13121. {
  13122. if (isFirstUninit)
  13123. str += " uninit: ";
  13124. else
  13125. str += ", ";
  13126. isFirstUninit = false;
  13127. vregIdx = nextVRegIdx;
  13128. str += StrFormat("%d", vregIdx - mVRegInitializedContext.mNumItems);
  13129. }
  13130. else
  13131. {
  13132. if (vregIdx != -1)
  13133. str += ", ";
  13134. vregIdx = nextVRegIdx;
  13135. str += StrFormat("%d", vregIdx);
  13136. auto vregInfo = mVRegInfo[vregIdx];
  13137. if (vregInfo->mValueScopeRetainedKind == BeMCValueScopeRetainKind_Soft)
  13138. str += "r";
  13139. else if (vregInfo->mValueScopeRetainedKind == BeMCValueScopeRetainKind_Hard)
  13140. str += "rh";
  13141. }
  13142. }
  13143. if (inst->mVRegsInitialized->mNumChanges > 0)
  13144. {
  13145. str += " | ";
  13146. for (int changeIdx = 0; changeIdx < inst->mVRegsInitialized->mNumChanges; changeIdx++)
  13147. {
  13148. if (changeIdx != 0)
  13149. str += ", ";
  13150. int vregIdx = inst->mVRegsInitialized->GetChange(changeIdx);
  13151. if (vregIdx >= 0)
  13152. str += StrFormat("+%d", vregIdx);
  13153. else
  13154. str += StrFormat("-%d", -vregIdx - 1);
  13155. }
  13156. }
  13157. }
  13158. str += "\n";
  13159. }
  13160. String BeMCContext::ToString(bool showVRegFlags, bool showVRegDetails)
  13161. {
  13162. String str;
  13163. str += mBeFunction->mName;
  13164. str += "\n";
  13165. str += StrFormat("Stack Size: 0x%X\n", mStackSize);
  13166. str += "Frame Objects:\n";
  13167. for (int vregIdx = 0; vregIdx < (int)mVRegInfo.size(); vregIdx++)
  13168. {
  13169. int showVRegIdx = vregIdx;
  13170. auto vregInfo = mVRegInfo[showVRegIdx];
  13171. if ((vregInfo->mIsRetVal) && (mCompositeRetVRegIdx != -1))
  13172. {
  13173. showVRegIdx = mCompositeRetVRegIdx;
  13174. vregInfo = mVRegInfo[showVRegIdx];
  13175. }
  13176. if (vregInfo->mFrameOffset != INT_MIN)
  13177. {
  13178. str += " ";
  13179. str += ToString(BeMCOperand::FromVReg(vregIdx));
  13180. str += StrFormat(": size=%d, align=%d, at ", vregInfo->mType->mSize, vregInfo->mAlign);
  13181. X64CPURegister reg;
  13182. int offset;
  13183. GetValAddr(BeMCOperand::FromVRegAddr(showVRegIdx), reg, offset);
  13184. str += "[";
  13185. str += X64CPURegisters::GetRegisterName(reg);
  13186. if (offset != 0)
  13187. str += StrFormat(" + 0x%X", offset);
  13188. str += "]";
  13189. str += "\n";
  13190. }
  13191. }
  13192. str += "\n";
  13193. for (int blockIdx = 0; blockIdx < (int)mBlocks.size(); blockIdx++)
  13194. {
  13195. auto mcBlock = mBlocks[blockIdx];
  13196. if (blockIdx > 0)
  13197. str += "\n";
  13198. if (mBlocks.size() > 1)
  13199. {
  13200. str += mcBlock->mName;
  13201. str += ":";
  13202. if (mcBlock->mIsLooped)
  13203. str += " ; looped";
  13204. str += " ; preds = ";
  13205. for (int predIdx = 0; predIdx < (int)mcBlock->mPreds.size(); predIdx++)
  13206. {
  13207. if (predIdx != 0)
  13208. str += ", ";
  13209. str += "%";
  13210. str += mcBlock->mPreds[predIdx]->mName;
  13211. }
  13212. ///
  13213. str += " ; succs = ";
  13214. for (int succIdx = 0; succIdx < (int)mcBlock->mSuccs.size(); succIdx++)
  13215. {
  13216. if (succIdx != 0)
  13217. str += ", ";
  13218. str += "%";
  13219. str += mcBlock->mSuccs[succIdx]->mName;
  13220. }
  13221. //
  13222. str += "\n";
  13223. }
  13224. for (auto inst : mcBlock->mInstructions)
  13225. ToString(inst, str, showVRegFlags, showVRegDetails);
  13226. }
  13227. str += "\n";
  13228. return str;
  13229. }
  13230. void BeMCContext::Print()
  13231. {
  13232. OutputDebugStr(ToString(true, false));
  13233. }
  13234. void BeMCContext::Print(bool showVRegFlags, bool showVRegDetails)
  13235. {
  13236. OutputDebugStr(ToString(showVRegFlags, showVRegDetails));
  13237. }
  13238. BeMCOperand BeMCContext::AllocBinaryOp(BeMCInstKind instKind, const BeMCOperand& lhs, const BeMCOperand& rhs, BeMCBinIdentityKind identityKind)
  13239. {
  13240. if ((lhs.IsImmediate()) && (lhs.mKind == rhs.mKind))
  13241. {
  13242. if (instKind == BeMCInstKind_Add)
  13243. {
  13244. BeMCOperand result;
  13245. result.mKind = lhs.mKind;
  13246. switch (lhs.mKind)
  13247. {
  13248. case BeMCOperandKind_Immediate_i32:
  13249. result.mImmediate = lhs.mImmediate + rhs.mImmediate;
  13250. return result;
  13251. }
  13252. }
  13253. }
  13254. if (identityKind == BeMCBinIdentityKind_Any_IsOne)
  13255. {
  13256. if (((lhs.IsImmediateFloat()) && (lhs.mImmFloat == 1.0)) ||
  13257. ((lhs.IsImmediateInt()) && (lhs.mImmediate == 1)))
  13258. return rhs;
  13259. }
  13260. if (identityKind == BeMCBinIdentityKind_Right_IsOne_Result_Zero)
  13261. {
  13262. if (((rhs.IsImmediateFloat()) && (rhs.mImmFloat == 1.0)) ||
  13263. ((rhs.IsImmediateInt()) && (rhs.mImmediate == 1)))
  13264. {
  13265. BeMCOperand operand = rhs;
  13266. operand.mImmediate = 0;
  13267. return operand;
  13268. }
  13269. }
  13270. if ((identityKind == BeMCBinIdentityKind_Right_IsOne) || (identityKind == BeMCBinIdentityKind_Any_IsOne))
  13271. {
  13272. if (((rhs.IsImmediateFloat()) && (rhs.mImmFloat == 1.0)) ||
  13273. ((rhs.IsImmediateInt()) && (rhs.mImmediate == 1)))
  13274. return lhs;
  13275. }
  13276. if ((identityKind == BeMCBinIdentityKind_Right_IsZero) || (identityKind == BeMCBinIdentityKind_Any_IsZero))
  13277. {
  13278. if (((rhs.IsImmediateFloat()) && (rhs.mImmFloat == 0.0)) ||
  13279. ((rhs.IsImmediateInt()) && (rhs.mImmediate == 0)))
  13280. return lhs;
  13281. }
  13282. if (identityKind == BeMCBinIdentityKind_Any_IsZero)
  13283. {
  13284. if (((lhs.IsImmediateFloat()) && (lhs.mImmFloat == 0.0)) ||
  13285. ((lhs.IsImmediateInt()) && (lhs.mImmediate == 0)))
  13286. return rhs;
  13287. }
  13288. auto result = AllocVirtualReg(GetType(lhs));
  13289. AllocInst(BeMCInstKind_Def, result);
  13290. auto mcInst = AllocInst(instKind, lhs, rhs);
  13291. mcInst->mResult = result;
  13292. return result;
  13293. }
  13294. void BeMCContext::Generate(BeFunction* function)
  13295. {
  13296. BP_ZONE_F("BeMCContext::Generate %s", function->mName.c_str());
  13297. mBeFunction = function;
  13298. mDbgFunction = mBeFunction->mDbgFunction;
  13299. mModule = function->mModule;
  13300. //mDbgPreferredRegs[15] = X64Reg_RCX;
  13301. //mDbgPreferredRegs[7] = X64Reg_RCX;
  13302. /*mDbgPreferredRegs[14] = X64Reg_RAX;
  13303. mDbgPreferredRegs[15] = X64Reg_None;
  13304. mDbgPreferredRegs[19] = X64Reg_None;
  13305. mDbgPreferredRegs[31] = X64Reg_R8;
  13306. mDbgPreferredRegs[32] = X64Reg_R8;*/
  13307. //mDbgPreferredRegs[8] = X64Reg_RAX;
  13308. mDebugging = function->mName ==
  13309. //"?TestPrimitives@Nullable@Tests@bf@@SAXXZ"
  13310. "?TestAlloc@Blurg@bf@@SAXXZ";
  13311. //"?Main@Program@bf@@CAHPEAV?$Array1@PEAVString@System@bf@@@System@2@@Z";
  13312. //"?Hey@Blurg@bf@@SAXXZ";
  13313. //"?get__Value@?$Nullable@ULineAndColumn@EditWidgetContent@widgets@Beefy@bf@@@System@bf@@QEAAULineAndColumn@EditWidgetContent@widgets@Beefy@3@XZ";
  13314. //"?__BfCtor@StructA@bf@@QEAAXXZ";
  13315. if (mDebugging)
  13316. {
  13317. mModule->Print(mBeFunction);
  13318. }
  13319. for (auto beBlock : function->mBlocks)
  13320. {
  13321. int blockIdx = (int)mMCBlockAlloc.size();
  13322. auto mcBlock = mMCBlockAlloc.Alloc();
  13323. mcBlock->mName = beBlock->mName + StrFormat(":%d", blockIdx);
  13324. mcBlock->mBlockIdx = blockIdx;
  13325. mcBlock->mMaxDeclBlockId = blockIdx;
  13326. BeMCOperand mcOperand;
  13327. mcOperand.mKind = BeMCOperandKind_Block;
  13328. mcOperand.mBlock = mcBlock;
  13329. mValueToOperand[beBlock] = mcOperand;
  13330. mBlocks.push_back(mcBlock);
  13331. }
  13332. SizedArray<int, 64> dbgVarsAwaitingEnd;
  13333. BeMDNode* curDbgScope = NULL;
  13334. bool inHeadAlloca = true;
  13335. SizedArray<int, 64> stackSaveVRegs;
  13336. // Scan pass
  13337. mMaxCallParamCount = 4;
  13338. for (int blockIdx = 0; blockIdx < (int)function->mBlocks.size(); blockIdx++)
  13339. {
  13340. auto beBlock = function->mBlocks[blockIdx];
  13341. auto mcBlock = mBlocks[blockIdx];
  13342. for (int instIdx = 0; instIdx < (int)beBlock->mInstructions.size(); instIdx++)
  13343. {
  13344. auto inst = beBlock->mInstructions[instIdx];
  13345. int instType = inst->GetTypeId();
  13346. switch (instType)
  13347. {
  13348. case BeAllocaInst::TypeId:
  13349. {
  13350. auto castedInst = (BeAllocaInst*)inst;
  13351. if ((!inHeadAlloca) || (castedInst->mAlign > 16))
  13352. mUseBP = true;
  13353. }
  13354. break;
  13355. case BeNumericCastInst::TypeId:
  13356. case BeBitCastInst::TypeId:
  13357. break;
  13358. case BeStackSaveInst::TypeId:
  13359. {
  13360. auto stackVReg = AllocVirtualReg(mNativeIntType);
  13361. stackSaveVRegs.push_back(stackVReg.mVRegIdx);
  13362. }
  13363. break;
  13364. case BeCallInst::TypeId:
  13365. {
  13366. auto castedInst = (BeCallInst*)inst;
  13367. mMaxCallParamCount = BF_MAX(mMaxCallParamCount, (int)castedInst->mArgs.size());
  13368. }
  13369. break;
  13370. default:
  13371. inHeadAlloca = false;
  13372. break;
  13373. }
  13374. }
  13375. }
  13376. int retCount = 0;
  13377. bool isFirstBlock = true;
  13378. inHeadAlloca = true;
  13379. SizedArray<int, 64> valueScopeStack;
  13380. // Generate pass
  13381. for (int blockIdx = 0; blockIdx < (int)function->mBlocks.size(); blockIdx++)
  13382. {
  13383. auto beBlock = function->mBlocks[blockIdx];
  13384. auto mcBlock = mBlocks[blockIdx];
  13385. mActiveBeBlock = beBlock;
  13386. mActiveBlock = mcBlock;
  13387. if (isFirstBlock)
  13388. HandleParams();
  13389. for (int instIdx = 0; instIdx < (int)beBlock->mInstructions.size(); instIdx++)
  13390. {
  13391. auto inst = beBlock->mInstructions[instIdx];
  13392. BeMCOperand result;
  13393. mCurDbgLoc = inst->mDbgLoc;
  13394. int instType = inst->GetTypeId();
  13395. switch (instType)
  13396. {
  13397. case BeAllocaInst::TypeId:
  13398. case BeNumericCastInst::TypeId:
  13399. case BeBitCastInst::TypeId:
  13400. break;
  13401. default:
  13402. inHeadAlloca = false;
  13403. break;
  13404. }
  13405. switch (instType)
  13406. {
  13407. case BeNopInst::TypeId:
  13408. {
  13409. auto mcInst = AllocInst();
  13410. mcInst->mKind = BeMCInstKind_Nop;
  13411. }
  13412. break;
  13413. case BeUnreachableInst::TypeId:
  13414. {
  13415. auto mcInst = AllocInst();
  13416. mcInst->mKind = BeMCInstKind_Unreachable;
  13417. }
  13418. break;
  13419. case BeEnsureInstructionAtInst::TypeId:
  13420. {
  13421. auto mcInst = AllocInst();
  13422. mcInst->mKind = BeMCInstKind_EnsureInstructionAt;
  13423. }
  13424. break;
  13425. case BeUndefValueInst::TypeId:
  13426. {
  13427. auto castedInst = (BeUndefValueInst*)inst;
  13428. result = AllocVirtualReg(castedInst->mType);
  13429. CreateDefineVReg(result);
  13430. }
  13431. break;
  13432. case BeExtractValueInst::TypeId:
  13433. {
  13434. auto castedInst = (BeExtractValueInst*)inst;
  13435. BeConstant* constant = BeValueDynCast<BeConstant>(castedInst->mAggVal);
  13436. BeMCOperand mcAgg;
  13437. if (constant == NULL)
  13438. {
  13439. mcAgg = GetOperand(castedInst->mAggVal);
  13440. if (mcAgg.mKind == BeMCOperandKind_ConstAgg)
  13441. {
  13442. constant = mcAgg.mConstant;
  13443. }
  13444. }
  13445. if (constant != NULL)
  13446. {
  13447. result.mImmediate = 0;
  13448. BeType* wantDefaultType = NULL;
  13449. if (constant->mType->IsStruct())
  13450. {
  13451. BeStructType* structType = (BeStructType*)constant->mType;
  13452. auto& member = structType->mMembers[castedInst->mIdx];
  13453. wantDefaultType = member.mType;
  13454. }
  13455. else if (constant->mType->IsSizedArray())
  13456. {
  13457. BeSizedArrayType* arrayType = (BeSizedArrayType*)constant->mType;
  13458. wantDefaultType = arrayType->mElementType;
  13459. }
  13460. if (wantDefaultType != NULL)
  13461. {
  13462. switch (wantDefaultType->mTypeCode)
  13463. {
  13464. case BeTypeCode_Boolean:
  13465. case BeTypeCode_Int8:
  13466. result.mKind = BeMCOperandKind_Immediate_i8;
  13467. break;
  13468. case BeTypeCode_Int16:
  13469. result.mKind = BeMCOperandKind_Immediate_i16;
  13470. break;
  13471. case BeTypeCode_Int32:
  13472. result.mKind = BeMCOperandKind_Immediate_i32;
  13473. break;
  13474. case BeTypeCode_Int64:
  13475. result.mKind = BeMCOperandKind_Immediate_i64;
  13476. break;
  13477. case BeTypeCode_Float:
  13478. result.mKind = BeMCOperandKind_Immediate_f32;
  13479. break;
  13480. case BeTypeCode_Double:
  13481. result.mKind = BeMCOperandKind_Immediate_f64;
  13482. break;
  13483. case BeTypeCode_Pointer:
  13484. result.mKind = BeMCOperandKind_Immediate_Null;
  13485. result.mType = wantDefaultType;
  13486. break;
  13487. case BeTypeCode_Struct:
  13488. case BeTypeCode_SizedArray:
  13489. {
  13490. auto subConst = mAlloc.Alloc<BeConstant>();
  13491. subConst->mType = wantDefaultType;
  13492. result.mConstant = subConst;
  13493. result.mKind = BeMCOperandKind_ConstAgg;
  13494. }
  13495. break;
  13496. default:
  13497. NotImpl();
  13498. }
  13499. }
  13500. break;
  13501. }
  13502. auto aggType = GetType(mcAgg);
  13503. BF_ASSERT(aggType->IsStruct());
  13504. BeStructType* structType = (BeStructType*)aggType;
  13505. auto& structMember = structType->mMembers[castedInst->mIdx];
  13506. if (mcAgg.mKind == BeMCOperandKind_VReg)
  13507. mcAgg.mKind = BeMCOperandKind_VRegAddr;
  13508. else if (mcAgg.mKind == BeMCOperandKind_VRegLoad)
  13509. mcAgg.mKind = BeMCOperandKind_VReg;
  13510. else
  13511. NotImpl();
  13512. auto memberPtrType = mModule->mContext->GetPointerTo(structMember.mType);
  13513. result = AllocRelativeVirtualReg(memberPtrType, mcAgg, BeMCOperand::FromImmediate(structMember.mByteOffset), 1);
  13514. result.mKind = BeMCOperandKind_VRegLoad;
  13515. CreateDefineVReg(result);
  13516. }
  13517. break;
  13518. case BeInsertValueInst::TypeId:
  13519. {
  13520. auto castedInst = (BeInsertValueInst*)inst;
  13521. auto mcAgg = GetOperand(castedInst->mAggVal);
  13522. auto mcValue = GetOperand(castedInst->mMemberVal);
  13523. auto aggType = GetType(mcAgg);
  13524. BF_ASSERT(aggType->IsStruct());
  13525. BeStructType* structType = (BeStructType*)aggType;
  13526. auto& structMember = structType->mMembers[castedInst->mIdx];
  13527. BF_ASSERT(mcAgg.mKind = BeMCOperandKind_VReg);
  13528. auto mcAggRef = mcAgg;
  13529. mcAggRef.mKind = BeMCOperandKind_VRegAddr;
  13530. auto memberPtrType = mModule->mContext->GetPointerTo(structMember.mType);
  13531. auto mcMemberRef = AllocRelativeVirtualReg(memberPtrType, mcAggRef, BeMCOperand::FromImmediate(structMember.mByteOffset), 1);
  13532. CreateDefineVReg(mcMemberRef);
  13533. mcMemberRef.mKind = BeMCOperandKind_VRegLoad;
  13534. AllocInst(BeMCInstKind_Mov, mcMemberRef, mcValue);
  13535. // Our InsertValue always modifies the source aggregrate, it does not make a copy like LLVM's InsertValue would infer.
  13536. // This is okay because of Beef front end knowledge, but is not general purpose.
  13537. result = mcAgg;
  13538. }
  13539. break;
  13540. case BeNumericCastInst::TypeId:
  13541. {
  13542. auto castedInst = (BeNumericCastInst*)inst;
  13543. auto mcValue = GetOperand(castedInst->mValue);
  13544. auto fromType = GetType(mcValue);
  13545. if (fromType == castedInst->mToType)
  13546. {
  13547. // If it's just a sign change then leave it alone
  13548. result = mcValue;
  13549. }
  13550. else
  13551. {
  13552. auto toType = castedInst->mToType;
  13553. auto toValue = AllocVirtualReg(castedInst->mToType);
  13554. CreateDefineVReg(toValue);
  13555. if ((toType->IsInt()) && (fromType->IsInt()) && (toType->mSize < fromType->mSize))
  13556. {
  13557. // For truncating values, no actual instructions are needed, so we can just do a vreg relto ref
  13558. auto vregInfo = mVRegInfo[toValue.mVRegIdx];
  13559. vregInfo->mIsExpr = true;
  13560. vregInfo->mRelTo = mcValue;
  13561. }
  13562. else
  13563. {
  13564. bool doSignExtension = (toType->IsInt()) && (fromType->IsInt()) && (toType->mSize > fromType->mSize) && (castedInst->mToSigned) && (castedInst->mValSigned);
  13565. if ((toType->IsFloat()) && (fromType->IsInt()) && (castedInst->mValSigned))
  13566. doSignExtension = true;
  13567. if (doSignExtension)
  13568. {
  13569. AllocInst(BeMCInstKind_MovSX, toValue, mcValue);
  13570. }
  13571. else
  13572. AllocInst(BeMCInstKind_Mov, toValue, mcValue);
  13573. }
  13574. result = toValue;
  13575. }
  13576. }
  13577. break;
  13578. case BeNegInst::TypeId:
  13579. {
  13580. auto castedInst = (BeNumericCastInst*)inst;
  13581. auto mcValue = GetOperand(castedInst->mValue);
  13582. result = AllocVirtualReg(GetType(mcValue));
  13583. CreateDefineVReg(result);
  13584. AllocInst(BeMCInstKind_Mov, result, mcValue);
  13585. AllocInst(BeMCInstKind_Neg, result);
  13586. }
  13587. break;
  13588. case BeNotInst::TypeId:
  13589. {
  13590. auto castedInst = (BeNumericCastInst*)inst;
  13591. auto mcValue = GetOperand(castedInst->mValue, true);
  13592. // Phi's are easy - just make a new one with the true and false branches swapped
  13593. // if (mcValue.mKind == BeMCOperandKind_Phi)
  13594. // {
  13595. // BeMCPhi* origPhi = mcValue.mPhi;
  13596. // BeMCPhi* newPhi = mPhiAlloc.Alloc();
  13597. //
  13598. // *newPhi = *origPhi;
  13599. // BF_SWAP(newPhi->mBrTrue, newPhi->mBrFalse);
  13600. // result.mKind = BeMCOperandKind_Phi;
  13601. // result.mPhi = newPhi;
  13602. // break;
  13603. // }
  13604. //
  13605. // if (mcValue.mKind == BeMCOperandKind_CmpResult)
  13606. // {
  13607. // auto origCmpResult = mCmpResults[mcValue.mCmpResultIdx];
  13608. //
  13609. // auto cmpResultIdx = (int)mCmpResults.size();
  13610. // BeCmpResult cmpResult;
  13611. // cmpResult.mCmpKind = BeModule::InvertCmp(origCmpResult.mCmpKind);
  13612. // mCmpResults.push_back(cmpResult);
  13613. // result.mKind = BeMCOperandKind_CmpResult;
  13614. // result.mCmpResultIdx = cmpResultIdx;
  13615. // break;
  13616. // }
  13617. if (mcValue.mKind == BeMCOperandKind_NotResult)
  13618. {
  13619. // Double negative! Just unwrap the NotResult.
  13620. result = GetOperand(mcValue.mNotResult->mValue, true);
  13621. break;
  13622. }
  13623. else if ((mcValue.mKind == BeMCOperandKind_Phi) || (mcValue.mKind == BeMCOperandKind_CmpResult))
  13624. {
  13625. auto notResult = mAlloc.Alloc<BeNotResult>();
  13626. notResult->mValue = castedInst->mValue;
  13627. result.mKind = BeMCOperandKind_NotResult;
  13628. result.mNotResult = notResult;
  13629. break;
  13630. }
  13631. // LLVM does a weird thing for Not: val = (val ^ 0xFF) & 1
  13632. // Which turns a '2' into a '1' which is True to True - non-conformant to C standard?
  13633. // Visual Studio does an actual conditional branch. For Beef, bools are defined as 1 or 0.
  13634. /*result = AllocVirtualReg(GetType(mcValue));
  13635. CreateDefineVReg(result);
  13636. AllocInst(BeMCInstKind_Mov, result, mcValue);
  13637. BeMCOperand xorVal;
  13638. xorVal.mKind = BeMCOperandKind_Immediate_i8;
  13639. xorVal.mImmediate = 0xFF;
  13640. AllocInst(BeMCInstKind_Xor, result, xorVal);
  13641. BeMCOperand andVal;
  13642. andVal.mKind = BeMCOperandKind_Immediate_i8;
  13643. andVal.mImmediate = 0x1;
  13644. AllocInst(BeMCInstKind_And, result, andVal);*/
  13645. auto type = castedInst->mValue->GetType();
  13646. result = AllocVirtualReg(GetType(mcValue));
  13647. CreateDefineVReg(result);
  13648. AllocInst(BeMCInstKind_Mov, result, mcValue);
  13649. if (type->mTypeCode == BeTypeCode_Boolean)
  13650. {
  13651. BeMCOperand xorVal;
  13652. xorVal.mKind = BeMCOperandKind_Immediate_i8;
  13653. xorVal.mImmediate = 0x1;
  13654. AllocInst(BeMCInstKind_Xor, result, xorVal);
  13655. }
  13656. else
  13657. {
  13658. AllocInst(BeMCInstKind_Not, result);
  13659. }
  13660. }
  13661. break;
  13662. case BeBinaryOpInst::TypeId:
  13663. {
  13664. auto castedInst = (BeBinaryOpInst*)inst;
  13665. auto mcLHS = GetOperand(castedInst->mLHS);
  13666. auto mcRHS = GetOperand(castedInst->mRHS);
  13667. if (castedInst->mOpKind == BeBinaryOpKind_Subtract)
  13668. {
  13669. if (((mcLHS.IsImmediateFloat()) && (mcLHS.mImmFloat == 0.0)) ||
  13670. ((mcLHS.IsImmediateInt()) && (mcLHS.mImmediate == 0)))
  13671. {
  13672. auto castedInst = (BeNumericCastInst*)inst;
  13673. result = AllocVirtualReg(GetType(mcRHS));
  13674. CreateDefineVReg(result);
  13675. AllocInst(BeMCInstKind_Mov, result, mcRHS);
  13676. AllocInst(BeMCInstKind_Neg, result);
  13677. break;
  13678. }
  13679. }
  13680. switch (castedInst->mOpKind)
  13681. {
  13682. case BeBinaryOpKind_Add: result = AllocBinaryOp(BeMCInstKind_Add, mcLHS, mcRHS, BeMCBinIdentityKind_Any_IsZero); break;
  13683. case BeBinaryOpKind_Subtract: result = AllocBinaryOp(BeMCInstKind_Sub, mcLHS, mcRHS, BeMCBinIdentityKind_Right_IsZero); break;
  13684. case BeBinaryOpKind_Multiply: result = AllocBinaryOp(BeMCInstKind_IMul, mcLHS, mcRHS, BeMCBinIdentityKind_Any_IsOne); break;
  13685. case BeBinaryOpKind_SDivide: result = AllocBinaryOp(BeMCInstKind_IDiv, mcLHS, mcRHS, BeMCBinIdentityKind_Right_IsOne); break;
  13686. case BeBinaryOpKind_UDivide: result = AllocBinaryOp(BeMCInstKind_Div, mcLHS, mcRHS, BeMCBinIdentityKind_Right_IsOne); break;
  13687. case BeBinaryOpKind_SModulus: result = AllocBinaryOp(BeMCInstKind_IRem, mcLHS, mcRHS, BeMCBinIdentityKind_Right_IsOne_Result_Zero); break;
  13688. case BeBinaryOpKind_UModulus: result = AllocBinaryOp(BeMCInstKind_Rem, mcLHS, mcRHS, BeMCBinIdentityKind_Right_IsOne_Result_Zero); break;
  13689. case BeBinaryOpKind_BitwiseAnd: result = AllocBinaryOp(BeMCInstKind_And, mcLHS, mcRHS, BeMCBinIdentityKind_None); break;
  13690. case BeBinaryOpKind_BitwiseOr: result = AllocBinaryOp(BeMCInstKind_Or, mcLHS, mcRHS, BeMCBinIdentityKind_Any_IsZero); break;
  13691. case BeBinaryOpKind_ExclusiveOr: result = AllocBinaryOp(BeMCInstKind_Xor, mcLHS, mcRHS, BeMCBinIdentityKind_Any_IsZero); break;
  13692. case BeBinaryOpKind_LeftShift: result = AllocBinaryOp(BeMCInstKind_Shl, mcLHS, mcRHS, BeMCBinIdentityKind_Any_IsZero); break;
  13693. case BeBinaryOpKind_RightShift: result = AllocBinaryOp(BeMCInstKind_Shr, mcLHS, mcRHS, BeMCBinIdentityKind_Any_IsZero); break;
  13694. case BeBinaryOpKind_ARightShift: result = AllocBinaryOp(BeMCInstKind_Sar, mcLHS, mcRHS, BeMCBinIdentityKind_Any_IsZero); break;
  13695. }
  13696. }
  13697. break;
  13698. case BeBitCastInst::TypeId:
  13699. {
  13700. auto castedInst = (BeBitCastInst*)inst;
  13701. auto mcValue = GetOperand(castedInst->mValue);
  13702. if (castedInst->mToType->IsInt())
  13703. {
  13704. BF_ASSERT(castedInst->mToType->mSize == 8);
  13705. }
  13706. else
  13707. BF_ASSERT(castedInst->mToType->IsPointer());
  13708. auto toType = castedInst->mToType;
  13709. if (mcValue.IsImmediate())
  13710. {
  13711. if (mcValue.mImmediate == 0)
  13712. {
  13713. BeMCOperand newImmediate;
  13714. newImmediate.mKind = BeMCOperandKind_Immediate_Null;
  13715. newImmediate.mType = toType;
  13716. result = newImmediate;
  13717. }
  13718. else
  13719. {
  13720. // Non-zero constant. Weird case, just do an actual MOV
  13721. result = AllocVirtualReg(toType);
  13722. CreateDefineVReg(result);
  13723. auto vregInfo = GetVRegInfo(result);
  13724. AllocInst(BeMCInstKind_Mov, result, mcValue);
  13725. if (mcValue.mKind == BeMCOperandKind_VRegAddr)
  13726. {
  13727. auto srcVRegInfo = GetVRegInfo(mcValue);
  13728. srcVRegInfo->mForceMem = true;
  13729. CheckForce(srcVRegInfo);
  13730. }
  13731. }
  13732. }
  13733. else
  13734. {
  13735. result = AllocVirtualReg(toType);
  13736. CreateDefineVReg(result);
  13737. auto vregInfo = GetVRegInfo(result);
  13738. vregInfo->mRelTo = mcValue;
  13739. vregInfo->mIsExpr = true;
  13740. if (mcValue.mKind == BeMCOperandKind_VRegAddr)
  13741. {
  13742. auto srcVRegInfo = GetVRegInfo(mcValue);
  13743. srcVRegInfo->mForceMem = true;
  13744. CheckForce(srcVRegInfo);
  13745. }
  13746. }
  13747. }
  13748. break;
  13749. case BeCmpInst::TypeId:
  13750. {
  13751. auto castedInst = (BeCmpInst*)inst;
  13752. auto mcLHS = GetOperand(castedInst->mLHS);
  13753. auto mcRHS = GetOperand(castedInst->mRHS);
  13754. auto mcInst = AllocInst(BeMCInstKind_Cmp, mcLHS, mcRHS);
  13755. auto cmpResultIdx = (int)mCmpResults.size();
  13756. BeCmpResult cmpResult;
  13757. cmpResult.mCmpKind = castedInst->mCmpKind;
  13758. mCmpResults.push_back(cmpResult);
  13759. result.mKind = BeMCOperandKind_CmpResult;
  13760. result.mCmpResultIdx = cmpResultIdx;
  13761. mcInst->mResult = result;
  13762. }
  13763. break;
  13764. case BeObjectAccessCheckInst::TypeId:
  13765. {
  13766. auto castedInst = (BeObjectAccessCheckInst*)inst;
  13767. auto mcValue = GetOperand(castedInst->mValue);
  13768. auto int8Type = mModule->mContext->GetPrimitiveType(BeTypeCode_Int8);
  13769. auto int8PtrType = mModule->mContext->GetPointerTo(int8Type);
  13770. auto int8PtrVal = AllocVirtualReg(int8PtrType);
  13771. CreateDefineVReg(int8PtrVal);
  13772. auto vregInfo = GetVRegInfo(int8PtrVal);
  13773. vregInfo->mRelTo = mcValue;
  13774. vregInfo->mIsExpr = true;
  13775. int labelNum = mCurLabelIdx++;
  13776. BeMCOperand mcImm;
  13777. mcImm.mKind = BeMCOperandKind_Immediate_i8;
  13778. mcImm.mImmediate = -0x80;
  13779. BeMCOperand int8Val;
  13780. int8Val.mKind = BeMCOperandKind_VRegLoad;
  13781. int8Val.mVRegIdx = int8PtrVal.mVRegIdx;
  13782. AllocInst(BeMCInstKind_Cmp, int8Val, mcImm);
  13783. AllocInst(BeMCInstKind_CondBr, BeMCOperand::FromLabel(labelNum), BeMCOperand::FromCmpKind(BeCmpKind_ULT));
  13784. AllocInst(BeMCInstKind_DbgBreak);
  13785. AllocInst(BeMCInstKind_Label, BeMCOperand::FromLabel(labelNum));
  13786. }
  13787. break;
  13788. case BeAllocaInst::TypeId:
  13789. {
  13790. if (mDebugging)
  13791. {
  13792. NOP;
  13793. }
  13794. int homeSize = BF_ALIGN(BF_MAX(mMaxCallParamCount, 4) * 8, 16);
  13795. auto castedInst = (BeAllocaInst*)inst;
  13796. auto mcSize = BeMCOperand::FromImmediate(castedInst->mType->mSize);
  13797. bool isAligned16 = false;
  13798. int align = castedInst->mAlign;
  13799. BeType* allocType = castedInst->mType;
  13800. bool preservedVolatiles = false;
  13801. bool doPtrCast = false;
  13802. if (castedInst->mArraySize != NULL)
  13803. {
  13804. auto mcArraySize = GetOperand(castedInst->mArraySize);
  13805. if (mcArraySize.IsImmediate())
  13806. {
  13807. mcSize.mImmediate = mcSize.mImmediate * mcArraySize.mImmediate;
  13808. allocType = mModule->mContext->CreateSizedArrayType(castedInst->mType, mcArraySize.mImmediate);
  13809. doPtrCast = true;
  13810. }
  13811. else
  13812. {
  13813. preservedVolatiles = true;
  13814. AllocInst(BeMCInstKind_PreserveVolatiles, BeMCOperand::FromReg(X64Reg_RAX));
  13815. inHeadAlloca = false;
  13816. if (mcSize.mImmediate == 1)
  13817. {
  13818. mcSize = mcArraySize;
  13819. }
  13820. else
  13821. {
  13822. auto mcInst = AllocInst(BeMCInstKind_IMul, mcArraySize, mcSize);
  13823. mcInst->mResult = BeMCOperand::FromReg(X64Reg_RAX);
  13824. mcSize = mcInst->mResult;
  13825. }
  13826. }
  13827. }
  13828. // The stack is 16-byte aligned on entry - we have to manually adjust for any alignment greater than that
  13829. if ((inHeadAlloca) && (align <= 16))
  13830. {
  13831. result = AllocVirtualReg(allocType);
  13832. auto vregInfo = mVRegInfo[result.mVRegIdx];
  13833. vregInfo->mAlign = castedInst->mAlign;
  13834. vregInfo->mHasDynLife = true;
  13835. if (castedInst->mForceMem)
  13836. vregInfo->mForceMem = true;
  13837. if (allocType->IsComposite())
  13838. vregInfo->mForceMem = true;
  13839. result.mKind = BeMCOperandKind_VRegAddr;
  13840. if (doPtrCast)
  13841. {
  13842. BF_ASSERT(allocType->IsSizedArray());
  13843. auto resultType = mModule->mContext->GetPointerTo(castedInst->mType);
  13844. auto ptrResult = AllocVirtualReg(resultType);
  13845. auto vregInfo = mVRegInfo[ptrResult.mVRegIdx];
  13846. vregInfo->mIsExpr = true;
  13847. vregInfo->mRelTo = result;
  13848. vregInfo->mType = resultType;
  13849. vregInfo->mAlign = resultType->mSize;
  13850. CreateDefineVReg(ptrResult);
  13851. result = ptrResult;
  13852. }
  13853. }
  13854. else
  13855. {
  13856. bool needsChkStk = !castedInst->mNoChkStk;
  13857. bool doFastChkStk = false;
  13858. if (instIdx < (int)beBlock->mInstructions.size() - 1)
  13859. {
  13860. if (auto memSetInstr = BeValueDynCast<BeMemSetInst>(beBlock->mInstructions[instIdx + 1]))
  13861. {
  13862. if (memSetInstr->mAddr == inst)
  13863. {
  13864. // If we're clearing out this memory immediately after allocation then we don't
  13865. // need to do stack probing - the memset will ensure stack pages are committed
  13866. needsChkStk = false;
  13867. }
  13868. }
  13869. }
  13870. int stackAlign = BF_MAX(align, 16);
  13871. BeMCOperand mcFunc;
  13872. mcFunc.mKind = BeMCOperandKind_SymbolAddr;
  13873. mcFunc.mSymbolIdx = mCOFFObject->GetSymbolRef("__chkstk")->mIdx;
  13874. if (mcSize.IsImmediate())
  13875. {
  13876. // Align to 16 bytes
  13877. mcSize.mImmediate = (mcSize.mImmediate + 0xF) & ~0xF;
  13878. }
  13879. if ((mcSize.IsImmediate()) && (!preservedVolatiles) && (!needsChkStk))
  13880. {
  13881. AllocInst(BeMCInstKind_Sub, BeMCOperand::FromReg(X64Reg_RSP), mcSize);
  13882. }
  13883. else
  13884. {
  13885. if (needsChkStk)
  13886. {
  13887. if ((mcSize.IsImmediate()) && (mcSize.mImmediate < 4096))
  13888. {
  13889. // We can do a fast __chkstk in this case since we have a max of one page to handle
  13890. doFastChkStk = true;
  13891. }
  13892. }
  13893. if (doFastChkStk)
  13894. {
  13895. AllocInst(BeMCInstKind_Sub, BeMCOperand::FromReg(X64Reg_RSP), mcSize);
  13896. AllocInst(BeMCInstKind_FastCheckStack, BeMCOperand::FromReg(X64Reg_RSP));
  13897. }
  13898. else
  13899. {
  13900. if (!preservedVolatiles)
  13901. AllocInst(BeMCInstKind_PreserveVolatiles, BeMCOperand::FromReg(X64Reg_RAX));
  13902. if (mcSize.IsImmediate())
  13903. {
  13904. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromReg(X64Reg_RAX), mcSize);
  13905. // It's tempting to not do a chkstk when we do an alloc less than 4k, but this isn't valid
  13906. // because we could break the system by doing three 2k allocs and access the third one first
  13907. // and BOOM. We rely on the front-end to tell us when we can omit it.
  13908. }
  13909. else if (!isAligned16)
  13910. {
  13911. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromReg(X64Reg_RAX), mcSize);
  13912. AllocInst(BeMCInstKind_Add, BeMCOperand::FromReg(X64Reg_RAX), BeMCOperand::FromImmediate(0xF));
  13913. AllocInst(BeMCInstKind_And, BeMCOperand::FromReg(X64Reg_RAX), BeMCOperand::FromImmediate(~0xF));
  13914. }
  13915. if ((needsChkStk) && (!doFastChkStk))
  13916. {
  13917. AllocInst(BeMCInstKind_Call, mcFunc);
  13918. }
  13919. AllocInst(BeMCInstKind_Sub, BeMCOperand::FromReg(X64Reg_RSP), BeMCOperand::FromReg(X64Reg_RAX));
  13920. if (doFastChkStk)
  13921. {
  13922. AllocInst(BeMCInstKind_FastCheckStack, BeMCOperand::FromReg(X64Reg_RSP));
  13923. }
  13924. AllocInst(BeMCInstKind_RestoreVolatiles, BeMCOperand::FromReg(X64Reg_RAX));
  13925. }
  13926. }
  13927. auto resultType = mModule->mContext->GetPointerTo(castedInst->mType);
  13928. auto intType = mModule->mContext->GetPrimitiveType(BeTypeCode_Int64);
  13929. BeMCOperand ptrValue;
  13930. if (mUseBP)
  13931. {
  13932. ptrValue = AllocVirtualReg(intType);
  13933. auto vregInfo = mVRegInfo[ptrValue.mVRegIdx];
  13934. vregInfo->mIsExpr = true;
  13935. vregInfo->mRelTo = BeMCOperand::FromReg(X64Reg_RSP);
  13936. vregInfo->mRelOffset = BeMCOperand::FromImmediate(homeSize);
  13937. CreateDefineVReg(ptrValue);
  13938. }
  13939. else
  13940. {
  13941. ptrValue = BeMCOperand::FromReg(X64Reg_RSP);
  13942. }
  13943. result = AllocVirtualReg(resultType);
  13944. auto vregInfo = mVRegInfo[result.mVRegIdx];
  13945. vregInfo->mHasDynLife = true;
  13946. CreateDefineVReg(result);
  13947. AllocInst(BeMCInstKind_Mov, result, ptrValue);
  13948. if (stackAlign > 16)
  13949. {
  13950. // We have to align after everything - note that we always have to keep the 'homeSize' space available from RSP for calls,
  13951. // so the ANDing for alignment must be done here
  13952. AllocInst(BeMCInstKind_And, result, BeMCOperand::FromImmediate(~(stackAlign - 1)));
  13953. AllocInst(BeMCInstKind_Sub, BeMCOperand::FromReg(X64Reg_RSP), BeMCOperand::FromImmediate(stackAlign - 16));
  13954. }
  13955. BF_ASSERT(mUseBP);
  13956. }
  13957. }
  13958. break;
  13959. case BeAliasValueInst::TypeId:
  13960. {
  13961. auto castedInst = (BeAliasValueInst*)inst;
  13962. auto mcPtr = GetOperand(castedInst->mPtr, false, true);
  13963. result = AllocVirtualReg(GetType(mcPtr));
  13964. auto vregInfo = mVRegInfo[result.mVRegIdx];
  13965. vregInfo->mIsExpr = true;
  13966. vregInfo->mRelTo = mcPtr;
  13967. vregInfo->mHasDynLife = true;
  13968. CreateDefineVReg(result);
  13969. }
  13970. break;
  13971. case BeLifetimeStartInst::TypeId:
  13972. {
  13973. auto castedInst = (BeLifetimeEndInst*)inst;
  13974. auto mcPtr = GetOperand(castedInst->mPtr, false, true);
  13975. if (mcPtr)
  13976. AllocInst(BeMCInstKind_LifetimeStart, mcPtr);
  13977. }
  13978. break;
  13979. case BeLifetimeExtendInst::TypeId:
  13980. {
  13981. auto castedInst = (BeLifetimeEndInst*)inst;
  13982. auto mcPtr = GetOperand(castedInst->mPtr, false, true);
  13983. if (mcPtr)
  13984. AllocInst(BeMCInstKind_LifetimeExtend, mcPtr);
  13985. }
  13986. break;
  13987. case BeLifetimeEndInst::TypeId:
  13988. {
  13989. auto castedInst = (BeLifetimeEndInst*)inst;
  13990. auto mcPtr = GetOperand(castedInst->mPtr, false, true);
  13991. if (mcPtr.IsVRegAny())
  13992. {
  13993. AllocInst(BeMCInstKind_LifetimeEnd, mcPtr);
  13994. }
  13995. }
  13996. break;
  13997. case BeValueScopeStartInst::TypeId:
  13998. {
  13999. result = BeMCOperand::FromImmediate((int)mVRegInfo.size());
  14000. }
  14001. break;
  14002. case BeValueScopeRetainInst::TypeId:
  14003. {
  14004. auto castedInst = (BeValueScopeRetainInst*)inst;
  14005. auto mcValue = GetOperand(castedInst->mValue, false, true);
  14006. auto vregInfo = GetVRegInfo(mcValue);
  14007. vregInfo->mValueScopeRetainedKind = BeMCValueScopeRetainKind_Soft;
  14008. }
  14009. break;
  14010. case BeValueScopeEndInst::TypeId:
  14011. {
  14012. auto castedInst = (BeValueScopeEndInst*)inst;
  14013. BeMCOperand mcScopeStart = GetOperand(castedInst->mScopeStart, false, true);
  14014. // There are some recordering cases where we have a ValueScopeStart moved after a ValueScopeEnd
  14015. // Just ignore those. This is just an optimization anyway.
  14016. if (mcScopeStart)
  14017. AllocInst(castedInst->mIsSoft ? BeMCInstKind_ValueScopeSoftEnd : BeMCInstKind_ValueScopeHardEnd, mcScopeStart, BeMCOperand::FromImmediate((int)mVRegInfo.size()));
  14018. }
  14019. break;
  14020. case BeLifetimeFenceInst::TypeId:
  14021. {
  14022. auto castedInst = (BeLifetimeFenceInst*)inst;
  14023. auto mcPtr = GetOperand(castedInst->mPtr, false);
  14024. auto fenceBlock = GetOperand(castedInst->mFenceBlock);
  14025. auto vregInfo = GetVRegInfo(mcPtr);
  14026. vregInfo->mChainLifetimeEnd = true;
  14027. SetAndRestoreValue<BeMCBlock*> prevBlock(mActiveBlock, fenceBlock.mBlock);
  14028. auto lifetimeStart = AllocInst(BeMCInstKind_LifetimeStart, mcPtr);
  14029. lifetimeStart->mDbgLoc = NULL;
  14030. }
  14031. break;
  14032. case BeLoadInst::TypeId:
  14033. {
  14034. auto castedInst = (BeLoadInst*)inst;
  14035. auto mcTarget = GetOperand(castedInst->mTarget);
  14036. result = CreateLoad(mcTarget);
  14037. }
  14038. break;
  14039. case BeStoreInst::TypeId:
  14040. {
  14041. auto castedInst = (BeStoreInst*)inst;
  14042. auto mcVal = GetOperand(castedInst->mVal);
  14043. auto mcPtr = GetOperand(castedInst->mPtr);
  14044. bool handled = false;
  14045. CreateStore(BeMCInstKind_Mov, mcVal, mcPtr);
  14046. }
  14047. break;
  14048. case BeSetCanMergeInst::TypeId:
  14049. {
  14050. auto castedInst = (BeSetCanMergeInst*)inst;
  14051. auto mcVal = GetOperand(castedInst->mVal);
  14052. auto vregInfo = GetVRegInfo(mcVal);
  14053. vregInfo->mForceMerge = true;
  14054. }
  14055. break;
  14056. case BeMemSetInst::TypeId:
  14057. {
  14058. auto castedInst = (BeMemSetInst*)inst;
  14059. if (auto constVal = BeValueDynCast<BeConstant>(castedInst->mVal))
  14060. {
  14061. if (auto constSize = BeValueDynCast<BeConstant>(castedInst->mSize))
  14062. {
  14063. CreateMemSet(GetOperand(castedInst->mAddr), constVal->mUInt8, constSize->mInt64, castedInst->mAlignment);
  14064. break;
  14065. }
  14066. }
  14067. SizedArray<BeValue*, 3> args = { castedInst->mAddr, castedInst->mVal, castedInst->mSize };
  14068. auto mcFunc = BeMCOperand::FromSymbolAddr(mCOFFObject->GetSymbolRef("memset")->mIdx);
  14069. CreateCall(mcFunc, args);
  14070. }
  14071. break;
  14072. case BeFenceInst::TypeId:
  14073. {
  14074. AllocInst(BeMCInstKind_MFence);
  14075. }
  14076. break;
  14077. case BeStackSaveInst::TypeId:
  14078. {
  14079. auto stackVReg = BeMCOperand::FromVReg(stackSaveVRegs.back());
  14080. stackSaveVRegs.pop_back();
  14081. CreateDefineVReg(stackVReg);
  14082. AllocInst(BeMCInstKind_Mov, stackVReg, BeMCOperand::FromReg(X64Reg_RSP));
  14083. result = stackVReg;
  14084. }
  14085. break;
  14086. case BeStackRestoreInst::TypeId:
  14087. {
  14088. auto castedInst = (BeStackRestoreInst*)inst;
  14089. auto mcStackVal = GetOperand(castedInst->mStackVal);
  14090. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromReg(X64Reg_RSP), mcStackVal);
  14091. }
  14092. break;
  14093. case BeGEPInst::TypeId:
  14094. {
  14095. auto castedInst = (BeGEPInst*)inst;
  14096. auto mcVal = GetOperand(castedInst->mPtr);
  14097. auto mcIdx0 = GetOperand(castedInst->mIdx0);
  14098. BePointerType* ptrType = (BePointerType*)GetType(mcVal);
  14099. BF_ASSERT(ptrType->mTypeCode == BeTypeCode_Pointer);
  14100. result = mcVal;
  14101. if (castedInst->mIdx1 != NULL)
  14102. {
  14103. // We assume we never do both an idx0 and idx1 at once. Fix if we change that.
  14104. BF_ASSERT(castedInst->mIdx0);
  14105. auto mcIdx1 = GetOperand(castedInst->mIdx1);
  14106. if (!mcIdx1.IsImmediate())
  14107. {
  14108. // This path is used when we have a const array that gets indexed by a non-const index value
  14109. if (ptrType->mElementType->mTypeCode == BeTypeCode_SizedArray)
  14110. {
  14111. auto arrayType = (BeSizedArrayType*)ptrType->mElementType;
  14112. auto elementPtrType = mModule->mContext->GetPointerTo(arrayType->mElementType);
  14113. auto ptrValue = AllocVirtualReg(elementPtrType);
  14114. auto ptrInfo = GetVRegInfo(ptrValue);
  14115. ptrInfo->mIsExpr = true;
  14116. ptrInfo->mRelTo = result;
  14117. CreateDefineVReg(ptrValue);
  14118. result = ptrValue;
  14119. BeMCOperand mcRelOffset;
  14120. int relScale = 1;
  14121. if (mcIdx1.IsImmediate())
  14122. {
  14123. mcRelOffset = BeMCOperand::FromImmediate(mcIdx1.mImmediate * arrayType->mElementType->mSize);
  14124. }
  14125. else
  14126. {
  14127. mcRelOffset = mcIdx1;
  14128. relScale = arrayType->mElementType->mSize;
  14129. }
  14130. result = AllocRelativeVirtualReg(elementPtrType, result, mcRelOffset, relScale);
  14131. // The def is primary to create a single 'master location' for the GEP vreg to become legalized before use
  14132. CreateDefineVReg(result);
  14133. //TODO: Always correct?
  14134. result.mKind = BeMCOperandKind_VReg;
  14135. }
  14136. else
  14137. Fail("Invalid GEP");
  14138. }
  14139. else
  14140. {
  14141. BF_ASSERT(mcIdx1.IsImmediate());
  14142. int byteOffset = 0;
  14143. BeType* elementType = NULL;
  14144. if (ptrType->mElementType->mTypeCode == BeTypeCode_Struct)
  14145. {
  14146. BeStructType* structType = (BeStructType*)ptrType->mElementType;
  14147. auto& structMember = structType->mMembers[mcIdx1.mImmediate];
  14148. elementType = structMember.mType;
  14149. byteOffset = structMember.mByteOffset;
  14150. }
  14151. else
  14152. {
  14153. BF_ASSERT(ptrType->mElementType->mTypeCode == BeTypeCode_SizedArray);
  14154. auto arrayType = (BeSizedArrayType*)ptrType->mElementType;
  14155. elementType = arrayType->mElementType;
  14156. byteOffset = mcIdx1.mImmediate * elementType->mSize;
  14157. }
  14158. auto elementPtrType = mModule->mContext->GetPointerTo(elementType);
  14159. result = AllocRelativeVirtualReg(elementPtrType, result, GetImmediate(byteOffset), 1);
  14160. // The def is primary to create a single 'master location' for the GEP vreg to become legalized before use
  14161. CreateDefineVReg(result);
  14162. result.mKind = BeMCOperandKind_VReg;
  14163. }
  14164. }
  14165. else
  14166. {
  14167. // It's temping to do a (IsNonZero) precondition, but if we make a reference to a VReg that is NOT in Addr form,
  14168. // then this will encode that so we will know we need to do a Load on that value at the Def during legalization
  14169. BeMCOperand mcRelOffset;
  14170. int relScale = 1;
  14171. if (mcIdx0.IsImmediate())
  14172. {
  14173. mcRelOffset = BeMCOperand::FromImmediate(mcIdx0.mImmediate * ptrType->mElementType->mSize);
  14174. }
  14175. else
  14176. {
  14177. mcRelOffset = mcIdx0;
  14178. relScale = ptrType->mElementType->mSize;
  14179. }
  14180. result = AllocRelativeVirtualReg(ptrType, result, mcRelOffset, relScale);
  14181. // The def is primary to create a single 'master location' for the GEP vreg to become legalized before use
  14182. CreateDefineVReg(result);
  14183. //TODO: Always correct?
  14184. result.mKind = BeMCOperandKind_VReg;
  14185. }
  14186. }
  14187. break;
  14188. case BeBrInst::TypeId:
  14189. {
  14190. auto castedInst = (BeBrInst*)inst;
  14191. auto mcInst = AllocInst();
  14192. mcInst->mKind = BeMCInstKind_Br;
  14193. mcInst->mArg0 = GetOperand(castedInst->mTargetBlock);
  14194. mcInst->mArg0.mBlock->AddPred(mcBlock);
  14195. if (castedInst->mNoCollapse)
  14196. {
  14197. mcInst->mArg1.mKind = BeMCOperandKind_Immediate_i8;
  14198. mcInst->mArg1.mImmediate = 1;
  14199. }
  14200. else if (castedInst->mIsFake)
  14201. {
  14202. mcInst->mArg1.mKind = BeMCOperandKind_Immediate_i8;
  14203. mcInst->mArg1.mImmediate = 2;
  14204. }
  14205. }
  14206. break;
  14207. case BeCondBrInst::TypeId:
  14208. {
  14209. if (mDebugging)
  14210. {
  14211. NOP;
  14212. }
  14213. auto castedInst = (BeCondBrInst*)inst;
  14214. auto testVal = GetOperand(castedInst->mCond, true);
  14215. auto trueBlock = GetOperand(castedInst->mTrueBlock);
  14216. auto falseBlock = GetOperand(castedInst->mFalseBlock);
  14217. trueBlock.mBlock->AddPred(mcBlock);
  14218. falseBlock.mBlock->AddPred(mcBlock);
  14219. CreateCondBr(mcBlock, testVal, trueBlock, falseBlock);
  14220. }
  14221. break;
  14222. case BePhiInst::TypeId:
  14223. {
  14224. auto castedInst = (BePhiInst*)inst;
  14225. BeMCPhi* mcPhi = mPhiAlloc.Alloc();
  14226. mcPhi->mBlock = mcBlock;
  14227. mcPhi->mIdx = mCurPhiIdx++;
  14228. //if (mDebugging)
  14229. {
  14230. for (auto phiIncoming : castedInst->mIncoming)
  14231. {
  14232. auto blockFrom = GetOperand(phiIncoming->mBlock).mBlock;;
  14233. int insertIdx = blockFrom->mInstructions.size() - 1;
  14234. SetAndRestoreValue<BeMCBlock*> prevActiveBlock(mActiveBlock, blockFrom);
  14235. SetAndRestoreValue<int*> prevInsertIdxPtr(mInsertInstIdxRef, &insertIdx);
  14236. BeMCPhiValue phiVal;
  14237. phiVal.mBlockFrom = blockFrom;
  14238. phiVal.mValue = GetOperand(phiIncoming->mValue, true);
  14239. if (phiVal.mValue.mKind == BeMCOperandKind_VRegAddr)
  14240. {
  14241. auto vregInfo = GetVRegInfo(phiVal.mValue);
  14242. if (!vregInfo->mIsExpr)
  14243. {
  14244. vregInfo->mForceMem = true;
  14245. CheckForce(vregInfo);
  14246. }
  14247. }
  14248. mcPhi->mValues.push_back(phiVal);
  14249. }
  14250. }
  14251. /*else
  14252. {
  14253. for (auto phiIncoming : castedInst->mIncoming)
  14254. {
  14255. BeMCPhiValue phiVal;
  14256. phiVal.mBlockFrom = GetOperand(phiIncoming->mBlock).mBlock;
  14257. phiVal.mValue = GetOperand(phiIncoming->mValue, true);
  14258. mcPhi->mValues.push_back(phiVal);
  14259. }
  14260. }*/
  14261. result.mKind = BeMCOperandKind_Phi;
  14262. result.mPhi = mcPhi;
  14263. // DefPhi is important because when we convert a CondBr of a PHI, because we will need to create jumps to the correct
  14264. // location when we create it as a value (specifically in the bool case)
  14265. AllocInst(BeMCInstKind_DefPhi, result);
  14266. }
  14267. break;
  14268. case BeSwitchInst::TypeId:
  14269. {
  14270. auto castedInst = (BeSwitchInst*)inst;
  14271. std::stable_sort(castedInst->mCases.begin(), castedInst->mCases.end(), [&](const BeSwitchCase& lhs, const BeSwitchCase& rhs)
  14272. {
  14273. return lhs.mValue->mInt64 < rhs.mValue->mInt64;
  14274. });
  14275. int numVals = castedInst->mCases.size();
  14276. if (numVals > 0)
  14277. {
  14278. int64 loVal = castedInst->mCases.front().mValue->mInt64;
  14279. int64 hiVal = castedInst->mCases.back().mValue->mInt64;
  14280. uint64 avgSpacing = (uint64)(hiVal - loVal) / numVals;
  14281. // Only use a table if we have a lot of values and the values are 'tight' enough
  14282. if ((numVals > 6) && (avgSpacing <= 8))
  14283. CreateTableSwitchSection(castedInst, 0, castedInst->mCases.size());
  14284. else
  14285. CreateBinarySwitchSection(castedInst, 0, castedInst->mCases.size());
  14286. }
  14287. auto mcDefaultBlock = GetOperand(castedInst->mDefaultBlock);
  14288. AllocInst(BeMCInstKind_Br, mcDefaultBlock);
  14289. mcDefaultBlock.mBlock->AddPred(mActiveBlock);
  14290. }
  14291. break;
  14292. case BeRetInst::TypeId:
  14293. {
  14294. auto castedInst = (BeRetInst*)inst;
  14295. if (castedInst->mRetValue != NULL)
  14296. {
  14297. auto retVal = GetOperand(castedInst->mRetValue);
  14298. auto retType = GetType(retVal);
  14299. if (retType->IsComposite())
  14300. {
  14301. BF_ASSERT(mCompositeRetVRegIdx != -1);
  14302. BF_ASSERT(retVal.IsVReg());
  14303. auto vregInfo = GetVRegInfo(retVal);
  14304. vregInfo->SetRetVal();
  14305. }
  14306. else
  14307. {
  14308. X64CPURegister reg = X64Reg_RAX;
  14309. if (retType->IsIntable())
  14310. {
  14311. if (retType->mSize == 4)
  14312. reg = X64Reg_EAX;
  14313. else if (retType->mSize == 2)
  14314. reg = X64Reg_AX;
  14315. else if (retType->mSize == 1)
  14316. reg = X64Reg_AL;
  14317. }
  14318. else if (retType->mTypeCode == BeTypeCode_Float)
  14319. reg = X64Reg_XMM0_f32;
  14320. else if (retType->mTypeCode == BeTypeCode_Double)
  14321. reg = X64Reg_XMM0_f64;
  14322. auto movInst = AllocInst(BeMCInstKind_Mov, BeMCOperand::FromReg(reg), retVal);
  14323. }
  14324. }
  14325. auto mcInst = AllocInst();
  14326. mcInst->mKind = BeMCInstKind_Ret;
  14327. retCount++;
  14328. }
  14329. break;
  14330. case BeCallInst::TypeId:
  14331. {
  14332. auto castedInst = (BeCallInst*)inst;
  14333. BeMCOperand mcFunc;
  14334. BeType* returnType = NULL;
  14335. bool isVarArg = false;
  14336. bool useAltArgs = false;
  14337. SizedArray<BeValue*, 6> args;
  14338. if (auto intrin = BeValueDynCast<BeIntrinsic>(castedInst->mFunc))
  14339. {
  14340. switch (intrin->mKind)
  14341. {
  14342. case BfIRIntrinsic_AtomicAdd:
  14343. case BfIRIntrinsic_AtomicSub:
  14344. {
  14345. auto mcPtr = GetOperand(castedInst->mArgs[0].mValue);
  14346. auto mcVal = GetOperand(castedInst->mArgs[1].mValue);
  14347. auto valType = GetType(mcVal);
  14348. if (!valType->IsFloat())
  14349. {
  14350. auto mcMemKind = GetOperand(castedInst->mArgs[2].mValue);
  14351. if (!mcMemKind.IsImmediateInt())
  14352. {
  14353. SoftFail("Non-constant success ordering on AtomicLoad", castedInst->mDbgLoc);
  14354. break;
  14355. }
  14356. BeMCOperand scratchReg = AllocVirtualReg(valType);
  14357. auto vregInfo = GetVRegInfo(scratchReg);
  14358. vregInfo->mMustExist = true;
  14359. CreateDefineVReg(scratchReg);
  14360. if ((intrin->mKind == BfIRIntrinsic_AtomicSub) && (mcVal.IsImmediate()))
  14361. {
  14362. BeMCOperand mcNeg = mcVal;
  14363. if (mcVal.IsImmediateFloat())
  14364. mcNeg.mImmFloat = -mcNeg.mImmFloat;
  14365. else
  14366. mcNeg.mImmediate = -mcNeg.mImmediate;
  14367. AllocInst(BeMCInstKind_Mov, scratchReg, mcNeg);
  14368. }
  14369. else
  14370. {
  14371. AllocInst(BeMCInstKind_Mov, scratchReg, mcVal);
  14372. if (intrin->mKind == BfIRIntrinsic_AtomicSub)
  14373. AllocInst(BeMCInstKind_Neg, scratchReg);
  14374. }
  14375. CreateStore(BeMCInstKind_XAdd, scratchReg, mcPtr);
  14376. if ((mcMemKind.mImmediate & BfIRAtomicOrdering_ReturnModified) != 0)
  14377. {
  14378. if (intrin->mKind == BfIRIntrinsic_AtomicSub)
  14379. AllocInst(BeMCInstKind_Sub, scratchReg, mcVal);
  14380. else
  14381. AllocInst(BeMCInstKind_Add, scratchReg, mcVal);
  14382. }
  14383. result = scratchReg;
  14384. break;
  14385. }
  14386. }
  14387. case BfIRIntrinsic_AtomicAnd:
  14388. case BfIRIntrinsic_AtomicMax:
  14389. case BfIRIntrinsic_AtomicMin:
  14390. case BfIRIntrinsic_AtomicNAnd:
  14391. case BfIRIntrinsic_AtomicOr:
  14392. case BfIRIntrinsic_AtomicUMax:
  14393. case BfIRIntrinsic_AtomicUMin:
  14394. case BfIRIntrinsic_AtomicXor:
  14395. {
  14396. auto mcPtr = GetOperand(castedInst->mArgs[0].mValue);
  14397. auto mcVal = GetOperand(castedInst->mArgs[1].mValue);
  14398. auto mcMemKind = GetOperand(castedInst->mArgs[2].mValue);
  14399. if (!mcMemKind.IsImmediateInt())
  14400. {
  14401. SoftFail("Non-constant ordering on atomic instruction", castedInst->mDbgLoc);
  14402. break;
  14403. }
  14404. auto valType = GetType(mcVal);
  14405. auto origValType = valType;
  14406. bool isFloat = valType->IsFloat();
  14407. auto mcTarget = BeMCOperand::ToLoad(mcPtr);
  14408. auto useReg = ResizeRegister(X64Reg_RAX, valType->mSize);
  14409. auto origTarget = mcTarget;
  14410. if (isFloat)
  14411. {
  14412. if (valType->mSize == 4)
  14413. valType = mModule->mContext->GetPrimitiveType(BeTypeCode_Int32);
  14414. else
  14415. valType = mModule->mContext->GetPrimitiveType(BeTypeCode_Int64);
  14416. BeMCOperand castedTarget = AllocVirtualReg(valType);
  14417. auto vregInfo = GetVRegInfo(castedTarget);
  14418. vregInfo->mMustExist = true;
  14419. vregInfo->mType = valType;
  14420. vregInfo->mAlign = valType->mAlign;
  14421. vregInfo->mIsExpr = true;
  14422. vregInfo->mRelTo = mcTarget;
  14423. CreateDefineVReg(castedTarget);
  14424. mcTarget = castedTarget;
  14425. }
  14426. int labelIdx = CreateLabel();
  14427. BeMCOperand mcPrev = AllocVirtualReg(valType);
  14428. auto vregInfo = GetVRegInfo(mcPrev);
  14429. vregInfo->mMustExist = true;
  14430. CreateDefineVReg(mcPrev);
  14431. BeMCOperand mcNext = AllocVirtualReg(valType);
  14432. vregInfo = GetVRegInfo(mcNext);
  14433. vregInfo->mMustExist = true;
  14434. vregInfo->mForceMem = isFloat;
  14435. CreateDefineVReg(mcNext);
  14436. AllocInst(BeMCInstKind_Mov, mcPrev, mcTarget);
  14437. AllocInst(BeMCInstKind_Mov, mcNext, mcPrev);
  14438. if (isFloat)
  14439. {
  14440. BeMCOperand mcFNext = AllocVirtualReg(origValType);
  14441. vregInfo = GetVRegInfo(mcFNext);
  14442. vregInfo->mIsExpr = true;
  14443. vregInfo->mRelTo = mcNext;
  14444. CreateDefineVReg(mcFNext);
  14445. if (intrin->mKind == BfIRIntrinsic_AtomicAdd)
  14446. AllocInst(BeMCInstKind_Add, mcFNext, mcVal);
  14447. else
  14448. AllocInst(BeMCInstKind_Sub, mcFNext, mcVal);
  14449. }
  14450. else
  14451. {
  14452. switch (intrin->mKind)
  14453. {
  14454. case BfIRIntrinsic_AtomicAdd:
  14455. AllocInst(BeMCInstKind_Add, mcNext, mcVal);
  14456. break;
  14457. case BfIRIntrinsic_AtomicAnd:
  14458. AllocInst(BeMCInstKind_Or, mcNext, mcVal);
  14459. break;
  14460. case BfIRIntrinsic_AtomicMax:
  14461. case BfIRIntrinsic_AtomicMin:
  14462. case BfIRIntrinsic_AtomicUMax:
  14463. case BfIRIntrinsic_AtomicUMin:
  14464. {
  14465. int cmpLabelIdx = mCurLabelIdx++;
  14466. AllocInst(BeMCInstKind_Cmp, mcNext, mcVal);
  14467. BeCmpKind cmpKind = BeCmpKind_None;
  14468. switch (intrin->mKind)
  14469. {
  14470. case BfIRIntrinsic_AtomicMax:
  14471. cmpKind = BeCmpKind_SGE;
  14472. break;
  14473. case BfIRIntrinsic_AtomicMin:
  14474. cmpKind = BeCmpKind_SLE;
  14475. break;
  14476. case BfIRIntrinsic_AtomicUMax:
  14477. cmpKind = BeCmpKind_UGE;
  14478. break;
  14479. case BfIRIntrinsic_AtomicUMin:
  14480. cmpKind = BeCmpKind_ULE;
  14481. break;
  14482. }
  14483. AllocInst(BeMCInstKind_CondBr, BeMCOperand::FromLabel(cmpLabelIdx), BeMCOperand::FromCmpKind(cmpKind));
  14484. AllocInst(BeMCInstKind_Mov, mcNext, mcVal);
  14485. CreateLabel(-1, cmpLabelIdx);
  14486. }
  14487. break;
  14488. case BfIRIntrinsic_AtomicNAnd:
  14489. AllocInst(BeMCInstKind_And, mcNext, mcVal);
  14490. AllocInst(BeMCInstKind_Not, mcNext);
  14491. break;
  14492. case BfIRIntrinsic_AtomicOr:
  14493. AllocInst(BeMCInstKind_Or, mcNext, mcVal);
  14494. break;
  14495. case BfIRIntrinsic_AtomicSub:
  14496. AllocInst(BeMCInstKind_Sub, mcNext, mcVal);
  14497. break;
  14498. case BfIRIntrinsic_AtomicXor:
  14499. AllocInst(BeMCInstKind_Xor, mcNext, mcVal);
  14500. break;
  14501. }
  14502. }
  14503. AllocInst(BeMCInstKind_PreserveVolatiles, BeMCOperand::FromReg(X64Reg_RAX));
  14504. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromReg(useReg), mcPrev);
  14505. auto cmpXChgInst = AllocInst(BeMCInstKind_CmpXChg, mcTarget, mcNext);
  14506. AllocInst(BeMCInstKind_RestoreVolatiles, BeMCOperand::FromReg(X64Reg_RAX));
  14507. AllocInst(BeMCInstKind_CondBr, BeMCOperand::FromLabel(labelIdx), BeMCOperand::FromCmpKind(BeCmpKind_NE));
  14508. if ((mcMemKind.mImmediate & BfIRAtomicOrdering_ReturnModified) != 0)
  14509. result = mcNext;
  14510. else
  14511. result = mcPrev;
  14512. }
  14513. break;
  14514. case BfIRIntrinsic_AtomicCmpStore:
  14515. case BfIRIntrinsic_AtomicCmpStore_Weak:
  14516. case BfIRIntrinsic_AtomicCmpXChg:
  14517. {
  14518. auto mcPtr = GetOperand(castedInst->mArgs[0].mValue);
  14519. auto mcComparand = GetOperand(castedInst->mArgs[1].mValue);
  14520. auto mcVal = GetOperand(castedInst->mArgs[2].mValue);
  14521. auto mcMemKind = GetOperand(castedInst->mArgs[3].mValue);
  14522. if (!mcMemKind.IsImmediate())
  14523. {
  14524. SoftFail("Non-constant success ordering on atomic operation", castedInst->mDbgLoc);
  14525. break;
  14526. }
  14527. auto valType = GetType(mcVal);
  14528. auto useReg = ResizeRegister(X64Reg_RAX, valType->mSize);
  14529. BeMCOperand scratchReg = AllocVirtualReg(GetType(mcVal));
  14530. auto vregInfo = GetVRegInfo(scratchReg);
  14531. vregInfo->mMustExist = true;
  14532. CreateDefineVReg(scratchReg);
  14533. AllocInst(BeMCInstKind_Mov, scratchReg, mcVal);
  14534. AllocInst(BeMCInstKind_PreserveVolatiles, BeMCOperand::FromReg(X64Reg_RAX));
  14535. AllocInst(BeMCInstKind_Mov, BeMCOperand::FromReg(useReg), mcComparand);
  14536. auto cmpXChgInst = AllocInst(BeMCInstKind_CmpXChg, BeMCOperand::ToLoad(mcPtr), scratchReg);
  14537. if (intrin->mKind == BfIRIntrinsic_AtomicCmpXChg)
  14538. {
  14539. AllocInst(BeMCInstKind_Mov, scratchReg, BeMCOperand::FromReg(useReg));
  14540. result = scratchReg;
  14541. }
  14542. else
  14543. {
  14544. auto cmpResultIdx = (int)mCmpResults.size();
  14545. BeCmpResult cmpResult;
  14546. cmpResult.mCmpKind = BeCmpKind_EQ;
  14547. mCmpResults.push_back(cmpResult);
  14548. result.mKind = BeMCOperandKind_CmpResult;
  14549. result.mCmpResultIdx = cmpResultIdx;
  14550. cmpXChgInst->mResult = result;
  14551. }
  14552. AllocInst(BeMCInstKind_RestoreVolatiles, BeMCOperand::FromReg(X64Reg_RAX));
  14553. }
  14554. break;
  14555. case BfIRIntrinsic_AtomicLoad:
  14556. {
  14557. auto mcTarget = GetOperand(castedInst->mArgs[0].mValue);
  14558. result = CreateLoad(mcTarget);
  14559. }
  14560. break;
  14561. case BfIRIntrinsic_AtomicFence:
  14562. {
  14563. if (castedInst->mArgs.size() == 0)
  14564. {
  14565. // Compiler fence- do nothing.
  14566. break;
  14567. }
  14568. auto mcMemKind = GetOperand(castedInst->mArgs[0].mValue);
  14569. if (!mcMemKind.IsImmediateInt())
  14570. {
  14571. SoftFail("Non-constant success ordering on AtomicFence", castedInst->mDbgLoc);
  14572. break;
  14573. }
  14574. if (mcMemKind.mImmediate == BfIRAtomicOrdering_SeqCst)
  14575. AllocInst(BeMCInstKind_MFence);
  14576. }
  14577. break;
  14578. case BfIRIntrinsic_AtomicStore:
  14579. {
  14580. auto mcPtr = GetOperand(castedInst->mArgs[0].mValue);
  14581. auto mcVal = GetOperand(castedInst->mArgs[1].mValue);
  14582. auto mcMemKind = GetOperand(castedInst->mArgs[2].mValue);
  14583. if (!mcMemKind.IsImmediateInt())
  14584. {
  14585. SoftFail("Non-constant success ordering on AtomicLoad", castedInst->mDbgLoc);
  14586. break;
  14587. }
  14588. if (mcMemKind.mImmediate == BfIRAtomicOrdering_SeqCst)
  14589. {
  14590. BeMCOperand scratchReg = AllocVirtualReg(GetType(mcVal));
  14591. auto vregInfo = GetVRegInfo(scratchReg);
  14592. vregInfo->mMustExist = true;
  14593. CreateDefineVReg(scratchReg);
  14594. AllocInst(BeMCInstKind_Mov, scratchReg, mcVal);
  14595. CreateStore(BeMCInstKind_XChg, scratchReg, mcPtr);
  14596. }
  14597. else
  14598. {
  14599. CreateStore(BeMCInstKind_Mov, mcVal, mcPtr);
  14600. }
  14601. }
  14602. break;
  14603. case BfIRIntrinsic_AtomicXChg:
  14604. {
  14605. auto mcPtr = GetOperand(castedInst->mArgs[0].mValue);
  14606. auto mcVal = GetOperand(castedInst->mArgs[1].mValue);
  14607. auto mcMemKind = GetOperand(castedInst->mArgs[2].mValue);
  14608. if (!mcMemKind.IsImmediateInt())
  14609. {
  14610. SoftFail("Non-constant success ordering on AtomicXChg", castedInst->mDbgLoc);
  14611. break;
  14612. }
  14613. BeMCOperand scratchReg = AllocVirtualReg(GetType(mcVal));
  14614. auto vregInfo = GetVRegInfo(scratchReg);
  14615. vregInfo->mMustExist = true;
  14616. CreateDefineVReg(scratchReg);
  14617. AllocInst(BeMCInstKind_Mov, scratchReg, mcVal);
  14618. CreateStore(BeMCInstKind_XChg, scratchReg, mcPtr);
  14619. result = scratchReg;
  14620. }
  14621. break;
  14622. case BfIRIntrinsic_MemSet:
  14623. {
  14624. if (auto constVal = BeValueDynCast<BeConstant>(castedInst->mArgs[1].mValue))
  14625. {
  14626. if (auto constSize = BeValueDynCast<BeConstant>(castedInst->mArgs[2].mValue))
  14627. {
  14628. if (auto constAlign = BeValueDynCast<BeConstant>(castedInst->mArgs[3].mValue))
  14629. {
  14630. CreateMemSet(GetOperand(castedInst->mArgs[0].mValue), constVal->mUInt8, constSize->mInt64, constAlign->mInt32);
  14631. break;
  14632. }
  14633. }
  14634. }
  14635. mcFunc = BeMCOperand::FromSymbolAddr(mCOFFObject->GetSymbolRef("memset")->mIdx);
  14636. for (int i = 0; i < 3; i++)
  14637. args.Add(castedInst->mArgs[i].mValue);
  14638. useAltArgs = true;
  14639. }
  14640. break;
  14641. case BfIRIntrinsic_MemCpy:
  14642. {
  14643. if (auto constSize = BeValueDynCast<BeConstant>(castedInst->mArgs[2].mValue))
  14644. {
  14645. if (auto constAlign = BeValueDynCast<BeConstant>(castedInst->mArgs[3].mValue))
  14646. {
  14647. CreateMemCpy(GetOperand(castedInst->mArgs[0].mValue), GetOperand(castedInst->mArgs[1].mValue), constSize->mInt64, constAlign->mInt32);
  14648. break;
  14649. }
  14650. }
  14651. mcFunc = BeMCOperand::FromSymbolAddr(mCOFFObject->GetSymbolRef("memcpy")->mIdx);
  14652. //altArgs.insert(altArgs.begin(), castedInst->mArgs.begin(), castedInst->mArgs.begin() + 3);
  14653. for (int i = 0; i < 3; i++)
  14654. args.Add(castedInst->mArgs[i].mValue);
  14655. useAltArgs = true;
  14656. }
  14657. break;
  14658. case BfIRIntrinsic_MemMove:
  14659. {
  14660. mcFunc = BeMCOperand::FromSymbolAddr(mCOFFObject->GetSymbolRef("memmove")->mIdx);
  14661. //altArgs.insert(altArgs.begin(), castedInst->mArgs.begin(), castedInst->mArgs.begin() + 3);
  14662. for (int i = 0; i < 3; i++)
  14663. args.Add(castedInst->mArgs[i].mValue);
  14664. useAltArgs = true;
  14665. }
  14666. break;
  14667. default:
  14668. SoftFail("Intrinsic not handled", castedInst->mDbgLoc);
  14669. break;
  14670. }
  14671. }
  14672. else
  14673. {
  14674. if (auto func = BeValueDynCast<BeFunction>(castedInst->mFunc))
  14675. {
  14676. auto funcPtrType = func->mType;
  14677. if (funcPtrType->IsPointer())
  14678. {
  14679. auto elementType = ((BePointerType*)funcPtrType)->mElementType;
  14680. if (elementType->mTypeCode == BeTypeCode_Function)
  14681. {
  14682. isVarArg = ((BeFunctionType*)elementType)->mIsVarArg;
  14683. }
  14684. }
  14685. }
  14686. returnType = castedInst->GetType();
  14687. mcFunc = GetOperand(castedInst->mFunc);
  14688. }
  14689. if (mcFunc)
  14690. {
  14691. if (!useAltArgs)
  14692. {
  14693. BF_ASSERT(args.IsEmpty());
  14694. for (auto& arg : castedInst->mArgs)
  14695. args.Add(arg.mValue);
  14696. }
  14697. result = CreateCall(mcFunc, args, returnType, castedInst->mCallingConv, castedInst->HasStructRet(), castedInst->mNoReturn, isVarArg);
  14698. }
  14699. }
  14700. break;
  14701. case BeDbgDeclareInst::TypeId:
  14702. {
  14703. if (mDebugging)
  14704. {
  14705. NOP;
  14706. }
  14707. auto castedInst = (BeDbgDeclareInst*)inst;
  14708. auto dbgVar = castedInst->mDbgVar;
  14709. auto mcValue = GetOperand(castedInst->mValue);
  14710. auto mcVReg = mcValue;
  14711. auto vregInfo = GetVRegInfo(mcVReg);
  14712. if ((vregInfo != NULL) && (vregInfo->mDbgVariable != NULL))
  14713. {
  14714. auto shadowVReg = AllocVirtualReg(vregInfo->mType);
  14715. CreateDefineVReg(shadowVReg);
  14716. auto shadowVRegInfo = GetVRegInfo(shadowVReg);
  14717. shadowVRegInfo->mIsExpr = true;
  14718. shadowVRegInfo->mValueScopeRetainedKind = BeMCValueScopeRetainKind_Hard;
  14719. shadowVRegInfo->mRelTo = mcVReg;
  14720. shadowVRegInfo->mRelTo.mKind = BeMCOperandKind_VReg;
  14721. shadowVReg.mKind = mcVReg.mKind;
  14722. mcValue = shadowVReg;
  14723. mcVReg = shadowVReg;
  14724. vregInfo = shadowVRegInfo;
  14725. mValueToOperand[dbgVar] = shadowVReg;
  14726. }
  14727. else
  14728. {
  14729. mValueToOperand[dbgVar] = mcVReg;
  14730. }
  14731. dbgVar->mValue = castedInst->mValue;
  14732. dbgVar->mDeclDbgLoc = inst->mDbgLoc;
  14733. dbgVar->mIsValue = castedInst->mIsValue;
  14734. if (!mcVReg.IsVRegAny())
  14735. {
  14736. mcVReg = AllocVirtualReg(mModule->mContext->GetPrimitiveType(BeTypeCode_None));
  14737. vregInfo = GetVRegInfo(mcVReg);
  14738. // Allocate a vreg just to properly track the lifetime of this local constant
  14739. /*auto constType = GetType(mcVReg);
  14740. auto newVReg = AllocVirtualReg(constType);
  14741. vregInfo = GetVRegInfo(newVReg);
  14742. vregInfo->mIsExpr = true;
  14743. vregInfo->mRelTo = mcVReg;
  14744. mcVReg = newVReg;*/
  14745. }
  14746. vregInfo->mDbgVariable = dbgVar;
  14747. vregInfo->mMustExist = true;
  14748. dbgVar->mScope = mCurDbgLoc->mDbgScope;
  14749. dbgVar->mDeclMCBlockId = mcBlock->mBlockIdx;
  14750. AllocInst(BeMCInstKind_DbgDecl, mcVReg);
  14751. }
  14752. break;
  14753. default:
  14754. NotImpl();
  14755. break;
  14756. }
  14757. if (mFailed)
  14758. return;
  14759. if (result.mKind != BeMCOperandKind_None)
  14760. mValueToOperand[inst] = result;
  14761. }
  14762. inHeadAlloca = false;
  14763. isFirstBlock = false;
  14764. }
  14765. mCurDbgLoc = NULL;
  14766. BF_ASSERT(valueScopeStack.size() == 0);
  14767. BF_ASSERT(retCount == 1);
  14768. bool wantDebug = mDebugging;
  14769. //wantDebug |= function->mName == "?get__Yo@PoopBase@@UEAAUPloogB@@XZ";
  14770. //wantDebug |= function->mName == "?Testos@Fartso@@SAHPEA1@HH@Z";
  14771. //wantDebug |= function->mName == "?GetYoopA@Fartso@@QEAAUYoop@@XZ";
  14772. //"?TestVals@Fartso@@QEAATint@@XZ";
  14773. /*if (function->mName == "?TestVals@Fartso@@QEAATint@@PEA_J@Z")
  14774. {
  14775. //TODO: Temporary, force reg1 to spill
  14776. mVRegInfo[1]->mSpilled = true;
  14777. }*/
  14778. String str;
  14779. if (wantDebug)
  14780. {
  14781. str = "-------- Initial --------\n" + ToString();
  14782. OutputDebugStr(str.c_str());
  14783. } // Hi
  14784. DoTLSSetup();
  14785. DoChainedBlockMerge();
  14786. DetectLoops();
  14787. for (int pass = 0; pass < 3; pass++)
  14788. {
  14789. // Shouldn't have more than 2 passes
  14790. BF_ASSERT(pass != 2);
  14791. if (DoInitializedPass())
  14792. break;
  14793. }
  14794. if (wantDebug)
  14795. {
  14796. str = "-------- After DoDefPass --------\n" + ToString();
  14797. OutputDebugStr(str.c_str());
  14798. }
  14799. RefreshRefCounts();
  14800. GenerateLiveness();
  14801. if (wantDebug)
  14802. {
  14803. str = "--------After GenerateLiveness --------\n" + ToString();
  14804. OutputDebugStr(str.c_str());
  14805. }
  14806. DoInstCombinePass();
  14807. RefreshRefCounts();
  14808. if (wantDebug)
  14809. {
  14810. str = "--------After DoInstCombinePass--------\n" + ToString();
  14811. OutputDebugStr(str.c_str());
  14812. }
  14813. DoLoads();
  14814. for (int pass = 0; true; pass++)
  14815. {
  14816. DoRegAssignPass();
  14817. DoSanityChecking();
  14818. if (wantDebug)
  14819. {
  14820. str = "--------After RegAssignPass--------\n" + ToString();
  14821. OutputDebugStr(str.c_str());
  14822. }
  14823. bool regsDone = DoLegalization();
  14824. if (wantDebug)
  14825. {
  14826. str = "--------After Legalization--------\n" + ToString();
  14827. OutputDebugStr(str.c_str());
  14828. }
  14829. if (regsDone)
  14830. {
  14831. if (pass == 0)
  14832. {
  14833. if (wantDebug)
  14834. {
  14835. // The first pass may overestimate mem cost, so run another one
  14836. OutputDebugStr("Processing done on first pass, doing another register assign pass\n");
  14837. }
  14838. }
  14839. else
  14840. break;
  14841. }
  14842. //FOR TESTING
  14843. if (pass == 4)
  14844. {
  14845. NOP;
  14846. }
  14847. if (pass == 16)
  14848. {
  14849. Fail("Register assignment failed!");
  14850. }
  14851. // Reassign regs after legalization
  14852. //DoRegAssignPass();
  14853. }
  14854. DoRegFinalization();
  14855. if (wantDebug)
  14856. {
  14857. str = "--------After RegFinalization--------\n" + ToString();
  14858. OutputDebugStr(str);
  14859. }
  14860. DoBlockCombine();
  14861. if (wantDebug)
  14862. {
  14863. str = "--------After BlockCombine --------\n" + ToString();
  14864. OutputDebugStr(str);
  14865. }
  14866. while (true)
  14867. {
  14868. bool didWork = DoJumpRemovePass();
  14869. if (!didWork)
  14870. break;
  14871. RefreshRefCounts();
  14872. if (wantDebug)
  14873. {
  14874. str = "--------After DoJumpRemovePass --------\n" + ToString();
  14875. OutputDebugStr(str);
  14876. }
  14877. }
  14878. DoFrameObjPass(); // Must be (almost) last
  14879. if (wantDebug)
  14880. {
  14881. str = ToString();
  14882. OutputDebugStr(str.c_str());
  14883. }
  14884. DoCodeEmission();
  14885. }