llvm_backend_expr.cpp 171 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486248724882489249024912492249324942495249624972498249925002501250225032504250525062507250825092510251125122513251425152516251725182519252025212522252325242525252625272528252925302531253225332534253525362537253825392540254125422543254425452546254725482549255025512552255325542555255625572558255925602561256225632564256525662567256825692570257125722573257425752576257725782579258025812582258325842585258625872588258925902591259225932594259525962597259825992600260126022603260426052606260726082609261026112612261326142615261626172618261926202621262226232624262526262627262826292630263126322633263426352636263726382639264026412642264326442645264626472648264926502651265226532654265526562657265826592660266126622663266426652666266726682669267026712672267326742675267626772678267926802681268226832684268526862687268826892690269126922693269426952696269726982699270027012702270327042705270627072708270927102711271227132714271527162717271827192720272127222723272427252726272727282729273027312732273327342735273627372738273927402741274227432744274527462747274827492750275127522753275427552756275727582759276027612762276327642765276627672768276927702771277227732774277527762777277827792780278127822783278427852786278727882789279027912792279327942795279627972798279928002801280228032804280528062807280828092810281128122813281428152816281728182819282028212822282328242825282628272828282928302831283228332834283528362837283828392840284128422843284428452846284728482849285028512852285328542855285628572858285928602861286228632864286528662867286828692870287128722873287428752876287728782879288028812882288328842885288628872888288928902891289228932894289528962897289828992900290129022903290429052906290729082909291029112912291329142915291629172918291929202921292229232924292529262927292829292930293129322933293429352936293729382939294029412942294329442945294629472948294929502951295229532954295529562957295829592960296129622963296429652966296729682969297029712972297329742975297629772978297929802981298229832984298529862987298829892990299129922993299429952996299729982999300030013002300330043005300630073008300930103011301230133014301530163017301830193020302130223023302430253026302730283029303030313032303330343035303630373038303930403041304230433044304530463047304830493050305130523053305430553056305730583059306030613062306330643065306630673068306930703071307230733074307530763077307830793080308130823083308430853086308730883089309030913092309330943095309630973098309931003101310231033104310531063107310831093110311131123113311431153116311731183119312031213122312331243125312631273128312931303131313231333134313531363137313831393140314131423143314431453146314731483149315031513152315331543155315631573158315931603161316231633164316531663167316831693170317131723173317431753176317731783179318031813182318331843185318631873188318931903191319231933194319531963197319831993200320132023203320432053206320732083209321032113212321332143215321632173218321932203221322232233224322532263227322832293230323132323233323432353236323732383239324032413242324332443245324632473248324932503251325232533254325532563257325832593260326132623263326432653266326732683269327032713272327332743275327632773278327932803281328232833284328532863287328832893290329132923293329432953296329732983299330033013302330333043305330633073308330933103311331233133314331533163317331833193320332133223323332433253326332733283329333033313332333333343335333633373338333933403341334233433344334533463347334833493350335133523353335433553356335733583359336033613362336333643365336633673368336933703371337233733374337533763377337833793380338133823383338433853386338733883389339033913392339333943395339633973398339934003401340234033404340534063407340834093410341134123413341434153416341734183419342034213422342334243425342634273428342934303431343234333434343534363437343834393440344134423443344434453446344734483449345034513452345334543455345634573458345934603461346234633464346534663467346834693470347134723473347434753476347734783479348034813482348334843485348634873488348934903491349234933494349534963497349834993500350135023503350435053506350735083509351035113512351335143515351635173518351935203521352235233524352535263527352835293530353135323533353435353536353735383539354035413542354335443545354635473548354935503551355235533554355535563557355835593560356135623563356435653566356735683569357035713572357335743575357635773578357935803581358235833584358535863587358835893590359135923593359435953596359735983599360036013602360336043605360636073608360936103611361236133614361536163617361836193620362136223623362436253626362736283629363036313632363336343635363636373638363936403641364236433644364536463647364836493650365136523653365436553656365736583659366036613662366336643665366636673668366936703671367236733674367536763677367836793680368136823683368436853686368736883689369036913692369336943695369636973698369937003701370237033704370537063707370837093710371137123713371437153716371737183719372037213722372337243725372637273728372937303731373237333734373537363737373837393740374137423743374437453746374737483749375037513752375337543755375637573758375937603761376237633764376537663767376837693770377137723773377437753776377737783779378037813782378337843785378637873788378937903791379237933794379537963797379837993800380138023803380438053806380738083809381038113812381338143815381638173818381938203821382238233824382538263827382838293830383138323833383438353836383738383839384038413842384338443845384638473848384938503851385238533854385538563857385838593860386138623863386438653866386738683869387038713872387338743875387638773878387938803881388238833884388538863887388838893890389138923893389438953896389738983899390039013902390339043905390639073908390939103911391239133914391539163917391839193920392139223923392439253926392739283929393039313932393339343935393639373938393939403941394239433944394539463947394839493950395139523953395439553956395739583959396039613962396339643965396639673968396939703971397239733974397539763977397839793980398139823983398439853986398739883989399039913992399339943995399639973998399940004001400240034004400540064007400840094010401140124013401440154016401740184019402040214022402340244025402640274028402940304031403240334034403540364037403840394040404140424043404440454046404740484049405040514052405340544055405640574058405940604061406240634064406540664067406840694070407140724073407440754076407740784079408040814082408340844085408640874088408940904091409240934094409540964097409840994100410141024103410441054106410741084109411041114112411341144115411641174118411941204121412241234124412541264127412841294130413141324133413441354136413741384139414041414142414341444145414641474148414941504151415241534154415541564157415841594160416141624163416441654166416741684169417041714172417341744175417641774178417941804181418241834184418541864187418841894190419141924193419441954196419741984199420042014202420342044205420642074208420942104211421242134214421542164217421842194220422142224223422442254226422742284229423042314232423342344235423642374238423942404241424242434244424542464247424842494250425142524253425442554256425742584259426042614262426342644265426642674268426942704271427242734274427542764277427842794280428142824283428442854286428742884289429042914292429342944295429642974298429943004301430243034304430543064307430843094310431143124313431443154316431743184319432043214322432343244325432643274328432943304331433243334334433543364337433843394340434143424343434443454346434743484349435043514352435343544355435643574358435943604361436243634364436543664367436843694370437143724373437443754376437743784379438043814382438343844385438643874388438943904391439243934394439543964397439843994400440144024403440444054406440744084409441044114412441344144415441644174418441944204421442244234424442544264427442844294430443144324433443444354436443744384439444044414442444344444445444644474448444944504451445244534454445544564457445844594460446144624463446444654466446744684469447044714472447344744475447644774478447944804481448244834484448544864487448844894490449144924493449444954496449744984499450045014502450345044505450645074508450945104511451245134514451545164517451845194520452145224523452445254526452745284529453045314532453345344535453645374538453945404541454245434544454545464547454845494550455145524553455445554556455745584559456045614562456345644565456645674568456945704571457245734574457545764577457845794580458145824583458445854586458745884589459045914592459345944595459645974598459946004601460246034604460546064607460846094610461146124613461446154616461746184619462046214622462346244625462646274628462946304631463246334634463546364637463846394640464146424643464446454646464746484649465046514652465346544655465646574658465946604661466246634664466546664667466846694670467146724673467446754676467746784679468046814682468346844685468646874688468946904691469246934694469546964697469846994700470147024703470447054706470747084709471047114712471347144715471647174718471947204721472247234724472547264727472847294730473147324733473447354736473747384739474047414742474347444745474647474748474947504751475247534754475547564757475847594760476147624763476447654766476747684769477047714772477347744775477647774778477947804781478247834784478547864787478847894790479147924793479447954796479747984799480048014802480348044805480648074808480948104811481248134814481548164817481848194820482148224823482448254826482748284829483048314832483348344835483648374838483948404841484248434844484548464847484848494850485148524853485448554856485748584859486048614862486348644865486648674868486948704871487248734874487548764877487848794880488148824883488448854886488748884889489048914892489348944895489648974898489949004901490249034904490549064907490849094910491149124913491449154916491749184919492049214922492349244925492649274928492949304931493249334934493549364937493849394940494149424943494449454946494749484949495049514952495349544955495649574958495949604961496249634964496549664967496849694970497149724973497449754976497749784979498049814982498349844985498649874988498949904991499249934994499549964997499849995000500150025003500450055006500750085009501050115012501350145015501650175018501950205021502250235024502550265027502850295030503150325033503450355036503750385039504050415042504350445045504650475048504950505051505250535054505550565057505850595060506150625063506450655066506750685069507050715072507350745075507650775078507950805081508250835084508550865087508850895090509150925093509450955096509750985099510051015102510351045105510651075108510951105111511251135114511551165117511851195120512151225123512451255126512751285129513051315132513351345135513651375138513951405141514251435144514551465147514851495150515151525153515451555156515751585159516051615162516351645165516651675168516951705171517251735174517551765177517851795180518151825183518451855186518751885189519051915192519351945195519651975198519952005201520252035204520552065207520852095210521152125213521452155216521752185219522052215222522352245225522652275228522952305231523252335234523552365237523852395240524152425243524452455246524752485249525052515252525352545255525652575258525952605261526252635264526552665267526852695270527152725273527452755276527752785279528052815282528352845285528652875288528952905291529252935294529552965297529852995300530153025303530453055306530753085309531053115312531353145315531653175318531953205321532253235324532553265327532853295330533153325333533453355336533753385339534053415342534353445345534653475348534953505351535253535354535553565357535853595360536153625363536453655366536753685369537053715372537353745375537653775378537953805381538253835384538553865387538853895390539153925393539453955396539753985399540054015402540354045405540654075408540954105411541254135414541554165417541854195420542154225423542454255426542754285429543054315432543354345435543654375438543954405441544254435444544554465447544854495450545154525453545454555456545754585459546054615462546354645465546654675468546954705471547254735474547554765477547854795480
  1. gb_internal lbValue lb_emit_arith_matrix(lbProcedure *p, TokenKind op, lbValue lhs, lbValue rhs, Type *type, bool component_wise);
  2. gb_internal lbValue lb_emit_logical_binary_expr(lbProcedure *p, TokenKind op, Ast *left, Ast *right, Type *final_type) {
  3. lbModule *m = p->module;
  4. lbBlock *rhs = lb_create_block(p, "logical.cmp.rhs");
  5. lbBlock *done = lb_create_block(p, "logical.cmp.done");
  6. lbValue short_circuit = {};
  7. if (op == Token_CmpAnd) {
  8. lb_build_cond(p, left, rhs, done);
  9. short_circuit = lb_const_bool(m, t_llvm_bool, false);
  10. } else if (op == Token_CmpOr) {
  11. lb_build_cond(p, left, done, rhs);
  12. short_circuit = lb_const_bool(m, t_llvm_bool, true);
  13. }
  14. if (rhs->preds.count == 0) {
  15. lb_start_block(p, done);
  16. return short_circuit;
  17. }
  18. if (done->preds.count == 0) {
  19. lb_start_block(p, rhs);
  20. if (lb_is_expr_untyped_const(right)) {
  21. return lb_expr_untyped_const_to_typed(m, right, default_type(final_type));
  22. }
  23. return lb_build_expr(p, right);
  24. }
  25. Array<LLVMValueRef> incoming_values = {};
  26. Array<LLVMBasicBlockRef> incoming_blocks = {};
  27. array_init(&incoming_values, heap_allocator(), done->preds.count+1);
  28. array_init(&incoming_blocks, heap_allocator(), done->preds.count+1);
  29. for_array(i, done->preds) {
  30. incoming_values[i] = short_circuit.value;
  31. incoming_blocks[i] = done->preds[i]->block;
  32. }
  33. lb_start_block(p, rhs);
  34. lbValue edge = {};
  35. if (lb_is_expr_untyped_const(right)) {
  36. edge = lb_expr_untyped_const_to_typed(m, right, t_llvm_bool);
  37. } else {
  38. edge = lb_emit_conv(p, lb_build_expr(p, right), t_llvm_bool);
  39. }
  40. GB_ASSERT(edge.type == t_llvm_bool);
  41. incoming_values[done->preds.count] = edge.value;
  42. incoming_blocks[done->preds.count] = p->curr_block->block;
  43. lb_emit_jump(p, done);
  44. lb_start_block(p, done);
  45. LLVMTypeRef dst_type = lb_type(m, t_llvm_bool);
  46. LLVMValueRef phi = nullptr;
  47. GB_ASSERT(incoming_values.count == incoming_blocks.count);
  48. GB_ASSERT(incoming_values.count > 0);
  49. LLVMTypeRef phi_type = nullptr;
  50. for (LLVMValueRef incoming_value : incoming_values) {
  51. if (!LLVMIsConstant(incoming_value)) {
  52. phi_type = LLVMTypeOf(incoming_value);
  53. break;
  54. }
  55. }
  56. lbValue res = {};
  57. if (phi_type == nullptr) {
  58. phi = LLVMBuildPhi(p->builder, dst_type, "");
  59. LLVMAddIncoming(phi, incoming_values.data, incoming_blocks.data, cast(unsigned)incoming_values.count);
  60. res.value = phi;
  61. res.type = t_llvm_bool;
  62. } else {
  63. for_array(i, incoming_values) {
  64. LLVMValueRef incoming_value = incoming_values[i];
  65. LLVMTypeRef incoming_type = LLVMTypeOf(incoming_value);
  66. if (phi_type != incoming_type) {
  67. GB_ASSERT_MSG(LLVMIsConstant(incoming_value), "%s vs %s", LLVMPrintTypeToString(phi_type), LLVMPrintTypeToString(incoming_type));
  68. bool ok = !!LLVMConstIntGetZExtValue(incoming_value);
  69. incoming_values[i] = LLVMConstInt(phi_type, ok, false);
  70. }
  71. }
  72. // NOTE(bill): this now only uses i1 for the logic to prevent issues with corrupted booleans which are not of value 0 or 1 (e.g. 2)
  73. // Doing this may produce slightly worse code as a result but it will be correct behaviour
  74. phi = LLVMBuildPhi(p->builder, phi_type, "");
  75. LLVMAddIncoming(phi, incoming_values.data, incoming_blocks.data, cast(unsigned)incoming_values.count);
  76. res.value = phi;
  77. res.type = t_llvm_bool;
  78. }
  79. return lb_emit_conv(p, res, default_type(final_type));
  80. }
  81. gb_internal lbValue lb_emit_unary_arith(lbProcedure *p, TokenKind op, lbValue x, Type *type) {
  82. switch (op) {
  83. case Token_Add:
  84. return x;
  85. case Token_Not: // Boolean not
  86. case Token_Xor: // Bitwise not
  87. case Token_Sub: // Number negation
  88. break;
  89. case Token_Pointer:
  90. GB_PANIC("This should be handled elsewhere");
  91. break;
  92. }
  93. if (is_type_array_like(x.type)) {
  94. // IMPORTANT TODO(bill): This is very wasteful with regards to stack memory
  95. Type *tl = base_type(x.type);
  96. lbValue val = lb_address_from_load_or_generate_local(p, x);
  97. GB_ASSERT(is_type_array_like(type));
  98. Type *elem_type = base_array_type(type);
  99. // NOTE(bill): Doesn't need to be zero because it will be initialized in the loops
  100. lbAddr res_addr = lb_add_local(p, type, nullptr, false, true);
  101. lbValue res = lb_addr_get_ptr(p, res_addr);
  102. bool inline_array_arith = lb_can_try_to_inline_array_arith(type);
  103. i32 count = cast(i32)get_array_type_count(tl);
  104. LLVMTypeRef vector_type = nullptr;
  105. if (op != Token_Not && lb_try_vector_cast(p->module, val, &vector_type)) {
  106. LLVMValueRef vp = LLVMBuildPointerCast(p->builder, val.value, LLVMPointerType(vector_type, 0), "");
  107. LLVMValueRef v = LLVMBuildLoad2(p->builder, vector_type, vp, "");
  108. LLVMValueRef opv = nullptr;
  109. switch (op) {
  110. case Token_Xor:
  111. opv = LLVMBuildNot(p->builder, v, "");
  112. break;
  113. case Token_Sub:
  114. if (is_type_float(elem_type)) {
  115. opv = LLVMBuildFNeg(p->builder, v, "");
  116. } else {
  117. opv = LLVMBuildNeg(p->builder, v, "");
  118. }
  119. break;
  120. }
  121. if (opv != nullptr) {
  122. LLVMSetAlignment(res.value, cast(unsigned)lb_alignof(vector_type));
  123. LLVMValueRef res_ptr = LLVMBuildPointerCast(p->builder, res.value, LLVMPointerType(vector_type, 0), "");
  124. LLVMBuildStore(p->builder, opv, res_ptr);
  125. return lb_emit_conv(p, lb_emit_load(p, res), type);
  126. }
  127. }
  128. if (inline_array_arith) {
  129. // inline
  130. for (i32 i = 0; i < count; i++) {
  131. lbValue e = lb_emit_load(p, lb_emit_array_epi(p, val, i));
  132. lbValue z = lb_emit_unary_arith(p, op, e, elem_type);
  133. lb_emit_store(p, lb_emit_array_epi(p, res, i), z);
  134. }
  135. } else {
  136. auto loop_data = lb_loop_start(p, count, t_i32);
  137. lbValue e = lb_emit_load(p, lb_emit_array_ep(p, val, loop_data.idx));
  138. lbValue z = lb_emit_unary_arith(p, op, e, elem_type);
  139. lb_emit_store(p, lb_emit_array_ep(p, res, loop_data.idx), z);
  140. lb_loop_end(p, loop_data);
  141. }
  142. return lb_emit_load(p, res);
  143. }
  144. if (op == Token_Xor) {
  145. lbValue cmp = {};
  146. cmp.value = LLVMBuildNot(p->builder, x.value, "");
  147. cmp.type = x.type;
  148. return lb_emit_conv(p, cmp, type);
  149. }
  150. if (op == Token_Not) {
  151. lbValue cmp = {};
  152. LLVMValueRef zero = LLVMConstInt(lb_type(p->module, x.type), 0, false);
  153. cmp.value = LLVMBuildICmp(p->builder, LLVMIntEQ, x.value, zero, "");
  154. cmp.type = t_llvm_bool;
  155. return lb_emit_conv(p, cmp, type);
  156. }
  157. if (op == Token_Sub && is_type_integer(type) && is_type_different_to_arch_endianness(type)) {
  158. Type *platform_type = integer_endian_type_to_platform_type(type);
  159. lbValue v = lb_emit_byte_swap(p, x, platform_type);
  160. lbValue res = {};
  161. res.value = LLVMBuildNeg(p->builder, v.value, "");
  162. res.type = platform_type;
  163. return lb_emit_byte_swap(p, res, type);
  164. }
  165. if (op == Token_Sub && is_type_float(type) && is_type_different_to_arch_endianness(type)) {
  166. Type *platform_type = integer_endian_type_to_platform_type(type);
  167. lbValue v = lb_emit_byte_swap(p, x, platform_type);
  168. lbValue res = {};
  169. res.value = LLVMBuildFNeg(p->builder, v.value, "");
  170. res.type = platform_type;
  171. return lb_emit_byte_swap(p, res, type);
  172. }
  173. lbValue res = {};
  174. switch (op) {
  175. case Token_Not: // Boolean not
  176. case Token_Xor: // Bitwise not
  177. res.value = LLVMBuildNot(p->builder, x.value, "");
  178. res.type = x.type;
  179. return res;
  180. case Token_Sub: // Number negation
  181. if (is_type_integer(x.type)) {
  182. res.value = LLVMBuildNeg(p->builder, x.value, "");
  183. } else if (is_type_float(x.type)) {
  184. res.value = LLVMBuildFNeg(p->builder, x.value, "");
  185. } else if (is_type_complex(x.type)) {
  186. LLVMValueRef v0 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 0, ""), "");
  187. LLVMValueRef v1 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 1, ""), "");
  188. lbAddr addr = lb_add_local_generated(p, x.type, false);
  189. LLVMTypeRef type = llvm_addr_type(p->module, addr.addr);
  190. LLVMBuildStore(p->builder, v0, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 0, ""));
  191. LLVMBuildStore(p->builder, v1, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 1, ""));
  192. return lb_addr_load(p, addr);
  193. } else if (is_type_quaternion(x.type)) {
  194. LLVMValueRef v0 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 0, ""), "");
  195. LLVMValueRef v1 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 1, ""), "");
  196. LLVMValueRef v2 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 2, ""), "");
  197. LLVMValueRef v3 = LLVMBuildFNeg(p->builder, LLVMBuildExtractValue(p->builder, x.value, 3, ""), "");
  198. lbAddr addr = lb_add_local_generated(p, x.type, false);
  199. LLVMTypeRef type = llvm_addr_type(p->module, addr.addr);
  200. LLVMBuildStore(p->builder, v0, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 0, ""));
  201. LLVMBuildStore(p->builder, v1, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 1, ""));
  202. LLVMBuildStore(p->builder, v2, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 2, ""));
  203. LLVMBuildStore(p->builder, v3, LLVMBuildStructGEP2(p->builder, type, addr.addr.value, 3, ""));
  204. return lb_addr_load(p, addr);
  205. } else if (is_type_simd_vector(x.type)) {
  206. Type *elem = base_array_type(x.type);
  207. if (is_type_float(elem)) {
  208. res.value = LLVMBuildFNeg(p->builder, x.value, "");
  209. } else {
  210. res.value = LLVMBuildNeg(p->builder, x.value, "");
  211. }
  212. } else if (is_type_matrix(x.type)) {
  213. lbValue zero = {};
  214. zero.value = LLVMConstNull(lb_type(p->module, type));
  215. zero.type = type;
  216. return lb_emit_arith_matrix(p, Token_Sub, zero, x, type, true);
  217. } else {
  218. GB_PANIC("Unhandled type %s", type_to_string(x.type));
  219. }
  220. res.type = x.type;
  221. return res;
  222. }
  223. return res;
  224. }
  225. gb_internal bool lb_try_direct_vector_arith(lbProcedure *p, TokenKind op, lbValue lhs, lbValue rhs, Type *type, lbValue *res_) {
  226. GB_ASSERT(is_type_array_like(type));
  227. Type *elem_type = base_array_type(type);
  228. // NOTE(bill): Shift operations cannot be easily dealt with due to Odin's semantics
  229. if (op == Token_Shl || op == Token_Shr) {
  230. return false;
  231. }
  232. if (!LLVMIsALoadInst(lhs.value) || !LLVMIsALoadInst(rhs.value)) {
  233. return false;
  234. }
  235. lbValue lhs_ptr = {};
  236. lbValue rhs_ptr = {};
  237. lhs_ptr.value = LLVMGetOperand(lhs.value, 0);
  238. lhs_ptr.type = alloc_type_pointer(lhs.type);
  239. rhs_ptr.value = LLVMGetOperand(rhs.value, 0);
  240. rhs_ptr.type = alloc_type_pointer(rhs.type);
  241. LLVMTypeRef vector_type0 = nullptr;
  242. LLVMTypeRef vector_type1 = nullptr;
  243. if (lb_try_vector_cast(p->module, lhs_ptr, &vector_type0) &&
  244. lb_try_vector_cast(p->module, rhs_ptr, &vector_type1)) {
  245. GB_ASSERT(vector_type0 == vector_type1);
  246. LLVMTypeRef vector_type = vector_type0;
  247. Type *integral_type = base_type(elem_type);
  248. if (is_type_simd_vector(integral_type)) {
  249. integral_type = core_array_type(integral_type);
  250. }
  251. if (is_type_bit_set(integral_type)) {
  252. switch (op) {
  253. case Token_Add: op = Token_Or; break;
  254. case Token_Sub: op = Token_AndNot; break;
  255. }
  256. Type *u = bit_set_to_int(type);
  257. if (is_type_array(u)) {
  258. return false;
  259. }
  260. }
  261. LLVMValueRef lhs_vp = LLVMBuildPointerCast(p->builder, lhs_ptr.value, LLVMPointerType(vector_type, 0), "");
  262. LLVMValueRef rhs_vp = LLVMBuildPointerCast(p->builder, rhs_ptr.value, LLVMPointerType(vector_type, 0), "");
  263. LLVMValueRef x = LLVMBuildLoad2(p->builder, vector_type, lhs_vp, "");
  264. LLVMValueRef y = LLVMBuildLoad2(p->builder, vector_type, rhs_vp, "");
  265. LLVMValueRef z = nullptr;
  266. if (is_type_float(integral_type)) {
  267. switch (op) {
  268. case Token_Add:
  269. z = LLVMBuildFAdd(p->builder, x, y, "");
  270. break;
  271. case Token_Sub:
  272. z = LLVMBuildFSub(p->builder, x, y, "");
  273. break;
  274. case Token_Mul:
  275. z = LLVMBuildFMul(p->builder, x, y, "");
  276. break;
  277. case Token_Quo:
  278. z = LLVMBuildFDiv(p->builder, x, y, "");
  279. break;
  280. case Token_Mod:
  281. z = LLVMBuildFRem(p->builder, x, y, "");
  282. break;
  283. default:
  284. GB_PANIC("Unsupported vector operation %.*s", LIT(token_strings[op]));
  285. break;
  286. }
  287. } else {
  288. switch (op) {
  289. case Token_Add:
  290. z = LLVMBuildAdd(p->builder, x, y, "");
  291. break;
  292. case Token_Sub:
  293. z = LLVMBuildSub(p->builder, x, y, "");
  294. break;
  295. case Token_Mul:
  296. z = LLVMBuildMul(p->builder, x, y, "");
  297. break;
  298. case Token_Quo:
  299. if (is_type_unsigned(integral_type)) {
  300. z = LLVMBuildUDiv(p->builder, x, y, "");
  301. } else {
  302. z = LLVMBuildSDiv(p->builder, x, y, "");
  303. }
  304. break;
  305. case Token_Mod:
  306. if (is_type_unsigned(integral_type)) {
  307. z = LLVMBuildURem(p->builder, x, y, "");
  308. } else {
  309. z = LLVMBuildSRem(p->builder, x, y, "");
  310. }
  311. break;
  312. case Token_ModMod:
  313. if (is_type_unsigned(integral_type)) {
  314. z = LLVMBuildURem(p->builder, x, y, "");
  315. } else {
  316. LLVMValueRef a = LLVMBuildSRem(p->builder, x, y, "");
  317. LLVMValueRef b = LLVMBuildAdd(p->builder, a, y, "");
  318. z = LLVMBuildSRem(p->builder, b, y, "");
  319. }
  320. break;
  321. case Token_And:
  322. z = LLVMBuildAnd(p->builder, x, y, "");
  323. break;
  324. case Token_AndNot:
  325. z = LLVMBuildAnd(p->builder, x, LLVMBuildNot(p->builder, y, ""), "");
  326. break;
  327. case Token_Or:
  328. z = LLVMBuildOr(p->builder, x, y, "");
  329. break;
  330. case Token_Xor:
  331. z = LLVMBuildXor(p->builder, x, y, "");
  332. break;
  333. default:
  334. GB_PANIC("Unsupported vector operation");
  335. break;
  336. }
  337. }
  338. if (z != nullptr) {
  339. lbAddr res = lb_add_local_generated_temp(p, type, lb_alignof(vector_type));
  340. LLVMValueRef vp = LLVMBuildPointerCast(p->builder, res.addr.value, LLVMPointerType(vector_type, 0), "");
  341. LLVMBuildStore(p->builder, z, vp);
  342. lbValue v = lb_addr_load(p, res);
  343. if (res_) *res_ = v;
  344. return true;
  345. }
  346. }
  347. return false;
  348. }
  349. gb_internal lbValue lb_emit_arith_array(lbProcedure *p, TokenKind op, lbValue lhs, lbValue rhs, Type *type) {
  350. GB_ASSERT(is_type_array_like(lhs.type) || is_type_array_like(rhs.type));
  351. lhs = lb_emit_conv(p, lhs, type);
  352. rhs = lb_emit_conv(p, rhs, type);
  353. GB_ASSERT(is_type_array_like(type));
  354. Type *elem_type = base_array_type(type);
  355. i64 count = get_array_type_count(type);
  356. unsigned n = cast(unsigned)count;
  357. // NOTE(bill, 2021-06-12): Try to do a direct operation as a vector, if possible
  358. lbValue direct_vector_res = {};
  359. if (lb_try_direct_vector_arith(p, op, lhs, rhs, type, &direct_vector_res)) {
  360. return direct_vector_res;
  361. }
  362. bool inline_array_arith = lb_can_try_to_inline_array_arith(type);
  363. if (inline_array_arith) {
  364. auto dst_ptrs = slice_make<lbValue>(temporary_allocator(), n);
  365. auto a_loads = slice_make<lbValue>(temporary_allocator(), n);
  366. auto b_loads = slice_make<lbValue>(temporary_allocator(), n);
  367. auto c_ops = slice_make<lbValue>(temporary_allocator(), n);
  368. for (unsigned i = 0; i < n; i++) {
  369. a_loads[i].value = LLVMBuildExtractValue(p->builder, lhs.value, i, "");
  370. a_loads[i].type = elem_type;
  371. }
  372. for (unsigned i = 0; i < n; i++) {
  373. b_loads[i].value = LLVMBuildExtractValue(p->builder, rhs.value, i, "");
  374. b_loads[i].type = elem_type;
  375. }
  376. for (unsigned i = 0; i < n; i++) {
  377. c_ops[i] = lb_emit_arith(p, op, a_loads[i], b_loads[i], elem_type);
  378. }
  379. lbAddr res = lb_add_local_generated(p, type, false);
  380. for (unsigned i = 0; i < n; i++) {
  381. dst_ptrs[i] = lb_emit_array_epi(p, res.addr, i);
  382. }
  383. for (unsigned i = 0; i < n; i++) {
  384. lb_emit_store(p, dst_ptrs[i], c_ops[i]);
  385. }
  386. return lb_addr_load(p, res);
  387. } else {
  388. lbValue x = lb_address_from_load_or_generate_local(p, lhs);
  389. lbValue y = lb_address_from_load_or_generate_local(p, rhs);
  390. lbAddr res = lb_add_local_generated(p, type, false);
  391. auto loop_data = lb_loop_start(p, cast(isize)count, t_i32);
  392. lbValue a_ptr = lb_emit_array_ep(p, x, loop_data.idx);
  393. lbValue b_ptr = lb_emit_array_ep(p, y, loop_data.idx);
  394. lbValue dst_ptr = lb_emit_array_ep(p, res.addr, loop_data.idx);
  395. lbValue a = lb_emit_load(p, a_ptr);
  396. lbValue b = lb_emit_load(p, b_ptr);
  397. lbValue c = lb_emit_arith(p, op, a, b, elem_type);
  398. lb_emit_store(p, dst_ptr, c);
  399. lb_loop_end(p, loop_data);
  400. return lb_addr_load(p, res);
  401. }
  402. }
  403. gb_internal bool lb_is_matrix_simdable(Type *t) {
  404. Type *mt = base_type(t);
  405. GB_ASSERT(mt->kind == Type_Matrix);
  406. Type *elem = core_type(mt->Matrix.elem);
  407. if (is_type_complex(elem)) {
  408. return false;
  409. }
  410. if (is_type_different_to_arch_endianness(elem)) {
  411. return false;
  412. }
  413. switch (build_context.metrics.arch) {
  414. default:
  415. return false;
  416. case TargetArch_amd64:
  417. case TargetArch_arm64:
  418. break;
  419. }
  420. if (type_align_of(t) < 16) {
  421. // it's not aligned well enough to use the vector instructions
  422. return false;
  423. }
  424. if ((mt->Matrix.row_count & 1) ^ (mt->Matrix.column_count & 1)) {
  425. return false;
  426. }
  427. if (mt->Matrix.is_row_major) {
  428. // TODO(bill): make #row_major matrices work with SIMD
  429. return false;
  430. }
  431. if (elem->kind == Type_Basic) {
  432. switch (elem->Basic.kind) {
  433. case Basic_f16:
  434. case Basic_f16le:
  435. case Basic_f16be:
  436. switch (build_context.metrics.arch) {
  437. case TargetArch_amd64:
  438. return false;
  439. case TargetArch_arm64:
  440. // TODO(bill): determine when this is fine
  441. return true;
  442. case TargetArch_i386:
  443. case TargetArch_wasm32:
  444. case TargetArch_wasm64p32:
  445. return false;
  446. }
  447. }
  448. }
  449. return true;
  450. }
  451. gb_internal LLVMValueRef lb_matrix_to_vector(lbProcedure *p, lbValue matrix) {
  452. Type *mt = base_type(matrix.type);
  453. GB_ASSERT(mt->kind == Type_Matrix);
  454. LLVMTypeRef elem_type = lb_type(p->module, mt->Matrix.elem);
  455. unsigned total_count = cast(unsigned)matrix_type_total_internal_elems(mt);
  456. LLVMTypeRef total_matrix_type = LLVMVectorType(elem_type, total_count);
  457. #if 1
  458. LLVMValueRef ptr = lb_address_from_load_or_generate_local(p, matrix).value;
  459. LLVMValueRef matrix_vector_ptr = LLVMBuildPointerCast(p->builder, ptr, LLVMPointerType(total_matrix_type, 0), "");
  460. LLVMValueRef matrix_vector = LLVMBuildLoad2(p->builder, total_matrix_type, matrix_vector_ptr, "");
  461. LLVMSetAlignment(matrix_vector, cast(unsigned)type_align_of(mt));
  462. return matrix_vector;
  463. #else
  464. LLVMValueRef matrix_vector = LLVMBuildBitCast(p->builder, matrix.value, total_matrix_type, "");
  465. return matrix_vector;
  466. #endif
  467. }
  468. gb_internal LLVMValueRef lb_matrix_trimmed_vector_mask(lbProcedure *p, Type *mt) {
  469. mt = base_type(mt);
  470. GB_ASSERT(mt->kind == Type_Matrix);
  471. unsigned stride = cast(unsigned)matrix_type_stride_in_elems(mt);
  472. unsigned row_count = cast(unsigned)mt->Matrix.row_count;
  473. unsigned column_count = cast(unsigned)mt->Matrix.column_count;
  474. unsigned mask_elems_index = 0;
  475. auto mask_elems = slice_make<LLVMValueRef>(permanent_allocator(), row_count*column_count);
  476. for (unsigned j = 0; j < column_count; j++) {
  477. for (unsigned i = 0; i < row_count; i++) {
  478. unsigned offset = stride*j + i;
  479. mask_elems[mask_elems_index++] = lb_const_int(p->module, t_u32, offset).value;
  480. }
  481. }
  482. LLVMValueRef mask = LLVMConstVector(mask_elems.data, cast(unsigned)mask_elems.count);
  483. return mask;
  484. }
  485. gb_internal LLVMValueRef lb_matrix_to_trimmed_vector(lbProcedure *p, lbValue m) {
  486. LLVMValueRef vector = lb_matrix_to_vector(p, m);
  487. Type *mt = base_type(m.type);
  488. GB_ASSERT(mt->kind == Type_Matrix);
  489. unsigned stride = cast(unsigned)matrix_type_stride_in_elems(mt);
  490. unsigned row_count = cast(unsigned)mt->Matrix.row_count;
  491. if (stride == row_count) {
  492. return vector;
  493. }
  494. LLVMValueRef mask = lb_matrix_trimmed_vector_mask(p, mt);
  495. LLVMValueRef trimmed_vector = llvm_basic_shuffle(p, vector, mask);
  496. return trimmed_vector;
  497. }
  498. gb_internal lbValue lb_emit_matrix_tranpose(lbProcedure *p, lbValue m, Type *type) {
  499. if (is_type_array(m.type)) {
  500. i32 rank = type_math_rank(m.type);
  501. if (rank == 2) {
  502. lbAddr addr = lb_add_local_generated(p, type, false);
  503. lbValue dst = addr.addr;
  504. lbValue src = m;
  505. i32 n = cast(i32)get_array_type_count(m.type);
  506. i32 m = cast(i32)get_array_type_count(type);
  507. // m.type == [n][m]T
  508. // type == [m][n]T
  509. for (i32 j = 0; j < m; j++) {
  510. lbValue dst_col = lb_emit_struct_ep(p, dst, j);
  511. for (i32 i = 0; i < n; i++) {
  512. lbValue dst_row = lb_emit_struct_ep(p, dst_col, i);
  513. lbValue src_col = lb_emit_struct_ev(p, src, i);
  514. lbValue src_row = lb_emit_struct_ev(p, src_col, j);
  515. lb_emit_store(p, dst_row, src_row);
  516. }
  517. }
  518. return lb_addr_load(p, addr);
  519. }
  520. // no-op
  521. m.type = type;
  522. return m;
  523. }
  524. Type *mt = base_type(m.type);
  525. GB_ASSERT(mt->kind == Type_Matrix);
  526. if (lb_is_matrix_simdable(mt)) {
  527. unsigned stride = cast(unsigned)matrix_type_stride_in_elems(mt);
  528. unsigned row_count = cast(unsigned)mt->Matrix.row_count;
  529. unsigned column_count = cast(unsigned)mt->Matrix.column_count;
  530. auto rows = slice_make<LLVMValueRef>(permanent_allocator(), row_count);
  531. auto mask_elems = slice_make<LLVMValueRef>(permanent_allocator(), column_count);
  532. LLVMValueRef vector = lb_matrix_to_vector(p, m);
  533. for (unsigned i = 0; i < row_count; i++) {
  534. for (unsigned j = 0; j < column_count; j++) {
  535. unsigned offset = stride*j + i;
  536. mask_elems[j] = lb_const_int(p->module, t_u32, offset).value;
  537. }
  538. // transpose mask
  539. LLVMValueRef mask = LLVMConstVector(mask_elems.data, column_count);
  540. LLVMValueRef row = llvm_basic_shuffle(p, vector, mask);
  541. rows[i] = row;
  542. }
  543. lbAddr res = lb_add_local_generated(p, type, true);
  544. for_array(i, rows) {
  545. LLVMValueRef row = rows[i];
  546. lbValue dst_row_ptr = lb_emit_matrix_epi(p, res.addr, 0, i);
  547. LLVMValueRef ptr = dst_row_ptr.value;
  548. ptr = LLVMBuildPointerCast(p->builder, ptr, LLVMPointerType(LLVMTypeOf(row), 0), "");
  549. LLVMBuildStore(p->builder, row, ptr);
  550. }
  551. return lb_addr_load(p, res);
  552. }
  553. lbAddr res = lb_add_local_generated(p, type, true);
  554. i64 row_count = mt->Matrix.row_count;
  555. i64 column_count = mt->Matrix.column_count;
  556. for (i64 j = 0; j < column_count; j++) {
  557. for (i64 i = 0; i < row_count; i++) {
  558. lbValue src = lb_emit_matrix_ev(p, m, i, j);
  559. lbValue dst = lb_emit_matrix_epi(p, res.addr, j, i);
  560. lb_emit_store(p, dst, src);
  561. }
  562. }
  563. return lb_addr_load(p, res);
  564. }
  565. gb_internal lbValue lb_matrix_cast_vector_to_type(lbProcedure *p, LLVMValueRef vector, Type *type) {
  566. lbAddr res = lb_add_local_generated(p, type, true);
  567. LLVMValueRef res_ptr = res.addr.value;
  568. unsigned alignment = cast(unsigned)gb_max(type_align_of(type), lb_alignof(LLVMTypeOf(vector)));
  569. LLVMSetAlignment(res_ptr, alignment);
  570. res_ptr = LLVMBuildPointerCast(p->builder, res_ptr, LLVMPointerType(LLVMTypeOf(vector), 0), "");
  571. LLVMBuildStore(p->builder, vector, res_ptr);
  572. return lb_addr_load(p, res);
  573. }
  574. gb_internal lbValue lb_emit_matrix_flatten(lbProcedure *p, lbValue m, Type *type) {
  575. if (is_type_array(m.type)) {
  576. // no-op
  577. m.type = type;
  578. return m;
  579. }
  580. Type *mt = base_type(m.type);
  581. GB_ASSERT(mt->kind == Type_Matrix);
  582. lbAddr res = lb_add_local_generated(p, type, true);
  583. i64 row_count = mt->Matrix.row_count;
  584. i64 column_count = mt->Matrix.column_count;
  585. TEMPORARY_ALLOCATOR_GUARD();
  586. auto srcs = array_make<lbValue>(temporary_allocator(), 0, row_count*column_count);
  587. auto dsts = array_make<lbValue>(temporary_allocator(), 0, row_count*column_count);
  588. for (i64 j = 0; j < column_count; j++) {
  589. for (i64 i = 0; i < row_count; i++) {
  590. lbValue src = lb_emit_matrix_ev(p, m, i, j);
  591. array_add(&srcs, src);
  592. }
  593. }
  594. for (i64 j = 0; j < column_count; j++) {
  595. for (i64 i = 0; i < row_count; i++) {
  596. lbValue dst = lb_emit_array_epi(p, res.addr, i + j*row_count);
  597. array_add(&dsts, dst);
  598. }
  599. }
  600. GB_ASSERT(srcs.count == dsts.count);
  601. for_array(i, srcs) {
  602. lb_emit_store(p, dsts[i], srcs[i]);
  603. }
  604. return lb_addr_load(p, res);
  605. }
  606. gb_internal lbValue lb_emit_outer_product(lbProcedure *p, lbValue a, lbValue b, Type *type) {
  607. Type *mt = base_type(type);
  608. Type *at = base_type(a.type);
  609. Type *bt = base_type(b.type);
  610. GB_ASSERT(mt->kind == Type_Matrix);
  611. GB_ASSERT(at->kind == Type_Array);
  612. GB_ASSERT(bt->kind == Type_Array);
  613. i64 row_count = mt->Matrix.row_count;
  614. i64 column_count = mt->Matrix.column_count;
  615. GB_ASSERT(row_count == at->Array.count);
  616. GB_ASSERT(column_count == bt->Array.count);
  617. lbAddr res = lb_add_local_generated(p, type, true);
  618. for (i64 j = 0; j < column_count; j++) {
  619. for (i64 i = 0; i < row_count; i++) {
  620. lbValue x = lb_emit_struct_ev(p, a, cast(i32)i);
  621. lbValue y = lb_emit_struct_ev(p, b, cast(i32)j);
  622. lbValue src = lb_emit_arith(p, Token_Mul, x, y, mt->Matrix.elem);
  623. lbValue dst = lb_emit_matrix_epi(p, res.addr, i, j);
  624. lb_emit_store(p, dst, src);
  625. }
  626. }
  627. return lb_addr_load(p, res);
  628. }
  629. gb_internal lbValue lb_emit_matrix_mul(lbProcedure *p, lbValue lhs, lbValue rhs, Type *type) {
  630. // TODO(bill): Handle edge case for f16 types on x86(-64) platforms
  631. Type *xt = base_type(lhs.type);
  632. Type *yt = base_type(rhs.type);
  633. GB_ASSERT(is_type_matrix(type));
  634. GB_ASSERT(is_type_matrix(xt));
  635. GB_ASSERT(is_type_matrix(yt));
  636. GB_ASSERT(xt->Matrix.column_count == yt->Matrix.row_count);
  637. GB_ASSERT(are_types_identical(xt->Matrix.elem, yt->Matrix.elem));
  638. GB_ASSERT(xt->Matrix.is_row_major == yt->Matrix.is_row_major);
  639. Type *elem = xt->Matrix.elem;
  640. unsigned outer_rows = cast(unsigned)xt->Matrix.row_count;
  641. unsigned inner = cast(unsigned)xt->Matrix.column_count;
  642. unsigned outer_columns = cast(unsigned)yt->Matrix.column_count;
  643. if (!xt->Matrix.is_row_major && lb_is_matrix_simdable(xt)) {
  644. unsigned x_stride = cast(unsigned)matrix_type_stride_in_elems(xt);
  645. unsigned y_stride = cast(unsigned)matrix_type_stride_in_elems(yt);
  646. auto x_rows = slice_make<LLVMValueRef>(permanent_allocator(), outer_rows);
  647. auto y_columns = slice_make<LLVMValueRef>(permanent_allocator(), outer_columns);
  648. LLVMValueRef x_vector = lb_matrix_to_vector(p, lhs);
  649. LLVMValueRef y_vector = lb_matrix_to_vector(p, rhs);
  650. auto mask_elems = slice_make<LLVMValueRef>(permanent_allocator(), inner);
  651. for (unsigned i = 0; i < outer_rows; i++) {
  652. for (unsigned j = 0; j < inner; j++) {
  653. unsigned offset = x_stride*j + i;
  654. mask_elems[j] = lb_const_int(p->module, t_u32, offset).value;
  655. }
  656. // transpose mask
  657. LLVMValueRef mask = LLVMConstVector(mask_elems.data, inner);
  658. LLVMValueRef row = llvm_basic_shuffle(p, x_vector, mask);
  659. x_rows[i] = row;
  660. }
  661. for (unsigned i = 0; i < outer_columns; i++) {
  662. LLVMValueRef mask = llvm_mask_iota(p->module, y_stride*i, inner);
  663. LLVMValueRef column = llvm_basic_shuffle(p, y_vector, mask);
  664. y_columns[i] = column;
  665. }
  666. lbAddr res = lb_add_local_generated(p, type, true);
  667. for_array(i, x_rows) {
  668. LLVMValueRef x_row = x_rows[i];
  669. for_array(j, y_columns) {
  670. LLVMValueRef y_column = y_columns[j];
  671. LLVMValueRef elem = llvm_vector_dot(p, x_row, y_column);
  672. lbValue dst = lb_emit_matrix_epi(p, res.addr, i, j);
  673. LLVMBuildStore(p->builder, elem, dst.value);
  674. }
  675. }
  676. return lb_addr_load(p, res);
  677. }
  678. if (!xt->Matrix.is_row_major) {
  679. lbAddr res = lb_add_local_generated(p, type, true);
  680. auto inners = slice_make<lbValue[2]>(permanent_allocator(), inner);
  681. for (unsigned j = 0; j < outer_columns; j++) {
  682. for (unsigned i = 0; i < outer_rows; i++) {
  683. lbValue dst = lb_emit_matrix_epi(p, res.addr, i, j);
  684. for (unsigned k = 0; k < inner; k++) {
  685. inners[k][0] = lb_emit_matrix_ev(p, lhs, i, k);
  686. inners[k][1] = lb_emit_matrix_ev(p, rhs, k, j);
  687. }
  688. lbValue sum = lb_const_nil(p->module, elem);
  689. for (unsigned k = 0; k < inner; k++) {
  690. lbValue a = inners[k][0];
  691. lbValue b = inners[k][1];
  692. sum = lb_emit_mul_add(p, a, b, sum, elem);
  693. }
  694. lb_emit_store(p, dst, sum);
  695. }
  696. }
  697. return lb_addr_load(p, res);
  698. } else {
  699. lbAddr res = lb_add_local_generated(p, type, true);
  700. auto inners = slice_make<lbValue[2]>(permanent_allocator(), inner);
  701. for (unsigned i = 0; i < outer_rows; i++) {
  702. for (unsigned j = 0; j < outer_columns; j++) {
  703. lbValue dst = lb_emit_matrix_epi(p, res.addr, i, j);
  704. for (unsigned k = 0; k < inner; k++) {
  705. inners[k][0] = lb_emit_matrix_ev(p, lhs, i, k);
  706. inners[k][1] = lb_emit_matrix_ev(p, rhs, k, j);
  707. }
  708. lbValue sum = lb_const_nil(p->module, elem);
  709. for (unsigned k = 0; k < inner; k++) {
  710. lbValue a = inners[k][0];
  711. lbValue b = inners[k][1];
  712. sum = lb_emit_mul_add(p, a, b, sum, elem);
  713. }
  714. lb_emit_store(p, dst, sum);
  715. }
  716. }
  717. return lb_addr_load(p, res);
  718. }
  719. }
  720. gb_internal lbValue lb_emit_matrix_mul_vector(lbProcedure *p, lbValue lhs, lbValue rhs, Type *type) {
  721. // TODO(bill): Handle edge case for f16 types on x86(-64) platforms
  722. Type *mt = base_type(lhs.type);
  723. Type *vt = base_type(rhs.type);
  724. GB_ASSERT(is_type_matrix(mt));
  725. GB_ASSERT(is_type_array_like(vt));
  726. i64 vector_count = get_array_type_count(vt);
  727. GB_ASSERT(mt->Matrix.column_count == vector_count);
  728. GB_ASSERT(are_types_identical(mt->Matrix.elem, base_array_type(vt)));
  729. Type *elem = mt->Matrix.elem;
  730. if (!mt->Matrix.is_row_major && lb_is_matrix_simdable(mt)) {
  731. unsigned stride = cast(unsigned)matrix_type_stride_in_elems(mt);
  732. unsigned row_count = cast(unsigned)mt->Matrix.row_count;
  733. unsigned column_count = cast(unsigned)mt->Matrix.column_count;
  734. auto m_columns = slice_make<LLVMValueRef>(permanent_allocator(), column_count);
  735. auto v_rows = slice_make<LLVMValueRef>(permanent_allocator(), column_count);
  736. LLVMValueRef matrix_vector = lb_matrix_to_vector(p, lhs);
  737. for (unsigned column_index = 0; column_index < column_count; column_index++) {
  738. LLVMValueRef mask = llvm_mask_iota(p->module, stride*column_index, row_count);
  739. LLVMValueRef column = llvm_basic_shuffle(p, matrix_vector, mask);
  740. m_columns[column_index] = column;
  741. }
  742. for (unsigned row_index = 0; row_index < column_count; row_index++) {
  743. LLVMValueRef value = lb_emit_struct_ev(p, rhs, row_index).value;
  744. LLVMValueRef row = llvm_vector_broadcast(p, value, row_count);
  745. v_rows[row_index] = row;
  746. }
  747. GB_ASSERT(column_count > 0);
  748. LLVMValueRef vector = nullptr;
  749. for (i64 i = 0; i < column_count; i++) {
  750. if (i == 0) {
  751. vector = llvm_vector_mul(p, m_columns[i], v_rows[i]);
  752. } else {
  753. vector = llvm_vector_mul_add(p, m_columns[i], v_rows[i], vector);
  754. }
  755. }
  756. return lb_matrix_cast_vector_to_type(p, vector, type);
  757. }
  758. lbAddr res = lb_add_local_generated(p, type, true);
  759. for (i64 i = 0; i < mt->Matrix.row_count; i++) {
  760. for (i64 j = 0; j < mt->Matrix.column_count; j++) {
  761. lbValue dst = lb_emit_matrix_epi(p, res.addr, i, 0);
  762. lbValue d0 = lb_emit_load(p, dst);
  763. lbValue a = lb_emit_matrix_ev(p, lhs, i, j);
  764. lbValue b = lb_emit_struct_ev(p, rhs, cast(i32)j);
  765. lbValue c = lb_emit_mul_add(p, a, b, d0, elem);
  766. lb_emit_store(p, dst, c);
  767. }
  768. }
  769. return lb_addr_load(p, res);
  770. }
  771. gb_internal lbValue lb_emit_vector_mul_matrix(lbProcedure *p, lbValue lhs, lbValue rhs, Type *type) {
  772. // TODO(bill): Handle edge case for f16 types on x86(-64) platforms
  773. Type *mt = base_type(rhs.type);
  774. Type *vt = base_type(lhs.type);
  775. GB_ASSERT(is_type_matrix(mt));
  776. GB_ASSERT(is_type_array_like(vt));
  777. i64 vector_count = get_array_type_count(vt);
  778. GB_ASSERT(vector_count == mt->Matrix.row_count);
  779. GB_ASSERT(are_types_identical(mt->Matrix.elem, base_array_type(vt)));
  780. Type *elem = mt->Matrix.elem;
  781. if (!mt->Matrix.is_row_major && lb_is_matrix_simdable(mt)) {
  782. unsigned stride = cast(unsigned)matrix_type_stride_in_elems(mt);
  783. unsigned row_count = cast(unsigned)mt->Matrix.row_count;
  784. unsigned column_count = cast(unsigned)mt->Matrix.column_count; gb_unused(column_count);
  785. auto m_columns = slice_make<LLVMValueRef>(permanent_allocator(), row_count);
  786. auto v_rows = slice_make<LLVMValueRef>(permanent_allocator(), row_count);
  787. LLVMValueRef matrix_vector = lb_matrix_to_vector(p, rhs);
  788. auto mask_elems = slice_make<LLVMValueRef>(permanent_allocator(), column_count);
  789. for (unsigned row_index = 0; row_index < row_count; row_index++) {
  790. for (unsigned column_index = 0; column_index < column_count; column_index++) {
  791. unsigned offset = row_index + column_index*stride;
  792. mask_elems[column_index] = lb_const_int(p->module, t_u32, offset).value;
  793. }
  794. // transpose mask
  795. LLVMValueRef mask = LLVMConstVector(mask_elems.data, column_count);
  796. LLVMValueRef column = llvm_basic_shuffle(p, matrix_vector, mask);
  797. m_columns[row_index] = column;
  798. }
  799. for (unsigned column_index = 0; column_index < row_count; column_index++) {
  800. LLVMValueRef value = lb_emit_struct_ev(p, lhs, column_index).value;
  801. LLVMValueRef row = llvm_vector_broadcast(p, value, column_count);
  802. v_rows[column_index] = row;
  803. }
  804. GB_ASSERT(row_count > 0);
  805. LLVMValueRef vector = nullptr;
  806. for (i64 i = 0; i < row_count; i++) {
  807. if (i == 0) {
  808. vector = llvm_vector_mul(p, v_rows[i], m_columns[i]);
  809. } else {
  810. vector = llvm_vector_mul_add(p, v_rows[i], m_columns[i], vector);
  811. }
  812. }
  813. lbAddr res = lb_add_local_generated(p, type, true);
  814. LLVMValueRef res_ptr = res.addr.value;
  815. unsigned alignment = cast(unsigned)gb_max(type_align_of(type), lb_alignof(LLVMTypeOf(vector)));
  816. LLVMSetAlignment(res_ptr, alignment);
  817. res_ptr = LLVMBuildPointerCast(p->builder, res_ptr, LLVMPointerType(LLVMTypeOf(vector), 0), "");
  818. LLVMBuildStore(p->builder, vector, res_ptr);
  819. return lb_addr_load(p, res);
  820. }
  821. lbAddr res = lb_add_local_generated(p, type, true);
  822. for (i64 j = 0; j < mt->Matrix.column_count; j++) {
  823. for (i64 k = 0; k < mt->Matrix.row_count; k++) {
  824. lbValue dst = lb_emit_matrix_epi(p, res.addr, 0, j);
  825. lbValue d0 = lb_emit_load(p, dst);
  826. lbValue a = lb_emit_struct_ev(p, lhs, cast(i32)k);
  827. lbValue b = lb_emit_matrix_ev(p, rhs, k, j);
  828. lbValue c = lb_emit_mul_add(p, a, b, d0, elem);
  829. lb_emit_store(p, dst, c);
  830. }
  831. }
  832. return lb_addr_load(p, res);
  833. }
  834. gb_internal lbValue lb_emit_arith_matrix(lbProcedure *p, TokenKind op, lbValue lhs, lbValue rhs, Type *type, bool component_wise) {
  835. GB_ASSERT(is_type_matrix(lhs.type) || is_type_matrix(rhs.type));
  836. if (op == Token_Mul && !component_wise) {
  837. Type *xt = base_type(lhs.type);
  838. Type *yt = base_type(rhs.type);
  839. if (xt->kind == Type_Matrix) {
  840. if (yt->kind == Type_Matrix) {
  841. return lb_emit_matrix_mul(p, lhs, rhs, type);
  842. } else if (is_type_array_like(yt)) {
  843. return lb_emit_matrix_mul_vector(p, lhs, rhs, type);
  844. }
  845. } else if (is_type_array_like(xt)) {
  846. GB_ASSERT(yt->kind == Type_Matrix);
  847. return lb_emit_vector_mul_matrix(p, lhs, rhs, type);
  848. } else {
  849. GB_ASSERT(xt->kind == Type_Basic);
  850. GB_ASSERT(yt->kind == Type_Matrix);
  851. GB_ASSERT(is_type_matrix(type));
  852. Type *array_type = alloc_type_array(yt->Matrix.elem, matrix_type_total_internal_elems(yt));
  853. GB_ASSERT(type_size_of(array_type) == type_size_of(yt));
  854. lbValue array_lhs = lb_emit_conv(p, lhs, array_type);
  855. lbValue array_rhs = rhs;
  856. array_rhs.type = array_type;
  857. lbValue array = lb_emit_arith(p, op, array_lhs, array_rhs, array_type);
  858. array.type = type;
  859. return array;
  860. }
  861. } else {
  862. if (is_type_matrix(lhs.type)) {
  863. rhs = lb_emit_conv(p, rhs, lhs.type);
  864. } else {
  865. lhs = lb_emit_conv(p, lhs, rhs.type);
  866. }
  867. Type *xt = base_type(lhs.type);
  868. Type *yt = base_type(rhs.type);
  869. GB_ASSERT_MSG(are_types_identical(xt, yt), "%s %.*s %s", type_to_string(lhs.type), LIT(token_strings[op]), type_to_string(rhs.type));
  870. GB_ASSERT(xt->kind == Type_Matrix);
  871. // element-wise arithmetic
  872. // pretend it is an array
  873. lbValue array_lhs = lhs;
  874. lbValue array_rhs = rhs;
  875. Type *array_type = alloc_type_array(xt->Matrix.elem, matrix_type_total_internal_elems(xt));
  876. GB_ASSERT(type_size_of(array_type) == type_size_of(xt));
  877. array_lhs.type = array_type;
  878. array_rhs.type = array_type;
  879. if (token_is_comparison(op)) {
  880. lbValue res = lb_emit_comp(p, op, array_lhs, array_rhs);
  881. return lb_emit_conv(p, res, type);
  882. } else {
  883. lbValue array = lb_emit_arith(p, op, array_lhs, array_rhs, array_type);
  884. array.type = type;
  885. return array;
  886. }
  887. }
  888. GB_PANIC("TODO: lb_emit_arith_matrix");
  889. return {};
  890. }
  891. gb_internal lbValue lb_emit_arith(lbProcedure *p, TokenKind op, lbValue lhs, lbValue rhs, Type *type) {
  892. if (is_type_array_like(lhs.type) || is_type_array_like(rhs.type)) {
  893. return lb_emit_arith_array(p, op, lhs, rhs, type);
  894. } else if (is_type_matrix(lhs.type) || is_type_matrix(rhs.type)) {
  895. return lb_emit_arith_matrix(p, op, lhs, rhs, type, false);
  896. } else if (is_type_complex(type)) {
  897. lhs = lb_emit_conv(p, lhs, type);
  898. rhs = lb_emit_conv(p, rhs, type);
  899. Type *ft = base_complex_elem_type(type);
  900. if (op == Token_Quo) {
  901. TEMPORARY_ALLOCATOR_GUARD();
  902. auto args = array_make<lbValue>(temporary_allocator(), 2);
  903. args[0] = lhs;
  904. args[1] = rhs;
  905. switch (type_size_of(ft)) {
  906. case 2: return lb_emit_runtime_call(p, "quo_complex32", args);
  907. case 4: return lb_emit_runtime_call(p, "quo_complex64", args);
  908. case 8: return lb_emit_runtime_call(p, "quo_complex128", args);
  909. default: GB_PANIC("Unknown float type"); break;
  910. }
  911. }
  912. lbAddr res = lb_add_local_generated(p, type, false); // NOTE: initialized in full later
  913. lbValue a = lb_emit_struct_ev(p, lhs, 0);
  914. lbValue b = lb_emit_struct_ev(p, lhs, 1);
  915. lbValue c = lb_emit_struct_ev(p, rhs, 0);
  916. lbValue d = lb_emit_struct_ev(p, rhs, 1);
  917. lbValue real = {};
  918. lbValue imag = {};
  919. switch (op) {
  920. case Token_Add:
  921. case Token_Sub:
  922. if (type_size_of(ft) == 2) {
  923. a = lb_emit_conv(p, a, t_f32);
  924. b = lb_emit_conv(p, b, t_f32);
  925. c = lb_emit_conv(p, c, t_f32);
  926. d = lb_emit_conv(p, d, t_f32);
  927. real = lb_emit_arith(p, op, a, c, t_f32);
  928. imag = lb_emit_arith(p, op, b, d, t_f32);
  929. real = lb_emit_conv(p, real, ft);
  930. imag = lb_emit_conv(p, imag, ft);
  931. } else {
  932. real = lb_emit_arith(p, op, a, c, ft);
  933. imag = lb_emit_arith(p, op, b, d, ft);
  934. }
  935. break;
  936. case Token_Mul: {
  937. lbValue x = lb_emit_arith(p, Token_Mul, a, c, ft);
  938. lbValue y = lb_emit_arith(p, Token_Mul, b, d, ft);
  939. real = lb_emit_arith(p, Token_Sub, x, y, ft);
  940. lbValue z = lb_emit_arith(p, Token_Mul, b, c, ft);
  941. lbValue w = lb_emit_arith(p, Token_Mul, a, d, ft);
  942. imag = lb_emit_arith(p, Token_Add, z, w, ft);
  943. break;
  944. }
  945. }
  946. lb_emit_store(p, lb_emit_struct_ep(p, res.addr, 0), real);
  947. lb_emit_store(p, lb_emit_struct_ep(p, res.addr, 1), imag);
  948. return lb_addr_load(p, res);
  949. } else if (is_type_quaternion(type)) {
  950. lhs = lb_emit_conv(p, lhs, type);
  951. rhs = lb_emit_conv(p, rhs, type);
  952. Type *ft = base_complex_elem_type(type);
  953. if (op == Token_Add || op == Token_Sub) {
  954. Type *immediate_type = ft;
  955. if (type_size_of(ft) == 2) {
  956. immediate_type = t_f32;
  957. }
  958. lbAddr res = lb_add_local_generated(p, type, false); // NOTE: initialized in full later
  959. lbValue x0 = lb_emit_struct_ev(p, lhs, 0);
  960. lbValue x1 = lb_emit_struct_ev(p, lhs, 1);
  961. lbValue x2 = lb_emit_struct_ev(p, lhs, 2);
  962. lbValue x3 = lb_emit_struct_ev(p, lhs, 3);
  963. lbValue y0 = lb_emit_struct_ev(p, rhs, 0);
  964. lbValue y1 = lb_emit_struct_ev(p, rhs, 1);
  965. lbValue y2 = lb_emit_struct_ev(p, rhs, 2);
  966. lbValue y3 = lb_emit_struct_ev(p, rhs, 3);
  967. if (immediate_type != ft) {
  968. x0 = lb_emit_conv(p, x0, immediate_type);
  969. x1 = lb_emit_conv(p, x1, immediate_type);
  970. x2 = lb_emit_conv(p, x2, immediate_type);
  971. x3 = lb_emit_conv(p, x3, immediate_type);
  972. y0 = lb_emit_conv(p, y0, immediate_type);
  973. y1 = lb_emit_conv(p, y1, immediate_type);
  974. y2 = lb_emit_conv(p, y2, immediate_type);
  975. y3 = lb_emit_conv(p, y3, immediate_type);
  976. }
  977. lbValue z0 = lb_emit_arith(p, op, x0, y0, immediate_type);
  978. lbValue z1 = lb_emit_arith(p, op, x1, y1, immediate_type);
  979. lbValue z2 = lb_emit_arith(p, op, x2, y2, immediate_type);
  980. lbValue z3 = lb_emit_arith(p, op, x3, y3, immediate_type);
  981. lbValue d0 = lb_emit_struct_ep(p, res.addr, 0);
  982. lbValue d1 = lb_emit_struct_ep(p, res.addr, 1);
  983. lbValue d2 = lb_emit_struct_ep(p, res.addr, 2);
  984. lbValue d3 = lb_emit_struct_ep(p, res.addr, 3);
  985. if (immediate_type != ft) {
  986. d0 = lb_emit_conv(p, d0, ft);
  987. d1 = lb_emit_conv(p, d1, ft);
  988. d2 = lb_emit_conv(p, d2, ft);
  989. d3 = lb_emit_conv(p, d3, ft);
  990. }
  991. lb_emit_store(p, d0, z0);
  992. lb_emit_store(p, d1, z1);
  993. lb_emit_store(p, d2, z2);
  994. lb_emit_store(p, d3, z3);
  995. return lb_addr_load(p, res);
  996. } else if (op == Token_Mul) {
  997. TEMPORARY_ALLOCATOR_GUARD();
  998. auto args = array_make<lbValue>(temporary_allocator(), 2);
  999. args[0] = lhs;
  1000. args[1] = rhs;
  1001. switch (8*type_size_of(ft)) {
  1002. case 16: return lb_emit_runtime_call(p, "mul_quaternion64", args);
  1003. case 32: return lb_emit_runtime_call(p, "mul_quaternion128", args);
  1004. case 64: return lb_emit_runtime_call(p, "mul_quaternion256", args);
  1005. default: GB_PANIC("Unknown float type"); break;
  1006. }
  1007. } else if (op == Token_Quo) {
  1008. TEMPORARY_ALLOCATOR_GUARD();
  1009. auto args = array_make<lbValue>(temporary_allocator(), 2);
  1010. args[0] = lhs;
  1011. args[1] = rhs;
  1012. switch (8*type_size_of(ft)) {
  1013. case 16: return lb_emit_runtime_call(p, "quo_quaternion64", args);
  1014. case 32: return lb_emit_runtime_call(p, "quo_quaternion128", args);
  1015. case 64: return lb_emit_runtime_call(p, "quo_quaternion256", args);
  1016. default: GB_PANIC("Unknown float type"); break;
  1017. }
  1018. }
  1019. }
  1020. lhs = lb_emit_conv(p, lhs, type);
  1021. rhs = lb_emit_conv(p, rhs, type);
  1022. if (is_type_integer(type) && is_type_different_to_arch_endianness(type)) {
  1023. switch (op) {
  1024. case Token_AndNot:
  1025. case Token_And:
  1026. case Token_Or:
  1027. case Token_Xor:
  1028. goto handle_op;
  1029. }
  1030. Type *platform_type = integer_endian_type_to_platform_type(type);
  1031. lbValue x = lb_emit_byte_swap(p, lhs, integer_endian_type_to_platform_type(lhs.type));
  1032. lbValue y = lb_emit_byte_swap(p, rhs, integer_endian_type_to_platform_type(rhs.type));
  1033. lbValue res = lb_emit_arith(p, op, x, y, platform_type);
  1034. return lb_emit_byte_swap(p, res, type);
  1035. }
  1036. if (is_type_float(type) && is_type_different_to_arch_endianness(type)) {
  1037. Type *platform_type = integer_endian_type_to_platform_type(type);
  1038. lbValue x = lb_emit_conv(p, lhs, integer_endian_type_to_platform_type(lhs.type));
  1039. lbValue y = lb_emit_conv(p, rhs, integer_endian_type_to_platform_type(rhs.type));
  1040. lbValue res = lb_emit_arith(p, op, x, y, platform_type);
  1041. return lb_emit_byte_swap(p, res, type);
  1042. }
  1043. handle_op:;
  1044. lbValue res = {};
  1045. res.type = type;
  1046. // NOTE(bill): Bit Set Aliases for + and -
  1047. if (is_type_bit_set(type)) {
  1048. switch (op) {
  1049. case Token_Add: op = Token_Or; break;
  1050. case Token_Sub: op = Token_AndNot; break;
  1051. }
  1052. Type *u = bit_set_to_int(type);
  1053. if (is_type_array(u)) {
  1054. lhs.type = u;
  1055. rhs.type = u;
  1056. res = lb_emit_arith(p, op, lhs, rhs, u);
  1057. res.type = type;
  1058. return res;
  1059. }
  1060. }
  1061. Type *integral_type = type;
  1062. if (is_type_simd_vector(integral_type)) {
  1063. integral_type = core_array_type(integral_type);
  1064. }
  1065. switch (op) {
  1066. case Token_Add:
  1067. if (is_type_float(integral_type)) {
  1068. res.value = LLVMBuildFAdd(p->builder, lhs.value, rhs.value, "");
  1069. return res;
  1070. }
  1071. res.value = LLVMBuildAdd(p->builder, lhs.value, rhs.value, "");
  1072. return res;
  1073. case Token_Sub:
  1074. if (is_type_float(integral_type)) {
  1075. res.value = LLVMBuildFSub(p->builder, lhs.value, rhs.value, "");
  1076. return res;
  1077. }
  1078. res.value = LLVMBuildSub(p->builder, lhs.value, rhs.value, "");
  1079. return res;
  1080. case Token_Mul:
  1081. if (is_type_float(integral_type)) {
  1082. res.value = LLVMBuildFMul(p->builder, lhs.value, rhs.value, "");
  1083. return res;
  1084. }
  1085. res.value = LLVMBuildMul(p->builder, lhs.value, rhs.value, "");
  1086. return res;
  1087. case Token_Quo:
  1088. if (is_type_float(integral_type)) {
  1089. res.value = LLVMBuildFDiv(p->builder, lhs.value, rhs.value, "");
  1090. return res;
  1091. } else if (is_type_unsigned(integral_type)) {
  1092. res.value = LLVMBuildUDiv(p->builder, lhs.value, rhs.value, "");
  1093. return res;
  1094. }
  1095. res.value = LLVMBuildSDiv(p->builder, lhs.value, rhs.value, "");
  1096. return res;
  1097. case Token_Mod:
  1098. if (is_type_float(integral_type)) {
  1099. res.value = LLVMBuildFRem(p->builder, lhs.value, rhs.value, "");
  1100. return res;
  1101. } else if (is_type_unsigned(integral_type)) {
  1102. res.value = LLVMBuildURem(p->builder, lhs.value, rhs.value, "");
  1103. return res;
  1104. }
  1105. res.value = LLVMBuildSRem(p->builder, lhs.value, rhs.value, "");
  1106. return res;
  1107. case Token_ModMod:
  1108. if (is_type_unsigned(integral_type)) {
  1109. res.value = LLVMBuildURem(p->builder, lhs.value, rhs.value, "");
  1110. return res;
  1111. } else {
  1112. LLVMValueRef a = LLVMBuildSRem(p->builder, lhs.value, rhs.value, "");
  1113. LLVMValueRef b = LLVMBuildAdd(p->builder, a, rhs.value, "");
  1114. LLVMValueRef c = LLVMBuildSRem(p->builder, b, rhs.value, "");
  1115. res.value = c;
  1116. return res;
  1117. }
  1118. case Token_And:
  1119. res.value = LLVMBuildAnd(p->builder, lhs.value, rhs.value, "");
  1120. return res;
  1121. case Token_Or:
  1122. res.value = LLVMBuildOr(p->builder, lhs.value, rhs.value, "");
  1123. return res;
  1124. case Token_Xor:
  1125. res.value = LLVMBuildXor(p->builder, lhs.value, rhs.value, "");
  1126. return res;
  1127. case Token_Shl:
  1128. {
  1129. rhs = lb_emit_conv(p, rhs, lhs.type);
  1130. LLVMValueRef lhsval = lhs.value;
  1131. LLVMValueRef bits = rhs.value;
  1132. LLVMValueRef bit_size = LLVMConstInt(lb_type(p->module, rhs.type), 8*type_size_of(lhs.type), false);
  1133. LLVMValueRef width_test = LLVMBuildICmp(p->builder, LLVMIntULT, bits, bit_size, "");
  1134. res.value = LLVMBuildShl(p->builder, lhsval, bits, "");
  1135. LLVMValueRef zero = LLVMConstNull(lb_type(p->module, lhs.type));
  1136. res.value = LLVMBuildSelect(p->builder, width_test, res.value, zero, "");
  1137. return res;
  1138. }
  1139. case Token_Shr:
  1140. {
  1141. rhs = lb_emit_conv(p, rhs, lhs.type);
  1142. LLVMValueRef lhsval = lhs.value;
  1143. LLVMValueRef bits = rhs.value;
  1144. bool is_unsigned = is_type_unsigned(integral_type);
  1145. LLVMValueRef bit_size = LLVMConstInt(lb_type(p->module, rhs.type), 8*type_size_of(lhs.type), false);
  1146. LLVMValueRef width_test = LLVMBuildICmp(p->builder, LLVMIntULT, bits, bit_size, "");
  1147. if (is_unsigned) {
  1148. res.value = LLVMBuildLShr(p->builder, lhsval, bits, "");
  1149. } else {
  1150. res.value = LLVMBuildAShr(p->builder, lhsval, bits, "");
  1151. }
  1152. LLVMValueRef zero = LLVMConstNull(lb_type(p->module, lhs.type));
  1153. res.value = LLVMBuildSelect(p->builder, width_test, res.value, zero, "");
  1154. return res;
  1155. }
  1156. case Token_AndNot:
  1157. {
  1158. LLVMValueRef new_rhs = LLVMBuildNot(p->builder, rhs.value, "");
  1159. res.value = LLVMBuildAnd(p->builder, lhs.value, new_rhs, "");
  1160. return res;
  1161. }
  1162. break;
  1163. }
  1164. GB_PANIC("unhandled operator of lb_emit_arith");
  1165. return {};
  1166. }
  1167. gb_internal bool lb_is_empty_string_constant(Ast *expr) {
  1168. if (expr->tav.value.kind == ExactValue_String &&
  1169. is_type_string(expr->tav.type)) {
  1170. String s = expr->tav.value.value_string;
  1171. return s.len == 0;
  1172. }
  1173. return false;
  1174. }
  1175. gb_internal lbValue lb_build_binary_in(lbProcedure *p, lbValue left, lbValue right, TokenKind op) {
  1176. Type *rt = base_type(right.type);
  1177. if (is_type_pointer(rt)) {
  1178. right = lb_emit_load(p, right);
  1179. rt = base_type(type_deref(rt));
  1180. }
  1181. switch (rt->kind) {
  1182. case Type_Map:
  1183. {
  1184. lbValue map_ptr = lb_address_from_load_or_generate_local(p, right);
  1185. lbValue key = left;
  1186. lbValue ptr = lb_internal_dynamic_map_get_ptr(p, map_ptr, key);
  1187. if (op == Token_in) {
  1188. return lb_emit_conv(p, lb_emit_comp_against_nil(p, Token_NotEq, ptr), t_bool);
  1189. } else {
  1190. return lb_emit_conv(p, lb_emit_comp_against_nil(p, Token_CmpEq, ptr), t_bool);
  1191. }
  1192. }
  1193. break;
  1194. case Type_BitSet:
  1195. {
  1196. Type *key_type = rt->BitSet.elem;
  1197. GB_ASSERT(are_types_identical(left.type, key_type));
  1198. Type *it = bit_set_to_int(rt);
  1199. left = lb_emit_conv(p, left, it);
  1200. if (is_type_different_to_arch_endianness(it)) {
  1201. left = lb_emit_byte_swap(p, left, integer_endian_type_to_platform_type(it));
  1202. }
  1203. lbValue lower = lb_const_value(p->module, left.type, exact_value_i64(rt->BitSet.lower));
  1204. lbValue key = lb_emit_arith(p, Token_Sub, left, lower, left.type);
  1205. lbValue bit = lb_emit_arith(p, Token_Shl, lb_const_int(p->module, left.type, 1), key, left.type);
  1206. bit = lb_emit_conv(p, bit, it);
  1207. lbValue old_value = lb_emit_transmute(p, right, it);
  1208. lbValue new_value = lb_emit_arith(p, Token_And, old_value, bit, it);
  1209. if (op == Token_in) {
  1210. return lb_emit_conv(p, lb_emit_comp(p, Token_NotEq, new_value, lb_const_int(p->module, new_value.type, 0)), t_bool);
  1211. } else {
  1212. return lb_emit_conv(p, lb_emit_comp(p, Token_CmpEq, new_value, lb_const_int(p->module, new_value.type, 0)), t_bool);
  1213. }
  1214. }
  1215. break;
  1216. }
  1217. GB_PANIC("Invalid 'in' type");
  1218. return {};
  1219. }
  1220. gb_internal lbValue lb_build_binary_expr(lbProcedure *p, Ast *expr) {
  1221. ast_node(be, BinaryExpr, expr);
  1222. TypeAndValue tv = type_and_value_of_expr(expr);
  1223. if (is_type_matrix(be->left->tav.type) || is_type_matrix(be->right->tav.type)) {
  1224. lbValue left = lb_build_expr(p, be->left);
  1225. lbValue right = lb_build_expr(p, be->right);
  1226. return lb_emit_arith_matrix(p, be->op.kind, left, right, default_type(tv.type), false);
  1227. }
  1228. switch (be->op.kind) {
  1229. case Token_Add:
  1230. case Token_Sub:
  1231. case Token_Mul:
  1232. case Token_Quo:
  1233. case Token_Mod:
  1234. case Token_ModMod:
  1235. case Token_And:
  1236. case Token_Or:
  1237. case Token_Xor:
  1238. case Token_AndNot: {
  1239. Type *type = default_type(tv.type);
  1240. lbValue left = lb_build_expr(p, be->left);
  1241. lbValue right = lb_build_expr(p, be->right);
  1242. return lb_emit_arith(p, be->op.kind, left, right, type);
  1243. }
  1244. case Token_Shl:
  1245. case Token_Shr: {
  1246. lbValue left, right;
  1247. Type *type = default_type(tv.type);
  1248. left = lb_build_expr(p, be->left);
  1249. if (lb_is_expr_untyped_const(be->right)) {
  1250. // NOTE(bill): RHS shift operands can still be untyped
  1251. // Just bypass the standard lb_build_expr
  1252. right = lb_expr_untyped_const_to_typed(p->module, be->right, type);
  1253. } else {
  1254. right = lb_build_expr(p, be->right);
  1255. }
  1256. return lb_emit_arith(p, be->op.kind, left, right, type);
  1257. }
  1258. case Token_CmpEq:
  1259. case Token_NotEq:
  1260. if (is_type_untyped_nil(be->right->tav.type)) {
  1261. // `x == nil` or `x != nil`
  1262. lbValue left = lb_build_expr(p, be->left);
  1263. lbValue cmp = lb_emit_comp_against_nil(p, be->op.kind, left);
  1264. Type *type = default_type(tv.type);
  1265. return lb_emit_conv(p, cmp, type);
  1266. } else if (is_type_untyped_nil(be->left->tav.type)) {
  1267. // `nil == x` or `nil != x`
  1268. lbValue right = lb_build_expr(p, be->right);
  1269. lbValue cmp = lb_emit_comp_against_nil(p, be->op.kind, right);
  1270. Type *type = default_type(tv.type);
  1271. return lb_emit_conv(p, cmp, type);
  1272. } else if (lb_is_empty_string_constant(be->right)) {
  1273. // `x == ""` or `x != ""`
  1274. lbValue s = lb_build_expr(p, be->left);
  1275. s = lb_emit_conv(p, s, t_string);
  1276. lbValue len = lb_string_len(p, s);
  1277. lbValue cmp = lb_emit_comp(p, be->op.kind, len, lb_const_int(p->module, t_int, 0));
  1278. Type *type = default_type(tv.type);
  1279. return lb_emit_conv(p, cmp, type);
  1280. } else if (lb_is_empty_string_constant(be->left)) {
  1281. // `"" == x` or `"" != x`
  1282. lbValue s = lb_build_expr(p, be->right);
  1283. s = lb_emit_conv(p, s, t_string);
  1284. lbValue len = lb_string_len(p, s);
  1285. lbValue cmp = lb_emit_comp(p, be->op.kind, len, lb_const_int(p->module, t_int, 0));
  1286. Type *type = default_type(tv.type);
  1287. return lb_emit_conv(p, cmp, type);
  1288. }
  1289. /*fallthrough*/
  1290. case Token_Lt:
  1291. case Token_LtEq:
  1292. case Token_Gt:
  1293. case Token_GtEq:
  1294. {
  1295. lbValue left = {};
  1296. lbValue right = {};
  1297. if (be->left->tav.mode == Addressing_Type) {
  1298. left = lb_typeid(p->module, be->left->tav.type);
  1299. }
  1300. if (be->right->tav.mode == Addressing_Type) {
  1301. right = lb_typeid(p->module, be->right->tav.type);
  1302. }
  1303. if (left.value == nullptr) left = lb_build_expr(p, be->left);
  1304. if (right.value == nullptr) right = lb_build_expr(p, be->right);
  1305. lbValue cmp = lb_emit_comp(p, be->op.kind, left, right);
  1306. Type *type = default_type(tv.type);
  1307. return lb_emit_conv(p, cmp, type);
  1308. }
  1309. case Token_CmpAnd:
  1310. case Token_CmpOr:
  1311. return lb_emit_logical_binary_expr(p, be->op.kind, be->left, be->right, tv.type);
  1312. case Token_in:
  1313. case Token_not_in:
  1314. {
  1315. lbValue left = lb_build_expr(p, be->left);
  1316. lbValue right = lb_build_expr(p, be->right);
  1317. return lb_build_binary_in(p, left, right, be->op.kind);
  1318. }
  1319. default:
  1320. GB_PANIC("Invalid binary expression");
  1321. break;
  1322. }
  1323. return {};
  1324. }
  1325. gb_internal lbValue lb_emit_conv(lbProcedure *p, lbValue value, Type *t) {
  1326. lbModule *m = p->module;
  1327. t = reduce_tuple_to_single_type(t);
  1328. Type *src_type = value.type;
  1329. if (are_types_identical(t, src_type)) {
  1330. return value;
  1331. }
  1332. Type *src = core_type(src_type);
  1333. Type *dst = core_type(t);
  1334. GB_ASSERT(src != nullptr);
  1335. GB_ASSERT(dst != nullptr);
  1336. if (is_type_untyped_uninit(src)) {
  1337. return lb_const_undef(m, t);
  1338. }
  1339. if (is_type_untyped_nil(src)) {
  1340. return lb_const_nil(m, t);
  1341. }
  1342. if (LLVMIsConstant(value.value)) {
  1343. if (is_type_any(dst)) {
  1344. Type *st = default_type(src_type);
  1345. lbAddr default_value = lb_add_local_generated(p, st, false);
  1346. lb_addr_store(p, default_value, value);
  1347. lbValue data = lb_emit_conv(p, default_value.addr, t_rawptr);
  1348. lbValue id = lb_typeid(m, st);
  1349. lbAddr res = lb_add_local_generated(p, t, false);
  1350. lbValue a0 = lb_emit_struct_ep(p, res.addr, 0);
  1351. lbValue a1 = lb_emit_struct_ep(p, res.addr, 1);
  1352. lb_emit_store(p, a0, data);
  1353. lb_emit_store(p, a1, id);
  1354. return lb_addr_load(p, res);
  1355. } else if (dst->kind == Type_Basic) {
  1356. if (src->Basic.kind == Basic_string && dst->Basic.kind == Basic_cstring) {
  1357. String str = lb_get_const_string(m, value);
  1358. lbValue res = {};
  1359. res.type = t;
  1360. res.value = llvm_cstring(m, str);
  1361. return res;
  1362. }
  1363. // if (is_type_float(dst)) {
  1364. // return value;
  1365. // } else if (is_type_integer(dst)) {
  1366. // return value;
  1367. // }
  1368. // ExactValue ev = value->Constant.value;
  1369. // if (is_type_float(dst)) {
  1370. // ev = exact_value_to_float(ev);
  1371. // } else if (is_type_complex(dst)) {
  1372. // ev = exact_value_to_complex(ev);
  1373. // } else if (is_type_quaternion(dst)) {
  1374. // ev = exact_value_to_quaternion(ev);
  1375. // } else if (is_type_string(dst)) {
  1376. // // Handled elsewhere
  1377. // GB_ASSERT_MSG(ev.kind == ExactValue_String, "%d", ev.kind);
  1378. // } else if (is_type_integer(dst)) {
  1379. // ev = exact_value_to_integer(ev);
  1380. // } else if (is_type_pointer(dst)) {
  1381. // // IMPORTANT NOTE(bill): LLVM doesn't support pointer constants expect 'null'
  1382. // lbValue i = lb_add_module_constant(p->module, t_uintptr, ev);
  1383. // return lb_emit(p, lb_instr_conv(p, irConv_inttoptr, i, t_uintptr, dst));
  1384. // }
  1385. // return lb_const_value(p->module, t, ev);
  1386. }
  1387. }
  1388. if (are_types_identical(src, dst)) {
  1389. if (!are_types_identical(src_type, t)) {
  1390. return lb_emit_transmute(p, value, t);
  1391. }
  1392. return value;
  1393. }
  1394. // bool <-> llvm bool
  1395. if (is_type_boolean(src) && dst == t_llvm_bool) {
  1396. lbValue res = {};
  1397. res.value = LLVMBuildICmp(p->builder, LLVMIntNE, value.value, LLVMConstNull(lb_type(m, src)), "");
  1398. res.type = t;
  1399. return res;
  1400. }
  1401. if (src == t_llvm_bool && is_type_boolean(dst)) {
  1402. lbValue res = {};
  1403. res.value = LLVMBuildZExt(p->builder, value.value, lb_type(m, dst), "");
  1404. res.type = t;
  1405. return res;
  1406. }
  1407. // integer -> integer
  1408. if (is_type_integer(src) && is_type_integer(dst)) {
  1409. GB_ASSERT(src->kind == Type_Basic &&
  1410. dst->kind == Type_Basic);
  1411. i64 sz = type_size_of(default_type(src));
  1412. i64 dz = type_size_of(default_type(dst));
  1413. if (sz == dz) {
  1414. if (dz > 1 && !types_have_same_internal_endian(src, dst)) {
  1415. return lb_emit_byte_swap(p, value, t);
  1416. }
  1417. lbValue res = {};
  1418. res.value = value.value;
  1419. res.type = t;
  1420. return res;
  1421. }
  1422. if (sz > 1 && is_type_different_to_arch_endianness(src)) {
  1423. Type *platform_src_type = integer_endian_type_to_platform_type(src);
  1424. value = lb_emit_byte_swap(p, value, platform_src_type);
  1425. }
  1426. LLVMOpcode op = LLVMTrunc;
  1427. if (dz < sz) {
  1428. op = LLVMTrunc;
  1429. } else if (dz == sz) {
  1430. // NOTE(bill): In LLVM, all integers are signed and rely upon 2's compliment
  1431. // NOTE(bill): Copy the value just for type correctness
  1432. op = LLVMBitCast;
  1433. } else if (dz > sz) {
  1434. op = is_type_unsigned(src) ? LLVMZExt : LLVMSExt; // zero extent
  1435. }
  1436. if (dz > 1 && is_type_different_to_arch_endianness(dst)) {
  1437. Type *platform_dst_type = integer_endian_type_to_platform_type(dst);
  1438. lbValue res = {};
  1439. res.value = LLVMBuildCast(p->builder, op, value.value, lb_type(m, platform_dst_type), "");
  1440. res.type = t;
  1441. return lb_emit_byte_swap(p, res, t);
  1442. } else {
  1443. lbValue res = {};
  1444. res.value = LLVMBuildCast(p->builder, op, value.value, lb_type(m, t), "");
  1445. res.type = t;
  1446. return res;
  1447. }
  1448. }
  1449. // boolean -> boolean/integer
  1450. if (is_type_boolean(src) && (is_type_boolean(dst) || is_type_integer(dst))) {
  1451. LLVMValueRef b = LLVMBuildICmp(p->builder, LLVMIntNE, value.value, LLVMConstNull(lb_type(m, value.type)), "");
  1452. lbValue res = {};
  1453. res.value = LLVMBuildIntCast2(p->builder, b, lb_type(m, t), false, "");
  1454. res.type = t;
  1455. return res;
  1456. }
  1457. if (is_type_cstring(src) && is_type_u8_ptr(dst)) {
  1458. return lb_emit_transmute(p, value, dst);
  1459. }
  1460. if (is_type_u8_ptr(src) && is_type_cstring(dst)) {
  1461. return lb_emit_transmute(p, value, dst);
  1462. }
  1463. if (is_type_cstring(src) && is_type_u8_multi_ptr(dst)) {
  1464. return lb_emit_transmute(p, value, dst);
  1465. }
  1466. if (is_type_u8_multi_ptr(src) && is_type_cstring(dst)) {
  1467. return lb_emit_transmute(p, value, dst);
  1468. }
  1469. if (is_type_cstring(src) && is_type_rawptr(dst)) {
  1470. return lb_emit_transmute(p, value, dst);
  1471. }
  1472. if (is_type_rawptr(src) && is_type_cstring(dst)) {
  1473. return lb_emit_transmute(p, value, dst);
  1474. }
  1475. if (are_types_identical(src, t_cstring) && are_types_identical(dst, t_string)) {
  1476. TEMPORARY_ALLOCATOR_GUARD();
  1477. lbValue c = lb_emit_conv(p, value, t_cstring);
  1478. auto args = array_make<lbValue>(temporary_allocator(), 1);
  1479. args[0] = c;
  1480. lbValue s = lb_emit_runtime_call(p, "cstring_to_string", args);
  1481. return lb_emit_conv(p, s, dst);
  1482. }
  1483. // integer -> boolean
  1484. if (is_type_integer(src) && is_type_boolean(dst)) {
  1485. lbValue res = {};
  1486. res.value = LLVMBuildICmp(p->builder, LLVMIntNE, value.value, LLVMConstNull(lb_type(m, value.type)), "");
  1487. res.type = t_llvm_bool;
  1488. return lb_emit_conv(p, res, t);
  1489. }
  1490. // float -> float
  1491. if (is_type_float(src) && is_type_float(dst)) {
  1492. i64 sz = type_size_of(src);
  1493. i64 dz = type_size_of(dst);
  1494. if (dz == sz) {
  1495. if (types_have_same_internal_endian(src, dst)) {
  1496. lbValue res = {};
  1497. res.type = t;
  1498. res.value = value.value;
  1499. return res;
  1500. } else {
  1501. return lb_emit_byte_swap(p, value, t);
  1502. }
  1503. }
  1504. if (is_type_different_to_arch_endianness(src) || is_type_different_to_arch_endianness(dst)) {
  1505. Type *platform_src_type = integer_endian_type_to_platform_type(src);
  1506. Type *platform_dst_type = integer_endian_type_to_platform_type(dst);
  1507. lbValue res = {};
  1508. res = lb_emit_conv(p, value, platform_src_type);
  1509. res = lb_emit_conv(p, res, platform_dst_type);
  1510. if (is_type_different_to_arch_endianness(dst)) {
  1511. res = lb_emit_byte_swap(p, res, t);
  1512. }
  1513. return lb_emit_conv(p, res, t);
  1514. }
  1515. lbValue res = {};
  1516. res.type = t;
  1517. if (dz >= sz) {
  1518. res.value = LLVMBuildFPExt(p->builder, value.value, lb_type(m, t), "");
  1519. } else {
  1520. res.value = LLVMBuildFPTrunc(p->builder, value.value, lb_type(m, t), "");
  1521. }
  1522. return res;
  1523. }
  1524. if (is_type_complex(src) && is_type_complex(dst)) {
  1525. Type *ft = base_complex_elem_type(dst);
  1526. lbAddr gen = lb_add_local_generated(p, t, false);
  1527. lbValue gp = lb_addr_get_ptr(p, gen);
  1528. lbValue real = lb_emit_conv(p, lb_emit_struct_ev(p, value, 0), ft);
  1529. lbValue imag = lb_emit_conv(p, lb_emit_struct_ev(p, value, 1), ft);
  1530. lb_emit_store(p, lb_emit_struct_ep(p, gp, 0), real);
  1531. lb_emit_store(p, lb_emit_struct_ep(p, gp, 1), imag);
  1532. return lb_addr_load(p, gen);
  1533. }
  1534. if (is_type_quaternion(src) && is_type_quaternion(dst)) {
  1535. // @QuaternionLayout
  1536. Type *ft = base_complex_elem_type(dst);
  1537. lbAddr gen = lb_add_local_generated(p, t, false);
  1538. lbValue gp = lb_addr_get_ptr(p, gen);
  1539. lbValue q0 = lb_emit_conv(p, lb_emit_struct_ev(p, value, 0), ft);
  1540. lbValue q1 = lb_emit_conv(p, lb_emit_struct_ev(p, value, 1), ft);
  1541. lbValue q2 = lb_emit_conv(p, lb_emit_struct_ev(p, value, 2), ft);
  1542. lbValue q3 = lb_emit_conv(p, lb_emit_struct_ev(p, value, 3), ft);
  1543. lb_emit_store(p, lb_emit_struct_ep(p, gp, 0), q0);
  1544. lb_emit_store(p, lb_emit_struct_ep(p, gp, 1), q1);
  1545. lb_emit_store(p, lb_emit_struct_ep(p, gp, 2), q2);
  1546. lb_emit_store(p, lb_emit_struct_ep(p, gp, 3), q3);
  1547. return lb_addr_load(p, gen);
  1548. }
  1549. if (is_type_integer(src) && is_type_complex(dst)) {
  1550. Type *ft = base_complex_elem_type(dst);
  1551. lbAddr gen = lb_add_local_generated(p, t, true);
  1552. lbValue gp = lb_addr_get_ptr(p, gen);
  1553. lbValue real = lb_emit_conv(p, value, ft);
  1554. lb_emit_store(p, lb_emit_struct_ep(p, gp, 0), real);
  1555. return lb_addr_load(p, gen);
  1556. }
  1557. if (is_type_float(src) && is_type_complex(dst)) {
  1558. Type *ft = base_complex_elem_type(dst);
  1559. lbAddr gen = lb_add_local_generated(p, t, true);
  1560. lbValue gp = lb_addr_get_ptr(p, gen);
  1561. lbValue real = lb_emit_conv(p, value, ft);
  1562. lb_emit_store(p, lb_emit_struct_ep(p, gp, 0), real);
  1563. return lb_addr_load(p, gen);
  1564. }
  1565. if (is_type_integer(src) && is_type_quaternion(dst)) {
  1566. Type *ft = base_complex_elem_type(dst);
  1567. lbAddr gen = lb_add_local_generated(p, t, true);
  1568. lbValue gp = lb_addr_get_ptr(p, gen);
  1569. lbValue real = lb_emit_conv(p, value, ft);
  1570. // @QuaternionLayout
  1571. lb_emit_store(p, lb_emit_struct_ep(p, gp, 3), real);
  1572. return lb_addr_load(p, gen);
  1573. }
  1574. if (is_type_float(src) && is_type_quaternion(dst)) {
  1575. Type *ft = base_complex_elem_type(dst);
  1576. lbAddr gen = lb_add_local_generated(p, t, true);
  1577. lbValue gp = lb_addr_get_ptr(p, gen);
  1578. lbValue real = lb_emit_conv(p, value, ft);
  1579. // @QuaternionLayout
  1580. lb_emit_store(p, lb_emit_struct_ep(p, gp, 3), real);
  1581. return lb_addr_load(p, gen);
  1582. }
  1583. if (is_type_complex(src) && is_type_quaternion(dst)) {
  1584. Type *ft = base_complex_elem_type(dst);
  1585. lbAddr gen = lb_add_local_generated(p, t, true);
  1586. lbValue gp = lb_addr_get_ptr(p, gen);
  1587. lbValue real = lb_emit_conv(p, lb_emit_struct_ev(p, value, 0), ft);
  1588. lbValue imag = lb_emit_conv(p, lb_emit_struct_ev(p, value, 1), ft);
  1589. // @QuaternionLayout
  1590. lb_emit_store(p, lb_emit_struct_ep(p, gp, 3), real);
  1591. lb_emit_store(p, lb_emit_struct_ep(p, gp, 0), imag);
  1592. return lb_addr_load(p, gen);
  1593. }
  1594. // float <-> integer
  1595. if (is_type_float(src) && is_type_integer(dst)) {
  1596. if (is_type_different_to_arch_endianness(src) || is_type_different_to_arch_endianness(dst)) {
  1597. Type *platform_src_type = integer_endian_type_to_platform_type(src);
  1598. Type *platform_dst_type = integer_endian_type_to_platform_type(dst);
  1599. lbValue res = {};
  1600. res = lb_emit_conv(p, value, platform_src_type);
  1601. res = lb_emit_conv(p, res, platform_dst_type);
  1602. return lb_emit_conv(p, res, t);
  1603. }
  1604. if (is_type_integer_128bit(dst)) {
  1605. TEMPORARY_ALLOCATOR_GUARD();
  1606. auto args = array_make<lbValue>(temporary_allocator(), 1);
  1607. args[0] = value;
  1608. char const *call = "fixunsdfdi";
  1609. if (is_type_unsigned(dst)) {
  1610. call = "fixunsdfti";
  1611. }
  1612. lbValue res_i128 = lb_emit_runtime_call(p, call, args);
  1613. return lb_emit_conv(p, res_i128, t);
  1614. }
  1615. i64 sz = type_size_of(src);
  1616. lbValue res = {};
  1617. res.type = t;
  1618. if (is_type_unsigned(dst)) {
  1619. switch (sz) {
  1620. case 2:
  1621. case 4:
  1622. res.value = LLVMBuildFPToUI(p->builder, value.value, lb_type(m, t_u32), "");
  1623. res.value = LLVMBuildIntCast2(p->builder, res.value, lb_type(m, t), false, "");
  1624. break;
  1625. case 8:
  1626. res.value = LLVMBuildFPToUI(p->builder, value.value, lb_type(m, t_u64), "");
  1627. res.value = LLVMBuildIntCast2(p->builder, res.value, lb_type(m, t), false, "");
  1628. break;
  1629. default:
  1630. GB_PANIC("Unhandled float type");
  1631. break;
  1632. }
  1633. } else {
  1634. switch (sz) {
  1635. case 2:
  1636. case 4:
  1637. res.value = LLVMBuildFPToSI(p->builder, value.value, lb_type(m, t_i32), "");
  1638. res.value = LLVMBuildIntCast2(p->builder, res.value, lb_type(m, t), true, "");
  1639. break;
  1640. case 8:
  1641. res.value = LLVMBuildFPToSI(p->builder, value.value, lb_type(m, t_i64), "");
  1642. res.value = LLVMBuildIntCast2(p->builder, res.value, lb_type(m, t), true, "");
  1643. break;
  1644. default:
  1645. GB_PANIC("Unhandled float type");
  1646. break;
  1647. }
  1648. }
  1649. return res;
  1650. }
  1651. if (is_type_integer(src) && is_type_float(dst)) {
  1652. if (is_type_different_to_arch_endianness(src) || is_type_different_to_arch_endianness(dst)) {
  1653. Type *platform_src_type = integer_endian_type_to_platform_type(src);
  1654. Type *platform_dst_type = integer_endian_type_to_platform_type(dst);
  1655. lbValue res = {};
  1656. res = lb_emit_conv(p, value, platform_src_type);
  1657. res = lb_emit_conv(p, res, platform_dst_type);
  1658. if (is_type_different_to_arch_endianness(dst)) {
  1659. res = lb_emit_byte_swap(p, res, t);
  1660. }
  1661. return lb_emit_conv(p, res, t);
  1662. }
  1663. if (is_type_integer_128bit(src)) {
  1664. TEMPORARY_ALLOCATOR_GUARD();
  1665. auto args = array_make<lbValue>(temporary_allocator(), 1);
  1666. args[0] = value;
  1667. char const *call = "floattidf";
  1668. if (is_type_unsigned(src)) {
  1669. call = "floattidf_unsigned";
  1670. }
  1671. lbValue res_f64 = lb_emit_runtime_call(p, call, args);
  1672. return lb_emit_conv(p, res_f64, t);
  1673. }
  1674. lbValue res = {};
  1675. res.type = t;
  1676. if (is_type_unsigned(src)) {
  1677. res.value = LLVMBuildUIToFP(p->builder, value.value, lb_type(m, t), "");
  1678. } else {
  1679. res.value = LLVMBuildSIToFP(p->builder, value.value, lb_type(m, t), "");
  1680. }
  1681. return res;
  1682. }
  1683. if (is_type_simd_vector(dst)) {
  1684. Type *et = base_array_type(dst);
  1685. if (is_type_simd_vector(src)) {
  1686. Type *src_elem = core_array_type(src);
  1687. Type *dst_elem = core_array_type(dst);
  1688. GB_ASSERT(src->SimdVector.count == dst->SimdVector.count);
  1689. lbValue res = {};
  1690. res.type = t;
  1691. if (are_types_identical(src_elem, dst_elem)) {
  1692. res.value = value.value;
  1693. } else if (is_type_float(src_elem) && is_type_integer(dst_elem)) {
  1694. if (is_type_unsigned(dst_elem)) {
  1695. res.value = LLVMBuildFPToUI(p->builder, value.value, lb_type(m, t), "");
  1696. } else {
  1697. res.value = LLVMBuildFPToSI(p->builder, value.value, lb_type(m, t), "");
  1698. }
  1699. } else if (is_type_integer(src_elem) && is_type_float(dst_elem)) {
  1700. if (is_type_unsigned(src_elem)) {
  1701. res.value = LLVMBuildUIToFP(p->builder, value.value, lb_type(m, t), "");
  1702. } else {
  1703. res.value = LLVMBuildSIToFP(p->builder, value.value, lb_type(m, t), "");
  1704. }
  1705. } else if ((is_type_integer(src_elem) || is_type_boolean(src_elem)) && is_type_integer(dst_elem)) {
  1706. res.value = LLVMBuildIntCast2(p->builder, value.value, lb_type(m, t), !is_type_unsigned(src_elem), "");
  1707. } else if (is_type_float(src_elem) && is_type_float(dst_elem)) {
  1708. res.value = LLVMBuildFPCast(p->builder, value.value, lb_type(m, t), "");
  1709. } else if (is_type_integer(src_elem) && is_type_boolean(dst_elem)) {
  1710. LLVMValueRef i1vector = LLVMBuildICmp(p->builder, LLVMIntNE, value.value, LLVMConstNull(LLVMTypeOf(value.value)), "");
  1711. res.value = LLVMBuildIntCast2(p->builder, i1vector, lb_type(m, t), !is_type_unsigned(src_elem), "");
  1712. } else if (is_type_pointer(src_elem) && is_type_integer(dst_elem)) {
  1713. res.value = LLVMBuildPtrToInt(p->builder, value.value, lb_type(m, t), "");
  1714. } else if (is_type_integer(src_elem) && is_type_pointer(dst_elem)) {
  1715. res.value = LLVMBuildIntToPtr(p->builder, value.value, lb_type(m, t), "");
  1716. }else {
  1717. GB_PANIC("Unhandled simd vector conversion: %s -> %s", type_to_string(src), type_to_string(dst));
  1718. }
  1719. return res;
  1720. } else {
  1721. i64 count = get_array_type_count(dst);
  1722. LLVMTypeRef vt = lb_type(m, t);
  1723. LLVMTypeRef llvm_u32 = lb_type(m, t_u32);
  1724. LLVMValueRef elem = lb_emit_conv(p, value, et).value;
  1725. LLVMValueRef vector = LLVMConstNull(vt);
  1726. for (i64 i = 0; i < count; i++) {
  1727. LLVMValueRef idx = LLVMConstInt(llvm_u32, i, false);
  1728. vector = LLVMBuildInsertElement(p->builder, vector, elem, idx, "");
  1729. }
  1730. lbValue res = {};
  1731. res.type = t;
  1732. res.value = vector;
  1733. return res;
  1734. }
  1735. }
  1736. // bit_field <-> backing type
  1737. if (is_type_bit_field(src)) {
  1738. if (are_types_identical(src->BitField.backing_type, dst)) {
  1739. lbValue res = {};
  1740. res.type = t;
  1741. res.value = value.value;
  1742. return res;
  1743. }
  1744. }
  1745. if (is_type_bit_field(dst)) {
  1746. if (are_types_identical(src, dst->BitField.backing_type)) {
  1747. lbValue res = {};
  1748. res.type = t;
  1749. res.value = value.value;
  1750. return res;
  1751. }
  1752. }
  1753. // bit_set <-> backing type
  1754. if (is_type_bit_set(src)) {
  1755. Type *backing = bit_set_to_int(src);
  1756. if (are_types_identical(backing, dst)) {
  1757. lbValue res = {};
  1758. res.type = t;
  1759. res.value = value.value;
  1760. return res;
  1761. }
  1762. }
  1763. if (is_type_bit_set(dst)) {
  1764. Type *backing = bit_set_to_int(dst);
  1765. if (are_types_identical(src, backing)) {
  1766. lbValue res = {};
  1767. res.type = t;
  1768. res.value = value.value;
  1769. return res;
  1770. }
  1771. }
  1772. // Pointer <-> uintptr
  1773. if (is_type_pointer(src) && is_type_uintptr(dst)) {
  1774. lbValue res = {};
  1775. res.type = t;
  1776. res.value = LLVMBuildPtrToInt(p->builder, value.value, lb_type(m, t), "");
  1777. return res;
  1778. }
  1779. if (is_type_uintptr(src) && is_type_pointer(dst)) {
  1780. lbValue res = {};
  1781. res.type = t;
  1782. res.value = LLVMBuildIntToPtr(p->builder, value.value, lb_type(m, t), "");
  1783. return res;
  1784. }
  1785. if (is_type_multi_pointer(src) && is_type_uintptr(dst)) {
  1786. lbValue res = {};
  1787. res.type = t;
  1788. res.value = LLVMBuildPtrToInt(p->builder, value.value, lb_type(m, t), "");
  1789. return res;
  1790. }
  1791. if (is_type_uintptr(src) && is_type_multi_pointer(dst)) {
  1792. lbValue res = {};
  1793. res.type = t;
  1794. res.value = LLVMBuildIntToPtr(p->builder, value.value, lb_type(m, t), "");
  1795. return res;
  1796. }
  1797. if (is_type_union(dst)) {
  1798. if (dst->Union.variants.count == 1) {
  1799. Type *vt = dst->Union.variants[0];
  1800. if (internal_check_is_assignable_to(src_type, vt)) {
  1801. value = lb_emit_conv(p, value, vt);
  1802. lbAddr parent = lb_add_local_generated(p, t, true);
  1803. lb_emit_store_union_variant(p, parent.addr, value, vt);
  1804. return lb_addr_load(p, parent);
  1805. }
  1806. }
  1807. for (Type *vt : dst->Union.variants) {
  1808. if (are_types_identical(src_type, vt)) {
  1809. lbAddr parent = lb_add_local_generated(p, t, true);
  1810. lb_emit_store_union_variant(p, parent.addr, value, vt);
  1811. return lb_addr_load(p, parent);
  1812. }
  1813. }
  1814. ValidIndexAndScore *valids = gb_alloc_array(temporary_allocator(), ValidIndexAndScore, dst->Union.variants.count);
  1815. isize valid_count = 0;
  1816. isize first_success_index = -1;
  1817. for_array(i, dst->Union.variants) {
  1818. Type *vt = dst->Union.variants[i];
  1819. i64 score = 0;
  1820. if (internal_check_is_assignable_to(src_type, vt)) {
  1821. valids[valid_count].index = i;
  1822. valids[valid_count].score = score;
  1823. valid_count += 1;
  1824. if (first_success_index < 0) {
  1825. first_success_index = i;
  1826. }
  1827. }
  1828. }
  1829. if (valid_count > 1) {
  1830. gb_sort_array(valids, valid_count, valid_index_and_score_cmp);
  1831. i64 best_score = valids[0].score;
  1832. for (isize i = 1; i < valid_count; i++) {
  1833. auto v = valids[i];
  1834. if (best_score > v.score) {
  1835. valid_count = i;
  1836. break;
  1837. }
  1838. best_score = v.score;
  1839. }
  1840. first_success_index = valids[0].index;
  1841. }
  1842. if (valid_count == 1) {
  1843. Type *vt = dst->Union.variants[first_success_index];
  1844. value = lb_emit_conv(p, value, vt);
  1845. lbAddr parent = lb_add_local_generated(p, t, true);
  1846. lb_emit_store_union_variant(p, parent.addr, value, vt);
  1847. return lb_addr_load(p, parent);
  1848. }
  1849. }
  1850. // NOTE(bill): This has to be done before 'Pointer <-> Pointer' as it's
  1851. // subtype polymorphism casting
  1852. if (check_is_assignable_to_using_subtype(src_type, t)) {
  1853. Type *st = type_deref(src_type);
  1854. st = type_deref(st);
  1855. bool st_is_ptr = is_type_pointer(src_type);
  1856. st = base_type(st);
  1857. Type *dt = t;
  1858. GB_ASSERT(is_type_struct(st) || is_type_raw_union(st));
  1859. Selection sel = {};
  1860. sel.index.allocator = heap_allocator();
  1861. defer (array_free(&sel.index));
  1862. if (lookup_subtype_polymorphic_selection(t, src_type, &sel)) {
  1863. if (sel.entity == nullptr) {
  1864. GB_PANIC("invalid subtype cast %s -> ", type_to_string(src_type), type_to_string(t));
  1865. }
  1866. if (st_is_ptr) {
  1867. lbValue res = lb_emit_deep_field_gep(p, value, sel);
  1868. Type *rt = res.type;
  1869. if (!are_types_identical(rt, dt) && are_types_identical(type_deref(rt), dt)) {
  1870. res = lb_emit_load(p, res);
  1871. }
  1872. return res;
  1873. } else {
  1874. if (is_type_pointer(value.type)) {
  1875. Type *rt = value.type;
  1876. if (!are_types_identical(rt, dt) && are_types_identical(type_deref(rt), dt)) {
  1877. value = lb_emit_load(p, value);
  1878. } else {
  1879. value = lb_emit_deep_field_gep(p, value, sel);
  1880. return lb_emit_load(p, value);
  1881. }
  1882. }
  1883. return lb_emit_deep_field_ev(p, value, sel);
  1884. }
  1885. }
  1886. }
  1887. // Pointer <-> Pointer
  1888. if (is_type_pointer(src) && is_type_pointer(dst)) {
  1889. lbValue res = {};
  1890. res.type = t;
  1891. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1892. return res;
  1893. }
  1894. if (is_type_multi_pointer(src) && is_type_pointer(dst)) {
  1895. lbValue res = {};
  1896. res.type = t;
  1897. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1898. return res;
  1899. }
  1900. if (is_type_pointer(src) && is_type_multi_pointer(dst)) {
  1901. lbValue res = {};
  1902. res.type = t;
  1903. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1904. return res;
  1905. }
  1906. if (is_type_multi_pointer(src) && is_type_multi_pointer(dst)) {
  1907. lbValue res = {};
  1908. res.type = t;
  1909. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1910. return res;
  1911. }
  1912. // proc <-> proc
  1913. if (is_type_proc(src) && is_type_proc(dst)) {
  1914. lbValue res = {};
  1915. res.type = t;
  1916. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1917. return res;
  1918. }
  1919. // pointer -> proc
  1920. if (is_type_pointer(src) && is_type_proc(dst)) {
  1921. lbValue res = {};
  1922. res.type = t;
  1923. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1924. return res;
  1925. }
  1926. // proc -> pointer
  1927. if (is_type_proc(src) && is_type_pointer(dst)) {
  1928. lbValue res = {};
  1929. res.type = t;
  1930. res.value = LLVMBuildPointerCast(p->builder, value.value, lb_type(m, t), "");
  1931. return res;
  1932. }
  1933. // []byte/[]u8 <-> string
  1934. if (is_type_u8_slice(src) && is_type_string(dst)) {
  1935. return lb_emit_transmute(p, value, t);
  1936. }
  1937. if (is_type_string(src) && is_type_u8_slice(dst)) {
  1938. return lb_emit_transmute(p, value, t);
  1939. }
  1940. if (is_type_array_like(dst)) {
  1941. Type *elem = base_array_type(dst);
  1942. isize index_count = cast(isize)get_array_type_count(dst);
  1943. isize inlineable = type_size_of(dst) <= build_context.max_simd_align;
  1944. lbValue e = lb_emit_conv(p, value, elem);
  1945. if (inlineable && lb_is_const(e)) {
  1946. lbAddr v = {};
  1947. if (e.value) {
  1948. TEMPORARY_ALLOCATOR_GUARD();
  1949. LLVMValueRef *values = gb_alloc_array(temporary_allocator(), LLVMValueRef, index_count);
  1950. for (isize i = 0; i < index_count; i++) {
  1951. values[i] = e.value;
  1952. }
  1953. lbValue array_const_value = {};
  1954. array_const_value.type = t;
  1955. array_const_value.value = LLVMConstArray(lb_type(m, elem), values, cast(unsigned)index_count);
  1956. v = lb_add_global_generated(m, t, array_const_value);
  1957. } else {
  1958. v = lb_add_global_generated(m, t);
  1959. }
  1960. lb_make_global_private_const(v);
  1961. return lb_addr_load(p, v);
  1962. }
  1963. // NOTE(bill): Doesn't need to be zero because it will be initialized in the loops
  1964. lbAddr v = lb_add_local_generated(p, t, false);
  1965. if (!inlineable) {
  1966. auto loop_data = lb_loop_start(p, index_count, t_int);
  1967. lbValue elem = lb_emit_array_ep(p, v.addr, loop_data.idx);
  1968. lb_emit_store(p, elem, e);
  1969. lb_loop_end(p, loop_data);
  1970. } else {
  1971. for (isize i = 0; i < index_count; i++) {
  1972. lbValue elem = lb_emit_array_epi(p, v.addr, i);
  1973. lb_emit_store(p, elem, e);
  1974. }
  1975. }
  1976. return lb_addr_load(p, v);
  1977. }
  1978. if (is_type_matrix(dst) && !is_type_matrix(src)) {
  1979. GB_ASSERT_MSG(dst->Matrix.row_count == dst->Matrix.column_count, "%s <- %s", type_to_string(dst), type_to_string(src));
  1980. Type *elem = base_array_type(dst);
  1981. lbValue e = lb_emit_conv(p, value, elem);
  1982. lbAddr v = lb_add_local_generated(p, t, false);
  1983. lbValue zero = lb_const_value(p->module, elem, exact_value_i64(0), true);
  1984. for (i64 j = 0; j < dst->Matrix.column_count; j++) {
  1985. for (i64 i = 0; i < dst->Matrix.row_count; i++) {
  1986. lbValue ptr = lb_emit_matrix_epi(p, v.addr, i, j);
  1987. lb_emit_store(p, ptr, i == j ? e : zero);
  1988. }
  1989. }
  1990. return lb_addr_load(p, v);
  1991. }
  1992. if (is_type_matrix(dst) && is_type_matrix(src)) {
  1993. GB_ASSERT(dst->kind == Type_Matrix);
  1994. GB_ASSERT(src->kind == Type_Matrix);
  1995. lbAddr v = lb_add_local_generated(p, t, true);
  1996. if (is_matrix_square(dst) && is_matrix_square(dst)) {
  1997. for (i64 j = 0; j < dst->Matrix.column_count; j++) {
  1998. for (i64 i = 0; i < dst->Matrix.row_count; i++) {
  1999. if (i < src->Matrix.row_count && j < src->Matrix.column_count) {
  2000. lbValue d = lb_emit_matrix_epi(p, v.addr, i, j);
  2001. lbValue s = lb_emit_matrix_ev(p, value, i, j);
  2002. lb_emit_store(p, d, s);
  2003. } else if (i == j) {
  2004. lbValue d = lb_emit_matrix_epi(p, v.addr, i, j);
  2005. lbValue s = lb_const_value(p->module, dst->Matrix.elem, exact_value_i64(1), true);
  2006. lb_emit_store(p, d, s);
  2007. }
  2008. }
  2009. }
  2010. } else {
  2011. i64 dst_count = dst->Matrix.row_count*dst->Matrix.column_count;
  2012. i64 src_count = src->Matrix.row_count*src->Matrix.column_count;
  2013. GB_ASSERT(dst_count == src_count);
  2014. lbValue pdst = v.addr;
  2015. lbValue psrc = lb_address_from_load_or_generate_local(p, value);
  2016. bool same_elem_base_types = are_types_identical(
  2017. base_type(dst->Matrix.elem),
  2018. base_type(src->Matrix.elem)
  2019. );
  2020. if (same_elem_base_types && type_size_of(dst) == type_size_of(src)) {
  2021. lb_mem_copy_overlapping(p, v.addr, psrc, lb_const_int(p->module, t_int, type_size_of(dst)));
  2022. } else {
  2023. for (i64 i = 0; i < src_count; i++) {
  2024. lbValue dp = lb_emit_array_epi(p, v.addr, matrix_column_major_index_to_offset(dst, i));
  2025. lbValue sp = lb_emit_array_epi(p, psrc, matrix_column_major_index_to_offset(src, i));
  2026. lbValue s = lb_emit_load(p, sp);
  2027. s = lb_emit_conv(p, s, dst->Matrix.elem);
  2028. lb_emit_store(p, dp, s);
  2029. }
  2030. }
  2031. }
  2032. return lb_addr_load(p, v);
  2033. }
  2034. if (is_type_any(dst)) {
  2035. if (is_type_untyped_uninit(src)) {
  2036. return lb_const_undef(p->module, t);
  2037. }
  2038. if (is_type_untyped_nil(src)) {
  2039. return lb_const_nil(p->module, t);
  2040. }
  2041. lbAddr result = lb_add_local_generated(p, t, true);
  2042. Type *st = default_type(src_type);
  2043. lbValue data = lb_address_from_load_or_generate_local(p, value);
  2044. GB_ASSERT_MSG(is_type_pointer(data.type), "%s", type_to_string(data.type));
  2045. GB_ASSERT_MSG(is_type_typed(st), "%s", type_to_string(st));
  2046. data = lb_emit_conv(p, data, t_rawptr);
  2047. lbValue id = lb_typeid(p->module, st);
  2048. lbValue any_data = lb_emit_struct_ep(p, result.addr, 0);
  2049. lbValue any_id = lb_emit_struct_ep(p, result.addr, 1);
  2050. lb_emit_store(p, any_data, data);
  2051. lb_emit_store(p, any_id, id);
  2052. return lb_addr_load(p, result);
  2053. }
  2054. i64 src_sz = type_size_of(src);
  2055. i64 dst_sz = type_size_of(dst);
  2056. if (src_sz == dst_sz) {
  2057. // bit_set <-> integer
  2058. if (is_type_integer(src) && is_type_bit_set(dst)) {
  2059. lbValue res = lb_emit_conv(p, value, bit_set_to_int(dst));
  2060. res.type = t;
  2061. return res;
  2062. }
  2063. if (is_type_bit_set(src) && is_type_integer(dst)) {
  2064. lbValue bs = value;
  2065. bs.type = bit_set_to_int(src);
  2066. return lb_emit_conv(p, bs, dst);
  2067. }
  2068. // typeid <-> integer
  2069. if (is_type_integer(src) && is_type_typeid(dst)) {
  2070. return lb_emit_transmute(p, value, dst);
  2071. }
  2072. if (is_type_typeid(src) && is_type_integer(dst)) {
  2073. return lb_emit_transmute(p, value, dst);
  2074. }
  2075. }
  2076. if (is_type_untyped(src)) {
  2077. if (is_type_string(src) && is_type_string(dst)) {
  2078. lbAddr result = lb_add_local_generated(p, t, false);
  2079. lb_addr_store(p, result, value);
  2080. return lb_addr_load(p, result);
  2081. }
  2082. }
  2083. gb_printf_err("%.*s\n", LIT(p->name));
  2084. gb_printf_err("lb_emit_conv: src -> dst\n");
  2085. gb_printf_err("Not Identical %s != %s\n", type_to_string(src_type), type_to_string(t));
  2086. gb_printf_err("Not Identical %s != %s\n", type_to_string(src), type_to_string(dst));
  2087. gb_printf_err("Not Identical %p != %p\n", src_type, t);
  2088. gb_printf_err("Not Identical %p != %p\n", src, dst);
  2089. GB_PANIC("Invalid type conversion: '%s' to '%s' for procedure '%.*s'",
  2090. type_to_string(src_type), type_to_string(t),
  2091. LIT(p->name));
  2092. return {};
  2093. }
  2094. gb_internal lbValue lb_emit_c_vararg(lbProcedure *p, lbValue arg, Type *type) {
  2095. Type *core = core_type(type);
  2096. if (core->kind == Type_BitSet) {
  2097. core = core_type(bit_set_to_int(core));
  2098. arg = lb_emit_transmute(p, arg, core);
  2099. }
  2100. Type *promoted = c_vararg_promote_type(core);
  2101. return lb_emit_conv(p, arg, promoted);
  2102. }
  2103. gb_internal lbValue lb_compare_records(lbProcedure *p, TokenKind op_kind, lbValue left, lbValue right, Type *type) {
  2104. GB_ASSERT((is_type_struct(type) || is_type_union(type)) && is_type_comparable(type));
  2105. lbValue left_ptr = lb_address_from_load_or_generate_local(p, left);
  2106. lbValue right_ptr = lb_address_from_load_or_generate_local(p, right);
  2107. lbValue res = {};
  2108. if (type_size_of(type) == 0) {
  2109. switch (op_kind) {
  2110. case Token_CmpEq:
  2111. return lb_const_bool(p->module, t_bool, true);
  2112. case Token_NotEq:
  2113. return lb_const_bool(p->module, t_bool, false);
  2114. }
  2115. GB_PANIC("invalid operator");
  2116. }
  2117. TEMPORARY_ALLOCATOR_GUARD();
  2118. if (is_type_simple_compare(type)) {
  2119. // TODO(bill): Test to see if this is actually faster!!!!
  2120. auto args = array_make<lbValue>(temporary_allocator(), 3);
  2121. args[0] = lb_emit_conv(p, left_ptr, t_rawptr);
  2122. args[1] = lb_emit_conv(p, right_ptr, t_rawptr);
  2123. args[2] = lb_const_int(p->module, t_int, type_size_of(type));
  2124. res = lb_emit_runtime_call(p, "memory_equal", args);
  2125. } else {
  2126. lbValue value = lb_equal_proc_for_type(p->module, type);
  2127. auto args = array_make<lbValue>(temporary_allocator(), 2);
  2128. args[0] = lb_emit_conv(p, left_ptr, t_rawptr);
  2129. args[1] = lb_emit_conv(p, right_ptr, t_rawptr);
  2130. res = lb_emit_call(p, value, args);
  2131. }
  2132. if (op_kind == Token_NotEq) {
  2133. res = lb_emit_unary_arith(p, Token_Not, res, res.type);
  2134. }
  2135. return res;
  2136. }
  2137. gb_internal lbValue lb_emit_comp(lbProcedure *p, TokenKind op_kind, lbValue left, lbValue right) {
  2138. Type *a = core_type(left.type);
  2139. Type *b = core_type(right.type);
  2140. GB_ASSERT(gb_is_between(op_kind, Token__ComparisonBegin+1, Token__ComparisonEnd-1));
  2141. lbValue nil_check = {};
  2142. if (is_type_array_like(left.type) || is_type_array_like(right.type)) {
  2143. // don't do `nil` check if it is array-like
  2144. } else if (is_type_untyped_nil(left.type)) {
  2145. nil_check = lb_emit_comp_against_nil(p, op_kind, right);
  2146. } else if (is_type_untyped_nil(right.type)) {
  2147. nil_check = lb_emit_comp_against_nil(p, op_kind, left);
  2148. }
  2149. if (nil_check.value != nullptr) {
  2150. return nil_check;
  2151. }
  2152. if (are_types_identical(a, b)) {
  2153. // NOTE(bill): No need for a conversion
  2154. } else if (lb_is_const(left) || lb_is_const_nil(left)) {
  2155. if (lb_is_const_nil(left)) {
  2156. return lb_emit_comp_against_nil(p, op_kind, right);
  2157. }
  2158. left = lb_emit_conv(p, left, right.type);
  2159. } else if (lb_is_const(right) || lb_is_const_nil(right)) {
  2160. if (lb_is_const_nil(right)) {
  2161. return lb_emit_comp_against_nil(p, op_kind, left);
  2162. }
  2163. right = lb_emit_conv(p, right, left.type);
  2164. } else {
  2165. Type *lt = left.type;
  2166. Type *rt = right.type;
  2167. lt = left.type;
  2168. rt = right.type;
  2169. i64 ls = type_size_of(lt);
  2170. i64 rs = type_size_of(rt);
  2171. // NOTE(bill): Quick heuristic, larger types are usually the target type
  2172. if (ls < rs) {
  2173. left = lb_emit_conv(p, left, rt);
  2174. } else if (ls > rs) {
  2175. right = lb_emit_conv(p, right, lt);
  2176. } else {
  2177. if (is_type_union(rt)) {
  2178. left = lb_emit_conv(p, left, rt);
  2179. } else {
  2180. right = lb_emit_conv(p, right, lt);
  2181. }
  2182. }
  2183. }
  2184. a = core_type(left.type);
  2185. b = core_type(right.type);
  2186. if (is_type_matrix(a) && (op_kind == Token_CmpEq || op_kind == Token_NotEq)) {
  2187. Type *tl = base_type(a);
  2188. lbValue lhs = lb_address_from_load_or_generate_local(p, left);
  2189. lbValue rhs = lb_address_from_load_or_generate_local(p, right);
  2190. // TODO(bill): Test to see if this is actually faster!!!!
  2191. auto args = array_make<lbValue>(permanent_allocator(), 3);
  2192. args[0] = lb_emit_conv(p, lhs, t_rawptr);
  2193. args[1] = lb_emit_conv(p, rhs, t_rawptr);
  2194. args[2] = lb_const_int(p->module, t_int, type_size_of(tl));
  2195. lbValue val = lb_emit_runtime_call(p, "memory_compare", args);
  2196. lbValue res = lb_emit_comp(p, op_kind, val, lb_const_nil(p->module, val.type));
  2197. return lb_emit_conv(p, res, t_bool);
  2198. }
  2199. if (is_type_array_like(a)) {
  2200. Type *tl = base_type(a);
  2201. lbValue lhs = lb_address_from_load_or_generate_local(p, left);
  2202. lbValue rhs = lb_address_from_load_or_generate_local(p, right);
  2203. TokenKind cmp_op = Token_And;
  2204. lbValue res = lb_const_bool(p->module, t_llvm_bool, true);
  2205. if (op_kind == Token_NotEq) {
  2206. res = lb_const_bool(p->module, t_llvm_bool, false);
  2207. cmp_op = Token_Or;
  2208. } else if (op_kind == Token_CmpEq) {
  2209. res = lb_const_bool(p->module, t_llvm_bool, true);
  2210. cmp_op = Token_And;
  2211. }
  2212. bool inline_array_arith = lb_can_try_to_inline_array_arith(tl);
  2213. i32 count = 0;
  2214. switch (tl->kind) {
  2215. case Type_Array: count = cast(i32)tl->Array.count; break;
  2216. case Type_EnumeratedArray: count = cast(i32)tl->EnumeratedArray.count; break;
  2217. }
  2218. if (inline_array_arith) {
  2219. // inline
  2220. lbAddr val = lb_add_local_generated(p, t_bool, false);
  2221. lb_addr_store(p, val, res);
  2222. for (i32 i = 0; i < count; i++) {
  2223. lbValue x = lb_emit_load(p, lb_emit_array_epi(p, lhs, i));
  2224. lbValue y = lb_emit_load(p, lb_emit_array_epi(p, rhs, i));
  2225. lbValue cmp = lb_emit_comp(p, op_kind, x, y);
  2226. lbValue new_res = lb_emit_arith(p, cmp_op, lb_addr_load(p, val), cmp, t_bool);
  2227. lb_addr_store(p, val, lb_emit_conv(p, new_res, t_bool));
  2228. }
  2229. return lb_addr_load(p, val);
  2230. } else {
  2231. if (is_type_simple_compare(tl) && (op_kind == Token_CmpEq || op_kind == Token_NotEq)) {
  2232. // TODO(bill): Test to see if this is actually faster!!!!
  2233. auto args = array_make<lbValue>(permanent_allocator(), 3);
  2234. args[0] = lb_emit_conv(p, lhs, t_rawptr);
  2235. args[1] = lb_emit_conv(p, rhs, t_rawptr);
  2236. args[2] = lb_const_int(p->module, t_int, type_size_of(tl));
  2237. lbValue val = lb_emit_runtime_call(p, "memory_compare", args);
  2238. lbValue res = lb_emit_comp(p, op_kind, val, lb_const_nil(p->module, val.type));
  2239. return lb_emit_conv(p, res, t_bool);
  2240. } else {
  2241. lbAddr val = lb_add_local_generated(p, t_bool, false);
  2242. lb_addr_store(p, val, res);
  2243. auto loop_data = lb_loop_start(p, count, t_i32);
  2244. {
  2245. lbValue i = loop_data.idx;
  2246. lbValue x = lb_emit_load(p, lb_emit_array_ep(p, lhs, i));
  2247. lbValue y = lb_emit_load(p, lb_emit_array_ep(p, rhs, i));
  2248. lbValue cmp = lb_emit_comp(p, op_kind, x, y);
  2249. lbValue new_res = lb_emit_arith(p, cmp_op, lb_addr_load(p, val), cmp, t_bool);
  2250. lb_addr_store(p, val, lb_emit_conv(p, new_res, t_bool));
  2251. }
  2252. lb_loop_end(p, loop_data);
  2253. return lb_addr_load(p, val);
  2254. }
  2255. }
  2256. }
  2257. if ((is_type_struct(a) || is_type_union(a)) && is_type_comparable(a)) {
  2258. return lb_compare_records(p, op_kind, left, right, a);
  2259. }
  2260. if ((is_type_struct(b) || is_type_union(b)) && is_type_comparable(b)) {
  2261. return lb_compare_records(p, op_kind, left, right, b);
  2262. }
  2263. if (is_type_string(a)) {
  2264. if (is_type_cstring(a) && is_type_cstring(b)) {
  2265. left = lb_emit_conv(p, left, t_cstring);
  2266. right = lb_emit_conv(p, right, t_cstring);
  2267. char const *runtime_procedure = nullptr;
  2268. switch (op_kind) {
  2269. case Token_CmpEq: runtime_procedure = "cstring_eq"; break;
  2270. case Token_NotEq: runtime_procedure = "cstring_ne"; break;
  2271. case Token_Lt: runtime_procedure = "cstring_lt"; break;
  2272. case Token_Gt: runtime_procedure = "cstring_gt"; break;
  2273. case Token_LtEq: runtime_procedure = "cstring_le"; break;
  2274. case Token_GtEq: runtime_procedure = "cstring_ge"; break;
  2275. }
  2276. GB_ASSERT(runtime_procedure != nullptr);
  2277. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2278. args[0] = left;
  2279. args[1] = right;
  2280. return lb_emit_runtime_call(p, runtime_procedure, args);
  2281. }
  2282. if (is_type_cstring(a) ^ is_type_cstring(b)) {
  2283. left = lb_emit_conv(p, left, t_string);
  2284. right = lb_emit_conv(p, right, t_string);
  2285. }
  2286. char const *runtime_procedure = nullptr;
  2287. switch (op_kind) {
  2288. case Token_CmpEq: runtime_procedure = "string_eq"; break;
  2289. case Token_NotEq: runtime_procedure = "string_ne"; break;
  2290. case Token_Lt: runtime_procedure = "string_lt"; break;
  2291. case Token_Gt: runtime_procedure = "string_gt"; break;
  2292. case Token_LtEq: runtime_procedure = "string_le"; break;
  2293. case Token_GtEq: runtime_procedure = "string_ge"; break;
  2294. }
  2295. GB_ASSERT(runtime_procedure != nullptr);
  2296. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2297. args[0] = left;
  2298. args[1] = right;
  2299. return lb_emit_runtime_call(p, runtime_procedure, args);
  2300. }
  2301. if (is_type_complex(a)) {
  2302. char const *runtime_procedure = "";
  2303. i64 sz = 8*type_size_of(a);
  2304. switch (sz) {
  2305. case 32:
  2306. switch (op_kind) {
  2307. case Token_CmpEq: runtime_procedure = "complex32_eq"; break;
  2308. case Token_NotEq: runtime_procedure = "complex32_ne"; break;
  2309. }
  2310. break;
  2311. case 64:
  2312. switch (op_kind) {
  2313. case Token_CmpEq: runtime_procedure = "complex64_eq"; break;
  2314. case Token_NotEq: runtime_procedure = "complex64_ne"; break;
  2315. }
  2316. break;
  2317. case 128:
  2318. switch (op_kind) {
  2319. case Token_CmpEq: runtime_procedure = "complex128_eq"; break;
  2320. case Token_NotEq: runtime_procedure = "complex128_ne"; break;
  2321. }
  2322. break;
  2323. }
  2324. GB_ASSERT(runtime_procedure != nullptr);
  2325. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2326. args[0] = left;
  2327. args[1] = right;
  2328. return lb_emit_runtime_call(p, runtime_procedure, args);
  2329. }
  2330. if (is_type_quaternion(a)) {
  2331. char const *runtime_procedure = "";
  2332. i64 sz = 8*type_size_of(a);
  2333. switch (sz) {
  2334. case 64:
  2335. switch (op_kind) {
  2336. case Token_CmpEq: runtime_procedure = "quaternion64_eq"; break;
  2337. case Token_NotEq: runtime_procedure = "quaternion64_ne"; break;
  2338. }
  2339. break;
  2340. case 128:
  2341. switch (op_kind) {
  2342. case Token_CmpEq: runtime_procedure = "quaternion128_eq"; break;
  2343. case Token_NotEq: runtime_procedure = "quaternion128_ne"; break;
  2344. }
  2345. break;
  2346. case 256:
  2347. switch (op_kind) {
  2348. case Token_CmpEq: runtime_procedure = "quaternion256_eq"; break;
  2349. case Token_NotEq: runtime_procedure = "quaternion256_ne"; break;
  2350. }
  2351. break;
  2352. }
  2353. GB_ASSERT(runtime_procedure != nullptr);
  2354. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2355. args[0] = left;
  2356. args[1] = right;
  2357. return lb_emit_runtime_call(p, runtime_procedure, args);
  2358. }
  2359. if (is_type_bit_set(a)) {
  2360. switch (op_kind) {
  2361. case Token_Lt:
  2362. case Token_LtEq:
  2363. case Token_Gt:
  2364. case Token_GtEq:
  2365. {
  2366. Type *it = bit_set_to_int(a);
  2367. lbValue lhs = lb_emit_transmute(p, left, it);
  2368. lbValue rhs = lb_emit_transmute(p, right, it);
  2369. lbValue res = lb_emit_arith(p, Token_And, lhs, rhs, it);
  2370. if (op_kind == Token_Lt || op_kind == Token_LtEq) {
  2371. // (lhs & rhs) == lhs
  2372. res.value = LLVMBuildICmp(p->builder, LLVMIntEQ, res.value, lhs.value, "");
  2373. res.type = t_llvm_bool;
  2374. } else if (op_kind == Token_Gt || op_kind == Token_GtEq) {
  2375. // (lhs & rhs) == rhs
  2376. res.value = LLVMBuildICmp(p->builder, LLVMIntEQ, res.value, rhs.value, "");
  2377. res.type = t_llvm_bool;
  2378. }
  2379. // NOTE(bill): Strict subsets
  2380. if (op_kind == Token_Lt || op_kind == Token_Gt) {
  2381. // res &~ (lhs == rhs)
  2382. lbValue eq = {};
  2383. eq.value = LLVMBuildICmp(p->builder, LLVMIntEQ, lhs.value, rhs.value, "");
  2384. eq.type = t_llvm_bool;
  2385. res = lb_emit_arith(p, Token_AndNot, res, eq, t_llvm_bool);
  2386. }
  2387. return res;
  2388. }
  2389. case Token_CmpEq:
  2390. case Token_NotEq:
  2391. {
  2392. LLVMIntPredicate pred = {};
  2393. switch (op_kind) {
  2394. case Token_CmpEq: pred = LLVMIntEQ; break;
  2395. case Token_NotEq: pred = LLVMIntNE; break;
  2396. }
  2397. lbValue res = {};
  2398. res.type = t_llvm_bool;
  2399. res.value = LLVMBuildICmp(p->builder, pred, left.value, right.value, "");
  2400. return res;
  2401. }
  2402. }
  2403. }
  2404. if (op_kind != Token_CmpEq && op_kind != Token_NotEq) {
  2405. Type *t = left.type;
  2406. if (is_type_integer(t) && is_type_different_to_arch_endianness(t)) {
  2407. Type *platform_type = integer_endian_type_to_platform_type(t);
  2408. lbValue x = lb_emit_byte_swap(p, left, platform_type);
  2409. lbValue y = lb_emit_byte_swap(p, right, platform_type);
  2410. left = x;
  2411. right = y;
  2412. } else if (is_type_float(t) && is_type_different_to_arch_endianness(t)) {
  2413. Type *platform_type = integer_endian_type_to_platform_type(t);
  2414. lbValue x = lb_emit_conv(p, left, platform_type);
  2415. lbValue y = lb_emit_conv(p, right, platform_type);
  2416. left = x;
  2417. right = y;
  2418. }
  2419. }
  2420. a = core_type(left.type);
  2421. b = core_type(right.type);
  2422. lbValue res = {};
  2423. res.type = t_llvm_bool;
  2424. if (is_type_integer(a) ||
  2425. is_type_boolean(a) ||
  2426. is_type_pointer(a) ||
  2427. is_type_multi_pointer(a) ||
  2428. is_type_proc(a) ||
  2429. is_type_enum(a)) {
  2430. LLVMIntPredicate pred = {};
  2431. if (is_type_unsigned(left.type)) {
  2432. switch (op_kind) {
  2433. case Token_Gt: pred = LLVMIntUGT; break;
  2434. case Token_GtEq: pred = LLVMIntUGE; break;
  2435. case Token_Lt: pred = LLVMIntULT; break;
  2436. case Token_LtEq: pred = LLVMIntULE; break;
  2437. }
  2438. } else {
  2439. switch (op_kind) {
  2440. case Token_Gt: pred = LLVMIntSGT; break;
  2441. case Token_GtEq: pred = LLVMIntSGE; break;
  2442. case Token_Lt: pred = LLVMIntSLT; break;
  2443. case Token_LtEq: pred = LLVMIntSLE; break;
  2444. }
  2445. }
  2446. switch (op_kind) {
  2447. case Token_CmpEq: pred = LLVMIntEQ; break;
  2448. case Token_NotEq: pred = LLVMIntNE; break;
  2449. }
  2450. LLVMValueRef lhs = left.value;
  2451. LLVMValueRef rhs = right.value;
  2452. if (LLVMTypeOf(lhs) != LLVMTypeOf(rhs)) {
  2453. if (lb_is_type_kind(LLVMTypeOf(lhs), LLVMPointerTypeKind)) {
  2454. rhs = LLVMBuildPointerCast(p->builder, rhs, LLVMTypeOf(lhs), "");
  2455. }
  2456. }
  2457. res.value = LLVMBuildICmp(p->builder, pred, lhs, rhs, "");
  2458. } else if (is_type_float(a)) {
  2459. LLVMRealPredicate pred = {};
  2460. switch (op_kind) {
  2461. case Token_CmpEq: pred = LLVMRealOEQ; break;
  2462. case Token_Gt: pred = LLVMRealOGT; break;
  2463. case Token_GtEq: pred = LLVMRealOGE; break;
  2464. case Token_Lt: pred = LLVMRealOLT; break;
  2465. case Token_LtEq: pred = LLVMRealOLE; break;
  2466. case Token_NotEq: pred = LLVMRealONE; break;
  2467. }
  2468. res.value = LLVMBuildFCmp(p->builder, pred, left.value, right.value, "");
  2469. } else if (is_type_typeid(a)) {
  2470. LLVMIntPredicate pred = {};
  2471. switch (op_kind) {
  2472. case Token_Gt: pred = LLVMIntUGT; break;
  2473. case Token_GtEq: pred = LLVMIntUGE; break;
  2474. case Token_Lt: pred = LLVMIntULT; break;
  2475. case Token_LtEq: pred = LLVMIntULE; break;
  2476. case Token_CmpEq: pred = LLVMIntEQ; break;
  2477. case Token_NotEq: pred = LLVMIntNE; break;
  2478. }
  2479. res.value = LLVMBuildICmp(p->builder, pred, left.value, right.value, "");
  2480. } else if (is_type_simd_vector(a)) {
  2481. LLVMValueRef mask = nullptr;
  2482. Type *elem = base_array_type(a);
  2483. if (is_type_float(elem)) {
  2484. LLVMRealPredicate pred = {};
  2485. switch (op_kind) {
  2486. case Token_CmpEq: pred = LLVMRealOEQ; break;
  2487. case Token_NotEq: pred = LLVMRealONE; break;
  2488. }
  2489. mask = LLVMBuildFCmp(p->builder, pred, left.value, right.value, "");
  2490. } else {
  2491. LLVMIntPredicate pred = {};
  2492. switch (op_kind) {
  2493. case Token_CmpEq: pred = LLVMIntEQ; break;
  2494. case Token_NotEq: pred = LLVMIntNE; break;
  2495. }
  2496. mask = LLVMBuildICmp(p->builder, pred, left.value, right.value, "");
  2497. }
  2498. GB_ASSERT_MSG(mask != nullptr, "Unhandled comparison kind %s (%s) %.*s %s (%s)", type_to_string(left.type), type_to_string(base_type(left.type)), LIT(token_strings[op_kind]), type_to_string(right.type), type_to_string(base_type(right.type)));
  2499. /* NOTE(bill, 2022-05-28):
  2500. Thanks to Per Vognsen, sign extending <N x i1> to
  2501. a vector of the same width as the input vector, bit casting to an integer,
  2502. and then comparing against zero is the better option
  2503. See: https://lists.llvm.org/pipermail/llvm-dev/2012-September/053046.html
  2504. // Example assuming 128-bit vector
  2505. %1 = <4 x float> ...
  2506. %2 = <4 x float> ...
  2507. %3 = fcmp oeq <4 x float> %1, %2
  2508. %4 = sext <4 x i1> %3 to <4 x i32>
  2509. %5 = bitcast <4 x i32> %4 to i128
  2510. %6 = icmp ne i128 %5, 0
  2511. br i1 %6, label %true1, label %false2
  2512. This will result in 1 cmpps + 1 ptest + 1 br
  2513. (even without SSE4.1, contrary to what the mail list states, because of pmovmskb)
  2514. */
  2515. unsigned count = cast(unsigned)get_array_type_count(a);
  2516. unsigned elem_sz = cast(unsigned)(type_size_of(elem)*8);
  2517. LLVMTypeRef mask_type = LLVMVectorType(LLVMIntTypeInContext(p->module->ctx, elem_sz), count);
  2518. mask = LLVMBuildSExtOrBitCast(p->builder, mask, mask_type, "");
  2519. LLVMTypeRef mask_int_type = LLVMIntTypeInContext(p->module->ctx, cast(unsigned)(8*type_size_of(a)));
  2520. LLVMValueRef mask_int = LLVMBuildBitCast(p->builder, mask, mask_int_type, "");
  2521. res.value = LLVMBuildICmp(p->builder, LLVMIntNE, mask_int, LLVMConstNull(LLVMTypeOf(mask_int)), "");
  2522. return res;
  2523. } else {
  2524. GB_PANIC("Unhandled comparison kind %s (%s) %.*s %s (%s)", type_to_string(left.type), type_to_string(base_type(left.type)), LIT(token_strings[op_kind]), type_to_string(right.type), type_to_string(base_type(right.type)));
  2525. }
  2526. return res;
  2527. }
  2528. gb_internal lbValue lb_emit_comp_against_nil(lbProcedure *p, TokenKind op_kind, lbValue x) {
  2529. lbValue res = {};
  2530. res.type = t_llvm_bool;
  2531. Type *t = x.type;
  2532. Type *bt = base_type(t);
  2533. TypeKind type_kind = bt->kind;
  2534. switch (type_kind) {
  2535. case Type_Basic:
  2536. switch (bt->Basic.kind) {
  2537. case Basic_rawptr:
  2538. case Basic_cstring:
  2539. if (op_kind == Token_CmpEq) {
  2540. res.value = LLVMBuildIsNull(p->builder, x.value, "");
  2541. } else if (op_kind == Token_NotEq) {
  2542. res.value = LLVMBuildIsNotNull(p->builder, x.value, "");
  2543. }
  2544. return res;
  2545. case Basic_any:
  2546. {
  2547. // TODO(bill): is this correct behaviour for nil comparison for any?
  2548. lbValue data = lb_emit_struct_ev(p, x, 0);
  2549. lbValue ti = lb_emit_struct_ev(p, x, 1);
  2550. if (op_kind == Token_CmpEq) {
  2551. LLVMValueRef a = LLVMBuildIsNull(p->builder, data.value, "");
  2552. LLVMValueRef b = LLVMBuildIsNull(p->builder, ti.value, "");
  2553. res.value = LLVMBuildOr(p->builder, a, b, "");
  2554. return res;
  2555. } else if (op_kind == Token_NotEq) {
  2556. LLVMValueRef a = LLVMBuildIsNotNull(p->builder, data.value, "");
  2557. LLVMValueRef b = LLVMBuildIsNotNull(p->builder, ti.value, "");
  2558. res.value = LLVMBuildAnd(p->builder, a, b, "");
  2559. return res;
  2560. }
  2561. }
  2562. break;
  2563. case Basic_typeid:
  2564. lbValue invalid_typeid = lb_const_value(p->module, t_typeid, exact_value_i64(0));
  2565. return lb_emit_comp(p, op_kind, x, invalid_typeid);
  2566. }
  2567. break;
  2568. case Type_Enum:
  2569. case Type_Pointer:
  2570. case Type_MultiPointer:
  2571. case Type_Proc:
  2572. if (op_kind == Token_CmpEq) {
  2573. res.value = LLVMBuildIsNull(p->builder, x.value, "");
  2574. } else if (op_kind == Token_NotEq) {
  2575. res.value = LLVMBuildIsNotNull(p->builder, x.value, "");
  2576. }
  2577. return res;
  2578. case Type_BitSet:
  2579. {
  2580. Type *u = bit_set_to_int(bt);
  2581. if (is_type_array(u)) {
  2582. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2583. lbValue lhs = lb_address_from_load_or_generate_local(p, x);
  2584. args[0] = lb_emit_conv(p, lhs, t_rawptr);
  2585. args[1] = lb_const_int(p->module, t_int, type_size_of(t));
  2586. lbValue val = lb_emit_runtime_call(p, "memory_compare_zero", args);
  2587. lbValue res = lb_emit_comp(p, op_kind, val, lb_const_int(p->module, t_int, 0));
  2588. return res;
  2589. } else {
  2590. if (op_kind == Token_CmpEq) {
  2591. res.value = LLVMBuildIsNull(p->builder, x.value, "");
  2592. } else if (op_kind == Token_NotEq) {
  2593. res.value = LLVMBuildIsNotNull(p->builder, x.value, "");
  2594. }
  2595. }
  2596. return res;
  2597. }
  2598. case Type_Slice:
  2599. {
  2600. lbValue data = lb_emit_struct_ev(p, x, 0);
  2601. if (op_kind == Token_CmpEq) {
  2602. res.value = LLVMBuildIsNull(p->builder, data.value, "");
  2603. return res;
  2604. } else if (op_kind == Token_NotEq) {
  2605. res.value = LLVMBuildIsNotNull(p->builder, data.value, "");
  2606. return res;
  2607. }
  2608. }
  2609. break;
  2610. case Type_DynamicArray:
  2611. {
  2612. lbValue data = lb_emit_struct_ev(p, x, 0);
  2613. if (op_kind == Token_CmpEq) {
  2614. res.value = LLVMBuildIsNull(p->builder, data.value, "");
  2615. return res;
  2616. } else if (op_kind == Token_NotEq) {
  2617. res.value = LLVMBuildIsNotNull(p->builder, data.value, "");
  2618. return res;
  2619. }
  2620. }
  2621. break;
  2622. case Type_Map:
  2623. {
  2624. lbValue data_ptr = lb_emit_struct_ev(p, x, 0);
  2625. if (op_kind == Token_CmpEq) {
  2626. res.value = LLVMBuildIsNull(p->builder, data_ptr.value, "");
  2627. return res;
  2628. } else {
  2629. res.value = LLVMBuildIsNotNull(p->builder, data_ptr.value, "");
  2630. return res;
  2631. }
  2632. }
  2633. break;
  2634. case Type_Union:
  2635. {
  2636. if (type_size_of(t) == 0) {
  2637. if (op_kind == Token_CmpEq) {
  2638. return lb_const_bool(p->module, t_llvm_bool, true);
  2639. } else if (op_kind == Token_NotEq) {
  2640. return lb_const_bool(p->module, t_llvm_bool, false);
  2641. }
  2642. } else if (is_type_union_maybe_pointer(t)) {
  2643. lbValue tag = lb_emit_transmute(p, x, t_rawptr);
  2644. return lb_emit_comp_against_nil(p, op_kind, tag);
  2645. } else {
  2646. lbValue tag = lb_emit_union_tag_value(p, x);
  2647. return lb_emit_comp(p, op_kind, tag, lb_zero(p->module, tag.type));
  2648. }
  2649. }
  2650. case Type_Struct:
  2651. if (is_type_soa_struct(t)) {
  2652. Type *bt = base_type(t);
  2653. if (bt->Struct.soa_kind == StructSoa_Slice) {
  2654. LLVMValueRef the_value = {};
  2655. if (bt->Struct.fields.count == 0) {
  2656. lbValue len = lb_soa_struct_len(p, x);
  2657. the_value = len.value;
  2658. } else {
  2659. lbValue first_field = lb_emit_struct_ev(p, x, 0);
  2660. the_value = first_field.value;
  2661. }
  2662. if (op_kind == Token_CmpEq) {
  2663. res.value = LLVMBuildIsNull(p->builder, the_value, "");
  2664. return res;
  2665. } else if (op_kind == Token_NotEq) {
  2666. res.value = LLVMBuildIsNotNull(p->builder, the_value, "");
  2667. return res;
  2668. }
  2669. } else if (bt->Struct.soa_kind == StructSoa_Dynamic) {
  2670. LLVMValueRef the_value = {};
  2671. if (bt->Struct.fields.count == 0) {
  2672. lbValue cap = lb_soa_struct_cap(p, x);
  2673. the_value = cap.value;
  2674. } else {
  2675. lbValue first_field = lb_emit_struct_ev(p, x, 0);
  2676. the_value = first_field.value;
  2677. }
  2678. if (op_kind == Token_CmpEq) {
  2679. res.value = LLVMBuildIsNull(p->builder, the_value, "");
  2680. return res;
  2681. } else if (op_kind == Token_NotEq) {
  2682. res.value = LLVMBuildIsNotNull(p->builder, the_value, "");
  2683. return res;
  2684. }
  2685. }
  2686. } else if (is_type_struct(t) && type_has_nil(t)) {
  2687. auto args = array_make<lbValue>(permanent_allocator(), 2);
  2688. lbValue lhs = lb_address_from_load_or_generate_local(p, x);
  2689. args[0] = lb_emit_conv(p, lhs, t_rawptr);
  2690. args[1] = lb_const_int(p->module, t_int, type_size_of(t));
  2691. lbValue val = lb_emit_runtime_call(p, "memory_compare_zero", args);
  2692. lbValue res = lb_emit_comp(p, op_kind, val, lb_const_int(p->module, t_int, 0));
  2693. return res;
  2694. }
  2695. break;
  2696. }
  2697. GB_PANIC("Unknown handled type: %s -> %s", type_to_string(t), type_to_string(bt));
  2698. return {};
  2699. }
  2700. gb_internal lbValue lb_build_unary_and(lbProcedure *p, Ast *expr) {
  2701. ast_node(ue, UnaryExpr, expr);
  2702. auto tv = type_and_value_of_expr(expr);
  2703. Ast *ue_expr = unparen_expr(ue->expr);
  2704. if (ue_expr->kind == Ast_IndexExpr && tv.mode == Addressing_OptionalOkPtr && is_type_tuple(tv.type)) {
  2705. Type *tuple = tv.type;
  2706. Type *map_type = type_of_expr(ue_expr->IndexExpr.expr);
  2707. Type *ot = base_type(map_type);
  2708. Type *t = base_type(type_deref(ot));
  2709. bool deref = t != ot;
  2710. GB_ASSERT(t->kind == Type_Map);
  2711. ast_node(ie, IndexExpr, ue_expr);
  2712. lbValue map_val = lb_build_addr_ptr(p, ie->expr);
  2713. if (deref) {
  2714. map_val = lb_emit_load(p, map_val);
  2715. }
  2716. lbValue key = lb_build_expr(p, ie->index);
  2717. key = lb_emit_conv(p, key, t->Map.key);
  2718. lbAddr addr = lb_addr_map(map_val, key, t, alloc_type_pointer(t->Map.value));
  2719. lbValue ptr = lb_addr_get_ptr(p, addr);
  2720. lbValue ok = lb_emit_comp_against_nil(p, Token_NotEq, ptr);
  2721. ok = lb_emit_conv(p, ok, tuple->Tuple.variables[1]->type);
  2722. lbAddr res = lb_add_local_generated(p, tuple, false);
  2723. lbValue gep0 = lb_emit_struct_ep(p, res.addr, 0);
  2724. lbValue gep1 = lb_emit_struct_ep(p, res.addr, 1);
  2725. lb_emit_store(p, gep0, ptr);
  2726. lb_emit_store(p, gep1, ok);
  2727. return lb_addr_load(p, res);
  2728. } else if (is_type_soa_pointer(tv.type)) {
  2729. ast_node(ie, IndexExpr, ue_expr);
  2730. lbValue addr = lb_build_addr_ptr(p, ie->expr);
  2731. if (is_type_pointer(type_deref(addr.type))) {
  2732. addr = lb_emit_load(p, addr);
  2733. }
  2734. GB_ASSERT(is_type_pointer(addr.type));
  2735. lbValue index = lb_build_expr(p, ie->index);
  2736. if (!build_context.no_bounds_check) {
  2737. // TODO(bill): soa bounds checking
  2738. }
  2739. return lb_make_soa_pointer(p, tv.type, addr, index);
  2740. } else if (ue_expr->kind == Ast_CompoundLit) {
  2741. lbValue v = lb_build_expr(p, ue->expr);
  2742. Type *type = v.type;
  2743. lbAddr addr = {};
  2744. if (p->is_startup) {
  2745. addr = lb_add_global_generated(p->module, type, v);
  2746. } else {
  2747. addr = lb_add_local_generated(p, type, false);
  2748. }
  2749. lb_addr_store(p, addr, v);
  2750. return addr.addr;
  2751. } else if (ue_expr->kind == Ast_TypeAssertion) {
  2752. if (is_type_tuple(tv.type)) {
  2753. Type *tuple = tv.type;
  2754. Type *ptr_type = tuple->Tuple.variables[0]->type;
  2755. Type *ok_type = tuple->Tuple.variables[1]->type;
  2756. ast_node(ta, TypeAssertion, ue_expr);
  2757. TokenPos pos = ast_token(expr).pos;
  2758. Type *type = type_of_expr(ue_expr);
  2759. GB_ASSERT(!is_type_tuple(type));
  2760. lbValue e = lb_build_expr(p, ta->expr);
  2761. Type *t = type_deref(e.type);
  2762. if (is_type_union(t)) {
  2763. lbValue v = e;
  2764. if (!is_type_pointer(v.type)) {
  2765. v = lb_address_from_load_or_generate_local(p, v);
  2766. }
  2767. Type *src_type = type_deref(v.type);
  2768. Type *dst_type = type;
  2769. lbValue src_tag = {};
  2770. lbValue dst_tag = {};
  2771. if (is_type_union_maybe_pointer(src_type)) {
  2772. src_tag = lb_emit_comp_against_nil(p, Token_NotEq, v);
  2773. dst_tag = lb_const_bool(p->module, t_bool, true);
  2774. } else {
  2775. src_tag = lb_emit_load(p, lb_emit_union_tag_ptr(p, v));
  2776. dst_tag = lb_const_union_tag(p->module, src_type, dst_type);
  2777. }
  2778. lbValue ok = lb_emit_comp(p, Token_CmpEq, src_tag, dst_tag);
  2779. lbValue data_ptr = lb_emit_conv(p, v, ptr_type);
  2780. lbAddr res = lb_add_local_generated(p, tuple, true);
  2781. lbValue gep0 = lb_emit_struct_ep(p, res.addr, 0);
  2782. lbValue gep1 = lb_emit_struct_ep(p, res.addr, 1);
  2783. lb_emit_store(p, gep0, lb_emit_select(p, ok, data_ptr, lb_const_nil(p->module, ptr_type)));
  2784. lb_emit_store(p, gep1, lb_emit_conv(p, ok, ok_type));
  2785. return lb_addr_load(p, res);
  2786. } else if (is_type_any(t)) {
  2787. lbValue v = e;
  2788. if (is_type_pointer(v.type)) {
  2789. v = lb_emit_load(p, v);
  2790. }
  2791. lbValue data_ptr = lb_emit_conv(p, lb_emit_struct_ev(p, v, 0), ptr_type);
  2792. lbValue any_id = lb_emit_struct_ev(p, v, 1);
  2793. lbValue id = lb_typeid(p->module, type);
  2794. lbValue ok = lb_emit_comp(p, Token_CmpEq, any_id, id);
  2795. lbAddr res = lb_add_local_generated(p, tuple, false);
  2796. lbValue gep0 = lb_emit_struct_ep(p, res.addr, 0);
  2797. lbValue gep1 = lb_emit_struct_ep(p, res.addr, 1);
  2798. lb_emit_store(p, gep0, lb_emit_select(p, ok, data_ptr, lb_const_nil(p->module, ptr_type)));
  2799. lb_emit_store(p, gep1, lb_emit_conv(p, ok, ok_type));
  2800. return lb_addr_load(p, res);
  2801. } else {
  2802. GB_PANIC("TODO(bill): type assertion %s", type_to_string(type));
  2803. }
  2804. } else {
  2805. GB_ASSERT(is_type_pointer(tv.type));
  2806. ast_node(ta, TypeAssertion, ue_expr);
  2807. TokenPos pos = ast_token(expr).pos;
  2808. Type *type = type_of_expr(ue_expr);
  2809. GB_ASSERT(!is_type_tuple(type));
  2810. lbValue e = lb_build_expr(p, ta->expr);
  2811. Type *t = type_deref(e.type);
  2812. if (is_type_union(t)) {
  2813. lbValue v = e;
  2814. if (!is_type_pointer(v.type)) {
  2815. v = lb_address_from_load_or_generate_local(p, v);
  2816. }
  2817. Type *src_type = type_deref(v.type);
  2818. Type *dst_type = type;
  2819. if (!build_context.no_type_assert && (p->state_flags & StateFlag_no_type_assert) == 0) {
  2820. lbValue src_tag = {};
  2821. lbValue dst_tag = {};
  2822. if (is_type_union_maybe_pointer(src_type)) {
  2823. src_tag = lb_emit_comp_against_nil(p, Token_NotEq, v);
  2824. dst_tag = lb_const_bool(p->module, t_bool, true);
  2825. } else {
  2826. src_tag = lb_emit_load(p, lb_emit_union_tag_ptr(p, v));
  2827. dst_tag = lb_const_union_tag(p->module, src_type, dst_type);
  2828. }
  2829. isize arg_count = 6;
  2830. if (build_context.no_rtti) {
  2831. arg_count = 4;
  2832. }
  2833. lbValue ok = lb_emit_comp(p, Token_CmpEq, src_tag, dst_tag);
  2834. auto args = array_make<lbValue>(permanent_allocator(), arg_count);
  2835. args[0] = ok;
  2836. args[1] = lb_find_or_add_entity_string(p->module, get_file_path_string(pos.file_id));
  2837. args[2] = lb_const_int(p->module, t_i32, pos.line);
  2838. args[3] = lb_const_int(p->module, t_i32, pos.column);
  2839. if (!build_context.no_rtti) {
  2840. args[4] = lb_typeid(p->module, src_type);
  2841. args[5] = lb_typeid(p->module, dst_type);
  2842. }
  2843. lb_emit_runtime_call(p, "type_assertion_check", args);
  2844. }
  2845. lbValue data_ptr = v;
  2846. return lb_emit_conv(p, data_ptr, tv.type);
  2847. } else if (is_type_any(t)) {
  2848. lbValue v = e;
  2849. if (is_type_pointer(v.type)) {
  2850. v = lb_emit_load(p, v);
  2851. }
  2852. lbValue data_ptr = lb_emit_struct_ev(p, v, 0);
  2853. if (!build_context.no_type_assert && (p->state_flags & StateFlag_no_type_assert) == 0) {
  2854. GB_ASSERT(!build_context.no_rtti);
  2855. lbValue any_id = lb_emit_struct_ev(p, v, 1);
  2856. lbValue id = lb_typeid(p->module, type);
  2857. lbValue ok = lb_emit_comp(p, Token_CmpEq, any_id, id);
  2858. auto args = array_make<lbValue>(permanent_allocator(), 6);
  2859. args[0] = ok;
  2860. args[1] = lb_find_or_add_entity_string(p->module, get_file_path_string(pos.file_id));
  2861. args[2] = lb_const_int(p->module, t_i32, pos.line);
  2862. args[3] = lb_const_int(p->module, t_i32, pos.column);
  2863. args[4] = any_id;
  2864. args[5] = id;
  2865. lb_emit_runtime_call(p, "type_assertion_check", args);
  2866. }
  2867. return lb_emit_conv(p, data_ptr, tv.type);
  2868. } else {
  2869. GB_PANIC("TODO(bill): type assertion %s", type_to_string(type));
  2870. }
  2871. }
  2872. }
  2873. return lb_build_addr_ptr(p, ue->expr);
  2874. }
  2875. gb_internal lbValue lb_build_expr_internal(lbProcedure *p, Ast *expr);
  2876. gb_internal lbValue lb_build_expr(lbProcedure *p, Ast *expr) {
  2877. u16 prev_state_flags = p->state_flags;
  2878. defer (p->state_flags = prev_state_flags);
  2879. if (expr->state_flags != 0) {
  2880. u16 in = expr->state_flags;
  2881. u16 out = p->state_flags;
  2882. if (in & StateFlag_bounds_check) {
  2883. out |= StateFlag_bounds_check;
  2884. out &= ~StateFlag_no_bounds_check;
  2885. } else if (in & StateFlag_no_bounds_check) {
  2886. out |= StateFlag_no_bounds_check;
  2887. out &= ~StateFlag_bounds_check;
  2888. }
  2889. if (in & StateFlag_type_assert) {
  2890. out |= StateFlag_type_assert;
  2891. out &= ~StateFlag_no_type_assert;
  2892. } else if (in & StateFlag_no_type_assert) {
  2893. out |= StateFlag_no_type_assert;
  2894. out &= ~StateFlag_type_assert;
  2895. }
  2896. p->state_flags = out;
  2897. }
  2898. // IMPORTANT NOTE(bill):
  2899. // Selector Call Expressions (foo->bar(...))
  2900. // must only evaluate `foo` once as it gets transformed into
  2901. // `foo.bar(foo, ...)`
  2902. // And if `foo` is a procedure call or something more complex, storing the value
  2903. // once is a very good idea
  2904. // If a stored value is found, it must be removed from the cache
  2905. if (expr->state_flags & StateFlag_SelectorCallExpr) {
  2906. lbValue *pp = map_get(&p->selector_values, expr);
  2907. if (pp != nullptr) {
  2908. lbValue res = *pp;
  2909. map_remove(&p->selector_values, expr);
  2910. return res;
  2911. }
  2912. lbAddr *pa = map_get(&p->selector_addr, expr);
  2913. if (pa != nullptr) {
  2914. lbAddr res = *pa;
  2915. map_remove(&p->selector_addr, expr);
  2916. return lb_addr_load(p, res);
  2917. }
  2918. }
  2919. lbValue res = lb_build_expr_internal(p, expr);
  2920. if (expr->state_flags & StateFlag_SelectorCallExpr) {
  2921. map_set(&p->selector_values, expr, res);
  2922. }
  2923. return res;
  2924. }
  2925. gb_internal lbValue lb_build_expr_internal(lbProcedure *p, Ast *expr) {
  2926. lbModule *m = p->module;
  2927. expr = unparen_expr(expr);
  2928. TokenPos expr_pos = ast_token(expr).pos;
  2929. TypeAndValue tv = type_and_value_of_expr(expr);
  2930. Type *type = type_of_expr(expr);
  2931. GB_ASSERT_MSG(tv.mode != Addressing_Invalid, "invalid expression '%s' (tv.mode = %d, tv.type = %s) @ %s\n Current Proc: %.*s : %s", expr_to_string(expr), tv.mode, type_to_string(tv.type), token_pos_to_string(expr_pos), LIT(p->name), type_to_string(p->type));
  2932. if (tv.value.kind != ExactValue_Invalid) {
  2933. // NOTE(bill): Short on constant values
  2934. return lb_const_value(p->module, type, tv.value);
  2935. } else if (tv.mode == Addressing_Type) {
  2936. // NOTE(bill, 2023-01-16): is this correct? I hope so at least
  2937. return lb_typeid(m, tv.type);
  2938. }
  2939. switch (expr->kind) {
  2940. case_ast_node(bl, BasicLit, expr);
  2941. TokenPos pos = bl->token.pos;
  2942. GB_PANIC("Non-constant basic literal %s - %.*s", token_pos_to_string(pos), LIT(token_strings[bl->token.kind]));
  2943. case_end;
  2944. case_ast_node(bd, BasicDirective, expr);
  2945. TokenPos pos = bd->token.pos;
  2946. GB_PANIC("Non-constant basic literal %s - %.*s", token_pos_to_string(pos), LIT(bd->name.string));
  2947. case_end;
  2948. case_ast_node(i, Implicit, expr);
  2949. return lb_addr_load(p, lb_build_addr(p, expr));
  2950. case_end;
  2951. case_ast_node(u, Uninit, expr)
  2952. lbValue res = {};
  2953. if (is_type_untyped(type)) {
  2954. res.value = nullptr;
  2955. res.type = t_untyped_uninit;
  2956. } else {
  2957. res.value = LLVMGetUndef(lb_type(m, type));
  2958. res.type = type;
  2959. }
  2960. return res;
  2961. case_end;
  2962. case_ast_node(i, Ident, expr);
  2963. Entity *e = entity_from_expr(expr);
  2964. e = strip_entity_wrapping(e);
  2965. GB_ASSERT_MSG(e != nullptr, "%s in %.*s %p", expr_to_string(expr), LIT(p->name), expr);
  2966. if (e->kind == Entity_Builtin) {
  2967. Token token = ast_token(expr);
  2968. GB_PANIC("TODO(bill): lb_build_expr Entity_Builtin '%.*s'\n"
  2969. "\t at %s", LIT(builtin_procs[e->Builtin.id].name),
  2970. token_pos_to_string(token.pos));
  2971. return {};
  2972. } else if (e->kind == Entity_Nil) {
  2973. lbValue res = {};
  2974. res.value = nullptr;
  2975. res.type = e->type;
  2976. return res;
  2977. }
  2978. GB_ASSERT(e->kind != Entity_ProcGroup);
  2979. return lb_find_ident(p, m, e, expr);
  2980. case_end;
  2981. case_ast_node(de, DerefExpr, expr);
  2982. return lb_addr_load(p, lb_build_addr(p, expr));
  2983. case_end;
  2984. case_ast_node(se, SelectorExpr, expr);
  2985. TypeAndValue tav = type_and_value_of_expr(expr);
  2986. GB_ASSERT(tav.mode != Addressing_Invalid);
  2987. return lb_addr_load(p, lb_build_addr(p, expr));
  2988. case_end;
  2989. case_ast_node(ise, ImplicitSelectorExpr, expr);
  2990. TypeAndValue tav = type_and_value_of_expr(expr);
  2991. GB_ASSERT(tav.mode == Addressing_Constant);
  2992. return lb_const_value(p->module, type, tv.value);
  2993. case_end;
  2994. case_ast_node(se, SelectorCallExpr, expr);
  2995. GB_ASSERT(se->modified_call);
  2996. return lb_build_call_expr(p, se->call);
  2997. case_end;
  2998. case_ast_node(te, TernaryIfExpr, expr);
  2999. LLVMValueRef incoming_values[2] = {};
  3000. LLVMBasicBlockRef incoming_blocks[2] = {};
  3001. GB_ASSERT(te->y != nullptr);
  3002. lbBlock *then = lb_create_block(p, "if.then");
  3003. lbBlock *done = lb_create_block(p, "if.done"); // NOTE(bill): Append later
  3004. lbBlock *else_ = lb_create_block(p, "if.else");
  3005. lb_build_cond(p, te->cond, then, else_);
  3006. lb_start_block(p, then);
  3007. Type *type = default_type(type_of_expr(expr));
  3008. LLVMTypeRef llvm_type = lb_type(p->module, type);
  3009. incoming_values[0] = lb_emit_conv(p, lb_build_expr(p, te->x), type).value;
  3010. if (is_type_internally_pointer_like(type)) {
  3011. incoming_values[0] = LLVMBuildBitCast(p->builder, incoming_values[0], llvm_type, "");
  3012. }
  3013. lb_emit_jump(p, done);
  3014. lb_start_block(p, else_);
  3015. incoming_values[1] = lb_emit_conv(p, lb_build_expr(p, te->y), type).value;
  3016. if (is_type_internally_pointer_like(type)) {
  3017. incoming_values[1] = LLVMBuildBitCast(p->builder, incoming_values[1], llvm_type, "");
  3018. }
  3019. lb_emit_jump(p, done);
  3020. lb_start_block(p, done);
  3021. lbValue res = {};
  3022. res.value = LLVMBuildPhi(p->builder, llvm_type, "");
  3023. res.type = type;
  3024. GB_ASSERT(p->curr_block->preds.count >= 2);
  3025. incoming_blocks[0] = p->curr_block->preds[0]->block;
  3026. incoming_blocks[1] = p->curr_block->preds[1]->block;
  3027. LLVMAddIncoming(res.value, incoming_values, incoming_blocks, 2);
  3028. return res;
  3029. case_end;
  3030. case_ast_node(te, TernaryWhenExpr, expr);
  3031. TypeAndValue tav = type_and_value_of_expr(te->cond);
  3032. GB_ASSERT(tav.mode == Addressing_Constant);
  3033. GB_ASSERT(tav.value.kind == ExactValue_Bool);
  3034. if (tav.value.value_bool) {
  3035. return lb_build_expr(p, te->x);
  3036. } else {
  3037. return lb_build_expr(p, te->y);
  3038. }
  3039. case_end;
  3040. case_ast_node(oe, OrElseExpr, expr);
  3041. return lb_emit_or_else(p, oe->x, oe->y, tv);
  3042. case_end;
  3043. case_ast_node(oe, OrReturnExpr, expr);
  3044. return lb_emit_or_return(p, oe->expr, tv);
  3045. case_end;
  3046. case_ast_node(be, OrBranchExpr, expr);
  3047. lbBlock *block = nullptr;
  3048. if (be->label != nullptr) {
  3049. lbBranchBlocks bb = lb_lookup_branch_blocks(p, be->label);
  3050. switch (be->token.kind) {
  3051. case Token_or_break: block = bb.break_; break;
  3052. case Token_or_continue: block = bb.continue_; break;
  3053. }
  3054. } else {
  3055. for (lbTargetList *t = p->target_list; t != nullptr && block == nullptr; t = t->prev) {
  3056. if (t->is_block) {
  3057. continue;
  3058. }
  3059. switch (be->token.kind) {
  3060. case Token_or_break: block = t->break_; break;
  3061. case Token_or_continue: block = t->continue_; break;
  3062. }
  3063. }
  3064. }
  3065. GB_ASSERT(block != nullptr);
  3066. lbValue lhs = {};
  3067. lbValue rhs = {};
  3068. lb_emit_try_lhs_rhs(p, be->expr, tv, &lhs, &rhs);
  3069. Type *type = default_type(tv.type);
  3070. if (lhs.value) {
  3071. lhs = lb_emit_conv(p, lhs, type);
  3072. } else if (type != nullptr && type != t_invalid) {
  3073. lhs = lb_const_nil(p->module, type);
  3074. }
  3075. lbBlock *then = lb_create_block(p, "or_branch.then");
  3076. lbBlock *else_ = lb_create_block(p, "or_branch.else");
  3077. lb_emit_if(p, lb_emit_try_has_value(p, rhs), then, else_);
  3078. lb_start_block(p, else_);
  3079. lb_emit_defer_stmts(p, lbDeferExit_Branch, block);
  3080. lb_emit_jump(p, block);
  3081. lb_start_block(p, then);
  3082. return lhs;
  3083. case_end;
  3084. case_ast_node(ta, TypeAssertion, expr);
  3085. TokenPos pos = ast_token(expr).pos;
  3086. lbValue e = lb_build_expr(p, ta->expr);
  3087. Type *t = type_deref(e.type);
  3088. if (is_type_union(t)) {
  3089. if (ta->ignores[0]) {
  3090. // NOTE(bill): This is not needed for optimization levels other than 0
  3091. return lb_emit_union_cast_only_ok_check(p, e, type, pos);
  3092. }
  3093. return lb_emit_union_cast(p, e, type, pos);
  3094. } else if (is_type_any(t)) {
  3095. return lb_emit_any_cast(p, e, type, pos);
  3096. } else {
  3097. GB_PANIC("TODO(bill): type assertion %s", type_to_string(e.type));
  3098. }
  3099. case_end;
  3100. case_ast_node(tc, TypeCast, expr);
  3101. lbValue e = lb_build_expr(p, tc->expr);
  3102. switch (tc->token.kind) {
  3103. case Token_cast:
  3104. return lb_emit_conv(p, e, type);
  3105. case Token_transmute:
  3106. return lb_emit_transmute(p, e, type);
  3107. }
  3108. GB_PANIC("Invalid AST TypeCast");
  3109. case_end;
  3110. case_ast_node(ac, AutoCast, expr);
  3111. lbValue value = lb_build_expr(p, ac->expr);
  3112. return lb_emit_conv(p, value, type);
  3113. case_end;
  3114. case_ast_node(ue, UnaryExpr, expr);
  3115. switch (ue->op.kind) {
  3116. case Token_And:
  3117. return lb_build_unary_and(p, expr);
  3118. default:
  3119. {
  3120. lbValue v = lb_build_expr(p, ue->expr);
  3121. return lb_emit_unary_arith(p, ue->op.kind, v, type);
  3122. }
  3123. }
  3124. case_end;
  3125. case_ast_node(be, BinaryExpr, expr);
  3126. return lb_build_binary_expr(p, expr);
  3127. case_end;
  3128. case_ast_node(pl, ProcLit, expr);
  3129. return lb_generate_anonymous_proc_lit(p->module, p->name, expr, p);
  3130. case_end;
  3131. case_ast_node(cl, CompoundLit, expr);
  3132. return lb_addr_load(p, lb_build_addr(p, expr));
  3133. case_end;
  3134. case_ast_node(ce, CallExpr, expr);
  3135. return lb_build_call_expr(p, expr);
  3136. case_end;
  3137. case_ast_node(se, SliceExpr, expr);
  3138. if (is_type_slice(type_of_expr(se->expr))) {
  3139. // NOTE(bill): Quick optimization
  3140. if (se->high == nullptr &&
  3141. (se->low == nullptr || lb_is_expr_constant_zero(se->low))) {
  3142. return lb_build_expr(p, se->expr);
  3143. }
  3144. }
  3145. return lb_addr_load(p, lb_build_addr(p, expr));
  3146. case_end;
  3147. case_ast_node(ie, IndexExpr, expr);
  3148. return lb_addr_load(p, lb_build_addr(p, expr));
  3149. case_end;
  3150. case_ast_node(ie, MatrixIndexExpr, expr);
  3151. return lb_addr_load(p, lb_build_addr(p, expr));
  3152. case_end;
  3153. case_ast_node(ia, InlineAsmExpr, expr);
  3154. Type *t = type_of_expr(expr);
  3155. GB_ASSERT(is_type_asm_proc(t));
  3156. String asm_string = {};
  3157. String constraints_string = {};
  3158. TypeAndValue tav;
  3159. tav = type_and_value_of_expr(ia->asm_string);
  3160. GB_ASSERT(is_type_string(tav.type));
  3161. GB_ASSERT(tav.value.kind == ExactValue_String);
  3162. asm_string = tav.value.value_string;
  3163. tav = type_and_value_of_expr(ia->constraints_string);
  3164. GB_ASSERT(is_type_string(tav.type));
  3165. GB_ASSERT(tav.value.kind == ExactValue_String);
  3166. constraints_string = tav.value.value_string;
  3167. LLVMInlineAsmDialect dialect = LLVMInlineAsmDialectATT;
  3168. switch (ia->dialect) {
  3169. case InlineAsmDialect_Default: dialect = LLVMInlineAsmDialectATT; break;
  3170. case InlineAsmDialect_ATT: dialect = LLVMInlineAsmDialectATT; break;
  3171. case InlineAsmDialect_Intel: dialect = LLVMInlineAsmDialectIntel; break;
  3172. default: GB_PANIC("Unhandled inline asm dialect"); break;
  3173. }
  3174. LLVMTypeRef func_type = lb_type_internal_for_procedures_raw(p->module, t);
  3175. LLVMValueRef the_asm = llvm_get_inline_asm(func_type, asm_string, constraints_string, ia->has_side_effects, ia->has_side_effects, dialect);
  3176. GB_ASSERT(the_asm != nullptr);
  3177. return {the_asm, t};
  3178. case_end;
  3179. }
  3180. GB_PANIC("lb_build_expr: %.*s", LIT(ast_strings[expr->kind]));
  3181. return {};
  3182. }
  3183. gb_internal lbAddr lb_get_soa_variable_addr(lbProcedure *p, Entity *e) {
  3184. return map_must_get(&p->module->soa_values, e);
  3185. }
  3186. gb_internal lbValue lb_get_using_variable(lbProcedure *p, Entity *e) {
  3187. GB_ASSERT(e->kind == Entity_Variable && e->flags & EntityFlag_Using);
  3188. String name = e->token.string;
  3189. Entity *parent = e->using_parent;
  3190. Selection sel = lookup_field(parent->type, name, false);
  3191. GB_ASSERT(sel.entity != nullptr);
  3192. lbValue *pv = map_get(&p->module->values, parent);
  3193. lbValue v = {};
  3194. bool is_soa = false;
  3195. if (pv == nullptr && parent->flags & EntityFlag_SoaPtrField) {
  3196. is_soa = true;
  3197. // NOTE(bill): using SOA value (probably from for-in statement)
  3198. lbAddr parent_addr = lb_get_soa_variable_addr(p, parent);
  3199. v = lb_addr_get_ptr(p, parent_addr);
  3200. } else if (pv != nullptr) {
  3201. v = *pv;
  3202. } else {
  3203. GB_ASSERT_MSG(e->using_expr != nullptr, "%.*s", LIT(name));
  3204. v = lb_build_addr_ptr(p, e->using_expr);
  3205. }
  3206. GB_ASSERT(v.value != nullptr);
  3207. GB_ASSERT_MSG(is_soa || parent->type == type_deref(v.type), "%s %s", type_to_string(parent->type), type_to_string(v.type));
  3208. lbValue ptr = lb_emit_deep_field_gep(p, v, sel);
  3209. if (parent->scope) {
  3210. if ((parent->scope->flags & (ScopeFlag_File|ScopeFlag_Pkg)) == 0) {
  3211. lb_add_debug_local_variable(p, ptr.value, e->type, e->token);
  3212. }
  3213. } else {
  3214. lb_add_debug_local_variable(p, ptr.value, e->type, e->token);
  3215. }
  3216. return ptr;
  3217. }
  3218. gb_internal lbAddr lb_build_addr_from_entity(lbProcedure *p, Entity *e, Ast *expr) {
  3219. GB_ASSERT(e != nullptr);
  3220. if (e->kind == Entity_Constant) {
  3221. Type *t = default_type(type_of_expr(expr));
  3222. lbValue v = lb_const_value(p->module, t, e->Constant.value);
  3223. if (LLVMIsConstant(v.value)) {
  3224. lbAddr g = lb_add_global_generated(p->module, t, v);
  3225. return g;
  3226. }
  3227. GB_ASSERT(LLVMIsALoadInst(v.value));
  3228. lbValue ptr = {};
  3229. ptr.value = LLVMGetOperand(v.value, 0);
  3230. ptr.type = alloc_type_pointer(t);
  3231. return lb_addr(ptr);
  3232. }
  3233. lbValue v = {};
  3234. lbValue *found = map_get(&p->module->values, e);
  3235. if (found) {
  3236. v = *found;
  3237. } else if (e->kind == Entity_Variable && e->flags & EntityFlag_Using) {
  3238. // NOTE(bill): Calculate the using variable every time
  3239. v = lb_get_using_variable(p, e);
  3240. } else if (e->flags & EntityFlag_SoaPtrField) {
  3241. return lb_get_soa_variable_addr(p, e);
  3242. }
  3243. if (v.value == nullptr) {
  3244. return lb_addr(lb_find_value_from_entity(p->module, e));
  3245. // error(expr, "%.*s Unknown value: %.*s, entity: %p %.*s",
  3246. // LIT(p->name),
  3247. // LIT(e->token.string), e, LIT(entity_strings[e->kind]));
  3248. // GB_PANIC("Unknown value");
  3249. }
  3250. return lb_addr(v);
  3251. }
  3252. gb_internal lbAddr lb_build_array_swizzle_addr(lbProcedure *p, AstCallExpr *ce, TypeAndValue const &tv) {
  3253. isize index_count = ce->args.count-1;
  3254. lbAddr addr = lb_build_addr(p, ce->args[0]);
  3255. if (index_count == 0) {
  3256. return addr;
  3257. }
  3258. Type *type = base_type(lb_addr_type(addr));
  3259. GB_ASSERT(type->kind == Type_Array);
  3260. i64 count = type->Array.count;
  3261. if (count <= 4 && index_count <= 4) {
  3262. u8 indices[4] = {};
  3263. u8 index_count = 0;
  3264. for (i32 i = 1; i < ce->args.count; i++) {
  3265. TypeAndValue tv = type_and_value_of_expr(ce->args[i]);
  3266. GB_ASSERT(is_type_integer(tv.type));
  3267. GB_ASSERT(tv.value.kind == ExactValue_Integer);
  3268. i64 src_index = big_int_to_i64(&tv.value.value_integer);
  3269. indices[index_count++] = cast(u8)src_index;
  3270. }
  3271. return lb_addr_swizzle(lb_addr_get_ptr(p, addr), tv.type, index_count, indices);
  3272. }
  3273. auto indices = slice_make<i32>(permanent_allocator(), ce->args.count-1);
  3274. isize index_index = 0;
  3275. for (i32 i = 1; i < ce->args.count; i++) {
  3276. TypeAndValue tv = type_and_value_of_expr(ce->args[i]);
  3277. GB_ASSERT(is_type_integer(tv.type));
  3278. GB_ASSERT(tv.value.kind == ExactValue_Integer);
  3279. i64 src_index = big_int_to_i64(&tv.value.value_integer);
  3280. indices[index_index++] = cast(i32)src_index;
  3281. }
  3282. return lb_addr_swizzle_large(lb_addr_get_ptr(p, addr), tv.type, indices);
  3283. }
  3284. gb_internal lbAddr lb_build_addr_internal(lbProcedure *p, Ast *expr);
  3285. gb_internal lbAddr lb_build_addr(lbProcedure *p, Ast *expr) {
  3286. expr = unparen_expr(expr);
  3287. // IMPORTANT NOTE(bill):
  3288. // Selector Call Expressions (foo->bar(...))
  3289. // must only evaluate `foo` once as it gets transformed into
  3290. // `foo.bar(foo, ...)`
  3291. // And if `foo` is a procedure call or something more complex, storing the value
  3292. // once is a very good idea
  3293. // If a stored value is found, it must be removed from the cache
  3294. if (expr->state_flags & StateFlag_SelectorCallExpr) {
  3295. lbAddr *pp = map_get(&p->selector_addr, expr);
  3296. if (pp != nullptr) {
  3297. lbAddr res = *pp;
  3298. map_remove(&p->selector_addr, expr);
  3299. return res;
  3300. }
  3301. }
  3302. lbAddr addr = lb_build_addr_internal(p, expr);
  3303. if (expr->state_flags & StateFlag_SelectorCallExpr) {
  3304. map_set(&p->selector_addr, expr, addr);
  3305. }
  3306. return addr;
  3307. }
  3308. gb_internal void lb_build_addr_compound_lit_populate(lbProcedure *p, Slice<Ast *> const &elems, Array<lbCompoundLitElemTempData> *temp_data, Type *compound_type) {
  3309. Type *bt = base_type(compound_type);
  3310. Type *et = nullptr;
  3311. switch (bt->kind) {
  3312. case Type_Array: et = bt->Array.elem; break;
  3313. case Type_EnumeratedArray: et = bt->EnumeratedArray.elem; break;
  3314. case Type_Slice: et = bt->Slice.elem; break;
  3315. case Type_BitSet: et = bt->BitSet.elem; break;
  3316. case Type_DynamicArray: et = bt->DynamicArray.elem; break;
  3317. case Type_SimdVector: et = bt->SimdVector.elem; break;
  3318. case Type_Matrix: et = bt->Matrix.elem; break;
  3319. }
  3320. GB_ASSERT(et != nullptr);
  3321. // NOTE(bill): Separate value, gep, store into their own chunks
  3322. for_array(i, elems) {
  3323. Ast *elem = elems[i];
  3324. if (elem->kind == Ast_FieldValue) {
  3325. ast_node(fv, FieldValue, elem);
  3326. if (bt->kind != Type_DynamicArray && lb_is_elem_const(fv->value, et)) {
  3327. continue;
  3328. }
  3329. if (is_ast_range(fv->field)) {
  3330. ast_node(ie, BinaryExpr, fv->field);
  3331. TypeAndValue lo_tav = ie->left->tav;
  3332. TypeAndValue hi_tav = ie->right->tav;
  3333. GB_ASSERT(lo_tav.mode == Addressing_Constant);
  3334. GB_ASSERT(hi_tav.mode == Addressing_Constant);
  3335. TokenKind op = ie->op.kind;
  3336. i64 lo = exact_value_to_i64(lo_tav.value);
  3337. i64 hi = exact_value_to_i64(hi_tav.value);
  3338. if (op != Token_RangeHalf) {
  3339. hi += 1;
  3340. }
  3341. lbValue value = lb_emit_conv(p, lb_build_expr(p, fv->value), et);
  3342. GB_ASSERT((hi-lo) > 0);
  3343. if (bt->kind == Type_Matrix) {
  3344. for (i64 k = lo; k < hi; k++) {
  3345. lbCompoundLitElemTempData data = {};
  3346. data.value = value;
  3347. data.elem_index = matrix_row_major_index_to_offset(bt, k);
  3348. array_add(temp_data, data);
  3349. }
  3350. } else {
  3351. enum {MAX_ELEMENT_AMOUNT = 32};
  3352. if ((hi-lo) <= MAX_ELEMENT_AMOUNT) {
  3353. for (i64 k = lo; k < hi; k++) {
  3354. lbCompoundLitElemTempData data = {};
  3355. data.value = value;
  3356. data.elem_index = k;
  3357. array_add(temp_data, data);
  3358. }
  3359. } else {
  3360. lbCompoundLitElemTempData data = {};
  3361. data.value = value;
  3362. data.elem_index = lo;
  3363. data.elem_length = hi-lo;
  3364. array_add(temp_data, data);
  3365. }
  3366. }
  3367. } else {
  3368. auto tav = fv->field->tav;
  3369. GB_ASSERT(tav.mode == Addressing_Constant);
  3370. i64 index = exact_value_to_i64(tav.value);
  3371. lbValue value = lb_emit_conv(p, lb_build_expr(p, fv->value), et);
  3372. GB_ASSERT(!is_type_tuple(value.type));
  3373. lbCompoundLitElemTempData data = {};
  3374. data.value = value;
  3375. data.expr = fv->value;
  3376. if (bt->kind == Type_Matrix) {
  3377. data.elem_index = matrix_row_major_index_to_offset(bt, index);
  3378. } else {
  3379. data.elem_index = index;
  3380. }
  3381. array_add(temp_data, data);
  3382. }
  3383. } else {
  3384. if (bt->kind != Type_DynamicArray && lb_is_elem_const(elem, et)) {
  3385. continue;
  3386. }
  3387. lbValue field_expr = lb_build_expr(p, elem);
  3388. GB_ASSERT(!is_type_tuple(field_expr.type));
  3389. lbValue ev = lb_emit_conv(p, field_expr, et);
  3390. lbCompoundLitElemTempData data = {};
  3391. data.value = ev;
  3392. if (bt->kind == Type_Matrix) {
  3393. data.elem_index = matrix_row_major_index_to_offset(bt, i);
  3394. } else {
  3395. data.elem_index = i;
  3396. }
  3397. array_add(temp_data, data);
  3398. }
  3399. }
  3400. }
  3401. gb_internal void lb_build_addr_compound_lit_assign_array(lbProcedure *p, Array<lbCompoundLitElemTempData> const &temp_data) {
  3402. for (auto const &td : temp_data) {
  3403. if (td.value.value != nullptr) {
  3404. if (td.elem_length > 0) {
  3405. auto loop_data = lb_loop_start(p, cast(isize)td.elem_length, t_i32);
  3406. {
  3407. lbValue dst = td.gep;
  3408. dst = lb_emit_ptr_offset(p, dst, loop_data.idx);
  3409. lb_emit_store(p, dst, td.value);
  3410. }
  3411. lb_loop_end(p, loop_data);
  3412. } else {
  3413. lb_emit_store(p, td.gep, td.value);
  3414. }
  3415. }
  3416. }
  3417. }
  3418. gb_internal lbAddr lb_build_addr_index_expr(lbProcedure *p, Ast *expr) {
  3419. ast_node(ie, IndexExpr, expr);
  3420. Type *t = base_type(type_of_expr(ie->expr));
  3421. bool deref = is_type_pointer(t);
  3422. t = base_type(type_deref(t));
  3423. if (is_type_soa_struct(t)) {
  3424. // SOA STRUCTURES!!!!
  3425. lbValue val = lb_build_addr_ptr(p, ie->expr);
  3426. if (deref) {
  3427. val = lb_emit_load(p, val);
  3428. }
  3429. lbValue index = lb_build_expr(p, ie->index);
  3430. return lb_addr_soa_variable(val, index, ie->index);
  3431. }
  3432. if (ie->expr->tav.mode == Addressing_SoaVariable) {
  3433. // SOA Structures for slices/dynamic arrays
  3434. GB_ASSERT_MSG(is_type_multi_pointer(type_of_expr(ie->expr)), "%s", type_to_string(type_of_expr(ie->expr)));
  3435. lbValue field = lb_build_expr(p, ie->expr);
  3436. lbValue index = lb_build_expr(p, ie->index);
  3437. if (!build_context.no_bounds_check) {
  3438. Ast *se_expr = unparen_expr(ie->expr);
  3439. if (se_expr->kind == Ast_SelectorExpr) {
  3440. ast_node(se, SelectorExpr, se_expr);
  3441. lbValue len = {};
  3442. Type *type = base_type(type_deref(type_of_expr(se->expr)));
  3443. GB_ASSERT_MSG(is_type_soa_struct(type), "%s", type_to_string(type));
  3444. if (type->Struct.soa_kind == StructSoa_Fixed) {
  3445. len = lb_const_int(p->module, t_int, type->Struct.soa_count);
  3446. } else {
  3447. lbAddr *found = map_get(&p->selector_addr, se_expr);
  3448. if (found) {
  3449. lbAddr addr = *found;
  3450. lbValue parent = lb_addr_get_ptr(p, addr);
  3451. if (is_type_pointer(type_deref(parent.type))) {
  3452. parent = lb_emit_load(p, parent);
  3453. }
  3454. len = lb_soa_struct_len(p, parent);
  3455. }
  3456. }
  3457. if (len.value) {
  3458. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3459. }
  3460. } else {
  3461. // TODO(bill): how do you even do bounds checking here?
  3462. }
  3463. }
  3464. lbValue val = lb_emit_ptr_offset(p, field, index);
  3465. return lb_addr(val);
  3466. }
  3467. GB_ASSERT_MSG(is_type_indexable(t), "%s %s", type_to_string(t), expr_to_string(expr));
  3468. if (is_type_map(t)) {
  3469. lbAddr map_addr = lb_build_addr(p, ie->expr);
  3470. lbValue key = lb_build_expr(p, ie->index);
  3471. key = lb_emit_conv(p, key, t->Map.key);
  3472. Type *result_type = type_of_expr(expr);
  3473. lbValue map_ptr = lb_addr_get_ptr(p, map_addr);
  3474. if (is_type_pointer(type_deref(map_ptr.type))) {
  3475. map_ptr = lb_emit_load(p, map_ptr);
  3476. }
  3477. return lb_addr_map(map_ptr, key, t, result_type);
  3478. }
  3479. switch (t->kind) {
  3480. case Type_Array: {
  3481. lbValue array = {};
  3482. array = lb_build_addr_ptr(p, ie->expr);
  3483. if (deref) {
  3484. array = lb_emit_load(p, array);
  3485. }
  3486. lbValue index = lb_build_expr(p, ie->index);
  3487. index = lb_emit_conv(p, index, t_int);
  3488. lbValue elem = lb_emit_array_ep(p, array, index);
  3489. auto index_tv = type_and_value_of_expr(ie->index);
  3490. if (index_tv.mode != Addressing_Constant) {
  3491. lbValue len = lb_const_int(p->module, t_int, t->Array.count);
  3492. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3493. }
  3494. return lb_addr(elem);
  3495. }
  3496. case Type_EnumeratedArray: {
  3497. lbValue array = {};
  3498. array = lb_build_addr_ptr(p, ie->expr);
  3499. if (deref) {
  3500. array = lb_emit_load(p, array);
  3501. }
  3502. Type *index_type = t->EnumeratedArray.index;
  3503. auto index_tv = type_and_value_of_expr(ie->index);
  3504. lbValue index = {};
  3505. if (compare_exact_values(Token_NotEq, *t->EnumeratedArray.min_value, exact_value_i64(0))) {
  3506. if (index_tv.mode == Addressing_Constant) {
  3507. ExactValue idx = exact_value_sub(index_tv.value, *t->EnumeratedArray.min_value);
  3508. index = lb_const_value(p->module, index_type, idx);
  3509. } else {
  3510. index = lb_emit_arith(p, Token_Sub,
  3511. lb_build_expr(p, ie->index),
  3512. lb_const_value(p->module, index_type, *t->EnumeratedArray.min_value),
  3513. index_type);
  3514. index = lb_emit_conv(p, index, t_int);
  3515. }
  3516. } else {
  3517. index = lb_emit_conv(p, lb_build_expr(p, ie->index), t_int);
  3518. }
  3519. lbValue elem = lb_emit_array_ep(p, array, index);
  3520. if (index_tv.mode != Addressing_Constant) {
  3521. lbValue len = lb_const_int(p->module, t_int, t->EnumeratedArray.count);
  3522. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3523. }
  3524. return lb_addr(elem);
  3525. }
  3526. case Type_Slice: {
  3527. lbValue slice = {};
  3528. slice = lb_build_expr(p, ie->expr);
  3529. if (deref) {
  3530. slice = lb_emit_load(p, slice);
  3531. }
  3532. lbValue elem = lb_slice_elem(p, slice);
  3533. lbValue index = lb_emit_conv(p, lb_build_expr(p, ie->index), t_int);
  3534. lbValue len = lb_slice_len(p, slice);
  3535. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3536. lbValue v = lb_emit_ptr_offset(p, elem, index);
  3537. return lb_addr(v);
  3538. }
  3539. case Type_MultiPointer: {
  3540. lbValue multi_ptr = {};
  3541. multi_ptr = lb_build_expr(p, ie->expr);
  3542. if (deref) {
  3543. multi_ptr = lb_emit_load(p, multi_ptr);
  3544. }
  3545. lbValue index = lb_build_expr(p, ie->index);
  3546. index = lb_emit_conv(p, index, t_int);
  3547. lbValue v = {};
  3548. LLVMValueRef indices[1] = {index.value};
  3549. v.value = LLVMBuildGEP2(p->builder, lb_type(p->module, t->MultiPointer.elem), multi_ptr.value, indices, 1, "");
  3550. v.type = alloc_type_pointer(t->MultiPointer.elem);
  3551. return lb_addr(v);
  3552. }
  3553. case Type_RelativeMultiPointer: {
  3554. lbAddr rel_ptr_addr = {};
  3555. if (deref) {
  3556. lbValue rel_ptr_ptr = lb_build_expr(p, ie->expr);
  3557. rel_ptr_addr = lb_addr(rel_ptr_ptr);
  3558. } else {
  3559. rel_ptr_addr = lb_build_addr(p, ie->expr);
  3560. }
  3561. lbValue rel_ptr = lb_relative_pointer_to_pointer(p, rel_ptr_addr);
  3562. lbValue index = lb_build_expr(p, ie->index);
  3563. index = lb_emit_conv(p, index, t_int);
  3564. lbValue v = {};
  3565. Type *pointer_type = base_type(t->RelativeMultiPointer.pointer_type);
  3566. GB_ASSERT(pointer_type->kind == Type_MultiPointer);
  3567. Type *elem = pointer_type->MultiPointer.elem;
  3568. LLVMValueRef indices[1] = {index.value};
  3569. v.value = LLVMBuildGEP2(p->builder, lb_type(p->module, elem), rel_ptr.value, indices, 1, "");
  3570. v.type = alloc_type_pointer(elem);
  3571. return lb_addr(v);
  3572. }
  3573. case Type_DynamicArray: {
  3574. lbValue dynamic_array = {};
  3575. dynamic_array = lb_build_expr(p, ie->expr);
  3576. if (deref) {
  3577. dynamic_array = lb_emit_load(p, dynamic_array);
  3578. }
  3579. lbValue elem = lb_dynamic_array_elem(p, dynamic_array);
  3580. lbValue len = lb_dynamic_array_len(p, dynamic_array);
  3581. lbValue index = lb_emit_conv(p, lb_build_expr(p, ie->index), t_int);
  3582. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3583. lbValue v = lb_emit_ptr_offset(p, elem, index);
  3584. return lb_addr(v);
  3585. }
  3586. case Type_Matrix: {
  3587. lbValue matrix = {};
  3588. matrix = lb_build_addr_ptr(p, ie->expr);
  3589. if (deref) {
  3590. matrix = lb_emit_load(p, matrix);
  3591. }
  3592. lbValue index = lb_build_expr(p, ie->index);
  3593. index = lb_emit_conv(p, index, t_int);
  3594. isize bounds_len = 0;
  3595. lbValue elem = {};
  3596. if (t->Matrix.is_row_major) {
  3597. bounds_len = t->Matrix.row_count;
  3598. elem = lb_emit_matrix_ep(p, matrix, index, lb_const_int(p->module, t_int, 0));
  3599. } else {
  3600. bounds_len = t->Matrix.column_count;
  3601. elem = lb_emit_matrix_ep(p, matrix, lb_const_int(p->module, t_int, 0), index);
  3602. }
  3603. elem = lb_emit_conv(p, elem, alloc_type_pointer(type_of_expr(expr)));
  3604. auto index_tv = type_and_value_of_expr(ie->index);
  3605. if (index_tv.mode != Addressing_Constant) {
  3606. lbValue len = lb_const_int(p->module, t_int, bounds_len);
  3607. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3608. }
  3609. return lb_addr(elem);
  3610. }
  3611. case Type_Basic: { // Basic_string
  3612. lbValue str;
  3613. lbValue elem;
  3614. lbValue len;
  3615. lbValue index;
  3616. str = lb_build_expr(p, ie->expr);
  3617. if (deref) {
  3618. str = lb_emit_load(p, str);
  3619. }
  3620. elem = lb_string_elem(p, str);
  3621. len = lb_string_len(p, str);
  3622. index = lb_emit_conv(p, lb_build_expr(p, ie->index), t_int);
  3623. lb_emit_bounds_check(p, ast_token(ie->index), index, len);
  3624. return lb_addr(lb_emit_ptr_offset(p, elem, index));
  3625. }
  3626. }
  3627. return {};
  3628. }
  3629. gb_internal lbAddr lb_build_addr_slice_expr(lbProcedure *p, Ast *expr) {
  3630. ast_node(se, SliceExpr, expr);
  3631. lbValue low = lb_const_int(p->module, t_int, 0);
  3632. lbValue high = {};
  3633. if (se->low != nullptr) {
  3634. low = lb_correct_endianness(p, lb_build_expr(p, se->low));
  3635. }
  3636. if (se->high != nullptr) {
  3637. high = lb_correct_endianness(p, lb_build_expr(p, se->high));
  3638. }
  3639. bool no_indices = se->low == nullptr && se->high == nullptr;
  3640. lbAddr addr = lb_build_addr(p, se->expr);
  3641. lbValue base = lb_addr_load(p, addr);
  3642. Type *type = base_type(base.type);
  3643. if (is_type_pointer(type)) {
  3644. type = base_type(type_deref(type));
  3645. addr = lb_addr(base);
  3646. base = lb_addr_load(p, addr);
  3647. }
  3648. switch (type->kind) {
  3649. case Type_Slice: {
  3650. Type *slice_type = type;
  3651. lbValue len = lb_slice_len(p, base);
  3652. if (high.value == nullptr) high = len;
  3653. if (!no_indices) {
  3654. lb_emit_slice_bounds_check(p, se->open, low, high, len, se->low != nullptr);
  3655. }
  3656. lbValue elem = lb_emit_ptr_offset(p, lb_slice_elem(p, base), low);
  3657. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3658. lbAddr slice = lb_add_local_generated(p, slice_type, false);
  3659. lb_fill_slice(p, slice, elem, new_len);
  3660. return slice;
  3661. }
  3662. case Type_RelativePointer:
  3663. GB_PANIC("TODO(bill): Type_RelativePointer should be handled above already on the lb_addr_load");
  3664. break;
  3665. case Type_RelativeMultiPointer:
  3666. GB_PANIC("TODO(bill): Type_RelativeMultiPointer should be handled above already on the lb_addr_load");
  3667. break;
  3668. case Type_DynamicArray: {
  3669. Type *elem_type = type->DynamicArray.elem;
  3670. Type *slice_type = alloc_type_slice(elem_type);
  3671. lbValue len = lb_dynamic_array_len(p, base);
  3672. if (high.value == nullptr) high = len;
  3673. if (!no_indices) {
  3674. lb_emit_slice_bounds_check(p, se->open, low, high, len, se->low != nullptr);
  3675. }
  3676. lbValue elem = lb_emit_ptr_offset(p, lb_dynamic_array_elem(p, base), low);
  3677. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3678. lbAddr slice = lb_add_local_generated(p, slice_type, false);
  3679. lb_fill_slice(p, slice, elem, new_len);
  3680. return slice;
  3681. }
  3682. case Type_MultiPointer: {
  3683. lbAddr res = lb_add_local_generated(p, type_of_expr(expr), false);
  3684. if (se->high == nullptr) {
  3685. lbValue offset = base;
  3686. LLVMValueRef indices[1] = {low.value};
  3687. offset.value = LLVMBuildGEP2(p->builder, lb_type(p->module, base_type(offset.type)->MultiPointer.elem), offset.value, indices, 1, "");
  3688. lb_addr_store(p, res, offset);
  3689. } else {
  3690. low = lb_emit_conv(p, low, t_int);
  3691. high = lb_emit_conv(p, high, t_int);
  3692. lb_emit_multi_pointer_slice_bounds_check(p, se->open, low, high);
  3693. LLVMValueRef indices[1] = {low.value};
  3694. LLVMValueRef ptr = LLVMBuildGEP2(p->builder, lb_type(p->module, base_type(base.type)->MultiPointer.elem), base.value, indices, 1, "");
  3695. LLVMValueRef len = LLVMBuildSub(p->builder, high.value, low.value, "");
  3696. LLVMValueRef gep0 = lb_emit_struct_ep(p, res.addr, 0).value;
  3697. LLVMValueRef gep1 = lb_emit_struct_ep(p, res.addr, 1).value;
  3698. LLVMBuildStore(p->builder, ptr, gep0);
  3699. LLVMBuildStore(p->builder, len, gep1);
  3700. }
  3701. return res;
  3702. }
  3703. case Type_Array: {
  3704. Type *slice_type = alloc_type_slice(type->Array.elem);
  3705. lbValue len = lb_const_int(p->module, t_int, type->Array.count);
  3706. if (high.value == nullptr) high = len;
  3707. bool low_const = type_and_value_of_expr(se->low).mode == Addressing_Constant;
  3708. bool high_const = type_and_value_of_expr(se->high).mode == Addressing_Constant;
  3709. if (!low_const || !high_const) {
  3710. if (!no_indices) {
  3711. lb_emit_slice_bounds_check(p, se->open, low, high, len, se->low != nullptr);
  3712. }
  3713. }
  3714. lbValue elem = lb_emit_ptr_offset(p, lb_array_elem(p, lb_addr_get_ptr(p, addr)), low);
  3715. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3716. lbAddr slice = lb_add_local_generated(p, slice_type, false);
  3717. lb_fill_slice(p, slice, elem, new_len);
  3718. return slice;
  3719. }
  3720. case Type_Basic: {
  3721. GB_ASSERT_MSG(are_types_identical(type, t_string), "got %s", type_to_string(type));
  3722. lbValue len = lb_string_len(p, base);
  3723. if (high.value == nullptr) high = len;
  3724. if (!no_indices) {
  3725. lb_emit_slice_bounds_check(p, se->open, low, high, len, se->low != nullptr);
  3726. }
  3727. lbValue elem = lb_emit_ptr_offset(p, lb_string_elem(p, base), low);
  3728. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3729. lbAddr str = lb_add_local_generated(p, t_string, false);
  3730. lb_fill_string(p, str, elem, new_len);
  3731. return str;
  3732. }
  3733. case Type_Struct:
  3734. if (is_type_soa_struct(type)) {
  3735. lbValue len = lb_soa_struct_len(p, lb_addr_get_ptr(p, addr));
  3736. if (high.value == nullptr) high = len;
  3737. if (!no_indices) {
  3738. lb_emit_slice_bounds_check(p, se->open, low, high, len, se->low != nullptr);
  3739. }
  3740. #if 1
  3741. lbAddr dst = lb_add_local_generated(p, type_of_expr(expr), true);
  3742. if (type->Struct.soa_kind == StructSoa_Fixed) {
  3743. i32 field_count = cast(i32)type->Struct.fields.count;
  3744. for (i32 i = 0; i < field_count; i++) {
  3745. lbValue field_dst = lb_emit_struct_ep(p, dst.addr, i);
  3746. lbValue field_src = lb_emit_struct_ep(p, lb_addr_get_ptr(p, addr), i);
  3747. field_src = lb_emit_array_ep(p, field_src, low);
  3748. field_src = lb_emit_conv(p, field_src, type_deref(field_dst.type));
  3749. lb_emit_store(p, field_dst, field_src);
  3750. }
  3751. lbValue len_dst = lb_emit_struct_ep(p, dst.addr, field_count);
  3752. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3753. lb_emit_store(p, len_dst, new_len);
  3754. } else if (type->Struct.soa_kind == StructSoa_Slice) {
  3755. if (no_indices) {
  3756. lb_addr_store(p, dst, base);
  3757. } else {
  3758. i32 field_count = cast(i32)type->Struct.fields.count - 1;
  3759. for (i32 i = 0; i < field_count; i++) {
  3760. lbValue field_dst = lb_emit_struct_ep(p, dst.addr, i);
  3761. lbValue field_src = lb_emit_struct_ev(p, base, i);
  3762. field_src = lb_emit_ptr_offset(p, field_src, low);
  3763. field_src = lb_emit_conv(p, field_src, type_deref(field_dst.type));
  3764. lb_emit_store(p, field_dst, field_src);
  3765. }
  3766. lbValue len_dst = lb_emit_struct_ep(p, dst.addr, field_count);
  3767. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3768. lb_emit_store(p, len_dst, new_len);
  3769. }
  3770. } else if (type->Struct.soa_kind == StructSoa_Dynamic) {
  3771. i32 field_count = cast(i32)type->Struct.fields.count - 3;
  3772. for (i32 i = 0; i < field_count; i++) {
  3773. lbValue field_dst = lb_emit_struct_ep(p, dst.addr, i);
  3774. lbValue field_src = lb_emit_struct_ev(p, base, i);
  3775. field_src = lb_emit_ptr_offset(p, field_src, low);
  3776. field_src = lb_emit_conv(p, field_src, type_deref(field_dst.type));
  3777. lb_emit_store(p, field_dst, field_src);
  3778. }
  3779. lbValue len_dst = lb_emit_struct_ep(p, dst.addr, field_count);
  3780. lbValue new_len = lb_emit_arith(p, Token_Sub, high, low, t_int);
  3781. lb_emit_store(p, len_dst, new_len);
  3782. }
  3783. return dst;
  3784. #endif
  3785. }
  3786. break;
  3787. }
  3788. GB_PANIC("Unknown slicable type");
  3789. return {};
  3790. }
  3791. gb_internal lbAddr lb_build_addr_compound_lit(lbProcedure *p, Ast *expr) {
  3792. ast_node(cl, CompoundLit, expr);
  3793. Type *type = type_of_expr(expr);
  3794. Type *bt = base_type(type);
  3795. lbAddr v = lb_add_local_generated(p, type, true);
  3796. TEMPORARY_ALLOCATOR_GUARD();
  3797. Type *et = nullptr;
  3798. switch (bt->kind) {
  3799. case Type_Array: et = bt->Array.elem; break;
  3800. case Type_EnumeratedArray: et = bt->EnumeratedArray.elem; break;
  3801. case Type_Slice: et = bt->Slice.elem; break;
  3802. case Type_BitSet: et = bt->BitSet.elem; break;
  3803. case Type_SimdVector: et = bt->SimdVector.elem; break;
  3804. case Type_Matrix: et = bt->Matrix.elem; break;
  3805. }
  3806. String proc_name = {};
  3807. if (p->entity) {
  3808. proc_name = p->entity->token.string;
  3809. }
  3810. TokenPos pos = ast_token(expr).pos;
  3811. switch (bt->kind) {
  3812. default: GB_PANIC("Unknown CompoundLit type: %s", type_to_string(type)); break;
  3813. case Type_BitField: {
  3814. TEMPORARY_ALLOCATOR_GUARD();
  3815. // Type *backing_type = core_type(bt->BitField.backing_type);
  3816. struct FieldData {
  3817. Type *field_type;
  3818. u64 bit_offset;
  3819. u64 bit_size;
  3820. };
  3821. auto values = array_make<lbValue>(temporary_allocator(), 0, cl->elems.count);
  3822. auto fields = array_make<FieldData>(temporary_allocator(), 0, cl->elems.count);
  3823. for (Ast *elem : cl->elems) {
  3824. ast_node(fv, FieldValue, elem);
  3825. String name = fv->field->Ident.token.string;
  3826. Selection sel = lookup_field(bt, name, false);
  3827. GB_ASSERT(sel.is_bit_field);
  3828. GB_ASSERT(!sel.indirect);
  3829. GB_ASSERT(sel.index.count == 1);
  3830. GB_ASSERT(sel.entity != nullptr);
  3831. i64 index = sel.index[0];
  3832. Entity *f = bt->BitField.fields[index];
  3833. GB_ASSERT(f == sel.entity);
  3834. i64 bit_offset = bt->BitField.bit_offsets[index];
  3835. i64 bit_size = bt->BitField.bit_sizes[index];
  3836. GB_ASSERT(bit_size > 0);
  3837. Type *field_type = sel.entity->type;
  3838. lbValue field_expr = lb_build_expr(p, fv->value);
  3839. field_expr = lb_emit_conv(p, field_expr, field_type);
  3840. array_add(&values, field_expr);
  3841. array_add(&fields, FieldData{field_type, cast(u64)bit_offset, cast(u64)bit_size});
  3842. }
  3843. // NOTE(bill): inline insertion sort should be good enough, right?
  3844. for (isize i = 1; i < values.count; i++) {
  3845. for (isize j = i;
  3846. j > 0 && fields[i].bit_offset < fields[j].bit_offset;
  3847. j--) {
  3848. auto vtmp = values[j];
  3849. values[j] = values[j-1];
  3850. values[j-1] = vtmp;
  3851. auto ftmp = fields[j];
  3852. fields[j] = fields[j-1];
  3853. fields[j-1] = ftmp;
  3854. }
  3855. }
  3856. bool any_fields_different_endian = false;
  3857. for (auto const &f : fields) {
  3858. if (is_type_different_to_arch_endianness(f.field_type)) {
  3859. // NOTE(bill): Just be slow for this, to be correct
  3860. any_fields_different_endian = true;
  3861. break;
  3862. }
  3863. }
  3864. if (!any_fields_different_endian &&
  3865. fields.count == bt->BitField.fields.count) {
  3866. // SINGLE INTEGER BACKING ONLY
  3867. Type *backing_type = core_type(bt->BitField.backing_type);
  3868. GB_ASSERT(is_type_integer(backing_type) ||
  3869. (is_type_array(backing_type) && is_type_integer(backing_type->Array.elem)));
  3870. // NOTE(bill): all fields are present
  3871. // this means no masking is necessary since on write, the bits will be overridden
  3872. lbValue dst_byte_ptr = lb_emit_conv(p, v.addr, t_u8_ptr);
  3873. u64 total_bit_size = cast(u64)(8*type_size_of(bt));
  3874. if (is_type_integer(backing_type)) {
  3875. LLVMTypeRef lit = lb_type(p->module, backing_type);
  3876. LLVMValueRef res = LLVMConstInt(lit, 0, false);
  3877. for (isize i = 0; i < fields.count; i++) {
  3878. auto const &f = fields[i];
  3879. LLVMValueRef mask = LLVMConstInt(lit, 1, false);
  3880. mask = LLVMConstShl(mask, LLVMConstInt(lit, f.bit_size, false));
  3881. mask = LLVMConstSub(mask, LLVMConstInt(lit, 1, false));
  3882. LLVMValueRef elem = values[i].value;
  3883. if (lb_sizeof(lit) < lb_sizeof(LLVMTypeOf(elem))) {
  3884. elem = LLVMBuildTrunc(p->builder, elem, lit, "");
  3885. } else {
  3886. elem = LLVMBuildZExt(p->builder, elem, lit, "");
  3887. }
  3888. elem = LLVMBuildAnd(p->builder, elem, mask, "");
  3889. elem = LLVMBuildShl(p->builder, elem, LLVMConstInt(lit, f.bit_offset, false), "");
  3890. res = LLVMBuildOr(p->builder, res, elem, "");
  3891. }
  3892. LLVMBuildStore(p->builder, res, v.addr.value);
  3893. } else if (is_type_array(backing_type)) {
  3894. // ARRAY OF INTEGER BACKING
  3895. i64 array_count = backing_type->Array.count;
  3896. LLVMTypeRef lit = lb_type(p->module, core_type(backing_type->Array.elem));
  3897. gb_unused(array_count);
  3898. gb_unused(lit);
  3899. LLVMValueRef *elems = gb_alloc_array(temporary_allocator(), LLVMValueRef, array_count);
  3900. for (i64 i = 0; i < array_count; i++) {
  3901. elems[i] = LLVMConstInt(lit, 0, false);
  3902. }
  3903. u64 elem_bit_size = cast(u64)(8*type_size_of(backing_type->Array.elem));
  3904. u64 curr_bit_offset = 0;
  3905. for (isize i = 0; i < fields.count; i++) {
  3906. auto const &f = fields[i];
  3907. LLVMValueRef val = values[i].value;
  3908. LLVMTypeRef vt = lb_type(p->module, values[i].type);
  3909. for (u64 bits_to_set = f.bit_size;
  3910. bits_to_set > 0;
  3911. /**/) {
  3912. i64 elem_idx = curr_bit_offset/elem_bit_size;
  3913. u64 elem_bit_offset = curr_bit_offset%elem_bit_size;
  3914. u64 mask_width = gb_min(bits_to_set, elem_bit_size-elem_bit_offset);
  3915. GB_ASSERT(mask_width > 0);
  3916. bits_to_set -= mask_width;
  3917. LLVMValueRef mask = LLVMConstInt(vt, 1, false);
  3918. mask = LLVMConstShl(mask, LLVMConstInt(vt, mask_width, false));
  3919. mask = LLVMConstSub(mask, LLVMConstInt(vt, 1, false));
  3920. LLVMValueRef to_set = LLVMBuildAnd(p->builder, val, mask, "");
  3921. if (elem_bit_offset != 0) {
  3922. to_set = LLVMBuildShl(p->builder, to_set, LLVMConstInt(vt, elem_bit_offset, false), "");
  3923. }
  3924. to_set = LLVMBuildTrunc(p->builder, to_set, lit, "");
  3925. if (LLVMIsNull(elems[elem_idx])) {
  3926. elems[elem_idx] = to_set; // don't even bother doing `0 | to_set`
  3927. } else {
  3928. elems[elem_idx] = LLVMBuildOr(p->builder, elems[elem_idx], to_set, "");
  3929. }
  3930. if (mask_width != 0) {
  3931. val = LLVMBuildLShr(p->builder, val, LLVMConstInt(vt, mask_width, false), "");
  3932. }
  3933. curr_bit_offset += mask_width;
  3934. }
  3935. GB_ASSERT(curr_bit_offset == f.bit_offset + f.bit_size);
  3936. }
  3937. for (i64 i = 0; i < array_count; i++) {
  3938. LLVMValueRef elem_ptr = LLVMBuildStructGEP2(p->builder, lb_type(p->module, backing_type), v.addr.value, cast(unsigned)i, "");
  3939. LLVMBuildStore(p->builder, elems[i], elem_ptr);
  3940. }
  3941. } else {
  3942. // SLOW STORAGE
  3943. for_array(i, fields) {
  3944. auto const &f = fields[i];
  3945. if ((f.bit_offset & 7) == 0) {
  3946. u64 unpacked_bit_size = cast(u64)(8*type_size_of(f.field_type));
  3947. u64 byte_size = (f.bit_size+7)/8;
  3948. if (f.bit_offset + unpacked_bit_size <= total_bit_size) {
  3949. byte_size = unpacked_bit_size/8;
  3950. }
  3951. lbValue dst = lb_emit_ptr_offset(p, dst_byte_ptr, lb_const_int(p->module, t_int, f.bit_offset/8));
  3952. lbValue src = lb_address_from_load_or_generate_local(p, values[i]);
  3953. lb_mem_copy_non_overlapping(p, dst, src, lb_const_int(p->module, t_uintptr, byte_size));
  3954. } else {
  3955. lbAddr dst = lb_addr_bit_field(v.addr, f.field_type, f.bit_offset, f.bit_size);
  3956. lb_addr_store(p, dst, values[i]);
  3957. }
  3958. }
  3959. }
  3960. } else {
  3961. // individual storing
  3962. for_array(i, values) {
  3963. auto const &f = fields[i];
  3964. lbAddr dst = lb_addr_bit_field(v.addr, f.field_type, f.bit_offset, f.bit_size);
  3965. lb_addr_store(p, dst, values[i]);
  3966. }
  3967. }
  3968. return v;
  3969. }
  3970. case Type_Struct: {
  3971. // TODO(bill): "constant" '#raw_union's are not initialized constantly at the moment.
  3972. // NOTE(bill): This is due to the layout of the unions when printed to LLVM-IR
  3973. bool is_raw_union = is_type_raw_union(bt);
  3974. GB_ASSERT(is_type_struct(bt) || is_raw_union);
  3975. TypeStruct *st = &bt->Struct;
  3976. if (cl->elems.count > 0) {
  3977. lb_addr_store(p, v, lb_const_value(p->module, type, exact_value_compound(expr)));
  3978. lbValue comp_lit_ptr = lb_addr_get_ptr(p, v);
  3979. for_array(field_index, cl->elems) {
  3980. Ast *elem = cl->elems[field_index];
  3981. lbValue field_expr = {};
  3982. Entity *field = nullptr;
  3983. isize index = field_index;
  3984. if (elem->kind == Ast_FieldValue) {
  3985. ast_node(fv, FieldValue, elem);
  3986. String name = fv->field->Ident.token.string;
  3987. Selection sel = lookup_field(bt, name, false);
  3988. GB_ASSERT(!sel.indirect);
  3989. elem = fv->value;
  3990. if (sel.index.count > 1) {
  3991. if (lb_is_nested_possibly_constant(type, sel, elem)) {
  3992. continue;
  3993. }
  3994. field_expr = lb_build_expr(p, elem);
  3995. field_expr = lb_emit_conv(p, field_expr, sel.entity->type);
  3996. if (sel.is_bit_field) {
  3997. Selection sub_sel = trim_selection(sel);
  3998. lbValue trimmed_dst = lb_emit_deep_field_gep(p, comp_lit_ptr, sub_sel);
  3999. Type *bf = base_type(type_deref(trimmed_dst.type));
  4000. if (is_type_pointer(bf)) {
  4001. trimmed_dst = lb_emit_load(p, trimmed_dst);
  4002. bf = base_type(type_deref(trimmed_dst.type));
  4003. }
  4004. GB_ASSERT(bf->kind == Type_BitField);
  4005. isize idx = sel.index[sel.index.count-1];
  4006. lbAddr dst = lb_addr_bit_field(trimmed_dst, bf->BitField.fields[idx]->type, bf->BitField.bit_offsets[idx], bf->BitField.bit_sizes[idx]);
  4007. lb_addr_store(p, dst, field_expr);
  4008. } else {
  4009. lbValue dst = lb_emit_deep_field_gep(p, comp_lit_ptr, sel);
  4010. lb_emit_store(p, dst, field_expr);
  4011. }
  4012. continue;
  4013. }
  4014. index = sel.index[0];
  4015. } else {
  4016. Selection sel = lookup_field_from_index(bt, st->fields[field_index]->Variable.field_index);
  4017. GB_ASSERT(sel.index.count == 1);
  4018. GB_ASSERT(!sel.indirect);
  4019. index = sel.index[0];
  4020. }
  4021. field = st->fields[index];
  4022. Type *ft = field->type;
  4023. if (!is_raw_union && !is_type_typeid(ft) && lb_is_elem_const(elem, ft)) {
  4024. continue;
  4025. }
  4026. field_expr = lb_build_expr(p, elem);
  4027. lbValue gep = {};
  4028. if (is_raw_union) {
  4029. gep = lb_emit_conv(p, comp_lit_ptr, alloc_type_pointer(ft));
  4030. } else {
  4031. gep = lb_emit_struct_ep(p, comp_lit_ptr, cast(i32)index);
  4032. }
  4033. Type *fet = field_expr.type;
  4034. GB_ASSERT(fet->kind != Type_Tuple);
  4035. // HACK TODO(bill): THIS IS A MASSIVE HACK!!!!
  4036. if (is_type_union(ft) && !are_types_identical(fet, ft) && !is_type_untyped(fet)) {
  4037. GB_ASSERT_MSG(union_variant_index(ft, fet) >= 0, "%s", type_to_string(fet));
  4038. lb_emit_store_union_variant(p, gep, field_expr, fet);
  4039. } else {
  4040. lbValue fv = lb_emit_conv(p, field_expr, ft);
  4041. lb_emit_store(p, gep, fv);
  4042. }
  4043. }
  4044. }
  4045. break;
  4046. }
  4047. case Type_Map: {
  4048. if (cl->elems.count == 0) {
  4049. break;
  4050. }
  4051. GB_ASSERT(!build_context.no_dynamic_literals);
  4052. lbValue err = lb_dynamic_map_reserve(p, v.addr, 2*cl->elems.count, pos);
  4053. gb_unused(err);
  4054. for (Ast *elem : cl->elems) {
  4055. ast_node(fv, FieldValue, elem);
  4056. lbValue key = lb_build_expr(p, fv->field);
  4057. lbValue value = lb_build_expr(p, fv->value);
  4058. lb_internal_dynamic_map_set(p, v.addr, type, key, value, elem);
  4059. }
  4060. break;
  4061. }
  4062. case Type_Array: {
  4063. if (cl->elems.count > 0) {
  4064. lb_addr_store(p, v, lb_const_value(p->module, type, exact_value_compound(expr)));
  4065. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4066. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4067. lbValue dst_ptr = lb_addr_get_ptr(p, v);
  4068. for_array(i, temp_data) {
  4069. i32 index = cast(i32)(temp_data[i].elem_index);
  4070. temp_data[i].gep = lb_emit_array_epi(p, dst_ptr, index);
  4071. }
  4072. lb_build_addr_compound_lit_assign_array(p, temp_data);
  4073. }
  4074. break;
  4075. }
  4076. case Type_EnumeratedArray: {
  4077. if (cl->elems.count > 0) {
  4078. lb_addr_store(p, v, lb_const_value(p->module, type, exact_value_compound(expr)));
  4079. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4080. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4081. lbValue dst_ptr = lb_addr_get_ptr(p, v);
  4082. i64 index_offset = exact_value_to_i64(*bt->EnumeratedArray.min_value);
  4083. for_array(i, temp_data) {
  4084. i32 index = cast(i32)(temp_data[i].elem_index - index_offset);
  4085. temp_data[i].gep = lb_emit_array_epi(p, dst_ptr, index);
  4086. }
  4087. lb_build_addr_compound_lit_assign_array(p, temp_data);
  4088. }
  4089. break;
  4090. }
  4091. case Type_Slice: {
  4092. if (cl->elems.count > 0) {
  4093. lbValue slice = lb_const_value(p->module, type, exact_value_compound(expr));
  4094. lbValue data = lb_slice_elem(p, slice);
  4095. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4096. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4097. for_array(i, temp_data) {
  4098. temp_data[i].gep = lb_emit_ptr_offset(p, data, lb_const_int(p->module, t_int, temp_data[i].elem_index));
  4099. }
  4100. lb_build_addr_compound_lit_assign_array(p, temp_data);
  4101. {
  4102. lbValue count = {};
  4103. count.type = t_int;
  4104. unsigned len_index = lb_convert_struct_index(p->module, type, 1);
  4105. if (lb_is_const(slice)) {
  4106. unsigned indices[1] = {len_index};
  4107. count.value = llvm_const_extract_value(p->module, slice.value, indices, gb_count_of(indices));
  4108. } else {
  4109. count.value = LLVMBuildExtractValue(p->builder, slice.value, len_index, "");
  4110. }
  4111. lb_fill_slice(p, v, data, count);
  4112. }
  4113. }
  4114. break;
  4115. }
  4116. case Type_DynamicArray: {
  4117. if (cl->elems.count == 0) {
  4118. break;
  4119. }
  4120. GB_ASSERT(!build_context.no_dynamic_literals);
  4121. Type *et = bt->DynamicArray.elem;
  4122. lbValue size = lb_const_int(p->module, t_int, type_size_of(et));
  4123. lbValue align = lb_const_int(p->module, t_int, type_align_of(et));
  4124. i64 item_count = gb_max(cl->max_count, cl->elems.count);
  4125. {
  4126. auto args = array_make<lbValue>(temporary_allocator(), 5);
  4127. args[0] = lb_emit_conv(p, lb_addr_get_ptr(p, v), t_rawptr);
  4128. args[1] = size;
  4129. args[2] = align;
  4130. args[3] = lb_const_int(p->module, t_int, item_count);
  4131. args[4] = lb_emit_source_code_location_as_global(p, proc_name, pos);
  4132. lb_emit_runtime_call(p, "__dynamic_array_reserve", args);
  4133. }
  4134. lbValue items = lb_generate_local_array(p, et, item_count);
  4135. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4136. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4137. for_array(i, temp_data) {
  4138. temp_data[i].gep = lb_emit_array_epi(p, items, temp_data[i].elem_index);
  4139. }
  4140. lb_build_addr_compound_lit_assign_array(p, temp_data);
  4141. {
  4142. auto args = array_make<lbValue>(temporary_allocator(), 6);
  4143. args[0] = lb_emit_conv(p, v.addr, t_rawptr);
  4144. args[1] = size;
  4145. args[2] = align;
  4146. args[3] = lb_emit_conv(p, items, t_rawptr);
  4147. args[4] = lb_const_int(p->module, t_int, item_count);
  4148. args[5] = lb_emit_source_code_location_as_global(p, proc_name, pos);
  4149. lb_emit_runtime_call(p, "__dynamic_array_append", args);
  4150. }
  4151. break;
  4152. }
  4153. case Type_Basic: {
  4154. GB_ASSERT(is_type_any(bt));
  4155. if (cl->elems.count > 0) {
  4156. lb_addr_store(p, v, lb_const_value(p->module, type, exact_value_compound(expr)));
  4157. String field_names[2] = {
  4158. str_lit("data"),
  4159. str_lit("id"),
  4160. };
  4161. Type *field_types[2] = {
  4162. t_rawptr,
  4163. t_typeid,
  4164. };
  4165. for_array(field_index, cl->elems) {
  4166. Ast *elem = cl->elems[field_index];
  4167. lbValue field_expr = {};
  4168. isize index = field_index;
  4169. if (elem->kind == Ast_FieldValue) {
  4170. ast_node(fv, FieldValue, elem);
  4171. Selection sel = lookup_field(bt, fv->field->Ident.token.string, false);
  4172. index = sel.index[0];
  4173. elem = fv->value;
  4174. } else {
  4175. TypeAndValue tav = type_and_value_of_expr(elem);
  4176. Selection sel = lookup_field(bt, field_names[field_index], false);
  4177. index = sel.index[0];
  4178. }
  4179. field_expr = lb_build_expr(p, elem);
  4180. GB_ASSERT(field_expr.type->kind != Type_Tuple);
  4181. Type *ft = field_types[index];
  4182. lbValue fv = lb_emit_conv(p, field_expr, ft);
  4183. lbValue gep = lb_emit_struct_ep(p, lb_addr_get_ptr(p, v), cast(i32)index);
  4184. lb_emit_store(p, gep, fv);
  4185. }
  4186. }
  4187. break;
  4188. }
  4189. case Type_BitSet: {
  4190. i64 sz = type_size_of(type);
  4191. if (cl->elems.count > 0 && sz > 0) {
  4192. lbValue lower = lb_const_value(p->module, t_int, exact_value_i64(bt->BitSet.lower));
  4193. Type *backing = bit_set_to_int(type);
  4194. if (is_type_array(backing)) {
  4195. GB_PANIC("TODO: bit_set [N]T");
  4196. Type *base_it = core_array_type(backing);
  4197. i64 bits_per_elem = 8*type_size_of(base_it);
  4198. gb_unused(bits_per_elem);
  4199. lbValue one = lb_const_value(p->module, t_i64, exact_value_i64(1));
  4200. for (Ast *elem : cl->elems) {
  4201. GB_ASSERT(elem->kind != Ast_FieldValue);
  4202. lbValue expr = lb_build_expr(p, elem);
  4203. GB_ASSERT(expr.type->kind != Type_Tuple);
  4204. lbValue e = lb_emit_conv(p, expr, t_i64);
  4205. e = lb_emit_arith(p, Token_Sub, e, lower, t_i64);
  4206. // lbValue idx = lb_emit_arith(p, Token_Div, e, bits_per_elem, t_i64);
  4207. // lbValue val = lb_emit_arith(p, Token_Div, e, bits_per_elem, t_i64);
  4208. }
  4209. } else {
  4210. Type *it = bit_set_to_int(bt);
  4211. lbValue one = lb_const_value(p->module, it, exact_value_i64(1));
  4212. for (Ast *elem : cl->elems) {
  4213. GB_ASSERT(elem->kind != Ast_FieldValue);
  4214. lbValue expr = lb_build_expr(p, elem);
  4215. GB_ASSERT(expr.type->kind != Type_Tuple);
  4216. lbValue e = lb_emit_conv(p, expr, it);
  4217. e = lb_emit_arith(p, Token_Sub, e, lower, it);
  4218. e = lb_emit_arith(p, Token_Shl, one, e, it);
  4219. lbValue old_value = lb_emit_transmute(p, lb_addr_load(p, v), it);
  4220. lbValue new_value = lb_emit_arith(p, Token_Or, old_value, e, it);
  4221. new_value = lb_emit_transmute(p, new_value, type);
  4222. lb_addr_store(p, v, new_value);
  4223. }
  4224. }
  4225. }
  4226. break;
  4227. }
  4228. case Type_Matrix: {
  4229. if (cl->elems.count > 0) {
  4230. lb_addr_store(p, v, lb_const_value(p->module, type, exact_value_compound(expr)));
  4231. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4232. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4233. lbValue dst_ptr = lb_addr_get_ptr(p, v);
  4234. for_array(i, temp_data) {
  4235. temp_data[i].gep = lb_emit_array_epi(p, dst_ptr, temp_data[i].elem_index);
  4236. }
  4237. lb_build_addr_compound_lit_assign_array(p, temp_data);
  4238. }
  4239. break;
  4240. }
  4241. case Type_SimdVector: {
  4242. if (cl->elems.count > 0) {
  4243. lbValue vector_value = lb_const_value(p->module, type, exact_value_compound(expr));
  4244. defer (lb_addr_store(p, v, vector_value));
  4245. auto temp_data = array_make<lbCompoundLitElemTempData>(temporary_allocator(), 0, cl->elems.count);
  4246. lb_build_addr_compound_lit_populate(p, cl->elems, &temp_data, type);
  4247. // TODO(bill): reduce the need for individual `insertelement` if a `shufflevector`
  4248. // might be a better option
  4249. for (auto const &td : temp_data) {
  4250. if (td.value.value != nullptr) {
  4251. if (td.elem_length > 0) {
  4252. for (i64 k = 0; k < td.elem_length; k++) {
  4253. LLVMValueRef index = lb_const_int(p->module, t_u32, td.elem_index + k).value;
  4254. vector_value.value = LLVMBuildInsertElement(p->builder, vector_value.value, td.value.value, index, "");
  4255. }
  4256. } else {
  4257. LLVMValueRef index = lb_const_int(p->module, t_u32, td.elem_index).value;
  4258. vector_value.value = LLVMBuildInsertElement(p->builder, vector_value.value, td.value.value, index, "");
  4259. }
  4260. }
  4261. }
  4262. }
  4263. break;
  4264. }
  4265. }
  4266. return v;
  4267. }
  4268. gb_internal lbAddr lb_build_addr_internal(lbProcedure *p, Ast *expr) {
  4269. switch (expr->kind) {
  4270. case_ast_node(i, Implicit, expr);
  4271. lbAddr v = {};
  4272. switch (i->kind) {
  4273. case Token_context:
  4274. v = lb_find_or_generate_context_ptr(p);
  4275. break;
  4276. }
  4277. GB_ASSERT(v.addr.value != nullptr);
  4278. return v;
  4279. case_end;
  4280. case_ast_node(i, Ident, expr);
  4281. if (is_blank_ident(expr)) {
  4282. lbAddr val = {};
  4283. return val;
  4284. }
  4285. String name = i->token.string;
  4286. Entity *e = entity_of_node(expr);
  4287. return lb_build_addr_from_entity(p, e, expr);
  4288. case_end;
  4289. case_ast_node(se, SelectorExpr, expr);
  4290. Ast *sel_node = unparen_expr(se->selector);
  4291. if (sel_node->kind == Ast_Ident) {
  4292. String selector = sel_node->Ident.token.string;
  4293. TypeAndValue tav = type_and_value_of_expr(se->expr);
  4294. if (tav.mode == Addressing_Invalid) {
  4295. // NOTE(bill): Imports
  4296. Entity *imp = entity_of_node(se->expr);
  4297. if (imp != nullptr) {
  4298. GB_ASSERT(imp->kind == Entity_ImportName);
  4299. }
  4300. return lb_build_addr(p, unparen_expr(se->selector));
  4301. }
  4302. Type *type = base_type(tav.type);
  4303. if (tav.mode == Addressing_Type) { // Addressing_Type
  4304. Selection sel = lookup_field(tav.type, selector, true);
  4305. if (sel.pseudo_field) {
  4306. GB_ASSERT(sel.entity->kind == Entity_Procedure || sel.entity->kind == Entity_ProcGroup);
  4307. Entity *e = entity_of_node(sel_node);
  4308. GB_ASSERT(e->kind == Entity_Procedure);
  4309. return lb_addr(lb_find_value_from_entity(p->module, e));
  4310. }
  4311. GB_PANIC("Unreachable %.*s", LIT(selector));
  4312. }
  4313. if (se->swizzle_count > 0) {
  4314. Type *array_type = base_type(type_deref(tav.type));
  4315. GB_ASSERT(array_type->kind == Type_Array || array_type->kind == Type_SimdVector);
  4316. u8 swizzle_count = se->swizzle_count;
  4317. u8 swizzle_indices_raw = se->swizzle_indices;
  4318. u8 swizzle_indices[4] = {};
  4319. for (u8 i = 0; i < swizzle_count; i++) {
  4320. u8 index = swizzle_indices_raw>>(i*2) & 3;
  4321. swizzle_indices[i] = index;
  4322. }
  4323. lbValue a = {};
  4324. if (is_type_pointer(tav.type)) {
  4325. a = lb_build_expr(p, se->expr);
  4326. } else {
  4327. lbAddr addr = lb_build_addr(p, se->expr);
  4328. a = lb_addr_get_ptr(p, addr);
  4329. }
  4330. Type *type = type_deref(expr->tav.type);
  4331. GB_ASSERT(is_type_array(type) || is_type_simd_vector(type));
  4332. return lb_addr_swizzle(a, type, swizzle_count, swizzle_indices);
  4333. }
  4334. Selection sel = lookup_field(type, selector, false);
  4335. GB_ASSERT(sel.entity != nullptr);
  4336. if (sel.pseudo_field) {
  4337. GB_ASSERT(sel.entity->kind == Entity_Procedure || sel.entity->kind == Entity_ProcGroup);
  4338. Entity *e = entity_of_node(sel_node);
  4339. GB_ASSERT(e->kind == Entity_Procedure);
  4340. return lb_addr(lb_find_value_from_entity(p->module, e));
  4341. }
  4342. if (sel.is_bit_field) {
  4343. lbAddr addr = lb_build_addr(p, se->expr);
  4344. Selection sub_sel = sel;
  4345. sub_sel.index.count -= 1;
  4346. lbValue ptr = lb_addr_get_ptr(p, addr);
  4347. if (sub_sel.index.count > 0) {
  4348. ptr = lb_emit_deep_field_gep(p, ptr, sub_sel);
  4349. }
  4350. if (is_type_pointer(type_deref(ptr.type))) {
  4351. ptr = lb_emit_load(p, ptr);
  4352. }
  4353. Type *bf_type = type_deref(ptr.type);
  4354. bf_type = base_type(bf_type);
  4355. GB_ASSERT(bf_type->kind == Type_BitField);
  4356. i32 index = sel.index[sel.index.count-1];
  4357. Entity *f = bf_type->BitField.fields[index];
  4358. u8 bit_size = bf_type->BitField.bit_sizes[index];
  4359. i64 bit_offset = bf_type->BitField.bit_offsets[index];
  4360. return lb_addr_bit_field(ptr, f->type, bit_offset, bit_size);
  4361. }
  4362. {
  4363. lbAddr addr = lb_build_addr(p, se->expr);
  4364. if (addr.kind == lbAddr_Map) {
  4365. lbValue v = lb_addr_load(p, addr);
  4366. lbValue a = lb_address_from_load_or_generate_local(p, v);
  4367. a = lb_emit_deep_field_gep(p, a, sel);
  4368. return lb_addr(a);
  4369. } else if (addr.kind == lbAddr_Context) {
  4370. GB_ASSERT(sel.index.count > 0);
  4371. if (addr.ctx.sel.index.count >= 0) {
  4372. sel = selection_combine(addr.ctx.sel, sel);
  4373. }
  4374. addr.ctx.sel = sel;
  4375. addr.kind = lbAddr_Context;
  4376. return addr;
  4377. } else if (addr.kind == lbAddr_SoaVariable) {
  4378. lbValue index = addr.soa.index;
  4379. i32 first_index = sel.index[0];
  4380. Selection sub_sel = sel;
  4381. sub_sel.index.data += 1;
  4382. sub_sel.index.count -= 1;
  4383. lbValue arr = lb_emit_struct_ep(p, addr.addr, first_index);
  4384. Type *t = base_type(type_deref(addr.addr.type));
  4385. GB_ASSERT(is_type_soa_struct(t));
  4386. if (addr.soa.index_expr != nullptr && (!lb_is_const(addr.soa.index) || t->Struct.soa_kind != StructSoa_Fixed)) {
  4387. lbValue len = lb_soa_struct_len(p, addr.addr);
  4388. lb_emit_bounds_check(p, ast_token(addr.soa.index_expr), addr.soa.index, len);
  4389. }
  4390. lbValue item = {};
  4391. if (t->Struct.soa_kind == StructSoa_Fixed) {
  4392. item = lb_emit_array_ep(p, arr, index);
  4393. } else {
  4394. item = lb_emit_ptr_offset(p, lb_emit_load(p, arr), index);
  4395. }
  4396. if (sub_sel.index.count > 0) {
  4397. item = lb_emit_deep_field_gep(p, item, sub_sel);
  4398. }
  4399. // make sure it's ^T and not [^]T
  4400. item.type = alloc_type_multi_pointer_to_pointer(item.type);
  4401. return lb_addr(item);
  4402. } else if (addr.kind == lbAddr_Swizzle) {
  4403. GB_ASSERT(sel.index.count > 0);
  4404. // NOTE(bill): just patch the index in place
  4405. sel.index[0] = addr.swizzle.indices[sel.index[0]];
  4406. } else if (addr.kind == lbAddr_SwizzleLarge) {
  4407. GB_ASSERT(sel.index.count > 0);
  4408. // NOTE(bill): just patch the index in place
  4409. sel.index[0] = addr.swizzle.indices[sel.index[0]];
  4410. }
  4411. Type *atype = type_deref(lb_addr_type(addr));
  4412. if (is_type_soa_struct(atype)) {
  4413. map_set(&p->selector_addr, expr, addr);
  4414. }
  4415. lbValue a = lb_addr_get_ptr(p, addr);
  4416. a = lb_emit_deep_field_gep(p, a, sel);
  4417. return lb_addr(a);
  4418. }
  4419. } else {
  4420. GB_PANIC("Unsupported selector expression");
  4421. }
  4422. case_end;
  4423. case_ast_node(se, SelectorCallExpr, expr);
  4424. lbValue e = lb_build_expr(p, expr);
  4425. return lb_addr(lb_address_from_load_or_generate_local(p, e));
  4426. case_end;
  4427. case_ast_node(ta, TypeAssertion, expr);
  4428. TokenPos pos = ast_token(expr).pos;
  4429. lbValue e = lb_build_expr(p, ta->expr);
  4430. Type *t = type_deref(e.type);
  4431. if (is_type_union(t)) {
  4432. Type *type = type_of_expr(expr);
  4433. lbAddr v = lb_add_local_generated(p, type, false);
  4434. lb_addr_store(p, v, lb_emit_union_cast(p, lb_build_expr(p, ta->expr), type, pos));
  4435. return v;
  4436. } else if (is_type_any(t)) {
  4437. Type *type = type_of_expr(expr);
  4438. return lb_emit_any_cast_addr(p, lb_build_expr(p, ta->expr), type, pos);
  4439. } else {
  4440. GB_PANIC("TODO(bill): type assertion %s", type_to_string(e.type));
  4441. }
  4442. case_end;
  4443. case_ast_node(ue, UnaryExpr, expr);
  4444. switch (ue->op.kind) {
  4445. case Token_And: {
  4446. lbValue ptr = lb_build_expr(p, expr);
  4447. return lb_addr(lb_address_from_load_or_generate_local(p, ptr));
  4448. }
  4449. default:
  4450. GB_PANIC("Invalid unary expression for lb_build_addr");
  4451. }
  4452. case_end;
  4453. case_ast_node(be, BinaryExpr, expr);
  4454. lbValue v = lb_build_expr(p, expr);
  4455. Type *t = v.type;
  4456. if (is_type_pointer(t)) {
  4457. return lb_addr(v);
  4458. }
  4459. return lb_addr(lb_address_from_load_or_generate_local(p, v));
  4460. case_end;
  4461. case_ast_node(ie, IndexExpr, expr);
  4462. return lb_build_addr_index_expr(p, expr);
  4463. case_end;
  4464. case_ast_node(ie, MatrixIndexExpr, expr);
  4465. Type *t = base_type(type_of_expr(ie->expr));
  4466. bool deref = is_type_pointer(t);
  4467. t = base_type(type_deref(t));
  4468. lbValue m = {};
  4469. m = lb_build_addr_ptr(p, ie->expr);
  4470. if (deref) {
  4471. m = lb_emit_load(p, m);
  4472. }
  4473. lbValue row_index = lb_build_expr(p, ie->row_index);
  4474. lbValue column_index = lb_build_expr(p, ie->column_index);
  4475. row_index = lb_emit_conv(p, row_index, t_int);
  4476. column_index = lb_emit_conv(p, column_index, t_int);
  4477. lbValue elem = lb_emit_matrix_ep(p, m, row_index, column_index);
  4478. auto row_index_tv = type_and_value_of_expr(ie->row_index);
  4479. auto column_index_tv = type_and_value_of_expr(ie->column_index);
  4480. if (row_index_tv.mode != Addressing_Constant || column_index_tv.mode != Addressing_Constant) {
  4481. lbValue row_count = lb_const_int(p->module, t_int, t->Matrix.row_count);
  4482. lbValue column_count = lb_const_int(p->module, t_int, t->Matrix.column_count);
  4483. lb_emit_matrix_bounds_check(p, ast_token(ie->row_index), row_index, column_index, row_count, column_count);
  4484. }
  4485. return lb_addr(elem);
  4486. case_end;
  4487. case_ast_node(se, SliceExpr, expr);
  4488. return lb_build_addr_slice_expr(p, expr);
  4489. case_end;
  4490. case_ast_node(de, DerefExpr, expr);
  4491. Type *t = type_of_expr(de->expr);
  4492. if (is_type_relative_pointer(t)) {
  4493. lbAddr addr = lb_build_addr(p, de->expr);
  4494. addr.relative.deref = true;
  4495. return addr;
  4496. } else if (is_type_soa_pointer(t)) {
  4497. lbValue value = lb_build_expr(p, de->expr);
  4498. lbValue ptr = lb_emit_struct_ev(p, value, 0);
  4499. lbValue idx = lb_emit_struct_ev(p, value, 1);
  4500. return lb_addr_soa_variable(ptr, idx, nullptr);
  4501. }
  4502. lbValue addr = lb_build_expr(p, de->expr);
  4503. return lb_addr(addr);
  4504. case_end;
  4505. case_ast_node(ce, CallExpr, expr);
  4506. BuiltinProcId builtin_id = BuiltinProc_Invalid;
  4507. if (ce->proc->tav.mode == Addressing_Builtin) {
  4508. Entity *e = entity_of_node(ce->proc);
  4509. if (e != nullptr) {
  4510. builtin_id = cast(BuiltinProcId)e->Builtin.id;
  4511. } else {
  4512. builtin_id = BuiltinProc_DIRECTIVE;
  4513. }
  4514. }
  4515. auto const &tv = expr->tav;
  4516. if (builtin_id == BuiltinProc_swizzle &&
  4517. is_type_array(tv.type)) {
  4518. // NOTE(bill, 2021-08-09): `swizzle` has some bizarre semantics so it needs to be
  4519. // specialized here for to be addressable
  4520. return lb_build_array_swizzle_addr(p, ce, tv);
  4521. }
  4522. // NOTE(bill): This is make sure you never need to have an 'array_ev'
  4523. lbValue e = lb_build_expr(p, expr);
  4524. #if 1
  4525. return lb_addr(lb_address_from_load_or_generate_local(p, e));
  4526. #else
  4527. lbAddr v = lb_add_local_generated(p, e.type, false);
  4528. lb_addr_store(p, v, e);
  4529. return v;
  4530. #endif
  4531. case_end;
  4532. case_ast_node(cl, CompoundLit, expr);
  4533. return lb_build_addr_compound_lit(p, expr);
  4534. case_end;
  4535. case_ast_node(tc, TypeCast, expr);
  4536. Type *type = type_of_expr(expr);
  4537. lbValue x = lb_build_expr(p, tc->expr);
  4538. lbValue e = {};
  4539. switch (tc->token.kind) {
  4540. case Token_cast:
  4541. e = lb_emit_conv(p, x, type);
  4542. break;
  4543. case Token_transmute:
  4544. e = lb_emit_transmute(p, x, type);
  4545. break;
  4546. default:
  4547. GB_PANIC("Invalid AST TypeCast");
  4548. }
  4549. lbAddr v = lb_add_local_generated(p, type, false);
  4550. lb_addr_store(p, v, e);
  4551. return v;
  4552. case_end;
  4553. case_ast_node(ac, AutoCast, expr);
  4554. return lb_build_addr(p, ac->expr);
  4555. case_end;
  4556. case_ast_node(te, TernaryIfExpr, expr);
  4557. LLVMValueRef incoming_values[2] = {};
  4558. LLVMBasicBlockRef incoming_blocks[2] = {};
  4559. GB_ASSERT(te->y != nullptr);
  4560. lbBlock *then = lb_create_block(p, "if.then");
  4561. lbBlock *done = lb_create_block(p, "if.done"); // NOTE(bill): Append later
  4562. lbBlock *else_ = lb_create_block(p, "if.else");
  4563. lb_build_cond(p, te->cond, then, else_);
  4564. lb_start_block(p, then);
  4565. Type *ptr_type = alloc_type_pointer(default_type(type_of_expr(expr)));
  4566. incoming_values[0] = lb_emit_conv(p, lb_build_addr_ptr(p, te->x), ptr_type).value;
  4567. lb_emit_jump(p, done);
  4568. lb_start_block(p, else_);
  4569. incoming_values[1] = lb_emit_conv(p, lb_build_addr_ptr(p, te->y), ptr_type).value;
  4570. lb_emit_jump(p, done);
  4571. lb_start_block(p, done);
  4572. lbValue res = {};
  4573. res.value = LLVMBuildPhi(p->builder, lb_type(p->module, ptr_type), "");
  4574. res.type = ptr_type;
  4575. GB_ASSERT(p->curr_block->preds.count >= 2);
  4576. incoming_blocks[0] = p->curr_block->preds[0]->block;
  4577. incoming_blocks[1] = p->curr_block->preds[1]->block;
  4578. LLVMAddIncoming(res.value, incoming_values, incoming_blocks, 2);
  4579. return lb_addr(res);
  4580. case_end;
  4581. case_ast_node(oe, OrElseExpr, expr);
  4582. lbValue ptr = lb_address_from_load_or_generate_local(p, lb_build_expr(p, expr));
  4583. return lb_addr(ptr);
  4584. case_end;
  4585. case_ast_node(oe, OrReturnExpr, expr);
  4586. lbValue ptr = lb_address_from_load_or_generate_local(p, lb_build_expr(p, expr));
  4587. return lb_addr(ptr);
  4588. case_end;
  4589. case_ast_node(be, OrBranchExpr, expr);
  4590. lbBlock *block = nullptr;
  4591. if (be->label != nullptr) {
  4592. lbBranchBlocks bb = lb_lookup_branch_blocks(p, be->label);
  4593. switch (be->token.kind) {
  4594. case Token_or_break: block = bb.break_; break;
  4595. case Token_or_continue: block = bb.continue_; break;
  4596. }
  4597. } else {
  4598. for (lbTargetList *t = p->target_list; t != nullptr && block == nullptr; t = t->prev) {
  4599. if (t->is_block) {
  4600. continue;
  4601. }
  4602. switch (be->token.kind) {
  4603. case Token_or_break: block = t->break_; break;
  4604. case Token_or_continue: block = t->continue_; break;
  4605. }
  4606. }
  4607. }
  4608. GB_ASSERT(block != nullptr);
  4609. TypeAndValue tv = expr->tav;
  4610. lbValue lhs = {};
  4611. lbValue rhs = {};
  4612. lb_emit_try_lhs_rhs(p, be->expr, tv, &lhs, &rhs);
  4613. Type *type = default_type(tv.type);
  4614. if (lhs.value) {
  4615. lhs = lb_emit_conv(p, lhs, type);
  4616. } else if (type != nullptr && type != t_invalid) {
  4617. lhs = lb_const_nil(p->module, type);
  4618. }
  4619. lbBlock *then = lb_create_block(p, "or_branch.then");
  4620. lbBlock *else_ = lb_create_block(p, "or_branch.else");
  4621. lb_emit_if(p, lb_emit_try_has_value(p, rhs), then, else_);
  4622. lb_start_block(p, else_);
  4623. lb_emit_defer_stmts(p, lbDeferExit_Branch, block);
  4624. lb_emit_jump(p, block);
  4625. lb_start_block(p, then);
  4626. return lb_addr(lb_address_from_load_or_generate_local(p, lhs));
  4627. case_end;
  4628. }
  4629. TokenPos token_pos = ast_token(expr).pos;
  4630. GB_PANIC("Unexpected address expression\n"
  4631. "\tAst: %.*s @ "
  4632. "%s\n",
  4633. LIT(ast_strings[expr->kind]),
  4634. token_pos_to_string(token_pos));
  4635. return {};
  4636. }